diff --git "a/log/debug_0.log" "b/log/debug_0.log" --- "a/log/debug_0.log" +++ "b/log/debug_0.log" @@ -1,60046 +1,3 @@ -11/06/2021 21:16:12 - INFO - __main__ - Distributed environment: MULTI_GPU Backend: nccl -Num processes: 16 -Process index: 0 -Local process index: 0 -Device: cuda:0 -Use FP16 precision: True - -11/06/2021 21:16:13 - WARNING - huggingface_hub.repository - /home/leandro/codeparrot-small/./ is already a clone of https://huggingface.co/lvwerra/codeparrot-small. Make sure you pull the latest changes with `repo.git_pull()`. -11/06/2021 21:16:13 - WARNING - huggingface_hub.repository - Revision `proud-haze-135` does not exist. Created and checked out branch `proud-haze-135`. -11/06/2021 21:16:13 - WARNING - huggingface_hub.repository - -11/06/2021 21:16:15 - INFO - datasets.data_files - Some files matched the pattern '*' at /home/leandro/codeparrot-clean-train but don't have valid data file extensions: [PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/0b/f3/0bf3cd1320065c163f47a112458dc107650e3e862094b703b76073bd0b68663d'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-rebase.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/fsmonitor-watchman.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-applypatch.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/37/26/3726a0239b5cb7d0ef3ea36886c533d0becc7404217763015559edb546d53c94'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/e7/a9/e7a9ccbfe6bd92476f83eba205c47ed23732ace4c1bd7458d76d666ebbba3b1c'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/73/73/737327c2b47693e00050aa3410c5eb402c66211a79740ab57f1c763a1e557563'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/commit-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/2a/7e/2a7e50bbdb90d6c4cec534c3f1dc7ec0e6a0dada15c07cfd94615940c632ce02'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/5a/5f/5a5fbc19e0e76787f668ada7235203c10b0cbcdea0ecf8f873f8ec281cfe3494'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/74/31/7431977a8e3a6eb0348b821009495f85d9373c1f730f4a74b0db43326568f77d'), PosixPath('/home/leandro/codeparrot-clean-train/.git/logs/refs/heads/main'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/50/38/503872def2ac44733fbefc2602ab16224caca0896aa1eba045025ef2d60efcdc'), PosixPath('/home/leandro/codeparrot-clean-train/.git/refs/heads/main'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/update.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/b6/ce/b6ce495492aedfc91b66efdfd214b2dfe44867c719d51590e1868e42f4e9b6dd'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/df/08/df0840d1657530c8fa9f82864be5999c515f54341d926c430a82528a6bb83740'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/2f/62/2f628d890bceee216f87edb3c45d2e384ee2501ce41a4c4169efaa3363bef1d2'), PosixPath('/home/leandro/codeparrot-clean-train/.git/HEAD'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/0f/7a/0f7a67cd83c1c069995f0f2510ebf818dcc71d9658f189de1231d2b7aac8883c'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/05/39/053944e1daead0b6de8e46ea2e0bc68b9247604c63a55d444ac3b9adb12e2cd2'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/dc/ac/dcacb03d8f43f7879c5eab4422644d7b3797b47dbb0c9c84d88cbc85822d8306'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/ac/e3/ace3ac440b380d604ab198cf8e838a2a375e7b0a6b5699ec74a8c79648f4bab8'), PosixPath('/home/leandro/codeparrot-clean-train/.git/description'), PosixPath('/home/leandro/codeparrot-clean-train/.git/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/d4/9f/d49f1929644619c39cff677367ff2e18223a8046ec8f61e224954a10aa2ccf8f'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/2e/aa/2eaa21b832ed1496fb7f0b259666dbfc36ed483d81494d1e8705f9d601509c12'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/f1/a7/f1a7a250e1f6164a7fb602131ff54b69deb305258792f2358075403769d58fe5'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/d0/02/d0024828eece6d4d1c25cb4e539328be97fa28ce66a3b8d2374a117711cfd520'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/90/a5/90a573501de640c3e0e6f1b3508306febc96faf6061bb33c67894c168a1879c6'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/post-checkout'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/post-commit'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/5d/42/5d42ba9f195510757a3699005a7c43ddede4b598caf8a5f2f8c84d1125fa6324'), PosixPath('/home/leandro/codeparrot-clean-train/.git/logs/HEAD'), PosixPath('/home/leandro/codeparrot-clean-train/.git/packed-refs'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/5f/d1/5fd1bb56db810b65d1fd3866dc43d9c7b690c8f52b9ca8119b2a5f4c49d13eec'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/7c/0e/7c0ef87edb0e556939282c859c7c893a91b5b0f931394ca4cca4f4ec98a61951'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/ee/c1/eec1a9546aac0444a706c09f6aab67cd64403940657417e30212b7ff1e16665c'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/55/b6/55b6989a41ae296337356153e6081c61484d0b6734b6905683823e7317d01c42'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-commit.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/cc/58/cc58b22515c4fd7d891287ee717c2054290b20c17b1c34693fd8964ab730687b'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/b6/8a/b68a74f9784402dcb311f4db72a873035e47b98b185a1813ab2c1645cb7255a2'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/fb/84/fb84ca8000808f62718994e4b44e79d88a05b345e9638d9f6cf6c8a5472da01f'), PosixPath('/home/leandro/codeparrot-clean-train/.git/objects/pack/pack-12438cb8112d3b4104fefcb88d751872b5e0fd6e.pack'), PosixPath('/home/leandro/codeparrot-clean-train/.git/info/exclude'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/12/8d/128d56e09d9d741b2778d733e595838a50a5e82fdc9adbb0aa8645457716b97e'), PosixPath('/home/leandro/codeparrot-clean-train/.git/objects/pack/pack-12438cb8112d3b4104fefcb88d751872b5e0fd6e.idx'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/b4/83/b4836655e350f0796acd2b1a206e657c2808d9f136afae095e0b94a790c704e1'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/3e/f2/3ef240d0b394384803ae1bbe3b30974e11eb9b1b6ad4f49afc2ed0f7c9eae0d6'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/14/08/14089cad26037080ee900bede2fd42d5cac70738b2e77402b36681e1d2a521f6'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/86/0e/860eda34e90456533e9dd41a5c0fdb74c54dc8d9cf43d6c60b887b2c858be831'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/post-update.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-push'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/15/ac/15ac016e4cd702bb184457cbf5674d71b632fc34c29611ba4de549b85c67acfb'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/a4/6b/a46b5c08d39691524b46fadf78eab5efefa29978edfee799ec3587d928dc1302'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/fa/e6/fae6b44a24c1c35f15053a19a6b2b2af5cc9fb8bdaf0da409068a2a1f333f28e'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/17/5e/175e7375d6f65993071aa653bdd4e8b117cc02d1d2353cd7bcdbaaf7fe8b3c9c'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/ac/36/ac36d12d37c1dc8ee8d3b8f0eae93966ae73482ef725615bb1a715802ddd4dd4'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/17/96/1796f12729d0407cc57500c9c87959e0e7becd729f37374702868ed8765015f4'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/67/f1/67f1ff0d590fbf4aa9afa161c290fe9be17538d4b723278bb21fd6408b0e6a3e'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/55/c9/55c9c0b2f26de96e0311ee43e8eaa78ad1af387d0c59a26f22c5ebd507dda321'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-push.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/config'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/9f/7e/9f7e18a3980d4b3d5ed9469ab7a2d67b608e8aa6fff38d876f86719c8f2a7a82'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/e6/48/e6484a578778beccab26c8549608ec13970e6bcdb9541cdccad20f4d984e8181'), PosixPath('/home/leandro/codeparrot-clean-train/.git/index'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/54/60/5460223b92bb118814a7777a939f4005b7426a7e4a068c193c10d1b86eeb862b'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/prepare-commit-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/logs/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/ae/45/ae45741df674456bc63bad91374d2ba5ef988d33d6e2a322ef0a5ac8af040371'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/60/41/604177fe5560efd99d93091fadab6293afe7cd7d12f81638c301de1c937c1583'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/ef/e1/efe1759837b74b5b5ed3df1a09d4c880f9ad20413d958f79d35bf1cb6a2a09d4'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/pre-receive.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/32/be/32beb30e381ff02fb71854b5534306f395ef00f51f02b62da1f027c8c7fab26f'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/9b/1b/9b1b8e52b9262f03f1719d3950dc8dfa2b9719dc2e273603023f6f329c1b2068'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/56/80/56803c607a19ccb576c90bdb10a02cfa7b3affc67dd150fa41b00cc22213b174'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/4e/39/4e392fcaae564652d234d07b4f71eeed90efe51b1b714831e39d77f3e537d3df'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/applypatch-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/cd/33/cd339656799518495d23aedf1503459be6d3086e22672e80edab8403d12ded1c'), PosixPath('/home/leandro/codeparrot-clean-train/.git/lfs/objects/f1/62/f162b06b5dca01aa85ef9a675d396c0fbab1d009b5bee1c5b7ea6b415c6f12a4'), PosixPath('/home/leandro/codeparrot-clean-train/.git/hooks/post-merge')] -11/06/2021 21:16:15 - WARNING - datasets.builder - Using custom data configuration codeparrot-clean-train-e839c6c1585da466 -11/06/2021 21:16:15 - INFO - datasets.data_files - Some files matched the pattern '*' at /home/leandro/codeparrot-clean-valid but don't have valid data file extensions: [PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/60/0dc2964cf471fa4aac706659009777cf176497'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/commit-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/95/7b2579c6ef20995a09efd9a17f8fd90606f5ed'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-push.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/refs/heads/main'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/config'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/info/exclude'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/applypatch-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-commit.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/update.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/logs/refs/heads/main'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/HEAD'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/index'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/25/747fcf966f2b7b3a2f4149130bff69ebe83718'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/15/4f5f07c68026fb069c4bdfe3966893737035f4'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/6d/d1188965fcd7feab0efc3506668a615805e13f'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/description'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/post-merge'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/prepare-commit-msg.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/d9/cd7ad451bcd8a388471b341a961d0e6e6ff558'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-rebase.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/55/36bbd68dd8f283092b22eb77a051175c1b727a'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/lfs/objects/7f/8c/7f8c20a737c9084779bcdb853325ad4774d0db52c74aa2a63fd658d6787eb35b'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/fsmonitor-watchman.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-applypatch.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/post-update.sample'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/09/e6a70d1aadc53ed29b9890332f184f89d0a39b'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/logs/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/objects/5e/d5325308cb9a07b2c5807dad51120c9a75b6db'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-push'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/post-checkout'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/post-commit'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/packed-refs'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/logs/HEAD'), PosixPath('/home/leandro/codeparrot-clean-valid/.git/hooks/pre-receive.sample')] -11/06/2021 21:16:15 - WARNING - datasets.builder - Using custom data configuration codeparrot-clean-valid-ced470bd23403144 -11/06/2021 21:16:43 - INFO - __main__ - Step 1: {'lr': 0.0, 'samples': 192, 'steps': 0, 'loss/train': 10.55798625946045} -11/06/2021 21:16:43 - INFO - root - Reducer buckets have been rebuilt in this iteration. -11/06/2021 21:16:43 - INFO - __main__ - Step 2: {'lr': 2.5e-07, 'samples': 384, 'steps': 1, 'loss/train': 10.535750389099121} -11/06/2021 21:16:43 - INFO - __main__ - Step 3: {'lr': 5e-07, 'samples': 576, 'steps': 2, 'loss/train': 10.530282974243164} -11/06/2021 21:16:44 - INFO - __main__ - Step 4: {'lr': 7.5e-07, 'samples': 768, 'steps': 3, 'loss/train': 10.527787208557129} -11/06/2021 21:16:45 - INFO - __main__ - Step 5: {'lr': 1e-06, 'samples': 960, 'steps': 4, 'loss/train': 10.491048812866211} -11/06/2021 21:16:46 - INFO - __main__ - Step 6: {'lr': 1.25e-06, 'samples': 1152, 'steps': 5, 'loss/train': 10.409588813781738} -11/06/2021 21:16:46 - INFO - __main__ - Step 7: {'lr': 1.5e-06, 'samples': 1344, 'steps': 6, 'loss/train': 10.350728034973145} -11/06/2021 21:16:46 - INFO - __main__ - Step 8: {'lr': 1.75e-06, 'samples': 1536, 'steps': 7, 'loss/train': 10.252238273620605} -11/06/2021 21:16:47 - INFO - __main__ - Step 9: {'lr': 2e-06, 'samples': 1728, 'steps': 8, 'loss/train': 10.193534851074219} -11/06/2021 21:16:47 - INFO - __main__ - Step 10: {'lr': 2.25e-06, 'samples': 1920, 'steps': 9, 'loss/train': 9.953790664672852} -11/06/2021 21:16:48 - INFO - __main__ - Step 11: {'lr': 2.5e-06, 'samples': 2112, 'steps': 10, 'loss/train': 10.194929122924805} -11/06/2021 21:16:49 - INFO - __main__ - Step 12: {'lr': 2.75e-06, 'samples': 2304, 'steps': 11, 'loss/train': 9.89802074432373} -11/06/2021 21:16:49 - INFO - __main__ - Step 13: {'lr': 3e-06, 'samples': 2496, 'steps': 12, 'loss/train': 9.843729972839355} -11/06/2021 21:16:49 - INFO - __main__ - Step 14: {'lr': 3.25e-06, 'samples': 2688, 'steps': 13, 'loss/train': 9.845044136047363} -11/06/2021 21:16:50 - INFO - __main__ - Step 15: {'lr': 3.5e-06, 'samples': 2880, 'steps': 14, 'loss/train': 9.869210243225098} -11/06/2021 21:16:51 - INFO - __main__ - Step 16: {'lr': 3.75e-06, 'samples': 3072, 'steps': 15, 'loss/train': 9.587459564208984} -11/06/2021 21:16:51 - INFO - __main__ - Step 17: {'lr': 4e-06, 'samples': 3264, 'steps': 16, 'loss/train': 9.667202949523926} -11/06/2021 21:16:51 - INFO - __main__ - Step 18: {'lr': 4.250000000000001e-06, 'samples': 3456, 'steps': 17, 'loss/train': 9.495230674743652} -11/06/2021 21:16:52 - INFO - __main__ - Step 19: {'lr': 4.5e-06, 'samples': 3648, 'steps': 18, 'loss/train': 9.640376091003418} -11/06/2021 21:16:52 - INFO - __main__ - Step 20: {'lr': 4.75e-06, 'samples': 3840, 'steps': 19, 'loss/train': 9.428448677062988} -11/06/2021 21:16:52 - INFO - __main__ - Step 21: {'lr': 5e-06, 'samples': 4032, 'steps': 20, 'loss/train': 9.341026306152344} -11/06/2021 21:16:54 - INFO - __main__ - Step 22: {'lr': 5.2500000000000006e-06, 'samples': 4224, 'steps': 21, 'loss/train': 9.372577667236328} -11/06/2021 21:16:54 - INFO - __main__ - Step 23: {'lr': 5.5e-06, 'samples': 4416, 'steps': 22, 'loss/train': 8.967851638793945} -11/06/2021 21:16:54 - INFO - __main__ - Step 24: {'lr': 5.75e-06, 'samples': 4608, 'steps': 23, 'loss/train': 8.74506950378418} -11/06/2021 21:16:55 - INFO - __main__ - Step 25: {'lr': 6e-06, 'samples': 4800, 'steps': 24, 'loss/train': 9.786674499511719} -11/06/2021 21:16:55 - INFO - __main__ - Step 26: {'lr': 6.25e-06, 'samples': 4992, 'steps': 25, 'loss/train': 9.504456520080566} -11/06/2021 21:16:56 - INFO - __main__ - Step 27: {'lr': 6.5e-06, 'samples': 5184, 'steps': 26, 'loss/train': 9.166744232177734} -11/06/2021 21:16:56 - INFO - __main__ - Step 28: {'lr': 6.75e-06, 'samples': 5376, 'steps': 27, 'loss/train': 8.682860374450684} -11/06/2021 21:16:57 - INFO - __main__ - Step 29: {'lr': 7e-06, 'samples': 5568, 'steps': 28, 'loss/train': 8.596318244934082} -11/06/2021 21:16:57 - INFO - __main__ - Step 30: {'lr': 7.250000000000001e-06, 'samples': 5760, 'steps': 29, 'loss/train': 9.048979759216309} -11/06/2021 21:16:57 - INFO - __main__ - Step 31: {'lr': 7.5e-06, 'samples': 5952, 'steps': 30, 'loss/train': 9.320890426635742} -11/06/2021 21:16:58 - INFO - __main__ - Step 32: {'lr': 7.75e-06, 'samples': 6144, 'steps': 31, 'loss/train': 8.952228546142578} -11/06/2021 21:16:59 - INFO - __main__ - Step 33: {'lr': 8e-06, 'samples': 6336, 'steps': 32, 'loss/train': 8.751225471496582} -11/06/2021 21:16:59 - INFO - __main__ - Step 34: {'lr': 8.25e-06, 'samples': 6528, 'steps': 33, 'loss/train': 9.156981468200684} -11/06/2021 21:17:00 - INFO - __main__ - Step 35: {'lr': 8.500000000000002e-06, 'samples': 6720, 'steps': 34, 'loss/train': 8.837956428527832} -11/06/2021 21:17:00 - INFO - __main__ - Step 36: {'lr': 8.750000000000001e-06, 'samples': 6912, 'steps': 35, 'loss/train': 8.935142517089844} -11/06/2021 21:17:01 - INFO - __main__ - Step 37: {'lr': 9e-06, 'samples': 7104, 'steps': 36, 'loss/train': 9.019933700561523} -11/06/2021 21:17:02 - INFO - __main__ - Step 38: {'lr': 9.25e-06, 'samples': 7296, 'steps': 37, 'loss/train': 8.594483375549316} -11/06/2021 21:17:02 - INFO - __main__ - Step 39: {'lr': 9.5e-06, 'samples': 7488, 'steps': 38, 'loss/train': 9.565625190734863} -11/06/2021 21:17:02 - INFO - __main__ - Step 40: {'lr': 9.75e-06, 'samples': 7680, 'steps': 39, 'loss/train': 9.195219039916992} -11/06/2021 21:17:03 - INFO - __main__ - Step 41: {'lr': 1e-05, 'samples': 7872, 'steps': 40, 'loss/train': 9.008049011230469} -11/06/2021 21:17:04 - INFO - __main__ - Step 42: {'lr': 1.025e-05, 'samples': 8064, 'steps': 41, 'loss/train': 9.54212760925293} -11/06/2021 21:17:04 - INFO - __main__ - Step 43: {'lr': 1.0500000000000001e-05, 'samples': 8256, 'steps': 42, 'loss/train': 9.074606895446777} -11/06/2021 21:17:04 - INFO - __main__ - Step 44: {'lr': 1.0749999999999999e-05, 'samples': 8448, 'steps': 43, 'loss/train': 9.575305938720703} -11/06/2021 21:17:05 - INFO - __main__ - Step 45: {'lr': 1.1e-05, 'samples': 8640, 'steps': 44, 'loss/train': 9.862631797790527} -11/06/2021 21:17:05 - INFO - __main__ - Step 46: {'lr': 1.1249999999999999e-05, 'samples': 8832, 'steps': 45, 'loss/train': 8.833338737487793} -11/06/2021 21:17:06 - INFO - __main__ - Step 47: {'lr': 1.15e-05, 'samples': 9024, 'steps': 46, 'loss/train': 8.830769538879395} -11/06/2021 21:17:07 - INFO - __main__ - Step 48: {'lr': 1.1750000000000001e-05, 'samples': 9216, 'steps': 47, 'loss/train': 8.828520774841309} -11/06/2021 21:17:07 - INFO - __main__ - Step 49: {'lr': 1.2e-05, 'samples': 9408, 'steps': 48, 'loss/train': 8.692312240600586} -11/06/2021 21:17:07 - INFO - __main__ - Step 50: {'lr': 1.2250000000000001e-05, 'samples': 9600, 'steps': 49, 'loss/train': 8.698874473571777} -11/06/2021 21:17:08 - INFO - __main__ - Step 51: {'lr': 1.25e-05, 'samples': 9792, 'steps': 50, 'loss/train': 8.904641151428223} -11/06/2021 21:17:09 - INFO - __main__ - Step 52: {'lr': 1.275e-05, 'samples': 9984, 'steps': 51, 'loss/train': 8.66476821899414} -11/06/2021 21:17:09 - INFO - __main__ - Step 53: {'lr': 1.3e-05, 'samples': 10176, 'steps': 52, 'loss/train': 8.561541557312012} -11/06/2021 21:17:10 - INFO - __main__ - Step 54: {'lr': 1.325e-05, 'samples': 10368, 'steps': 53, 'loss/train': 8.71354866027832} -11/06/2021 21:17:10 - INFO - __main__ - Step 55: {'lr': 1.35e-05, 'samples': 10560, 'steps': 54, 'loss/train': 8.084650993347168} -11/06/2021 21:17:10 - INFO - __main__ - Step 56: {'lr': 1.375e-05, 'samples': 10752, 'steps': 55, 'loss/train': 8.701323509216309} -11/06/2021 21:17:11 - INFO - __main__ - Step 57: {'lr': 1.4e-05, 'samples': 10944, 'steps': 56, 'loss/train': 8.886054039001465} -11/06/2021 21:17:12 - INFO - __main__ - Step 58: {'lr': 1.425e-05, 'samples': 11136, 'steps': 57, 'loss/train': 8.962408065795898} -11/06/2021 21:17:12 - INFO - __main__ - Step 59: {'lr': 1.4500000000000002e-05, 'samples': 11328, 'steps': 58, 'loss/train': 8.731340408325195} -11/06/2021 21:17:13 - INFO - __main__ - Step 60: {'lr': 1.475e-05, 'samples': 11520, 'steps': 59, 'loss/train': 8.48225212097168} -11/06/2021 21:17:13 - INFO - __main__ - Step 61: {'lr': 1.5e-05, 'samples': 11712, 'steps': 60, 'loss/train': 8.860502243041992} -11/06/2021 21:17:14 - INFO - __main__ - Step 62: {'lr': 1.525e-05, 'samples': 11904, 'steps': 61, 'loss/train': 8.848859786987305} -11/06/2021 21:17:15 - INFO - __main__ - Step 63: {'lr': 1.55e-05, 'samples': 12096, 'steps': 62, 'loss/train': 8.20711612701416} -11/06/2021 21:17:15 - INFO - __main__ - Step 64: {'lr': 1.575e-05, 'samples': 12288, 'steps': 63, 'loss/train': 10.296394348144531} -11/06/2021 21:17:15 - INFO - __main__ - Step 65: {'lr': 1.6e-05, 'samples': 12480, 'steps': 64, 'loss/train': 7.71311092376709} -11/06/2021 21:17:16 - INFO - __main__ - Step 66: {'lr': 1.6250000000000002e-05, 'samples': 12672, 'steps': 65, 'loss/train': 8.466562271118164} -11/06/2021 21:17:16 - INFO - __main__ - Step 67: {'lr': 1.65e-05, 'samples': 12864, 'steps': 66, 'loss/train': 8.35257339477539} -11/06/2021 21:17:17 - INFO - __main__ - Step 68: {'lr': 1.675e-05, 'samples': 13056, 'steps': 67, 'loss/train': 8.386396408081055} -11/06/2021 21:17:18 - INFO - __main__ - Step 69: {'lr': 1.7000000000000003e-05, 'samples': 13248, 'steps': 68, 'loss/train': 8.12002944946289} -11/06/2021 21:17:18 - INFO - __main__ - Step 70: {'lr': 1.7250000000000003e-05, 'samples': 13440, 'steps': 69, 'loss/train': 8.70462417602539} -11/06/2021 21:17:18 - INFO - __main__ - Step 71: {'lr': 1.7500000000000002e-05, 'samples': 13632, 'steps': 70, 'loss/train': 8.239697456359863} -11/06/2021 21:17:19 - INFO - __main__ - Step 72: {'lr': 1.7749999999999998e-05, 'samples': 13824, 'steps': 71, 'loss/train': 7.610179424285889} -11/06/2021 21:17:20 - INFO - __main__ - Step 73: {'lr': 1.8e-05, 'samples': 14016, 'steps': 72, 'loss/train': 7.8869452476501465} -11/06/2021 21:17:20 - INFO - __main__ - Step 74: {'lr': 1.825e-05, 'samples': 14208, 'steps': 73, 'loss/train': 7.692283630371094} -11/06/2021 21:17:21 - INFO - __main__ - Step 75: {'lr': 1.85e-05, 'samples': 14400, 'steps': 74, 'loss/train': 8.208292007446289} -11/06/2021 21:17:21 - INFO - __main__ - Step 76: {'lr': 1.875e-05, 'samples': 14592, 'steps': 75, 'loss/train': 7.97852897644043} -11/06/2021 21:17:21 - INFO - __main__ - Step 77: {'lr': 1.9e-05, 'samples': 14784, 'steps': 76, 'loss/train': 8.777739524841309} -11/06/2021 21:17:22 - INFO - __main__ - Step 78: {'lr': 1.925e-05, 'samples': 14976, 'steps': 77, 'loss/train': 7.68981409072876} -11/06/2021 21:17:23 - INFO - __main__ - Step 79: {'lr': 1.95e-05, 'samples': 15168, 'steps': 78, 'loss/train': 7.656458854675293} -11/06/2021 21:17:23 - INFO - __main__ - Step 80: {'lr': 1.975e-05, 'samples': 15360, 'steps': 79, 'loss/train': 8.30695915222168} -11/06/2021 21:17:23 - INFO - __main__ - Step 81: {'lr': 2e-05, 'samples': 15552, 'steps': 80, 'loss/train': 7.897383689880371} -11/06/2021 21:17:24 - INFO - __main__ - Step 82: {'lr': 2.025e-05, 'samples': 15744, 'steps': 81, 'loss/train': 8.267080307006836} -11/06/2021 21:17:25 - INFO - __main__ - Step 83: {'lr': 2.05e-05, 'samples': 15936, 'steps': 82, 'loss/train': 8.247127532958984} -11/06/2021 21:17:25 - INFO - __main__ - Step 84: {'lr': 2.0750000000000003e-05, 'samples': 16128, 'steps': 83, 'loss/train': 8.18776798248291} -11/06/2021 21:17:25 - INFO - __main__ - Step 85: {'lr': 2.1000000000000002e-05, 'samples': 16320, 'steps': 84, 'loss/train': 7.7213358879089355} -11/06/2021 21:17:26 - INFO - __main__ - Step 86: {'lr': 2.125e-05, 'samples': 16512, 'steps': 85, 'loss/train': 7.880347728729248} -11/06/2021 21:17:26 - INFO - __main__ - Step 87: {'lr': 2.1499999999999997e-05, 'samples': 16704, 'steps': 86, 'loss/train': 8.094650268554688} -11/06/2021 21:17:27 - INFO - __main__ - Step 88: {'lr': 2.175e-05, 'samples': 16896, 'steps': 87, 'loss/train': 7.1267242431640625} -11/06/2021 21:17:27 - INFO - __main__ - Step 89: {'lr': 2.2e-05, 'samples': 17088, 'steps': 88, 'loss/train': 7.992337703704834} -11/06/2021 21:17:28 - INFO - __main__ - Step 90: {'lr': 2.225e-05, 'samples': 17280, 'steps': 89, 'loss/train': 7.918111801147461} -11/06/2021 21:17:28 - INFO - __main__ - Step 91: {'lr': 2.2499999999999998e-05, 'samples': 17472, 'steps': 90, 'loss/train': 7.4610795974731445} -11/06/2021 21:17:29 - INFO - __main__ - Step 92: {'lr': 2.275e-05, 'samples': 17664, 'steps': 91, 'loss/train': 7.861474990844727} -11/06/2021 21:17:29 - INFO - __main__ - Step 93: {'lr': 2.3e-05, 'samples': 17856, 'steps': 92, 'loss/train': 7.493942737579346} -11/06/2021 21:17:30 - INFO - __main__ - Step 94: {'lr': 2.325e-05, 'samples': 18048, 'steps': 93, 'loss/train': 8.051450729370117} -11/06/2021 21:17:30 - INFO - __main__ - Step 95: {'lr': 2.3500000000000002e-05, 'samples': 18240, 'steps': 94, 'loss/train': 7.800515651702881} -11/06/2021 21:17:31 - INFO - __main__ - Step 96: {'lr': 2.375e-05, 'samples': 18432, 'steps': 95, 'loss/train': 7.40056037902832} -11/06/2021 21:17:31 - INFO - __main__ - Step 97: {'lr': 2.4e-05, 'samples': 18624, 'steps': 96, 'loss/train': 7.518774032592773} -11/06/2021 21:17:31 - INFO - __main__ - Step 98: {'lr': 2.425e-05, 'samples': 18816, 'steps': 97, 'loss/train': 7.735995292663574} -11/06/2021 21:17:32 - INFO - __main__ - Step 99: {'lr': 2.4500000000000003e-05, 'samples': 19008, 'steps': 98, 'loss/train': 7.60399866104126} -11/06/2021 21:17:33 - INFO - __main__ - Step 100: {'lr': 2.4750000000000002e-05, 'samples': 19200, 'steps': 99, 'loss/train': 7.875792980194092} -11/06/2021 21:17:33 - INFO - __main__ - Step 101: {'lr': 2.5e-05, 'samples': 19392, 'steps': 100, 'loss/train': 7.704280853271484} -11/06/2021 21:17:34 - INFO - __main__ - Step 102: {'lr': 2.525e-05, 'samples': 19584, 'steps': 101, 'loss/train': 7.629642009735107} -11/06/2021 21:17:34 - INFO - __main__ - Step 103: {'lr': 2.55e-05, 'samples': 19776, 'steps': 102, 'loss/train': 7.427465915679932} -11/06/2021 21:17:35 - INFO - __main__ - Step 104: {'lr': 2.575e-05, 'samples': 19968, 'steps': 103, 'loss/train': 7.325517654418945} -11/06/2021 21:17:35 - INFO - __main__ - Step 105: {'lr': 2.6e-05, 'samples': 20160, 'steps': 104, 'loss/train': 7.825165271759033} -11/06/2021 21:17:36 - INFO - __main__ - Step 106: {'lr': 2.625e-05, 'samples': 20352, 'steps': 105, 'loss/train': 7.557342529296875} -11/06/2021 21:17:36 - INFO - __main__ - Step 107: {'lr': 2.65e-05, 'samples': 20544, 'steps': 106, 'loss/train': 7.5471510887146} -11/06/2021 21:17:36 - INFO - __main__ - Step 108: {'lr': 2.675e-05, 'samples': 20736, 'steps': 107, 'loss/train': 7.51965856552124} -11/06/2021 21:17:37 - INFO - __main__ - Step 109: {'lr': 2.7e-05, 'samples': 20928, 'steps': 108, 'loss/train': 7.727786540985107} -11/06/2021 21:17:38 - INFO - __main__ - Step 110: {'lr': 2.725e-05, 'samples': 21120, 'steps': 109, 'loss/train': 8.008770942687988} -11/06/2021 21:17:38 - INFO - __main__ - Step 111: {'lr': 2.75e-05, 'samples': 21312, 'steps': 110, 'loss/train': 7.874051094055176} -11/06/2021 21:17:38 - INFO - __main__ - Step 112: {'lr': 2.775e-05, 'samples': 21504, 'steps': 111, 'loss/train': 7.637380599975586} -11/06/2021 21:17:39 - INFO - __main__ - Step 113: {'lr': 2.8e-05, 'samples': 21696, 'steps': 112, 'loss/train': 7.677240371704102} -11/06/2021 21:17:40 - INFO - __main__ - Step 114: {'lr': 2.8250000000000002e-05, 'samples': 21888, 'steps': 113, 'loss/train': 7.03343391418457} -11/06/2021 21:17:40 - INFO - __main__ - Step 115: {'lr': 2.85e-05, 'samples': 22080, 'steps': 114, 'loss/train': 7.615724563598633} -11/06/2021 21:17:41 - INFO - __main__ - Step 116: {'lr': 2.875e-05, 'samples': 22272, 'steps': 115, 'loss/train': 7.741561412811279} -11/06/2021 21:17:41 - INFO - __main__ - Step 117: {'lr': 2.9000000000000004e-05, 'samples': 22464, 'steps': 116, 'loss/train': 8.360411643981934} -11/06/2021 21:17:41 - INFO - __main__ - Step 118: {'lr': 2.9250000000000003e-05, 'samples': 22656, 'steps': 117, 'loss/train': 7.302130222320557} -11/06/2021 21:17:42 - INFO - __main__ - Step 119: {'lr': 2.95e-05, 'samples': 22848, 'steps': 118, 'loss/train': 7.071781158447266} -11/06/2021 21:17:43 - INFO - __main__ - Step 120: {'lr': 2.9749999999999998e-05, 'samples': 23040, 'steps': 119, 'loss/train': 7.1986308097839355} -11/06/2021 21:17:43 - INFO - __main__ - Step 121: {'lr': 3e-05, 'samples': 23232, 'steps': 120, 'loss/train': 6.897414684295654} -11/06/2021 21:17:43 - INFO - __main__ - Step 122: {'lr': 3.025e-05, 'samples': 23424, 'steps': 121, 'loss/train': 6.9648213386535645} -11/06/2021 21:17:44 - INFO - __main__ - Step 123: {'lr': 3.05e-05, 'samples': 23616, 'steps': 122, 'loss/train': 7.184485912322998} -11/06/2021 21:17:45 - INFO - __main__ - Step 124: {'lr': 3.075e-05, 'samples': 23808, 'steps': 123, 'loss/train': 6.945891857147217} -11/06/2021 21:17:45 - INFO - __main__ - Step 125: {'lr': 3.1e-05, 'samples': 24000, 'steps': 124, 'loss/train': 7.381505489349365} -11/06/2021 21:17:46 - INFO - __main__ - Step 126: {'lr': 3.125e-05, 'samples': 24192, 'steps': 125, 'loss/train': 7.457914352416992} -11/06/2021 21:17:46 - INFO - __main__ - Step 127: {'lr': 3.15e-05, 'samples': 24384, 'steps': 126, 'loss/train': 7.405432224273682} -11/06/2021 21:17:47 - INFO - __main__ - Step 128: {'lr': 3.175e-05, 'samples': 24576, 'steps': 127, 'loss/train': 7.172966003417969} -11/06/2021 21:17:48 - INFO - __main__ - Step 129: {'lr': 3.2e-05, 'samples': 24768, 'steps': 128, 'loss/train': 7.367163181304932} -11/06/2021 21:17:48 - INFO - __main__ - Step 130: {'lr': 3.2250000000000005e-05, 'samples': 24960, 'steps': 129, 'loss/train': 6.170543670654297} -11/06/2021 21:17:48 - INFO - __main__ - Step 131: {'lr': 3.2500000000000004e-05, 'samples': 25152, 'steps': 130, 'loss/train': 6.940507411956787} -11/06/2021 21:17:49 - INFO - __main__ - Step 132: {'lr': 3.275e-05, 'samples': 25344, 'steps': 131, 'loss/train': 7.2779364585876465} -11/06/2021 21:17:49 - INFO - __main__ - Step 133: {'lr': 3.3e-05, 'samples': 25536, 'steps': 132, 'loss/train': 6.9434428215026855} -11/06/2021 21:17:49 - INFO - __main__ - Step 134: {'lr': 3.325e-05, 'samples': 25728, 'steps': 133, 'loss/train': 7.035802841186523} -11/06/2021 21:17:50 - INFO - __main__ - Step 135: {'lr': 3.35e-05, 'samples': 25920, 'steps': 134, 'loss/train': 8.246500015258789} -11/06/2021 21:17:51 - INFO - __main__ - Step 136: {'lr': 3.375e-05, 'samples': 26112, 'steps': 135, 'loss/train': 6.835116386413574} -11/06/2021 21:17:51 - INFO - __main__ - Step 137: {'lr': 3.4000000000000007e-05, 'samples': 26304, 'steps': 136, 'loss/train': 6.883285999298096} -11/06/2021 21:17:51 - INFO - __main__ - Step 138: {'lr': 3.4250000000000006e-05, 'samples': 26496, 'steps': 137, 'loss/train': 7.106326103210449} -11/06/2021 21:17:52 - INFO - __main__ - Step 139: {'lr': 3.4500000000000005e-05, 'samples': 26688, 'steps': 138, 'loss/train': 7.33680534362793} -11/06/2021 21:17:53 - INFO - __main__ - Step 140: {'lr': 3.4750000000000004e-05, 'samples': 26880, 'steps': 139, 'loss/train': 6.972182273864746} -11/06/2021 21:17:53 - INFO - __main__ - Step 141: {'lr': 3.5000000000000004e-05, 'samples': 27072, 'steps': 140, 'loss/train': 6.676812171936035} -11/06/2021 21:17:54 - INFO - __main__ - Step 142: {'lr': 3.5249999999999996e-05, 'samples': 27264, 'steps': 141, 'loss/train': 7.476287364959717} -11/06/2021 21:17:54 - INFO - __main__ - Step 143: {'lr': 3.5499999999999996e-05, 'samples': 27456, 'steps': 142, 'loss/train': 6.697681903839111} -11/06/2021 21:17:54 - INFO - __main__ - Step 144: {'lr': 3.5749999999999995e-05, 'samples': 27648, 'steps': 143, 'loss/train': 6.98452091217041} -11/06/2021 21:17:55 - INFO - __main__ - Step 145: {'lr': 3.6e-05, 'samples': 27840, 'steps': 144, 'loss/train': 6.702653408050537} -11/06/2021 21:17:56 - INFO - __main__ - Step 146: {'lr': 3.625e-05, 'samples': 28032, 'steps': 145, 'loss/train': 7.03615140914917} -11/06/2021 21:17:56 - INFO - __main__ - Step 147: {'lr': 3.65e-05, 'samples': 28224, 'steps': 146, 'loss/train': 6.963271617889404} -11/06/2021 21:17:56 - INFO - __main__ - Step 148: {'lr': 3.675e-05, 'samples': 28416, 'steps': 147, 'loss/train': 6.389257907867432} -11/06/2021 21:17:57 - INFO - __main__ - Step 149: {'lr': 3.7e-05, 'samples': 28608, 'steps': 148, 'loss/train': 6.685713768005371} -11/06/2021 21:17:58 - INFO - __main__ - Step 150: {'lr': 3.725e-05, 'samples': 28800, 'steps': 149, 'loss/train': 6.8497772216796875} -11/06/2021 21:17:58 - INFO - __main__ - Step 151: {'lr': 3.75e-05, 'samples': 28992, 'steps': 150, 'loss/train': 6.36531925201416} -11/06/2021 21:17:59 - INFO - __main__ - Step 152: {'lr': 3.775e-05, 'samples': 29184, 'steps': 151, 'loss/train': 6.523715019226074} -11/06/2021 21:17:59 - INFO - __main__ - Step 153: {'lr': 3.8e-05, 'samples': 29376, 'steps': 152, 'loss/train': 7.334853172302246} -11/06/2021 21:17:59 - INFO - __main__ - Step 154: {'lr': 3.825e-05, 'samples': 29568, 'steps': 153, 'loss/train': 6.311091423034668} -11/06/2021 21:18:00 - INFO - __main__ - Step 155: {'lr': 3.85e-05, 'samples': 29760, 'steps': 154, 'loss/train': 6.930693626403809} -11/06/2021 21:18:01 - INFO - __main__ - Step 156: {'lr': 3.875e-05, 'samples': 29952, 'steps': 155, 'loss/train': 7.10976505279541} -11/06/2021 21:18:01 - INFO - __main__ - Step 157: {'lr': 3.9e-05, 'samples': 30144, 'steps': 156, 'loss/train': 6.257956504821777} -11/06/2021 21:18:01 - INFO - __main__ - Step 158: {'lr': 3.925e-05, 'samples': 30336, 'steps': 157, 'loss/train': 6.675495624542236} -11/06/2021 21:18:02 - INFO - __main__ - Step 159: {'lr': 3.95e-05, 'samples': 30528, 'steps': 158, 'loss/train': 6.756046295166016} -11/06/2021 21:18:03 - INFO - __main__ - Step 160: {'lr': 3.9750000000000004e-05, 'samples': 30720, 'steps': 159, 'loss/train': 7.092185020446777} -11/06/2021 21:18:03 - INFO - __main__ - Step 161: {'lr': 4e-05, 'samples': 30912, 'steps': 160, 'loss/train': 6.609521389007568} -11/06/2021 21:18:04 - INFO - __main__ - Step 162: {'lr': 4.025e-05, 'samples': 31104, 'steps': 161, 'loss/train': 6.6135945320129395} -11/06/2021 21:18:04 - INFO - __main__ - Step 163: {'lr': 4.05e-05, 'samples': 31296, 'steps': 162, 'loss/train': 6.731355667114258} -11/06/2021 21:18:04 - INFO - __main__ - Step 164: {'lr': 4.075e-05, 'samples': 31488, 'steps': 163, 'loss/train': 6.836953163146973} -11/06/2021 21:18:05 - INFO - __main__ - Step 165: {'lr': 4.1e-05, 'samples': 31680, 'steps': 164, 'loss/train': 6.64618444442749} -11/06/2021 21:18:06 - INFO - __main__ - Step 166: {'lr': 4.125e-05, 'samples': 31872, 'steps': 165, 'loss/train': 6.482452869415283} -11/06/2021 21:18:06 - INFO - __main__ - Step 167: {'lr': 4.1500000000000006e-05, 'samples': 32064, 'steps': 166, 'loss/train': 6.185523509979248} -11/06/2021 21:18:06 - INFO - __main__ - Step 168: {'lr': 4.1750000000000005e-05, 'samples': 32256, 'steps': 167, 'loss/train': 6.377339839935303} -11/06/2021 21:18:07 - INFO - __main__ - Step 169: {'lr': 4.2000000000000004e-05, 'samples': 32448, 'steps': 168, 'loss/train': 6.502751350402832} -11/06/2021 21:18:08 - INFO - __main__ - Step 170: {'lr': 4.2250000000000004e-05, 'samples': 32640, 'steps': 169, 'loss/train': 7.073266506195068} -11/06/2021 21:18:08 - INFO - __main__ - Step 171: {'lr': 4.25e-05, 'samples': 32832, 'steps': 170, 'loss/train': 6.543142318725586} -11/06/2021 21:18:08 - INFO - __main__ - Step 172: {'lr': 4.275e-05, 'samples': 33024, 'steps': 171, 'loss/train': 6.489956378936768} -11/06/2021 21:18:09 - INFO - __main__ - Step 173: {'lr': 4.2999999999999995e-05, 'samples': 33216, 'steps': 172, 'loss/train': 6.199307918548584} -11/06/2021 21:18:09 - INFO - __main__ - Step 174: {'lr': 4.325e-05, 'samples': 33408, 'steps': 173, 'loss/train': 6.356565475463867} -11/06/2021 21:18:10 - INFO - __main__ - Step 175: {'lr': 4.35e-05, 'samples': 33600, 'steps': 174, 'loss/train': 5.826794147491455} -11/06/2021 21:18:11 - INFO - __main__ - Step 176: {'lr': 4.375e-05, 'samples': 33792, 'steps': 175, 'loss/train': 7.043330192565918} -11/06/2021 21:18:11 - INFO - __main__ - Step 177: {'lr': 4.4e-05, 'samples': 33984, 'steps': 176, 'loss/train': 6.09688663482666} -11/06/2021 21:18:11 - INFO - __main__ - Step 178: {'lr': 4.425e-05, 'samples': 34176, 'steps': 177, 'loss/train': 6.213244915008545} -11/06/2021 21:18:12 - INFO - __main__ - Step 179: {'lr': 4.45e-05, 'samples': 34368, 'steps': 178, 'loss/train': 6.990470886230469} -11/06/2021 21:18:13 - INFO - __main__ - Step 180: {'lr': 4.475e-05, 'samples': 34560, 'steps': 179, 'loss/train': 6.256852149963379} -11/06/2021 21:18:13 - INFO - __main__ - Step 181: {'lr': 4.4999999999999996e-05, 'samples': 34752, 'steps': 180, 'loss/train': 7.177120685577393} -11/06/2021 21:18:13 - INFO - __main__ - Step 182: {'lr': 4.525e-05, 'samples': 34944, 'steps': 181, 'loss/train': 6.373216152191162} -11/06/2021 21:18:14 - INFO - __main__ - Step 183: {'lr': 4.55e-05, 'samples': 35136, 'steps': 182, 'loss/train': 7.0793328285217285} -11/06/2021 21:18:14 - INFO - __main__ - Step 184: {'lr': 4.575e-05, 'samples': 35328, 'steps': 183, 'loss/train': 6.392989158630371} -11/06/2021 21:18:15 - INFO - __main__ - Step 185: {'lr': 4.6e-05, 'samples': 35520, 'steps': 184, 'loss/train': 8.500471115112305} -11/06/2021 21:18:16 - INFO - __main__ - Step 186: {'lr': 4.625e-05, 'samples': 35712, 'steps': 185, 'loss/train': 6.313254356384277} -11/06/2021 21:18:16 - INFO - __main__ - Step 187: {'lr': 4.65e-05, 'samples': 35904, 'steps': 186, 'loss/train': 6.720587253570557} -11/06/2021 21:18:16 - INFO - __main__ - Step 188: {'lr': 4.675e-05, 'samples': 36096, 'steps': 187, 'loss/train': 5.526083469390869} -11/06/2021 21:18:17 - INFO - __main__ - Step 189: {'lr': 4.7000000000000004e-05, 'samples': 36288, 'steps': 188, 'loss/train': 5.93545389175415} -11/06/2021 21:18:17 - INFO - __main__ - Step 190: {'lr': 4.725e-05, 'samples': 36480, 'steps': 189, 'loss/train': 7.147458553314209} -11/06/2021 21:18:18 - INFO - __main__ - Step 191: {'lr': 4.75e-05, 'samples': 36672, 'steps': 190, 'loss/train': 6.479673385620117} -11/06/2021 21:18:18 - INFO - __main__ - Step 192: {'lr': 4.775e-05, 'samples': 36864, 'steps': 191, 'loss/train': 6.075639247894287} -11/06/2021 21:18:19 - INFO - __main__ - Step 193: {'lr': 4.8e-05, 'samples': 37056, 'steps': 192, 'loss/train': 6.69281005859375} -11/06/2021 21:18:19 - INFO - __main__ - Step 194: {'lr': 4.825e-05, 'samples': 37248, 'steps': 193, 'loss/train': 6.355683326721191} -11/06/2021 21:18:20 - INFO - __main__ - Step 195: {'lr': 4.85e-05, 'samples': 37440, 'steps': 194, 'loss/train': 6.180767059326172} -11/06/2021 21:18:20 - INFO - __main__ - Step 196: {'lr': 4.8750000000000006e-05, 'samples': 37632, 'steps': 195, 'loss/train': 5.40876579284668} -11/06/2021 21:18:21 - INFO - __main__ - Step 197: {'lr': 4.9000000000000005e-05, 'samples': 37824, 'steps': 196, 'loss/train': 7.284364700317383} -11/06/2021 21:18:21 - INFO - __main__ - Step 198: {'lr': 4.9250000000000004e-05, 'samples': 38016, 'steps': 197, 'loss/train': 6.532893180847168} -11/06/2021 21:18:22 - INFO - __main__ - Step 199: {'lr': 4.9500000000000004e-05, 'samples': 38208, 'steps': 198, 'loss/train': 6.542242527008057} -11/06/2021 21:18:22 - INFO - __main__ - Step 200: {'lr': 4.975e-05, 'samples': 38400, 'steps': 199, 'loss/train': 6.113000392913818} -11/06/2021 21:18:22 - INFO - __main__ - Step 201: {'lr': 5e-05, 'samples': 38592, 'steps': 200, 'loss/train': 6.284862995147705} -11/06/2021 21:18:23 - INFO - __main__ - Step 202: {'lr': 5.025e-05, 'samples': 38784, 'steps': 201, 'loss/train': 6.143826007843018} -11/06/2021 21:18:24 - INFO - __main__ - Step 203: {'lr': 5.05e-05, 'samples': 38976, 'steps': 202, 'loss/train': 6.595575332641602} -11/06/2021 21:18:24 - INFO - __main__ - Step 204: {'lr': 5.075000000000001e-05, 'samples': 39168, 'steps': 203, 'loss/train': 6.1036787033081055} -11/06/2021 21:18:24 - INFO - __main__ - Step 205: {'lr': 5.1e-05, 'samples': 39360, 'steps': 204, 'loss/train': 6.222804546356201} -11/06/2021 21:18:25 - INFO - __main__ - Step 206: {'lr': 5.125e-05, 'samples': 39552, 'steps': 205, 'loss/train': 5.817543029785156} -11/06/2021 21:18:26 - INFO - __main__ - Step 207: {'lr': 5.15e-05, 'samples': 39744, 'steps': 206, 'loss/train': 6.056823253631592} -11/06/2021 21:18:26 - INFO - __main__ - Step 208: {'lr': 5.175e-05, 'samples': 39936, 'steps': 207, 'loss/train': 6.261317729949951} -11/06/2021 21:18:27 - INFO - __main__ - Step 209: {'lr': 5.2e-05, 'samples': 40128, 'steps': 208, 'loss/train': 6.321830749511719} -11/06/2021 21:18:27 - INFO - __main__ - Step 210: {'lr': 5.2249999999999996e-05, 'samples': 40320, 'steps': 209, 'loss/train': 5.724458694458008} -11/06/2021 21:18:27 - INFO - __main__ - Step 211: {'lr': 5.25e-05, 'samples': 40512, 'steps': 210, 'loss/train': 6.434157371520996} -11/06/2021 21:18:28 - INFO - __main__ - Step 212: {'lr': 5.275e-05, 'samples': 40704, 'steps': 211, 'loss/train': 5.677988529205322} -11/06/2021 21:18:29 - INFO - __main__ - Step 213: {'lr': 5.3e-05, 'samples': 40896, 'steps': 212, 'loss/train': 5.744022846221924} -11/06/2021 21:18:29 - INFO - __main__ - Step 214: {'lr': 5.325e-05, 'samples': 41088, 'steps': 213, 'loss/train': 5.744656562805176} -11/06/2021 21:18:29 - INFO - __main__ - Step 215: {'lr': 5.35e-05, 'samples': 41280, 'steps': 214, 'loss/train': 5.984218597412109} -11/06/2021 21:18:30 - INFO - __main__ - Step 216: {'lr': 5.375e-05, 'samples': 41472, 'steps': 215, 'loss/train': 6.307746887207031} -11/06/2021 21:18:31 - INFO - __main__ - Step 217: {'lr': 5.4e-05, 'samples': 41664, 'steps': 216, 'loss/train': 6.040472030639648} -11/06/2021 21:18:31 - INFO - __main__ - Step 218: {'lr': 5.4250000000000004e-05, 'samples': 41856, 'steps': 217, 'loss/train': 6.029814720153809} -11/06/2021 21:18:31 - INFO - __main__ - Step 219: {'lr': 5.45e-05, 'samples': 42048, 'steps': 218, 'loss/train': 6.033048629760742} -11/06/2021 21:18:32 - INFO - __main__ - Step 220: {'lr': 5.475e-05, 'samples': 42240, 'steps': 219, 'loss/train': 5.9049153327941895} -11/06/2021 21:18:32 - INFO - __main__ - Step 221: {'lr': 5.5e-05, 'samples': 42432, 'steps': 220, 'loss/train': 6.097071170806885} -11/06/2021 21:18:33 - INFO - __main__ - Step 222: {'lr': 5.525e-05, 'samples': 42624, 'steps': 221, 'loss/train': 6.372702598571777} -11/06/2021 21:18:33 - INFO - __main__ - Step 223: {'lr': 5.55e-05, 'samples': 42816, 'steps': 222, 'loss/train': 7.301460266113281} -11/06/2021 21:18:34 - INFO - __main__ - Step 224: {'lr': 5.575e-05, 'samples': 43008, 'steps': 223, 'loss/train': 6.467023849487305} -11/06/2021 21:18:34 - INFO - __main__ - Step 225: {'lr': 5.6e-05, 'samples': 43200, 'steps': 224, 'loss/train': 6.188560962677002} -11/06/2021 21:18:34 - INFO - __main__ - Step 226: {'lr': 5.6250000000000005e-05, 'samples': 43392, 'steps': 225, 'loss/train': 5.94260311126709} -11/06/2021 21:18:36 - INFO - __main__ - Step 227: {'lr': 5.6500000000000005e-05, 'samples': 43584, 'steps': 226, 'loss/train': 5.925175189971924} -11/06/2021 21:18:36 - INFO - __main__ - Step 228: {'lr': 5.6750000000000004e-05, 'samples': 43776, 'steps': 227, 'loss/train': 5.587348937988281} -11/06/2021 21:18:36 - INFO - __main__ - Step 229: {'lr': 5.7e-05, 'samples': 43968, 'steps': 228, 'loss/train': 5.978050231933594} -11/06/2021 21:18:37 - INFO - __main__ - Step 230: {'lr': 5.725e-05, 'samples': 44160, 'steps': 229, 'loss/train': 5.728048324584961} -11/06/2021 21:18:37 - INFO - __main__ - Step 231: {'lr': 5.75e-05, 'samples': 44352, 'steps': 230, 'loss/train': 6.196109771728516} -11/06/2021 21:18:37 - INFO - __main__ - Step 232: {'lr': 5.775e-05, 'samples': 44544, 'steps': 231, 'loss/train': 6.567146301269531} -11/06/2021 21:18:38 - INFO - __main__ - Step 233: {'lr': 5.800000000000001e-05, 'samples': 44736, 'steps': 232, 'loss/train': 5.301417827606201} -11/06/2021 21:18:39 - INFO - __main__ - Step 234: {'lr': 5.8250000000000006e-05, 'samples': 44928, 'steps': 233, 'loss/train': 5.6201348304748535} -11/06/2021 21:18:39 - INFO - __main__ - Step 235: {'lr': 5.8500000000000006e-05, 'samples': 45120, 'steps': 234, 'loss/train': 5.957462787628174} -11/06/2021 21:18:39 - INFO - __main__ - Step 236: {'lr': 5.875e-05, 'samples': 45312, 'steps': 235, 'loss/train': 6.2582688331604} -11/06/2021 21:18:40 - INFO - __main__ - Step 237: {'lr': 5.9e-05, 'samples': 45504, 'steps': 236, 'loss/train': 5.807918071746826} -11/06/2021 21:18:41 - INFO - __main__ - Step 238: {'lr': 5.925e-05, 'samples': 45696, 'steps': 237, 'loss/train': 5.977503299713135} -11/06/2021 21:18:41 - INFO - __main__ - Step 239: {'lr': 5.9499999999999996e-05, 'samples': 45888, 'steps': 238, 'loss/train': 5.574709892272949} -11/06/2021 21:18:42 - INFO - __main__ - Step 240: {'lr': 5.9749999999999995e-05, 'samples': 46080, 'steps': 239, 'loss/train': 5.93025016784668} -11/06/2021 21:18:42 - INFO - __main__ - Step 241: {'lr': 6e-05, 'samples': 46272, 'steps': 240, 'loss/train': 5.585808277130127} -11/06/2021 21:18:42 - INFO - __main__ - Step 242: {'lr': 6.025e-05, 'samples': 46464, 'steps': 241, 'loss/train': 6.203149318695068} -11/06/2021 21:18:43 - INFO - __main__ - Step 243: {'lr': 6.05e-05, 'samples': 46656, 'steps': 242, 'loss/train': 4.716400623321533} -11/06/2021 21:18:44 - INFO - __main__ - Step 244: {'lr': 6.075e-05, 'samples': 46848, 'steps': 243, 'loss/train': 5.850978851318359} -11/06/2021 21:18:44 - INFO - __main__ - Step 245: {'lr': 6.1e-05, 'samples': 47040, 'steps': 244, 'loss/train': 5.889804840087891} -11/06/2021 21:18:44 - INFO - __main__ - Step 246: {'lr': 6.125e-05, 'samples': 47232, 'steps': 245, 'loss/train': 5.8663225173950195} -11/06/2021 21:18:45 - INFO - __main__ - Step 247: {'lr': 6.15e-05, 'samples': 47424, 'steps': 246, 'loss/train': 5.8062334060668945} -11/06/2021 21:18:45 - INFO - __main__ - Step 248: {'lr': 6.175e-05, 'samples': 47616, 'steps': 247, 'loss/train': 5.754123210906982} -11/06/2021 21:18:46 - INFO - __main__ - Step 249: {'lr': 6.2e-05, 'samples': 47808, 'steps': 248, 'loss/train': 5.87885856628418} -11/06/2021 21:18:47 - INFO - __main__ - Step 250: {'lr': 6.225e-05, 'samples': 48000, 'steps': 249, 'loss/train': 5.715115070343018} -11/06/2021 21:18:47 - INFO - __main__ - Step 251: {'lr': 6.25e-05, 'samples': 48192, 'steps': 250, 'loss/train': 5.726807594299316} -11/06/2021 21:18:47 - INFO - __main__ - Step 252: {'lr': 6.275000000000001e-05, 'samples': 48384, 'steps': 251, 'loss/train': 5.94719934463501} -11/06/2021 21:18:48 - INFO - __main__ - Step 253: {'lr': 6.3e-05, 'samples': 48576, 'steps': 252, 'loss/train': 5.911177158355713} -11/06/2021 21:18:49 - INFO - __main__ - Step 254: {'lr': 6.325e-05, 'samples': 48768, 'steps': 253, 'loss/train': 5.7925004959106445} -11/06/2021 21:18:49 - INFO - __main__ - Step 255: {'lr': 6.35e-05, 'samples': 48960, 'steps': 254, 'loss/train': 5.541946887969971} -11/06/2021 21:18:50 - INFO - __main__ - Step 256: {'lr': 6.375e-05, 'samples': 49152, 'steps': 255, 'loss/train': 5.5716233253479} -11/06/2021 21:18:50 - INFO - __main__ - Step 257: {'lr': 6.4e-05, 'samples': 49344, 'steps': 256, 'loss/train': 6.297529697418213} -11/06/2021 21:18:50 - INFO - __main__ - Step 258: {'lr': 6.425e-05, 'samples': 49536, 'steps': 257, 'loss/train': 4.350067138671875} -11/06/2021 21:18:51 - INFO - __main__ - Step 259: {'lr': 6.450000000000001e-05, 'samples': 49728, 'steps': 258, 'loss/train': 5.1816887855529785} -11/06/2021 21:18:52 - INFO - __main__ - Step 260: {'lr': 6.475e-05, 'samples': 49920, 'steps': 259, 'loss/train': 3.9729881286621094} -11/06/2021 21:18:52 - INFO - __main__ - Step 261: {'lr': 6.500000000000001e-05, 'samples': 50112, 'steps': 260, 'loss/train': 5.403891563415527} -11/06/2021 21:18:52 - INFO - __main__ - Step 262: {'lr': 6.525e-05, 'samples': 50304, 'steps': 261, 'loss/train': 6.115725517272949} -11/06/2021 21:18:53 - INFO - __main__ - Step 263: {'lr': 6.55e-05, 'samples': 50496, 'steps': 262, 'loss/train': 6.0679426193237305} -11/06/2021 21:18:53 - INFO - __main__ - Step 264: {'lr': 6.575e-05, 'samples': 50688, 'steps': 263, 'loss/train': 5.964505195617676} -11/06/2021 21:18:54 - INFO - __main__ - Step 265: {'lr': 6.6e-05, 'samples': 50880, 'steps': 264, 'loss/train': 5.48927640914917} -11/06/2021 21:18:55 - INFO - __main__ - Step 266: {'lr': 6.625000000000001e-05, 'samples': 51072, 'steps': 265, 'loss/train': 6.112322807312012} -11/06/2021 21:18:55 - INFO - __main__ - Step 267: {'lr': 6.65e-05, 'samples': 51264, 'steps': 266, 'loss/train': 6.019900798797607} -11/06/2021 21:18:55 - INFO - __main__ - Step 268: {'lr': 6.675000000000001e-05, 'samples': 51456, 'steps': 267, 'loss/train': 6.1478657722473145} -11/06/2021 21:18:56 - INFO - __main__ - Step 269: {'lr': 6.7e-05, 'samples': 51648, 'steps': 268, 'loss/train': 5.52264404296875} -11/06/2021 21:18:57 - INFO - __main__ - Step 270: {'lr': 6.725000000000001e-05, 'samples': 51840, 'steps': 269, 'loss/train': 5.913082599639893} -11/06/2021 21:18:57 - INFO - __main__ - Step 271: {'lr': 6.75e-05, 'samples': 52032, 'steps': 270, 'loss/train': 5.843954086303711} -11/06/2021 21:18:57 - INFO - __main__ - Step 272: {'lr': 6.775000000000001e-05, 'samples': 52224, 'steps': 271, 'loss/train': 5.43068790435791} -11/06/2021 21:18:58 - INFO - __main__ - Step 273: {'lr': 6.800000000000001e-05, 'samples': 52416, 'steps': 272, 'loss/train': 5.731388568878174} -11/06/2021 21:18:58 - INFO - __main__ - Step 274: {'lr': 6.825e-05, 'samples': 52608, 'steps': 273, 'loss/train': 6.002760887145996} -11/06/2021 21:18:59 - INFO - __main__ - Step 275: {'lr': 6.850000000000001e-05, 'samples': 52800, 'steps': 274, 'loss/train': 5.909034729003906} -11/06/2021 21:18:59 - INFO - __main__ - Step 276: {'lr': 6.875e-05, 'samples': 52992, 'steps': 275, 'loss/train': 5.980253219604492} -11/06/2021 21:19:00 - INFO - __main__ - Step 277: {'lr': 6.900000000000001e-05, 'samples': 53184, 'steps': 276, 'loss/train': 5.36932373046875} -11/06/2021 21:19:00 - INFO - __main__ - Step 278: {'lr': 6.925e-05, 'samples': 53376, 'steps': 277, 'loss/train': 5.7302045822143555} -11/06/2021 21:19:00 - INFO - __main__ - Step 279: {'lr': 6.950000000000001e-05, 'samples': 53568, 'steps': 278, 'loss/train': 5.460746765136719} -11/06/2021 21:19:01 - INFO - __main__ - Step 280: {'lr': 6.975e-05, 'samples': 53760, 'steps': 279, 'loss/train': 5.948640823364258} -11/06/2021 21:19:02 - INFO - __main__ - Step 281: {'lr': 7.000000000000001e-05, 'samples': 53952, 'steps': 280, 'loss/train': 5.746571063995361} -11/06/2021 21:19:02 - INFO - __main__ - Step 282: {'lr': 7.025000000000001e-05, 'samples': 54144, 'steps': 281, 'loss/train': 6.098116874694824} -11/06/2021 21:19:03 - INFO - __main__ - Step 283: {'lr': 7.049999999999999e-05, 'samples': 54336, 'steps': 282, 'loss/train': 5.805056571960449} -11/06/2021 21:19:03 - INFO - __main__ - Step 284: {'lr': 7.075e-05, 'samples': 54528, 'steps': 283, 'loss/train': 5.200248718261719} -11/06/2021 21:19:04 - INFO - __main__ - Step 285: {'lr': 7.099999999999999e-05, 'samples': 54720, 'steps': 284, 'loss/train': 6.579744815826416} -11/06/2021 21:19:04 - INFO - __main__ - Step 286: {'lr': 7.125e-05, 'samples': 54912, 'steps': 285, 'loss/train': 5.594106197357178} -11/06/2021 21:19:05 - INFO - __main__ - Step 287: {'lr': 7.149999999999999e-05, 'samples': 55104, 'steps': 286, 'loss/train': 6.083644390106201} -11/06/2021 21:19:05 - INFO - __main__ - Step 288: {'lr': 7.175e-05, 'samples': 55296, 'steps': 287, 'loss/train': 5.514430999755859} -11/06/2021 21:19:05 - INFO - __main__ - Step 289: {'lr': 7.2e-05, 'samples': 55488, 'steps': 288, 'loss/train': 5.3459954261779785} -11/06/2021 21:19:06 - INFO - __main__ - Step 290: {'lr': 7.225e-05, 'samples': 55680, 'steps': 289, 'loss/train': 6.18521785736084} -11/06/2021 21:19:07 - INFO - __main__ - Step 291: {'lr': 7.25e-05, 'samples': 55872, 'steps': 290, 'loss/train': 6.124849319458008} -11/06/2021 21:19:07 - INFO - __main__ - Step 292: {'lr': 7.274999999999999e-05, 'samples': 56064, 'steps': 291, 'loss/train': 5.46663761138916} -11/06/2021 21:19:07 - INFO - __main__ - Step 293: {'lr': 7.3e-05, 'samples': 56256, 'steps': 292, 'loss/train': 5.0395188331604} -11/06/2021 21:19:08 - INFO - __main__ - Step 294: {'lr': 7.324999999999999e-05, 'samples': 56448, 'steps': 293, 'loss/train': 5.422224998474121} -11/06/2021 21:19:08 - INFO - __main__ - Step 295: {'lr': 7.35e-05, 'samples': 56640, 'steps': 294, 'loss/train': 5.153810024261475} -11/06/2021 21:19:09 - INFO - __main__ - Step 296: {'lr': 7.375e-05, 'samples': 56832, 'steps': 295, 'loss/train': 5.397673606872559} -11/06/2021 21:19:10 - INFO - __main__ - Step 297: {'lr': 7.4e-05, 'samples': 57024, 'steps': 296, 'loss/train': 5.323544979095459} -11/06/2021 21:19:10 - INFO - __main__ - Step 298: {'lr': 7.425e-05, 'samples': 57216, 'steps': 297, 'loss/train': 5.2873454093933105} -11/06/2021 21:19:10 - INFO - __main__ - Step 299: {'lr': 7.45e-05, 'samples': 57408, 'steps': 298, 'loss/train': 5.626234531402588} -11/06/2021 21:19:11 - INFO - __main__ - Step 300: {'lr': 7.475e-05, 'samples': 57600, 'steps': 299, 'loss/train': 5.648954391479492} -11/06/2021 21:19:12 - INFO - __main__ - Step 301: {'lr': 7.5e-05, 'samples': 57792, 'steps': 300, 'loss/train': 6.47790002822876} -11/06/2021 21:19:12 - INFO - __main__ - Step 302: {'lr': 7.525e-05, 'samples': 57984, 'steps': 301, 'loss/train': 5.377347469329834} -11/06/2021 21:19:12 - INFO - __main__ - Step 303: {'lr': 7.55e-05, 'samples': 58176, 'steps': 302, 'loss/train': 5.396330833435059} -11/06/2021 21:19:13 - INFO - __main__ - Step 304: {'lr': 7.575e-05, 'samples': 58368, 'steps': 303, 'loss/train': 6.444887161254883} -11/06/2021 21:19:13 - INFO - __main__ - Step 305: {'lr': 7.6e-05, 'samples': 58560, 'steps': 304, 'loss/train': 5.51333475112915} -11/06/2021 21:19:14 - INFO - __main__ - Step 306: {'lr': 7.625e-05, 'samples': 58752, 'steps': 305, 'loss/train': 5.4495744705200195} -11/06/2021 21:19:15 - INFO - __main__ - Step 307: {'lr': 7.65e-05, 'samples': 58944, 'steps': 306, 'loss/train': 5.420361518859863} -11/06/2021 21:19:15 - INFO - __main__ - Step 308: {'lr': 7.675e-05, 'samples': 59136, 'steps': 307, 'loss/train': 5.876494407653809} -11/06/2021 21:19:15 - INFO - __main__ - Step 309: {'lr': 7.7e-05, 'samples': 59328, 'steps': 308, 'loss/train': 5.0450520515441895} -11/06/2021 21:19:16 - INFO - __main__ - Step 310: {'lr': 7.725000000000001e-05, 'samples': 59520, 'steps': 309, 'loss/train': 5.425472736358643} -11/06/2021 21:19:17 - INFO - __main__ - Step 311: {'lr': 7.75e-05, 'samples': 59712, 'steps': 310, 'loss/train': 5.596251010894775} -11/06/2021 21:19:17 - INFO - __main__ - Step 312: {'lr': 7.775e-05, 'samples': 59904, 'steps': 311, 'loss/train': 5.2670392990112305} -11/06/2021 21:19:17 - INFO - __main__ - Step 313: {'lr': 7.8e-05, 'samples': 60096, 'steps': 312, 'loss/train': 7.779051780700684} -11/06/2021 21:19:18 - INFO - __main__ - Step 314: {'lr': 7.825e-05, 'samples': 60288, 'steps': 313, 'loss/train': 5.498117923736572} -11/06/2021 21:19:18 - INFO - __main__ - Step 315: {'lr': 7.85e-05, 'samples': 60480, 'steps': 314, 'loss/train': 5.533538341522217} -11/06/2021 21:19:19 - INFO - __main__ - Step 316: {'lr': 7.875e-05, 'samples': 60672, 'steps': 315, 'loss/train': 5.794958591461182} -11/06/2021 21:19:19 - INFO - __main__ - Step 317: {'lr': 7.9e-05, 'samples': 60864, 'steps': 316, 'loss/train': 5.267005443572998} -11/06/2021 21:19:20 - INFO - __main__ - Step 318: {'lr': 7.925e-05, 'samples': 61056, 'steps': 317, 'loss/train': 5.625141143798828} -11/06/2021 21:19:20 - INFO - __main__ - Step 319: {'lr': 7.950000000000001e-05, 'samples': 61248, 'steps': 318, 'loss/train': 5.229969024658203} -11/06/2021 21:19:21 - INFO - __main__ - Step 320: {'lr': 7.975e-05, 'samples': 61440, 'steps': 319, 'loss/train': 5.5839314460754395} -11/06/2021 21:19:21 - INFO - __main__ - Step 321: {'lr': 8e-05, 'samples': 61632, 'steps': 320, 'loss/train': 5.807913303375244} -11/06/2021 21:19:22 - INFO - __main__ - Step 322: {'lr': 8.025e-05, 'samples': 61824, 'steps': 321, 'loss/train': 5.966512203216553} -11/06/2021 21:19:22 - INFO - __main__ - Step 323: {'lr': 8.05e-05, 'samples': 62016, 'steps': 322, 'loss/train': 5.348308563232422} -11/06/2021 21:19:23 - INFO - __main__ - Step 324: {'lr': 8.075e-05, 'samples': 62208, 'steps': 323, 'loss/train': 5.878225326538086} -11/06/2021 21:19:23 - INFO - __main__ - Step 325: {'lr': 8.1e-05, 'samples': 62400, 'steps': 324, 'loss/train': 5.854434013366699} -11/06/2021 21:19:23 - INFO - __main__ - Step 326: {'lr': 8.125000000000001e-05, 'samples': 62592, 'steps': 325, 'loss/train': 5.428937911987305} -11/06/2021 21:19:24 - INFO - __main__ - Step 327: {'lr': 8.15e-05, 'samples': 62784, 'steps': 326, 'loss/train': 5.665132522583008} -11/06/2021 21:19:25 - INFO - __main__ - Step 328: {'lr': 8.175000000000001e-05, 'samples': 62976, 'steps': 327, 'loss/train': 5.691938400268555} -11/06/2021 21:19:25 - INFO - __main__ - Step 329: {'lr': 8.2e-05, 'samples': 63168, 'steps': 328, 'loss/train': 6.869819641113281} -11/06/2021 21:19:26 - INFO - __main__ - Step 330: {'lr': 8.225000000000001e-05, 'samples': 63360, 'steps': 329, 'loss/train': 4.917605876922607} -11/06/2021 21:19:26 - INFO - __main__ - Step 331: {'lr': 8.25e-05, 'samples': 63552, 'steps': 330, 'loss/train': 5.495372295379639} -11/06/2021 21:19:27 - INFO - __main__ - Step 332: {'lr': 8.275e-05, 'samples': 63744, 'steps': 331, 'loss/train': 5.180616855621338} -11/06/2021 21:19:27 - INFO - __main__ - Step 333: {'lr': 8.300000000000001e-05, 'samples': 63936, 'steps': 332, 'loss/train': 5.5182318687438965} -11/06/2021 21:19:28 - INFO - __main__ - Step 334: {'lr': 8.325e-05, 'samples': 64128, 'steps': 333, 'loss/train': 5.079967975616455} -11/06/2021 21:19:28 - INFO - __main__ - Step 335: {'lr': 8.350000000000001e-05, 'samples': 64320, 'steps': 334, 'loss/train': 5.6893181800842285} -11/06/2021 21:19:28 - INFO - __main__ - Step 336: {'lr': 8.375e-05, 'samples': 64512, 'steps': 335, 'loss/train': 5.519853115081787} -11/06/2021 21:19:29 - INFO - __main__ - Step 337: {'lr': 8.400000000000001e-05, 'samples': 64704, 'steps': 336, 'loss/train': 5.515233516693115} -11/06/2021 21:19:30 - INFO - __main__ - Step 338: {'lr': 8.425e-05, 'samples': 64896, 'steps': 337, 'loss/train': 4.627192974090576} -11/06/2021 21:19:30 - INFO - __main__ - Step 339: {'lr': 8.450000000000001e-05, 'samples': 65088, 'steps': 338, 'loss/train': 5.647910118103027} -11/06/2021 21:19:30 - INFO - __main__ - Step 340: {'lr': 8.475000000000001e-05, 'samples': 65280, 'steps': 339, 'loss/train': 5.477786540985107} -11/06/2021 21:19:31 - INFO - __main__ - Step 341: {'lr': 8.5e-05, 'samples': 65472, 'steps': 340, 'loss/train': 5.654776573181152} -11/06/2021 21:19:32 - INFO - __main__ - Step 342: {'lr': 8.525000000000001e-05, 'samples': 65664, 'steps': 341, 'loss/train': 5.568868637084961} -11/06/2021 21:19:32 - INFO - __main__ - Step 343: {'lr': 8.55e-05, 'samples': 65856, 'steps': 342, 'loss/train': 3.5874297618865967} -11/06/2021 21:19:33 - INFO - __main__ - Step 344: {'lr': 8.575000000000001e-05, 'samples': 66048, 'steps': 343, 'loss/train': 5.646244525909424} -11/06/2021 21:19:33 - INFO - __main__ - Step 345: {'lr': 8.599999999999999e-05, 'samples': 66240, 'steps': 344, 'loss/train': 5.599254131317139} -11/06/2021 21:19:33 - INFO - __main__ - Step 346: {'lr': 8.625e-05, 'samples': 66432, 'steps': 345, 'loss/train': 5.349778652191162} -11/06/2021 21:19:34 - INFO - __main__ - Step 347: {'lr': 8.65e-05, 'samples': 66624, 'steps': 346, 'loss/train': 5.612128257751465} -11/06/2021 21:19:35 - INFO - __main__ - Step 348: {'lr': 8.675e-05, 'samples': 66816, 'steps': 347, 'loss/train': 5.6107988357543945} -11/06/2021 21:19:35 - INFO - __main__ - Step 349: {'lr': 8.7e-05, 'samples': 67008, 'steps': 348, 'loss/train': 5.735456943511963} -11/06/2021 21:19:35 - INFO - __main__ - Step 350: {'lr': 8.724999999999999e-05, 'samples': 67200, 'steps': 349, 'loss/train': 5.3645172119140625} -11/06/2021 21:19:36 - INFO - __main__ - Step 351: {'lr': 8.75e-05, 'samples': 67392, 'steps': 350, 'loss/train': 5.467144966125488} -11/06/2021 21:19:36 - INFO - __main__ - Step 352: {'lr': 8.774999999999999e-05, 'samples': 67584, 'steps': 351, 'loss/train': 6.211921215057373} -11/06/2021 21:19:37 - INFO - __main__ - Step 353: {'lr': 8.8e-05, 'samples': 67776, 'steps': 352, 'loss/train': 5.452548980712891} -11/06/2021 21:19:37 - INFO - __main__ - Step 354: {'lr': 8.824999999999999e-05, 'samples': 67968, 'steps': 353, 'loss/train': 5.824997901916504} -11/06/2021 21:19:38 - INFO - __main__ - Step 355: {'lr': 8.85e-05, 'samples': 68160, 'steps': 354, 'loss/train': 5.646512985229492} -11/06/2021 21:19:38 - INFO - __main__ - Step 356: {'lr': 8.875e-05, 'samples': 68352, 'steps': 355, 'loss/train': 5.443009853363037} -11/06/2021 21:19:39 - INFO - __main__ - Step 357: {'lr': 8.9e-05, 'samples': 68544, 'steps': 356, 'loss/train': 5.597517490386963} -11/06/2021 21:19:40 - INFO - __main__ - Step 358: {'lr': 8.925e-05, 'samples': 68736, 'steps': 357, 'loss/train': 5.510553359985352} -11/06/2021 21:19:40 - INFO - __main__ - Step 359: {'lr': 8.95e-05, 'samples': 68928, 'steps': 358, 'loss/train': 5.271029949188232} -11/06/2021 21:19:40 - INFO - __main__ - Step 360: {'lr': 8.975e-05, 'samples': 69120, 'steps': 359, 'loss/train': 5.6077141761779785} -11/06/2021 21:19:41 - INFO - __main__ - Step 361: {'lr': 8.999999999999999e-05, 'samples': 69312, 'steps': 360, 'loss/train': 7.289037227630615} -11/06/2021 21:19:41 - INFO - __main__ - Step 362: {'lr': 9.025e-05, 'samples': 69504, 'steps': 361, 'loss/train': 5.1300740242004395} -11/06/2021 21:19:42 - INFO - __main__ - Step 363: {'lr': 9.05e-05, 'samples': 69696, 'steps': 362, 'loss/train': 5.349740982055664} -11/06/2021 21:19:42 - INFO - __main__ - Step 364: {'lr': 9.075e-05, 'samples': 69888, 'steps': 363, 'loss/train': 5.435561656951904} -11/06/2021 21:19:43 - INFO - __main__ - Step 365: {'lr': 9.1e-05, 'samples': 70080, 'steps': 364, 'loss/train': 5.4572978019714355} -11/06/2021 21:19:43 - INFO - __main__ - Step 366: {'lr': 9.125e-05, 'samples': 70272, 'steps': 365, 'loss/train': 5.351955890655518} -11/06/2021 21:19:43 - INFO - __main__ - Step 367: {'lr': 9.15e-05, 'samples': 70464, 'steps': 366, 'loss/train': 5.565761089324951} -11/06/2021 21:19:44 - INFO - __main__ - Step 368: {'lr': 9.175e-05, 'samples': 70656, 'steps': 367, 'loss/train': 5.959819316864014} -11/06/2021 21:19:45 - INFO - __main__ - Step 369: {'lr': 9.2e-05, 'samples': 70848, 'steps': 368, 'loss/train': 5.474288463592529} -11/06/2021 21:19:45 - INFO - __main__ - Step 370: {'lr': 9.225e-05, 'samples': 71040, 'steps': 369, 'loss/train': 5.607541561126709} -11/06/2021 21:19:46 - INFO - __main__ - Step 371: {'lr': 9.25e-05, 'samples': 71232, 'steps': 370, 'loss/train': 5.084637641906738} -11/06/2021 21:19:46 - INFO - __main__ - Step 372: {'lr': 9.275e-05, 'samples': 71424, 'steps': 371, 'loss/train': 4.969635009765625} -11/06/2021 21:19:46 - INFO - __main__ - Step 373: {'lr': 9.3e-05, 'samples': 71616, 'steps': 372, 'loss/train': 5.273648262023926} -11/06/2021 21:19:47 - INFO - __main__ - Step 374: {'lr': 9.325e-05, 'samples': 71808, 'steps': 373, 'loss/train': 5.385776042938232} -11/06/2021 21:19:48 - INFO - __main__ - Step 375: {'lr': 9.35e-05, 'samples': 72000, 'steps': 374, 'loss/train': 4.57074499130249} -11/06/2021 21:19:48 - INFO - __main__ - Step 376: {'lr': 9.375e-05, 'samples': 72192, 'steps': 375, 'loss/train': 5.399175643920898} -11/06/2021 21:19:48 - INFO - __main__ - Step 377: {'lr': 9.400000000000001e-05, 'samples': 72384, 'steps': 376, 'loss/train': 5.5180864334106445} -11/06/2021 21:19:49 - INFO - __main__ - Step 378: {'lr': 9.425e-05, 'samples': 72576, 'steps': 377, 'loss/train': 5.192264556884766} -11/06/2021 21:19:50 - INFO - __main__ - Step 379: {'lr': 9.45e-05, 'samples': 72768, 'steps': 378, 'loss/train': 5.126402854919434} -11/06/2021 21:19:50 - INFO - __main__ - Step 380: {'lr': 9.475e-05, 'samples': 72960, 'steps': 379, 'loss/train': 5.3973708152771} -11/06/2021 21:19:50 - INFO - __main__ - Step 381: {'lr': 9.5e-05, 'samples': 73152, 'steps': 380, 'loss/train': 5.583156585693359} -11/06/2021 21:19:51 - INFO - __main__ - Step 382: {'lr': 9.525e-05, 'samples': 73344, 'steps': 381, 'loss/train': 5.458894729614258} -11/06/2021 21:19:51 - INFO - __main__ - Step 383: {'lr': 9.55e-05, 'samples': 73536, 'steps': 382, 'loss/train': 5.020319938659668} -11/06/2021 21:19:52 - INFO - __main__ - Step 384: {'lr': 9.575000000000001e-05, 'samples': 73728, 'steps': 383, 'loss/train': 5.400721073150635} -11/06/2021 21:19:53 - INFO - __main__ - Step 385: {'lr': 9.6e-05, 'samples': 73920, 'steps': 384, 'loss/train': 5.1949381828308105} -11/06/2021 21:19:53 - INFO - __main__ - Step 386: {'lr': 9.625000000000001e-05, 'samples': 74112, 'steps': 385, 'loss/train': 5.291417121887207} -11/06/2021 21:19:53 - INFO - __main__ - Step 387: {'lr': 9.65e-05, 'samples': 74304, 'steps': 386, 'loss/train': 6.089571475982666} -11/06/2021 21:19:54 - INFO - __main__ - Step 388: {'lr': 9.675000000000001e-05, 'samples': 74496, 'steps': 387, 'loss/train': 5.51926326751709} -11/06/2021 21:19:55 - INFO - __main__ - Step 389: {'lr': 9.7e-05, 'samples': 74688, 'steps': 388, 'loss/train': 5.781015396118164} -11/06/2021 21:19:55 - INFO - __main__ - Step 390: {'lr': 9.725e-05, 'samples': 74880, 'steps': 389, 'loss/train': 4.908177852630615} -11/06/2021 21:19:55 - INFO - __main__ - Step 391: {'lr': 9.750000000000001e-05, 'samples': 75072, 'steps': 390, 'loss/train': 5.012897968292236} -11/06/2021 21:19:56 - INFO - __main__ - Step 392: {'lr': 9.775e-05, 'samples': 75264, 'steps': 391, 'loss/train': 5.399777889251709} -11/06/2021 21:19:56 - INFO - __main__ - Step 393: {'lr': 9.800000000000001e-05, 'samples': 75456, 'steps': 392, 'loss/train': 5.350080966949463} -11/06/2021 21:19:57 - INFO - __main__ - Step 394: {'lr': 9.825e-05, 'samples': 75648, 'steps': 393, 'loss/train': 5.737140655517578} -11/06/2021 21:19:57 - INFO - __main__ - Step 395: {'lr': 9.850000000000001e-05, 'samples': 75840, 'steps': 394, 'loss/train': 5.23768949508667} -11/06/2021 21:19:58 - INFO - __main__ - Step 396: {'lr': 9.875e-05, 'samples': 76032, 'steps': 395, 'loss/train': 5.202757358551025} -11/06/2021 21:19:58 - INFO - __main__ - Step 397: {'lr': 9.900000000000001e-05, 'samples': 76224, 'steps': 396, 'loss/train': 5.724830150604248} -11/06/2021 21:19:59 - INFO - __main__ - Step 398: {'lr': 9.925000000000001e-05, 'samples': 76416, 'steps': 397, 'loss/train': 6.981353282928467} -11/06/2021 21:19:59 - INFO - __main__ - Step 399: {'lr': 9.95e-05, 'samples': 76608, 'steps': 398, 'loss/train': 7.47460412979126} -11/06/2021 21:20:00 - INFO - __main__ - Step 400: {'lr': 9.975000000000001e-05, 'samples': 76800, 'steps': 399, 'loss/train': 5.741088390350342} -11/06/2021 21:20:00 - INFO - __main__ - Step 401: {'lr': 0.0001, 'samples': 76992, 'steps': 400, 'loss/train': 5.029991626739502} -11/06/2021 21:20:01 - INFO - __main__ - Step 402: {'lr': 0.00010025000000000001, 'samples': 77184, 'steps': 401, 'loss/train': 5.318662166595459} -11/06/2021 21:20:01 - INFO - __main__ - Step 403: {'lr': 0.0001005, 'samples': 77376, 'steps': 402, 'loss/train': 5.997198104858398} -11/06/2021 21:20:01 - INFO - __main__ - Step 404: {'lr': 0.00010075000000000001, 'samples': 77568, 'steps': 403, 'loss/train': 6.158583641052246} -11/06/2021 21:20:02 - INFO - __main__ - Step 405: {'lr': 0.000101, 'samples': 77760, 'steps': 404, 'loss/train': 5.336831569671631} -11/06/2021 21:20:03 - INFO - __main__ - Step 406: {'lr': 0.00010125000000000001, 'samples': 77952, 'steps': 405, 'loss/train': 5.227279186248779} -11/06/2021 21:20:03 - INFO - __main__ - Step 407: {'lr': 0.00010150000000000001, 'samples': 78144, 'steps': 406, 'loss/train': 5.527342319488525} -11/06/2021 21:20:03 - INFO - __main__ - Step 408: {'lr': 0.00010174999999999999, 'samples': 78336, 'steps': 407, 'loss/train': 5.73346471786499} -11/06/2021 21:20:04 - INFO - __main__ - Step 409: {'lr': 0.000102, 'samples': 78528, 'steps': 408, 'loss/train': 6.215020179748535} -11/06/2021 21:20:05 - INFO - __main__ - Step 410: {'lr': 0.00010224999999999999, 'samples': 78720, 'steps': 409, 'loss/train': 5.491655349731445} -11/06/2021 21:20:05 - INFO - __main__ - Step 411: {'lr': 0.0001025, 'samples': 78912, 'steps': 410, 'loss/train': 4.847282886505127} -11/06/2021 21:20:05 - INFO - __main__ - Step 412: {'lr': 0.00010274999999999999, 'samples': 79104, 'steps': 411, 'loss/train': 5.18861198425293} -11/06/2021 21:20:06 - INFO - __main__ - Step 413: {'lr': 0.000103, 'samples': 79296, 'steps': 412, 'loss/train': 5.54094934463501} -11/06/2021 21:20:06 - INFO - __main__ - Step 414: {'lr': 0.00010325, 'samples': 79488, 'steps': 413, 'loss/train': 5.201007843017578} -11/06/2021 21:20:07 - INFO - __main__ - Step 415: {'lr': 0.0001035, 'samples': 79680, 'steps': 414, 'loss/train': 5.937044143676758} -11/06/2021 21:20:08 - INFO - __main__ - Step 416: {'lr': 0.00010375, 'samples': 79872, 'steps': 415, 'loss/train': 5.265571117401123} -11/06/2021 21:20:08 - INFO - __main__ - Step 417: {'lr': 0.000104, 'samples': 80064, 'steps': 416, 'loss/train': 4.91490364074707} -11/06/2021 21:20:08 - INFO - __main__ - Step 418: {'lr': 0.00010425, 'samples': 80256, 'steps': 417, 'loss/train': 5.490600109100342} -11/06/2021 21:20:09 - INFO - __main__ - Step 419: {'lr': 0.00010449999999999999, 'samples': 80448, 'steps': 418, 'loss/train': 4.848526954650879} -11/06/2021 21:20:10 - INFO - __main__ - Step 420: {'lr': 0.00010475, 'samples': 80640, 'steps': 419, 'loss/train': 5.088794231414795} -11/06/2021 21:20:10 - INFO - __main__ - Step 421: {'lr': 0.000105, 'samples': 80832, 'steps': 420, 'loss/train': 5.438802719116211} -11/06/2021 21:20:10 - INFO - __main__ - Step 422: {'lr': 0.00010525, 'samples': 81024, 'steps': 421, 'loss/train': 5.321382522583008} -11/06/2021 21:20:11 - INFO - __main__ - Step 423: {'lr': 0.0001055, 'samples': 81216, 'steps': 422, 'loss/train': 5.291647434234619} -11/06/2021 21:20:11 - INFO - __main__ - Step 424: {'lr': 0.00010575, 'samples': 81408, 'steps': 423, 'loss/train': 4.753524303436279} -11/06/2021 21:20:11 - INFO - __main__ - Step 425: {'lr': 0.000106, 'samples': 81600, 'steps': 424, 'loss/train': 5.298032760620117} -11/06/2021 21:20:13 - INFO - __main__ - Step 426: {'lr': 0.00010625, 'samples': 81792, 'steps': 425, 'loss/train': 6.007701873779297} -11/06/2021 21:20:13 - INFO - __main__ - Step 427: {'lr': 0.0001065, 'samples': 81984, 'steps': 426, 'loss/train': 5.437173366546631} -11/06/2021 21:20:13 - INFO - __main__ - Step 428: {'lr': 0.00010675, 'samples': 82176, 'steps': 427, 'loss/train': 5.345945358276367} -11/06/2021 21:20:14 - INFO - __main__ - Step 429: {'lr': 0.000107, 'samples': 82368, 'steps': 428, 'loss/train': 5.066455841064453} -11/06/2021 21:20:14 - INFO - __main__ - Step 430: {'lr': 0.00010725, 'samples': 82560, 'steps': 429, 'loss/train': 3.3696258068084717} -11/06/2021 21:20:15 - INFO - __main__ - Step 431: {'lr': 0.0001075, 'samples': 82752, 'steps': 430, 'loss/train': 4.334190845489502} -11/06/2021 21:20:15 - INFO - __main__ - Step 432: {'lr': 0.00010775, 'samples': 82944, 'steps': 431, 'loss/train': 5.169923305511475} -11/06/2021 21:20:16 - INFO - __main__ - Step 433: {'lr': 0.000108, 'samples': 83136, 'steps': 432, 'loss/train': 5.3268537521362305} -11/06/2021 21:20:16 - INFO - __main__ - Step 434: {'lr': 0.00010825, 'samples': 83328, 'steps': 433, 'loss/train': 5.3919854164123535} -11/06/2021 21:20:16 - INFO - __main__ - Step 435: {'lr': 0.00010850000000000001, 'samples': 83520, 'steps': 434, 'loss/train': 5.3725810050964355} -11/06/2021 21:20:17 - INFO - __main__ - Step 436: {'lr': 0.00010875, 'samples': 83712, 'steps': 435, 'loss/train': 5.403895854949951} -11/06/2021 21:20:18 - INFO - __main__ - Step 437: {'lr': 0.000109, 'samples': 83904, 'steps': 436, 'loss/train': 5.205580711364746} -11/06/2021 21:20:18 - INFO - __main__ - Step 438: {'lr': 0.00010925, 'samples': 84096, 'steps': 437, 'loss/train': 5.33302640914917} -11/06/2021 21:20:18 - INFO - __main__ - Step 439: {'lr': 0.0001095, 'samples': 84288, 'steps': 438, 'loss/train': 5.41857385635376} -11/06/2021 21:20:19 - INFO - __main__ - Step 440: {'lr': 0.00010975, 'samples': 84480, 'steps': 439, 'loss/train': 5.0854315757751465} -11/06/2021 21:20:20 - INFO - __main__ - Step 441: {'lr': 0.00011, 'samples': 84672, 'steps': 440, 'loss/train': 4.953428745269775} -11/06/2021 21:20:21 - INFO - __main__ - Step 442: {'lr': 0.00011025, 'samples': 84864, 'steps': 441, 'loss/train': 5.355175495147705} -11/06/2021 21:20:21 - INFO - __main__ - Step 443: {'lr': 0.0001105, 'samples': 85056, 'steps': 442, 'loss/train': 5.322221279144287} -11/06/2021 21:20:21 - INFO - __main__ - Step 444: {'lr': 0.00011075000000000001, 'samples': 85248, 'steps': 443, 'loss/train': 5.694289207458496} -11/06/2021 21:20:22 - INFO - __main__ - Step 445: {'lr': 0.000111, 'samples': 85440, 'steps': 444, 'loss/train': 5.615618705749512} -11/06/2021 21:20:23 - INFO - __main__ - Step 446: {'lr': 0.00011125000000000001, 'samples': 85632, 'steps': 445, 'loss/train': 4.579447269439697} -11/06/2021 21:20:23 - INFO - __main__ - Step 447: {'lr': 0.0001115, 'samples': 85824, 'steps': 446, 'loss/train': 5.4635491371154785} -11/06/2021 21:20:23 - INFO - __main__ - Step 448: {'lr': 0.00011175, 'samples': 86016, 'steps': 447, 'loss/train': 5.6371636390686035} -11/06/2021 21:20:24 - INFO - __main__ - Step 449: {'lr': 0.000112, 'samples': 86208, 'steps': 448, 'loss/train': 5.192485332489014} -11/06/2021 21:20:24 - INFO - __main__ - Step 450: {'lr': 0.00011225, 'samples': 86400, 'steps': 449, 'loss/train': 5.126009464263916} -11/06/2021 21:20:25 - INFO - __main__ - Step 451: {'lr': 0.00011250000000000001, 'samples': 86592, 'steps': 450, 'loss/train': 4.955085754394531} -11/06/2021 21:20:25 - INFO - __main__ - Step 452: {'lr': 0.00011275, 'samples': 86784, 'steps': 451, 'loss/train': 4.919888973236084} -11/06/2021 21:20:26 - INFO - __main__ - Step 453: {'lr': 0.00011300000000000001, 'samples': 86976, 'steps': 452, 'loss/train': 5.37556266784668} -11/06/2021 21:20:26 - INFO - __main__ - Step 454: {'lr': 0.00011325, 'samples': 87168, 'steps': 453, 'loss/train': 5.237241744995117} -11/06/2021 21:20:26 - INFO - __main__ - Step 455: {'lr': 0.00011350000000000001, 'samples': 87360, 'steps': 454, 'loss/train': 4.927133083343506} -11/06/2021 21:20:27 - INFO - __main__ - Step 456: {'lr': 0.00011375, 'samples': 87552, 'steps': 455, 'loss/train': 5.2103400230407715} -11/06/2021 21:20:28 - INFO - __main__ - Step 457: {'lr': 0.000114, 'samples': 87744, 'steps': 456, 'loss/train': 5.820415496826172} -11/06/2021 21:20:28 - INFO - __main__ - Step 458: {'lr': 0.00011425000000000001, 'samples': 87936, 'steps': 457, 'loss/train': 3.8978383541107178} -11/06/2021 21:20:29 - INFO - __main__ - Step 459: {'lr': 0.0001145, 'samples': 88128, 'steps': 458, 'loss/train': 6.301289081573486} -11/06/2021 21:20:29 - INFO - __main__ - Step 460: {'lr': 0.00011475000000000001, 'samples': 88320, 'steps': 459, 'loss/train': 5.069262504577637} -11/06/2021 21:20:30 - INFO - __main__ - Step 461: {'lr': 0.000115, 'samples': 88512, 'steps': 460, 'loss/train': 5.043389320373535} -11/06/2021 21:20:30 - INFO - __main__ - Step 462: {'lr': 0.00011525000000000001, 'samples': 88704, 'steps': 461, 'loss/train': 5.780721664428711} -11/06/2021 21:20:31 - INFO - __main__ - Step 463: {'lr': 0.0001155, 'samples': 88896, 'steps': 462, 'loss/train': 4.882776737213135} -11/06/2021 21:20:31 - INFO - __main__ - Step 464: {'lr': 0.00011575000000000001, 'samples': 89088, 'steps': 463, 'loss/train': 4.844412326812744} -11/06/2021 21:20:31 - INFO - __main__ - Step 465: {'lr': 0.00011600000000000001, 'samples': 89280, 'steps': 464, 'loss/train': 5.012292385101318} -11/06/2021 21:20:32 - INFO - __main__ - Step 466: {'lr': 0.00011625, 'samples': 89472, 'steps': 465, 'loss/train': 5.141354084014893} -11/06/2021 21:20:33 - INFO - __main__ - Step 467: {'lr': 0.00011650000000000001, 'samples': 89664, 'steps': 466, 'loss/train': 5.3636956214904785} -11/06/2021 21:20:33 - INFO - __main__ - Step 468: {'lr': 0.00011675, 'samples': 89856, 'steps': 467, 'loss/train': 5.613701820373535} -11/06/2021 21:20:33 - INFO - __main__ - Step 469: {'lr': 0.00011700000000000001, 'samples': 90048, 'steps': 468, 'loss/train': 4.824275493621826} -11/06/2021 21:20:34 - INFO - __main__ - Step 470: {'lr': 0.00011724999999999999, 'samples': 90240, 'steps': 469, 'loss/train': 4.927989482879639} -11/06/2021 21:20:34 - INFO - __main__ - Step 471: {'lr': 0.0001175, 'samples': 90432, 'steps': 470, 'loss/train': 5.5396223068237305} -11/06/2021 21:20:35 - INFO - __main__ - Step 472: {'lr': 0.00011775, 'samples': 90624, 'steps': 471, 'loss/train': 5.157430648803711} -11/06/2021 21:20:36 - INFO - __main__ - Step 473: {'lr': 0.000118, 'samples': 90816, 'steps': 472, 'loss/train': 4.571201324462891} -11/06/2021 21:20:36 - INFO - __main__ - Step 474: {'lr': 0.00011825, 'samples': 91008, 'steps': 473, 'loss/train': 5.168905735015869} -11/06/2021 21:20:36 - INFO - __main__ - Step 475: {'lr': 0.0001185, 'samples': 91200, 'steps': 474, 'loss/train': 5.4914021492004395} -11/06/2021 21:20:37 - INFO - __main__ - Step 476: {'lr': 0.00011875, 'samples': 91392, 'steps': 475, 'loss/train': 5.1100382804870605} -11/06/2021 21:20:38 - INFO - __main__ - Step 477: {'lr': 0.00011899999999999999, 'samples': 91584, 'steps': 476, 'loss/train': 5.027097225189209} -11/06/2021 21:20:38 - INFO - __main__ - Step 478: {'lr': 0.00011925, 'samples': 91776, 'steps': 477, 'loss/train': 3.3699212074279785} -11/06/2021 21:20:38 - INFO - __main__ - Step 479: {'lr': 0.00011949999999999999, 'samples': 91968, 'steps': 478, 'loss/train': 5.552117824554443} -11/06/2021 21:20:39 - INFO - __main__ - Step 480: {'lr': 0.00011975, 'samples': 92160, 'steps': 479, 'loss/train': 5.236664295196533} -11/06/2021 21:20:39 - INFO - __main__ - Step 481: {'lr': 0.00012, 'samples': 92352, 'steps': 480, 'loss/train': 5.218561172485352} -11/06/2021 21:20:40 - INFO - __main__ - Step 482: {'lr': 0.00012025, 'samples': 92544, 'steps': 481, 'loss/train': 4.788586139678955} -11/06/2021 21:20:41 - INFO - __main__ - Step 483: {'lr': 0.0001205, 'samples': 92736, 'steps': 482, 'loss/train': 4.982636451721191} -11/06/2021 21:20:41 - INFO - __main__ - Step 484: {'lr': 0.00012075, 'samples': 92928, 'steps': 483, 'loss/train': 4.840455055236816} -11/06/2021 21:20:41 - INFO - __main__ - Step 485: {'lr': 0.000121, 'samples': 93120, 'steps': 484, 'loss/train': 5.3554840087890625} -11/06/2021 21:20:42 - INFO - __main__ - Step 486: {'lr': 0.00012124999999999999, 'samples': 93312, 'steps': 485, 'loss/train': 5.182967185974121} -11/06/2021 21:20:43 - INFO - __main__ - Step 487: {'lr': 0.0001215, 'samples': 93504, 'steps': 486, 'loss/train': 5.115420818328857} -11/06/2021 21:20:43 - INFO - __main__ - Step 488: {'lr': 0.00012175, 'samples': 93696, 'steps': 487, 'loss/train': 5.1655683517456055} -11/06/2021 21:20:43 - INFO - __main__ - Step 489: {'lr': 0.000122, 'samples': 93888, 'steps': 488, 'loss/train': 5.405882835388184} -11/06/2021 21:20:44 - INFO - __main__ - Step 490: {'lr': 0.00012225, 'samples': 94080, 'steps': 489, 'loss/train': 5.127898693084717} -11/06/2021 21:20:44 - INFO - __main__ - Step 491: {'lr': 0.0001225, 'samples': 94272, 'steps': 490, 'loss/train': 5.024046421051025} -11/06/2021 21:20:45 - INFO - __main__ - Step 492: {'lr': 0.00012275, 'samples': 94464, 'steps': 491, 'loss/train': 5.145169734954834} -11/06/2021 21:20:45 - INFO - __main__ - Step 493: {'lr': 0.000123, 'samples': 94656, 'steps': 492, 'loss/train': 4.954655170440674} -11/06/2021 21:20:46 - INFO - __main__ - Step 494: {'lr': 0.00012325000000000001, 'samples': 94848, 'steps': 493, 'loss/train': 5.174392223358154} -11/06/2021 21:20:46 - INFO - __main__ - Step 495: {'lr': 0.0001235, 'samples': 95040, 'steps': 494, 'loss/train': 4.580348014831543} -11/06/2021 21:20:47 - INFO - __main__ - Step 496: {'lr': 0.00012375, 'samples': 95232, 'steps': 495, 'loss/train': 4.821667194366455} -11/06/2021 21:20:47 - INFO - __main__ - Step 497: {'lr': 0.000124, 'samples': 95424, 'steps': 496, 'loss/train': 5.254716873168945} -11/06/2021 21:20:48 - INFO - __main__ - Step 498: {'lr': 0.00012425, 'samples': 95616, 'steps': 497, 'loss/train': 4.732685565948486} -11/06/2021 21:20:48 - INFO - __main__ - Step 499: {'lr': 0.0001245, 'samples': 95808, 'steps': 498, 'loss/train': 5.048670291900635} -11/06/2021 21:20:49 - INFO - __main__ - Step 500: {'lr': 0.00012475, 'samples': 96000, 'steps': 499, 'loss/train': 4.834158420562744} -11/06/2021 21:20:49 - INFO - __main__ - Step 501: {'lr': 0.000125, 'samples': 96192, 'steps': 500, 'loss/train': 5.50537109375} -11/06/2021 21:20:49 - INFO - __main__ - Step 502: {'lr': 0.00012525, 'samples': 96384, 'steps': 501, 'loss/train': 4.96640157699585} -11/06/2021 21:20:50 - INFO - __main__ - Step 503: {'lr': 0.00012550000000000001, 'samples': 96576, 'steps': 502, 'loss/train': 4.255295753479004} -11/06/2021 21:20:51 - INFO - __main__ - Step 504: {'lr': 0.00012575, 'samples': 96768, 'steps': 503, 'loss/train': 3.4102871417999268} -11/06/2021 21:20:51 - INFO - __main__ - Step 505: {'lr': 0.000126, 'samples': 96960, 'steps': 504, 'loss/train': 5.220231056213379} -11/06/2021 21:20:51 - INFO - __main__ - Step 506: {'lr': 0.00012625, 'samples': 97152, 'steps': 505, 'loss/train': 4.843728542327881} -11/06/2021 21:20:52 - INFO - __main__ - Step 507: {'lr': 0.0001265, 'samples': 97344, 'steps': 506, 'loss/train': 4.380231857299805} -11/06/2021 21:20:53 - INFO - __main__ - Step 508: {'lr': 0.00012675, 'samples': 97536, 'steps': 507, 'loss/train': 4.899729251861572} -11/06/2021 21:20:54 - INFO - __main__ - Step 509: {'lr': 0.000127, 'samples': 97728, 'steps': 508, 'loss/train': 4.977561950683594} -11/06/2021 21:20:54 - INFO - __main__ - Step 510: {'lr': 0.00012725, 'samples': 97920, 'steps': 509, 'loss/train': 5.346168518066406} -11/06/2021 21:20:54 - INFO - __main__ - Step 511: {'lr': 0.0001275, 'samples': 98112, 'steps': 510, 'loss/train': 4.873198509216309} -11/06/2021 21:20:55 - INFO - __main__ - Step 512: {'lr': 0.00012775000000000002, 'samples': 98304, 'steps': 511, 'loss/train': 5.125716686248779} -11/06/2021 21:20:56 - INFO - __main__ - Step 513: {'lr': 0.000128, 'samples': 98496, 'steps': 512, 'loss/train': 5.299740314483643} -11/06/2021 21:20:56 - INFO - __main__ - Step 514: {'lr': 0.00012825, 'samples': 98688, 'steps': 513, 'loss/train': 5.17880916595459} -11/06/2021 21:20:57 - INFO - __main__ - Step 515: {'lr': 0.0001285, 'samples': 98880, 'steps': 514, 'loss/train': 5.38531494140625} -11/06/2021 21:20:57 - INFO - __main__ - Step 516: {'lr': 0.00012875, 'samples': 99072, 'steps': 515, 'loss/train': 5.111538410186768} -11/06/2021 21:20:58 - INFO - __main__ - Step 517: {'lr': 0.00012900000000000002, 'samples': 99264, 'steps': 516, 'loss/train': 4.971146583557129} -11/06/2021 21:20:59 - INFO - __main__ - Step 518: {'lr': 0.00012925, 'samples': 99456, 'steps': 517, 'loss/train': 4.8264899253845215} -11/06/2021 21:20:59 - INFO - __main__ - Step 519: {'lr': 0.0001295, 'samples': 99648, 'steps': 518, 'loss/train': 4.728095054626465} -11/06/2021 21:20:59 - INFO - __main__ - Step 520: {'lr': 0.00012975, 'samples': 99840, 'steps': 519, 'loss/train': 4.82402229309082} -11/06/2021 21:21:00 - INFO - __main__ - Step 521: {'lr': 0.00013000000000000002, 'samples': 100032, 'steps': 520, 'loss/train': 4.82277774810791} -11/06/2021 21:21:00 - INFO - __main__ - Step 522: {'lr': 0.00013025, 'samples': 100224, 'steps': 521, 'loss/train': 4.736476898193359} -11/06/2021 21:21:01 - INFO - __main__ - Step 523: {'lr': 0.0001305, 'samples': 100416, 'steps': 522, 'loss/train': 5.3957390785217285} -11/06/2021 21:21:02 - INFO - __main__ - Step 524: {'lr': 0.00013075, 'samples': 100608, 'steps': 523, 'loss/train': 4.804849624633789} -11/06/2021 21:21:02 - INFO - __main__ - Step 525: {'lr': 0.000131, 'samples': 100800, 'steps': 524, 'loss/train': 5.213521957397461} -11/06/2021 21:21:02 - INFO - __main__ - Step 526: {'lr': 0.00013125000000000002, 'samples': 100992, 'steps': 525, 'loss/train': 4.800134181976318} -11/06/2021 21:21:03 - INFO - __main__ - Step 527: {'lr': 0.0001315, 'samples': 101184, 'steps': 526, 'loss/train': 5.979576587677002} -11/06/2021 21:21:04 - INFO - __main__ - Step 528: {'lr': 0.00013175, 'samples': 101376, 'steps': 527, 'loss/train': 4.6841630935668945} -11/06/2021 21:21:04 - INFO - __main__ - Step 529: {'lr': 0.000132, 'samples': 101568, 'steps': 528, 'loss/train': 5.14123010635376} -11/06/2021 21:21:04 - INFO - __main__ - Step 530: {'lr': 0.00013225000000000002, 'samples': 101760, 'steps': 529, 'loss/train': 4.850307941436768} -11/06/2021 21:21:05 - INFO - __main__ - Step 531: {'lr': 0.00013250000000000002, 'samples': 101952, 'steps': 530, 'loss/train': 4.945707321166992} -11/06/2021 21:21:05 - INFO - __main__ - Step 532: {'lr': 0.00013275, 'samples': 102144, 'steps': 531, 'loss/train': 5.073093891143799} -11/06/2021 21:21:06 - INFO - __main__ - Step 533: {'lr': 0.000133, 'samples': 102336, 'steps': 532, 'loss/train': 4.880060195922852} -11/06/2021 21:21:07 - INFO - __main__ - Step 534: {'lr': 0.00013325, 'samples': 102528, 'steps': 533, 'loss/train': 5.960422039031982} -11/06/2021 21:21:07 - INFO - __main__ - Step 535: {'lr': 0.00013350000000000002, 'samples': 102720, 'steps': 534, 'loss/train': 4.578385829925537} -11/06/2021 21:21:07 - INFO - __main__ - Step 536: {'lr': 0.00013375, 'samples': 102912, 'steps': 535, 'loss/train': 5.22959566116333} -11/06/2021 21:21:08 - INFO - __main__ - Step 537: {'lr': 0.000134, 'samples': 103104, 'steps': 536, 'loss/train': 5.195213317871094} -11/06/2021 21:21:08 - INFO - __main__ - Step 538: {'lr': 0.00013425, 'samples': 103296, 'steps': 537, 'loss/train': 5.1764912605285645} -11/06/2021 21:21:09 - INFO - __main__ - Step 539: {'lr': 0.00013450000000000002, 'samples': 103488, 'steps': 538, 'loss/train': 4.329580783843994} -11/06/2021 21:21:09 - INFO - __main__ - Step 540: {'lr': 0.00013475000000000002, 'samples': 103680, 'steps': 539, 'loss/train': 5.327682971954346} -11/06/2021 21:21:10 - INFO - __main__ - Step 541: {'lr': 0.000135, 'samples': 103872, 'steps': 540, 'loss/train': 5.050226211547852} -11/06/2021 21:21:10 - INFO - __main__ - Step 542: {'lr': 0.00013525, 'samples': 104064, 'steps': 541, 'loss/train': 6.563281059265137} -11/06/2021 21:21:10 - INFO - __main__ - Step 543: {'lr': 0.00013550000000000001, 'samples': 104256, 'steps': 542, 'loss/train': 5.260067462921143} -11/06/2021 21:21:12 - INFO - __main__ - Step 544: {'lr': 0.00013575000000000002, 'samples': 104448, 'steps': 543, 'loss/train': 5.054920196533203} -11/06/2021 21:21:12 - INFO - __main__ - Step 545: {'lr': 0.00013600000000000003, 'samples': 104640, 'steps': 544, 'loss/train': 4.304242134094238} -11/06/2021 21:21:12 - INFO - __main__ - Step 546: {'lr': 0.00013625, 'samples': 104832, 'steps': 545, 'loss/train': 5.143182277679443} -11/06/2021 21:21:13 - INFO - __main__ - Step 547: {'lr': 0.0001365, 'samples': 105024, 'steps': 546, 'loss/train': 5.063644886016846} -11/06/2021 21:21:13 - INFO - __main__ - Step 548: {'lr': 0.00013675000000000002, 'samples': 105216, 'steps': 547, 'loss/train': 4.523825168609619} -11/06/2021 21:21:14 - INFO - __main__ - Step 549: {'lr': 0.00013700000000000002, 'samples': 105408, 'steps': 548, 'loss/train': 5.415563583374023} -11/06/2021 21:21:14 - INFO - __main__ - Step 550: {'lr': 0.00013725, 'samples': 105600, 'steps': 549, 'loss/train': 5.242093086242676} -11/06/2021 21:21:15 - INFO - __main__ - Step 551: {'lr': 0.0001375, 'samples': 105792, 'steps': 550, 'loss/train': 5.3217949867248535} -11/06/2021 21:21:15 - INFO - __main__ - Step 552: {'lr': 0.00013775000000000001, 'samples': 105984, 'steps': 551, 'loss/train': 4.965686798095703} -11/06/2021 21:21:15 - INFO - __main__ - Step 553: {'lr': 0.00013800000000000002, 'samples': 106176, 'steps': 552, 'loss/train': 4.69637393951416} -11/06/2021 21:21:16 - INFO - __main__ - Step 554: {'lr': 0.00013825000000000003, 'samples': 106368, 'steps': 553, 'loss/train': 5.67413854598999} -11/06/2021 21:21:17 - INFO - __main__ - Step 555: {'lr': 0.0001385, 'samples': 106560, 'steps': 554, 'loss/train': 1.4391024112701416} -11/06/2021 21:21:17 - INFO - __main__ - Step 556: {'lr': 0.00013875, 'samples': 106752, 'steps': 555, 'loss/train': 4.693598747253418} -11/06/2021 21:21:18 - INFO - __main__ - Step 557: {'lr': 0.00013900000000000002, 'samples': 106944, 'steps': 556, 'loss/train': 4.811655521392822} -11/06/2021 21:21:18 - INFO - __main__ - Step 558: {'lr': 0.00013925000000000002, 'samples': 107136, 'steps': 557, 'loss/train': 5.708633899688721} -11/06/2021 21:21:18 - INFO - __main__ - Step 559: {'lr': 0.0001395, 'samples': 107328, 'steps': 558, 'loss/train': 5.34543514251709} -11/06/2021 21:21:19 - INFO - __main__ - Step 560: {'lr': 0.00013975, 'samples': 107520, 'steps': 559, 'loss/train': 4.994585990905762} -11/06/2021 21:21:20 - INFO - __main__ - Step 561: {'lr': 0.00014000000000000001, 'samples': 107712, 'steps': 560, 'loss/train': 4.977428913116455} -11/06/2021 21:21:20 - INFO - __main__ - Step 562: {'lr': 0.00014025000000000002, 'samples': 107904, 'steps': 561, 'loss/train': 5.134328365325928} -11/06/2021 21:21:20 - INFO - __main__ - Step 563: {'lr': 0.00014050000000000003, 'samples': 108096, 'steps': 562, 'loss/train': 5.075902462005615} -11/06/2021 21:21:21 - INFO - __main__ - Step 564: {'lr': 0.00014074999999999998, 'samples': 108288, 'steps': 563, 'loss/train': 4.605697154998779} -11/06/2021 21:21:22 - INFO - __main__ - Step 565: {'lr': 0.00014099999999999998, 'samples': 108480, 'steps': 564, 'loss/train': 4.873136520385742} -11/06/2021 21:21:22 - INFO - __main__ - Step 566: {'lr': 0.00014125, 'samples': 108672, 'steps': 565, 'loss/train': 4.94666862487793} -11/06/2021 21:21:22 - INFO - __main__ - Step 567: {'lr': 0.0001415, 'samples': 108864, 'steps': 566, 'loss/train': 4.661070823669434} -11/06/2021 21:21:23 - INFO - __main__ - Step 568: {'lr': 0.00014175, 'samples': 109056, 'steps': 567, 'loss/train': 5.004296779632568} -11/06/2021 21:21:23 - INFO - __main__ - Step 569: {'lr': 0.00014199999999999998, 'samples': 109248, 'steps': 568, 'loss/train': 4.945058345794678} -11/06/2021 21:21:24 - INFO - __main__ - Step 570: {'lr': 0.00014225, 'samples': 109440, 'steps': 569, 'loss/train': 4.626468658447266} -11/06/2021 21:21:25 - INFO - __main__ - Step 571: {'lr': 0.0001425, 'samples': 109632, 'steps': 570, 'loss/train': 4.994494915008545} -11/06/2021 21:21:25 - INFO - __main__ - Step 572: {'lr': 0.00014275, 'samples': 109824, 'steps': 571, 'loss/train': 5.284569263458252} -11/06/2021 21:21:26 - INFO - __main__ - Step 573: {'lr': 0.00014299999999999998, 'samples': 110016, 'steps': 572, 'loss/train': 5.315004348754883} -11/06/2021 21:21:26 - INFO - __main__ - Step 574: {'lr': 0.00014324999999999999, 'samples': 110208, 'steps': 573, 'loss/train': 4.810165882110596} -11/06/2021 21:21:27 - INFO - __main__ - Step 575: {'lr': 0.0001435, 'samples': 110400, 'steps': 574, 'loss/train': 5.227445125579834} -11/06/2021 21:21:27 - INFO - __main__ - Step 576: {'lr': 0.00014375, 'samples': 110592, 'steps': 575, 'loss/train': 5.34274435043335} -11/06/2021 21:21:28 - INFO - __main__ - Step 577: {'lr': 0.000144, 'samples': 110784, 'steps': 576, 'loss/train': 5.176715850830078} -11/06/2021 21:21:28 - INFO - __main__ - Step 578: {'lr': 0.00014424999999999998, 'samples': 110976, 'steps': 577, 'loss/train': 4.281363487243652} -11/06/2021 21:21:28 - INFO - __main__ - Step 579: {'lr': 0.0001445, 'samples': 111168, 'steps': 578, 'loss/train': 5.460202217102051} -11/06/2021 21:21:29 - INFO - __main__ - Step 580: {'lr': 0.00014475, 'samples': 111360, 'steps': 579, 'loss/train': 5.397484302520752} -11/06/2021 21:21:30 - INFO - __main__ - Step 581: {'lr': 0.000145, 'samples': 111552, 'steps': 580, 'loss/train': 4.4818291664123535} -11/06/2021 21:21:30 - INFO - __main__ - Step 582: {'lr': 0.00014524999999999998, 'samples': 111744, 'steps': 581, 'loss/train': 4.609002590179443} -11/06/2021 21:21:31 - INFO - __main__ - Step 583: {'lr': 0.00014549999999999999, 'samples': 111936, 'steps': 582, 'loss/train': 5.447309970855713} -11/06/2021 21:21:31 - INFO - __main__ - Step 584: {'lr': 0.00014575, 'samples': 112128, 'steps': 583, 'loss/train': 5.413631439208984} -11/06/2021 21:21:32 - INFO - __main__ - Step 585: {'lr': 0.000146, 'samples': 112320, 'steps': 584, 'loss/train': 6.304897308349609} -11/06/2021 21:21:32 - INFO - __main__ - Step 586: {'lr': 0.00014625, 'samples': 112512, 'steps': 585, 'loss/train': 3.9225189685821533} -11/06/2021 21:21:33 - INFO - __main__ - Step 587: {'lr': 0.00014649999999999998, 'samples': 112704, 'steps': 586, 'loss/train': 4.575343132019043} -11/06/2021 21:21:33 - INFO - __main__ - Step 588: {'lr': 0.00014675, 'samples': 112896, 'steps': 587, 'loss/train': 4.97996711730957} -11/06/2021 21:21:34 - INFO - __main__ - Step 589: {'lr': 0.000147, 'samples': 113088, 'steps': 588, 'loss/train': 5.520531177520752} -11/06/2021 21:21:35 - INFO - __main__ - Step 590: {'lr': 0.00014725, 'samples': 113280, 'steps': 589, 'loss/train': 4.435773849487305} -11/06/2021 21:21:35 - INFO - __main__ - Step 591: {'lr': 0.0001475, 'samples': 113472, 'steps': 590, 'loss/train': 5.016930103302002} -11/06/2021 21:21:35 - INFO - __main__ - Step 592: {'lr': 0.00014774999999999999, 'samples': 113664, 'steps': 591, 'loss/train': 4.882648468017578} -11/06/2021 21:21:36 - INFO - __main__ - Step 593: {'lr': 0.000148, 'samples': 113856, 'steps': 592, 'loss/train': 6.573506832122803} -11/06/2021 21:21:36 - INFO - __main__ - Step 594: {'lr': 0.00014825, 'samples': 114048, 'steps': 593, 'loss/train': 4.22829532623291} -11/06/2021 21:21:36 - INFO - __main__ - Step 595: {'lr': 0.0001485, 'samples': 114240, 'steps': 594, 'loss/train': 4.915690898895264} -11/06/2021 21:21:37 - INFO - __main__ - Step 596: {'lr': 0.00014874999999999998, 'samples': 114432, 'steps': 595, 'loss/train': 4.756763458251953} -11/06/2021 21:21:38 - INFO - __main__ - Step 597: {'lr': 0.000149, 'samples': 114624, 'steps': 596, 'loss/train': 4.910470485687256} -11/06/2021 21:21:38 - INFO - __main__ - Step 598: {'lr': 0.00014925, 'samples': 114816, 'steps': 597, 'loss/train': 4.912417411804199} -11/06/2021 21:21:38 - INFO - __main__ - Step 599: {'lr': 0.0001495, 'samples': 115008, 'steps': 598, 'loss/train': 4.568467140197754} -11/06/2021 21:21:39 - INFO - __main__ - Step 600: {'lr': 0.00014975, 'samples': 115200, 'steps': 599, 'loss/train': 4.727468967437744} -11/06/2021 21:21:40 - INFO - __main__ - Step 601: {'lr': 0.00015, 'samples': 115392, 'steps': 600, 'loss/train': 4.731727123260498} -11/06/2021 21:21:40 - INFO - __main__ - Step 602: {'lr': 0.00015025, 'samples': 115584, 'steps': 601, 'loss/train': 5.941672325134277} -11/06/2021 21:21:41 - INFO - __main__ - Step 603: {'lr': 0.0001505, 'samples': 115776, 'steps': 602, 'loss/train': 4.752991676330566} -11/06/2021 21:21:41 - INFO - __main__ - Step 604: {'lr': 0.00015075, 'samples': 115968, 'steps': 603, 'loss/train': 4.749768257141113} -11/06/2021 21:21:41 - INFO - __main__ - Step 605: {'lr': 0.000151, 'samples': 116160, 'steps': 604, 'loss/train': 4.868316650390625} -11/06/2021 21:21:43 - INFO - __main__ - Step 606: {'lr': 0.00015125, 'samples': 116352, 'steps': 605, 'loss/train': 4.696784973144531} -11/06/2021 21:21:43 - INFO - __main__ - Step 607: {'lr': 0.0001515, 'samples': 116544, 'steps': 606, 'loss/train': 5.38928747177124} -11/06/2021 21:21:43 - INFO - __main__ - Step 608: {'lr': 0.00015175, 'samples': 116736, 'steps': 607, 'loss/train': 4.822604179382324} -11/06/2021 21:21:44 - INFO - __main__ - Step 609: {'lr': 0.000152, 'samples': 116928, 'steps': 608, 'loss/train': 4.739031791687012} -11/06/2021 21:21:44 - INFO - __main__ - Step 610: {'lr': 0.00015225, 'samples': 117120, 'steps': 609, 'loss/train': 4.78218412399292} -11/06/2021 21:21:44 - INFO - __main__ - Step 611: {'lr': 0.0001525, 'samples': 117312, 'steps': 610, 'loss/train': 5.469936370849609} -11/06/2021 21:21:46 - INFO - __main__ - Step 612: {'lr': 0.00015275, 'samples': 117504, 'steps': 611, 'loss/train': 5.018012523651123} -11/06/2021 21:21:46 - INFO - __main__ - Step 613: {'lr': 0.000153, 'samples': 117696, 'steps': 612, 'loss/train': 4.723076343536377} -11/06/2021 21:21:46 - INFO - __main__ - Step 614: {'lr': 0.00015325, 'samples': 117888, 'steps': 613, 'loss/train': 4.444612503051758} -11/06/2021 21:21:47 - INFO - __main__ - Step 615: {'lr': 0.0001535, 'samples': 118080, 'steps': 614, 'loss/train': 5.002647876739502} -11/06/2021 21:21:47 - INFO - __main__ - Step 616: {'lr': 0.00015375, 'samples': 118272, 'steps': 615, 'loss/train': 5.234433174133301} -11/06/2021 21:21:48 - INFO - __main__ - Step 617: {'lr': 0.000154, 'samples': 118464, 'steps': 616, 'loss/train': 5.180642604827881} -11/06/2021 21:21:48 - INFO - __main__ - Step 618: {'lr': 0.00015425, 'samples': 118656, 'steps': 617, 'loss/train': 4.186741828918457} -11/06/2021 21:21:49 - INFO - __main__ - Step 619: {'lr': 0.00015450000000000001, 'samples': 118848, 'steps': 618, 'loss/train': 4.601840019226074} -11/06/2021 21:21:49 - INFO - __main__ - Step 620: {'lr': 0.00015475, 'samples': 119040, 'steps': 619, 'loss/train': 5.070303440093994} -11/06/2021 21:21:50 - INFO - __main__ - Step 621: {'lr': 0.000155, 'samples': 119232, 'steps': 620, 'loss/train': 4.981260776519775} -11/06/2021 21:21:50 - INFO - __main__ - Step 622: {'lr': 0.00015525, 'samples': 119424, 'steps': 621, 'loss/train': 4.912421703338623} -11/06/2021 21:21:51 - INFO - __main__ - Step 623: {'lr': 0.0001555, 'samples': 119616, 'steps': 622, 'loss/train': 4.604945182800293} -11/06/2021 21:21:51 - INFO - __main__ - Step 624: {'lr': 0.00015575, 'samples': 119808, 'steps': 623, 'loss/train': 4.606297969818115} -11/06/2021 21:21:52 - INFO - __main__ - Step 625: {'lr': 0.000156, 'samples': 120000, 'steps': 624, 'loss/train': 4.950876235961914} -11/06/2021 21:21:52 - INFO - __main__ - Step 626: {'lr': 0.00015625, 'samples': 120192, 'steps': 625, 'loss/train': 4.56068229675293} -11/06/2021 21:21:52 - INFO - __main__ - Step 627: {'lr': 0.0001565, 'samples': 120384, 'steps': 626, 'loss/train': 4.22480583190918} -11/06/2021 21:21:53 - INFO - __main__ - Step 628: {'lr': 0.00015675000000000002, 'samples': 120576, 'steps': 627, 'loss/train': 5.061352729797363} -11/06/2021 21:21:54 - INFO - __main__ - Step 629: {'lr': 0.000157, 'samples': 120768, 'steps': 628, 'loss/train': 4.828984260559082} -11/06/2021 21:21:54 - INFO - __main__ - Step 630: {'lr': 0.00015725, 'samples': 120960, 'steps': 629, 'loss/train': 4.675282955169678} -11/06/2021 21:21:55 - INFO - __main__ - Step 631: {'lr': 0.0001575, 'samples': 121152, 'steps': 630, 'loss/train': 4.3496575355529785} -11/06/2021 21:21:55 - INFO - __main__ - Step 632: {'lr': 0.00015775, 'samples': 121344, 'steps': 631, 'loss/train': 4.719287872314453} -11/06/2021 21:21:56 - INFO - __main__ - Step 633: {'lr': 0.000158, 'samples': 121536, 'steps': 632, 'loss/train': 4.833708763122559} -11/06/2021 21:21:56 - INFO - __main__ - Step 634: {'lr': 0.00015825, 'samples': 121728, 'steps': 633, 'loss/train': 4.082372665405273} -11/06/2021 21:21:57 - INFO - __main__ - Step 635: {'lr': 0.0001585, 'samples': 121920, 'steps': 634, 'loss/train': 4.89099645614624} -11/06/2021 21:21:57 - INFO - __main__ - Step 636: {'lr': 0.00015875, 'samples': 122112, 'steps': 635, 'loss/train': 5.596816062927246} -11/06/2021 21:21:57 - INFO - __main__ - Step 637: {'lr': 0.00015900000000000002, 'samples': 122304, 'steps': 636, 'loss/train': 4.681394100189209} -11/06/2021 21:21:58 - INFO - __main__ - Step 638: {'lr': 0.00015925, 'samples': 122496, 'steps': 637, 'loss/train': 4.834127426147461} -11/06/2021 21:21:59 - INFO - __main__ - Step 639: {'lr': 0.0001595, 'samples': 122688, 'steps': 638, 'loss/train': 5.277633190155029} -11/06/2021 21:21:59 - INFO - __main__ - Step 640: {'lr': 0.00015975, 'samples': 122880, 'steps': 639, 'loss/train': 5.002859115600586} -11/06/2021 21:21:59 - INFO - __main__ - Step 641: {'lr': 0.00016, 'samples': 123072, 'steps': 640, 'loss/train': 5.2396440505981445} -11/06/2021 21:22:00 - INFO - __main__ - Step 642: {'lr': 0.00016025000000000002, 'samples': 123264, 'steps': 641, 'loss/train': 5.183033466339111} -11/06/2021 21:22:01 - INFO - __main__ - Step 643: {'lr': 0.0001605, 'samples': 123456, 'steps': 642, 'loss/train': 4.6580305099487305} -11/06/2021 21:22:01 - INFO - __main__ - Step 644: {'lr': 0.00016075, 'samples': 123648, 'steps': 643, 'loss/train': 4.906527519226074} -11/06/2021 21:22:02 - INFO - __main__ - Step 645: {'lr': 0.000161, 'samples': 123840, 'steps': 644, 'loss/train': 4.350686073303223} -11/06/2021 21:22:02 - INFO - __main__ - Step 646: {'lr': 0.00016125000000000002, 'samples': 124032, 'steps': 645, 'loss/train': 4.576035499572754} -11/06/2021 21:22:02 - INFO - __main__ - Step 647: {'lr': 0.0001615, 'samples': 124224, 'steps': 646, 'loss/train': 4.445610046386719} -11/06/2021 21:22:03 - INFO - __main__ - Step 648: {'lr': 0.00016175, 'samples': 124416, 'steps': 647, 'loss/train': 4.549352645874023} -11/06/2021 21:22:04 - INFO - __main__ - Step 649: {'lr': 0.000162, 'samples': 124608, 'steps': 648, 'loss/train': 4.443591117858887} -11/06/2021 21:22:04 - INFO - __main__ - Step 650: {'lr': 0.00016225000000000001, 'samples': 124800, 'steps': 649, 'loss/train': 4.2263288497924805} -11/06/2021 21:22:04 - INFO - __main__ - Step 651: {'lr': 0.00016250000000000002, 'samples': 124992, 'steps': 650, 'loss/train': 4.449684143066406} -11/06/2021 21:22:05 - INFO - __main__ - Step 652: {'lr': 0.00016275, 'samples': 125184, 'steps': 651, 'loss/train': 5.221400737762451} -11/06/2021 21:22:06 - INFO - __main__ - Step 653: {'lr': 0.000163, 'samples': 125376, 'steps': 652, 'loss/train': 5.1638994216918945} -11/06/2021 21:22:06 - INFO - __main__ - Step 654: {'lr': 0.00016325, 'samples': 125568, 'steps': 653, 'loss/train': 4.728190898895264} -11/06/2021 21:22:06 - INFO - __main__ - Step 655: {'lr': 0.00016350000000000002, 'samples': 125760, 'steps': 654, 'loss/train': 4.6709394454956055} -11/06/2021 21:22:07 - INFO - __main__ - Step 656: {'lr': 0.00016375000000000002, 'samples': 125952, 'steps': 655, 'loss/train': 4.627468109130859} -11/06/2021 21:22:07 - INFO - __main__ - Step 657: {'lr': 0.000164, 'samples': 126144, 'steps': 656, 'loss/train': 4.362966060638428} -11/06/2021 21:22:08 - INFO - __main__ - Step 658: {'lr': 0.00016425, 'samples': 126336, 'steps': 657, 'loss/train': 5.120889663696289} -11/06/2021 21:22:08 - INFO - __main__ - Step 659: {'lr': 0.00016450000000000001, 'samples': 126528, 'steps': 658, 'loss/train': 4.917827129364014} -11/06/2021 21:22:09 - INFO - __main__ - Step 660: {'lr': 0.00016475000000000002, 'samples': 126720, 'steps': 659, 'loss/train': 4.704123020172119} -11/06/2021 21:22:09 - INFO - __main__ - Step 661: {'lr': 0.000165, 'samples': 126912, 'steps': 660, 'loss/train': 4.710036277770996} -11/06/2021 21:22:10 - INFO - __main__ - Step 662: {'lr': 0.00016525, 'samples': 127104, 'steps': 661, 'loss/train': 4.979597091674805} -11/06/2021 21:22:10 - INFO - __main__ - Step 663: {'lr': 0.0001655, 'samples': 127296, 'steps': 662, 'loss/train': 4.606518268585205} -11/06/2021 21:22:11 - INFO - __main__ - Step 664: {'lr': 0.00016575000000000002, 'samples': 127488, 'steps': 663, 'loss/train': 4.490879058837891} -11/06/2021 21:22:11 - INFO - __main__ - Step 665: {'lr': 0.00016600000000000002, 'samples': 127680, 'steps': 664, 'loss/train': 4.3809075355529785} -11/06/2021 21:22:12 - INFO - __main__ - Step 666: {'lr': 0.00016625, 'samples': 127872, 'steps': 665, 'loss/train': 4.735256195068359} -11/06/2021 21:22:12 - INFO - __main__ - Step 667: {'lr': 0.0001665, 'samples': 128064, 'steps': 666, 'loss/train': 4.7257890701293945} -11/06/2021 21:22:12 - INFO - __main__ - Step 668: {'lr': 0.00016675000000000001, 'samples': 128256, 'steps': 667, 'loss/train': 4.959212303161621} -11/06/2021 21:22:13 - INFO - __main__ - Step 669: {'lr': 0.00016700000000000002, 'samples': 128448, 'steps': 668, 'loss/train': 4.34332275390625} -11/06/2021 21:22:14 - INFO - __main__ - Step 670: {'lr': 0.00016725000000000003, 'samples': 128640, 'steps': 669, 'loss/train': 4.633439064025879} -11/06/2021 21:22:14 - INFO - __main__ - Step 671: {'lr': 0.0001675, 'samples': 128832, 'steps': 670, 'loss/train': 4.631658554077148} -11/06/2021 21:22:15 - INFO - __main__ - Step 672: {'lr': 0.00016775, 'samples': 129024, 'steps': 671, 'loss/train': 4.435437202453613} -11/06/2021 21:22:15 - INFO - __main__ - Step 673: {'lr': 0.00016800000000000002, 'samples': 129216, 'steps': 672, 'loss/train': 3.3415842056274414} -11/06/2021 21:22:16 - INFO - __main__ - Step 674: {'lr': 0.00016825000000000002, 'samples': 129408, 'steps': 673, 'loss/train': 4.65171480178833} -11/06/2021 21:22:16 - INFO - __main__ - Step 675: {'lr': 0.0001685, 'samples': 129600, 'steps': 674, 'loss/train': 4.98203182220459} -11/06/2021 21:22:17 - INFO - __main__ - Step 676: {'lr': 0.00016875, 'samples': 129792, 'steps': 675, 'loss/train': 5.456784248352051} -11/06/2021 21:22:17 - INFO - __main__ - Step 677: {'lr': 0.00016900000000000002, 'samples': 129984, 'steps': 676, 'loss/train': 4.679195880889893} -11/06/2021 21:22:17 - INFO - __main__ - Step 678: {'lr': 0.00016925000000000002, 'samples': 130176, 'steps': 677, 'loss/train': 4.434994697570801} -11/06/2021 21:22:18 - INFO - __main__ - Step 679: {'lr': 0.00016950000000000003, 'samples': 130368, 'steps': 678, 'loss/train': 4.650574684143066} -11/06/2021 21:22:19 - INFO - __main__ - Step 680: {'lr': 0.00016975, 'samples': 130560, 'steps': 679, 'loss/train': 4.444644451141357} -11/06/2021 21:22:19 - INFO - __main__ - Step 681: {'lr': 0.00017, 'samples': 130752, 'steps': 680, 'loss/train': 4.423855781555176} -11/06/2021 21:22:20 - INFO - __main__ - Step 682: {'lr': 0.00017025000000000002, 'samples': 130944, 'steps': 681, 'loss/train': 4.7202301025390625} -11/06/2021 21:22:20 - INFO - __main__ - Step 683: {'lr': 0.00017050000000000002, 'samples': 131136, 'steps': 682, 'loss/train': 4.4818854331970215} -11/06/2021 21:22:21 - INFO - __main__ - Step 684: {'lr': 0.00017075, 'samples': 131328, 'steps': 683, 'loss/train': 5.359105587005615} -11/06/2021 21:22:21 - INFO - __main__ - Step 685: {'lr': 0.000171, 'samples': 131520, 'steps': 684, 'loss/train': 4.730793476104736} -11/06/2021 21:22:22 - INFO - __main__ - Step 686: {'lr': 0.00017125000000000002, 'samples': 131712, 'steps': 685, 'loss/train': 4.558211803436279} -11/06/2021 21:22:22 - INFO - __main__ - Step 687: {'lr': 0.00017150000000000002, 'samples': 131904, 'steps': 686, 'loss/train': 4.429317951202393} -11/06/2021 21:22:22 - INFO - __main__ - Step 688: {'lr': 0.00017175000000000003, 'samples': 132096, 'steps': 687, 'loss/train': 4.6293816566467285} -11/06/2021 21:22:24 - INFO - __main__ - Step 689: {'lr': 0.00017199999999999998, 'samples': 132288, 'steps': 688, 'loss/train': 5.065909385681152} -11/06/2021 21:22:24 - INFO - __main__ - Step 690: {'lr': 0.00017224999999999999, 'samples': 132480, 'steps': 689, 'loss/train': 4.581766605377197} -11/06/2021 21:22:24 - INFO - __main__ - Step 691: {'lr': 0.0001725, 'samples': 132672, 'steps': 690, 'loss/train': 4.165865421295166} -11/06/2021 21:22:25 - INFO - __main__ - Step 692: {'lr': 0.00017275, 'samples': 132864, 'steps': 691, 'loss/train': 4.4996209144592285} -11/06/2021 21:22:25 - INFO - __main__ - Step 693: {'lr': 0.000173, 'samples': 133056, 'steps': 692, 'loss/train': 4.5448150634765625} -11/06/2021 21:22:25 - INFO - __main__ - Step 694: {'lr': 0.00017324999999999998, 'samples': 133248, 'steps': 693, 'loss/train': 3.898272752761841} -11/06/2021 21:22:26 - INFO - __main__ - Step 695: {'lr': 0.0001735, 'samples': 133440, 'steps': 694, 'loss/train': 4.2713165283203125} -11/06/2021 21:22:27 - INFO - __main__ - Step 696: {'lr': 0.00017375, 'samples': 133632, 'steps': 695, 'loss/train': 5.151446342468262} -11/06/2021 21:22:27 - INFO - __main__ - Step 697: {'lr': 0.000174, 'samples': 133824, 'steps': 696, 'loss/train': 4.418706893920898} -11/06/2021 21:22:28 - INFO - __main__ - Step 698: {'lr': 0.00017424999999999998, 'samples': 134016, 'steps': 697, 'loss/train': 4.960476875305176} -11/06/2021 21:22:28 - INFO - __main__ - Step 699: {'lr': 0.00017449999999999999, 'samples': 134208, 'steps': 698, 'loss/train': 4.722470760345459} -11/06/2021 21:22:30 - INFO - __main__ - Step 700: {'lr': 0.00017475, 'samples': 134400, 'steps': 699, 'loss/train': 4.800037384033203} -11/06/2021 21:22:30 - INFO - __main__ - Step 701: {'lr': 0.000175, 'samples': 134592, 'steps': 700, 'loss/train': 4.3655500411987305} -11/06/2021 21:22:30 - INFO - __main__ - Step 702: {'lr': 0.00017525, 'samples': 134784, 'steps': 701, 'loss/train': 4.725539684295654} -11/06/2021 21:22:31 - INFO - __main__ - Step 703: {'lr': 0.00017549999999999998, 'samples': 134976, 'steps': 702, 'loss/train': 4.290457248687744} -11/06/2021 21:22:31 - INFO - __main__ - Step 704: {'lr': 0.00017575, 'samples': 135168, 'steps': 703, 'loss/train': 4.849248886108398} -11/06/2021 21:22:31 - INFO - __main__ - Step 705: {'lr': 0.000176, 'samples': 135360, 'steps': 704, 'loss/train': 2.431931734085083} -11/06/2021 21:22:32 - INFO - __main__ - Step 706: {'lr': 0.00017625, 'samples': 135552, 'steps': 705, 'loss/train': 2.3060343265533447} -11/06/2021 21:22:33 - INFO - __main__ - Step 707: {'lr': 0.00017649999999999998, 'samples': 135744, 'steps': 706, 'loss/train': 2.4550411701202393} -11/06/2021 21:22:33 - INFO - __main__ - Step 708: {'lr': 0.00017675, 'samples': 135936, 'steps': 707, 'loss/train': 4.702536106109619} -11/06/2021 21:22:33 - INFO - __main__ - Step 709: {'lr': 0.000177, 'samples': 136128, 'steps': 708, 'loss/train': 4.986819267272949} -11/06/2021 21:22:34 - INFO - __main__ - Step 710: {'lr': 0.00017725, 'samples': 136320, 'steps': 709, 'loss/train': 4.857694149017334} -11/06/2021 21:22:34 - INFO - __main__ - Step 711: {'lr': 0.0001775, 'samples': 136512, 'steps': 710, 'loss/train': 4.735157012939453} -11/06/2021 21:22:35 - INFO - __main__ - Step 712: {'lr': 0.00017774999999999998, 'samples': 136704, 'steps': 711, 'loss/train': 4.753922462463379} -11/06/2021 21:22:36 - INFO - __main__ - Step 713: {'lr': 0.000178, 'samples': 136896, 'steps': 712, 'loss/train': 4.611956596374512} -11/06/2021 21:22:36 - INFO - __main__ - Step 714: {'lr': 0.00017825, 'samples': 137088, 'steps': 713, 'loss/train': 4.634572982788086} -11/06/2021 21:22:36 - INFO - __main__ - Step 715: {'lr': 0.0001785, 'samples': 137280, 'steps': 714, 'loss/train': 4.737353801727295} -11/06/2021 21:22:37 - INFO - __main__ - Step 716: {'lr': 0.00017875, 'samples': 137472, 'steps': 715, 'loss/train': 4.557127475738525} -11/06/2021 21:22:38 - INFO - __main__ - Step 717: {'lr': 0.000179, 'samples': 137664, 'steps': 716, 'loss/train': 5.090901851654053} -11/06/2021 21:22:38 - INFO - __main__ - Step 718: {'lr': 0.00017925, 'samples': 137856, 'steps': 717, 'loss/train': 4.926265716552734} -11/06/2021 21:22:39 - INFO - __main__ - Step 719: {'lr': 0.0001795, 'samples': 138048, 'steps': 718, 'loss/train': 4.575839519500732} -11/06/2021 21:22:39 - INFO - __main__ - Step 720: {'lr': 0.00017975, 'samples': 138240, 'steps': 719, 'loss/train': 4.539857864379883} -11/06/2021 21:22:39 - INFO - __main__ - Step 721: {'lr': 0.00017999999999999998, 'samples': 138432, 'steps': 720, 'loss/train': 5.017696380615234} -11/06/2021 21:22:41 - INFO - __main__ - Step 722: {'lr': 0.00018025, 'samples': 138624, 'steps': 721, 'loss/train': 4.860723495483398} -11/06/2021 21:22:41 - INFO - __main__ - Step 723: {'lr': 0.0001805, 'samples': 138816, 'steps': 722, 'loss/train': 4.767000675201416} -11/06/2021 21:22:41 - INFO - __main__ - Step 724: {'lr': 0.00018075, 'samples': 139008, 'steps': 723, 'loss/train': 4.792560577392578} -11/06/2021 21:22:42 - INFO - __main__ - Step 725: {'lr': 0.000181, 'samples': 139200, 'steps': 724, 'loss/train': 4.775363922119141} -11/06/2021 21:22:42 - INFO - __main__ - Step 726: {'lr': 0.00018125, 'samples': 139392, 'steps': 725, 'loss/train': 4.8343377113342285} -11/06/2021 21:22:42 - INFO - __main__ - Step 727: {'lr': 0.0001815, 'samples': 139584, 'steps': 726, 'loss/train': 4.501916885375977} -11/06/2021 21:22:43 - INFO - __main__ - Step 728: {'lr': 0.00018175, 'samples': 139776, 'steps': 727, 'loss/train': 4.543506145477295} -11/06/2021 21:22:44 - INFO - __main__ - Step 729: {'lr': 0.000182, 'samples': 139968, 'steps': 728, 'loss/train': 4.346724033355713} -11/06/2021 21:22:44 - INFO - __main__ - Step 730: {'lr': 0.00018225, 'samples': 140160, 'steps': 729, 'loss/train': 4.893301486968994} -11/06/2021 21:22:44 - INFO - __main__ - Step 731: {'lr': 0.0001825, 'samples': 140352, 'steps': 730, 'loss/train': 4.508211612701416} -11/06/2021 21:22:45 - INFO - __main__ - Step 732: {'lr': 0.00018275, 'samples': 140544, 'steps': 731, 'loss/train': 4.329798221588135} -11/06/2021 21:22:46 - INFO - __main__ - Step 733: {'lr': 0.000183, 'samples': 140736, 'steps': 732, 'loss/train': 4.946159362792969} -11/06/2021 21:22:46 - INFO - __main__ - Step 734: {'lr': 0.00018325, 'samples': 140928, 'steps': 733, 'loss/train': 4.753419399261475} -11/06/2021 21:22:47 - INFO - __main__ - Step 735: {'lr': 0.0001835, 'samples': 141120, 'steps': 734, 'loss/train': 5.069578170776367} -11/06/2021 21:22:47 - INFO - __main__ - Step 736: {'lr': 0.00018375, 'samples': 141312, 'steps': 735, 'loss/train': 5.126845359802246} -11/06/2021 21:22:47 - INFO - __main__ - Step 737: {'lr': 0.000184, 'samples': 141504, 'steps': 736, 'loss/train': 4.666621685028076} -11/06/2021 21:22:48 - INFO - __main__ - Step 738: {'lr': 0.00018425, 'samples': 141696, 'steps': 737, 'loss/train': 4.2837958335876465} -11/06/2021 21:22:49 - INFO - __main__ - Step 739: {'lr': 0.0001845, 'samples': 141888, 'steps': 738, 'loss/train': 4.565089702606201} -11/06/2021 21:22:49 - INFO - __main__ - Step 740: {'lr': 0.00018475, 'samples': 142080, 'steps': 739, 'loss/train': 4.330541133880615} -11/06/2021 21:22:49 - INFO - __main__ - Step 741: {'lr': 0.000185, 'samples': 142272, 'steps': 740, 'loss/train': 4.524784564971924} -11/06/2021 21:22:50 - INFO - __main__ - Step 742: {'lr': 0.00018525, 'samples': 142464, 'steps': 741, 'loss/train': 4.280323505401611} -11/06/2021 21:22:51 - INFO - __main__ - Step 743: {'lr': 0.0001855, 'samples': 142656, 'steps': 742, 'loss/train': 4.447424411773682} -11/06/2021 21:22:51 - INFO - __main__ - Step 744: {'lr': 0.00018575000000000002, 'samples': 142848, 'steps': 743, 'loss/train': 4.917816638946533} -11/06/2021 21:22:51 - INFO - __main__ - Step 745: {'lr': 0.000186, 'samples': 143040, 'steps': 744, 'loss/train': 4.4243059158325195} -11/06/2021 21:22:52 - INFO - __main__ - Step 746: {'lr': 0.00018625, 'samples': 143232, 'steps': 745, 'loss/train': 5.763511657714844} -11/06/2021 21:22:52 - INFO - __main__ - Step 747: {'lr': 0.0001865, 'samples': 143424, 'steps': 746, 'loss/train': 4.306034564971924} -11/06/2021 21:22:53 - INFO - __main__ - Step 748: {'lr': 0.00018675, 'samples': 143616, 'steps': 747, 'loss/train': 5.227732181549072} -11/06/2021 21:22:54 - INFO - __main__ - Step 749: {'lr': 0.000187, 'samples': 143808, 'steps': 748, 'loss/train': 5.433281421661377} -11/06/2021 21:22:54 - INFO - __main__ - Step 750: {'lr': 0.00018725, 'samples': 144000, 'steps': 749, 'loss/train': 4.236339092254639} -11/06/2021 21:22:54 - INFO - __main__ - Step 751: {'lr': 0.0001875, 'samples': 144192, 'steps': 750, 'loss/train': 4.570340633392334} -11/06/2021 21:22:55 - INFO - __main__ - Step 752: {'lr': 0.00018775, 'samples': 144384, 'steps': 751, 'loss/train': 4.103482723236084} -11/06/2021 21:22:55 - INFO - __main__ - Step 753: {'lr': 0.00018800000000000002, 'samples': 144576, 'steps': 752, 'loss/train': 4.504870891571045} -11/06/2021 21:22:56 - INFO - __main__ - Step 754: {'lr': 0.00018825, 'samples': 144768, 'steps': 753, 'loss/train': 4.6825480461120605} -11/06/2021 21:22:57 - INFO - __main__ - Step 755: {'lr': 0.0001885, 'samples': 144960, 'steps': 754, 'loss/train': 4.360548973083496} -11/06/2021 21:22:57 - INFO - __main__ - Step 756: {'lr': 0.00018875, 'samples': 145152, 'steps': 755, 'loss/train': 4.626955032348633} -11/06/2021 21:22:57 - INFO - __main__ - Step 757: {'lr': 0.000189, 'samples': 145344, 'steps': 756, 'loss/train': 4.462242126464844} -11/06/2021 21:22:58 - INFO - __main__ - Step 758: {'lr': 0.00018925, 'samples': 145536, 'steps': 757, 'loss/train': 4.262608528137207} -11/06/2021 21:22:59 - INFO - __main__ - Step 759: {'lr': 0.0001895, 'samples': 145728, 'steps': 758, 'loss/train': 4.549057960510254} -11/06/2021 21:22:59 - INFO - __main__ - Step 760: {'lr': 0.00018975, 'samples': 145920, 'steps': 759, 'loss/train': 4.4868574142456055} -11/06/2021 21:22:59 - INFO - __main__ - Step 761: {'lr': 0.00019, 'samples': 146112, 'steps': 760, 'loss/train': 4.394392013549805} -11/06/2021 21:23:00 - INFO - __main__ - Step 762: {'lr': 0.00019025000000000002, 'samples': 146304, 'steps': 761, 'loss/train': 4.9143500328063965} -11/06/2021 21:23:00 - INFO - __main__ - Step 763: {'lr': 0.0001905, 'samples': 146496, 'steps': 762, 'loss/train': 4.456435680389404} -11/06/2021 21:23:01 - INFO - __main__ - Step 764: {'lr': 0.00019075, 'samples': 146688, 'steps': 763, 'loss/train': 5.696299076080322} -11/06/2021 21:23:02 - INFO - __main__ - Step 765: {'lr': 0.000191, 'samples': 146880, 'steps': 764, 'loss/train': 4.935421466827393} -11/06/2021 21:23:02 - INFO - __main__ - Step 766: {'lr': 0.00019125000000000001, 'samples': 147072, 'steps': 765, 'loss/train': 4.943374156951904} -11/06/2021 21:23:02 - INFO - __main__ - Step 767: {'lr': 0.00019150000000000002, 'samples': 147264, 'steps': 766, 'loss/train': 5.322519302368164} -11/06/2021 21:23:03 - INFO - __main__ - Step 768: {'lr': 0.00019175, 'samples': 147456, 'steps': 767, 'loss/train': 4.189104080200195} -11/06/2021 21:23:04 - INFO - __main__ - Step 769: {'lr': 0.000192, 'samples': 147648, 'steps': 768, 'loss/train': 5.1701979637146} -11/06/2021 21:23:04 - INFO - __main__ - Step 770: {'lr': 0.00019225, 'samples': 147840, 'steps': 769, 'loss/train': 4.428781032562256} -11/06/2021 21:23:04 - INFO - __main__ - Step 771: {'lr': 0.00019250000000000002, 'samples': 148032, 'steps': 770, 'loss/train': 4.415109157562256} -11/06/2021 21:23:05 - INFO - __main__ - Step 772: {'lr': 0.00019275, 'samples': 148224, 'steps': 771, 'loss/train': 4.811757564544678} -11/06/2021 21:23:05 - INFO - __main__ - Step 773: {'lr': 0.000193, 'samples': 148416, 'steps': 772, 'loss/train': 4.7581634521484375} -11/06/2021 21:23:06 - INFO - __main__ - Step 774: {'lr': 0.00019325, 'samples': 148608, 'steps': 773, 'loss/train': 4.4999098777771} -11/06/2021 21:23:06 - INFO - __main__ - Step 775: {'lr': 0.00019350000000000001, 'samples': 148800, 'steps': 774, 'loss/train': 4.690352439880371} -11/06/2021 21:23:07 - INFO - __main__ - Step 776: {'lr': 0.00019375000000000002, 'samples': 148992, 'steps': 775, 'loss/train': 4.419637203216553} -11/06/2021 21:23:07 - INFO - __main__ - Step 777: {'lr': 0.000194, 'samples': 149184, 'steps': 776, 'loss/train': 4.947287559509277} -11/06/2021 21:23:08 - INFO - __main__ - Step 778: {'lr': 0.00019425, 'samples': 149376, 'steps': 777, 'loss/train': 5.457443714141846} -11/06/2021 21:23:09 - INFO - __main__ - Step 779: {'lr': 0.0001945, 'samples': 149568, 'steps': 778, 'loss/train': 4.38627815246582} -11/06/2021 21:23:09 - INFO - __main__ - Step 780: {'lr': 0.00019475000000000002, 'samples': 149760, 'steps': 779, 'loss/train': 5.3790178298950195} -11/06/2021 21:23:09 - INFO - __main__ - Step 781: {'lr': 0.00019500000000000002, 'samples': 149952, 'steps': 780, 'loss/train': 4.04803466796875} -11/06/2021 21:23:10 - INFO - __main__ - Step 782: {'lr': 0.00019525, 'samples': 150144, 'steps': 781, 'loss/train': 4.558263301849365} -11/06/2021 21:23:10 - INFO - __main__ - Step 783: {'lr': 0.0001955, 'samples': 150336, 'steps': 782, 'loss/train': 4.308804988861084} -11/06/2021 21:23:11 - INFO - __main__ - Step 784: {'lr': 0.00019575000000000001, 'samples': 150528, 'steps': 783, 'loss/train': 5.033785820007324} -11/06/2021 21:23:11 - INFO - __main__ - Step 785: {'lr': 0.00019600000000000002, 'samples': 150720, 'steps': 784, 'loss/train': 4.059752464294434} -11/06/2021 21:23:12 - INFO - __main__ - Step 786: {'lr': 0.00019625, 'samples': 150912, 'steps': 785, 'loss/train': 4.140824317932129} -11/06/2021 21:23:12 - INFO - __main__ - Step 787: {'lr': 0.0001965, 'samples': 151104, 'steps': 786, 'loss/train': 4.625868797302246} -11/06/2021 21:23:12 - INFO - __main__ - Step 788: {'lr': 0.00019675, 'samples': 151296, 'steps': 787, 'loss/train': 4.85765266418457} -11/06/2021 21:23:14 - INFO - __main__ - Step 789: {'lr': 0.00019700000000000002, 'samples': 151488, 'steps': 788, 'loss/train': 4.904588222503662} -11/06/2021 21:23:14 - INFO - __main__ - Step 790: {'lr': 0.00019725000000000002, 'samples': 151680, 'steps': 789, 'loss/train': 4.804408550262451} -11/06/2021 21:23:14 - INFO - __main__ - Step 791: {'lr': 0.0001975, 'samples': 151872, 'steps': 790, 'loss/train': 4.8462114334106445} -11/06/2021 21:23:15 - INFO - __main__ - Step 792: {'lr': 0.00019775, 'samples': 152064, 'steps': 791, 'loss/train': 4.475534439086914} -11/06/2021 21:23:15 - INFO - __main__ - Step 793: {'lr': 0.00019800000000000002, 'samples': 152256, 'steps': 792, 'loss/train': 4.764225482940674} -11/06/2021 21:23:16 - INFO - __main__ - Step 794: {'lr': 0.00019825000000000002, 'samples': 152448, 'steps': 793, 'loss/train': 4.824385643005371} -11/06/2021 21:23:16 - INFO - __main__ - Step 795: {'lr': 0.00019850000000000003, 'samples': 152640, 'steps': 794, 'loss/train': 4.384396076202393} -11/06/2021 21:23:17 - INFO - __main__ - Step 796: {'lr': 0.00019875, 'samples': 152832, 'steps': 795, 'loss/train': 4.154908657073975} -11/06/2021 21:23:17 - INFO - __main__ - Step 797: {'lr': 0.000199, 'samples': 153024, 'steps': 796, 'loss/train': 4.558513641357422} -11/06/2021 21:23:18 - INFO - __main__ - Step 798: {'lr': 0.00019925000000000002, 'samples': 153216, 'steps': 797, 'loss/train': 4.913057327270508} -11/06/2021 21:23:18 - INFO - __main__ - Step 799: {'lr': 0.00019950000000000002, 'samples': 153408, 'steps': 798, 'loss/train': 4.051199913024902} -11/06/2021 21:23:20 - INFO - __main__ - Step 800: {'lr': 0.00019975, 'samples': 153600, 'steps': 799, 'loss/train': 3.938993215560913} -11/06/2021 21:23:20 - INFO - __main__ - Step 801: {'lr': 0.0002, 'samples': 153792, 'steps': 800, 'loss/train': 4.724459648132324} -11/06/2021 21:23:20 - INFO - __main__ - Step 802: {'lr': 0.00020025000000000002, 'samples': 153984, 'steps': 801, 'loss/train': 6.338046550750732} -11/06/2021 21:23:21 - INFO - __main__ - Step 803: {'lr': 0.00020050000000000002, 'samples': 154176, 'steps': 802, 'loss/train': 2.221121072769165} -11/06/2021 21:23:21 - INFO - __main__ - Step 804: {'lr': 0.00020075000000000003, 'samples': 154368, 'steps': 803, 'loss/train': 2.2776834964752197} -11/06/2021 21:23:21 - INFO - __main__ - Step 805: {'lr': 0.000201, 'samples': 154560, 'steps': 804, 'loss/train': 2.1242752075195312} -11/06/2021 21:23:22 - INFO - __main__ - Step 806: {'lr': 0.00020125, 'samples': 154752, 'steps': 805, 'loss/train': 3.73689603805542} -11/06/2021 21:23:23 - INFO - __main__ - Step 807: {'lr': 0.00020150000000000002, 'samples': 154944, 'steps': 806, 'loss/train': 4.354226112365723} -11/06/2021 21:23:23 - INFO - __main__ - Step 808: {'lr': 0.00020175000000000003, 'samples': 155136, 'steps': 807, 'loss/train': 4.5094475746154785} -11/06/2021 21:23:24 - INFO - __main__ - Step 809: {'lr': 0.000202, 'samples': 155328, 'steps': 808, 'loss/train': 4.677899360656738} -11/06/2021 21:23:24 - INFO - __main__ - Step 810: {'lr': 0.00020225, 'samples': 155520, 'steps': 809, 'loss/train': 4.373321533203125} -11/06/2021 21:23:25 - INFO - __main__ - Step 811: {'lr': 0.00020250000000000002, 'samples': 155712, 'steps': 810, 'loss/train': 5.149594306945801} -11/06/2021 21:23:26 - INFO - __main__ - Step 812: {'lr': 0.00020275000000000002, 'samples': 155904, 'steps': 811, 'loss/train': 4.3080902099609375} -11/06/2021 21:23:26 - INFO - __main__ - Step 813: {'lr': 0.00020300000000000003, 'samples': 156096, 'steps': 812, 'loss/train': 4.42739725112915} -11/06/2021 21:23:26 - INFO - __main__ - Step 814: {'lr': 0.00020324999999999998, 'samples': 156288, 'steps': 813, 'loss/train': 4.6587677001953125} -11/06/2021 21:23:27 - INFO - __main__ - Step 815: {'lr': 0.00020349999999999999, 'samples': 156480, 'steps': 814, 'loss/train': 4.584706783294678} -11/06/2021 21:23:27 - INFO - __main__ - Step 816: {'lr': 0.00020375, 'samples': 156672, 'steps': 815, 'loss/train': 4.675464153289795} -11/06/2021 21:23:28 - INFO - __main__ - Step 817: {'lr': 0.000204, 'samples': 156864, 'steps': 816, 'loss/train': 4.275284767150879} -11/06/2021 21:23:28 - INFO - __main__ - Step 818: {'lr': 0.00020425, 'samples': 157056, 'steps': 817, 'loss/train': 4.487129211425781} -11/06/2021 21:23:29 - INFO - __main__ - Step 819: {'lr': 0.00020449999999999998, 'samples': 157248, 'steps': 818, 'loss/train': 3.8839242458343506} -11/06/2021 21:23:29 - INFO - __main__ - Step 820: {'lr': 0.00020475, 'samples': 157440, 'steps': 819, 'loss/train': 5.175144672393799} -11/06/2021 21:23:30 - INFO - __main__ - Step 821: {'lr': 0.000205, 'samples': 157632, 'steps': 820, 'loss/train': 4.6907877922058105} -11/06/2021 21:23:31 - INFO - __main__ - Step 822: {'lr': 0.00020525, 'samples': 157824, 'steps': 821, 'loss/train': 5.107820987701416} -11/06/2021 21:23:31 - INFO - __main__ - Step 823: {'lr': 0.00020549999999999998, 'samples': 158016, 'steps': 822, 'loss/train': 4.4801106452941895} -11/06/2021 21:23:31 - INFO - __main__ - Step 824: {'lr': 0.00020575, 'samples': 158208, 'steps': 823, 'loss/train': 4.510085105895996} -11/06/2021 21:23:32 - INFO - __main__ - Step 825: {'lr': 0.000206, 'samples': 158400, 'steps': 824, 'loss/train': 4.396790981292725} -11/06/2021 21:23:32 - INFO - __main__ - Step 826: {'lr': 0.00020625, 'samples': 158592, 'steps': 825, 'loss/train': 4.010310649871826} -11/06/2021 21:23:32 - INFO - __main__ - Step 827: {'lr': 0.0002065, 'samples': 158784, 'steps': 826, 'loss/train': 4.797766208648682} -11/06/2021 21:23:33 - INFO - __main__ - Step 828: {'lr': 0.00020674999999999998, 'samples': 158976, 'steps': 827, 'loss/train': 4.619658470153809} -11/06/2021 21:23:34 - INFO - __main__ - Step 829: {'lr': 0.000207, 'samples': 159168, 'steps': 828, 'loss/train': 4.163397312164307} -11/06/2021 21:23:34 - INFO - __main__ - Step 830: {'lr': 0.00020725, 'samples': 159360, 'steps': 829, 'loss/train': 4.228115081787109} -11/06/2021 21:23:34 - INFO - __main__ - Step 831: {'lr': 0.0002075, 'samples': 159552, 'steps': 830, 'loss/train': 4.451252460479736} -11/06/2021 21:23:35 - INFO - __main__ - Step 832: {'lr': 0.00020774999999999998, 'samples': 159744, 'steps': 831, 'loss/train': 4.284130096435547} -11/06/2021 21:23:36 - INFO - __main__ - Step 833: {'lr': 0.000208, 'samples': 159936, 'steps': 832, 'loss/train': 4.7883687019348145} -11/06/2021 21:23:36 - INFO - __main__ - Step 834: {'lr': 0.00020825, 'samples': 160128, 'steps': 833, 'loss/train': 4.043850898742676} -11/06/2021 21:23:37 - INFO - __main__ - Step 835: {'lr': 0.0002085, 'samples': 160320, 'steps': 834, 'loss/train': 4.566141128540039} -11/06/2021 21:23:37 - INFO - __main__ - Step 836: {'lr': 0.00020875, 'samples': 160512, 'steps': 835, 'loss/train': 5.373464584350586} -11/06/2021 21:23:37 - INFO - __main__ - Step 837: {'lr': 0.00020899999999999998, 'samples': 160704, 'steps': 836, 'loss/train': 4.873067378997803} -11/06/2021 21:23:39 - INFO - __main__ - Step 838: {'lr': 0.00020925, 'samples': 160896, 'steps': 837, 'loss/train': 4.9676995277404785} -11/06/2021 21:23:39 - INFO - __main__ - Step 839: {'lr': 0.0002095, 'samples': 161088, 'steps': 838, 'loss/train': 4.646881103515625} -11/06/2021 21:23:39 - INFO - __main__ - Step 840: {'lr': 0.00020975, 'samples': 161280, 'steps': 839, 'loss/train': 4.013716220855713} -11/06/2021 21:23:40 - INFO - __main__ - Step 841: {'lr': 0.00021, 'samples': 161472, 'steps': 840, 'loss/train': 6.019371509552002} -11/06/2021 21:23:40 - INFO - __main__ - Step 842: {'lr': 0.00021025, 'samples': 161664, 'steps': 841, 'loss/train': 3.9948506355285645} -11/06/2021 21:23:41 - INFO - __main__ - Step 843: {'lr': 0.0002105, 'samples': 161856, 'steps': 842, 'loss/train': 4.164978504180908} -11/06/2021 21:23:42 - INFO - __main__ - Step 844: {'lr': 0.00021075, 'samples': 162048, 'steps': 843, 'loss/train': 4.208803176879883} -11/06/2021 21:23:42 - INFO - __main__ - Step 845: {'lr': 0.000211, 'samples': 162240, 'steps': 844, 'loss/train': 5.149277210235596} -11/06/2021 21:23:42 - INFO - __main__ - Step 846: {'lr': 0.00021124999999999998, 'samples': 162432, 'steps': 845, 'loss/train': 4.742812156677246} -11/06/2021 21:23:43 - INFO - __main__ - Step 847: {'lr': 0.0002115, 'samples': 162624, 'steps': 846, 'loss/train': 4.207589149475098} -11/06/2021 21:23:43 - INFO - __main__ - Step 848: {'lr': 0.00021175, 'samples': 162816, 'steps': 847, 'loss/train': 4.035452842712402} -11/06/2021 21:23:44 - INFO - __main__ - Step 849: {'lr': 0.000212, 'samples': 163008, 'steps': 848, 'loss/train': 4.860066890716553} -11/06/2021 21:23:45 - INFO - __main__ - Step 850: {'lr': 0.00021225, 'samples': 163200, 'steps': 849, 'loss/train': 3.371035575866699} -11/06/2021 21:23:45 - INFO - __main__ - Step 851: {'lr': 0.0002125, 'samples': 163392, 'steps': 850, 'loss/train': 4.5741753578186035} -11/06/2021 21:23:45 - INFO - __main__ - Step 852: {'lr': 0.00021275, 'samples': 163584, 'steps': 851, 'loss/train': 4.537678241729736} -11/06/2021 21:23:46 - INFO - __main__ - Step 853: {'lr': 0.000213, 'samples': 163776, 'steps': 852, 'loss/train': 4.552616119384766} -11/06/2021 21:23:47 - INFO - __main__ - Step 854: {'lr': 0.00021325, 'samples': 163968, 'steps': 853, 'loss/train': 4.6721577644348145} -11/06/2021 21:23:47 - INFO - __main__ - Step 855: {'lr': 0.0002135, 'samples': 164160, 'steps': 854, 'loss/train': 4.655636310577393} -11/06/2021 21:23:47 - INFO - __main__ - Step 856: {'lr': 0.00021375, 'samples': 164352, 'steps': 855, 'loss/train': 4.305333614349365} -11/06/2021 21:23:48 - INFO - __main__ - Step 857: {'lr': 0.000214, 'samples': 164544, 'steps': 856, 'loss/train': 4.127890110015869} -11/06/2021 21:23:48 - INFO - __main__ - Step 858: {'lr': 0.00021425, 'samples': 164736, 'steps': 857, 'loss/train': 4.549274921417236} -11/06/2021 21:23:49 - INFO - __main__ - Step 859: {'lr': 0.0002145, 'samples': 164928, 'steps': 858, 'loss/train': 3.803431510925293} -11/06/2021 21:23:50 - INFO - __main__ - Step 860: {'lr': 0.00021475, 'samples': 165120, 'steps': 859, 'loss/train': 4.316712379455566} -11/06/2021 21:23:50 - INFO - __main__ - Step 861: {'lr': 0.000215, 'samples': 165312, 'steps': 860, 'loss/train': 4.917266845703125} -11/06/2021 21:23:50 - INFO - __main__ - Step 862: {'lr': 0.00021525, 'samples': 165504, 'steps': 861, 'loss/train': 4.41719913482666} -11/06/2021 21:23:51 - INFO - __main__ - Step 863: {'lr': 0.0002155, 'samples': 165696, 'steps': 862, 'loss/train': 4.436905384063721} -11/06/2021 21:23:52 - INFO - __main__ - Step 864: {'lr': 0.00021575, 'samples': 165888, 'steps': 863, 'loss/train': 4.34383487701416} -11/06/2021 21:23:52 - INFO - __main__ - Step 865: {'lr': 0.000216, 'samples': 166080, 'steps': 864, 'loss/train': 4.4350080490112305} -11/06/2021 21:23:52 - INFO - __main__ - Step 866: {'lr': 0.00021625, 'samples': 166272, 'steps': 865, 'loss/train': 4.548778057098389} -11/06/2021 21:23:53 - INFO - __main__ - Step 867: {'lr': 0.0002165, 'samples': 166464, 'steps': 866, 'loss/train': 4.653875827789307} -11/06/2021 21:23:53 - INFO - __main__ - Step 868: {'lr': 0.00021675, 'samples': 166656, 'steps': 867, 'loss/train': 4.1312150955200195} -11/06/2021 21:23:54 - INFO - __main__ - Step 869: {'lr': 0.00021700000000000002, 'samples': 166848, 'steps': 868, 'loss/train': 4.243196964263916} -11/06/2021 21:23:54 - INFO - __main__ - Step 870: {'lr': 0.00021725, 'samples': 167040, 'steps': 869, 'loss/train': 4.393092155456543} -11/06/2021 21:23:55 - INFO - __main__ - Step 871: {'lr': 0.0002175, 'samples': 167232, 'steps': 870, 'loss/train': 4.559785842895508} -11/06/2021 21:23:55 - INFO - __main__ - Step 872: {'lr': 0.00021775, 'samples': 167424, 'steps': 871, 'loss/train': 1.9217588901519775} -11/06/2021 21:23:55 - INFO - __main__ - Step 873: {'lr': 0.000218, 'samples': 167616, 'steps': 872, 'loss/train': 4.757959365844727} -11/06/2021 21:23:57 - INFO - __main__ - Step 874: {'lr': 0.00021825, 'samples': 167808, 'steps': 873, 'loss/train': 4.589957237243652} -11/06/2021 21:23:57 - INFO - __main__ - Step 875: {'lr': 0.0002185, 'samples': 168000, 'steps': 874, 'loss/train': 4.484537124633789} -11/06/2021 21:23:57 - INFO - __main__ - Step 876: {'lr': 0.00021875, 'samples': 168192, 'steps': 875, 'loss/train': 4.340537071228027} -11/06/2021 21:23:58 - INFO - __main__ - Step 877: {'lr': 0.000219, 'samples': 168384, 'steps': 876, 'loss/train': 4.769442558288574} -11/06/2021 21:23:58 - INFO - __main__ - Step 878: {'lr': 0.00021925000000000002, 'samples': 168576, 'steps': 877, 'loss/train': 4.576560974121094} -11/06/2021 21:23:59 - INFO - __main__ - Step 879: {'lr': 0.0002195, 'samples': 168768, 'steps': 878, 'loss/train': 4.7822418212890625} -11/06/2021 21:23:59 - INFO - __main__ - Step 880: {'lr': 0.00021975, 'samples': 168960, 'steps': 879, 'loss/train': 4.239711284637451} -11/06/2021 21:24:00 - INFO - __main__ - Step 881: {'lr': 0.00022, 'samples': 169152, 'steps': 880, 'loss/train': 4.899833679199219} -11/06/2021 21:24:00 - INFO - __main__ - Step 882: {'lr': 0.00022025000000000001, 'samples': 169344, 'steps': 881, 'loss/train': 4.500170707702637} -11/06/2021 21:24:00 - INFO - __main__ - Step 883: {'lr': 0.0002205, 'samples': 169536, 'steps': 882, 'loss/train': 4.454834938049316} -11/06/2021 21:24:02 - INFO - __main__ - Step 884: {'lr': 0.00022075, 'samples': 169728, 'steps': 883, 'loss/train': 4.347689151763916} -11/06/2021 21:24:02 - INFO - __main__ - Step 885: {'lr': 0.000221, 'samples': 169920, 'steps': 884, 'loss/train': 4.470192909240723} -11/06/2021 21:24:02 - INFO - __main__ - Step 886: {'lr': 0.00022125, 'samples': 170112, 'steps': 885, 'loss/train': 3.8449060916900635} -11/06/2021 21:24:03 - INFO - __main__ - Step 887: {'lr': 0.00022150000000000002, 'samples': 170304, 'steps': 886, 'loss/train': 3.2878403663635254} -11/06/2021 21:24:03 - INFO - __main__ - Step 888: {'lr': 0.00022175, 'samples': 170496, 'steps': 887, 'loss/train': 4.312256813049316} -11/06/2021 21:24:04 - INFO - __main__ - Step 889: {'lr': 0.000222, 'samples': 170688, 'steps': 888, 'loss/train': 4.553658962249756} -11/06/2021 21:24:04 - INFO - __main__ - Step 890: {'lr': 0.00022225, 'samples': 170880, 'steps': 889, 'loss/train': 4.031077861785889} -11/06/2021 21:24:05 - INFO - __main__ - Step 891: {'lr': 0.00022250000000000001, 'samples': 171072, 'steps': 890, 'loss/train': 4.104956150054932} -11/06/2021 21:24:05 - INFO - __main__ - Step 892: {'lr': 0.00022275000000000002, 'samples': 171264, 'steps': 891, 'loss/train': 4.234619617462158} -11/06/2021 21:24:05 - INFO - __main__ - Step 893: {'lr': 0.000223, 'samples': 171456, 'steps': 892, 'loss/train': 3.9380950927734375} -11/06/2021 21:24:06 - INFO - __main__ - Step 894: {'lr': 0.00022325, 'samples': 171648, 'steps': 893, 'loss/train': 3.4913272857666016} -11/06/2021 21:24:07 - INFO - __main__ - Step 895: {'lr': 0.0002235, 'samples': 171840, 'steps': 894, 'loss/train': 2.99515700340271} -11/06/2021 21:24:07 - INFO - __main__ - Step 896: {'lr': 0.00022375000000000002, 'samples': 172032, 'steps': 895, 'loss/train': 4.716649055480957} -11/06/2021 21:24:07 - INFO - __main__ - Step 897: {'lr': 0.000224, 'samples': 172224, 'steps': 896, 'loss/train': 3.291337251663208} -11/06/2021 21:24:08 - INFO - __main__ - Step 898: {'lr': 0.00022425, 'samples': 172416, 'steps': 897, 'loss/train': 4.090959548950195} -11/06/2021 21:24:08 - INFO - __main__ - Step 899: {'lr': 0.0002245, 'samples': 172608, 'steps': 898, 'loss/train': 4.231109142303467} -11/06/2021 21:24:09 - INFO - __main__ - Step 900: {'lr': 0.00022475000000000001, 'samples': 172800, 'steps': 899, 'loss/train': 3.5604536533355713} -11/06/2021 21:24:09 - INFO - __main__ - Step 901: {'lr': 0.00022500000000000002, 'samples': 172992, 'steps': 900, 'loss/train': 4.001966953277588} -11/06/2021 21:24:10 - INFO - __main__ - Step 902: {'lr': 0.00022525, 'samples': 173184, 'steps': 901, 'loss/train': 4.180810928344727} -11/06/2021 21:24:10 - INFO - __main__ - Step 903: {'lr': 0.0002255, 'samples': 173376, 'steps': 902, 'loss/train': 4.559982776641846} -11/06/2021 21:24:11 - INFO - __main__ - Step 904: {'lr': 0.00022575, 'samples': 173568, 'steps': 903, 'loss/train': 4.321451663970947} -11/06/2021 21:24:12 - INFO - __main__ - Step 905: {'lr': 0.00022600000000000002, 'samples': 173760, 'steps': 904, 'loss/train': 4.82120943069458} -11/06/2021 21:24:12 - INFO - __main__ - Step 906: {'lr': 0.00022625000000000002, 'samples': 173952, 'steps': 905, 'loss/train': 4.165206432342529} -11/06/2021 21:24:12 - INFO - __main__ - Step 907: {'lr': 0.0002265, 'samples': 174144, 'steps': 906, 'loss/train': 2.5543439388275146} -11/06/2021 21:24:13 - INFO - __main__ - Step 908: {'lr': 0.00022675, 'samples': 174336, 'steps': 907, 'loss/train': 4.742263317108154} -11/06/2021 21:24:13 - INFO - __main__ - Step 909: {'lr': 0.00022700000000000002, 'samples': 174528, 'steps': 908, 'loss/train': 4.112782001495361} -11/06/2021 21:24:14 - INFO - __main__ - Step 910: {'lr': 0.00022725000000000002, 'samples': 174720, 'steps': 909, 'loss/train': 4.566103458404541} -11/06/2021 21:24:15 - INFO - __main__ - Step 911: {'lr': 0.0002275, 'samples': 174912, 'steps': 910, 'loss/train': 4.344858169555664} -11/06/2021 21:24:15 - INFO - __main__ - Step 912: {'lr': 0.00022775, 'samples': 175104, 'steps': 911, 'loss/train': 3.5020289421081543} -11/06/2021 21:24:15 - INFO - __main__ - Step 913: {'lr': 0.000228, 'samples': 175296, 'steps': 912, 'loss/train': 4.5875163078308105} -11/06/2021 21:24:16 - INFO - __main__ - Step 914: {'lr': 0.00022825000000000002, 'samples': 175488, 'steps': 913, 'loss/train': 4.796538352966309} -11/06/2021 21:24:17 - INFO - __main__ - Step 915: {'lr': 0.00022850000000000002, 'samples': 175680, 'steps': 914, 'loss/train': 4.283998966217041} -11/06/2021 21:24:17 - INFO - __main__ - Step 916: {'lr': 0.00022875, 'samples': 175872, 'steps': 915, 'loss/train': 4.674391746520996} -11/06/2021 21:24:17 - INFO - __main__ - Step 917: {'lr': 0.000229, 'samples': 176064, 'steps': 916, 'loss/train': 5.0381999015808105} -11/06/2021 21:24:18 - INFO - __main__ - Step 918: {'lr': 0.00022925000000000002, 'samples': 176256, 'steps': 917, 'loss/train': 4.393980503082275} -11/06/2021 21:24:18 - INFO - __main__ - Step 919: {'lr': 0.00022950000000000002, 'samples': 176448, 'steps': 918, 'loss/train': 3.857478141784668} -11/06/2021 21:24:19 - INFO - __main__ - Step 920: {'lr': 0.00022975000000000003, 'samples': 176640, 'steps': 919, 'loss/train': 4.180598258972168} -11/06/2021 21:24:19 - INFO - __main__ - Step 921: {'lr': 0.00023, 'samples': 176832, 'steps': 920, 'loss/train': 4.508198261260986} -11/06/2021 21:24:20 - INFO - __main__ - Step 922: {'lr': 0.00023025, 'samples': 177024, 'steps': 921, 'loss/train': 4.902273654937744} -11/06/2021 21:24:20 - INFO - __main__ - Step 923: {'lr': 0.00023050000000000002, 'samples': 177216, 'steps': 922, 'loss/train': 3.9419641494750977} -11/06/2021 21:24:21 - INFO - __main__ - Step 924: {'lr': 0.00023075000000000003, 'samples': 177408, 'steps': 923, 'loss/train': 4.182397365570068} -11/06/2021 21:24:21 - INFO - __main__ - Step 925: {'lr': 0.000231, 'samples': 177600, 'steps': 924, 'loss/train': 5.673306941986084} -11/06/2021 21:24:22 - INFO - __main__ - Step 926: {'lr': 0.00023125, 'samples': 177792, 'steps': 925, 'loss/train': 4.469267845153809} -11/06/2021 21:24:22 - INFO - __main__ - Step 927: {'lr': 0.00023150000000000002, 'samples': 177984, 'steps': 926, 'loss/train': 4.016385078430176} -11/06/2021 21:24:23 - INFO - __main__ - Step 928: {'lr': 0.00023175000000000002, 'samples': 178176, 'steps': 927, 'loss/train': 4.510035037994385} -11/06/2021 21:24:23 - INFO - __main__ - Step 929: {'lr': 0.00023200000000000003, 'samples': 178368, 'steps': 928, 'loss/train': 3.650172233581543} -11/06/2021 21:24:23 - INFO - __main__ - Step 930: {'lr': 0.00023225, 'samples': 178560, 'steps': 929, 'loss/train': 3.8825185298919678} -11/06/2021 21:24:24 - INFO - __main__ - Step 931: {'lr': 0.0002325, 'samples': 178752, 'steps': 930, 'loss/train': 4.376020908355713} -11/06/2021 21:24:25 - INFO - __main__ - Step 932: {'lr': 0.00023275000000000002, 'samples': 178944, 'steps': 931, 'loss/train': 4.174633979797363} -11/06/2021 21:24:25 - INFO - __main__ - Step 933: {'lr': 0.00023300000000000003, 'samples': 179136, 'steps': 932, 'loss/train': 4.296014785766602} -11/06/2021 21:24:25 - INFO - __main__ - Step 934: {'lr': 0.00023325, 'samples': 179328, 'steps': 933, 'loss/train': 3.821877956390381} -11/06/2021 21:24:26 - INFO - __main__ - Step 935: {'lr': 0.0002335, 'samples': 179520, 'steps': 934, 'loss/train': 4.20390510559082} -11/06/2021 21:24:27 - INFO - __main__ - Step 936: {'lr': 0.00023375000000000002, 'samples': 179712, 'steps': 935, 'loss/train': 4.282657623291016} -11/06/2021 21:24:27 - INFO - __main__ - Step 937: {'lr': 0.00023400000000000002, 'samples': 179904, 'steps': 936, 'loss/train': 3.8457953929901123} -11/06/2021 21:24:28 - INFO - __main__ - Step 938: {'lr': 0.00023425000000000003, 'samples': 180096, 'steps': 937, 'loss/train': 4.099065780639648} -11/06/2021 21:24:28 - INFO - __main__ - Step 939: {'lr': 0.00023449999999999998, 'samples': 180288, 'steps': 938, 'loss/train': 4.02554988861084} -11/06/2021 21:24:28 - INFO - __main__ - Step 940: {'lr': 0.00023475, 'samples': 180480, 'steps': 939, 'loss/train': 4.181853294372559} -11/06/2021 21:24:29 - INFO - __main__ - Step 941: {'lr': 0.000235, 'samples': 180672, 'steps': 940, 'loss/train': 4.0363969802856445} -11/06/2021 21:24:30 - INFO - __main__ - Step 942: {'lr': 0.00023525, 'samples': 180864, 'steps': 941, 'loss/train': 4.118391036987305} -11/06/2021 21:24:30 - INFO - __main__ - Step 943: {'lr': 0.0002355, 'samples': 181056, 'steps': 942, 'loss/train': 4.28350830078125} -11/06/2021 21:24:30 - INFO - __main__ - Step 944: {'lr': 0.00023574999999999998, 'samples': 181248, 'steps': 943, 'loss/train': 3.8540680408477783} -11/06/2021 21:24:31 - INFO - __main__ - Step 945: {'lr': 0.000236, 'samples': 181440, 'steps': 944, 'loss/train': 4.089186191558838} -11/06/2021 21:24:32 - INFO - __main__ - Step 946: {'lr': 0.00023625, 'samples': 181632, 'steps': 945, 'loss/train': 4.698647975921631} -11/06/2021 21:24:32 - INFO - __main__ - Step 947: {'lr': 0.0002365, 'samples': 181824, 'steps': 946, 'loss/train': 4.4743123054504395} -11/06/2021 21:24:32 - INFO - __main__ - Step 948: {'lr': 0.00023674999999999998, 'samples': 182016, 'steps': 947, 'loss/train': 4.072103500366211} -11/06/2021 21:24:33 - INFO - __main__ - Step 949: {'lr': 0.000237, 'samples': 182208, 'steps': 948, 'loss/train': 4.225581169128418} -11/06/2021 21:24:33 - INFO - __main__ - Step 950: {'lr': 0.00023725, 'samples': 182400, 'steps': 949, 'loss/train': 4.038322448730469} -11/06/2021 21:24:34 - INFO - __main__ - Step 951: {'lr': 0.0002375, 'samples': 182592, 'steps': 950, 'loss/train': 4.349215984344482} -11/06/2021 21:24:35 - INFO - __main__ - Step 952: {'lr': 0.00023775, 'samples': 182784, 'steps': 951, 'loss/train': 4.141671180725098} -11/06/2021 21:24:35 - INFO - __main__ - Step 953: {'lr': 0.00023799999999999998, 'samples': 182976, 'steps': 952, 'loss/train': 3.437227725982666} -11/06/2021 21:24:35 - INFO - __main__ - Step 954: {'lr': 0.00023825, 'samples': 183168, 'steps': 953, 'loss/train': 4.3065505027771} -11/06/2021 21:24:36 - INFO - __main__ - Step 955: {'lr': 0.0002385, 'samples': 183360, 'steps': 954, 'loss/train': 4.3600687980651855} -11/06/2021 21:24:36 - INFO - __main__ - Step 956: {'lr': 0.00023875, 'samples': 183552, 'steps': 955, 'loss/train': 3.731297731399536} -11/06/2021 21:24:37 - INFO - __main__ - Step 957: {'lr': 0.00023899999999999998, 'samples': 183744, 'steps': 956, 'loss/train': 4.126706600189209} -11/06/2021 21:24:37 - INFO - __main__ - Step 958: {'lr': 0.00023925, 'samples': 183936, 'steps': 957, 'loss/train': 4.03998327255249} -11/06/2021 21:24:38 - INFO - __main__ - Step 959: {'lr': 0.0002395, 'samples': 184128, 'steps': 958, 'loss/train': 4.376034259796143} -11/06/2021 21:24:38 - INFO - __main__ - Step 960: {'lr': 0.00023975, 'samples': 184320, 'steps': 959, 'loss/train': 4.163696765899658} -11/06/2021 21:24:39 - INFO - __main__ - Step 961: {'lr': 0.00024, 'samples': 184512, 'steps': 960, 'loss/train': 3.9525156021118164} -11/06/2021 21:24:40 - INFO - __main__ - Step 962: {'lr': 0.00024024999999999999, 'samples': 184704, 'steps': 961, 'loss/train': 4.245794296264648} -11/06/2021 21:24:40 - INFO - __main__ - Step 963: {'lr': 0.0002405, 'samples': 184896, 'steps': 962, 'loss/train': 4.1179914474487305} -11/06/2021 21:24:41 - INFO - __main__ - Step 964: {'lr': 0.00024075, 'samples': 185088, 'steps': 963, 'loss/train': 3.9547386169433594} -11/06/2021 21:24:41 - INFO - __main__ - Step 965: {'lr': 0.000241, 'samples': 185280, 'steps': 964, 'loss/train': 5.651031494140625} -11/06/2021 21:24:41 - INFO - __main__ - Step 966: {'lr': 0.00024125, 'samples': 185472, 'steps': 965, 'loss/train': 4.45121431350708} -11/06/2021 21:24:42 - INFO - __main__ - Step 967: {'lr': 0.0002415, 'samples': 185664, 'steps': 966, 'loss/train': 4.361720561981201} -11/06/2021 21:24:43 - INFO - __main__ - Step 968: {'lr': 0.00024175, 'samples': 185856, 'steps': 967, 'loss/train': 4.614392280578613} -11/06/2021 21:24:43 - INFO - __main__ - Step 969: {'lr': 0.000242, 'samples': 186048, 'steps': 968, 'loss/train': 4.159306526184082} -11/06/2021 21:24:43 - INFO - __main__ - Step 970: {'lr': 0.00024225, 'samples': 186240, 'steps': 969, 'loss/train': 4.633758544921875} -11/06/2021 21:24:44 - INFO - __main__ - Step 971: {'lr': 0.00024249999999999999, 'samples': 186432, 'steps': 970, 'loss/train': 3.539381742477417} -11/06/2021 21:24:45 - INFO - __main__ - Step 972: {'lr': 0.00024275, 'samples': 186624, 'steps': 971, 'loss/train': 4.320156097412109} -11/06/2021 21:24:45 - INFO - __main__ - Step 973: {'lr': 0.000243, 'samples': 186816, 'steps': 972, 'loss/train': 4.2555952072143555} -11/06/2021 21:24:45 - INFO - __main__ - Step 974: {'lr': 0.00024325, 'samples': 187008, 'steps': 973, 'loss/train': 4.501039505004883} -11/06/2021 21:24:46 - INFO - __main__ - Step 975: {'lr': 0.0002435, 'samples': 187200, 'steps': 974, 'loss/train': 4.149434566497803} -11/06/2021 21:24:46 - INFO - __main__ - Step 976: {'lr': 0.00024375, 'samples': 187392, 'steps': 975, 'loss/train': 4.1013922691345215} -11/06/2021 21:24:47 - INFO - __main__ - Step 977: {'lr': 0.000244, 'samples': 187584, 'steps': 976, 'loss/train': 4.386606216430664} -11/06/2021 21:24:47 - INFO - __main__ - Step 978: {'lr': 0.00024425, 'samples': 187776, 'steps': 977, 'loss/train': 5.693066596984863} -11/06/2021 21:24:48 - INFO - __main__ - Step 979: {'lr': 0.0002445, 'samples': 187968, 'steps': 978, 'loss/train': 4.069120407104492} -11/06/2021 21:24:48 - INFO - __main__ - Step 980: {'lr': 0.00024475, 'samples': 188160, 'steps': 979, 'loss/train': 3.942934513092041} -11/06/2021 21:24:49 - INFO - __main__ - Step 981: {'lr': 0.000245, 'samples': 188352, 'steps': 980, 'loss/train': 4.399833679199219} -11/06/2021 21:24:49 - INFO - __main__ - Step 982: {'lr': 0.00024525, 'samples': 188544, 'steps': 981, 'loss/train': 4.462058067321777} -11/06/2021 21:24:50 - INFO - __main__ - Step 983: {'lr': 0.0002455, 'samples': 188736, 'steps': 982, 'loss/train': 4.437088966369629} -11/06/2021 21:24:50 - INFO - __main__ - Step 984: {'lr': 0.00024575, 'samples': 188928, 'steps': 983, 'loss/train': 3.954718828201294} -11/06/2021 21:24:51 - INFO - __main__ - Step 985: {'lr': 0.000246, 'samples': 189120, 'steps': 984, 'loss/train': 3.88590669631958} -11/06/2021 21:24:51 - INFO - __main__ - Step 986: {'lr': 0.00024625, 'samples': 189312, 'steps': 985, 'loss/train': 4.265262603759766} -11/06/2021 21:24:51 - INFO - __main__ - Step 987: {'lr': 0.00024650000000000003, 'samples': 189504, 'steps': 986, 'loss/train': 3.8113763332366943} -11/06/2021 21:24:52 - INFO - __main__ - Step 988: {'lr': 0.00024675, 'samples': 189696, 'steps': 987, 'loss/train': 4.336015701293945} -11/06/2021 21:24:53 - INFO - __main__ - Step 989: {'lr': 0.000247, 'samples': 189888, 'steps': 988, 'loss/train': 3.8807554244995117} -11/06/2021 21:24:53 - INFO - __main__ - Step 990: {'lr': 0.00024725, 'samples': 190080, 'steps': 989, 'loss/train': 3.6231210231781006} -11/06/2021 21:24:53 - INFO - __main__ - Step 991: {'lr': 0.0002475, 'samples': 190272, 'steps': 990, 'loss/train': 4.3600897789001465} -11/06/2021 21:24:54 - INFO - __main__ - Step 992: {'lr': 0.00024775, 'samples': 190464, 'steps': 991, 'loss/train': 4.003350734710693} -11/06/2021 21:24:55 - INFO - __main__ - Step 993: {'lr': 0.000248, 'samples': 190656, 'steps': 992, 'loss/train': 4.158915996551514} -11/06/2021 21:24:55 - INFO - __main__ - Step 994: {'lr': 0.00024825, 'samples': 190848, 'steps': 993, 'loss/train': 4.062311172485352} -11/06/2021 21:24:55 - INFO - __main__ - Step 995: {'lr': 0.0002485, 'samples': 191040, 'steps': 994, 'loss/train': 4.686992645263672} -11/06/2021 21:24:56 - INFO - __main__ - Step 996: {'lr': 0.00024875, 'samples': 191232, 'steps': 995, 'loss/train': 4.652307510375977} -11/06/2021 21:24:57 - INFO - __main__ - Step 997: {'lr': 0.000249, 'samples': 191424, 'steps': 996, 'loss/train': 4.7089762687683105} -11/06/2021 21:24:57 - INFO - __main__ - Step 998: {'lr': 0.00024925, 'samples': 191616, 'steps': 997, 'loss/train': 4.194471836090088} -11/06/2021 21:24:57 - INFO - __main__ - Step 999: {'lr': 0.0002495, 'samples': 191808, 'steps': 998, 'loss/train': 4.319421768188477} -11/06/2021 21:24:58 - INFO - __main__ - Step 1000: {'lr': 0.00024975, 'samples': 192000, 'steps': 999, 'loss/train': 4.688298225402832} -11/06/2021 21:24:58 - INFO - __main__ - Step 1001: {'lr': 0.00025, 'samples': 192192, 'steps': 1000, 'loss/train': 5.178300857543945} -11/06/2021 21:24:58 - INFO - __main__ - Step 1002: {'lr': 0.00025025, 'samples': 192384, 'steps': 1001, 'loss/train': 4.494810104370117} -11/06/2021 21:25:00 - INFO - __main__ - Step 1003: {'lr': 0.0002505, 'samples': 192576, 'steps': 1002, 'loss/train': 4.467245101928711} -11/06/2021 21:25:00 - INFO - __main__ - Step 1004: {'lr': 0.00025075, 'samples': 192768, 'steps': 1003, 'loss/train': 3.843966484069824} -11/06/2021 21:25:00 - INFO - __main__ - Step 1005: {'lr': 0.00025100000000000003, 'samples': 192960, 'steps': 1004, 'loss/train': 3.936264753341675} -11/06/2021 21:25:01 - INFO - __main__ - Step 1006: {'lr': 0.00025124999999999995, 'samples': 193152, 'steps': 1005, 'loss/train': 2.070441961288452} -11/06/2021 21:25:01 - INFO - __main__ - Step 1007: {'lr': 0.0002515, 'samples': 193344, 'steps': 1006, 'loss/train': 2.1154818534851074} -11/06/2021 21:25:01 - INFO - __main__ - Step 1008: {'lr': 0.00025174999999999997, 'samples': 193536, 'steps': 1007, 'loss/train': 4.228350639343262} -11/06/2021 21:25:02 - INFO - __main__ - Step 1009: {'lr': 0.000252, 'samples': 193728, 'steps': 1008, 'loss/train': 3.9860525131225586} -11/06/2021 21:25:03 - INFO - __main__ - Step 1010: {'lr': 0.00025225, 'samples': 193920, 'steps': 1009, 'loss/train': 4.507659912109375} -11/06/2021 21:25:03 - INFO - __main__ - Step 1011: {'lr': 0.0002525, 'samples': 194112, 'steps': 1010, 'loss/train': 4.104220867156982} -11/06/2021 21:25:04 - INFO - __main__ - Step 1012: {'lr': 0.00025275, 'samples': 194304, 'steps': 1011, 'loss/train': 3.661561965942383} -11/06/2021 21:25:04 - INFO - __main__ - Step 1013: {'lr': 0.000253, 'samples': 194496, 'steps': 1012, 'loss/train': 4.302820682525635} -11/06/2021 21:25:05 - INFO - __main__ - Step 1014: {'lr': 0.00025325, 'samples': 194688, 'steps': 1013, 'loss/train': 4.471502780914307} -11/06/2021 21:25:05 - INFO - __main__ - Step 1015: {'lr': 0.0002535, 'samples': 194880, 'steps': 1014, 'loss/train': 4.165027141571045} -11/06/2021 21:25:06 - INFO - __main__ - Step 1016: {'lr': 0.00025374999999999996, 'samples': 195072, 'steps': 1015, 'loss/train': 3.9462151527404785} -11/06/2021 21:25:06 - INFO - __main__ - Step 1017: {'lr': 0.000254, 'samples': 195264, 'steps': 1016, 'loss/train': 6.699620723724365} -11/06/2021 21:25:06 - INFO - __main__ - Step 1018: {'lr': 0.00025425, 'samples': 195456, 'steps': 1017, 'loss/train': 3.6332051753997803} -11/06/2021 21:25:07 - INFO - __main__ - Step 1019: {'lr': 0.0002545, 'samples': 195648, 'steps': 1018, 'loss/train': 4.286611080169678} -11/06/2021 21:25:08 - INFO - __main__ - Step 1020: {'lr': 0.00025475, 'samples': 195840, 'steps': 1019, 'loss/train': 3.8143672943115234} -11/06/2021 21:25:08 - INFO - __main__ - Step 1021: {'lr': 0.000255, 'samples': 196032, 'steps': 1020, 'loss/train': 3.97232723236084} -11/06/2021 21:25:08 - INFO - __main__ - Step 1022: {'lr': 0.00025525, 'samples': 196224, 'steps': 1021, 'loss/train': 4.28098726272583} -11/06/2021 21:25:09 - INFO - __main__ - Step 1023: {'lr': 0.00025550000000000003, 'samples': 196416, 'steps': 1022, 'loss/train': 4.043383598327637} -11/06/2021 21:25:10 - INFO - __main__ - Step 1024: {'lr': 0.00025575, 'samples': 196608, 'steps': 1023, 'loss/train': 4.659992218017578} -11/06/2021 21:25:10 - INFO - __main__ - Step 1025: {'lr': 0.000256, 'samples': 196800, 'steps': 1024, 'loss/train': 4.093658924102783} -11/06/2021 21:25:10 - INFO - __main__ - Step 1026: {'lr': 0.00025624999999999997, 'samples': 196992, 'steps': 1025, 'loss/train': 3.535585880279541} -11/06/2021 21:25:11 - INFO - __main__ - Step 1027: {'lr': 0.0002565, 'samples': 197184, 'steps': 1026, 'loss/train': 4.1824493408203125} -11/06/2021 21:25:11 - INFO - __main__ - Step 1028: {'lr': 0.00025675, 'samples': 197376, 'steps': 1027, 'loss/train': 4.0930609703063965} -11/06/2021 21:25:11 - INFO - __main__ - Step 1029: {'lr': 0.000257, 'samples': 197568, 'steps': 1028, 'loss/train': 3.6540799140930176} -11/06/2021 21:25:13 - INFO - __main__ - Step 1030: {'lr': 0.00025725, 'samples': 197760, 'steps': 1029, 'loss/train': 4.0925822257995605} -11/06/2021 21:25:13 - INFO - __main__ - Step 1031: {'lr': 0.0002575, 'samples': 197952, 'steps': 1030, 'loss/train': 3.85776424407959} -11/06/2021 21:25:13 - INFO - __main__ - Step 1032: {'lr': 0.00025775, 'samples': 198144, 'steps': 1031, 'loss/train': 4.097292423248291} -11/06/2021 21:25:14 - INFO - __main__ - Step 1033: {'lr': 0.00025800000000000004, 'samples': 198336, 'steps': 1032, 'loss/train': 1.9851371049880981} -11/06/2021 21:25:14 - INFO - __main__ - Step 1034: {'lr': 0.00025824999999999996, 'samples': 198528, 'steps': 1033, 'loss/train': 4.119291305541992} -11/06/2021 21:25:15 - INFO - __main__ - Step 1035: {'lr': 0.0002585, 'samples': 198720, 'steps': 1034, 'loss/train': 4.1994733810424805} -11/06/2021 21:25:15 - INFO - __main__ - Step 1036: {'lr': 0.00025875, 'samples': 198912, 'steps': 1035, 'loss/train': 4.295950412750244} -11/06/2021 21:25:16 - INFO - __main__ - Step 1037: {'lr': 0.000259, 'samples': 199104, 'steps': 1036, 'loss/train': 3.5869834423065186} -11/06/2021 21:25:16 - INFO - __main__ - Step 1038: {'lr': 0.00025925, 'samples': 199296, 'steps': 1037, 'loss/train': 5.716175556182861} -11/06/2021 21:25:16 - INFO - __main__ - Step 1039: {'lr': 0.0002595, 'samples': 199488, 'steps': 1038, 'loss/train': 4.104729175567627} -11/06/2021 21:25:18 - INFO - __main__ - Step 1040: {'lr': 0.00025975, 'samples': 199680, 'steps': 1039, 'loss/train': 4.121339321136475} -11/06/2021 21:25:18 - INFO - __main__ - Step 1041: {'lr': 0.00026000000000000003, 'samples': 199872, 'steps': 1040, 'loss/train': 4.044469356536865} -11/06/2021 21:25:18 - INFO - __main__ - Step 1042: {'lr': 0.00026025, 'samples': 200064, 'steps': 1041, 'loss/train': 4.489924430847168} -11/06/2021 21:25:19 - INFO - __main__ - Step 1043: {'lr': 0.0002605, 'samples': 200256, 'steps': 1042, 'loss/train': 4.626270771026611} -11/06/2021 21:25:19 - INFO - __main__ - Step 1044: {'lr': 0.00026074999999999997, 'samples': 200448, 'steps': 1043, 'loss/train': 3.788095712661743} -11/06/2021 21:25:20 - INFO - __main__ - Step 1045: {'lr': 0.000261, 'samples': 200640, 'steps': 1044, 'loss/train': 4.697029113769531} -11/06/2021 21:25:20 - INFO - __main__ - Step 1046: {'lr': 0.00026125, 'samples': 200832, 'steps': 1045, 'loss/train': 3.7859976291656494} -11/06/2021 21:25:21 - INFO - __main__ - Step 1047: {'lr': 0.0002615, 'samples': 201024, 'steps': 1046, 'loss/train': 4.636324405670166} -11/06/2021 21:25:21 - INFO - __main__ - Step 1048: {'lr': 0.00026175, 'samples': 201216, 'steps': 1047, 'loss/train': 4.295483112335205} -11/06/2021 21:25:21 - INFO - __main__ - Step 1049: {'lr': 0.000262, 'samples': 201408, 'steps': 1048, 'loss/train': 3.938405990600586} -11/06/2021 21:25:22 - INFO - __main__ - Step 1050: {'lr': 0.00026225, 'samples': 201600, 'steps': 1049, 'loss/train': 5.09901762008667} -11/06/2021 21:25:23 - INFO - __main__ - Step 1051: {'lr': 0.00026250000000000004, 'samples': 201792, 'steps': 1050, 'loss/train': 4.2966108322143555} -11/06/2021 21:25:23 - INFO - __main__ - Step 1052: {'lr': 0.00026274999999999996, 'samples': 201984, 'steps': 1051, 'loss/train': 3.858107805252075} -11/06/2021 21:25:23 - INFO - __main__ - Step 1053: {'lr': 0.000263, 'samples': 202176, 'steps': 1052, 'loss/train': 4.3338303565979} -11/06/2021 21:25:24 - INFO - __main__ - Step 1054: {'lr': 0.00026325, 'samples': 202368, 'steps': 1053, 'loss/train': 4.086007118225098} -11/06/2021 21:25:25 - INFO - __main__ - Step 1055: {'lr': 0.0002635, 'samples': 202560, 'steps': 1054, 'loss/train': 3.4907381534576416} -11/06/2021 21:25:25 - INFO - __main__ - Step 1056: {'lr': 0.00026375, 'samples': 202752, 'steps': 1055, 'loss/train': 6.328280925750732} -11/06/2021 21:25:26 - INFO - __main__ - Step 1057: {'lr': 0.000264, 'samples': 202944, 'steps': 1056, 'loss/train': 4.75831413269043} -11/06/2021 21:25:26 - INFO - __main__ - Step 1058: {'lr': 0.00026425, 'samples': 203136, 'steps': 1057, 'loss/train': 4.140725135803223} -11/06/2021 21:25:26 - INFO - __main__ - Step 1059: {'lr': 0.00026450000000000003, 'samples': 203328, 'steps': 1058, 'loss/train': 4.232659339904785} -11/06/2021 21:25:27 - INFO - __main__ - Step 1060: {'lr': 0.00026475, 'samples': 203520, 'steps': 1059, 'loss/train': 3.662130117416382} -11/06/2021 21:25:28 - INFO - __main__ - Step 1061: {'lr': 0.00026500000000000004, 'samples': 203712, 'steps': 1060, 'loss/train': 4.175182819366455} -11/06/2021 21:25:28 - INFO - __main__ - Step 1062: {'lr': 0.00026524999999999997, 'samples': 203904, 'steps': 1061, 'loss/train': 4.066892623901367} -11/06/2021 21:25:28 - INFO - __main__ - Step 1063: {'lr': 0.0002655, 'samples': 204096, 'steps': 1062, 'loss/train': 3.988063335418701} -11/06/2021 21:25:29 - INFO - __main__ - Step 1064: {'lr': 0.00026575, 'samples': 204288, 'steps': 1063, 'loss/train': 5.1581830978393555} -11/06/2021 21:25:29 - INFO - __main__ - Step 1065: {'lr': 0.000266, 'samples': 204480, 'steps': 1064, 'loss/train': 3.77549409866333} -11/06/2021 21:25:30 - INFO - __main__ - Step 1066: {'lr': 0.00026625, 'samples': 204672, 'steps': 1065, 'loss/train': 3.962754011154175} -11/06/2021 21:25:30 - INFO - __main__ - Step 1067: {'lr': 0.0002665, 'samples': 204864, 'steps': 1066, 'loss/train': 4.140915393829346} -11/06/2021 21:25:31 - INFO - __main__ - Step 1068: {'lr': 0.00026675, 'samples': 205056, 'steps': 1067, 'loss/train': 3.9314892292022705} -11/06/2021 21:25:31 - INFO - __main__ - Step 1069: {'lr': 0.00026700000000000004, 'samples': 205248, 'steps': 1068, 'loss/train': 4.5690155029296875} -11/06/2021 21:25:31 - INFO - __main__ - Step 1070: {'lr': 0.00026725, 'samples': 205440, 'steps': 1069, 'loss/train': 2.362624168395996} -11/06/2021 21:25:33 - INFO - __main__ - Step 1071: {'lr': 0.0002675, 'samples': 205632, 'steps': 1070, 'loss/train': 3.6357979774475098} -11/06/2021 21:25:33 - INFO - __main__ - Step 1072: {'lr': 0.00026775, 'samples': 205824, 'steps': 1071, 'loss/train': 4.618821144104004} -11/06/2021 21:25:33 - INFO - __main__ - Step 1073: {'lr': 0.000268, 'samples': 206016, 'steps': 1072, 'loss/train': 3.773068904876709} -11/06/2021 21:25:34 - INFO - __main__ - Step 1074: {'lr': 0.00026825, 'samples': 206208, 'steps': 1073, 'loss/train': 3.240086078643799} -11/06/2021 21:25:34 - INFO - __main__ - Step 1075: {'lr': 0.0002685, 'samples': 206400, 'steps': 1074, 'loss/train': 5.478127479553223} -11/06/2021 21:25:35 - INFO - __main__ - Step 1076: {'lr': 0.00026875, 'samples': 206592, 'steps': 1075, 'loss/train': 4.112662315368652} -11/06/2021 21:25:35 - INFO - __main__ - Step 1077: {'lr': 0.00026900000000000003, 'samples': 206784, 'steps': 1076, 'loss/train': 4.273911476135254} -11/06/2021 21:25:36 - INFO - __main__ - Step 1078: {'lr': 0.00026925, 'samples': 206976, 'steps': 1077, 'loss/train': 4.561737060546875} -11/06/2021 21:25:36 - INFO - __main__ - Step 1079: {'lr': 0.00026950000000000005, 'samples': 207168, 'steps': 1078, 'loss/train': 4.370131015777588} -11/06/2021 21:25:36 - INFO - __main__ - Step 1080: {'lr': 0.00026974999999999997, 'samples': 207360, 'steps': 1079, 'loss/train': 4.151457786560059} -11/06/2021 21:25:37 - INFO - __main__ - Step 1081: {'lr': 0.00027, 'samples': 207552, 'steps': 1080, 'loss/train': 4.187550067901611} -11/06/2021 21:25:38 - INFO - __main__ - Step 1082: {'lr': 0.00027025, 'samples': 207744, 'steps': 1081, 'loss/train': 3.7700130939483643} -11/06/2021 21:25:38 - INFO - __main__ - Step 1083: {'lr': 0.0002705, 'samples': 207936, 'steps': 1082, 'loss/train': 3.5349581241607666} -11/06/2021 21:25:38 - INFO - __main__ - Step 1084: {'lr': 0.00027075, 'samples': 208128, 'steps': 1083, 'loss/train': 3.959185838699341} -11/06/2021 21:25:39 - INFO - __main__ - Step 1085: {'lr': 0.00027100000000000003, 'samples': 208320, 'steps': 1084, 'loss/train': 4.234473705291748} -11/06/2021 21:25:40 - INFO - __main__ - Step 1086: {'lr': 0.00027125, 'samples': 208512, 'steps': 1085, 'loss/train': 4.3777313232421875} -11/06/2021 21:25:40 - INFO - __main__ - Step 1087: {'lr': 0.00027150000000000004, 'samples': 208704, 'steps': 1086, 'loss/train': 4.0575103759765625} -11/06/2021 21:25:41 - INFO - __main__ - Step 1088: {'lr': 0.00027175, 'samples': 208896, 'steps': 1087, 'loss/train': 3.6606838703155518} -11/06/2021 21:25:41 - INFO - __main__ - Step 1089: {'lr': 0.00027200000000000005, 'samples': 209088, 'steps': 1088, 'loss/train': 4.134492874145508} -11/06/2021 21:25:41 - INFO - __main__ - Step 1090: {'lr': 0.00027225, 'samples': 209280, 'steps': 1089, 'loss/train': 3.7823238372802734} -11/06/2021 21:25:42 - INFO - __main__ - Step 1091: {'lr': 0.0002725, 'samples': 209472, 'steps': 1090, 'loss/train': 3.5656397342681885} -11/06/2021 21:25:43 - INFO - __main__ - Step 1092: {'lr': 0.00027275, 'samples': 209664, 'steps': 1091, 'loss/train': 4.612241744995117} -11/06/2021 21:25:43 - INFO - __main__ - Step 1093: {'lr': 0.000273, 'samples': 209856, 'steps': 1092, 'loss/train': 4.211349010467529} -11/06/2021 21:25:43 - INFO - __main__ - Step 1094: {'lr': 0.00027325, 'samples': 210048, 'steps': 1093, 'loss/train': 3.8772196769714355} -11/06/2021 21:25:44 - INFO - __main__ - Step 1095: {'lr': 0.00027350000000000003, 'samples': 210240, 'steps': 1094, 'loss/train': 4.242520332336426} -11/06/2021 21:25:45 - INFO - __main__ - Step 1096: {'lr': 0.00027375, 'samples': 210432, 'steps': 1095, 'loss/train': 4.067473411560059} -11/06/2021 21:25:45 - INFO - __main__ - Step 1097: {'lr': 0.00027400000000000005, 'samples': 210624, 'steps': 1096, 'loss/train': 4.022539138793945} -11/06/2021 21:25:46 - INFO - __main__ - Step 1098: {'lr': 0.00027425, 'samples': 210816, 'steps': 1097, 'loss/train': 3.810528516769409} -11/06/2021 21:25:46 - INFO - __main__ - Step 1099: {'lr': 0.0002745, 'samples': 211008, 'steps': 1098, 'loss/train': 4.089423179626465} -11/06/2021 21:25:47 - INFO - __main__ - Step 1100: {'lr': 0.00027475, 'samples': 211200, 'steps': 1099, 'loss/train': 4.257665157318115} -11/06/2021 21:25:48 - INFO - __main__ - Step 1101: {'lr': 0.000275, 'samples': 211392, 'steps': 1100, 'loss/train': 4.2323384284973145} -11/06/2021 21:25:48 - INFO - __main__ - Step 1102: {'lr': 0.00027525, 'samples': 211584, 'steps': 1101, 'loss/train': 4.789181709289551} -11/06/2021 21:25:48 - INFO - __main__ - Step 1103: {'lr': 0.00027550000000000003, 'samples': 211776, 'steps': 1102, 'loss/train': 6.588270664215088} -11/06/2021 21:25:49 - INFO - __main__ - Step 1104: {'lr': 0.00027575, 'samples': 211968, 'steps': 1103, 'loss/train': 3.7694168090820312} -11/06/2021 21:25:49 - INFO - __main__ - Step 1105: {'lr': 0.00027600000000000004, 'samples': 212160, 'steps': 1104, 'loss/train': 3.7395424842834473} -11/06/2021 21:25:50 - INFO - __main__ - Step 1106: {'lr': 0.00027625, 'samples': 212352, 'steps': 1105, 'loss/train': 4.408657073974609} -11/06/2021 21:25:51 - INFO - __main__ - Step 1107: {'lr': 0.00027650000000000005, 'samples': 212544, 'steps': 1106, 'loss/train': 4.209283828735352} -11/06/2021 21:25:51 - INFO - __main__ - Step 1108: {'lr': 0.00027675, 'samples': 212736, 'steps': 1107, 'loss/train': 4.449584007263184} -11/06/2021 21:25:51 - INFO - __main__ - Step 1109: {'lr': 0.000277, 'samples': 212928, 'steps': 1108, 'loss/train': 3.7549164295196533} -11/06/2021 21:25:52 - INFO - __main__ - Step 1110: {'lr': 0.00027725, 'samples': 213120, 'steps': 1109, 'loss/train': 4.272808074951172} -11/06/2021 21:25:52 - INFO - __main__ - Step 1111: {'lr': 0.0002775, 'samples': 213312, 'steps': 1110, 'loss/train': 4.251165390014648} -11/06/2021 21:25:53 - INFO - __main__ - Step 1112: {'lr': 0.00027775, 'samples': 213504, 'steps': 1111, 'loss/train': 4.609951972961426} -11/06/2021 21:25:54 - INFO - __main__ - Step 1113: {'lr': 0.00027800000000000004, 'samples': 213696, 'steps': 1112, 'loss/train': 4.141632556915283} -11/06/2021 21:25:54 - INFO - __main__ - Step 1114: {'lr': 0.00027825, 'samples': 213888, 'steps': 1113, 'loss/train': 4.153262615203857} -11/06/2021 21:25:54 - INFO - __main__ - Step 1115: {'lr': 0.00027850000000000005, 'samples': 214080, 'steps': 1114, 'loss/train': 3.717008113861084} -11/06/2021 21:25:55 - INFO - __main__ - Step 1116: {'lr': 0.00027875, 'samples': 214272, 'steps': 1115, 'loss/train': 3.0349667072296143} -11/06/2021 21:25:56 - INFO - __main__ - Step 1117: {'lr': 0.000279, 'samples': 214464, 'steps': 1116, 'loss/train': 5.148609161376953} -11/06/2021 21:25:56 - INFO - __main__ - Step 1118: {'lr': 0.00027925, 'samples': 214656, 'steps': 1117, 'loss/train': 4.0414958000183105} -11/06/2021 21:25:56 - INFO - __main__ - Step 1119: {'lr': 0.0002795, 'samples': 214848, 'steps': 1118, 'loss/train': 3.6977531909942627} -11/06/2021 21:25:57 - INFO - __main__ - Step 1120: {'lr': 0.00027975, 'samples': 215040, 'steps': 1119, 'loss/train': 3.3791584968566895} -11/06/2021 21:25:57 - INFO - __main__ - Step 1121: {'lr': 0.00028000000000000003, 'samples': 215232, 'steps': 1120, 'loss/train': 3.486509084701538} -11/06/2021 21:25:57 - INFO - __main__ - Step 1122: {'lr': 0.00028025, 'samples': 215424, 'steps': 1121, 'loss/train': 4.281680583953857} -11/06/2021 21:25:59 - INFO - __main__ - Step 1123: {'lr': 0.00028050000000000004, 'samples': 215616, 'steps': 1122, 'loss/train': 5.040244102478027} -11/06/2021 21:25:59 - INFO - __main__ - Step 1124: {'lr': 0.00028075, 'samples': 215808, 'steps': 1123, 'loss/train': 3.963624954223633} -11/06/2021 21:25:59 - INFO - __main__ - Step 1125: {'lr': 0.00028100000000000005, 'samples': 216000, 'steps': 1124, 'loss/train': 3.8375720977783203} -11/06/2021 21:26:00 - INFO - __main__ - Step 1126: {'lr': 0.00028125000000000003, 'samples': 216192, 'steps': 1125, 'loss/train': 4.240171432495117} -11/06/2021 21:26:00 - INFO - __main__ - Step 1127: {'lr': 0.00028149999999999996, 'samples': 216384, 'steps': 1126, 'loss/train': 3.637873888015747} -11/06/2021 21:26:01 - INFO - __main__ - Step 1128: {'lr': 0.00028175, 'samples': 216576, 'steps': 1127, 'loss/train': 3.8652379512786865} -11/06/2021 21:26:01 - INFO - __main__ - Step 1129: {'lr': 0.00028199999999999997, 'samples': 216768, 'steps': 1128, 'loss/train': 4.120966911315918} -11/06/2021 21:26:02 - INFO - __main__ - Step 1130: {'lr': 0.00028225, 'samples': 216960, 'steps': 1129, 'loss/train': 4.294138431549072} -11/06/2021 21:26:02 - INFO - __main__ - Step 1131: {'lr': 0.0002825, 'samples': 217152, 'steps': 1130, 'loss/train': 3.7788121700286865} -11/06/2021 21:26:02 - INFO - __main__ - Step 1132: {'lr': 0.00028275, 'samples': 217344, 'steps': 1131, 'loss/train': 3.901336908340454} -11/06/2021 21:26:03 - INFO - __main__ - Step 1133: {'lr': 0.000283, 'samples': 217536, 'steps': 1132, 'loss/train': 4.027707099914551} -11/06/2021 21:26:04 - INFO - __main__ - Step 1134: {'lr': 0.00028325000000000003, 'samples': 217728, 'steps': 1133, 'loss/train': 4.218957424163818} -11/06/2021 21:26:04 - INFO - __main__ - Step 1135: {'lr': 0.0002835, 'samples': 217920, 'steps': 1134, 'loss/train': 4.311142444610596} -11/06/2021 21:26:05 - INFO - __main__ - Step 1136: {'lr': 0.00028375, 'samples': 218112, 'steps': 1135, 'loss/train': 4.181615352630615} -11/06/2021 21:26:05 - INFO - __main__ - Step 1137: {'lr': 0.00028399999999999996, 'samples': 218304, 'steps': 1136, 'loss/train': 3.916645050048828} -11/06/2021 21:26:06 - INFO - __main__ - Step 1138: {'lr': 0.00028425, 'samples': 218496, 'steps': 1137, 'loss/train': 4.085984706878662} -11/06/2021 21:26:06 - INFO - __main__ - Step 1139: {'lr': 0.0002845, 'samples': 218688, 'steps': 1138, 'loss/train': 4.673676013946533} -11/06/2021 21:26:07 - INFO - __main__ - Step 1140: {'lr': 0.00028475, 'samples': 218880, 'steps': 1139, 'loss/train': 4.280994415283203} -11/06/2021 21:26:07 - INFO - __main__ - Step 1141: {'lr': 0.000285, 'samples': 219072, 'steps': 1140, 'loss/train': 4.047427177429199} -11/06/2021 21:26:07 - INFO - __main__ - Step 1142: {'lr': 0.00028525, 'samples': 219264, 'steps': 1141, 'loss/train': 3.885024070739746} -11/06/2021 21:26:08 - INFO - __main__ - Step 1143: {'lr': 0.0002855, 'samples': 219456, 'steps': 1142, 'loss/train': 4.40393590927124} -11/06/2021 21:26:09 - INFO - __main__ - Step 1144: {'lr': 0.00028575000000000003, 'samples': 219648, 'steps': 1143, 'loss/train': 4.992481708526611} -11/06/2021 21:26:09 - INFO - __main__ - Step 1145: {'lr': 0.00028599999999999996, 'samples': 219840, 'steps': 1144, 'loss/train': 4.026183128356934} -11/06/2021 21:26:10 - INFO - __main__ - Step 1146: {'lr': 0.00028625, 'samples': 220032, 'steps': 1145, 'loss/train': 3.5987935066223145} -11/06/2021 21:26:10 - INFO - __main__ - Step 1147: {'lr': 0.00028649999999999997, 'samples': 220224, 'steps': 1146, 'loss/train': 4.403866767883301} -11/06/2021 21:26:11 - INFO - __main__ - Step 1148: {'lr': 0.00028675, 'samples': 220416, 'steps': 1147, 'loss/train': 3.9268059730529785} -11/06/2021 21:26:11 - INFO - __main__ - Step 1149: {'lr': 0.000287, 'samples': 220608, 'steps': 1148, 'loss/train': 3.6902759075164795} -11/06/2021 21:26:12 - INFO - __main__ - Step 1150: {'lr': 0.00028725, 'samples': 220800, 'steps': 1149, 'loss/train': 4.134997367858887} -11/06/2021 21:26:12 - INFO - __main__ - Step 1151: {'lr': 0.0002875, 'samples': 220992, 'steps': 1150, 'loss/train': 3.9367594718933105} -11/06/2021 21:26:12 - INFO - __main__ - Step 1152: {'lr': 0.00028775000000000003, 'samples': 221184, 'steps': 1151, 'loss/train': 3.4053988456726074} -11/06/2021 21:26:13 - INFO - __main__ - Step 1153: {'lr': 0.000288, 'samples': 221376, 'steps': 1152, 'loss/train': 4.11300802230835} -11/06/2021 21:26:14 - INFO - __main__ - Step 1154: {'lr': 0.00028825, 'samples': 221568, 'steps': 1153, 'loss/train': 3.790684700012207} -11/06/2021 21:26:14 - INFO - __main__ - Step 1155: {'lr': 0.00028849999999999997, 'samples': 221760, 'steps': 1154, 'loss/train': 4.096200942993164} -11/06/2021 21:26:14 - INFO - __main__ - Step 1156: {'lr': 0.00028875, 'samples': 221952, 'steps': 1155, 'loss/train': 4.3799262046813965} -11/06/2021 21:26:15 - INFO - __main__ - Step 1157: {'lr': 0.000289, 'samples': 222144, 'steps': 1156, 'loss/train': 4.1134748458862305} -11/06/2021 21:26:15 - INFO - __main__ - Step 1158: {'lr': 0.00028925, 'samples': 222336, 'steps': 1157, 'loss/train': 4.462249755859375} -11/06/2021 21:26:16 - INFO - __main__ - Step 1159: {'lr': 0.0002895, 'samples': 222528, 'steps': 1158, 'loss/train': 2.7520174980163574} -11/06/2021 21:26:16 - INFO - __main__ - Step 1160: {'lr': 0.00028975, 'samples': 222720, 'steps': 1159, 'loss/train': 4.172967910766602} -11/06/2021 21:26:17 - INFO - __main__ - Step 1161: {'lr': 0.00029, 'samples': 222912, 'steps': 1160, 'loss/train': 3.451906204223633} -11/06/2021 21:26:17 - INFO - __main__ - Step 1162: {'lr': 0.00029025000000000003, 'samples': 223104, 'steps': 1161, 'loss/train': 4.355815887451172} -11/06/2021 21:26:18 - INFO - __main__ - Step 1163: {'lr': 0.00029049999999999996, 'samples': 223296, 'steps': 1162, 'loss/train': 4.1517109870910645} -11/06/2021 21:26:19 - INFO - __main__ - Step 1164: {'lr': 0.00029075, 'samples': 223488, 'steps': 1163, 'loss/train': 4.004212856292725} -11/06/2021 21:26:19 - INFO - __main__ - Step 1165: {'lr': 0.00029099999999999997, 'samples': 223680, 'steps': 1164, 'loss/train': 4.073708534240723} -11/06/2021 21:26:19 - INFO - __main__ - Step 1166: {'lr': 0.00029125, 'samples': 223872, 'steps': 1165, 'loss/train': 4.045283317565918} -11/06/2021 21:26:20 - INFO - __main__ - Step 1167: {'lr': 0.0002915, 'samples': 224064, 'steps': 1166, 'loss/train': 3.959521770477295} -11/06/2021 21:26:20 - INFO - __main__ - Step 1168: {'lr': 0.00029175, 'samples': 224256, 'steps': 1167, 'loss/train': 3.8172402381896973} -11/06/2021 21:26:21 - INFO - __main__ - Step 1169: {'lr': 0.000292, 'samples': 224448, 'steps': 1168, 'loss/train': 3.809446096420288} -11/06/2021 21:26:21 - INFO - __main__ - Step 1170: {'lr': 0.00029225000000000003, 'samples': 224640, 'steps': 1169, 'loss/train': 4.352285385131836} -11/06/2021 21:26:22 - INFO - __main__ - Step 1171: {'lr': 0.0002925, 'samples': 224832, 'steps': 1170, 'loss/train': 3.0493404865264893} -11/06/2021 21:26:22 - INFO - __main__ - Step 1172: {'lr': 0.00029275000000000004, 'samples': 225024, 'steps': 1171, 'loss/train': 4.092573642730713} -11/06/2021 21:26:22 - INFO - __main__ - Step 1173: {'lr': 0.00029299999999999997, 'samples': 225216, 'steps': 1172, 'loss/train': 4.186103820800781} -11/06/2021 21:26:23 - INFO - __main__ - Step 1174: {'lr': 0.00029325, 'samples': 225408, 'steps': 1173, 'loss/train': 3.786396026611328} -11/06/2021 21:26:24 - INFO - __main__ - Step 1175: {'lr': 0.0002935, 'samples': 225600, 'steps': 1174, 'loss/train': 4.53329610824585} -11/06/2021 21:26:24 - INFO - __main__ - Step 1176: {'lr': 0.00029375, 'samples': 225792, 'steps': 1175, 'loss/train': 3.6532394886016846} -11/06/2021 21:26:24 - INFO - __main__ - Step 1177: {'lr': 0.000294, 'samples': 225984, 'steps': 1176, 'loss/train': 3.6320600509643555} -11/06/2021 21:26:25 - INFO - __main__ - Step 1178: {'lr': 0.00029425, 'samples': 226176, 'steps': 1177, 'loss/train': 3.9214487075805664} -11/06/2021 21:26:26 - INFO - __main__ - Step 1179: {'lr': 0.0002945, 'samples': 226368, 'steps': 1178, 'loss/train': 3.6811251640319824} -11/06/2021 21:26:26 - INFO - __main__ - Step 1180: {'lr': 0.00029475000000000004, 'samples': 226560, 'steps': 1179, 'loss/train': 3.892512559890747} -11/06/2021 21:26:27 - INFO - __main__ - Step 1181: {'lr': 0.000295, 'samples': 226752, 'steps': 1180, 'loss/train': 4.335596561431885} -11/06/2021 21:26:27 - INFO - __main__ - Step 1182: {'lr': 0.00029525, 'samples': 226944, 'steps': 1181, 'loss/train': 3.9504594802856445} -11/06/2021 21:26:27 - INFO - __main__ - Step 1183: {'lr': 0.00029549999999999997, 'samples': 227136, 'steps': 1182, 'loss/train': 4.172230243682861} -11/06/2021 21:26:28 - INFO - __main__ - Step 1184: {'lr': 0.00029575, 'samples': 227328, 'steps': 1183, 'loss/train': 4.093757152557373} -11/06/2021 21:26:29 - INFO - __main__ - Step 1185: {'lr': 0.000296, 'samples': 227520, 'steps': 1184, 'loss/train': 3.9272379875183105} -11/06/2021 21:26:29 - INFO - __main__ - Step 1186: {'lr': 0.00029625, 'samples': 227712, 'steps': 1185, 'loss/train': 3.678920269012451} -11/06/2021 21:26:29 - INFO - __main__ - Step 1187: {'lr': 0.0002965, 'samples': 227904, 'steps': 1186, 'loss/train': 3.9552578926086426} -11/06/2021 21:26:30 - INFO - __main__ - Step 1188: {'lr': 0.00029675000000000003, 'samples': 228096, 'steps': 1187, 'loss/train': 3.7164466381073} -11/06/2021 21:26:30 - INFO - __main__ - Step 1189: {'lr': 0.000297, 'samples': 228288, 'steps': 1188, 'loss/train': 4.196506977081299} -11/06/2021 21:26:31 - INFO - __main__ - Step 1190: {'lr': 0.00029725000000000004, 'samples': 228480, 'steps': 1189, 'loss/train': 3.887439489364624} -11/06/2021 21:26:31 - INFO - __main__ - Step 1191: {'lr': 0.00029749999999999997, 'samples': 228672, 'steps': 1190, 'loss/train': 3.7323334217071533} -11/06/2021 21:26:32 - INFO - __main__ - Step 1192: {'lr': 0.00029775, 'samples': 228864, 'steps': 1191, 'loss/train': 4.008239269256592} -11/06/2021 21:26:32 - INFO - __main__ - Step 1193: {'lr': 0.000298, 'samples': 229056, 'steps': 1192, 'loss/train': 5.458200454711914} -11/06/2021 21:26:33 - INFO - __main__ - Step 1194: {'lr': 0.00029825, 'samples': 229248, 'steps': 1193, 'loss/train': 3.7591049671173096} -11/06/2021 21:26:34 - INFO - __main__ - Step 1195: {'lr': 0.0002985, 'samples': 229440, 'steps': 1194, 'loss/train': 4.328658103942871} -11/06/2021 21:26:34 - INFO - __main__ - Step 1196: {'lr': 0.00029875, 'samples': 229632, 'steps': 1195, 'loss/train': 3.8931264877319336} -11/06/2021 21:26:34 - INFO - __main__ - Step 1197: {'lr': 0.000299, 'samples': 229824, 'steps': 1196, 'loss/train': 4.966779708862305} -11/06/2021 21:26:35 - INFO - __main__ - Step 1198: {'lr': 0.00029925000000000004, 'samples': 230016, 'steps': 1197, 'loss/train': 3.1090831756591797} -11/06/2021 21:26:35 - INFO - __main__ - Step 1199: {'lr': 0.0002995, 'samples': 230208, 'steps': 1198, 'loss/train': 3.9816088676452637} -11/06/2021 21:26:36 - INFO - __main__ - Step 1200: {'lr': 0.00029975000000000005, 'samples': 230400, 'steps': 1199, 'loss/train': 4.041784286499023} -11/06/2021 21:26:36 - INFO - __main__ - Step 1201: {'lr': 0.0003, 'samples': 230592, 'steps': 1200, 'loss/train': 3.73962664604187} -11/06/2021 21:26:37 - INFO - __main__ - Step 1202: {'lr': 0.00030025, 'samples': 230784, 'steps': 1201, 'loss/train': 3.259591579437256} -11/06/2021 21:26:37 - INFO - __main__ - Step 1203: {'lr': 0.0003005, 'samples': 230976, 'steps': 1202, 'loss/train': 4.60701322555542} -11/06/2021 21:26:37 - INFO - __main__ - Step 1204: {'lr': 0.00030075, 'samples': 231168, 'steps': 1203, 'loss/train': 4.123647689819336} -11/06/2021 21:26:39 - INFO - __main__ - Step 1205: {'lr': 0.000301, 'samples': 231360, 'steps': 1204, 'loss/train': 4.385739326477051} -11/06/2021 21:26:39 - INFO - __main__ - Step 1206: {'lr': 0.00030125000000000003, 'samples': 231552, 'steps': 1205, 'loss/train': 3.796212911605835} -11/06/2021 21:26:39 - INFO - __main__ - Step 1207: {'lr': 0.0003015, 'samples': 231744, 'steps': 1206, 'loss/train': 4.638833999633789} -11/06/2021 21:26:40 - INFO - __main__ - Step 1208: {'lr': 0.00030175000000000004, 'samples': 231936, 'steps': 1207, 'loss/train': 4.022327423095703} -11/06/2021 21:26:40 - INFO - __main__ - Step 1209: {'lr': 0.000302, 'samples': 232128, 'steps': 1208, 'loss/train': 4.19215202331543} -11/06/2021 21:26:41 - INFO - __main__ - Step 1210: {'lr': 0.00030225, 'samples': 232320, 'steps': 1209, 'loss/train': 4.021753787994385} -11/06/2021 21:26:41 - INFO - __main__ - Step 1211: {'lr': 0.0003025, 'samples': 232512, 'steps': 1210, 'loss/train': 3.7708232402801514} -11/06/2021 21:26:42 - INFO - __main__ - Step 1212: {'lr': 0.00030275, 'samples': 232704, 'steps': 1211, 'loss/train': 3.500831365585327} -11/06/2021 21:26:42 - INFO - __main__ - Step 1213: {'lr': 0.000303, 'samples': 232896, 'steps': 1212, 'loss/train': 3.7347517013549805} -11/06/2021 21:26:42 - INFO - __main__ - Step 1214: {'lr': 0.00030325, 'samples': 233088, 'steps': 1213, 'loss/train': 3.712738275527954} -11/06/2021 21:26:43 - INFO - __main__ - Step 1215: {'lr': 0.0003035, 'samples': 233280, 'steps': 1214, 'loss/train': 4.544304370880127} -11/06/2021 21:26:44 - INFO - __main__ - Step 1216: {'lr': 0.00030375000000000004, 'samples': 233472, 'steps': 1215, 'loss/train': 3.8694875240325928} -11/06/2021 21:26:44 - INFO - __main__ - Step 1217: {'lr': 0.000304, 'samples': 233664, 'steps': 1216, 'loss/train': 3.3171164989471436} -11/06/2021 21:26:44 - INFO - __main__ - Step 1218: {'lr': 0.00030425000000000005, 'samples': 233856, 'steps': 1217, 'loss/train': 3.7530202865600586} -11/06/2021 21:26:45 - INFO - __main__ - Step 1219: {'lr': 0.0003045, 'samples': 234048, 'steps': 1218, 'loss/train': 3.967923879623413} -11/06/2021 21:26:45 - INFO - __main__ - Step 1220: {'lr': 0.00030475, 'samples': 234240, 'steps': 1219, 'loss/train': 3.715089797973633} -11/06/2021 21:26:46 - INFO - __main__ - Step 1221: {'lr': 0.000305, 'samples': 234432, 'steps': 1220, 'loss/train': 3.693310260772705} -11/06/2021 21:26:46 - INFO - __main__ - Step 1222: {'lr': 0.00030525, 'samples': 234624, 'steps': 1221, 'loss/train': 3.5755531787872314} -11/06/2021 21:26:47 - INFO - __main__ - Step 1223: {'lr': 0.0003055, 'samples': 234816, 'steps': 1222, 'loss/train': 4.144630432128906} -11/06/2021 21:26:47 - INFO - __main__ - Step 1224: {'lr': 0.00030575000000000003, 'samples': 235008, 'steps': 1223, 'loss/train': 3.8937008380889893} -11/06/2021 21:26:48 - INFO - __main__ - Step 1225: {'lr': 0.000306, 'samples': 235200, 'steps': 1224, 'loss/train': 3.7765586376190186} -11/06/2021 21:26:48 - INFO - __main__ - Step 1226: {'lr': 0.00030625000000000004, 'samples': 235392, 'steps': 1225, 'loss/train': 4.3001017570495605} -11/06/2021 21:26:49 - INFO - __main__ - Step 1227: {'lr': 0.0003065, 'samples': 235584, 'steps': 1226, 'loss/train': 3.861295461654663} -11/06/2021 21:26:49 - INFO - __main__ - Step 1228: {'lr': 0.00030675, 'samples': 235776, 'steps': 1227, 'loss/train': 4.244755268096924} -11/06/2021 21:26:50 - INFO - __main__ - Step 1229: {'lr': 0.000307, 'samples': 235968, 'steps': 1228, 'loss/train': 4.392697811126709} -11/06/2021 21:26:50 - INFO - __main__ - Step 1230: {'lr': 0.00030725, 'samples': 236160, 'steps': 1229, 'loss/train': 4.003592014312744} -11/06/2021 21:26:51 - INFO - __main__ - Step 1231: {'lr': 0.0003075, 'samples': 236352, 'steps': 1230, 'loss/train': 3.7558765411376953} -11/06/2021 21:26:51 - INFO - __main__ - Step 1232: {'lr': 0.00030775, 'samples': 236544, 'steps': 1231, 'loss/train': 3.535252571105957} -11/06/2021 21:26:52 - INFO - __main__ - Step 1233: {'lr': 0.000308, 'samples': 236736, 'steps': 1232, 'loss/train': 3.4438316822052} -11/06/2021 21:26:52 - INFO - __main__ - Step 1234: {'lr': 0.00030825000000000004, 'samples': 236928, 'steps': 1233, 'loss/train': 3.6062018871307373} -11/06/2021 21:26:52 - INFO - __main__ - Step 1235: {'lr': 0.0003085, 'samples': 237120, 'steps': 1234, 'loss/train': 3.9174911975860596} -11/06/2021 21:26:53 - INFO - __main__ - Step 1236: {'lr': 0.00030875000000000005, 'samples': 237312, 'steps': 1235, 'loss/train': 3.6126482486724854} -11/06/2021 21:26:54 - INFO - __main__ - Step 1237: {'lr': 0.00030900000000000003, 'samples': 237504, 'steps': 1236, 'loss/train': 3.4603700637817383} -11/06/2021 21:26:54 - INFO - __main__ - Step 1238: {'lr': 0.00030925, 'samples': 237696, 'steps': 1237, 'loss/train': 5.033356666564941} -11/06/2021 21:26:54 - INFO - __main__ - Step 1239: {'lr': 0.0003095, 'samples': 237888, 'steps': 1238, 'loss/train': 3.9721944332122803} -11/06/2021 21:26:55 - INFO - __main__ - Step 1240: {'lr': 0.00030975, 'samples': 238080, 'steps': 1239, 'loss/train': 3.999577045440674} -11/06/2021 21:26:56 - INFO - __main__ - Step 1241: {'lr': 0.00031, 'samples': 238272, 'steps': 1240, 'loss/train': 3.221419334411621} -11/06/2021 21:26:56 - INFO - __main__ - Step 1242: {'lr': 0.00031025000000000003, 'samples': 238464, 'steps': 1241, 'loss/train': 3.553842067718506} -11/06/2021 21:26:57 - INFO - __main__ - Step 1243: {'lr': 0.0003105, 'samples': 238656, 'steps': 1242, 'loss/train': 3.4750494956970215} -11/06/2021 21:26:57 - INFO - __main__ - Step 1244: {'lr': 0.00031075000000000005, 'samples': 238848, 'steps': 1243, 'loss/train': 3.7925238609313965} -11/06/2021 21:26:57 - INFO - __main__ - Step 1245: {'lr': 0.000311, 'samples': 239040, 'steps': 1244, 'loss/train': 4.293489456176758} -11/06/2021 21:26:58 - INFO - __main__ - Step 1246: {'lr': 0.00031125000000000006, 'samples': 239232, 'steps': 1245, 'loss/train': 3.7371480464935303} -11/06/2021 21:26:59 - INFO - __main__ - Step 1247: {'lr': 0.0003115, 'samples': 239424, 'steps': 1246, 'loss/train': 4.00302791595459} -11/06/2021 21:26:59 - INFO - __main__ - Step 1248: {'lr': 0.00031175, 'samples': 239616, 'steps': 1247, 'loss/train': 3.7047793865203857} -11/06/2021 21:27:00 - INFO - __main__ - Step 1249: {'lr': 0.000312, 'samples': 239808, 'steps': 1248, 'loss/train': 4.603279113769531} -11/06/2021 21:27:00 - INFO - __main__ - Step 1250: {'lr': 0.00031225000000000003, 'samples': 240000, 'steps': 1249, 'loss/train': 3.6074068546295166} -11/06/2021 21:27:00 - INFO - __main__ - Step 1251: {'lr': 0.0003125, 'samples': 240192, 'steps': 1250, 'loss/train': 4.296557903289795} -11/06/2021 21:27:01 - INFO - __main__ - Step 1252: {'lr': 0.00031275, 'samples': 240384, 'steps': 1251, 'loss/train': 3.7983367443084717} -11/06/2021 21:27:02 - INFO - __main__ - Step 1253: {'lr': 0.000313, 'samples': 240576, 'steps': 1252, 'loss/train': 3.8672046661376953} -11/06/2021 21:27:02 - INFO - __main__ - Step 1254: {'lr': 0.00031325, 'samples': 240768, 'steps': 1253, 'loss/train': 3.8182613849639893} -11/06/2021 21:27:02 - INFO - __main__ - Step 1255: {'lr': 0.00031350000000000003, 'samples': 240960, 'steps': 1254, 'loss/train': 3.425907850265503} -11/06/2021 21:27:03 - INFO - __main__ - Step 1256: {'lr': 0.00031374999999999996, 'samples': 241152, 'steps': 1255, 'loss/train': 3.5726277828216553} -11/06/2021 21:27:04 - INFO - __main__ - Step 1257: {'lr': 0.000314, 'samples': 241344, 'steps': 1256, 'loss/train': 3.928713083267212} -11/06/2021 21:27:04 - INFO - __main__ - Step 1258: {'lr': 0.00031424999999999997, 'samples': 241536, 'steps': 1257, 'loss/train': 3.986309289932251} -11/06/2021 21:27:04 - INFO - __main__ - Step 1259: {'lr': 0.0003145, 'samples': 241728, 'steps': 1258, 'loss/train': 4.367678642272949} -11/06/2021 21:27:05 - INFO - __main__ - Step 1260: {'lr': 0.00031475, 'samples': 241920, 'steps': 1259, 'loss/train': 3.995647430419922} -11/06/2021 21:27:05 - INFO - __main__ - Step 1261: {'lr': 0.000315, 'samples': 242112, 'steps': 1260, 'loss/train': 3.605346441268921} -11/06/2021 21:27:06 - INFO - __main__ - Step 1262: {'lr': 0.00031525, 'samples': 242304, 'steps': 1261, 'loss/train': 3.96653413772583} -11/06/2021 21:27:06 - INFO - __main__ - Step 1263: {'lr': 0.0003155, 'samples': 242496, 'steps': 1262, 'loss/train': 3.9042797088623047} -11/06/2021 21:27:07 - INFO - __main__ - Step 1264: {'lr': 0.00031575, 'samples': 242688, 'steps': 1263, 'loss/train': 3.5482776165008545} -11/06/2021 21:27:07 - INFO - __main__ - Step 1265: {'lr': 0.000316, 'samples': 242880, 'steps': 1264, 'loss/train': 3.473890781402588} -11/06/2021 21:27:07 - INFO - __main__ - Step 1266: {'lr': 0.00031624999999999996, 'samples': 243072, 'steps': 1265, 'loss/train': 3.6147239208221436} -11/06/2021 21:27:08 - INFO - __main__ - Step 1267: {'lr': 0.0003165, 'samples': 243264, 'steps': 1266, 'loss/train': 3.760866403579712} -11/06/2021 21:27:09 - INFO - __main__ - Step 1268: {'lr': 0.00031675, 'samples': 243456, 'steps': 1267, 'loss/train': 3.5120933055877686} -11/06/2021 21:27:10 - INFO - __main__ - Step 1269: {'lr': 0.000317, 'samples': 243648, 'steps': 1268, 'loss/train': 4.119743824005127} -11/06/2021 21:27:10 - INFO - __main__ - Step 1270: {'lr': 0.00031725, 'samples': 243840, 'steps': 1269, 'loss/train': 4.16604471206665} -11/06/2021 21:27:10 - INFO - __main__ - Step 1271: {'lr': 0.0003175, 'samples': 244032, 'steps': 1270, 'loss/train': 3.718264102935791} -11/06/2021 21:27:11 - INFO - __main__ - Step 1272: {'lr': 0.00031775, 'samples': 244224, 'steps': 1271, 'loss/train': 3.804915428161621} -11/06/2021 21:27:12 - INFO - __main__ - Step 1273: {'lr': 0.00031800000000000003, 'samples': 244416, 'steps': 1272, 'loss/train': 3.632591724395752} -11/06/2021 21:27:12 - INFO - __main__ - Step 1274: {'lr': 0.00031825, 'samples': 244608, 'steps': 1273, 'loss/train': 3.5990989208221436} -11/06/2021 21:27:12 - INFO - __main__ - Step 1275: {'lr': 0.0003185, 'samples': 244800, 'steps': 1274, 'loss/train': 3.5454981327056885} -11/06/2021 21:27:13 - INFO - __main__ - Step 1276: {'lr': 0.00031874999999999997, 'samples': 244992, 'steps': 1275, 'loss/train': 2.8243398666381836} -11/06/2021 21:27:13 - INFO - __main__ - Step 1277: {'lr': 0.000319, 'samples': 245184, 'steps': 1276, 'loss/train': 4.374372959136963} -11/06/2021 21:27:14 - INFO - __main__ - Step 1278: {'lr': 0.00031925, 'samples': 245376, 'steps': 1277, 'loss/train': 2.880706548690796} -11/06/2021 21:27:15 - INFO - __main__ - Step 1279: {'lr': 0.0003195, 'samples': 245568, 'steps': 1278, 'loss/train': 3.749918222427368} -11/06/2021 21:27:15 - INFO - __main__ - Step 1280: {'lr': 0.00031975, 'samples': 245760, 'steps': 1279, 'loss/train': 3.91780686378479} -11/06/2021 21:27:15 - INFO - __main__ - Step 1281: {'lr': 0.00032, 'samples': 245952, 'steps': 1280, 'loss/train': 3.8567497730255127} -11/06/2021 21:27:16 - INFO - __main__ - Step 1282: {'lr': 0.00032025, 'samples': 246144, 'steps': 1281, 'loss/train': 2.492274761199951} -11/06/2021 21:27:17 - INFO - __main__ - Step 1283: {'lr': 0.00032050000000000004, 'samples': 246336, 'steps': 1282, 'loss/train': 4.012140274047852} -11/06/2021 21:27:17 - INFO - __main__ - Step 1284: {'lr': 0.00032074999999999996, 'samples': 246528, 'steps': 1283, 'loss/train': 3.700061559677124} -11/06/2021 21:27:17 - INFO - __main__ - Step 1285: {'lr': 0.000321, 'samples': 246720, 'steps': 1284, 'loss/train': 4.031924724578857} -11/06/2021 21:27:18 - INFO - __main__ - Step 1286: {'lr': 0.00032125, 'samples': 246912, 'steps': 1285, 'loss/train': 4.252817153930664} -11/06/2021 21:27:18 - INFO - __main__ - Step 1287: {'lr': 0.0003215, 'samples': 247104, 'steps': 1286, 'loss/train': 3.6342227458953857} -11/06/2021 21:27:19 - INFO - __main__ - Step 1288: {'lr': 0.00032175, 'samples': 247296, 'steps': 1287, 'loss/train': 3.6176106929779053} -11/06/2021 21:27:20 - INFO - __main__ - Step 1289: {'lr': 0.000322, 'samples': 247488, 'steps': 1288, 'loss/train': 5.5985236167907715} -11/06/2021 21:27:20 - INFO - __main__ - Step 1290: {'lr': 0.00032225, 'samples': 247680, 'steps': 1289, 'loss/train': 3.5907435417175293} -11/06/2021 21:27:20 - INFO - __main__ - Step 1291: {'lr': 0.00032250000000000003, 'samples': 247872, 'steps': 1290, 'loss/train': 3.7204911708831787} -11/06/2021 21:27:21 - INFO - __main__ - Step 1292: {'lr': 0.00032275, 'samples': 248064, 'steps': 1291, 'loss/train': 3.9456405639648438} -11/06/2021 21:27:22 - INFO - __main__ - Step 1293: {'lr': 0.000323, 'samples': 248256, 'steps': 1292, 'loss/train': 3.7843210697174072} -11/06/2021 21:27:22 - INFO - __main__ - Step 1294: {'lr': 0.00032324999999999997, 'samples': 248448, 'steps': 1293, 'loss/train': 3.915496349334717} -11/06/2021 21:27:22 - INFO - __main__ - Step 1295: {'lr': 0.0003235, 'samples': 248640, 'steps': 1294, 'loss/train': 4.2259440422058105} -11/06/2021 21:27:23 - INFO - __main__ - Step 1296: {'lr': 0.00032375, 'samples': 248832, 'steps': 1295, 'loss/train': 3.61068058013916} -11/06/2021 21:27:23 - INFO - __main__ - Step 1297: {'lr': 0.000324, 'samples': 249024, 'steps': 1296, 'loss/train': 3.682305097579956} -11/06/2021 21:27:24 - INFO - __main__ - Step 1298: {'lr': 0.00032425, 'samples': 249216, 'steps': 1297, 'loss/train': 3.750075340270996} -11/06/2021 21:27:25 - INFO - __main__ - Step 1299: {'lr': 0.00032450000000000003, 'samples': 249408, 'steps': 1298, 'loss/train': 3.9268178939819336} -11/06/2021 21:27:25 - INFO - __main__ - Step 1300: {'lr': 0.00032475, 'samples': 249600, 'steps': 1299, 'loss/train': 3.8040266036987305} -11/06/2021 21:27:25 - INFO - __main__ - Step 1301: {'lr': 0.00032500000000000004, 'samples': 249792, 'steps': 1300, 'loss/train': 3.4303956031799316} -11/06/2021 21:27:26 - INFO - __main__ - Step 1302: {'lr': 0.00032524999999999996, 'samples': 249984, 'steps': 1301, 'loss/train': 4.067983150482178} -11/06/2021 21:27:27 - INFO - __main__ - Step 1303: {'lr': 0.0003255, 'samples': 250176, 'steps': 1302, 'loss/train': 3.6090753078460693} -11/06/2021 21:27:27 - INFO - __main__ - Step 1304: {'lr': 0.00032575, 'samples': 250368, 'steps': 1303, 'loss/train': 3.846041440963745} -11/06/2021 21:27:27 - INFO - __main__ - Step 1305: {'lr': 0.000326, 'samples': 250560, 'steps': 1304, 'loss/train': 4.3484272956848145} -11/06/2021 21:27:28 - INFO - __main__ - Step 1306: {'lr': 0.00032625, 'samples': 250752, 'steps': 1305, 'loss/train': 3.714219331741333} -11/06/2021 21:27:28 - INFO - __main__ - Step 1307: {'lr': 0.0003265, 'samples': 250944, 'steps': 1306, 'loss/train': 3.670234441757202} -11/06/2021 21:27:29 - INFO - __main__ - Step 1308: {'lr': 0.00032675, 'samples': 251136, 'steps': 1307, 'loss/train': 4.2095441818237305} -11/06/2021 21:27:29 - INFO - __main__ - Step 1309: {'lr': 0.00032700000000000003, 'samples': 251328, 'steps': 1308, 'loss/train': 3.6904191970825195} -11/06/2021 21:27:30 - INFO - __main__ - Step 1310: {'lr': 0.00032725, 'samples': 251520, 'steps': 1309, 'loss/train': 3.5426836013793945} -11/06/2021 21:27:30 - INFO - __main__ - Step 1311: {'lr': 0.00032750000000000005, 'samples': 251712, 'steps': 1310, 'loss/train': 3.8077216148376465} -11/06/2021 21:27:31 - INFO - __main__ - Step 1312: {'lr': 0.00032774999999999997, 'samples': 251904, 'steps': 1311, 'loss/train': 3.6772751808166504} -11/06/2021 21:27:31 - INFO - __main__ - Step 1313: {'lr': 0.000328, 'samples': 252096, 'steps': 1312, 'loss/train': 4.283506393432617} -11/06/2021 21:27:32 - INFO - __main__ - Step 1314: {'lr': 0.00032825, 'samples': 252288, 'steps': 1313, 'loss/train': 3.820636510848999} -11/06/2021 21:27:32 - INFO - __main__ - Step 1315: {'lr': 0.0003285, 'samples': 252480, 'steps': 1314, 'loss/train': 3.645063877105713} -11/06/2021 21:27:33 - INFO - __main__ - Step 1316: {'lr': 0.00032875, 'samples': 252672, 'steps': 1315, 'loss/train': 3.96279239654541} -11/06/2021 21:27:33 - INFO - __main__ - Step 1317: {'lr': 0.00032900000000000003, 'samples': 252864, 'steps': 1316, 'loss/train': 3.848276138305664} -11/06/2021 21:27:33 - INFO - __main__ - Step 1318: {'lr': 0.00032925, 'samples': 253056, 'steps': 1317, 'loss/train': 3.3637754917144775} -11/06/2021 21:27:34 - INFO - __main__ - Step 1319: {'lr': 0.00032950000000000004, 'samples': 253248, 'steps': 1318, 'loss/train': 3.951634168624878} -11/06/2021 21:27:35 - INFO - __main__ - Step 1320: {'lr': 0.00032975, 'samples': 253440, 'steps': 1319, 'loss/train': 4.035619735717773} -11/06/2021 21:27:35 - INFO - __main__ - Step 1321: {'lr': 0.00033, 'samples': 253632, 'steps': 1320, 'loss/train': 3.623622179031372} -11/06/2021 21:27:35 - INFO - __main__ - Step 1322: {'lr': 0.00033025, 'samples': 253824, 'steps': 1321, 'loss/train': 4.259491920471191} -11/06/2021 21:27:36 - INFO - __main__ - Step 1323: {'lr': 0.0003305, 'samples': 254016, 'steps': 1322, 'loss/train': 3.655144214630127} -11/06/2021 21:27:37 - INFO - __main__ - Step 1324: {'lr': 0.00033075, 'samples': 254208, 'steps': 1323, 'loss/train': 3.6705875396728516} -11/06/2021 21:27:37 - INFO - __main__ - Step 1325: {'lr': 0.000331, 'samples': 254400, 'steps': 1324, 'loss/train': 3.493577480316162} -11/06/2021 21:27:38 - INFO - __main__ - Step 1326: {'lr': 0.00033125, 'samples': 254592, 'steps': 1325, 'loss/train': 3.0190889835357666} -11/06/2021 21:27:38 - INFO - __main__ - Step 1327: {'lr': 0.00033150000000000003, 'samples': 254784, 'steps': 1326, 'loss/train': 4.079080104827881} -11/06/2021 21:27:38 - INFO - __main__ - Step 1328: {'lr': 0.00033175, 'samples': 254976, 'steps': 1327, 'loss/train': 3.815504550933838} -11/06/2021 21:27:39 - INFO - __main__ - Step 1329: {'lr': 0.00033200000000000005, 'samples': 255168, 'steps': 1328, 'loss/train': 3.4887773990631104} -11/06/2021 21:27:40 - INFO - __main__ - Step 1330: {'lr': 0.00033224999999999997, 'samples': 255360, 'steps': 1329, 'loss/train': 3.8788294792175293} -11/06/2021 21:27:40 - INFO - __main__ - Step 1331: {'lr': 0.0003325, 'samples': 255552, 'steps': 1330, 'loss/train': 3.5784215927124023} -11/06/2021 21:27:40 - INFO - __main__ - Step 1332: {'lr': 0.00033275, 'samples': 255744, 'steps': 1331, 'loss/train': 3.404329299926758} -11/06/2021 21:27:41 - INFO - __main__ - Step 1333: {'lr': 0.000333, 'samples': 255936, 'steps': 1332, 'loss/train': 3.8690433502197266} -11/06/2021 21:27:42 - INFO - __main__ - Step 1334: {'lr': 0.00033325, 'samples': 256128, 'steps': 1333, 'loss/train': 3.4080007076263428} -11/06/2021 21:27:42 - INFO - __main__ - Step 1335: {'lr': 0.00033350000000000003, 'samples': 256320, 'steps': 1334, 'loss/train': 3.692984104156494} -11/06/2021 21:27:42 - INFO - __main__ - Step 1336: {'lr': 0.00033375, 'samples': 256512, 'steps': 1335, 'loss/train': 3.570852756500244} -11/06/2021 21:27:43 - INFO - __main__ - Step 1337: {'lr': 0.00033400000000000004, 'samples': 256704, 'steps': 1336, 'loss/train': 3.4716129302978516} -11/06/2021 21:27:43 - INFO - __main__ - Step 1338: {'lr': 0.00033425, 'samples': 256896, 'steps': 1337, 'loss/train': 3.4797582626342773} -11/06/2021 21:27:44 - INFO - __main__ - Step 1339: {'lr': 0.00033450000000000005, 'samples': 257088, 'steps': 1338, 'loss/train': 3.386270046234131} -11/06/2021 21:27:45 - INFO - __main__ - Step 1340: {'lr': 0.00033475, 'samples': 257280, 'steps': 1339, 'loss/train': 4.1568217277526855} -11/06/2021 21:27:45 - INFO - __main__ - Step 1341: {'lr': 0.000335, 'samples': 257472, 'steps': 1340, 'loss/train': 3.2953333854675293} -11/06/2021 21:27:45 - INFO - __main__ - Step 1342: {'lr': 0.00033525, 'samples': 257664, 'steps': 1341, 'loss/train': 3.355146646499634} -11/06/2021 21:27:46 - INFO - __main__ - Step 1343: {'lr': 0.0003355, 'samples': 257856, 'steps': 1342, 'loss/train': 3.234477996826172} -11/06/2021 21:27:47 - INFO - __main__ - Step 1344: {'lr': 0.00033575, 'samples': 258048, 'steps': 1343, 'loss/train': 3.457892656326294} -11/06/2021 21:27:47 - INFO - __main__ - Step 1345: {'lr': 0.00033600000000000004, 'samples': 258240, 'steps': 1344, 'loss/train': 3.948150634765625} -11/06/2021 21:27:47 - INFO - __main__ - Step 1346: {'lr': 0.00033625, 'samples': 258432, 'steps': 1345, 'loss/train': 3.7880961894989014} -11/06/2021 21:27:48 - INFO - __main__ - Step 1347: {'lr': 0.00033650000000000005, 'samples': 258624, 'steps': 1346, 'loss/train': 3.310671329498291} -11/06/2021 21:27:48 - INFO - __main__ - Step 1348: {'lr': 0.00033675, 'samples': 258816, 'steps': 1347, 'loss/train': 3.0229480266571045} -11/06/2021 21:27:49 - INFO - __main__ - Step 1349: {'lr': 0.000337, 'samples': 259008, 'steps': 1348, 'loss/train': 3.778203010559082} -11/06/2021 21:27:50 - INFO - __main__ - Step 1350: {'lr': 0.00033725, 'samples': 259200, 'steps': 1349, 'loss/train': 3.488584280014038} -11/06/2021 21:27:50 - INFO - __main__ - Step 1351: {'lr': 0.0003375, 'samples': 259392, 'steps': 1350, 'loss/train': 2.763584613800049} -11/06/2021 21:27:50 - INFO - __main__ - Step 1352: {'lr': 0.00033775, 'samples': 259584, 'steps': 1351, 'loss/train': 3.3598763942718506} -11/06/2021 21:27:51 - INFO - __main__ - Step 1353: {'lr': 0.00033800000000000003, 'samples': 259776, 'steps': 1352, 'loss/train': 3.7228636741638184} -11/06/2021 21:27:51 - INFO - __main__ - Step 1354: {'lr': 0.00033825, 'samples': 259968, 'steps': 1353, 'loss/train': 4.054864883422852} -11/06/2021 21:27:52 - INFO - __main__ - Step 1355: {'lr': 0.00033850000000000004, 'samples': 260160, 'steps': 1354, 'loss/train': 3.6283679008483887} -11/06/2021 21:27:53 - INFO - __main__ - Step 1356: {'lr': 0.00033875, 'samples': 260352, 'steps': 1355, 'loss/train': 3.3796229362487793} -11/06/2021 21:27:53 - INFO - __main__ - Step 1357: {'lr': 0.00033900000000000005, 'samples': 260544, 'steps': 1356, 'loss/train': 3.939152717590332} -11/06/2021 21:27:53 - INFO - __main__ - Step 1358: {'lr': 0.00033925, 'samples': 260736, 'steps': 1357, 'loss/train': 4.031463623046875} -11/06/2021 21:27:54 - INFO - __main__ - Step 1359: {'lr': 0.0003395, 'samples': 260928, 'steps': 1358, 'loss/train': 4.39647912979126} -11/06/2021 21:27:55 - INFO - __main__ - Step 1360: {'lr': 0.00033975, 'samples': 261120, 'steps': 1359, 'loss/train': 3.659208059310913} -11/06/2021 21:27:55 - INFO - __main__ - Step 1361: {'lr': 0.00034, 'samples': 261312, 'steps': 1360, 'loss/train': 4.465490341186523} -11/06/2021 21:27:55 - INFO - __main__ - Step 1362: {'lr': 0.00034025, 'samples': 261504, 'steps': 1361, 'loss/train': 4.4638543128967285} -11/06/2021 21:27:56 - INFO - __main__ - Step 1363: {'lr': 0.00034050000000000004, 'samples': 261696, 'steps': 1362, 'loss/train': 4.332038402557373} -11/06/2021 21:27:56 - INFO - __main__ - Step 1364: {'lr': 0.00034075, 'samples': 261888, 'steps': 1363, 'loss/train': 4.257739543914795} -11/06/2021 21:27:57 - INFO - __main__ - Step 1365: {'lr': 0.00034100000000000005, 'samples': 262080, 'steps': 1364, 'loss/train': 3.7311654090881348} -11/06/2021 21:27:57 - INFO - __main__ - Step 1366: {'lr': 0.00034125000000000003, 'samples': 262272, 'steps': 1365, 'loss/train': 3.6005234718322754} -11/06/2021 21:27:58 - INFO - __main__ - Step 1367: {'lr': 0.0003415, 'samples': 262464, 'steps': 1366, 'loss/train': 3.586486339569092} -11/06/2021 21:27:58 - INFO - __main__ - Step 1368: {'lr': 0.00034175, 'samples': 262656, 'steps': 1367, 'loss/train': 2.7847213745117188} -11/06/2021 21:27:59 - INFO - __main__ - Step 1369: {'lr': 0.000342, 'samples': 262848, 'steps': 1368, 'loss/train': 3.146930456161499} -11/06/2021 21:28:00 - INFO - __main__ - Step 1370: {'lr': 0.00034225, 'samples': 263040, 'steps': 1369, 'loss/train': 3.4413974285125732} -11/06/2021 21:28:00 - INFO - __main__ - Step 1371: {'lr': 0.00034250000000000003, 'samples': 263232, 'steps': 1370, 'loss/train': 3.6233880519866943} -11/06/2021 21:28:00 - INFO - __main__ - Step 1372: {'lr': 0.00034275, 'samples': 263424, 'steps': 1371, 'loss/train': 3.721611261367798} -11/06/2021 21:28:01 - INFO - __main__ - Step 1373: {'lr': 0.00034300000000000004, 'samples': 263616, 'steps': 1372, 'loss/train': 4.222573757171631} -11/06/2021 21:28:01 - INFO - __main__ - Step 1374: {'lr': 0.00034325, 'samples': 263808, 'steps': 1373, 'loss/train': 3.599992513656616} -11/06/2021 21:28:02 - INFO - __main__ - Step 1375: {'lr': 0.00034350000000000006, 'samples': 264000, 'steps': 1374, 'loss/train': 3.8981473445892334} -11/06/2021 21:28:03 - INFO - __main__ - Step 1376: {'lr': 0.00034375, 'samples': 264192, 'steps': 1375, 'loss/train': 3.6449296474456787} -11/06/2021 21:28:03 - INFO - __main__ - Step 1377: {'lr': 0.00034399999999999996, 'samples': 264384, 'steps': 1376, 'loss/train': 3.2894580364227295} -11/06/2021 21:28:03 - INFO - __main__ - Step 1378: {'lr': 0.00034425, 'samples': 264576, 'steps': 1377, 'loss/train': 3.513908624649048} -11/06/2021 21:28:04 - INFO - __main__ - Step 1379: {'lr': 0.00034449999999999997, 'samples': 264768, 'steps': 1378, 'loss/train': 4.0787034034729} -11/06/2021 21:28:05 - INFO - __main__ - Step 1380: {'lr': 0.00034475, 'samples': 264960, 'steps': 1379, 'loss/train': 3.7418301105499268} -11/06/2021 21:28:05 - INFO - __main__ - Step 1381: {'lr': 0.000345, 'samples': 265152, 'steps': 1380, 'loss/train': 3.700737237930298} -11/06/2021 21:28:05 - INFO - __main__ - Step 1382: {'lr': 0.00034525, 'samples': 265344, 'steps': 1381, 'loss/train': 3.3428897857666016} -11/06/2021 21:28:06 - INFO - __main__ - Step 1383: {'lr': 0.0003455, 'samples': 265536, 'steps': 1382, 'loss/train': 3.495915651321411} -11/06/2021 21:28:06 - INFO - __main__ - Step 1384: {'lr': 0.00034575000000000003, 'samples': 265728, 'steps': 1383, 'loss/train': 3.5448079109191895} -11/06/2021 21:28:07 - INFO - __main__ - Step 1385: {'lr': 0.000346, 'samples': 265920, 'steps': 1384, 'loss/train': 3.691251277923584} -11/06/2021 21:28:07 - INFO - __main__ - Step 1386: {'lr': 0.00034625, 'samples': 266112, 'steps': 1385, 'loss/train': 2.9062933921813965} -11/06/2021 21:28:08 - INFO - __main__ - Step 1387: {'lr': 0.00034649999999999997, 'samples': 266304, 'steps': 1386, 'loss/train': 3.5462396144866943} -11/06/2021 21:28:08 - INFO - __main__ - Step 1388: {'lr': 0.00034675, 'samples': 266496, 'steps': 1387, 'loss/train': 5.252135276794434} -11/06/2021 21:28:08 - INFO - __main__ - Step 1389: {'lr': 0.000347, 'samples': 266688, 'steps': 1388, 'loss/train': 3.7084007263183594} -11/06/2021 21:28:09 - INFO - __main__ - Step 1390: {'lr': 0.00034725, 'samples': 266880, 'steps': 1389, 'loss/train': 4.000763893127441} -11/06/2021 21:28:10 - INFO - __main__ - Step 1391: {'lr': 0.0003475, 'samples': 267072, 'steps': 1390, 'loss/train': 3.437042474746704} -11/06/2021 21:28:10 - INFO - __main__ - Step 1392: {'lr': 0.00034775, 'samples': 267264, 'steps': 1391, 'loss/train': 3.971050977706909} -11/06/2021 21:28:11 - INFO - __main__ - Step 1393: {'lr': 0.000348, 'samples': 267456, 'steps': 1392, 'loss/train': 3.698169231414795} -11/06/2021 21:28:11 - INFO - __main__ - Step 1394: {'lr': 0.00034825000000000004, 'samples': 267648, 'steps': 1393, 'loss/train': 3.2756340503692627} -11/06/2021 21:28:11 - INFO - __main__ - Step 1395: {'lr': 0.00034849999999999996, 'samples': 267840, 'steps': 1394, 'loss/train': 3.3742105960845947} -11/06/2021 21:28:12 - INFO - __main__ - Step 1396: {'lr': 0.00034875, 'samples': 268032, 'steps': 1395, 'loss/train': 3.8026742935180664} -11/06/2021 21:28:13 - INFO - __main__ - Step 1397: {'lr': 0.00034899999999999997, 'samples': 268224, 'steps': 1396, 'loss/train': 3.521596908569336} -11/06/2021 21:28:13 - INFO - __main__ - Step 1398: {'lr': 0.00034925, 'samples': 268416, 'steps': 1397, 'loss/train': 3.4449994564056396} -11/06/2021 21:28:13 - INFO - __main__ - Step 1399: {'lr': 0.0003495, 'samples': 268608, 'steps': 1398, 'loss/train': 3.146643877029419} -11/06/2021 21:28:14 - INFO - __main__ - Step 1400: {'lr': 0.00034975, 'samples': 268800, 'steps': 1399, 'loss/train': 3.3726940155029297} -11/06/2021 21:28:15 - INFO - __main__ - Step 1401: {'lr': 0.00035, 'samples': 268992, 'steps': 1400, 'loss/train': 3.4211158752441406} -11/06/2021 21:28:15 - INFO - __main__ - Step 1402: {'lr': 0.00035025000000000003, 'samples': 269184, 'steps': 1401, 'loss/train': 3.7196311950683594} -11/06/2021 21:28:15 - INFO - __main__ - Step 1403: {'lr': 0.0003505, 'samples': 269376, 'steps': 1402, 'loss/train': 3.6825990676879883} -11/06/2021 21:28:16 - INFO - __main__ - Step 1404: {'lr': 0.00035075, 'samples': 269568, 'steps': 1403, 'loss/train': 3.5246872901916504} -11/06/2021 21:28:16 - INFO - __main__ - Step 1405: {'lr': 0.00035099999999999997, 'samples': 269760, 'steps': 1404, 'loss/train': 3.948554277420044} -11/06/2021 21:28:17 - INFO - __main__ - Step 1406: {'lr': 0.00035125, 'samples': 269952, 'steps': 1405, 'loss/train': 3.4808645248413086} -11/06/2021 21:28:18 - INFO - __main__ - Step 1407: {'lr': 0.0003515, 'samples': 270144, 'steps': 1406, 'loss/train': 3.6043059825897217} -11/06/2021 21:28:18 - INFO - __main__ - Step 1408: {'lr': 0.00035175, 'samples': 270336, 'steps': 1407, 'loss/train': 3.91089129447937} -11/06/2021 21:28:18 - INFO - __main__ - Step 1409: {'lr': 0.000352, 'samples': 270528, 'steps': 1408, 'loss/train': 3.544276237487793} -11/06/2021 21:28:19 - INFO - __main__ - Step 1410: {'lr': 0.00035225, 'samples': 270720, 'steps': 1409, 'loss/train': 3.8686203956604004} -11/06/2021 21:28:20 - INFO - __main__ - Step 1411: {'lr': 0.0003525, 'samples': 270912, 'steps': 1410, 'loss/train': 3.5301620960235596} -11/06/2021 21:28:20 - INFO - __main__ - Step 1412: {'lr': 0.00035275000000000004, 'samples': 271104, 'steps': 1411, 'loss/train': 3.6756720542907715} -11/06/2021 21:28:21 - INFO - __main__ - Step 1413: {'lr': 0.00035299999999999996, 'samples': 271296, 'steps': 1412, 'loss/train': 3.3864593505859375} -11/06/2021 21:28:21 - INFO - __main__ - Step 1414: {'lr': 0.00035325, 'samples': 271488, 'steps': 1413, 'loss/train': 3.0657331943511963} -11/06/2021 21:28:21 - INFO - __main__ - Step 1415: {'lr': 0.0003535, 'samples': 271680, 'steps': 1414, 'loss/train': 3.454667091369629} -11/06/2021 21:28:22 - INFO - __main__ - Step 1416: {'lr': 0.00035375, 'samples': 271872, 'steps': 1415, 'loss/train': 3.242163896560669} -11/06/2021 21:28:23 - INFO - __main__ - Step 1417: {'lr': 0.000354, 'samples': 272064, 'steps': 1416, 'loss/train': 3.9992828369140625} -11/06/2021 21:28:23 - INFO - __main__ - Step 1418: {'lr': 0.00035425, 'samples': 272256, 'steps': 1417, 'loss/train': 3.688415050506592} -11/06/2021 21:28:23 - INFO - __main__ - Step 1419: {'lr': 0.0003545, 'samples': 272448, 'steps': 1418, 'loss/train': 3.7804338932037354} -11/06/2021 21:28:24 - INFO - __main__ - Step 1420: {'lr': 0.00035475000000000003, 'samples': 272640, 'steps': 1419, 'loss/train': 3.729741096496582} -11/06/2021 21:28:25 - INFO - __main__ - Step 1421: {'lr': 0.000355, 'samples': 272832, 'steps': 1420, 'loss/train': 4.303407192230225} -11/06/2021 21:28:25 - INFO - __main__ - Step 1422: {'lr': 0.00035525000000000004, 'samples': 273024, 'steps': 1421, 'loss/train': 3.4556620121002197} -11/06/2021 21:28:26 - INFO - __main__ - Step 1423: {'lr': 0.00035549999999999997, 'samples': 273216, 'steps': 1422, 'loss/train': 2.991054058074951} -11/06/2021 21:28:26 - INFO - __main__ - Step 1424: {'lr': 0.00035575, 'samples': 273408, 'steps': 1423, 'loss/train': 4.185265064239502} -11/06/2021 21:28:26 - INFO - __main__ - Step 1425: {'lr': 0.000356, 'samples': 273600, 'steps': 1424, 'loss/train': 3.529508590698242} -11/06/2021 21:28:27 - INFO - __main__ - Step 1426: {'lr': 0.00035625, 'samples': 273792, 'steps': 1425, 'loss/train': 3.394829034805298} -11/06/2021 21:28:28 - INFO - __main__ - Step 1427: {'lr': 0.0003565, 'samples': 273984, 'steps': 1426, 'loss/train': 4.052621364593506} -11/06/2021 21:28:28 - INFO - __main__ - Step 1428: {'lr': 0.00035675, 'samples': 274176, 'steps': 1427, 'loss/train': 3.0512208938598633} -11/06/2021 21:28:28 - INFO - __main__ - Step 1429: {'lr': 0.000357, 'samples': 274368, 'steps': 1428, 'loss/train': 3.3234691619873047} -11/06/2021 21:28:29 - INFO - __main__ - Step 1430: {'lr': 0.00035725000000000004, 'samples': 274560, 'steps': 1429, 'loss/train': 3.588322162628174} -11/06/2021 21:28:29 - INFO - __main__ - Step 1431: {'lr': 0.0003575, 'samples': 274752, 'steps': 1430, 'loss/train': 3.39493727684021} -11/06/2021 21:28:30 - INFO - __main__ - Step 1432: {'lr': 0.00035775, 'samples': 274944, 'steps': 1431, 'loss/train': 2.880502939224243} -11/06/2021 21:28:30 - INFO - __main__ - Step 1433: {'lr': 0.000358, 'samples': 275136, 'steps': 1432, 'loss/train': 3.7747838497161865} -11/06/2021 21:28:31 - INFO - __main__ - Step 1434: {'lr': 0.00035825, 'samples': 275328, 'steps': 1433, 'loss/train': 3.3060061931610107} -11/06/2021 21:28:31 - INFO - __main__ - Step 1435: {'lr': 0.0003585, 'samples': 275520, 'steps': 1434, 'loss/train': 3.7018392086029053} -11/06/2021 21:28:32 - INFO - __main__ - Step 1436: {'lr': 0.00035875, 'samples': 275712, 'steps': 1435, 'loss/train': 3.0778818130493164} -11/06/2021 21:28:33 - INFO - __main__ - Step 1437: {'lr': 0.000359, 'samples': 275904, 'steps': 1436, 'loss/train': 3.736198902130127} -11/06/2021 21:28:33 - INFO - __main__ - Step 1438: {'lr': 0.00035925000000000003, 'samples': 276096, 'steps': 1437, 'loss/train': 3.045379877090454} -11/06/2021 21:28:33 - INFO - __main__ - Step 1439: {'lr': 0.0003595, 'samples': 276288, 'steps': 1438, 'loss/train': 3.695364475250244} -11/06/2021 21:28:34 - INFO - __main__ - Step 1440: {'lr': 0.00035975000000000004, 'samples': 276480, 'steps': 1439, 'loss/train': 3.711172342300415} -11/06/2021 21:28:34 - INFO - __main__ - Step 1441: {'lr': 0.00035999999999999997, 'samples': 276672, 'steps': 1440, 'loss/train': 2.9761195182800293} -11/06/2021 21:28:35 - INFO - __main__ - Step 1442: {'lr': 0.00036025, 'samples': 276864, 'steps': 1441, 'loss/train': 3.2470874786376953} -11/06/2021 21:28:35 - INFO - __main__ - Step 1443: {'lr': 0.0003605, 'samples': 277056, 'steps': 1442, 'loss/train': 3.0125174522399902} -11/06/2021 21:28:36 - INFO - __main__ - Step 1444: {'lr': 0.00036075, 'samples': 277248, 'steps': 1443, 'loss/train': 3.5066580772399902} -11/06/2021 21:28:36 - INFO - __main__ - Step 1445: {'lr': 0.000361, 'samples': 277440, 'steps': 1444, 'loss/train': 3.245635747909546} -11/06/2021 21:28:36 - INFO - __main__ - Step 1446: {'lr': 0.00036125, 'samples': 277632, 'steps': 1445, 'loss/train': 4.3313374519348145} -11/06/2021 21:28:38 - INFO - __main__ - Step 1447: {'lr': 0.0003615, 'samples': 277824, 'steps': 1446, 'loss/train': 3.90049409866333} -11/06/2021 21:28:38 - INFO - __main__ - Step 1448: {'lr': 0.00036175000000000004, 'samples': 278016, 'steps': 1447, 'loss/train': 2.849242687225342} -11/06/2021 21:28:38 - INFO - __main__ - Step 1449: {'lr': 0.000362, 'samples': 278208, 'steps': 1448, 'loss/train': 3.8985612392425537} -11/06/2021 21:28:39 - INFO - __main__ - Step 1450: {'lr': 0.00036225000000000005, 'samples': 278400, 'steps': 1449, 'loss/train': 3.1428816318511963} -11/06/2021 21:28:39 - INFO - __main__ - Step 1451: {'lr': 0.0003625, 'samples': 278592, 'steps': 1450, 'loss/train': 3.8840200901031494} -11/06/2021 21:28:39 - INFO - __main__ - Step 1452: {'lr': 0.00036275, 'samples': 278784, 'steps': 1451, 'loss/train': 3.16904354095459} -11/06/2021 21:28:40 - INFO - __main__ - Step 1453: {'lr': 0.000363, 'samples': 278976, 'steps': 1452, 'loss/train': 2.8679397106170654} -11/06/2021 21:28:41 - INFO - __main__ - Step 1454: {'lr': 0.00036325, 'samples': 279168, 'steps': 1453, 'loss/train': 3.2666327953338623} -11/06/2021 21:28:41 - INFO - __main__ - Step 1455: {'lr': 0.0003635, 'samples': 279360, 'steps': 1454, 'loss/train': 3.257840871810913} -11/06/2021 21:28:41 - INFO - __main__ - Step 1456: {'lr': 0.00036375000000000003, 'samples': 279552, 'steps': 1455, 'loss/train': 3.4981942176818848} -11/06/2021 21:28:42 - INFO - __main__ - Step 1457: {'lr': 0.000364, 'samples': 279744, 'steps': 1456, 'loss/train': 3.474823236465454} -11/06/2021 21:28:43 - INFO - __main__ - Step 1458: {'lr': 0.00036425000000000004, 'samples': 279936, 'steps': 1457, 'loss/train': 3.6593263149261475} -11/06/2021 21:28:43 - INFO - __main__ - Step 1459: {'lr': 0.0003645, 'samples': 280128, 'steps': 1458, 'loss/train': 3.4789998531341553} -11/06/2021 21:28:43 - INFO - __main__ - Step 1460: {'lr': 0.00036475, 'samples': 280320, 'steps': 1459, 'loss/train': 3.415144920349121} -11/06/2021 21:28:44 - INFO - __main__ - Step 1461: {'lr': 0.000365, 'samples': 280512, 'steps': 1460, 'loss/train': 3.892705202102661} -11/06/2021 21:28:44 - INFO - __main__ - Step 1462: {'lr': 0.00036525, 'samples': 280704, 'steps': 1461, 'loss/train': 3.5692012310028076} -11/06/2021 21:28:45 - INFO - __main__ - Step 1463: {'lr': 0.0003655, 'samples': 280896, 'steps': 1462, 'loss/train': 3.964817762374878} -11/06/2021 21:28:46 - INFO - __main__ - Step 1464: {'lr': 0.00036575, 'samples': 281088, 'steps': 1463, 'loss/train': 3.4829154014587402} -11/06/2021 21:28:46 - INFO - __main__ - Step 1465: {'lr': 0.000366, 'samples': 281280, 'steps': 1464, 'loss/train': 3.2892184257507324} -11/06/2021 21:28:46 - INFO - __main__ - Step 1466: {'lr': 0.00036625000000000004, 'samples': 281472, 'steps': 1465, 'loss/train': 3.158153772354126} -11/06/2021 21:28:47 - INFO - __main__ - Step 1467: {'lr': 0.0003665, 'samples': 281664, 'steps': 1466, 'loss/train': 3.4137485027313232} -11/06/2021 21:28:48 - INFO - __main__ - Step 1468: {'lr': 0.00036675000000000005, 'samples': 281856, 'steps': 1467, 'loss/train': 3.1349167823791504} -11/06/2021 21:28:48 - INFO - __main__ - Step 1469: {'lr': 0.000367, 'samples': 282048, 'steps': 1468, 'loss/train': 2.7978010177612305} -11/06/2021 21:28:48 - INFO - __main__ - Step 1470: {'lr': 0.00036725, 'samples': 282240, 'steps': 1469, 'loss/train': 3.418675184249878} -11/06/2021 21:28:49 - INFO - __main__ - Step 1471: {'lr': 0.0003675, 'samples': 282432, 'steps': 1470, 'loss/train': 3.3369407653808594} -11/06/2021 21:28:49 - INFO - __main__ - Step 1472: {'lr': 0.00036775, 'samples': 282624, 'steps': 1471, 'loss/train': 3.0756335258483887} -11/06/2021 21:28:50 - INFO - __main__ - Step 1473: {'lr': 0.000368, 'samples': 282816, 'steps': 1472, 'loss/train': 3.3924009799957275} -11/06/2021 21:28:51 - INFO - __main__ - Step 1474: {'lr': 0.00036825000000000003, 'samples': 283008, 'steps': 1473, 'loss/train': 3.3130877017974854} -11/06/2021 21:28:51 - INFO - __main__ - Step 1475: {'lr': 0.0003685, 'samples': 283200, 'steps': 1474, 'loss/train': 2.7034976482391357} -11/06/2021 21:28:51 - INFO - __main__ - Step 1476: {'lr': 0.00036875000000000005, 'samples': 283392, 'steps': 1475, 'loss/train': 2.9324753284454346} -11/06/2021 21:28:52 - INFO - __main__ - Step 1477: {'lr': 0.000369, 'samples': 283584, 'steps': 1476, 'loss/train': 3.632042407989502} -11/06/2021 21:28:53 - INFO - __main__ - Step 1478: {'lr': 0.00036925, 'samples': 283776, 'steps': 1477, 'loss/train': 3.7734642028808594} -11/06/2021 21:28:54 - INFO - __main__ - Step 1479: {'lr': 0.0003695, 'samples': 283968, 'steps': 1478, 'loss/train': 3.285372018814087} -11/06/2021 21:28:54 - INFO - __main__ - Step 1480: {'lr': 0.00036975, 'samples': 284160, 'steps': 1479, 'loss/train': 3.5449750423431396} -11/06/2021 21:28:54 - INFO - __main__ - Step 1481: {'lr': 0.00037, 'samples': 284352, 'steps': 1480, 'loss/train': 3.1665492057800293} -11/06/2021 21:28:55 - INFO - __main__ - Step 1482: {'lr': 0.00037025000000000003, 'samples': 284544, 'steps': 1481, 'loss/train': 2.68510103225708} -11/06/2021 21:28:55 - INFO - __main__ - Step 1483: {'lr': 0.0003705, 'samples': 284736, 'steps': 1482, 'loss/train': 3.09177303314209} -11/06/2021 21:28:56 - INFO - __main__ - Step 1484: {'lr': 0.00037075000000000004, 'samples': 284928, 'steps': 1483, 'loss/train': 0.934282124042511} -11/06/2021 21:28:57 - INFO - __main__ - Step 1485: {'lr': 0.000371, 'samples': 285120, 'steps': 1484, 'loss/train': 0.7881891131401062} -11/06/2021 21:28:57 - INFO - __main__ - Step 1486: {'lr': 0.00037125000000000005, 'samples': 285312, 'steps': 1485, 'loss/train': 3.3031082153320312} -11/06/2021 21:28:58 - INFO - __main__ - Step 1487: {'lr': 0.00037150000000000003, 'samples': 285504, 'steps': 1486, 'loss/train': 3.4887430667877197} -11/06/2021 21:28:58 - INFO - __main__ - Step 1488: {'lr': 0.00037175, 'samples': 285696, 'steps': 1487, 'loss/train': 3.392094850540161} -11/06/2021 21:28:58 - INFO - __main__ - Step 1489: {'lr': 0.000372, 'samples': 285888, 'steps': 1488, 'loss/train': 3.5077946186065674} -11/06/2021 21:28:59 - INFO - __main__ - Step 1490: {'lr': 0.00037225, 'samples': 286080, 'steps': 1489, 'loss/train': 3.9329774379730225} -11/06/2021 21:29:00 - INFO - __main__ - Step 1491: {'lr': 0.0003725, 'samples': 286272, 'steps': 1490, 'loss/train': 3.5324740409851074} -11/06/2021 21:29:00 - INFO - __main__ - Step 1492: {'lr': 0.00037275000000000003, 'samples': 286464, 'steps': 1491, 'loss/train': 2.4463398456573486} -11/06/2021 21:29:00 - INFO - __main__ - Step 1493: {'lr': 0.000373, 'samples': 286656, 'steps': 1492, 'loss/train': 3.127577066421509} -11/06/2021 21:29:01 - INFO - __main__ - Step 1494: {'lr': 0.00037325000000000005, 'samples': 286848, 'steps': 1493, 'loss/train': 1.6627174615859985} -11/06/2021 21:29:03 - INFO - __main__ - Step 1495: {'lr': 0.0003735, 'samples': 287040, 'steps': 1494, 'loss/train': 3.5371575355529785} -11/06/2021 21:29:03 - INFO - __main__ - Step 1496: {'lr': 0.00037375000000000006, 'samples': 287232, 'steps': 1495, 'loss/train': 3.178628921508789} -11/06/2021 21:29:03 - INFO - __main__ - Step 1497: {'lr': 0.000374, 'samples': 287424, 'steps': 1496, 'loss/train': 2.7111098766326904} -11/06/2021 21:29:04 - INFO - __main__ - Step 1498: {'lr': 0.00037425, 'samples': 287616, 'steps': 1497, 'loss/train': 4.202212810516357} -11/06/2021 21:29:04 - INFO - __main__ - Step 1499: {'lr': 0.0003745, 'samples': 287808, 'steps': 1498, 'loss/train': 3.379865884780884} -11/06/2021 21:29:04 - INFO - __main__ - Step 1500: {'lr': 0.00037475000000000003, 'samples': 288000, 'steps': 1499, 'loss/train': 3.4952762126922607} -11/06/2021 21:29:05 - INFO - __main__ - Step 1501: {'lr': 0.000375, 'samples': 288192, 'steps': 1500, 'loss/train': 4.174196720123291} -11/06/2021 21:29:06 - INFO - __main__ - Step 1502: {'lr': 0.00037525, 'samples': 288384, 'steps': 1501, 'loss/train': 3.272667169570923} -11/06/2021 21:29:06 - INFO - __main__ - Step 1503: {'lr': 0.0003755, 'samples': 288576, 'steps': 1502, 'loss/train': 2.8478939533233643} -11/06/2021 21:29:07 - INFO - __main__ - Step 1504: {'lr': 0.00037575, 'samples': 288768, 'steps': 1503, 'loss/train': 4.3909077644348145} -11/06/2021 21:29:07 - INFO - __main__ - Step 1505: {'lr': 0.00037600000000000003, 'samples': 288960, 'steps': 1504, 'loss/train': 3.602169990539551} -11/06/2021 21:29:08 - INFO - __main__ - Step 1506: {'lr': 0.00037624999999999996, 'samples': 289152, 'steps': 1505, 'loss/train': 3.1311495304107666} -11/06/2021 21:29:08 - INFO - __main__ - Step 1507: {'lr': 0.0003765, 'samples': 289344, 'steps': 1506, 'loss/train': 2.88991379737854} -11/06/2021 21:29:09 - INFO - __main__ - Step 1508: {'lr': 0.00037674999999999997, 'samples': 289536, 'steps': 1507, 'loss/train': 2.8797428607940674} -11/06/2021 21:29:09 - INFO - __main__ - Step 1509: {'lr': 0.000377, 'samples': 289728, 'steps': 1508, 'loss/train': 3.3940863609313965} -11/06/2021 21:29:09 - INFO - __main__ - Step 1510: {'lr': 0.00037725, 'samples': 289920, 'steps': 1509, 'loss/train': 3.036484479904175} -11/06/2021 21:29:10 - INFO - __main__ - Step 1511: {'lr': 0.0003775, 'samples': 290112, 'steps': 1510, 'loss/train': 4.253868579864502} -11/06/2021 21:29:11 - INFO - __main__ - Step 1512: {'lr': 0.00037775, 'samples': 290304, 'steps': 1511, 'loss/train': 3.5372188091278076} -11/06/2021 21:29:11 - INFO - __main__ - Step 1513: {'lr': 0.000378, 'samples': 290496, 'steps': 1512, 'loss/train': 3.0633351802825928} -11/06/2021 21:29:12 - INFO - __main__ - Step 1514: {'lr': 0.00037825, 'samples': 290688, 'steps': 1513, 'loss/train': 3.378868818283081} -11/06/2021 21:29:12 - INFO - __main__ - Step 1515: {'lr': 0.0003785, 'samples': 290880, 'steps': 1514, 'loss/train': 4.058987140655518} -11/06/2021 21:29:12 - INFO - __main__ - Step 1516: {'lr': 0.00037874999999999996, 'samples': 291072, 'steps': 1515, 'loss/train': 3.8939054012298584} -11/06/2021 21:29:14 - INFO - __main__ - Step 1517: {'lr': 0.000379, 'samples': 291264, 'steps': 1516, 'loss/train': 3.405064344406128} -11/06/2021 21:29:15 - INFO - __main__ - Step 1518: {'lr': 0.00037925, 'samples': 291456, 'steps': 1517, 'loss/train': 3.7268097400665283} -11/06/2021 21:29:15 - INFO - __main__ - Step 1519: {'lr': 0.0003795, 'samples': 291648, 'steps': 1518, 'loss/train': 3.949538469314575} -11/06/2021 21:29:16 - INFO - __main__ - Step 1520: {'lr': 0.00037975, 'samples': 291840, 'steps': 1519, 'loss/train': 2.9000167846679688} -11/06/2021 21:29:16 - INFO - __main__ - Step 1521: {'lr': 0.00038, 'samples': 292032, 'steps': 1520, 'loss/train': 1.4307708740234375} -11/06/2021 21:29:16 - INFO - __main__ - Step 1522: {'lr': 0.00038025, 'samples': 292224, 'steps': 1521, 'loss/train': 1.3860046863555908} -11/06/2021 21:29:17 - INFO - __main__ - Step 1523: {'lr': 0.00038050000000000003, 'samples': 292416, 'steps': 1522, 'loss/train': 1.1130292415618896} -11/06/2021 21:29:18 - INFO - __main__ - Step 1524: {'lr': 0.00038075, 'samples': 292608, 'steps': 1523, 'loss/train': 3.4155771732330322} -11/06/2021 21:29:18 - INFO - __main__ - Step 1525: {'lr': 0.000381, 'samples': 292800, 'steps': 1524, 'loss/train': 3.0278680324554443} -11/06/2021 21:29:19 - INFO - __main__ - Step 1526: {'lr': 0.00038124999999999997, 'samples': 292992, 'steps': 1525, 'loss/train': 3.4204211235046387} -11/06/2021 21:29:19 - INFO - __main__ - Step 1527: {'lr': 0.0003815, 'samples': 293184, 'steps': 1526, 'loss/train': 2.968132972717285} -11/06/2021 21:29:19 - INFO - __main__ - Step 1528: {'lr': 0.00038175, 'samples': 293376, 'steps': 1527, 'loss/train': 3.8879196643829346} -11/06/2021 21:29:20 - INFO - __main__ - Step 1529: {'lr': 0.000382, 'samples': 293568, 'steps': 1528, 'loss/train': 3.570026159286499} -11/06/2021 21:29:21 - INFO - __main__ - Step 1530: {'lr': 0.00038225, 'samples': 293760, 'steps': 1529, 'loss/train': 3.1837944984436035} -11/06/2021 21:29:21 - INFO - __main__ - Step 1531: {'lr': 0.00038250000000000003, 'samples': 293952, 'steps': 1530, 'loss/train': 2.6540393829345703} -11/06/2021 21:29:22 - INFO - __main__ - Step 1532: {'lr': 0.00038275, 'samples': 294144, 'steps': 1531, 'loss/train': 2.824615478515625} -11/06/2021 21:29:22 - INFO - __main__ - Step 1533: {'lr': 0.00038300000000000004, 'samples': 294336, 'steps': 1532, 'loss/train': 2.8562939167022705} -11/06/2021 21:29:23 - INFO - __main__ - Step 1534: {'lr': 0.00038324999999999996, 'samples': 294528, 'steps': 1533, 'loss/train': 3.2858169078826904} -11/06/2021 21:29:23 - INFO - __main__ - Step 1535: {'lr': 0.0003835, 'samples': 294720, 'steps': 1534, 'loss/train': 3.5091545581817627} -11/06/2021 21:29:24 - INFO - __main__ - Step 1536: {'lr': 0.00038375, 'samples': 294912, 'steps': 1535, 'loss/train': 3.2510337829589844} -11/06/2021 21:29:24 - INFO - __main__ - Step 1537: {'lr': 0.000384, 'samples': 295104, 'steps': 1536, 'loss/train': 3.5380523204803467} -11/06/2021 21:29:24 - INFO - __main__ - Step 1538: {'lr': 0.00038425, 'samples': 295296, 'steps': 1537, 'loss/train': 2.9871280193328857} -11/06/2021 21:29:25 - INFO - __main__ - Step 1539: {'lr': 0.0003845, 'samples': 295488, 'steps': 1538, 'loss/train': 3.5664308071136475} -11/06/2021 21:29:26 - INFO - __main__ - Step 1540: {'lr': 0.00038475, 'samples': 295680, 'steps': 1539, 'loss/train': 3.1113128662109375} -11/06/2021 21:29:26 - INFO - __main__ - Step 1541: {'lr': 0.00038500000000000003, 'samples': 295872, 'steps': 1540, 'loss/train': 4.263197422027588} -11/06/2021 21:29:26 - INFO - __main__ - Step 1542: {'lr': 0.00038525, 'samples': 296064, 'steps': 1541, 'loss/train': 3.313586711883545} -11/06/2021 21:29:27 - INFO - __main__ - Step 1543: {'lr': 0.0003855, 'samples': 296256, 'steps': 1542, 'loss/train': 3.427462100982666} -11/06/2021 21:29:27 - INFO - __main__ - Step 1544: {'lr': 0.00038574999999999997, 'samples': 296448, 'steps': 1543, 'loss/train': 4.165167808532715} -11/06/2021 21:29:28 - INFO - __main__ - Step 1545: {'lr': 0.000386, 'samples': 296640, 'steps': 1544, 'loss/train': 3.6539011001586914} -11/06/2021 21:29:29 - INFO - __main__ - Step 1546: {'lr': 0.00038625, 'samples': 296832, 'steps': 1545, 'loss/train': 3.510122060775757} -11/06/2021 21:29:29 - INFO - __main__ - Step 1547: {'lr': 0.0003865, 'samples': 297024, 'steps': 1546, 'loss/train': 3.2956809997558594} -11/06/2021 21:29:29 - INFO - __main__ - Step 1548: {'lr': 0.00038675, 'samples': 297216, 'steps': 1547, 'loss/train': 3.2712979316711426} -11/06/2021 21:29:30 - INFO - __main__ - Step 1549: {'lr': 0.00038700000000000003, 'samples': 297408, 'steps': 1548, 'loss/train': 2.8422179222106934} -11/06/2021 21:29:31 - INFO - __main__ - Step 1550: {'lr': 0.00038725, 'samples': 297600, 'steps': 1549, 'loss/train': 3.2148244380950928} -11/06/2021 21:29:31 - INFO - __main__ - Step 1551: {'lr': 0.00038750000000000004, 'samples': 297792, 'steps': 1550, 'loss/train': 3.082228422164917} -11/06/2021 21:29:31 - INFO - __main__ - Step 1552: {'lr': 0.00038774999999999997, 'samples': 297984, 'steps': 1551, 'loss/train': 3.0857651233673096} -11/06/2021 21:29:32 - INFO - __main__ - Step 1553: {'lr': 0.000388, 'samples': 298176, 'steps': 1552, 'loss/train': 3.537327289581299} -11/06/2021 21:29:32 - INFO - __main__ - Step 1554: {'lr': 0.00038825, 'samples': 298368, 'steps': 1553, 'loss/train': 3.118391275405884} -11/06/2021 21:29:33 - INFO - __main__ - Step 1555: {'lr': 0.0003885, 'samples': 298560, 'steps': 1554, 'loss/train': 3.2976584434509277} -11/06/2021 21:29:34 - INFO - __main__ - Step 1556: {'lr': 0.00038875, 'samples': 298752, 'steps': 1555, 'loss/train': 3.208622694015503} -11/06/2021 21:29:34 - INFO - __main__ - Step 1557: {'lr': 0.000389, 'samples': 298944, 'steps': 1556, 'loss/train': 2.393932580947876} -11/06/2021 21:29:35 - INFO - __main__ - Step 1558: {'lr': 0.00038925, 'samples': 299136, 'steps': 1557, 'loss/train': 3.1180825233459473} -11/06/2021 21:29:35 - INFO - __main__ - Step 1559: {'lr': 0.00038950000000000003, 'samples': 299328, 'steps': 1558, 'loss/train': 3.363607406616211} -11/06/2021 21:29:35 - INFO - __main__ - Step 1560: {'lr': 0.00038975, 'samples': 299520, 'steps': 1559, 'loss/train': 3.7669551372528076} -11/06/2021 21:29:36 - INFO - __main__ - Step 1561: {'lr': 0.00039000000000000005, 'samples': 299712, 'steps': 1560, 'loss/train': 2.959444284439087} -11/06/2021 21:29:37 - INFO - __main__ - Step 1562: {'lr': 0.00039024999999999997, 'samples': 299904, 'steps': 1561, 'loss/train': 3.453453779220581} -11/06/2021 21:29:37 - INFO - __main__ - Step 1563: {'lr': 0.0003905, 'samples': 300096, 'steps': 1562, 'loss/train': 3.2474799156188965} -11/06/2021 21:29:37 - INFO - __main__ - Step 1564: {'lr': 0.00039075, 'samples': 300288, 'steps': 1563, 'loss/train': 3.6809487342834473} -11/06/2021 21:29:38 - INFO - __main__ - Step 1565: {'lr': 0.000391, 'samples': 300480, 'steps': 1564, 'loss/train': 3.5540361404418945} -11/06/2021 21:29:39 - INFO - __main__ - Step 1566: {'lr': 0.00039125, 'samples': 300672, 'steps': 1565, 'loss/train': 3.8347136974334717} -11/06/2021 21:29:39 - INFO - __main__ - Step 1567: {'lr': 0.00039150000000000003, 'samples': 300864, 'steps': 1566, 'loss/train': 3.0421507358551025} -11/06/2021 21:29:40 - INFO - __main__ - Step 1568: {'lr': 0.00039175, 'samples': 301056, 'steps': 1567, 'loss/train': 2.8751606941223145} -11/06/2021 21:29:40 - INFO - __main__ - Step 1569: {'lr': 0.00039200000000000004, 'samples': 301248, 'steps': 1568, 'loss/train': 2.795197010040283} -11/06/2021 21:29:40 - INFO - __main__ - Step 1570: {'lr': 0.00039225, 'samples': 301440, 'steps': 1569, 'loss/train': 2.370975971221924} -11/06/2021 21:29:41 - INFO - __main__ - Step 1571: {'lr': 0.0003925, 'samples': 301632, 'steps': 1570, 'loss/train': 2.498239040374756} -11/06/2021 21:29:42 - INFO - __main__ - Step 1572: {'lr': 0.00039275, 'samples': 301824, 'steps': 1571, 'loss/train': 1.6988508701324463} -11/06/2021 21:29:42 - INFO - __main__ - Step 1573: {'lr': 0.000393, 'samples': 302016, 'steps': 1572, 'loss/train': 4.021992206573486} -11/06/2021 21:29:42 - INFO - __main__ - Step 1574: {'lr': 0.00039325, 'samples': 302208, 'steps': 1573, 'loss/train': 2.898738145828247} -11/06/2021 21:29:43 - INFO - __main__ - Step 1575: {'lr': 0.0003935, 'samples': 302400, 'steps': 1574, 'loss/train': 2.607938289642334} -11/06/2021 21:29:43 - INFO - __main__ - Step 1576: {'lr': 0.00039375, 'samples': 302592, 'steps': 1575, 'loss/train': 3.263978958129883} -11/06/2021 21:29:44 - INFO - __main__ - Step 1577: {'lr': 0.00039400000000000004, 'samples': 302784, 'steps': 1576, 'loss/train': 2.8440113067626953} -11/06/2021 21:29:44 - INFO - __main__ - Step 1578: {'lr': 0.00039425, 'samples': 302976, 'steps': 1577, 'loss/train': 3.6558189392089844} -11/06/2021 21:29:45 - INFO - __main__ - Step 1579: {'lr': 0.00039450000000000005, 'samples': 303168, 'steps': 1578, 'loss/train': 3.0387959480285645} -11/06/2021 21:29:45 - INFO - __main__ - Step 1580: {'lr': 0.00039474999999999997, 'samples': 303360, 'steps': 1579, 'loss/train': 3.356081008911133} -11/06/2021 21:29:46 - INFO - __main__ - Step 1581: {'lr': 0.000395, 'samples': 303552, 'steps': 1580, 'loss/train': 2.985703706741333} -11/06/2021 21:29:47 - INFO - __main__ - Step 1582: {'lr': 0.00039525, 'samples': 303744, 'steps': 1581, 'loss/train': 3.263591766357422} -11/06/2021 21:29:47 - INFO - __main__ - Step 1583: {'lr': 0.0003955, 'samples': 303936, 'steps': 1582, 'loss/train': 3.0408103466033936} -11/06/2021 21:29:47 - INFO - __main__ - Step 1584: {'lr': 0.00039575, 'samples': 304128, 'steps': 1583, 'loss/train': 3.310321807861328} -11/06/2021 21:29:48 - INFO - __main__ - Step 1585: {'lr': 0.00039600000000000003, 'samples': 304320, 'steps': 1584, 'loss/train': 2.9202144145965576} -11/06/2021 21:29:48 - INFO - __main__ - Step 1586: {'lr': 0.00039625, 'samples': 304512, 'steps': 1585, 'loss/train': 3.2440686225891113} -11/06/2021 21:29:49 - INFO - __main__ - Step 1587: {'lr': 0.00039650000000000004, 'samples': 304704, 'steps': 1586, 'loss/train': 3.232225179672241} -11/06/2021 21:29:49 - INFO - __main__ - Step 1588: {'lr': 0.00039675, 'samples': 304896, 'steps': 1587, 'loss/train': 3.2099974155426025} -11/06/2021 21:29:50 - INFO - __main__ - Step 1589: {'lr': 0.00039700000000000005, 'samples': 305088, 'steps': 1588, 'loss/train': 2.729403018951416} -11/06/2021 21:29:50 - INFO - __main__ - Step 1590: {'lr': 0.00039725, 'samples': 305280, 'steps': 1589, 'loss/train': 2.7173776626586914} -11/06/2021 21:29:50 - INFO - __main__ - Step 1591: {'lr': 0.0003975, 'samples': 305472, 'steps': 1590, 'loss/train': 3.206320285797119} -11/06/2021 21:29:51 - INFO - __main__ - Step 1592: {'lr': 0.00039775, 'samples': 305664, 'steps': 1591, 'loss/train': 2.313783884048462} -11/06/2021 21:29:52 - INFO - __main__ - Step 1593: {'lr': 0.000398, 'samples': 305856, 'steps': 1592, 'loss/train': 3.254606008529663} -11/06/2021 21:29:52 - INFO - __main__ - Step 1594: {'lr': 0.00039825, 'samples': 306048, 'steps': 1593, 'loss/train': 3.374396324157715} -11/06/2021 21:29:52 - INFO - __main__ - Step 1595: {'lr': 0.00039850000000000004, 'samples': 306240, 'steps': 1594, 'loss/train': 3.533506155014038} -11/06/2021 21:29:53 - INFO - __main__ - Step 1596: {'lr': 0.00039875, 'samples': 306432, 'steps': 1595, 'loss/train': 2.543515205383301} -11/06/2021 21:29:54 - INFO - __main__ - Step 1597: {'lr': 0.00039900000000000005, 'samples': 306624, 'steps': 1596, 'loss/train': 2.980104684829712} -11/06/2021 21:29:54 - INFO - __main__ - Step 1598: {'lr': 0.00039925000000000003, 'samples': 306816, 'steps': 1597, 'loss/train': 2.649993896484375} -11/06/2021 21:29:55 - INFO - __main__ - Step 1599: {'lr': 0.0003995, 'samples': 307008, 'steps': 1598, 'loss/train': 2.8795385360717773} -11/06/2021 21:29:55 - INFO - __main__ - Step 1600: {'lr': 0.00039975, 'samples': 307200, 'steps': 1599, 'loss/train': 3.1416678428649902} -11/06/2021 21:29:55 - INFO - __main__ - Step 1601: {'lr': 0.0004, 'samples': 307392, 'steps': 1600, 'loss/train': 2.955704689025879} -11/06/2021 21:29:56 - INFO - __main__ - Step 1602: {'lr': 0.00040025, 'samples': 307584, 'steps': 1601, 'loss/train': 3.7033560276031494} -11/06/2021 21:29:57 - INFO - __main__ - Step 1603: {'lr': 0.00040050000000000003, 'samples': 307776, 'steps': 1602, 'loss/train': 2.7389466762542725} -11/06/2021 21:29:57 - INFO - __main__ - Step 1604: {'lr': 0.00040075, 'samples': 307968, 'steps': 1603, 'loss/train': 3.5183396339416504} -11/06/2021 21:29:58 - INFO - __main__ - Step 1605: {'lr': 0.00040100000000000004, 'samples': 308160, 'steps': 1604, 'loss/train': 3.134627103805542} -11/06/2021 21:29:58 - INFO - __main__ - Step 1606: {'lr': 0.00040125, 'samples': 308352, 'steps': 1605, 'loss/train': 2.952859878540039} -11/06/2021 21:29:58 - INFO - __main__ - Step 1607: {'lr': 0.00040150000000000006, 'samples': 308544, 'steps': 1606, 'loss/train': 3.224421977996826} -11/06/2021 21:29:59 - INFO - __main__ - Step 1608: {'lr': 0.00040175, 'samples': 308736, 'steps': 1607, 'loss/train': 2.4461114406585693} -11/06/2021 21:30:00 - INFO - __main__ - Step 1609: {'lr': 0.000402, 'samples': 308928, 'steps': 1608, 'loss/train': 3.342259645462036} -11/06/2021 21:30:00 - INFO - __main__ - Step 1610: {'lr': 0.00040225, 'samples': 309120, 'steps': 1609, 'loss/train': 3.2026968002319336} -11/06/2021 21:30:00 - INFO - __main__ - Step 1611: {'lr': 0.0004025, 'samples': 309312, 'steps': 1610, 'loss/train': 3.4691827297210693} -11/06/2021 21:30:01 - INFO - __main__ - Step 1612: {'lr': 0.00040275, 'samples': 309504, 'steps': 1611, 'loss/train': 3.279484987258911} -11/06/2021 21:30:02 - INFO - __main__ - Step 1613: {'lr': 0.00040300000000000004, 'samples': 309696, 'steps': 1612, 'loss/train': 3.016733407974243} -11/06/2021 21:30:02 - INFO - __main__ - Step 1614: {'lr': 0.00040325, 'samples': 309888, 'steps': 1613, 'loss/train': 3.192936897277832} -11/06/2021 21:30:02 - INFO - __main__ - Step 1615: {'lr': 0.00040350000000000005, 'samples': 310080, 'steps': 1614, 'loss/train': 3.0827951431274414} -11/06/2021 21:30:03 - INFO - __main__ - Step 1616: {'lr': 0.00040375000000000003, 'samples': 310272, 'steps': 1615, 'loss/train': 2.6593739986419678} -11/06/2021 21:30:03 - INFO - __main__ - Step 1617: {'lr': 0.000404, 'samples': 310464, 'steps': 1616, 'loss/train': 2.6806726455688477} -11/06/2021 21:30:04 - INFO - __main__ - Step 1618: {'lr': 0.00040425, 'samples': 310656, 'steps': 1617, 'loss/train': 2.476854085922241} -11/06/2021 21:30:04 - INFO - __main__ - Step 1619: {'lr': 0.0004045, 'samples': 310848, 'steps': 1618, 'loss/train': 3.110135793685913} -11/06/2021 21:30:05 - INFO - __main__ - Step 1620: {'lr': 0.00040475, 'samples': 311040, 'steps': 1619, 'loss/train': 2.908262014389038} -11/06/2021 21:30:05 - INFO - __main__ - Step 1621: {'lr': 0.00040500000000000003, 'samples': 311232, 'steps': 1620, 'loss/train': 3.027345657348633} -11/06/2021 21:30:05 - INFO - __main__ - Step 1622: {'lr': 0.00040525, 'samples': 311424, 'steps': 1621, 'loss/train': 3.2688331604003906} -11/06/2021 21:30:07 - INFO - __main__ - Step 1623: {'lr': 0.00040550000000000004, 'samples': 311616, 'steps': 1622, 'loss/train': 2.6070456504821777} -11/06/2021 21:30:07 - INFO - __main__ - Step 1624: {'lr': 0.00040575, 'samples': 311808, 'steps': 1623, 'loss/train': 3.40415620803833} -11/06/2021 21:30:07 - INFO - __main__ - Step 1625: {'lr': 0.00040600000000000006, 'samples': 312000, 'steps': 1624, 'loss/train': 3.013209819793701} -11/06/2021 21:30:08 - INFO - __main__ - Step 1626: {'lr': 0.00040625000000000004, 'samples': 312192, 'steps': 1625, 'loss/train': 2.7747411727905273} -11/06/2021 21:30:08 - INFO - __main__ - Step 1627: {'lr': 0.00040649999999999996, 'samples': 312384, 'steps': 1626, 'loss/train': 2.614873170852661} -11/06/2021 21:30:09 - INFO - __main__ - Step 1628: {'lr': 0.00040675, 'samples': 312576, 'steps': 1627, 'loss/train': 2.9833312034606934} -11/06/2021 21:30:09 - INFO - __main__ - Step 1629: {'lr': 0.00040699999999999997, 'samples': 312768, 'steps': 1628, 'loss/train': 3.6013989448547363} -11/06/2021 21:30:10 - INFO - __main__ - Step 1630: {'lr': 0.00040725, 'samples': 312960, 'steps': 1629, 'loss/train': 3.32792067527771} -11/06/2021 21:30:10 - INFO - __main__ - Step 1631: {'lr': 0.0004075, 'samples': 313152, 'steps': 1630, 'loss/train': 2.2372703552246094} -11/06/2021 21:30:10 - INFO - __main__ - Step 1632: {'lr': 0.00040775, 'samples': 313344, 'steps': 1631, 'loss/train': 3.2227723598480225} -11/06/2021 21:30:11 - INFO - __main__ - Step 1633: {'lr': 0.000408, 'samples': 313536, 'steps': 1632, 'loss/train': 2.9736287593841553} -11/06/2021 21:30:12 - INFO - __main__ - Step 1634: {'lr': 0.00040825000000000003, 'samples': 313728, 'steps': 1633, 'loss/train': 3.227055072784424} -11/06/2021 21:30:12 - INFO - __main__ - Step 1635: {'lr': 0.0004085, 'samples': 313920, 'steps': 1634, 'loss/train': 4.195490837097168} -11/06/2021 21:30:13 - INFO - __main__ - Step 1636: {'lr': 0.00040875, 'samples': 314112, 'steps': 1635, 'loss/train': 2.5357518196105957} -11/06/2021 21:30:13 - INFO - __main__ - Step 1637: {'lr': 0.00040899999999999997, 'samples': 314304, 'steps': 1636, 'loss/train': 3.0355074405670166} -11/06/2021 21:30:13 - INFO - __main__ - Step 1638: {'lr': 0.00040925, 'samples': 314496, 'steps': 1637, 'loss/train': 3.301243305206299} -11/06/2021 21:30:14 - INFO - __main__ - Step 1639: {'lr': 0.0004095, 'samples': 314688, 'steps': 1638, 'loss/train': 3.4538841247558594} -11/06/2021 21:30:15 - INFO - __main__ - Step 1640: {'lr': 0.00040975, 'samples': 314880, 'steps': 1639, 'loss/train': 3.0793862342834473} -11/06/2021 21:30:15 - INFO - __main__ - Step 1641: {'lr': 0.00041, 'samples': 315072, 'steps': 1640, 'loss/train': 3.042006492614746} -11/06/2021 21:30:15 - INFO - __main__ - Step 1642: {'lr': 0.00041025, 'samples': 315264, 'steps': 1641, 'loss/train': 2.085822105407715} -11/06/2021 21:30:16 - INFO - __main__ - Step 1643: {'lr': 0.0004105, 'samples': 315456, 'steps': 1642, 'loss/train': 3.430644989013672} -11/06/2021 21:30:17 - INFO - __main__ - Step 1644: {'lr': 0.00041075000000000004, 'samples': 315648, 'steps': 1643, 'loss/train': 2.801948308944702} -11/06/2021 21:30:17 - INFO - __main__ - Step 1645: {'lr': 0.00041099999999999996, 'samples': 315840, 'steps': 1644, 'loss/train': 2.5270915031433105} -11/06/2021 21:30:18 - INFO - __main__ - Step 1646: {'lr': 0.00041125, 'samples': 316032, 'steps': 1645, 'loss/train': 2.423734188079834} -11/06/2021 21:30:18 - INFO - __main__ - Step 1647: {'lr': 0.0004115, 'samples': 316224, 'steps': 1646, 'loss/train': 3.113656520843506} -11/06/2021 21:30:18 - INFO - __main__ - Step 1648: {'lr': 0.00041175, 'samples': 316416, 'steps': 1647, 'loss/train': 3.738720655441284} -11/06/2021 21:30:19 - INFO - __main__ - Step 1649: {'lr': 0.000412, 'samples': 316608, 'steps': 1648, 'loss/train': 3.3871734142303467} -11/06/2021 21:30:20 - INFO - __main__ - Step 1650: {'lr': 0.00041225, 'samples': 316800, 'steps': 1649, 'loss/train': 3.1259071826934814} -11/06/2021 21:30:20 - INFO - __main__ - Step 1651: {'lr': 0.0004125, 'samples': 316992, 'steps': 1650, 'loss/train': 2.9349560737609863} -11/06/2021 21:30:21 - INFO - __main__ - Step 1652: {'lr': 0.00041275000000000003, 'samples': 317184, 'steps': 1651, 'loss/train': 2.337951183319092} -11/06/2021 21:30:21 - INFO - __main__ - Step 1653: {'lr': 0.000413, 'samples': 317376, 'steps': 1652, 'loss/train': 3.269364595413208} -11/06/2021 21:30:21 - INFO - __main__ - Step 1654: {'lr': 0.00041325, 'samples': 317568, 'steps': 1653, 'loss/train': 2.937201499938965} -11/06/2021 21:30:22 - INFO - __main__ - Step 1655: {'lr': 0.00041349999999999997, 'samples': 317760, 'steps': 1654, 'loss/train': 3.1462650299072266} -11/06/2021 21:30:23 - INFO - __main__ - Step 1656: {'lr': 0.00041375, 'samples': 317952, 'steps': 1655, 'loss/train': 3.218020439147949} -11/06/2021 21:30:23 - INFO - __main__ - Step 1657: {'lr': 0.000414, 'samples': 318144, 'steps': 1656, 'loss/train': 2.919787645339966} -11/06/2021 21:30:23 - INFO - __main__ - Step 1658: {'lr': 0.00041425, 'samples': 318336, 'steps': 1657, 'loss/train': 2.882232666015625} -11/06/2021 21:30:24 - INFO - __main__ - Step 1659: {'lr': 0.0004145, 'samples': 318528, 'steps': 1658, 'loss/train': 3.018845558166504} -11/06/2021 21:30:24 - INFO - __main__ - Step 1660: {'lr': 0.00041475, 'samples': 318720, 'steps': 1659, 'loss/train': 3.1834557056427} -11/06/2021 21:30:25 - INFO - __main__ - Step 1661: {'lr': 0.000415, 'samples': 318912, 'steps': 1660, 'loss/train': 2.9305548667907715} -11/06/2021 21:30:26 - INFO - __main__ - Step 1662: {'lr': 0.00041525000000000004, 'samples': 319104, 'steps': 1661, 'loss/train': 2.6207032203674316} -11/06/2021 21:30:26 - INFO - __main__ - Step 1663: {'lr': 0.00041549999999999996, 'samples': 319296, 'steps': 1662, 'loss/train': 2.4517478942871094} -11/06/2021 21:30:26 - INFO - __main__ - Step 1664: {'lr': 0.00041575, 'samples': 319488, 'steps': 1663, 'loss/train': 3.7537591457366943} -11/06/2021 21:30:27 - INFO - __main__ - Step 1665: {'lr': 0.000416, 'samples': 319680, 'steps': 1664, 'loss/train': 2.756814956665039} -11/06/2021 21:30:28 - INFO - __main__ - Step 1666: {'lr': 0.00041625, 'samples': 319872, 'steps': 1665, 'loss/train': 1.4056485891342163} -11/06/2021 21:30:28 - INFO - __main__ - Step 1667: {'lr': 0.0004165, 'samples': 320064, 'steps': 1666, 'loss/train': 3.1112024784088135} -11/06/2021 21:30:29 - INFO - __main__ - Step 1668: {'lr': 0.00041675, 'samples': 320256, 'steps': 1667, 'loss/train': 2.9976048469543457} -11/06/2021 21:30:29 - INFO - __main__ - Step 1669: {'lr': 0.000417, 'samples': 320448, 'steps': 1668, 'loss/train': 2.675729274749756} -11/06/2021 21:30:29 - INFO - __main__ - Step 1670: {'lr': 0.00041725000000000003, 'samples': 320640, 'steps': 1669, 'loss/train': 3.3706750869750977} -11/06/2021 21:30:30 - INFO - __main__ - Step 1671: {'lr': 0.0004175, 'samples': 320832, 'steps': 1670, 'loss/train': 2.178697109222412} -11/06/2021 21:30:31 - INFO - __main__ - Step 1672: {'lr': 0.00041775000000000004, 'samples': 321024, 'steps': 1671, 'loss/train': 3.380084753036499} -11/06/2021 21:30:31 - INFO - __main__ - Step 1673: {'lr': 0.00041799999999999997, 'samples': 321216, 'steps': 1672, 'loss/train': 3.366750717163086} -11/06/2021 21:30:31 - INFO - __main__ - Step 1674: {'lr': 0.00041825, 'samples': 321408, 'steps': 1673, 'loss/train': 3.209273338317871} -11/06/2021 21:30:32 - INFO - __main__ - Step 1675: {'lr': 0.0004185, 'samples': 321600, 'steps': 1674, 'loss/train': 2.97452449798584} -11/06/2021 21:30:32 - INFO - __main__ - Step 1676: {'lr': 0.00041875, 'samples': 321792, 'steps': 1675, 'loss/train': 2.767279863357544} -11/06/2021 21:30:33 - INFO - __main__ - Step 1677: {'lr': 0.000419, 'samples': 321984, 'steps': 1676, 'loss/train': 2.001840114593506} -11/06/2021 21:30:34 - INFO - __main__ - Step 1678: {'lr': 0.00041925, 'samples': 322176, 'steps': 1677, 'loss/train': 2.869393825531006} -11/06/2021 21:30:34 - INFO - __main__ - Step 1679: {'lr': 0.0004195, 'samples': 322368, 'steps': 1678, 'loss/train': 3.0054664611816406} -11/06/2021 21:30:34 - INFO - __main__ - Step 1680: {'lr': 0.00041975000000000004, 'samples': 322560, 'steps': 1679, 'loss/train': 3.0030410289764404} -11/06/2021 21:30:35 - INFO - __main__ - Step 1681: {'lr': 0.00042, 'samples': 322752, 'steps': 1680, 'loss/train': 3.1293513774871826} -11/06/2021 21:30:36 - INFO - __main__ - Step 1682: {'lr': 0.00042025, 'samples': 322944, 'steps': 1681, 'loss/train': 2.867621421813965} -11/06/2021 21:30:36 - INFO - __main__ - Step 1683: {'lr': 0.0004205, 'samples': 323136, 'steps': 1682, 'loss/train': 3.148564100265503} -11/06/2021 21:30:36 - INFO - __main__ - Step 1684: {'lr': 0.00042075, 'samples': 323328, 'steps': 1683, 'loss/train': 3.7352867126464844} -11/06/2021 21:30:37 - INFO - __main__ - Step 1685: {'lr': 0.000421, 'samples': 323520, 'steps': 1684, 'loss/train': 2.9373221397399902} -11/06/2021 21:30:37 - INFO - __main__ - Step 1686: {'lr': 0.00042125, 'samples': 323712, 'steps': 1685, 'loss/train': 3.0616962909698486} -11/06/2021 21:30:38 - INFO - __main__ - Step 1687: {'lr': 0.0004215, 'samples': 323904, 'steps': 1686, 'loss/train': 3.012714147567749} -11/06/2021 21:30:38 - INFO - __main__ - Step 1688: {'lr': 0.00042175000000000003, 'samples': 324096, 'steps': 1687, 'loss/train': 2.1148290634155273} -11/06/2021 21:30:39 - INFO - __main__ - Step 1689: {'lr': 0.000422, 'samples': 324288, 'steps': 1688, 'loss/train': 2.7919063568115234} -11/06/2021 21:30:39 - INFO - __main__ - Step 1690: {'lr': 0.00042225000000000005, 'samples': 324480, 'steps': 1689, 'loss/train': 2.9707889556884766} -11/06/2021 21:30:39 - INFO - __main__ - Step 1691: {'lr': 0.00042249999999999997, 'samples': 324672, 'steps': 1690, 'loss/train': 2.998028039932251} -11/06/2021 21:30:40 - INFO - __main__ - Step 1692: {'lr': 0.00042275, 'samples': 324864, 'steps': 1691, 'loss/train': 2.591597557067871} -11/06/2021 21:30:41 - INFO - __main__ - Step 1693: {'lr': 0.000423, 'samples': 325056, 'steps': 1692, 'loss/train': 1.9363735914230347} -11/06/2021 21:30:41 - INFO - __main__ - Step 1694: {'lr': 0.00042325, 'samples': 325248, 'steps': 1693, 'loss/train': 4.028586387634277} -11/06/2021 21:30:42 - INFO - __main__ - Step 1695: {'lr': 0.0004235, 'samples': 325440, 'steps': 1694, 'loss/train': 2.9330668449401855} -11/06/2021 21:30:42 - INFO - __main__ - Step 1696: {'lr': 0.00042375000000000003, 'samples': 325632, 'steps': 1695, 'loss/train': 2.7509193420410156} -11/06/2021 21:30:42 - INFO - __main__ - Step 1697: {'lr': 0.000424, 'samples': 325824, 'steps': 1696, 'loss/train': 2.7954797744750977} -11/06/2021 21:30:44 - INFO - __main__ - Step 1698: {'lr': 0.00042425000000000004, 'samples': 326016, 'steps': 1697, 'loss/train': 2.988008499145508} -11/06/2021 21:30:44 - INFO - __main__ - Step 1699: {'lr': 0.0004245, 'samples': 326208, 'steps': 1698, 'loss/train': 1.511644959449768} -11/06/2021 21:30:44 - INFO - __main__ - Step 1700: {'lr': 0.00042475000000000005, 'samples': 326400, 'steps': 1699, 'loss/train': 2.778535842895508} -11/06/2021 21:30:45 - INFO - __main__ - Step 1701: {'lr': 0.000425, 'samples': 326592, 'steps': 1700, 'loss/train': 3.4467451572418213} -11/06/2021 21:30:45 - INFO - __main__ - Step 1702: {'lr': 0.00042525, 'samples': 326784, 'steps': 1701, 'loss/train': 2.888021469116211} -11/06/2021 21:30:46 - INFO - __main__ - Step 1703: {'lr': 0.0004255, 'samples': 326976, 'steps': 1702, 'loss/train': 3.509974718093872} -11/06/2021 21:30:46 - INFO - __main__ - Step 1704: {'lr': 0.00042575, 'samples': 327168, 'steps': 1703, 'loss/train': 3.2961580753326416} -11/06/2021 21:30:47 - INFO - __main__ - Step 1705: {'lr': 0.000426, 'samples': 327360, 'steps': 1704, 'loss/train': 2.881072521209717} -11/06/2021 21:30:47 - INFO - __main__ - Step 1706: {'lr': 0.00042625000000000003, 'samples': 327552, 'steps': 1705, 'loss/train': 2.8724474906921387} -11/06/2021 21:30:48 - INFO - __main__ - Step 1707: {'lr': 0.0004265, 'samples': 327744, 'steps': 1706, 'loss/train': 2.812833547592163} -11/06/2021 21:30:49 - INFO - __main__ - Step 1708: {'lr': 0.00042675000000000005, 'samples': 327936, 'steps': 1707, 'loss/train': 2.946378231048584} -11/06/2021 21:30:49 - INFO - __main__ - Step 1709: {'lr': 0.000427, 'samples': 328128, 'steps': 1708, 'loss/train': 3.0991225242614746} -11/06/2021 21:30:49 - INFO - __main__ - Step 1710: {'lr': 0.00042725, 'samples': 328320, 'steps': 1709, 'loss/train': 2.76066517829895} -11/06/2021 21:30:50 - INFO - __main__ - Step 1711: {'lr': 0.0004275, 'samples': 328512, 'steps': 1710, 'loss/train': 3.4125115871429443} -11/06/2021 21:30:50 - INFO - __main__ - Step 1712: {'lr': 0.00042775, 'samples': 328704, 'steps': 1711, 'loss/train': 3.148629903793335} -11/06/2021 21:30:51 - INFO - __main__ - Step 1713: {'lr': 0.000428, 'samples': 328896, 'steps': 1712, 'loss/train': 2.9542479515075684} -11/06/2021 21:30:51 - INFO - __main__ - Step 1714: {'lr': 0.00042825000000000003, 'samples': 329088, 'steps': 1713, 'loss/train': 2.862802743911743} -11/06/2021 21:30:52 - INFO - __main__ - Step 1715: {'lr': 0.0004285, 'samples': 329280, 'steps': 1714, 'loss/train': 3.073770046234131} -11/06/2021 21:30:52 - INFO - __main__ - Step 1716: {'lr': 0.00042875000000000004, 'samples': 329472, 'steps': 1715, 'loss/train': 3.261838436126709} -11/06/2021 21:30:52 - INFO - __main__ - Step 1717: {'lr': 0.000429, 'samples': 329664, 'steps': 1716, 'loss/train': 2.599968194961548} -11/06/2021 21:30:53 - INFO - __main__ - Step 1718: {'lr': 0.00042925000000000005, 'samples': 329856, 'steps': 1717, 'loss/train': 2.516638994216919} -11/06/2021 21:30:54 - INFO - __main__ - Step 1719: {'lr': 0.0004295, 'samples': 330048, 'steps': 1718, 'loss/train': 3.0501821041107178} -11/06/2021 21:30:54 - INFO - __main__ - Step 1720: {'lr': 0.00042975, 'samples': 330240, 'steps': 1719, 'loss/train': 2.847111225128174} -11/06/2021 21:30:55 - INFO - __main__ - Step 1721: {'lr': 0.00043, 'samples': 330432, 'steps': 1720, 'loss/train': 3.3006772994995117} -11/06/2021 21:30:55 - INFO - __main__ - Step 1722: {'lr': 0.00043025, 'samples': 330624, 'steps': 1721, 'loss/train': 2.7652220726013184} -11/06/2021 21:30:55 - INFO - __main__ - Step 1723: {'lr': 0.0004305, 'samples': 330816, 'steps': 1722, 'loss/train': 2.9833667278289795} -11/06/2021 21:30:56 - INFO - __main__ - Step 1724: {'lr': 0.00043075000000000003, 'samples': 331008, 'steps': 1723, 'loss/train': 2.814836263656616} -11/06/2021 21:30:57 - INFO - __main__ - Step 1725: {'lr': 0.000431, 'samples': 331200, 'steps': 1724, 'loss/train': 2.774881601333618} -11/06/2021 21:30:57 - INFO - __main__ - Step 1726: {'lr': 0.00043125000000000005, 'samples': 331392, 'steps': 1725, 'loss/train': 2.4785728454589844} -11/06/2021 21:30:57 - INFO - __main__ - Step 1727: {'lr': 0.0004315, 'samples': 331584, 'steps': 1726, 'loss/train': 2.6767044067382812} -11/06/2021 21:30:58 - INFO - __main__ - Step 1728: {'lr': 0.00043175, 'samples': 331776, 'steps': 1727, 'loss/train': 2.493360757827759} -11/06/2021 21:30:59 - INFO - __main__ - Step 1729: {'lr': 0.000432, 'samples': 331968, 'steps': 1728, 'loss/train': 2.8869781494140625} -11/06/2021 21:30:59 - INFO - __main__ - Step 1730: {'lr': 0.00043225, 'samples': 332160, 'steps': 1729, 'loss/train': 3.2163848876953125} -11/06/2021 21:30:59 - INFO - __main__ - Step 1731: {'lr': 0.0004325, 'samples': 332352, 'steps': 1730, 'loss/train': 2.487175703048706} -11/06/2021 21:31:00 - INFO - __main__ - Step 1732: {'lr': 0.00043275000000000003, 'samples': 332544, 'steps': 1731, 'loss/train': 3.1521098613739014} -11/06/2021 21:31:00 - INFO - __main__ - Step 1733: {'lr': 0.000433, 'samples': 332736, 'steps': 1732, 'loss/train': 2.8074662685394287} -11/06/2021 21:31:01 - INFO - __main__ - Step 1734: {'lr': 0.00043325000000000004, 'samples': 332928, 'steps': 1733, 'loss/train': 3.05580735206604} -11/06/2021 21:31:01 - INFO - __main__ - Step 1735: {'lr': 0.0004335, 'samples': 333120, 'steps': 1734, 'loss/train': 3.6109087467193604} -11/06/2021 21:31:02 - INFO - __main__ - Step 1736: {'lr': 0.00043375000000000005, 'samples': 333312, 'steps': 1735, 'loss/train': 2.645113945007324} -11/06/2021 21:31:02 - INFO - __main__ - Step 1737: {'lr': 0.00043400000000000003, 'samples': 333504, 'steps': 1736, 'loss/train': 3.2458112239837646} -11/06/2021 21:31:02 - INFO - __main__ - Step 1738: {'lr': 0.00043425, 'samples': 333696, 'steps': 1737, 'loss/train': 2.0575199127197266} -11/06/2021 21:31:03 - INFO - __main__ - Step 1739: {'lr': 0.0004345, 'samples': 333888, 'steps': 1738, 'loss/train': 2.66829514503479} -11/06/2021 21:31:04 - INFO - __main__ - Step 1740: {'lr': 0.00043475, 'samples': 334080, 'steps': 1739, 'loss/train': 2.9333367347717285} -11/06/2021 21:31:04 - INFO - __main__ - Step 1741: {'lr': 0.000435, 'samples': 334272, 'steps': 1740, 'loss/train': 3.1755714416503906} -11/06/2021 21:31:04 - INFO - __main__ - Step 1742: {'lr': 0.00043525000000000004, 'samples': 334464, 'steps': 1741, 'loss/train': 3.1603219509124756} -11/06/2021 21:31:05 - INFO - __main__ - Step 1743: {'lr': 0.0004355, 'samples': 334656, 'steps': 1742, 'loss/train': 2.6941590309143066} -11/06/2021 21:31:05 - INFO - __main__ - Step 1744: {'lr': 0.00043575000000000005, 'samples': 334848, 'steps': 1743, 'loss/train': 2.652301788330078} -11/06/2021 21:31:06 - INFO - __main__ - Step 1745: {'lr': 0.000436, 'samples': 335040, 'steps': 1744, 'loss/train': 2.9104788303375244} -11/06/2021 21:31:06 - INFO - __main__ - Step 1746: {'lr': 0.00043625000000000006, 'samples': 335232, 'steps': 1745, 'loss/train': 2.98048996925354} -11/06/2021 21:31:07 - INFO - __main__ - Step 1747: {'lr': 0.0004365, 'samples': 335424, 'steps': 1746, 'loss/train': 2.9957258701324463} -11/06/2021 21:31:07 - INFO - __main__ - Step 1748: {'lr': 0.00043675, 'samples': 335616, 'steps': 1747, 'loss/train': 2.979066848754883} -11/06/2021 21:31:08 - INFO - __main__ - Step 1749: {'lr': 0.000437, 'samples': 335808, 'steps': 1748, 'loss/train': 2.8784215450286865} -11/06/2021 21:31:09 - INFO - __main__ - Step 1750: {'lr': 0.00043725000000000003, 'samples': 336000, 'steps': 1749, 'loss/train': 2.7070152759552} -11/06/2021 21:31:09 - INFO - __main__ - Step 1751: {'lr': 0.0004375, 'samples': 336192, 'steps': 1750, 'loss/train': 3.0066816806793213} -11/06/2021 21:31:09 - INFO - __main__ - Step 1752: {'lr': 0.00043775, 'samples': 336384, 'steps': 1751, 'loss/train': 2.9297680854797363} -11/06/2021 21:31:10 - INFO - __main__ - Step 1753: {'lr': 0.000438, 'samples': 336576, 'steps': 1752, 'loss/train': 2.3090498447418213} -11/06/2021 21:31:10 - INFO - __main__ - Step 1754: {'lr': 0.00043825, 'samples': 336768, 'steps': 1753, 'loss/train': 2.7136483192443848} -11/06/2021 21:31:11 - INFO - __main__ - Step 1755: {'lr': 0.00043850000000000003, 'samples': 336960, 'steps': 1754, 'loss/train': 2.4475595951080322} -11/06/2021 21:31:11 - INFO - __main__ - Step 1756: {'lr': 0.00043874999999999996, 'samples': 337152, 'steps': 1755, 'loss/train': 2.8239781856536865} -11/06/2021 21:31:12 - INFO - __main__ - Step 1757: {'lr': 0.000439, 'samples': 337344, 'steps': 1756, 'loss/train': 3.583254337310791} -11/06/2021 21:31:12 - INFO - __main__ - Step 1758: {'lr': 0.00043924999999999997, 'samples': 337536, 'steps': 1757, 'loss/train': 2.8755791187286377} -11/06/2021 21:31:12 - INFO - __main__ - Step 1759: {'lr': 0.0004395, 'samples': 337728, 'steps': 1758, 'loss/train': 2.466693878173828} -11/06/2021 21:31:14 - INFO - __main__ - Step 1760: {'lr': 0.00043975, 'samples': 337920, 'steps': 1759, 'loss/train': 1.9713040590286255} -11/06/2021 21:31:14 - INFO - __main__ - Step 1761: {'lr': 0.00044, 'samples': 338112, 'steps': 1760, 'loss/train': 2.958988904953003} -11/06/2021 21:31:14 - INFO - __main__ - Step 1762: {'lr': 0.00044025, 'samples': 338304, 'steps': 1761, 'loss/train': 2.85742449760437} -11/06/2021 21:31:15 - INFO - __main__ - Step 1763: {'lr': 0.00044050000000000003, 'samples': 338496, 'steps': 1762, 'loss/train': 3.1893415451049805} -11/06/2021 21:31:15 - INFO - __main__ - Step 1764: {'lr': 0.00044075, 'samples': 338688, 'steps': 1763, 'loss/train': 2.489380121231079} -11/06/2021 21:31:16 - INFO - __main__ - Step 1765: {'lr': 0.000441, 'samples': 338880, 'steps': 1764, 'loss/train': 2.26016902923584} -11/06/2021 21:31:16 - INFO - __main__ - Step 1766: {'lr': 0.00044124999999999996, 'samples': 339072, 'steps': 1765, 'loss/train': 2.8823275566101074} -11/06/2021 21:31:17 - INFO - __main__ - Step 1767: {'lr': 0.0004415, 'samples': 339264, 'steps': 1766, 'loss/train': 3.0336639881134033} -11/06/2021 21:31:17 - INFO - __main__ - Step 1768: {'lr': 0.00044175, 'samples': 339456, 'steps': 1767, 'loss/train': 2.4429008960723877} -11/06/2021 21:31:17 - INFO - __main__ - Step 1769: {'lr': 0.000442, 'samples': 339648, 'steps': 1768, 'loss/train': 3.196798086166382} -11/06/2021 21:31:18 - INFO - __main__ - Step 1770: {'lr': 0.00044225, 'samples': 339840, 'steps': 1769, 'loss/train': 3.4543304443359375} -11/06/2021 21:31:19 - INFO - __main__ - Step 1771: {'lr': 0.0004425, 'samples': 340032, 'steps': 1770, 'loss/train': 2.851696252822876} -11/06/2021 21:31:19 - INFO - __main__ - Step 1772: {'lr': 0.00044275, 'samples': 340224, 'steps': 1771, 'loss/train': 3.060702085494995} -11/06/2021 21:31:19 - INFO - __main__ - Step 1773: {'lr': 0.00044300000000000003, 'samples': 340416, 'steps': 1772, 'loss/train': 2.7474842071533203} -11/06/2021 21:31:20 - INFO - __main__ - Step 1774: {'lr': 0.00044325, 'samples': 340608, 'steps': 1773, 'loss/train': 2.9190454483032227} -11/06/2021 21:31:21 - INFO - __main__ - Step 1775: {'lr': 0.0004435, 'samples': 340800, 'steps': 1774, 'loss/train': 2.802793025970459} -11/06/2021 21:31:21 - INFO - __main__ - Step 1776: {'lr': 0.00044374999999999997, 'samples': 340992, 'steps': 1775, 'loss/train': 2.8785560131073} -11/06/2021 21:31:21 - INFO - __main__ - Step 1777: {'lr': 0.000444, 'samples': 341184, 'steps': 1776, 'loss/train': 2.995643138885498} -11/06/2021 21:31:22 - INFO - __main__ - Step 1778: {'lr': 0.00044425, 'samples': 341376, 'steps': 1777, 'loss/train': 1.8993228673934937} -11/06/2021 21:31:22 - INFO - __main__ - Step 1779: {'lr': 0.0004445, 'samples': 341568, 'steps': 1778, 'loss/train': 2.85463547706604} -11/06/2021 21:31:23 - INFO - __main__ - Step 1780: {'lr': 0.00044475, 'samples': 341760, 'steps': 1779, 'loss/train': 2.185767650604248} -11/06/2021 21:31:24 - INFO - __main__ - Step 1781: {'lr': 0.00044500000000000003, 'samples': 341952, 'steps': 1780, 'loss/train': 2.92201828956604} -11/06/2021 21:31:24 - INFO - __main__ - Step 1782: {'lr': 0.00044525, 'samples': 342144, 'steps': 1781, 'loss/train': 3.134248971939087} -11/06/2021 21:31:24 - INFO - __main__ - Step 1783: {'lr': 0.00044550000000000004, 'samples': 342336, 'steps': 1782, 'loss/train': 2.170048952102661} -11/06/2021 21:31:25 - INFO - __main__ - Step 1784: {'lr': 0.00044574999999999997, 'samples': 342528, 'steps': 1783, 'loss/train': 3.8918814659118652} -11/06/2021 21:31:26 - INFO - __main__ - Step 1785: {'lr': 0.000446, 'samples': 342720, 'steps': 1784, 'loss/train': 2.8046724796295166} -11/06/2021 21:31:26 - INFO - __main__ - Step 1786: {'lr': 0.00044625, 'samples': 342912, 'steps': 1785, 'loss/train': 1.7093374729156494} -11/06/2021 21:31:26 - INFO - __main__ - Step 1787: {'lr': 0.0004465, 'samples': 343104, 'steps': 1786, 'loss/train': 2.761946678161621} -11/06/2021 21:31:27 - INFO - __main__ - Step 1788: {'lr': 0.00044675, 'samples': 343296, 'steps': 1787, 'loss/train': 3.1174871921539307} -11/06/2021 21:31:27 - INFO - __main__ - Step 1789: {'lr': 0.000447, 'samples': 343488, 'steps': 1788, 'loss/train': 0.9450645446777344} -11/06/2021 21:31:27 - INFO - __main__ - Step 1790: {'lr': 0.00044725, 'samples': 343680, 'steps': 1789, 'loss/train': 2.685868263244629} -11/06/2021 21:31:28 - INFO - __main__ - Step 1791: {'lr': 0.00044750000000000004, 'samples': 343872, 'steps': 1790, 'loss/train': 3.149627685546875} -11/06/2021 21:31:29 - INFO - __main__ - Step 1792: {'lr': 0.00044775, 'samples': 344064, 'steps': 1791, 'loss/train': 2.8557493686676025} -11/06/2021 21:31:29 - INFO - __main__ - Step 1793: {'lr': 0.000448, 'samples': 344256, 'steps': 1792, 'loss/train': 2.3917579650878906} -11/06/2021 21:31:29 - INFO - __main__ - Step 1794: {'lr': 0.00044824999999999997, 'samples': 344448, 'steps': 1793, 'loss/train': 2.5539019107818604} -11/06/2021 21:31:30 - INFO - __main__ - Step 1795: {'lr': 0.0004485, 'samples': 344640, 'steps': 1794, 'loss/train': 2.866556167602539} -11/06/2021 21:31:31 - INFO - __main__ - Step 1796: {'lr': 0.00044875, 'samples': 344832, 'steps': 1795, 'loss/train': 2.69342303276062} -11/06/2021 21:31:31 - INFO - __main__ - Step 1797: {'lr': 0.000449, 'samples': 345024, 'steps': 1796, 'loss/train': 3.4725310802459717} -11/06/2021 21:31:32 - INFO - __main__ - Step 1798: {'lr': 0.00044925, 'samples': 345216, 'steps': 1797, 'loss/train': 3.1553845405578613} -11/06/2021 21:31:32 - INFO - __main__ - Step 1799: {'lr': 0.00044950000000000003, 'samples': 345408, 'steps': 1798, 'loss/train': 2.5512850284576416} -11/06/2021 21:31:32 - INFO - __main__ - Step 1800: {'lr': 0.00044975, 'samples': 345600, 'steps': 1799, 'loss/train': 2.6328558921813965} -11/06/2021 21:31:33 - INFO - __main__ - Step 1801: {'lr': 0.00045000000000000004, 'samples': 345792, 'steps': 1800, 'loss/train': 2.415855646133423} -11/06/2021 21:31:34 - INFO - __main__ - Step 1802: {'lr': 0.00045024999999999997, 'samples': 345984, 'steps': 1801, 'loss/train': 2.065478801727295} -11/06/2021 21:31:34 - INFO - __main__ - Step 1803: {'lr': 0.0004505, 'samples': 346176, 'steps': 1802, 'loss/train': 3.1000237464904785} -11/06/2021 21:31:34 - INFO - __main__ - Step 1804: {'lr': 0.00045075, 'samples': 346368, 'steps': 1803, 'loss/train': 3.079942464828491} -11/06/2021 21:31:35 - INFO - __main__ - Step 1805: {'lr': 0.000451, 'samples': 346560, 'steps': 1804, 'loss/train': 2.9212794303894043} -11/06/2021 21:31:36 - INFO - __main__ - Step 1806: {'lr': 0.00045125, 'samples': 346752, 'steps': 1805, 'loss/train': 2.327099323272705} -11/06/2021 21:31:36 - INFO - __main__ - Step 1807: {'lr': 0.0004515, 'samples': 346944, 'steps': 1806, 'loss/train': 2.2962563037872314} -11/06/2021 21:31:36 - INFO - __main__ - Step 1808: {'lr': 0.00045175, 'samples': 347136, 'steps': 1807, 'loss/train': 2.611140012741089} -11/06/2021 21:31:37 - INFO - __main__ - Step 1809: {'lr': 0.00045200000000000004, 'samples': 347328, 'steps': 1808, 'loss/train': 2.6826744079589844} -11/06/2021 21:31:37 - INFO - __main__ - Step 1810: {'lr': 0.00045225, 'samples': 347520, 'steps': 1809, 'loss/train': 1.936403512954712} -11/06/2021 21:31:38 - INFO - __main__ - Step 1811: {'lr': 0.00045250000000000005, 'samples': 347712, 'steps': 1810, 'loss/train': 2.373436450958252} -11/06/2021 21:31:39 - INFO - __main__ - Step 1812: {'lr': 0.00045275, 'samples': 347904, 'steps': 1811, 'loss/train': 2.730616807937622} -11/06/2021 21:31:39 - INFO - __main__ - Step 1813: {'lr': 0.000453, 'samples': 348096, 'steps': 1812, 'loss/train': 2.415011405944824} -11/06/2021 21:31:39 - INFO - __main__ - Step 1814: {'lr': 0.00045325, 'samples': 348288, 'steps': 1813, 'loss/train': 3.2586300373077393} -11/06/2021 21:31:40 - INFO - __main__ - Step 1815: {'lr': 0.0004535, 'samples': 348480, 'steps': 1814, 'loss/train': 2.568127155303955} -11/06/2021 21:31:40 - INFO - __main__ - Step 1816: {'lr': 0.00045375, 'samples': 348672, 'steps': 1815, 'loss/train': 2.9116480350494385} -11/06/2021 21:31:41 - INFO - __main__ - Step 1817: {'lr': 0.00045400000000000003, 'samples': 348864, 'steps': 1816, 'loss/train': 2.36753249168396} -11/06/2021 21:31:41 - INFO - __main__ - Step 1818: {'lr': 0.00045425, 'samples': 349056, 'steps': 1817, 'loss/train': 1.9278064966201782} -11/06/2021 21:31:42 - INFO - __main__ - Step 1819: {'lr': 0.00045450000000000004, 'samples': 349248, 'steps': 1818, 'loss/train': 3.1639034748077393} -11/06/2021 21:31:42 - INFO - __main__ - Step 1820: {'lr': 0.00045475, 'samples': 349440, 'steps': 1819, 'loss/train': 2.775869846343994} -11/06/2021 21:31:42 - INFO - __main__ - Step 1821: {'lr': 0.000455, 'samples': 349632, 'steps': 1820, 'loss/train': 1.739648699760437} -11/06/2021 21:31:44 - INFO - __main__ - Step 1822: {'lr': 0.00045525, 'samples': 349824, 'steps': 1821, 'loss/train': 2.914762258529663} -11/06/2021 21:31:44 - INFO - __main__ - Step 1823: {'lr': 0.0004555, 'samples': 350016, 'steps': 1822, 'loss/train': 2.881727457046509} -11/06/2021 21:31:44 - INFO - __main__ - Step 1824: {'lr': 0.00045575, 'samples': 350208, 'steps': 1823, 'loss/train': 2.6797189712524414} -11/06/2021 21:31:45 - INFO - __main__ - Step 1825: {'lr': 0.000456, 'samples': 350400, 'steps': 1824, 'loss/train': 3.1673336029052734} -11/06/2021 21:31:45 - INFO - __main__ - Step 1826: {'lr': 0.00045625, 'samples': 350592, 'steps': 1825, 'loss/train': 2.9814321994781494} -11/06/2021 21:31:45 - INFO - __main__ - Step 1827: {'lr': 0.00045650000000000004, 'samples': 350784, 'steps': 1826, 'loss/train': 2.706651210784912} -11/06/2021 21:31:47 - INFO - __main__ - Step 1828: {'lr': 0.00045675, 'samples': 350976, 'steps': 1827, 'loss/train': 2.262235403060913} -11/06/2021 21:31:47 - INFO - __main__ - Step 1829: {'lr': 0.00045700000000000005, 'samples': 351168, 'steps': 1828, 'loss/train': 3.5420644283294678} -11/06/2021 21:31:47 - INFO - __main__ - Step 1830: {'lr': 0.00045725, 'samples': 351360, 'steps': 1829, 'loss/train': 2.597929000854492} -11/06/2021 21:31:48 - INFO - __main__ - Step 1831: {'lr': 0.0004575, 'samples': 351552, 'steps': 1830, 'loss/train': 3.1444313526153564} -11/06/2021 21:31:48 - INFO - __main__ - Step 1832: {'lr': 0.00045775, 'samples': 351744, 'steps': 1831, 'loss/train': 2.755781650543213} -11/06/2021 21:31:49 - INFO - __main__ - Step 1833: {'lr': 0.000458, 'samples': 351936, 'steps': 1832, 'loss/train': 2.7278811931610107} -11/06/2021 21:31:50 - INFO - __main__ - Step 1834: {'lr': 0.00045825, 'samples': 352128, 'steps': 1833, 'loss/train': 3.7509689331054688} -11/06/2021 21:31:50 - INFO - __main__ - Step 1835: {'lr': 0.00045850000000000003, 'samples': 352320, 'steps': 1834, 'loss/train': 2.9152324199676514} -11/06/2021 21:31:50 - INFO - __main__ - Step 1836: {'lr': 0.00045875, 'samples': 352512, 'steps': 1835, 'loss/train': 3.254568338394165} -11/06/2021 21:31:51 - INFO - __main__ - Step 1837: {'lr': 0.00045900000000000004, 'samples': 352704, 'steps': 1836, 'loss/train': 3.5360164642333984} -11/06/2021 21:31:51 - INFO - __main__ - Step 1838: {'lr': 0.00045925, 'samples': 352896, 'steps': 1837, 'loss/train': 2.5410776138305664} -11/06/2021 21:31:52 - INFO - __main__ - Step 1839: {'lr': 0.00045950000000000006, 'samples': 353088, 'steps': 1838, 'loss/train': 3.515568971633911} -11/06/2021 21:31:52 - INFO - __main__ - Step 1840: {'lr': 0.00045975, 'samples': 353280, 'steps': 1839, 'loss/train': 2.9194540977478027} -11/06/2021 21:31:53 - INFO - __main__ - Step 1841: {'lr': 0.00046, 'samples': 353472, 'steps': 1840, 'loss/train': 3.339538335800171} -11/06/2021 21:31:53 - INFO - __main__ - Step 1842: {'lr': 0.00046025, 'samples': 353664, 'steps': 1841, 'loss/train': 3.2247955799102783} -11/06/2021 21:31:53 - INFO - __main__ - Step 1843: {'lr': 0.0004605, 'samples': 353856, 'steps': 1842, 'loss/train': 2.9142487049102783} -11/06/2021 21:31:54 - INFO - __main__ - Step 1844: {'lr': 0.00046075, 'samples': 354048, 'steps': 1843, 'loss/train': 3.003730058670044} -11/06/2021 21:31:55 - INFO - __main__ - Step 1845: {'lr': 0.00046100000000000004, 'samples': 354240, 'steps': 1844, 'loss/train': 2.9719865322113037} -11/06/2021 21:31:55 - INFO - __main__ - Step 1846: {'lr': 0.00046125, 'samples': 354432, 'steps': 1845, 'loss/train': 2.9568333625793457} -11/06/2021 21:31:55 - INFO - __main__ - Step 1847: {'lr': 0.00046150000000000005, 'samples': 354624, 'steps': 1846, 'loss/train': 3.0182647705078125} -11/06/2021 21:31:56 - INFO - __main__ - Step 1848: {'lr': 0.00046175000000000003, 'samples': 354816, 'steps': 1847, 'loss/train': 2.928616762161255} -11/06/2021 21:31:57 - INFO - __main__ - Step 1849: {'lr': 0.000462, 'samples': 355008, 'steps': 1848, 'loss/train': 2.610539674758911} -11/06/2021 21:31:57 - INFO - __main__ - Step 1850: {'lr': 0.00046225, 'samples': 355200, 'steps': 1849, 'loss/train': 2.6568455696105957} -11/06/2021 21:31:57 - INFO - __main__ - Step 1851: {'lr': 0.0004625, 'samples': 355392, 'steps': 1850, 'loss/train': 3.0052649974823} -11/06/2021 21:31:58 - INFO - __main__ - Step 1852: {'lr': 0.00046275, 'samples': 355584, 'steps': 1851, 'loss/train': 2.291944980621338} -11/06/2021 21:31:58 - INFO - __main__ - Step 1853: {'lr': 0.00046300000000000003, 'samples': 355776, 'steps': 1852, 'loss/train': 2.464561700820923} -11/06/2021 21:31:59 - INFO - __main__ - Step 1854: {'lr': 0.00046325, 'samples': 355968, 'steps': 1853, 'loss/train': 2.724757671356201} -11/06/2021 21:32:00 - INFO - __main__ - Step 1855: {'lr': 0.00046350000000000004, 'samples': 356160, 'steps': 1854, 'loss/train': 2.5522210597991943} -11/06/2021 21:32:00 - INFO - __main__ - Step 1856: {'lr': 0.00046375, 'samples': 356352, 'steps': 1855, 'loss/train': 2.9748101234436035} -11/06/2021 21:32:00 - INFO - __main__ - Step 1857: {'lr': 0.00046400000000000006, 'samples': 356544, 'steps': 1856, 'loss/train': 2.8747081756591797} -11/06/2021 21:32:01 - INFO - __main__ - Step 1858: {'lr': 0.00046425, 'samples': 356736, 'steps': 1857, 'loss/train': 3.183314085006714} -11/06/2021 21:32:01 - INFO - __main__ - Step 1859: {'lr': 0.0004645, 'samples': 356928, 'steps': 1858, 'loss/train': 2.9345762729644775} -11/06/2021 21:32:02 - INFO - __main__ - Step 1860: {'lr': 0.00046475, 'samples': 357120, 'steps': 1859, 'loss/train': 2.89750337600708} -11/06/2021 21:32:02 - INFO - __main__ - Step 1861: {'lr': 0.000465, 'samples': 357312, 'steps': 1860, 'loss/train': 2.8957128524780273} -11/06/2021 21:32:03 - INFO - __main__ - Step 1862: {'lr': 0.00046525, 'samples': 357504, 'steps': 1861, 'loss/train': 3.1396281719207764} -11/06/2021 21:32:03 - INFO - __main__ - Step 1863: {'lr': 0.00046550000000000004, 'samples': 357696, 'steps': 1862, 'loss/train': 2.8213651180267334} -11/06/2021 21:32:03 - INFO - __main__ - Step 1864: {'lr': 0.00046575, 'samples': 357888, 'steps': 1863, 'loss/train': 3.4859542846679688} -11/06/2021 21:32:04 - INFO - __main__ - Step 1865: {'lr': 0.00046600000000000005, 'samples': 358080, 'steps': 1864, 'loss/train': 2.8421342372894287} -11/06/2021 21:32:05 - INFO - __main__ - Step 1866: {'lr': 0.00046625000000000003, 'samples': 358272, 'steps': 1865, 'loss/train': 2.0108532905578613} -11/06/2021 21:32:05 - INFO - __main__ - Step 1867: {'lr': 0.0004665, 'samples': 358464, 'steps': 1866, 'loss/train': 3.0010299682617188} -11/06/2021 21:32:05 - INFO - __main__ - Step 1868: {'lr': 0.00046675, 'samples': 358656, 'steps': 1867, 'loss/train': 2.391618013381958} -11/06/2021 21:32:06 - INFO - __main__ - Step 1869: {'lr': 0.000467, 'samples': 358848, 'steps': 1868, 'loss/train': 1.2518956661224365} -11/06/2021 21:32:07 - INFO - __main__ - Step 1870: {'lr': 0.00046725, 'samples': 359040, 'steps': 1869, 'loss/train': 2.0170106887817383} -11/06/2021 21:32:07 - INFO - __main__ - Step 1871: {'lr': 0.00046750000000000003, 'samples': 359232, 'steps': 1870, 'loss/train': 1.179073691368103} -11/06/2021 21:32:08 - INFO - __main__ - Step 1872: {'lr': 0.00046775, 'samples': 359424, 'steps': 1871, 'loss/train': 2.682760715484619} -11/06/2021 21:32:08 - INFO - __main__ - Step 1873: {'lr': 0.00046800000000000005, 'samples': 359616, 'steps': 1872, 'loss/train': 2.571380138397217} -11/06/2021 21:32:08 - INFO - __main__ - Step 1874: {'lr': 0.00046825, 'samples': 359808, 'steps': 1873, 'loss/train': 3.113672971725464} -11/06/2021 21:32:10 - INFO - __main__ - Step 1875: {'lr': 0.00046850000000000006, 'samples': 360000, 'steps': 1874, 'loss/train': 3.40779447555542} -11/06/2021 21:32:10 - INFO - __main__ - Step 1876: {'lr': 0.00046875, 'samples': 360192, 'steps': 1875, 'loss/train': 2.6321020126342773} -11/06/2021 21:32:10 - INFO - __main__ - Step 1877: {'lr': 0.00046899999999999996, 'samples': 360384, 'steps': 1876, 'loss/train': 2.4527957439422607} -11/06/2021 21:32:11 - INFO - __main__ - Step 1878: {'lr': 0.00046925, 'samples': 360576, 'steps': 1877, 'loss/train': 2.8265886306762695} -11/06/2021 21:32:11 - INFO - __main__ - Step 1879: {'lr': 0.0004695, 'samples': 360768, 'steps': 1878, 'loss/train': 2.863210916519165} -11/06/2021 21:32:11 - INFO - __main__ - Step 1880: {'lr': 0.00046975, 'samples': 360960, 'steps': 1879, 'loss/train': 2.7804150581359863} -11/06/2021 21:32:12 - INFO - __main__ - Step 1881: {'lr': 0.00047, 'samples': 361152, 'steps': 1880, 'loss/train': 2.7934844493865967} -11/06/2021 21:32:13 - INFO - __main__ - Step 1882: {'lr': 0.00047025, 'samples': 361344, 'steps': 1881, 'loss/train': 2.5030977725982666} -11/06/2021 21:32:13 - INFO - __main__ - Step 1883: {'lr': 0.0004705, 'samples': 361536, 'steps': 1882, 'loss/train': 2.1091949939727783} -11/06/2021 21:32:13 - INFO - __main__ - Step 1884: {'lr': 0.00047075000000000003, 'samples': 361728, 'steps': 1883, 'loss/train': 2.5549018383026123} -11/06/2021 21:32:14 - INFO - __main__ - Step 1885: {'lr': 0.000471, 'samples': 361920, 'steps': 1884, 'loss/train': 2.7697577476501465} -11/06/2021 21:32:15 - INFO - __main__ - Step 1886: {'lr': 0.00047125, 'samples': 362112, 'steps': 1885, 'loss/train': 2.8604817390441895} -11/06/2021 21:32:15 - INFO - __main__ - Step 1887: {'lr': 0.00047149999999999997, 'samples': 362304, 'steps': 1886, 'loss/train': 2.9714930057525635} -11/06/2021 21:32:16 - INFO - __main__ - Step 1888: {'lr': 0.00047175, 'samples': 362496, 'steps': 1887, 'loss/train': 3.0450122356414795} -11/06/2021 21:32:16 - INFO - __main__ - Step 1889: {'lr': 0.000472, 'samples': 362688, 'steps': 1888, 'loss/train': 2.69807505607605} -11/06/2021 21:32:16 - INFO - __main__ - Step 1890: {'lr': 0.00047225, 'samples': 362880, 'steps': 1889, 'loss/train': 2.992997884750366} -11/06/2021 21:32:17 - INFO - __main__ - Step 1891: {'lr': 0.0004725, 'samples': 363072, 'steps': 1890, 'loss/train': 2.015784740447998} -11/06/2021 21:32:18 - INFO - __main__ - Step 1892: {'lr': 0.00047275, 'samples': 363264, 'steps': 1891, 'loss/train': 2.8816325664520264} -11/06/2021 21:32:18 - INFO - __main__ - Step 1893: {'lr': 0.000473, 'samples': 363456, 'steps': 1892, 'loss/train': 3.2066597938537598} -11/06/2021 21:32:18 - INFO - __main__ - Step 1894: {'lr': 0.00047325000000000004, 'samples': 363648, 'steps': 1893, 'loss/train': 2.5090718269348145} -11/06/2021 21:32:19 - INFO - __main__ - Step 1895: {'lr': 0.00047349999999999996, 'samples': 363840, 'steps': 1894, 'loss/train': 2.715529680252075} -11/06/2021 21:32:19 - INFO - __main__ - Step 1896: {'lr': 0.00047375, 'samples': 364032, 'steps': 1895, 'loss/train': 2.8144490718841553} -11/06/2021 21:32:20 - INFO - __main__ - Step 1897: {'lr': 0.000474, 'samples': 364224, 'steps': 1896, 'loss/train': 2.670848846435547} -11/06/2021 21:32:21 - INFO - __main__ - Step 1898: {'lr': 0.00047425, 'samples': 364416, 'steps': 1897, 'loss/train': 2.614722728729248} -11/06/2021 21:32:21 - INFO - __main__ - Step 1899: {'lr': 0.0004745, 'samples': 364608, 'steps': 1898, 'loss/train': 2.741778612136841} -11/06/2021 21:32:21 - INFO - __main__ - Step 1900: {'lr': 0.00047475, 'samples': 364800, 'steps': 1899, 'loss/train': 3.1232104301452637} -11/06/2021 21:32:22 - INFO - __main__ - Step 1901: {'lr': 0.000475, 'samples': 364992, 'steps': 1900, 'loss/train': 2.564000368118286} -11/06/2021 21:32:23 - INFO - __main__ - Step 1902: {'lr': 0.00047525000000000003, 'samples': 365184, 'steps': 1901, 'loss/train': 2.7664237022399902} -11/06/2021 21:32:23 - INFO - __main__ - Step 1903: {'lr': 0.0004755, 'samples': 365376, 'steps': 1902, 'loss/train': 2.554410934448242} -11/06/2021 21:32:23 - INFO - __main__ - Step 1904: {'lr': 0.00047575, 'samples': 365568, 'steps': 1903, 'loss/train': 2.5446524620056152} -11/06/2021 21:32:24 - INFO - __main__ - Step 1905: {'lr': 0.00047599999999999997, 'samples': 365760, 'steps': 1904, 'loss/train': 2.754312515258789} -11/06/2021 21:32:24 - INFO - __main__ - Step 1906: {'lr': 0.00047625, 'samples': 365952, 'steps': 1905, 'loss/train': 2.7138187885284424} -11/06/2021 21:32:25 - INFO - __main__ - Step 1907: {'lr': 0.0004765, 'samples': 366144, 'steps': 1906, 'loss/train': 2.9011712074279785} -11/06/2021 21:32:25 - INFO - __main__ - Step 1908: {'lr': 0.00047675, 'samples': 366336, 'steps': 1907, 'loss/train': 2.7939672470092773} -11/06/2021 21:32:26 - INFO - __main__ - Step 1909: {'lr': 0.000477, 'samples': 366528, 'steps': 1908, 'loss/train': 3.0879056453704834} -11/06/2021 21:32:26 - INFO - __main__ - Step 1910: {'lr': 0.00047725, 'samples': 366720, 'steps': 1909, 'loss/train': 2.4980082511901855} -11/06/2021 21:32:26 - INFO - __main__ - Step 1911: {'lr': 0.0004775, 'samples': 366912, 'steps': 1910, 'loss/train': 2.949843645095825} -11/06/2021 21:32:27 - INFO - __main__ - Step 1912: {'lr': 0.00047775000000000004, 'samples': 367104, 'steps': 1911, 'loss/train': 2.661370277404785} -11/06/2021 21:32:28 - INFO - __main__ - Step 1913: {'lr': 0.00047799999999999996, 'samples': 367296, 'steps': 1912, 'loss/train': 2.855457305908203} -11/06/2021 21:32:28 - INFO - __main__ - Step 1914: {'lr': 0.00047825, 'samples': 367488, 'steps': 1913, 'loss/train': 2.790748119354248} -11/06/2021 21:32:28 - INFO - __main__ - Step 1915: {'lr': 0.0004785, 'samples': 367680, 'steps': 1914, 'loss/train': 2.1920478343963623} -11/06/2021 21:32:29 - INFO - __main__ - Step 1916: {'lr': 0.00047875, 'samples': 367872, 'steps': 1915, 'loss/train': 3.010140895843506} -11/06/2021 21:32:30 - INFO - __main__ - Step 1917: {'lr': 0.000479, 'samples': 368064, 'steps': 1916, 'loss/train': 2.7934629917144775} -11/06/2021 21:32:30 - INFO - __main__ - Step 1918: {'lr': 0.00047925, 'samples': 368256, 'steps': 1917, 'loss/train': 2.759575128555298} -11/06/2021 21:32:31 - INFO - __main__ - Step 1919: {'lr': 0.0004795, 'samples': 368448, 'steps': 1918, 'loss/train': 2.1986517906188965} -11/06/2021 21:32:31 - INFO - __main__ - Step 1920: {'lr': 0.00047975000000000003, 'samples': 368640, 'steps': 1919, 'loss/train': 2.7708301544189453} -11/06/2021 21:32:31 - INFO - __main__ - Step 1921: {'lr': 0.00048, 'samples': 368832, 'steps': 1920, 'loss/train': 4.627929210662842} -11/06/2021 21:32:32 - INFO - __main__ - Step 1922: {'lr': 0.00048025000000000005, 'samples': 369024, 'steps': 1921, 'loss/train': 2.932852029800415} -11/06/2021 21:32:33 - INFO - __main__ - Step 1923: {'lr': 0.00048049999999999997, 'samples': 369216, 'steps': 1922, 'loss/train': 2.970147132873535} -11/06/2021 21:32:33 - INFO - __main__ - Step 1924: {'lr': 0.00048075, 'samples': 369408, 'steps': 1923, 'loss/train': 3.2570888996124268} -11/06/2021 21:32:33 - INFO - __main__ - Step 1925: {'lr': 0.000481, 'samples': 369600, 'steps': 1924, 'loss/train': 2.7547266483306885} -11/06/2021 21:32:34 - INFO - __main__ - Step 1926: {'lr': 0.00048125, 'samples': 369792, 'steps': 1925, 'loss/train': 2.5552988052368164} -11/06/2021 21:32:34 - INFO - __main__ - Step 1927: {'lr': 0.0004815, 'samples': 369984, 'steps': 1926, 'loss/train': 2.8720643520355225} -11/06/2021 21:32:35 - INFO - __main__ - Step 1928: {'lr': 0.00048175000000000003, 'samples': 370176, 'steps': 1927, 'loss/train': 3.4235241413116455} -11/06/2021 21:32:35 - INFO - __main__ - Step 1929: {'lr': 0.000482, 'samples': 370368, 'steps': 1928, 'loss/train': 2.794508457183838} -11/06/2021 21:32:36 - INFO - __main__ - Step 1930: {'lr': 0.00048225000000000004, 'samples': 370560, 'steps': 1929, 'loss/train': 3.3702750205993652} -11/06/2021 21:32:36 - INFO - __main__ - Step 1931: {'lr': 0.0004825, 'samples': 370752, 'steps': 1930, 'loss/train': 3.3786303997039795} -11/06/2021 21:32:36 - INFO - __main__ - Step 1932: {'lr': 0.00048275, 'samples': 370944, 'steps': 1931, 'loss/train': 2.7347774505615234} -11/06/2021 21:32:37 - INFO - __main__ - Step 1933: {'lr': 0.000483, 'samples': 371136, 'steps': 1932, 'loss/train': 2.8218722343444824} -11/06/2021 21:32:38 - INFO - __main__ - Step 1934: {'lr': 0.00048325, 'samples': 371328, 'steps': 1933, 'loss/train': 1.854628324508667} -11/06/2021 21:32:38 - INFO - __main__ - Step 1935: {'lr': 0.0004835, 'samples': 371520, 'steps': 1934, 'loss/train': 2.730201244354248} -11/06/2021 21:32:38 - INFO - __main__ - Step 1936: {'lr': 0.00048375, 'samples': 371712, 'steps': 1935, 'loss/train': 2.558645725250244} -11/06/2021 21:32:39 - INFO - __main__ - Step 1937: {'lr': 0.000484, 'samples': 371904, 'steps': 1936, 'loss/train': 2.328354597091675} -11/06/2021 21:32:40 - INFO - __main__ - Step 1938: {'lr': 0.00048425000000000003, 'samples': 372096, 'steps': 1937, 'loss/train': 2.217445135116577} -11/06/2021 21:32:40 - INFO - __main__ - Step 1939: {'lr': 0.0004845, 'samples': 372288, 'steps': 1938, 'loss/train': 2.765631675720215} -11/06/2021 21:32:41 - INFO - __main__ - Step 1940: {'lr': 0.00048475000000000005, 'samples': 372480, 'steps': 1939, 'loss/train': 2.3212947845458984} -11/06/2021 21:32:41 - INFO - __main__ - Step 1941: {'lr': 0.00048499999999999997, 'samples': 372672, 'steps': 1940, 'loss/train': 2.563457727432251} -11/06/2021 21:32:41 - INFO - __main__ - Step 1942: {'lr': 0.00048525, 'samples': 372864, 'steps': 1941, 'loss/train': 2.725562334060669} -11/06/2021 21:32:42 - INFO - __main__ - Step 1943: {'lr': 0.0004855, 'samples': 373056, 'steps': 1942, 'loss/train': 2.3403518199920654} -11/06/2021 21:32:43 - INFO - __main__ - Step 1944: {'lr': 0.00048575, 'samples': 373248, 'steps': 1943, 'loss/train': 2.5952484607696533} -11/06/2021 21:32:43 - INFO - __main__ - Step 1945: {'lr': 0.000486, 'samples': 373440, 'steps': 1944, 'loss/train': 3.019125461578369} -11/06/2021 21:32:43 - INFO - __main__ - Step 1946: {'lr': 0.00048625000000000003, 'samples': 373632, 'steps': 1945, 'loss/train': 2.831516981124878} -11/06/2021 21:32:44 - INFO - __main__ - Step 1947: {'lr': 0.0004865, 'samples': 373824, 'steps': 1946, 'loss/train': 2.3622794151306152} -11/06/2021 21:32:45 - INFO - __main__ - Step 1948: {'lr': 0.00048675000000000004, 'samples': 374016, 'steps': 1947, 'loss/train': 2.709298849105835} -11/06/2021 21:32:45 - INFO - __main__ - Step 1949: {'lr': 0.000487, 'samples': 374208, 'steps': 1948, 'loss/train': 2.702164888381958} -11/06/2021 21:32:45 - INFO - __main__ - Step 1950: {'lr': 0.00048725000000000005, 'samples': 374400, 'steps': 1949, 'loss/train': 2.7699882984161377} -11/06/2021 21:32:46 - INFO - __main__ - Step 1951: {'lr': 0.0004875, 'samples': 374592, 'steps': 1950, 'loss/train': 3.081878900527954} -11/06/2021 21:32:46 - INFO - __main__ - Step 1952: {'lr': 0.00048775, 'samples': 374784, 'steps': 1951, 'loss/train': 2.322448492050171} -11/06/2021 21:32:47 - INFO - __main__ - Step 1953: {'lr': 0.000488, 'samples': 374976, 'steps': 1952, 'loss/train': 3.033129930496216} -11/06/2021 21:32:48 - INFO - __main__ - Step 1954: {'lr': 0.00048825, 'samples': 375168, 'steps': 1953, 'loss/train': 3.0832743644714355} -11/06/2021 21:32:48 - INFO - __main__ - Step 1955: {'lr': 0.0004885, 'samples': 375360, 'steps': 1954, 'loss/train': 2.644732713699341} -11/06/2021 21:32:48 - INFO - __main__ - Step 1956: {'lr': 0.00048875, 'samples': 375552, 'steps': 1955, 'loss/train': 2.585529327392578} -11/06/2021 21:32:49 - INFO - __main__ - Step 1957: {'lr': 0.000489, 'samples': 375744, 'steps': 1956, 'loss/train': 2.618997812271118} -11/06/2021 21:32:49 - INFO - __main__ - Step 1958: {'lr': 0.00048925, 'samples': 375936, 'steps': 1957, 'loss/train': 2.3187615871429443} -11/06/2021 21:32:50 - INFO - __main__ - Step 1959: {'lr': 0.0004895, 'samples': 376128, 'steps': 1958, 'loss/train': 0.9907362461090088} -11/06/2021 21:32:50 - INFO - __main__ - Step 1960: {'lr': 0.0004897500000000001, 'samples': 376320, 'steps': 1959, 'loss/train': 2.583451986312866} -11/06/2021 21:32:51 - INFO - __main__ - Step 1961: {'lr': 0.00049, 'samples': 376512, 'steps': 1960, 'loss/train': 2.766582489013672} -11/06/2021 21:32:51 - INFO - __main__ - Step 1962: {'lr': 0.00049025, 'samples': 376704, 'steps': 1961, 'loss/train': 2.8893637657165527} -11/06/2021 21:32:51 - INFO - __main__ - Step 1963: {'lr': 0.0004905, 'samples': 376896, 'steps': 1962, 'loss/train': 2.1860101222991943} -11/06/2021 21:32:53 - INFO - __main__ - Step 1964: {'lr': 0.0004907500000000001, 'samples': 377088, 'steps': 1963, 'loss/train': 2.513594150543213} -11/06/2021 21:32:53 - INFO - __main__ - Step 1965: {'lr': 0.000491, 'samples': 377280, 'steps': 1964, 'loss/train': 1.6197631359100342} -11/06/2021 21:32:53 - INFO - __main__ - Step 1966: {'lr': 0.00049125, 'samples': 377472, 'steps': 1965, 'loss/train': 2.5828354358673096} -11/06/2021 21:32:54 - INFO - __main__ - Step 1967: {'lr': 0.0004915, 'samples': 377664, 'steps': 1966, 'loss/train': 3.0170748233795166} -11/06/2021 21:32:54 - INFO - __main__ - Step 1968: {'lr': 0.00049175, 'samples': 377856, 'steps': 1967, 'loss/train': 1.9359134435653687} -11/06/2021 21:32:55 - INFO - __main__ - Step 1969: {'lr': 0.000492, 'samples': 378048, 'steps': 1968, 'loss/train': 2.57096266746521} -11/06/2021 21:32:55 - INFO - __main__ - Step 1970: {'lr': 0.0004922500000000001, 'samples': 378240, 'steps': 1969, 'loss/train': 2.656981945037842} -11/06/2021 21:32:56 - INFO - __main__ - Step 1971: {'lr': 0.0004925, 'samples': 378432, 'steps': 1970, 'loss/train': 2.5854079723358154} -11/06/2021 21:32:56 - INFO - __main__ - Step 1972: {'lr': 0.00049275, 'samples': 378624, 'steps': 1971, 'loss/train': 2.834716796875} -11/06/2021 21:32:56 - INFO - __main__ - Step 1973: {'lr': 0.0004930000000000001, 'samples': 378816, 'steps': 1972, 'loss/train': 2.5970420837402344} -11/06/2021 21:32:57 - INFO - __main__ - Step 1974: {'lr': 0.00049325, 'samples': 379008, 'steps': 1973, 'loss/train': 2.524550676345825} -11/06/2021 21:32:58 - INFO - __main__ - Step 1975: {'lr': 0.0004935, 'samples': 379200, 'steps': 1974, 'loss/train': 2.7941884994506836} -11/06/2021 21:32:58 - INFO - __main__ - Step 1976: {'lr': 0.00049375, 'samples': 379392, 'steps': 1975, 'loss/train': 2.233511447906494} -11/06/2021 21:32:58 - INFO - __main__ - Step 1977: {'lr': 0.000494, 'samples': 379584, 'steps': 1976, 'loss/train': 2.7673490047454834} -11/06/2021 21:32:59 - INFO - __main__ - Step 1978: {'lr': 0.00049425, 'samples': 379776, 'steps': 1977, 'loss/train': 2.7276995182037354} -11/06/2021 21:32:59 - INFO - __main__ - Step 1979: {'lr': 0.0004945, 'samples': 379968, 'steps': 1978, 'loss/train': 3.163912534713745} -11/06/2021 21:33:00 - INFO - __main__ - Step 1980: {'lr': 0.0004947500000000001, 'samples': 380160, 'steps': 1979, 'loss/train': 2.734490394592285} -11/06/2021 21:33:00 - INFO - __main__ - Step 1981: {'lr': 0.000495, 'samples': 380352, 'steps': 1980, 'loss/train': 2.695145845413208} -11/06/2021 21:33:01 - INFO - __main__ - Step 1982: {'lr': 0.00049525, 'samples': 380544, 'steps': 1981, 'loss/train': 2.7770211696624756} -11/06/2021 21:33:01 - INFO - __main__ - Step 1983: {'lr': 0.0004955, 'samples': 380736, 'steps': 1982, 'loss/train': 2.7686867713928223} -11/06/2021 21:33:02 - INFO - __main__ - Step 1984: {'lr': 0.00049575, 'samples': 380928, 'steps': 1983, 'loss/train': 2.8708817958831787} -11/06/2021 21:33:03 - INFO - __main__ - Step 1985: {'lr': 0.000496, 'samples': 381120, 'steps': 1984, 'loss/train': 2.6449930667877197} -11/06/2021 21:33:03 - INFO - __main__ - Step 1986: {'lr': 0.0004962500000000001, 'samples': 381312, 'steps': 1985, 'loss/train': 2.249175786972046} -11/06/2021 21:33:03 - INFO - __main__ - Step 1987: {'lr': 0.0004965, 'samples': 381504, 'steps': 1986, 'loss/train': 2.399980068206787} -11/06/2021 21:33:04 - INFO - __main__ - Step 1988: {'lr': 0.00049675, 'samples': 381696, 'steps': 1987, 'loss/train': 2.932748556137085} -11/06/2021 21:33:04 - INFO - __main__ - Step 1989: {'lr': 0.000497, 'samples': 381888, 'steps': 1988, 'loss/train': 2.3569090366363525} -11/06/2021 21:33:05 - INFO - __main__ - Step 1990: {'lr': 0.0004972500000000001, 'samples': 382080, 'steps': 1989, 'loss/train': 2.4476397037506104} -11/06/2021 21:33:05 - INFO - __main__ - Step 1991: {'lr': 0.0004975, 'samples': 382272, 'steps': 1990, 'loss/train': 3.7033238410949707} -11/06/2021 21:33:06 - INFO - __main__ - Step 1992: {'lr': 0.00049775, 'samples': 382464, 'steps': 1991, 'loss/train': 2.872666835784912} -11/06/2021 21:33:06 - INFO - __main__ - Step 1993: {'lr': 0.000498, 'samples': 382656, 'steps': 1992, 'loss/train': 2.463730573654175} -11/06/2021 21:33:06 - INFO - __main__ - Step 1994: {'lr': 0.00049825, 'samples': 382848, 'steps': 1993, 'loss/train': 2.2862772941589355} -11/06/2021 21:33:07 - INFO - __main__ - Step 1995: {'lr': 0.0004985, 'samples': 383040, 'steps': 1994, 'loss/train': 2.9158213138580322} -11/06/2021 21:33:08 - INFO - __main__ - Step 1996: {'lr': 0.0004987500000000001, 'samples': 383232, 'steps': 1995, 'loss/train': 2.440356731414795} -11/06/2021 21:33:08 - INFO - __main__ - Step 1997: {'lr': 0.000499, 'samples': 383424, 'steps': 1996, 'loss/train': 2.8165547847747803} -11/06/2021 21:33:08 - INFO - __main__ - Step 1998: {'lr': 0.00049925, 'samples': 383616, 'steps': 1997, 'loss/train': 2.460160970687866} -11/06/2021 21:33:09 - INFO - __main__ - Step 1999: {'lr': 0.0004995, 'samples': 383808, 'steps': 1998, 'loss/train': 2.8963072299957275} -11/06/2021 21:33:10 - INFO - __main__ - Step 2000: {'lr': 0.0004997500000000001, 'samples': 384000, 'steps': 1999, 'loss/train': 2.667146921157837} -11/06/2021 21:33:10 - INFO - __main__ - Step 2001: {'lr': 0.0005, 'samples': 384192, 'steps': 2000, 'loss/train': 1.9915542602539062} -11/06/2021 21:33:10 - INFO - __main__ - Step 2002: {'lr': 0.0004999999999436769, 'samples': 384384, 'steps': 2001, 'loss/train': 2.369316816329956} -11/06/2021 21:33:11 - INFO - __main__ - Step 2003: {'lr': 0.0004999999997747077, 'samples': 384576, 'steps': 2002, 'loss/train': 2.117219924926758} -11/06/2021 21:33:11 - INFO - __main__ - Step 2004: {'lr': 0.0004999999994930923, 'samples': 384768, 'steps': 2003, 'loss/train': 3.217236280441284} -11/06/2021 21:33:12 - INFO - __main__ - Step 2005: {'lr': 0.0004999999990988309, 'samples': 384960, 'steps': 2004, 'loss/train': 2.4494330883026123} -11/06/2021 21:33:13 - INFO - __main__ - Step 2006: {'lr': 0.0004999999985919232, 'samples': 385152, 'steps': 2005, 'loss/train': 2.7397634983062744} -11/06/2021 21:33:13 - INFO - __main__ - Step 2007: {'lr': 0.0004999999979723695, 'samples': 385344, 'steps': 2006, 'loss/train': 1.72874915599823} -11/06/2021 21:33:13 - INFO - __main__ - Step 2008: {'lr': 0.0004999999972401696, 'samples': 385536, 'steps': 2007, 'loss/train': 2.854842185974121} -11/06/2021 21:33:14 - INFO - __main__ - Step 2009: {'lr': 0.0004999999963953234, 'samples': 385728, 'steps': 2008, 'loss/train': 2.8656506538391113} -11/06/2021 21:33:14 - INFO - __main__ - Step 2010: {'lr': 0.0004999999954378312, 'samples': 385920, 'steps': 2009, 'loss/train': 2.108156681060791} -11/06/2021 21:33:15 - INFO - __main__ - Step 2011: {'lr': 0.000499999994367693, 'samples': 386112, 'steps': 2010, 'loss/train': 2.626335382461548} -11/06/2021 21:33:15 - INFO - __main__ - Step 2012: {'lr': 0.0004999999931849084, 'samples': 386304, 'steps': 2011, 'loss/train': 2.684321403503418} -11/06/2021 21:33:16 - INFO - __main__ - Step 2013: {'lr': 0.0004999999918894778, 'samples': 386496, 'steps': 2012, 'loss/train': 2.6967201232910156} -11/06/2021 21:33:16 - INFO - __main__ - Step 2014: {'lr': 0.000499999990481401, 'samples': 386688, 'steps': 2013, 'loss/train': 2.6608567237854004} -11/06/2021 21:33:16 - INFO - __main__ - Step 2015: {'lr': 0.0004999999889606781, 'samples': 386880, 'steps': 2014, 'loss/train': 2.773587942123413} -11/06/2021 21:33:17 - INFO - __main__ - Step 2016: {'lr': 0.0004999999873273091, 'samples': 387072, 'steps': 2015, 'loss/train': 2.5396175384521484} -11/06/2021 21:33:18 - INFO - __main__ - Step 2017: {'lr': 0.000499999985581294, 'samples': 387264, 'steps': 2016, 'loss/train': 2.9286653995513916} -11/06/2021 21:33:18 - INFO - __main__ - Step 2018: {'lr': 0.0004999999837226326, 'samples': 387456, 'steps': 2017, 'loss/train': 2.4174294471740723} -11/06/2021 21:33:18 - INFO - __main__ - Step 2019: {'lr': 0.0004999999817513252, 'samples': 387648, 'steps': 2018, 'loss/train': 2.4650332927703857} -11/06/2021 21:33:19 - INFO - __main__ - Step 2020: {'lr': 0.0004999999796673716, 'samples': 387840, 'steps': 2019, 'loss/train': 2.799029588699341} -11/06/2021 21:33:20 - INFO - __main__ - Step 2021: {'lr': 0.0004999999774707719, 'samples': 388032, 'steps': 2020, 'loss/train': 2.8545684814453125} -11/06/2021 21:33:20 - INFO - __main__ - Step 2022: {'lr': 0.0004999999751615261, 'samples': 388224, 'steps': 2021, 'loss/train': 2.4763200283050537} -11/06/2021 21:33:20 - INFO - __main__ - Step 2023: {'lr': 0.0004999999727396341, 'samples': 388416, 'steps': 2022, 'loss/train': 2.094083309173584} -11/06/2021 21:33:21 - INFO - __main__ - Step 2024: {'lr': 0.0004999999702050959, 'samples': 388608, 'steps': 2023, 'loss/train': 2.4490573406219482} -11/06/2021 21:33:21 - INFO - __main__ - Step 2025: {'lr': 0.0004999999675579118, 'samples': 388800, 'steps': 2024, 'loss/train': 3.2666213512420654} -11/06/2021 21:33:22 - INFO - __main__ - Step 2026: {'lr': 0.0004999999647980814, 'samples': 388992, 'steps': 2025, 'loss/train': 2.2224512100219727} -11/06/2021 21:33:23 - INFO - __main__ - Step 2027: {'lr': 0.0004999999619256049, 'samples': 389184, 'steps': 2026, 'loss/train': 3.0559303760528564} -11/06/2021 21:33:23 - INFO - __main__ - Step 2028: {'lr': 0.0004999999589404822, 'samples': 389376, 'steps': 2027, 'loss/train': 2.4753761291503906} -11/06/2021 21:33:23 - INFO - __main__ - Step 2029: {'lr': 0.0004999999558427136, 'samples': 389568, 'steps': 2028, 'loss/train': 2.350665807723999} -11/06/2021 21:33:24 - INFO - __main__ - Step 2030: {'lr': 0.0004999999526322987, 'samples': 389760, 'steps': 2029, 'loss/train': 2.9428741931915283} -11/06/2021 21:33:24 - INFO - __main__ - Step 2031: {'lr': 0.0004999999493092377, 'samples': 389952, 'steps': 2030, 'loss/train': 2.561460018157959} -11/06/2021 21:33:25 - INFO - __main__ - Step 2032: {'lr': 0.0004999999458735306, 'samples': 390144, 'steps': 2031, 'loss/train': 2.2386529445648193} -11/06/2021 21:33:26 - INFO - __main__ - Step 2033: {'lr': 0.0004999999423251774, 'samples': 390336, 'steps': 2032, 'loss/train': 2.3020198345184326} -11/06/2021 21:33:26 - INFO - __main__ - Step 2034: {'lr': 0.0004999999386641781, 'samples': 390528, 'steps': 2033, 'loss/train': 2.7840397357940674} -11/06/2021 21:33:26 - INFO - __main__ - Step 2035: {'lr': 0.0004999999348905326, 'samples': 390720, 'steps': 2034, 'loss/train': 2.2460341453552246} -11/06/2021 21:33:27 - INFO - __main__ - Step 2036: {'lr': 0.000499999931004241, 'samples': 390912, 'steps': 2035, 'loss/train': 2.3942503929138184} -11/06/2021 21:33:28 - INFO - __main__ - Step 2037: {'lr': 0.0004999999270053034, 'samples': 391104, 'steps': 2036, 'loss/train': 3.297150135040283} -11/06/2021 21:33:28 - INFO - __main__ - Step 2038: {'lr': 0.0004999999228937196, 'samples': 391296, 'steps': 2037, 'loss/train': 2.8241195678710938} -11/06/2021 21:33:28 - INFO - __main__ - Step 2039: {'lr': 0.0004999999186694897, 'samples': 391488, 'steps': 2038, 'loss/train': 2.7766733169555664} -11/06/2021 21:33:29 - INFO - __main__ - Step 2040: {'lr': 0.0004999999143326137, 'samples': 391680, 'steps': 2039, 'loss/train': 2.7513749599456787} -11/06/2021 21:33:29 - INFO - __main__ - Step 2041: {'lr': 0.0004999999098830916, 'samples': 391872, 'steps': 2040, 'loss/train': 2.4639899730682373} -11/06/2021 21:33:30 - INFO - __main__ - Step 2042: {'lr': 0.0004999999053209235, 'samples': 392064, 'steps': 2041, 'loss/train': 2.83908748626709} -11/06/2021 21:33:30 - INFO - __main__ - Step 2043: {'lr': 0.0004999999006461091, 'samples': 392256, 'steps': 2042, 'loss/train': 2.7250239849090576} -11/06/2021 21:33:31 - INFO - __main__ - Step 2044: {'lr': 0.0004999998958586487, 'samples': 392448, 'steps': 2043, 'loss/train': 2.2710461616516113} -11/06/2021 21:33:31 - INFO - __main__ - Step 2045: {'lr': 0.0004999998909585423, 'samples': 392640, 'steps': 2044, 'loss/train': 2.9703567028045654} -11/06/2021 21:33:31 - INFO - __main__ - Step 2046: {'lr': 0.0004999998859457896, 'samples': 392832, 'steps': 2045, 'loss/train': 1.9827837944030762} -11/06/2021 21:33:33 - INFO - __main__ - Step 2047: {'lr': 0.0004999998808203909, 'samples': 393024, 'steps': 2046, 'loss/train': 2.4545347690582275} -11/06/2021 21:33:33 - INFO - __main__ - Step 2048: {'lr': 0.0004999998755823462, 'samples': 393216, 'steps': 2047, 'loss/train': 2.7062439918518066} -11/06/2021 21:33:33 - INFO - __main__ - Step 2049: {'lr': 0.0004999998702316553, 'samples': 393408, 'steps': 2048, 'loss/train': 2.6722590923309326} -11/06/2021 21:33:34 - INFO - __main__ - Step 2050: {'lr': 0.0004999998647683184, 'samples': 393600, 'steps': 2049, 'loss/train': 2.4513065814971924} -11/06/2021 21:33:34 - INFO - __main__ - Step 2051: {'lr': 0.0004999998591923353, 'samples': 393792, 'steps': 2050, 'loss/train': 2.691094398498535} -11/06/2021 21:33:34 - INFO - __main__ - Step 2052: {'lr': 0.0004999998535037063, 'samples': 393984, 'steps': 2051, 'loss/train': 2.209742307662964} -11/06/2021 21:33:35 - INFO - __main__ - Step 2053: {'lr': 0.0004999998477024311, 'samples': 394176, 'steps': 2052, 'loss/train': 2.50882887840271} -11/06/2021 21:33:36 - INFO - __main__ - Step 2054: {'lr': 0.0004999998417885099, 'samples': 394368, 'steps': 2053, 'loss/train': 2.435020685195923} -11/06/2021 21:33:36 - INFO - __main__ - Step 2055: {'lr': 0.0004999998357619425, 'samples': 394560, 'steps': 2054, 'loss/train': 2.0775961875915527} -11/06/2021 21:33:36 - INFO - __main__ - Step 2056: {'lr': 0.0004999998296227291, 'samples': 394752, 'steps': 2055, 'loss/train': 2.863607168197632} -11/06/2021 21:33:37 - INFO - __main__ - Step 2057: {'lr': 0.0004999998233708697, 'samples': 394944, 'steps': 2056, 'loss/train': 2.371857166290283} -11/06/2021 21:33:38 - INFO - __main__ - Step 2058: {'lr': 0.0004999998170063642, 'samples': 395136, 'steps': 2057, 'loss/train': 2.9623489379882812} -11/06/2021 21:33:38 - INFO - __main__ - Step 2059: {'lr': 0.0004999998105292126, 'samples': 395328, 'steps': 2058, 'loss/train': 2.637700319290161} -11/06/2021 21:33:39 - INFO - __main__ - Step 2060: {'lr': 0.000499999803939415, 'samples': 395520, 'steps': 2059, 'loss/train': 2.8465237617492676} -11/06/2021 21:33:39 - INFO - __main__ - Step 2061: {'lr': 0.0004999997972369713, 'samples': 395712, 'steps': 2060, 'loss/train': 2.0144639015197754} -11/06/2021 21:33:39 - INFO - __main__ - Step 2062: {'lr': 0.0004999997904218816, 'samples': 395904, 'steps': 2061, 'loss/train': 2.385756254196167} -11/06/2021 21:33:40 - INFO - __main__ - Step 2063: {'lr': 0.0004999997834941459, 'samples': 396096, 'steps': 2062, 'loss/train': 3.102501153945923} -11/06/2021 21:33:41 - INFO - __main__ - Step 2064: {'lr': 0.000499999776453764, 'samples': 396288, 'steps': 2063, 'loss/train': 1.95815908908844} -11/06/2021 21:33:41 - INFO - __main__ - Step 2065: {'lr': 0.0004999997693007361, 'samples': 396480, 'steps': 2064, 'loss/train': 2.9032347202301025} -11/06/2021 21:33:41 - INFO - __main__ - Step 2066: {'lr': 0.0004999997620350622, 'samples': 396672, 'steps': 2065, 'loss/train': 2.321173906326294} -11/06/2021 21:33:42 - INFO - __main__ - Step 2067: {'lr': 0.0004999997546567423, 'samples': 396864, 'steps': 2066, 'loss/train': 2.925659418106079} -11/06/2021 21:33:42 - INFO - __main__ - Step 2068: {'lr': 0.0004999997471657763, 'samples': 397056, 'steps': 2067, 'loss/train': 2.795663356781006} -11/06/2021 21:33:43 - INFO - __main__ - Step 2069: {'lr': 0.0004999997395621642, 'samples': 397248, 'steps': 2068, 'loss/train': 2.198864698410034} -11/06/2021 21:33:43 - INFO - __main__ - Step 2070: {'lr': 0.0004999997318459064, 'samples': 397440, 'steps': 2069, 'loss/train': 2.6380443572998047} -11/06/2021 21:33:44 - INFO - __main__ - Step 2071: {'lr': 0.0004999997240170023, 'samples': 397632, 'steps': 2070, 'loss/train': 1.3615984916687012} -11/06/2021 21:33:44 - INFO - __main__ - Step 2072: {'lr': 0.0004999997160754522, 'samples': 397824, 'steps': 2071, 'loss/train': 2.0112996101379395} -11/06/2021 21:33:45 - INFO - __main__ - Step 2073: {'lr': 0.0004999997080212561, 'samples': 398016, 'steps': 2072, 'loss/train': 2.477386236190796} -11/06/2021 21:33:46 - INFO - __main__ - Step 2074: {'lr': 0.000499999699854414, 'samples': 398208, 'steps': 2073, 'loss/train': 3.2133283615112305} -11/06/2021 21:33:46 - INFO - __main__ - Step 2075: {'lr': 0.0004999996915749259, 'samples': 398400, 'steps': 2074, 'loss/train': 2.5600574016571045} -11/06/2021 21:33:46 - INFO - __main__ - Step 2076: {'lr': 0.0004999996831827918, 'samples': 398592, 'steps': 2075, 'loss/train': 2.0490965843200684} -11/06/2021 21:33:47 - INFO - __main__ - Step 2077: {'lr': 0.0004999996746780117, 'samples': 398784, 'steps': 2076, 'loss/train': 2.4900460243225098} -11/06/2021 21:33:47 - INFO - __main__ - Step 2078: {'lr': 0.0004999996660605856, 'samples': 398976, 'steps': 2077, 'loss/train': 2.7026772499084473} -11/06/2021 21:33:47 - INFO - __main__ - Step 2079: {'lr': 0.0004999996573305135, 'samples': 399168, 'steps': 2078, 'loss/train': 1.7970755100250244} -11/06/2021 21:33:48 - INFO - __main__ - Step 2080: {'lr': 0.0004999996484877955, 'samples': 399360, 'steps': 2079, 'loss/train': 2.834831953048706} -11/06/2021 21:33:49 - INFO - __main__ - Step 2081: {'lr': 0.0004999996395324313, 'samples': 399552, 'steps': 2080, 'loss/train': 2.1271467208862305} -11/06/2021 21:33:49 - INFO - __main__ - Step 2082: {'lr': 0.0004999996304644213, 'samples': 399744, 'steps': 2081, 'loss/train': 2.7261979579925537} -11/06/2021 21:33:49 - INFO - __main__ - Step 2083: {'lr': 0.0004999996212837653, 'samples': 399936, 'steps': 2082, 'loss/train': 2.50911021232605} -11/06/2021 21:33:50 - INFO - __main__ - Step 2084: {'lr': 0.0004999996119904633, 'samples': 400128, 'steps': 2083, 'loss/train': 2.5453062057495117} -11/06/2021 21:33:51 - INFO - __main__ - Step 2085: {'lr': 0.0004999996025845154, 'samples': 400320, 'steps': 2084, 'loss/train': 2.562901496887207} -11/06/2021 21:33:51 - INFO - __main__ - Step 2086: {'lr': 0.0004999995930659215, 'samples': 400512, 'steps': 2085, 'loss/train': 2.8472900390625} -11/06/2021 21:33:51 - INFO - __main__ - Step 2087: {'lr': 0.0004999995834346815, 'samples': 400704, 'steps': 2086, 'loss/train': 2.197766065597534} -11/06/2021 21:33:52 - INFO - __main__ - Step 2088: {'lr': 0.0004999995736907957, 'samples': 400896, 'steps': 2087, 'loss/train': 2.4093174934387207} -11/06/2021 21:33:52 - INFO - __main__ - Step 2089: {'lr': 0.000499999563834264, 'samples': 401088, 'steps': 2088, 'loss/train': 2.8441734313964844} -11/06/2021 21:33:53 - INFO - __main__ - Step 2090: {'lr': 0.0004999995538650862, 'samples': 401280, 'steps': 2089, 'loss/train': 2.863389492034912} -11/06/2021 21:33:53 - INFO - __main__ - Step 2091: {'lr': 0.0004999995437832626, 'samples': 401472, 'steps': 2090, 'loss/train': 2.4036967754364014} -11/06/2021 21:33:54 - INFO - __main__ - Step 2092: {'lr': 0.0004999995335887929, 'samples': 401664, 'steps': 2091, 'loss/train': 2.5592567920684814} -11/06/2021 21:33:54 - INFO - __main__ - Step 2093: {'lr': 0.0004999995232816774, 'samples': 401856, 'steps': 2092, 'loss/train': 2.0404558181762695} -11/06/2021 21:33:54 - INFO - __main__ - Step 2094: {'lr': 0.000499999512861916, 'samples': 402048, 'steps': 2093, 'loss/train': 2.452481985092163} -11/06/2021 21:33:56 - INFO - __main__ - Step 2095: {'lr': 0.0004999995023295086, 'samples': 402240, 'steps': 2094, 'loss/train': 2.8676137924194336} -11/06/2021 21:33:56 - INFO - __main__ - Step 2096: {'lr': 0.0004999994916844552, 'samples': 402432, 'steps': 2095, 'loss/train': 2.586151599884033} -11/06/2021 21:33:56 - INFO - __main__ - Step 2097: {'lr': 0.0004999994809267561, 'samples': 402624, 'steps': 2096, 'loss/train': 2.180725574493408} -11/06/2021 21:33:57 - INFO - __main__ - Step 2098: {'lr': 0.0004999994700564109, 'samples': 402816, 'steps': 2097, 'loss/train': 2.6748390197753906} -11/06/2021 21:33:57 - INFO - __main__ - Step 2099: {'lr': 0.0004999994590734199, 'samples': 403008, 'steps': 2098, 'loss/train': 2.2900843620300293} -11/06/2021 21:33:58 - INFO - __main__ - Step 2100: {'lr': 0.000499999447977783, 'samples': 403200, 'steps': 2099, 'loss/train': 2.7498953342437744} -11/06/2021 21:33:58 - INFO - __main__ - Step 2101: {'lr': 0.0004999994367695001, 'samples': 403392, 'steps': 2100, 'loss/train': 2.9146597385406494} -11/06/2021 21:33:59 - INFO - __main__ - Step 2102: {'lr': 0.0004999994254485714, 'samples': 403584, 'steps': 2101, 'loss/train': 2.650158166885376} -11/06/2021 21:33:59 - INFO - __main__ - Step 2103: {'lr': 0.0004999994140149969, 'samples': 403776, 'steps': 2102, 'loss/train': 2.6396777629852295} -11/06/2021 21:33:59 - INFO - __main__ - Step 2104: {'lr': 0.0004999994024687764, 'samples': 403968, 'steps': 2103, 'loss/train': 2.664414644241333} -11/06/2021 21:34:00 - INFO - __main__ - Step 2105: {'lr': 0.00049999939080991, 'samples': 404160, 'steps': 2104, 'loss/train': 1.7636381387710571} -11/06/2021 21:34:01 - INFO - __main__ - Step 2106: {'lr': 0.0004999993790383978, 'samples': 404352, 'steps': 2105, 'loss/train': 2.3601715564727783} -11/06/2021 21:34:01 - INFO - __main__ - Step 2107: {'lr': 0.0004999993671542397, 'samples': 404544, 'steps': 2106, 'loss/train': 1.9566963911056519} -11/06/2021 21:34:01 - INFO - __main__ - Step 2108: {'lr': 0.0004999993551574358, 'samples': 404736, 'steps': 2107, 'loss/train': 1.9892882108688354} -11/06/2021 21:34:02 - INFO - __main__ - Step 2109: {'lr': 0.000499999343047986, 'samples': 404928, 'steps': 2108, 'loss/train': 2.693075180053711} -11/06/2021 21:34:02 - INFO - __main__ - Step 2110: {'lr': 0.0004999993308258904, 'samples': 405120, 'steps': 2109, 'loss/train': 2.1097216606140137} -11/06/2021 21:34:03 - INFO - __main__ - Step 2111: {'lr': 0.0004999993184911489, 'samples': 405312, 'steps': 2110, 'loss/train': 2.149388074874878} -11/06/2021 21:34:04 - INFO - __main__ - Step 2112: {'lr': 0.0004999993060437616, 'samples': 405504, 'steps': 2111, 'loss/train': 1.7287077903747559} -11/06/2021 21:34:04 - INFO - __main__ - Step 2113: {'lr': 0.0004999992934837284, 'samples': 405696, 'steps': 2112, 'loss/train': 2.66508150100708} -11/06/2021 21:34:04 - INFO - __main__ - Step 2114: {'lr': 0.0004999992808110495, 'samples': 405888, 'steps': 2113, 'loss/train': 2.4178295135498047} -11/06/2021 21:34:05 - INFO - __main__ - Step 2115: {'lr': 0.0004999992680257247, 'samples': 406080, 'steps': 2114, 'loss/train': 2.6689789295196533} -11/06/2021 21:34:06 - INFO - __main__ - Step 2116: {'lr': 0.0004999992551277541, 'samples': 406272, 'steps': 2115, 'loss/train': 2.902282953262329} -11/06/2021 21:34:06 - INFO - __main__ - Step 2117: {'lr': 0.0004999992421171377, 'samples': 406464, 'steps': 2116, 'loss/train': 2.81160306930542} -11/06/2021 21:34:06 - INFO - __main__ - Step 2118: {'lr': 0.0004999992289938755, 'samples': 406656, 'steps': 2117, 'loss/train': 2.694124698638916} -11/06/2021 21:34:07 - INFO - __main__ - Step 2119: {'lr': 0.0004999992157579676, 'samples': 406848, 'steps': 2118, 'loss/train': 3.20439076423645} -11/06/2021 21:34:07 - INFO - __main__ - Step 2120: {'lr': 0.0004999992024094138, 'samples': 407040, 'steps': 2119, 'loss/train': 2.9919791221618652} -11/06/2021 21:34:08 - INFO - __main__ - Step 2121: {'lr': 0.0004999991889482142, 'samples': 407232, 'steps': 2120, 'loss/train': 2.432868003845215} -11/06/2021 21:34:08 - INFO - __main__ - Step 2122: {'lr': 0.0004999991753743689, 'samples': 407424, 'steps': 2121, 'loss/train': 2.5452983379364014} -11/06/2021 21:34:09 - INFO - __main__ - Step 2123: {'lr': 0.0004999991616878777, 'samples': 407616, 'steps': 2122, 'loss/train': 2.8512609004974365} -11/06/2021 21:34:09 - INFO - __main__ - Step 2124: {'lr': 0.0004999991478887409, 'samples': 407808, 'steps': 2123, 'loss/train': 2.363013505935669} -11/06/2021 21:34:09 - INFO - __main__ - Step 2125: {'lr': 0.0004999991339769582, 'samples': 408000, 'steps': 2124, 'loss/train': 2.3409323692321777} -11/06/2021 21:34:10 - INFO - __main__ - Step 2126: {'lr': 0.0004999991199525299, 'samples': 408192, 'steps': 2125, 'loss/train': 2.357633113861084} -11/06/2021 21:34:11 - INFO - __main__ - Step 2127: {'lr': 0.0004999991058154557, 'samples': 408384, 'steps': 2126, 'loss/train': 2.454667091369629} -11/06/2021 21:34:11 - INFO - __main__ - Step 2128: {'lr': 0.0004999990915657359, 'samples': 408576, 'steps': 2127, 'loss/train': 1.9439713954925537} -11/06/2021 21:34:11 - INFO - __main__ - Step 2129: {'lr': 0.0004999990772033702, 'samples': 408768, 'steps': 2128, 'loss/train': 2.639913320541382} -11/06/2021 21:34:12 - INFO - __main__ - Step 2130: {'lr': 0.000499999062728359, 'samples': 408960, 'steps': 2129, 'loss/train': 2.727692127227783} -11/06/2021 21:34:12 - INFO - __main__ - Step 2131: {'lr': 0.0004999990481407018, 'samples': 409152, 'steps': 2130, 'loss/train': 2.4127743244171143} -11/06/2021 21:34:13 - INFO - __main__ - Step 2132: {'lr': 0.0004999990334403991, 'samples': 409344, 'steps': 2131, 'loss/train': 2.539153575897217} -11/06/2021 21:34:14 - INFO - __main__ - Step 2133: {'lr': 0.0004999990186274506, 'samples': 409536, 'steps': 2132, 'loss/train': 2.580580949783325} -11/06/2021 21:34:14 - INFO - __main__ - Step 2134: {'lr': 0.0004999990037018564, 'samples': 409728, 'steps': 2133, 'loss/train': 2.830368757247925} -11/06/2021 21:34:14 - INFO - __main__ - Step 2135: {'lr': 0.0004999989886636166, 'samples': 409920, 'steps': 2134, 'loss/train': 2.996830463409424} -11/06/2021 21:34:15 - INFO - __main__ - Step 2136: {'lr': 0.000499998973512731, 'samples': 410112, 'steps': 2135, 'loss/train': 2.449648141860962} -11/06/2021 21:34:16 - INFO - __main__ - Step 2137: {'lr': 0.0004999989582491998, 'samples': 410304, 'steps': 2136, 'loss/train': 2.1310882568359375} -11/06/2021 21:34:16 - INFO - __main__ - Step 2138: {'lr': 0.0004999989428730229, 'samples': 410496, 'steps': 2137, 'loss/train': 2.7264044284820557} -11/06/2021 21:34:17 - INFO - __main__ - Step 2139: {'lr': 0.0004999989273842003, 'samples': 410688, 'steps': 2138, 'loss/train': 2.348263740539551} -11/06/2021 21:34:17 - INFO - __main__ - Step 2140: {'lr': 0.0004999989117827321, 'samples': 410880, 'steps': 2139, 'loss/train': 2.6819005012512207} -11/06/2021 21:34:17 - INFO - __main__ - Step 2141: {'lr': 0.0004999988960686182, 'samples': 411072, 'steps': 2140, 'loss/train': 1.7351843118667603} -11/06/2021 21:34:18 - INFO - __main__ - Step 2142: {'lr': 0.0004999988802418587, 'samples': 411264, 'steps': 2141, 'loss/train': 2.5951883792877197} -11/06/2021 21:34:19 - INFO - __main__ - Step 2143: {'lr': 0.0004999988643024536, 'samples': 411456, 'steps': 2142, 'loss/train': 2.5091636180877686} -11/06/2021 21:34:19 - INFO - __main__ - Step 2144: {'lr': 0.0004999988482504027, 'samples': 411648, 'steps': 2143, 'loss/train': 2.721625804901123} -11/06/2021 21:34:19 - INFO - __main__ - Step 2145: {'lr': 0.0004999988320857063, 'samples': 411840, 'steps': 2144, 'loss/train': 2.778151750564575} -11/06/2021 21:34:20 - INFO - __main__ - Step 2146: {'lr': 0.0004999988158083643, 'samples': 412032, 'steps': 2145, 'loss/train': 2.607226848602295} -11/06/2021 21:34:20 - INFO - __main__ - Step 2147: {'lr': 0.0004999987994183766, 'samples': 412224, 'steps': 2146, 'loss/train': 2.325345277786255} -11/06/2021 21:34:21 - INFO - __main__ - Step 2148: {'lr': 0.0004999987829157434, 'samples': 412416, 'steps': 2147, 'loss/train': 2.363879442214966} -11/06/2021 21:34:21 - INFO - __main__ - Step 2149: {'lr': 0.0004999987663004646, 'samples': 412608, 'steps': 2148, 'loss/train': 2.3791654109954834} -11/06/2021 21:34:22 - INFO - __main__ - Step 2150: {'lr': 0.0004999987495725401, 'samples': 412800, 'steps': 2149, 'loss/train': 1.6959710121154785} -11/06/2021 21:34:22 - INFO - __main__ - Step 2151: {'lr': 0.0004999987327319701, 'samples': 412992, 'steps': 2150, 'loss/train': 2.9837472438812256} -11/06/2021 21:34:22 - INFO - __main__ - Step 2152: {'lr': 0.0004999987157787546, 'samples': 413184, 'steps': 2151, 'loss/train': 2.8918848037719727} -11/06/2021 21:34:24 - INFO - __main__ - Step 2153: {'lr': 0.0004999986987128934, 'samples': 413376, 'steps': 2152, 'loss/train': 2.0959744453430176} -11/06/2021 21:34:24 - INFO - __main__ - Step 2154: {'lr': 0.0004999986815343867, 'samples': 413568, 'steps': 2153, 'loss/train': 2.464357614517212} -11/06/2021 21:34:24 - INFO - __main__ - Step 2155: {'lr': 0.0004999986642432345, 'samples': 413760, 'steps': 2154, 'loss/train': 2.6230199337005615} -11/06/2021 21:34:25 - INFO - __main__ - Step 2156: {'lr': 0.0004999986468394367, 'samples': 413952, 'steps': 2155, 'loss/train': 2.50052547454834} -11/06/2021 21:34:25 - INFO - __main__ - Step 2157: {'lr': 0.0004999986293229934, 'samples': 414144, 'steps': 2156, 'loss/train': 2.743523359298706} -11/06/2021 21:34:26 - INFO - __main__ - Step 2158: {'lr': 0.0004999986116939045, 'samples': 414336, 'steps': 2157, 'loss/train': 2.9330990314483643} -11/06/2021 21:34:26 - INFO - __main__ - Step 2159: {'lr': 0.0004999985939521702, 'samples': 414528, 'steps': 2158, 'loss/train': 3.325244426727295} -11/06/2021 21:34:27 - INFO - __main__ - Step 2160: {'lr': 0.0004999985760977903, 'samples': 414720, 'steps': 2159, 'loss/train': 2.2128641605377197} -11/06/2021 21:34:27 - INFO - __main__ - Step 2161: {'lr': 0.000499998558130765, 'samples': 414912, 'steps': 2160, 'loss/train': 2.9361557960510254} -11/06/2021 21:34:27 - INFO - __main__ - Step 2162: {'lr': 0.0004999985400510941, 'samples': 415104, 'steps': 2161, 'loss/train': 2.5086746215820312} -11/06/2021 21:34:28 - INFO - __main__ - Step 2163: {'lr': 0.0004999985218587777, 'samples': 415296, 'steps': 2162, 'loss/train': 1.6962592601776123} -11/06/2021 21:34:29 - INFO - __main__ - Step 2164: {'lr': 0.0004999985035538159, 'samples': 415488, 'steps': 2163, 'loss/train': 2.615097761154175} -11/06/2021 21:34:29 - INFO - __main__ - Step 2165: {'lr': 0.0004999984851362086, 'samples': 415680, 'steps': 2164, 'loss/train': 2.722036600112915} -11/06/2021 21:34:29 - INFO - __main__ - Step 2166: {'lr': 0.0004999984666059559, 'samples': 415872, 'steps': 2165, 'loss/train': 2.560600996017456} -11/06/2021 21:34:30 - INFO - __main__ - Step 2167: {'lr': 0.0004999984479630577, 'samples': 416064, 'steps': 2166, 'loss/train': 2.6970345973968506} -11/06/2021 21:34:30 - INFO - __main__ - Step 2168: {'lr': 0.000499998429207514, 'samples': 416256, 'steps': 2167, 'loss/train': 2.9107210636138916} -11/06/2021 21:34:31 - INFO - __main__ - Step 2169: {'lr': 0.000499998410339325, 'samples': 416448, 'steps': 2168, 'loss/train': 2.580718994140625} -11/06/2021 21:34:32 - INFO - __main__ - Step 2170: {'lr': 0.0004999983913584904, 'samples': 416640, 'steps': 2169, 'loss/train': 2.8567304611206055} -11/06/2021 21:34:32 - INFO - __main__ - Step 2171: {'lr': 0.0004999983722650106, 'samples': 416832, 'steps': 2170, 'loss/train': 2.371682643890381} -11/06/2021 21:34:32 - INFO - __main__ - Step 2172: {'lr': 0.0004999983530588853, 'samples': 417024, 'steps': 2171, 'loss/train': 2.061142921447754} -11/06/2021 21:34:33 - INFO - __main__ - Step 2173: {'lr': 0.0004999983337401145, 'samples': 417216, 'steps': 2172, 'loss/train': 2.451244354248047} -11/06/2021 21:34:34 - INFO - __main__ - Step 2174: {'lr': 0.0004999983143086984, 'samples': 417408, 'steps': 2173, 'loss/train': 1.99120032787323} -11/06/2021 21:34:34 - INFO - __main__ - Step 2175: {'lr': 0.0004999982947646368, 'samples': 417600, 'steps': 2174, 'loss/train': 2.0224850177764893} -11/06/2021 21:34:34 - INFO - __main__ - Step 2176: {'lr': 0.00049999827510793, 'samples': 417792, 'steps': 2175, 'loss/train': 2.3628859519958496} -11/06/2021 21:34:35 - INFO - __main__ - Step 2177: {'lr': 0.0004999982553385778, 'samples': 417984, 'steps': 2176, 'loss/train': 2.5779266357421875} -11/06/2021 21:34:35 - INFO - __main__ - Step 2178: {'lr': 0.0004999982354565802, 'samples': 418176, 'steps': 2177, 'loss/train': 2.631287097930908} -11/06/2021 21:34:36 - INFO - __main__ - Step 2179: {'lr': 0.0004999982154619372, 'samples': 418368, 'steps': 2178, 'loss/train': 2.691127300262451} -11/06/2021 21:34:36 - INFO - __main__ - Step 2180: {'lr': 0.000499998195354649, 'samples': 418560, 'steps': 2179, 'loss/train': 2.6451637744903564} -11/06/2021 21:34:37 - INFO - __main__ - Step 2181: {'lr': 0.0004999981751347153, 'samples': 418752, 'steps': 2180, 'loss/train': 3.3670623302459717} -11/06/2021 21:34:37 - INFO - __main__ - Step 2182: {'lr': 0.0004999981548021364, 'samples': 418944, 'steps': 2181, 'loss/train': 2.2093632221221924} -11/06/2021 21:34:37 - INFO - __main__ - Step 2183: {'lr': 0.0004999981343569122, 'samples': 419136, 'steps': 2182, 'loss/train': 2.704352855682373} -11/06/2021 21:34:38 - INFO - __main__ - Step 2184: {'lr': 0.0004999981137990425, 'samples': 419328, 'steps': 2183, 'loss/train': 3.1171112060546875} -11/06/2021 21:34:39 - INFO - __main__ - Step 2185: {'lr': 0.0004999980931285278, 'samples': 419520, 'steps': 2184, 'loss/train': 2.5423855781555176} -11/06/2021 21:34:39 - INFO - __main__ - Step 2186: {'lr': 0.0004999980723453676, 'samples': 419712, 'steps': 2185, 'loss/train': 1.9052900075912476} -11/06/2021 21:34:40 - INFO - __main__ - Step 2187: {'lr': 0.0004999980514495623, 'samples': 419904, 'steps': 2186, 'loss/train': 2.7308359146118164} -11/06/2021 21:34:40 - INFO - __main__ - Step 2188: {'lr': 0.0004999980304411116, 'samples': 420096, 'steps': 2187, 'loss/train': 2.344801902770996} -11/06/2021 21:34:40 - INFO - __main__ - Step 2189: {'lr': 0.0004999980093200157, 'samples': 420288, 'steps': 2188, 'loss/train': 2.7158095836639404} -11/06/2021 21:34:41 - INFO - __main__ - Step 2190: {'lr': 0.0004999979880862745, 'samples': 420480, 'steps': 2189, 'loss/train': 1.4334872961044312} -11/06/2021 21:34:42 - INFO - __main__ - Step 2191: {'lr': 0.0004999979667398882, 'samples': 420672, 'steps': 2190, 'loss/train': 2.5495493412017822} -11/06/2021 21:34:42 - INFO - __main__ - Step 2192: {'lr': 0.0004999979452808565, 'samples': 420864, 'steps': 2191, 'loss/train': 2.356931447982788} -11/06/2021 21:34:42 - INFO - __main__ - Step 2193: {'lr': 0.0004999979237091796, 'samples': 421056, 'steps': 2192, 'loss/train': 2.551086902618408} -11/06/2021 21:34:43 - INFO - __main__ - Step 2194: {'lr': 0.0004999979020248577, 'samples': 421248, 'steps': 2193, 'loss/train': 2.4983091354370117} -11/06/2021 21:34:43 - INFO - __main__ - Step 2195: {'lr': 0.0004999978802278904, 'samples': 421440, 'steps': 2194, 'loss/train': 2.6009490489959717} -11/06/2021 21:34:44 - INFO - __main__ - Step 2196: {'lr': 0.000499997858318278, 'samples': 421632, 'steps': 2195, 'loss/train': 2.3032186031341553} -11/06/2021 21:34:45 - INFO - __main__ - Step 2197: {'lr': 0.0004999978362960204, 'samples': 421824, 'steps': 2196, 'loss/train': 2.835674285888672} -11/06/2021 21:34:45 - INFO - __main__ - Step 2198: {'lr': 0.0004999978141611176, 'samples': 422016, 'steps': 2197, 'loss/train': 3.615586042404175} -11/06/2021 21:34:45 - INFO - __main__ - Step 2199: {'lr': 0.0004999977919135696, 'samples': 422208, 'steps': 2198, 'loss/train': 1.8978424072265625} -11/06/2021 21:34:46 - INFO - __main__ - Step 2200: {'lr': 0.0004999977695533766, 'samples': 422400, 'steps': 2199, 'loss/train': 2.526134967803955} -11/06/2021 21:34:47 - INFO - __main__ - Step 2201: {'lr': 0.0004999977470805383, 'samples': 422592, 'steps': 2200, 'loss/train': 2.3798577785491943} -11/06/2021 21:34:47 - INFO - __main__ - Step 2202: {'lr': 0.0004999977244950551, 'samples': 422784, 'steps': 2201, 'loss/train': 2.6443750858306885} -11/06/2021 21:34:47 - INFO - __main__ - Step 2203: {'lr': 0.0004999977017969266, 'samples': 422976, 'steps': 2202, 'loss/train': 1.9695329666137695} -11/06/2021 21:34:48 - INFO - __main__ - Step 2204: {'lr': 0.000499997678986153, 'samples': 423168, 'steps': 2203, 'loss/train': 2.704178810119629} -11/06/2021 21:34:48 - INFO - __main__ - Step 2205: {'lr': 0.0004999976560627344, 'samples': 423360, 'steps': 2204, 'loss/train': 2.8710994720458984} -11/06/2021 21:34:49 - INFO - __main__ - Step 2206: {'lr': 0.0004999976330266707, 'samples': 423552, 'steps': 2205, 'loss/train': 2.6105599403381348} -11/06/2021 21:34:49 - INFO - __main__ - Step 2207: {'lr': 0.0004999976098779618, 'samples': 423744, 'steps': 2206, 'loss/train': 2.541774272918701} -11/06/2021 21:34:50 - INFO - __main__ - Step 2208: {'lr': 0.0004999975866166079, 'samples': 423936, 'steps': 2207, 'loss/train': 2.3094847202301025} -11/06/2021 21:34:50 - INFO - __main__ - Step 2209: {'lr': 0.000499997563242609, 'samples': 424128, 'steps': 2208, 'loss/train': 2.5492539405822754} -11/06/2021 21:34:50 - INFO - __main__ - Step 2210: {'lr': 0.0004999975397559649, 'samples': 424320, 'steps': 2209, 'loss/train': 2.095379114151001} -11/06/2021 21:34:52 - INFO - __main__ - Step 2211: {'lr': 0.000499997516156676, 'samples': 424512, 'steps': 2210, 'loss/train': 2.605085849761963} -11/06/2021 21:34:52 - INFO - __main__ - Step 2212: {'lr': 0.000499997492444742, 'samples': 424704, 'steps': 2211, 'loss/train': 2.455345630645752} -11/06/2021 21:34:52 - INFO - __main__ - Step 2213: {'lr': 0.0004999974686201629, 'samples': 424896, 'steps': 2212, 'loss/train': 2.637754201889038} -11/06/2021 21:34:53 - INFO - __main__ - Step 2214: {'lr': 0.0004999974446829389, 'samples': 425088, 'steps': 2213, 'loss/train': 2.4633007049560547} -11/06/2021 21:34:53 - INFO - __main__ - Step 2215: {'lr': 0.0004999974206330698, 'samples': 425280, 'steps': 2214, 'loss/train': 2.5374715328216553} -11/06/2021 21:34:53 - INFO - __main__ - Step 2216: {'lr': 0.0004999973964705558, 'samples': 425472, 'steps': 2215, 'loss/train': 2.7447330951690674} -11/06/2021 21:34:54 - INFO - __main__ - Step 2217: {'lr': 0.0004999973721953968, 'samples': 425664, 'steps': 2216, 'loss/train': 2.3357722759246826} -11/06/2021 21:34:55 - INFO - __main__ - Step 2218: {'lr': 0.0004999973478075928, 'samples': 425856, 'steps': 2217, 'loss/train': 2.6798555850982666} -11/06/2021 21:34:55 - INFO - __main__ - Step 2219: {'lr': 0.0004999973233071438, 'samples': 426048, 'steps': 2218, 'loss/train': 2.2830727100372314} -11/06/2021 21:34:55 - INFO - __main__ - Step 2220: {'lr': 0.00049999729869405, 'samples': 426240, 'steps': 2219, 'loss/train': 2.466994524002075} -11/06/2021 21:34:56 - INFO - __main__ - Step 2221: {'lr': 0.0004999972739683113, 'samples': 426432, 'steps': 2220, 'loss/train': 2.3057074546813965} -11/06/2021 21:34:57 - INFO - __main__ - Step 2222: {'lr': 0.0004999972491299276, 'samples': 426624, 'steps': 2221, 'loss/train': 2.5645909309387207} -11/06/2021 21:34:57 - INFO - __main__ - Step 2223: {'lr': 0.000499997224178899, 'samples': 426816, 'steps': 2222, 'loss/train': 2.493025064468384} -11/06/2021 21:34:57 - INFO - __main__ - Step 2224: {'lr': 0.0004999971991152256, 'samples': 427008, 'steps': 2223, 'loss/train': 3.2061784267425537} -11/06/2021 21:34:58 - INFO - __main__ - Step 2225: {'lr': 0.0004999971739389072, 'samples': 427200, 'steps': 2224, 'loss/train': 2.114089250564575} -11/06/2021 21:34:58 - INFO - __main__ - Step 2226: {'lr': 0.000499997148649944, 'samples': 427392, 'steps': 2225, 'loss/train': 2.6324121952056885} -11/06/2021 21:34:59 - INFO - __main__ - Step 2227: {'lr': 0.0004999971232483359, 'samples': 427584, 'steps': 2226, 'loss/train': 2.3817732334136963} -11/06/2021 21:34:59 - INFO - __main__ - Step 2228: {'lr': 0.0004999970977340829, 'samples': 427776, 'steps': 2227, 'loss/train': 2.323068380355835} -11/06/2021 21:35:00 - INFO - __main__ - Step 2229: {'lr': 0.0004999970721071852, 'samples': 427968, 'steps': 2228, 'loss/train': 2.610438585281372} -11/06/2021 21:35:00 - INFO - __main__ - Step 2230: {'lr': 0.0004999970463676427, 'samples': 428160, 'steps': 2229, 'loss/train': 2.492368221282959} -11/06/2021 21:35:00 - INFO - __main__ - Step 2231: {'lr': 0.0004999970205154553, 'samples': 428352, 'steps': 2230, 'loss/train': 2.369539499282837} -11/06/2021 21:35:02 - INFO - __main__ - Step 2232: {'lr': 0.000499996994550623, 'samples': 428544, 'steps': 2231, 'loss/train': 2.712465524673462} -11/06/2021 21:35:02 - INFO - __main__ - Step 2233: {'lr': 0.000499996968473146, 'samples': 428736, 'steps': 2232, 'loss/train': 3.136364221572876} -11/06/2021 21:35:02 - INFO - __main__ - Step 2234: {'lr': 0.0004999969422830242, 'samples': 428928, 'steps': 2233, 'loss/train': 1.8193436861038208} -11/06/2021 21:35:03 - INFO - __main__ - Step 2235: {'lr': 0.0004999969159802577, 'samples': 429120, 'steps': 2234, 'loss/train': 2.6638810634613037} -11/06/2021 21:35:03 - INFO - __main__ - Step 2236: {'lr': 0.0004999968895648464, 'samples': 429312, 'steps': 2235, 'loss/train': 2.946650505065918} -11/06/2021 21:35:03 - INFO - __main__ - Step 2237: {'lr': 0.0004999968630367905, 'samples': 429504, 'steps': 2236, 'loss/train': 1.9133739471435547} -11/06/2021 21:35:04 - INFO - __main__ - Step 2238: {'lr': 0.0004999968363960897, 'samples': 429696, 'steps': 2237, 'loss/train': 2.461745023727417} -11/06/2021 21:35:05 - INFO - __main__ - Step 2239: {'lr': 0.0004999968096427443, 'samples': 429888, 'steps': 2238, 'loss/train': 1.956204891204834} -11/06/2021 21:35:05 - INFO - __main__ - Step 2240: {'lr': 0.0004999967827767541, 'samples': 430080, 'steps': 2239, 'loss/train': 2.4149010181427} -11/06/2021 21:35:05 - INFO - __main__ - Step 2241: {'lr': 0.0004999967557981192, 'samples': 430272, 'steps': 2240, 'loss/train': 2.339151382446289} -11/06/2021 21:35:06 - INFO - __main__ - Step 2242: {'lr': 0.0004999967287068396, 'samples': 430464, 'steps': 2241, 'loss/train': 1.5045028924942017} -11/06/2021 21:35:07 - INFO - __main__ - Step 2243: {'lr': 0.0004999967015029155, 'samples': 430656, 'steps': 2242, 'loss/train': 2.4464919567108154} -11/06/2021 21:35:07 - INFO - __main__ - Step 2244: {'lr': 0.0004999966741863467, 'samples': 430848, 'steps': 2243, 'loss/train': 2.7989583015441895} -11/06/2021 21:35:07 - INFO - __main__ - Step 2245: {'lr': 0.000499996646757133, 'samples': 431040, 'steps': 2244, 'loss/train': 2.849099636077881} -11/06/2021 21:35:08 - INFO - __main__ - Step 2246: {'lr': 0.0004999966192152749, 'samples': 431232, 'steps': 2245, 'loss/train': 2.3336470127105713} -11/06/2021 21:35:08 - INFO - __main__ - Step 2247: {'lr': 0.0004999965915607722, 'samples': 431424, 'steps': 2246, 'loss/train': 1.3028373718261719} -11/06/2021 21:35:09 - INFO - __main__ - Step 2248: {'lr': 0.0004999965637936248, 'samples': 431616, 'steps': 2247, 'loss/train': 2.4899795055389404} -11/06/2021 21:35:10 - INFO - __main__ - Step 2249: {'lr': 0.0004999965359138329, 'samples': 431808, 'steps': 2248, 'loss/train': 3.0825843811035156} -11/06/2021 21:35:10 - INFO - __main__ - Step 2250: {'lr': 0.0004999965079213964, 'samples': 432000, 'steps': 2249, 'loss/train': 2.510723352432251} -11/06/2021 21:35:10 - INFO - __main__ - Step 2251: {'lr': 0.0004999964798163152, 'samples': 432192, 'steps': 2250, 'loss/train': 2.384847640991211} -11/06/2021 21:35:11 - INFO - __main__ - Step 2252: {'lr': 0.0004999964515985896, 'samples': 432384, 'steps': 2251, 'loss/train': 2.7811596393585205} -11/06/2021 21:35:12 - INFO - __main__ - Step 2253: {'lr': 0.0004999964232682194, 'samples': 432576, 'steps': 2252, 'loss/train': 3.195866823196411} -11/06/2021 21:35:12 - INFO - __main__ - Step 2254: {'lr': 0.0004999963948252046, 'samples': 432768, 'steps': 2253, 'loss/train': 1.684893012046814} -11/06/2021 21:35:12 - INFO - __main__ - Step 2255: {'lr': 0.0004999963662695453, 'samples': 432960, 'steps': 2254, 'loss/train': 2.470139265060425} -11/06/2021 21:35:13 - INFO - __main__ - Step 2256: {'lr': 0.0004999963376012416, 'samples': 433152, 'steps': 2255, 'loss/train': 2.2551157474517822} -11/06/2021 21:35:13 - INFO - __main__ - Step 2257: {'lr': 0.0004999963088202934, 'samples': 433344, 'steps': 2256, 'loss/train': 1.778255581855774} -11/06/2021 21:35:13 - INFO - __main__ - Step 2258: {'lr': 0.0004999962799267006, 'samples': 433536, 'steps': 2257, 'loss/train': 2.4314968585968018} -11/06/2021 21:35:14 - INFO - __main__ - Step 2259: {'lr': 0.0004999962509204634, 'samples': 433728, 'steps': 2258, 'loss/train': 2.8687584400177} -11/06/2021 21:35:15 - INFO - __main__ - Step 2260: {'lr': 0.0004999962218015818, 'samples': 433920, 'steps': 2259, 'loss/train': 2.5391645431518555} -11/06/2021 21:35:15 - INFO - __main__ - Step 2261: {'lr': 0.0004999961925700557, 'samples': 434112, 'steps': 2260, 'loss/train': 2.284990072250366} -11/06/2021 21:35:15 - INFO - __main__ - Step 2262: {'lr': 0.0004999961632258851, 'samples': 434304, 'steps': 2261, 'loss/train': 2.2912981510162354} -11/06/2021 21:35:16 - INFO - __main__ - Step 2263: {'lr': 0.0004999961337690703, 'samples': 434496, 'steps': 2262, 'loss/train': 2.5647494792938232} -11/06/2021 21:35:17 - INFO - __main__ - Step 2264: {'lr': 0.0004999961041996109, 'samples': 434688, 'steps': 2263, 'loss/train': 2.3833937644958496} -11/06/2021 21:35:17 - INFO - __main__ - Step 2265: {'lr': 0.0004999960745175071, 'samples': 434880, 'steps': 2264, 'loss/train': 2.4869725704193115} -11/06/2021 21:35:18 - INFO - __main__ - Step 2266: {'lr': 0.0004999960447227591, 'samples': 435072, 'steps': 2265, 'loss/train': 2.0234827995300293} -11/06/2021 21:35:18 - INFO - __main__ - Step 2267: {'lr': 0.0004999960148153667, 'samples': 435264, 'steps': 2266, 'loss/train': 2.4819018840789795} -11/06/2021 21:35:18 - INFO - __main__ - Step 2268: {'lr': 0.0004999959847953299, 'samples': 435456, 'steps': 2267, 'loss/train': 1.9739242792129517} -11/06/2021 21:35:19 - INFO - __main__ - Step 2269: {'lr': 0.0004999959546626487, 'samples': 435648, 'steps': 2268, 'loss/train': 2.5445456504821777} -11/06/2021 21:35:20 - INFO - __main__ - Step 2270: {'lr': 0.0004999959244173232, 'samples': 435840, 'steps': 2269, 'loss/train': 1.6040853261947632} -11/06/2021 21:35:20 - INFO - __main__ - Step 2271: {'lr': 0.0004999958940593535, 'samples': 436032, 'steps': 2270, 'loss/train': 2.391418218612671} -11/06/2021 21:35:20 - INFO - __main__ - Step 2272: {'lr': 0.0004999958635887394, 'samples': 436224, 'steps': 2271, 'loss/train': 2.7278921604156494} -11/06/2021 21:35:21 - INFO - __main__ - Step 2273: {'lr': 0.0004999958330054811, 'samples': 436416, 'steps': 2272, 'loss/train': 2.206878900527954} -11/06/2021 21:35:21 - INFO - __main__ - Step 2274: {'lr': 0.0004999958023095785, 'samples': 436608, 'steps': 2273, 'loss/train': 2.4823598861694336} -11/06/2021 21:35:22 - INFO - __main__ - Step 2275: {'lr': 0.0004999957715010317, 'samples': 436800, 'steps': 2274, 'loss/train': 2.0036473274230957} -11/06/2021 21:35:22 - INFO - __main__ - Step 2276: {'lr': 0.0004999957405798405, 'samples': 436992, 'steps': 2275, 'loss/train': 2.6134819984436035} -11/06/2021 21:35:23 - INFO - __main__ - Step 2277: {'lr': 0.0004999957095460052, 'samples': 437184, 'steps': 2276, 'loss/train': 2.5736441612243652} -11/06/2021 21:35:23 - INFO - __main__ - Step 2278: {'lr': 0.0004999956783995257, 'samples': 437376, 'steps': 2277, 'loss/train': 2.585498809814453} -11/06/2021 21:35:23 - INFO - __main__ - Step 2279: {'lr': 0.0004999956471404021, 'samples': 437568, 'steps': 2278, 'loss/train': 2.7420217990875244} -11/06/2021 21:35:24 - INFO - __main__ - Step 2280: {'lr': 0.0004999956157686341, 'samples': 437760, 'steps': 2279, 'loss/train': 2.3299975395202637} -11/06/2021 21:35:25 - INFO - __main__ - Step 2281: {'lr': 0.0004999955842842222, 'samples': 437952, 'steps': 2280, 'loss/train': 2.463308334350586} -11/06/2021 21:35:25 - INFO - __main__ - Step 2282: {'lr': 0.0004999955526871659, 'samples': 438144, 'steps': 2281, 'loss/train': 1.7193819284439087} -11/06/2021 21:35:26 - INFO - __main__ - Step 2283: {'lr': 0.0004999955209774656, 'samples': 438336, 'steps': 2282, 'loss/train': 2.3171699047088623} -11/06/2021 21:35:26 - INFO - __main__ - Step 2284: {'lr': 0.0004999954891551211, 'samples': 438528, 'steps': 2283, 'loss/train': 3.057791233062744} -11/06/2021 21:35:27 - INFO - __main__ - Step 2285: {'lr': 0.0004999954572201326, 'samples': 438720, 'steps': 2284, 'loss/train': 2.662093162536621} -11/06/2021 21:35:27 - INFO - __main__ - Step 2286: {'lr': 0.0004999954251724999, 'samples': 438912, 'steps': 2285, 'loss/train': 2.635653495788574} -11/06/2021 21:35:28 - INFO - __main__ - Step 2287: {'lr': 0.0004999953930122231, 'samples': 439104, 'steps': 2286, 'loss/train': 2.4084901809692383} -11/06/2021 21:35:28 - INFO - __main__ - Step 2288: {'lr': 0.0004999953607393023, 'samples': 439296, 'steps': 2287, 'loss/train': 2.4325740337371826} -11/06/2021 21:35:28 - INFO - __main__ - Step 2289: {'lr': 0.0004999953283537374, 'samples': 439488, 'steps': 2288, 'loss/train': 2.2441446781158447} -11/06/2021 21:35:29 - INFO - __main__ - Step 2290: {'lr': 0.0004999952958555285, 'samples': 439680, 'steps': 2289, 'loss/train': 3.243093729019165} -11/06/2021 21:35:30 - INFO - __main__ - Step 2291: {'lr': 0.0004999952632446756, 'samples': 439872, 'steps': 2290, 'loss/train': 2.7363367080688477} -11/06/2021 21:35:30 - INFO - __main__ - Step 2292: {'lr': 0.0004999952305211786, 'samples': 440064, 'steps': 2291, 'loss/train': 1.7157084941864014} -11/06/2021 21:35:31 - INFO - __main__ - Step 2293: {'lr': 0.0004999951976850377, 'samples': 440256, 'steps': 2292, 'loss/train': 1.871019721031189} -11/06/2021 21:35:31 - INFO - __main__ - Step 2294: {'lr': 0.0004999951647362527, 'samples': 440448, 'steps': 2293, 'loss/train': 2.4851877689361572} -11/06/2021 21:35:32 - INFO - __main__ - Step 2295: {'lr': 0.0004999951316748239, 'samples': 440640, 'steps': 2294, 'loss/train': 2.7389845848083496} -11/06/2021 21:35:32 - INFO - __main__ - Step 2296: {'lr': 0.0004999950985007511, 'samples': 440832, 'steps': 2295, 'loss/train': 1.447107195854187} -11/06/2021 21:35:33 - INFO - __main__ - Step 2297: {'lr': 0.0004999950652140343, 'samples': 441024, 'steps': 2296, 'loss/train': 2.8587417602539062} -11/06/2021 21:35:33 - INFO - __main__ - Step 2298: {'lr': 0.0004999950318146737, 'samples': 441216, 'steps': 2297, 'loss/train': 2.5910117626190186} -11/06/2021 21:35:33 - INFO - __main__ - Step 2299: {'lr': 0.0004999949983026691, 'samples': 441408, 'steps': 2298, 'loss/train': 2.3904645442962646} -11/06/2021 21:35:34 - INFO - __main__ - Step 2300: {'lr': 0.0004999949646780205, 'samples': 441600, 'steps': 2299, 'loss/train': 2.857335329055786} -11/06/2021 21:35:35 - INFO - __main__ - Step 2301: {'lr': 0.0004999949309407283, 'samples': 441792, 'steps': 2300, 'loss/train': 2.917921543121338} -11/06/2021 21:35:35 - INFO - __main__ - Step 2302: {'lr': 0.0004999948970907921, 'samples': 441984, 'steps': 2301, 'loss/train': 2.345691442489624} -11/06/2021 21:35:36 - INFO - __main__ - Step 2303: {'lr': 0.0004999948631282119, 'samples': 442176, 'steps': 2302, 'loss/train': 1.4263627529144287} -11/06/2021 21:35:36 - INFO - __main__ - Step 2304: {'lr': 0.0004999948290529881, 'samples': 442368, 'steps': 2303, 'loss/train': 2.424299955368042} -11/06/2021 21:35:36 - INFO - __main__ - Step 2305: {'lr': 0.0004999947948651204, 'samples': 442560, 'steps': 2304, 'loss/train': 1.874759316444397} -11/06/2021 21:35:37 - INFO - __main__ - Step 2306: {'lr': 0.0004999947605646089, 'samples': 442752, 'steps': 2305, 'loss/train': 2.55169677734375} -11/06/2021 21:35:38 - INFO - __main__ - Step 2307: {'lr': 0.0004999947261514537, 'samples': 442944, 'steps': 2306, 'loss/train': 2.5056583881378174} -11/06/2021 21:35:38 - INFO - __main__ - Step 2308: {'lr': 0.0004999946916256547, 'samples': 443136, 'steps': 2307, 'loss/train': 2.708646535873413} -11/06/2021 21:35:38 - INFO - __main__ - Step 2309: {'lr': 0.0004999946569872118, 'samples': 443328, 'steps': 2308, 'loss/train': 2.174234628677368} -11/06/2021 21:35:39 - INFO - __main__ - Step 2310: {'lr': 0.0004999946222361254, 'samples': 443520, 'steps': 2309, 'loss/train': 2.365739107131958} -11/06/2021 21:35:40 - INFO - __main__ - Step 2311: {'lr': 0.0004999945873723951, 'samples': 443712, 'steps': 2310, 'loss/train': 2.3640260696411133} -11/06/2021 21:35:40 - INFO - __main__ - Step 2312: {'lr': 0.0004999945523960212, 'samples': 443904, 'steps': 2311, 'loss/train': 1.8592215776443481} -11/06/2021 21:35:40 - INFO - __main__ - Step 2313: {'lr': 0.0004999945173070035, 'samples': 444096, 'steps': 2312, 'loss/train': 2.9647116661071777} -11/06/2021 21:35:41 - INFO - __main__ - Step 2314: {'lr': 0.0004999944821053422, 'samples': 444288, 'steps': 2313, 'loss/train': 2.653313636779785} -11/06/2021 21:35:41 - INFO - __main__ - Step 2315: {'lr': 0.0004999944467910372, 'samples': 444480, 'steps': 2314, 'loss/train': 2.4893155097961426} -11/06/2021 21:35:42 - INFO - __main__ - Step 2316: {'lr': 0.0004999944113640887, 'samples': 444672, 'steps': 2315, 'loss/train': 2.724855422973633} -11/06/2021 21:35:43 - INFO - __main__ - Step 2317: {'lr': 0.0004999943758244964, 'samples': 444864, 'steps': 2316, 'loss/train': 2.472731590270996} -11/06/2021 21:35:43 - INFO - __main__ - Step 2318: {'lr': 0.0004999943401722606, 'samples': 445056, 'steps': 2317, 'loss/train': 2.70874285697937} -11/06/2021 21:35:43 - INFO - __main__ - Step 2319: {'lr': 0.0004999943044073813, 'samples': 445248, 'steps': 2318, 'loss/train': 2.925724983215332} -11/06/2021 21:35:44 - INFO - __main__ - Step 2320: {'lr': 0.0004999942685298582, 'samples': 445440, 'steps': 2319, 'loss/train': 2.7367475032806396} -11/06/2021 21:35:44 - INFO - __main__ - Step 2321: {'lr': 0.0004999942325396916, 'samples': 445632, 'steps': 2320, 'loss/train': 2.439120054244995} -11/06/2021 21:35:45 - INFO - __main__ - Step 2322: {'lr': 0.0004999941964368817, 'samples': 445824, 'steps': 2321, 'loss/train': 2.9538588523864746} -11/06/2021 21:35:45 - INFO - __main__ - Step 2323: {'lr': 0.000499994160221428, 'samples': 446016, 'steps': 2322, 'loss/train': 2.5466785430908203} -11/06/2021 21:35:46 - INFO - __main__ - Step 2324: {'lr': 0.0004999941238933308, 'samples': 446208, 'steps': 2323, 'loss/train': 2.833611488342285} -11/06/2021 21:35:46 - INFO - __main__ - Step 2325: {'lr': 0.0004999940874525902, 'samples': 446400, 'steps': 2324, 'loss/train': 2.2067928314208984} -11/06/2021 21:35:46 - INFO - __main__ - Step 2326: {'lr': 0.0004999940508992061, 'samples': 446592, 'steps': 2325, 'loss/train': 2.688612222671509} -11/06/2021 21:35:48 - INFO - __main__ - Step 2327: {'lr': 0.0004999940142331785, 'samples': 446784, 'steps': 2326, 'loss/train': 2.2611327171325684} -11/06/2021 21:35:48 - INFO - __main__ - Step 2328: {'lr': 0.0004999939774545074, 'samples': 446976, 'steps': 2327, 'loss/train': 2.940781593322754} -11/06/2021 21:35:48 - INFO - __main__ - Step 2329: {'lr': 0.000499993940563193, 'samples': 447168, 'steps': 2328, 'loss/train': 1.4350242614746094} -11/06/2021 21:35:49 - INFO - __main__ - Step 2330: {'lr': 0.0004999939035592351, 'samples': 447360, 'steps': 2329, 'loss/train': 1.2856340408325195} -11/06/2021 21:35:49 - INFO - __main__ - Step 2331: {'lr': 0.0004999938664426339, 'samples': 447552, 'steps': 2330, 'loss/train': 2.2000558376312256} -11/06/2021 21:35:50 - INFO - __main__ - Step 2332: {'lr': 0.0004999938292133894, 'samples': 447744, 'steps': 2331, 'loss/train': 2.552149534225464} -11/06/2021 21:35:51 - INFO - __main__ - Step 2333: {'lr': 0.0004999937918715013, 'samples': 447936, 'steps': 2332, 'loss/train': 2.23763370513916} -11/06/2021 21:35:51 - INFO - __main__ - Step 2334: {'lr': 0.00049999375441697, 'samples': 448128, 'steps': 2333, 'loss/train': 2.5193448066711426} -11/06/2021 21:35:51 - INFO - __main__ - Step 2335: {'lr': 0.0004999937168497954, 'samples': 448320, 'steps': 2334, 'loss/train': 2.982269763946533} -11/06/2021 21:35:52 - INFO - __main__ - Step 2336: {'lr': 0.0004999936791699773, 'samples': 448512, 'steps': 2335, 'loss/train': 2.2376298904418945} -11/06/2021 21:35:53 - INFO - __main__ - Step 2337: {'lr': 0.0004999936413775161, 'samples': 448704, 'steps': 2336, 'loss/train': 2.544750928878784} -11/06/2021 21:35:53 - INFO - __main__ - Step 2338: {'lr': 0.0004999936034724115, 'samples': 448896, 'steps': 2337, 'loss/train': 2.562856912612915} -11/06/2021 21:35:53 - INFO - __main__ - Step 2339: {'lr': 0.0004999935654546638, 'samples': 449088, 'steps': 2338, 'loss/train': 2.4741744995117188} -11/06/2021 21:35:54 - INFO - __main__ - Step 2340: {'lr': 0.0004999935273242727, 'samples': 449280, 'steps': 2339, 'loss/train': 2.637646198272705} -11/06/2021 21:35:54 - INFO - __main__ - Step 2341: {'lr': 0.0004999934890812384, 'samples': 449472, 'steps': 2340, 'loss/train': 2.313438892364502} -11/06/2021 21:35:55 - INFO - __main__ - Step 2342: {'lr': 0.0004999934507255609, 'samples': 449664, 'steps': 2341, 'loss/train': 1.6301710605621338} -11/06/2021 21:35:55 - INFO - __main__ - Step 2343: {'lr': 0.0004999934122572403, 'samples': 449856, 'steps': 2342, 'loss/train': 2.490684747695923} -11/06/2021 21:35:56 - INFO - __main__ - Step 2344: {'lr': 0.0004999933736762763, 'samples': 450048, 'steps': 2343, 'loss/train': 2.5411455631256104} -11/06/2021 21:35:56 - INFO - __main__ - Step 2345: {'lr': 0.0004999933349826694, 'samples': 450240, 'steps': 2344, 'loss/train': 2.634213924407959} -11/06/2021 21:35:57 - INFO - __main__ - Step 2346: {'lr': 0.0004999932961764192, 'samples': 450432, 'steps': 2345, 'loss/train': 2.2040252685546875} -11/06/2021 21:35:58 - INFO - __main__ - Step 2347: {'lr': 0.000499993257257526, 'samples': 450624, 'steps': 2346, 'loss/train': 3.1868784427642822} -11/06/2021 21:35:58 - INFO - __main__ - Step 2348: {'lr': 0.0004999932182259897, 'samples': 450816, 'steps': 2347, 'loss/train': 2.624990940093994} -11/06/2021 21:35:58 - INFO - __main__ - Step 2349: {'lr': 0.0004999931790818102, 'samples': 451008, 'steps': 2348, 'loss/train': 2.1832830905914307} -11/06/2021 21:35:59 - INFO - __main__ - Step 2350: {'lr': 0.0004999931398249876, 'samples': 451200, 'steps': 2349, 'loss/train': 1.3503772020339966} -11/06/2021 21:35:59 - INFO - __main__ - Step 2351: {'lr': 0.0004999931004555221, 'samples': 451392, 'steps': 2350, 'loss/train': 2.434903383255005} -11/06/2021 21:36:00 - INFO - __main__ - Step 2352: {'lr': 0.0004999930609734135, 'samples': 451584, 'steps': 2351, 'loss/train': 1.9292891025543213} -11/06/2021 21:36:01 - INFO - __main__ - Step 2353: {'lr': 0.0004999930213786619, 'samples': 451776, 'steps': 2352, 'loss/train': 2.576533555984497} -11/06/2021 21:36:01 - INFO - __main__ - Step 2354: {'lr': 0.0004999929816712672, 'samples': 451968, 'steps': 2353, 'loss/train': 2.6374588012695312} -11/06/2021 21:36:01 - INFO - __main__ - Step 2355: {'lr': 0.0004999929418512296, 'samples': 452160, 'steps': 2354, 'loss/train': 2.645233392715454} -11/06/2021 21:36:02 - INFO - __main__ - Step 2356: {'lr': 0.0004999929019185491, 'samples': 452352, 'steps': 2355, 'loss/train': 2.3898088932037354} -11/06/2021 21:36:02 - INFO - __main__ - Step 2357: {'lr': 0.0004999928618732256, 'samples': 452544, 'steps': 2356, 'loss/train': 2.8378491401672363} -11/06/2021 21:36:03 - INFO - __main__ - Step 2358: {'lr': 0.0004999928217152591, 'samples': 452736, 'steps': 2357, 'loss/train': 2.8093080520629883} -11/06/2021 21:36:03 - INFO - __main__ - Step 2359: {'lr': 0.0004999927814446498, 'samples': 452928, 'steps': 2358, 'loss/train': 2.382434844970703} -11/06/2021 21:36:04 - INFO - __main__ - Step 2360: {'lr': 0.0004999927410613975, 'samples': 453120, 'steps': 2359, 'loss/train': 2.509754180908203} -11/06/2021 21:36:04 - INFO - __main__ - Step 2361: {'lr': 0.0004999927005655024, 'samples': 453312, 'steps': 2360, 'loss/train': 2.2279305458068848} -11/06/2021 21:36:04 - INFO - __main__ - Step 2362: {'lr': 0.0004999926599569644, 'samples': 453504, 'steps': 2361, 'loss/train': 2.2018115520477295} -11/06/2021 21:36:05 - INFO - __main__ - Step 2363: {'lr': 0.0004999926192357836, 'samples': 453696, 'steps': 2362, 'loss/train': 2.667649269104004} -11/06/2021 21:36:06 - INFO - __main__ - Step 2364: {'lr': 0.00049999257840196, 'samples': 453888, 'steps': 2363, 'loss/train': 1.9997769594192505} -11/06/2021 21:36:06 - INFO - __main__ - Step 2365: {'lr': 0.0004999925374554936, 'samples': 454080, 'steps': 2364, 'loss/train': 2.3278563022613525} -11/06/2021 21:36:06 - INFO - __main__ - Step 2366: {'lr': 0.0004999924963963845, 'samples': 454272, 'steps': 2365, 'loss/train': 2.7401719093322754} -11/06/2021 21:36:07 - INFO - __main__ - Step 2367: {'lr': 0.0004999924552246324, 'samples': 454464, 'steps': 2366, 'loss/train': 2.5451650619506836} -11/06/2021 21:36:08 - INFO - __main__ - Step 2368: {'lr': 0.0004999924139402378, 'samples': 454656, 'steps': 2367, 'loss/train': 2.171853542327881} -11/06/2021 21:36:08 - INFO - __main__ - Step 2369: {'lr': 0.0004999923725432004, 'samples': 454848, 'steps': 2368, 'loss/train': 2.3794937133789062} -11/06/2021 21:36:09 - INFO - __main__ - Step 2370: {'lr': 0.0004999923310335202, 'samples': 455040, 'steps': 2369, 'loss/train': 2.2186713218688965} -11/06/2021 21:36:09 - INFO - __main__ - Step 2371: {'lr': 0.0004999922894111975, 'samples': 455232, 'steps': 2370, 'loss/train': 2.5309088230133057} -11/06/2021 21:36:09 - INFO - __main__ - Step 2372: {'lr': 0.000499992247676232, 'samples': 455424, 'steps': 2371, 'loss/train': 2.399653196334839} -11/06/2021 21:36:10 - INFO - __main__ - Step 2373: {'lr': 0.0004999922058286238, 'samples': 455616, 'steps': 2372, 'loss/train': 2.432457208633423} -11/06/2021 21:36:11 - INFO - __main__ - Step 2374: {'lr': 0.0004999921638683731, 'samples': 455808, 'steps': 2373, 'loss/train': 2.936699390411377} -11/06/2021 21:36:11 - INFO - __main__ - Step 2375: {'lr': 0.0004999921217954797, 'samples': 456000, 'steps': 2374, 'loss/train': 2.8602395057678223} -11/06/2021 21:36:11 - INFO - __main__ - Step 2376: {'lr': 0.0004999920796099437, 'samples': 456192, 'steps': 2375, 'loss/train': 2.113866090774536} -11/06/2021 21:36:12 - INFO - __main__ - Step 2377: {'lr': 0.0004999920373117652, 'samples': 456384, 'steps': 2376, 'loss/train': 2.382596492767334} -11/06/2021 21:36:13 - INFO - __main__ - Step 2378: {'lr': 0.0004999919949009442, 'samples': 456576, 'steps': 2377, 'loss/train': 1.9662163257598877} -11/06/2021 21:36:13 - INFO - __main__ - Step 2379: {'lr': 0.0004999919523774806, 'samples': 456768, 'steps': 2378, 'loss/train': 2.765549659729004} -11/06/2021 21:36:13 - INFO - __main__ - Step 2380: {'lr': 0.0004999919097413743, 'samples': 456960, 'steps': 2379, 'loss/train': 2.0128252506256104} -11/06/2021 21:36:14 - INFO - __main__ - Step 2381: {'lr': 0.0004999918669926258, 'samples': 457152, 'steps': 2380, 'loss/train': 2.4427826404571533} -11/06/2021 21:36:14 - INFO - __main__ - Step 2382: {'lr': 0.0004999918241312346, 'samples': 457344, 'steps': 2381, 'loss/train': 3.2769882678985596} -11/06/2021 21:36:15 - INFO - __main__ - Step 2383: {'lr': 0.0004999917811572011, 'samples': 457536, 'steps': 2382, 'loss/train': 2.264770030975342} -11/06/2021 21:36:16 - INFO - __main__ - Step 2384: {'lr': 0.000499991738070525, 'samples': 457728, 'steps': 2383, 'loss/train': 2.820688247680664} -11/06/2021 21:36:16 - INFO - __main__ - Step 2385: {'lr': 0.0004999916948712066, 'samples': 457920, 'steps': 2384, 'loss/train': 2.739671230316162} -11/06/2021 21:36:16 - INFO - __main__ - Step 2386: {'lr': 0.0004999916515592458, 'samples': 458112, 'steps': 2385, 'loss/train': 2.355753183364868} -11/06/2021 21:36:17 - INFO - __main__ - Step 2387: {'lr': 0.0004999916081346426, 'samples': 458304, 'steps': 2386, 'loss/train': 2.6739003658294678} -11/06/2021 21:36:17 - INFO - __main__ - Step 2388: {'lr': 0.000499991564597397, 'samples': 458496, 'steps': 2387, 'loss/train': 2.985884189605713} -11/06/2021 21:36:18 - INFO - __main__ - Step 2389: {'lr': 0.0004999915209475091, 'samples': 458688, 'steps': 2388, 'loss/train': 2.5510177612304688} -11/06/2021 21:36:18 - INFO - __main__ - Step 2390: {'lr': 0.0004999914771849788, 'samples': 458880, 'steps': 2389, 'loss/train': 2.628279447555542} -11/06/2021 21:36:19 - INFO - __main__ - Step 2391: {'lr': 0.0004999914333098063, 'samples': 459072, 'steps': 2390, 'loss/train': 2.3192155361175537} -11/06/2021 21:36:19 - INFO - __main__ - Step 2392: {'lr': 0.0004999913893219915, 'samples': 459264, 'steps': 2391, 'loss/train': 2.4803824424743652} -11/06/2021 21:36:19 - INFO - __main__ - Step 2393: {'lr': 0.0004999913452215345, 'samples': 459456, 'steps': 2392, 'loss/train': 2.0477797985076904} -11/06/2021 21:36:20 - INFO - __main__ - Step 2394: {'lr': 0.0004999913010084351, 'samples': 459648, 'steps': 2393, 'loss/train': 2.529292583465576} -11/06/2021 21:36:21 - INFO - __main__ - Step 2395: {'lr': 0.0004999912566826935, 'samples': 459840, 'steps': 2394, 'loss/train': 2.484360456466675} -11/06/2021 21:36:21 - INFO - __main__ - Step 2396: {'lr': 0.0004999912122443098, 'samples': 460032, 'steps': 2395, 'loss/train': 2.425950288772583} -11/06/2021 21:36:22 - INFO - __main__ - Step 2397: {'lr': 0.0004999911676932838, 'samples': 460224, 'steps': 2396, 'loss/train': 2.7710964679718018} -11/06/2021 21:36:22 - INFO - __main__ - Step 2398: {'lr': 0.0004999911230296158, 'samples': 460416, 'steps': 2397, 'loss/train': 2.69278883934021} -11/06/2021 21:36:23 - INFO - __main__ - Step 2399: {'lr': 0.0004999910782533055, 'samples': 460608, 'steps': 2398, 'loss/train': 2.1563870906829834} -11/06/2021 21:36:23 - INFO - __main__ - Step 2400: {'lr': 0.0004999910333643531, 'samples': 460800, 'steps': 2399, 'loss/train': 2.21958327293396} -11/06/2021 21:36:24 - INFO - __main__ - Step 2401: {'lr': 0.0004999909883627587, 'samples': 460992, 'steps': 2400, 'loss/train': 2.3043596744537354} -11/06/2021 21:36:24 - INFO - __main__ - Step 2402: {'lr': 0.0004999909432485221, 'samples': 461184, 'steps': 2401, 'loss/train': 2.142707586288452} -11/06/2021 21:36:24 - INFO - __main__ - Step 2403: {'lr': 0.0004999908980216436, 'samples': 461376, 'steps': 2402, 'loss/train': 2.6707916259765625} -11/06/2021 21:36:25 - INFO - __main__ - Step 2404: {'lr': 0.0004999908526821229, 'samples': 461568, 'steps': 2403, 'loss/train': 2.7008554935455322} -11/06/2021 21:36:26 - INFO - __main__ - Step 2405: {'lr': 0.0004999908072299602, 'samples': 461760, 'steps': 2404, 'loss/train': 2.4561195373535156} -11/06/2021 21:36:26 - INFO - __main__ - Step 2406: {'lr': 0.0004999907616651556, 'samples': 461952, 'steps': 2405, 'loss/train': 2.6300549507141113} -11/06/2021 21:36:26 - INFO - __main__ - Step 2407: {'lr': 0.000499990715987709, 'samples': 462144, 'steps': 2406, 'loss/train': 2.5278778076171875} -11/06/2021 21:36:27 - INFO - __main__ - Step 2408: {'lr': 0.0004999906701976203, 'samples': 462336, 'steps': 2407, 'loss/train': 2.5817818641662598} -11/06/2021 21:36:28 - INFO - __main__ - Step 2409: {'lr': 0.0004999906242948898, 'samples': 462528, 'steps': 2408, 'loss/train': 2.7424280643463135} -11/06/2021 21:36:28 - INFO - __main__ - Step 2410: {'lr': 0.0004999905782795173, 'samples': 462720, 'steps': 2409, 'loss/train': 2.3306918144226074} -11/06/2021 21:36:29 - INFO - __main__ - Step 2411: {'lr': 0.000499990532151503, 'samples': 462912, 'steps': 2410, 'loss/train': 2.3240315914154053} -11/06/2021 21:36:29 - INFO - __main__ - Step 2412: {'lr': 0.0004999904859108467, 'samples': 463104, 'steps': 2411, 'loss/train': 2.3780782222747803} -11/06/2021 21:36:29 - INFO - __main__ - Step 2413: {'lr': 0.0004999904395575486, 'samples': 463296, 'steps': 2412, 'loss/train': 2.3109028339385986} -11/06/2021 21:36:30 - INFO - __main__ - Step 2414: {'lr': 0.0004999903930916087, 'samples': 463488, 'steps': 2413, 'loss/train': 2.878998279571533} -11/06/2021 21:36:31 - INFO - __main__ - Step 2415: {'lr': 0.000499990346513027, 'samples': 463680, 'steps': 2414, 'loss/train': 2.0418524742126465} -11/06/2021 21:36:31 - INFO - __main__ - Step 2416: {'lr': 0.0004999902998218034, 'samples': 463872, 'steps': 2415, 'loss/train': 2.2002334594726562} -11/06/2021 21:36:31 - INFO - __main__ - Step 2417: {'lr': 0.000499990253017938, 'samples': 464064, 'steps': 2416, 'loss/train': 2.537015438079834} -11/06/2021 21:36:32 - INFO - __main__ - Step 2418: {'lr': 0.0004999902061014311, 'samples': 464256, 'steps': 2417, 'loss/train': 2.3986918926239014} -11/06/2021 21:36:32 - INFO - __main__ - Step 2419: {'lr': 0.0004999901590722823, 'samples': 464448, 'steps': 2418, 'loss/train': 2.3698606491088867} -11/06/2021 21:36:33 - INFO - __main__ - Step 2420: {'lr': 0.0004999901119304919, 'samples': 464640, 'steps': 2419, 'loss/train': 2.4910922050476074} -11/06/2021 21:36:33 - INFO - __main__ - Step 2421: {'lr': 0.0004999900646760597, 'samples': 464832, 'steps': 2420, 'loss/train': 2.2482521533966064} -11/06/2021 21:36:34 - INFO - __main__ - Step 2422: {'lr': 0.0004999900173089858, 'samples': 465024, 'steps': 2421, 'loss/train': 3.0635385513305664} -11/06/2021 21:36:34 - INFO - __main__ - Step 2423: {'lr': 0.0004999899698292703, 'samples': 465216, 'steps': 2422, 'loss/train': 2.6223621368408203} -11/06/2021 21:36:35 - INFO - __main__ - Step 2424: {'lr': 0.0004999899222369132, 'samples': 465408, 'steps': 2423, 'loss/train': 2.0457282066345215} -11/06/2021 21:36:35 - INFO - __main__ - Step 2425: {'lr': 0.0004999898745319145, 'samples': 465600, 'steps': 2424, 'loss/train': 2.419081449508667} -11/06/2021 21:36:36 - INFO - __main__ - Step 2426: {'lr': 0.0004999898267142741, 'samples': 465792, 'steps': 2425, 'loss/train': 2.6468558311462402} -11/06/2021 21:36:36 - INFO - __main__ - Step 2427: {'lr': 0.0004999897787839923, 'samples': 465984, 'steps': 2426, 'loss/train': 2.8656837940216064} -11/06/2021 21:36:37 - INFO - __main__ - Step 2428: {'lr': 0.000499989730741069, 'samples': 466176, 'steps': 2427, 'loss/train': 2.517319679260254} -11/06/2021 21:36:37 - INFO - __main__ - Step 2429: {'lr': 0.000499989682585504, 'samples': 466368, 'steps': 2428, 'loss/train': 1.5299700498580933} -11/06/2021 21:36:37 - INFO - __main__ - Step 2430: {'lr': 0.0004999896343172976, 'samples': 466560, 'steps': 2429, 'loss/train': 1.4747153520584106} -11/06/2021 21:36:38 - INFO - __main__ - Step 2431: {'lr': 0.0004999895859364498, 'samples': 466752, 'steps': 2430, 'loss/train': 1.975550651550293} -11/06/2021 21:36:39 - INFO - __main__ - Step 2432: {'lr': 0.0004999895374429605, 'samples': 466944, 'steps': 2431, 'loss/train': 2.7396199703216553} -11/06/2021 21:36:39 - INFO - __main__ - Step 2433: {'lr': 0.0004999894888368297, 'samples': 467136, 'steps': 2432, 'loss/train': 2.1605048179626465} -11/06/2021 21:36:39 - INFO - __main__ - Step 2434: {'lr': 0.0004999894401180576, 'samples': 467328, 'steps': 2433, 'loss/train': 2.631399631500244} -11/06/2021 21:36:40 - INFO - __main__ - Step 2435: {'lr': 0.0004999893912866441, 'samples': 467520, 'steps': 2434, 'loss/train': 2.6873080730438232} -11/06/2021 21:36:41 - INFO - __main__ - Step 2436: {'lr': 0.0004999893423425892, 'samples': 467712, 'steps': 2435, 'loss/train': 2.2480852603912354} -11/06/2021 21:36:41 - INFO - __main__ - Step 2437: {'lr': 0.0004999892932858929, 'samples': 467904, 'steps': 2436, 'loss/train': 2.1071290969848633} -11/06/2021 21:36:42 - INFO - __main__ - Step 2438: {'lr': 0.0004999892441165554, 'samples': 468096, 'steps': 2437, 'loss/train': 2.8640754222869873} -11/06/2021 21:36:42 - INFO - __main__ - Step 2439: {'lr': 0.0004999891948345765, 'samples': 468288, 'steps': 2438, 'loss/train': 2.4221558570861816} -11/06/2021 21:36:42 - INFO - __main__ - Step 2440: {'lr': 0.0004999891454399565, 'samples': 468480, 'steps': 2439, 'loss/train': 2.7163968086242676} -11/06/2021 21:36:43 - INFO - __main__ - Step 2441: {'lr': 0.000499989095932695, 'samples': 468672, 'steps': 2440, 'loss/train': 2.371148109436035} -11/06/2021 21:36:44 - INFO - __main__ - Step 2442: {'lr': 0.0004999890463127924, 'samples': 468864, 'steps': 2441, 'loss/train': 2.5758795738220215} -11/06/2021 21:36:44 - INFO - __main__ - Step 2443: {'lr': 0.0004999889965802486, 'samples': 469056, 'steps': 2442, 'loss/train': 2.778921127319336} -11/06/2021 21:36:44 - INFO - __main__ - Step 2444: {'lr': 0.0004999889467350636, 'samples': 469248, 'steps': 2443, 'loss/train': 1.8492902517318726} -11/06/2021 21:36:45 - INFO - __main__ - Step 2445: {'lr': 0.0004999888967772375, 'samples': 469440, 'steps': 2444, 'loss/train': 2.191366672515869} -11/06/2021 21:36:45 - INFO - __main__ - Step 2446: {'lr': 0.0004999888467067702, 'samples': 469632, 'steps': 2445, 'loss/train': 2.458528757095337} -11/06/2021 21:36:46 - INFO - __main__ - Step 2447: {'lr': 0.0004999887965236617, 'samples': 469824, 'steps': 2446, 'loss/train': 2.605138063430786} -11/06/2021 21:36:46 - INFO - __main__ - Step 2448: {'lr': 0.0004999887462279123, 'samples': 470016, 'steps': 2447, 'loss/train': 2.1305642127990723} -11/06/2021 21:36:47 - INFO - __main__ - Step 2449: {'lr': 0.0004999886958195216, 'samples': 470208, 'steps': 2448, 'loss/train': 2.6707427501678467} -11/06/2021 21:36:47 - INFO - __main__ - Step 2450: {'lr': 0.00049998864529849, 'samples': 470400, 'steps': 2449, 'loss/train': 1.814773440361023} -11/06/2021 21:36:47 - INFO - __main__ - Step 2451: {'lr': 0.0004999885946648174, 'samples': 470592, 'steps': 2450, 'loss/train': 2.4460277557373047} -11/06/2021 21:36:48 - INFO - __main__ - Step 2452: {'lr': 0.0004999885439185037, 'samples': 470784, 'steps': 2451, 'loss/train': 2.429396390914917} -11/06/2021 21:36:49 - INFO - __main__ - Step 2453: {'lr': 0.0004999884930595491, 'samples': 470976, 'steps': 2452, 'loss/train': 2.094714879989624} -11/06/2021 21:36:49 - INFO - __main__ - Step 2454: {'lr': 0.0004999884420879534, 'samples': 471168, 'steps': 2453, 'loss/train': 2.2643680572509766} -11/06/2021 21:36:49 - INFO - __main__ - Step 2455: {'lr': 0.000499988391003717, 'samples': 471360, 'steps': 2454, 'loss/train': 2.5920233726501465} -11/06/2021 21:36:50 - INFO - __main__ - Step 2456: {'lr': 0.0004999883398068396, 'samples': 471552, 'steps': 2455, 'loss/train': 3.2174901962280273} -11/06/2021 21:36:51 - INFO - __main__ - Step 2457: {'lr': 0.0004999882884973212, 'samples': 471744, 'steps': 2456, 'loss/train': 2.311598062515259} -11/06/2021 21:36:52 - INFO - __main__ - Step 2458: {'lr': 0.000499988237075162, 'samples': 471936, 'steps': 2457, 'loss/train': 2.8705482482910156} -11/06/2021 21:36:52 - INFO - __main__ - Step 2459: {'lr': 0.000499988185540362, 'samples': 472128, 'steps': 2458, 'loss/train': 3.6789543628692627} -11/06/2021 21:36:52 - INFO - __main__ - Step 2460: {'lr': 0.0004999881338929211, 'samples': 472320, 'steps': 2459, 'loss/train': 2.2293074131011963} -11/06/2021 21:36:53 - INFO - __main__ - Step 2461: {'lr': 0.0004999880821328395, 'samples': 472512, 'steps': 2460, 'loss/train': 2.13460373878479} -11/06/2021 21:36:53 - INFO - __main__ - Step 2462: {'lr': 0.000499988030260117, 'samples': 472704, 'steps': 2461, 'loss/train': 2.2145402431488037} -11/06/2021 21:36:54 - INFO - __main__ - Step 2463: {'lr': 0.0004999879782747539, 'samples': 472896, 'steps': 2462, 'loss/train': 2.412808418273926} -11/06/2021 21:36:55 - INFO - __main__ - Step 2464: {'lr': 0.00049998792617675, 'samples': 473088, 'steps': 2463, 'loss/train': 1.355026125907898} -11/06/2021 21:36:55 - INFO - __main__ - Step 2465: {'lr': 0.0004999878739661053, 'samples': 473280, 'steps': 2464, 'loss/train': 2.797194242477417} -11/06/2021 21:36:55 - INFO - __main__ - Step 2466: {'lr': 0.0004999878216428201, 'samples': 473472, 'steps': 2465, 'loss/train': 3.099053144454956} -11/06/2021 21:36:56 - INFO - __main__ - Step 2467: {'lr': 0.0004999877692068942, 'samples': 473664, 'steps': 2466, 'loss/train': 2.666736602783203} -11/06/2021 21:36:57 - INFO - __main__ - Step 2468: {'lr': 0.0004999877166583276, 'samples': 473856, 'steps': 2467, 'loss/train': 2.2007715702056885} -11/06/2021 21:36:57 - INFO - __main__ - Step 2469: {'lr': 0.0004999876639971204, 'samples': 474048, 'steps': 2468, 'loss/train': 2.5760223865509033} -11/06/2021 21:36:57 - INFO - __main__ - Step 2470: {'lr': 0.0004999876112232726, 'samples': 474240, 'steps': 2469, 'loss/train': 2.2806897163391113} -11/06/2021 21:36:58 - INFO - __main__ - Step 2471: {'lr': 0.0004999875583367844, 'samples': 474432, 'steps': 2470, 'loss/train': 2.3899688720703125} -11/06/2021 21:36:58 - INFO - __main__ - Step 2472: {'lr': 0.0004999875053376555, 'samples': 474624, 'steps': 2471, 'loss/train': 2.720411539077759} -11/06/2021 21:36:59 - INFO - __main__ - Step 2473: {'lr': 0.0004999874522258861, 'samples': 474816, 'steps': 2472, 'loss/train': 2.3538568019866943} -11/06/2021 21:36:59 - INFO - __main__ - Step 2474: {'lr': 0.0004999873990014763, 'samples': 475008, 'steps': 2473, 'loss/train': 2.296961784362793} -11/06/2021 21:37:00 - INFO - __main__ - Step 2475: {'lr': 0.0004999873456644259, 'samples': 475200, 'steps': 2474, 'loss/train': 3.126654624938965} -11/06/2021 21:37:00 - INFO - __main__ - Step 2476: {'lr': 0.0004999872922147352, 'samples': 475392, 'steps': 2475, 'loss/train': 2.8180599212646484} -11/06/2021 21:37:01 - INFO - __main__ - Step 2477: {'lr': 0.0004999872386524041, 'samples': 475584, 'steps': 2476, 'loss/train': 2.209730625152588} -11/06/2021 21:37:02 - INFO - __main__ - Step 2478: {'lr': 0.0004999871849774325, 'samples': 475776, 'steps': 2477, 'loss/train': 2.773592472076416} -11/06/2021 21:37:02 - INFO - __main__ - Step 2479: {'lr': 0.0004999871311898205, 'samples': 475968, 'steps': 2478, 'loss/train': 2.503931760787964} -11/06/2021 21:37:02 - INFO - __main__ - Step 2480: {'lr': 0.0004999870772895683, 'samples': 476160, 'steps': 2479, 'loss/train': 2.848806858062744} -11/06/2021 21:37:03 - INFO - __main__ - Step 2481: {'lr': 0.0004999870232766756, 'samples': 476352, 'steps': 2480, 'loss/train': 2.6014020442962646} -11/06/2021 21:37:03 - INFO - __main__ - Step 2482: {'lr': 0.0004999869691511428, 'samples': 476544, 'steps': 2481, 'loss/train': 2.4127416610717773} -11/06/2021 21:37:04 - INFO - __main__ - Step 2483: {'lr': 0.0004999869149129696, 'samples': 476736, 'steps': 2482, 'loss/train': 1.9022128582000732} -11/06/2021 21:37:04 - INFO - __main__ - Step 2484: {'lr': 0.0004999868605621563, 'samples': 476928, 'steps': 2483, 'loss/train': 2.502490282058716} -11/06/2021 21:37:05 - INFO - __main__ - Step 2485: {'lr': 0.0004999868060987027, 'samples': 477120, 'steps': 2484, 'loss/train': 2.5162899494171143} -11/06/2021 21:37:05 - INFO - __main__ - Step 2486: {'lr': 0.0004999867515226088, 'samples': 477312, 'steps': 2485, 'loss/train': 2.565920829772949} -11/06/2021 21:37:05 - INFO - __main__ - Step 2487: {'lr': 0.0004999866968338748, 'samples': 477504, 'steps': 2486, 'loss/train': 2.152040481567383} -11/06/2021 21:37:07 - INFO - __main__ - Step 2488: {'lr': 0.0004999866420325006, 'samples': 477696, 'steps': 2487, 'loss/train': 2.5506532192230225} -11/06/2021 21:37:07 - INFO - __main__ - Step 2489: {'lr': 0.0004999865871184863, 'samples': 477888, 'steps': 2488, 'loss/train': 2.6349217891693115} -11/06/2021 21:37:07 - INFO - __main__ - Step 2490: {'lr': 0.000499986532091832, 'samples': 478080, 'steps': 2489, 'loss/train': 1.8564928770065308} -11/06/2021 21:37:08 - INFO - __main__ - Step 2491: {'lr': 0.0004999864769525375, 'samples': 478272, 'steps': 2490, 'loss/train': 2.035461664199829} -11/06/2021 21:37:08 - INFO - __main__ - Step 2492: {'lr': 0.000499986421700603, 'samples': 478464, 'steps': 2491, 'loss/train': 2.712242364883423} -11/06/2021 21:37:09 - INFO - __main__ - Step 2493: {'lr': 0.0004999863663360285, 'samples': 478656, 'steps': 2492, 'loss/train': 1.668128490447998} -11/06/2021 21:37:09 - INFO - __main__ - Step 2494: {'lr': 0.000499986310858814, 'samples': 478848, 'steps': 2493, 'loss/train': 2.30643892288208} -11/06/2021 21:37:10 - INFO - __main__ - Step 2495: {'lr': 0.0004999862552689595, 'samples': 479040, 'steps': 2494, 'loss/train': 2.329277992248535} -11/06/2021 21:37:10 - INFO - __main__ - Step 2496: {'lr': 0.000499986199566465, 'samples': 479232, 'steps': 2495, 'loss/train': 2.888967275619507} -11/06/2021 21:37:10 - INFO - __main__ - Step 2497: {'lr': 0.0004999861437513306, 'samples': 479424, 'steps': 2496, 'loss/train': 2.5283238887786865} -11/06/2021 21:37:11 - INFO - __main__ - Step 2498: {'lr': 0.0004999860878235564, 'samples': 479616, 'steps': 2497, 'loss/train': 2.4118523597717285} -11/06/2021 21:37:12 - INFO - __main__ - Step 2499: {'lr': 0.0004999860317831423, 'samples': 479808, 'steps': 2498, 'loss/train': 1.975379228591919} -11/06/2021 21:37:12 - INFO - __main__ - Step 2500: {'lr': 0.0004999859756300883, 'samples': 480000, 'steps': 2499, 'loss/train': 2.776916027069092} -11/06/2021 21:37:13 - INFO - __main__ - Step 2501: {'lr': 0.0004999859193643945, 'samples': 480192, 'steps': 2500, 'loss/train': 1.9438010454177856} -11/06/2021 21:37:13 - INFO - __main__ - Step 2502: {'lr': 0.0004999858629860609, 'samples': 480384, 'steps': 2501, 'loss/train': 2.3400754928588867} -11/06/2021 21:37:14 - INFO - __main__ - Step 2503: {'lr': 0.0004999858064950875, 'samples': 480576, 'steps': 2502, 'loss/train': 2.453505516052246} -11/06/2021 21:37:14 - INFO - __main__ - Step 2504: {'lr': 0.0004999857498914744, 'samples': 480768, 'steps': 2503, 'loss/train': 1.737013339996338} -11/06/2021 21:37:15 - INFO - __main__ - Step 2505: {'lr': 0.0004999856931752215, 'samples': 480960, 'steps': 2504, 'loss/train': 2.44512677192688} -11/06/2021 21:37:15 - INFO - __main__ - Step 2506: {'lr': 0.000499985636346329, 'samples': 481152, 'steps': 2505, 'loss/train': 2.2163236141204834} -11/06/2021 21:37:15 - INFO - __main__ - Step 2507: {'lr': 0.0004999855794047968, 'samples': 481344, 'steps': 2506, 'loss/train': 2.2586050033569336} -11/06/2021 21:37:16 - INFO - __main__ - Step 2508: {'lr': 0.000499985522350625, 'samples': 481536, 'steps': 2507, 'loss/train': 2.6702263355255127} -11/06/2021 21:37:17 - INFO - __main__ - Step 2509: {'lr': 0.0004999854651838134, 'samples': 481728, 'steps': 2508, 'loss/train': 1.7556337118148804} -11/06/2021 21:37:17 - INFO - __main__ - Step 2510: {'lr': 0.0004999854079043624, 'samples': 481920, 'steps': 2509, 'loss/train': 2.5938799381256104} -11/06/2021 21:37:17 - INFO - __main__ - Step 2511: {'lr': 0.0004999853505122718, 'samples': 482112, 'steps': 2510, 'loss/train': 2.314603567123413} -11/06/2021 21:37:18 - INFO - __main__ - Step 2512: {'lr': 0.0004999852930075416, 'samples': 482304, 'steps': 2511, 'loss/train': 3.3958892822265625} -11/06/2021 21:37:18 - INFO - __main__ - Step 2513: {'lr': 0.0004999852353901719, 'samples': 482496, 'steps': 2512, 'loss/train': 2.0846526622772217} -11/06/2021 21:37:19 - INFO - __main__ - Step 2514: {'lr': 0.0004999851776601627, 'samples': 482688, 'steps': 2513, 'loss/train': 2.1145737171173096} -11/06/2021 21:37:19 - INFO - __main__ - Step 2515: {'lr': 0.0004999851198175141, 'samples': 482880, 'steps': 2514, 'loss/train': 2.3666229248046875} -11/06/2021 21:37:20 - INFO - __main__ - Step 2516: {'lr': 0.0004999850618622259, 'samples': 483072, 'steps': 2515, 'loss/train': 1.9783778190612793} -11/06/2021 21:37:20 - INFO - __main__ - Step 2517: {'lr': 0.0004999850037942984, 'samples': 483264, 'steps': 2516, 'loss/train': 1.6819298267364502} -11/06/2021 21:37:21 - INFO - __main__ - Step 2518: {'lr': 0.0004999849456137316, 'samples': 483456, 'steps': 2517, 'loss/train': 2.5427420139312744} -11/06/2021 21:37:22 - INFO - __main__ - Step 2519: {'lr': 0.0004999848873205254, 'samples': 483648, 'steps': 2518, 'loss/train': 1.944232702255249} -11/06/2021 21:37:22 - INFO - __main__ - Step 2520: {'lr': 0.0004999848289146798, 'samples': 483840, 'steps': 2519, 'loss/train': 2.538642644882202} -11/06/2021 21:37:22 - INFO - __main__ - Step 2521: {'lr': 0.0004999847703961948, 'samples': 484032, 'steps': 2520, 'loss/train': 2.035733699798584} -11/06/2021 21:37:23 - INFO - __main__ - Step 2522: {'lr': 0.0004999847117650708, 'samples': 484224, 'steps': 2521, 'loss/train': 2.2497646808624268} -11/06/2021 21:37:23 - INFO - __main__ - Step 2523: {'lr': 0.0004999846530213074, 'samples': 484416, 'steps': 2522, 'loss/train': 2.4687421321868896} -11/06/2021 21:37:24 - INFO - __main__ - Step 2524: {'lr': 0.0004999845941649048, 'samples': 484608, 'steps': 2523, 'loss/train': 2.6273131370544434} -11/06/2021 21:37:25 - INFO - __main__ - Step 2525: {'lr': 0.0004999845351958629, 'samples': 484800, 'steps': 2524, 'loss/train': 2.2162749767303467} -11/06/2021 21:37:25 - INFO - __main__ - Step 2526: {'lr': 0.0004999844761141818, 'samples': 484992, 'steps': 2525, 'loss/train': 2.4674794673919678} -11/06/2021 21:37:25 - INFO - __main__ - Step 2527: {'lr': 0.0004999844169198617, 'samples': 485184, 'steps': 2526, 'loss/train': 2.444234609603882} -11/06/2021 21:37:26 - INFO - __main__ - Step 2528: {'lr': 0.0004999843576129024, 'samples': 485376, 'steps': 2527, 'loss/train': 2.046820640563965} -11/06/2021 21:37:27 - INFO - __main__ - Step 2529: {'lr': 0.000499984298193304, 'samples': 485568, 'steps': 2528, 'loss/train': 3.3430094718933105} -11/06/2021 21:37:27 - INFO - __main__ - Step 2530: {'lr': 0.0004999842386610666, 'samples': 485760, 'steps': 2529, 'loss/train': 2.4798810482025146} -11/06/2021 21:37:27 - INFO - __main__ - Step 2531: {'lr': 0.0004999841790161901, 'samples': 485952, 'steps': 2530, 'loss/train': 2.1105799674987793} -11/06/2021 21:37:28 - INFO - __main__ - Step 2532: {'lr': 0.0004999841192586746, 'samples': 486144, 'steps': 2531, 'loss/train': 2.247392177581787} -11/06/2021 21:37:28 - INFO - __main__ - Step 2533: {'lr': 0.0004999840593885201, 'samples': 486336, 'steps': 2532, 'loss/train': 2.632009983062744} -11/06/2021 21:37:29 - INFO - __main__ - Step 2534: {'lr': 0.0004999839994057266, 'samples': 486528, 'steps': 2533, 'loss/train': 2.2957653999328613} -11/06/2021 21:37:29 - INFO - __main__ - Step 2535: {'lr': 0.0004999839393102943, 'samples': 486720, 'steps': 2534, 'loss/train': 2.15610671043396} -11/06/2021 21:37:30 - INFO - __main__ - Step 2536: {'lr': 0.0004999838791022229, 'samples': 486912, 'steps': 2535, 'loss/train': 1.8324062824249268} -11/06/2021 21:37:30 - INFO - __main__ - Step 2537: {'lr': 0.0004999838187815128, 'samples': 487104, 'steps': 2536, 'loss/train': 2.1403756141662598} -11/06/2021 21:37:30 - INFO - __main__ - Step 2538: {'lr': 0.0004999837583481638, 'samples': 487296, 'steps': 2537, 'loss/train': 2.4630844593048096} -11/06/2021 21:37:31 - INFO - __main__ - Step 2539: {'lr': 0.000499983697802176, 'samples': 487488, 'steps': 2538, 'loss/train': 2.763502836227417} -11/06/2021 21:37:32 - INFO - __main__ - Step 2540: {'lr': 0.0004999836371435494, 'samples': 487680, 'steps': 2539, 'loss/train': 1.6404800415039062} -11/06/2021 21:37:32 - INFO - __main__ - Step 2541: {'lr': 0.000499983576372284, 'samples': 487872, 'steps': 2540, 'loss/train': 0.7703345417976379} -11/06/2021 21:37:32 - INFO - __main__ - Step 2542: {'lr': 0.0004999835154883798, 'samples': 488064, 'steps': 2541, 'loss/train': 2.3808321952819824} -11/06/2021 21:37:33 - INFO - __main__ - Step 2543: {'lr': 0.0004999834544918369, 'samples': 488256, 'steps': 2542, 'loss/train': 1.3541216850280762} -11/06/2021 21:37:33 - INFO - __main__ - Step 2544: {'lr': 0.0004999833933826554, 'samples': 488448, 'steps': 2543, 'loss/train': 2.6432573795318604} -11/06/2021 21:37:34 - INFO - __main__ - Step 2545: {'lr': 0.0004999833321608351, 'samples': 488640, 'steps': 2544, 'loss/train': 2.655363082885742} -11/06/2021 21:37:35 - INFO - __main__ - Step 2546: {'lr': 0.0004999832708263764, 'samples': 488832, 'steps': 2545, 'loss/train': 1.829182744026184} -11/06/2021 21:37:35 - INFO - __main__ - Step 2547: {'lr': 0.000499983209379279, 'samples': 489024, 'steps': 2546, 'loss/train': 2.714189291000366} -11/06/2021 21:37:35 - INFO - __main__ - Step 2548: {'lr': 0.0004999831478195429, 'samples': 489216, 'steps': 2547, 'loss/train': 2.1510307788848877} -11/06/2021 21:37:36 - INFO - __main__ - Step 2549: {'lr': 0.0004999830861471684, 'samples': 489408, 'steps': 2548, 'loss/train': 2.5913808345794678} -11/06/2021 21:37:37 - INFO - __main__ - Step 2550: {'lr': 0.0004999830243621553, 'samples': 489600, 'steps': 2549, 'loss/train': 2.1029839515686035} -11/06/2021 21:37:37 - INFO - __main__ - Step 2551: {'lr': 0.0004999829624645037, 'samples': 489792, 'steps': 2550, 'loss/train': 2.4384331703186035} -11/06/2021 21:37:37 - INFO - __main__ - Step 2552: {'lr': 0.0004999829004542136, 'samples': 489984, 'steps': 2551, 'loss/train': 2.5452609062194824} -11/06/2021 21:37:38 - INFO - __main__ - Step 2553: {'lr': 0.0004999828383312851, 'samples': 490176, 'steps': 2552, 'loss/train': 2.293485403060913} -11/06/2021 21:37:38 - INFO - __main__ - Step 2554: {'lr': 0.0004999827760957182, 'samples': 490368, 'steps': 2553, 'loss/train': 2.1594653129577637} -11/06/2021 21:37:39 - INFO - __main__ - Step 2555: {'lr': 0.000499982713747513, 'samples': 490560, 'steps': 2554, 'loss/train': 2.2348339557647705} -11/06/2021 21:37:39 - INFO - __main__ - Step 2556: {'lr': 0.0004999826512866693, 'samples': 490752, 'steps': 2555, 'loss/train': 2.039029598236084} -11/06/2021 21:37:40 - INFO - __main__ - Step 2557: {'lr': 0.0004999825887131874, 'samples': 490944, 'steps': 2556, 'loss/train': 2.3221940994262695} -11/06/2021 21:37:40 - INFO - __main__ - Step 2558: {'lr': 0.0004999825260270671, 'samples': 491136, 'steps': 2557, 'loss/train': 1.9088735580444336} -11/06/2021 21:37:40 - INFO - __main__ - Step 2559: {'lr': 0.0004999824632283086, 'samples': 491328, 'steps': 2558, 'loss/train': 2.34741473197937} -11/06/2021 21:37:41 - INFO - __main__ - Step 2560: {'lr': 0.0004999824003169119, 'samples': 491520, 'steps': 2559, 'loss/train': 2.832210063934326} -11/06/2021 21:37:42 - INFO - __main__ - Step 2561: {'lr': 0.000499982337292877, 'samples': 491712, 'steps': 2560, 'loss/train': 2.518115758895874} -11/06/2021 21:37:42 - INFO - __main__ - Step 2562: {'lr': 0.0004999822741562038, 'samples': 491904, 'steps': 2561, 'loss/train': 1.5568736791610718} -11/06/2021 21:37:42 - INFO - __main__ - Step 2563: {'lr': 0.0004999822109068925, 'samples': 492096, 'steps': 2562, 'loss/train': 2.128868818283081} -11/06/2021 21:37:43 - INFO - __main__ - Step 2564: {'lr': 0.000499982147544943, 'samples': 492288, 'steps': 2563, 'loss/train': 2.274667739868164} -11/06/2021 21:37:44 - INFO - __main__ - Step 2565: {'lr': 0.0004999820840703554, 'samples': 492480, 'steps': 2564, 'loss/train': 2.438570022583008} -11/06/2021 21:37:44 - INFO - __main__ - Step 2566: {'lr': 0.0004999820204831298, 'samples': 492672, 'steps': 2565, 'loss/train': 1.8974850177764893} -11/06/2021 21:37:44 - INFO - __main__ - Step 2567: {'lr': 0.0004999819567832661, 'samples': 492864, 'steps': 2566, 'loss/train': 1.991250991821289} -11/06/2021 21:37:45 - INFO - __main__ - Step 2568: {'lr': 0.0004999818929707645, 'samples': 493056, 'steps': 2567, 'loss/train': 2.29544734954834} -11/06/2021 21:37:45 - INFO - __main__ - Step 2569: {'lr': 0.0004999818290456249, 'samples': 493248, 'steps': 2568, 'loss/train': 2.5977227687835693} -11/06/2021 21:37:45 - INFO - __main__ - Step 2570: {'lr': 0.0004999817650078474, 'samples': 493440, 'steps': 2569, 'loss/train': 2.2066221237182617} -11/06/2021 21:37:47 - INFO - __main__ - Step 2571: {'lr': 0.0004999817008574318, 'samples': 493632, 'steps': 2570, 'loss/train': 2.1649460792541504} -11/06/2021 21:37:47 - INFO - __main__ - Step 2572: {'lr': 0.0004999816365943784, 'samples': 493824, 'steps': 2571, 'loss/train': 2.5640785694122314} -11/06/2021 21:37:47 - INFO - __main__ - Step 2573: {'lr': 0.000499981572218687, 'samples': 494016, 'steps': 2572, 'loss/train': 2.131150007247925} -11/06/2021 21:37:48 - INFO - __main__ - Step 2574: {'lr': 0.0004999815077303579, 'samples': 494208, 'steps': 2573, 'loss/train': 2.548187017440796} -11/06/2021 21:37:48 - INFO - __main__ - Step 2575: {'lr': 0.000499981443129391, 'samples': 494400, 'steps': 2574, 'loss/train': 1.7672605514526367} -11/06/2021 21:37:49 - INFO - __main__ - Step 2576: {'lr': 0.0004999813784157863, 'samples': 494592, 'steps': 2575, 'loss/train': 1.979129433631897} -11/06/2021 21:37:49 - INFO - __main__ - Step 2577: {'lr': 0.0004999813135895438, 'samples': 494784, 'steps': 2576, 'loss/train': 2.5306124687194824} -11/06/2021 21:37:50 - INFO - __main__ - Step 2578: {'lr': 0.0004999812486506637, 'samples': 494976, 'steps': 2577, 'loss/train': 1.985874056816101} -11/06/2021 21:37:50 - INFO - __main__ - Step 2579: {'lr': 0.0004999811835991457, 'samples': 495168, 'steps': 2578, 'loss/train': 2.2465949058532715} -11/06/2021 21:37:50 - INFO - __main__ - Step 2580: {'lr': 0.0004999811184349902, 'samples': 495360, 'steps': 2579, 'loss/train': 1.718479871749878} -11/06/2021 21:37:51 - INFO - __main__ - Step 2581: {'lr': 0.000499981053158197, 'samples': 495552, 'steps': 2580, 'loss/train': 2.3030970096588135} -11/06/2021 21:37:52 - INFO - __main__ - Step 2582: {'lr': 0.0004999809877687662, 'samples': 495744, 'steps': 2581, 'loss/train': 2.4952125549316406} -11/06/2021 21:37:52 - INFO - __main__ - Step 2583: {'lr': 0.0004999809222666978, 'samples': 495936, 'steps': 2582, 'loss/train': 2.9251458644866943} -11/06/2021 21:37:52 - INFO - __main__ - Step 2584: {'lr': 0.0004999808566519919, 'samples': 496128, 'steps': 2583, 'loss/train': 2.0826971530914307} -11/06/2021 21:37:53 - INFO - __main__ - Step 2585: {'lr': 0.0004999807909246485, 'samples': 496320, 'steps': 2584, 'loss/train': 2.6530747413635254} -11/06/2021 21:37:54 - INFO - __main__ - Step 2586: {'lr': 0.0004999807250846676, 'samples': 496512, 'steps': 2585, 'loss/train': 2.023077964782715} -11/06/2021 21:37:54 - INFO - __main__ - Step 2587: {'lr': 0.0004999806591320492, 'samples': 496704, 'steps': 2586, 'loss/train': 2.128833532333374} -11/06/2021 21:37:54 - INFO - __main__ - Step 2588: {'lr': 0.0004999805930667934, 'samples': 496896, 'steps': 2587, 'loss/train': 2.2073006629943848} -11/06/2021 21:37:55 - INFO - __main__ - Step 2589: {'lr': 0.0004999805268889003, 'samples': 497088, 'steps': 2588, 'loss/train': 2.542658567428589} -11/06/2021 21:37:55 - INFO - __main__ - Step 2590: {'lr': 0.0004999804605983697, 'samples': 497280, 'steps': 2589, 'loss/train': 1.7954328060150146} -11/06/2021 21:37:56 - INFO - __main__ - Step 2591: {'lr': 0.0004999803941952018, 'samples': 497472, 'steps': 2590, 'loss/train': 1.970054030418396} -11/06/2021 21:37:57 - INFO - __main__ - Step 2592: {'lr': 0.0004999803276793965, 'samples': 497664, 'steps': 2591, 'loss/train': 2.5273969173431396} -11/06/2021 21:37:57 - INFO - __main__ - Step 2593: {'lr': 0.0004999802610509541, 'samples': 497856, 'steps': 2592, 'loss/train': 2.8750476837158203} -11/06/2021 21:37:57 - INFO - __main__ - Step 2594: {'lr': 0.0004999801943098743, 'samples': 498048, 'steps': 2593, 'loss/train': 2.145956039428711} -11/06/2021 21:37:58 - INFO - __main__ - Step 2595: {'lr': 0.0004999801274561573, 'samples': 498240, 'steps': 2594, 'loss/train': 1.3880176544189453} -11/06/2021 21:37:58 - INFO - __main__ - Step 2596: {'lr': 0.0004999800604898032, 'samples': 498432, 'steps': 2595, 'loss/train': 2.8618476390838623} -11/06/2021 21:37:59 - INFO - __main__ - Step 2597: {'lr': 0.000499979993410812, 'samples': 498624, 'steps': 2596, 'loss/train': 1.0421839952468872} -11/06/2021 21:37:59 - INFO - __main__ - Step 2598: {'lr': 0.0004999799262191835, 'samples': 498816, 'steps': 2597, 'loss/train': 2.2791144847869873} -11/06/2021 21:38:00 - INFO - __main__ - Step 2599: {'lr': 0.0004999798589149179, 'samples': 499008, 'steps': 2598, 'loss/train': 1.718825101852417} -11/06/2021 21:38:00 - INFO - __main__ - Step 2600: {'lr': 0.0004999797914980154, 'samples': 499200, 'steps': 2599, 'loss/train': 2.3873207569122314} -11/06/2021 21:38:01 - INFO - __main__ - Step 2601: {'lr': 0.0004999797239684757, 'samples': 499392, 'steps': 2600, 'loss/train': 1.5167217254638672} -11/06/2021 21:38:02 - INFO - __main__ - Step 2602: {'lr': 0.0004999796563262991, 'samples': 499584, 'steps': 2601, 'loss/train': 2.33709454536438} -11/06/2021 21:38:02 - INFO - __main__ - Step 2603: {'lr': 0.0004999795885714855, 'samples': 499776, 'steps': 2602, 'loss/train': 1.5589454174041748} -11/06/2021 21:38:02 - INFO - __main__ - Step 2604: {'lr': 0.0004999795207040349, 'samples': 499968, 'steps': 2603, 'loss/train': 3.2038750648498535} -11/06/2021 21:38:03 - INFO - __main__ - Step 2605: {'lr': 0.0004999794527239474, 'samples': 500160, 'steps': 2604, 'loss/train': 2.761178731918335} -11/06/2021 21:38:03 - INFO - __main__ - Step 2606: {'lr': 0.000499979384631223, 'samples': 500352, 'steps': 2605, 'loss/train': 2.426281690597534} -11/06/2021 21:38:03 - INFO - __main__ - Step 2607: {'lr': 0.000499979316425862, 'samples': 500544, 'steps': 2606, 'loss/train': 2.246225118637085} -11/06/2021 21:38:04 - INFO - __main__ - Step 2608: {'lr': 0.0004999792481078639, 'samples': 500736, 'steps': 2607, 'loss/train': 1.7112780809402466} -11/06/2021 21:38:05 - INFO - __main__ - Step 2609: {'lr': 0.000499979179677229, 'samples': 500928, 'steps': 2608, 'loss/train': 2.6037216186523438} -11/06/2021 21:38:05 - INFO - __main__ - Step 2610: {'lr': 0.0004999791111339574, 'samples': 501120, 'steps': 2609, 'loss/train': 2.3880434036254883} -11/06/2021 21:38:05 - INFO - __main__ - Step 2611: {'lr': 0.0004999790424780492, 'samples': 501312, 'steps': 2610, 'loss/train': 2.595461368560791} -11/06/2021 21:38:06 - INFO - __main__ - Step 2612: {'lr': 0.0004999789737095041, 'samples': 501504, 'steps': 2611, 'loss/train': 1.1569690704345703} -11/06/2021 21:38:07 - INFO - __main__ - Step 2613: {'lr': 0.0004999789048283224, 'samples': 501696, 'steps': 2612, 'loss/train': 3.0552828311920166} -11/06/2021 21:38:07 - INFO - __main__ - Step 2614: {'lr': 0.0004999788358345041, 'samples': 501888, 'steps': 2613, 'loss/train': 2.318122386932373} -11/06/2021 21:38:08 - INFO - __main__ - Step 2615: {'lr': 0.0004999787667280492, 'samples': 502080, 'steps': 2614, 'loss/train': 2.3980915546417236} -11/06/2021 21:38:08 - INFO - __main__ - Step 2616: {'lr': 0.0004999786975089577, 'samples': 502272, 'steps': 2615, 'loss/train': 4.580399513244629} -11/06/2021 21:38:08 - INFO - __main__ - Step 2617: {'lr': 0.0004999786281772296, 'samples': 502464, 'steps': 2616, 'loss/train': 2.6063055992126465} -11/06/2021 21:38:09 - INFO - __main__ - Step 2618: {'lr': 0.0004999785587328651, 'samples': 502656, 'steps': 2617, 'loss/train': 2.637915849685669} -11/06/2021 21:38:10 - INFO - __main__ - Step 2619: {'lr': 0.0004999784891758641, 'samples': 502848, 'steps': 2618, 'loss/train': 2.712459087371826} -11/06/2021 21:38:10 - INFO - __main__ - Step 2620: {'lr': 0.0004999784195062266, 'samples': 503040, 'steps': 2619, 'loss/train': 1.5384448766708374} -11/06/2021 21:38:10 - INFO - __main__ - Step 2621: {'lr': 0.0004999783497239526, 'samples': 503232, 'steps': 2620, 'loss/train': 2.1913907527923584} -11/06/2021 21:38:11 - INFO - __main__ - Step 2622: {'lr': 0.0004999782798290424, 'samples': 503424, 'steps': 2621, 'loss/train': 2.0295615196228027} -11/06/2021 21:38:11 - INFO - __main__ - Step 2623: {'lr': 0.0004999782098214957, 'samples': 503616, 'steps': 2622, 'loss/train': 2.4918506145477295} -11/06/2021 21:38:12 - INFO - __main__ - Step 2624: {'lr': 0.0004999781397013127, 'samples': 503808, 'steps': 2623, 'loss/train': 2.2522714138031006} -11/06/2021 21:38:13 - INFO - __main__ - Step 2625: {'lr': 0.0004999780694684934, 'samples': 504000, 'steps': 2624, 'loss/train': 2.477266550064087} -11/06/2021 21:38:13 - INFO - __main__ - Step 2626: {'lr': 0.000499977999123038, 'samples': 504192, 'steps': 2625, 'loss/train': 2.451108455657959} -11/06/2021 21:38:13 - INFO - __main__ - Step 2627: {'lr': 0.0004999779286649461, 'samples': 504384, 'steps': 2626, 'loss/train': 2.620913028717041} -11/06/2021 21:38:14 - INFO - __main__ - Step 2628: {'lr': 0.0004999778580942183, 'samples': 504576, 'steps': 2627, 'loss/train': 1.3361049890518188} -11/06/2021 21:38:15 - INFO - __main__ - Step 2629: {'lr': 0.000499977787410854, 'samples': 504768, 'steps': 2628, 'loss/train': 2.3474013805389404} -11/06/2021 21:38:15 - INFO - __main__ - Step 2630: {'lr': 0.0004999777166148539, 'samples': 504960, 'steps': 2629, 'loss/train': 2.328670024871826} -11/06/2021 21:38:15 - INFO - __main__ - Step 2631: {'lr': 0.0004999776457062175, 'samples': 505152, 'steps': 2630, 'loss/train': 2.4533984661102295} -11/06/2021 21:38:16 - INFO - __main__ - Step 2632: {'lr': 0.0004999775746849451, 'samples': 505344, 'steps': 2631, 'loss/train': 1.9219590425491333} -11/06/2021 21:38:16 - INFO - __main__ - Step 2633: {'lr': 0.0004999775035510367, 'samples': 505536, 'steps': 2632, 'loss/train': 1.3246666193008423} -11/06/2021 21:38:17 - INFO - __main__ - Step 2634: {'lr': 0.0004999774323044922, 'samples': 505728, 'steps': 2633, 'loss/train': 2.5250437259674072} -11/06/2021 21:38:17 - INFO - __main__ - Step 2635: {'lr': 0.0004999773609453118, 'samples': 505920, 'steps': 2634, 'loss/train': 2.8457674980163574} -11/06/2021 21:38:18 - INFO - __main__ - Step 2636: {'lr': 0.0004999772894734954, 'samples': 506112, 'steps': 2635, 'loss/train': 1.6440210342407227} -11/06/2021 21:38:18 - INFO - __main__ - Step 2637: {'lr': 0.000499977217889043, 'samples': 506304, 'steps': 2636, 'loss/train': 2.209573984146118} -11/06/2021 21:38:18 - INFO - __main__ - Step 2638: {'lr': 0.0004999771461919549, 'samples': 506496, 'steps': 2637, 'loss/train': 2.6149797439575195} -11/06/2021 21:38:20 - INFO - __main__ - Step 2639: {'lr': 0.0004999770743822309, 'samples': 506688, 'steps': 2638, 'loss/train': 1.8034636974334717} -11/06/2021 21:38:20 - INFO - __main__ - Step 2640: {'lr': 0.0004999770024598711, 'samples': 506880, 'steps': 2639, 'loss/train': 2.848144054412842} -11/06/2021 21:38:20 - INFO - __main__ - Step 2641: {'lr': 0.0004999769304248754, 'samples': 507072, 'steps': 2640, 'loss/train': 2.00382661819458} -11/06/2021 21:38:21 - INFO - __main__ - Step 2642: {'lr': 0.0004999768582772442, 'samples': 507264, 'steps': 2641, 'loss/train': 2.284688711166382} -11/06/2021 21:38:21 - INFO - __main__ - Step 2643: {'lr': 0.000499976786016977, 'samples': 507456, 'steps': 2642, 'loss/train': 2.6324987411499023} -11/06/2021 21:38:22 - INFO - __main__ - Step 2644: {'lr': 0.0004999767136440742, 'samples': 507648, 'steps': 2643, 'loss/train': 2.4299545288085938} -11/06/2021 21:38:22 - INFO - __main__ - Step 2645: {'lr': 0.0004999766411585359, 'samples': 507840, 'steps': 2644, 'loss/train': 2.3650753498077393} -11/06/2021 21:38:23 - INFO - __main__ - Step 2646: {'lr': 0.0004999765685603618, 'samples': 508032, 'steps': 2645, 'loss/train': 1.2427858114242554} -11/06/2021 21:38:23 - INFO - __main__ - Step 2647: {'lr': 0.0004999764958495522, 'samples': 508224, 'steps': 2646, 'loss/train': 1.7125329971313477} -11/06/2021 21:38:23 - INFO - __main__ - Step 2648: {'lr': 0.0004999764230261072, 'samples': 508416, 'steps': 2647, 'loss/train': 2.69739031791687} -11/06/2021 21:38:24 - INFO - __main__ - Step 2649: {'lr': 0.0004999763500900265, 'samples': 508608, 'steps': 2648, 'loss/train': 2.207709550857544} -11/06/2021 21:38:25 - INFO - __main__ - Step 2650: {'lr': 0.0004999762770413103, 'samples': 508800, 'steps': 2649, 'loss/train': 2.108356237411499} -11/06/2021 21:38:25 - INFO - __main__ - Step 2651: {'lr': 0.0004999762038799587, 'samples': 508992, 'steps': 2650, 'loss/train': 2.2225661277770996} -11/06/2021 21:38:25 - INFO - __main__ - Step 2652: {'lr': 0.0004999761306059717, 'samples': 509184, 'steps': 2651, 'loss/train': 2.4659764766693115} -11/06/2021 21:38:26 - INFO - __main__ - Step 2653: {'lr': 0.0004999760572193492, 'samples': 509376, 'steps': 2652, 'loss/train': 2.0966432094573975} -11/06/2021 21:38:26 - INFO - __main__ - Step 2654: {'lr': 0.0004999759837200914, 'samples': 509568, 'steps': 2653, 'loss/train': 2.6494579315185547} -11/06/2021 21:38:27 - INFO - __main__ - Step 2655: {'lr': 0.0004999759101081984, 'samples': 509760, 'steps': 2654, 'loss/train': 2.213627815246582} -11/06/2021 21:38:28 - INFO - __main__ - Step 2656: {'lr': 0.0004999758363836701, 'samples': 509952, 'steps': 2655, 'loss/train': 2.514630079269409} -11/06/2021 21:38:28 - INFO - __main__ - Step 2657: {'lr': 0.0004999757625465063, 'samples': 510144, 'steps': 2656, 'loss/train': 1.6061630249023438} -11/06/2021 21:38:28 - INFO - __main__ - Step 2658: {'lr': 0.0004999756885967075, 'samples': 510336, 'steps': 2657, 'loss/train': 1.924759030342102} -11/06/2021 21:38:29 - INFO - __main__ - Step 2659: {'lr': 0.0004999756145342735, 'samples': 510528, 'steps': 2658, 'loss/train': 1.7294937372207642} -11/06/2021 21:38:30 - INFO - __main__ - Step 2660: {'lr': 0.0004999755403592043, 'samples': 510720, 'steps': 2659, 'loss/train': 2.623060941696167} -11/06/2021 21:38:30 - INFO - __main__ - Step 2661: {'lr': 0.0004999754660714999, 'samples': 510912, 'steps': 2660, 'loss/train': 2.1438426971435547} -11/06/2021 21:38:30 - INFO - __main__ - Step 2662: {'lr': 0.0004999753916711606, 'samples': 511104, 'steps': 2661, 'loss/train': 1.9994590282440186} -11/06/2021 21:38:31 - INFO - __main__ - Step 2663: {'lr': 0.0004999753171581862, 'samples': 511296, 'steps': 2662, 'loss/train': 2.382080554962158} -11/06/2021 21:38:31 - INFO - __main__ - Step 2664: {'lr': 0.0004999752425325766, 'samples': 511488, 'steps': 2663, 'loss/train': 2.0769588947296143} -11/06/2021 21:38:32 - INFO - __main__ - Step 2665: {'lr': 0.0004999751677943322, 'samples': 511680, 'steps': 2664, 'loss/train': 1.7713021039962769} -11/06/2021 21:38:32 - INFO - __main__ - Step 2666: {'lr': 0.0004999750929434527, 'samples': 511872, 'steps': 2665, 'loss/train': 2.075993537902832} -11/06/2021 21:38:33 - INFO - __main__ - Step 2667: {'lr': 0.0004999750179799383, 'samples': 512064, 'steps': 2666, 'loss/train': 2.5356898307800293} -11/06/2021 21:38:33 - INFO - __main__ - Step 2668: {'lr': 0.0004999749429037892, 'samples': 512256, 'steps': 2667, 'loss/train': 2.999053716659546} -11/06/2021 21:38:33 - INFO - __main__ - Step 2669: {'lr': 0.0004999748677150051, 'samples': 512448, 'steps': 2668, 'loss/train': 2.6738812923431396} -11/06/2021 21:38:34 - INFO - __main__ - Step 2670: {'lr': 0.0004999747924135862, 'samples': 512640, 'steps': 2669, 'loss/train': 2.2657175064086914} -11/06/2021 21:38:35 - INFO - __main__ - Step 2671: {'lr': 0.0004999747169995325, 'samples': 512832, 'steps': 2670, 'loss/train': 2.049834966659546} -11/06/2021 21:38:35 - INFO - __main__ - Step 2672: {'lr': 0.0004999746414728441, 'samples': 513024, 'steps': 2671, 'loss/train': 2.0094645023345947} -11/06/2021 21:38:35 - INFO - __main__ - Step 2673: {'lr': 0.0004999745658335209, 'samples': 513216, 'steps': 2672, 'loss/train': 2.6007511615753174} -11/06/2021 21:38:36 - INFO - __main__ - Step 2674: {'lr': 0.000499974490081563, 'samples': 513408, 'steps': 2673, 'loss/train': 2.5795583724975586} -11/06/2021 21:38:37 - INFO - __main__ - Step 2675: {'lr': 0.0004999744142169707, 'samples': 513600, 'steps': 2674, 'loss/train': 1.848941445350647} -11/06/2021 21:38:37 - INFO - __main__ - Step 2676: {'lr': 0.0004999743382397435, 'samples': 513792, 'steps': 2675, 'loss/train': 2.2464025020599365} -11/06/2021 21:38:38 - INFO - __main__ - Step 2677: {'lr': 0.0004999742621498818, 'samples': 513984, 'steps': 2676, 'loss/train': 2.2649552822113037} -11/06/2021 21:38:38 - INFO - __main__ - Step 2678: {'lr': 0.0004999741859473857, 'samples': 514176, 'steps': 2677, 'loss/train': 2.3065757751464844} -11/06/2021 21:38:38 - INFO - __main__ - Step 2679: {'lr': 0.0004999741096322549, 'samples': 514368, 'steps': 2678, 'loss/train': 2.34328031539917} -11/06/2021 21:38:39 - INFO - __main__ - Step 2680: {'lr': 0.0004999740332044898, 'samples': 514560, 'steps': 2679, 'loss/train': 2.229511022567749} -11/06/2021 21:38:40 - INFO - __main__ - Step 2681: {'lr': 0.0004999739566640901, 'samples': 514752, 'steps': 2680, 'loss/train': 2.1822242736816406} -11/06/2021 21:38:40 - INFO - __main__ - Step 2682: {'lr': 0.000499973880011056, 'samples': 514944, 'steps': 2681, 'loss/train': 2.409409999847412} -11/06/2021 21:38:41 - INFO - __main__ - Step 2683: {'lr': 0.0004999738032453876, 'samples': 515136, 'steps': 2682, 'loss/train': 2.3872311115264893} -11/06/2021 21:38:41 - INFO - __main__ - Step 2684: {'lr': 0.0004999737263670848, 'samples': 515328, 'steps': 2683, 'loss/train': 2.3661561012268066} -11/06/2021 21:38:41 - INFO - __main__ - Step 2685: {'lr': 0.0004999736493761477, 'samples': 515520, 'steps': 2684, 'loss/train': 2.4622879028320312} -11/06/2021 21:38:42 - INFO - __main__ - Step 2686: {'lr': 0.0004999735722725765, 'samples': 515712, 'steps': 2685, 'loss/train': 1.6226389408111572} -11/06/2021 21:38:43 - INFO - __main__ - Step 2687: {'lr': 0.0004999734950563709, 'samples': 515904, 'steps': 2686, 'loss/train': 2.3979785442352295} -11/06/2021 21:38:43 - INFO - __main__ - Step 2688: {'lr': 0.0004999734177275311, 'samples': 516096, 'steps': 2687, 'loss/train': 2.707308769226074} -11/06/2021 21:38:43 - INFO - __main__ - Step 2689: {'lr': 0.0004999733402860572, 'samples': 516288, 'steps': 2688, 'loss/train': 2.6095635890960693} -11/06/2021 21:38:44 - INFO - __main__ - Step 2690: {'lr': 0.0004999732627319491, 'samples': 516480, 'steps': 2689, 'loss/train': 2.480802297592163} -11/06/2021 21:38:45 - INFO - __main__ - Step 2691: {'lr': 0.000499973185065207, 'samples': 516672, 'steps': 2690, 'loss/train': 2.4791250228881836} -11/06/2021 21:38:45 - INFO - __main__ - Step 2692: {'lr': 0.0004999731072858307, 'samples': 516864, 'steps': 2691, 'loss/train': 2.2488434314727783} -11/06/2021 21:38:45 - INFO - __main__ - Step 2693: {'lr': 0.0004999730293938205, 'samples': 517056, 'steps': 2692, 'loss/train': 2.4395229816436768} -11/06/2021 21:38:46 - INFO - __main__ - Step 2694: {'lr': 0.0004999729513891762, 'samples': 517248, 'steps': 2693, 'loss/train': 2.7909016609191895} -11/06/2021 21:38:46 - INFO - __main__ - Step 2695: {'lr': 0.000499972873271898, 'samples': 517440, 'steps': 2694, 'loss/train': 2.6461949348449707} -11/06/2021 21:38:47 - INFO - __main__ - Step 2696: {'lr': 0.0004999727950419859, 'samples': 517632, 'steps': 2695, 'loss/train': 2.5715339183807373} -11/06/2021 21:38:48 - INFO - __main__ - Step 2697: {'lr': 0.0004999727166994399, 'samples': 517824, 'steps': 2696, 'loss/train': 2.065563917160034} -11/06/2021 21:38:48 - INFO - __main__ - Step 2698: {'lr': 0.0004999726382442601, 'samples': 518016, 'steps': 2697, 'loss/train': 1.9356613159179688} -11/06/2021 21:38:48 - INFO - __main__ - Step 2699: {'lr': 0.0004999725596764465, 'samples': 518208, 'steps': 2698, 'loss/train': 1.576759934425354} -11/06/2021 21:38:49 - INFO - __main__ - Step 2700: {'lr': 0.000499972480995999, 'samples': 518400, 'steps': 2699, 'loss/train': 2.4644877910614014} -11/06/2021 21:38:49 - INFO - __main__ - Step 2701: {'lr': 0.0004999724022029179, 'samples': 518592, 'steps': 2700, 'loss/train': 2.8699357509613037} -11/06/2021 21:38:51 - INFO - __main__ - Step 2702: {'lr': 0.000499972323297203, 'samples': 518784, 'steps': 2701, 'loss/train': 2.5225210189819336} -11/06/2021 21:38:51 - INFO - __main__ - Step 2703: {'lr': 0.0004999722442788544, 'samples': 518976, 'steps': 2702, 'loss/train': 2.4827229976654053} -11/06/2021 21:38:51 - INFO - __main__ - Step 2704: {'lr': 0.0004999721651478723, 'samples': 519168, 'steps': 2703, 'loss/train': 1.9105079174041748} -11/06/2021 21:38:52 - INFO - __main__ - Step 2705: {'lr': 0.0004999720859042565, 'samples': 519360, 'steps': 2704, 'loss/train': 2.2500193119049072} -11/06/2021 21:38:52 - INFO - __main__ - Step 2706: {'lr': 0.0004999720065480071, 'samples': 519552, 'steps': 2705, 'loss/train': 2.6277735233306885} -11/06/2021 21:38:52 - INFO - __main__ - Step 2707: {'lr': 0.0004999719270791242, 'samples': 519744, 'steps': 2706, 'loss/train': 1.4648323059082031} -11/06/2021 21:38:53 - INFO - __main__ - Step 2708: {'lr': 0.0004999718474976078, 'samples': 519936, 'steps': 2707, 'loss/train': 2.773413896560669} -11/06/2021 21:38:54 - INFO - __main__ - Step 2709: {'lr': 0.000499971767803458, 'samples': 520128, 'steps': 2708, 'loss/train': 2.3420262336730957} -11/06/2021 21:38:54 - INFO - __main__ - Step 2710: {'lr': 0.0004999716879966747, 'samples': 520320, 'steps': 2709, 'loss/train': 2.6745805740356445} -11/06/2021 21:38:54 - INFO - __main__ - Step 2711: {'lr': 0.000499971608077258, 'samples': 520512, 'steps': 2710, 'loss/train': 1.5498085021972656} -11/06/2021 21:38:55 - INFO - __main__ - Step 2712: {'lr': 0.000499971528045208, 'samples': 520704, 'steps': 2711, 'loss/train': 2.7040622234344482} -11/06/2021 21:38:55 - INFO - __main__ - Step 2713: {'lr': 0.0004999714479005248, 'samples': 520896, 'steps': 2712, 'loss/train': 3.5146377086639404} -11/06/2021 21:38:56 - INFO - __main__ - Step 2714: {'lr': 0.0004999713676432082, 'samples': 521088, 'steps': 2713, 'loss/train': 2.1871511936187744} -11/06/2021 21:38:56 - INFO - __main__ - Step 2715: {'lr': 0.0004999712872732584, 'samples': 521280, 'steps': 2714, 'loss/train': 2.5216920375823975} -11/06/2021 21:38:57 - INFO - __main__ - Step 2716: {'lr': 0.0004999712067906754, 'samples': 521472, 'steps': 2715, 'loss/train': 2.882300615310669} -11/06/2021 21:38:57 - INFO - __main__ - Step 2717: {'lr': 0.0004999711261954591, 'samples': 521664, 'steps': 2716, 'loss/train': 2.44183349609375} -11/06/2021 21:38:57 - INFO - __main__ - Step 2718: {'lr': 0.0004999710454876099, 'samples': 521856, 'steps': 2717, 'loss/train': 2.10378360748291} -11/06/2021 21:38:59 - INFO - __main__ - Step 2719: {'lr': 0.0004999709646671274, 'samples': 522048, 'steps': 2718, 'loss/train': 2.456674098968506} -11/06/2021 21:38:59 - INFO - __main__ - Step 2720: {'lr': 0.0004999708837340119, 'samples': 522240, 'steps': 2719, 'loss/train': 2.4138710498809814} -11/06/2021 21:38:59 - INFO - __main__ - Step 2721: {'lr': 0.0004999708026882635, 'samples': 522432, 'steps': 2720, 'loss/train': 2.910074234008789} -11/06/2021 21:39:00 - INFO - __main__ - Step 2722: {'lr': 0.000499970721529882, 'samples': 522624, 'steps': 2721, 'loss/train': 3.079136848449707} -11/06/2021 21:39:00 - INFO - __main__ - Step 2723: {'lr': 0.0004999706402588675, 'samples': 522816, 'steps': 2722, 'loss/train': 2.3095333576202393} -11/06/2021 21:39:01 - INFO - __main__ - Step 2724: {'lr': 0.0004999705588752202, 'samples': 523008, 'steps': 2723, 'loss/train': 1.8380732536315918} -11/06/2021 21:39:01 - INFO - __main__ - Step 2725: {'lr': 0.00049997047737894, 'samples': 523200, 'steps': 2724, 'loss/train': 2.072640895843506} -11/06/2021 21:39:02 - INFO - __main__ - Step 2726: {'lr': 0.0004999703957700269, 'samples': 523392, 'steps': 2725, 'loss/train': 2.321617603302002} -11/06/2021 21:39:02 - INFO - __main__ - Step 2727: {'lr': 0.000499970314048481, 'samples': 523584, 'steps': 2726, 'loss/train': 2.2870664596557617} -11/06/2021 21:39:02 - INFO - __main__ - Step 2728: {'lr': 0.0004999702322143023, 'samples': 523776, 'steps': 2727, 'loss/train': 2.508100748062134} -11/06/2021 21:39:03 - INFO - __main__ - Step 2729: {'lr': 0.000499970150267491, 'samples': 523968, 'steps': 2728, 'loss/train': 2.8131275177001953} -11/06/2021 21:39:04 - INFO - __main__ - Step 2730: {'lr': 0.0004999700682080469, 'samples': 524160, 'steps': 2729, 'loss/train': 2.412299871444702} -11/06/2021 21:39:04 - INFO - __main__ - Step 2731: {'lr': 0.0004999699860359702, 'samples': 524352, 'steps': 2730, 'loss/train': 2.656719446182251} -11/06/2021 21:39:04 - INFO - __main__ - Step 2732: {'lr': 0.0004999699037512608, 'samples': 524544, 'steps': 2731, 'loss/train': 2.0453786849975586} -11/06/2021 21:39:05 - INFO - __main__ - Step 2733: {'lr': 0.000499969821353919, 'samples': 524736, 'steps': 2732, 'loss/train': 1.5553648471832275} -11/06/2021 21:39:06 - INFO - __main__ - Step 2734: {'lr': 0.0004999697388439444, 'samples': 524928, 'steps': 2733, 'loss/train': 2.4622724056243896} -11/06/2021 21:39:06 - INFO - __main__ - Step 2735: {'lr': 0.0004999696562213375, 'samples': 525120, 'steps': 2734, 'loss/train': 2.221712827682495} -11/06/2021 21:39:06 - INFO - __main__ - Step 2736: {'lr': 0.0004999695734860981, 'samples': 525312, 'steps': 2735, 'loss/train': 2.3038675785064697} -11/06/2021 21:39:07 - INFO - __main__ - Step 2737: {'lr': 0.0004999694906382262, 'samples': 525504, 'steps': 2736, 'loss/train': 2.3742024898529053} -11/06/2021 21:39:07 - INFO - __main__ - Step 2738: {'lr': 0.0004999694076777219, 'samples': 525696, 'steps': 2737, 'loss/train': 2.387545347213745} -11/06/2021 21:39:08 - INFO - __main__ - Step 2739: {'lr': 0.0004999693246045854, 'samples': 525888, 'steps': 2738, 'loss/train': 2.2682254314422607} -11/06/2021 21:39:08 - INFO - __main__ - Step 2740: {'lr': 0.0004999692414188164, 'samples': 526080, 'steps': 2739, 'loss/train': 1.0920865535736084} -11/06/2021 21:39:09 - INFO - __main__ - Step 2741: {'lr': 0.0004999691581204152, 'samples': 526272, 'steps': 2740, 'loss/train': 2.4095451831817627} -11/06/2021 21:39:09 - INFO - __main__ - Step 2742: {'lr': 0.0004999690747093816, 'samples': 526464, 'steps': 2741, 'loss/train': 2.6026110649108887} -11/06/2021 21:39:09 - INFO - __main__ - Step 2743: {'lr': 0.000499968991185716, 'samples': 526656, 'steps': 2742, 'loss/train': 2.7001304626464844} -11/06/2021 21:39:10 - INFO - __main__ - Step 2744: {'lr': 0.0004999689075494182, 'samples': 526848, 'steps': 2743, 'loss/train': 2.8792505264282227} -11/06/2021 21:39:11 - INFO - __main__ - Step 2745: {'lr': 0.0004999688238004882, 'samples': 527040, 'steps': 2744, 'loss/train': 1.739349603652954} -11/06/2021 21:39:11 - INFO - __main__ - Step 2746: {'lr': 0.0004999687399389262, 'samples': 527232, 'steps': 2745, 'loss/train': 1.9313324689865112} -11/06/2021 21:39:11 - INFO - __main__ - Step 2747: {'lr': 0.0004999686559647319, 'samples': 527424, 'steps': 2746, 'loss/train': 2.5279910564422607} -11/06/2021 21:39:12 - INFO - __main__ - Step 2748: {'lr': 0.0004999685718779058, 'samples': 527616, 'steps': 2747, 'loss/train': 2.2004690170288086} -11/06/2021 21:39:12 - INFO - __main__ - Step 2749: {'lr': 0.0004999684876784477, 'samples': 527808, 'steps': 2748, 'loss/train': 2.4345414638519287} -11/06/2021 21:39:13 - INFO - __main__ - Step 2750: {'lr': 0.0004999684033663576, 'samples': 528000, 'steps': 2749, 'loss/train': 1.688835620880127} -11/06/2021 21:39:14 - INFO - __main__ - Step 2751: {'lr': 0.0004999683189416356, 'samples': 528192, 'steps': 2750, 'loss/train': 1.597861647605896} -11/06/2021 21:39:14 - INFO - __main__ - Step 2752: {'lr': 0.0004999682344042817, 'samples': 528384, 'steps': 2751, 'loss/train': 2.844277858734131} -11/06/2021 21:39:14 - INFO - __main__ - Step 2753: {'lr': 0.000499968149754296, 'samples': 528576, 'steps': 2752, 'loss/train': 2.3030660152435303} -11/06/2021 21:39:15 - INFO - __main__ - Step 2754: {'lr': 0.0004999680649916786, 'samples': 528768, 'steps': 2753, 'loss/train': 2.6878316402435303} -11/06/2021 21:39:16 - INFO - __main__ - Step 2755: {'lr': 0.0004999679801164295, 'samples': 528960, 'steps': 2754, 'loss/train': 0.8238305449485779} -11/06/2021 21:39:17 - INFO - __main__ - Step 2756: {'lr': 0.0004999678951285485, 'samples': 529152, 'steps': 2755, 'loss/train': 2.0880188941955566} -11/06/2021 21:39:17 - INFO - __main__ - Step 2757: {'lr': 0.0004999678100280358, 'samples': 529344, 'steps': 2756, 'loss/train': 2.4757795333862305} -11/06/2021 21:39:17 - INFO - __main__ - Step 2758: {'lr': 0.0004999677248148916, 'samples': 529536, 'steps': 2757, 'loss/train': 2.4732248783111572} -11/06/2021 21:39:18 - INFO - __main__ - Step 2759: {'lr': 0.0004999676394891158, 'samples': 529728, 'steps': 2758, 'loss/train': 2.1484673023223877} -11/06/2021 21:39:18 - INFO - __main__ - Step 2760: {'lr': 0.0004999675540507083, 'samples': 529920, 'steps': 2759, 'loss/train': 3.0172383785247803} -11/06/2021 21:39:19 - INFO - __main__ - Step 2761: {'lr': 0.0004999674684996694, 'samples': 530112, 'steps': 2760, 'loss/train': 2.785417079925537} -11/06/2021 21:39:19 - INFO - __main__ - Step 2762: {'lr': 0.0004999673828359989, 'samples': 530304, 'steps': 2761, 'loss/train': 2.5744974613189697} -11/06/2021 21:39:20 - INFO - __main__ - Step 2763: {'lr': 0.0004999672970596971, 'samples': 530496, 'steps': 2762, 'loss/train': 2.5258822441101074} -11/06/2021 21:39:20 - INFO - __main__ - Step 2764: {'lr': 0.0004999672111707639, 'samples': 530688, 'steps': 2763, 'loss/train': 3.058380603790283} -11/06/2021 21:39:21 - INFO - __main__ - Step 2765: {'lr': 0.0004999671251691991, 'samples': 530880, 'steps': 2764, 'loss/train': 2.8081789016723633} -11/06/2021 21:39:21 - INFO - __main__ - Step 2766: {'lr': 0.0004999670390550032, 'samples': 531072, 'steps': 2765, 'loss/train': 2.2795279026031494} -11/06/2021 21:39:22 - INFO - __main__ - Step 2767: {'lr': 0.000499966952828176, 'samples': 531264, 'steps': 2766, 'loss/train': 1.8465057611465454} -11/06/2021 21:39:22 - INFO - __main__ - Step 2768: {'lr': 0.0004999668664887175, 'samples': 531456, 'steps': 2767, 'loss/train': 2.2657551765441895} -11/06/2021 21:39:23 - INFO - __main__ - Step 2769: {'lr': 0.0004999667800366278, 'samples': 531648, 'steps': 2768, 'loss/train': 2.2362067699432373} -11/06/2021 21:39:23 - INFO - __main__ - Step 2770: {'lr': 0.0004999666934719069, 'samples': 531840, 'steps': 2769, 'loss/train': 1.8398356437683105} -11/06/2021 21:39:23 - INFO - __main__ - Step 2771: {'lr': 0.0004999666067945548, 'samples': 532032, 'steps': 2770, 'loss/train': 2.37894868850708} -11/06/2021 21:39:24 - INFO - __main__ - Step 2772: {'lr': 0.0004999665200045716, 'samples': 532224, 'steps': 2771, 'loss/train': 1.0660734176635742} -11/06/2021 21:39:25 - INFO - __main__ - Step 2773: {'lr': 0.0004999664331019574, 'samples': 532416, 'steps': 2772, 'loss/train': 2.489011287689209} -11/06/2021 21:39:25 - INFO - __main__ - Step 2774: {'lr': 0.0004999663460867123, 'samples': 532608, 'steps': 2773, 'loss/train': 2.3319153785705566} -11/06/2021 21:39:25 - INFO - __main__ - Step 2775: {'lr': 0.000499966258958836, 'samples': 532800, 'steps': 2774, 'loss/train': 2.5055582523345947} -11/06/2021 21:39:26 - INFO - __main__ - Step 2776: {'lr': 0.000499966171718329, 'samples': 532992, 'steps': 2775, 'loss/train': 2.4398868083953857} -11/06/2021 21:39:27 - INFO - __main__ - Step 2777: {'lr': 0.000499966084365191, 'samples': 533184, 'steps': 2776, 'loss/train': 2.4442226886749268} -11/06/2021 21:39:27 - INFO - __main__ - Step 2778: {'lr': 0.0004999659968994221, 'samples': 533376, 'steps': 2777, 'loss/train': 2.8139424324035645} -11/06/2021 21:39:28 - INFO - __main__ - Step 2779: {'lr': 0.0004999659093210223, 'samples': 533568, 'steps': 2778, 'loss/train': 2.4639973640441895} -11/06/2021 21:39:28 - INFO - __main__ - Step 2780: {'lr': 0.0004999658216299919, 'samples': 533760, 'steps': 2779, 'loss/train': 2.217278242111206} -11/06/2021 21:39:28 - INFO - __main__ - Step 2781: {'lr': 0.0004999657338263308, 'samples': 533952, 'steps': 2780, 'loss/train': 2.8546433448791504} -11/06/2021 21:39:29 - INFO - __main__ - Step 2782: {'lr': 0.0004999656459100388, 'samples': 534144, 'steps': 2781, 'loss/train': 2.2053894996643066} -11/06/2021 21:39:30 - INFO - __main__ - Step 2783: {'lr': 0.0004999655578811161, 'samples': 534336, 'steps': 2782, 'loss/train': 2.2209572792053223} -11/06/2021 21:39:30 - INFO - __main__ - Step 2784: {'lr': 0.0004999654697395629, 'samples': 534528, 'steps': 2783, 'loss/train': 2.64697527885437} -11/06/2021 21:39:30 - INFO - __main__ - Step 2785: {'lr': 0.0004999653814853791, 'samples': 534720, 'steps': 2784, 'loss/train': 2.1000912189483643} -11/06/2021 21:39:31 - INFO - __main__ - Step 2786: {'lr': 0.0004999652931185648, 'samples': 534912, 'steps': 2785, 'loss/train': 2.200310468673706} -11/06/2021 21:39:32 - INFO - __main__ - Step 2787: {'lr': 0.00049996520463912, 'samples': 535104, 'steps': 2786, 'loss/train': 2.8074491024017334} -11/06/2021 21:39:32 - INFO - __main__ - Step 2788: {'lr': 0.0004999651160470447, 'samples': 535296, 'steps': 2787, 'loss/train': 2.2512643337249756} -11/06/2021 21:39:32 - INFO - __main__ - Step 2789: {'lr': 0.0004999650273423389, 'samples': 535488, 'steps': 2788, 'loss/train': 2.207897663116455} -11/06/2021 21:39:33 - INFO - __main__ - Step 2790: {'lr': 0.0004999649385250028, 'samples': 535680, 'steps': 2789, 'loss/train': 2.473784923553467} -11/06/2021 21:39:33 - INFO - __main__ - Step 2791: {'lr': 0.0004999648495950363, 'samples': 535872, 'steps': 2790, 'loss/train': 2.487807273864746} -11/06/2021 21:39:34 - INFO - __main__ - Step 2792: {'lr': 0.0004999647605524396, 'samples': 536064, 'steps': 2791, 'loss/train': 2.234999895095825} -11/06/2021 21:39:35 - INFO - __main__ - Step 2793: {'lr': 0.0004999646713972126, 'samples': 536256, 'steps': 2792, 'loss/train': 2.1799986362457275} -11/06/2021 21:39:35 - INFO - __main__ - Step 2794: {'lr': 0.0004999645821293552, 'samples': 536448, 'steps': 2793, 'loss/train': 1.1634377241134644} -11/06/2021 21:39:35 - INFO - __main__ - Step 2795: {'lr': 0.0004999644927488678, 'samples': 536640, 'steps': 2794, 'loss/train': 2.290945529937744} -11/06/2021 21:39:36 - INFO - __main__ - Step 2796: {'lr': 0.0004999644032557503, 'samples': 536832, 'steps': 2795, 'loss/train': 2.273956537246704} -11/06/2021 21:39:37 - INFO - __main__ - Step 2797: {'lr': 0.0004999643136500027, 'samples': 537024, 'steps': 2796, 'loss/train': 1.5732803344726562} -11/06/2021 21:39:37 - INFO - __main__ - Step 2798: {'lr': 0.0004999642239316249, 'samples': 537216, 'steps': 2797, 'loss/train': 2.646408796310425} -11/06/2021 21:39:38 - INFO - __main__ - Step 2799: {'lr': 0.000499964134100617, 'samples': 537408, 'steps': 2798, 'loss/train': 2.802149772644043} -11/06/2021 21:39:38 - INFO - __main__ - Step 2800: {'lr': 0.0004999640441569793, 'samples': 537600, 'steps': 2799, 'loss/train': 1.9303408861160278} -11/06/2021 21:39:38 - INFO - __main__ - Step 2801: {'lr': 0.0004999639541007116, 'samples': 537792, 'steps': 2800, 'loss/train': 2.0123252868652344} -11/06/2021 21:39:39 - INFO - __main__ - Step 2802: {'lr': 0.0004999638639318141, 'samples': 537984, 'steps': 2801, 'loss/train': 2.5675606727600098} -11/06/2021 21:39:40 - INFO - __main__ - Step 2803: {'lr': 0.0004999637736502866, 'samples': 538176, 'steps': 2802, 'loss/train': 2.3583943843841553} -11/06/2021 21:39:40 - INFO - __main__ - Step 2804: {'lr': 0.0004999636832561293, 'samples': 538368, 'steps': 2803, 'loss/train': 2.4021947383880615} -11/06/2021 21:39:40 - INFO - __main__ - Step 2805: {'lr': 0.0004999635927493423, 'samples': 538560, 'steps': 2804, 'loss/train': 2.4244282245635986} -11/06/2021 21:39:41 - INFO - __main__ - Step 2806: {'lr': 0.0004999635021299255, 'samples': 538752, 'steps': 2805, 'loss/train': 2.661571741104126} -11/06/2021 21:39:41 - INFO - __main__ - Step 2807: {'lr': 0.0004999634113978791, 'samples': 538944, 'steps': 2806, 'loss/train': 2.562166929244995} -11/06/2021 21:39:42 - INFO - __main__ - Step 2808: {'lr': 0.0004999633205532029, 'samples': 539136, 'steps': 2807, 'loss/train': 2.0239551067352295} -11/06/2021 21:39:43 - INFO - __main__ - Step 2809: {'lr': 0.0004999632295958972, 'samples': 539328, 'steps': 2808, 'loss/train': 2.355177164077759} -11/06/2021 21:39:43 - INFO - __main__ - Step 2810: {'lr': 0.0004999631385259617, 'samples': 539520, 'steps': 2809, 'loss/train': 2.7225186824798584} -11/06/2021 21:39:43 - INFO - __main__ - Step 2811: {'lr': 0.000499963047343397, 'samples': 539712, 'steps': 2810, 'loss/train': 1.7809796333312988} -11/06/2021 21:39:44 - INFO - __main__ - Step 2812: {'lr': 0.0004999629560482026, 'samples': 539904, 'steps': 2811, 'loss/train': 1.2682995796203613} -11/06/2021 21:39:45 - INFO - __main__ - Step 2813: {'lr': 0.0004999628646403788, 'samples': 540096, 'steps': 2812, 'loss/train': 2.061248302459717} -11/06/2021 21:39:45 - INFO - __main__ - Step 2814: {'lr': 0.0004999627731199256, 'samples': 540288, 'steps': 2813, 'loss/train': 2.505889654159546} -11/06/2021 21:39:45 - INFO - __main__ - Step 2815: {'lr': 0.0004999626814868429, 'samples': 540480, 'steps': 2814, 'loss/train': 1.8169455528259277} -11/06/2021 21:39:46 - INFO - __main__ - Step 2816: {'lr': 0.0004999625897411311, 'samples': 540672, 'steps': 2815, 'loss/train': 2.5656561851501465} -11/06/2021 21:39:46 - INFO - __main__ - Step 2817: {'lr': 0.0004999624978827899, 'samples': 540864, 'steps': 2816, 'loss/train': 2.479475736618042} -11/06/2021 21:39:47 - INFO - __main__ - Step 2818: {'lr': 0.0004999624059118194, 'samples': 541056, 'steps': 2817, 'loss/train': 1.6999139785766602} -11/06/2021 21:39:47 - INFO - __main__ - Step 2819: {'lr': 0.0004999623138282198, 'samples': 541248, 'steps': 2818, 'loss/train': 2.207723617553711} -11/06/2021 21:39:48 - INFO - __main__ - Step 2820: {'lr': 0.000499962221631991, 'samples': 541440, 'steps': 2819, 'loss/train': 2.569610357284546} -11/06/2021 21:39:48 - INFO - __main__ - Step 2821: {'lr': 0.0004999621293231331, 'samples': 541632, 'steps': 2820, 'loss/train': 2.8650639057159424} -11/06/2021 21:39:48 - INFO - __main__ - Step 2822: {'lr': 0.0004999620369016461, 'samples': 541824, 'steps': 2821, 'loss/train': 2.0223443508148193} -11/06/2021 21:39:49 - INFO - __main__ - Step 2823: {'lr': 0.00049996194436753, 'samples': 542016, 'steps': 2822, 'loss/train': 2.039158344268799} -11/06/2021 21:39:50 - INFO - __main__ - Step 2824: {'lr': 0.000499961851720785, 'samples': 542208, 'steps': 2823, 'loss/train': 2.3247768878936768} -11/06/2021 21:39:50 - INFO - __main__ - Step 2825: {'lr': 0.000499961758961411, 'samples': 542400, 'steps': 2824, 'loss/train': 2.4017333984375} -11/06/2021 21:39:50 - INFO - __main__ - Step 2826: {'lr': 0.0004999616660894081, 'samples': 542592, 'steps': 2825, 'loss/train': 2.326307535171509} -11/06/2021 21:39:51 - INFO - __main__ - Step 2827: {'lr': 0.0004999615731047762, 'samples': 542784, 'steps': 2826, 'loss/train': 2.21771240234375} -11/06/2021 21:39:52 - INFO - __main__ - Step 2828: {'lr': 0.0004999614800075158, 'samples': 542976, 'steps': 2827, 'loss/train': 1.7368288040161133} -11/06/2021 21:39:52 - INFO - __main__ - Step 2829: {'lr': 0.0004999613867976264, 'samples': 543168, 'steps': 2828, 'loss/train': 2.7821502685546875} -11/06/2021 21:39:53 - INFO - __main__ - Step 2830: {'lr': 0.0004999612934751082, 'samples': 543360, 'steps': 2829, 'loss/train': 2.315138101577759} -11/06/2021 21:39:53 - INFO - __main__ - Step 2831: {'lr': 0.0004999612000399614, 'samples': 543552, 'steps': 2830, 'loss/train': 2.502418041229248} -11/06/2021 21:39:53 - INFO - __main__ - Step 2832: {'lr': 0.0004999611064921859, 'samples': 543744, 'steps': 2831, 'loss/train': 2.381127119064331} -11/06/2021 21:39:54 - INFO - __main__ - Step 2833: {'lr': 0.0004999610128317818, 'samples': 543936, 'steps': 2832, 'loss/train': 1.7340575456619263} -11/06/2021 21:39:55 - INFO - __main__ - Step 2834: {'lr': 0.0004999609190587492, 'samples': 544128, 'steps': 2833, 'loss/train': 2.435819387435913} -11/06/2021 21:39:55 - INFO - __main__ - Step 2835: {'lr': 0.000499960825173088, 'samples': 544320, 'steps': 2834, 'loss/train': 2.3425838947296143} -11/06/2021 21:39:55 - INFO - __main__ - Step 2836: {'lr': 0.0004999607311747983, 'samples': 544512, 'steps': 2835, 'loss/train': 1.7845638990402222} -11/06/2021 21:39:56 - INFO - __main__ - Step 2837: {'lr': 0.0004999606370638801, 'samples': 544704, 'steps': 2836, 'loss/train': 1.946204423904419} -11/06/2021 21:39:56 - INFO - __main__ - Step 2838: {'lr': 0.0004999605428403336, 'samples': 544896, 'steps': 2837, 'loss/train': 2.6006252765655518} -11/06/2021 21:39:57 - INFO - __main__ - Step 2839: {'lr': 0.0004999604485041585, 'samples': 545088, 'steps': 2838, 'loss/train': 2.409191131591797} -11/06/2021 21:39:57 - INFO - __main__ - Step 2840: {'lr': 0.0004999603540553554, 'samples': 545280, 'steps': 2839, 'loss/train': 2.562089204788208} -11/06/2021 21:39:58 - INFO - __main__ - Step 2841: {'lr': 0.0004999602594939238, 'samples': 545472, 'steps': 2840, 'loss/train': 2.2880022525787354} -11/06/2021 21:39:58 - INFO - __main__ - Step 2842: {'lr': 0.0004999601648198641, 'samples': 545664, 'steps': 2841, 'loss/train': 2.791858434677124} -11/06/2021 21:39:58 - INFO - __main__ - Step 2843: {'lr': 0.0004999600700331761, 'samples': 545856, 'steps': 2842, 'loss/train': 2.366997003555298} -11/06/2021 21:40:00 - INFO - __main__ - Step 2844: {'lr': 0.0004999599751338601, 'samples': 546048, 'steps': 2843, 'loss/train': 2.355536937713623} -11/06/2021 21:40:00 - INFO - __main__ - Step 2845: {'lr': 0.0004999598801219158, 'samples': 546240, 'steps': 2844, 'loss/train': 1.3548896312713623} -11/06/2021 21:40:00 - INFO - __main__ - Step 2846: {'lr': 0.0004999597849973435, 'samples': 546432, 'steps': 2845, 'loss/train': 2.1477577686309814} -11/06/2021 21:40:01 - INFO - __main__ - Step 2847: {'lr': 0.0004999596897601432, 'samples': 546624, 'steps': 2846, 'loss/train': 1.9438403844833374} -11/06/2021 21:40:01 - INFO - __main__ - Step 2848: {'lr': 0.0004999595944103149, 'samples': 546816, 'steps': 2847, 'loss/train': 2.6734774112701416} -11/06/2021 21:40:02 - INFO - __main__ - Step 2849: {'lr': 0.0004999594989478587, 'samples': 547008, 'steps': 2848, 'loss/train': 2.6153666973114014} -11/06/2021 21:40:02 - INFO - __main__ - Step 2850: {'lr': 0.0004999594033727747, 'samples': 547200, 'steps': 2849, 'loss/train': 2.0793142318725586} -11/06/2021 21:40:03 - INFO - __main__ - Step 2851: {'lr': 0.0004999593076850627, 'samples': 547392, 'steps': 2850, 'loss/train': 2.2441251277923584} -11/06/2021 21:40:03 - INFO - __main__ - Step 2852: {'lr': 0.0004999592118847229, 'samples': 547584, 'steps': 2851, 'loss/train': 2.7743895053863525} -11/06/2021 21:40:03 - INFO - __main__ - Step 2853: {'lr': 0.0004999591159717554, 'samples': 547776, 'steps': 2852, 'loss/train': 2.089233160018921} -11/06/2021 21:40:04 - INFO - __main__ - Step 2854: {'lr': 0.0004999590199461602, 'samples': 547968, 'steps': 2853, 'loss/train': 2.220766067504883} -11/06/2021 21:40:05 - INFO - __main__ - Step 2855: {'lr': 0.0004999589238079373, 'samples': 548160, 'steps': 2854, 'loss/train': 2.098376989364624} -11/06/2021 21:40:05 - INFO - __main__ - Step 2856: {'lr': 0.0004999588275570868, 'samples': 548352, 'steps': 2855, 'loss/train': 2.4644670486450195} -11/06/2021 21:40:05 - INFO - __main__ - Step 2857: {'lr': 0.0004999587311936086, 'samples': 548544, 'steps': 2856, 'loss/train': 2.239152193069458} -11/06/2021 21:40:06 - INFO - __main__ - Step 2858: {'lr': 0.000499958634717503, 'samples': 548736, 'steps': 2857, 'loss/train': 1.4249017238616943} -11/06/2021 21:40:07 - INFO - __main__ - Step 2859: {'lr': 0.0004999585381287696, 'samples': 548928, 'steps': 2858, 'loss/train': 2.2999162673950195} -11/06/2021 21:40:07 - INFO - __main__ - Step 2860: {'lr': 0.000499958441427409, 'samples': 549120, 'steps': 2859, 'loss/train': 2.8387157917022705} -11/06/2021 21:40:08 - INFO - __main__ - Step 2861: {'lr': 0.0004999583446134209, 'samples': 549312, 'steps': 2860, 'loss/train': 2.874333620071411} -11/06/2021 21:40:08 - INFO - __main__ - Step 2862: {'lr': 0.0004999582476868055, 'samples': 549504, 'steps': 2861, 'loss/train': 2.6905484199523926} -11/06/2021 21:40:08 - INFO - __main__ - Step 2863: {'lr': 0.0004999581506475627, 'samples': 549696, 'steps': 2862, 'loss/train': 2.1297647953033447} -11/06/2021 21:40:09 - INFO - __main__ - Step 2864: {'lr': 0.0004999580534956927, 'samples': 549888, 'steps': 2863, 'loss/train': 2.871276378631592} -11/06/2021 21:40:10 - INFO - __main__ - Step 2865: {'lr': 0.0004999579562311953, 'samples': 550080, 'steps': 2864, 'loss/train': 1.109349012374878} -11/06/2021 21:40:10 - INFO - __main__ - Step 2866: {'lr': 0.0004999578588540709, 'samples': 550272, 'steps': 2865, 'loss/train': 2.0491299629211426} -11/06/2021 21:40:10 - INFO - __main__ - Step 2867: {'lr': 0.0004999577613643192, 'samples': 550464, 'steps': 2866, 'loss/train': 2.0363290309906006} -11/06/2021 21:40:11 - INFO - __main__ - Step 2868: {'lr': 0.0004999576637619404, 'samples': 550656, 'steps': 2867, 'loss/train': 2.5006585121154785} -11/06/2021 21:40:11 - INFO - __main__ - Step 2869: {'lr': 0.0004999575660469347, 'samples': 550848, 'steps': 2868, 'loss/train': 2.5980803966522217} -11/06/2021 21:40:12 - INFO - __main__ - Step 2870: {'lr': 0.0004999574682193017, 'samples': 551040, 'steps': 2869, 'loss/train': 1.786831259727478} -11/06/2021 21:40:13 - INFO - __main__ - Step 2871: {'lr': 0.0004999573702790419, 'samples': 551232, 'steps': 2870, 'loss/train': 1.8787875175476074} -11/06/2021 21:40:13 - INFO - __main__ - Step 2872: {'lr': 0.0004999572722261551, 'samples': 551424, 'steps': 2871, 'loss/train': 1.8773044347763062} -11/06/2021 21:40:13 - INFO - __main__ - Step 2873: {'lr': 0.0004999571740606415, 'samples': 551616, 'steps': 2872, 'loss/train': 2.097402572631836} -11/06/2021 21:40:14 - INFO - __main__ - Step 2874: {'lr': 0.000499957075782501, 'samples': 551808, 'steps': 2873, 'loss/train': 1.8168832063674927} -11/06/2021 21:40:15 - INFO - __main__ - Step 2875: {'lr': 0.0004999569773917337, 'samples': 552000, 'steps': 2874, 'loss/train': 2.0323092937469482} -11/06/2021 21:40:15 - INFO - __main__ - Step 2876: {'lr': 0.0004999568788883397, 'samples': 552192, 'steps': 2875, 'loss/train': 1.8158880472183228} -11/06/2021 21:40:15 - INFO - __main__ - Step 2877: {'lr': 0.0004999567802723188, 'samples': 552384, 'steps': 2876, 'loss/train': 2.2598671913146973} -11/06/2021 21:40:16 - INFO - __main__ - Step 2878: {'lr': 0.0004999566815436715, 'samples': 552576, 'steps': 2877, 'loss/train': 2.445081949234009} -11/06/2021 21:40:16 - INFO - __main__ - Step 2879: {'lr': 0.0004999565827023974, 'samples': 552768, 'steps': 2878, 'loss/train': 2.130836009979248} -11/06/2021 21:40:17 - INFO - __main__ - Step 2880: {'lr': 0.0004999564837484967, 'samples': 552960, 'steps': 2879, 'loss/train': 2.3038902282714844} -11/06/2021 21:40:17 - INFO - __main__ - Step 2881: {'lr': 0.0004999563846819696, 'samples': 553152, 'steps': 2880, 'loss/train': 2.3476128578186035} -11/06/2021 21:40:18 - INFO - __main__ - Step 2882: {'lr': 0.0004999562855028159, 'samples': 553344, 'steps': 2881, 'loss/train': 2.6095919609069824} -11/06/2021 21:40:18 - INFO - __main__ - Step 2883: {'lr': 0.0004999561862110358, 'samples': 553536, 'steps': 2882, 'loss/train': 1.861746072769165} -11/06/2021 21:40:18 - INFO - __main__ - Step 2884: {'lr': 0.0004999560868066293, 'samples': 553728, 'steps': 2883, 'loss/train': 2.09774112701416} -11/06/2021 21:40:20 - INFO - __main__ - Step 2885: {'lr': 0.0004999559872895964, 'samples': 553920, 'steps': 2884, 'loss/train': 1.9192487001419067} -11/06/2021 21:40:20 - INFO - __main__ - Step 2886: {'lr': 0.0004999558876599373, 'samples': 554112, 'steps': 2885, 'loss/train': 2.2191450595855713} -11/06/2021 21:40:20 - INFO - __main__ - Step 2887: {'lr': 0.0004999557879176518, 'samples': 554304, 'steps': 2886, 'loss/train': 2.411027193069458} -11/06/2021 21:40:21 - INFO - __main__ - Step 2888: {'lr': 0.0004999556880627401, 'samples': 554496, 'steps': 2887, 'loss/train': 2.7569634914398193} -11/06/2021 21:40:21 - INFO - __main__ - Step 2889: {'lr': 0.0004999555880952023, 'samples': 554688, 'steps': 2888, 'loss/train': 2.49636173248291} -11/06/2021 21:40:22 - INFO - __main__ - Step 2890: {'lr': 0.0004999554880150383, 'samples': 554880, 'steps': 2889, 'loss/train': 2.0643162727355957} -11/06/2021 21:40:22 - INFO - __main__ - Step 2891: {'lr': 0.0004999553878222482, 'samples': 555072, 'steps': 2890, 'loss/train': 1.2182731628417969} -11/06/2021 21:40:23 - INFO - __main__ - Step 2892: {'lr': 0.0004999552875168321, 'samples': 555264, 'steps': 2891, 'loss/train': 2.110027551651001} -11/06/2021 21:40:23 - INFO - __main__ - Step 2893: {'lr': 0.0004999551870987901, 'samples': 555456, 'steps': 2892, 'loss/train': 2.0621578693389893} -11/06/2021 21:40:23 - INFO - __main__ - Step 2894: {'lr': 0.000499955086568122, 'samples': 555648, 'steps': 2893, 'loss/train': 2.4326114654541016} -11/06/2021 21:40:24 - INFO - __main__ - Step 2895: {'lr': 0.000499954985924828, 'samples': 555840, 'steps': 2894, 'loss/train': 1.992488980293274} -11/06/2021 21:40:25 - INFO - __main__ - Step 2896: {'lr': 0.0004999548851689082, 'samples': 556032, 'steps': 2895, 'loss/train': 1.6926281452178955} -11/06/2021 21:40:25 - INFO - __main__ - Step 2897: {'lr': 0.0004999547843003627, 'samples': 556224, 'steps': 2896, 'loss/train': 2.2497506141662598} -11/06/2021 21:40:25 - INFO - __main__ - Step 2898: {'lr': 0.0004999546833191912, 'samples': 556416, 'steps': 2897, 'loss/train': 2.4135076999664307} -11/06/2021 21:40:26 - INFO - __main__ - Step 2899: {'lr': 0.0004999545822253941, 'samples': 556608, 'steps': 2898, 'loss/train': 1.9909908771514893} -11/06/2021 21:40:27 - INFO - __main__ - Step 2900: {'lr': 0.0004999544810189713, 'samples': 556800, 'steps': 2899, 'loss/train': 1.9784951210021973} -11/06/2021 21:40:27 - INFO - __main__ - Step 2901: {'lr': 0.0004999543796999228, 'samples': 556992, 'steps': 2900, 'loss/train': 2.4324984550476074} -11/06/2021 21:40:27 - INFO - __main__ - Step 2902: {'lr': 0.0004999542782682489, 'samples': 557184, 'steps': 2901, 'loss/train': 1.6676363945007324} -11/06/2021 21:40:28 - INFO - __main__ - Step 2903: {'lr': 0.0004999541767239493, 'samples': 557376, 'steps': 2902, 'loss/train': 2.2086076736450195} -11/06/2021 21:40:28 - INFO - __main__ - Step 2904: {'lr': 0.0004999540750670243, 'samples': 557568, 'steps': 2903, 'loss/train': 2.221266746520996} -11/06/2021 21:40:28 - INFO - __main__ - Step 2905: {'lr': 0.0004999539732974738, 'samples': 557760, 'steps': 2904, 'loss/train': 1.9565421342849731} -11/06/2021 21:40:29 - INFO - __main__ - Step 2906: {'lr': 0.0004999538714152978, 'samples': 557952, 'steps': 2905, 'loss/train': 2.1874446868896484} -11/06/2021 21:40:30 - INFO - __main__ - Step 2907: {'lr': 0.0004999537694204966, 'samples': 558144, 'steps': 2906, 'loss/train': 1.4559849500656128} -11/06/2021 21:40:30 - INFO - __main__ - Step 2908: {'lr': 0.0004999536673130701, 'samples': 558336, 'steps': 2907, 'loss/train': 2.1022891998291016} -11/06/2021 21:40:30 - INFO - __main__ - Step 2909: {'lr': 0.0004999535650930182, 'samples': 558528, 'steps': 2908, 'loss/train': 1.6833531856536865} -11/06/2021 21:40:31 - INFO - __main__ - Step 2910: {'lr': 0.0004999534627603411, 'samples': 558720, 'steps': 2909, 'loss/train': 1.6895768642425537} -11/06/2021 21:40:33 - INFO - __main__ - Step 2911: {'lr': 0.0004999533603150389, 'samples': 558912, 'steps': 2910, 'loss/train': 2.199605703353882} -11/06/2021 21:40:33 - INFO - __main__ - Step 2912: {'lr': 0.0004999532577571116, 'samples': 559104, 'steps': 2911, 'loss/train': 2.348113536834717} -11/06/2021 21:40:33 - INFO - __main__ - Step 2913: {'lr': 0.0004999531550865592, 'samples': 559296, 'steps': 2912, 'loss/train': 1.9907268285751343} -11/06/2021 21:40:34 - INFO - __main__ - Step 2914: {'lr': 0.0004999530523033817, 'samples': 559488, 'steps': 2913, 'loss/train': 1.3060599565505981} -11/06/2021 21:40:34 - INFO - __main__ - Step 2915: {'lr': 0.0004999529494075792, 'samples': 559680, 'steps': 2914, 'loss/train': 2.2429051399230957} -11/06/2021 21:40:34 - INFO - __main__ - Step 2916: {'lr': 0.0004999528463991518, 'samples': 559872, 'steps': 2915, 'loss/train': 3.520594596862793} -11/06/2021 21:40:35 - INFO - __main__ - Step 2917: {'lr': 0.0004999527432780995, 'samples': 560064, 'steps': 2916, 'loss/train': 2.8024425506591797} -11/06/2021 21:40:36 - INFO - __main__ - Step 2918: {'lr': 0.0004999526400444223, 'samples': 560256, 'steps': 2917, 'loss/train': 2.3068015575408936} -11/06/2021 21:40:36 - INFO - __main__ - Step 2919: {'lr': 0.0004999525366981204, 'samples': 560448, 'steps': 2918, 'loss/train': 2.4727816581726074} -11/06/2021 21:40:36 - INFO - __main__ - Step 2920: {'lr': 0.0004999524332391937, 'samples': 560640, 'steps': 2919, 'loss/train': 1.4589003324508667} -11/06/2021 21:40:37 - INFO - __main__ - Step 2921: {'lr': 0.0004999523296676423, 'samples': 560832, 'steps': 2920, 'loss/train': 2.8546531200408936} -11/06/2021 21:40:38 - INFO - __main__ - Step 2922: {'lr': 0.0004999522259834662, 'samples': 561024, 'steps': 2921, 'loss/train': 2.01436185836792} -11/06/2021 21:40:38 - INFO - __main__ - Step 2923: {'lr': 0.0004999521221866655, 'samples': 561216, 'steps': 2922, 'loss/train': 2.9022979736328125} -11/06/2021 21:40:38 - INFO - __main__ - Step 2924: {'lr': 0.0004999520182772402, 'samples': 561408, 'steps': 2923, 'loss/train': 2.112090826034546} -11/06/2021 21:40:39 - INFO - __main__ - Step 2925: {'lr': 0.0004999519142551905, 'samples': 561600, 'steps': 2924, 'loss/train': 2.724461317062378} -11/06/2021 21:40:39 - INFO - __main__ - Step 2926: {'lr': 0.0004999518101205162, 'samples': 561792, 'steps': 2925, 'loss/train': 3.0705063343048096} -11/06/2021 21:40:40 - INFO - __main__ - Step 2927: {'lr': 0.0004999517058732175, 'samples': 561984, 'steps': 2926, 'loss/train': 2.3945233821868896} -11/06/2021 21:40:41 - INFO - __main__ - Step 2928: {'lr': 0.0004999516015132945, 'samples': 562176, 'steps': 2927, 'loss/train': 1.2997283935546875} -11/06/2021 21:40:41 - INFO - __main__ - Step 2929: {'lr': 0.0004999514970407471, 'samples': 562368, 'steps': 2928, 'loss/train': 1.4309011697769165} -11/06/2021 21:40:41 - INFO - __main__ - Step 2930: {'lr': 0.0004999513924555754, 'samples': 562560, 'steps': 2929, 'loss/train': 1.5472474098205566} -11/06/2021 21:40:42 - INFO - __main__ - Step 2931: {'lr': 0.0004999512877577794, 'samples': 562752, 'steps': 2930, 'loss/train': 2.173020601272583} -11/06/2021 21:40:43 - INFO - __main__ - Step 2932: {'lr': 0.0004999511829473593, 'samples': 562944, 'steps': 2931, 'loss/train': 1.8353915214538574} -11/06/2021 21:40:43 - INFO - __main__ - Step 2933: {'lr': 0.0004999510780243151, 'samples': 563136, 'steps': 2932, 'loss/train': 1.7260181903839111} -11/06/2021 21:40:43 - INFO - __main__ - Step 2934: {'lr': 0.0004999509729886467, 'samples': 563328, 'steps': 2933, 'loss/train': 2.6757678985595703} -11/06/2021 21:40:44 - INFO - __main__ - Step 2935: {'lr': 0.0004999508678403542, 'samples': 563520, 'steps': 2934, 'loss/train': 2.1792075634002686} -11/06/2021 21:40:44 - INFO - __main__ - Step 2936: {'lr': 0.0004999507625794378, 'samples': 563712, 'steps': 2935, 'loss/train': 2.2181787490844727} -11/06/2021 21:40:45 - INFO - __main__ - Step 2937: {'lr': 0.0004999506572058974, 'samples': 563904, 'steps': 2936, 'loss/train': 2.060746192932129} -11/06/2021 21:40:45 - INFO - __main__ - Step 2938: {'lr': 0.0004999505517197331, 'samples': 564096, 'steps': 2937, 'loss/train': 2.2606637477874756} -11/06/2021 21:40:46 - INFO - __main__ - Step 2939: {'lr': 0.000499950446120945, 'samples': 564288, 'steps': 2938, 'loss/train': 1.9064645767211914} -11/06/2021 21:40:46 - INFO - __main__ - Step 2940: {'lr': 0.000499950340409533, 'samples': 564480, 'steps': 2939, 'loss/train': 2.1608986854553223} -11/06/2021 21:40:46 - INFO - __main__ - Step 2941: {'lr': 0.0004999502345854973, 'samples': 564672, 'steps': 2940, 'loss/train': 2.2429375648498535} -11/06/2021 21:40:47 - INFO - __main__ - Step 2942: {'lr': 0.0004999501286488378, 'samples': 564864, 'steps': 2941, 'loss/train': 2.142625093460083} -11/06/2021 21:40:48 - INFO - __main__ - Step 2943: {'lr': 0.0004999500225995547, 'samples': 565056, 'steps': 2942, 'loss/train': 2.0483415126800537} -11/06/2021 21:40:48 - INFO - __main__ - Step 2944: {'lr': 0.000499949916437648, 'samples': 565248, 'steps': 2943, 'loss/train': 2.363560199737549} -11/06/2021 21:40:49 - INFO - __main__ - Step 2945: {'lr': 0.0004999498101631177, 'samples': 565440, 'steps': 2944, 'loss/train': 2.750171422958374} -11/06/2021 21:40:49 - INFO - __main__ - Step 2946: {'lr': 0.0004999497037759638, 'samples': 565632, 'steps': 2945, 'loss/train': 2.285203218460083} -11/06/2021 21:40:49 - INFO - __main__ - Step 2947: {'lr': 0.0004999495972761865, 'samples': 565824, 'steps': 2946, 'loss/train': 2.084728479385376} -11/06/2021 21:40:50 - INFO - __main__ - Step 2948: {'lr': 0.0004999494906637857, 'samples': 566016, 'steps': 2947, 'loss/train': 2.138784646987915} -11/06/2021 21:40:51 - INFO - __main__ - Step 2949: {'lr': 0.0004999493839387615, 'samples': 566208, 'steps': 2948, 'loss/train': 0.8493632674217224} -11/06/2021 21:40:51 - INFO - __main__ - Step 2950: {'lr': 0.000499949277101114, 'samples': 566400, 'steps': 2949, 'loss/train': 2.2582223415374756} -11/06/2021 21:40:51 - INFO - __main__ - Step 2951: {'lr': 0.0004999491701508433, 'samples': 566592, 'steps': 2950, 'loss/train': 2.1516506671905518} -11/06/2021 21:40:52 - INFO - __main__ - Step 2952: {'lr': 0.0004999490630879493, 'samples': 566784, 'steps': 2951, 'loss/train': 1.5355583429336548} -11/06/2021 21:40:53 - INFO - __main__ - Step 2953: {'lr': 0.0004999489559124321, 'samples': 566976, 'steps': 2952, 'loss/train': 1.9333853721618652} -11/06/2021 21:40:53 - INFO - __main__ - Step 2954: {'lr': 0.0004999488486242918, 'samples': 567168, 'steps': 2953, 'loss/train': 1.470977783203125} -11/06/2021 21:40:53 - INFO - __main__ - Step 2955: {'lr': 0.0004999487412235284, 'samples': 567360, 'steps': 2954, 'loss/train': 2.435324192047119} -11/06/2021 21:40:54 - INFO - __main__ - Step 2956: {'lr': 0.0004999486337101419, 'samples': 567552, 'steps': 2955, 'loss/train': 2.1768510341644287} -11/06/2021 21:40:54 - INFO - __main__ - Step 2957: {'lr': 0.0004999485260841324, 'samples': 567744, 'steps': 2956, 'loss/train': 2.5534868240356445} -11/06/2021 21:40:55 - INFO - __main__ - Step 2958: {'lr': 0.0004999484183455, 'samples': 567936, 'steps': 2957, 'loss/train': 2.551486015319824} -11/06/2021 21:40:55 - INFO - __main__ - Step 2959: {'lr': 0.0004999483104942446, 'samples': 568128, 'steps': 2958, 'loss/train': 2.710608720779419} -11/06/2021 21:40:56 - INFO - __main__ - Step 2960: {'lr': 0.0004999482025303665, 'samples': 568320, 'steps': 2959, 'loss/train': 2.0834438800811768} -11/06/2021 21:40:56 - INFO - __main__ - Step 2961: {'lr': 0.0004999480944538655, 'samples': 568512, 'steps': 2960, 'loss/train': 2.1335995197296143} -11/06/2021 21:40:57 - INFO - __main__ - Step 2962: {'lr': 0.0004999479862647417, 'samples': 568704, 'steps': 2961, 'loss/train': 1.7323172092437744} -11/06/2021 21:40:57 - INFO - __main__ - Step 2963: {'lr': 0.0004999478779629953, 'samples': 568896, 'steps': 2962, 'loss/train': 1.3542144298553467} -11/06/2021 21:40:58 - INFO - __main__ - Step 2964: {'lr': 0.0004999477695486261, 'samples': 569088, 'steps': 2963, 'loss/train': 2.248361349105835} -11/06/2021 21:40:58 - INFO - __main__ - Step 2965: {'lr': 0.0004999476610216345, 'samples': 569280, 'steps': 2964, 'loss/train': 1.651444673538208} -11/06/2021 21:40:59 - INFO - __main__ - Step 2966: {'lr': 0.0004999475523820203, 'samples': 569472, 'steps': 2965, 'loss/train': 1.6673521995544434} -11/06/2021 21:40:59 - INFO - __main__ - Step 2967: {'lr': 0.0004999474436297835, 'samples': 569664, 'steps': 2966, 'loss/train': 2.576014995574951} -11/06/2021 21:40:59 - INFO - __main__ - Step 2968: {'lr': 0.0004999473347649242, 'samples': 569856, 'steps': 2967, 'loss/train': 2.7090260982513428} -11/06/2021 21:41:00 - INFO - __main__ - Step 2969: {'lr': 0.0004999472257874426, 'samples': 570048, 'steps': 2968, 'loss/train': 2.4172799587249756} -11/06/2021 21:41:01 - INFO - __main__ - Step 2970: {'lr': 0.0004999471166973385, 'samples': 570240, 'steps': 2969, 'loss/train': 2.754880905151367} -11/06/2021 21:41:01 - INFO - __main__ - Step 2971: {'lr': 0.0004999470074946122, 'samples': 570432, 'steps': 2970, 'loss/train': 2.2452704906463623} -11/06/2021 21:41:01 - INFO - __main__ - Step 2972: {'lr': 0.0004999468981792636, 'samples': 570624, 'steps': 2971, 'loss/train': 1.8505585193634033} -11/06/2021 21:41:02 - INFO - __main__ - Step 2973: {'lr': 0.0004999467887512928, 'samples': 570816, 'steps': 2972, 'loss/train': 2.324302911758423} -11/06/2021 21:41:03 - INFO - __main__ - Step 2974: {'lr': 0.0004999466792106998, 'samples': 571008, 'steps': 2973, 'loss/train': 2.198997974395752} -11/06/2021 21:41:03 - INFO - __main__ - Step 2975: {'lr': 0.0004999465695574848, 'samples': 571200, 'steps': 2974, 'loss/train': 2.4964334964752197} -11/06/2021 21:41:03 - INFO - __main__ - Step 2976: {'lr': 0.0004999464597916476, 'samples': 571392, 'steps': 2975, 'loss/train': 2.4963150024414062} -11/06/2021 21:41:04 - INFO - __main__ - Step 2977: {'lr': 0.0004999463499131884, 'samples': 571584, 'steps': 2976, 'loss/train': 2.5181667804718018} -11/06/2021 21:41:04 - INFO - __main__ - Step 2978: {'lr': 0.0004999462399221073, 'samples': 571776, 'steps': 2977, 'loss/train': 3.5236194133758545} -11/06/2021 21:41:05 - INFO - __main__ - Step 2979: {'lr': 0.0004999461298184042, 'samples': 571968, 'steps': 2978, 'loss/train': 2.367652416229248} -11/06/2021 21:41:06 - INFO - __main__ - Step 2980: {'lr': 0.0004999460196020793, 'samples': 572160, 'steps': 2979, 'loss/train': 2.657733201980591} -11/06/2021 21:41:06 - INFO - __main__ - Step 2981: {'lr': 0.0004999459092731326, 'samples': 572352, 'steps': 2980, 'loss/train': 2.142723321914673} -11/06/2021 21:41:06 - INFO - __main__ - Step 2982: {'lr': 0.000499945798831564, 'samples': 572544, 'steps': 2981, 'loss/train': 2.780032157897949} -11/06/2021 21:41:07 - INFO - __main__ - Step 2983: {'lr': 0.0004999456882773737, 'samples': 572736, 'steps': 2982, 'loss/train': 2.4689583778381348} -11/06/2021 21:41:08 - INFO - __main__ - Step 2984: {'lr': 0.0004999455776105618, 'samples': 572928, 'steps': 2983, 'loss/train': 1.9315149784088135} -11/06/2021 21:41:08 - INFO - __main__ - Step 2985: {'lr': 0.0004999454668311283, 'samples': 573120, 'steps': 2984, 'loss/train': 2.1817145347595215} -11/06/2021 21:41:08 - INFO - __main__ - Step 2986: {'lr': 0.0004999453559390731, 'samples': 573312, 'steps': 2985, 'loss/train': 2.152888774871826} -11/06/2021 21:41:09 - INFO - __main__ - Step 2987: {'lr': 0.0004999452449343967, 'samples': 573504, 'steps': 2986, 'loss/train': 2.3532779216766357} -11/06/2021 21:41:09 - INFO - __main__ - Step 2988: {'lr': 0.0004999451338170985, 'samples': 573696, 'steps': 2987, 'loss/train': 2.4001834392547607} -11/06/2021 21:41:10 - INFO - __main__ - Step 2989: {'lr': 0.000499945022587179, 'samples': 573888, 'steps': 2988, 'loss/train': 2.3787949085235596} -11/06/2021 21:41:10 - INFO - __main__ - Step 2990: {'lr': 0.0004999449112446381, 'samples': 574080, 'steps': 2989, 'loss/train': 2.610903263092041} -11/06/2021 21:41:11 - INFO - __main__ - Step 2991: {'lr': 0.000499944799789476, 'samples': 574272, 'steps': 2990, 'loss/train': 2.203000545501709} -11/06/2021 21:41:11 - INFO - __main__ - Step 2992: {'lr': 0.0004999446882216925, 'samples': 574464, 'steps': 2991, 'loss/train': 1.9404032230377197} -11/06/2021 21:41:11 - INFO - __main__ - Step 2993: {'lr': 0.0004999445765412878, 'samples': 574656, 'steps': 2992, 'loss/train': 2.0062878131866455} -11/06/2021 21:41:12 - INFO - __main__ - Step 2994: {'lr': 0.0004999444647482619, 'samples': 574848, 'steps': 2993, 'loss/train': 2.512753963470459} -11/06/2021 21:41:13 - INFO - __main__ - Step 2995: {'lr': 0.0004999443528426149, 'samples': 575040, 'steps': 2994, 'loss/train': 2.4999752044677734} -11/06/2021 21:41:13 - INFO - __main__ - Step 2996: {'lr': 0.0004999442408243469, 'samples': 575232, 'steps': 2995, 'loss/train': 2.140004873275757} -11/06/2021 21:41:13 - INFO - __main__ - Step 2997: {'lr': 0.0004999441286934578, 'samples': 575424, 'steps': 2996, 'loss/train': 2.258283853530884} -11/06/2021 21:41:14 - INFO - __main__ - Step 2998: {'lr': 0.0004999440164499478, 'samples': 575616, 'steps': 2997, 'loss/train': 2.103290557861328} -11/06/2021 21:41:14 - INFO - __main__ - Step 2999: {'lr': 0.0004999439040938168, 'samples': 575808, 'steps': 2998, 'loss/train': 2.217271327972412} -11/06/2021 21:41:15 - INFO - __main__ - Step 3000: {'lr': 0.000499943791625065, 'samples': 576000, 'steps': 2999, 'loss/train': 2.1993706226348877} -11/06/2021 21:41:15 - INFO - __main__ - Step 3001: {'lr': 0.0004999436790436923, 'samples': 576192, 'steps': 3000, 'loss/train': 1.9046951532363892} -11/06/2021 21:41:16 - INFO - __main__ - Step 3002: {'lr': 0.000499943566349699, 'samples': 576384, 'steps': 3001, 'loss/train': 2.5663747787475586} -11/06/2021 21:41:16 - INFO - __main__ - Step 3003: {'lr': 0.0004999434535430848, 'samples': 576576, 'steps': 3002, 'loss/train': 2.3395111560821533} -11/06/2021 21:41:17 - INFO - __main__ - Step 3004: {'lr': 0.0004999433406238501, 'samples': 576768, 'steps': 3003, 'loss/train': 2.3144681453704834} -11/06/2021 21:41:18 - INFO - __main__ - Step 3005: {'lr': 0.0004999432275919947, 'samples': 576960, 'steps': 3004, 'loss/train': 2.3449320793151855} -11/06/2021 21:41:18 - INFO - __main__ - Step 3006: {'lr': 0.0004999431144475187, 'samples': 577152, 'steps': 3005, 'loss/train': 2.1510040760040283} -11/06/2021 21:41:18 - INFO - __main__ - Step 3007: {'lr': 0.0004999430011904222, 'samples': 577344, 'steps': 3006, 'loss/train': 0.7324512004852295} -11/06/2021 21:41:19 - INFO - __main__ - Step 3008: {'lr': 0.0004999428878207054, 'samples': 577536, 'steps': 3007, 'loss/train': 2.3040289878845215} -11/06/2021 21:41:19 - INFO - __main__ - Step 3009: {'lr': 0.000499942774338368, 'samples': 577728, 'steps': 3008, 'loss/train': 2.3875339031219482} -11/06/2021 21:41:20 - INFO - __main__ - Step 3010: {'lr': 0.0004999426607434104, 'samples': 577920, 'steps': 3009, 'loss/train': 2.562206268310547} -11/06/2021 21:41:20 - INFO - __main__ - Step 3011: {'lr': 0.0004999425470358324, 'samples': 578112, 'steps': 3010, 'loss/train': 2.1042847633361816} -11/06/2021 21:41:21 - INFO - __main__ - Step 3012: {'lr': 0.0004999424332156341, 'samples': 578304, 'steps': 3011, 'loss/train': 1.8335940837860107} -11/06/2021 21:41:21 - INFO - __main__ - Step 3013: {'lr': 0.0004999423192828156, 'samples': 578496, 'steps': 3012, 'loss/train': 2.3943774700164795} -11/06/2021 21:41:21 - INFO - __main__ - Step 3014: {'lr': 0.0004999422052373771, 'samples': 578688, 'steps': 3013, 'loss/train': 2.3687760829925537} -11/06/2021 21:41:23 - INFO - __main__ - Step 3015: {'lr': 0.0004999420910793183, 'samples': 578880, 'steps': 3014, 'loss/train': 2.2933881282806396} -11/06/2021 21:41:23 - INFO - __main__ - Step 3016: {'lr': 0.0004999419768086397, 'samples': 579072, 'steps': 3015, 'loss/train': 2.4723987579345703} -11/06/2021 21:41:23 - INFO - __main__ - Step 3017: {'lr': 0.0004999418624253408, 'samples': 579264, 'steps': 3016, 'loss/train': 2.3024117946624756} -11/06/2021 21:41:24 - INFO - __main__ - Step 3018: {'lr': 0.0004999417479294221, 'samples': 579456, 'steps': 3017, 'loss/train': 2.373169183731079} -11/06/2021 21:41:24 - INFO - __main__ - Step 3019: {'lr': 0.0004999416333208835, 'samples': 579648, 'steps': 3018, 'loss/train': 1.6759024858474731} -11/06/2021 21:41:25 - INFO - __main__ - Step 3020: {'lr': 0.0004999415185997252, 'samples': 579840, 'steps': 3019, 'loss/train': 2.323343515396118} -11/06/2021 21:41:25 - INFO - __main__ - Step 3021: {'lr': 0.0004999414037659468, 'samples': 580032, 'steps': 3020, 'loss/train': 1.5138059854507446} -11/06/2021 21:41:26 - INFO - __main__ - Step 3022: {'lr': 0.000499941288819549, 'samples': 580224, 'steps': 3021, 'loss/train': 1.5361846685409546} -11/06/2021 21:41:26 - INFO - __main__ - Step 3023: {'lr': 0.0004999411737605313, 'samples': 580416, 'steps': 3022, 'loss/train': 1.946350336074829} -11/06/2021 21:41:27 - INFO - __main__ - Step 3024: {'lr': 0.000499941058588894, 'samples': 580608, 'steps': 3023, 'loss/train': 2.60408091545105} -11/06/2021 21:41:28 - INFO - __main__ - Step 3025: {'lr': 0.0004999409433046371, 'samples': 580800, 'steps': 3024, 'loss/train': 2.4534120559692383} -11/06/2021 21:41:28 - INFO - __main__ - Step 3026: {'lr': 0.0004999408279077607, 'samples': 580992, 'steps': 3025, 'loss/train': 2.68884015083313} -11/06/2021 21:41:29 - INFO - __main__ - Step 3027: {'lr': 0.0004999407123982649, 'samples': 581184, 'steps': 3026, 'loss/train': 2.0190529823303223} -11/06/2021 21:41:29 - INFO - __main__ - Step 3028: {'lr': 0.0004999405967761495, 'samples': 581376, 'steps': 3027, 'loss/train': 1.0339617729187012} -11/06/2021 21:41:29 - INFO - __main__ - Step 3029: {'lr': 0.0004999404810414149, 'samples': 581568, 'steps': 3028, 'loss/train': 0.895268440246582} -11/06/2021 21:41:31 - INFO - __main__ - Step 3030: {'lr': 0.0004999403651940608, 'samples': 581760, 'steps': 3029, 'loss/train': 2.5212795734405518} -11/06/2021 21:41:31 - INFO - __main__ - Step 3031: {'lr': 0.0004999402492340875, 'samples': 581952, 'steps': 3030, 'loss/train': 2.4372713565826416} -11/06/2021 21:41:31 - INFO - __main__ - Step 3032: {'lr': 0.000499940133161495, 'samples': 582144, 'steps': 3031, 'loss/train': 2.357042074203491} -11/06/2021 21:41:32 - INFO - __main__ - Step 3033: {'lr': 0.0004999400169762834, 'samples': 582336, 'steps': 3032, 'loss/train': 1.6500097513198853} -11/06/2021 21:41:32 - INFO - __main__ - Step 3034: {'lr': 0.0004999399006784525, 'samples': 582528, 'steps': 3033, 'loss/train': 2.2816481590270996} -11/06/2021 21:41:33 - INFO - __main__ - Step 3035: {'lr': 0.0004999397842680027, 'samples': 582720, 'steps': 3034, 'loss/train': 2.364650249481201} -11/06/2021 21:41:33 - INFO - __main__ - Step 3036: {'lr': 0.0004999396677449338, 'samples': 582912, 'steps': 3035, 'loss/train': 0.6538060307502747} -11/06/2021 21:41:34 - INFO - __main__ - Step 3037: {'lr': 0.000499939551109246, 'samples': 583104, 'steps': 3036, 'loss/train': 2.646855354309082} -11/06/2021 21:41:34 - INFO - __main__ - Step 3038: {'lr': 0.0004999394343609393, 'samples': 583296, 'steps': 3037, 'loss/train': 2.262348175048828} -11/06/2021 21:41:34 - INFO - __main__ - Step 3039: {'lr': 0.0004999393175000137, 'samples': 583488, 'steps': 3038, 'loss/train': 2.1946680545806885} -11/06/2021 21:41:35 - INFO - __main__ - Step 3040: {'lr': 0.0004999392005264694, 'samples': 583680, 'steps': 3039, 'loss/train': 2.3588778972625732} -11/06/2021 21:41:36 - INFO - __main__ - Step 3041: {'lr': 0.0004999390834403062, 'samples': 583872, 'steps': 3040, 'loss/train': 1.918365716934204} -11/06/2021 21:41:36 - INFO - __main__ - Step 3042: {'lr': 0.0004999389662415244, 'samples': 584064, 'steps': 3041, 'loss/train': 2.238910436630249} -11/06/2021 21:41:37 - INFO - __main__ - Step 3043: {'lr': 0.000499938848930124, 'samples': 584256, 'steps': 3042, 'loss/train': 1.9267772436141968} -11/06/2021 21:41:37 - INFO - __main__ - Step 3044: {'lr': 0.0004999387315061049, 'samples': 584448, 'steps': 3043, 'loss/train': 2.763803005218506} -11/06/2021 21:41:37 - INFO - __main__ - Step 3045: {'lr': 0.0004999386139694673, 'samples': 584640, 'steps': 3044, 'loss/train': 5.723489761352539} -11/06/2021 21:41:38 - INFO - __main__ - Step 3046: {'lr': 0.0004999384963202113, 'samples': 584832, 'steps': 3045, 'loss/train': 2.657350778579712} -11/06/2021 21:41:39 - INFO - __main__ - Step 3047: {'lr': 0.0004999383785583368, 'samples': 585024, 'steps': 3046, 'loss/train': 2.1708598136901855} -11/06/2021 21:41:39 - INFO - __main__ - Step 3048: {'lr': 0.0004999382606838439, 'samples': 585216, 'steps': 3047, 'loss/train': 2.4225125312805176} -11/06/2021 21:41:39 - INFO - __main__ - Step 3049: {'lr': 0.0004999381426967327, 'samples': 585408, 'steps': 3048, 'loss/train': 2.1795241832733154} -11/06/2021 21:41:40 - INFO - __main__ - Step 3050: {'lr': 0.0004999380245970033, 'samples': 585600, 'steps': 3049, 'loss/train': 2.3345532417297363} -11/06/2021 21:41:40 - INFO - __main__ - Step 3051: {'lr': 0.0004999379063846555, 'samples': 585792, 'steps': 3050, 'loss/train': 2.1658904552459717} -11/06/2021 21:41:41 - INFO - __main__ - Step 3052: {'lr': 0.0004999377880596897, 'samples': 585984, 'steps': 3051, 'loss/train': 2.3104407787323} -11/06/2021 21:41:41 - INFO - __main__ - Step 3053: {'lr': 0.0004999376696221057, 'samples': 586176, 'steps': 3052, 'loss/train': 2.1022863388061523} -11/06/2021 21:41:42 - INFO - __main__ - Step 3054: {'lr': 0.0004999375510719037, 'samples': 586368, 'steps': 3053, 'loss/train': 2.1373109817504883} -11/06/2021 21:41:42 - INFO - __main__ - Step 3055: {'lr': 0.0004999374324090837, 'samples': 586560, 'steps': 3054, 'loss/train': 2.6458959579467773} -11/06/2021 21:41:43 - INFO - __main__ - Step 3056: {'lr': 0.0004999373136336457, 'samples': 586752, 'steps': 3055, 'loss/train': 2.1818501949310303} -11/06/2021 21:41:44 - INFO - __main__ - Step 3057: {'lr': 0.0004999371947455899, 'samples': 586944, 'steps': 3056, 'loss/train': 3.2870852947235107} -11/06/2021 21:41:44 - INFO - __main__ - Step 3058: {'lr': 0.0004999370757449162, 'samples': 587136, 'steps': 3057, 'loss/train': 1.6503088474273682} -11/06/2021 21:41:45 - INFO - __main__ - Step 3059: {'lr': 0.0004999369566316247, 'samples': 587328, 'steps': 3058, 'loss/train': 3.2985236644744873} -11/06/2021 21:41:45 - INFO - __main__ - Step 3060: {'lr': 0.0004999368374057155, 'samples': 587520, 'steps': 3059, 'loss/train': 2.637629985809326} -11/06/2021 21:41:45 - INFO - __main__ - Step 3061: {'lr': 0.0004999367180671886, 'samples': 587712, 'steps': 3060, 'loss/train': 2.058300733566284} -11/06/2021 21:41:46 - INFO - __main__ - Step 3062: {'lr': 0.000499936598616044, 'samples': 587904, 'steps': 3061, 'loss/train': 2.2234086990356445} -11/06/2021 21:41:46 - INFO - __main__ - Step 3063: {'lr': 0.0004999364790522819, 'samples': 588096, 'steps': 3062, 'loss/train': 1.9552711248397827} -11/06/2021 21:41:47 - INFO - __main__ - Step 3064: {'lr': 0.0004999363593759022, 'samples': 588288, 'steps': 3063, 'loss/train': 2.5826447010040283} -11/06/2021 21:41:47 - INFO - __main__ - Step 3065: {'lr': 0.0004999362395869052, 'samples': 588480, 'steps': 3064, 'loss/train': 2.5143256187438965} -11/06/2021 21:41:48 - INFO - __main__ - Step 3066: {'lr': 0.0004999361196852906, 'samples': 588672, 'steps': 3065, 'loss/train': 2.092707633972168} -11/06/2021 21:41:48 - INFO - __main__ - Step 3067: {'lr': 0.0004999359996710588, 'samples': 588864, 'steps': 3066, 'loss/train': 2.1652286052703857} -11/06/2021 21:41:49 - INFO - __main__ - Step 3068: {'lr': 0.0004999358795442096, 'samples': 589056, 'steps': 3067, 'loss/train': 2.3341615200042725} -11/06/2021 21:41:50 - INFO - __main__ - Step 3069: {'lr': 0.0004999357593047431, 'samples': 589248, 'steps': 3068, 'loss/train': 1.7487068176269531} -11/06/2021 21:41:50 - INFO - __main__ - Step 3070: {'lr': 0.0004999356389526595, 'samples': 589440, 'steps': 3069, 'loss/train': 2.2745633125305176} -11/06/2021 21:41:50 - INFO - __main__ - Step 3071: {'lr': 0.0004999355184879587, 'samples': 589632, 'steps': 3070, 'loss/train': 1.911078691482544} -11/06/2021 21:41:51 - INFO - __main__ - Step 3072: {'lr': 0.0004999353979106409, 'samples': 589824, 'steps': 3071, 'loss/train': 2.032170057296753} -11/06/2021 21:41:52 - INFO - __main__ - Step 3073: {'lr': 0.000499935277220706, 'samples': 590016, 'steps': 3072, 'loss/train': 0.5505169034004211} -11/06/2021 21:41:52 - INFO - __main__ - Step 3074: {'lr': 0.0004999351564181541, 'samples': 590208, 'steps': 3073, 'loss/train': 2.0557284355163574} -11/06/2021 21:41:53 - INFO - __main__ - Step 3075: {'lr': 0.0004999350355029854, 'samples': 590400, 'steps': 3074, 'loss/train': 2.871734857559204} -11/06/2021 21:41:53 - INFO - __main__ - Step 3076: {'lr': 0.0004999349144751997, 'samples': 590592, 'steps': 3075, 'loss/train': 2.093614339828491} -11/06/2021 21:41:53 - INFO - __main__ - Step 3077: {'lr': 0.0004999347933347972, 'samples': 590784, 'steps': 3076, 'loss/train': 2.2639260292053223} -11/06/2021 21:41:55 - INFO - __main__ - Step 3078: {'lr': 0.0004999346720817779, 'samples': 590976, 'steps': 3077, 'loss/train': 1.5730407238006592} -11/06/2021 21:41:55 - INFO - __main__ - Step 3079: {'lr': 0.000499934550716142, 'samples': 591168, 'steps': 3078, 'loss/train': 2.4267160892486572} -11/06/2021 21:41:55 - INFO - __main__ - Step 3080: {'lr': 0.0004999344292378893, 'samples': 591360, 'steps': 3079, 'loss/train': 3.6418893337249756} -11/06/2021 21:41:56 - INFO - __main__ - Step 3081: {'lr': 0.0004999343076470202, 'samples': 591552, 'steps': 3080, 'loss/train': 1.6918516159057617} -11/06/2021 21:41:56 - INFO - __main__ - Step 3082: {'lr': 0.0004999341859435345, 'samples': 591744, 'steps': 3081, 'loss/train': 2.610215902328491} -11/06/2021 21:41:57 - INFO - __main__ - Step 3083: {'lr': 0.0004999340641274322, 'samples': 591936, 'steps': 3082, 'loss/train': 2.330768346786499} -11/06/2021 21:41:57 - INFO - __main__ - Step 3084: {'lr': 0.0004999339421987136, 'samples': 592128, 'steps': 3083, 'loss/train': 1.9727678298950195} -11/06/2021 21:41:58 - INFO - __main__ - Step 3085: {'lr': 0.0004999338201573786, 'samples': 592320, 'steps': 3084, 'loss/train': 2.6285154819488525} -11/06/2021 21:41:58 - INFO - __main__ - Step 3086: {'lr': 0.0004999336980034271, 'samples': 592512, 'steps': 3085, 'loss/train': 2.5483882427215576} -11/06/2021 21:41:59 - INFO - __main__ - Step 3087: {'lr': 0.0004999335757368595, 'samples': 592704, 'steps': 3086, 'loss/train': 2.4830641746520996} -11/06/2021 21:41:59 - INFO - __main__ - Step 3088: {'lr': 0.0004999334533576757, 'samples': 592896, 'steps': 3087, 'loss/train': 2.06929087638855} -11/06/2021 21:41:59 - INFO - __main__ - Step 3089: {'lr': 0.0004999333308658756, 'samples': 593088, 'steps': 3088, 'loss/train': 2.439222812652588} -11/06/2021 21:42:01 - INFO - __main__ - Step 3090: {'lr': 0.0004999332082614597, 'samples': 593280, 'steps': 3089, 'loss/train': 1.6735726594924927} -11/06/2021 21:42:01 - INFO - __main__ - Step 3091: {'lr': 0.0004999330855444274, 'samples': 593472, 'steps': 3090, 'loss/train': 2.4830446243286133} -11/06/2021 21:42:01 - INFO - __main__ - Step 3092: {'lr': 0.0004999329627147792, 'samples': 593664, 'steps': 3091, 'loss/train': 1.9454426765441895} -11/06/2021 21:42:02 - INFO - __main__ - Step 3093: {'lr': 0.0004999328397725152, 'samples': 593856, 'steps': 3092, 'loss/train': 2.445350408554077} -11/06/2021 21:42:02 - INFO - __main__ - Step 3094: {'lr': 0.0004999327167176352, 'samples': 594048, 'steps': 3093, 'loss/train': 2.219423532485962} -11/06/2021 21:42:02 - INFO - __main__ - Step 3095: {'lr': 0.0004999325935501395, 'samples': 594240, 'steps': 3094, 'loss/train': 2.2615649700164795} -11/06/2021 21:42:03 - INFO - __main__ - Step 3096: {'lr': 0.0004999324702700279, 'samples': 594432, 'steps': 3095, 'loss/train': 2.060243844985962} -11/06/2021 21:42:04 - INFO - __main__ - Step 3097: {'lr': 0.0004999323468773007, 'samples': 594624, 'steps': 3096, 'loss/train': 1.7364767789840698} -11/06/2021 21:42:04 - INFO - __main__ - Step 3098: {'lr': 0.0004999322233719578, 'samples': 594816, 'steps': 3097, 'loss/train': 2.3466086387634277} -11/06/2021 21:42:04 - INFO - __main__ - Step 3099: {'lr': 0.0004999320997539992, 'samples': 595008, 'steps': 3098, 'loss/train': 2.1478734016418457} -11/06/2021 21:42:05 - INFO - __main__ - Step 3100: {'lr': 0.0004999319760234251, 'samples': 595200, 'steps': 3099, 'loss/train': 1.8214367628097534} -11/06/2021 21:42:06 - INFO - __main__ - Step 3101: {'lr': 0.0004999318521802356, 'samples': 595392, 'steps': 3100, 'loss/train': 2.0618221759796143} -11/06/2021 21:42:06 - INFO - __main__ - Step 3102: {'lr': 0.0004999317282244305, 'samples': 595584, 'steps': 3101, 'loss/train': 2.218130350112915} -11/06/2021 21:42:07 - INFO - __main__ - Step 3103: {'lr': 0.0004999316041560102, 'samples': 595776, 'steps': 3102, 'loss/train': 1.9381036758422852} -11/06/2021 21:42:07 - INFO - __main__ - Step 3104: {'lr': 0.0004999314799749745, 'samples': 595968, 'steps': 3103, 'loss/train': 3.2617650032043457} -11/06/2021 21:42:07 - INFO - __main__ - Step 3105: {'lr': 0.0004999313556813235, 'samples': 596160, 'steps': 3104, 'loss/train': 2.255150079727173} -11/06/2021 21:42:08 - INFO - __main__ - Step 3106: {'lr': 0.0004999312312750573, 'samples': 596352, 'steps': 3105, 'loss/train': 1.6376298666000366} -11/06/2021 21:42:09 - INFO - __main__ - Step 3107: {'lr': 0.000499931106756176, 'samples': 596544, 'steps': 3106, 'loss/train': 2.3858001232147217} -11/06/2021 21:42:09 - INFO - __main__ - Step 3108: {'lr': 0.0004999309821246795, 'samples': 596736, 'steps': 3107, 'loss/train': 2.6677393913269043} -11/06/2021 21:42:10 - INFO - __main__ - Step 3109: {'lr': 0.000499930857380568, 'samples': 596928, 'steps': 3108, 'loss/train': 1.4987972974777222} -11/06/2021 21:42:10 - INFO - __main__ - Step 3110: {'lr': 0.0004999307325238416, 'samples': 597120, 'steps': 3109, 'loss/train': 1.9903048276901245} -11/06/2021 21:42:10 - INFO - __main__ - Step 3111: {'lr': 0.0004999306075545002, 'samples': 597312, 'steps': 3110, 'loss/train': 2.7295010089874268} -11/06/2021 21:42:11 - INFO - __main__ - Step 3112: {'lr': 0.0004999304824725439, 'samples': 597504, 'steps': 3111, 'loss/train': 2.1662516593933105} -11/06/2021 21:42:12 - INFO - __main__ - Step 3113: {'lr': 0.0004999303572779727, 'samples': 597696, 'steps': 3112, 'loss/train': 1.8486442565917969} -11/06/2021 21:42:12 - INFO - __main__ - Step 3114: {'lr': 0.0004999302319707869, 'samples': 597888, 'steps': 3113, 'loss/train': 2.575617551803589} -11/06/2021 21:42:12 - INFO - __main__ - Step 3115: {'lr': 0.0004999301065509863, 'samples': 598080, 'steps': 3114, 'loss/train': 2.4557383060455322} -11/06/2021 21:42:13 - INFO - __main__ - Step 3116: {'lr': 0.0004999299810185712, 'samples': 598272, 'steps': 3115, 'loss/train': 1.887520670890808} -11/06/2021 21:42:14 - INFO - __main__ - Step 3117: {'lr': 0.0004999298553735413, 'samples': 598464, 'steps': 3116, 'loss/train': 2.2960591316223145} -11/06/2021 21:42:14 - INFO - __main__ - Step 3118: {'lr': 0.000499929729615897, 'samples': 598656, 'steps': 3117, 'loss/train': 2.5776569843292236} -11/06/2021 21:42:14 - INFO - __main__ - Step 3119: {'lr': 0.0004999296037456381, 'samples': 598848, 'steps': 3118, 'loss/train': 2.3189525604248047} -11/06/2021 21:42:15 - INFO - __main__ - Step 3120: {'lr': 0.0004999294777627649, 'samples': 599040, 'steps': 3119, 'loss/train': 1.3478337526321411} -11/06/2021 21:42:15 - INFO - __main__ - Step 3121: {'lr': 0.0004999293516672773, 'samples': 599232, 'steps': 3120, 'loss/train': 2.864377021789551} -11/06/2021 21:42:16 - INFO - __main__ - Step 3122: {'lr': 0.0004999292254591754, 'samples': 599424, 'steps': 3121, 'loss/train': 2.7079334259033203} -11/06/2021 21:42:16 - INFO - __main__ - Step 3123: {'lr': 0.0004999290991384591, 'samples': 599616, 'steps': 3122, 'loss/train': 2.133533477783203} -11/06/2021 21:42:17 - INFO - __main__ - Step 3124: {'lr': 0.0004999289727051289, 'samples': 599808, 'steps': 3123, 'loss/train': 2.1969847679138184} -11/06/2021 21:42:17 - INFO - __main__ - Step 3125: {'lr': 0.0004999288461591842, 'samples': 600000, 'steps': 3124, 'loss/train': 1.7113127708435059} -11/06/2021 21:42:17 - INFO - __main__ - Step 3126: {'lr': 0.0004999287195006257, 'samples': 600192, 'steps': 3125, 'loss/train': 2.617366313934326} -11/06/2021 21:42:19 - INFO - __main__ - Step 3127: {'lr': 0.000499928592729453, 'samples': 600384, 'steps': 3126, 'loss/train': 2.459381103515625} -11/06/2021 21:42:19 - INFO - __main__ - Step 3128: {'lr': 0.0004999284658456665, 'samples': 600576, 'steps': 3127, 'loss/train': 2.3718807697296143} -11/06/2021 21:42:19 - INFO - __main__ - Step 3129: {'lr': 0.000499928338849266, 'samples': 600768, 'steps': 3128, 'loss/train': 2.543180465698242} -11/06/2021 21:42:20 - INFO - __main__ - Step 3130: {'lr': 0.0004999282117402516, 'samples': 600960, 'steps': 3129, 'loss/train': 1.7423886060714722} -11/06/2021 21:42:20 - INFO - __main__ - Step 3131: {'lr': 0.0004999280845186235, 'samples': 601152, 'steps': 3130, 'loss/train': 2.2052173614501953} -11/06/2021 21:42:21 - INFO - __main__ - Step 3132: {'lr': 0.0004999279571843816, 'samples': 601344, 'steps': 3131, 'loss/train': 1.9484204053878784} -11/06/2021 21:42:22 - INFO - __main__ - Step 3133: {'lr': 0.000499927829737526, 'samples': 601536, 'steps': 3132, 'loss/train': 2.428269147872925} -11/06/2021 21:42:22 - INFO - __main__ - Step 3134: {'lr': 0.0004999277021780569, 'samples': 601728, 'steps': 3133, 'loss/train': 2.089491128921509} -11/06/2021 21:42:22 - INFO - __main__ - Step 3135: {'lr': 0.0004999275745059741, 'samples': 601920, 'steps': 3134, 'loss/train': 2.9237546920776367} -11/06/2021 21:42:23 - INFO - __main__ - Step 3136: {'lr': 0.0004999274467212779, 'samples': 602112, 'steps': 3135, 'loss/train': 2.297293186187744} -11/06/2021 21:42:23 - INFO - __main__ - Step 3137: {'lr': 0.0004999273188239681, 'samples': 602304, 'steps': 3136, 'loss/train': 2.1000170707702637} -11/06/2021 21:42:24 - INFO - __main__ - Step 3138: {'lr': 0.0004999271908140451, 'samples': 602496, 'steps': 3137, 'loss/train': 2.391845703125} -11/06/2021 21:42:24 - INFO - __main__ - Step 3139: {'lr': 0.0004999270626915086, 'samples': 602688, 'steps': 3138, 'loss/train': 2.167910099029541} -11/06/2021 21:42:25 - INFO - __main__ - Step 3140: {'lr': 0.0004999269344563589, 'samples': 602880, 'steps': 3139, 'loss/train': 2.10351300239563} -11/06/2021 21:42:25 - INFO - __main__ - Step 3141: {'lr': 0.0004999268061085959, 'samples': 603072, 'steps': 3140, 'loss/train': 2.418550968170166} -11/06/2021 21:42:25 - INFO - __main__ - Step 3142: {'lr': 0.0004999266776482199, 'samples': 603264, 'steps': 3141, 'loss/train': 2.0939297676086426} -11/06/2021 21:42:27 - INFO - __main__ - Step 3143: {'lr': 0.0004999265490752306, 'samples': 603456, 'steps': 3142, 'loss/train': 2.4321014881134033} -11/06/2021 21:42:27 - INFO - __main__ - Step 3144: {'lr': 0.0004999264203896284, 'samples': 603648, 'steps': 3143, 'loss/train': 2.1129066944122314} -11/06/2021 21:42:27 - INFO - __main__ - Step 3145: {'lr': 0.0004999262915914132, 'samples': 603840, 'steps': 3144, 'loss/train': 1.9223228693008423} -11/06/2021 21:42:28 - INFO - __main__ - Step 3146: {'lr': 0.000499926162680585, 'samples': 604032, 'steps': 3145, 'loss/train': 1.9708632230758667} -11/06/2021 21:42:28 - INFO - __main__ - Step 3147: {'lr': 0.000499926033657144, 'samples': 604224, 'steps': 3146, 'loss/train': 2.535964250564575} -11/06/2021 21:42:29 - INFO - __main__ - Step 3148: {'lr': 0.0004999259045210901, 'samples': 604416, 'steps': 3147, 'loss/train': 1.4385805130004883} -11/06/2021 21:42:29 - INFO - __main__ - Step 3149: {'lr': 0.0004999257752724234, 'samples': 604608, 'steps': 3148, 'loss/train': 2.0960731506347656} -11/06/2021 21:42:30 - INFO - __main__ - Step 3150: {'lr': 0.0004999256459111443, 'samples': 604800, 'steps': 3149, 'loss/train': 1.577193021774292} -11/06/2021 21:42:30 - INFO - __main__ - Step 3151: {'lr': 0.0004999255164372523, 'samples': 604992, 'steps': 3150, 'loss/train': 1.8809454441070557} -11/06/2021 21:42:30 - INFO - __main__ - Step 3152: {'lr': 0.0004999253868507476, 'samples': 605184, 'steps': 3151, 'loss/train': 2.5812270641326904} -11/06/2021 21:42:31 - INFO - __main__ - Step 3153: {'lr': 0.0004999252571516306, 'samples': 605376, 'steps': 3152, 'loss/train': 2.324453353881836} -11/06/2021 21:42:32 - INFO - __main__ - Step 3154: {'lr': 0.0004999251273399011, 'samples': 605568, 'steps': 3153, 'loss/train': 1.5840191841125488} -11/06/2021 21:42:32 - INFO - __main__ - Step 3155: {'lr': 0.0004999249974155592, 'samples': 605760, 'steps': 3154, 'loss/train': 2.419705390930176} -11/06/2021 21:42:33 - INFO - __main__ - Step 3156: {'lr': 0.0004999248673786049, 'samples': 605952, 'steps': 3155, 'loss/train': 1.7660547494888306} -11/06/2021 21:42:33 - INFO - __main__ - Step 3157: {'lr': 0.0004999247372290383, 'samples': 606144, 'steps': 3156, 'loss/train': 3.5126683712005615} -11/06/2021 21:42:33 - INFO - __main__ - Step 3158: {'lr': 0.0004999246069668596, 'samples': 606336, 'steps': 3157, 'loss/train': 2.0734901428222656} -11/06/2021 21:42:34 - INFO - __main__ - Step 3159: {'lr': 0.0004999244765920687, 'samples': 606528, 'steps': 3158, 'loss/train': 2.5572397708892822} -11/06/2021 21:42:35 - INFO - __main__ - Step 3160: {'lr': 0.0004999243461046656, 'samples': 606720, 'steps': 3159, 'loss/train': 1.9452892541885376} -11/06/2021 21:42:35 - INFO - __main__ - Step 3161: {'lr': 0.0004999242155046504, 'samples': 606912, 'steps': 3160, 'loss/train': 0.912672221660614} -11/06/2021 21:42:35 - INFO - __main__ - Step 3162: {'lr': 0.0004999240847920233, 'samples': 607104, 'steps': 3161, 'loss/train': 1.7738767862319946} -11/06/2021 21:42:36 - INFO - __main__ - Step 3163: {'lr': 0.0004999239539667842, 'samples': 607296, 'steps': 3162, 'loss/train': 1.6333916187286377} -11/06/2021 21:42:37 - INFO - __main__ - Step 3164: {'lr': 0.0004999238230289333, 'samples': 607488, 'steps': 3163, 'loss/train': 2.6016409397125244} -11/06/2021 21:42:37 - INFO - __main__ - Step 3165: {'lr': 0.0004999236919784705, 'samples': 607680, 'steps': 3164, 'loss/train': 2.146538734436035} -11/06/2021 21:42:37 - INFO - __main__ - Step 3166: {'lr': 0.0004999235608153961, 'samples': 607872, 'steps': 3165, 'loss/train': 1.9972015619277954} -11/06/2021 21:42:38 - INFO - __main__ - Step 3167: {'lr': 0.0004999234295397098, 'samples': 608064, 'steps': 3166, 'loss/train': 2.117999315261841} -11/06/2021 21:42:38 - INFO - __main__ - Step 3168: {'lr': 0.000499923298151412, 'samples': 608256, 'steps': 3167, 'loss/train': 2.080382823944092} -11/06/2021 21:42:39 - INFO - __main__ - Step 3169: {'lr': 0.0004999231666505025, 'samples': 608448, 'steps': 3168, 'loss/train': 2.333287239074707} -11/06/2021 21:42:39 - INFO - __main__ - Step 3170: {'lr': 0.0004999230350369816, 'samples': 608640, 'steps': 3169, 'loss/train': 2.8902382850646973} -11/06/2021 21:42:40 - INFO - __main__ - Step 3171: {'lr': 0.0004999229033108492, 'samples': 608832, 'steps': 3170, 'loss/train': 1.6683903932571411} -11/06/2021 21:42:40 - INFO - __main__ - Step 3172: {'lr': 0.0004999227714721054, 'samples': 609024, 'steps': 3171, 'loss/train': 1.9496757984161377} -11/06/2021 21:42:40 - INFO - __main__ - Step 3173: {'lr': 0.0004999226395207501, 'samples': 609216, 'steps': 3172, 'loss/train': 2.0327744483947754} -11/06/2021 21:42:41 - INFO - __main__ - Step 3174: {'lr': 0.0004999225074567837, 'samples': 609408, 'steps': 3173, 'loss/train': 2.1947336196899414} -11/06/2021 21:42:42 - INFO - __main__ - Step 3175: {'lr': 0.000499922375280206, 'samples': 609600, 'steps': 3174, 'loss/train': 2.3255155086517334} -11/06/2021 21:42:42 - INFO - __main__ - Step 3176: {'lr': 0.0004999222429910171, 'samples': 609792, 'steps': 3175, 'loss/train': 2.275817394256592} -11/06/2021 21:42:42 - INFO - __main__ - Step 3177: {'lr': 0.0004999221105892172, 'samples': 609984, 'steps': 3176, 'loss/train': 2.14980411529541} -11/06/2021 21:42:43 - INFO - __main__ - Step 3178: {'lr': 0.0004999219780748062, 'samples': 610176, 'steps': 3177, 'loss/train': 3.107052803039551} -11/06/2021 21:42:44 - INFO - __main__ - Step 3179: {'lr': 0.0004999218454477843, 'samples': 610368, 'steps': 3178, 'loss/train': 1.9000006914138794} -11/06/2021 21:42:44 - INFO - __main__ - Step 3180: {'lr': 0.0004999217127081514, 'samples': 610560, 'steps': 3179, 'loss/train': 2.2246599197387695} -11/06/2021 21:42:44 - INFO - __main__ - Step 3181: {'lr': 0.0004999215798559076, 'samples': 610752, 'steps': 3180, 'loss/train': 2.3011488914489746} -11/06/2021 21:42:45 - INFO - __main__ - Step 3182: {'lr': 0.000499921446891053, 'samples': 610944, 'steps': 3181, 'loss/train': 2.965468168258667} -11/06/2021 21:42:45 - INFO - __main__ - Step 3183: {'lr': 0.0004999213138135877, 'samples': 611136, 'steps': 3182, 'loss/train': 2.451305389404297} -11/06/2021 21:42:46 - INFO - __main__ - Step 3184: {'lr': 0.0004999211806235117, 'samples': 611328, 'steps': 3183, 'loss/train': 2.616995334625244} -11/06/2021 21:42:47 - INFO - __main__ - Step 3185: {'lr': 0.000499921047320825, 'samples': 611520, 'steps': 3184, 'loss/train': 1.994917869567871} -11/06/2021 21:42:47 - INFO - __main__ - Step 3186: {'lr': 0.0004999209139055278, 'samples': 611712, 'steps': 3185, 'loss/train': 2.5971717834472656} -11/06/2021 21:42:47 - INFO - __main__ - Step 3187: {'lr': 0.0004999207803776201, 'samples': 611904, 'steps': 3186, 'loss/train': 2.031585693359375} -11/06/2021 21:42:48 - INFO - __main__ - Step 3188: {'lr': 0.000499920646737102, 'samples': 612096, 'steps': 3187, 'loss/train': 2.4705827236175537} -11/06/2021 21:42:48 - INFO - __main__ - Step 3189: {'lr': 0.0004999205129839734, 'samples': 612288, 'steps': 3188, 'loss/train': 2.301380157470703} -11/06/2021 21:42:49 - INFO - __main__ - Step 3190: {'lr': 0.0004999203791182345, 'samples': 612480, 'steps': 3189, 'loss/train': 2.5135273933410645} -11/06/2021 21:42:49 - INFO - __main__ - Step 3191: {'lr': 0.0004999202451398853, 'samples': 612672, 'steps': 3190, 'loss/train': 2.0862905979156494} -11/06/2021 21:42:50 - INFO - __main__ - Step 3192: {'lr': 0.000499920111048926, 'samples': 612864, 'steps': 3191, 'loss/train': 2.3521876335144043} -11/06/2021 21:42:50 - INFO - __main__ - Step 3193: {'lr': 0.0004999199768453565, 'samples': 613056, 'steps': 3192, 'loss/train': 5.900242328643799} -11/06/2021 21:42:50 - INFO - __main__ - Step 3194: {'lr': 0.0004999198425291769, 'samples': 613248, 'steps': 3193, 'loss/train': 2.1287336349487305} -11/06/2021 21:42:52 - INFO - __main__ - Step 3195: {'lr': 0.0004999197081003873, 'samples': 613440, 'steps': 3194, 'loss/train': 1.8804785013198853} -11/06/2021 21:42:52 - INFO - __main__ - Step 3196: {'lr': 0.0004999195735589877, 'samples': 613632, 'steps': 3195, 'loss/train': 2.1079533100128174} -11/06/2021 21:42:52 - INFO - __main__ - Step 3197: {'lr': 0.0004999194389049783, 'samples': 613824, 'steps': 3196, 'loss/train': 2.4482831954956055} -11/06/2021 21:42:53 - INFO - __main__ - Step 3198: {'lr': 0.0004999193041383588, 'samples': 614016, 'steps': 3197, 'loss/train': 2.2492079734802246} -11/06/2021 21:42:53 - INFO - __main__ - Step 3199: {'lr': 0.0004999191692591299, 'samples': 614208, 'steps': 3198, 'loss/train': 1.8088970184326172} -11/06/2021 21:42:54 - INFO - __main__ - Step 3200: {'lr': 0.000499919034267291, 'samples': 614400, 'steps': 3199, 'loss/train': 2.175657272338867} -11/06/2021 21:42:54 - INFO - __main__ - Step 3201: {'lr': 0.0004999188991628425, 'samples': 614592, 'steps': 3200, 'loss/train': 2.242400646209717} -11/06/2021 21:42:55 - INFO - __main__ - Step 3202: {'lr': 0.0004999187639457844, 'samples': 614784, 'steps': 3201, 'loss/train': 2.0254077911376953} -11/06/2021 21:42:55 - INFO - __main__ - Step 3203: {'lr': 0.0004999186286161169, 'samples': 614976, 'steps': 3202, 'loss/train': 2.909585952758789} -11/06/2021 21:42:55 - INFO - __main__ - Step 3204: {'lr': 0.0004999184931738397, 'samples': 615168, 'steps': 3203, 'loss/train': 1.7180776596069336} -11/06/2021 21:42:56 - INFO - __main__ - Step 3205: {'lr': 0.0004999183576189532, 'samples': 615360, 'steps': 3204, 'loss/train': 2.3504021167755127} -11/06/2021 21:42:57 - INFO - __main__ - Step 3206: {'lr': 0.0004999182219514573, 'samples': 615552, 'steps': 3205, 'loss/train': 2.0548884868621826} -11/06/2021 21:42:57 - INFO - __main__ - Step 3207: {'lr': 0.0004999180861713522, 'samples': 615744, 'steps': 3206, 'loss/train': 2.1941933631896973} -11/06/2021 21:42:58 - INFO - __main__ - Step 3208: {'lr': 0.0004999179502786377, 'samples': 615936, 'steps': 3207, 'loss/train': 6.997474193572998} -11/06/2021 21:42:58 - INFO - __main__ - Step 3209: {'lr': 0.0004999178142733141, 'samples': 616128, 'steps': 3208, 'loss/train': 2.0363223552703857} -11/06/2021 21:42:59 - INFO - __main__ - Step 3210: {'lr': 0.0004999176781553815, 'samples': 616320, 'steps': 3209, 'loss/train': 2.108640432357788} -11/06/2021 21:42:59 - INFO - __main__ - Step 3211: {'lr': 0.0004999175419248398, 'samples': 616512, 'steps': 3210, 'loss/train': 2.0920512676239014} -11/06/2021 21:43:00 - INFO - __main__ - Step 3212: {'lr': 0.0004999174055816891, 'samples': 616704, 'steps': 3211, 'loss/train': 2.339956760406494} -11/06/2021 21:43:00 - INFO - __main__ - Step 3213: {'lr': 0.0004999172691259293, 'samples': 616896, 'steps': 3212, 'loss/train': 1.8541127443313599} -11/06/2021 21:43:01 - INFO - __main__ - Step 3214: {'lr': 0.0004999171325575609, 'samples': 617088, 'steps': 3213, 'loss/train': 1.9735697507858276} -11/06/2021 21:43:01 - INFO - __main__ - Step 3215: {'lr': 0.0004999169958765836, 'samples': 617280, 'steps': 3214, 'loss/train': 2.325428009033203} -11/06/2021 21:43:02 - INFO - __main__ - Step 3216: {'lr': 0.0004999168590829975, 'samples': 617472, 'steps': 3215, 'loss/train': 2.0824670791625977} -11/06/2021 21:43:02 - INFO - __main__ - Step 3217: {'lr': 0.0004999167221768028, 'samples': 617664, 'steps': 3216, 'loss/train': 2.0834946632385254} -11/06/2021 21:43:03 - INFO - __main__ - Step 3218: {'lr': 0.0004999165851579994, 'samples': 617856, 'steps': 3217, 'loss/train': 1.993496060371399} -11/06/2021 21:43:03 - INFO - __main__ - Step 3219: {'lr': 0.0004999164480265875, 'samples': 618048, 'steps': 3218, 'loss/train': 2.200866460800171} -11/06/2021 21:43:03 - INFO - __main__ - Step 3220: {'lr': 0.0004999163107825671, 'samples': 618240, 'steps': 3219, 'loss/train': 2.439110040664673} -11/06/2021 21:43:04 - INFO - __main__ - Step 3221: {'lr': 0.0004999161734259383, 'samples': 618432, 'steps': 3220, 'loss/train': 1.0018621683120728} -11/06/2021 21:43:05 - INFO - __main__ - Step 3222: {'lr': 0.0004999160359567011, 'samples': 618624, 'steps': 3221, 'loss/train': 1.9945106506347656} -11/06/2021 21:43:05 - INFO - __main__ - Step 3223: {'lr': 0.0004999158983748555, 'samples': 618816, 'steps': 3222, 'loss/train': 2.565582036972046} -11/06/2021 21:43:06 - INFO - __main__ - Step 3224: {'lr': 0.0004999157606804018, 'samples': 619008, 'steps': 3223, 'loss/train': 2.3982090950012207} -11/06/2021 21:43:06 - INFO - __main__ - Step 3225: {'lr': 0.0004999156228733398, 'samples': 619200, 'steps': 3224, 'loss/train': 2.0050203800201416} -11/06/2021 21:43:07 - INFO - __main__ - Step 3226: {'lr': 0.0004999154849536698, 'samples': 619392, 'steps': 3225, 'loss/train': 2.3978424072265625} -11/06/2021 21:43:07 - INFO - __main__ - Step 3227: {'lr': 0.0004999153469213917, 'samples': 619584, 'steps': 3226, 'loss/train': 1.5546318292617798} -11/06/2021 21:43:08 - INFO - __main__ - Step 3228: {'lr': 0.0004999152087765055, 'samples': 619776, 'steps': 3227, 'loss/train': 1.9464197158813477} -11/06/2021 21:43:08 - INFO - __main__ - Step 3229: {'lr': 0.0004999150705190114, 'samples': 619968, 'steps': 3228, 'loss/train': 2.4329493045806885} -11/06/2021 21:43:08 - INFO - __main__ - Step 3230: {'lr': 0.0004999149321489095, 'samples': 620160, 'steps': 3229, 'loss/train': 3.806713581085205} -11/06/2021 21:43:09 - INFO - __main__ - Step 3231: {'lr': 0.0004999147936661997, 'samples': 620352, 'steps': 3230, 'loss/train': 1.9667352437973022} -11/06/2021 21:43:10 - INFO - __main__ - Step 3232: {'lr': 0.0004999146550708822, 'samples': 620544, 'steps': 3231, 'loss/train': 2.300558567047119} -11/06/2021 21:43:10 - INFO - __main__ - Step 3233: {'lr': 0.000499914516362957, 'samples': 620736, 'steps': 3232, 'loss/train': 1.624573826789856} -11/06/2021 21:43:10 - INFO - __main__ - Step 3234: {'lr': 0.0004999143775424241, 'samples': 620928, 'steps': 3233, 'loss/train': 2.1690218448638916} -11/06/2021 21:43:11 - INFO - __main__ - Step 3235: {'lr': 0.0004999142386092838, 'samples': 621120, 'steps': 3234, 'loss/train': 1.306965708732605} -11/06/2021 21:43:12 - INFO - __main__ - Step 3236: {'lr': 0.000499914099563536, 'samples': 621312, 'steps': 3235, 'loss/train': 2.066814422607422} -11/06/2021 21:43:12 - INFO - __main__ - Step 3237: {'lr': 0.0004999139604051806, 'samples': 621504, 'steps': 3236, 'loss/train': 2.289586305618286} -11/06/2021 21:43:12 - INFO - __main__ - Step 3238: {'lr': 0.0004999138211342179, 'samples': 621696, 'steps': 3237, 'loss/train': 2.0394601821899414} -11/06/2021 21:43:13 - INFO - __main__ - Step 3239: {'lr': 0.0004999136817506478, 'samples': 621888, 'steps': 3238, 'loss/train': 2.375570297241211} -11/06/2021 21:43:13 - INFO - __main__ - Step 3240: {'lr': 0.0004999135422544707, 'samples': 622080, 'steps': 3239, 'loss/train': 1.8367230892181396} -11/06/2021 21:43:14 - INFO - __main__ - Step 3241: {'lr': 0.0004999134026456862, 'samples': 622272, 'steps': 3240, 'loss/train': 2.2936620712280273} -11/06/2021 21:43:14 - INFO - __main__ - Step 3242: {'lr': 0.0004999132629242946, 'samples': 622464, 'steps': 3241, 'loss/train': 2.675550937652588} -11/06/2021 21:43:15 - INFO - __main__ - Step 3243: {'lr': 0.000499913123090296, 'samples': 622656, 'steps': 3242, 'loss/train': 2.318620204925537} -11/06/2021 21:43:15 - INFO - __main__ - Step 3244: {'lr': 0.0004999129831436904, 'samples': 622848, 'steps': 3243, 'loss/train': 2.7929880619049072} -11/06/2021 21:43:15 - INFO - __main__ - Step 3245: {'lr': 0.0004999128430844778, 'samples': 623040, 'steps': 3244, 'loss/train': 1.8520056009292603} -11/06/2021 21:43:16 - INFO - __main__ - Step 3246: {'lr': 0.0004999127029126585, 'samples': 623232, 'steps': 3245, 'loss/train': 1.9427516460418701} -11/06/2021 21:43:17 - INFO - __main__ - Step 3247: {'lr': 0.0004999125626282322, 'samples': 623424, 'steps': 3246, 'loss/train': 2.054605484008789} -11/06/2021 21:43:17 - INFO - __main__ - Step 3248: {'lr': 0.0004999124222311993, 'samples': 623616, 'steps': 3247, 'loss/train': 1.6573278903961182} -11/06/2021 21:43:17 - INFO - __main__ - Step 3249: {'lr': 0.0004999122817215595, 'samples': 623808, 'steps': 3248, 'loss/train': 1.8662605285644531} -11/06/2021 21:43:18 - INFO - __main__ - Step 3250: {'lr': 0.0004999121410993133, 'samples': 624000, 'steps': 3249, 'loss/train': 2.0213828086853027} -11/06/2021 21:43:19 - INFO - __main__ - Step 3251: {'lr': 0.0004999120003644604, 'samples': 624192, 'steps': 3250, 'loss/train': 2.3014163970947266} -11/06/2021 21:43:19 - INFO - __main__ - Step 3252: {'lr': 0.0004999118595170011, 'samples': 624384, 'steps': 3251, 'loss/train': 2.2614598274230957} -11/06/2021 21:43:20 - INFO - __main__ - Step 3253: {'lr': 0.0004999117185569354, 'samples': 624576, 'steps': 3252, 'loss/train': 2.0688071250915527} -11/06/2021 21:43:20 - INFO - __main__ - Step 3254: {'lr': 0.0004999115774842633, 'samples': 624768, 'steps': 3253, 'loss/train': 1.5158661603927612} -11/06/2021 21:43:20 - INFO - __main__ - Step 3255: {'lr': 0.0004999114362989849, 'samples': 624960, 'steps': 3254, 'loss/train': 2.2318007946014404} -11/06/2021 21:43:21 - INFO - __main__ - Step 3256: {'lr': 0.0004999112950011002, 'samples': 625152, 'steps': 3255, 'loss/train': 1.8678102493286133} -11/06/2021 21:43:22 - INFO - __main__ - Step 3257: {'lr': 0.0004999111535906094, 'samples': 625344, 'steps': 3256, 'loss/train': 2.0674848556518555} -11/06/2021 21:43:22 - INFO - __main__ - Step 3258: {'lr': 0.0004999110120675125, 'samples': 625536, 'steps': 3257, 'loss/train': 1.557898998260498} -11/06/2021 21:43:23 - INFO - __main__ - Step 3259: {'lr': 0.0004999108704318095, 'samples': 625728, 'steps': 3258, 'loss/train': 1.9527461528778076} -11/06/2021 21:43:23 - INFO - __main__ - Step 3260: {'lr': 0.0004999107286835006, 'samples': 625920, 'steps': 3259, 'loss/train': 0.5624179244041443} -11/06/2021 21:43:23 - INFO - __main__ - Step 3261: {'lr': 0.0004999105868225858, 'samples': 626112, 'steps': 3260, 'loss/train': 2.3505382537841797} -11/06/2021 21:43:24 - INFO - __main__ - Step 3262: {'lr': 0.0004999104448490649, 'samples': 626304, 'steps': 3261, 'loss/train': 1.716923475265503} -11/06/2021 21:43:25 - INFO - __main__ - Step 3263: {'lr': 0.0004999103027629384, 'samples': 626496, 'steps': 3262, 'loss/train': 2.0216355323791504} -11/06/2021 21:43:25 - INFO - __main__ - Step 3264: {'lr': 0.0004999101605642061, 'samples': 626688, 'steps': 3263, 'loss/train': 2.3034634590148926} -11/06/2021 21:43:25 - INFO - __main__ - Step 3265: {'lr': 0.0004999100182528683, 'samples': 626880, 'steps': 3264, 'loss/train': 2.1556177139282227} -11/06/2021 21:43:26 - INFO - __main__ - Step 3266: {'lr': 0.0004999098758289248, 'samples': 627072, 'steps': 3265, 'loss/train': 2.250798463821411} -11/06/2021 21:43:27 - INFO - __main__ - Step 3267: {'lr': 0.0004999097332923758, 'samples': 627264, 'steps': 3266, 'loss/train': 2.280691623687744} -11/06/2021 21:43:27 - INFO - __main__ - Step 3268: {'lr': 0.0004999095906432213, 'samples': 627456, 'steps': 3267, 'loss/train': 2.3557052612304688} -11/06/2021 21:43:28 - INFO - __main__ - Step 3269: {'lr': 0.0004999094478814613, 'samples': 627648, 'steps': 3268, 'loss/train': 2.4633193016052246} -11/06/2021 21:43:28 - INFO - __main__ - Step 3270: {'lr': 0.0004999093050070961, 'samples': 627840, 'steps': 3269, 'loss/train': 5.240302562713623} -11/06/2021 21:43:28 - INFO - __main__ - Step 3271: {'lr': 0.0004999091620201255, 'samples': 628032, 'steps': 3270, 'loss/train': 4.105412006378174} -11/06/2021 21:43:29 - INFO - __main__ - Step 3272: {'lr': 0.0004999090189205498, 'samples': 628224, 'steps': 3271, 'loss/train': 2.502105951309204} -11/06/2021 21:43:29 - INFO - __main__ - Step 3273: {'lr': 0.0004999088757083689, 'samples': 628416, 'steps': 3272, 'loss/train': 2.263211250305176} -11/06/2021 21:43:30 - INFO - __main__ - Step 3274: {'lr': 0.0004999087323835829, 'samples': 628608, 'steps': 3273, 'loss/train': 1.1719061136245728} -11/06/2021 21:43:31 - INFO - __main__ - Step 3275: {'lr': 0.0004999085889461919, 'samples': 628800, 'steps': 3274, 'loss/train': 2.298391103744507} -11/06/2021 21:43:31 - INFO - __main__ - Step 3276: {'lr': 0.0004999084453961959, 'samples': 628992, 'steps': 3275, 'loss/train': 1.848705530166626} -11/06/2021 21:43:31 - INFO - __main__ - Step 3277: {'lr': 0.0004999083017335951, 'samples': 629184, 'steps': 3276, 'loss/train': 2.3697509765625} -11/06/2021 21:43:32 - INFO - __main__ - Step 3278: {'lr': 0.0004999081579583895, 'samples': 629376, 'steps': 3277, 'loss/train': 1.937208652496338} -11/06/2021 21:43:33 - INFO - __main__ - Step 3279: {'lr': 0.0004999080140705791, 'samples': 629568, 'steps': 3278, 'loss/train': 2.3870885372161865} -11/06/2021 21:43:33 - INFO - __main__ - Step 3280: {'lr': 0.0004999078700701639, 'samples': 629760, 'steps': 3279, 'loss/train': 2.4358227252960205} -11/06/2021 21:43:33 - INFO - __main__ - Step 3281: {'lr': 0.0004999077259571442, 'samples': 629952, 'steps': 3280, 'loss/train': 2.139662504196167} -11/06/2021 21:43:34 - INFO - __main__ - Step 3282: {'lr': 0.0004999075817315199, 'samples': 630144, 'steps': 3281, 'loss/train': 2.3960695266723633} -11/06/2021 21:43:34 - INFO - __main__ - Step 3283: {'lr': 0.0004999074373932911, 'samples': 630336, 'steps': 3282, 'loss/train': 1.9690511226654053} -11/06/2021 21:43:35 - INFO - __main__ - Step 3284: {'lr': 0.0004999072929424579, 'samples': 630528, 'steps': 3283, 'loss/train': 1.8000233173370361} -11/06/2021 21:43:35 - INFO - __main__ - Step 3285: {'lr': 0.0004999071483790203, 'samples': 630720, 'steps': 3284, 'loss/train': 2.917104721069336} -11/06/2021 21:43:36 - INFO - __main__ - Step 3286: {'lr': 0.0004999070037029783, 'samples': 630912, 'steps': 3285, 'loss/train': 2.3763699531555176} -11/06/2021 21:43:36 - INFO - __main__ - Step 3287: {'lr': 0.0004999068589143322, 'samples': 631104, 'steps': 3286, 'loss/train': 2.728950023651123} -11/06/2021 21:43:36 - INFO - __main__ - Step 3288: {'lr': 0.0004999067140130819, 'samples': 631296, 'steps': 3287, 'loss/train': 2.0896875858306885} -11/06/2021 21:43:37 - INFO - __main__ - Step 3289: {'lr': 0.0004999065689992273, 'samples': 631488, 'steps': 3288, 'loss/train': 2.303443431854248} -11/06/2021 21:43:38 - INFO - __main__ - Step 3290: {'lr': 0.0004999064238727689, 'samples': 631680, 'steps': 3289, 'loss/train': 2.483797073364258} -11/06/2021 21:43:38 - INFO - __main__ - Step 3291: {'lr': 0.0004999062786337064, 'samples': 631872, 'steps': 3290, 'loss/train': 1.8650814294815063} -11/06/2021 21:43:39 - INFO - __main__ - Step 3292: {'lr': 0.0004999061332820401, 'samples': 632064, 'steps': 3291, 'loss/train': 1.7333624362945557} -11/06/2021 21:43:39 - INFO - __main__ - Step 3293: {'lr': 0.0004999059878177699, 'samples': 632256, 'steps': 3292, 'loss/train': 2.357539176940918} -11/06/2021 21:43:40 - INFO - __main__ - Step 3294: {'lr': 0.0004999058422408959, 'samples': 632448, 'steps': 3293, 'loss/train': 2.1987416744232178} -11/06/2021 21:43:40 - INFO - __main__ - Step 3295: {'lr': 0.0004999056965514181, 'samples': 632640, 'steps': 3294, 'loss/train': 1.9118432998657227} -11/06/2021 21:43:41 - INFO - __main__ - Step 3296: {'lr': 0.0004999055507493368, 'samples': 632832, 'steps': 3295, 'loss/train': 2.26961612701416} -11/06/2021 21:43:41 - INFO - __main__ - Step 3297: {'lr': 0.0004999054048346517, 'samples': 633024, 'steps': 3296, 'loss/train': 2.7712512016296387} -11/06/2021 21:43:41 - INFO - __main__ - Step 3298: {'lr': 0.0004999052588073633, 'samples': 633216, 'steps': 3297, 'loss/train': 2.1366281509399414} -11/06/2021 21:43:42 - INFO - __main__ - Step 3299: {'lr': 0.0004999051126674714, 'samples': 633408, 'steps': 3298, 'loss/train': 1.3426307439804077} -11/06/2021 21:43:43 - INFO - __main__ - Step 3300: {'lr': 0.0004999049664149761, 'samples': 633600, 'steps': 3299, 'loss/train': 3.066981315612793} -11/06/2021 21:43:43 - INFO - __main__ - Step 3301: {'lr': 0.0004999048200498774, 'samples': 633792, 'steps': 3300, 'loss/train': 2.1740355491638184} -11/06/2021 21:43:43 - INFO - __main__ - Step 3302: {'lr': 0.0004999046735721755, 'samples': 633984, 'steps': 3301, 'loss/train': 2.4104175567626953} -11/06/2021 21:43:44 - INFO - __main__ - Step 3303: {'lr': 0.0004999045269818704, 'samples': 634176, 'steps': 3302, 'loss/train': 2.4756033420562744} -11/06/2021 21:43:45 - INFO - __main__ - Step 3304: {'lr': 0.0004999043802789622, 'samples': 634368, 'steps': 3303, 'loss/train': 1.4023329019546509} -11/06/2021 21:43:45 - INFO - __main__ - Step 3305: {'lr': 0.000499904233463451, 'samples': 634560, 'steps': 3304, 'loss/train': 1.6189985275268555} -11/06/2021 21:43:45 - INFO - __main__ - Step 3306: {'lr': 0.0004999040865353367, 'samples': 634752, 'steps': 3305, 'loss/train': 1.5078233480453491} -11/06/2021 21:43:46 - INFO - __main__ - Step 3307: {'lr': 0.0004999039394946196, 'samples': 634944, 'steps': 3306, 'loss/train': 1.8554377555847168} -11/06/2021 21:43:46 - INFO - __main__ - Step 3308: {'lr': 0.0004999037923412995, 'samples': 635136, 'steps': 3307, 'loss/train': 2.242231845855713} -11/06/2021 21:43:47 - INFO - __main__ - Step 3309: {'lr': 0.0004999036450753767, 'samples': 635328, 'steps': 3308, 'loss/train': 2.1639621257781982} -11/06/2021 21:43:47 - INFO - __main__ - Step 3310: {'lr': 0.0004999034976968511, 'samples': 635520, 'steps': 3309, 'loss/train': 2.1223878860473633} -11/06/2021 21:43:48 - INFO - __main__ - Step 3311: {'lr': 0.0004999033502057228, 'samples': 635712, 'steps': 3310, 'loss/train': 2.3255131244659424} -11/06/2021 21:43:48 - INFO - __main__ - Step 3312: {'lr': 0.000499903202601992, 'samples': 635904, 'steps': 3311, 'loss/train': 2.050856113433838} -11/06/2021 21:43:48 - INFO - __main__ - Step 3313: {'lr': 0.0004999030548856586, 'samples': 636096, 'steps': 3312, 'loss/train': 1.3736777305603027} -11/06/2021 21:43:49 - INFO - __main__ - Step 3314: {'lr': 0.0004999029070567229, 'samples': 636288, 'steps': 3313, 'loss/train': 2.3344199657440186} -11/06/2021 21:43:50 - INFO - __main__ - Step 3315: {'lr': 0.0004999027591151847, 'samples': 636480, 'steps': 3314, 'loss/train': 2.361743927001953} -11/06/2021 21:43:50 - INFO - __main__ - Step 3316: {'lr': 0.0004999026110610442, 'samples': 636672, 'steps': 3315, 'loss/train': 1.3730331659317017} -11/06/2021 21:43:51 - INFO - __main__ - Step 3317: {'lr': 0.0004999024628943014, 'samples': 636864, 'steps': 3316, 'loss/train': 2.4670941829681396} -11/06/2021 21:43:51 - INFO - __main__ - Step 3318: {'lr': 0.0004999023146149565, 'samples': 637056, 'steps': 3317, 'loss/train': 1.93985116481781} -11/06/2021 21:43:51 - INFO - __main__ - Step 3319: {'lr': 0.0004999021662230093, 'samples': 637248, 'steps': 3318, 'loss/train': 1.4250794649124146} -11/06/2021 21:43:52 - INFO - __main__ - Step 3320: {'lr': 0.0004999020177184601, 'samples': 637440, 'steps': 3319, 'loss/train': 2.3671536445617676} -11/06/2021 21:43:53 - INFO - __main__ - Step 3321: {'lr': 0.000499901869101309, 'samples': 637632, 'steps': 3320, 'loss/train': 2.1804182529449463} -11/06/2021 21:43:53 - INFO - __main__ - Step 3322: {'lr': 0.0004999017203715559, 'samples': 637824, 'steps': 3321, 'loss/train': 2.0329232215881348} -11/06/2021 21:43:53 - INFO - __main__ - Step 3323: {'lr': 0.000499901571529201, 'samples': 638016, 'steps': 3322, 'loss/train': 1.9539903402328491} -11/06/2021 21:43:54 - INFO - __main__ - Step 3324: {'lr': 0.0004999014225742442, 'samples': 638208, 'steps': 3323, 'loss/train': 1.762226939201355} -11/06/2021 21:43:55 - INFO - __main__ - Step 3325: {'lr': 0.0004999012735066858, 'samples': 638400, 'steps': 3324, 'loss/train': 2.084671974182129} -11/06/2021 21:43:55 - INFO - __main__ - Step 3326: {'lr': 0.0004999011243265257, 'samples': 638592, 'steps': 3325, 'loss/train': 2.541097402572632} -11/06/2021 21:43:55 - INFO - __main__ - Step 3327: {'lr': 0.000499900975033764, 'samples': 638784, 'steps': 3326, 'loss/train': 2.444103240966797} -11/06/2021 21:43:56 - INFO - __main__ - Step 3328: {'lr': 0.0004999008256284008, 'samples': 638976, 'steps': 3327, 'loss/train': 2.3885836601257324} -11/06/2021 21:43:56 - INFO - __main__ - Step 3329: {'lr': 0.0004999006761104361, 'samples': 639168, 'steps': 3328, 'loss/train': 1.9459644556045532} -11/06/2021 21:43:57 - INFO - __main__ - Step 3330: {'lr': 0.0004999005264798701, 'samples': 639360, 'steps': 3329, 'loss/train': 2.031470775604248} -11/06/2021 21:43:58 - INFO - __main__ - Step 3331: {'lr': 0.0004999003767367027, 'samples': 639552, 'steps': 3330, 'loss/train': 2.199577808380127} -11/06/2021 21:43:58 - INFO - __main__ - Step 3332: {'lr': 0.0004999002268809339, 'samples': 639744, 'steps': 3331, 'loss/train': 2.1211884021759033} -11/06/2021 21:43:59 - INFO - __main__ - Step 3333: {'lr': 0.0004999000769125642, 'samples': 639936, 'steps': 3332, 'loss/train': 3.076802968978882} -11/06/2021 21:43:59 - INFO - __main__ - Step 3334: {'lr': 0.0004998999268315932, 'samples': 640128, 'steps': 3333, 'loss/train': 2.300365447998047} -11/06/2021 21:43:59 - INFO - __main__ - Step 3335: {'lr': 0.0004998997766380212, 'samples': 640320, 'steps': 3334, 'loss/train': 2.047560214996338} -11/06/2021 21:44:00 - INFO - __main__ - Step 3336: {'lr': 0.0004998996263318482, 'samples': 640512, 'steps': 3335, 'loss/train': 2.0564115047454834} -11/06/2021 21:44:00 - INFO - __main__ - Step 3337: {'lr': 0.0004998994759130743, 'samples': 640704, 'steps': 3336, 'loss/train': 1.807005763053894} -11/06/2021 21:44:01 - INFO - __main__ - Step 3338: {'lr': 0.0004998993253816996, 'samples': 640896, 'steps': 3337, 'loss/train': 2.106369733810425} -11/06/2021 21:44:01 - INFO - __main__ - Step 3339: {'lr': 0.000499899174737724, 'samples': 641088, 'steps': 3338, 'loss/train': 2.363450765609741} -11/06/2021 21:44:02 - INFO - __main__ - Step 3340: {'lr': 0.0004998990239811477, 'samples': 641280, 'steps': 3339, 'loss/train': 1.9341990947723389} -11/06/2021 21:44:03 - INFO - __main__ - Step 3341: {'lr': 0.0004998988731119709, 'samples': 641472, 'steps': 3340, 'loss/train': 2.0908918380737305} -11/06/2021 21:44:03 - INFO - __main__ - Step 3342: {'lr': 0.0004998987221301935, 'samples': 641664, 'steps': 3341, 'loss/train': 2.078077793121338} -11/06/2021 21:44:03 - INFO - __main__ - Step 3343: {'lr': 0.0004998985710358155, 'samples': 641856, 'steps': 3342, 'loss/train': 1.9851315021514893} -11/06/2021 21:44:04 - INFO - __main__ - Step 3344: {'lr': 0.0004998984198288371, 'samples': 642048, 'steps': 3343, 'loss/train': 2.1168434619903564} -11/06/2021 21:44:04 - INFO - __main__ - Step 3345: {'lr': 0.0004998982685092583, 'samples': 642240, 'steps': 3344, 'loss/train': 2.281632900238037} -11/06/2021 21:44:05 - INFO - __main__ - Step 3346: {'lr': 0.0004998981170770792, 'samples': 642432, 'steps': 3345, 'loss/train': 2.356718063354492} -11/06/2021 21:44:05 - INFO - __main__ - Step 3347: {'lr': 0.0004998979655323, 'samples': 642624, 'steps': 3346, 'loss/train': 1.8560844659805298} -11/06/2021 21:44:06 - INFO - __main__ - Step 3348: {'lr': 0.0004998978138749204, 'samples': 642816, 'steps': 3347, 'loss/train': 1.9993972778320312} -11/06/2021 21:44:06 - INFO - __main__ - Step 3349: {'lr': 0.0004998976621049408, 'samples': 643008, 'steps': 3348, 'loss/train': 2.5754454135894775} -11/06/2021 21:44:06 - INFO - __main__ - Step 3350: {'lr': 0.0004998975102223612, 'samples': 643200, 'steps': 3349, 'loss/train': 2.1721551418304443} -11/06/2021 21:44:08 - INFO - __main__ - Step 3351: {'lr': 0.0004998973582271817, 'samples': 643392, 'steps': 3350, 'loss/train': 1.9218946695327759} -11/06/2021 21:44:08 - INFO - __main__ - Step 3352: {'lr': 0.0004998972061194022, 'samples': 643584, 'steps': 3351, 'loss/train': 2.063539743423462} -11/06/2021 21:44:08 - INFO - __main__ - Step 3353: {'lr': 0.0004998970538990228, 'samples': 643776, 'steps': 3352, 'loss/train': 2.91345477104187} -11/06/2021 21:44:09 - INFO - __main__ - Step 3354: {'lr': 0.0004998969015660438, 'samples': 643968, 'steps': 3353, 'loss/train': 1.8647414445877075} -11/06/2021 21:44:09 - INFO - __main__ - Step 3355: {'lr': 0.0004998967491204651, 'samples': 644160, 'steps': 3354, 'loss/train': 2.418487787246704} -11/06/2021 21:44:09 - INFO - __main__ - Step 3356: {'lr': 0.0004998965965622867, 'samples': 644352, 'steps': 3355, 'loss/train': 1.3407362699508667} -11/06/2021 21:44:11 - INFO - __main__ - Step 3357: {'lr': 0.0004998964438915088, 'samples': 644544, 'steps': 3356, 'loss/train': 2.0935134887695312} -11/06/2021 21:44:11 - INFO - __main__ - Step 3358: {'lr': 0.0004998962911081314, 'samples': 644736, 'steps': 3357, 'loss/train': 2.340810775756836} -11/06/2021 21:44:11 - INFO - __main__ - Step 3359: {'lr': 0.0004998961382121546, 'samples': 644928, 'steps': 3358, 'loss/train': 2.3082637786865234} -11/06/2021 21:44:12 - INFO - __main__ - Step 3360: {'lr': 0.0004998959852035785, 'samples': 645120, 'steps': 3359, 'loss/train': 1.8081005811691284} -11/06/2021 21:44:12 - INFO - __main__ - Step 3361: {'lr': 0.0004998958320824031, 'samples': 645312, 'steps': 3360, 'loss/train': 2.52008318901062} -11/06/2021 21:44:13 - INFO - __main__ - Step 3362: {'lr': 0.0004998956788486284, 'samples': 645504, 'steps': 3361, 'loss/train': 2.574852228164673} -11/06/2021 21:44:13 - INFO - __main__ - Step 3363: {'lr': 0.0004998955255022547, 'samples': 645696, 'steps': 3362, 'loss/train': 2.9360525608062744} -11/06/2021 21:44:14 - INFO - __main__ - Step 3364: {'lr': 0.0004998953720432818, 'samples': 645888, 'steps': 3363, 'loss/train': 2.0350911617279053} -11/06/2021 21:44:14 - INFO - __main__ - Step 3365: {'lr': 0.00049989521847171, 'samples': 646080, 'steps': 3364, 'loss/train': 1.7591485977172852} -11/06/2021 21:44:14 - INFO - __main__ - Step 3366: {'lr': 0.0004998950647875392, 'samples': 646272, 'steps': 3365, 'loss/train': 1.764539122581482} -11/06/2021 21:44:15 - INFO - __main__ - Step 3367: {'lr': 0.0004998949109907697, 'samples': 646464, 'steps': 3366, 'loss/train': 2.29533052444458} -11/06/2021 21:44:16 - INFO - __main__ - Step 3368: {'lr': 0.0004998947570814012, 'samples': 646656, 'steps': 3367, 'loss/train': 2.4703001976013184} -11/06/2021 21:44:16 - INFO - __main__ - Step 3369: {'lr': 0.0004998946030594341, 'samples': 646848, 'steps': 3368, 'loss/train': 2.0543324947357178} -11/06/2021 21:44:16 - INFO - __main__ - Step 3370: {'lr': 0.0004998944489248683, 'samples': 647040, 'steps': 3369, 'loss/train': 2.8122878074645996} -11/06/2021 21:44:17 - INFO - __main__ - Step 3371: {'lr': 0.000499894294677704, 'samples': 647232, 'steps': 3370, 'loss/train': 2.024826765060425} -11/06/2021 21:44:18 - INFO - __main__ - Step 3372: {'lr': 0.000499894140317941, 'samples': 647424, 'steps': 3371, 'loss/train': 2.372493267059326} -11/06/2021 21:44:18 - INFO - __main__ - Step 3373: {'lr': 0.0004998939858455798, 'samples': 647616, 'steps': 3372, 'loss/train': 1.8553732633590698} -11/06/2021 21:44:19 - INFO - __main__ - Step 3374: {'lr': 0.0004998938312606201, 'samples': 647808, 'steps': 3373, 'loss/train': 6.488889694213867} -11/06/2021 21:44:19 - INFO - __main__ - Step 3375: {'lr': 0.000499893676563062, 'samples': 648000, 'steps': 3374, 'loss/train': 2.1932318210601807} -11/06/2021 21:44:19 - INFO - __main__ - Step 3376: {'lr': 0.0004998935217529058, 'samples': 648192, 'steps': 3375, 'loss/train': 2.0442917346954346} -11/06/2021 21:44:20 - INFO - __main__ - Step 3377: {'lr': 0.0004998933668301514, 'samples': 648384, 'steps': 3376, 'loss/train': 1.9358372688293457} -11/06/2021 21:44:21 - INFO - __main__ - Step 3378: {'lr': 0.0004998932117947989, 'samples': 648576, 'steps': 3377, 'loss/train': 1.9061901569366455} -11/06/2021 21:44:21 - INFO - __main__ - Step 3379: {'lr': 0.0004998930566468484, 'samples': 648768, 'steps': 3378, 'loss/train': 2.5020077228546143} -11/06/2021 21:44:21 - INFO - __main__ - Step 3380: {'lr': 0.0004998929013863, 'samples': 648960, 'steps': 3379, 'loss/train': 1.080916404724121} -11/06/2021 21:44:22 - INFO - __main__ - Step 3381: {'lr': 0.0004998927460131535, 'samples': 649152, 'steps': 3380, 'loss/train': 2.488973379135132} -11/06/2021 21:44:22 - INFO - __main__ - Step 3382: {'lr': 0.0004998925905274094, 'samples': 649344, 'steps': 3381, 'loss/train': 1.9152915477752686} -11/06/2021 21:44:23 - INFO - __main__ - Step 3383: {'lr': 0.0004998924349290674, 'samples': 649536, 'steps': 3382, 'loss/train': 0.7557737827301025} -11/06/2021 21:44:24 - INFO - __main__ - Step 3384: {'lr': 0.0004998922792181278, 'samples': 649728, 'steps': 3383, 'loss/train': 1.4994975328445435} -11/06/2021 21:44:24 - INFO - __main__ - Step 3385: {'lr': 0.0004998921233945907, 'samples': 649920, 'steps': 3384, 'loss/train': 1.6330103874206543} -11/06/2021 21:44:24 - INFO - __main__ - Step 3386: {'lr': 0.0004998919674584559, 'samples': 650112, 'steps': 3385, 'loss/train': 1.484663486480713} -11/06/2021 21:44:25 - INFO - __main__ - Step 3387: {'lr': 0.0004998918114097237, 'samples': 650304, 'steps': 3386, 'loss/train': 2.346414566040039} -11/06/2021 21:44:26 - INFO - __main__ - Step 3388: {'lr': 0.0004998916552483941, 'samples': 650496, 'steps': 3387, 'loss/train': 1.351393699645996} -11/06/2021 21:44:26 - INFO - __main__ - Step 3389: {'lr': 0.0004998914989744671, 'samples': 650688, 'steps': 3388, 'loss/train': 2.10522198677063} -11/06/2021 21:44:26 - INFO - __main__ - Step 3390: {'lr': 0.000499891342587943, 'samples': 650880, 'steps': 3389, 'loss/train': 1.9814081192016602} -11/06/2021 21:44:27 - INFO - __main__ - Step 3391: {'lr': 0.0004998911860888217, 'samples': 651072, 'steps': 3390, 'loss/train': 1.96201491355896} -11/06/2021 21:44:27 - INFO - __main__ - Step 3392: {'lr': 0.0004998910294771032, 'samples': 651264, 'steps': 3391, 'loss/train': 2.6143369674682617} -11/06/2021 21:44:28 - INFO - __main__ - Step 3393: {'lr': 0.0004998908727527877, 'samples': 651456, 'steps': 3392, 'loss/train': 2.523289442062378} -11/06/2021 21:44:28 - INFO - __main__ - Step 3394: {'lr': 0.0004998907159158752, 'samples': 651648, 'steps': 3393, 'loss/train': 1.4275950193405151} -11/06/2021 21:44:29 - INFO - __main__ - Step 3395: {'lr': 0.0004998905589663658, 'samples': 651840, 'steps': 3394, 'loss/train': 2.1565451622009277} -11/06/2021 21:44:29 - INFO - __main__ - Step 3396: {'lr': 0.0004998904019042596, 'samples': 652032, 'steps': 3395, 'loss/train': 2.2461233139038086} -11/06/2021 21:44:30 - INFO - __main__ - Step 3397: {'lr': 0.0004998902447295567, 'samples': 652224, 'steps': 3396, 'loss/train': 2.1691172122955322} -11/06/2021 21:44:31 - INFO - __main__ - Step 3398: {'lr': 0.000499890087442257, 'samples': 652416, 'steps': 3397, 'loss/train': 2.0089993476867676} -11/06/2021 21:44:31 - INFO - __main__ - Step 3399: {'lr': 0.0004998899300423607, 'samples': 652608, 'steps': 3398, 'loss/train': 2.1266562938690186} -11/06/2021 21:44:31 - INFO - __main__ - Step 3400: {'lr': 0.0004998897725298679, 'samples': 652800, 'steps': 3399, 'loss/train': 1.9188565015792847} -11/06/2021 21:44:32 - INFO - __main__ - Step 3401: {'lr': 0.0004998896149047786, 'samples': 652992, 'steps': 3400, 'loss/train': 2.4505343437194824} -11/06/2021 21:44:32 - INFO - __main__ - Step 3402: {'lr': 0.0004998894571670929, 'samples': 653184, 'steps': 3401, 'loss/train': 2.3925869464874268} -11/06/2021 21:44:32 - INFO - __main__ - Step 3403: {'lr': 0.0004998892993168109, 'samples': 653376, 'steps': 3402, 'loss/train': 2.170724391937256} -11/06/2021 21:44:33 - INFO - __main__ - Step 3404: {'lr': 0.0004998891413539326, 'samples': 653568, 'steps': 3403, 'loss/train': 1.9499857425689697} -11/06/2021 21:44:34 - INFO - __main__ - Step 3405: {'lr': 0.0004998889832784581, 'samples': 653760, 'steps': 3404, 'loss/train': 2.608039379119873} -11/06/2021 21:44:34 - INFO - __main__ - Step 3406: {'lr': 0.0004998888250903875, 'samples': 653952, 'steps': 3405, 'loss/train': 2.1653521060943604} -11/06/2021 21:44:34 - INFO - __main__ - Step 3407: {'lr': 0.0004998886667897209, 'samples': 654144, 'steps': 3406, 'loss/train': 2.1557538509368896} -11/06/2021 21:44:35 - INFO - __main__ - Step 3408: {'lr': 0.0004998885083764582, 'samples': 654336, 'steps': 3407, 'loss/train': 2.54028582572937} -11/06/2021 21:44:36 - INFO - __main__ - Step 3409: {'lr': 0.0004998883498505996, 'samples': 654528, 'steps': 3408, 'loss/train': 2.0685014724731445} -11/06/2021 21:44:36 - INFO - __main__ - Step 3410: {'lr': 0.0004998881912121453, 'samples': 654720, 'steps': 3409, 'loss/train': 1.7899914979934692} -11/06/2021 21:44:37 - INFO - __main__ - Step 3411: {'lr': 0.0004998880324610952, 'samples': 654912, 'steps': 3410, 'loss/train': 2.2215492725372314} -11/06/2021 21:44:37 - INFO - __main__ - Step 3412: {'lr': 0.0004998878735974493, 'samples': 655104, 'steps': 3411, 'loss/train': 2.2348644733428955} -11/06/2021 21:44:37 - INFO - __main__ - Step 3413: {'lr': 0.0004998877146212079, 'samples': 655296, 'steps': 3412, 'loss/train': 2.385568618774414} -11/06/2021 21:44:38 - INFO - __main__ - Step 3414: {'lr': 0.0004998875555323708, 'samples': 655488, 'steps': 3413, 'loss/train': 2.1982250213623047} -11/06/2021 21:44:38 - INFO - __main__ - Step 3415: {'lr': 0.0004998873963309384, 'samples': 655680, 'steps': 3414, 'loss/train': 2.085184097290039} -11/06/2021 21:44:39 - INFO - __main__ - Step 3416: {'lr': 0.0004998872370169105, 'samples': 655872, 'steps': 3415, 'loss/train': 2.228264808654785} -11/06/2021 21:44:39 - INFO - __main__ - Step 3417: {'lr': 0.0004998870775902872, 'samples': 656064, 'steps': 3416, 'loss/train': 2.356597900390625} -11/06/2021 21:44:40 - INFO - __main__ - Step 3418: {'lr': 0.0004998869180510688, 'samples': 656256, 'steps': 3417, 'loss/train': 1.9543739557266235} -11/06/2021 21:44:41 - INFO - __main__ - Step 3419: {'lr': 0.0004998867583992551, 'samples': 656448, 'steps': 3418, 'loss/train': 1.8418172597885132} -11/06/2021 21:44:41 - INFO - __main__ - Step 3420: {'lr': 0.0004998865986348464, 'samples': 656640, 'steps': 3419, 'loss/train': 1.725966453552246} -11/06/2021 21:44:42 - INFO - __main__ - Step 3421: {'lr': 0.0004998864387578426, 'samples': 656832, 'steps': 3420, 'loss/train': 1.9191683530807495} -11/06/2021 21:44:42 - INFO - __main__ - Step 3422: {'lr': 0.0004998862787682438, 'samples': 657024, 'steps': 3421, 'loss/train': 2.177302598953247} -11/06/2021 21:44:42 - INFO - __main__ - Step 3423: {'lr': 0.00049988611866605, 'samples': 657216, 'steps': 3422, 'loss/train': 1.9818519353866577} -11/06/2021 21:44:43 - INFO - __main__ - Step 3424: {'lr': 0.0004998859584512615, 'samples': 657408, 'steps': 3423, 'loss/train': 2.42037296295166} -11/06/2021 21:44:44 - INFO - __main__ - Step 3425: {'lr': 0.0004998857981238782, 'samples': 657600, 'steps': 3424, 'loss/train': 0.6604869961738586} -11/06/2021 21:44:44 - INFO - __main__ - Step 3426: {'lr': 0.0004998856376839003, 'samples': 657792, 'steps': 3425, 'loss/train': 0.3991982340812683} -11/06/2021 21:44:45 - INFO - __main__ - Step 3427: {'lr': 0.0004998854771313277, 'samples': 657984, 'steps': 3426, 'loss/train': 2.094467878341675} -11/06/2021 21:44:45 - INFO - __main__ - Step 3428: {'lr': 0.0004998853164661606, 'samples': 658176, 'steps': 3427, 'loss/train': 1.7819459438323975} -11/06/2021 21:44:45 - INFO - __main__ - Step 3429: {'lr': 0.000499885155688399, 'samples': 658368, 'steps': 3428, 'loss/train': 2.345151901245117} -11/06/2021 21:44:46 - INFO - __main__ - Step 3430: {'lr': 0.000499884994798043, 'samples': 658560, 'steps': 3429, 'loss/train': 1.721934199333191} -11/06/2021 21:44:47 - INFO - __main__ - Step 3431: {'lr': 0.0004998848337950927, 'samples': 658752, 'steps': 3430, 'loss/train': 1.6747421026229858} -11/06/2021 21:44:47 - INFO - __main__ - Step 3432: {'lr': 0.0004998846726795482, 'samples': 658944, 'steps': 3431, 'loss/train': 2.4393625259399414} -11/06/2021 21:44:47 - INFO - __main__ - Step 3433: {'lr': 0.0004998845114514095, 'samples': 659136, 'steps': 3432, 'loss/train': 1.8727471828460693} -11/06/2021 21:44:48 - INFO - __main__ - Step 3434: {'lr': 0.0004998843501106766, 'samples': 659328, 'steps': 3433, 'loss/train': 2.1409528255462646} -11/06/2021 21:44:49 - INFO - __main__ - Step 3435: {'lr': 0.0004998841886573496, 'samples': 659520, 'steps': 3434, 'loss/train': 2.510873317718506} -11/06/2021 21:44:49 - INFO - __main__ - Step 3436: {'lr': 0.0004998840270914288, 'samples': 659712, 'steps': 3435, 'loss/train': 1.8569953441619873} -11/06/2021 21:44:50 - INFO - __main__ - Step 3437: {'lr': 0.0004998838654129142, 'samples': 659904, 'steps': 3436, 'loss/train': 1.0409950017929077} -11/06/2021 21:44:50 - INFO - __main__ - Step 3438: {'lr': 0.0004998837036218056, 'samples': 660096, 'steps': 3437, 'loss/train': 2.066178798675537} -11/06/2021 21:44:51 - INFO - __main__ - Step 3439: {'lr': 0.0004998835417181033, 'samples': 660288, 'steps': 3438, 'loss/train': 1.7412632703781128} -11/06/2021 21:44:52 - INFO - __main__ - Step 3440: {'lr': 0.0004998833797018074, 'samples': 660480, 'steps': 3439, 'loss/train': 1.823896050453186} -11/06/2021 21:44:52 - INFO - __main__ - Step 3441: {'lr': 0.0004998832175729179, 'samples': 660672, 'steps': 3440, 'loss/train': 2.1356678009033203} -11/06/2021 21:44:52 - INFO - __main__ - Step 3442: {'lr': 0.0004998830553314349, 'samples': 660864, 'steps': 3441, 'loss/train': 1.7477060556411743} -11/06/2021 21:44:53 - INFO - __main__ - Step 3443: {'lr': 0.0004998828929773583, 'samples': 661056, 'steps': 3442, 'loss/train': 2.1472830772399902} -11/06/2021 21:44:53 - INFO - __main__ - Step 3444: {'lr': 0.0004998827305106884, 'samples': 661248, 'steps': 3443, 'loss/train': 1.7395120859146118} -11/06/2021 21:44:54 - INFO - __main__ - Step 3445: {'lr': 0.0004998825679314253, 'samples': 661440, 'steps': 3444, 'loss/train': 2.5220179557800293} -11/06/2021 21:44:54 - INFO - __main__ - Step 3446: {'lr': 0.0004998824052395689, 'samples': 661632, 'steps': 3445, 'loss/train': 2.2687270641326904} -11/06/2021 21:44:55 - INFO - __main__ - Step 3447: {'lr': 0.0004998822424351193, 'samples': 661824, 'steps': 3446, 'loss/train': 2.2349984645843506} -11/06/2021 21:44:55 - INFO - __main__ - Step 3448: {'lr': 0.0004998820795180766, 'samples': 662016, 'steps': 3447, 'loss/train': 2.5539913177490234} -11/06/2021 21:44:55 - INFO - __main__ - Step 3449: {'lr': 0.000499881916488441, 'samples': 662208, 'steps': 3448, 'loss/train': 1.9206302165985107} -11/06/2021 21:44:57 - INFO - __main__ - Step 3450: {'lr': 0.0004998817533462123, 'samples': 662400, 'steps': 3449, 'loss/train': 2.2440977096557617} -11/06/2021 21:44:57 - INFO - __main__ - Step 3451: {'lr': 0.0004998815900913909, 'samples': 662592, 'steps': 3450, 'loss/train': 1.2015467882156372} -11/06/2021 21:44:57 - INFO - __main__ - Step 3452: {'lr': 0.0004998814267239767, 'samples': 662784, 'steps': 3451, 'loss/train': 2.6361520290374756} -11/06/2021 21:44:58 - INFO - __main__ - Step 3453: {'lr': 0.0004998812632439697, 'samples': 662976, 'steps': 3452, 'loss/train': 1.7184646129608154} -11/06/2021 21:44:58 - INFO - __main__ - Step 3454: {'lr': 0.00049988109965137, 'samples': 663168, 'steps': 3453, 'loss/train': 2.2237768173217773} -11/06/2021 21:44:58 - INFO - __main__ - Step 3455: {'lr': 0.000499880935946178, 'samples': 663360, 'steps': 3454, 'loss/train': 1.60335111618042} -11/06/2021 21:44:59 - INFO - __main__ - Step 3456: {'lr': 0.0004998807721283932, 'samples': 663552, 'steps': 3455, 'loss/train': 4.451015472412109} -11/06/2021 21:45:00 - INFO - __main__ - Step 3457: {'lr': 0.0004998806081980162, 'samples': 663744, 'steps': 3456, 'loss/train': 2.589240074157715} -11/06/2021 21:45:00 - INFO - __main__ - Step 3458: {'lr': 0.0004998804441550467, 'samples': 663936, 'steps': 3457, 'loss/train': 1.5202341079711914} -11/06/2021 21:45:00 - INFO - __main__ - Step 3459: {'lr': 0.000499880279999485, 'samples': 664128, 'steps': 3458, 'loss/train': 2.2377476692199707} -11/06/2021 21:45:01 - INFO - __main__ - Step 3460: {'lr': 0.0004998801157313311, 'samples': 664320, 'steps': 3459, 'loss/train': 2.0967650413513184} -11/06/2021 21:45:02 - INFO - __main__ - Step 3461: {'lr': 0.0004998799513505851, 'samples': 664512, 'steps': 3460, 'loss/train': 2.196791648864746} -11/06/2021 21:45:02 - INFO - __main__ - Step 3462: {'lr': 0.000499879786857247, 'samples': 664704, 'steps': 3461, 'loss/train': 2.2895452976226807} -11/06/2021 21:45:02 - INFO - __main__ - Step 3463: {'lr': 0.0004998796222513169, 'samples': 664896, 'steps': 3462, 'loss/train': 2.4116644859313965} -11/06/2021 21:45:03 - INFO - __main__ - Step 3464: {'lr': 0.000499879457532795, 'samples': 665088, 'steps': 3463, 'loss/train': 2.3247618675231934} -11/06/2021 21:45:03 - INFO - __main__ - Step 3465: {'lr': 0.0004998792927016812, 'samples': 665280, 'steps': 3464, 'loss/train': 2.557910203933716} -11/06/2021 21:45:04 - INFO - __main__ - Step 3466: {'lr': 0.0004998791277579757, 'samples': 665472, 'steps': 3465, 'loss/train': 2.2992501258850098} -11/06/2021 21:45:04 - INFO - __main__ - Step 3467: {'lr': 0.0004998789627016784, 'samples': 665664, 'steps': 3466, 'loss/train': 2.114197254180908} -11/06/2021 21:45:05 - INFO - __main__ - Step 3468: {'lr': 0.0004998787975327896, 'samples': 665856, 'steps': 3467, 'loss/train': 2.2296416759490967} -11/06/2021 21:45:05 - INFO - __main__ - Step 3469: {'lr': 0.0004998786322513093, 'samples': 666048, 'steps': 3468, 'loss/train': 2.309483528137207} -11/06/2021 21:45:05 - INFO - __main__ - Step 3470: {'lr': 0.0004998784668572375, 'samples': 666240, 'steps': 3469, 'loss/train': 1.9443069696426392} -11/06/2021 21:45:06 - INFO - __main__ - Step 3471: {'lr': 0.0004998783013505743, 'samples': 666432, 'steps': 3470, 'loss/train': 2.0072755813598633} -11/06/2021 21:45:07 - INFO - __main__ - Step 3472: {'lr': 0.0004998781357313198, 'samples': 666624, 'steps': 3471, 'loss/train': 2.455528974533081} -11/06/2021 21:45:07 - INFO - __main__ - Step 3473: {'lr': 0.0004998779699994741, 'samples': 666816, 'steps': 3472, 'loss/train': 2.9603943824768066} -11/06/2021 21:45:07 - INFO - __main__ - Step 3474: {'lr': 0.0004998778041550372, 'samples': 667008, 'steps': 3473, 'loss/train': 2.1143574714660645} -11/06/2021 21:45:08 - INFO - __main__ - Step 3475: {'lr': 0.0004998776381980092, 'samples': 667200, 'steps': 3474, 'loss/train': 2.124244213104248} -11/06/2021 21:45:08 - INFO - __main__ - Step 3476: {'lr': 0.0004998774721283903, 'samples': 667392, 'steps': 3475, 'loss/train': 2.0879619121551514} -11/06/2021 21:45:09 - INFO - __main__ - Step 3477: {'lr': 0.0004998773059461803, 'samples': 667584, 'steps': 3476, 'loss/train': 2.3110809326171875} -11/06/2021 21:45:10 - INFO - __main__ - Step 3478: {'lr': 0.0004998771396513796, 'samples': 667776, 'steps': 3477, 'loss/train': 2.4501490592956543} -11/06/2021 21:45:10 - INFO - __main__ - Step 3479: {'lr': 0.000499876973243988, 'samples': 667968, 'steps': 3478, 'loss/train': 1.411661148071289} -11/06/2021 21:45:10 - INFO - __main__ - Step 3480: {'lr': 0.0004998768067240059, 'samples': 668160, 'steps': 3479, 'loss/train': 2.6114776134490967} -11/06/2021 21:45:11 - INFO - __main__ - Step 3481: {'lr': 0.0004998766400914329, 'samples': 668352, 'steps': 3480, 'loss/train': 2.1029934883117676} -11/06/2021 21:45:12 - INFO - __main__ - Step 3482: {'lr': 0.0004998764733462694, 'samples': 668544, 'steps': 3481, 'loss/train': 1.7680230140686035} -11/06/2021 21:45:12 - INFO - __main__ - Step 3483: {'lr': 0.0004998763064885155, 'samples': 668736, 'steps': 3482, 'loss/train': 2.153639554977417} -11/06/2021 21:45:12 - INFO - __main__ - Step 3484: {'lr': 0.0004998761395181712, 'samples': 668928, 'steps': 3483, 'loss/train': 2.03013014793396} -11/06/2021 21:45:13 - INFO - __main__ - Step 3485: {'lr': 0.0004998759724352365, 'samples': 669120, 'steps': 3484, 'loss/train': 0.6211015582084656} -11/06/2021 21:45:13 - INFO - __main__ - Step 3486: {'lr': 0.0004998758052397115, 'samples': 669312, 'steps': 3485, 'loss/train': 1.9367340803146362} -11/06/2021 21:45:14 - INFO - __main__ - Step 3487: {'lr': 0.0004998756379315964, 'samples': 669504, 'steps': 3486, 'loss/train': 1.8777623176574707} -11/06/2021 21:45:14 - INFO - __main__ - Step 3488: {'lr': 0.0004998754705108912, 'samples': 669696, 'steps': 3487, 'loss/train': 2.432539939880371} -11/06/2021 21:45:15 - INFO - __main__ - Step 3489: {'lr': 0.000499875302977596, 'samples': 669888, 'steps': 3488, 'loss/train': 2.30979585647583} -11/06/2021 21:45:15 - INFO - __main__ - Step 3490: {'lr': 0.0004998751353317108, 'samples': 670080, 'steps': 3489, 'loss/train': 2.282562017440796} -11/06/2021 21:45:15 - INFO - __main__ - Step 3491: {'lr': 0.0004998749675732357, 'samples': 670272, 'steps': 3490, 'loss/train': 2.008915662765503} -11/06/2021 21:45:17 - INFO - __main__ - Step 3492: {'lr': 0.0004998747997021708, 'samples': 670464, 'steps': 3491, 'loss/train': 2.295339584350586} -11/06/2021 21:45:17 - INFO - __main__ - Step 3493: {'lr': 0.0004998746317185162, 'samples': 670656, 'steps': 3492, 'loss/train': 2.1820249557495117} -11/06/2021 21:45:18 - INFO - __main__ - Step 3494: {'lr': 0.000499874463622272, 'samples': 670848, 'steps': 3493, 'loss/train': 2.051396131515503} -11/06/2021 21:45:18 - INFO - __main__ - Step 3495: {'lr': 0.000499874295413438, 'samples': 671040, 'steps': 3494, 'loss/train': 1.9268534183502197} -11/06/2021 21:45:18 - INFO - __main__ - Step 3496: {'lr': 0.0004998741270920147, 'samples': 671232, 'steps': 3495, 'loss/train': 2.2112491130828857} -11/06/2021 21:45:19 - INFO - __main__ - Step 3497: {'lr': 0.0004998739586580019, 'samples': 671424, 'steps': 3496, 'loss/train': 2.0771069526672363} -11/06/2021 21:45:19 - INFO - __main__ - Step 3498: {'lr': 0.0004998737901113999, 'samples': 671616, 'steps': 3497, 'loss/train': 5.947204113006592} -11/06/2021 21:45:20 - INFO - __main__ - Step 3499: {'lr': 0.0004998736214522084, 'samples': 671808, 'steps': 3498, 'loss/train': 3.6572864055633545} -11/06/2021 21:45:20 - INFO - __main__ - Step 3500: {'lr': 0.0004998734526804278, 'samples': 672000, 'steps': 3499, 'loss/train': 2.2772557735443115} -11/06/2021 21:45:21 - INFO - __main__ - Step 3501: {'lr': 0.0004998732837960581, 'samples': 672192, 'steps': 3500, 'loss/train': 1.6389656066894531} -11/06/2021 21:45:21 - INFO - __main__ - Step 3502: {'lr': 0.0004998731147990993, 'samples': 672384, 'steps': 3501, 'loss/train': 2.0018649101257324} -11/06/2021 21:45:21 - INFO - __main__ - Step 3503: {'lr': 0.0004998729456895516, 'samples': 672576, 'steps': 3502, 'loss/train': 2.645084857940674} -11/06/2021 21:45:23 - INFO - __main__ - Step 3504: {'lr': 0.0004998727764674149, 'samples': 672768, 'steps': 3503, 'loss/train': 2.0491695404052734} -11/06/2021 21:45:23 - INFO - __main__ - Step 3505: {'lr': 0.0004998726071326896, 'samples': 672960, 'steps': 3504, 'loss/train': 1.6065165996551514} -11/06/2021 21:45:23 - INFO - __main__ - Step 3506: {'lr': 0.0004998724376853754, 'samples': 673152, 'steps': 3505, 'loss/train': 1.9586995840072632} -11/06/2021 21:45:24 - INFO - __main__ - Step 3507: {'lr': 0.0004998722681254725, 'samples': 673344, 'steps': 3506, 'loss/train': 1.835058569908142} -11/06/2021 21:45:24 - INFO - __main__ - Step 3508: {'lr': 0.0004998720984529811, 'samples': 673536, 'steps': 3507, 'loss/train': 2.592658519744873} -11/06/2021 21:45:25 - INFO - __main__ - Step 3509: {'lr': 0.0004998719286679011, 'samples': 673728, 'steps': 3508, 'loss/train': 1.8576128482818604} -11/06/2021 21:45:25 - INFO - __main__ - Step 3510: {'lr': 0.0004998717587702328, 'samples': 673920, 'steps': 3509, 'loss/train': 1.9809731245040894} -11/06/2021 21:45:26 - INFO - __main__ - Step 3511: {'lr': 0.0004998715887599759, 'samples': 674112, 'steps': 3510, 'loss/train': 1.734330415725708} -11/06/2021 21:45:26 - INFO - __main__ - Step 3512: {'lr': 0.000499871418637131, 'samples': 674304, 'steps': 3511, 'loss/train': 1.7968868017196655} -11/06/2021 21:45:26 - INFO - __main__ - Step 3513: {'lr': 0.0004998712484016977, 'samples': 674496, 'steps': 3512, 'loss/train': 2.3915631771087646} -11/06/2021 21:45:27 - INFO - __main__ - Step 3514: {'lr': 0.0004998710780536763, 'samples': 674688, 'steps': 3513, 'loss/train': 2.1563174724578857} -11/06/2021 21:45:28 - INFO - __main__ - Step 3515: {'lr': 0.0004998709075930669, 'samples': 674880, 'steps': 3514, 'loss/train': 1.6511495113372803} -11/06/2021 21:45:28 - INFO - __main__ - Step 3516: {'lr': 0.0004998707370198695, 'samples': 675072, 'steps': 3515, 'loss/train': 2.0000085830688477} -11/06/2021 21:45:28 - INFO - __main__ - Step 3517: {'lr': 0.0004998705663340843, 'samples': 675264, 'steps': 3516, 'loss/train': 1.445250153541565} -11/06/2021 21:45:29 - INFO - __main__ - Step 3518: {'lr': 0.0004998703955357111, 'samples': 675456, 'steps': 3517, 'loss/train': 1.4034719467163086} -11/06/2021 21:45:30 - INFO - __main__ - Step 3519: {'lr': 0.0004998702246247502, 'samples': 675648, 'steps': 3518, 'loss/train': 2.529625415802002} -11/06/2021 21:45:30 - INFO - __main__ - Step 3520: {'lr': 0.0004998700536012017, 'samples': 675840, 'steps': 3519, 'loss/train': 2.3188982009887695} -11/06/2021 21:45:30 - INFO - __main__ - Step 3521: {'lr': 0.0004998698824650655, 'samples': 676032, 'steps': 3520, 'loss/train': 0.6927474737167358} -11/06/2021 21:45:31 - INFO - __main__ - Step 3522: {'lr': 0.000499869711216342, 'samples': 676224, 'steps': 3521, 'loss/train': 1.4308483600616455} -11/06/2021 21:45:31 - INFO - __main__ - Step 3523: {'lr': 0.0004998695398550309, 'samples': 676416, 'steps': 3522, 'loss/train': 2.8342642784118652} -11/06/2021 21:45:32 - INFO - __main__ - Step 3524: {'lr': 0.0004998693683811325, 'samples': 676608, 'steps': 3523, 'loss/train': 2.05680513381958} -11/06/2021 21:45:32 - INFO - __main__ - Step 3525: {'lr': 0.0004998691967946468, 'samples': 676800, 'steps': 3524, 'loss/train': 2.1919660568237305} -11/06/2021 21:45:33 - INFO - __main__ - Step 3526: {'lr': 0.000499869025095574, 'samples': 676992, 'steps': 3525, 'loss/train': 1.6675937175750732} -11/06/2021 21:45:33 - INFO - __main__ - Step 3527: {'lr': 0.0004998688532839139, 'samples': 677184, 'steps': 3526, 'loss/train': 2.5993382930755615} -11/06/2021 21:45:34 - INFO - __main__ - Step 3528: {'lr': 0.0004998686813596668, 'samples': 677376, 'steps': 3527, 'loss/train': 2.326568126678467} -11/06/2021 21:45:34 - INFO - __main__ - Step 3529: {'lr': 0.0004998685093228327, 'samples': 677568, 'steps': 3528, 'loss/train': 1.6023788452148438} -11/06/2021 21:45:35 - INFO - __main__ - Step 3530: {'lr': 0.0004998683371734118, 'samples': 677760, 'steps': 3529, 'loss/train': 1.248134732246399} -11/06/2021 21:45:35 - INFO - __main__ - Step 3531: {'lr': 0.000499868164911404, 'samples': 677952, 'steps': 3530, 'loss/train': 1.8184454441070557} -11/06/2021 21:45:36 - INFO - __main__ - Step 3532: {'lr': 0.0004998679925368094, 'samples': 678144, 'steps': 3531, 'loss/train': 1.9451133012771606} -11/06/2021 21:45:36 - INFO - __main__ - Step 3533: {'lr': 0.0004998678200496283, 'samples': 678336, 'steps': 3532, 'loss/train': 2.026451587677002} -11/06/2021 21:45:36 - INFO - __main__ - Step 3534: {'lr': 0.0004998676474498606, 'samples': 678528, 'steps': 3533, 'loss/train': 1.7797132730484009} -11/06/2021 21:45:37 - INFO - __main__ - Step 3535: {'lr': 0.0004998674747375063, 'samples': 678720, 'steps': 3534, 'loss/train': 2.1139495372772217} -11/06/2021 21:45:38 - INFO - __main__ - Step 3536: {'lr': 0.0004998673019125657, 'samples': 678912, 'steps': 3535, 'loss/train': 2.0227255821228027} -11/06/2021 21:45:38 - INFO - __main__ - Step 3537: {'lr': 0.0004998671289750386, 'samples': 679104, 'steps': 3536, 'loss/train': 2.357372283935547} -11/06/2021 21:45:38 - INFO - __main__ - Step 3538: {'lr': 0.0004998669559249252, 'samples': 679296, 'steps': 3537, 'loss/train': 2.0382673740386963} -11/06/2021 21:45:39 - INFO - __main__ - Step 3539: {'lr': 0.0004998667827622258, 'samples': 679488, 'steps': 3538, 'loss/train': 1.8378405570983887} -11/06/2021 21:45:40 - INFO - __main__ - Step 3540: {'lr': 0.0004998666094869402, 'samples': 679680, 'steps': 3539, 'loss/train': 1.9578657150268555} -11/06/2021 21:45:40 - INFO - __main__ - Step 3541: {'lr': 0.0004998664360990685, 'samples': 679872, 'steps': 3540, 'loss/train': 2.1692068576812744} -11/06/2021 21:45:41 - INFO - __main__ - Step 3542: {'lr': 0.0004998662625986109, 'samples': 680064, 'steps': 3541, 'loss/train': 1.96601140499115} -11/06/2021 21:45:41 - INFO - __main__ - Step 3543: {'lr': 0.0004998660889855674, 'samples': 680256, 'steps': 3542, 'loss/train': 2.4479618072509766} -11/06/2021 21:45:41 - INFO - __main__ - Step 3544: {'lr': 0.0004998659152599381, 'samples': 680448, 'steps': 3543, 'loss/train': 2.9186902046203613} -11/06/2021 21:45:43 - INFO - __main__ - Step 3545: {'lr': 0.000499865741421723, 'samples': 680640, 'steps': 3544, 'loss/train': 1.9552292823791504} -11/06/2021 21:45:43 - INFO - __main__ - Step 3546: {'lr': 0.0004998655674709224, 'samples': 680832, 'steps': 3545, 'loss/train': 2.1400067806243896} -11/06/2021 21:45:43 - INFO - __main__ - Step 3547: {'lr': 0.0004998653934075361, 'samples': 681024, 'steps': 3546, 'loss/train': 2.2904787063598633} -11/06/2021 21:45:44 - INFO - __main__ - Step 3548: {'lr': 0.0004998652192315644, 'samples': 681216, 'steps': 3547, 'loss/train': 1.8039276599884033} -11/06/2021 21:45:44 - INFO - __main__ - Step 3549: {'lr': 0.0004998650449430073, 'samples': 681408, 'steps': 3548, 'loss/train': 1.7798856496810913} -11/06/2021 21:45:45 - INFO - __main__ - Step 3550: {'lr': 0.0004998648705418648, 'samples': 681600, 'steps': 3549, 'loss/train': 1.5824065208435059} -11/06/2021 21:45:45 - INFO - __main__ - Step 3551: {'lr': 0.000499864696028137, 'samples': 681792, 'steps': 3550, 'loss/train': 1.8516236543655396} -11/06/2021 21:45:46 - INFO - __main__ - Step 3552: {'lr': 0.000499864521401824, 'samples': 681984, 'steps': 3551, 'loss/train': 2.100595474243164} -11/06/2021 21:45:46 - INFO - __main__ - Step 3553: {'lr': 0.000499864346662926, 'samples': 682176, 'steps': 3552, 'loss/train': 2.4325428009033203} -11/06/2021 21:45:46 - INFO - __main__ - Step 3554: {'lr': 0.000499864171811443, 'samples': 682368, 'steps': 3553, 'loss/train': 1.2289140224456787} -11/06/2021 21:45:47 - INFO - __main__ - Step 3555: {'lr': 0.0004998639968473751, 'samples': 682560, 'steps': 3554, 'loss/train': 2.2943685054779053} -11/06/2021 21:45:48 - INFO - __main__ - Step 3556: {'lr': 0.0004998638217707222, 'samples': 682752, 'steps': 3555, 'loss/train': 2.264774799346924} -11/06/2021 21:45:48 - INFO - __main__ - Step 3557: {'lr': 0.0004998636465814846, 'samples': 682944, 'steps': 3556, 'loss/train': 1.637046217918396} -11/06/2021 21:45:48 - INFO - __main__ - Step 3558: {'lr': 0.0004998634712796622, 'samples': 683136, 'steps': 3557, 'loss/train': 2.0852251052856445} -11/06/2021 21:45:49 - INFO - __main__ - Step 3559: {'lr': 0.0004998632958652554, 'samples': 683328, 'steps': 3558, 'loss/train': 1.820117473602295} -11/06/2021 21:45:50 - INFO - __main__ - Step 3560: {'lr': 0.0004998631203382639, 'samples': 683520, 'steps': 3559, 'loss/train': 2.074711561203003} -11/06/2021 21:45:50 - INFO - __main__ - Step 3561: {'lr': 0.0004998629446986879, 'samples': 683712, 'steps': 3560, 'loss/train': 2.1228792667388916} -11/06/2021 21:45:51 - INFO - __main__ - Step 3562: {'lr': 0.0004998627689465276, 'samples': 683904, 'steps': 3561, 'loss/train': 2.0950121879577637} -11/06/2021 21:45:51 - INFO - __main__ - Step 3563: {'lr': 0.0004998625930817829, 'samples': 684096, 'steps': 3562, 'loss/train': 2.041194200515747} -11/06/2021 21:45:51 - INFO - __main__ - Step 3564: {'lr': 0.0004998624171044541, 'samples': 684288, 'steps': 3563, 'loss/train': 1.9695250988006592} -11/06/2021 21:45:52 - INFO - __main__ - Step 3565: {'lr': 0.000499862241014541, 'samples': 684480, 'steps': 3564, 'loss/train': 2.691624164581299} -11/06/2021 21:45:53 - INFO - __main__ - Step 3566: {'lr': 0.0004998620648120439, 'samples': 684672, 'steps': 3565, 'loss/train': 1.932613730430603} -11/06/2021 21:45:53 - INFO - __main__ - Step 3567: {'lr': 0.0004998618884969628, 'samples': 684864, 'steps': 3566, 'loss/train': 2.155407190322876} -11/06/2021 21:45:53 - INFO - __main__ - Step 3568: {'lr': 0.0004998617120692977, 'samples': 685056, 'steps': 3567, 'loss/train': 1.8647109270095825} -11/06/2021 21:45:54 - INFO - __main__ - Step 3569: {'lr': 0.0004998615355290489, 'samples': 685248, 'steps': 3568, 'loss/train': 0.48862022161483765} -11/06/2021 21:45:55 - INFO - __main__ - Step 3570: {'lr': 0.0004998613588762163, 'samples': 685440, 'steps': 3569, 'loss/train': 2.087411642074585} -11/06/2021 21:45:55 - INFO - __main__ - Step 3571: {'lr': 0.0004998611821108001, 'samples': 685632, 'steps': 3570, 'loss/train': 2.365281820297241} -11/06/2021 21:45:55 - INFO - __main__ - Step 3572: {'lr': 0.0004998610052328002, 'samples': 685824, 'steps': 3571, 'loss/train': 1.9633747339248657} -11/06/2021 21:45:56 - INFO - __main__ - Step 3573: {'lr': 0.0004998608282422169, 'samples': 686016, 'steps': 3572, 'loss/train': 2.195950746536255} -11/06/2021 21:45:56 - INFO - __main__ - Step 3574: {'lr': 0.0004998606511390501, 'samples': 686208, 'steps': 3573, 'loss/train': 1.7376683950424194} -11/06/2021 21:45:56 - INFO - __main__ - Step 3575: {'lr': 0.0004998604739232999, 'samples': 686400, 'steps': 3574, 'loss/train': 2.2785563468933105} -11/06/2021 21:45:58 - INFO - __main__ - Step 3576: {'lr': 0.0004998602965949664, 'samples': 686592, 'steps': 3575, 'loss/train': 1.848177433013916} -11/06/2021 21:45:58 - INFO - __main__ - Step 3577: {'lr': 0.0004998601191540499, 'samples': 686784, 'steps': 3576, 'loss/train': 2.7372477054595947} -11/06/2021 21:45:58 - INFO - __main__ - Step 3578: {'lr': 0.0004998599416005502, 'samples': 686976, 'steps': 3577, 'loss/train': 2.2560975551605225} -11/06/2021 21:45:59 - INFO - __main__ - Step 3579: {'lr': 0.0004998597639344674, 'samples': 687168, 'steps': 3578, 'loss/train': 2.355379819869995} -11/06/2021 21:45:59 - INFO - __main__ - Step 3580: {'lr': 0.0004998595861558016, 'samples': 687360, 'steps': 3579, 'loss/train': 2.119218111038208} -11/06/2021 21:46:00 - INFO - __main__ - Step 3581: {'lr': 0.000499859408264553, 'samples': 687552, 'steps': 3580, 'loss/train': 1.7983760833740234} -11/06/2021 21:46:00 - INFO - __main__ - Step 3582: {'lr': 0.0004998592302607217, 'samples': 687744, 'steps': 3581, 'loss/train': 2.229571580886841} -11/06/2021 21:46:01 - INFO - __main__ - Step 3583: {'lr': 0.0004998590521443075, 'samples': 687936, 'steps': 3582, 'loss/train': 1.9575389623641968} -11/06/2021 21:46:01 - INFO - __main__ - Step 3584: {'lr': 0.0004998588739153108, 'samples': 688128, 'steps': 3583, 'loss/train': 1.7447315454483032} -11/06/2021 21:46:01 - INFO - __main__ - Step 3585: {'lr': 0.0004998586955737316, 'samples': 688320, 'steps': 3584, 'loss/train': 2.1006550788879395} -11/06/2021 21:46:02 - INFO - __main__ - Step 3586: {'lr': 0.0004998585171195698, 'samples': 688512, 'steps': 3585, 'loss/train': 3.3587646484375} -11/06/2021 21:46:03 - INFO - __main__ - Step 3587: {'lr': 0.0004998583385528256, 'samples': 688704, 'steps': 3586, 'loss/train': 2.2408502101898193} -11/06/2021 21:46:03 - INFO - __main__ - Step 3588: {'lr': 0.0004998581598734991, 'samples': 688896, 'steps': 3587, 'loss/train': 1.8953609466552734} -11/06/2021 21:46:04 - INFO - __main__ - Step 3589: {'lr': 0.0004998579810815905, 'samples': 689088, 'steps': 3588, 'loss/train': 2.701934576034546} -11/06/2021 21:46:04 - INFO - __main__ - Step 3590: {'lr': 0.0004998578021770995, 'samples': 689280, 'steps': 3589, 'loss/train': 1.9593024253845215} -11/06/2021 21:46:05 - INFO - __main__ - Step 3591: {'lr': 0.0004998576231600267, 'samples': 689472, 'steps': 3590, 'loss/train': 1.8404669761657715} -11/06/2021 21:46:05 - INFO - __main__ - Step 3592: {'lr': 0.0004998574440303718, 'samples': 689664, 'steps': 3591, 'loss/train': 2.3145079612731934} -11/06/2021 21:46:06 - INFO - __main__ - Step 3593: {'lr': 0.0004998572647881349, 'samples': 689856, 'steps': 3592, 'loss/train': 1.889504075050354} -11/06/2021 21:46:06 - INFO - __main__ - Step 3594: {'lr': 0.0004998570854333163, 'samples': 690048, 'steps': 3593, 'loss/train': 1.687559962272644} -11/06/2021 21:46:06 - INFO - __main__ - Step 3595: {'lr': 0.0004998569059659158, 'samples': 690240, 'steps': 3594, 'loss/train': 1.928205966949463} -11/06/2021 21:46:07 - INFO - __main__ - Step 3596: {'lr': 0.0004998567263859338, 'samples': 690432, 'steps': 3595, 'loss/train': 2.1471500396728516} -11/06/2021 21:46:08 - INFO - __main__ - Step 3597: {'lr': 0.0004998565466933702, 'samples': 690624, 'steps': 3596, 'loss/train': 2.6100289821624756} -11/06/2021 21:46:08 - INFO - __main__ - Step 3598: {'lr': 0.000499856366888225, 'samples': 690816, 'steps': 3597, 'loss/train': 1.6505409479141235} -11/06/2021 21:46:08 - INFO - __main__ - Step 3599: {'lr': 0.0004998561869704983, 'samples': 691008, 'steps': 3598, 'loss/train': 1.5047534704208374} -11/06/2021 21:46:09 - INFO - __main__ - Step 3600: {'lr': 0.0004998560069401905, 'samples': 691200, 'steps': 3599, 'loss/train': 2.1573095321655273} -11/06/2021 21:46:10 - INFO - __main__ - Step 3601: {'lr': 0.0004998558267973013, 'samples': 691392, 'steps': 3600, 'loss/train': 2.1335763931274414} -11/06/2021 21:46:10 - INFO - __main__ - Step 3602: {'lr': 0.0004998556465418309, 'samples': 691584, 'steps': 3601, 'loss/train': 2.135831832885742} -11/06/2021 21:46:11 - INFO - __main__ - Step 3603: {'lr': 0.0004998554661737795, 'samples': 691776, 'steps': 3602, 'loss/train': 2.5998644828796387} -11/06/2021 21:46:11 - INFO - __main__ - Step 3604: {'lr': 0.000499855285693147, 'samples': 691968, 'steps': 3603, 'loss/train': 2.1776552200317383} -11/06/2021 21:46:11 - INFO - __main__ - Step 3605: {'lr': 0.0004998551050999336, 'samples': 692160, 'steps': 3604, 'loss/train': 1.8231139183044434} -11/06/2021 21:46:12 - INFO - __main__ - Step 3606: {'lr': 0.0004998549243941393, 'samples': 692352, 'steps': 3605, 'loss/train': 1.756971001625061} -11/06/2021 21:46:13 - INFO - __main__ - Step 3607: {'lr': 0.0004998547435757643, 'samples': 692544, 'steps': 3606, 'loss/train': 1.6793618202209473} -11/06/2021 21:46:13 - INFO - __main__ - Step 3608: {'lr': 0.0004998545626448087, 'samples': 692736, 'steps': 3607, 'loss/train': 2.033261299133301} -11/06/2021 21:46:13 - INFO - __main__ - Step 3609: {'lr': 0.0004998543816012723, 'samples': 692928, 'steps': 3608, 'loss/train': 2.1296401023864746} -11/06/2021 21:46:14 - INFO - __main__ - Step 3610: {'lr': 0.0004998542004451554, 'samples': 693120, 'steps': 3609, 'loss/train': 2.213966131210327} -11/06/2021 21:46:14 - INFO - __main__ - Step 3611: {'lr': 0.000499854019176458, 'samples': 693312, 'steps': 3610, 'loss/train': 2.0920517444610596} -11/06/2021 21:46:15 - INFO - __main__ - Step 3612: {'lr': 0.0004998538377951803, 'samples': 693504, 'steps': 3611, 'loss/train': 0.8657620549201965} -11/06/2021 21:46:15 - INFO - __main__ - Step 3613: {'lr': 0.0004998536563013224, 'samples': 693696, 'steps': 3612, 'loss/train': 2.072887659072876} -11/06/2021 21:46:16 - INFO - __main__ - Step 3614: {'lr': 0.0004998534746948843, 'samples': 693888, 'steps': 3613, 'loss/train': 1.9264954328536987} -11/06/2021 21:46:16 - INFO - __main__ - Step 3615: {'lr': 0.000499853292975866, 'samples': 694080, 'steps': 3614, 'loss/train': 0.808038592338562} -11/06/2021 21:46:16 - INFO - __main__ - Step 3616: {'lr': 0.0004998531111442676, 'samples': 694272, 'steps': 3615, 'loss/train': 1.6517269611358643} -11/06/2021 21:46:18 - INFO - __main__ - Step 3617: {'lr': 0.0004998529292000893, 'samples': 694464, 'steps': 3616, 'loss/train': 2.1595749855041504} -11/06/2021 21:46:18 - INFO - __main__ - Step 3618: {'lr': 0.0004998527471433312, 'samples': 694656, 'steps': 3617, 'loss/train': 1.3440548181533813} -11/06/2021 21:46:18 - INFO - __main__ - Step 3619: {'lr': 0.0004998525649739932, 'samples': 694848, 'steps': 3618, 'loss/train': 1.8935426473617554} -11/06/2021 21:46:19 - INFO - __main__ - Step 3620: {'lr': 0.0004998523826920756, 'samples': 695040, 'steps': 3619, 'loss/train': 2.0238497257232666} -11/06/2021 21:46:19 - INFO - __main__ - Step 3621: {'lr': 0.0004998522002975783, 'samples': 695232, 'steps': 3620, 'loss/train': 2.4836816787719727} -11/06/2021 21:46:20 - INFO - __main__ - Step 3622: {'lr': 0.0004998520177905015, 'samples': 695424, 'steps': 3621, 'loss/train': 1.8629294633865356} -11/06/2021 21:46:20 - INFO - __main__ - Step 3623: {'lr': 0.0004998518351708452, 'samples': 695616, 'steps': 3622, 'loss/train': 2.230546712875366} -11/06/2021 21:46:21 - INFO - __main__ - Step 3624: {'lr': 0.0004998516524386095, 'samples': 695808, 'steps': 3623, 'loss/train': 2.3679111003875732} -11/06/2021 21:46:21 - INFO - __main__ - Step 3625: {'lr': 0.0004998514695937945, 'samples': 696000, 'steps': 3624, 'loss/train': 2.3775951862335205} -11/06/2021 21:46:21 - INFO - __main__ - Step 3626: {'lr': 0.0004998512866364003, 'samples': 696192, 'steps': 3625, 'loss/train': 1.8260321617126465} -11/06/2021 21:46:23 - INFO - __main__ - Step 3627: {'lr': 0.000499851103566427, 'samples': 696384, 'steps': 3626, 'loss/train': 2.3718161582946777} -11/06/2021 21:46:24 - INFO - __main__ - Step 3628: {'lr': 0.0004998509203838746, 'samples': 696576, 'steps': 3627, 'loss/train': 2.2593507766723633} -11/06/2021 21:46:24 - INFO - __main__ - Step 3629: {'lr': 0.0004998507370887433, 'samples': 696768, 'steps': 3628, 'loss/train': 2.683199882507324} -11/06/2021 21:46:24 - INFO - __main__ - Step 3630: {'lr': 0.000499850553681033, 'samples': 696960, 'steps': 3629, 'loss/train': 3.9143762588500977} -11/06/2021 21:46:25 - INFO - __main__ - Step 3631: {'lr': 0.000499850370160744, 'samples': 697152, 'steps': 3630, 'loss/train': 5.931422233581543} -11/06/2021 21:46:25 - INFO - __main__ - Step 3632: {'lr': 0.0004998501865278762, 'samples': 697344, 'steps': 3631, 'loss/train': 1.1052885055541992} -11/06/2021 21:46:25 - INFO - __main__ - Step 3633: {'lr': 0.0004998500027824298, 'samples': 697536, 'steps': 3632, 'loss/train': 1.352131724357605} -11/06/2021 21:46:26 - INFO - __main__ - Step 3634: {'lr': 0.0004998498189244049, 'samples': 697728, 'steps': 3633, 'loss/train': 2.097627639770508} -11/06/2021 21:46:27 - INFO - __main__ - Step 3635: {'lr': 0.0004998496349538015, 'samples': 697920, 'steps': 3634, 'loss/train': 2.872110605239868} -11/06/2021 21:46:27 - INFO - __main__ - Step 3636: {'lr': 0.0004998494508706196, 'samples': 698112, 'steps': 3635, 'loss/train': 1.6961387395858765} -11/06/2021 21:46:27 - INFO - __main__ - Step 3637: {'lr': 0.0004998492666748594, 'samples': 698304, 'steps': 3636, 'loss/train': 2.1306369304656982} -11/06/2021 21:46:28 - INFO - __main__ - Step 3638: {'lr': 0.0004998490823665211, 'samples': 698496, 'steps': 3637, 'loss/train': 2.1220192909240723} -11/06/2021 21:46:29 - INFO - __main__ - Step 3639: {'lr': 0.0004998488979456046, 'samples': 698688, 'steps': 3638, 'loss/train': 2.4169700145721436} -11/06/2021 21:46:29 - INFO - __main__ - Step 3640: {'lr': 0.00049984871341211, 'samples': 698880, 'steps': 3639, 'loss/train': 2.1508548259735107} -11/06/2021 21:46:30 - INFO - __main__ - Step 3641: {'lr': 0.0004998485287660375, 'samples': 699072, 'steps': 3640, 'loss/train': 2.348625898361206} -11/06/2021 21:46:30 - INFO - __main__ - Step 3642: {'lr': 0.0004998483440073871, 'samples': 699264, 'steps': 3641, 'loss/train': 2.3207335472106934} -11/06/2021 21:46:30 - INFO - __main__ - Step 3643: {'lr': 0.0004998481591361589, 'samples': 699456, 'steps': 3642, 'loss/train': 2.584690570831299} -11/06/2021 21:46:31 - INFO - __main__ - Step 3644: {'lr': 0.000499847974152353, 'samples': 699648, 'steps': 3643, 'loss/train': 1.8976331949234009} -11/06/2021 21:46:32 - INFO - __main__ - Step 3645: {'lr': 0.0004998477890559693, 'samples': 699840, 'steps': 3644, 'loss/train': 1.7949036359786987} -11/06/2021 21:46:32 - INFO - __main__ - Step 3646: {'lr': 0.0004998476038470082, 'samples': 700032, 'steps': 3645, 'loss/train': 2.1402628421783447} -11/06/2021 21:46:32 - INFO - __main__ - Step 3647: {'lr': 0.0004998474185254696, 'samples': 700224, 'steps': 3646, 'loss/train': 2.140929937362671} -11/06/2021 21:46:33 - INFO - __main__ - Step 3648: {'lr': 0.0004998472330913535, 'samples': 700416, 'steps': 3647, 'loss/train': 1.1526223421096802} -11/06/2021 21:46:34 - INFO - __main__ - Step 3649: {'lr': 0.0004998470475446603, 'samples': 700608, 'steps': 3648, 'loss/train': 2.2785234451293945} -11/06/2021 21:46:34 - INFO - __main__ - Step 3650: {'lr': 0.0004998468618853896, 'samples': 700800, 'steps': 3649, 'loss/train': 2.1500542163848877} -11/06/2021 21:46:35 - INFO - __main__ - Step 3651: {'lr': 0.000499846676113542, 'samples': 700992, 'steps': 3650, 'loss/train': 2.041510820388794} -11/06/2021 21:46:35 - INFO - __main__ - Step 3652: {'lr': 0.0004998464902291173, 'samples': 701184, 'steps': 3651, 'loss/train': 2.313647985458374} -11/06/2021 21:46:35 - INFO - __main__ - Step 3653: {'lr': 0.0004998463042321155, 'samples': 701376, 'steps': 3652, 'loss/train': 1.6131926774978638} -11/06/2021 21:46:36 - INFO - __main__ - Step 3654: {'lr': 0.0004998461181225369, 'samples': 701568, 'steps': 3653, 'loss/train': 2.0128300189971924} -11/06/2021 21:46:37 - INFO - __main__ - Step 3655: {'lr': 0.0004998459319003815, 'samples': 701760, 'steps': 3654, 'loss/train': 2.388474464416504} -11/06/2021 21:46:37 - INFO - __main__ - Step 3656: {'lr': 0.0004998457455656493, 'samples': 701952, 'steps': 3655, 'loss/train': 1.8429226875305176} -11/06/2021 21:46:37 - INFO - __main__ - Step 3657: {'lr': 0.0004998455591183406, 'samples': 702144, 'steps': 3656, 'loss/train': 2.267188310623169} -11/06/2021 21:46:38 - INFO - __main__ - Step 3658: {'lr': 0.0004998453725584552, 'samples': 702336, 'steps': 3657, 'loss/train': 2.0592057704925537} -11/06/2021 21:46:39 - INFO - __main__ - Step 3659: {'lr': 0.0004998451858859934, 'samples': 702528, 'steps': 3658, 'loss/train': 1.9567612409591675} -11/06/2021 21:46:39 - INFO - __main__ - Step 3660: {'lr': 0.0004998449991009552, 'samples': 702720, 'steps': 3659, 'loss/train': 2.084226608276367} -11/06/2021 21:46:39 - INFO - __main__ - Step 3661: {'lr': 0.0004998448122033408, 'samples': 702912, 'steps': 3660, 'loss/train': 2.5636651515960693} -11/06/2021 21:46:40 - INFO - __main__ - Step 3662: {'lr': 0.00049984462519315, 'samples': 703104, 'steps': 3661, 'loss/train': 2.506985664367676} -11/06/2021 21:46:40 - INFO - __main__ - Step 3663: {'lr': 0.0004998444380703832, 'samples': 703296, 'steps': 3662, 'loss/train': 2.208871603012085} -11/06/2021 21:46:41 - INFO - __main__ - Step 3664: {'lr': 0.0004998442508350404, 'samples': 703488, 'steps': 3663, 'loss/train': 2.199995994567871} -11/06/2021 21:46:41 - INFO - __main__ - Step 3665: {'lr': 0.0004998440634871215, 'samples': 703680, 'steps': 3664, 'loss/train': 1.8999465703964233} -11/06/2021 21:46:42 - INFO - __main__ - Step 3666: {'lr': 0.0004998438760266267, 'samples': 703872, 'steps': 3665, 'loss/train': 2.107455253601074} -11/06/2021 21:46:42 - INFO - __main__ - Step 3667: {'lr': 0.0004998436884535562, 'samples': 704064, 'steps': 3666, 'loss/train': 1.854463815689087} -11/06/2021 21:46:42 - INFO - __main__ - Step 3668: {'lr': 0.00049984350076791, 'samples': 704256, 'steps': 3667, 'loss/train': 2.7667548656463623} -11/06/2021 21:46:44 - INFO - __main__ - Step 3669: {'lr': 0.0004998433129696882, 'samples': 704448, 'steps': 3668, 'loss/train': 1.5981824398040771} -11/06/2021 21:46:44 - INFO - __main__ - Step 3670: {'lr': 0.0004998431250588907, 'samples': 704640, 'steps': 3669, 'loss/train': 2.160209894180298} -11/06/2021 21:46:44 - INFO - __main__ - Step 3671: {'lr': 0.0004998429370355179, 'samples': 704832, 'steps': 3670, 'loss/train': 1.8680161237716675} -11/06/2021 21:46:45 - INFO - __main__ - Step 3672: {'lr': 0.0004998427488995697, 'samples': 705024, 'steps': 3671, 'loss/train': 2.518526315689087} -11/06/2021 21:46:45 - INFO - __main__ - Step 3673: {'lr': 0.0004998425606510461, 'samples': 705216, 'steps': 3672, 'loss/train': 2.714362621307373} -11/06/2021 21:46:45 - INFO - __main__ - Step 3674: {'lr': 0.0004998423722899475, 'samples': 705408, 'steps': 3673, 'loss/train': 1.8246042728424072} -11/06/2021 21:46:46 - INFO - __main__ - Step 3675: {'lr': 0.0004998421838162735, 'samples': 705600, 'steps': 3674, 'loss/train': 0.9275121688842773} -11/06/2021 21:46:47 - INFO - __main__ - Step 3676: {'lr': 0.0004998419952300247, 'samples': 705792, 'steps': 3675, 'loss/train': 2.0111794471740723} -11/06/2021 21:46:47 - INFO - __main__ - Step 3677: {'lr': 0.0004998418065312009, 'samples': 705984, 'steps': 3676, 'loss/train': 1.89971923828125} -11/06/2021 21:46:47 - INFO - __main__ - Step 3678: {'lr': 0.0004998416177198022, 'samples': 706176, 'steps': 3677, 'loss/train': 1.930174708366394} -11/06/2021 21:46:48 - INFO - __main__ - Step 3679: {'lr': 0.0004998414287958288, 'samples': 706368, 'steps': 3678, 'loss/train': 2.1186258792877197} -11/06/2021 21:46:49 - INFO - __main__ - Step 3680: {'lr': 0.0004998412397592807, 'samples': 706560, 'steps': 3679, 'loss/train': 2.1540133953094482} -11/06/2021 21:46:49 - INFO - __main__ - Step 3681: {'lr': 0.0004998410506101579, 'samples': 706752, 'steps': 3680, 'loss/train': 1.5001546144485474} -11/06/2021 21:46:50 - INFO - __main__ - Step 3682: {'lr': 0.0004998408613484605, 'samples': 706944, 'steps': 3681, 'loss/train': 1.7224041223526} -11/06/2021 21:46:50 - INFO - __main__ - Step 3683: {'lr': 0.0004998406719741888, 'samples': 707136, 'steps': 3682, 'loss/train': 1.118072509765625} -11/06/2021 21:46:51 - INFO - __main__ - Step 3684: {'lr': 0.0004998404824873428, 'samples': 707328, 'steps': 3683, 'loss/train': 1.8773263692855835} -11/06/2021 21:46:51 - INFO - __main__ - Step 3685: {'lr': 0.0004998402928879225, 'samples': 707520, 'steps': 3684, 'loss/train': 1.9647787809371948} -11/06/2021 21:46:52 - INFO - __main__ - Step 3686: {'lr': 0.000499840103175928, 'samples': 707712, 'steps': 3685, 'loss/train': 2.2132978439331055} -11/06/2021 21:46:52 - INFO - __main__ - Step 3687: {'lr': 0.0004998399133513594, 'samples': 707904, 'steps': 3686, 'loss/train': 2.232158899307251} -11/06/2021 21:46:53 - INFO - __main__ - Step 3688: {'lr': 0.0004998397234142167, 'samples': 708096, 'steps': 3687, 'loss/train': 2.528634786605835} -11/06/2021 21:46:53 - INFO - __main__ - Step 3689: {'lr': 0.0004998395333645002, 'samples': 708288, 'steps': 3688, 'loss/train': 2.5124094486236572} -11/06/2021 21:46:54 - INFO - __main__ - Step 3690: {'lr': 0.0004998393432022098, 'samples': 708480, 'steps': 3689, 'loss/train': 2.4985034465789795} -11/06/2021 21:46:54 - INFO - __main__ - Step 3691: {'lr': 0.0004998391529273457, 'samples': 708672, 'steps': 3690, 'loss/train': 2.0140085220336914} -11/06/2021 21:46:55 - INFO - __main__ - Step 3692: {'lr': 0.0004998389625399079, 'samples': 708864, 'steps': 3691, 'loss/train': 1.7472585439682007} -11/06/2021 21:46:55 - INFO - __main__ - Step 3693: {'lr': 0.0004998387720398965, 'samples': 709056, 'steps': 3692, 'loss/train': 2.138169527053833} -11/06/2021 21:46:55 - INFO - __main__ - Step 3694: {'lr': 0.0004998385814273116, 'samples': 709248, 'steps': 3693, 'loss/train': 1.8398798704147339} -11/06/2021 21:46:56 - INFO - __main__ - Step 3695: {'lr': 0.0004998383907021533, 'samples': 709440, 'steps': 3694, 'loss/train': 2.2453384399414062} -11/06/2021 21:46:57 - INFO - __main__ - Step 3696: {'lr': 0.0004998381998644217, 'samples': 709632, 'steps': 3695, 'loss/train': 2.210822105407715} -11/06/2021 21:46:57 - INFO - __main__ - Step 3697: {'lr': 0.0004998380089141169, 'samples': 709824, 'steps': 3696, 'loss/train': 1.83198082447052} -11/06/2021 21:46:57 - INFO - __main__ - Step 3698: {'lr': 0.0004998378178512388, 'samples': 710016, 'steps': 3697, 'loss/train': 2.363736391067505} -11/06/2021 21:46:58 - INFO - __main__ - Step 3699: {'lr': 0.0004998376266757878, 'samples': 710208, 'steps': 3698, 'loss/train': 1.7178457975387573} -11/06/2021 21:46:58 - INFO - __main__ - Step 3700: {'lr': 0.0004998374353877638, 'samples': 710400, 'steps': 3699, 'loss/train': 1.9114118814468384} -11/06/2021 21:46:59 - INFO - __main__ - Step 3701: {'lr': 0.0004998372439871668, 'samples': 710592, 'steps': 3700, 'loss/train': 2.2929277420043945} -11/06/2021 21:46:59 - INFO - __main__ - Step 3702: {'lr': 0.000499837052473997, 'samples': 710784, 'steps': 3701, 'loss/train': 2.206447124481201} -11/06/2021 21:47:00 - INFO - __main__ - Step 3703: {'lr': 0.0004998368608482546, 'samples': 710976, 'steps': 3702, 'loss/train': 2.2719476222991943} -11/06/2021 21:47:00 - INFO - __main__ - Step 3704: {'lr': 0.0004998366691099395, 'samples': 711168, 'steps': 3703, 'loss/train': 1.9696950912475586} -11/06/2021 21:47:01 - INFO - __main__ - Step 3705: {'lr': 0.0004998364772590518, 'samples': 711360, 'steps': 3704, 'loss/train': 1.9279074668884277} -11/06/2021 21:47:02 - INFO - __main__ - Step 3706: {'lr': 0.0004998362852955918, 'samples': 711552, 'steps': 3705, 'loss/train': 2.3700718879699707} -11/06/2021 21:47:02 - INFO - __main__ - Step 3707: {'lr': 0.0004998360932195593, 'samples': 711744, 'steps': 3706, 'loss/train': 2.2039358615875244} -11/06/2021 21:47:02 - INFO - __main__ - Step 3708: {'lr': 0.0004998359010309544, 'samples': 711936, 'steps': 3707, 'loss/train': 2.483283758163452} -11/06/2021 21:47:03 - INFO - __main__ - Step 3709: {'lr': 0.0004998357087297775, 'samples': 712128, 'steps': 3708, 'loss/train': 1.5728569030761719} -11/06/2021 21:47:03 - INFO - __main__ - Step 3710: {'lr': 0.0004998355163160285, 'samples': 712320, 'steps': 3709, 'loss/train': 1.6009992361068726} -11/06/2021 21:47:04 - INFO - __main__ - Step 3711: {'lr': 0.0004998353237897073, 'samples': 712512, 'steps': 3710, 'loss/train': 2.459540605545044} -11/06/2021 21:47:04 - INFO - __main__ - Step 3712: {'lr': 0.0004998351311508143, 'samples': 712704, 'steps': 3711, 'loss/train': 1.7308366298675537} -11/06/2021 21:47:05 - INFO - __main__ - Step 3713: {'lr': 0.0004998349383993493, 'samples': 712896, 'steps': 3712, 'loss/train': 2.191849708557129} -11/06/2021 21:47:05 - INFO - __main__ - Step 3714: {'lr': 0.0004998347455353126, 'samples': 713088, 'steps': 3713, 'loss/train': 2.918881893157959} -11/06/2021 21:47:05 - INFO - __main__ - Step 3715: {'lr': 0.0004998345525587042, 'samples': 713280, 'steps': 3714, 'loss/train': 2.113539695739746} -11/06/2021 21:47:06 - INFO - __main__ - Step 3716: {'lr': 0.0004998343594695242, 'samples': 713472, 'steps': 3715, 'loss/train': 1.7858660221099854} -11/06/2021 21:47:07 - INFO - __main__ - Step 3717: {'lr': 0.0004998341662677728, 'samples': 713664, 'steps': 3716, 'loss/train': 1.8981730937957764} -11/06/2021 21:47:07 - INFO - __main__ - Step 3718: {'lr': 0.0004998339729534499, 'samples': 713856, 'steps': 3717, 'loss/train': 2.5536508560180664} -11/06/2021 21:47:07 - INFO - __main__ - Step 3719: {'lr': 0.0004998337795265557, 'samples': 714048, 'steps': 3718, 'loss/train': 2.2563905715942383} -11/06/2021 21:47:08 - INFO - __main__ - Step 3720: {'lr': 0.0004998335859870903, 'samples': 714240, 'steps': 3719, 'loss/train': 1.7998706102371216} -11/06/2021 21:47:09 - INFO - __main__ - Step 3721: {'lr': 0.0004998333923350536, 'samples': 714432, 'steps': 3720, 'loss/train': 2.0226428508758545} -11/06/2021 21:47:09 - INFO - __main__ - Step 3722: {'lr': 0.000499833198570446, 'samples': 714624, 'steps': 3721, 'loss/train': 1.3011538982391357} -11/06/2021 21:47:10 - INFO - __main__ - Step 3723: {'lr': 0.0004998330046932672, 'samples': 714816, 'steps': 3722, 'loss/train': 2.5336453914642334} -11/06/2021 21:47:10 - INFO - __main__ - Step 3724: {'lr': 0.0004998328107035176, 'samples': 715008, 'steps': 3723, 'loss/train': 2.392589807510376} -11/06/2021 21:47:10 - INFO - __main__ - Step 3725: {'lr': 0.0004998326166011973, 'samples': 715200, 'steps': 3724, 'loss/train': 2.1815335750579834} -11/06/2021 21:47:11 - INFO - __main__ - Step 3726: {'lr': 0.0004998324223863061, 'samples': 715392, 'steps': 3725, 'loss/train': 6.898614406585693} -11/06/2021 21:47:12 - INFO - __main__ - Step 3727: {'lr': 0.0004998322280588445, 'samples': 715584, 'steps': 3726, 'loss/train': 1.5503253936767578} -11/06/2021 21:47:12 - INFO - __main__ - Step 3728: {'lr': 0.0004998320336188121, 'samples': 715776, 'steps': 3727, 'loss/train': 2.2275030612945557} -11/06/2021 21:47:12 - INFO - __main__ - Step 3729: {'lr': 0.0004998318390662095, 'samples': 715968, 'steps': 3728, 'loss/train': 1.9741984605789185} -11/06/2021 21:47:13 - INFO - __main__ - Step 3730: {'lr': 0.0004998316444010363, 'samples': 716160, 'steps': 3729, 'loss/train': 1.3006471395492554} -11/06/2021 21:47:13 - INFO - __main__ - Step 3731: {'lr': 0.0004998314496232929, 'samples': 716352, 'steps': 3730, 'loss/train': 2.1504995822906494} -11/06/2021 21:47:14 - INFO - __main__ - Step 3732: {'lr': 0.0004998312547329793, 'samples': 716544, 'steps': 3731, 'loss/train': 2.3918561935424805} -11/06/2021 21:47:14 - INFO - __main__ - Step 3733: {'lr': 0.0004998310597300956, 'samples': 716736, 'steps': 3732, 'loss/train': 2.505441665649414} -11/06/2021 21:47:15 - INFO - __main__ - Step 3734: {'lr': 0.0004998308646146419, 'samples': 716928, 'steps': 3733, 'loss/train': 1.6491429805755615} -11/06/2021 21:47:15 - INFO - __main__ - Step 3735: {'lr': 0.0004998306693866181, 'samples': 717120, 'steps': 3734, 'loss/train': 2.3682384490966797} -11/06/2021 21:47:15 - INFO - __main__ - Step 3736: {'lr': 0.0004998304740460247, 'samples': 717312, 'steps': 3735, 'loss/train': 1.748855471611023} -11/06/2021 21:47:16 - INFO - __main__ - Step 3737: {'lr': 0.0004998302785928614, 'samples': 717504, 'steps': 3736, 'loss/train': 3.4032115936279297} -11/06/2021 21:47:17 - INFO - __main__ - Step 3738: {'lr': 0.0004998300830271285, 'samples': 717696, 'steps': 3737, 'loss/train': 2.2181355953216553} -11/06/2021 21:47:17 - INFO - __main__ - Step 3739: {'lr': 0.000499829887348826, 'samples': 717888, 'steps': 3738, 'loss/train': 2.0063092708587646} -11/06/2021 21:47:17 - INFO - __main__ - Step 3740: {'lr': 0.0004998296915579539, 'samples': 718080, 'steps': 3739, 'loss/train': 2.2116055488586426} -11/06/2021 21:47:18 - INFO - __main__ - Step 3741: {'lr': 0.0004998294956545125, 'samples': 718272, 'steps': 3740, 'loss/train': 2.458434820175171} -11/06/2021 21:47:19 - INFO - __main__ - Step 3742: {'lr': 0.0004998292996385019, 'samples': 718464, 'steps': 3741, 'loss/train': 2.001145839691162} -11/06/2021 21:47:19 - INFO - __main__ - Step 3743: {'lr': 0.0004998291035099219, 'samples': 718656, 'steps': 3742, 'loss/train': 1.889823079109192} -11/06/2021 21:47:20 - INFO - __main__ - Step 3744: {'lr': 0.0004998289072687728, 'samples': 718848, 'steps': 3743, 'loss/train': 2.2206709384918213} -11/06/2021 21:47:20 - INFO - __main__ - Step 3745: {'lr': 0.0004998287109150547, 'samples': 719040, 'steps': 3744, 'loss/train': 1.8798199892044067} -11/06/2021 21:47:20 - INFO - __main__ - Step 3746: {'lr': 0.0004998285144487676, 'samples': 719232, 'steps': 3745, 'loss/train': 2.057377576828003} -11/06/2021 21:47:21 - INFO - __main__ - Step 3747: {'lr': 0.0004998283178699116, 'samples': 719424, 'steps': 3746, 'loss/train': 1.8531581163406372} -11/06/2021 21:47:22 - INFO - __main__ - Step 3748: {'lr': 0.0004998281211784869, 'samples': 719616, 'steps': 3747, 'loss/train': 2.3435657024383545} -11/06/2021 21:47:22 - INFO - __main__ - Step 3749: {'lr': 0.0004998279243744934, 'samples': 719808, 'steps': 3748, 'loss/train': 2.2125914096832275} -11/06/2021 21:47:22 - INFO - __main__ - Step 3750: {'lr': 0.0004998277274579313, 'samples': 720000, 'steps': 3749, 'loss/train': 2.172743558883667} -11/06/2021 21:47:23 - INFO - __main__ - Step 3751: {'lr': 0.0004998275304288007, 'samples': 720192, 'steps': 3750, 'loss/train': 1.698510766029358} -11/06/2021 21:47:24 - INFO - __main__ - Step 3752: {'lr': 0.0004998273332871017, 'samples': 720384, 'steps': 3751, 'loss/train': 2.1584572792053223} -11/06/2021 21:47:24 - INFO - __main__ - Step 3753: {'lr': 0.0004998271360328344, 'samples': 720576, 'steps': 3752, 'loss/train': 1.8731579780578613} -11/06/2021 21:47:24 - INFO - __main__ - Step 3754: {'lr': 0.0004998269386659988, 'samples': 720768, 'steps': 3753, 'loss/train': 2.281588077545166} -11/06/2021 21:47:25 - INFO - __main__ - Step 3755: {'lr': 0.000499826741186595, 'samples': 720960, 'steps': 3754, 'loss/train': 2.172957420349121} -11/06/2021 21:47:25 - INFO - __main__ - Step 3756: {'lr': 0.0004998265435946232, 'samples': 721152, 'steps': 3755, 'loss/train': 2.0597519874572754} -11/06/2021 21:47:26 - INFO - __main__ - Step 3757: {'lr': 0.0004998263458900833, 'samples': 721344, 'steps': 3756, 'loss/train': 1.874323844909668} -11/06/2021 21:47:26 - INFO - __main__ - Step 3758: {'lr': 0.0004998261480729755, 'samples': 721536, 'steps': 3757, 'loss/train': 2.4779069423675537} -11/06/2021 21:47:27 - INFO - __main__ - Step 3759: {'lr': 0.0004998259501433, 'samples': 721728, 'steps': 3758, 'loss/train': 2.595695734024048} -11/06/2021 21:47:27 - INFO - __main__ - Step 3760: {'lr': 0.0004998257521010567, 'samples': 721920, 'steps': 3759, 'loss/train': 2.313114643096924} -11/06/2021 21:47:27 - INFO - __main__ - Step 3761: {'lr': 0.0004998255539462459, 'samples': 722112, 'steps': 3760, 'loss/train': 1.7417014837265015} -11/06/2021 21:47:28 - INFO - __main__ - Step 3762: {'lr': 0.0004998253556788675, 'samples': 722304, 'steps': 3761, 'loss/train': 2.088002920150757} -11/06/2021 21:47:29 - INFO - __main__ - Step 3763: {'lr': 0.0004998251572989217, 'samples': 722496, 'steps': 3762, 'loss/train': 2.2535784244537354} -11/06/2021 21:47:29 - INFO - __main__ - Step 3764: {'lr': 0.0004998249588064085, 'samples': 722688, 'steps': 3763, 'loss/train': 1.551037073135376} -11/06/2021 21:47:30 - INFO - __main__ - Step 3765: {'lr': 0.0004998247602013278, 'samples': 722880, 'steps': 3764, 'loss/train': 2.5815794467926025} -11/06/2021 21:47:30 - INFO - __main__ - Step 3766: {'lr': 0.0004998245614836802, 'samples': 723072, 'steps': 3765, 'loss/train': 2.278775930404663} -11/06/2021 21:47:30 - INFO - __main__ - Step 3767: {'lr': 0.0004998243626534655, 'samples': 723264, 'steps': 3766, 'loss/train': 2.4035115242004395} -11/06/2021 21:47:31 - INFO - __main__ - Step 3768: {'lr': 0.0004998241637106836, 'samples': 723456, 'steps': 3767, 'loss/train': 2.4984121322631836} -11/06/2021 21:47:32 - INFO - __main__ - Step 3769: {'lr': 0.0004998239646553349, 'samples': 723648, 'steps': 3768, 'loss/train': 1.8377968072891235} -11/06/2021 21:47:32 - INFO - __main__ - Step 3770: {'lr': 0.0004998237654874195, 'samples': 723840, 'steps': 3769, 'loss/train': 2.3453054428100586} -11/06/2021 21:47:32 - INFO - __main__ - Step 3771: {'lr': 0.0004998235662069372, 'samples': 724032, 'steps': 3770, 'loss/train': 1.7649283409118652} -11/06/2021 21:47:33 - INFO - __main__ - Step 3772: {'lr': 0.0004998233668138883, 'samples': 724224, 'steps': 3771, 'loss/train': 1.8481817245483398} -11/06/2021 21:47:34 - INFO - __main__ - Step 3773: {'lr': 0.0004998231673082729, 'samples': 724416, 'steps': 3772, 'loss/train': 2.0594215393066406} -11/06/2021 21:47:34 - INFO - __main__ - Step 3774: {'lr': 0.000499822967690091, 'samples': 724608, 'steps': 3773, 'loss/train': 2.3945000171661377} -11/06/2021 21:47:35 - INFO - __main__ - Step 3775: {'lr': 0.0004998227679593426, 'samples': 724800, 'steps': 3774, 'loss/train': 1.9772299528121948} -11/06/2021 21:47:35 - INFO - __main__ - Step 3776: {'lr': 0.0004998225681160281, 'samples': 724992, 'steps': 3775, 'loss/train': 1.82159423828125} -11/06/2021 21:47:35 - INFO - __main__ - Step 3777: {'lr': 0.0004998223681601474, 'samples': 725184, 'steps': 3776, 'loss/train': 2.3857104778289795} -11/06/2021 21:47:36 - INFO - __main__ - Step 3778: {'lr': 0.0004998221680917004, 'samples': 725376, 'steps': 3777, 'loss/train': 2.202800989151001} -11/06/2021 21:47:37 - INFO - __main__ - Step 3779: {'lr': 0.0004998219679106876, 'samples': 725568, 'steps': 3778, 'loss/train': 2.383378028869629} -11/06/2021 21:47:37 - INFO - __main__ - Step 3780: {'lr': 0.0004998217676171088, 'samples': 725760, 'steps': 3779, 'loss/train': 2.38877010345459} -11/06/2021 21:47:37 - INFO - __main__ - Step 3781: {'lr': 0.0004998215672109641, 'samples': 725952, 'steps': 3780, 'loss/train': 2.0370190143585205} -11/06/2021 21:47:38 - INFO - __main__ - Step 3782: {'lr': 0.0004998213666922537, 'samples': 726144, 'steps': 3781, 'loss/train': 1.9329248666763306} -11/06/2021 21:47:39 - INFO - __main__ - Step 3783: {'lr': 0.0004998211660609777, 'samples': 726336, 'steps': 3782, 'loss/train': 3.1192450523376465} -11/06/2021 21:47:39 - INFO - __main__ - Step 3784: {'lr': 0.0004998209653171361, 'samples': 726528, 'steps': 3783, 'loss/train': 0.4665497839450836} -11/06/2021 21:47:39 - INFO - __main__ - Step 3785: {'lr': 0.0004998207644607291, 'samples': 726720, 'steps': 3784, 'loss/train': 2.076326370239258} -11/06/2021 21:47:40 - INFO - __main__ - Step 3786: {'lr': 0.0004998205634917566, 'samples': 726912, 'steps': 3785, 'loss/train': 2.1383769512176514} -11/06/2021 21:47:40 - INFO - __main__ - Step 3787: {'lr': 0.0004998203624102188, 'samples': 727104, 'steps': 3786, 'loss/train': 2.3829987049102783} -11/06/2021 21:47:41 - INFO - __main__ - Step 3788: {'lr': 0.0004998201612161159, 'samples': 727296, 'steps': 3787, 'loss/train': 1.7519925832748413} -11/06/2021 21:47:42 - INFO - __main__ - Step 3789: {'lr': 0.0004998199599094478, 'samples': 727488, 'steps': 3788, 'loss/train': 1.9867311716079712} -11/06/2021 21:47:42 - INFO - __main__ - Step 3790: {'lr': 0.0004998197584902147, 'samples': 727680, 'steps': 3789, 'loss/train': 1.7998645305633545} -11/06/2021 21:47:42 - INFO - __main__ - Step 3791: {'lr': 0.0004998195569584168, 'samples': 727872, 'steps': 3790, 'loss/train': 2.279456377029419} -11/06/2021 21:47:43 - INFO - __main__ - Step 3792: {'lr': 0.0004998193553140539, 'samples': 728064, 'steps': 3791, 'loss/train': 1.8781626224517822} -11/06/2021 21:47:44 - INFO - __main__ - Step 3793: {'lr': 0.0004998191535571264, 'samples': 728256, 'steps': 3792, 'loss/train': 2.181241750717163} -11/06/2021 21:47:44 - INFO - __main__ - Step 3794: {'lr': 0.0004998189516876342, 'samples': 728448, 'steps': 3793, 'loss/train': 2.345247983932495} -11/06/2021 21:47:44 - INFO - __main__ - Step 3795: {'lr': 0.0004998187497055773, 'samples': 728640, 'steps': 3794, 'loss/train': 0.6545143723487854} -11/06/2021 21:47:45 - INFO - __main__ - Step 3796: {'lr': 0.000499818547610956, 'samples': 728832, 'steps': 3795, 'loss/train': 1.8099079132080078} -11/06/2021 21:47:45 - INFO - __main__ - Step 3797: {'lr': 0.0004998183454037703, 'samples': 729024, 'steps': 3796, 'loss/train': 1.515761137008667} -11/06/2021 21:47:45 - INFO - __main__ - Step 3798: {'lr': 0.0004998181430840204, 'samples': 729216, 'steps': 3797, 'loss/train': 1.9123553037643433} -11/06/2021 21:47:46 - INFO - __main__ - Step 3799: {'lr': 0.0004998179406517063, 'samples': 729408, 'steps': 3798, 'loss/train': 1.983812689781189} -11/06/2021 21:47:47 - INFO - __main__ - Step 3800: {'lr': 0.000499817738106828, 'samples': 729600, 'steps': 3799, 'loss/train': 5.782630920410156} -11/06/2021 21:47:47 - INFO - __main__ - Step 3801: {'lr': 0.0004998175354493857, 'samples': 729792, 'steps': 3800, 'loss/train': 1.7894034385681152} -11/06/2021 21:47:47 - INFO - __main__ - Step 3802: {'lr': 0.0004998173326793795, 'samples': 729984, 'steps': 3801, 'loss/train': 1.8084430694580078} -11/06/2021 21:47:48 - INFO - __main__ - Step 3803: {'lr': 0.0004998171297968095, 'samples': 730176, 'steps': 3802, 'loss/train': 2.3628175258636475} -11/06/2021 21:47:49 - INFO - __main__ - Step 3804: {'lr': 0.0004998169268016757, 'samples': 730368, 'steps': 3803, 'loss/train': 2.064181089401245} -11/06/2021 21:47:49 - INFO - __main__ - Step 3805: {'lr': 0.0004998167236939783, 'samples': 730560, 'steps': 3804, 'loss/train': 2.378023147583008} -11/06/2021 21:47:50 - INFO - __main__ - Step 3806: {'lr': 0.0004998165204737173, 'samples': 730752, 'steps': 3805, 'loss/train': 1.9755092859268188} -11/06/2021 21:47:50 - INFO - __main__ - Step 3807: {'lr': 0.0004998163171408928, 'samples': 730944, 'steps': 3806, 'loss/train': 2.0892038345336914} -11/06/2021 21:47:50 - INFO - __main__ - Step 3808: {'lr': 0.000499816113695505, 'samples': 731136, 'steps': 3807, 'loss/train': 2.038058042526245} -11/06/2021 21:47:52 - INFO - __main__ - Step 3809: {'lr': 0.0004998159101375538, 'samples': 731328, 'steps': 3808, 'loss/train': 2.4071855545043945} -11/06/2021 21:47:52 - INFO - __main__ - Step 3810: {'lr': 0.0004998157064670395, 'samples': 731520, 'steps': 3809, 'loss/train': 1.957269549369812} -11/06/2021 21:47:52 - INFO - __main__ - Step 3811: {'lr': 0.0004998155026839621, 'samples': 731712, 'steps': 3810, 'loss/train': 1.6153275966644287} -11/06/2021 21:47:53 - INFO - __main__ - Step 3812: {'lr': 0.0004998152987883217, 'samples': 731904, 'steps': 3811, 'loss/train': 1.7951699495315552} -11/06/2021 21:47:53 - INFO - __main__ - Step 3813: {'lr': 0.0004998150947801182, 'samples': 732096, 'steps': 3812, 'loss/train': 1.9503369331359863} -11/06/2021 21:47:54 - INFO - __main__ - Step 3814: {'lr': 0.000499814890659352, 'samples': 732288, 'steps': 3813, 'loss/train': 1.8731478452682495} -11/06/2021 21:47:55 - INFO - __main__ - Step 3815: {'lr': 0.0004998146864260231, 'samples': 732480, 'steps': 3814, 'loss/train': 2.178349733352661} -11/06/2021 21:47:55 - INFO - __main__ - Step 3816: {'lr': 0.0004998144820801316, 'samples': 732672, 'steps': 3815, 'loss/train': 2.257465124130249} -11/06/2021 21:47:55 - INFO - __main__ - Step 3817: {'lr': 0.0004998142776216775, 'samples': 732864, 'steps': 3816, 'loss/train': 2.292968988418579} -11/06/2021 21:47:56 - INFO - __main__ - Step 3818: {'lr': 0.0004998140730506609, 'samples': 733056, 'steps': 3817, 'loss/train': 1.7161427736282349} -11/06/2021 21:47:56 - INFO - __main__ - Step 3819: {'lr': 0.000499813868367082, 'samples': 733248, 'steps': 3818, 'loss/train': 1.899258017539978} -11/06/2021 21:47:57 - INFO - __main__ - Step 3820: {'lr': 0.0004998136635709408, 'samples': 733440, 'steps': 3819, 'loss/train': 2.3737716674804688} -11/06/2021 21:47:57 - INFO - __main__ - Step 3821: {'lr': 0.0004998134586622374, 'samples': 733632, 'steps': 3820, 'loss/train': 2.9889981746673584} -11/06/2021 21:47:58 - INFO - __main__ - Step 3822: {'lr': 0.0004998132536409718, 'samples': 733824, 'steps': 3821, 'loss/train': 1.6760238409042358} -11/06/2021 21:47:58 - INFO - __main__ - Step 3823: {'lr': 0.0004998130485071444, 'samples': 734016, 'steps': 3822, 'loss/train': 2.2223479747772217} -11/06/2021 21:47:58 - INFO - __main__ - Step 3824: {'lr': 0.000499812843260755, 'samples': 734208, 'steps': 3823, 'loss/train': 2.103163480758667} -11/06/2021 21:47:59 - INFO - __main__ - Step 3825: {'lr': 0.0004998126379018038, 'samples': 734400, 'steps': 3824, 'loss/train': 1.4351319074630737} -11/06/2021 21:48:00 - INFO - __main__ - Step 3826: {'lr': 0.000499812432430291, 'samples': 734592, 'steps': 3825, 'loss/train': 2.600419282913208} -11/06/2021 21:48:00 - INFO - __main__ - Step 3827: {'lr': 0.0004998122268462164, 'samples': 734784, 'steps': 3826, 'loss/train': 1.890721082687378} -11/06/2021 21:48:00 - INFO - __main__ - Step 3828: {'lr': 0.0004998120211495803, 'samples': 734976, 'steps': 3827, 'loss/train': 1.8643083572387695} -11/06/2021 21:48:01 - INFO - __main__ - Step 3829: {'lr': 0.0004998118153403827, 'samples': 735168, 'steps': 3828, 'loss/train': 2.375256299972534} -11/06/2021 21:48:02 - INFO - __main__ - Step 3830: {'lr': 0.0004998116094186239, 'samples': 735360, 'steps': 3829, 'loss/train': 1.937308430671692} -11/06/2021 21:48:02 - INFO - __main__ - Step 3831: {'lr': 0.0004998114033843038, 'samples': 735552, 'steps': 3830, 'loss/train': 2.2312798500061035} -11/06/2021 21:48:03 - INFO - __main__ - Step 3832: {'lr': 0.0004998111972374225, 'samples': 735744, 'steps': 3831, 'loss/train': 2.345470905303955} -11/06/2021 21:48:03 - INFO - __main__ - Step 3833: {'lr': 0.0004998109909779801, 'samples': 735936, 'steps': 3832, 'loss/train': 2.126286745071411} -11/06/2021 21:48:03 - INFO - __main__ - Step 3834: {'lr': 0.0004998107846059768, 'samples': 736128, 'steps': 3833, 'loss/train': 2.274366855621338} -11/06/2021 21:48:04 - INFO - __main__ - Step 3835: {'lr': 0.0004998105781214126, 'samples': 736320, 'steps': 3834, 'loss/train': 2.0822598934173584} -11/06/2021 21:48:05 - INFO - __main__ - Step 3836: {'lr': 0.0004998103715242875, 'samples': 736512, 'steps': 3835, 'loss/train': 2.376988649368286} -11/06/2021 21:48:05 - INFO - __main__ - Step 3837: {'lr': 0.0004998101648146018, 'samples': 736704, 'steps': 3836, 'loss/train': 2.1825759410858154} -11/06/2021 21:48:05 - INFO - __main__ - Step 3838: {'lr': 0.0004998099579923555, 'samples': 736896, 'steps': 3837, 'loss/train': 2.2881062030792236} -11/06/2021 21:48:06 - INFO - __main__ - Step 3839: {'lr': 0.0004998097510575487, 'samples': 737088, 'steps': 3838, 'loss/train': 2.04844069480896} -11/06/2021 21:48:06 - INFO - __main__ - Step 3840: {'lr': 0.0004998095440101815, 'samples': 737280, 'steps': 3839, 'loss/train': 2.203437089920044} -11/06/2021 21:48:07 - INFO - __main__ - Step 3841: {'lr': 0.0004998093368502539, 'samples': 737472, 'steps': 3840, 'loss/train': 2.4474103450775146} -11/06/2021 21:48:07 - INFO - __main__ - Step 3842: {'lr': 0.000499809129577766, 'samples': 737664, 'steps': 3841, 'loss/train': 1.3475080728530884} -11/06/2021 21:48:08 - INFO - __main__ - Step 3843: {'lr': 0.0004998089221927182, 'samples': 737856, 'steps': 3842, 'loss/train': 6.6313982009887695} -11/06/2021 21:48:08 - INFO - __main__ - Step 3844: {'lr': 0.0004998087146951101, 'samples': 738048, 'steps': 3843, 'loss/train': 0.9520333409309387} -11/06/2021 21:48:09 - INFO - __main__ - Step 3845: {'lr': 0.0004998085070849422, 'samples': 738240, 'steps': 3844, 'loss/train': 2.355161428451538} -11/06/2021 21:48:09 - INFO - __main__ - Step 3846: {'lr': 0.0004998082993622144, 'samples': 738432, 'steps': 3845, 'loss/train': 1.7078429460525513} -11/06/2021 21:48:10 - INFO - __main__ - Step 3847: {'lr': 0.0004998080915269268, 'samples': 738624, 'steps': 3846, 'loss/train': 1.6196483373641968} -11/06/2021 21:48:10 - INFO - __main__ - Step 3848: {'lr': 0.0004998078835790796, 'samples': 738816, 'steps': 3847, 'loss/train': 1.4258253574371338} -11/06/2021 21:48:11 - INFO - __main__ - Step 3849: {'lr': 0.0004998076755186727, 'samples': 739008, 'steps': 3848, 'loss/train': 1.7136802673339844} -11/06/2021 21:48:11 - INFO - __main__ - Step 3850: {'lr': 0.0004998074673457064, 'samples': 739200, 'steps': 3849, 'loss/train': 2.093299627304077} -11/06/2021 21:48:12 - INFO - __main__ - Step 3851: {'lr': 0.0004998072590601808, 'samples': 739392, 'steps': 3850, 'loss/train': 1.7674520015716553} -11/06/2021 21:48:12 - INFO - __main__ - Step 3852: {'lr': 0.0004998070506620957, 'samples': 739584, 'steps': 3851, 'loss/train': 2.6275033950805664} -11/06/2021 21:48:13 - INFO - __main__ - Step 3853: {'lr': 0.0004998068421514515, 'samples': 739776, 'steps': 3852, 'loss/train': 1.4663965702056885} -11/06/2021 21:48:13 - INFO - __main__ - Step 3854: {'lr': 0.0004998066335282483, 'samples': 739968, 'steps': 3853, 'loss/train': 1.9457613229751587} -11/06/2021 21:48:13 - INFO - __main__ - Step 3855: {'lr': 0.0004998064247924859, 'samples': 740160, 'steps': 3854, 'loss/train': 2.18340802192688} -11/06/2021 21:48:14 - INFO - __main__ - Step 3856: {'lr': 0.0004998062159441648, 'samples': 740352, 'steps': 3855, 'loss/train': 2.0008771419525146} -11/06/2021 21:48:15 - INFO - __main__ - Step 3857: {'lr': 0.0004998060069832846, 'samples': 740544, 'steps': 3856, 'loss/train': 1.8760361671447754} -11/06/2021 21:48:15 - INFO - __main__ - Step 3858: {'lr': 0.0004998057979098459, 'samples': 740736, 'steps': 3857, 'loss/train': 2.1014292240142822} -11/06/2021 21:48:15 - INFO - __main__ - Step 3859: {'lr': 0.0004998055887238485, 'samples': 740928, 'steps': 3858, 'loss/train': 1.7220332622528076} -11/06/2021 21:48:16 - INFO - __main__ - Step 3860: {'lr': 0.0004998053794252925, 'samples': 741120, 'steps': 3859, 'loss/train': 1.1343226432800293} -11/06/2021 21:48:16 - INFO - __main__ - Step 3861: {'lr': 0.0004998051700141781, 'samples': 741312, 'steps': 3860, 'loss/train': 1.9412497282028198} -11/06/2021 21:48:17 - INFO - __main__ - Step 3862: {'lr': 0.0004998049604905052, 'samples': 741504, 'steps': 3861, 'loss/train': 2.0013692378997803} -11/06/2021 21:48:17 - INFO - __main__ - Step 3863: {'lr': 0.0004998047508542742, 'samples': 741696, 'steps': 3862, 'loss/train': 2.296785593032837} -11/06/2021 21:48:18 - INFO - __main__ - Step 3864: {'lr': 0.000499804541105485, 'samples': 741888, 'steps': 3863, 'loss/train': 2.1500766277313232} -11/06/2021 21:48:18 - INFO - __main__ - Step 3865: {'lr': 0.0004998043312441378, 'samples': 742080, 'steps': 3864, 'loss/train': 2.002265214920044} -11/06/2021 21:48:18 - INFO - __main__ - Step 3866: {'lr': 0.0004998041212702325, 'samples': 742272, 'steps': 3865, 'loss/train': 1.9484808444976807} -11/06/2021 21:48:20 - INFO - __main__ - Step 3867: {'lr': 0.0004998039111837694, 'samples': 742464, 'steps': 3866, 'loss/train': 2.214564323425293} -11/06/2021 21:48:20 - INFO - __main__ - Step 3868: {'lr': 0.0004998037009847485, 'samples': 742656, 'steps': 3867, 'loss/train': 2.071249485015869} -11/06/2021 21:48:20 - INFO - __main__ - Step 3869: {'lr': 0.0004998034906731699, 'samples': 742848, 'steps': 3868, 'loss/train': 1.7390302419662476} -11/06/2021 21:48:21 - INFO - __main__ - Step 3870: {'lr': 0.0004998032802490337, 'samples': 743040, 'steps': 3869, 'loss/train': 1.92386794090271} -11/06/2021 21:48:21 - INFO - __main__ - Step 3871: {'lr': 0.0004998030697123399, 'samples': 743232, 'steps': 3870, 'loss/train': 2.0642926692962646} -11/06/2021 21:48:22 - INFO - __main__ - Step 3872: {'lr': 0.0004998028590630887, 'samples': 743424, 'steps': 3871, 'loss/train': 2.2832822799682617} -11/06/2021 21:48:22 - INFO - __main__ - Step 3873: {'lr': 0.0004998026483012803, 'samples': 743616, 'steps': 3872, 'loss/train': 0.3874906599521637} -11/06/2021 21:48:23 - INFO - __main__ - Step 3874: {'lr': 0.0004998024374269147, 'samples': 743808, 'steps': 3873, 'loss/train': 1.9504804611206055} -11/06/2021 21:48:23 - INFO - __main__ - Step 3875: {'lr': 0.000499802226439992, 'samples': 744000, 'steps': 3874, 'loss/train': 1.7076032161712646} -11/06/2021 21:48:23 - INFO - __main__ - Step 3876: {'lr': 0.0004998020153405121, 'samples': 744192, 'steps': 3875, 'loss/train': 2.5436949729919434} -11/06/2021 21:48:25 - INFO - __main__ - Step 3877: {'lr': 0.0004998018041284754, 'samples': 744384, 'steps': 3876, 'loss/train': 1.7179841995239258} -11/06/2021 21:48:25 - INFO - __main__ - Step 3878: {'lr': 0.0004998015928038819, 'samples': 744576, 'steps': 3877, 'loss/train': 1.9025819301605225} -11/06/2021 21:48:25 - INFO - __main__ - Step 3879: {'lr': 0.0004998013813667315, 'samples': 744768, 'steps': 3878, 'loss/train': 6.284189701080322} -11/06/2021 21:48:26 - INFO - __main__ - Step 3880: {'lr': 0.0004998011698170245, 'samples': 744960, 'steps': 3879, 'loss/train': 2.270320415496826} -11/06/2021 21:48:26 - INFO - __main__ - Step 3881: {'lr': 0.000499800958154761, 'samples': 745152, 'steps': 3880, 'loss/train': 1.9726059436798096} -11/06/2021 21:48:27 - INFO - __main__ - Step 3882: {'lr': 0.000499800746379941, 'samples': 745344, 'steps': 3881, 'loss/train': 2.072402000427246} -11/06/2021 21:48:28 - INFO - __main__ - Step 3883: {'lr': 0.0004998005344925647, 'samples': 745536, 'steps': 3882, 'loss/train': 1.0873523950576782} -11/06/2021 21:48:28 - INFO - __main__ - Step 3884: {'lr': 0.0004998003224926321, 'samples': 745728, 'steps': 3883, 'loss/train': 1.970503807067871} -11/06/2021 21:48:29 - INFO - __main__ - Step 3885: {'lr': 0.0004998001103801433, 'samples': 745920, 'steps': 3884, 'loss/train': 2.3565833568573} -11/06/2021 21:48:29 - INFO - __main__ - Step 3886: {'lr': 0.0004997998981550985, 'samples': 746112, 'steps': 3885, 'loss/train': 1.7249259948730469} -11/06/2021 21:48:29 - INFO - __main__ - Step 3887: {'lr': 0.0004997996858174976, 'samples': 746304, 'steps': 3886, 'loss/train': 2.158630132675171} -11/06/2021 21:48:30 - INFO - __main__ - Step 3888: {'lr': 0.0004997994733673409, 'samples': 746496, 'steps': 3887, 'loss/train': 2.0216381549835205} -11/06/2021 21:48:31 - INFO - __main__ - Step 3889: {'lr': 0.0004997992608046283, 'samples': 746688, 'steps': 3888, 'loss/train': 2.1885178089141846} -11/06/2021 21:48:31 - INFO - __main__ - Step 3890: {'lr': 0.0004997990481293602, 'samples': 746880, 'steps': 3889, 'loss/train': 2.567704916000366} -11/06/2021 21:48:31 - INFO - __main__ - Step 3891: {'lr': 0.0004997988353415364, 'samples': 747072, 'steps': 3890, 'loss/train': 2.117457389831543} -11/06/2021 21:48:32 - INFO - __main__ - Step 3892: {'lr': 0.0004997986224411571, 'samples': 747264, 'steps': 3891, 'loss/train': 1.900480031967163} -11/06/2021 21:48:32 - INFO - __main__ - Step 3893: {'lr': 0.0004997984094282224, 'samples': 747456, 'steps': 3892, 'loss/train': 1.8909573554992676} -11/06/2021 21:48:33 - INFO - __main__ - Step 3894: {'lr': 0.0004997981963027324, 'samples': 747648, 'steps': 3893, 'loss/train': 2.2381651401519775} -11/06/2021 21:48:33 - INFO - __main__ - Step 3895: {'lr': 0.0004997979830646871, 'samples': 747840, 'steps': 3894, 'loss/train': 1.9018830060958862} -11/06/2021 21:48:34 - INFO - __main__ - Step 3896: {'lr': 0.0004997977697140868, 'samples': 748032, 'steps': 3895, 'loss/train': 4.09332799911499} -11/06/2021 21:48:34 - INFO - __main__ - Step 3897: {'lr': 0.0004997975562509315, 'samples': 748224, 'steps': 3896, 'loss/train': 1.9882245063781738} -11/06/2021 21:48:34 - INFO - __main__ - Step 3898: {'lr': 0.0004997973426752212, 'samples': 748416, 'steps': 3897, 'loss/train': 2.2893571853637695} -11/06/2021 21:48:35 - INFO - __main__ - Step 3899: {'lr': 0.0004997971289869561, 'samples': 748608, 'steps': 3898, 'loss/train': 2.5305356979370117} -11/06/2021 21:48:36 - INFO - __main__ - Step 3900: {'lr': 0.0004997969151861362, 'samples': 748800, 'steps': 3899, 'loss/train': 1.9628640413284302} -11/06/2021 21:48:36 - INFO - __main__ - Step 3901: {'lr': 0.0004997967012727618, 'samples': 748992, 'steps': 3900, 'loss/train': 1.784785270690918} -11/06/2021 21:48:37 - INFO - __main__ - Step 3902: {'lr': 0.0004997964872468327, 'samples': 749184, 'steps': 3901, 'loss/train': 2.4843428134918213} -11/06/2021 21:48:37 - INFO - __main__ - Step 3903: {'lr': 0.0004997962731083492, 'samples': 749376, 'steps': 3902, 'loss/train': 2.3795173168182373} -11/06/2021 21:48:37 - INFO - __main__ - Step 3904: {'lr': 0.0004997960588573115, 'samples': 749568, 'steps': 3903, 'loss/train': 1.7460960149765015} -11/06/2021 21:48:38 - INFO - __main__ - Step 3905: {'lr': 0.0004997958444937193, 'samples': 749760, 'steps': 3904, 'loss/train': 2.3648343086242676} -11/06/2021 21:48:39 - INFO - __main__ - Step 3906: {'lr': 0.0004997956300175732, 'samples': 749952, 'steps': 3905, 'loss/train': 2.6430604457855225} -11/06/2021 21:48:39 - INFO - __main__ - Step 3907: {'lr': 0.000499795415428873, 'samples': 750144, 'steps': 3906, 'loss/train': 1.1248779296875} -11/06/2021 21:48:39 - INFO - __main__ - Step 3908: {'lr': 0.0004997952007276187, 'samples': 750336, 'steps': 3907, 'loss/train': 1.4855318069458008} -11/06/2021 21:48:40 - INFO - __main__ - Step 3909: {'lr': 0.0004997949859138106, 'samples': 750528, 'steps': 3908, 'loss/train': 2.541107177734375} -11/06/2021 21:48:41 - INFO - __main__ - Step 3910: {'lr': 0.0004997947709874487, 'samples': 750720, 'steps': 3909, 'loss/train': 2.4403843879699707} -11/06/2021 21:48:41 - INFO - __main__ - Step 3911: {'lr': 0.0004997945559485333, 'samples': 750912, 'steps': 3910, 'loss/train': 2.18257212638855} -11/06/2021 21:48:41 - INFO - __main__ - Step 3912: {'lr': 0.0004997943407970642, 'samples': 751104, 'steps': 3911, 'loss/train': 2.1708099842071533} -11/06/2021 21:48:42 - INFO - __main__ - Step 3913: {'lr': 0.0004997941255330416, 'samples': 751296, 'steps': 3912, 'loss/train': 1.9108836650848389} -11/06/2021 21:48:42 - INFO - __main__ - Step 3914: {'lr': 0.0004997939101564656, 'samples': 751488, 'steps': 3913, 'loss/train': 9.35435676574707} -11/06/2021 21:48:43 - INFO - __main__ - Step 3915: {'lr': 0.0004997936946673365, 'samples': 751680, 'steps': 3914, 'loss/train': 1.6310161352157593} -11/06/2021 21:48:44 - INFO - __main__ - Step 3916: {'lr': 0.000499793479065654, 'samples': 751872, 'steps': 3915, 'loss/train': 2.2418010234832764} -11/06/2021 21:48:44 - INFO - __main__ - Step 3917: {'lr': 0.0004997932633514185, 'samples': 752064, 'steps': 3916, 'loss/train': 2.000413417816162} -11/06/2021 21:48:44 - INFO - __main__ - Step 3918: {'lr': 0.00049979304752463, 'samples': 752256, 'steps': 3917, 'loss/train': 1.5085346698760986} -11/06/2021 21:48:45 - INFO - __main__ - Step 3919: {'lr': 0.0004997928315852887, 'samples': 752448, 'steps': 3918, 'loss/train': 2.0506739616394043} -11/06/2021 21:48:46 - INFO - __main__ - Step 3920: {'lr': 0.0004997926155333944, 'samples': 752640, 'steps': 3919, 'loss/train': 1.832281231880188} -11/06/2021 21:48:46 - INFO - __main__ - Step 3921: {'lr': 0.0004997923993689476, 'samples': 752832, 'steps': 3920, 'loss/train': 1.8612034320831299} -11/06/2021 21:48:46 - INFO - __main__ - Step 3922: {'lr': 0.0004997921830919481, 'samples': 753024, 'steps': 3921, 'loss/train': 0.8128635287284851} -11/06/2021 21:48:47 - INFO - __main__ - Step 3923: {'lr': 0.0004997919667023962, 'samples': 753216, 'steps': 3922, 'loss/train': 6.834549903869629} -11/06/2021 21:48:47 - INFO - __main__ - Step 3924: {'lr': 0.0004997917502002917, 'samples': 753408, 'steps': 3923, 'loss/train': 2.564049243927002} -11/06/2021 21:48:47 - INFO - __main__ - Step 3925: {'lr': 0.000499791533585635, 'samples': 753600, 'steps': 3924, 'loss/train': 1.4833868741989136} -11/06/2021 21:48:49 - INFO - __main__ - Step 3926: {'lr': 0.0004997913168584262, 'samples': 753792, 'steps': 3925, 'loss/train': 1.9561244249343872} -11/06/2021 21:48:49 - INFO - __main__ - Step 3927: {'lr': 0.0004997911000186651, 'samples': 753984, 'steps': 3926, 'loss/train': 2.2300021648406982} -11/06/2021 21:48:49 - INFO - __main__ - Step 3928: {'lr': 0.0004997908830663521, 'samples': 754176, 'steps': 3927, 'loss/train': 2.1345834732055664} -11/06/2021 21:48:50 - INFO - __main__ - Step 3929: {'lr': 0.0004997906660014871, 'samples': 754368, 'steps': 3928, 'loss/train': 1.8014755249023438} -11/06/2021 21:48:50 - INFO - __main__ - Step 3930: {'lr': 0.0004997904488240704, 'samples': 754560, 'steps': 3929, 'loss/train': 1.9056246280670166} -11/06/2021 21:48:51 - INFO - __main__ - Step 3931: {'lr': 0.0004997902315341019, 'samples': 754752, 'steps': 3930, 'loss/train': 2.0737431049346924} -11/06/2021 21:48:51 - INFO - __main__ - Step 3932: {'lr': 0.0004997900141315817, 'samples': 754944, 'steps': 3931, 'loss/train': 2.1492855548858643} -11/06/2021 21:48:52 - INFO - __main__ - Step 3933: {'lr': 0.0004997897966165101, 'samples': 755136, 'steps': 3932, 'loss/train': 1.6962233781814575} -11/06/2021 21:48:52 - INFO - __main__ - Step 3934: {'lr': 0.000499789578988887, 'samples': 755328, 'steps': 3933, 'loss/train': 2.532392740249634} -11/06/2021 21:48:52 - INFO - __main__ - Step 3935: {'lr': 0.0004997893612487126, 'samples': 755520, 'steps': 3934, 'loss/train': 2.003080368041992} -11/06/2021 21:48:53 - INFO - __main__ - Step 3936: {'lr': 0.000499789143395987, 'samples': 755712, 'steps': 3935, 'loss/train': 2.3303253650665283} -11/06/2021 21:48:54 - INFO - __main__ - Step 3937: {'lr': 0.0004997889254307103, 'samples': 755904, 'steps': 3936, 'loss/train': 2.4294395446777344} -11/06/2021 21:48:54 - INFO - __main__ - Step 3938: {'lr': 0.0004997887073528825, 'samples': 756096, 'steps': 3937, 'loss/train': 2.0944905281066895} -11/06/2021 21:48:54 - INFO - __main__ - Step 3939: {'lr': 0.0004997884891625037, 'samples': 756288, 'steps': 3938, 'loss/train': 2.200429916381836} -11/06/2021 21:48:55 - INFO - __main__ - Step 3940: {'lr': 0.0004997882708595742, 'samples': 756480, 'steps': 3939, 'loss/train': 1.588007926940918} -11/06/2021 21:48:55 - INFO - __main__ - Step 3941: {'lr': 0.0004997880524440939, 'samples': 756672, 'steps': 3940, 'loss/train': 2.470881700515747} -11/06/2021 21:48:56 - INFO - __main__ - Step 3942: {'lr': 0.0004997878339160628, 'samples': 756864, 'steps': 3941, 'loss/train': 2.125309705734253} -11/06/2021 21:48:56 - INFO - __main__ - Step 3943: {'lr': 0.0004997876152754814, 'samples': 757056, 'steps': 3942, 'loss/train': 1.4756630659103394} -11/06/2021 21:48:57 - INFO - __main__ - Step 3944: {'lr': 0.0004997873965223495, 'samples': 757248, 'steps': 3943, 'loss/train': 2.6807804107666016} -11/06/2021 21:48:57 - INFO - __main__ - Step 3945: {'lr': 0.0004997871776566672, 'samples': 757440, 'steps': 3944, 'loss/train': 2.2836551666259766} -11/06/2021 21:48:58 - INFO - __main__ - Step 3946: {'lr': 0.0004997869586784346, 'samples': 757632, 'steps': 3945, 'loss/train': 2.121295690536499} -11/06/2021 21:48:59 - INFO - __main__ - Step 3947: {'lr': 0.0004997867395876519, 'samples': 757824, 'steps': 3946, 'loss/train': 2.3428549766540527} -11/06/2021 21:48:59 - INFO - __main__ - Step 3948: {'lr': 0.0004997865203843192, 'samples': 758016, 'steps': 3947, 'loss/train': 1.777374267578125} -11/06/2021 21:48:59 - INFO - __main__ - Step 3949: {'lr': 0.0004997863010684365, 'samples': 758208, 'steps': 3948, 'loss/train': 0.35795682668685913} -11/06/2021 21:49:00 - INFO - __main__ - Step 3950: {'lr': 0.0004997860816400039, 'samples': 758400, 'steps': 3949, 'loss/train': 2.5950117111206055} -11/06/2021 21:49:00 - INFO - __main__ - Step 3951: {'lr': 0.0004997858620990217, 'samples': 758592, 'steps': 3950, 'loss/train': 1.9574391841888428} -11/06/2021 21:49:01 - INFO - __main__ - Step 3952: {'lr': 0.0004997856424454897, 'samples': 758784, 'steps': 3951, 'loss/train': 1.4650882482528687} -11/06/2021 21:49:02 - INFO - __main__ - Step 3953: {'lr': 0.0004997854226794082, 'samples': 758976, 'steps': 3952, 'loss/train': 2.324097156524658} -11/06/2021 21:49:02 - INFO - __main__ - Step 3954: {'lr': 0.0004997852028007772, 'samples': 759168, 'steps': 3953, 'loss/train': 1.7094135284423828} -11/06/2021 21:49:02 - INFO - __main__ - Step 3955: {'lr': 0.0004997849828095969, 'samples': 759360, 'steps': 3954, 'loss/train': 2.0461413860321045} -11/06/2021 21:49:03 - INFO - __main__ - Step 3956: {'lr': 0.0004997847627058673, 'samples': 759552, 'steps': 3955, 'loss/train': 1.8901828527450562} -11/06/2021 21:49:04 - INFO - __main__ - Step 3957: {'lr': 0.0004997845424895886, 'samples': 759744, 'steps': 3956, 'loss/train': 2.1595001220703125} -11/06/2021 21:49:04 - INFO - __main__ - Step 3958: {'lr': 0.0004997843221607607, 'samples': 759936, 'steps': 3957, 'loss/train': 2.0419363975524902} -11/06/2021 21:49:04 - INFO - __main__ - Step 3959: {'lr': 0.0004997841017193841, 'samples': 760128, 'steps': 3958, 'loss/train': 2.1688108444213867} -11/06/2021 21:49:05 - INFO - __main__ - Step 3960: {'lr': 0.0004997838811654584, 'samples': 760320, 'steps': 3959, 'loss/train': 2.6631009578704834} -11/06/2021 21:49:05 - INFO - __main__ - Step 3961: {'lr': 0.000499783660498984, 'samples': 760512, 'steps': 3960, 'loss/train': 2.2320704460144043} -11/06/2021 21:49:06 - INFO - __main__ - Step 3962: {'lr': 0.0004997834397199609, 'samples': 760704, 'steps': 3961, 'loss/train': 2.1878163814544678} -11/06/2021 21:49:06 - INFO - __main__ - Step 3963: {'lr': 0.0004997832188283893, 'samples': 760896, 'steps': 3962, 'loss/train': 2.8972058296203613} -11/06/2021 21:49:07 - INFO - __main__ - Step 3964: {'lr': 0.0004997829978242693, 'samples': 761088, 'steps': 3963, 'loss/train': 1.9565014839172363} -11/06/2021 21:49:07 - INFO - __main__ - Step 3965: {'lr': 0.0004997827767076008, 'samples': 761280, 'steps': 3964, 'loss/train': 1.7469931840896606} -11/06/2021 21:49:07 - INFO - __main__ - Step 3966: {'lr': 0.0004997825554783841, 'samples': 761472, 'steps': 3965, 'loss/train': 1.9404348134994507} -11/06/2021 21:49:09 - INFO - __main__ - Step 3967: {'lr': 0.0004997823341366192, 'samples': 761664, 'steps': 3966, 'loss/train': 2.1852457523345947} -11/06/2021 21:49:09 - INFO - __main__ - Step 3968: {'lr': 0.0004997821126823062, 'samples': 761856, 'steps': 3967, 'loss/train': 2.048008680343628} -11/06/2021 21:49:09 - INFO - __main__ - Step 3969: {'lr': 0.0004997818911154454, 'samples': 762048, 'steps': 3968, 'loss/train': 2.4784631729125977} -11/06/2021 21:49:10 - INFO - __main__ - Step 3970: {'lr': 0.0004997816694360367, 'samples': 762240, 'steps': 3969, 'loss/train': 2.501253128051758} -11/06/2021 21:49:10 - INFO - __main__ - Step 3971: {'lr': 0.00049978144764408, 'samples': 762432, 'steps': 3970, 'loss/train': 2.0882301330566406} -11/06/2021 21:49:10 - INFO - __main__ - Step 3972: {'lr': 0.0004997812257395758, 'samples': 762624, 'steps': 3971, 'loss/train': 0.8743030428886414} -11/06/2021 21:49:11 - INFO - __main__ - Step 3973: {'lr': 0.0004997810037225241, 'samples': 762816, 'steps': 3972, 'loss/train': 1.5809043645858765} -11/06/2021 21:49:12 - INFO - __main__ - Step 3974: {'lr': 0.0004997807815929248, 'samples': 763008, 'steps': 3973, 'loss/train': 2.1613574028015137} -11/06/2021 21:49:12 - INFO - __main__ - Step 3975: {'lr': 0.0004997805593507783, 'samples': 763200, 'steps': 3974, 'loss/train': 1.512646198272705} -11/06/2021 21:49:12 - INFO - __main__ - Step 3976: {'lr': 0.0004997803369960844, 'samples': 763392, 'steps': 3975, 'loss/train': 1.4740993976593018} -11/06/2021 21:49:13 - INFO - __main__ - Step 3977: {'lr': 0.0004997801145288433, 'samples': 763584, 'steps': 3976, 'loss/train': 1.5394988059997559} -11/06/2021 21:49:14 - INFO - __main__ - Step 3978: {'lr': 0.0004997798919490553, 'samples': 763776, 'steps': 3977, 'loss/train': 1.7356780767440796} -11/06/2021 21:49:14 - INFO - __main__ - Step 3979: {'lr': 0.0004997796692567202, 'samples': 763968, 'steps': 3978, 'loss/train': 2.2947258949279785} -11/06/2021 21:49:14 - INFO - __main__ - Step 3980: {'lr': 0.0004997794464518383, 'samples': 764160, 'steps': 3979, 'loss/train': 2.025333881378174} -11/06/2021 21:49:15 - INFO - __main__ - Step 3981: {'lr': 0.0004997792235344096, 'samples': 764352, 'steps': 3980, 'loss/train': 2.1326520442962646} -11/06/2021 21:49:15 - INFO - __main__ - Step 3982: {'lr': 0.0004997790005044343, 'samples': 764544, 'steps': 3981, 'loss/train': 1.8855067491531372} -11/06/2021 21:49:16 - INFO - __main__ - Step 3983: {'lr': 0.0004997787773619123, 'samples': 764736, 'steps': 3982, 'loss/train': 2.2183456420898438} -11/06/2021 21:49:17 - INFO - __main__ - Step 3984: {'lr': 0.0004997785541068439, 'samples': 764928, 'steps': 3983, 'loss/train': 2.175524950027466} -11/06/2021 21:49:17 - INFO - __main__ - Step 3985: {'lr': 0.0004997783307392292, 'samples': 765120, 'steps': 3984, 'loss/train': 1.8312244415283203} -11/06/2021 21:49:17 - INFO - __main__ - Step 3986: {'lr': 0.0004997781072590683, 'samples': 765312, 'steps': 3985, 'loss/train': 5.831401348114014} -11/06/2021 21:49:18 - INFO - __main__ - Step 3987: {'lr': 0.000499777883666361, 'samples': 765504, 'steps': 3986, 'loss/train': 2.1856584548950195} -11/06/2021 21:49:19 - INFO - __main__ - Step 3988: {'lr': 0.0004997776599611078, 'samples': 765696, 'steps': 3987, 'loss/train': 1.9828382730484009} -11/06/2021 21:49:19 - INFO - __main__ - Step 3989: {'lr': 0.0004997774361433086, 'samples': 765888, 'steps': 3988, 'loss/train': 2.3569905757904053} -11/06/2021 21:49:19 - INFO - __main__ - Step 3990: {'lr': 0.0004997772122129635, 'samples': 766080, 'steps': 3989, 'loss/train': 1.4840973615646362} -11/06/2021 21:49:20 - INFO - __main__ - Step 3991: {'lr': 0.0004997769881700727, 'samples': 766272, 'steps': 3990, 'loss/train': 2.4721338748931885} -11/06/2021 21:49:20 - INFO - __main__ - Step 3992: {'lr': 0.0004997767640146363, 'samples': 766464, 'steps': 3991, 'loss/train': 1.890811800956726} -11/06/2021 21:49:21 - INFO - __main__ - Step 3993: {'lr': 0.0004997765397466543, 'samples': 766656, 'steps': 3992, 'loss/train': 1.7789920568466187} -11/06/2021 21:49:22 - INFO - __main__ - Step 3994: {'lr': 0.0004997763153661269, 'samples': 766848, 'steps': 3993, 'loss/train': 0.7541496157646179} -11/06/2021 21:49:22 - INFO - __main__ - Step 3995: {'lr': 0.000499776090873054, 'samples': 767040, 'steps': 3994, 'loss/train': 1.7700446844100952} -11/06/2021 21:49:22 - INFO - __main__ - Step 3996: {'lr': 0.000499775866267436, 'samples': 767232, 'steps': 3995, 'loss/train': 2.0774638652801514} -11/06/2021 21:49:23 - INFO - __main__ - Step 3997: {'lr': 0.0004997756415492727, 'samples': 767424, 'steps': 3996, 'loss/train': 2.1475741863250732} -11/06/2021 21:49:23 - INFO - __main__ - Step 3998: {'lr': 0.0004997754167185644, 'samples': 767616, 'steps': 3997, 'loss/train': 2.2139883041381836} -11/06/2021 21:49:24 - INFO - __main__ - Step 3999: {'lr': 0.0004997751917753113, 'samples': 767808, 'steps': 3998, 'loss/train': 1.3149014711380005} -11/06/2021 21:49:24 - INFO - __main__ - Step 4000: {'lr': 0.0004997749667195132, 'samples': 768000, 'steps': 3999, 'loss/train': 2.0716893672943115} -11/06/2021 21:49:25 - INFO - __main__ - Step 4001: {'lr': 0.0004997747415511704, 'samples': 768192, 'steps': 4000, 'loss/train': 2.3865301609039307} -11/06/2021 21:49:25 - INFO - __main__ - Step 4002: {'lr': 0.000499774516270283, 'samples': 768384, 'steps': 4001, 'loss/train': 2.4549617767333984} -11/06/2021 21:49:25 - INFO - __main__ - Step 4003: {'lr': 0.0004997742908768508, 'samples': 768576, 'steps': 4002, 'loss/train': 2.512511968612671} -11/06/2021 21:49:27 - INFO - __main__ - Step 4004: {'lr': 0.0004997740653708744, 'samples': 768768, 'steps': 4003, 'loss/train': 1.9932130575180054} -11/06/2021 21:49:27 - INFO - __main__ - Step 4005: {'lr': 0.0004997738397523537, 'samples': 768960, 'steps': 4004, 'loss/train': 2.0718185901641846} -11/06/2021 21:49:27 - INFO - __main__ - Step 4006: {'lr': 0.0004997736140212887, 'samples': 769152, 'steps': 4005, 'loss/train': 2.311023712158203} -11/06/2021 21:49:28 - INFO - __main__ - Step 4007: {'lr': 0.0004997733881776796, 'samples': 769344, 'steps': 4006, 'loss/train': 2.1917130947113037} -11/06/2021 21:49:28 - INFO - __main__ - Step 4008: {'lr': 0.0004997731622215264, 'samples': 769536, 'steps': 4007, 'loss/train': 2.4064438343048096} -11/06/2021 21:49:29 - INFO - __main__ - Step 4009: {'lr': 0.0004997729361528292, 'samples': 769728, 'steps': 4008, 'loss/train': 2.3731486797332764} -11/06/2021 21:49:29 - INFO - __main__ - Step 4010: {'lr': 0.0004997727099715882, 'samples': 769920, 'steps': 4009, 'loss/train': 1.5370467901229858} -11/06/2021 21:49:30 - INFO - __main__ - Step 4011: {'lr': 0.0004997724836778036, 'samples': 770112, 'steps': 4010, 'loss/train': 1.7078628540039062} -11/06/2021 21:49:30 - INFO - __main__ - Step 4012: {'lr': 0.0004997722572714753, 'samples': 770304, 'steps': 4011, 'loss/train': 1.5252915620803833} -11/06/2021 21:49:30 - INFO - __main__ - Step 4013: {'lr': 0.0004997720307526034, 'samples': 770496, 'steps': 4012, 'loss/train': 2.1763927936553955} -11/06/2021 21:49:31 - INFO - __main__ - Step 4014: {'lr': 0.0004997718041211881, 'samples': 770688, 'steps': 4013, 'loss/train': 2.195366382598877} -11/06/2021 21:49:32 - INFO - __main__ - Step 4015: {'lr': 0.0004997715773772296, 'samples': 770880, 'steps': 4014, 'loss/train': 1.1582077741622925} -11/06/2021 21:49:32 - INFO - __main__ - Step 4016: {'lr': 0.0004997713505207278, 'samples': 771072, 'steps': 4015, 'loss/train': 1.8005876541137695} -11/06/2021 21:49:32 - INFO - __main__ - Step 4017: {'lr': 0.0004997711235516829, 'samples': 771264, 'steps': 4016, 'loss/train': 1.86122727394104} -11/06/2021 21:49:33 - INFO - __main__ - Step 4018: {'lr': 0.000499770896470095, 'samples': 771456, 'steps': 4017, 'loss/train': 1.915101170539856} -11/06/2021 21:49:34 - INFO - __main__ - Step 4019: {'lr': 0.0004997706692759642, 'samples': 771648, 'steps': 4018, 'loss/train': 2.1200358867645264} -11/06/2021 21:49:34 - INFO - __main__ - Step 4020: {'lr': 0.0004997704419692905, 'samples': 771840, 'steps': 4019, 'loss/train': 2.1703789234161377} -11/06/2021 21:49:34 - INFO - __main__ - Step 4021: {'lr': 0.0004997702145500741, 'samples': 772032, 'steps': 4020, 'loss/train': 2.4524030685424805} -11/06/2021 21:49:35 - INFO - __main__ - Step 4022: {'lr': 0.0004997699870183151, 'samples': 772224, 'steps': 4021, 'loss/train': 2.2087340354919434} -11/06/2021 21:49:35 - INFO - __main__ - Step 4023: {'lr': 0.0004997697593740137, 'samples': 772416, 'steps': 4022, 'loss/train': 1.8903212547302246} -11/06/2021 21:49:36 - INFO - __main__ - Step 4024: {'lr': 0.0004997695316171698, 'samples': 772608, 'steps': 4023, 'loss/train': 2.31099534034729} -11/06/2021 21:49:37 - INFO - __main__ - Step 4025: {'lr': 0.0004997693037477837, 'samples': 772800, 'steps': 4024, 'loss/train': 2.07493257522583} -11/06/2021 21:49:37 - INFO - __main__ - Step 4026: {'lr': 0.0004997690757658552, 'samples': 772992, 'steps': 4025, 'loss/train': 1.9826215505599976} -11/06/2021 21:49:37 - INFO - __main__ - Step 4027: {'lr': 0.0004997688476713848, 'samples': 773184, 'steps': 4026, 'loss/train': 2.102391004562378} -11/06/2021 21:49:38 - INFO - __main__ - Step 4028: {'lr': 0.0004997686194643724, 'samples': 773376, 'steps': 4027, 'loss/train': 1.9948838949203491} -11/06/2021 21:49:38 - INFO - __main__ - Step 4029: {'lr': 0.0004997683911448181, 'samples': 773568, 'steps': 4028, 'loss/train': 1.7805095911026} -11/06/2021 21:49:39 - INFO - __main__ - Step 4030: {'lr': 0.000499768162712722, 'samples': 773760, 'steps': 4029, 'loss/train': 2.1849615573883057} -11/06/2021 21:49:39 - INFO - __main__ - Step 4031: {'lr': 0.0004997679341680843, 'samples': 773952, 'steps': 4030, 'loss/train': 2.313040256500244} -11/06/2021 21:49:40 - INFO - __main__ - Step 4032: {'lr': 0.0004997677055109049, 'samples': 774144, 'steps': 4031, 'loss/train': 1.893852949142456} -11/06/2021 21:49:40 - INFO - __main__ - Step 4033: {'lr': 0.0004997674767411841, 'samples': 774336, 'steps': 4032, 'loss/train': 2.130466938018799} -11/06/2021 21:49:40 - INFO - __main__ - Step 4034: {'lr': 0.0004997672478589219, 'samples': 774528, 'steps': 4033, 'loss/train': 1.615881085395813} -11/06/2021 21:49:41 - INFO - __main__ - Step 4035: {'lr': 0.0004997670188641183, 'samples': 774720, 'steps': 4034, 'loss/train': 2.1269845962524414} -11/06/2021 21:49:42 - INFO - __main__ - Step 4036: {'lr': 0.0004997667897567738, 'samples': 774912, 'steps': 4035, 'loss/train': 2.2043027877807617} -11/06/2021 21:49:42 - INFO - __main__ - Step 4037: {'lr': 0.0004997665605368881, 'samples': 775104, 'steps': 4036, 'loss/train': 1.7043681144714355} -11/06/2021 21:49:42 - INFO - __main__ - Step 4038: {'lr': 0.0004997663312044614, 'samples': 775296, 'steps': 4037, 'loss/train': 1.8073010444641113} -11/06/2021 21:49:43 - INFO - __main__ - Step 4039: {'lr': 0.0004997661017594939, 'samples': 775488, 'steps': 4038, 'loss/train': 2.2743730545043945} -11/06/2021 21:49:44 - INFO - __main__ - Step 4040: {'lr': 0.0004997658722019857, 'samples': 775680, 'steps': 4039, 'loss/train': 1.5168383121490479} -11/06/2021 21:49:44 - INFO - __main__ - Step 4041: {'lr': 0.0004997656425319367, 'samples': 775872, 'steps': 4040, 'loss/train': 2.3586344718933105} -11/06/2021 21:49:44 - INFO - __main__ - Step 4042: {'lr': 0.0004997654127493473, 'samples': 776064, 'steps': 4041, 'loss/train': 2.290358066558838} -11/06/2021 21:49:45 - INFO - __main__ - Step 4043: {'lr': 0.0004997651828542173, 'samples': 776256, 'steps': 4042, 'loss/train': 2.349440336227417} -11/06/2021 21:49:45 - INFO - __main__ - Step 4044: {'lr': 0.0004997649528465471, 'samples': 776448, 'steps': 4043, 'loss/train': 2.3541646003723145} -11/06/2021 21:49:46 - INFO - __main__ - Step 4045: {'lr': 0.0004997647227263367, 'samples': 776640, 'steps': 4044, 'loss/train': 2.01802396774292} -11/06/2021 21:49:47 - INFO - __main__ - Step 4046: {'lr': 0.000499764492493586, 'samples': 776832, 'steps': 4045, 'loss/train': 1.9747871160507202} -11/06/2021 21:49:47 - INFO - __main__ - Step 4047: {'lr': 0.0004997642621482955, 'samples': 777024, 'steps': 4046, 'loss/train': 3.536803960800171} -11/06/2021 21:49:47 - INFO - __main__ - Step 4048: {'lr': 0.0004997640316904649, 'samples': 777216, 'steps': 4047, 'loss/train': 2.313307523727417} -11/06/2021 21:49:48 - INFO - __main__ - Step 4049: {'lr': 0.0004997638011200946, 'samples': 777408, 'steps': 4048, 'loss/train': 1.8340681791305542} -11/06/2021 21:49:49 - INFO - __main__ - Step 4050: {'lr': 0.0004997635704371844, 'samples': 777600, 'steps': 4049, 'loss/train': 2.015902519226074} -11/06/2021 21:49:49 - INFO - __main__ - Step 4051: {'lr': 0.0004997633396417348, 'samples': 777792, 'steps': 4050, 'loss/train': 2.1511425971984863} -11/06/2021 21:49:49 - INFO - __main__ - Step 4052: {'lr': 0.0004997631087337456, 'samples': 777984, 'steps': 4051, 'loss/train': 1.9303054809570312} -11/06/2021 21:49:50 - INFO - __main__ - Step 4053: {'lr': 0.000499762877713217, 'samples': 778176, 'steps': 4052, 'loss/train': 2.202286720275879} -11/06/2021 21:49:50 - INFO - __main__ - Step 4054: {'lr': 0.0004997626465801492, 'samples': 778368, 'steps': 4053, 'loss/train': 2.0874695777893066} -11/06/2021 21:49:51 - INFO - __main__ - Step 4055: {'lr': 0.000499762415334542, 'samples': 778560, 'steps': 4054, 'loss/train': 1.871009111404419} -11/06/2021 21:49:51 - INFO - __main__ - Step 4056: {'lr': 0.0004997621839763958, 'samples': 778752, 'steps': 4055, 'loss/train': 1.8566710948944092} -11/06/2021 21:49:52 - INFO - __main__ - Step 4057: {'lr': 0.0004997619525057106, 'samples': 778944, 'steps': 4056, 'loss/train': 1.2701704502105713} -11/06/2021 21:49:52 - INFO - __main__ - Step 4058: {'lr': 0.0004997617209224866, 'samples': 779136, 'steps': 4057, 'loss/train': 2.2687175273895264} -11/06/2021 21:49:52 - INFO - __main__ - Step 4059: {'lr': 0.0004997614892267238, 'samples': 779328, 'steps': 4058, 'loss/train': 1.7731740474700928} -11/06/2021 21:49:53 - INFO - __main__ - Step 4060: {'lr': 0.0004997612574184223, 'samples': 779520, 'steps': 4059, 'loss/train': 2.616718292236328} -11/06/2021 21:49:54 - INFO - __main__ - Step 4061: {'lr': 0.0004997610254975823, 'samples': 779712, 'steps': 4060, 'loss/train': 1.441390872001648} -11/06/2021 21:49:54 - INFO - __main__ - Step 4062: {'lr': 0.0004997607934642038, 'samples': 779904, 'steps': 4061, 'loss/train': 2.379161834716797} -11/06/2021 21:49:55 - INFO - __main__ - Step 4063: {'lr': 0.0004997605613182868, 'samples': 780096, 'steps': 4062, 'loss/train': 2.2010395526885986} -11/06/2021 21:49:55 - INFO - __main__ - Step 4064: {'lr': 0.0004997603290598317, 'samples': 780288, 'steps': 4063, 'loss/train': 1.8180835247039795} -11/06/2021 21:49:55 - INFO - __main__ - Step 4065: {'lr': 0.0004997600966888384, 'samples': 780480, 'steps': 4064, 'loss/train': 1.5754492282867432} -11/06/2021 21:49:56 - INFO - __main__ - Step 4066: {'lr': 0.000499759864205307, 'samples': 780672, 'steps': 4065, 'loss/train': 1.9471435546875} -11/06/2021 21:49:57 - INFO - __main__ - Step 4067: {'lr': 0.0004997596316092378, 'samples': 780864, 'steps': 4066, 'loss/train': 0.3540392220020294} -11/06/2021 21:49:57 - INFO - __main__ - Step 4068: {'lr': 0.0004997593989006306, 'samples': 781056, 'steps': 4067, 'loss/train': 1.7563910484313965} -11/06/2021 21:49:58 - INFO - __main__ - Step 4069: {'lr': 0.0004997591660794858, 'samples': 781248, 'steps': 4068, 'loss/train': 2.3376967906951904} -11/06/2021 21:49:58 - INFO - __main__ - Step 4070: {'lr': 0.0004997589331458034, 'samples': 781440, 'steps': 4069, 'loss/train': 2.6819803714752197} -11/06/2021 21:49:59 - INFO - __main__ - Step 4071: {'lr': 0.0004997587000995833, 'samples': 781632, 'steps': 4070, 'loss/train': 2.0289735794067383} -11/06/2021 21:49:59 - INFO - __main__ - Step 4072: {'lr': 0.000499758466940826, 'samples': 781824, 'steps': 4071, 'loss/train': 1.8696802854537964} -11/06/2021 21:50:00 - INFO - __main__ - Step 4073: {'lr': 0.0004997582336695312, 'samples': 782016, 'steps': 4072, 'loss/train': 2.1343019008636475} -11/06/2021 21:50:00 - INFO - __main__ - Step 4074: {'lr': 0.0004997580002856993, 'samples': 782208, 'steps': 4073, 'loss/train': 2.6347973346710205} -11/06/2021 21:50:00 - INFO - __main__ - Step 4075: {'lr': 0.0004997577667893303, 'samples': 782400, 'steps': 4074, 'loss/train': 2.238234519958496} -11/06/2021 21:50:01 - INFO - __main__ - Step 4076: {'lr': 0.0004997575331804243, 'samples': 782592, 'steps': 4075, 'loss/train': 1.6434662342071533} -11/06/2021 21:50:02 - INFO - __main__ - Step 4077: {'lr': 0.0004997572994589812, 'samples': 782784, 'steps': 4076, 'loss/train': 2.2874550819396973} -11/06/2021 21:50:02 - INFO - __main__ - Step 4078: {'lr': 0.0004997570656250016, 'samples': 782976, 'steps': 4077, 'loss/train': 2.18599009513855} -11/06/2021 21:50:02 - INFO - __main__ - Step 4079: {'lr': 0.0004997568316784852, 'samples': 783168, 'steps': 4078, 'loss/train': 2.6030142307281494} -11/06/2021 21:50:03 - INFO - __main__ - Step 4080: {'lr': 0.0004997565976194323, 'samples': 783360, 'steps': 4079, 'loss/train': 2.873201608657837} -11/06/2021 21:50:03 - INFO - __main__ - Step 4081: {'lr': 0.0004997563634478429, 'samples': 783552, 'steps': 4080, 'loss/train': 1.6083195209503174} -11/06/2021 21:50:04 - INFO - __main__ - Step 4082: {'lr': 0.000499756129163717, 'samples': 783744, 'steps': 4081, 'loss/train': 2.6470818519592285} -11/06/2021 21:50:05 - INFO - __main__ - Step 4083: {'lr': 0.000499755894767055, 'samples': 783936, 'steps': 4082, 'loss/train': 2.0863211154937744} -11/06/2021 21:50:05 - INFO - __main__ - Step 4084: {'lr': 0.0004997556602578568, 'samples': 784128, 'steps': 4083, 'loss/train': 2.274592161178589} -11/06/2021 21:50:05 - INFO - __main__ - Step 4085: {'lr': 0.0004997554256361225, 'samples': 784320, 'steps': 4084, 'loss/train': 1.7604327201843262} -11/06/2021 21:50:06 - INFO - __main__ - Step 4086: {'lr': 0.0004997551909018524, 'samples': 784512, 'steps': 4085, 'loss/train': 1.6476736068725586} -11/06/2021 21:50:07 - INFO - __main__ - Step 4087: {'lr': 0.0004997549560550464, 'samples': 784704, 'steps': 4086, 'loss/train': 2.3296737670898438} -11/06/2021 21:50:07 - INFO - __main__ - Step 4088: {'lr': 0.0004997547210957047, 'samples': 784896, 'steps': 4087, 'loss/train': 1.9330281019210815} -11/06/2021 21:50:07 - INFO - __main__ - Step 4089: {'lr': 0.0004997544860238272, 'samples': 785088, 'steps': 4088, 'loss/train': 2.002901315689087} -11/06/2021 21:50:08 - INFO - __main__ - Step 4090: {'lr': 0.0004997542508394144, 'samples': 785280, 'steps': 4089, 'loss/train': 2.227198362350464} -11/06/2021 21:50:08 - INFO - __main__ - Step 4091: {'lr': 0.000499754015542466, 'samples': 785472, 'steps': 4090, 'loss/train': 2.175802707672119} -11/06/2021 21:50:09 - INFO - __main__ - Step 4092: {'lr': 0.0004997537801329824, 'samples': 785664, 'steps': 4091, 'loss/train': 1.697835087776184} -11/06/2021 21:50:10 - INFO - __main__ - Step 4093: {'lr': 0.0004997535446109637, 'samples': 785856, 'steps': 4092, 'loss/train': 1.8053069114685059} -11/06/2021 21:50:10 - INFO - __main__ - Step 4094: {'lr': 0.0004997533089764097, 'samples': 786048, 'steps': 4093, 'loss/train': 1.4036602973937988} -11/06/2021 21:50:10 - INFO - __main__ - Step 4095: {'lr': 0.0004997530732293209, 'samples': 786240, 'steps': 4094, 'loss/train': 1.8951164484024048} -11/06/2021 21:50:11 - INFO - __main__ - Step 4096: {'lr': 0.000499752837369697, 'samples': 786432, 'steps': 4095, 'loss/train': 2.195209264755249} -11/06/2021 21:50:12 - INFO - __main__ - Step 4097: {'lr': 0.0004997526013975385, 'samples': 786624, 'steps': 4096, 'loss/train': 1.7116293907165527} -11/06/2021 21:50:12 - INFO - __main__ - Step 4098: {'lr': 0.0004997523653128453, 'samples': 786816, 'steps': 4097, 'loss/train': 1.4756605625152588} -11/06/2021 21:50:12 - INFO - __main__ - Step 4099: {'lr': 0.0004997521291156175, 'samples': 787008, 'steps': 4098, 'loss/train': 2.56708025932312} -11/06/2021 21:50:13 - INFO - __main__ - Step 4100: {'lr': 0.0004997518928058553, 'samples': 787200, 'steps': 4099, 'loss/train': 1.9039506912231445} -11/06/2021 21:50:13 - INFO - __main__ - Step 4101: {'lr': 0.0004997516563835587, 'samples': 787392, 'steps': 4100, 'loss/train': 2.242305040359497} -11/06/2021 21:50:14 - INFO - __main__ - Step 4102: {'lr': 0.0004997514198487279, 'samples': 787584, 'steps': 4101, 'loss/train': 1.7869306802749634} -11/06/2021 21:50:15 - INFO - __main__ - Step 4103: {'lr': 0.0004997511832013629, 'samples': 787776, 'steps': 4102, 'loss/train': 1.4681452512741089} -11/06/2021 21:50:15 - INFO - __main__ - Step 4104: {'lr': 0.0004997509464414639, 'samples': 787968, 'steps': 4103, 'loss/train': 1.8288829326629639} -11/06/2021 21:50:15 - INFO - __main__ - Step 4105: {'lr': 0.000499750709569031, 'samples': 788160, 'steps': 4104, 'loss/train': 2.145322322845459} -11/06/2021 21:50:16 - INFO - __main__ - Step 4106: {'lr': 0.0004997504725840644, 'samples': 788352, 'steps': 4105, 'loss/train': 1.8525432348251343} -11/06/2021 21:50:17 - INFO - __main__ - Step 4107: {'lr': 0.0004997502354865639, 'samples': 788544, 'steps': 4106, 'loss/train': 2.4128339290618896} -11/06/2021 21:50:17 - INFO - __main__ - Step 4108: {'lr': 0.0004997499982765299, 'samples': 788736, 'steps': 4107, 'loss/train': 2.3028995990753174} -11/06/2021 21:50:17 - INFO - __main__ - Step 4109: {'lr': 0.0004997497609539623, 'samples': 788928, 'steps': 4108, 'loss/train': 1.7529590129852295} -11/06/2021 21:50:18 - INFO - __main__ - Step 4110: {'lr': 0.0004997495235188614, 'samples': 789120, 'steps': 4109, 'loss/train': 2.2879607677459717} -11/06/2021 21:50:18 - INFO - __main__ - Step 4111: {'lr': 0.0004997492859712272, 'samples': 789312, 'steps': 4110, 'loss/train': 2.290275812149048} -11/06/2021 21:50:19 - INFO - __main__ - Step 4112: {'lr': 0.0004997490483110599, 'samples': 789504, 'steps': 4111, 'loss/train': 2.2251839637756348} -11/06/2021 21:50:19 - INFO - __main__ - Step 4113: {'lr': 0.0004997488105383594, 'samples': 789696, 'steps': 4112, 'loss/train': 1.8223003149032593} -11/06/2021 21:50:20 - INFO - __main__ - Step 4114: {'lr': 0.000499748572653126, 'samples': 789888, 'steps': 4113, 'loss/train': 2.5275418758392334} -11/06/2021 21:50:20 - INFO - __main__ - Step 4115: {'lr': 0.0004997483346553597, 'samples': 790080, 'steps': 4114, 'loss/train': 2.204193592071533} -11/06/2021 21:50:21 - INFO - __main__ - Step 4116: {'lr': 0.0004997480965450607, 'samples': 790272, 'steps': 4115, 'loss/train': 2.2369582653045654} -11/06/2021 21:50:21 - INFO - __main__ - Step 4117: {'lr': 0.0004997478583222291, 'samples': 790464, 'steps': 4116, 'loss/train': 1.5711380243301392} -11/06/2021 21:50:22 - INFO - __main__ - Step 4118: {'lr': 0.0004997476199868649, 'samples': 790656, 'steps': 4117, 'loss/train': 2.431384563446045} -11/06/2021 21:50:22 - INFO - __main__ - Step 4119: {'lr': 0.0004997473815389683, 'samples': 790848, 'steps': 4118, 'loss/train': 2.284108877182007} -11/06/2021 21:50:23 - INFO - __main__ - Step 4120: {'lr': 0.0004997471429785394, 'samples': 791040, 'steps': 4119, 'loss/train': 2.340329170227051} -11/06/2021 21:50:23 - INFO - __main__ - Step 4121: {'lr': 0.0004997469043055784, 'samples': 791232, 'steps': 4120, 'loss/train': 1.350162386894226} -11/06/2021 21:50:24 - INFO - __main__ - Step 4122: {'lr': 0.000499746665520085, 'samples': 791424, 'steps': 4121, 'loss/train': 2.2945504188537598} -11/06/2021 21:50:24 - INFO - __main__ - Step 4123: {'lr': 0.0004997464266220599, 'samples': 791616, 'steps': 4122, 'loss/train': 1.9403982162475586} -11/06/2021 21:50:25 - INFO - __main__ - Step 4124: {'lr': 0.0004997461876115029, 'samples': 791808, 'steps': 4123, 'loss/train': 1.7669719457626343} -11/06/2021 21:50:25 - INFO - __main__ - Step 4125: {'lr': 0.0004997459484884139, 'samples': 792000, 'steps': 4124, 'loss/train': 2.5181665420532227} -11/06/2021 21:50:25 - INFO - __main__ - Step 4126: {'lr': 0.0004997457092527934, 'samples': 792192, 'steps': 4125, 'loss/train': 1.4069466590881348} -11/06/2021 21:50:26 - INFO - __main__ - Step 4127: {'lr': 0.0004997454699046412, 'samples': 792384, 'steps': 4126, 'loss/train': 1.1352291107177734} -11/06/2021 21:50:27 - INFO - __main__ - Step 4128: {'lr': 0.0004997452304439577, 'samples': 792576, 'steps': 4127, 'loss/train': 2.2297260761260986} -11/06/2021 21:50:27 - INFO - __main__ - Step 4129: {'lr': 0.0004997449908707428, 'samples': 792768, 'steps': 4128, 'loss/train': 1.6142773628234863} -11/06/2021 21:50:27 - INFO - __main__ - Step 4130: {'lr': 0.0004997447511849966, 'samples': 792960, 'steps': 4129, 'loss/train': 0.43251675367355347} -11/06/2021 21:50:28 - INFO - __main__ - Step 4131: {'lr': 0.0004997445113867193, 'samples': 793152, 'steps': 4130, 'loss/train': 2.1551005840301514} -11/06/2021 21:50:28 - INFO - __main__ - Step 4132: {'lr': 0.000499744271475911, 'samples': 793344, 'steps': 4131, 'loss/train': 1.9457584619522095} -11/06/2021 21:50:29 - INFO - __main__ - Step 4133: {'lr': 0.0004997440314525718, 'samples': 793536, 'steps': 4132, 'loss/train': 1.7447444200515747} -11/06/2021 21:50:29 - INFO - __main__ - Step 4134: {'lr': 0.0004997437913167018, 'samples': 793728, 'steps': 4133, 'loss/train': 2.1197428703308105} -11/06/2021 21:50:30 - INFO - __main__ - Step 4135: {'lr': 0.0004997435510683011, 'samples': 793920, 'steps': 4134, 'loss/train': 1.950053095817566} -11/06/2021 21:50:30 - INFO - __main__ - Step 4136: {'lr': 0.0004997433107073697, 'samples': 794112, 'steps': 4135, 'loss/train': 2.236959457397461} -11/06/2021 21:50:30 - INFO - __main__ - Step 4137: {'lr': 0.000499743070233908, 'samples': 794304, 'steps': 4136, 'loss/train': 2.2369892597198486} -11/06/2021 21:50:31 - INFO - __main__ - Step 4138: {'lr': 0.0004997428296479158, 'samples': 794496, 'steps': 4137, 'loss/train': 1.6959571838378906} -11/06/2021 21:50:32 - INFO - __main__ - Step 4139: {'lr': 0.0004997425889493933, 'samples': 794688, 'steps': 4138, 'loss/train': 2.1793487071990967} -11/06/2021 21:50:32 - INFO - __main__ - Step 4140: {'lr': 0.0004997423481383407, 'samples': 794880, 'steps': 4139, 'loss/train': 1.875229001045227} -11/06/2021 21:50:33 - INFO - __main__ - Step 4141: {'lr': 0.0004997421072147581, 'samples': 795072, 'steps': 4140, 'loss/train': 2.0105512142181396} -11/06/2021 21:50:33 - INFO - __main__ - Step 4142: {'lr': 0.0004997418661786455, 'samples': 795264, 'steps': 4141, 'loss/train': 2.1727404594421387} -11/06/2021 21:50:34 - INFO - __main__ - Step 4143: {'lr': 0.0004997416250300031, 'samples': 795456, 'steps': 4142, 'loss/train': 2.191661834716797} -11/06/2021 21:50:34 - INFO - __main__ - Step 4144: {'lr': 0.0004997413837688309, 'samples': 795648, 'steps': 4143, 'loss/train': 1.4901235103607178} -11/06/2021 21:50:35 - INFO - __main__ - Step 4145: {'lr': 0.0004997411423951292, 'samples': 795840, 'steps': 4144, 'loss/train': 2.327420234680176} -11/06/2021 21:50:35 - INFO - __main__ - Step 4146: {'lr': 0.0004997409009088979, 'samples': 796032, 'steps': 4145, 'loss/train': 2.225456476211548} -11/06/2021 21:50:35 - INFO - __main__ - Step 4147: {'lr': 0.0004997406593101373, 'samples': 796224, 'steps': 4146, 'loss/train': 1.6128720045089722} -11/06/2021 21:50:36 - INFO - __main__ - Step 4148: {'lr': 0.0004997404175988474, 'samples': 796416, 'steps': 4147, 'loss/train': 1.3797961473464966} -11/06/2021 21:50:37 - INFO - __main__ - Step 4149: {'lr': 0.0004997401757750282, 'samples': 796608, 'steps': 4148, 'loss/train': 2.3454394340515137} -11/06/2021 21:50:37 - INFO - __main__ - Step 4150: {'lr': 0.00049973993383868, 'samples': 796800, 'steps': 4149, 'loss/train': 1.4798073768615723} -11/06/2021 21:50:37 - INFO - __main__ - Step 4151: {'lr': 0.0004997396917898029, 'samples': 796992, 'steps': 4150, 'loss/train': 1.8693385124206543} -11/06/2021 21:50:38 - INFO - __main__ - Step 4152: {'lr': 0.0004997394496283969, 'samples': 797184, 'steps': 4151, 'loss/train': 1.895919919013977} -11/06/2021 21:50:39 - INFO - __main__ - Step 4153: {'lr': 0.0004997392073544622, 'samples': 797376, 'steps': 4152, 'loss/train': 2.0135254859924316} -11/06/2021 21:50:39 - INFO - __main__ - Step 4154: {'lr': 0.0004997389649679987, 'samples': 797568, 'steps': 4153, 'loss/train': 1.9823795557022095} -11/06/2021 21:50:39 - INFO - __main__ - Step 4155: {'lr': 0.0004997387224690068, 'samples': 797760, 'steps': 4154, 'loss/train': 2.079752206802368} -11/06/2021 21:50:40 - INFO - __main__ - Step 4156: {'lr': 0.0004997384798574865, 'samples': 797952, 'steps': 4155, 'loss/train': 1.7831960916519165} -11/06/2021 21:50:40 - INFO - __main__ - Step 4157: {'lr': 0.0004997382371334379, 'samples': 798144, 'steps': 4156, 'loss/train': 1.613570213317871} -11/06/2021 21:50:41 - INFO - __main__ - Step 4158: {'lr': 0.0004997379942968611, 'samples': 798336, 'steps': 4157, 'loss/train': 2.2602744102478027} -11/06/2021 21:50:41 - INFO - __main__ - Step 4159: {'lr': 0.0004997377513477562, 'samples': 798528, 'steps': 4158, 'loss/train': 1.372780203819275} -11/06/2021 21:50:42 - INFO - __main__ - Step 4160: {'lr': 0.0004997375082861234, 'samples': 798720, 'steps': 4159, 'loss/train': 0.5014187693595886} -11/06/2021 21:50:42 - INFO - __main__ - Step 4161: {'lr': 0.0004997372651119626, 'samples': 798912, 'steps': 4160, 'loss/train': 2.1681416034698486} -11/06/2021 21:50:42 - INFO - __main__ - Step 4162: {'lr': 0.0004997370218252741, 'samples': 799104, 'steps': 4161, 'loss/train': 1.6607433557510376} -11/06/2021 21:50:44 - INFO - __main__ - Step 4163: {'lr': 0.000499736778426058, 'samples': 799296, 'steps': 4162, 'loss/train': 1.9761664867401123} -11/06/2021 21:50:44 - INFO - __main__ - Step 4164: {'lr': 0.0004997365349143142, 'samples': 799488, 'steps': 4163, 'loss/train': 2.0288639068603516} -11/06/2021 21:50:44 - INFO - __main__ - Step 4165: {'lr': 0.0004997362912900432, 'samples': 799680, 'steps': 4164, 'loss/train': 2.2376766204833984} -11/06/2021 21:50:45 - INFO - __main__ - Step 4166: {'lr': 0.0004997360475532447, 'samples': 799872, 'steps': 4165, 'loss/train': 2.014327049255371} -11/06/2021 21:50:45 - INFO - __main__ - Step 4167: {'lr': 0.000499735803703919, 'samples': 800064, 'steps': 4166, 'loss/train': 2.371185302734375} -11/06/2021 21:50:46 - INFO - __main__ - Step 4168: {'lr': 0.0004997355597420663, 'samples': 800256, 'steps': 4167, 'loss/train': 1.7514441013336182} -11/06/2021 21:50:46 - INFO - __main__ - Step 4169: {'lr': 0.0004997353156676866, 'samples': 800448, 'steps': 4168, 'loss/train': 2.4108896255493164} -11/06/2021 21:50:47 - INFO - __main__ - Step 4170: {'lr': 0.0004997350714807799, 'samples': 800640, 'steps': 4169, 'loss/train': 1.9724844694137573} -11/06/2021 21:50:47 - INFO - __main__ - Step 4171: {'lr': 0.0004997348271813466, 'samples': 800832, 'steps': 4170, 'loss/train': 2.2488949298858643} -11/06/2021 21:50:47 - INFO - __main__ - Step 4172: {'lr': 0.0004997345827693865, 'samples': 801024, 'steps': 4171, 'loss/train': 2.0820884704589844} -11/06/2021 21:50:48 - INFO - __main__ - Step 4173: {'lr': 0.0004997343382448999, 'samples': 801216, 'steps': 4172, 'loss/train': 1.9005787372589111} -11/06/2021 21:50:49 - INFO - __main__ - Step 4174: {'lr': 0.0004997340936078869, 'samples': 801408, 'steps': 4173, 'loss/train': 2.1329050064086914} -11/06/2021 21:50:49 - INFO - __main__ - Step 4175: {'lr': 0.0004997338488583475, 'samples': 801600, 'steps': 4174, 'loss/train': 2.015869617462158} -11/06/2021 21:50:50 - INFO - __main__ - Step 4176: {'lr': 0.000499733603996282, 'samples': 801792, 'steps': 4175, 'loss/train': 1.6287065744400024} -11/06/2021 21:50:50 - INFO - __main__ - Step 4177: {'lr': 0.0004997333590216902, 'samples': 801984, 'steps': 4176, 'loss/train': 2.286756753921509} -11/06/2021 21:50:50 - INFO - __main__ - Step 4178: {'lr': 0.0004997331139345725, 'samples': 802176, 'steps': 4177, 'loss/train': 2.0928821563720703} -11/06/2021 21:50:51 - INFO - __main__ - Step 4179: {'lr': 0.000499732868734929, 'samples': 802368, 'steps': 4178, 'loss/train': 1.4197605848312378} -11/06/2021 21:50:52 - INFO - __main__ - Step 4180: {'lr': 0.0004997326234227596, 'samples': 802560, 'steps': 4179, 'loss/train': 1.9068725109100342} -11/06/2021 21:50:52 - INFO - __main__ - Step 4181: {'lr': 0.0004997323779980646, 'samples': 802752, 'steps': 4180, 'loss/train': 0.9633380174636841} -11/06/2021 21:50:52 - INFO - __main__ - Step 4182: {'lr': 0.0004997321324608441, 'samples': 802944, 'steps': 4181, 'loss/train': 2.2076642513275146} -11/06/2021 21:50:53 - INFO - __main__ - Step 4183: {'lr': 0.0004997318868110981, 'samples': 803136, 'steps': 4182, 'loss/train': 2.6250104904174805} -11/06/2021 21:50:54 - INFO - __main__ - Step 4184: {'lr': 0.0004997316410488267, 'samples': 803328, 'steps': 4183, 'loss/train': 2.3980045318603516} -11/06/2021 21:50:54 - INFO - __main__ - Step 4185: {'lr': 0.0004997313951740301, 'samples': 803520, 'steps': 4184, 'loss/train': 1.4753458499908447} -11/06/2021 21:50:54 - INFO - __main__ - Step 4186: {'lr': 0.0004997311491867083, 'samples': 803712, 'steps': 4185, 'loss/train': 1.5125452280044556} -11/06/2021 21:50:55 - INFO - __main__ - Step 4187: {'lr': 0.0004997309030868617, 'samples': 803904, 'steps': 4186, 'loss/train': 1.2969268560409546} -11/06/2021 21:50:55 - INFO - __main__ - Step 4188: {'lr': 0.0004997306568744901, 'samples': 804096, 'steps': 4187, 'loss/train': 2.0338566303253174} -11/06/2021 21:50:56 - INFO - __main__ - Step 4189: {'lr': 0.0004997304105495938, 'samples': 804288, 'steps': 4188, 'loss/train': 1.7441582679748535} -11/06/2021 21:50:57 - INFO - __main__ - Step 4190: {'lr': 0.0004997301641121727, 'samples': 804480, 'steps': 4189, 'loss/train': 2.200920581817627} -11/06/2021 21:50:57 - INFO - __main__ - Step 4191: {'lr': 0.0004997299175622271, 'samples': 804672, 'steps': 4190, 'loss/train': 2.2595231533050537} -11/06/2021 21:50:57 - INFO - __main__ - Step 4192: {'lr': 0.000499729670899757, 'samples': 804864, 'steps': 4191, 'loss/train': 2.5529255867004395} -11/06/2021 21:50:58 - INFO - __main__ - Step 4193: {'lr': 0.0004997294241247627, 'samples': 805056, 'steps': 4192, 'loss/train': 1.6093616485595703} -11/06/2021 21:50:59 - INFO - __main__ - Step 4194: {'lr': 0.0004997291772372441, 'samples': 805248, 'steps': 4193, 'loss/train': 1.4874943494796753} -11/06/2021 21:50:59 - INFO - __main__ - Step 4195: {'lr': 0.0004997289302372014, 'samples': 805440, 'steps': 4194, 'loss/train': 2.0579819679260254} -11/06/2021 21:51:00 - INFO - __main__ - Step 4196: {'lr': 0.0004997286831246347, 'samples': 805632, 'steps': 4195, 'loss/train': 2.4122848510742188} -11/06/2021 21:51:00 - INFO - __main__ - Step 4197: {'lr': 0.0004997284358995441, 'samples': 805824, 'steps': 4196, 'loss/train': 2.2387192249298096} -11/06/2021 21:51:00 - INFO - __main__ - Step 4198: {'lr': 0.0004997281885619297, 'samples': 806016, 'steps': 4197, 'loss/train': 1.6527743339538574} -11/06/2021 21:51:01 - INFO - __main__ - Step 4199: {'lr': 0.0004997279411117916, 'samples': 806208, 'steps': 4198, 'loss/train': 0.3961840569972992} -11/06/2021 21:51:02 - INFO - __main__ - Step 4200: {'lr': 0.00049972769354913, 'samples': 806400, 'steps': 4199, 'loss/train': 1.9782782793045044} -11/06/2021 21:51:02 - INFO - __main__ - Step 4201: {'lr': 0.0004997274458739449, 'samples': 806592, 'steps': 4200, 'loss/train': 2.000523328781128} -11/06/2021 21:51:02 - INFO - __main__ - Step 4202: {'lr': 0.0004997271980862366, 'samples': 806784, 'steps': 4201, 'loss/train': 2.5717737674713135} -11/06/2021 21:51:03 - INFO - __main__ - Step 4203: {'lr': 0.000499726950186005, 'samples': 806976, 'steps': 4202, 'loss/train': 2.567746639251709} -11/06/2021 21:51:03 - INFO - __main__ - Step 4204: {'lr': 0.0004997267021732502, 'samples': 807168, 'steps': 4203, 'loss/train': 2.4571382999420166} -11/06/2021 21:51:04 - INFO - __main__ - Step 4205: {'lr': 0.0004997264540479724, 'samples': 807360, 'steps': 4204, 'loss/train': 1.8436121940612793} -11/06/2021 21:51:05 - INFO - __main__ - Step 4206: {'lr': 0.0004997262058101719, 'samples': 807552, 'steps': 4205, 'loss/train': 2.192099094390869} -11/06/2021 21:51:05 - INFO - __main__ - Step 4207: {'lr': 0.0004997259574598485, 'samples': 807744, 'steps': 4206, 'loss/train': 2.6766111850738525} -11/06/2021 21:51:05 - INFO - __main__ - Step 4208: {'lr': 0.0004997257089970024, 'samples': 807936, 'steps': 4207, 'loss/train': 2.0918617248535156} -11/06/2021 21:51:06 - INFO - __main__ - Step 4209: {'lr': 0.0004997254604216338, 'samples': 808128, 'steps': 4208, 'loss/train': 2.2900002002716064} -11/06/2021 21:51:07 - INFO - __main__ - Step 4210: {'lr': 0.0004997252117337428, 'samples': 808320, 'steps': 4209, 'loss/train': 1.7111936807632446} -11/06/2021 21:51:07 - INFO - __main__ - Step 4211: {'lr': 0.0004997249629333294, 'samples': 808512, 'steps': 4210, 'loss/train': 2.1886565685272217} -11/06/2021 21:51:07 - INFO - __main__ - Step 4212: {'lr': 0.0004997247140203939, 'samples': 808704, 'steps': 4211, 'loss/train': 2.0272629261016846} -11/06/2021 21:51:08 - INFO - __main__ - Step 4213: {'lr': 0.0004997244649949362, 'samples': 808896, 'steps': 4212, 'loss/train': 1.792849063873291} -11/06/2021 21:51:08 - INFO - __main__ - Step 4214: {'lr': 0.0004997242158569564, 'samples': 809088, 'steps': 4213, 'loss/train': 1.8342564105987549} -11/06/2021 21:51:09 - INFO - __main__ - Step 4215: {'lr': 0.0004997239666064549, 'samples': 809280, 'steps': 4214, 'loss/train': 2.516932249069214} -11/06/2021 21:51:09 - INFO - __main__ - Step 4216: {'lr': 0.0004997237172434316, 'samples': 809472, 'steps': 4215, 'loss/train': 1.893647313117981} -11/06/2021 21:51:10 - INFO - __main__ - Step 4217: {'lr': 0.0004997234677678867, 'samples': 809664, 'steps': 4216, 'loss/train': 2.4590060710906982} -11/06/2021 21:51:10 - INFO - __main__ - Step 4218: {'lr': 0.0004997232181798201, 'samples': 809856, 'steps': 4217, 'loss/train': 1.6287667751312256} -11/06/2021 21:51:10 - INFO - __main__ - Step 4219: {'lr': 0.0004997229684792322, 'samples': 810048, 'steps': 4218, 'loss/train': 2.320136070251465} -11/06/2021 21:51:12 - INFO - __main__ - Step 4220: {'lr': 0.000499722718666123, 'samples': 810240, 'steps': 4219, 'loss/train': 2.140002965927124} -11/06/2021 21:51:12 - INFO - __main__ - Step 4221: {'lr': 0.0004997224687404926, 'samples': 810432, 'steps': 4220, 'loss/train': 2.0114235877990723} -11/06/2021 21:51:12 - INFO - __main__ - Step 4222: {'lr': 0.0004997222187023409, 'samples': 810624, 'steps': 4221, 'loss/train': 1.9719492197036743} -11/06/2021 21:51:13 - INFO - __main__ - Step 4223: {'lr': 0.0004997219685516684, 'samples': 810816, 'steps': 4222, 'loss/train': 2.0050837993621826} -11/06/2021 21:51:13 - INFO - __main__ - Step 4224: {'lr': 0.000499721718288475, 'samples': 811008, 'steps': 4223, 'loss/train': 1.0554298162460327} -11/06/2021 21:51:14 - INFO - __main__ - Step 4225: {'lr': 0.0004997214679127609, 'samples': 811200, 'steps': 4224, 'loss/train': 2.309093713760376} -11/06/2021 21:51:14 - INFO - __main__ - Step 4226: {'lr': 0.000499721217424526, 'samples': 811392, 'steps': 4225, 'loss/train': 1.7864500284194946} -11/06/2021 21:51:15 - INFO - __main__ - Step 4227: {'lr': 0.0004997209668237707, 'samples': 811584, 'steps': 4226, 'loss/train': 2.3149712085723877} -11/06/2021 21:51:15 - INFO - __main__ - Step 4228: {'lr': 0.0004997207161104951, 'samples': 811776, 'steps': 4227, 'loss/train': 2.2613799571990967} -11/06/2021 21:51:15 - INFO - __main__ - Step 4229: {'lr': 0.0004997204652846991, 'samples': 811968, 'steps': 4228, 'loss/train': 1.9725654125213623} -11/06/2021 21:51:16 - INFO - __main__ - Step 4230: {'lr': 0.0004997202143463828, 'samples': 812160, 'steps': 4229, 'loss/train': 2.0676584243774414} -11/06/2021 21:51:17 - INFO - __main__ - Step 4231: {'lr': 0.0004997199632955464, 'samples': 812352, 'steps': 4230, 'loss/train': 2.0852909088134766} -11/06/2021 21:51:17 - INFO - __main__ - Step 4232: {'lr': 0.0004997197121321903, 'samples': 812544, 'steps': 4231, 'loss/train': 2.0031850337982178} -11/06/2021 21:51:18 - INFO - __main__ - Step 4233: {'lr': 0.0004997194608563142, 'samples': 812736, 'steps': 4232, 'loss/train': 1.9812066555023193} -11/06/2021 21:51:18 - INFO - __main__ - Step 4234: {'lr': 0.0004997192094679183, 'samples': 812928, 'steps': 4233, 'loss/train': 2.6864309310913086} -11/06/2021 21:51:18 - INFO - __main__ - Step 4235: {'lr': 0.0004997189579670028, 'samples': 813120, 'steps': 4234, 'loss/train': 2.032951831817627} -11/06/2021 21:51:19 - INFO - __main__ - Step 4236: {'lr': 0.0004997187063535679, 'samples': 813312, 'steps': 4235, 'loss/train': 2.289562463760376} -11/06/2021 21:51:20 - INFO - __main__ - Step 4237: {'lr': 0.0004997184546276135, 'samples': 813504, 'steps': 4236, 'loss/train': 1.5230915546417236} -11/06/2021 21:51:20 - INFO - __main__ - Step 4238: {'lr': 0.0004997182027891399, 'samples': 813696, 'steps': 4237, 'loss/train': 2.07342529296875} -11/06/2021 21:51:21 - INFO - __main__ - Step 4239: {'lr': 0.000499717950838147, 'samples': 813888, 'steps': 4238, 'loss/train': 1.0521665811538696} -11/06/2021 21:51:21 - INFO - __main__ - Step 4240: {'lr': 0.0004997176987746352, 'samples': 814080, 'steps': 4239, 'loss/train': 2.1802866458892822} -11/06/2021 21:51:21 - INFO - __main__ - Step 4241: {'lr': 0.0004997174465986043, 'samples': 814272, 'steps': 4240, 'loss/train': 1.9899753332138062} -11/06/2021 21:51:23 - INFO - __main__ - Step 4242: {'lr': 0.0004997171943100547, 'samples': 814464, 'steps': 4241, 'loss/train': 1.9145240783691406} -11/06/2021 21:51:23 - INFO - __main__ - Step 4243: {'lr': 0.0004997169419089863, 'samples': 814656, 'steps': 4242, 'loss/train': 2.2730929851531982} -11/06/2021 21:51:23 - INFO - __main__ - Step 4244: {'lr': 0.0004997166893953994, 'samples': 814848, 'steps': 4243, 'loss/train': 2.227478504180908} -11/06/2021 21:51:24 - INFO - __main__ - Step 4245: {'lr': 0.000499716436769294, 'samples': 815040, 'steps': 4244, 'loss/train': 1.7130650281906128} -11/06/2021 21:51:24 - INFO - __main__ - Step 4246: {'lr': 0.0004997161840306701, 'samples': 815232, 'steps': 4245, 'loss/train': 2.1107656955718994} -11/06/2021 21:51:25 - INFO - __main__ - Step 4247: {'lr': 0.0004997159311795281, 'samples': 815424, 'steps': 4246, 'loss/train': 2.0193605422973633} -11/06/2021 21:51:25 - INFO - __main__ - Step 4248: {'lr': 0.0004997156782158679, 'samples': 815616, 'steps': 4247, 'loss/train': 2.169619083404541} -11/06/2021 21:51:26 - INFO - __main__ - Step 4249: {'lr': 0.0004997154251396896, 'samples': 815808, 'steps': 4248, 'loss/train': 1.5952482223510742} -11/06/2021 21:51:26 - INFO - __main__ - Step 4250: {'lr': 0.0004997151719509935, 'samples': 816000, 'steps': 4249, 'loss/train': 2.200782060623169} -11/06/2021 21:51:26 - INFO - __main__ - Step 4251: {'lr': 0.0004997149186497795, 'samples': 816192, 'steps': 4250, 'loss/train': 2.353931188583374} -11/06/2021 21:51:27 - INFO - __main__ - Step 4252: {'lr': 0.0004997146652360478, 'samples': 816384, 'steps': 4251, 'loss/train': 1.8407737016677856} -11/06/2021 21:51:28 - INFO - __main__ - Step 4253: {'lr': 0.0004997144117097986, 'samples': 816576, 'steps': 4252, 'loss/train': 1.8652644157409668} -11/06/2021 21:51:28 - INFO - __main__ - Step 4254: {'lr': 0.0004997141580710318, 'samples': 816768, 'steps': 4253, 'loss/train': 2.0572428703308105} -11/06/2021 21:51:28 - INFO - __main__ - Step 4255: {'lr': 0.0004997139043197478, 'samples': 816960, 'steps': 4254, 'loss/train': 1.7917412519454956} -11/06/2021 21:51:29 - INFO - __main__ - Step 4256: {'lr': 0.0004997136504559465, 'samples': 817152, 'steps': 4255, 'loss/train': 1.9230844974517822} -11/06/2021 21:51:30 - INFO - __main__ - Step 4257: {'lr': 0.0004997133964796281, 'samples': 817344, 'steps': 4256, 'loss/train': 2.0481159687042236} -11/06/2021 21:51:30 - INFO - __main__ - Step 4258: {'lr': 0.0004997131423907927, 'samples': 817536, 'steps': 4257, 'loss/train': 2.003450632095337} -11/06/2021 21:51:31 - INFO - __main__ - Step 4259: {'lr': 0.0004997128881894404, 'samples': 817728, 'steps': 4258, 'loss/train': 2.5174543857574463} -11/06/2021 21:51:31 - INFO - __main__ - Step 4260: {'lr': 0.0004997126338755714, 'samples': 817920, 'steps': 4259, 'loss/train': 2.247880697250366} -11/06/2021 21:51:31 - INFO - __main__ - Step 4261: {'lr': 0.0004997123794491856, 'samples': 818112, 'steps': 4260, 'loss/train': 2.505103349685669} -11/06/2021 21:51:32 - INFO - __main__ - Step 4262: {'lr': 0.0004997121249102834, 'samples': 818304, 'steps': 4261, 'loss/train': 1.9285527467727661} -11/06/2021 21:51:33 - INFO - __main__ - Step 4263: {'lr': 0.0004997118702588647, 'samples': 818496, 'steps': 4262, 'loss/train': 2.225656509399414} -11/06/2021 21:51:33 - INFO - __main__ - Step 4264: {'lr': 0.0004997116154949297, 'samples': 818688, 'steps': 4263, 'loss/train': 1.5641311407089233} -11/06/2021 21:51:34 - INFO - __main__ - Step 4265: {'lr': 0.0004997113606184785, 'samples': 818880, 'steps': 4264, 'loss/train': 1.9400560855865479} -11/06/2021 21:51:34 - INFO - __main__ - Step 4266: {'lr': 0.0004997111056295111, 'samples': 819072, 'steps': 4265, 'loss/train': 2.0672645568847656} -11/06/2021 21:51:35 - INFO - __main__ - Step 4267: {'lr': 0.0004997108505280279, 'samples': 819264, 'steps': 4266, 'loss/train': 2.7679026126861572} -11/06/2021 21:51:35 - INFO - __main__ - Step 4268: {'lr': 0.0004997105953140288, 'samples': 819456, 'steps': 4267, 'loss/train': 1.6954803466796875} -11/06/2021 21:51:36 - INFO - __main__ - Step 4269: {'lr': 0.0004997103399875139, 'samples': 819648, 'steps': 4268, 'loss/train': 1.9309132099151611} -11/06/2021 21:51:36 - INFO - __main__ - Step 4270: {'lr': 0.0004997100845484834, 'samples': 819840, 'steps': 4269, 'loss/train': 1.524571418762207} -11/06/2021 21:51:37 - INFO - __main__ - Step 4271: {'lr': 0.0004997098289969374, 'samples': 820032, 'steps': 4270, 'loss/train': 1.9430183172225952} -11/06/2021 21:51:37 - INFO - __main__ - Step 4272: {'lr': 0.0004997095733328761, 'samples': 820224, 'steps': 4271, 'loss/train': 2.232881784439087} -11/06/2021 21:51:38 - INFO - __main__ - Step 4273: {'lr': 0.0004997093175562994, 'samples': 820416, 'steps': 4272, 'loss/train': 2.1205177307128906} -11/06/2021 21:51:38 - INFO - __main__ - Step 4274: {'lr': 0.0004997090616672076, 'samples': 820608, 'steps': 4273, 'loss/train': 2.2687668800354004} -11/06/2021 21:51:39 - INFO - __main__ - Step 4275: {'lr': 0.0004997088056656006, 'samples': 820800, 'steps': 4274, 'loss/train': 2.34332275390625} -11/06/2021 21:51:39 - INFO - __main__ - Step 4276: {'lr': 0.0004997085495514788, 'samples': 820992, 'steps': 4275, 'loss/train': 2.0807552337646484} -11/06/2021 21:51:39 - INFO - __main__ - Step 4277: {'lr': 0.0004997082933248421, 'samples': 821184, 'steps': 4276, 'loss/train': 2.0649728775024414} -11/06/2021 21:51:40 - INFO - __main__ - Step 4278: {'lr': 0.0004997080369856907, 'samples': 821376, 'steps': 4277, 'loss/train': 2.0820047855377197} -11/06/2021 21:51:41 - INFO - __main__ - Step 4279: {'lr': 0.0004997077805340248, 'samples': 821568, 'steps': 4278, 'loss/train': 1.6447721719741821} -11/06/2021 21:51:41 - INFO - __main__ - Step 4280: {'lr': 0.0004997075239698445, 'samples': 821760, 'steps': 4279, 'loss/train': 1.9901349544525146} -11/06/2021 21:51:41 - INFO - __main__ - Step 4281: {'lr': 0.0004997072672931497, 'samples': 821952, 'steps': 4280, 'loss/train': 2.4467787742614746} -11/06/2021 21:51:42 - INFO - __main__ - Step 4282: {'lr': 0.0004997070105039407, 'samples': 822144, 'steps': 4281, 'loss/train': 1.6936836242675781} -11/06/2021 21:51:43 - INFO - __main__ - Step 4283: {'lr': 0.0004997067536022176, 'samples': 822336, 'steps': 4282, 'loss/train': 2.122401475906372} -11/06/2021 21:51:43 - INFO - __main__ - Step 4284: {'lr': 0.0004997064965879804, 'samples': 822528, 'steps': 4283, 'loss/train': 2.0260608196258545} -11/06/2021 21:51:44 - INFO - __main__ - Step 4285: {'lr': 0.0004997062394612293, 'samples': 822720, 'steps': 4284, 'loss/train': 2.1867868900299072} -11/06/2021 21:51:44 - INFO - __main__ - Step 4286: {'lr': 0.0004997059822219645, 'samples': 822912, 'steps': 4285, 'loss/train': 2.057260274887085} -11/06/2021 21:51:44 - INFO - __main__ - Step 4287: {'lr': 0.000499705724870186, 'samples': 823104, 'steps': 4286, 'loss/train': 2.2277965545654297} -11/06/2021 21:51:45 - INFO - __main__ - Step 4288: {'lr': 0.0004997054674058941, 'samples': 823296, 'steps': 4287, 'loss/train': 2.590022325515747} -11/06/2021 21:51:46 - INFO - __main__ - Step 4289: {'lr': 0.0004997052098290886, 'samples': 823488, 'steps': 4288, 'loss/train': 2.015610694885254} -11/06/2021 21:51:46 - INFO - __main__ - Step 4290: {'lr': 0.0004997049521397698, 'samples': 823680, 'steps': 4289, 'loss/train': 2.311326503753662} -11/06/2021 21:51:46 - INFO - __main__ - Step 4291: {'lr': 0.0004997046943379379, 'samples': 823872, 'steps': 4290, 'loss/train': 1.8215492963790894} -11/06/2021 21:51:47 - INFO - __main__ - Step 4292: {'lr': 0.0004997044364235928, 'samples': 824064, 'steps': 4291, 'loss/train': 1.7921706438064575} -11/06/2021 21:51:47 - INFO - __main__ - Step 4293: {'lr': 0.0004997041783967348, 'samples': 824256, 'steps': 4292, 'loss/train': 2.276956558227539} -11/06/2021 21:51:48 - INFO - __main__ - Step 4294: {'lr': 0.0004997039202573639, 'samples': 824448, 'steps': 4293, 'loss/train': 1.8650037050247192} -11/06/2021 21:51:48 - INFO - __main__ - Step 4295: {'lr': 0.0004997036620054803, 'samples': 824640, 'steps': 4294, 'loss/train': 2.3925178050994873} -11/06/2021 21:51:49 - INFO - __main__ - Step 4296: {'lr': 0.0004997034036410841, 'samples': 824832, 'steps': 4295, 'loss/train': 1.9569441080093384} -11/06/2021 21:51:49 - INFO - __main__ - Step 4297: {'lr': 0.0004997031451641754, 'samples': 825024, 'steps': 4296, 'loss/train': 1.8525234460830688} -11/06/2021 21:51:49 - INFO - __main__ - Step 4298: {'lr': 0.0004997028865747542, 'samples': 825216, 'steps': 4297, 'loss/train': 2.4801597595214844} -11/06/2021 21:51:51 - INFO - __main__ - Step 4299: {'lr': 0.0004997026278728209, 'samples': 825408, 'steps': 4298, 'loss/train': 2.3479583263397217} -11/06/2021 21:51:51 - INFO - __main__ - Step 4300: {'lr': 0.0004997023690583753, 'samples': 825600, 'steps': 4299, 'loss/train': 1.8593815565109253} -11/06/2021 21:51:51 - INFO - __main__ - Step 4301: {'lr': 0.0004997021101314179, 'samples': 825792, 'steps': 4300, 'loss/train': 2.492985248565674} -11/06/2021 21:51:52 - INFO - __main__ - Step 4302: {'lr': 0.0004997018510919483, 'samples': 825984, 'steps': 4301, 'loss/train': 1.1239334344863892} -11/06/2021 21:51:52 - INFO - __main__ - Step 4303: {'lr': 0.0004997015919399671, 'samples': 826176, 'steps': 4302, 'loss/train': 2.068119525909424} -11/06/2021 21:51:53 - INFO - __main__ - Step 4304: {'lr': 0.0004997013326754742, 'samples': 826368, 'steps': 4303, 'loss/train': 2.1923468112945557} -11/06/2021 21:51:53 - INFO - __main__ - Step 4305: {'lr': 0.0004997010732984696, 'samples': 826560, 'steps': 4304, 'loss/train': 2.267517566680908} -11/06/2021 21:51:54 - INFO - __main__ - Step 4306: {'lr': 0.0004997008138089536, 'samples': 826752, 'steps': 4305, 'loss/train': 2.289822816848755} -11/06/2021 21:51:54 - INFO - __main__ - Step 4307: {'lr': 0.0004997005542069263, 'samples': 826944, 'steps': 4306, 'loss/train': 2.516078233718872} -11/06/2021 21:51:54 - INFO - __main__ - Step 4308: {'lr': 0.0004997002944923878, 'samples': 827136, 'steps': 4307, 'loss/train': 2.071676731109619} -11/06/2021 21:51:55 - INFO - __main__ - Step 4309: {'lr': 0.0004997000346653381, 'samples': 827328, 'steps': 4308, 'loss/train': 2.0077381134033203} -11/06/2021 21:51:56 - INFO - __main__ - Step 4310: {'lr': 0.0004996997747257775, 'samples': 827520, 'steps': 4309, 'loss/train': 2.347663640975952} -11/06/2021 21:51:56 - INFO - __main__ - Step 4311: {'lr': 0.000499699514673706, 'samples': 827712, 'steps': 4310, 'loss/train': 1.8493750095367432} -11/06/2021 21:51:56 - INFO - __main__ - Step 4312: {'lr': 0.0004996992545091239, 'samples': 827904, 'steps': 4311, 'loss/train': 1.9490984678268433} -11/06/2021 21:51:57 - INFO - __main__ - Step 4313: {'lr': 0.000499698994232031, 'samples': 828096, 'steps': 4312, 'loss/train': 2.2209248542785645} -11/06/2021 21:51:57 - INFO - __main__ - Step 4314: {'lr': 0.0004996987338424276, 'samples': 828288, 'steps': 4313, 'loss/train': 2.120884418487549} -11/06/2021 21:51:58 - INFO - __main__ - Step 4315: {'lr': 0.0004996984733403138, 'samples': 828480, 'steps': 4314, 'loss/train': 2.1321933269500732} -11/06/2021 21:51:59 - INFO - __main__ - Step 4316: {'lr': 0.0004996982127256898, 'samples': 828672, 'steps': 4315, 'loss/train': 2.0887527465820312} -11/06/2021 21:51:59 - INFO - __main__ - Step 4317: {'lr': 0.0004996979519985556, 'samples': 828864, 'steps': 4316, 'loss/train': 2.1263225078582764} -11/06/2021 21:51:59 - INFO - __main__ - Step 4318: {'lr': 0.0004996976911589114, 'samples': 829056, 'steps': 4317, 'loss/train': 1.8161555528640747} -11/06/2021 21:52:00 - INFO - __main__ - Step 4319: {'lr': 0.0004996974302067572, 'samples': 829248, 'steps': 4318, 'loss/train': 1.67631995677948} -11/06/2021 21:52:01 - INFO - __main__ - Step 4320: {'lr': 0.0004996971691420931, 'samples': 829440, 'steps': 4319, 'loss/train': 1.9163763523101807} -11/06/2021 21:52:01 - INFO - __main__ - Step 4321: {'lr': 0.0004996969079649195, 'samples': 829632, 'steps': 4320, 'loss/train': 1.8467737436294556} -11/06/2021 21:52:01 - INFO - __main__ - Step 4322: {'lr': 0.0004996966466752362, 'samples': 829824, 'steps': 4321, 'loss/train': 2.3159868717193604} -11/06/2021 21:52:02 - INFO - __main__ - Step 4323: {'lr': 0.0004996963852730436, 'samples': 830016, 'steps': 4322, 'loss/train': 1.9152145385742188} -11/06/2021 21:52:02 - INFO - __main__ - Step 4324: {'lr': 0.0004996961237583415, 'samples': 830208, 'steps': 4323, 'loss/train': 2.11564302444458} -11/06/2021 21:52:03 - INFO - __main__ - Step 4325: {'lr': 0.0004996958621311302, 'samples': 830400, 'steps': 4324, 'loss/train': 2.3892369270324707} -11/06/2021 21:52:03 - INFO - __main__ - Step 4326: {'lr': 0.00049969560039141, 'samples': 830592, 'steps': 4325, 'loss/train': 1.4963157176971436} -11/06/2021 21:52:04 - INFO - __main__ - Step 4327: {'lr': 0.0004996953385391806, 'samples': 830784, 'steps': 4326, 'loss/train': 2.2413148880004883} -11/06/2021 21:52:04 - INFO - __main__ - Step 4328: {'lr': 0.0004996950765744424, 'samples': 830976, 'steps': 4327, 'loss/train': 1.8104511499404907} -11/06/2021 21:52:04 - INFO - __main__ - Step 4329: {'lr': 0.0004996948144971953, 'samples': 831168, 'steps': 4328, 'loss/train': 1.7227517366409302} -11/06/2021 21:52:05 - INFO - __main__ - Step 4330: {'lr': 0.0004996945523074398, 'samples': 831360, 'steps': 4329, 'loss/train': 1.6873306035995483} -11/06/2021 21:52:06 - INFO - __main__ - Step 4331: {'lr': 0.0004996942900051757, 'samples': 831552, 'steps': 4330, 'loss/train': 2.224438190460205} -11/06/2021 21:52:06 - INFO - __main__ - Step 4332: {'lr': 0.0004996940275904031, 'samples': 831744, 'steps': 4331, 'loss/train': 2.1473422050476074} -11/06/2021 21:52:07 - INFO - __main__ - Step 4333: {'lr': 0.0004996937650631224, 'samples': 831936, 'steps': 4332, 'loss/train': 2.5668904781341553} -11/06/2021 21:52:07 - INFO - __main__ - Step 4334: {'lr': 0.0004996935024233335, 'samples': 832128, 'steps': 4333, 'loss/train': 2.192603349685669} -11/06/2021 21:52:08 - INFO - __main__ - Step 4335: {'lr': 0.0004996932396710365, 'samples': 832320, 'steps': 4334, 'loss/train': 1.7712533473968506} -11/06/2021 21:52:08 - INFO - __main__ - Step 4336: {'lr': 0.0004996929768062316, 'samples': 832512, 'steps': 4335, 'loss/train': 1.558101773262024} -11/06/2021 21:52:09 - INFO - __main__ - Step 4337: {'lr': 0.0004996927138289189, 'samples': 832704, 'steps': 4336, 'loss/train': 2.441239833831787} -11/06/2021 21:52:09 - INFO - __main__ - Step 4338: {'lr': 0.0004996924507390985, 'samples': 832896, 'steps': 4337, 'loss/train': 2.24872088432312} -11/06/2021 21:52:09 - INFO - __main__ - Step 4339: {'lr': 0.0004996921875367705, 'samples': 833088, 'steps': 4338, 'loss/train': 2.0886828899383545} -11/06/2021 21:52:10 - INFO - __main__ - Step 4340: {'lr': 0.0004996919242219352, 'samples': 833280, 'steps': 4339, 'loss/train': 2.2574408054351807} -11/06/2021 21:52:11 - INFO - __main__ - Step 4341: {'lr': 0.0004996916607945925, 'samples': 833472, 'steps': 4340, 'loss/train': 1.8286736011505127} -11/06/2021 21:52:11 - INFO - __main__ - Step 4342: {'lr': 0.0004996913972547426, 'samples': 833664, 'steps': 4341, 'loss/train': 2.018918037414551} -11/06/2021 21:52:11 - INFO - __main__ - Step 4343: {'lr': 0.0004996911336023855, 'samples': 833856, 'steps': 4342, 'loss/train': 2.208406925201416} -11/06/2021 21:52:12 - INFO - __main__ - Step 4344: {'lr': 0.0004996908698375216, 'samples': 834048, 'steps': 4343, 'loss/train': 1.9386653900146484} -11/06/2021 21:52:12 - INFO - __main__ - Step 4345: {'lr': 0.0004996906059601507, 'samples': 834240, 'steps': 4344, 'loss/train': 1.8494505882263184} -11/06/2021 21:52:13 - INFO - __main__ - Step 4346: {'lr': 0.0004996903419702731, 'samples': 834432, 'steps': 4345, 'loss/train': 2.3450777530670166} -11/06/2021 21:52:13 - INFO - __main__ - Step 4347: {'lr': 0.0004996900778678889, 'samples': 834624, 'steps': 4346, 'loss/train': 2.0560898780822754} -11/06/2021 21:52:14 - INFO - __main__ - Step 4348: {'lr': 0.0004996898136529982, 'samples': 834816, 'steps': 4347, 'loss/train': 2.482868194580078} -11/06/2021 21:52:14 - INFO - __main__ - Step 4349: {'lr': 0.0004996895493256012, 'samples': 835008, 'steps': 4348, 'loss/train': 1.759129524230957} -11/06/2021 21:52:14 - INFO - __main__ - Step 4350: {'lr': 0.0004996892848856978, 'samples': 835200, 'steps': 4349, 'loss/train': 1.8137215375900269} -11/06/2021 21:52:16 - INFO - __main__ - Step 4351: {'lr': 0.0004996890203332883, 'samples': 835392, 'steps': 4350, 'loss/train': 1.9098490476608276} -11/06/2021 21:52:16 - INFO - __main__ - Step 4352: {'lr': 0.0004996887556683729, 'samples': 835584, 'steps': 4351, 'loss/train': 2.027623414993286} -11/06/2021 21:52:16 - INFO - __main__ - Step 4353: {'lr': 0.0004996884908909515, 'samples': 835776, 'steps': 4352, 'loss/train': 2.083651304244995} -11/06/2021 21:52:17 - INFO - __main__ - Step 4354: {'lr': 0.0004996882260010243, 'samples': 835968, 'steps': 4353, 'loss/train': 1.6562211513519287} -11/06/2021 21:52:17 - INFO - __main__ - Step 4355: {'lr': 0.0004996879609985915, 'samples': 836160, 'steps': 4354, 'loss/train': 1.846291422843933} -11/06/2021 21:52:18 - INFO - __main__ - Step 4356: {'lr': 0.0004996876958836532, 'samples': 836352, 'steps': 4355, 'loss/train': 2.066518783569336} -11/06/2021 21:52:19 - INFO - __main__ - Step 4357: {'lr': 0.0004996874306562093, 'samples': 836544, 'steps': 4356, 'loss/train': 2.2601191997528076} -11/06/2021 21:52:19 - INFO - __main__ - Step 4358: {'lr': 0.0004996871653162602, 'samples': 836736, 'steps': 4357, 'loss/train': 2.134087562561035} -11/06/2021 21:52:19 - INFO - __main__ - Step 4359: {'lr': 0.0004996868998638059, 'samples': 836928, 'steps': 4358, 'loss/train': 2.3234333992004395} -11/06/2021 21:52:20 - INFO - __main__ - Step 4360: {'lr': 0.0004996866342988467, 'samples': 837120, 'steps': 4359, 'loss/train': 2.3369786739349365} -11/06/2021 21:52:20 - INFO - __main__ - Step 4361: {'lr': 0.0004996863686213823, 'samples': 837312, 'steps': 4360, 'loss/train': 2.203856945037842} -11/06/2021 21:52:21 - INFO - __main__ - Step 4362: {'lr': 0.0004996861028314133, 'samples': 837504, 'steps': 4361, 'loss/train': 2.04062557220459} -11/06/2021 21:52:21 - INFO - __main__ - Step 4363: {'lr': 0.0004996858369289394, 'samples': 837696, 'steps': 4362, 'loss/train': 2.0130574703216553} -11/06/2021 21:52:22 - INFO - __main__ - Step 4364: {'lr': 0.000499685570913961, 'samples': 837888, 'steps': 4363, 'loss/train': 1.978306770324707} -11/06/2021 21:52:22 - INFO - __main__ - Step 4365: {'lr': 0.0004996853047864781, 'samples': 838080, 'steps': 4364, 'loss/train': 2.3143999576568604} -11/06/2021 21:52:22 - INFO - __main__ - Step 4366: {'lr': 0.0004996850385464909, 'samples': 838272, 'steps': 4365, 'loss/train': 2.2573633193969727} -11/06/2021 21:52:23 - INFO - __main__ - Step 4367: {'lr': 0.0004996847721939994, 'samples': 838464, 'steps': 4366, 'loss/train': 1.7779031991958618} -11/06/2021 21:52:24 - INFO - __main__ - Step 4368: {'lr': 0.0004996845057290039, 'samples': 838656, 'steps': 4367, 'loss/train': 2.1156513690948486} -11/06/2021 21:52:24 - INFO - __main__ - Step 4369: {'lr': 0.0004996842391515044, 'samples': 838848, 'steps': 4368, 'loss/train': 1.8346737623214722} -11/06/2021 21:52:25 - INFO - __main__ - Step 4370: {'lr': 0.000499683972461501, 'samples': 839040, 'steps': 4369, 'loss/train': 1.7656928300857544} -11/06/2021 21:52:25 - INFO - __main__ - Step 4371: {'lr': 0.0004996837056589938, 'samples': 839232, 'steps': 4370, 'loss/train': 1.4817529916763306} -11/06/2021 21:52:25 - INFO - __main__ - Step 4372: {'lr': 0.0004996834387439831, 'samples': 839424, 'steps': 4371, 'loss/train': 2.4186854362487793} -11/06/2021 21:52:26 - INFO - __main__ - Step 4373: {'lr': 0.0004996831717164689, 'samples': 839616, 'steps': 4372, 'loss/train': 2.3830738067626953} -11/06/2021 21:52:27 - INFO - __main__ - Step 4374: {'lr': 0.0004996829045764512, 'samples': 839808, 'steps': 4373, 'loss/train': 2.039133310317993} -11/06/2021 21:52:27 - INFO - __main__ - Step 4375: {'lr': 0.0004996826373239303, 'samples': 840000, 'steps': 4374, 'loss/train': 1.8050706386566162} -11/06/2021 21:52:27 - INFO - __main__ - Step 4376: {'lr': 0.0004996823699589062, 'samples': 840192, 'steps': 4375, 'loss/train': 2.005566120147705} -11/06/2021 21:52:28 - INFO - __main__ - Step 4377: {'lr': 0.0004996821024813791, 'samples': 840384, 'steps': 4376, 'loss/train': 2.3006296157836914} -11/06/2021 21:52:29 - INFO - __main__ - Step 4378: {'lr': 0.0004996818348913491, 'samples': 840576, 'steps': 4377, 'loss/train': 1.9584013223648071} -11/06/2021 21:52:29 - INFO - __main__ - Step 4379: {'lr': 0.0004996815671888163, 'samples': 840768, 'steps': 4378, 'loss/train': 2.180757522583008} -11/06/2021 21:52:29 - INFO - __main__ - Step 4380: {'lr': 0.000499681299373781, 'samples': 840960, 'steps': 4379, 'loss/train': 2.559288740158081} -11/06/2021 21:52:30 - INFO - __main__ - Step 4381: {'lr': 0.0004996810314462429, 'samples': 841152, 'steps': 4380, 'loss/train': 1.7387698888778687} -11/06/2021 21:52:30 - INFO - __main__ - Step 4382: {'lr': 0.0004996807634062025, 'samples': 841344, 'steps': 4381, 'loss/train': 2.247429847717285} -11/06/2021 21:52:31 - INFO - __main__ - Step 4383: {'lr': 0.0004996804952536599, 'samples': 841536, 'steps': 4382, 'loss/train': 2.5863077640533447} -11/06/2021 21:52:31 - INFO - __main__ - Step 4384: {'lr': 0.0004996802269886149, 'samples': 841728, 'steps': 4383, 'loss/train': 1.9979889392852783} -11/06/2021 21:52:32 - INFO - __main__ - Step 4385: {'lr': 0.0004996799586110681, 'samples': 841920, 'steps': 4384, 'loss/train': 2.161149501800537} -11/06/2021 21:52:32 - INFO - __main__ - Step 4386: {'lr': 0.0004996796901210192, 'samples': 842112, 'steps': 4385, 'loss/train': 2.0866355895996094} -11/06/2021 21:52:32 - INFO - __main__ - Step 4387: {'lr': 0.0004996794215184685, 'samples': 842304, 'steps': 4386, 'loss/train': 2.5882389545440674} -11/06/2021 21:52:33 - INFO - __main__ - Step 4388: {'lr': 0.0004996791528034161, 'samples': 842496, 'steps': 4387, 'loss/train': 1.5546870231628418} -11/06/2021 21:52:34 - INFO - __main__ - Step 4389: {'lr': 0.0004996788839758622, 'samples': 842688, 'steps': 4388, 'loss/train': 2.4196763038635254} -11/06/2021 21:52:34 - INFO - __main__ - Step 4390: {'lr': 0.0004996786150358068, 'samples': 842880, 'steps': 4389, 'loss/train': 1.6892547607421875} -11/06/2021 21:52:35 - INFO - __main__ - Step 4391: {'lr': 0.00049967834598325, 'samples': 843072, 'steps': 4390, 'loss/train': 2.1776304244995117} -11/06/2021 21:52:35 - INFO - __main__ - Step 4392: {'lr': 0.0004996780768181921, 'samples': 843264, 'steps': 4391, 'loss/train': 2.4177329540252686} -11/06/2021 21:52:35 - INFO - __main__ - Step 4393: {'lr': 0.0004996778075406331, 'samples': 843456, 'steps': 4392, 'loss/train': 1.8474143743515015} -11/06/2021 21:52:36 - INFO - __main__ - Step 4394: {'lr': 0.0004996775381505731, 'samples': 843648, 'steps': 4393, 'loss/train': 1.766103744506836} -11/06/2021 21:52:37 - INFO - __main__ - Step 4395: {'lr': 0.0004996772686480122, 'samples': 843840, 'steps': 4394, 'loss/train': 2.221249580383301} -11/06/2021 21:52:37 - INFO - __main__ - Step 4396: {'lr': 0.0004996769990329507, 'samples': 844032, 'steps': 4395, 'loss/train': 1.950240135192871} -11/06/2021 21:52:37 - INFO - __main__ - Step 4397: {'lr': 0.0004996767293053885, 'samples': 844224, 'steps': 4396, 'loss/train': 1.8675569295883179} -11/06/2021 21:52:38 - INFO - __main__ - Step 4398: {'lr': 0.0004996764594653258, 'samples': 844416, 'steps': 4397, 'loss/train': 2.6407816410064697} -11/06/2021 21:52:39 - INFO - __main__ - Step 4399: {'lr': 0.0004996761895127628, 'samples': 844608, 'steps': 4398, 'loss/train': 1.6900591850280762} -11/06/2021 21:52:39 - INFO - __main__ - Step 4400: {'lr': 0.0004996759194476996, 'samples': 844800, 'steps': 4399, 'loss/train': 0.33388879895210266} -11/06/2021 21:52:39 - INFO - __main__ - Step 4401: {'lr': 0.0004996756492701362, 'samples': 844992, 'steps': 4400, 'loss/train': 1.999221682548523} -11/06/2021 21:52:40 - INFO - __main__ - Step 4402: {'lr': 0.0004996753789800729, 'samples': 845184, 'steps': 4401, 'loss/train': 2.3262462615966797} -11/06/2021 21:52:40 - INFO - __main__ - Step 4403: {'lr': 0.0004996751085775096, 'samples': 845376, 'steps': 4402, 'loss/train': 2.0857207775115967} -11/06/2021 21:52:41 - INFO - __main__ - Step 4404: {'lr': 0.0004996748380624467, 'samples': 845568, 'steps': 4403, 'loss/train': 1.382709264755249} -11/06/2021 21:52:41 - INFO - __main__ - Step 4405: {'lr': 0.000499674567434884, 'samples': 845760, 'steps': 4404, 'loss/train': 2.260540008544922} -11/06/2021 21:52:42 - INFO - __main__ - Step 4406: {'lr': 0.0004996742966948219, 'samples': 845952, 'steps': 4405, 'loss/train': 1.8191969394683838} -11/06/2021 21:52:42 - INFO - __main__ - Step 4407: {'lr': 0.0004996740258422604, 'samples': 846144, 'steps': 4406, 'loss/train': 2.2261736392974854} -11/06/2021 21:52:43 - INFO - __main__ - Step 4408: {'lr': 0.0004996737548771997, 'samples': 846336, 'steps': 4407, 'loss/train': 1.8432106971740723} -11/06/2021 21:52:44 - INFO - __main__ - Step 4409: {'lr': 0.0004996734837996397, 'samples': 846528, 'steps': 4408, 'loss/train': 2.118229627609253} -11/06/2021 21:52:44 - INFO - __main__ - Step 4410: {'lr': 0.0004996732126095807, 'samples': 846720, 'steps': 4409, 'loss/train': 1.7854758501052856} -11/06/2021 21:52:44 - INFO - __main__ - Step 4411: {'lr': 0.0004996729413070229, 'samples': 846912, 'steps': 4410, 'loss/train': 2.3659751415252686} -11/06/2021 21:52:45 - INFO - __main__ - Step 4412: {'lr': 0.0004996726698919664, 'samples': 847104, 'steps': 4411, 'loss/train': 1.817520260810852} -11/06/2021 21:52:45 - INFO - __main__ - Step 4413: {'lr': 0.0004996723983644112, 'samples': 847296, 'steps': 4412, 'loss/train': 1.4988713264465332} -11/06/2021 21:52:46 - INFO - __main__ - Step 4414: {'lr': 0.0004996721267243573, 'samples': 847488, 'steps': 4413, 'loss/train': 1.2573717832565308} -11/06/2021 21:52:47 - INFO - __main__ - Step 4415: {'lr': 0.0004996718549718051, 'samples': 847680, 'steps': 4414, 'loss/train': 1.9494376182556152} -11/06/2021 21:52:47 - INFO - __main__ - Step 4416: {'lr': 0.0004996715831067546, 'samples': 847872, 'steps': 4415, 'loss/train': 0.341790109872818} -11/06/2021 21:52:47 - INFO - __main__ - Step 4417: {'lr': 0.000499671311129206, 'samples': 848064, 'steps': 4416, 'loss/train': 1.7873398065567017} -11/06/2021 21:52:48 - INFO - __main__ - Step 4418: {'lr': 0.0004996710390391593, 'samples': 848256, 'steps': 4417, 'loss/train': 2.2925448417663574} -11/06/2021 21:52:49 - INFO - __main__ - Step 4419: {'lr': 0.0004996707668366147, 'samples': 848448, 'steps': 4418, 'loss/train': 2.3310353755950928} -11/06/2021 21:52:49 - INFO - __main__ - Step 4420: {'lr': 0.0004996704945215724, 'samples': 848640, 'steps': 4419, 'loss/train': 1.234442949295044} -11/06/2021 21:52:49 - INFO - __main__ - Step 4421: {'lr': 0.0004996702220940322, 'samples': 848832, 'steps': 4420, 'loss/train': 2.263622522354126} -11/06/2021 21:52:50 - INFO - __main__ - Step 4422: {'lr': 0.0004996699495539947, 'samples': 849024, 'steps': 4421, 'loss/train': 2.1597673892974854} -11/06/2021 21:52:50 - INFO - __main__ - Step 4423: {'lr': 0.0004996696769014596, 'samples': 849216, 'steps': 4422, 'loss/train': 2.2731714248657227} -11/06/2021 21:52:50 - INFO - __main__ - Step 4424: {'lr': 0.0004996694041364272, 'samples': 849408, 'steps': 4423, 'loss/train': 2.049422264099121} -11/06/2021 21:52:51 - INFO - __main__ - Step 4425: {'lr': 0.0004996691312588977, 'samples': 849600, 'steps': 4424, 'loss/train': 1.7566492557525635} -11/06/2021 21:52:52 - INFO - __main__ - Step 4426: {'lr': 0.0004996688582688711, 'samples': 849792, 'steps': 4425, 'loss/train': 2.2029178142547607} -11/06/2021 21:52:52 - INFO - __main__ - Step 4427: {'lr': 0.0004996685851663477, 'samples': 849984, 'steps': 4426, 'loss/train': 2.1259970664978027} -11/06/2021 21:52:52 - INFO - __main__ - Step 4428: {'lr': 0.0004996683119513274, 'samples': 850176, 'steps': 4427, 'loss/train': 1.6493570804595947} -11/06/2021 21:52:53 - INFO - __main__ - Step 4429: {'lr': 0.0004996680386238103, 'samples': 850368, 'steps': 4428, 'loss/train': 1.9351447820663452} -11/06/2021 21:52:54 - INFO - __main__ - Step 4430: {'lr': 0.0004996677651837967, 'samples': 850560, 'steps': 4429, 'loss/train': 2.663370132446289} -11/06/2021 21:52:54 - INFO - __main__ - Step 4431: {'lr': 0.0004996674916312867, 'samples': 850752, 'steps': 4430, 'loss/train': 2.205284595489502} -11/06/2021 21:52:55 - INFO - __main__ - Step 4432: {'lr': 0.0004996672179662803, 'samples': 850944, 'steps': 4431, 'loss/train': 0.6293364763259888} -11/06/2021 21:52:55 - INFO - __main__ - Step 4433: {'lr': 0.0004996669441887778, 'samples': 851136, 'steps': 4432, 'loss/train': 1.934459924697876} -11/06/2021 21:52:55 - INFO - __main__ - Step 4434: {'lr': 0.0004996666702987791, 'samples': 851328, 'steps': 4433, 'loss/train': 1.715638518333435} -11/06/2021 21:52:56 - INFO - __main__ - Step 4435: {'lr': 0.0004996663962962846, 'samples': 851520, 'steps': 4434, 'loss/train': 2.070112705230713} -11/06/2021 21:52:57 - INFO - __main__ - Step 4436: {'lr': 0.0004996661221812942, 'samples': 851712, 'steps': 4435, 'loss/train': 2.642328977584839} -11/06/2021 21:52:57 - INFO - __main__ - Step 4437: {'lr': 0.0004996658479538081, 'samples': 851904, 'steps': 4436, 'loss/train': 2.1696090698242188} -11/06/2021 21:52:57 - INFO - __main__ - Step 4438: {'lr': 0.0004996655736138265, 'samples': 852096, 'steps': 4437, 'loss/train': 2.149383783340454} -11/06/2021 21:52:58 - INFO - __main__ - Step 4439: {'lr': 0.0004996652991613494, 'samples': 852288, 'steps': 4438, 'loss/train': 1.425952434539795} -11/06/2021 21:52:59 - INFO - __main__ - Step 4440: {'lr': 0.0004996650245963768, 'samples': 852480, 'steps': 4439, 'loss/train': 1.9291316270828247} -11/06/2021 21:53:00 - INFO - __main__ - Step 4441: {'lr': 0.0004996647499189092, 'samples': 852672, 'steps': 4440, 'loss/train': 1.8874024152755737} -11/06/2021 21:53:00 - INFO - __main__ - Step 4442: {'lr': 0.0004996644751289464, 'samples': 852864, 'steps': 4441, 'loss/train': 1.797756552696228} -11/06/2021 21:53:00 - INFO - __main__ - Step 4443: {'lr': 0.0004996642002264887, 'samples': 853056, 'steps': 4442, 'loss/train': 2.348628282546997} -11/06/2021 21:53:01 - INFO - __main__ - Step 4444: {'lr': 0.0004996639252115362, 'samples': 853248, 'steps': 4443, 'loss/train': 1.8861411809921265} -11/06/2021 21:53:01 - INFO - __main__ - Step 4445: {'lr': 0.000499663650084089, 'samples': 853440, 'steps': 4444, 'loss/train': 2.2785558700561523} -11/06/2021 21:53:01 - INFO - __main__ - Step 4446: {'lr': 0.0004996633748441472, 'samples': 853632, 'steps': 4445, 'loss/train': 2.116128444671631} -11/06/2021 21:53:03 - INFO - __main__ - Step 4447: {'lr': 0.0004996630994917108, 'samples': 853824, 'steps': 4446, 'loss/train': 1.9847468137741089} -11/06/2021 21:53:03 - INFO - __main__ - Step 4448: {'lr': 0.0004996628240267802, 'samples': 854016, 'steps': 4447, 'loss/train': 2.634124755859375} -11/06/2021 21:53:03 - INFO - __main__ - Step 4449: {'lr': 0.0004996625484493554, 'samples': 854208, 'steps': 4448, 'loss/train': 1.749208927154541} -11/06/2021 21:53:04 - INFO - __main__ - Step 4450: {'lr': 0.0004996622727594363, 'samples': 854400, 'steps': 4449, 'loss/train': 1.287934422492981} -11/06/2021 21:53:04 - INFO - __main__ - Step 4451: {'lr': 0.0004996619969570234, 'samples': 854592, 'steps': 4450, 'loss/train': 2.1173369884490967} -11/06/2021 21:53:05 - INFO - __main__ - Step 4452: {'lr': 0.0004996617210421166, 'samples': 854784, 'steps': 4451, 'loss/train': 1.4185445308685303} -11/06/2021 21:53:05 - INFO - __main__ - Step 4453: {'lr': 0.0004996614450147161, 'samples': 854976, 'steps': 4452, 'loss/train': 2.3131630420684814} -11/06/2021 21:53:06 - INFO - __main__ - Step 4454: {'lr': 0.0004996611688748221, 'samples': 855168, 'steps': 4453, 'loss/train': 0.5444425940513611} -11/06/2021 21:53:06 - INFO - __main__ - Step 4455: {'lr': 0.0004996608926224345, 'samples': 855360, 'steps': 4454, 'loss/train': 2.0416908264160156} -11/06/2021 21:53:06 - INFO - __main__ - Step 4456: {'lr': 0.0004996606162575536, 'samples': 855552, 'steps': 4455, 'loss/train': 1.4575010538101196} -11/06/2021 21:53:07 - INFO - __main__ - Step 4457: {'lr': 0.0004996603397801795, 'samples': 855744, 'steps': 4456, 'loss/train': 2.1322479248046875} -11/06/2021 21:53:08 - INFO - __main__ - Step 4458: {'lr': 0.0004996600631903123, 'samples': 855936, 'steps': 4457, 'loss/train': 2.1813089847564697} -11/06/2021 21:53:08 - INFO - __main__ - Step 4459: {'lr': 0.0004996597864879521, 'samples': 856128, 'steps': 4458, 'loss/train': 2.2517218589782715} -11/06/2021 21:53:08 - INFO - __main__ - Step 4460: {'lr': 0.000499659509673099, 'samples': 856320, 'steps': 4459, 'loss/train': 2.0033187866210938} -11/06/2021 21:53:09 - INFO - __main__ - Step 4461: {'lr': 0.0004996592327457533, 'samples': 856512, 'steps': 4460, 'loss/train': 1.793095350265503} -11/06/2021 21:53:10 - INFO - __main__ - Step 4462: {'lr': 0.000499658955705915, 'samples': 856704, 'steps': 4461, 'loss/train': 2.264535665512085} -11/06/2021 21:53:10 - INFO - __main__ - Step 4463: {'lr': 0.0004996586785535841, 'samples': 856896, 'steps': 4462, 'loss/train': 2.0258359909057617} -11/06/2021 21:53:11 - INFO - __main__ - Step 4464: {'lr': 0.000499658401288761, 'samples': 857088, 'steps': 4463, 'loss/train': 1.9607642889022827} -11/06/2021 21:53:11 - INFO - __main__ - Step 4465: {'lr': 0.0004996581239114456, 'samples': 857280, 'steps': 4464, 'loss/train': 1.6711504459381104} -11/06/2021 21:53:11 - INFO - __main__ - Step 4466: {'lr': 0.0004996578464216381, 'samples': 857472, 'steps': 4465, 'loss/train': 2.1529288291931152} -11/06/2021 21:53:12 - INFO - __main__ - Step 4467: {'lr': 0.0004996575688193386, 'samples': 857664, 'steps': 4466, 'loss/train': 1.737178087234497} -11/06/2021 21:53:13 - INFO - __main__ - Step 4468: {'lr': 0.0004996572911045473, 'samples': 857856, 'steps': 4467, 'loss/train': 2.233004570007324} -11/06/2021 21:53:13 - INFO - __main__ - Step 4469: {'lr': 0.0004996570132772642, 'samples': 858048, 'steps': 4468, 'loss/train': 1.742701530456543} -11/06/2021 21:53:13 - INFO - __main__ - Step 4470: {'lr': 0.0004996567353374896, 'samples': 858240, 'steps': 4469, 'loss/train': 2.380733013153076} -11/06/2021 21:53:14 - INFO - __main__ - Step 4471: {'lr': 0.0004996564572852235, 'samples': 858432, 'steps': 4470, 'loss/train': 2.0802853107452393} -11/06/2021 21:53:14 - INFO - __main__ - Step 4472: {'lr': 0.000499656179120466, 'samples': 858624, 'steps': 4471, 'loss/train': 1.6092973947525024} -11/06/2021 21:53:15 - INFO - __main__ - Step 4473: {'lr': 0.0004996559008432173, 'samples': 858816, 'steps': 4472, 'loss/train': 3.0951523780822754} -11/06/2021 21:53:16 - INFO - __main__ - Step 4474: {'lr': 0.0004996556224534776, 'samples': 859008, 'steps': 4473, 'loss/train': 2.4669737815856934} -11/06/2021 21:53:16 - INFO - __main__ - Step 4475: {'lr': 0.0004996553439512468, 'samples': 859200, 'steps': 4474, 'loss/train': 2.577219247817993} -11/06/2021 21:53:16 - INFO - __main__ - Step 4476: {'lr': 0.0004996550653365253, 'samples': 859392, 'steps': 4475, 'loss/train': 1.7655971050262451} -11/06/2021 21:53:17 - INFO - __main__ - Step 4477: {'lr': 0.0004996547866093129, 'samples': 859584, 'steps': 4476, 'loss/train': 2.026312828063965} -11/06/2021 21:53:17 - INFO - __main__ - Step 4478: {'lr': 0.00049965450776961, 'samples': 859776, 'steps': 4477, 'loss/train': 2.0732200145721436} -11/06/2021 21:53:18 - INFO - __main__ - Step 4479: {'lr': 0.0004996542288174166, 'samples': 859968, 'steps': 4478, 'loss/train': 2.4320411682128906} -11/06/2021 21:53:18 - INFO - __main__ - Step 4480: {'lr': 0.0004996539497527329, 'samples': 860160, 'steps': 4479, 'loss/train': 1.8877087831497192} -11/06/2021 21:53:19 - INFO - __main__ - Step 4481: {'lr': 0.000499653670575559, 'samples': 860352, 'steps': 4480, 'loss/train': 1.376404047012329} -11/06/2021 21:53:19 - INFO - __main__ - Step 4482: {'lr': 0.0004996533912858949, 'samples': 860544, 'steps': 4481, 'loss/train': 1.817132592201233} -11/06/2021 21:53:19 - INFO - __main__ - Step 4483: {'lr': 0.000499653111883741, 'samples': 860736, 'steps': 4482, 'loss/train': 2.1700544357299805} -11/06/2021 21:53:20 - INFO - __main__ - Step 4484: {'lr': 0.0004996528323690971, 'samples': 860928, 'steps': 4483, 'loss/train': 1.9818646907806396} -11/06/2021 21:53:21 - INFO - __main__ - Step 4485: {'lr': 0.0004996525527419636, 'samples': 861120, 'steps': 4484, 'loss/train': 1.9006667137145996} -11/06/2021 21:53:21 - INFO - __main__ - Step 4486: {'lr': 0.0004996522730023404, 'samples': 861312, 'steps': 4485, 'loss/train': 1.9432722330093384} -11/06/2021 21:53:21 - INFO - __main__ - Step 4487: {'lr': 0.0004996519931502279, 'samples': 861504, 'steps': 4486, 'loss/train': 2.3324050903320312} -11/06/2021 21:53:22 - INFO - __main__ - Step 4488: {'lr': 0.0004996517131856259, 'samples': 861696, 'steps': 4487, 'loss/train': 1.8573492765426636} -11/06/2021 21:53:23 - INFO - __main__ - Step 4489: {'lr': 0.0004996514331085348, 'samples': 861888, 'steps': 4488, 'loss/train': 1.8287177085876465} -11/06/2021 21:53:23 - INFO - __main__ - Step 4490: {'lr': 0.0004996511529189546, 'samples': 862080, 'steps': 4489, 'loss/train': 1.9560521841049194} -11/06/2021 21:53:24 - INFO - __main__ - Step 4491: {'lr': 0.0004996508726168854, 'samples': 862272, 'steps': 4490, 'loss/train': 2.2228381633758545} -11/06/2021 21:53:24 - INFO - __main__ - Step 4492: {'lr': 0.0004996505922023274, 'samples': 862464, 'steps': 4491, 'loss/train': 2.6008143424987793} -11/06/2021 21:53:24 - INFO - __main__ - Step 4493: {'lr': 0.0004996503116752807, 'samples': 862656, 'steps': 4492, 'loss/train': 2.061739206314087} -11/06/2021 21:53:25 - INFO - __main__ - Step 4494: {'lr': 0.0004996500310357454, 'samples': 862848, 'steps': 4493, 'loss/train': 1.7886160612106323} -11/06/2021 21:53:26 - INFO - __main__ - Step 4495: {'lr': 0.0004996497502837217, 'samples': 863040, 'steps': 4494, 'loss/train': 1.68747878074646} -11/06/2021 21:53:26 - INFO - __main__ - Step 4496: {'lr': 0.0004996494694192096, 'samples': 863232, 'steps': 4495, 'loss/train': 1.7942966222763062} -11/06/2021 21:53:26 - INFO - __main__ - Step 4497: {'lr': 0.0004996491884422092, 'samples': 863424, 'steps': 4496, 'loss/train': 2.276155948638916} -11/06/2021 21:53:27 - INFO - __main__ - Step 4498: {'lr': 0.0004996489073527208, 'samples': 863616, 'steps': 4497, 'loss/train': 2.0408365726470947} -11/06/2021 21:53:28 - INFO - __main__ - Step 4499: {'lr': 0.0004996486261507445, 'samples': 863808, 'steps': 4498, 'loss/train': 2.200601816177368} -11/06/2021 21:53:28 - INFO - __main__ - Step 4500: {'lr': 0.0004996483448362805, 'samples': 864000, 'steps': 4499, 'loss/train': 2.0834293365478516} -11/06/2021 21:53:28 - INFO - __main__ - Step 4501: {'lr': 0.0004996480634093287, 'samples': 864192, 'steps': 4500, 'loss/train': 1.751892328262329} -11/06/2021 21:53:29 - INFO - __main__ - Step 4502: {'lr': 0.0004996477818698893, 'samples': 864384, 'steps': 4501, 'loss/train': 2.13613224029541} -11/06/2021 21:53:29 - INFO - __main__ - Step 4503: {'lr': 0.0004996475002179625, 'samples': 864576, 'steps': 4502, 'loss/train': 2.1853764057159424} -11/06/2021 21:53:30 - INFO - __main__ - Step 4504: {'lr': 0.0004996472184535484, 'samples': 864768, 'steps': 4503, 'loss/train': 1.418428659439087} -11/06/2021 21:53:30 - INFO - __main__ - Step 4505: {'lr': 0.0004996469365766471, 'samples': 864960, 'steps': 4504, 'loss/train': 1.7238401174545288} -11/06/2021 21:53:31 - INFO - __main__ - Step 4506: {'lr': 0.0004996466545872588, 'samples': 865152, 'steps': 4505, 'loss/train': 1.999024510383606} -11/06/2021 21:53:31 - INFO - __main__ - Step 4507: {'lr': 0.0004996463724853834, 'samples': 865344, 'steps': 4506, 'loss/train': 2.0768072605133057} -11/06/2021 21:53:31 - INFO - __main__ - Step 4508: {'lr': 0.0004996460902710214, 'samples': 865536, 'steps': 4507, 'loss/train': 1.8393359184265137} -11/06/2021 21:53:32 - INFO - __main__ - Step 4509: {'lr': 0.0004996458079441727, 'samples': 865728, 'steps': 4508, 'loss/train': 1.8585339784622192} -11/06/2021 21:53:33 - INFO - __main__ - Step 4510: {'lr': 0.0004996455255048373, 'samples': 865920, 'steps': 4509, 'loss/train': 1.3014329671859741} -11/06/2021 21:53:33 - INFO - __main__ - Step 4511: {'lr': 0.0004996452429530156, 'samples': 866112, 'steps': 4510, 'loss/train': 2.1434712409973145} -11/06/2021 21:53:33 - INFO - __main__ - Step 4512: {'lr': 0.0004996449602887075, 'samples': 866304, 'steps': 4511, 'loss/train': 1.680091142654419} -11/06/2021 21:53:34 - INFO - __main__ - Step 4513: {'lr': 0.0004996446775119134, 'samples': 866496, 'steps': 4512, 'loss/train': 1.8141558170318604} -11/06/2021 21:53:35 - INFO - __main__ - Step 4514: {'lr': 0.0004996443946226331, 'samples': 866688, 'steps': 4513, 'loss/train': 1.9032708406448364} -11/06/2021 21:53:35 - INFO - __main__ - Step 4515: {'lr': 0.000499644111620867, 'samples': 866880, 'steps': 4514, 'loss/train': 1.6730246543884277} -11/06/2021 21:53:36 - INFO - __main__ - Step 4516: {'lr': 0.000499643828506615, 'samples': 867072, 'steps': 4515, 'loss/train': 2.1784026622772217} -11/06/2021 21:53:36 - INFO - __main__ - Step 4517: {'lr': 0.0004996435452798775, 'samples': 867264, 'steps': 4516, 'loss/train': 1.8776859045028687} -11/06/2021 21:53:36 - INFO - __main__ - Step 4518: {'lr': 0.0004996432619406543, 'samples': 867456, 'steps': 4517, 'loss/train': 2.0420169830322266} -11/06/2021 21:53:37 - INFO - __main__ - Step 4519: {'lr': 0.0004996429784889458, 'samples': 867648, 'steps': 4518, 'loss/train': 2.412881851196289} -11/06/2021 21:53:38 - INFO - __main__ - Step 4520: {'lr': 0.000499642694924752, 'samples': 867840, 'steps': 4519, 'loss/train': 1.9957324266433716} -11/06/2021 21:53:38 - INFO - __main__ - Step 4521: {'lr': 0.000499642411248073, 'samples': 868032, 'steps': 4520, 'loss/train': 1.6232712268829346} -11/06/2021 21:53:38 - INFO - __main__ - Step 4522: {'lr': 0.0004996421274589091, 'samples': 868224, 'steps': 4521, 'loss/train': 2.311401128768921} -11/06/2021 21:53:39 - INFO - __main__ - Step 4523: {'lr': 0.0004996418435572603, 'samples': 868416, 'steps': 4522, 'loss/train': 2.561228036880493} -11/06/2021 21:53:39 - INFO - __main__ - Step 4524: {'lr': 0.0004996415595431267, 'samples': 868608, 'steps': 4523, 'loss/train': 2.3829054832458496} -11/06/2021 21:53:40 - INFO - __main__ - Step 4525: {'lr': 0.0004996412754165084, 'samples': 868800, 'steps': 4524, 'loss/train': 1.9954290390014648} -11/06/2021 21:53:40 - INFO - __main__ - Step 4526: {'lr': 0.0004996409911774056, 'samples': 868992, 'steps': 4525, 'loss/train': 1.9752427339553833} -11/06/2021 21:53:41 - INFO - __main__ - Step 4527: {'lr': 0.0004996407068258186, 'samples': 869184, 'steps': 4526, 'loss/train': 2.2408523559570312} -11/06/2021 21:53:41 - INFO - __main__ - Step 4528: {'lr': 0.0004996404223617471, 'samples': 869376, 'steps': 4527, 'loss/train': 1.6397135257720947} -11/06/2021 21:53:41 - INFO - __main__ - Step 4529: {'lr': 0.0004996401377851917, 'samples': 869568, 'steps': 4528, 'loss/train': 2.1448097229003906} -11/06/2021 21:53:42 - INFO - __main__ - Step 4530: {'lr': 0.0004996398530961522, 'samples': 869760, 'steps': 4529, 'loss/train': 1.8006598949432373} -11/06/2021 21:53:43 - INFO - __main__ - Step 4531: {'lr': 0.0004996395682946288, 'samples': 869952, 'steps': 4530, 'loss/train': 1.2451746463775635} -11/06/2021 21:53:43 - INFO - __main__ - Step 4532: {'lr': 0.0004996392833806217, 'samples': 870144, 'steps': 4531, 'loss/train': 1.7764043807983398} -11/06/2021 21:53:44 - INFO - __main__ - Step 4533: {'lr': 0.000499638998354131, 'samples': 870336, 'steps': 4532, 'loss/train': 2.118048667907715} -11/06/2021 21:53:44 - INFO - __main__ - Step 4534: {'lr': 0.0004996387132151567, 'samples': 870528, 'steps': 4533, 'loss/train': 2.315908908843994} -11/06/2021 21:53:45 - INFO - __main__ - Step 4535: {'lr': 0.0004996384279636993, 'samples': 870720, 'steps': 4534, 'loss/train': 2.341172218322754} -11/06/2021 21:53:45 - INFO - __main__ - Step 4536: {'lr': 0.0004996381425997584, 'samples': 870912, 'steps': 4535, 'loss/train': 2.5195581912994385} -11/06/2021 21:53:46 - INFO - __main__ - Step 4537: {'lr': 0.0004996378571233347, 'samples': 871104, 'steps': 4536, 'loss/train': 2.251058578491211} -11/06/2021 21:53:46 - INFO - __main__ - Step 4538: {'lr': 0.0004996375715344278, 'samples': 871296, 'steps': 4537, 'loss/train': 2.1683661937713623} -11/06/2021 21:53:46 - INFO - __main__ - Step 4539: {'lr': 0.0004996372858330382, 'samples': 871488, 'steps': 4538, 'loss/train': 2.623131275177002} -11/06/2021 21:53:47 - INFO - __main__ - Step 4540: {'lr': 0.0004996370000191657, 'samples': 871680, 'steps': 4539, 'loss/train': 2.218451738357544} -11/06/2021 21:53:48 - INFO - __main__ - Step 4541: {'lr': 0.0004996367140928107, 'samples': 871872, 'steps': 4540, 'loss/train': 2.884366989135742} -11/06/2021 21:53:48 - INFO - __main__ - Step 4542: {'lr': 0.0004996364280539734, 'samples': 872064, 'steps': 4541, 'loss/train': 2.3906033039093018} -11/06/2021 21:53:48 - INFO - __main__ - Step 4543: {'lr': 0.0004996361419026537, 'samples': 872256, 'steps': 4542, 'loss/train': 2.0911548137664795} -11/06/2021 21:53:49 - INFO - __main__ - Step 4544: {'lr': 0.0004996358556388518, 'samples': 872448, 'steps': 4543, 'loss/train': 2.255887269973755} -11/06/2021 21:53:49 - INFO - __main__ - Step 4545: {'lr': 0.0004996355692625678, 'samples': 872640, 'steps': 4544, 'loss/train': 2.3875391483306885} -11/06/2021 21:53:50 - INFO - __main__ - Step 4546: {'lr': 0.0004996352827738018, 'samples': 872832, 'steps': 4545, 'loss/train': 1.9046090841293335} -11/06/2021 21:53:50 - INFO - __main__ - Step 4547: {'lr': 0.0004996349961725542, 'samples': 873024, 'steps': 4546, 'loss/train': 1.6704214811325073} -11/06/2021 21:53:51 - INFO - __main__ - Step 4548: {'lr': 0.0004996347094588247, 'samples': 873216, 'steps': 4547, 'loss/train': 1.5265803337097168} -11/06/2021 21:53:51 - INFO - __main__ - Step 4549: {'lr': 0.0004996344226326137, 'samples': 873408, 'steps': 4548, 'loss/train': 2.1202685832977295} -11/06/2021 21:53:52 - INFO - __main__ - Step 4550: {'lr': 0.0004996341356939214, 'samples': 873600, 'steps': 4549, 'loss/train': 2.068074941635132} -11/06/2021 21:53:53 - INFO - __main__ - Step 4551: {'lr': 0.0004996338486427477, 'samples': 873792, 'steps': 4550, 'loss/train': 2.596259593963623} -11/06/2021 21:53:53 - INFO - __main__ - Step 4552: {'lr': 0.0004996335614790929, 'samples': 873984, 'steps': 4551, 'loss/train': 1.9318180084228516} -11/06/2021 21:53:53 - INFO - __main__ - Step 4553: {'lr': 0.0004996332742029571, 'samples': 874176, 'steps': 4552, 'loss/train': 1.7639127969741821} -11/06/2021 21:53:54 - INFO - __main__ - Step 4554: {'lr': 0.0004996329868143404, 'samples': 874368, 'steps': 4553, 'loss/train': 2.062023639678955} -11/06/2021 21:53:54 - INFO - __main__ - Step 4555: {'lr': 0.0004996326993132428, 'samples': 874560, 'steps': 4554, 'loss/train': 2.341677665710449} -11/06/2021 21:53:55 - INFO - __main__ - Step 4556: {'lr': 0.0004996324116996647, 'samples': 874752, 'steps': 4555, 'loss/train': 1.2803831100463867} -11/06/2021 21:53:55 - INFO - __main__ - Step 4557: {'lr': 0.0004996321239736059, 'samples': 874944, 'steps': 4556, 'loss/train': 1.2265723943710327} -11/06/2021 21:53:56 - INFO - __main__ - Step 4558: {'lr': 0.000499631836135067, 'samples': 875136, 'steps': 4557, 'loss/train': 1.5673511028289795} -11/06/2021 21:53:56 - INFO - __main__ - Step 4559: {'lr': 0.0004996315481840476, 'samples': 875328, 'steps': 4558, 'loss/train': 2.2120308876037598} -11/06/2021 21:53:56 - INFO - __main__ - Step 4560: {'lr': 0.0004996312601205482, 'samples': 875520, 'steps': 4559, 'loss/train': 1.771849513053894} -11/06/2021 21:53:57 - INFO - __main__ - Step 4561: {'lr': 0.0004996309719445687, 'samples': 875712, 'steps': 4560, 'loss/train': 1.6283718347549438} -11/06/2021 21:53:58 - INFO - __main__ - Step 4562: {'lr': 0.0004996306836561094, 'samples': 875904, 'steps': 4561, 'loss/train': 2.1488685607910156} -11/06/2021 21:53:58 - INFO - __main__ - Step 4563: {'lr': 0.0004996303952551704, 'samples': 876096, 'steps': 4562, 'loss/train': 3.6791834831237793} -11/06/2021 21:53:58 - INFO - __main__ - Step 4564: {'lr': 0.0004996301067417517, 'samples': 876288, 'steps': 4563, 'loss/train': 1.914914846420288} -11/06/2021 21:53:59 - INFO - __main__ - Step 4565: {'lr': 0.0004996298181158536, 'samples': 876480, 'steps': 4564, 'loss/train': 2.1919569969177246} -11/06/2021 21:53:59 - INFO - __main__ - Step 4566: {'lr': 0.0004996295293774762, 'samples': 876672, 'steps': 4565, 'loss/train': 2.0341947078704834} -11/06/2021 21:54:00 - INFO - __main__ - Step 4567: {'lr': 0.0004996292405266195, 'samples': 876864, 'steps': 4566, 'loss/train': 3.0565133094787598} -11/06/2021 21:54:01 - INFO - __main__ - Step 4568: {'lr': 0.0004996289515632838, 'samples': 877056, 'steps': 4567, 'loss/train': 1.6455254554748535} -11/06/2021 21:54:01 - INFO - __main__ - Step 4569: {'lr': 0.0004996286624874691, 'samples': 877248, 'steps': 4568, 'loss/train': 2.0319526195526123} -11/06/2021 21:54:01 - INFO - __main__ - Step 4570: {'lr': 0.0004996283732991755, 'samples': 877440, 'steps': 4569, 'loss/train': 2.2277791500091553} -11/06/2021 21:54:02 - INFO - __main__ - Step 4571: {'lr': 0.0004996280839984033, 'samples': 877632, 'steps': 4570, 'loss/train': 1.485971450805664} -11/06/2021 21:54:03 - INFO - __main__ - Step 4572: {'lr': 0.0004996277945851525, 'samples': 877824, 'steps': 4571, 'loss/train': 2.180328369140625} -11/06/2021 21:54:03 - INFO - __main__ - Step 4573: {'lr': 0.0004996275050594233, 'samples': 878016, 'steps': 4572, 'loss/train': 1.8692883253097534} -11/06/2021 21:54:03 - INFO - __main__ - Step 4574: {'lr': 0.0004996272154212158, 'samples': 878208, 'steps': 4573, 'loss/train': 0.9339056611061096} -11/06/2021 21:54:04 - INFO - __main__ - Step 4575: {'lr': 0.0004996269256705301, 'samples': 878400, 'steps': 4574, 'loss/train': 2.103940486907959} -11/06/2021 21:54:04 - INFO - __main__ - Step 4576: {'lr': 0.0004996266358073664, 'samples': 878592, 'steps': 4575, 'loss/train': 1.7924268245697021} -11/06/2021 21:54:05 - INFO - __main__ - Step 4577: {'lr': 0.0004996263458317248, 'samples': 878784, 'steps': 4576, 'loss/train': 1.6914095878601074} -11/06/2021 21:54:05 - INFO - __main__ - Step 4578: {'lr': 0.0004996260557436053, 'samples': 878976, 'steps': 4577, 'loss/train': 1.528101921081543} -11/06/2021 21:54:06 - INFO - __main__ - Step 4579: {'lr': 0.0004996257655430083, 'samples': 879168, 'steps': 4578, 'loss/train': 1.8863238096237183} -11/06/2021 21:54:06 - INFO - __main__ - Step 4580: {'lr': 0.0004996254752299337, 'samples': 879360, 'steps': 4579, 'loss/train': 1.8763165473937988} -11/06/2021 21:54:06 - INFO - __main__ - Step 4581: {'lr': 0.0004996251848043817, 'samples': 879552, 'steps': 4580, 'loss/train': 1.885318636894226} -11/06/2021 21:54:07 - INFO - __main__ - Step 4582: {'lr': 0.0004996248942663525, 'samples': 879744, 'steps': 4581, 'loss/train': 1.8357065916061401} -11/06/2021 21:54:08 - INFO - __main__ - Step 4583: {'lr': 0.000499624603615846, 'samples': 879936, 'steps': 4582, 'loss/train': 1.8866019248962402} -11/06/2021 21:54:08 - INFO - __main__ - Step 4584: {'lr': 0.0004996243128528628, 'samples': 880128, 'steps': 4583, 'loss/train': 2.051255464553833} -11/06/2021 21:54:08 - INFO - __main__ - Step 4585: {'lr': 0.0004996240219774025, 'samples': 880320, 'steps': 4584, 'loss/train': 1.9675004482269287} -11/06/2021 21:54:09 - INFO - __main__ - Step 4586: {'lr': 0.0004996237309894656, 'samples': 880512, 'steps': 4585, 'loss/train': 2.283939838409424} -11/06/2021 21:54:10 - INFO - __main__ - Step 4587: {'lr': 0.0004996234398890521, 'samples': 880704, 'steps': 4586, 'loss/train': 1.3432775735855103} -11/06/2021 21:54:10 - INFO - __main__ - Step 4588: {'lr': 0.000499623148676162, 'samples': 880896, 'steps': 4587, 'loss/train': 2.1022074222564697} -11/06/2021 21:54:10 - INFO - __main__ - Step 4589: {'lr': 0.0004996228573507957, 'samples': 881088, 'steps': 4588, 'loss/train': 2.6343271732330322} -11/06/2021 21:54:11 - INFO - __main__ - Step 4590: {'lr': 0.0004996225659129531, 'samples': 881280, 'steps': 4589, 'loss/train': 1.8193244934082031} -11/06/2021 21:54:11 - INFO - __main__ - Step 4591: {'lr': 0.0004996222743626345, 'samples': 881472, 'steps': 4590, 'loss/train': 2.7049386501312256} -11/06/2021 21:54:12 - INFO - __main__ - Step 4592: {'lr': 0.0004996219826998399, 'samples': 881664, 'steps': 4591, 'loss/train': 2.1974246501922607} -11/06/2021 21:54:13 - INFO - __main__ - Step 4593: {'lr': 0.0004996216909245695, 'samples': 881856, 'steps': 4592, 'loss/train': 2.143535852432251} -11/06/2021 21:54:13 - INFO - __main__ - Step 4594: {'lr': 0.0004996213990368234, 'samples': 882048, 'steps': 4593, 'loss/train': 2.2130115032196045} -11/06/2021 21:54:13 - INFO - __main__ - Step 4595: {'lr': 0.0004996211070366018, 'samples': 882240, 'steps': 4594, 'loss/train': 2.191429376602173} -11/06/2021 21:54:14 - INFO - __main__ - Step 4596: {'lr': 0.0004996208149239047, 'samples': 882432, 'steps': 4595, 'loss/train': 2.114386558532715} -11/06/2021 21:54:14 - INFO - __main__ - Step 4597: {'lr': 0.0004996205226987324, 'samples': 882624, 'steps': 4596, 'loss/train': 1.8462443351745605} -11/06/2021 21:54:15 - INFO - __main__ - Step 4598: {'lr': 0.0004996202303610849, 'samples': 882816, 'steps': 4597, 'loss/train': 1.8497729301452637} -11/06/2021 21:54:15 - INFO - __main__ - Step 4599: {'lr': 0.0004996199379109624, 'samples': 883008, 'steps': 4598, 'loss/train': 1.8294633626937866} -11/06/2021 21:54:16 - INFO - __main__ - Step 4600: {'lr': 0.000499619645348365, 'samples': 883200, 'steps': 4599, 'loss/train': 2.2398879528045654} -11/06/2021 21:54:16 - INFO - __main__ - Step 4601: {'lr': 0.0004996193526732929, 'samples': 883392, 'steps': 4600, 'loss/train': 2.352756977081299} -11/06/2021 21:54:16 - INFO - __main__ - Step 4602: {'lr': 0.0004996190598857461, 'samples': 883584, 'steps': 4601, 'loss/train': 1.9614698886871338} -11/06/2021 21:54:17 - INFO - __main__ - Step 4603: {'lr': 0.0004996187669857247, 'samples': 883776, 'steps': 4602, 'loss/train': 1.7905255556106567} -11/06/2021 21:54:18 - INFO - __main__ - Step 4604: {'lr': 0.0004996184739732291, 'samples': 883968, 'steps': 4603, 'loss/train': 2.1833322048187256} -11/06/2021 21:54:18 - INFO - __main__ - Step 4605: {'lr': 0.0004996181808482592, 'samples': 884160, 'steps': 4604, 'loss/train': 1.840651035308838} -11/06/2021 21:54:18 - INFO - __main__ - Step 4606: {'lr': 0.0004996178876108152, 'samples': 884352, 'steps': 4605, 'loss/train': 1.8321231603622437} -11/06/2021 21:54:19 - INFO - __main__ - Step 4607: {'lr': 0.0004996175942608973, 'samples': 884544, 'steps': 4606, 'loss/train': 2.244662284851074} -11/06/2021 21:54:20 - INFO - __main__ - Step 4608: {'lr': 0.0004996173007985055, 'samples': 884736, 'steps': 4607, 'loss/train': 1.933355689048767} -11/06/2021 21:54:20 - INFO - __main__ - Step 4609: {'lr': 0.00049961700722364, 'samples': 884928, 'steps': 4608, 'loss/train': 1.835882306098938} -11/06/2021 21:54:21 - INFO - __main__ - Step 4610: {'lr': 0.0004996167135363009, 'samples': 885120, 'steps': 4609, 'loss/train': 0.5920076966285706} -11/06/2021 21:54:21 - INFO - __main__ - Step 4611: {'lr': 0.0004996164197364884, 'samples': 885312, 'steps': 4610, 'loss/train': 2.2849209308624268} -11/06/2021 21:54:21 - INFO - __main__ - Step 4612: {'lr': 0.0004996161258242025, 'samples': 885504, 'steps': 4611, 'loss/train': 2.7224349975585938} -11/06/2021 21:54:22 - INFO - __main__ - Step 4613: {'lr': 0.0004996158317994436, 'samples': 885696, 'steps': 4612, 'loss/train': 2.293109893798828} -11/06/2021 21:54:23 - INFO - __main__ - Step 4614: {'lr': 0.0004996155376622115, 'samples': 885888, 'steps': 4613, 'loss/train': 2.077742099761963} -11/06/2021 21:54:23 - INFO - __main__ - Step 4615: {'lr': 0.0004996152434125066, 'samples': 886080, 'steps': 4614, 'loss/train': 2.129293441772461} -11/06/2021 21:54:23 - INFO - __main__ - Step 4616: {'lr': 0.0004996149490503289, 'samples': 886272, 'steps': 4615, 'loss/train': 1.7415257692337036} -11/06/2021 21:54:24 - INFO - __main__ - Step 4617: {'lr': 0.0004996146545756786, 'samples': 886464, 'steps': 4616, 'loss/train': 1.9531595706939697} -11/06/2021 21:54:25 - INFO - __main__ - Step 4618: {'lr': 0.0004996143599885557, 'samples': 886656, 'steps': 4617, 'loss/train': 2.034966468811035} -11/06/2021 21:54:25 - INFO - __main__ - Step 4619: {'lr': 0.0004996140652889603, 'samples': 886848, 'steps': 4618, 'loss/train': 1.855339765548706} -11/06/2021 21:54:25 - INFO - __main__ - Step 4620: {'lr': 0.0004996137704768929, 'samples': 887040, 'steps': 4619, 'loss/train': 2.010745048522949} -11/06/2021 21:54:26 - INFO - __main__ - Step 4621: {'lr': 0.0004996134755523532, 'samples': 887232, 'steps': 4620, 'loss/train': 1.572229027748108} -11/06/2021 21:54:26 - INFO - __main__ - Step 4622: {'lr': 0.0004996131805153417, 'samples': 887424, 'steps': 4621, 'loss/train': 2.434321880340576} -11/06/2021 21:54:27 - INFO - __main__ - Step 4623: {'lr': 0.0004996128853658583, 'samples': 887616, 'steps': 4622, 'loss/train': 1.803308129310608} -11/06/2021 21:54:27 - INFO - __main__ - Step 4624: {'lr': 0.0004996125901039031, 'samples': 887808, 'steps': 4623, 'loss/train': 2.078205108642578} -11/06/2021 21:54:28 - INFO - __main__ - Step 4625: {'lr': 0.0004996122947294764, 'samples': 888000, 'steps': 4624, 'loss/train': 1.3897693157196045} -11/06/2021 21:54:28 - INFO - __main__ - Step 4626: {'lr': 0.0004996119992425782, 'samples': 888192, 'steps': 4625, 'loss/train': 2.1612305641174316} -11/06/2021 21:54:28 - INFO - __main__ - Step 4627: {'lr': 0.0004996117036432087, 'samples': 888384, 'steps': 4626, 'loss/train': 1.204795479774475} -11/06/2021 21:54:29 - INFO - __main__ - Step 4628: {'lr': 0.000499611407931368, 'samples': 888576, 'steps': 4627, 'loss/train': 1.87538480758667} -11/06/2021 21:54:30 - INFO - __main__ - Step 4629: {'lr': 0.0004996111121070562, 'samples': 888768, 'steps': 4628, 'loss/train': 1.9798368215560913} -11/06/2021 21:54:30 - INFO - __main__ - Step 4630: {'lr': 0.0004996108161702736, 'samples': 888960, 'steps': 4629, 'loss/train': 1.8879029750823975} -11/06/2021 21:54:30 - INFO - __main__ - Step 4631: {'lr': 0.0004996105201210202, 'samples': 889152, 'steps': 4630, 'loss/train': 1.498540997505188} -11/06/2021 21:54:31 - INFO - __main__ - Step 4632: {'lr': 0.0004996102239592961, 'samples': 889344, 'steps': 4631, 'loss/train': 2.450267791748047} -11/06/2021 21:54:31 - INFO - __main__ - Step 4633: {'lr': 0.0004996099276851015, 'samples': 889536, 'steps': 4632, 'loss/train': 1.960253357887268} -11/06/2021 21:54:32 - INFO - __main__ - Step 4634: {'lr': 0.0004996096312984365, 'samples': 889728, 'steps': 4633, 'loss/train': 2.13409423828125} -11/06/2021 21:54:33 - INFO - __main__ - Step 4635: {'lr': 0.0004996093347993013, 'samples': 889920, 'steps': 4634, 'loss/train': 2.0862467288970947} -11/06/2021 21:54:33 - INFO - __main__ - Step 4636: {'lr': 0.000499609038187696, 'samples': 890112, 'steps': 4635, 'loss/train': 1.7066518068313599} -11/06/2021 21:54:33 - INFO - __main__ - Step 4637: {'lr': 0.0004996087414636207, 'samples': 890304, 'steps': 4636, 'loss/train': 1.917240858078003} -11/06/2021 21:54:34 - INFO - __main__ - Step 4638: {'lr': 0.0004996084446270755, 'samples': 890496, 'steps': 4637, 'loss/train': 1.5188076496124268} -11/06/2021 21:54:35 - INFO - __main__ - Step 4639: {'lr': 0.0004996081476780607, 'samples': 890688, 'steps': 4638, 'loss/train': 2.3080358505249023} -11/06/2021 21:54:35 - INFO - __main__ - Step 4640: {'lr': 0.0004996078506165762, 'samples': 890880, 'steps': 4639, 'loss/train': 1.5977153778076172} -11/06/2021 21:54:35 - INFO - __main__ - Step 4641: {'lr': 0.0004996075534426222, 'samples': 891072, 'steps': 4640, 'loss/train': 1.9571729898452759} -11/06/2021 21:54:36 - INFO - __main__ - Step 4642: {'lr': 0.000499607256156199, 'samples': 891264, 'steps': 4641, 'loss/train': 1.8053956031799316} -11/06/2021 21:54:36 - INFO - __main__ - Step 4643: {'lr': 0.0004996069587573067, 'samples': 891456, 'steps': 4642, 'loss/train': 1.5705664157867432} -11/06/2021 21:54:37 - INFO - __main__ - Step 4644: {'lr': 0.0004996066612459452, 'samples': 891648, 'steps': 4643, 'loss/train': 1.735826849937439} -11/06/2021 21:54:37 - INFO - __main__ - Step 4645: {'lr': 0.0004996063636221148, 'samples': 891840, 'steps': 4644, 'loss/train': 2.2214009761810303} -11/06/2021 21:54:38 - INFO - __main__ - Step 4646: {'lr': 0.0004996060658858158, 'samples': 892032, 'steps': 4645, 'loss/train': 2.121854305267334} -11/06/2021 21:54:38 - INFO - __main__ - Step 4647: {'lr': 0.000499605768037048, 'samples': 892224, 'steps': 4646, 'loss/train': 2.353457450866699} -11/06/2021 21:54:39 - INFO - __main__ - Step 4648: {'lr': 0.0004996054700758117, 'samples': 892416, 'steps': 4647, 'loss/train': 2.0667355060577393} -11/06/2021 21:54:40 - INFO - __main__ - Step 4649: {'lr': 0.0004996051720021071, 'samples': 892608, 'steps': 4648, 'loss/train': 2.009962558746338} -11/06/2021 21:54:40 - INFO - __main__ - Step 4650: {'lr': 0.0004996048738159342, 'samples': 892800, 'steps': 4649, 'loss/train': 0.5192378163337708} -11/06/2021 21:54:40 - INFO - __main__ - Step 4651: {'lr': 0.0004996045755172932, 'samples': 892992, 'steps': 4650, 'loss/train': 1.84172785282135} -11/06/2021 21:54:41 - INFO - __main__ - Step 4652: {'lr': 0.0004996042771061843, 'samples': 893184, 'steps': 4651, 'loss/train': 2.217998504638672} -11/06/2021 21:54:41 - INFO - __main__ - Step 4653: {'lr': 0.0004996039785826075, 'samples': 893376, 'steps': 4652, 'loss/train': 1.648202657699585} -11/06/2021 21:54:42 - INFO - __main__ - Step 4654: {'lr': 0.000499603679946563, 'samples': 893568, 'steps': 4653, 'loss/train': 2.03910756111145} -11/06/2021 21:54:43 - INFO - __main__ - Step 4655: {'lr': 0.0004996033811980509, 'samples': 893760, 'steps': 4654, 'loss/train': 1.7975298166275024} -11/06/2021 21:54:43 - INFO - __main__ - Step 4656: {'lr': 0.0004996030823370715, 'samples': 893952, 'steps': 4655, 'loss/train': 1.8534296751022339} -11/06/2021 21:54:43 - INFO - __main__ - Step 4657: {'lr': 0.0004996027833636247, 'samples': 894144, 'steps': 4656, 'loss/train': 2.475618600845337} -11/06/2021 21:54:44 - INFO - __main__ - Step 4658: {'lr': 0.0004996024842777106, 'samples': 894336, 'steps': 4657, 'loss/train': 1.9979157447814941} -11/06/2021 21:54:44 - INFO - __main__ - Step 4659: {'lr': 0.0004996021850793297, 'samples': 894528, 'steps': 4658, 'loss/train': 2.030845880508423} -11/06/2021 21:54:45 - INFO - __main__ - Step 4660: {'lr': 0.0004996018857684818, 'samples': 894720, 'steps': 4659, 'loss/train': 2.158336877822876} -11/06/2021 21:54:45 - INFO - __main__ - Step 4661: {'lr': 0.0004996015863451672, 'samples': 894912, 'steps': 4660, 'loss/train': 1.8965908288955688} -11/06/2021 21:54:46 - INFO - __main__ - Step 4662: {'lr': 0.0004996012868093859, 'samples': 895104, 'steps': 4661, 'loss/train': 2.2160189151763916} -11/06/2021 21:54:46 - INFO - __main__ - Step 4663: {'lr': 0.0004996009871611382, 'samples': 895296, 'steps': 4662, 'loss/train': 2.1121556758880615} -11/06/2021 21:54:46 - INFO - __main__ - Step 4664: {'lr': 0.0004996006874004241, 'samples': 895488, 'steps': 4663, 'loss/train': 1.954535961151123} -11/06/2021 21:54:49 - INFO - __main__ - Step 4665: {'lr': 0.0004996003875272438, 'samples': 895680, 'steps': 4664, 'loss/train': 1.9362295866012573} -11/06/2021 21:54:49 - INFO - __main__ - Step 4666: {'lr': 0.0004996000875415973, 'samples': 895872, 'steps': 4665, 'loss/train': 1.841673731803894} -11/06/2021 21:54:50 - INFO - __main__ - Step 4667: {'lr': 0.000499599787443485, 'samples': 896064, 'steps': 4666, 'loss/train': 1.7296624183654785} -11/06/2021 21:54:50 - INFO - __main__ - Step 4668: {'lr': 0.0004995994872329069, 'samples': 896256, 'steps': 4667, 'loss/train': 2.1744236946105957} -11/06/2021 21:54:50 - INFO - __main__ - Step 4669: {'lr': 0.000499599186909863, 'samples': 896448, 'steps': 4668, 'loss/train': 2.424499273300171} -11/06/2021 21:54:51 - INFO - __main__ - Step 4670: {'lr': 0.0004995988864743536, 'samples': 896640, 'steps': 4669, 'loss/train': 2.350759744644165} -11/06/2021 21:54:51 - INFO - __main__ - Step 4671: {'lr': 0.0004995985859263789, 'samples': 896832, 'steps': 4670, 'loss/train': 1.975557804107666} -11/06/2021 21:54:51 - INFO - __main__ - Step 4672: {'lr': 0.0004995982852659388, 'samples': 897024, 'steps': 4671, 'loss/train': 2.1741600036621094} -11/06/2021 21:54:52 - INFO - __main__ - Step 4673: {'lr': 0.0004995979844930336, 'samples': 897216, 'steps': 4672, 'loss/train': 2.133139133453369} -11/06/2021 21:54:53 - INFO - __main__ - Step 4674: {'lr': 0.0004995976836076635, 'samples': 897408, 'steps': 4673, 'loss/train': 2.012343168258667} -11/06/2021 21:54:53 - INFO - __main__ - Step 4675: {'lr': 0.0004995973826098283, 'samples': 897600, 'steps': 4674, 'loss/train': 1.9310002326965332} -11/06/2021 21:54:53 - INFO - __main__ - Step 4676: {'lr': 0.0004995970814995285, 'samples': 897792, 'steps': 4675, 'loss/train': 1.969705581665039} -11/06/2021 21:54:54 - INFO - __main__ - Step 4677: {'lr': 0.0004995967802767641, 'samples': 897984, 'steps': 4676, 'loss/train': 0.5457145571708679} -11/06/2021 21:54:55 - INFO - __main__ - Step 4678: {'lr': 0.0004995964789415353, 'samples': 898176, 'steps': 4677, 'loss/train': 2.1169257164001465} -11/06/2021 21:54:55 - INFO - __main__ - Step 4679: {'lr': 0.0004995961774938423, 'samples': 898368, 'steps': 4678, 'loss/train': 2.047304630279541} -11/06/2021 21:54:56 - INFO - __main__ - Step 4680: {'lr': 0.0004995958759336849, 'samples': 898560, 'steps': 4679, 'loss/train': 2.2334115505218506} -11/06/2021 21:54:56 - INFO - __main__ - Step 4681: {'lr': 0.0004995955742610635, 'samples': 898752, 'steps': 4680, 'loss/train': 1.9930462837219238} -11/06/2021 21:54:56 - INFO - __main__ - Step 4682: {'lr': 0.0004995952724759781, 'samples': 898944, 'steps': 4681, 'loss/train': 2.6837527751922607} -11/06/2021 21:54:57 - INFO - __main__ - Step 4683: {'lr': 0.0004995949705784291, 'samples': 899136, 'steps': 4682, 'loss/train': 2.2613110542297363} -11/06/2021 21:54:58 - INFO - __main__ - Step 4684: {'lr': 0.0004995946685684164, 'samples': 899328, 'steps': 4683, 'loss/train': 1.6057881116867065} -11/06/2021 21:54:58 - INFO - __main__ - Step 4685: {'lr': 0.0004995943664459401, 'samples': 899520, 'steps': 4684, 'loss/train': 4.826809406280518} -11/06/2021 21:54:58 - INFO - __main__ - Step 4686: {'lr': 0.0004995940642110005, 'samples': 899712, 'steps': 4685, 'loss/train': 2.056427478790283} -11/06/2021 21:54:59 - INFO - __main__ - Step 4687: {'lr': 0.0004995937618635977, 'samples': 899904, 'steps': 4686, 'loss/train': 2.5549728870391846} -11/06/2021 21:55:00 - INFO - __main__ - Step 4688: {'lr': 0.0004995934594037316, 'samples': 900096, 'steps': 4687, 'loss/train': 1.6349835395812988} -11/06/2021 21:55:00 - INFO - __main__ - Step 4689: {'lr': 0.0004995931568314028, 'samples': 900288, 'steps': 4688, 'loss/train': 2.1520705223083496} -11/06/2021 21:55:00 - INFO - __main__ - Step 4690: {'lr': 0.0004995928541466111, 'samples': 900480, 'steps': 4689, 'loss/train': 2.086479902267456} -11/06/2021 21:55:01 - INFO - __main__ - Step 4691: {'lr': 0.0004995925513493567, 'samples': 900672, 'steps': 4690, 'loss/train': 2.070526123046875} -11/06/2021 21:55:01 - INFO - __main__ - Step 4692: {'lr': 0.0004995922484396397, 'samples': 900864, 'steps': 4691, 'loss/train': 1.8946828842163086} -11/06/2021 21:55:01 - INFO - __main__ - Step 4693: {'lr': 0.0004995919454174603, 'samples': 901056, 'steps': 4692, 'loss/train': 2.0533816814422607} -11/06/2021 21:55:02 - INFO - __main__ - Step 4694: {'lr': 0.0004995916422828187, 'samples': 901248, 'steps': 4693, 'loss/train': 1.6909483671188354} -11/06/2021 21:55:03 - INFO - __main__ - Step 4695: {'lr': 0.0004995913390357148, 'samples': 901440, 'steps': 4694, 'loss/train': 2.1296300888061523} -11/06/2021 21:55:03 - INFO - __main__ - Step 4696: {'lr': 0.0004995910356761491, 'samples': 901632, 'steps': 4695, 'loss/train': 1.5140820741653442} -11/06/2021 21:55:03 - INFO - __main__ - Step 4697: {'lr': 0.0004995907322041214, 'samples': 901824, 'steps': 4696, 'loss/train': 2.322920560836792} -11/06/2021 21:55:04 - INFO - __main__ - Step 4698: {'lr': 0.000499590428619632, 'samples': 902016, 'steps': 4697, 'loss/train': 1.875250220298767} -11/06/2021 21:55:05 - INFO - __main__ - Step 4699: {'lr': 0.000499590124922681, 'samples': 902208, 'steps': 4698, 'loss/train': 0.6247835159301758} -11/06/2021 21:55:05 - INFO - __main__ - Step 4700: {'lr': 0.0004995898211132685, 'samples': 902400, 'steps': 4699, 'loss/train': 2.233553171157837} -11/06/2021 21:55:06 - INFO - __main__ - Step 4701: {'lr': 0.0004995895171913947, 'samples': 902592, 'steps': 4700, 'loss/train': 2.2635233402252197} -11/06/2021 21:55:06 - INFO - __main__ - Step 4702: {'lr': 0.0004995892131570598, 'samples': 902784, 'steps': 4701, 'loss/train': 1.2235736846923828} -11/06/2021 21:55:06 - INFO - __main__ - Step 4703: {'lr': 0.0004995889090102638, 'samples': 902976, 'steps': 4702, 'loss/train': 1.9816572666168213} -11/06/2021 21:55:07 - INFO - __main__ - Step 4704: {'lr': 0.0004995886047510068, 'samples': 903168, 'steps': 4703, 'loss/train': 2.1657280921936035} -11/06/2021 21:55:08 - INFO - __main__ - Step 4705: {'lr': 0.0004995883003792891, 'samples': 903360, 'steps': 4704, 'loss/train': 2.1573469638824463} -11/06/2021 21:55:08 - INFO - __main__ - Step 4706: {'lr': 0.0004995879958951107, 'samples': 903552, 'steps': 4705, 'loss/train': 1.8357532024383545} -11/06/2021 21:55:08 - INFO - __main__ - Step 4707: {'lr': 0.0004995876912984719, 'samples': 903744, 'steps': 4706, 'loss/train': 2.194171667098999} -11/06/2021 21:55:09 - INFO - __main__ - Step 4708: {'lr': 0.0004995873865893727, 'samples': 903936, 'steps': 4707, 'loss/train': 2.122776985168457} -11/06/2021 21:55:10 - INFO - __main__ - Step 4709: {'lr': 0.0004995870817678133, 'samples': 904128, 'steps': 4708, 'loss/train': 1.9645999670028687} -11/06/2021 21:55:10 - INFO - __main__ - Step 4710: {'lr': 0.0004995867768337938, 'samples': 904320, 'steps': 4709, 'loss/train': 2.073693037033081} -11/06/2021 21:55:10 - INFO - __main__ - Step 4711: {'lr': 0.0004995864717873143, 'samples': 904512, 'steps': 4710, 'loss/train': 1.3138636350631714} -11/06/2021 21:55:11 - INFO - __main__ - Step 4712: {'lr': 0.000499586166628375, 'samples': 904704, 'steps': 4711, 'loss/train': 2.1905508041381836} -11/06/2021 21:55:11 - INFO - __main__ - Step 4713: {'lr': 0.0004995858613569761, 'samples': 904896, 'steps': 4712, 'loss/train': 2.189453363418579} -11/06/2021 21:55:12 - INFO - __main__ - Step 4714: {'lr': 0.0004995855559731176, 'samples': 905088, 'steps': 4713, 'loss/train': 2.266838550567627} -11/06/2021 21:55:12 - INFO - __main__ - Step 4715: {'lr': 0.0004995852504767997, 'samples': 905280, 'steps': 4714, 'loss/train': 2.4359450340270996} -11/06/2021 21:55:13 - INFO - __main__ - Step 4716: {'lr': 0.0004995849448680225, 'samples': 905472, 'steps': 4715, 'loss/train': 2.0849661827087402} -11/06/2021 21:55:13 - INFO - __main__ - Step 4717: {'lr': 0.0004995846391467862, 'samples': 905664, 'steps': 4716, 'loss/train': 2.252028465270996} -11/06/2021 21:55:13 - INFO - __main__ - Step 4718: {'lr': 0.000499584333313091, 'samples': 905856, 'steps': 4717, 'loss/train': 1.7350718975067139} -11/06/2021 21:55:14 - INFO - __main__ - Step 4719: {'lr': 0.0004995840273669369, 'samples': 906048, 'steps': 4718, 'loss/train': 2.1980574131011963} -11/06/2021 21:55:15 - INFO - __main__ - Step 4720: {'lr': 0.0004995837213083241, 'samples': 906240, 'steps': 4719, 'loss/train': 2.655808925628662} -11/06/2021 21:55:15 - INFO - __main__ - Step 4721: {'lr': 0.0004995834151372526, 'samples': 906432, 'steps': 4720, 'loss/train': 1.8203097581863403} -11/06/2021 21:55:16 - INFO - __main__ - Step 4722: {'lr': 0.0004995831088537229, 'samples': 906624, 'steps': 4721, 'loss/train': 1.9288336038589478} -11/06/2021 21:55:16 - INFO - __main__ - Step 4723: {'lr': 0.0004995828024577346, 'samples': 906816, 'steps': 4722, 'loss/train': 2.221000909805298} -11/06/2021 21:55:16 - INFO - __main__ - Step 4724: {'lr': 0.0004995824959492884, 'samples': 907008, 'steps': 4723, 'loss/train': 2.1988742351531982} -11/06/2021 21:55:17 - INFO - __main__ - Step 4725: {'lr': 0.0004995821893283841, 'samples': 907200, 'steps': 4724, 'loss/train': 1.5321357250213623} -11/06/2021 21:55:18 - INFO - __main__ - Step 4726: {'lr': 0.0004995818825950218, 'samples': 907392, 'steps': 4725, 'loss/train': 2.327254295349121} -11/06/2021 21:55:18 - INFO - __main__ - Step 4727: {'lr': 0.0004995815757492019, 'samples': 907584, 'steps': 4726, 'loss/train': 1.697227954864502} -11/06/2021 21:55:18 - INFO - __main__ - Step 4728: {'lr': 0.0004995812687909243, 'samples': 907776, 'steps': 4727, 'loss/train': 1.925517201423645} -11/06/2021 21:55:19 - INFO - __main__ - Step 4729: {'lr': 0.0004995809617201894, 'samples': 907968, 'steps': 4728, 'loss/train': 2.1235063076019287} -11/06/2021 21:55:20 - INFO - __main__ - Step 4730: {'lr': 0.000499580654536997, 'samples': 908160, 'steps': 4729, 'loss/train': 1.6067290306091309} -11/06/2021 21:55:20 - INFO - __main__ - Step 4731: {'lr': 0.0004995803472413474, 'samples': 908352, 'steps': 4730, 'loss/train': 2.062716245651245} -11/06/2021 21:55:21 - INFO - __main__ - Step 4732: {'lr': 0.0004995800398332409, 'samples': 908544, 'steps': 4731, 'loss/train': 2.0088040828704834} -11/06/2021 21:55:21 - INFO - __main__ - Step 4733: {'lr': 0.0004995797323126774, 'samples': 908736, 'steps': 4732, 'loss/train': 2.1273770332336426} -11/06/2021 21:55:21 - INFO - __main__ - Step 4734: {'lr': 0.0004995794246796571, 'samples': 908928, 'steps': 4733, 'loss/train': 1.9056154489517212} -11/06/2021 21:55:22 - INFO - __main__ - Step 4735: {'lr': 0.0004995791169341801, 'samples': 909120, 'steps': 4734, 'loss/train': 1.6100257635116577} -11/06/2021 21:55:23 - INFO - __main__ - Step 4736: {'lr': 0.0004995788090762467, 'samples': 909312, 'steps': 4735, 'loss/train': 1.8864790201187134} -11/06/2021 21:55:23 - INFO - __main__ - Step 4737: {'lr': 0.000499578501105857, 'samples': 909504, 'steps': 4736, 'loss/train': 1.9987335205078125} -11/06/2021 21:55:23 - INFO - __main__ - Step 4738: {'lr': 0.000499578193023011, 'samples': 909696, 'steps': 4737, 'loss/train': 2.262216567993164} -11/06/2021 21:55:24 - INFO - __main__ - Step 4739: {'lr': 0.0004995778848277088, 'samples': 909888, 'steps': 4738, 'loss/train': 1.9893282651901245} -11/06/2021 21:55:24 - INFO - __main__ - Step 4740: {'lr': 0.0004995775765199509, 'samples': 910080, 'steps': 4739, 'loss/train': 2.1088781356811523} -11/06/2021 21:55:25 - INFO - __main__ - Step 4741: {'lr': 0.000499577268099737, 'samples': 910272, 'steps': 4740, 'loss/train': 1.7496652603149414} -11/06/2021 21:55:25 - INFO - __main__ - Step 4742: {'lr': 0.0004995769595670675, 'samples': 910464, 'steps': 4741, 'loss/train': 1.8243907690048218} -11/06/2021 21:55:26 - INFO - __main__ - Step 4743: {'lr': 0.0004995766509219425, 'samples': 910656, 'steps': 4742, 'loss/train': 1.8536678552627563} -11/06/2021 21:55:26 - INFO - __main__ - Step 4744: {'lr': 0.0004995763421643621, 'samples': 910848, 'steps': 4743, 'loss/train': 2.054396152496338} -11/06/2021 21:55:26 - INFO - __main__ - Step 4745: {'lr': 0.0004995760332943264, 'samples': 911040, 'steps': 4744, 'loss/train': 2.0926995277404785} -11/06/2021 21:55:28 - INFO - __main__ - Step 4746: {'lr': 0.0004995757243118356, 'samples': 911232, 'steps': 4745, 'loss/train': 2.342751979827881} -11/06/2021 21:55:28 - INFO - __main__ - Step 4747: {'lr': 0.0004995754152168899, 'samples': 911424, 'steps': 4746, 'loss/train': 1.4246360063552856} -11/06/2021 21:55:28 - INFO - __main__ - Step 4748: {'lr': 0.0004995751060094893, 'samples': 911616, 'steps': 4747, 'loss/train': 1.6921579837799072} -11/06/2021 21:55:29 - INFO - __main__ - Step 4749: {'lr': 0.000499574796689634, 'samples': 911808, 'steps': 4748, 'loss/train': 1.5545167922973633} -11/06/2021 21:55:29 - INFO - __main__ - Step 4750: {'lr': 0.0004995744872573242, 'samples': 912000, 'steps': 4749, 'loss/train': 1.6792792081832886} -11/06/2021 21:55:30 - INFO - __main__ - Step 4751: {'lr': 0.00049957417771256, 'samples': 912192, 'steps': 4750, 'loss/train': 2.301424741744995} -11/06/2021 21:55:31 - INFO - __main__ - Step 4752: {'lr': 0.0004995738680553415, 'samples': 912384, 'steps': 4751, 'loss/train': 2.0780701637268066} -11/06/2021 21:55:31 - INFO - __main__ - Step 4753: {'lr': 0.0004995735582856689, 'samples': 912576, 'steps': 4752, 'loss/train': 2.5025558471679688} -11/06/2021 21:55:31 - INFO - __main__ - Step 4754: {'lr': 0.0004995732484035422, 'samples': 912768, 'steps': 4753, 'loss/train': 1.6821069717407227} -11/06/2021 21:55:32 - INFO - __main__ - Step 4755: {'lr': 0.0004995729384089618, 'samples': 912960, 'steps': 4754, 'loss/train': 1.8580917119979858} -11/06/2021 21:55:32 - INFO - __main__ - Step 4756: {'lr': 0.0004995726283019275, 'samples': 913152, 'steps': 4755, 'loss/train': 5.469394207000732} -11/06/2021 21:55:33 - INFO - __main__ - Step 4757: {'lr': 0.0004995723180824397, 'samples': 913344, 'steps': 4756, 'loss/train': 2.1818153858184814} -11/06/2021 21:55:33 - INFO - __main__ - Step 4758: {'lr': 0.0004995720077504986, 'samples': 913536, 'steps': 4757, 'loss/train': 1.8625547885894775} -11/06/2021 21:55:34 - INFO - __main__ - Step 4759: {'lr': 0.0004995716973061041, 'samples': 913728, 'steps': 4758, 'loss/train': 2.1026546955108643} -11/06/2021 21:55:34 - INFO - __main__ - Step 4760: {'lr': 0.0004995713867492564, 'samples': 913920, 'steps': 4759, 'loss/train': 2.178823471069336} -11/06/2021 21:55:34 - INFO - __main__ - Step 4761: {'lr': 0.0004995710760799557, 'samples': 914112, 'steps': 4760, 'loss/train': 1.872559905052185} -11/06/2021 21:55:36 - INFO - __main__ - Step 4762: {'lr': 0.0004995707652982022, 'samples': 914304, 'steps': 4761, 'loss/train': 1.871140718460083} -11/06/2021 21:55:36 - INFO - __main__ - Step 4763: {'lr': 0.0004995704544039958, 'samples': 914496, 'steps': 4762, 'loss/train': 2.3007659912109375} -11/06/2021 21:55:36 - INFO - __main__ - Step 4764: {'lr': 0.0004995701433973369, 'samples': 914688, 'steps': 4763, 'loss/train': 0.6473186016082764} -11/06/2021 21:55:37 - INFO - __main__ - Step 4765: {'lr': 0.0004995698322782257, 'samples': 914880, 'steps': 4764, 'loss/train': 1.983769416809082} -11/06/2021 21:55:37 - INFO - __main__ - Step 4766: {'lr': 0.0004995695210466619, 'samples': 915072, 'steps': 4765, 'loss/train': 1.983061671257019} -11/06/2021 21:55:37 - INFO - __main__ - Step 4767: {'lr': 0.0004995692097026461, 'samples': 915264, 'steps': 4766, 'loss/train': 1.7104268074035645} -11/06/2021 21:55:38 - INFO - __main__ - Step 4768: {'lr': 0.0004995688982461783, 'samples': 915456, 'steps': 4767, 'loss/train': 2.606029748916626} -11/06/2021 21:55:39 - INFO - __main__ - Step 4769: {'lr': 0.0004995685866772586, 'samples': 915648, 'steps': 4768, 'loss/train': 1.642903447151184} -11/06/2021 21:55:39 - INFO - __main__ - Step 4770: {'lr': 0.000499568274995887, 'samples': 915840, 'steps': 4769, 'loss/train': 2.383634328842163} -11/06/2021 21:55:39 - INFO - __main__ - Step 4771: {'lr': 0.0004995679632020639, 'samples': 916032, 'steps': 4770, 'loss/train': 2.0660829544067383} -11/06/2021 21:55:40 - INFO - __main__ - Step 4772: {'lr': 0.0004995676512957892, 'samples': 916224, 'steps': 4771, 'loss/train': 2.0167953968048096} -11/06/2021 21:55:41 - INFO - __main__ - Step 4773: {'lr': 0.0004995673392770634, 'samples': 916416, 'steps': 4772, 'loss/train': 2.2633042335510254} -11/06/2021 21:55:41 - INFO - __main__ - Step 4774: {'lr': 0.0004995670271458863, 'samples': 916608, 'steps': 4773, 'loss/train': 2.0929172039031982} -11/06/2021 21:55:42 - INFO - __main__ - Step 4775: {'lr': 0.0004995667149022581, 'samples': 916800, 'steps': 4774, 'loss/train': 2.1483800411224365} -11/06/2021 21:55:42 - INFO - __main__ - Step 4776: {'lr': 0.000499566402546179, 'samples': 916992, 'steps': 4775, 'loss/train': 1.7766259908676147} -11/06/2021 21:55:42 - INFO - __main__ - Step 4777: {'lr': 0.0004995660900776491, 'samples': 917184, 'steps': 4776, 'loss/train': 1.8469535112380981} -11/06/2021 21:55:43 - INFO - __main__ - Step 4778: {'lr': 0.0004995657774966686, 'samples': 917376, 'steps': 4777, 'loss/train': 2.0229592323303223} -11/06/2021 21:55:44 - INFO - __main__ - Step 4779: {'lr': 0.0004995654648032377, 'samples': 917568, 'steps': 4778, 'loss/train': 1.3622205257415771} -11/06/2021 21:55:44 - INFO - __main__ - Step 4780: {'lr': 0.0004995651519973563, 'samples': 917760, 'steps': 4779, 'loss/train': 2.1144587993621826} -11/06/2021 21:55:44 - INFO - __main__ - Step 4781: {'lr': 0.0004995648390790249, 'samples': 917952, 'steps': 4780, 'loss/train': 1.954245686531067} -11/06/2021 21:55:45 - INFO - __main__ - Step 4782: {'lr': 0.0004995645260482432, 'samples': 918144, 'steps': 4781, 'loss/train': 2.7569739818573} -11/06/2021 21:55:46 - INFO - __main__ - Step 4783: {'lr': 0.0004995642129050117, 'samples': 918336, 'steps': 4782, 'loss/train': 1.3092371225357056} -11/06/2021 21:55:46 - INFO - __main__ - Step 4784: {'lr': 0.0004995638996493304, 'samples': 918528, 'steps': 4783, 'loss/train': 1.6529567241668701} -11/06/2021 21:55:46 - INFO - __main__ - Step 4785: {'lr': 0.0004995635862811994, 'samples': 918720, 'steps': 4784, 'loss/train': 2.129288911819458} -11/06/2021 21:55:47 - INFO - __main__ - Step 4786: {'lr': 0.000499563272800619, 'samples': 918912, 'steps': 4785, 'loss/train': 2.2793755531311035} -11/06/2021 21:55:47 - INFO - __main__ - Step 4787: {'lr': 0.0004995629592075892, 'samples': 919104, 'steps': 4786, 'loss/train': 2.265683174133301} -11/06/2021 21:55:48 - INFO - __main__ - Step 4788: {'lr': 0.0004995626455021101, 'samples': 919296, 'steps': 4787, 'loss/train': 2.4997894763946533} -11/06/2021 21:55:49 - INFO - __main__ - Step 4789: {'lr': 0.0004995623316841821, 'samples': 919488, 'steps': 4788, 'loss/train': 2.061391592025757} -11/06/2021 21:55:49 - INFO - __main__ - Step 4790: {'lr': 0.0004995620177538051, 'samples': 919680, 'steps': 4789, 'loss/train': 2.428020715713501} -11/06/2021 21:55:50 - INFO - __main__ - Step 4791: {'lr': 0.0004995617037109792, 'samples': 919872, 'steps': 4790, 'loss/train': 1.7995200157165527} -11/06/2021 21:55:50 - INFO - __main__ - Step 4792: {'lr': 0.0004995613895557048, 'samples': 920064, 'steps': 4791, 'loss/train': 1.883157730102539} -11/06/2021 21:55:51 - INFO - __main__ - Step 4793: {'lr': 0.0004995610752879818, 'samples': 920256, 'steps': 4792, 'loss/train': 2.25808048248291} -11/06/2021 21:55:51 - INFO - __main__ - Step 4794: {'lr': 0.0004995607609078104, 'samples': 920448, 'steps': 4793, 'loss/train': 2.118656873703003} -11/06/2021 21:55:52 - INFO - __main__ - Step 4795: {'lr': 0.0004995604464151908, 'samples': 920640, 'steps': 4794, 'loss/train': 2.104627847671509} -11/06/2021 21:55:52 - INFO - __main__ - Step 4796: {'lr': 0.0004995601318101231, 'samples': 920832, 'steps': 4795, 'loss/train': 2.0214784145355225} -11/06/2021 21:55:52 - INFO - __main__ - Step 4797: {'lr': 0.0004995598170926074, 'samples': 921024, 'steps': 4796, 'loss/train': 1.9268819093704224} -11/06/2021 21:55:53 - INFO - __main__ - Step 4798: {'lr': 0.000499559502262644, 'samples': 921216, 'steps': 4797, 'loss/train': 1.5341185331344604} -11/06/2021 21:55:54 - INFO - __main__ - Step 4799: {'lr': 0.000499559187320233, 'samples': 921408, 'steps': 4798, 'loss/train': 2.1940500736236572} -11/06/2021 21:55:54 - INFO - __main__ - Step 4800: {'lr': 0.0004995588722653743, 'samples': 921600, 'steps': 4799, 'loss/train': 1.9055429697036743} -11/06/2021 21:55:54 - INFO - __main__ - Step 4801: {'lr': 0.0004995585570980684, 'samples': 921792, 'steps': 4800, 'loss/train': 2.3950815200805664} -11/06/2021 21:55:55 - INFO - __main__ - Step 4802: {'lr': 0.0004995582418183151, 'samples': 921984, 'steps': 4801, 'loss/train': 1.969565510749817} -11/06/2021 21:55:55 - INFO - __main__ - Step 4803: {'lr': 0.0004995579264261148, 'samples': 922176, 'steps': 4802, 'loss/train': 1.7654180526733398} -11/06/2021 21:55:56 - INFO - __main__ - Step 4804: {'lr': 0.0004995576109214676, 'samples': 922368, 'steps': 4803, 'loss/train': 2.6347360610961914} -11/06/2021 21:55:57 - INFO - __main__ - Step 4805: {'lr': 0.0004995572953043736, 'samples': 922560, 'steps': 4804, 'loss/train': 1.7408865690231323} -11/06/2021 21:55:57 - INFO - __main__ - Step 4806: {'lr': 0.0004995569795748328, 'samples': 922752, 'steps': 4805, 'loss/train': 1.1435315608978271} -11/06/2021 21:55:57 - INFO - __main__ - Step 4807: {'lr': 0.0004995566637328456, 'samples': 922944, 'steps': 4806, 'loss/train': 1.0032495260238647} -11/06/2021 21:55:58 - INFO - __main__ - Step 4808: {'lr': 0.0004995563477784119, 'samples': 923136, 'steps': 4807, 'loss/train': 2.07177472114563} -11/06/2021 21:55:59 - INFO - __main__ - Step 4809: {'lr': 0.000499556031711532, 'samples': 923328, 'steps': 4808, 'loss/train': 2.4952619075775146} -11/06/2021 21:55:59 - INFO - __main__ - Step 4810: {'lr': 0.000499555715532206, 'samples': 923520, 'steps': 4809, 'loss/train': 1.7936309576034546} -11/06/2021 21:55:59 - INFO - __main__ - Step 4811: {'lr': 0.0004995553992404342, 'samples': 923712, 'steps': 4810, 'loss/train': 1.8712501525878906} -11/06/2021 21:56:00 - INFO - __main__ - Step 4812: {'lr': 0.0004995550828362163, 'samples': 923904, 'steps': 4811, 'loss/train': 2.1187033653259277} -11/06/2021 21:56:00 - INFO - __main__ - Step 4813: {'lr': 0.000499554766319553, 'samples': 924096, 'steps': 4812, 'loss/train': 1.8378645181655884} -11/06/2021 21:56:01 - INFO - __main__ - Step 4814: {'lr': 0.0004995544496904441, 'samples': 924288, 'steps': 4813, 'loss/train': 2.4952051639556885} -11/06/2021 21:56:01 - INFO - __main__ - Step 4815: {'lr': 0.0004995541329488897, 'samples': 924480, 'steps': 4814, 'loss/train': 1.766731858253479} -11/06/2021 21:56:02 - INFO - __main__ - Step 4816: {'lr': 0.0004995538160948901, 'samples': 924672, 'steps': 4815, 'loss/train': 1.933300495147705} -11/06/2021 21:56:02 - INFO - __main__ - Step 4817: {'lr': 0.0004995534991284455, 'samples': 924864, 'steps': 4816, 'loss/train': 1.8735243082046509} -11/06/2021 21:56:02 - INFO - __main__ - Step 4818: {'lr': 0.0004995531820495559, 'samples': 925056, 'steps': 4817, 'loss/train': 2.582186460494995} -11/06/2021 21:56:03 - INFO - __main__ - Step 4819: {'lr': 0.0004995528648582214, 'samples': 925248, 'steps': 4818, 'loss/train': 2.391286611557007} -11/06/2021 21:56:04 - INFO - __main__ - Step 4820: {'lr': 0.0004995525475544423, 'samples': 925440, 'steps': 4819, 'loss/train': 2.931082248687744} -11/06/2021 21:56:04 - INFO - __main__ - Step 4821: {'lr': 0.0004995522301382187, 'samples': 925632, 'steps': 4820, 'loss/train': 1.65629243850708} -11/06/2021 21:56:05 - INFO - __main__ - Step 4822: {'lr': 0.0004995519126095506, 'samples': 925824, 'steps': 4821, 'loss/train': 2.3707022666931152} -11/06/2021 21:56:05 - INFO - __main__ - Step 4823: {'lr': 0.0004995515949684384, 'samples': 926016, 'steps': 4822, 'loss/train': 1.6298257112503052} -11/06/2021 21:56:05 - INFO - __main__ - Step 4824: {'lr': 0.000499551277214882, 'samples': 926208, 'steps': 4823, 'loss/train': 1.6904128789901733} -11/06/2021 21:56:06 - INFO - __main__ - Step 4825: {'lr': 0.0004995509593488818, 'samples': 926400, 'steps': 4824, 'loss/train': 2.1001079082489014} -11/06/2021 21:56:07 - INFO - __main__ - Step 4826: {'lr': 0.0004995506413704376, 'samples': 926592, 'steps': 4825, 'loss/train': 1.8763246536254883} -11/06/2021 21:56:07 - INFO - __main__ - Step 4827: {'lr': 0.0004995503232795498, 'samples': 926784, 'steps': 4826, 'loss/train': 1.9993937015533447} -11/06/2021 21:56:07 - INFO - __main__ - Step 4828: {'lr': 0.0004995500050762185, 'samples': 926976, 'steps': 4827, 'loss/train': 2.1457080841064453} -11/06/2021 21:56:08 - INFO - __main__ - Step 4829: {'lr': 0.0004995496867604438, 'samples': 927168, 'steps': 4828, 'loss/train': 1.929814338684082} -11/06/2021 21:56:09 - INFO - __main__ - Step 4830: {'lr': 0.0004995493683322259, 'samples': 927360, 'steps': 4829, 'loss/train': 1.904067873954773} -11/06/2021 21:56:09 - INFO - __main__ - Step 4831: {'lr': 0.0004995490497915649, 'samples': 927552, 'steps': 4830, 'loss/train': 2.4040565490722656} -11/06/2021 21:56:09 - INFO - __main__ - Step 4832: {'lr': 0.0004995487311384609, 'samples': 927744, 'steps': 4831, 'loss/train': 2.00188946723938} -11/06/2021 21:56:10 - INFO - __main__ - Step 4833: {'lr': 0.0004995484123729141, 'samples': 927936, 'steps': 4832, 'loss/train': 2.0301706790924072} -11/06/2021 21:56:10 - INFO - __main__ - Step 4834: {'lr': 0.0004995480934949247, 'samples': 928128, 'steps': 4833, 'loss/train': 1.7859026193618774} -11/06/2021 21:56:11 - INFO - __main__ - Step 4835: {'lr': 0.0004995477745044927, 'samples': 928320, 'steps': 4834, 'loss/train': 1.3403795957565308} -11/06/2021 21:56:12 - INFO - __main__ - Step 4836: {'lr': 0.0004995474554016184, 'samples': 928512, 'steps': 4835, 'loss/train': 2.4826717376708984} -11/06/2021 21:56:12 - INFO - __main__ - Step 4837: {'lr': 0.0004995471361863017, 'samples': 928704, 'steps': 4836, 'loss/train': 2.1667168140411377} -11/06/2021 21:56:12 - INFO - __main__ - Step 4838: {'lr': 0.0004995468168585431, 'samples': 928896, 'steps': 4837, 'loss/train': 1.3020102977752686} -11/06/2021 21:56:13 - INFO - __main__ - Step 4839: {'lr': 0.0004995464974183424, 'samples': 929088, 'steps': 4838, 'loss/train': 2.1668708324432373} -11/06/2021 21:56:14 - INFO - __main__ - Step 4840: {'lr': 0.0004995461778657002, 'samples': 929280, 'steps': 4839, 'loss/train': 1.8353111743927002} -11/06/2021 21:56:14 - INFO - __main__ - Step 4841: {'lr': 0.000499545858200616, 'samples': 929472, 'steps': 4840, 'loss/train': 1.82950758934021} -11/06/2021 21:56:14 - INFO - __main__ - Step 4842: {'lr': 0.0004995455384230904, 'samples': 929664, 'steps': 4841, 'loss/train': 1.8687033653259277} -11/06/2021 21:56:15 - INFO - __main__ - Step 4843: {'lr': 0.0004995452185331235, 'samples': 929856, 'steps': 4842, 'loss/train': 0.33405929803848267} -11/06/2021 21:56:15 - INFO - __main__ - Step 4844: {'lr': 0.0004995448985307153, 'samples': 930048, 'steps': 4843, 'loss/train': 1.0525949001312256} -11/06/2021 21:56:16 - INFO - __main__ - Step 4845: {'lr': 0.0004995445784158661, 'samples': 930240, 'steps': 4844, 'loss/train': 2.037909507751465} -11/06/2021 21:56:16 - INFO - __main__ - Step 4846: {'lr': 0.0004995442581885759, 'samples': 930432, 'steps': 4845, 'loss/train': 1.789475679397583} -11/06/2021 21:56:17 - INFO - __main__ - Step 4847: {'lr': 0.0004995439378488449, 'samples': 930624, 'steps': 4846, 'loss/train': 1.7952702045440674} -11/06/2021 21:56:17 - INFO - __main__ - Step 4848: {'lr': 0.0004995436173966733, 'samples': 930816, 'steps': 4847, 'loss/train': 1.640943169593811} -11/06/2021 21:56:17 - INFO - __main__ - Step 4849: {'lr': 0.0004995432968320611, 'samples': 931008, 'steps': 4848, 'loss/train': 2.3322298526763916} -11/06/2021 21:56:19 - INFO - __main__ - Step 4850: {'lr': 0.0004995429761550086, 'samples': 931200, 'steps': 4849, 'loss/train': 2.3583528995513916} -11/06/2021 21:56:19 - INFO - __main__ - Step 4851: {'lr': 0.0004995426553655159, 'samples': 931392, 'steps': 4850, 'loss/train': 1.6499428749084473} -11/06/2021 21:56:19 - INFO - __main__ - Step 4852: {'lr': 0.0004995423344635831, 'samples': 931584, 'steps': 4851, 'loss/train': 1.9984158277511597} -11/06/2021 21:56:20 - INFO - __main__ - Step 4853: {'lr': 0.0004995420134492105, 'samples': 931776, 'steps': 4852, 'loss/train': 2.299149513244629} -11/06/2021 21:56:20 - INFO - __main__ - Step 4854: {'lr': 0.0004995416923223979, 'samples': 931968, 'steps': 4853, 'loss/train': 2.4122209548950195} -11/06/2021 21:56:20 - INFO - __main__ - Step 4855: {'lr': 0.0004995413710831458, 'samples': 932160, 'steps': 4854, 'loss/train': 2.0572216510772705} -11/06/2021 21:56:21 - INFO - __main__ - Step 4856: {'lr': 0.0004995410497314542, 'samples': 932352, 'steps': 4855, 'loss/train': 1.9187612533569336} -11/06/2021 21:56:22 - INFO - __main__ - Step 4857: {'lr': 0.0004995407282673232, 'samples': 932544, 'steps': 4856, 'loss/train': 1.4883348941802979} -11/06/2021 21:56:22 - INFO - __main__ - Step 4858: {'lr': 0.000499540406690753, 'samples': 932736, 'steps': 4857, 'loss/train': 1.9691627025604248} -11/06/2021 21:56:22 - INFO - __main__ - Step 4859: {'lr': 0.0004995400850017438, 'samples': 932928, 'steps': 4858, 'loss/train': 1.930557131767273} -11/06/2021 21:56:23 - INFO - __main__ - Step 4860: {'lr': 0.0004995397632002957, 'samples': 933120, 'steps': 4859, 'loss/train': 1.965431809425354} -11/06/2021 21:56:24 - INFO - __main__ - Step 4861: {'lr': 0.0004995394412864088, 'samples': 933312, 'steps': 4860, 'loss/train': 1.9139984846115112} -11/06/2021 21:56:24 - INFO - __main__ - Step 4862: {'lr': 0.0004995391192600834, 'samples': 933504, 'steps': 4861, 'loss/train': 2.268007516860962} -11/06/2021 21:56:24 - INFO - __main__ - Step 4863: {'lr': 0.0004995387971213194, 'samples': 933696, 'steps': 4862, 'loss/train': 1.8037782907485962} -11/06/2021 21:56:25 - INFO - __main__ - Step 4864: {'lr': 0.000499538474870117, 'samples': 933888, 'steps': 4863, 'loss/train': 1.7647819519042969} -11/06/2021 21:56:25 - INFO - __main__ - Step 4865: {'lr': 0.0004995381525064765, 'samples': 934080, 'steps': 4864, 'loss/train': 2.0817017555236816} -11/06/2021 21:56:26 - INFO - __main__ - Step 4866: {'lr': 0.0004995378300303979, 'samples': 934272, 'steps': 4865, 'loss/train': 2.1606099605560303} -11/06/2021 21:56:27 - INFO - __main__ - Step 4867: {'lr': 0.0004995375074418815, 'samples': 934464, 'steps': 4866, 'loss/train': 2.0382091999053955} -11/06/2021 21:56:27 - INFO - __main__ - Step 4868: {'lr': 0.0004995371847409273, 'samples': 934656, 'steps': 4867, 'loss/train': 0.9957026243209839} -11/06/2021 21:56:27 - INFO - __main__ - Step 4869: {'lr': 0.0004995368619275355, 'samples': 934848, 'steps': 4868, 'loss/train': 1.8586081266403198} -11/06/2021 21:56:28 - INFO - __main__ - Step 4870: {'lr': 0.0004995365390017062, 'samples': 935040, 'steps': 4869, 'loss/train': 1.3379945755004883} -11/06/2021 21:56:28 - INFO - __main__ - Step 4871: {'lr': 0.0004995362159634396, 'samples': 935232, 'steps': 4870, 'loss/train': 1.8667609691619873} -11/06/2021 21:56:29 - INFO - __main__ - Step 4872: {'lr': 0.0004995358928127359, 'samples': 935424, 'steps': 4871, 'loss/train': 1.3676517009735107} -11/06/2021 21:56:29 - INFO - __main__ - Step 4873: {'lr': 0.0004995355695495952, 'samples': 935616, 'steps': 4872, 'loss/train': 1.948101282119751} -11/06/2021 21:56:30 - INFO - __main__ - Step 4874: {'lr': 0.0004995352461740174, 'samples': 935808, 'steps': 4873, 'loss/train': 1.8517183065414429} -11/06/2021 21:56:30 - INFO - __main__ - Step 4875: {'lr': 0.0004995349226860031, 'samples': 936000, 'steps': 4874, 'loss/train': 1.5299654006958008} -11/06/2021 21:56:30 - INFO - __main__ - Step 4876: {'lr': 0.0004995345990855522, 'samples': 936192, 'steps': 4875, 'loss/train': 2.013723850250244} -11/06/2021 21:56:31 - INFO - __main__ - Step 4877: {'lr': 0.0004995342753726647, 'samples': 936384, 'steps': 4876, 'loss/train': 2.0262885093688965} -11/06/2021 21:56:32 - INFO - __main__ - Step 4878: {'lr': 0.0004995339515473411, 'samples': 936576, 'steps': 4877, 'loss/train': 1.6470019817352295} -11/06/2021 21:56:32 - INFO - __main__ - Step 4879: {'lr': 0.0004995336276095812, 'samples': 936768, 'steps': 4878, 'loss/train': 1.9853967428207397} -11/06/2021 21:56:32 - INFO - __main__ - Step 4880: {'lr': 0.0004995333035593853, 'samples': 936960, 'steps': 4879, 'loss/train': 1.7942310571670532} -11/06/2021 21:56:33 - INFO - __main__ - Step 4881: {'lr': 0.0004995329793967537, 'samples': 937152, 'steps': 4880, 'loss/train': 2.1231250762939453} -11/06/2021 21:56:34 - INFO - __main__ - Step 4882: {'lr': 0.0004995326551216862, 'samples': 937344, 'steps': 4881, 'loss/train': 1.599252700805664} -11/06/2021 21:56:34 - INFO - __main__ - Step 4883: {'lr': 0.0004995323307341832, 'samples': 937536, 'steps': 4882, 'loss/train': 1.833884596824646} -11/06/2021 21:56:34 - INFO - __main__ - Step 4884: {'lr': 0.0004995320062342449, 'samples': 937728, 'steps': 4883, 'loss/train': 1.6169829368591309} -11/06/2021 21:56:35 - INFO - __main__ - Step 4885: {'lr': 0.0004995316816218712, 'samples': 937920, 'steps': 4884, 'loss/train': 2.102433681488037} -11/06/2021 21:56:35 - INFO - __main__ - Step 4886: {'lr': 0.0004995313568970625, 'samples': 938112, 'steps': 4885, 'loss/train': 2.166229724884033} -11/06/2021 21:56:36 - INFO - __main__ - Step 4887: {'lr': 0.0004995310320598187, 'samples': 938304, 'steps': 4886, 'loss/train': 2.130415916442871} -11/06/2021 21:56:36 - INFO - __main__ - Step 4888: {'lr': 0.0004995307071101401, 'samples': 938496, 'steps': 4887, 'loss/train': 2.281303882598877} -11/06/2021 21:56:37 - INFO - __main__ - Step 4889: {'lr': 0.0004995303820480268, 'samples': 938688, 'steps': 4888, 'loss/train': 1.7925283908843994} -11/06/2021 21:56:37 - INFO - __main__ - Step 4890: {'lr': 0.000499530056873479, 'samples': 938880, 'steps': 4889, 'loss/train': 2.1150357723236084} -11/06/2021 21:56:37 - INFO - __main__ - Step 4891: {'lr': 0.0004995297315864968, 'samples': 939072, 'steps': 4890, 'loss/train': 1.8841792345046997} -11/06/2021 21:56:39 - INFO - __main__ - Step 4892: {'lr': 0.0004995294061870802, 'samples': 939264, 'steps': 4891, 'loss/train': 1.9895226955413818} -11/06/2021 21:56:39 - INFO - __main__ - Step 4893: {'lr': 0.0004995290806752297, 'samples': 939456, 'steps': 4892, 'loss/train': 2.05294132232666} -11/06/2021 21:56:39 - INFO - __main__ - Step 4894: {'lr': 0.0004995287550509452, 'samples': 939648, 'steps': 4893, 'loss/train': 1.6693605184555054} -11/06/2021 21:56:40 - INFO - __main__ - Step 4895: {'lr': 0.0004995284293142268, 'samples': 939840, 'steps': 4894, 'loss/train': 2.2964420318603516} -11/06/2021 21:56:40 - INFO - __main__ - Step 4896: {'lr': 0.0004995281034650748, 'samples': 940032, 'steps': 4895, 'loss/train': 2.0679450035095215} -11/06/2021 21:56:41 - INFO - __main__ - Step 4897: {'lr': 0.0004995277775034894, 'samples': 940224, 'steps': 4896, 'loss/train': 1.8550939559936523} -11/06/2021 21:56:41 - INFO - __main__ - Step 4898: {'lr': 0.0004995274514294706, 'samples': 940416, 'steps': 4897, 'loss/train': 1.983759880065918} -11/06/2021 21:56:42 - INFO - __main__ - Step 4899: {'lr': 0.0004995271252430184, 'samples': 940608, 'steps': 4898, 'loss/train': 2.2435123920440674} -11/06/2021 21:56:42 - INFO - __main__ - Step 4900: {'lr': 0.0004995267989441332, 'samples': 940800, 'steps': 4899, 'loss/train': 1.9692909717559814} -11/06/2021 21:56:42 - INFO - __main__ - Step 4901: {'lr': 0.0004995264725328151, 'samples': 940992, 'steps': 4900, 'loss/train': 1.1252635717391968} -11/06/2021 21:56:43 - INFO - __main__ - Step 4902: {'lr': 0.0004995261460090644, 'samples': 941184, 'steps': 4901, 'loss/train': 2.1014087200164795} -11/06/2021 21:56:44 - INFO - __main__ - Step 4903: {'lr': 0.0004995258193728809, 'samples': 941376, 'steps': 4902, 'loss/train': 2.087357521057129} -11/06/2021 21:56:44 - INFO - __main__ - Step 4904: {'lr': 0.0004995254926242649, 'samples': 941568, 'steps': 4903, 'loss/train': 1.3872030973434448} -11/06/2021 21:56:44 - INFO - __main__ - Step 4905: {'lr': 0.0004995251657632165, 'samples': 941760, 'steps': 4904, 'loss/train': 1.6950825452804565} -11/06/2021 21:56:45 - INFO - __main__ - Step 4906: {'lr': 0.000499524838789736, 'samples': 941952, 'steps': 4905, 'loss/train': 2.146413803100586} -11/06/2021 21:56:46 - INFO - __main__ - Step 4907: {'lr': 0.0004995245117038235, 'samples': 942144, 'steps': 4906, 'loss/train': 2.0605762004852295} -11/06/2021 21:56:46 - INFO - __main__ - Step 4908: {'lr': 0.0004995241845054791, 'samples': 942336, 'steps': 4907, 'loss/train': 2.1872684955596924} -11/06/2021 21:56:46 - INFO - __main__ - Step 4909: {'lr': 0.0004995238571947029, 'samples': 942528, 'steps': 4908, 'loss/train': 1.7782576084136963} -11/06/2021 21:56:47 - INFO - __main__ - Step 4910: {'lr': 0.0004995235297714951, 'samples': 942720, 'steps': 4909, 'loss/train': 1.769343614578247} -11/06/2021 21:56:47 - INFO - __main__ - Step 4911: {'lr': 0.0004995232022358559, 'samples': 942912, 'steps': 4910, 'loss/train': 2.6425294876098633} -11/06/2021 21:56:48 - INFO - __main__ - Step 4912: {'lr': 0.0004995228745877853, 'samples': 943104, 'steps': 4911, 'loss/train': 1.9566208124160767} -11/06/2021 21:56:49 - INFO - __main__ - Step 4913: {'lr': 0.0004995225468272836, 'samples': 943296, 'steps': 4912, 'loss/train': 1.9008264541625977} -11/06/2021 21:56:49 - INFO - __main__ - Step 4914: {'lr': 0.0004995222189543509, 'samples': 943488, 'steps': 4913, 'loss/train': 6.304197311401367} -11/06/2021 21:56:49 - INFO - __main__ - Step 4915: {'lr': 0.0004995218909689873, 'samples': 943680, 'steps': 4914, 'loss/train': 1.216681718826294} -11/06/2021 21:56:50 - INFO - __main__ - Step 4916: {'lr': 0.0004995215628711931, 'samples': 943872, 'steps': 4915, 'loss/train': 2.1877267360687256} -11/06/2021 21:56:50 - INFO - __main__ - Step 4917: {'lr': 0.0004995212346609682, 'samples': 944064, 'steps': 4916, 'loss/train': 2.259002923965454} -11/06/2021 21:56:51 - INFO - __main__ - Step 4918: {'lr': 0.0004995209063383129, 'samples': 944256, 'steps': 4917, 'loss/train': 1.607182264328003} -11/06/2021 21:56:51 - INFO - __main__ - Step 4919: {'lr': 0.0004995205779032274, 'samples': 944448, 'steps': 4918, 'loss/train': 2.302341938018799} -11/06/2021 21:56:52 - INFO - __main__ - Step 4920: {'lr': 0.0004995202493557118, 'samples': 944640, 'steps': 4919, 'loss/train': 1.7484567165374756} -11/06/2021 21:56:52 - INFO - __main__ - Step 4921: {'lr': 0.0004995199206957662, 'samples': 944832, 'steps': 4920, 'loss/train': 2.0463926792144775} -11/06/2021 21:56:53 - INFO - __main__ - Step 4922: {'lr': 0.0004995195919233906, 'samples': 945024, 'steps': 4921, 'loss/train': 2.1027209758758545} -11/06/2021 21:56:54 - INFO - __main__ - Step 4923: {'lr': 0.0004995192630385855, 'samples': 945216, 'steps': 4922, 'loss/train': 1.897849678993225} -11/06/2021 21:56:54 - INFO - __main__ - Step 4924: {'lr': 0.0004995189340413509, 'samples': 945408, 'steps': 4923, 'loss/train': 1.5796188116073608} -11/06/2021 21:56:55 - INFO - __main__ - Step 4925: {'lr': 0.0004995186049316868, 'samples': 945600, 'steps': 4924, 'loss/train': 2.1608316898345947} -11/06/2021 21:56:55 - INFO - __main__ - Step 4926: {'lr': 0.0004995182757095935, 'samples': 945792, 'steps': 4925, 'loss/train': 2.3778295516967773} -11/06/2021 21:56:55 - INFO - __main__ - Step 4927: {'lr': 0.0004995179463750712, 'samples': 945984, 'steps': 4926, 'loss/train': 2.6206376552581787} -11/06/2021 21:56:56 - INFO - __main__ - Step 4928: {'lr': 0.0004995176169281199, 'samples': 946176, 'steps': 4927, 'loss/train': 2.371328115463257} -11/06/2021 21:56:57 - INFO - __main__ - Step 4929: {'lr': 0.0004995172873687398, 'samples': 946368, 'steps': 4928, 'loss/train': 2.762335777282715} -11/06/2021 21:56:57 - INFO - __main__ - Step 4930: {'lr': 0.0004995169576969311, 'samples': 946560, 'steps': 4929, 'loss/train': 1.838969349861145} -11/06/2021 21:56:58 - INFO - __main__ - Step 4931: {'lr': 0.0004995166279126938, 'samples': 946752, 'steps': 4930, 'loss/train': 1.8372935056686401} -11/06/2021 21:56:58 - INFO - __main__ - Step 4932: {'lr': 0.0004995162980160283, 'samples': 946944, 'steps': 4931, 'loss/train': 1.7743967771530151} -11/06/2021 21:56:58 - INFO - __main__ - Step 4933: {'lr': 0.0004995159680069346, 'samples': 947136, 'steps': 4932, 'loss/train': 1.8914155960083008} -11/06/2021 21:56:59 - INFO - __main__ - Step 4934: {'lr': 0.0004995156378854127, 'samples': 947328, 'steps': 4933, 'loss/train': 1.7607487440109253} -11/06/2021 21:57:00 - INFO - __main__ - Step 4935: {'lr': 0.000499515307651463, 'samples': 947520, 'steps': 4934, 'loss/train': 2.1030728816986084} -11/06/2021 21:57:00 - INFO - __main__ - Step 4936: {'lr': 0.0004995149773050857, 'samples': 947712, 'steps': 4935, 'loss/train': 2.1479721069335938} -11/06/2021 21:57:01 - INFO - __main__ - Step 4937: {'lr': 0.0004995146468462806, 'samples': 947904, 'steps': 4936, 'loss/train': 1.576684832572937} -11/06/2021 21:57:01 - INFO - __main__ - Step 4938: {'lr': 0.0004995143162750481, 'samples': 948096, 'steps': 4937, 'loss/train': 2.200626850128174} -11/06/2021 21:57:02 - INFO - __main__ - Step 4939: {'lr': 0.0004995139855913883, 'samples': 948288, 'steps': 4938, 'loss/train': 2.6972954273223877} -11/06/2021 21:57:02 - INFO - __main__ - Step 4940: {'lr': 0.0004995136547953014, 'samples': 948480, 'steps': 4939, 'loss/train': 2.025506019592285} -11/06/2021 21:57:02 - INFO - __main__ - Step 4941: {'lr': 0.0004995133238867874, 'samples': 948672, 'steps': 4940, 'loss/train': 2.79832124710083} -11/06/2021 21:57:03 - INFO - __main__ - Step 4942: {'lr': 0.0004995129928658466, 'samples': 948864, 'steps': 4941, 'loss/train': 1.9636731147766113} -11/06/2021 21:57:03 - INFO - __main__ - Step 4943: {'lr': 0.0004995126617324791, 'samples': 949056, 'steps': 4942, 'loss/train': 2.302797317504883} -11/06/2021 21:57:04 - INFO - __main__ - Step 4944: {'lr': 0.000499512330486685, 'samples': 949248, 'steps': 4943, 'loss/train': 1.3910671472549438} -11/06/2021 21:57:05 - INFO - __main__ - Step 4945: {'lr': 0.0004995119991284645, 'samples': 949440, 'steps': 4944, 'loss/train': 1.6283067464828491} -11/06/2021 21:57:05 - INFO - __main__ - Step 4946: {'lr': 0.0004995116676578178, 'samples': 949632, 'steps': 4945, 'loss/train': 2.0636019706726074} -11/06/2021 21:57:05 - INFO - __main__ - Step 4947: {'lr': 0.000499511336074745, 'samples': 949824, 'steps': 4946, 'loss/train': 1.653847575187683} -11/06/2021 21:57:06 - INFO - __main__ - Step 4948: {'lr': 0.0004995110043792462, 'samples': 950016, 'steps': 4947, 'loss/train': 1.9270820617675781} -11/06/2021 21:57:06 - INFO - __main__ - Step 4949: {'lr': 0.0004995106725713217, 'samples': 950208, 'steps': 4948, 'loss/train': 2.0320072174072266} -11/06/2021 21:57:07 - INFO - __main__ - Step 4950: {'lr': 0.0004995103406509713, 'samples': 950400, 'steps': 4949, 'loss/train': 1.9087032079696655} -11/06/2021 21:57:07 - INFO - __main__ - Step 4951: {'lr': 0.0004995100086181957, 'samples': 950592, 'steps': 4950, 'loss/train': 2.294539451599121} -11/06/2021 21:57:08 - INFO - __main__ - Step 4952: {'lr': 0.0004995096764729945, 'samples': 950784, 'steps': 4951, 'loss/train': 1.427341341972351} -11/06/2021 21:57:08 - INFO - __main__ - Step 4953: {'lr': 0.0004995093442153681, 'samples': 950976, 'steps': 4952, 'loss/train': 1.223702073097229} -11/06/2021 21:57:09 - INFO - __main__ - Step 4954: {'lr': 0.0004995090118453167, 'samples': 951168, 'steps': 4953, 'loss/train': 1.9926605224609375} -11/06/2021 21:57:09 - INFO - __main__ - Step 4955: {'lr': 0.0004995086793628405, 'samples': 951360, 'steps': 4954, 'loss/train': 2.119666337966919} -11/06/2021 21:57:10 - INFO - __main__ - Step 4956: {'lr': 0.0004995083467679394, 'samples': 951552, 'steps': 4955, 'loss/train': 1.4242171049118042} -11/06/2021 21:57:10 - INFO - __main__ - Step 4957: {'lr': 0.0004995080140606137, 'samples': 951744, 'steps': 4956, 'loss/train': 2.439540147781372} -11/06/2021 21:57:11 - INFO - __main__ - Step 4958: {'lr': 0.0004995076812408636, 'samples': 951936, 'steps': 4957, 'loss/train': 1.9032562971115112} -11/06/2021 21:57:11 - INFO - __main__ - Step 4959: {'lr': 0.0004995073483086891, 'samples': 952128, 'steps': 4958, 'loss/train': 1.8582649230957031} -11/06/2021 21:57:12 - INFO - __main__ - Step 4960: {'lr': 0.0004995070152640905, 'samples': 952320, 'steps': 4959, 'loss/train': 2.372265100479126} -11/06/2021 21:57:12 - INFO - __main__ - Step 4961: {'lr': 0.0004995066821070679, 'samples': 952512, 'steps': 4960, 'loss/train': 1.438249945640564} -11/06/2021 21:57:13 - INFO - __main__ - Step 4962: {'lr': 0.0004995063488376214, 'samples': 952704, 'steps': 4961, 'loss/train': 2.022662401199341} -11/06/2021 21:57:13 - INFO - __main__ - Step 4963: {'lr': 0.0004995060154557513, 'samples': 952896, 'steps': 4962, 'loss/train': 2.1550307273864746} -11/06/2021 21:57:13 - INFO - __main__ - Step 4964: {'lr': 0.0004995056819614575, 'samples': 953088, 'steps': 4963, 'loss/train': 1.8373814821243286} -11/06/2021 21:57:14 - INFO - __main__ - Step 4965: {'lr': 0.0004995053483547404, 'samples': 953280, 'steps': 4964, 'loss/train': 2.0746841430664062} -11/06/2021 21:57:15 - INFO - __main__ - Step 4966: {'lr': 0.0004995050146355999, 'samples': 953472, 'steps': 4965, 'loss/train': 1.7231754064559937} -11/06/2021 21:57:15 - INFO - __main__ - Step 4967: {'lr': 0.0004995046808040363, 'samples': 953664, 'steps': 4966, 'loss/train': 2.3439464569091797} -11/06/2021 21:57:15 - INFO - __main__ - Step 4968: {'lr': 0.0004995043468600499, 'samples': 953856, 'steps': 4967, 'loss/train': 1.1684303283691406} -11/06/2021 21:57:16 - INFO - __main__ - Step 4969: {'lr': 0.0004995040128036405, 'samples': 954048, 'steps': 4968, 'loss/train': 1.818418264389038} -11/06/2021 21:57:16 - INFO - __main__ - Step 4970: {'lr': 0.0004995036786348086, 'samples': 954240, 'steps': 4969, 'loss/train': 2.059702157974243} -11/06/2021 21:57:17 - INFO - __main__ - Step 4971: {'lr': 0.0004995033443535541, 'samples': 954432, 'steps': 4970, 'loss/train': 1.7052550315856934} -11/06/2021 21:57:17 - INFO - __main__ - Step 4972: {'lr': 0.0004995030099598773, 'samples': 954624, 'steps': 4971, 'loss/train': 2.043684720993042} -11/06/2021 21:57:18 - INFO - __main__ - Step 4973: {'lr': 0.0004995026754537783, 'samples': 954816, 'steps': 4972, 'loss/train': 1.259334683418274} -11/06/2021 21:57:18 - INFO - __main__ - Step 4974: {'lr': 0.0004995023408352572, 'samples': 955008, 'steps': 4973, 'loss/train': 2.089118242263794} -11/06/2021 21:57:18 - INFO - __main__ - Step 4975: {'lr': 0.0004995020061043142, 'samples': 955200, 'steps': 4974, 'loss/train': 2.190615177154541} -11/06/2021 21:57:20 - INFO - __main__ - Step 4976: {'lr': 0.0004995016712609495, 'samples': 955392, 'steps': 4975, 'loss/train': 2.123932361602783} -11/06/2021 21:57:20 - INFO - __main__ - Step 4977: {'lr': 0.0004995013363051631, 'samples': 955584, 'steps': 4976, 'loss/train': 2.357672929763794} -11/06/2021 21:57:20 - INFO - __main__ - Step 4978: {'lr': 0.0004995010012369554, 'samples': 955776, 'steps': 4977, 'loss/train': 2.4011850357055664} -11/06/2021 21:57:21 - INFO - __main__ - Step 4979: {'lr': 0.0004995006660563262, 'samples': 955968, 'steps': 4978, 'loss/train': 2.2604053020477295} -11/06/2021 21:57:21 - INFO - __main__ - Step 4980: {'lr': 0.000499500330763276, 'samples': 956160, 'steps': 4979, 'loss/train': 1.697622537612915} -11/06/2021 21:57:22 - INFO - __main__ - Step 4981: {'lr': 0.0004994999953578048, 'samples': 956352, 'steps': 4980, 'loss/train': 2.418104887008667} -11/06/2021 21:57:22 - INFO - __main__ - Step 4982: {'lr': 0.0004994996598399127, 'samples': 956544, 'steps': 4981, 'loss/train': 1.7995312213897705} -11/06/2021 21:57:23 - INFO - __main__ - Step 4983: {'lr': 0.0004994993242095999, 'samples': 956736, 'steps': 4982, 'loss/train': 1.0818099975585938} -11/06/2021 21:57:23 - INFO - __main__ - Step 4984: {'lr': 0.0004994989884668665, 'samples': 956928, 'steps': 4983, 'loss/train': 1.7262250185012817} -11/06/2021 21:57:23 - INFO - __main__ - Step 4985: {'lr': 0.0004994986526117127, 'samples': 957120, 'steps': 4984, 'loss/train': 1.8972023725509644} -11/06/2021 21:57:24 - INFO - __main__ - Step 4986: {'lr': 0.0004994983166441388, 'samples': 957312, 'steps': 4985, 'loss/train': 1.5889555215835571} -11/06/2021 21:57:25 - INFO - __main__ - Step 4987: {'lr': 0.0004994979805641448, 'samples': 957504, 'steps': 4986, 'loss/train': 2.0608432292938232} -11/06/2021 21:57:25 - INFO - __main__ - Step 4988: {'lr': 0.0004994976443717308, 'samples': 957696, 'steps': 4987, 'loss/train': 2.1303555965423584} -11/06/2021 21:57:25 - INFO - __main__ - Step 4989: {'lr': 0.000499497308066897, 'samples': 957888, 'steps': 4988, 'loss/train': 1.3450038433074951} -11/06/2021 21:57:26 - INFO - __main__ - Step 4990: {'lr': 0.0004994969716496435, 'samples': 958080, 'steps': 4989, 'loss/train': 1.9656953811645508} -11/06/2021 21:57:27 - INFO - __main__ - Step 4991: {'lr': 0.0004994966351199706, 'samples': 958272, 'steps': 4990, 'loss/train': 1.8768229484558105} -11/06/2021 21:57:27 - INFO - __main__ - Step 4992: {'lr': 0.0004994962984778784, 'samples': 958464, 'steps': 4991, 'loss/train': 0.9767778515815735} -11/06/2021 21:57:27 - INFO - __main__ - Step 4993: {'lr': 0.0004994959617233669, 'samples': 958656, 'steps': 4992, 'loss/train': 1.952646255493164} -11/06/2021 21:57:28 - INFO - __main__ - Step 4994: {'lr': 0.0004994956248564364, 'samples': 958848, 'steps': 4993, 'loss/train': 2.012577533721924} -11/06/2021 21:57:28 - INFO - __main__ - Step 4995: {'lr': 0.000499495287877087, 'samples': 959040, 'steps': 4994, 'loss/train': 2.6770846843719482} -11/06/2021 21:57:29 - INFO - __main__ - Step 4996: {'lr': 0.000499494950785319, 'samples': 959232, 'steps': 4995, 'loss/train': 0.9503514766693115} -11/06/2021 21:57:30 - INFO - __main__ - Step 4997: {'lr': 0.0004994946135811324, 'samples': 959424, 'steps': 4996, 'loss/train': 1.3578064441680908} -11/06/2021 21:57:30 - INFO - __main__ - Step 4998: {'lr': 0.0004994942762645274, 'samples': 959616, 'steps': 4997, 'loss/train': 1.6439087390899658} -11/06/2021 21:57:30 - INFO - __main__ - Step 4999: {'lr': 0.000499493938835504, 'samples': 959808, 'steps': 4998, 'loss/train': 1.955640196800232} -11/06/2021 21:57:31 - INFO - __main__ - Step 5000: {'lr': 0.0004994936012940626, 'samples': 960000, 'steps': 4999, 'loss/train': 2.0416653156280518} -11/06/2021 21:57:32 - INFO - __main__ - Step 5001: {'lr': 0.0004994932636402031, 'samples': 960192, 'steps': 5000, 'loss/train': 2.211860418319702} -11/06/2021 21:57:32 - INFO - __main__ - Step 5002: {'lr': 0.000499492925873926, 'samples': 960384, 'steps': 5001, 'loss/train': 2.095062017440796} -11/06/2021 21:57:33 - INFO - __main__ - Step 5003: {'lr': 0.000499492587995231, 'samples': 960576, 'steps': 5002, 'loss/train': 2.049713611602783} -11/06/2021 21:57:33 - INFO - __main__ - Step 5004: {'lr': 0.0004994922500041186, 'samples': 960768, 'steps': 5003, 'loss/train': 1.5910391807556152} -11/06/2021 21:57:33 - INFO - __main__ - Step 5005: {'lr': 0.0004994919119005888, 'samples': 960960, 'steps': 5004, 'loss/train': 2.3668973445892334} -11/06/2021 21:57:34 - INFO - __main__ - Step 5006: {'lr': 0.0004994915736846418, 'samples': 961152, 'steps': 5005, 'loss/train': 2.0674057006835938} -11/06/2021 21:57:35 - INFO - __main__ - Step 5007: {'lr': 0.0004994912353562778, 'samples': 961344, 'steps': 5006, 'loss/train': 2.0364692211151123} -11/06/2021 21:57:35 - INFO - __main__ - Step 5008: {'lr': 0.0004994908969154968, 'samples': 961536, 'steps': 5007, 'loss/train': 1.763395071029663} -11/06/2021 21:57:36 - INFO - __main__ - Step 5009: {'lr': 0.0004994905583622992, 'samples': 961728, 'steps': 5008, 'loss/train': 1.6759827136993408} -11/06/2021 21:57:36 - INFO - __main__ - Step 5010: {'lr': 0.000499490219696685, 'samples': 961920, 'steps': 5009, 'loss/train': 1.3407360315322876} -11/06/2021 21:57:36 - INFO - __main__ - Step 5011: {'lr': 0.0004994898809186542, 'samples': 962112, 'steps': 5010, 'loss/train': 2.153372049331665} -11/06/2021 21:57:37 - INFO - __main__ - Step 5012: {'lr': 0.0004994895420282072, 'samples': 962304, 'steps': 5011, 'loss/train': 2.228909969329834} -11/06/2021 21:57:38 - INFO - __main__ - Step 5013: {'lr': 0.000499489203025344, 'samples': 962496, 'steps': 5012, 'loss/train': 1.8992091417312622} -11/06/2021 21:57:38 - INFO - __main__ - Step 5014: {'lr': 0.000499488863910065, 'samples': 962688, 'steps': 5013, 'loss/train': 1.6911919116973877} -11/06/2021 21:57:38 - INFO - __main__ - Step 5015: {'lr': 0.00049948852468237, 'samples': 962880, 'steps': 5014, 'loss/train': 1.5895403623580933} -11/06/2021 21:57:39 - INFO - __main__ - Step 5016: {'lr': 0.0004994881853422594, 'samples': 963072, 'steps': 5015, 'loss/train': 1.8377931118011475} -11/06/2021 21:57:40 - INFO - __main__ - Step 5017: {'lr': 0.0004994878458897332, 'samples': 963264, 'steps': 5016, 'loss/train': 2.5478765964508057} -11/06/2021 21:57:40 - INFO - __main__ - Step 5018: {'lr': 0.0004994875063247916, 'samples': 963456, 'steps': 5017, 'loss/train': 1.8936893939971924} -11/06/2021 21:57:41 - INFO - __main__ - Step 5019: {'lr': 0.0004994871666474348, 'samples': 963648, 'steps': 5018, 'loss/train': 2.324462890625} -11/06/2021 21:57:41 - INFO - __main__ - Step 5020: {'lr': 0.000499486826857663, 'samples': 963840, 'steps': 5019, 'loss/train': 1.8107075691223145} -11/06/2021 21:57:41 - INFO - __main__ - Step 5021: {'lr': 0.0004994864869554763, 'samples': 964032, 'steps': 5020, 'loss/train': 1.989519476890564} -11/06/2021 21:57:42 - INFO - __main__ - Step 5022: {'lr': 0.0004994861469408748, 'samples': 964224, 'steps': 5021, 'loss/train': 1.991037368774414} -11/06/2021 21:57:43 - INFO - __main__ - Step 5023: {'lr': 0.0004994858068138587, 'samples': 964416, 'steps': 5022, 'loss/train': 1.7982574701309204} -11/06/2021 21:57:43 - INFO - __main__ - Step 5024: {'lr': 0.0004994854665744282, 'samples': 964608, 'steps': 5023, 'loss/train': 2.380490303039551} -11/06/2021 21:57:43 - INFO - __main__ - Step 5025: {'lr': 0.0004994851262225832, 'samples': 964800, 'steps': 5024, 'loss/train': 1.3919230699539185} -11/06/2021 21:57:44 - INFO - __main__ - Step 5026: {'lr': 0.0004994847857583242, 'samples': 964992, 'steps': 5025, 'loss/train': 2.2827370166778564} -11/06/2021 21:57:45 - INFO - __main__ - Step 5027: {'lr': 0.0004994844451816512, 'samples': 965184, 'steps': 5026, 'loss/train': 2.1347203254699707} -11/06/2021 21:57:45 - INFO - __main__ - Step 5028: {'lr': 0.0004994841044925644, 'samples': 965376, 'steps': 5027, 'loss/train': 1.6065678596496582} -11/06/2021 21:57:45 - INFO - __main__ - Step 5029: {'lr': 0.0004994837636910638, 'samples': 965568, 'steps': 5028, 'loss/train': 1.7136719226837158} -11/06/2021 21:57:46 - INFO - __main__ - Step 5030: {'lr': 0.0004994834227771498, 'samples': 965760, 'steps': 5029, 'loss/train': 2.129387617111206} -11/06/2021 21:57:46 - INFO - __main__ - Step 5031: {'lr': 0.0004994830817508224, 'samples': 965952, 'steps': 5030, 'loss/train': 2.3650991916656494} -11/06/2021 21:57:47 - INFO - __main__ - Step 5032: {'lr': 0.0004994827406120816, 'samples': 966144, 'steps': 5031, 'loss/train': 1.8486300706863403} -11/06/2021 21:57:47 - INFO - __main__ - Step 5033: {'lr': 0.0004994823993609279, 'samples': 966336, 'steps': 5032, 'loss/train': 0.8590723872184753} -11/06/2021 21:57:48 - INFO - __main__ - Step 5034: {'lr': 0.0004994820579973612, 'samples': 966528, 'steps': 5033, 'loss/train': 1.7398724555969238} -11/06/2021 21:57:48 - INFO - __main__ - Step 5035: {'lr': 0.0004994817165213817, 'samples': 966720, 'steps': 5034, 'loss/train': 2.0410008430480957} -11/06/2021 21:57:48 - INFO - __main__ - Step 5036: {'lr': 0.0004994813749329897, 'samples': 966912, 'steps': 5035, 'loss/train': 1.631545066833496} -11/06/2021 21:57:50 - INFO - __main__ - Step 5037: {'lr': 0.0004994810332321852, 'samples': 967104, 'steps': 5036, 'loss/train': 1.492642879486084} -11/06/2021 21:57:50 - INFO - __main__ - Step 5038: {'lr': 0.0004994806914189684, 'samples': 967296, 'steps': 5037, 'loss/train': 2.159714460372925} -11/06/2021 21:57:50 - INFO - __main__ - Step 5039: {'lr': 0.0004994803494933394, 'samples': 967488, 'steps': 5038, 'loss/train': 2.5530550479888916} -11/06/2021 21:57:51 - INFO - __main__ - Step 5040: {'lr': 0.0004994800074552985, 'samples': 967680, 'steps': 5039, 'loss/train': 1.7678231000900269} -11/06/2021 21:57:51 - INFO - __main__ - Step 5041: {'lr': 0.0004994796653048457, 'samples': 967872, 'steps': 5040, 'loss/train': 2.178983211517334} -11/06/2021 21:57:51 - INFO - __main__ - Step 5042: {'lr': 0.0004994793230419812, 'samples': 968064, 'steps': 5041, 'loss/train': 2.832493305206299} -11/06/2021 21:57:52 - INFO - __main__ - Step 5043: {'lr': 0.0004994789806667052, 'samples': 968256, 'steps': 5042, 'loss/train': 1.9693965911865234} -11/06/2021 21:57:53 - INFO - __main__ - Step 5044: {'lr': 0.0004994786381790178, 'samples': 968448, 'steps': 5043, 'loss/train': 1.6492239236831665} -11/06/2021 21:57:53 - INFO - __main__ - Step 5045: {'lr': 0.0004994782955789191, 'samples': 968640, 'steps': 5044, 'loss/train': 1.885124683380127} -11/06/2021 21:57:53 - INFO - __main__ - Step 5046: {'lr': 0.0004994779528664095, 'samples': 968832, 'steps': 5045, 'loss/train': 2.0043511390686035} -11/06/2021 21:57:54 - INFO - __main__ - Step 5047: {'lr': 0.0004994776100414888, 'samples': 969024, 'steps': 5046, 'loss/train': 2.129291534423828} -11/06/2021 21:57:55 - INFO - __main__ - Step 5048: {'lr': 0.0004994772671041575, 'samples': 969216, 'steps': 5047, 'loss/train': 2.2023603916168213} -11/06/2021 21:57:55 - INFO - __main__ - Step 5049: {'lr': 0.0004994769240544155, 'samples': 969408, 'steps': 5048, 'loss/train': 2.209613084793091} -11/06/2021 21:57:55 - INFO - __main__ - Step 5050: {'lr': 0.000499476580892263, 'samples': 969600, 'steps': 5049, 'loss/train': 1.4724314212799072} -11/06/2021 21:57:56 - INFO - __main__ - Step 5051: {'lr': 0.0004994762376177004, 'samples': 969792, 'steps': 5050, 'loss/train': 2.012944459915161} -11/06/2021 21:57:56 - INFO - __main__ - Step 5052: {'lr': 0.0004994758942307274, 'samples': 969984, 'steps': 5051, 'loss/train': 1.9832876920700073} -11/06/2021 21:57:57 - INFO - __main__ - Step 5053: {'lr': 0.0004994755507313446, 'samples': 970176, 'steps': 5052, 'loss/train': 2.164370536804199} -11/06/2021 21:57:58 - INFO - __main__ - Step 5054: {'lr': 0.000499475207119552, 'samples': 970368, 'steps': 5053, 'loss/train': 2.118231773376465} -11/06/2021 21:57:58 - INFO - __main__ - Step 5055: {'lr': 0.0004994748633953495, 'samples': 970560, 'steps': 5054, 'loss/train': 1.800482153892517} -11/06/2021 21:57:58 - INFO - __main__ - Step 5056: {'lr': 0.0004994745195587376, 'samples': 970752, 'steps': 5055, 'loss/train': 2.163815975189209} -11/06/2021 21:57:59 - INFO - __main__ - Step 5057: {'lr': 0.0004994741756097164, 'samples': 970944, 'steps': 5056, 'loss/train': 2.414111852645874} -11/06/2021 21:58:00 - INFO - __main__ - Step 5058: {'lr': 0.0004994738315482859, 'samples': 971136, 'steps': 5057, 'loss/train': 1.5080969333648682} -11/06/2021 21:58:00 - INFO - __main__ - Step 5059: {'lr': 0.0004994734873744464, 'samples': 971328, 'steps': 5058, 'loss/train': 2.688166379928589} -11/06/2021 21:58:00 - INFO - __main__ - Step 5060: {'lr': 0.0004994731430881979, 'samples': 971520, 'steps': 5059, 'loss/train': 2.305680990219116} -11/06/2021 21:58:01 - INFO - __main__ - Step 5061: {'lr': 0.0004994727986895408, 'samples': 971712, 'steps': 5060, 'loss/train': 1.9738892316818237} -11/06/2021 21:58:01 - INFO - __main__ - Step 5062: {'lr': 0.0004994724541784749, 'samples': 971904, 'steps': 5061, 'loss/train': 2.3541839122772217} -11/06/2021 21:58:02 - INFO - __main__ - Step 5063: {'lr': 0.0004994721095550008, 'samples': 972096, 'steps': 5062, 'loss/train': 1.869810938835144} -11/06/2021 21:58:02 - INFO - __main__ - Step 5064: {'lr': 0.0004994717648191182, 'samples': 972288, 'steps': 5063, 'loss/train': 1.6675723791122437} -11/06/2021 21:58:03 - INFO - __main__ - Step 5065: {'lr': 0.0004994714199708276, 'samples': 972480, 'steps': 5064, 'loss/train': 0.3723197877407074} -11/06/2021 21:58:03 - INFO - __main__ - Step 5066: {'lr': 0.000499471075010129, 'samples': 972672, 'steps': 5065, 'loss/train': 6.243468761444092} -11/06/2021 21:58:03 - INFO - __main__ - Step 5067: {'lr': 0.0004994707299370226, 'samples': 972864, 'steps': 5066, 'loss/train': 2.330059051513672} -11/06/2021 21:58:04 - INFO - __main__ - Step 5068: {'lr': 0.0004994703847515084, 'samples': 973056, 'steps': 5067, 'loss/train': 1.0603464841842651} -11/06/2021 21:58:05 - INFO - __main__ - Step 5069: {'lr': 0.0004994700394535869, 'samples': 973248, 'steps': 5068, 'loss/train': 2.0306475162506104} -11/06/2021 21:58:05 - INFO - __main__ - Step 5070: {'lr': 0.000499469694043258, 'samples': 973440, 'steps': 5069, 'loss/train': 2.2023260593414307} -11/06/2021 21:58:06 - INFO - __main__ - Step 5071: {'lr': 0.0004994693485205218, 'samples': 973632, 'steps': 5070, 'loss/train': 1.8960644006729126} -11/06/2021 21:58:06 - INFO - __main__ - Step 5072: {'lr': 0.0004994690028853787, 'samples': 973824, 'steps': 5071, 'loss/train': 1.8335449695587158} -11/06/2021 21:58:07 - INFO - __main__ - Step 5073: {'lr': 0.0004994686571378286, 'samples': 974016, 'steps': 5072, 'loss/train': 0.4239940643310547} -11/06/2021 21:58:08 - INFO - __main__ - Step 5074: {'lr': 0.0004994683112778718, 'samples': 974208, 'steps': 5073, 'loss/train': 1.9211030006408691} -11/06/2021 21:58:08 - INFO - __main__ - Step 5075: {'lr': 0.0004994679653055085, 'samples': 974400, 'steps': 5074, 'loss/train': 2.271078109741211} -11/06/2021 21:58:08 - INFO - __main__ - Step 5076: {'lr': 0.0004994676192207387, 'samples': 974592, 'steps': 5075, 'loss/train': 1.9957528114318848} -11/06/2021 21:58:09 - INFO - __main__ - Step 5077: {'lr': 0.0004994672730235626, 'samples': 974784, 'steps': 5076, 'loss/train': 2.396184206008911} -11/06/2021 21:58:09 - INFO - __main__ - Step 5078: {'lr': 0.0004994669267139806, 'samples': 974976, 'steps': 5077, 'loss/train': 2.0437135696411133} -11/06/2021 21:58:10 - INFO - __main__ - Step 5079: {'lr': 0.0004994665802919925, 'samples': 975168, 'steps': 5078, 'loss/train': 2.0462563037872314} -11/06/2021 21:58:11 - INFO - __main__ - Step 5080: {'lr': 0.0004994662337575986, 'samples': 975360, 'steps': 5079, 'loss/train': 2.834306478500366} -11/06/2021 21:58:11 - INFO - __main__ - Step 5081: {'lr': 0.000499465887110799, 'samples': 975552, 'steps': 5080, 'loss/train': 2.6196563243865967} -11/06/2021 21:58:11 - INFO - __main__ - Step 5082: {'lr': 0.0004994655403515941, 'samples': 975744, 'steps': 5081, 'loss/train': 1.8559695482254028} -11/06/2021 21:58:12 - INFO - __main__ - Step 5083: {'lr': 0.0004994651934799837, 'samples': 975936, 'steps': 5082, 'loss/train': 2.3033602237701416} -11/06/2021 21:58:12 - INFO - __main__ - Step 5084: {'lr': 0.0004994648464959683, 'samples': 976128, 'steps': 5083, 'loss/train': 1.8257298469543457} -11/06/2021 21:58:13 - INFO - __main__ - Step 5085: {'lr': 0.0004994644993995478, 'samples': 976320, 'steps': 5084, 'loss/train': 2.538905143737793} -11/06/2021 21:58:13 - INFO - __main__ - Step 5086: {'lr': 0.0004994641521907224, 'samples': 976512, 'steps': 5085, 'loss/train': 2.443490743637085} -11/06/2021 21:58:14 - INFO - __main__ - Step 5087: {'lr': 0.0004994638048694924, 'samples': 976704, 'steps': 5086, 'loss/train': 2.3946332931518555} -11/06/2021 21:58:14 - INFO - __main__ - Step 5088: {'lr': 0.0004994634574358579, 'samples': 976896, 'steps': 5087, 'loss/train': 1.450162649154663} -11/06/2021 21:58:14 - INFO - __main__ - Step 5089: {'lr': 0.0004994631098898188, 'samples': 977088, 'steps': 5088, 'loss/train': 1.5360685586929321} -11/06/2021 21:58:15 - INFO - __main__ - Step 5090: {'lr': 0.0004994627622313757, 'samples': 977280, 'steps': 5089, 'loss/train': 1.8420456647872925} -11/06/2021 21:58:16 - INFO - __main__ - Step 5091: {'lr': 0.0004994624144605284, 'samples': 977472, 'steps': 5090, 'loss/train': 2.4474048614501953} -11/06/2021 21:58:16 - INFO - __main__ - Step 5092: {'lr': 0.0004994620665772772, 'samples': 977664, 'steps': 5091, 'loss/train': 1.8615306615829468} -11/06/2021 21:58:16 - INFO - __main__ - Step 5093: {'lr': 0.0004994617185816222, 'samples': 977856, 'steps': 5092, 'loss/train': 2.000317335128784} -11/06/2021 21:58:17 - INFO - __main__ - Step 5094: {'lr': 0.0004994613704735638, 'samples': 978048, 'steps': 5093, 'loss/train': 2.3359320163726807} -11/06/2021 21:58:18 - INFO - __main__ - Step 5095: {'lr': 0.0004994610222531018, 'samples': 978240, 'steps': 5094, 'loss/train': 2.213413953781128} -11/06/2021 21:58:18 - INFO - __main__ - Step 5096: {'lr': 0.0004994606739202365, 'samples': 978432, 'steps': 5095, 'loss/train': 2.049318552017212} -11/06/2021 21:58:19 - INFO - __main__ - Step 5097: {'lr': 0.0004994603254749681, 'samples': 978624, 'steps': 5096, 'loss/train': 2.276933431625366} -11/06/2021 21:58:19 - INFO - __main__ - Step 5098: {'lr': 0.0004994599769172967, 'samples': 978816, 'steps': 5097, 'loss/train': 2.2054691314697266} -11/06/2021 21:58:19 - INFO - __main__ - Step 5099: {'lr': 0.0004994596282472225, 'samples': 979008, 'steps': 5098, 'loss/train': 1.958910346031189} -11/06/2021 21:58:20 - INFO - __main__ - Step 5100: {'lr': 0.0004994592794647457, 'samples': 979200, 'steps': 5099, 'loss/train': 2.0862319469451904} -11/06/2021 21:58:21 - INFO - __main__ - Step 5101: {'lr': 0.0004994589305698663, 'samples': 979392, 'steps': 5100, 'loss/train': 1.7089622020721436} -11/06/2021 21:58:21 - INFO - __main__ - Step 5102: {'lr': 0.0004994585815625847, 'samples': 979584, 'steps': 5101, 'loss/train': 1.952847957611084} -11/06/2021 21:58:21 - INFO - __main__ - Step 5103: {'lr': 0.0004994582324429008, 'samples': 979776, 'steps': 5102, 'loss/train': 1.894245982170105} -11/06/2021 21:58:22 - INFO - __main__ - Step 5104: {'lr': 0.0004994578832108148, 'samples': 979968, 'steps': 5103, 'loss/train': 1.3645782470703125} -11/06/2021 21:58:22 - INFO - __main__ - Step 5105: {'lr': 0.000499457533866327, 'samples': 980160, 'steps': 5104, 'loss/train': 2.4554972648620605} -11/06/2021 21:58:23 - INFO - __main__ - Step 5106: {'lr': 0.0004994571844094375, 'samples': 980352, 'steps': 5105, 'loss/train': 2.340075731277466} -11/06/2021 21:58:23 - INFO - __main__ - Step 5107: {'lr': 0.0004994568348401466, 'samples': 980544, 'steps': 5106, 'loss/train': 1.1222628355026245} -11/06/2021 21:58:24 - INFO - __main__ - Step 5108: {'lr': 0.0004994564851584541, 'samples': 980736, 'steps': 5107, 'loss/train': 1.5331889390945435} -11/06/2021 21:58:24 - INFO - __main__ - Step 5109: {'lr': 0.0004994561353643604, 'samples': 980928, 'steps': 5108, 'loss/train': 1.8134424686431885} -11/06/2021 21:58:25 - INFO - __main__ - Step 5110: {'lr': 0.0004994557854578656, 'samples': 981120, 'steps': 5109, 'loss/train': 1.9003137350082397} -11/06/2021 21:58:26 - INFO - __main__ - Step 5111: {'lr': 0.0004994554354389699, 'samples': 981312, 'steps': 5110, 'loss/train': 1.9330469369888306} -11/06/2021 21:58:26 - INFO - __main__ - Step 5112: {'lr': 0.0004994550853076734, 'samples': 981504, 'steps': 5111, 'loss/train': 1.9353581666946411} -11/06/2021 21:58:27 - INFO - __main__ - Step 5113: {'lr': 0.0004994547350639764, 'samples': 981696, 'steps': 5112, 'loss/train': 2.078845500946045} -11/06/2021 21:58:27 - INFO - __main__ - Step 5114: {'lr': 0.0004994543847078787, 'samples': 981888, 'steps': 5113, 'loss/train': 1.3129998445510864} -11/06/2021 21:58:27 - INFO - __main__ - Step 5115: {'lr': 0.000499454034239381, 'samples': 982080, 'steps': 5114, 'loss/train': 1.7932987213134766} -11/06/2021 21:58:28 - INFO - __main__ - Step 5116: {'lr': 0.000499453683658483, 'samples': 982272, 'steps': 5115, 'loss/train': 2.2063400745391846} -11/06/2021 21:58:28 - INFO - __main__ - Step 5117: {'lr': 0.0004994533329651849, 'samples': 982464, 'steps': 5116, 'loss/train': 1.820799469947815} -11/06/2021 21:58:29 - INFO - __main__ - Step 5118: {'lr': 0.0004994529821594872, 'samples': 982656, 'steps': 5117, 'loss/train': 2.5855801105499268} -11/06/2021 21:58:29 - INFO - __main__ - Step 5119: {'lr': 0.0004994526312413897, 'samples': 982848, 'steps': 5118, 'loss/train': 1.6690380573272705} -11/06/2021 21:58:30 - INFO - __main__ - Step 5120: {'lr': 0.0004994522802108927, 'samples': 983040, 'steps': 5119, 'loss/train': 1.896449327468872} -11/06/2021 21:58:30 - INFO - __main__ - Step 5121: {'lr': 0.0004994519290679964, 'samples': 983232, 'steps': 5120, 'loss/train': 1.6968704462051392} -11/06/2021 21:58:31 - INFO - __main__ - Step 5122: {'lr': 0.0004994515778127009, 'samples': 983424, 'steps': 5121, 'loss/train': 1.7569773197174072} -11/06/2021 21:58:31 - INFO - __main__ - Step 5123: {'lr': 0.0004994512264450064, 'samples': 983616, 'steps': 5122, 'loss/train': 2.063852310180664} -11/06/2021 21:58:32 - INFO - __main__ - Step 5124: {'lr': 0.000499450874964913, 'samples': 983808, 'steps': 5123, 'loss/train': 2.1291959285736084} -11/06/2021 21:58:32 - INFO - __main__ - Step 5125: {'lr': 0.000499450523372421, 'samples': 984000, 'steps': 5124, 'loss/train': 2.469874143600464} -11/06/2021 21:58:32 - INFO - __main__ - Step 5126: {'lr': 0.0004994501716675303, 'samples': 984192, 'steps': 5125, 'loss/train': 1.7951209545135498} -11/06/2021 21:58:33 - INFO - __main__ - Step 5127: {'lr': 0.0004994498198502412, 'samples': 984384, 'steps': 5126, 'loss/train': 2.0104482173919678} -11/06/2021 21:58:34 - INFO - __main__ - Step 5128: {'lr': 0.0004994494679205539, 'samples': 984576, 'steps': 5127, 'loss/train': 2.0760858058929443} -11/06/2021 21:58:34 - INFO - __main__ - Step 5129: {'lr': 0.0004994491158784684, 'samples': 984768, 'steps': 5128, 'loss/train': 2.1686079502105713} -11/06/2021 21:58:34 - INFO - __main__ - Step 5130: {'lr': 0.0004994487637239851, 'samples': 984960, 'steps': 5129, 'loss/train': 1.1807832717895508} -11/06/2021 21:58:35 - INFO - __main__ - Step 5131: {'lr': 0.0004994484114571041, 'samples': 985152, 'steps': 5130, 'loss/train': 1.4355896711349487} -11/06/2021 21:58:36 - INFO - __main__ - Step 5132: {'lr': 0.0004994480590778254, 'samples': 985344, 'steps': 5131, 'loss/train': 1.8569763898849487} -11/06/2021 21:58:36 - INFO - __main__ - Step 5133: {'lr': 0.0004994477065861493, 'samples': 985536, 'steps': 5132, 'loss/train': 2.1365954875946045} -11/06/2021 21:58:37 - INFO - __main__ - Step 5134: {'lr': 0.0004994473539820758, 'samples': 985728, 'steps': 5133, 'loss/train': 1.7661622762680054} -11/06/2021 21:58:37 - INFO - __main__ - Step 5135: {'lr': 0.0004994470012656052, 'samples': 985920, 'steps': 5134, 'loss/train': 2.2697160243988037} -11/06/2021 21:58:37 - INFO - __main__ - Step 5136: {'lr': 0.0004994466484367378, 'samples': 986112, 'steps': 5135, 'loss/train': 2.3424150943756104} -11/06/2021 21:58:38 - INFO - __main__ - Step 5137: {'lr': 0.0004994462954954734, 'samples': 986304, 'steps': 5136, 'loss/train': 1.250626564025879} -11/06/2021 21:58:39 - INFO - __main__ - Step 5138: {'lr': 0.0004994459424418125, 'samples': 986496, 'steps': 5137, 'loss/train': 2.22953462600708} -11/06/2021 21:58:39 - INFO - __main__ - Step 5139: {'lr': 0.000499445589275755, 'samples': 986688, 'steps': 5138, 'loss/train': 2.005419969558716} -11/06/2021 21:58:39 - INFO - __main__ - Step 5140: {'lr': 0.0004994452359973012, 'samples': 986880, 'steps': 5139, 'loss/train': 1.6053614616394043} -11/06/2021 21:58:40 - INFO - __main__ - Step 5141: {'lr': 0.0004994448826064512, 'samples': 987072, 'steps': 5140, 'loss/train': 2.132984161376953} -11/06/2021 21:58:41 - INFO - __main__ - Step 5142: {'lr': 0.0004994445291032053, 'samples': 987264, 'steps': 5141, 'loss/train': 1.4963831901550293} -11/06/2021 21:58:41 - INFO - __main__ - Step 5143: {'lr': 0.0004994441754875634, 'samples': 987456, 'steps': 5142, 'loss/train': 2.0756425857543945} -11/06/2021 21:58:41 - INFO - __main__ - Step 5144: {'lr': 0.0004994438217595259, 'samples': 987648, 'steps': 5143, 'loss/train': 2.1674396991729736} -11/06/2021 21:58:42 - INFO - __main__ - Step 5145: {'lr': 0.0004994434679190928, 'samples': 987840, 'steps': 5144, 'loss/train': 2.1360890865325928} -11/06/2021 21:58:42 - INFO - __main__ - Step 5146: {'lr': 0.0004994431139662643, 'samples': 988032, 'steps': 5145, 'loss/train': 2.855836868286133} -11/06/2021 21:58:43 - INFO - __main__ - Step 5147: {'lr': 0.0004994427599010406, 'samples': 988224, 'steps': 5146, 'loss/train': 2.0516815185546875} -11/06/2021 21:58:44 - INFO - __main__ - Step 5148: {'lr': 0.0004994424057234219, 'samples': 988416, 'steps': 5147, 'loss/train': 1.951188087463379} -11/06/2021 21:58:45 - INFO - __main__ - Step 5149: {'lr': 0.0004994420514334082, 'samples': 988608, 'steps': 5148, 'loss/train': 1.9776523113250732} -11/06/2021 21:58:45 - INFO - __main__ - Step 5150: {'lr': 0.0004994416970309999, 'samples': 988800, 'steps': 5149, 'loss/train': 2.2853457927703857} -11/06/2021 21:58:45 - INFO - __main__ - Step 5151: {'lr': 0.0004994413425161969, 'samples': 988992, 'steps': 5150, 'loss/train': 1.2515465021133423} -11/06/2021 21:58:46 - INFO - __main__ - Step 5152: {'lr': 0.0004994409878889995, 'samples': 989184, 'steps': 5151, 'loss/train': 1.107923984527588} -11/06/2021 21:58:46 - INFO - __main__ - Step 5153: {'lr': 0.0004994406331494079, 'samples': 989376, 'steps': 5152, 'loss/train': 0.8732290267944336} -11/06/2021 21:58:47 - INFO - __main__ - Step 5154: {'lr': 0.0004994402782974222, 'samples': 989568, 'steps': 5153, 'loss/train': 1.9641544818878174} -11/06/2021 21:58:47 - INFO - __main__ - Step 5155: {'lr': 0.0004994399233330426, 'samples': 989760, 'steps': 5154, 'loss/train': 2.2096810340881348} -11/06/2021 21:58:48 - INFO - __main__ - Step 5156: {'lr': 0.000499439568256269, 'samples': 989952, 'steps': 5155, 'loss/train': 1.8779668807983398} -11/06/2021 21:58:48 - INFO - __main__ - Step 5157: {'lr': 0.000499439213067102, 'samples': 990144, 'steps': 5156, 'loss/train': 2.0117697715759277} -11/06/2021 21:58:48 - INFO - __main__ - Step 5158: {'lr': 0.0004994388577655415, 'samples': 990336, 'steps': 5157, 'loss/train': 1.9738129377365112} -11/06/2021 21:58:49 - INFO - __main__ - Step 5159: {'lr': 0.0004994385023515876, 'samples': 990528, 'steps': 5158, 'loss/train': 2.6475677490234375} -11/06/2021 21:58:50 - INFO - __main__ - Step 5160: {'lr': 0.0004994381468252406, 'samples': 990720, 'steps': 5159, 'loss/train': 2.463541269302368} -11/06/2021 21:58:50 - INFO - __main__ - Step 5161: {'lr': 0.0004994377911865007, 'samples': 990912, 'steps': 5160, 'loss/train': 2.4826114177703857} -11/06/2021 21:58:51 - INFO - __main__ - Step 5162: {'lr': 0.0004994374354353679, 'samples': 991104, 'steps': 5161, 'loss/train': 2.0047404766082764} -11/06/2021 21:58:51 - INFO - __main__ - Step 5163: {'lr': 0.0004994370795718425, 'samples': 991296, 'steps': 5162, 'loss/train': 2.0610859394073486} -11/06/2021 21:58:51 - INFO - __main__ - Step 5164: {'lr': 0.0004994367235959245, 'samples': 991488, 'steps': 5163, 'loss/train': 1.4020670652389526} -11/06/2021 21:58:52 - INFO - __main__ - Step 5165: {'lr': 0.0004994363675076143, 'samples': 991680, 'steps': 5164, 'loss/train': 1.8617390394210815} -11/06/2021 21:58:53 - INFO - __main__ - Step 5166: {'lr': 0.0004994360113069118, 'samples': 991872, 'steps': 5165, 'loss/train': 2.2617647647857666} -11/06/2021 21:58:53 - INFO - __main__ - Step 5167: {'lr': 0.0004994356549938173, 'samples': 992064, 'steps': 5166, 'loss/train': 2.5071494579315186} -11/06/2021 21:58:53 - INFO - __main__ - Step 5168: {'lr': 0.000499435298568331, 'samples': 992256, 'steps': 5167, 'loss/train': 2.4085593223571777} -11/06/2021 21:58:54 - INFO - __main__ - Step 5169: {'lr': 0.000499434942030453, 'samples': 992448, 'steps': 5168, 'loss/train': 1.7436469793319702} -11/06/2021 21:58:55 - INFO - __main__ - Step 5170: {'lr': 0.0004994345853801834, 'samples': 992640, 'steps': 5169, 'loss/train': 1.887163758277893} -11/06/2021 21:58:55 - INFO - __main__ - Step 5171: {'lr': 0.0004994342286175225, 'samples': 992832, 'steps': 5170, 'loss/train': 1.4238390922546387} -11/06/2021 21:58:56 - INFO - __main__ - Step 5172: {'lr': 0.0004994338717424704, 'samples': 993024, 'steps': 5171, 'loss/train': 1.6073421239852905} -11/06/2021 21:58:56 - INFO - __main__ - Step 5173: {'lr': 0.0004994335147550272, 'samples': 993216, 'steps': 5172, 'loss/train': 2.328388214111328} -11/06/2021 21:58:56 - INFO - __main__ - Step 5174: {'lr': 0.0004994331576551931, 'samples': 993408, 'steps': 5173, 'loss/train': 2.2518372535705566} -11/06/2021 21:58:57 - INFO - __main__ - Step 5175: {'lr': 0.0004994328004429683, 'samples': 993600, 'steps': 5174, 'loss/train': 1.5607566833496094} -11/06/2021 21:58:58 - INFO - __main__ - Step 5176: {'lr': 0.000499432443118353, 'samples': 993792, 'steps': 5175, 'loss/train': 2.3936564922332764} -11/06/2021 21:58:58 - INFO - __main__ - Step 5177: {'lr': 0.0004994320856813471, 'samples': 993984, 'steps': 5176, 'loss/train': 1.8367432355880737} -11/06/2021 21:58:58 - INFO - __main__ - Step 5178: {'lr': 0.000499431728131951, 'samples': 994176, 'steps': 5177, 'loss/train': 1.9661235809326172} -11/06/2021 21:58:59 - INFO - __main__ - Step 5179: {'lr': 0.0004994313704701648, 'samples': 994368, 'steps': 5178, 'loss/train': 2.193740129470825} -11/06/2021 21:59:00 - INFO - __main__ - Step 5180: {'lr': 0.0004994310126959887, 'samples': 994560, 'steps': 5179, 'loss/train': 1.998255968093872} -11/06/2021 21:59:00 - INFO - __main__ - Step 5181: {'lr': 0.000499430654809423, 'samples': 994752, 'steps': 5180, 'loss/train': 2.1848907470703125} -11/06/2021 21:59:00 - INFO - __main__ - Step 5182: {'lr': 0.0004994302968104675, 'samples': 994944, 'steps': 5181, 'loss/train': 2.1371874809265137} -11/06/2021 21:59:01 - INFO - __main__ - Step 5183: {'lr': 0.0004994299386991227, 'samples': 995136, 'steps': 5182, 'loss/train': 2.302549362182617} -11/06/2021 21:59:01 - INFO - __main__ - Step 5184: {'lr': 0.0004994295804753885, 'samples': 995328, 'steps': 5183, 'loss/train': 1.9894294738769531} -11/06/2021 21:59:02 - INFO - __main__ - Step 5185: {'lr': 0.0004994292221392652, 'samples': 995520, 'steps': 5184, 'loss/train': 2.0415422916412354} -11/06/2021 21:59:02 - INFO - __main__ - Step 5186: {'lr': 0.000499428863690753, 'samples': 995712, 'steps': 5185, 'loss/train': 2.606383800506592} -11/06/2021 21:59:03 - INFO - __main__ - Step 5187: {'lr': 0.0004994285051298519, 'samples': 995904, 'steps': 5186, 'loss/train': 2.254190444946289} -11/06/2021 21:59:03 - INFO - __main__ - Step 5188: {'lr': 0.0004994281464565623, 'samples': 996096, 'steps': 5187, 'loss/train': 1.9112964868545532} -11/06/2021 21:59:03 - INFO - __main__ - Step 5189: {'lr': 0.0004994277876708841, 'samples': 996288, 'steps': 5188, 'loss/train': 1.7943540811538696} -11/06/2021 21:59:05 - INFO - __main__ - Step 5190: {'lr': 0.0004994274287728177, 'samples': 996480, 'steps': 5189, 'loss/train': 2.0679004192352295} -11/06/2021 21:59:05 - INFO - __main__ - Step 5191: {'lr': 0.0004994270697623631, 'samples': 996672, 'steps': 5190, 'loss/train': 1.3824659585952759} -11/06/2021 21:59:06 - INFO - __main__ - Step 5192: {'lr': 0.0004994267106395205, 'samples': 996864, 'steps': 5191, 'loss/train': 1.7324517965316772} -11/06/2021 21:59:06 - INFO - __main__ - Step 5193: {'lr': 0.0004994263514042901, 'samples': 997056, 'steps': 5192, 'loss/train': 0.9526032209396362} -11/06/2021 21:59:06 - INFO - __main__ - Step 5194: {'lr': 0.0004994259920566719, 'samples': 997248, 'steps': 5193, 'loss/train': 0.5770443677902222} -11/06/2021 21:59:07 - INFO - __main__ - Step 5195: {'lr': 0.0004994256325966663, 'samples': 997440, 'steps': 5194, 'loss/train': 1.4841455221176147} -11/06/2021 21:59:08 - INFO - __main__ - Step 5196: {'lr': 0.0004994252730242734, 'samples': 997632, 'steps': 5195, 'loss/train': 2.2125959396362305} -11/06/2021 21:59:08 - INFO - __main__ - Step 5197: {'lr': 0.0004994249133394933, 'samples': 997824, 'steps': 5196, 'loss/train': 1.9928648471832275} -11/06/2021 21:59:08 - INFO - __main__ - Step 5198: {'lr': 0.0004994245535423262, 'samples': 998016, 'steps': 5197, 'loss/train': 2.454911947250366} -11/06/2021 21:59:09 - INFO - __main__ - Step 5199: {'lr': 0.0004994241936327722, 'samples': 998208, 'steps': 5198, 'loss/train': 1.8284403085708618} -11/06/2021 21:59:10 - INFO - __main__ - Step 5200: {'lr': 0.0004994238336108315, 'samples': 998400, 'steps': 5199, 'loss/train': 1.941856861114502} -11/06/2021 21:59:10 - INFO - __main__ - Step 5201: {'lr': 0.0004994234734765043, 'samples': 998592, 'steps': 5200, 'loss/train': 1.9864927530288696} -11/06/2021 21:59:10 - INFO - __main__ - Step 5202: {'lr': 0.0004994231132297907, 'samples': 998784, 'steps': 5201, 'loss/train': 1.9978981018066406} -11/06/2021 21:59:11 - INFO - __main__ - Step 5203: {'lr': 0.0004994227528706909, 'samples': 998976, 'steps': 5202, 'loss/train': 0.5917396545410156} -11/06/2021 21:59:11 - INFO - __main__ - Step 5204: {'lr': 0.0004994223923992052, 'samples': 999168, 'steps': 5203, 'loss/train': 1.8816064596176147} -11/06/2021 21:59:12 - INFO - __main__ - Step 5205: {'lr': 0.0004994220318153334, 'samples': 999360, 'steps': 5204, 'loss/train': 1.95060133934021} -11/06/2021 21:59:13 - INFO - __main__ - Step 5206: {'lr': 0.000499421671119076, 'samples': 999552, 'steps': 5205, 'loss/train': 2.2630045413970947} -11/06/2021 21:59:13 - INFO - __main__ - Step 5207: {'lr': 0.0004994213103104331, 'samples': 999744, 'steps': 5206, 'loss/train': 1.9655598402023315} -11/06/2021 21:59:13 - INFO - __main__ - Step 5208: {'lr': 0.0004994209493894046, 'samples': 999936, 'steps': 5207, 'loss/train': 2.0341320037841797} -11/06/2021 21:59:14 - INFO - __main__ - Step 5209: {'lr': 0.000499420588355991, 'samples': 1000128, 'steps': 5208, 'loss/train': 2.1907718181610107} -11/06/2021 21:59:14 - INFO - __main__ - Step 5210: {'lr': 0.0004994202272101923, 'samples': 1000320, 'steps': 5209, 'loss/train': 2.0395348072052} -11/06/2021 21:59:15 - INFO - __main__ - Step 5211: {'lr': 0.0004994198659520087, 'samples': 1000512, 'steps': 5210, 'loss/train': 1.4296295642852783} -11/06/2021 21:59:15 - INFO - __main__ - Step 5212: {'lr': 0.0004994195045814404, 'samples': 1000704, 'steps': 5211, 'loss/train': 1.9126372337341309} -11/06/2021 21:59:16 - INFO - __main__ - Step 5213: {'lr': 0.0004994191430984876, 'samples': 1000896, 'steps': 5212, 'loss/train': 1.5323981046676636} -11/06/2021 21:59:16 - INFO - __main__ - Step 5214: {'lr': 0.0004994187815031502, 'samples': 1001088, 'steps': 5213, 'loss/train': 2.079664468765259} -11/06/2021 21:59:16 - INFO - __main__ - Step 5215: {'lr': 0.0004994184197954286, 'samples': 1001280, 'steps': 5214, 'loss/train': 2.4426677227020264} -11/06/2021 21:59:18 - INFO - __main__ - Step 5216: {'lr': 0.000499418057975323, 'samples': 1001472, 'steps': 5215, 'loss/train': 1.766026258468628} -11/06/2021 21:59:18 - INFO - __main__ - Step 5217: {'lr': 0.0004994176960428333, 'samples': 1001664, 'steps': 5216, 'loss/train': 2.4069254398345947} -11/06/2021 21:59:18 - INFO - __main__ - Step 5218: {'lr': 0.00049941733399796, 'samples': 1001856, 'steps': 5217, 'loss/train': 2.27449369430542} -11/06/2021 21:59:19 - INFO - __main__ - Step 5219: {'lr': 0.000499416971840703, 'samples': 1002048, 'steps': 5218, 'loss/train': 1.5242971181869507} -11/06/2021 21:59:19 - INFO - __main__ - Step 5220: {'lr': 0.0004994166095710626, 'samples': 1002240, 'steps': 5219, 'loss/train': 1.8974841833114624} -11/06/2021 21:59:20 - INFO - __main__ - Step 5221: {'lr': 0.000499416247189039, 'samples': 1002432, 'steps': 5220, 'loss/train': 1.832592248916626} -11/06/2021 21:59:21 - INFO - __main__ - Step 5222: {'lr': 0.0004994158846946321, 'samples': 1002624, 'steps': 5221, 'loss/train': 1.9344158172607422} -11/06/2021 21:59:21 - INFO - __main__ - Step 5223: {'lr': 0.0004994155220878425, 'samples': 1002816, 'steps': 5222, 'loss/train': 1.6130883693695068} -11/06/2021 21:59:21 - INFO - __main__ - Step 5224: {'lr': 0.0004994151593686699, 'samples': 1003008, 'steps': 5223, 'loss/train': 0.5793285965919495} -11/06/2021 21:59:22 - INFO - __main__ - Step 5225: {'lr': 0.0004994147965371147, 'samples': 1003200, 'steps': 5224, 'loss/train': 2.1755013465881348} -11/06/2021 21:59:23 - INFO - __main__ - Step 5226: {'lr': 0.0004994144335931772, 'samples': 1003392, 'steps': 5225, 'loss/train': 1.7877094745635986} -11/06/2021 21:59:23 - INFO - __main__ - Step 5227: {'lr': 0.0004994140705368573, 'samples': 1003584, 'steps': 5226, 'loss/train': 2.2187447547912598} -11/06/2021 21:59:24 - INFO - __main__ - Step 5228: {'lr': 0.0004994137073681552, 'samples': 1003776, 'steps': 5227, 'loss/train': 1.6575233936309814} -11/06/2021 21:59:24 - INFO - __main__ - Step 5229: {'lr': 0.0004994133440870712, 'samples': 1003968, 'steps': 5228, 'loss/train': 2.3762245178222656} -11/06/2021 21:59:24 - INFO - __main__ - Step 5230: {'lr': 0.0004994129806936054, 'samples': 1004160, 'steps': 5229, 'loss/train': 2.717776298522949} -11/06/2021 21:59:25 - INFO - __main__ - Step 5231: {'lr': 0.000499412617187758, 'samples': 1004352, 'steps': 5230, 'loss/train': 1.9042540788650513} -11/06/2021 21:59:26 - INFO - __main__ - Step 5232: {'lr': 0.0004994122535695291, 'samples': 1004544, 'steps': 5231, 'loss/train': 2.3282763957977295} -11/06/2021 21:59:26 - INFO - __main__ - Step 5233: {'lr': 0.0004994118898389189, 'samples': 1004736, 'steps': 5232, 'loss/train': 1.996087670326233} -11/06/2021 21:59:26 - INFO - __main__ - Step 5234: {'lr': 0.0004994115259959274, 'samples': 1004928, 'steps': 5233, 'loss/train': 1.9831849336624146} -11/06/2021 21:59:27 - INFO - __main__ - Step 5235: {'lr': 0.0004994111620405551, 'samples': 1005120, 'steps': 5234, 'loss/train': 1.956398844718933} -11/06/2021 21:59:28 - INFO - __main__ - Step 5236: {'lr': 0.0004994107979728019, 'samples': 1005312, 'steps': 5235, 'loss/train': 1.0656429529190063} -11/06/2021 21:59:28 - INFO - __main__ - Step 5237: {'lr': 0.0004994104337926681, 'samples': 1005504, 'steps': 5236, 'loss/train': 2.004157066345215} -11/06/2021 21:59:28 - INFO - __main__ - Step 5238: {'lr': 0.0004994100695001537, 'samples': 1005696, 'steps': 5237, 'loss/train': 1.8911778926849365} -11/06/2021 21:59:29 - INFO - __main__ - Step 5239: {'lr': 0.0004994097050952591, 'samples': 1005888, 'steps': 5238, 'loss/train': 2.1261074542999268} -11/06/2021 21:59:29 - INFO - __main__ - Step 5240: {'lr': 0.0004994093405779842, 'samples': 1006080, 'steps': 5239, 'loss/train': 1.9837573766708374} -11/06/2021 21:59:29 - INFO - __main__ - Step 5241: {'lr': 0.0004994089759483294, 'samples': 1006272, 'steps': 5240, 'loss/train': 1.9001221656799316} -11/06/2021 21:59:31 - INFO - __main__ - Step 5242: {'lr': 0.0004994086112062948, 'samples': 1006464, 'steps': 5241, 'loss/train': 1.5564855337142944} -11/06/2021 21:59:31 - INFO - __main__ - Step 5243: {'lr': 0.0004994082463518804, 'samples': 1006656, 'steps': 5242, 'loss/train': 1.7091917991638184} -11/06/2021 21:59:31 - INFO - __main__ - Step 5244: {'lr': 0.0004994078813850865, 'samples': 1006848, 'steps': 5243, 'loss/train': 2.3507444858551025} -11/06/2021 21:59:32 - INFO - __main__ - Step 5245: {'lr': 0.0004994075163059134, 'samples': 1007040, 'steps': 5244, 'loss/train': 1.456217646598816} -11/06/2021 21:59:32 - INFO - __main__ - Step 5246: {'lr': 0.0004994071511143609, 'samples': 1007232, 'steps': 5245, 'loss/train': 2.2415311336517334} -11/06/2021 21:59:33 - INFO - __main__ - Step 5247: {'lr': 0.0004994067858104296, 'samples': 1007424, 'steps': 5246, 'loss/train': 1.7924270629882812} -11/06/2021 21:59:33 - INFO - __main__ - Step 5248: {'lr': 0.0004994064203941195, 'samples': 1007616, 'steps': 5247, 'loss/train': 1.7448370456695557} -11/06/2021 21:59:34 - INFO - __main__ - Step 5249: {'lr': 0.0004994060548654304, 'samples': 1007808, 'steps': 5248, 'loss/train': 2.0024914741516113} -11/06/2021 21:59:34 - INFO - __main__ - Step 5250: {'lr': 0.000499405689224363, 'samples': 1008000, 'steps': 5249, 'loss/train': 2.1484951972961426} -11/06/2021 21:59:35 - INFO - __main__ - Step 5251: {'lr': 0.0004994053234709172, 'samples': 1008192, 'steps': 5250, 'loss/train': 2.0290279388427734} -11/06/2021 21:59:35 - INFO - __main__ - Step 5252: {'lr': 0.0004994049576050933, 'samples': 1008384, 'steps': 5251, 'loss/train': 1.8063730001449585} -11/06/2021 21:59:36 - INFO - __main__ - Step 5253: {'lr': 0.0004994045916268913, 'samples': 1008576, 'steps': 5252, 'loss/train': 1.8525824546813965} -11/06/2021 21:59:36 - INFO - __main__ - Step 5254: {'lr': 0.0004994042255363115, 'samples': 1008768, 'steps': 5253, 'loss/train': 1.7812204360961914} -11/06/2021 21:59:37 - INFO - __main__ - Step 5255: {'lr': 0.0004994038593333539, 'samples': 1008960, 'steps': 5254, 'loss/train': 1.8962163925170898} -11/06/2021 21:59:37 - INFO - __main__ - Step 5256: {'lr': 0.0004994034930180188, 'samples': 1009152, 'steps': 5255, 'loss/train': 1.78254234790802} -11/06/2021 21:59:38 - INFO - __main__ - Step 5257: {'lr': 0.0004994031265903063, 'samples': 1009344, 'steps': 5256, 'loss/train': 2.477855920791626} -11/06/2021 21:59:38 - INFO - __main__ - Step 5258: {'lr': 0.0004994027600502167, 'samples': 1009536, 'steps': 5257, 'loss/train': 1.9207967519760132} -11/06/2021 21:59:39 - INFO - __main__ - Step 5259: {'lr': 0.00049940239339775, 'samples': 1009728, 'steps': 5258, 'loss/train': 1.7611019611358643} -11/06/2021 21:59:39 - INFO - __main__ - Step 5260: {'lr': 0.0004994020266329064, 'samples': 1009920, 'steps': 5259, 'loss/train': 1.293487548828125} -11/06/2021 21:59:39 - INFO - __main__ - Step 5261: {'lr': 0.0004994016597556862, 'samples': 1010112, 'steps': 5260, 'loss/train': 2.4520223140716553} -11/06/2021 21:59:40 - INFO - __main__ - Step 5262: {'lr': 0.0004994012927660894, 'samples': 1010304, 'steps': 5261, 'loss/train': 2.1690826416015625} -11/06/2021 21:59:41 - INFO - __main__ - Step 5263: {'lr': 0.0004994009256641162, 'samples': 1010496, 'steps': 5262, 'loss/train': 1.7376418113708496} -11/06/2021 21:59:41 - INFO - __main__ - Step 5264: {'lr': 0.0004994005584497667, 'samples': 1010688, 'steps': 5263, 'loss/train': 1.8751423358917236} -11/06/2021 21:59:41 - INFO - __main__ - Step 5265: {'lr': 0.0004994001911230413, 'samples': 1010880, 'steps': 5264, 'loss/train': 1.917157769203186} -11/06/2021 21:59:42 - INFO - __main__ - Step 5266: {'lr': 0.00049939982368394, 'samples': 1011072, 'steps': 5265, 'loss/train': 1.825718879699707} -11/06/2021 21:59:42 - INFO - __main__ - Step 5267: {'lr': 0.000499399456132463, 'samples': 1011264, 'steps': 5266, 'loss/train': 2.2549986839294434} -11/06/2021 21:59:44 - INFO - __main__ - Step 5268: {'lr': 0.0004993990884686105, 'samples': 1011456, 'steps': 5267, 'loss/train': 1.5457383394241333} -11/06/2021 21:59:44 - INFO - __main__ - Step 5269: {'lr': 0.0004993987206923825, 'samples': 1011648, 'steps': 5268, 'loss/train': 1.0259302854537964} -11/06/2021 21:59:44 - INFO - __main__ - Step 5270: {'lr': 0.0004993983528037793, 'samples': 1011840, 'steps': 5269, 'loss/train': 1.1901259422302246} -11/06/2021 21:59:45 - INFO - __main__ - Step 5271: {'lr': 0.0004993979848028011, 'samples': 1012032, 'steps': 5270, 'loss/train': 2.2096664905548096} -11/06/2021 21:59:45 - INFO - __main__ - Step 5272: {'lr': 0.000499397616689448, 'samples': 1012224, 'steps': 5271, 'loss/train': 1.2520197629928589} -11/06/2021 21:59:46 - INFO - __main__ - Step 5273: {'lr': 0.0004993972484637202, 'samples': 1012416, 'steps': 5272, 'loss/train': 1.571405053138733} -11/06/2021 21:59:47 - INFO - __main__ - Step 5274: {'lr': 0.0004993968801256178, 'samples': 1012608, 'steps': 5273, 'loss/train': 2.2659175395965576} -11/06/2021 21:59:47 - INFO - __main__ - Step 5275: {'lr': 0.0004993965116751411, 'samples': 1012800, 'steps': 5274, 'loss/train': 1.6691346168518066} -11/06/2021 21:59:47 - INFO - __main__ - Step 5276: {'lr': 0.0004993961431122901, 'samples': 1012992, 'steps': 5275, 'loss/train': 2.171734094619751} -11/06/2021 21:59:48 - INFO - __main__ - Step 5277: {'lr': 0.0004993957744370651, 'samples': 1013184, 'steps': 5276, 'loss/train': 2.206928253173828} -11/06/2021 21:59:49 - INFO - __main__ - Step 5278: {'lr': 0.0004993954056494662, 'samples': 1013376, 'steps': 5277, 'loss/train': 1.2756541967391968} -11/06/2021 21:59:49 - INFO - __main__ - Step 5279: {'lr': 0.0004993950367494936, 'samples': 1013568, 'steps': 5278, 'loss/train': 2.2866268157958984} -11/06/2021 21:59:49 - INFO - __main__ - Step 5280: {'lr': 0.0004993946677371474, 'samples': 1013760, 'steps': 5279, 'loss/train': 2.0941381454467773} -11/06/2021 21:59:50 - INFO - __main__ - Step 5281: {'lr': 0.0004993942986124278, 'samples': 1013952, 'steps': 5280, 'loss/train': 1.8966882228851318} -11/06/2021 21:59:50 - INFO - __main__ - Step 5282: {'lr': 0.000499393929375335, 'samples': 1014144, 'steps': 5281, 'loss/train': 1.9149951934814453} -11/06/2021 21:59:51 - INFO - __main__ - Step 5283: {'lr': 0.0004993935600258691, 'samples': 1014336, 'steps': 5282, 'loss/train': 2.0702826976776123} -11/06/2021 21:59:51 - INFO - __main__ - Step 5284: {'lr': 0.0004993931905640305, 'samples': 1014528, 'steps': 5283, 'loss/train': 2.0960628986358643} -11/06/2021 21:59:52 - INFO - __main__ - Step 5285: {'lr': 0.000499392820989819, 'samples': 1014720, 'steps': 5284, 'loss/train': 1.8415803909301758} -11/06/2021 21:59:52 - INFO - __main__ - Step 5286: {'lr': 0.0004993924513032349, 'samples': 1014912, 'steps': 5285, 'loss/train': 2.124772071838379} -11/06/2021 21:59:52 - INFO - __main__ - Step 5287: {'lr': 0.0004993920815042785, 'samples': 1015104, 'steps': 5286, 'loss/train': 1.629605770111084} -11/06/2021 21:59:53 - INFO - __main__ - Step 5288: {'lr': 0.0004993917115929498, 'samples': 1015296, 'steps': 5287, 'loss/train': 2.094998359680176} -11/06/2021 21:59:54 - INFO - __main__ - Step 5289: {'lr': 0.0004993913415692492, 'samples': 1015488, 'steps': 5288, 'loss/train': 0.9913315176963806} -11/06/2021 21:59:54 - INFO - __main__ - Step 5290: {'lr': 0.0004993909714331766, 'samples': 1015680, 'steps': 5289, 'loss/train': 2.3629143238067627} -11/06/2021 21:59:54 - INFO - __main__ - Step 5291: {'lr': 0.0004993906011847323, 'samples': 1015872, 'steps': 5290, 'loss/train': 1.4902851581573486} -11/06/2021 21:59:55 - INFO - __main__ - Step 5292: {'lr': 0.0004993902308239164, 'samples': 1016064, 'steps': 5291, 'loss/train': 2.1800575256347656} -11/06/2021 21:59:55 - INFO - __main__ - Step 5293: {'lr': 0.0004993898603507292, 'samples': 1016256, 'steps': 5292, 'loss/train': 1.8672491312026978} -11/06/2021 21:59:56 - INFO - __main__ - Step 5294: {'lr': 0.0004993894897651706, 'samples': 1016448, 'steps': 5293, 'loss/train': 1.4217222929000854} -11/06/2021 21:59:57 - INFO - __main__ - Step 5295: {'lr': 0.0004993891190672411, 'samples': 1016640, 'steps': 5294, 'loss/train': 2.300929307937622} -11/06/2021 21:59:57 - INFO - __main__ - Step 5296: {'lr': 0.0004993887482569407, 'samples': 1016832, 'steps': 5295, 'loss/train': 1.8544442653656006} -11/06/2021 21:59:57 - INFO - __main__ - Step 5297: {'lr': 0.0004993883773342695, 'samples': 1017024, 'steps': 5296, 'loss/train': 1.9744642972946167} -11/06/2021 21:59:58 - INFO - __main__ - Step 5298: {'lr': 0.0004993880062992279, 'samples': 1017216, 'steps': 5297, 'loss/train': 1.6615900993347168} -11/06/2021 21:59:58 - INFO - __main__ - Step 5299: {'lr': 0.0004993876351518157, 'samples': 1017408, 'steps': 5298, 'loss/train': 1.865243911743164} -11/06/2021 21:59:59 - INFO - __main__ - Step 5300: {'lr': 0.0004993872638920335, 'samples': 1017600, 'steps': 5299, 'loss/train': 1.881446123123169} -11/06/2021 22:00:00 - INFO - __main__ - Step 5301: {'lr': 0.0004993868925198811, 'samples': 1017792, 'steps': 5300, 'loss/train': 2.0153396129608154} -11/06/2021 22:00:00 - INFO - __main__ - Step 5302: {'lr': 0.0004993865210353588, 'samples': 1017984, 'steps': 5301, 'loss/train': 1.8959330320358276} -11/06/2021 22:00:00 - INFO - __main__ - Step 5303: {'lr': 0.0004993861494384669, 'samples': 1018176, 'steps': 5302, 'loss/train': 1.8540432453155518} -11/06/2021 22:00:01 - INFO - __main__ - Step 5304: {'lr': 0.0004993857777292053, 'samples': 1018368, 'steps': 5303, 'loss/train': 1.6123359203338623} -11/06/2021 22:00:02 - INFO - __main__ - Step 5305: {'lr': 0.0004993854059075745, 'samples': 1018560, 'steps': 5304, 'loss/train': 2.1076877117156982} -11/06/2021 22:00:02 - INFO - __main__ - Step 5306: {'lr': 0.0004993850339735744, 'samples': 1018752, 'steps': 5305, 'loss/train': 1.8283599615097046} -11/06/2021 22:00:02 - INFO - __main__ - Step 5307: {'lr': 0.0004993846619272052, 'samples': 1018944, 'steps': 5306, 'loss/train': 2.057713508605957} -11/06/2021 22:00:03 - INFO - __main__ - Step 5308: {'lr': 0.0004993842897684672, 'samples': 1019136, 'steps': 5307, 'loss/train': 1.3499886989593506} -11/06/2021 22:00:03 - INFO - __main__ - Step 5309: {'lr': 0.0004993839174973604, 'samples': 1019328, 'steps': 5308, 'loss/train': 1.8223806619644165} -11/06/2021 22:00:04 - INFO - __main__ - Step 5310: {'lr': 0.0004993835451138851, 'samples': 1019520, 'steps': 5309, 'loss/train': 1.0041699409484863} -11/06/2021 22:00:04 - INFO - __main__ - Step 5311: {'lr': 0.0004993831726180414, 'samples': 1019712, 'steps': 5310, 'loss/train': 0.6815013289451599} -11/06/2021 22:00:05 - INFO - __main__ - Step 5312: {'lr': 0.0004993828000098296, 'samples': 1019904, 'steps': 5311, 'loss/train': 1.6194506883621216} -11/06/2021 22:00:05 - INFO - __main__ - Step 5313: {'lr': 0.0004993824272892497, 'samples': 1020096, 'steps': 5312, 'loss/train': 1.8829015493392944} -11/06/2021 22:00:05 - INFO - __main__ - Step 5314: {'lr': 0.0004993820544563018, 'samples': 1020288, 'steps': 5313, 'loss/train': 2.2411489486694336} -11/06/2021 22:00:06 - INFO - __main__ - Step 5315: {'lr': 0.0004993816815109863, 'samples': 1020480, 'steps': 5314, 'loss/train': 1.758228063583374} -11/06/2021 22:00:07 - INFO - __main__ - Step 5316: {'lr': 0.0004993813084533033, 'samples': 1020672, 'steps': 5315, 'loss/train': 1.9328948259353638} -11/06/2021 22:00:07 - INFO - __main__ - Step 5317: {'lr': 0.0004993809352832529, 'samples': 1020864, 'steps': 5316, 'loss/train': 1.9451228380203247} -11/06/2021 22:00:08 - INFO - __main__ - Step 5318: {'lr': 0.0004993805620008353, 'samples': 1021056, 'steps': 5317, 'loss/train': 2.118875026702881} -11/06/2021 22:00:08 - INFO - __main__ - Step 5319: {'lr': 0.0004993801886060506, 'samples': 1021248, 'steps': 5318, 'loss/train': 2.0214946269989014} -11/06/2021 22:00:09 - INFO - __main__ - Step 5320: {'lr': 0.0004993798150988991, 'samples': 1021440, 'steps': 5319, 'loss/train': 2.4562036991119385} -11/06/2021 22:00:09 - INFO - __main__ - Step 5321: {'lr': 0.0004993794414793808, 'samples': 1021632, 'steps': 5320, 'loss/train': 1.9569580554962158} -11/06/2021 22:00:10 - INFO - __main__ - Step 5322: {'lr': 0.0004993790677474962, 'samples': 1021824, 'steps': 5321, 'loss/train': 1.3694133758544922} -11/06/2021 22:00:10 - INFO - __main__ - Step 5323: {'lr': 0.0004993786939032451, 'samples': 1022016, 'steps': 5322, 'loss/train': 1.7816057205200195} -11/06/2021 22:00:10 - INFO - __main__ - Step 5324: {'lr': 0.0004993783199466278, 'samples': 1022208, 'steps': 5323, 'loss/train': 2.492426633834839} -11/06/2021 22:00:11 - INFO - __main__ - Step 5325: {'lr': 0.0004993779458776444, 'samples': 1022400, 'steps': 5324, 'loss/train': 2.574648857116699} -11/06/2021 22:00:12 - INFO - __main__ - Step 5326: {'lr': 0.0004993775716962953, 'samples': 1022592, 'steps': 5325, 'loss/train': 1.6549577713012695} -11/06/2021 22:00:12 - INFO - __main__ - Step 5327: {'lr': 0.0004993771974025805, 'samples': 1022784, 'steps': 5326, 'loss/train': 1.884212851524353} -11/06/2021 22:00:12 - INFO - __main__ - Step 5328: {'lr': 0.0004993768229965001, 'samples': 1022976, 'steps': 5327, 'loss/train': 2.4046313762664795} -11/06/2021 22:00:13 - INFO - __main__ - Step 5329: {'lr': 0.0004993764484780543, 'samples': 1023168, 'steps': 5328, 'loss/train': 1.4917925596237183} -11/06/2021 22:00:13 - INFO - __main__ - Step 5330: {'lr': 0.0004993760738472435, 'samples': 1023360, 'steps': 5329, 'loss/train': 1.8615087270736694} -11/06/2021 22:00:14 - INFO - __main__ - Step 5331: {'lr': 0.0004993756991040675, 'samples': 1023552, 'steps': 5330, 'loss/train': 1.8130137920379639} -11/06/2021 22:00:14 - INFO - __main__ - Step 5332: {'lr': 0.0004993753242485268, 'samples': 1023744, 'steps': 5331, 'loss/train': 2.364469051361084} -11/06/2021 22:00:15 - INFO - __main__ - Step 5333: {'lr': 0.0004993749492806214, 'samples': 1023936, 'steps': 5332, 'loss/train': 2.498106002807617} -11/06/2021 22:00:15 - INFO - __main__ - Step 5334: {'lr': 0.0004993745742003515, 'samples': 1024128, 'steps': 5333, 'loss/train': 1.809753656387329} -11/06/2021 22:00:16 - INFO - __main__ - Step 5335: {'lr': 0.0004993741990077172, 'samples': 1024320, 'steps': 5334, 'loss/train': 2.3342111110687256} -11/06/2021 22:00:16 - INFO - __main__ - Step 5336: {'lr': 0.0004993738237027188, 'samples': 1024512, 'steps': 5335, 'loss/train': 2.1999897956848145} -11/06/2021 22:00:17 - INFO - __main__ - Step 5337: {'lr': 0.0004993734482853563, 'samples': 1024704, 'steps': 5336, 'loss/train': 2.134817123413086} -11/06/2021 22:00:17 - INFO - __main__ - Step 5338: {'lr': 0.0004993730727556301, 'samples': 1024896, 'steps': 5337, 'loss/train': 1.9797841310501099} -11/06/2021 22:00:17 - INFO - __main__ - Step 5339: {'lr': 0.0004993726971135402, 'samples': 1025088, 'steps': 5338, 'loss/train': 1.4383511543273926} -11/06/2021 22:00:18 - INFO - __main__ - Step 5340: {'lr': 0.0004993723213590868, 'samples': 1025280, 'steps': 5339, 'loss/train': 2.2036027908325195} -11/06/2021 22:00:19 - INFO - __main__ - Step 5341: {'lr': 0.0004993719454922701, 'samples': 1025472, 'steps': 5340, 'loss/train': 2.0086007118225098} -11/06/2021 22:00:19 - INFO - __main__ - Step 5342: {'lr': 0.0004993715695130902, 'samples': 1025664, 'steps': 5341, 'loss/train': 1.6373944282531738} -11/06/2021 22:00:20 - INFO - __main__ - Step 5343: {'lr': 0.0004993711934215473, 'samples': 1025856, 'steps': 5342, 'loss/train': 1.591683268547058} -11/06/2021 22:00:20 - INFO - __main__ - Step 5344: {'lr': 0.0004993708172176417, 'samples': 1026048, 'steps': 5343, 'loss/train': 1.9710315465927124} -11/06/2021 22:00:20 - INFO - __main__ - Step 5345: {'lr': 0.0004993704409013734, 'samples': 1026240, 'steps': 5344, 'loss/train': 2.084678888320923} -11/06/2021 22:00:21 - INFO - __main__ - Step 5346: {'lr': 0.0004993700644727425, 'samples': 1026432, 'steps': 5345, 'loss/train': 2.1554689407348633} -11/06/2021 22:00:22 - INFO - __main__ - Step 5347: {'lr': 0.0004993696879317495, 'samples': 1026624, 'steps': 5346, 'loss/train': 1.5472863912582397} -11/06/2021 22:00:22 - INFO - __main__ - Step 5348: {'lr': 0.0004993693112783943, 'samples': 1026816, 'steps': 5347, 'loss/train': 1.995734691619873} -11/06/2021 22:00:22 - INFO - __main__ - Step 5349: {'lr': 0.0004993689345126771, 'samples': 1027008, 'steps': 5348, 'loss/train': 2.151108503341675} -11/06/2021 22:00:23 - INFO - __main__ - Step 5350: {'lr': 0.0004993685576345981, 'samples': 1027200, 'steps': 5349, 'loss/train': 2.3165838718414307} -11/06/2021 22:00:24 - INFO - __main__ - Step 5351: {'lr': 0.0004993681806441575, 'samples': 1027392, 'steps': 5350, 'loss/train': 2.325005292892456} -11/06/2021 22:00:24 - INFO - __main__ - Step 5352: {'lr': 0.0004993678035413554, 'samples': 1027584, 'steps': 5351, 'loss/train': 1.954711675643921} -11/06/2021 22:00:24 - INFO - __main__ - Step 5353: {'lr': 0.0004993674263261921, 'samples': 1027776, 'steps': 5352, 'loss/train': 1.639163851737976} -11/06/2021 22:00:25 - INFO - __main__ - Step 5354: {'lr': 0.0004993670489986677, 'samples': 1027968, 'steps': 5353, 'loss/train': 2.0933964252471924} -11/06/2021 22:00:25 - INFO - __main__ - Step 5355: {'lr': 0.0004993666715587823, 'samples': 1028160, 'steps': 5354, 'loss/train': 2.3471012115478516} -11/06/2021 22:00:26 - INFO - __main__ - Step 5356: {'lr': 0.0004993662940065361, 'samples': 1028352, 'steps': 5355, 'loss/train': 1.8415415287017822} -11/06/2021 22:00:26 - INFO - __main__ - Step 5357: {'lr': 0.0004993659163419294, 'samples': 1028544, 'steps': 5356, 'loss/train': 2.263580322265625} -11/06/2021 22:00:27 - INFO - __main__ - Step 5358: {'lr': 0.0004993655385649621, 'samples': 1028736, 'steps': 5357, 'loss/train': 1.8695333003997803} -11/06/2021 22:00:27 - INFO - __main__ - Step 5359: {'lr': 0.0004993651606756347, 'samples': 1028928, 'steps': 5358, 'loss/train': 2.1542937755584717} -11/06/2021 22:00:28 - INFO - __main__ - Step 5360: {'lr': 0.0004993647826739471, 'samples': 1029120, 'steps': 5359, 'loss/train': 1.7459410429000854} -11/06/2021 22:00:28 - INFO - __main__ - Step 5361: {'lr': 0.0004993644045598997, 'samples': 1029312, 'steps': 5360, 'loss/train': 2.4149515628814697} -11/06/2021 22:00:29 - INFO - __main__ - Step 5362: {'lr': 0.0004993640263334924, 'samples': 1029504, 'steps': 5361, 'loss/train': 1.8618431091308594} -11/06/2021 22:00:29 - INFO - __main__ - Step 5363: {'lr': 0.0004993636479947256, 'samples': 1029696, 'steps': 5362, 'loss/train': 1.1702266931533813} -11/06/2021 22:00:30 - INFO - __main__ - Step 5364: {'lr': 0.0004993632695435993, 'samples': 1029888, 'steps': 5363, 'loss/train': 2.124359369277954} -11/06/2021 22:00:30 - INFO - __main__ - Step 5365: {'lr': 0.0004993628909801138, 'samples': 1030080, 'steps': 5364, 'loss/train': 1.8695933818817139} -11/06/2021 22:00:31 - INFO - __main__ - Step 5366: {'lr': 0.0004993625123042694, 'samples': 1030272, 'steps': 5365, 'loss/train': 2.126741409301758} -11/06/2021 22:00:31 - INFO - __main__ - Step 5367: {'lr': 0.0004993621335160659, 'samples': 1030464, 'steps': 5366, 'loss/train': 2.1236331462860107} -11/06/2021 22:00:32 - INFO - __main__ - Step 5368: {'lr': 0.0004993617546155037, 'samples': 1030656, 'steps': 5367, 'loss/train': 1.1388921737670898} -11/06/2021 22:00:32 - INFO - __main__ - Step 5369: {'lr': 0.000499361375602583, 'samples': 1030848, 'steps': 5368, 'loss/train': 2.0226683616638184} -11/06/2021 22:00:32 - INFO - __main__ - Step 5370: {'lr': 0.0004993609964773039, 'samples': 1031040, 'steps': 5369, 'loss/train': 1.933193325996399} -11/06/2021 22:00:33 - INFO - __main__ - Step 5371: {'lr': 0.0004993606172396665, 'samples': 1031232, 'steps': 5370, 'loss/train': 1.9464812278747559} -11/06/2021 22:00:34 - INFO - __main__ - Step 5372: {'lr': 0.0004993602378896712, 'samples': 1031424, 'steps': 5371, 'loss/train': 1.1575310230255127} -11/06/2021 22:00:34 - INFO - __main__ - Step 5373: {'lr': 0.0004993598584273179, 'samples': 1031616, 'steps': 5372, 'loss/train': 2.0827817916870117} -11/06/2021 22:00:34 - INFO - __main__ - Step 5374: {'lr': 0.0004993594788526069, 'samples': 1031808, 'steps': 5373, 'loss/train': 2.1130635738372803} -11/06/2021 22:00:35 - INFO - __main__ - Step 5375: {'lr': 0.0004993590991655384, 'samples': 1032000, 'steps': 5374, 'loss/train': 2.0169715881347656} -11/06/2021 22:00:35 - INFO - __main__ - Step 5376: {'lr': 0.0004993587193661126, 'samples': 1032192, 'steps': 5375, 'loss/train': 2.4737699031829834} -11/06/2021 22:00:36 - INFO - __main__ - Step 5377: {'lr': 0.0004993583394543295, 'samples': 1032384, 'steps': 5376, 'loss/train': 1.8116259574890137} -11/06/2021 22:00:37 - INFO - __main__ - Step 5378: {'lr': 0.0004993579594301895, 'samples': 1032576, 'steps': 5377, 'loss/train': 1.8319172859191895} -11/06/2021 22:00:37 - INFO - __main__ - Step 5379: {'lr': 0.0004993575792936925, 'samples': 1032768, 'steps': 5378, 'loss/train': 1.6784554719924927} -11/06/2021 22:00:37 - INFO - __main__ - Step 5380: {'lr': 0.000499357199044839, 'samples': 1032960, 'steps': 5379, 'loss/train': 1.458201289176941} -11/06/2021 22:00:38 - INFO - __main__ - Step 5381: {'lr': 0.0004993568186836288, 'samples': 1033152, 'steps': 5380, 'loss/train': 1.8276842832565308} -11/06/2021 22:00:39 - INFO - __main__ - Step 5382: {'lr': 0.0004993564382100624, 'samples': 1033344, 'steps': 5381, 'loss/train': 1.3644241094589233} -11/06/2021 22:00:39 - INFO - __main__ - Step 5383: {'lr': 0.0004993560576241398, 'samples': 1033536, 'steps': 5382, 'loss/train': 1.386871337890625} -11/06/2021 22:00:39 - INFO - __main__ - Step 5384: {'lr': 0.0004993556769258612, 'samples': 1033728, 'steps': 5383, 'loss/train': 1.235226035118103} -11/06/2021 22:00:40 - INFO - __main__ - Step 5385: {'lr': 0.0004993552961152268, 'samples': 1033920, 'steps': 5384, 'loss/train': 1.334904670715332} -11/06/2021 22:00:40 - INFO - __main__ - Step 5386: {'lr': 0.0004993549151922367, 'samples': 1034112, 'steps': 5385, 'loss/train': 2.5312018394470215} -11/06/2021 22:00:41 - INFO - __main__ - Step 5387: {'lr': 0.0004993545341568912, 'samples': 1034304, 'steps': 5386, 'loss/train': 1.546046257019043} -11/06/2021 22:00:41 - INFO - __main__ - Step 5388: {'lr': 0.0004993541530091903, 'samples': 1034496, 'steps': 5387, 'loss/train': 1.8282663822174072} -11/06/2021 22:00:42 - INFO - __main__ - Step 5389: {'lr': 0.0004993537717491343, 'samples': 1034688, 'steps': 5388, 'loss/train': 2.0151655673980713} -11/06/2021 22:00:42 - INFO - __main__ - Step 5390: {'lr': 0.0004993533903767235, 'samples': 1034880, 'steps': 5389, 'loss/train': 1.5707823038101196} -11/06/2021 22:00:42 - INFO - __main__ - Step 5391: {'lr': 0.0004993530088919577, 'samples': 1035072, 'steps': 5390, 'loss/train': 1.7136812210083008} -11/06/2021 22:00:43 - INFO - __main__ - Step 5392: {'lr': 0.0004993526272948374, 'samples': 1035264, 'steps': 5391, 'loss/train': 0.6717694401741028} -11/06/2021 22:00:44 - INFO - __main__ - Step 5393: {'lr': 0.0004993522455853626, 'samples': 1035456, 'steps': 5392, 'loss/train': 1.5146379470825195} -11/06/2021 22:00:44 - INFO - __main__ - Step 5394: {'lr': 0.0004993518637635334, 'samples': 1035648, 'steps': 5393, 'loss/train': 1.4863612651824951} -11/06/2021 22:00:45 - INFO - __main__ - Step 5395: {'lr': 0.0004993514818293503, 'samples': 1035840, 'steps': 5394, 'loss/train': 1.7902588844299316} -11/06/2021 22:00:45 - INFO - __main__ - Step 5396: {'lr': 0.0004993510997828132, 'samples': 1036032, 'steps': 5395, 'loss/train': 1.7345638275146484} -11/06/2021 22:00:45 - INFO - __main__ - Step 5397: {'lr': 0.0004993507176239224, 'samples': 1036224, 'steps': 5396, 'loss/train': 1.4879080057144165} -11/06/2021 22:00:46 - INFO - __main__ - Step 5398: {'lr': 0.0004993503353526779, 'samples': 1036416, 'steps': 5397, 'loss/train': 1.566808819770813} -11/06/2021 22:00:47 - INFO - __main__ - Step 5399: {'lr': 0.0004993499529690801, 'samples': 1036608, 'steps': 5398, 'loss/train': 1.6237696409225464} -11/06/2021 22:00:47 - INFO - __main__ - Step 5400: {'lr': 0.000499349570473129, 'samples': 1036800, 'steps': 5399, 'loss/train': 2.0763614177703857} -11/06/2021 22:00:47 - INFO - __main__ - Step 5401: {'lr': 0.0004993491878648249, 'samples': 1036992, 'steps': 5400, 'loss/train': 2.139653444290161} -11/06/2021 22:00:48 - INFO - __main__ - Step 5402: {'lr': 0.0004993488051441677, 'samples': 1037184, 'steps': 5401, 'loss/train': 1.2702760696411133} -11/06/2021 22:00:49 - INFO - __main__ - Step 5403: {'lr': 0.000499348422311158, 'samples': 1037376, 'steps': 5402, 'loss/train': 1.7422914505004883} -11/06/2021 22:00:49 - INFO - __main__ - Step 5404: {'lr': 0.0004993480393657956, 'samples': 1037568, 'steps': 5403, 'loss/train': 1.667367935180664} -11/06/2021 22:00:50 - INFO - __main__ - Step 5405: {'lr': 0.0004993476563080809, 'samples': 1037760, 'steps': 5404, 'loss/train': 1.849706768989563} -11/06/2021 22:00:50 - INFO - __main__ - Step 5406: {'lr': 0.000499347273138014, 'samples': 1037952, 'steps': 5405, 'loss/train': 1.485642433166504} -11/06/2021 22:00:50 - INFO - __main__ - Step 5407: {'lr': 0.000499346889855595, 'samples': 1038144, 'steps': 5406, 'loss/train': 1.8878998756408691} -11/06/2021 22:00:51 - INFO - __main__ - Step 5408: {'lr': 0.0004993465064608242, 'samples': 1038336, 'steps': 5407, 'loss/train': 2.2448551654815674} -11/06/2021 22:00:52 - INFO - __main__ - Step 5409: {'lr': 0.0004993461229537017, 'samples': 1038528, 'steps': 5408, 'loss/train': 1.8952325582504272} -11/06/2021 22:00:52 - INFO - __main__ - Step 5410: {'lr': 0.0004993457393342276, 'samples': 1038720, 'steps': 5409, 'loss/train': 1.7118123769760132} -11/06/2021 22:00:52 - INFO - __main__ - Step 5411: {'lr': 0.0004993453556024023, 'samples': 1038912, 'steps': 5410, 'loss/train': 1.6171423196792603} -11/06/2021 22:00:53 - INFO - __main__ - Step 5412: {'lr': 0.0004993449717582258, 'samples': 1039104, 'steps': 5411, 'loss/train': 1.8556959629058838} -11/06/2021 22:00:53 - INFO - __main__ - Step 5413: {'lr': 0.0004993445878016982, 'samples': 1039296, 'steps': 5412, 'loss/train': 2.079441547393799} -11/06/2021 22:00:54 - INFO - __main__ - Step 5414: {'lr': 0.0004993442037328199, 'samples': 1039488, 'steps': 5413, 'loss/train': 2.005168914794922} -11/06/2021 22:00:54 - INFO - __main__ - Step 5415: {'lr': 0.0004993438195515909, 'samples': 1039680, 'steps': 5414, 'loss/train': 1.7402551174163818} -11/06/2021 22:00:55 - INFO - __main__ - Step 5416: {'lr': 0.0004993434352580115, 'samples': 1039872, 'steps': 5415, 'loss/train': 1.5889499187469482} -11/06/2021 22:00:55 - INFO - __main__ - Step 5417: {'lr': 0.0004993430508520816, 'samples': 1040064, 'steps': 5416, 'loss/train': 2.1305549144744873} -11/06/2021 22:00:55 - INFO - __main__ - Step 5418: {'lr': 0.0004993426663338018, 'samples': 1040256, 'steps': 5417, 'loss/train': 1.9073415994644165} -11/06/2021 22:00:57 - INFO - __main__ - Step 5419: {'lr': 0.0004993422817031719, 'samples': 1040448, 'steps': 5418, 'loss/train': 2.1884820461273193} -11/06/2021 22:00:57 - INFO - __main__ - Step 5420: {'lr': 0.0004993418969601921, 'samples': 1040640, 'steps': 5419, 'loss/train': 2.154372215270996} -11/06/2021 22:00:57 - INFO - __main__ - Step 5421: {'lr': 0.0004993415121048629, 'samples': 1040832, 'steps': 5420, 'loss/train': 1.9942115545272827} -11/06/2021 22:00:58 - INFO - __main__ - Step 5422: {'lr': 0.0004993411271371842, 'samples': 1041024, 'steps': 5421, 'loss/train': 1.9106769561767578} -11/06/2021 22:00:58 - INFO - __main__ - Step 5423: {'lr': 0.0004993407420571563, 'samples': 1041216, 'steps': 5422, 'loss/train': 1.0730233192443848} -11/06/2021 22:00:59 - INFO - __main__ - Step 5424: {'lr': 0.0004993403568647792, 'samples': 1041408, 'steps': 5423, 'loss/train': 2.985499143600464} -11/06/2021 22:01:00 - INFO - __main__ - Step 5425: {'lr': 0.0004993399715600531, 'samples': 1041600, 'steps': 5424, 'loss/train': 1.9801826477050781} -11/06/2021 22:01:00 - INFO - __main__ - Step 5426: {'lr': 0.0004993395861429785, 'samples': 1041792, 'steps': 5425, 'loss/train': 2.2979655265808105} -11/06/2021 22:01:00 - INFO - __main__ - Step 5427: {'lr': 0.0004993392006135552, 'samples': 1041984, 'steps': 5426, 'loss/train': 1.975477933883667} -11/06/2021 22:01:01 - INFO - __main__ - Step 5428: {'lr': 0.0004993388149717834, 'samples': 1042176, 'steps': 5427, 'loss/train': 1.659934639930725} -11/06/2021 22:01:02 - INFO - __main__ - Step 5429: {'lr': 0.0004993384292176636, 'samples': 1042368, 'steps': 5428, 'loss/train': 0.41693881154060364} -11/06/2021 22:01:02 - INFO - __main__ - Step 5430: {'lr': 0.0004993380433511956, 'samples': 1042560, 'steps': 5429, 'loss/train': 1.881492257118225} -11/06/2021 22:01:03 - INFO - __main__ - Step 5431: {'lr': 0.0004993376573723798, 'samples': 1042752, 'steps': 5430, 'loss/train': 2.2154150009155273} -11/06/2021 22:01:03 - INFO - __main__ - Step 5432: {'lr': 0.0004993372712812162, 'samples': 1042944, 'steps': 5431, 'loss/train': 2.0306501388549805} -11/06/2021 22:01:04 - INFO - __main__ - Step 5433: {'lr': 0.0004993368850777052, 'samples': 1043136, 'steps': 5432, 'loss/train': 2.2101669311523438} -11/06/2021 22:01:04 - INFO - __main__ - Step 5434: {'lr': 0.0004993364987618468, 'samples': 1043328, 'steps': 5433, 'loss/train': 2.0793869495391846} -11/06/2021 22:01:05 - INFO - __main__ - Step 5435: {'lr': 0.0004993361123336412, 'samples': 1043520, 'steps': 5434, 'loss/train': 1.7962534427642822} -11/06/2021 22:01:05 - INFO - __main__ - Step 5436: {'lr': 0.0004993357257930887, 'samples': 1043712, 'steps': 5435, 'loss/train': 2.5018160343170166} -11/06/2021 22:01:06 - INFO - __main__ - Step 5437: {'lr': 0.0004993353391401892, 'samples': 1043904, 'steps': 5436, 'loss/train': 2.258634567260742} -11/06/2021 22:01:06 - INFO - __main__ - Step 5438: {'lr': 0.0004993349523749431, 'samples': 1044096, 'steps': 5437, 'loss/train': 1.8289518356323242} -11/06/2021 22:01:07 - INFO - __main__ - Step 5439: {'lr': 0.0004993345654973505, 'samples': 1044288, 'steps': 5438, 'loss/train': 1.9161920547485352} -11/06/2021 22:01:07 - INFO - __main__ - Step 5440: {'lr': 0.0004993341785074116, 'samples': 1044480, 'steps': 5439, 'loss/train': 2.753596305847168} -11/06/2021 22:01:07 - INFO - __main__ - Step 5441: {'lr': 0.0004993337914051266, 'samples': 1044672, 'steps': 5440, 'loss/train': 1.9837926626205444} -11/06/2021 22:01:08 - INFO - __main__ - Step 5442: {'lr': 0.0004993334041904957, 'samples': 1044864, 'steps': 5441, 'loss/train': 0.3798553943634033} -11/06/2021 22:01:09 - INFO - __main__ - Step 5443: {'lr': 0.0004993330168635189, 'samples': 1045056, 'steps': 5442, 'loss/train': 1.5008134841918945} -11/06/2021 22:01:09 - INFO - __main__ - Step 5444: {'lr': 0.0004993326294241966, 'samples': 1045248, 'steps': 5443, 'loss/train': 0.524370014667511} -11/06/2021 22:01:09 - INFO - __main__ - Step 5445: {'lr': 0.0004993322418725286, 'samples': 1045440, 'steps': 5444, 'loss/train': 1.8944960832595825} -11/06/2021 22:01:10 - INFO - __main__ - Step 5446: {'lr': 0.0004993318542085157, 'samples': 1045632, 'steps': 5445, 'loss/train': 2.161842107772827} -11/06/2021 22:01:11 - INFO - __main__ - Step 5447: {'lr': 0.0004993314664321575, 'samples': 1045824, 'steps': 5446, 'loss/train': 2.0262186527252197} -11/06/2021 22:01:11 - INFO - __main__ - Step 5448: {'lr': 0.0004993310785434544, 'samples': 1046016, 'steps': 5447, 'loss/train': 1.3276009559631348} -11/06/2021 22:01:11 - INFO - __main__ - Step 5449: {'lr': 0.0004993306905424067, 'samples': 1046208, 'steps': 5448, 'loss/train': 1.6204453706741333} -11/06/2021 22:01:12 - INFO - __main__ - Step 5450: {'lr': 0.0004993303024290143, 'samples': 1046400, 'steps': 5449, 'loss/train': 2.0517914295196533} -11/06/2021 22:01:12 - INFO - __main__ - Step 5451: {'lr': 0.0004993299142032776, 'samples': 1046592, 'steps': 5450, 'loss/train': 1.5047802925109863} -11/06/2021 22:01:13 - INFO - __main__ - Step 5452: {'lr': 0.0004993295258651966, 'samples': 1046784, 'steps': 5451, 'loss/train': 2.418118953704834} -11/06/2021 22:01:14 - INFO - __main__ - Step 5453: {'lr': 0.0004993291374147716, 'samples': 1046976, 'steps': 5452, 'loss/train': 0.4726817011833191} -11/06/2021 22:01:14 - INFO - __main__ - Step 5454: {'lr': 0.0004993287488520027, 'samples': 1047168, 'steps': 5453, 'loss/train': 2.1030688285827637} -11/06/2021 22:01:14 - INFO - __main__ - Step 5455: {'lr': 0.0004993283601768902, 'samples': 1047360, 'steps': 5454, 'loss/train': 2.6343281269073486} -11/06/2021 22:01:15 - INFO - __main__ - Step 5456: {'lr': 0.0004993279713894342, 'samples': 1047552, 'steps': 5455, 'loss/train': 2.150969982147217} -11/06/2021 22:01:16 - INFO - __main__ - Step 5457: {'lr': 0.0004993275824896348, 'samples': 1047744, 'steps': 5456, 'loss/train': 1.408422827720642} -11/06/2021 22:01:16 - INFO - __main__ - Step 5458: {'lr': 0.0004993271934774922, 'samples': 1047936, 'steps': 5457, 'loss/train': 1.94776451587677} -11/06/2021 22:01:16 - INFO - __main__ - Step 5459: {'lr': 0.0004993268043530067, 'samples': 1048128, 'steps': 5458, 'loss/train': 1.2634351253509521} -11/06/2021 22:01:17 - INFO - __main__ - Step 5460: {'lr': 0.0004993264151161783, 'samples': 1048320, 'steps': 5459, 'loss/train': 1.6682987213134766} -11/06/2021 22:01:17 - INFO - __main__ - Step 5461: {'lr': 0.0004993260257670074, 'samples': 1048512, 'steps': 5460, 'loss/train': 2.2864060401916504} -11/06/2021 22:01:18 - INFO - __main__ - Step 5462: {'lr': 0.000499325636305494, 'samples': 1048704, 'steps': 5461, 'loss/train': 1.3038978576660156} -11/06/2021 22:01:18 - INFO - __main__ - Step 5463: {'lr': 0.0004993252467316382, 'samples': 1048896, 'steps': 5462, 'loss/train': 1.608263373374939} -11/06/2021 22:01:19 - INFO - __main__ - Step 5464: {'lr': 0.0004993248570454404, 'samples': 1049088, 'steps': 5463, 'loss/train': 1.6738258600234985} -11/06/2021 22:01:19 - INFO - __main__ - Step 5465: {'lr': 0.0004993244672469007, 'samples': 1049280, 'steps': 5464, 'loss/train': 2.2814807891845703} -11/06/2021 22:01:19 - INFO - __main__ - Step 5466: {'lr': 0.000499324077336019, 'samples': 1049472, 'steps': 5465, 'loss/train': 1.8330951929092407} -11/06/2021 22:01:20 - INFO - __main__ - Step 5467: {'lr': 0.000499323687312796, 'samples': 1049664, 'steps': 5466, 'loss/train': 1.905300498008728} -11/06/2021 22:01:21 - INFO - __main__ - Step 5468: {'lr': 0.0004993232971772315, 'samples': 1049856, 'steps': 5467, 'loss/train': 1.9987244606018066} -11/06/2021 22:01:21 - INFO - __main__ - Step 5469: {'lr': 0.0004993229069293257, 'samples': 1050048, 'steps': 5468, 'loss/train': 2.0383851528167725} -11/06/2021 22:01:21 - INFO - __main__ - Step 5470: {'lr': 0.0004993225165690789, 'samples': 1050240, 'steps': 5469, 'loss/train': 1.96856689453125} -11/06/2021 22:01:22 - INFO - __main__ - Step 5471: {'lr': 0.0004993221260964912, 'samples': 1050432, 'steps': 5470, 'loss/train': 2.155994415283203} -11/06/2021 22:01:22 - INFO - __main__ - Step 5472: {'lr': 0.0004993217355115628, 'samples': 1050624, 'steps': 5471, 'loss/train': 2.175236463546753} -11/06/2021 22:01:23 - INFO - __main__ - Step 5473: {'lr': 0.0004993213448142939, 'samples': 1050816, 'steps': 5472, 'loss/train': 2.2860300540924072} -11/06/2021 22:01:24 - INFO - __main__ - Step 5474: {'lr': 0.0004993209540046846, 'samples': 1051008, 'steps': 5473, 'loss/train': 2.309166431427002} -11/06/2021 22:01:24 - INFO - __main__ - Step 5475: {'lr': 0.0004993205630827352, 'samples': 1051200, 'steps': 5474, 'loss/train': 1.8463259935379028} -11/06/2021 22:01:24 - INFO - __main__ - Step 5476: {'lr': 0.0004993201720484458, 'samples': 1051392, 'steps': 5475, 'loss/train': 1.8536326885223389} -11/06/2021 22:01:25 - INFO - __main__ - Step 5477: {'lr': 0.0004993197809018165, 'samples': 1051584, 'steps': 5476, 'loss/train': 1.8011512756347656} -11/06/2021 22:01:26 - INFO - __main__ - Step 5478: {'lr': 0.0004993193896428476, 'samples': 1051776, 'steps': 5477, 'loss/train': 1.370781421661377} -11/06/2021 22:01:26 - INFO - __main__ - Step 5479: {'lr': 0.0004993189982715392, 'samples': 1051968, 'steps': 5478, 'loss/train': 1.9263511896133423} -11/06/2021 22:01:26 - INFO - __main__ - Step 5480: {'lr': 0.0004993186067878916, 'samples': 1052160, 'steps': 5479, 'loss/train': 1.3620198965072632} -11/06/2021 22:01:27 - INFO - __main__ - Step 5481: {'lr': 0.0004993182151919049, 'samples': 1052352, 'steps': 5480, 'loss/train': 2.0209407806396484} -11/06/2021 22:01:27 - INFO - __main__ - Step 5482: {'lr': 0.0004993178234835792, 'samples': 1052544, 'steps': 5481, 'loss/train': 1.6855971813201904} -11/06/2021 22:01:28 - INFO - __main__ - Step 5483: {'lr': 0.0004993174316629146, 'samples': 1052736, 'steps': 5482, 'loss/train': 2.446448802947998} -11/06/2021 22:01:28 - INFO - __main__ - Step 5484: {'lr': 0.0004993170397299116, 'samples': 1052928, 'steps': 5483, 'loss/train': 1.8740376234054565} -11/06/2021 22:01:29 - INFO - __main__ - Step 5485: {'lr': 0.0004993166476845701, 'samples': 1053120, 'steps': 5484, 'loss/train': 2.2243385314941406} -11/06/2021 22:01:29 - INFO - __main__ - Step 5486: {'lr': 0.0004993162555268903, 'samples': 1053312, 'steps': 5485, 'loss/train': 1.9227041006088257} -11/06/2021 22:01:29 - INFO - __main__ - Step 5487: {'lr': 0.0004993158632568726, 'samples': 1053504, 'steps': 5486, 'loss/train': 2.1195530891418457} -11/06/2021 22:01:30 - INFO - __main__ - Step 5488: {'lr': 0.000499315470874517, 'samples': 1053696, 'steps': 5487, 'loss/train': 2.2419090270996094} -11/06/2021 22:01:31 - INFO - __main__ - Step 5489: {'lr': 0.0004993150783798236, 'samples': 1053888, 'steps': 5488, 'loss/train': 2.4271090030670166} -11/06/2021 22:01:31 - INFO - __main__ - Step 5490: {'lr': 0.0004993146857727927, 'samples': 1054080, 'steps': 5489, 'loss/train': 1.7117938995361328} -11/06/2021 22:01:31 - INFO - __main__ - Step 5491: {'lr': 0.0004993142930534245, 'samples': 1054272, 'steps': 5490, 'loss/train': 1.232141375541687} -11/06/2021 22:01:32 - INFO - __main__ - Step 5492: {'lr': 0.000499313900221719, 'samples': 1054464, 'steps': 5491, 'loss/train': 1.8107589483261108} -11/06/2021 22:01:33 - INFO - __main__ - Step 5493: {'lr': 0.0004993135072776766, 'samples': 1054656, 'steps': 5492, 'loss/train': 2.035764694213867} -11/06/2021 22:01:33 - INFO - __main__ - Step 5494: {'lr': 0.0004993131142212974, 'samples': 1054848, 'steps': 5493, 'loss/train': 1.9107087850570679} -11/06/2021 22:01:33 - INFO - __main__ - Step 5495: {'lr': 0.0004993127210525815, 'samples': 1055040, 'steps': 5494, 'loss/train': 1.5598526000976562} -11/06/2021 22:01:34 - INFO - __main__ - Step 5496: {'lr': 0.0004993123277715292, 'samples': 1055232, 'steps': 5495, 'loss/train': 1.6145435571670532} -11/06/2021 22:01:34 - INFO - __main__ - Step 5497: {'lr': 0.0004993119343781406, 'samples': 1055424, 'steps': 5496, 'loss/train': 1.697355031967163} -11/06/2021 22:01:35 - INFO - __main__ - Step 5498: {'lr': 0.0004993115408724159, 'samples': 1055616, 'steps': 5497, 'loss/train': 1.3558404445648193} -11/06/2021 22:01:36 - INFO - __main__ - Step 5499: {'lr': 0.0004993111472543552, 'samples': 1055808, 'steps': 5498, 'loss/train': 1.6926814317703247} -11/06/2021 22:01:36 - INFO - __main__ - Step 5500: {'lr': 0.0004993107535239588, 'samples': 1056000, 'steps': 5499, 'loss/train': 1.3640247583389282} -11/06/2021 22:01:36 - INFO - __main__ - Step 5501: {'lr': 0.0004993103596812267, 'samples': 1056192, 'steps': 5500, 'loss/train': 1.8864690065383911} -11/06/2021 22:01:37 - INFO - __main__ - Step 5502: {'lr': 0.0004993099657261594, 'samples': 1056384, 'steps': 5501, 'loss/train': 2.0299696922302246} -11/06/2021 22:01:37 - INFO - __main__ - Step 5503: {'lr': 0.0004993095716587568, 'samples': 1056576, 'steps': 5502, 'loss/train': 2.2388596534729004} -11/06/2021 22:01:38 - INFO - __main__ - Step 5504: {'lr': 0.0004993091774790191, 'samples': 1056768, 'steps': 5503, 'loss/train': 1.5079683065414429} -11/06/2021 22:01:38 - INFO - __main__ - Step 5505: {'lr': 0.0004993087831869466, 'samples': 1056960, 'steps': 5504, 'loss/train': 2.0037267208099365} -11/06/2021 22:01:39 - INFO - __main__ - Step 5506: {'lr': 0.0004993083887825393, 'samples': 1057152, 'steps': 5505, 'loss/train': 2.18703556060791} -11/06/2021 22:01:39 - INFO - __main__ - Step 5507: {'lr': 0.0004993079942657976, 'samples': 1057344, 'steps': 5506, 'loss/train': 1.9802910089492798} -11/06/2021 22:01:39 - INFO - __main__ - Step 5508: {'lr': 0.0004993075996367215, 'samples': 1057536, 'steps': 5507, 'loss/train': 2.6383426189422607} -11/06/2021 22:01:40 - INFO - __main__ - Step 5509: {'lr': 0.0004993072048953113, 'samples': 1057728, 'steps': 5508, 'loss/train': 2.038627862930298} -11/06/2021 22:01:41 - INFO - __main__ - Step 5510: {'lr': 0.0004993068100415671, 'samples': 1057920, 'steps': 5509, 'loss/train': 1.877155065536499} -11/06/2021 22:01:41 - INFO - __main__ - Step 5511: {'lr': 0.000499306415075489, 'samples': 1058112, 'steps': 5510, 'loss/train': 1.7391774654388428} -11/06/2021 22:01:41 - INFO - __main__ - Step 5512: {'lr': 0.0004993060199970774, 'samples': 1058304, 'steps': 5511, 'loss/train': 2.053729772567749} -11/06/2021 22:01:42 - INFO - __main__ - Step 5513: {'lr': 0.0004993056248063323, 'samples': 1058496, 'steps': 5512, 'loss/train': 2.05024790763855} -11/06/2021 22:01:43 - INFO - __main__ - Step 5514: {'lr': 0.000499305229503254, 'samples': 1058688, 'steps': 5513, 'loss/train': 1.8646981716156006} -11/06/2021 22:01:43 - INFO - __main__ - Step 5515: {'lr': 0.0004993048340878425, 'samples': 1058880, 'steps': 5514, 'loss/train': 2.1601507663726807} -11/06/2021 22:01:44 - INFO - __main__ - Step 5516: {'lr': 0.0004993044385600982, 'samples': 1059072, 'steps': 5515, 'loss/train': 1.9711893796920776} -11/06/2021 22:01:44 - INFO - __main__ - Step 5517: {'lr': 0.0004993040429200211, 'samples': 1059264, 'steps': 5516, 'loss/train': 2.012702465057373} -11/06/2021 22:01:44 - INFO - __main__ - Step 5518: {'lr': 0.0004993036471676115, 'samples': 1059456, 'steps': 5517, 'loss/train': 1.4311362504959106} -11/06/2021 22:01:45 - INFO - __main__ - Step 5519: {'lr': 0.0004993032513028695, 'samples': 1059648, 'steps': 5518, 'loss/train': 1.7759687900543213} -11/06/2021 22:01:45 - INFO - __main__ - Step 5520: {'lr': 0.0004993028553257952, 'samples': 1059840, 'steps': 5519, 'loss/train': 2.569220781326294} -11/06/2021 22:01:46 - INFO - __main__ - Step 5521: {'lr': 0.000499302459236389, 'samples': 1060032, 'steps': 5520, 'loss/train': 1.6093146800994873} -11/06/2021 22:01:46 - INFO - __main__ - Step 5522: {'lr': 0.0004993020630346509, 'samples': 1060224, 'steps': 5521, 'loss/train': 2.444692611694336} -11/06/2021 22:01:47 - INFO - __main__ - Step 5523: {'lr': 0.0004993016667205812, 'samples': 1060416, 'steps': 5522, 'loss/train': 2.1542999744415283} -11/06/2021 22:01:48 - INFO - __main__ - Step 5524: {'lr': 0.0004993012702941799, 'samples': 1060608, 'steps': 5523, 'loss/train': 1.754870891571045} -11/06/2021 22:01:48 - INFO - __main__ - Step 5525: {'lr': 0.0004993008737554474, 'samples': 1060800, 'steps': 5524, 'loss/train': 1.7959246635437012} -11/06/2021 22:01:48 - INFO - __main__ - Step 5526: {'lr': 0.0004993004771043837, 'samples': 1060992, 'steps': 5525, 'loss/train': 2.041109800338745} -11/06/2021 22:01:49 - INFO - __main__ - Step 5527: {'lr': 0.0004993000803409891, 'samples': 1061184, 'steps': 5526, 'loss/train': 2.20894455909729} -11/06/2021 22:01:49 - INFO - __main__ - Step 5528: {'lr': 0.0004992996834652638, 'samples': 1061376, 'steps': 5527, 'loss/train': 1.942233681678772} -11/06/2021 22:01:50 - INFO - __main__ - Step 5529: {'lr': 0.0004992992864772079, 'samples': 1061568, 'steps': 5528, 'loss/train': 1.7475767135620117} -11/06/2021 22:01:50 - INFO - __main__ - Step 5530: {'lr': 0.0004992988893768214, 'samples': 1061760, 'steps': 5529, 'loss/train': 2.076091766357422} -11/06/2021 22:01:51 - INFO - __main__ - Step 5531: {'lr': 0.0004992984921641048, 'samples': 1061952, 'steps': 5530, 'loss/train': 2.0082509517669678} -11/06/2021 22:01:51 - INFO - __main__ - Step 5532: {'lr': 0.0004992980948390582, 'samples': 1062144, 'steps': 5531, 'loss/train': 1.9930384159088135} -11/06/2021 22:01:51 - INFO - __main__ - Step 5533: {'lr': 0.0004992976974016817, 'samples': 1062336, 'steps': 5532, 'loss/train': 2.128443479537964} -11/06/2021 22:01:52 - INFO - __main__ - Step 5534: {'lr': 0.0004992972998519755, 'samples': 1062528, 'steps': 5533, 'loss/train': 1.8396596908569336} -11/06/2021 22:01:53 - INFO - __main__ - Step 5535: {'lr': 0.0004992969021899397, 'samples': 1062720, 'steps': 5534, 'loss/train': 1.7834552526474} -11/06/2021 22:01:53 - INFO - __main__ - Step 5536: {'lr': 0.0004992965044155746, 'samples': 1062912, 'steps': 5535, 'loss/train': 1.7400227785110474} -11/06/2021 22:01:54 - INFO - __main__ - Step 5537: {'lr': 0.0004992961065288803, 'samples': 1063104, 'steps': 5536, 'loss/train': 1.9240829944610596} -11/06/2021 22:01:54 - INFO - __main__ - Step 5538: {'lr': 0.0004992957085298571, 'samples': 1063296, 'steps': 5537, 'loss/train': 1.3260631561279297} -11/06/2021 22:01:54 - INFO - __main__ - Step 5539: {'lr': 0.0004992953104185052, 'samples': 1063488, 'steps': 5538, 'loss/train': 1.4942200183868408} -11/06/2021 22:01:55 - INFO - __main__ - Step 5540: {'lr': 0.0004992949121948245, 'samples': 1063680, 'steps': 5539, 'loss/train': 1.48552668094635} -11/06/2021 22:01:56 - INFO - __main__ - Step 5541: {'lr': 0.0004992945138588154, 'samples': 1063872, 'steps': 5540, 'loss/train': 1.611240267753601} -11/06/2021 22:01:56 - INFO - __main__ - Step 5542: {'lr': 0.0004992941154104781, 'samples': 1064064, 'steps': 5541, 'loss/train': 1.437373399734497} -11/06/2021 22:01:56 - INFO - __main__ - Step 5543: {'lr': 0.0004992937168498126, 'samples': 1064256, 'steps': 5542, 'loss/train': 1.7761310338974} -11/06/2021 22:01:57 - INFO - __main__ - Step 5544: {'lr': 0.0004992933181768194, 'samples': 1064448, 'steps': 5543, 'loss/train': 2.0214922428131104} -11/06/2021 22:01:58 - INFO - __main__ - Step 5545: {'lr': 0.0004992929193914983, 'samples': 1064640, 'steps': 5544, 'loss/train': 1.7681033611297607} -11/06/2021 22:01:58 - INFO - __main__ - Step 5546: {'lr': 0.0004992925204938498, 'samples': 1064832, 'steps': 5545, 'loss/train': 2.075996160507202} -11/06/2021 22:01:59 - INFO - __main__ - Step 5547: {'lr': 0.0004992921214838738, 'samples': 1065024, 'steps': 5546, 'loss/train': 1.834026575088501} -11/06/2021 22:01:59 - INFO - __main__ - Step 5548: {'lr': 0.0004992917223615706, 'samples': 1065216, 'steps': 5547, 'loss/train': 1.4636272192001343} -11/06/2021 22:01:59 - INFO - __main__ - Step 5549: {'lr': 0.0004992913231269405, 'samples': 1065408, 'steps': 5548, 'loss/train': 1.9245575666427612} -11/06/2021 22:02:00 - INFO - __main__ - Step 5550: {'lr': 0.0004992909237799835, 'samples': 1065600, 'steps': 5549, 'loss/train': 2.2728660106658936} -11/06/2021 22:02:01 - INFO - __main__ - Step 5551: {'lr': 0.0004992905243206999, 'samples': 1065792, 'steps': 5550, 'loss/train': 1.8605475425720215} -11/06/2021 22:02:01 - INFO - __main__ - Step 5552: {'lr': 0.0004992901247490899, 'samples': 1065984, 'steps': 5551, 'loss/train': 2.065237522125244} -11/06/2021 22:02:01 - INFO - __main__ - Step 5553: {'lr': 0.0004992897250651535, 'samples': 1066176, 'steps': 5552, 'loss/train': 2.103445529937744} -11/06/2021 22:02:02 - INFO - __main__ - Step 5554: {'lr': 0.000499289325268891, 'samples': 1066368, 'steps': 5553, 'loss/train': 1.8733552694320679} -11/06/2021 22:02:03 - INFO - __main__ - Step 5555: {'lr': 0.0004992889253603027, 'samples': 1066560, 'steps': 5554, 'loss/train': 1.6204419136047363} -11/06/2021 22:02:03 - INFO - __main__ - Step 5556: {'lr': 0.0004992885253393885, 'samples': 1066752, 'steps': 5555, 'loss/train': 1.7640080451965332} -11/06/2021 22:02:04 - INFO - __main__ - Step 5557: {'lr': 0.0004992881252061489, 'samples': 1066944, 'steps': 5556, 'loss/train': 1.724705457687378} -11/06/2021 22:02:04 - INFO - __main__ - Step 5558: {'lr': 0.0004992877249605838, 'samples': 1067136, 'steps': 5557, 'loss/train': 2.2034895420074463} -11/06/2021 22:02:04 - INFO - __main__ - Step 5559: {'lr': 0.0004992873246026935, 'samples': 1067328, 'steps': 5558, 'loss/train': 2.039024591445923} -11/06/2021 22:02:05 - INFO - __main__ - Step 5560: {'lr': 0.0004992869241324783, 'samples': 1067520, 'steps': 5559, 'loss/train': 1.9477410316467285} -11/06/2021 22:02:06 - INFO - __main__ - Step 5561: {'lr': 0.000499286523549938, 'samples': 1067712, 'steps': 5560, 'loss/train': 1.9774774312973022} -11/06/2021 22:02:06 - INFO - __main__ - Step 5562: {'lr': 0.0004992861228550733, 'samples': 1067904, 'steps': 5561, 'loss/train': 2.137509822845459} -11/06/2021 22:02:06 - INFO - __main__ - Step 5563: {'lr': 0.0004992857220478841, 'samples': 1068096, 'steps': 5562, 'loss/train': 1.9436842203140259} -11/06/2021 22:02:07 - INFO - __main__ - Step 5564: {'lr': 0.0004992853211283705, 'samples': 1068288, 'steps': 5563, 'loss/train': 2.0045459270477295} -11/06/2021 22:02:08 - INFO - __main__ - Step 5565: {'lr': 0.0004992849200965327, 'samples': 1068480, 'steps': 5564, 'loss/train': 1.8353327512741089} -11/06/2021 22:02:08 - INFO - __main__ - Step 5566: {'lr': 0.0004992845189523711, 'samples': 1068672, 'steps': 5565, 'loss/train': 2.0094947814941406} -11/06/2021 22:02:08 - INFO - __main__ - Step 5567: {'lr': 0.0004992841176958858, 'samples': 1068864, 'steps': 5566, 'loss/train': 1.8892325162887573} -11/06/2021 22:02:09 - INFO - __main__ - Step 5568: {'lr': 0.0004992837163270769, 'samples': 1069056, 'steps': 5567, 'loss/train': 1.280644178390503} -11/06/2021 22:02:09 - INFO - __main__ - Step 5569: {'lr': 0.0004992833148459445, 'samples': 1069248, 'steps': 5568, 'loss/train': 2.168335199356079} -11/06/2021 22:02:10 - INFO - __main__ - Step 5570: {'lr': 0.0004992829132524889, 'samples': 1069440, 'steps': 5569, 'loss/train': 1.7364050149917603} -11/06/2021 22:02:11 - INFO - __main__ - Step 5571: {'lr': 0.0004992825115467102, 'samples': 1069632, 'steps': 5570, 'loss/train': 1.8209835290908813} -11/06/2021 22:02:11 - INFO - __main__ - Step 5572: {'lr': 0.0004992821097286088, 'samples': 1069824, 'steps': 5571, 'loss/train': 2.0928235054016113} -11/06/2021 22:02:11 - INFO - __main__ - Step 5573: {'lr': 0.0004992817077981846, 'samples': 1070016, 'steps': 5572, 'loss/train': 1.939453125} -11/06/2021 22:02:12 - INFO - __main__ - Step 5574: {'lr': 0.000499281305755438, 'samples': 1070208, 'steps': 5573, 'loss/train': 1.4345474243164062} -11/06/2021 22:02:13 - INFO - __main__ - Step 5575: {'lr': 0.0004992809036003691, 'samples': 1070400, 'steps': 5574, 'loss/train': 1.5226601362228394} -11/06/2021 22:02:13 - INFO - __main__ - Step 5576: {'lr': 0.000499280501332978, 'samples': 1070592, 'steps': 5575, 'loss/train': 1.6950485706329346} -11/06/2021 22:02:13 - INFO - __main__ - Step 5577: {'lr': 0.000499280098953265, 'samples': 1070784, 'steps': 5576, 'loss/train': 1.7863175868988037} -11/06/2021 22:02:14 - INFO - __main__ - Step 5578: {'lr': 0.0004992796964612302, 'samples': 1070976, 'steps': 5577, 'loss/train': 2.1370227336883545} -11/06/2021 22:02:14 - INFO - __main__ - Step 5579: {'lr': 0.0004992792938568739, 'samples': 1071168, 'steps': 5578, 'loss/train': 1.6954041719436646} -11/06/2021 22:02:15 - INFO - __main__ - Step 5580: {'lr': 0.0004992788911401961, 'samples': 1071360, 'steps': 5579, 'loss/train': 1.965846300125122} -11/06/2021 22:02:15 - INFO - __main__ - Step 5581: {'lr': 0.0004992784883111972, 'samples': 1071552, 'steps': 5580, 'loss/train': 2.0566160678863525} -11/06/2021 22:02:16 - INFO - __main__ - Step 5582: {'lr': 0.0004992780853698771, 'samples': 1071744, 'steps': 5581, 'loss/train': 2.0826704502105713} -11/06/2021 22:02:16 - INFO - __main__ - Step 5583: {'lr': 0.0004992776823162362, 'samples': 1071936, 'steps': 5582, 'loss/train': 1.6253973245620728} -11/06/2021 22:02:16 - INFO - __main__ - Step 5584: {'lr': 0.0004992772791502746, 'samples': 1072128, 'steps': 5583, 'loss/train': 1.7292557954788208} -11/06/2021 22:02:18 - INFO - __main__ - Step 5585: {'lr': 0.0004992768758719926, 'samples': 1072320, 'steps': 5584, 'loss/train': 2.4336965084075928} -11/06/2021 22:02:18 - INFO - __main__ - Step 5586: {'lr': 0.0004992764724813902, 'samples': 1072512, 'steps': 5585, 'loss/train': 1.5816513299942017} -11/06/2021 22:02:18 - INFO - __main__ - Step 5587: {'lr': 0.0004992760689784677, 'samples': 1072704, 'steps': 5586, 'loss/train': 1.2834484577178955} -11/06/2021 22:02:19 - INFO - __main__ - Step 5588: {'lr': 0.0004992756653632252, 'samples': 1072896, 'steps': 5587, 'loss/train': 2.1524899005889893} -11/06/2021 22:02:19 - INFO - __main__ - Step 5589: {'lr': 0.0004992752616356631, 'samples': 1073088, 'steps': 5588, 'loss/train': 2.2790422439575195} -11/06/2021 22:02:19 - INFO - __main__ - Step 5590: {'lr': 0.0004992748577957812, 'samples': 1073280, 'steps': 5589, 'loss/train': 1.7279716730117798} -11/06/2021 22:02:21 - INFO - __main__ - Step 5591: {'lr': 0.00049927445384358, 'samples': 1073472, 'steps': 5590, 'loss/train': 1.8624963760375977} -11/06/2021 22:02:21 - INFO - __main__ - Step 5592: {'lr': 0.0004992740497790595, 'samples': 1073664, 'steps': 5591, 'loss/train': 2.11755108833313} -11/06/2021 22:02:21 - INFO - __main__ - Step 5593: {'lr': 0.0004992736456022201, 'samples': 1073856, 'steps': 5592, 'loss/train': 6.259105205535889} -11/06/2021 22:02:22 - INFO - __main__ - Step 5594: {'lr': 0.0004992732413130617, 'samples': 1074048, 'steps': 5593, 'loss/train': 2.766812562942505} -11/06/2021 22:02:22 - INFO - __main__ - Step 5595: {'lr': 0.0004992728369115848, 'samples': 1074240, 'steps': 5594, 'loss/train': 0.8529731631278992} -11/06/2021 22:02:22 - INFO - __main__ - Step 5596: {'lr': 0.0004992724323977893, 'samples': 1074432, 'steps': 5595, 'loss/train': 1.5423051118850708} -11/06/2021 22:02:23 - INFO - __main__ - Step 5597: {'lr': 0.0004992720277716755, 'samples': 1074624, 'steps': 5596, 'loss/train': 1.7895461320877075} -11/06/2021 22:02:24 - INFO - __main__ - Step 5598: {'lr': 0.0004992716230332435, 'samples': 1074816, 'steps': 5597, 'loss/train': 1.8931951522827148} -11/06/2021 22:02:24 - INFO - __main__ - Step 5599: {'lr': 0.0004992712181824936, 'samples': 1075008, 'steps': 5598, 'loss/train': 2.938845634460449} -11/06/2021 22:02:24 - INFO - __main__ - Step 5600: {'lr': 0.0004992708132194259, 'samples': 1075200, 'steps': 5599, 'loss/train': 1.7190282344818115} -11/06/2021 22:02:25 - INFO - __main__ - Step 5601: {'lr': 0.0004992704081440407, 'samples': 1075392, 'steps': 5600, 'loss/train': 2.1930367946624756} -11/06/2021 22:02:26 - INFO - __main__ - Step 5602: {'lr': 0.0004992700029563381, 'samples': 1075584, 'steps': 5601, 'loss/train': 1.8844269514083862} -11/06/2021 22:02:26 - INFO - __main__ - Step 5603: {'lr': 0.0004992695976563182, 'samples': 1075776, 'steps': 5602, 'loss/train': 2.1230838298797607} -11/06/2021 22:02:26 - INFO - __main__ - Step 5604: {'lr': 0.0004992691922439814, 'samples': 1075968, 'steps': 5603, 'loss/train': 1.6668339967727661} -11/06/2021 22:02:27 - INFO - __main__ - Step 5605: {'lr': 0.0004992687867193277, 'samples': 1076160, 'steps': 5604, 'loss/train': 1.7833575010299683} -11/06/2021 22:02:27 - INFO - __main__ - Step 5606: {'lr': 0.0004992683810823572, 'samples': 1076352, 'steps': 5605, 'loss/train': 1.914794683456421} -11/06/2021 22:02:28 - INFO - __main__ - Step 5607: {'lr': 0.0004992679753330703, 'samples': 1076544, 'steps': 5606, 'loss/train': 1.698716163635254} -11/06/2021 22:02:28 - INFO - __main__ - Step 5608: {'lr': 0.0004992675694714671, 'samples': 1076736, 'steps': 5607, 'loss/train': 2.1556620597839355} -11/06/2021 22:02:29 - INFO - __main__ - Step 5609: {'lr': 0.0004992671634975477, 'samples': 1076928, 'steps': 5608, 'loss/train': 1.4872366189956665} -11/06/2021 22:02:29 - INFO - __main__ - Step 5610: {'lr': 0.0004992667574113125, 'samples': 1077120, 'steps': 5609, 'loss/train': 1.928450345993042} -11/06/2021 22:02:29 - INFO - __main__ - Step 5611: {'lr': 0.0004992663512127615, 'samples': 1077312, 'steps': 5610, 'loss/train': 2.2512283325195312} -11/06/2021 22:02:31 - INFO - __main__ - Step 5612: {'lr': 0.0004992659449018949, 'samples': 1077504, 'steps': 5611, 'loss/train': 1.50386643409729} -11/06/2021 22:02:31 - INFO - __main__ - Step 5613: {'lr': 0.0004992655384787129, 'samples': 1077696, 'steps': 5612, 'loss/train': 2.3416426181793213} -11/06/2021 22:02:31 - INFO - __main__ - Step 5614: {'lr': 0.0004992651319432157, 'samples': 1077888, 'steps': 5613, 'loss/train': 2.967033863067627} -11/06/2021 22:02:32 - INFO - __main__ - Step 5615: {'lr': 0.0004992647252954035, 'samples': 1078080, 'steps': 5614, 'loss/train': 2.203519582748413} -11/06/2021 22:02:32 - INFO - __main__ - Step 5616: {'lr': 0.0004992643185352765, 'samples': 1078272, 'steps': 5615, 'loss/train': 2.0697097778320312} -11/06/2021 22:02:32 - INFO - __main__ - Step 5617: {'lr': 0.0004992639116628349, 'samples': 1078464, 'steps': 5616, 'loss/train': 2.1669209003448486} -11/06/2021 22:02:34 - INFO - __main__ - Step 5618: {'lr': 0.0004992635046780786, 'samples': 1078656, 'steps': 5617, 'loss/train': 2.434951066970825} -11/06/2021 22:02:34 - INFO - __main__ - Step 5619: {'lr': 0.0004992630975810083, 'samples': 1078848, 'steps': 5618, 'loss/train': 2.055948257446289} -11/06/2021 22:02:35 - INFO - __main__ - Step 5620: {'lr': 0.0004992626903716237, 'samples': 1079040, 'steps': 5619, 'loss/train': 0.3906489312648773} -11/06/2021 22:02:35 - INFO - __main__ - Step 5621: {'lr': 0.0004992622830499252, 'samples': 1079232, 'steps': 5620, 'loss/train': 0.3192686438560486} -11/06/2021 22:02:35 - INFO - __main__ - Step 5622: {'lr': 0.000499261875615913, 'samples': 1079424, 'steps': 5621, 'loss/train': 1.627442479133606} -11/06/2021 22:02:36 - INFO - __main__ - Step 5623: {'lr': 0.0004992614680695872, 'samples': 1079616, 'steps': 5622, 'loss/train': 2.138500452041626} -11/06/2021 22:02:37 - INFO - __main__ - Step 5624: {'lr': 0.0004992610604109481, 'samples': 1079808, 'steps': 5623, 'loss/train': 2.165574312210083} -11/06/2021 22:02:37 - INFO - __main__ - Step 5625: {'lr': 0.0004992606526399957, 'samples': 1080000, 'steps': 5624, 'loss/train': 1.8479472398757935} -11/06/2021 22:02:37 - INFO - __main__ - Step 5626: {'lr': 0.0004992602447567304, 'samples': 1080192, 'steps': 5625, 'loss/train': 2.4740467071533203} -11/06/2021 22:02:38 - INFO - __main__ - Step 5627: {'lr': 0.0004992598367611523, 'samples': 1080384, 'steps': 5626, 'loss/train': 1.5033149719238281} -11/06/2021 22:02:38 - INFO - __main__ - Step 5628: {'lr': 0.0004992594286532615, 'samples': 1080576, 'steps': 5627, 'loss/train': 1.958828330039978} -11/06/2021 22:02:39 - INFO - __main__ - Step 5629: {'lr': 0.0004992590204330583, 'samples': 1080768, 'steps': 5628, 'loss/train': 1.696641445159912} -11/06/2021 22:02:39 - INFO - __main__ - Step 5630: {'lr': 0.0004992586121005427, 'samples': 1080960, 'steps': 5629, 'loss/train': 0.8877306580543518} -11/06/2021 22:02:40 - INFO - __main__ - Step 5631: {'lr': 0.0004992582036557152, 'samples': 1081152, 'steps': 5630, 'loss/train': 2.333393096923828} -11/06/2021 22:02:40 - INFO - __main__ - Step 5632: {'lr': 0.0004992577950985757, 'samples': 1081344, 'steps': 5631, 'loss/train': 2.0259532928466797} -11/06/2021 22:02:40 - INFO - __main__ - Step 5633: {'lr': 0.0004992573864291244, 'samples': 1081536, 'steps': 5632, 'loss/train': 1.8936342000961304} -11/06/2021 22:02:41 - INFO - __main__ - Step 5634: {'lr': 0.0004992569776473616, 'samples': 1081728, 'steps': 5633, 'loss/train': 1.8749663829803467} -11/06/2021 22:02:42 - INFO - __main__ - Step 5635: {'lr': 0.0004992565687532875, 'samples': 1081920, 'steps': 5634, 'loss/train': 1.5571837425231934} -11/06/2021 22:02:42 - INFO - __main__ - Step 5636: {'lr': 0.0004992561597469023, 'samples': 1082112, 'steps': 5635, 'loss/train': 2.0260841846466064} -11/06/2021 22:02:42 - INFO - __main__ - Step 5637: {'lr': 0.0004992557506282061, 'samples': 1082304, 'steps': 5636, 'loss/train': 1.9845712184906006} -11/06/2021 22:02:43 - INFO - __main__ - Step 5638: {'lr': 0.0004992553413971991, 'samples': 1082496, 'steps': 5637, 'loss/train': 1.8022942543029785} -11/06/2021 22:02:44 - INFO - __main__ - Step 5639: {'lr': 0.0004992549320538814, 'samples': 1082688, 'steps': 5638, 'loss/train': 2.3104302883148193} -11/06/2021 22:02:44 - INFO - __main__ - Step 5640: {'lr': 0.0004992545225982533, 'samples': 1082880, 'steps': 5639, 'loss/train': 1.7610740661621094} -11/06/2021 22:02:45 - INFO - __main__ - Step 5641: {'lr': 0.000499254113030315, 'samples': 1083072, 'steps': 5640, 'loss/train': 1.8128447532653809} -11/06/2021 22:02:45 - INFO - __main__ - Step 5642: {'lr': 0.0004992537033500667, 'samples': 1083264, 'steps': 5641, 'loss/train': 1.8965189456939697} -11/06/2021 22:02:45 - INFO - __main__ - Step 5643: {'lr': 0.0004992532935575084, 'samples': 1083456, 'steps': 5642, 'loss/train': 2.2873661518096924} -11/06/2021 22:02:46 - INFO - __main__ - Step 5644: {'lr': 0.0004992528836526405, 'samples': 1083648, 'steps': 5643, 'loss/train': 2.314706325531006} -11/06/2021 22:02:47 - INFO - __main__ - Step 5645: {'lr': 0.0004992524736354631, 'samples': 1083840, 'steps': 5644, 'loss/train': 2.096315622329712} -11/06/2021 22:02:47 - INFO - __main__ - Step 5646: {'lr': 0.0004992520635059762, 'samples': 1084032, 'steps': 5645, 'loss/train': 1.736008644104004} -11/06/2021 22:02:47 - INFO - __main__ - Step 5647: {'lr': 0.0004992516532641804, 'samples': 1084224, 'steps': 5646, 'loss/train': 1.71793794631958} -11/06/2021 22:02:48 - INFO - __main__ - Step 5648: {'lr': 0.0004992512429100757, 'samples': 1084416, 'steps': 5647, 'loss/train': 1.7612890005111694} -11/06/2021 22:02:49 - INFO - __main__ - Step 5649: {'lr': 0.000499250832443662, 'samples': 1084608, 'steps': 5648, 'loss/train': 2.2662413120269775} -11/06/2021 22:02:49 - INFO - __main__ - Step 5650: {'lr': 0.0004992504218649398, 'samples': 1084800, 'steps': 5649, 'loss/train': 1.443153977394104} -11/06/2021 22:02:50 - INFO - __main__ - Step 5651: {'lr': 0.0004992500111739093, 'samples': 1084992, 'steps': 5650, 'loss/train': 2.055508852005005} -11/06/2021 22:02:50 - INFO - __main__ - Step 5652: {'lr': 0.0004992496003705705, 'samples': 1085184, 'steps': 5651, 'loss/train': 2.131808042526245} -11/06/2021 22:02:50 - INFO - __main__ - Step 5653: {'lr': 0.0004992491894549236, 'samples': 1085376, 'steps': 5652, 'loss/train': 1.7326874732971191} -11/06/2021 22:02:51 - INFO - __main__ - Step 5654: {'lr': 0.000499248778426969, 'samples': 1085568, 'steps': 5653, 'loss/train': 2.14742374420166} -11/06/2021 22:02:52 - INFO - __main__ - Step 5655: {'lr': 0.0004992483672867068, 'samples': 1085760, 'steps': 5654, 'loss/train': 1.887015461921692} -11/06/2021 22:02:52 - INFO - __main__ - Step 5656: {'lr': 0.000499247956034137, 'samples': 1085952, 'steps': 5655, 'loss/train': 0.4538571536540985} -11/06/2021 22:02:52 - INFO - __main__ - Step 5657: {'lr': 0.00049924754466926, 'samples': 1086144, 'steps': 5656, 'loss/train': 2.187472105026245} -11/06/2021 22:02:53 - INFO - __main__ - Step 5658: {'lr': 0.0004992471331920758, 'samples': 1086336, 'steps': 5657, 'loss/train': 1.9629387855529785} -11/06/2021 22:02:53 - INFO - __main__ - Step 5659: {'lr': 0.0004992467216025848, 'samples': 1086528, 'steps': 5658, 'loss/train': 2.4174067974090576} -11/06/2021 22:02:54 - INFO - __main__ - Step 5660: {'lr': 0.0004992463099007871, 'samples': 1086720, 'steps': 5659, 'loss/train': 1.6454474925994873} -11/06/2021 22:02:54 - INFO - __main__ - Step 5661: {'lr': 0.0004992458980866827, 'samples': 1086912, 'steps': 5660, 'loss/train': 1.8920400142669678} -11/06/2021 22:02:55 - INFO - __main__ - Step 5662: {'lr': 0.000499245486160272, 'samples': 1087104, 'steps': 5661, 'loss/train': 1.9282915592193604} -11/06/2021 22:02:55 - INFO - __main__ - Step 5663: {'lr': 0.0004992450741215552, 'samples': 1087296, 'steps': 5662, 'loss/train': 1.9078826904296875} -11/06/2021 22:02:55 - INFO - __main__ - Step 5664: {'lr': 0.0004992446619705324, 'samples': 1087488, 'steps': 5663, 'loss/train': 1.9330226182937622} -11/06/2021 22:02:56 - INFO - __main__ - Step 5665: {'lr': 0.0004992442497072037, 'samples': 1087680, 'steps': 5664, 'loss/train': 1.8962855339050293} -11/06/2021 22:02:57 - INFO - __main__ - Step 5666: {'lr': 0.0004992438373315694, 'samples': 1087872, 'steps': 5665, 'loss/train': 1.5366052389144897} -11/06/2021 22:02:57 - INFO - __main__ - Step 5667: {'lr': 0.0004992434248436298, 'samples': 1088064, 'steps': 5666, 'loss/train': 1.221272587776184} -11/06/2021 22:02:57 - INFO - __main__ - Step 5668: {'lr': 0.0004992430122433848, 'samples': 1088256, 'steps': 5667, 'loss/train': 1.9391791820526123} -11/06/2021 22:02:58 - INFO - __main__ - Step 5669: {'lr': 0.0004992425995308349, 'samples': 1088448, 'steps': 5668, 'loss/train': 1.7548898458480835} -11/06/2021 22:02:59 - INFO - __main__ - Step 5670: {'lr': 0.0004992421867059801, 'samples': 1088640, 'steps': 5669, 'loss/train': 1.8856055736541748} -11/06/2021 22:02:59 - INFO - __main__ - Step 5671: {'lr': 0.0004992417737688206, 'samples': 1088832, 'steps': 5670, 'loss/train': 1.850290298461914} -11/06/2021 22:02:59 - INFO - __main__ - Step 5672: {'lr': 0.0004992413607193566, 'samples': 1089024, 'steps': 5671, 'loss/train': 2.0641515254974365} -11/06/2021 22:03:00 - INFO - __main__ - Step 5673: {'lr': 0.0004992409475575882, 'samples': 1089216, 'steps': 5672, 'loss/train': 2.626786231994629} -11/06/2021 22:03:00 - INFO - __main__ - Step 5674: {'lr': 0.0004992405342835158, 'samples': 1089408, 'steps': 5673, 'loss/train': 1.913179636001587} -11/06/2021 22:03:01 - INFO - __main__ - Step 5675: {'lr': 0.0004992401208971394, 'samples': 1089600, 'steps': 5674, 'loss/train': 2.4290151596069336} -11/06/2021 22:03:02 - INFO - __main__ - Step 5676: {'lr': 0.0004992397073984592, 'samples': 1089792, 'steps': 5675, 'loss/train': 1.8842289447784424} -11/06/2021 22:03:02 - INFO - __main__ - Step 5677: {'lr': 0.0004992392937874755, 'samples': 1089984, 'steps': 5676, 'loss/train': 1.9053252935409546} -11/06/2021 22:03:02 - INFO - __main__ - Step 5678: {'lr': 0.0004992388800641885, 'samples': 1090176, 'steps': 5677, 'loss/train': 2.1851115226745605} -11/06/2021 22:03:03 - INFO - __main__ - Step 5679: {'lr': 0.0004992384662285981, 'samples': 1090368, 'steps': 5678, 'loss/train': 1.9551331996917725} -11/06/2021 22:03:04 - INFO - __main__ - Step 5680: {'lr': 0.0004992380522807049, 'samples': 1090560, 'steps': 5679, 'loss/train': 2.1385090351104736} -11/06/2021 22:03:04 - INFO - __main__ - Step 5681: {'lr': 0.0004992376382205088, 'samples': 1090752, 'steps': 5680, 'loss/train': 0.955967903137207} -11/06/2021 22:03:04 - INFO - __main__ - Step 5682: {'lr': 0.00049923722404801, 'samples': 1090944, 'steps': 5681, 'loss/train': 1.333667278289795} -11/06/2021 22:03:05 - INFO - __main__ - Step 5683: {'lr': 0.0004992368097632089, 'samples': 1091136, 'steps': 5682, 'loss/train': 2.1074047088623047} -11/06/2021 22:03:05 - INFO - __main__ - Step 5684: {'lr': 0.0004992363953661054, 'samples': 1091328, 'steps': 5683, 'loss/train': 1.597164273262024} -11/06/2021 22:03:06 - INFO - __main__ - Step 5685: {'lr': 0.0004992359808566999, 'samples': 1091520, 'steps': 5684, 'loss/train': 4.272282600402832} -11/06/2021 22:03:06 - INFO - __main__ - Step 5686: {'lr': 0.0004992355662349925, 'samples': 1091712, 'steps': 5685, 'loss/train': 2.0851457118988037} -11/06/2021 22:03:07 - INFO - __main__ - Step 5687: {'lr': 0.0004992351515009833, 'samples': 1091904, 'steps': 5686, 'loss/train': 1.8593014478683472} -11/06/2021 22:03:07 - INFO - __main__ - Step 5688: {'lr': 0.0004992347366546727, 'samples': 1092096, 'steps': 5687, 'loss/train': 2.107888698577881} -11/06/2021 22:03:07 - INFO - __main__ - Step 5689: {'lr': 0.0004992343216960607, 'samples': 1092288, 'steps': 5688, 'loss/train': 1.92064368724823} -11/06/2021 22:03:09 - INFO - __main__ - Step 5690: {'lr': 0.0004992339066251476, 'samples': 1092480, 'steps': 5689, 'loss/train': 1.6505532264709473} -11/06/2021 22:03:09 - INFO - __main__ - Step 5691: {'lr': 0.0004992334914419337, 'samples': 1092672, 'steps': 5690, 'loss/train': 1.4800523519515991} -11/06/2021 22:03:09 - INFO - __main__ - Step 5692: {'lr': 0.0004992330761464188, 'samples': 1092864, 'steps': 5691, 'loss/train': 1.566269874572754} -11/06/2021 22:03:10 - INFO - __main__ - Step 5693: {'lr': 0.0004992326607386034, 'samples': 1093056, 'steps': 5692, 'loss/train': 2.7816977500915527} -11/06/2021 22:03:10 - INFO - __main__ - Step 5694: {'lr': 0.0004992322452184876, 'samples': 1093248, 'steps': 5693, 'loss/train': 2.2784321308135986} -11/06/2021 22:03:10 - INFO - __main__ - Step 5695: {'lr': 0.0004992318295860718, 'samples': 1093440, 'steps': 5694, 'loss/train': 1.6132631301879883} -11/06/2021 22:03:11 - INFO - __main__ - Step 5696: {'lr': 0.0004992314138413557, 'samples': 1093632, 'steps': 5695, 'loss/train': 1.0506314039230347} -11/06/2021 22:03:12 - INFO - __main__ - Step 5697: {'lr': 0.0004992309979843398, 'samples': 1093824, 'steps': 5696, 'loss/train': 1.6640676259994507} -11/06/2021 22:03:12 - INFO - __main__ - Step 5698: {'lr': 0.0004992305820150243, 'samples': 1094016, 'steps': 5697, 'loss/train': 2.264589548110962} -11/06/2021 22:03:12 - INFO - __main__ - Step 5699: {'lr': 0.0004992301659334095, 'samples': 1094208, 'steps': 5698, 'loss/train': 1.779240369796753} -11/06/2021 22:03:13 - INFO - __main__ - Step 5700: {'lr': 0.0004992297497394953, 'samples': 1094400, 'steps': 5699, 'loss/train': 1.5789347887039185} -11/06/2021 22:03:14 - INFO - __main__ - Step 5701: {'lr': 0.000499229333433282, 'samples': 1094592, 'steps': 5700, 'loss/train': 1.8561713695526123} -11/06/2021 22:03:14 - INFO - __main__ - Step 5702: {'lr': 0.0004992289170147699, 'samples': 1094784, 'steps': 5701, 'loss/train': 2.206258535385132} -11/06/2021 22:03:15 - INFO - __main__ - Step 5703: {'lr': 0.000499228500483959, 'samples': 1094976, 'steps': 5702, 'loss/train': 1.1616374254226685} -11/06/2021 22:03:15 - INFO - __main__ - Step 5704: {'lr': 0.0004992280838408496, 'samples': 1095168, 'steps': 5703, 'loss/train': 2.011932611465454} -11/06/2021 22:03:15 - INFO - __main__ - Step 5705: {'lr': 0.0004992276670854419, 'samples': 1095360, 'steps': 5704, 'loss/train': 2.265223503112793} -11/06/2021 22:03:16 - INFO - __main__ - Step 5706: {'lr': 0.000499227250217736, 'samples': 1095552, 'steps': 5705, 'loss/train': 1.879677414894104} -11/06/2021 22:03:17 - INFO - __main__ - Step 5707: {'lr': 0.0004992268332377323, 'samples': 1095744, 'steps': 5706, 'loss/train': 1.6559354066848755} -11/06/2021 22:03:17 - INFO - __main__ - Step 5708: {'lr': 0.0004992264161454306, 'samples': 1095936, 'steps': 5707, 'loss/train': 2.132072925567627} -11/06/2021 22:03:17 - INFO - __main__ - Step 5709: {'lr': 0.0004992259989408316, 'samples': 1096128, 'steps': 5708, 'loss/train': 3.037383556365967} -11/06/2021 22:03:18 - INFO - __main__ - Step 5710: {'lr': 0.000499225581623935, 'samples': 1096320, 'steps': 5709, 'loss/train': 2.0813891887664795} -11/06/2021 22:03:18 - INFO - __main__ - Step 5711: {'lr': 0.0004992251641947412, 'samples': 1096512, 'steps': 5710, 'loss/train': 1.6070504188537598} -11/06/2021 22:03:19 - INFO - __main__ - Step 5712: {'lr': 0.0004992247466532504, 'samples': 1096704, 'steps': 5711, 'loss/train': 1.8336153030395508} -11/06/2021 22:03:20 - INFO - __main__ - Step 5713: {'lr': 0.0004992243289994629, 'samples': 1096896, 'steps': 5712, 'loss/train': 1.5240449905395508} -11/06/2021 22:03:20 - INFO - __main__ - Step 5714: {'lr': 0.0004992239112333787, 'samples': 1097088, 'steps': 5713, 'loss/train': 2.0184898376464844} -11/06/2021 22:03:20 - INFO - __main__ - Step 5715: {'lr': 0.000499223493354998, 'samples': 1097280, 'steps': 5714, 'loss/train': 1.668257713317871} -11/06/2021 22:03:21 - INFO - __main__ - Step 5716: {'lr': 0.0004992230753643211, 'samples': 1097472, 'steps': 5715, 'loss/train': 2.1014792919158936} -11/06/2021 22:03:22 - INFO - __main__ - Step 5717: {'lr': 0.0004992226572613481, 'samples': 1097664, 'steps': 5716, 'loss/train': 2.5767147541046143} -11/06/2021 22:03:22 - INFO - __main__ - Step 5718: {'lr': 0.0004992222390460792, 'samples': 1097856, 'steps': 5717, 'loss/train': 1.6296945810317993} -11/06/2021 22:03:23 - INFO - __main__ - Step 5719: {'lr': 0.0004992218207185146, 'samples': 1098048, 'steps': 5718, 'loss/train': 1.9573607444763184} -11/06/2021 22:03:23 - INFO - __main__ - Step 5720: {'lr': 0.0004992214022786546, 'samples': 1098240, 'steps': 5719, 'loss/train': 2.1646392345428467} -11/06/2021 22:03:23 - INFO - __main__ - Step 5721: {'lr': 0.0004992209837264991, 'samples': 1098432, 'steps': 5720, 'loss/train': 1.7333484888076782} -11/06/2021 22:03:24 - INFO - __main__ - Step 5722: {'lr': 0.0004992205650620487, 'samples': 1098624, 'steps': 5721, 'loss/train': 0.6370934844017029} -11/06/2021 22:03:25 - INFO - __main__ - Step 5723: {'lr': 0.0004992201462853032, 'samples': 1098816, 'steps': 5722, 'loss/train': 1.629151701927185} -11/06/2021 22:03:25 - INFO - __main__ - Step 5724: {'lr': 0.000499219727396263, 'samples': 1099008, 'steps': 5723, 'loss/train': 1.9365618228912354} -11/06/2021 22:03:25 - INFO - __main__ - Step 5725: {'lr': 0.0004992193083949282, 'samples': 1099200, 'steps': 5724, 'loss/train': 1.9601372480392456} -11/06/2021 22:03:26 - INFO - __main__ - Step 5726: {'lr': 0.000499218889281299, 'samples': 1099392, 'steps': 5725, 'loss/train': 2.3020355701446533} -11/06/2021 22:03:27 - INFO - __main__ - Step 5727: {'lr': 0.0004992184700553756, 'samples': 1099584, 'steps': 5726, 'loss/train': 1.6674587726593018} -11/06/2021 22:03:27 - INFO - __main__ - Step 5728: {'lr': 0.0004992180507171583, 'samples': 1099776, 'steps': 5727, 'loss/train': 1.6533688306808472} -11/06/2021 22:03:28 - INFO - __main__ - Step 5729: {'lr': 0.0004992176312666472, 'samples': 1099968, 'steps': 5728, 'loss/train': 2.2179229259490967} -11/06/2021 22:03:28 - INFO - __main__ - Step 5730: {'lr': 0.0004992172117038424, 'samples': 1100160, 'steps': 5729, 'loss/train': 1.1370854377746582} -11/06/2021 22:03:28 - INFO - __main__ - Step 5731: {'lr': 0.0004992167920287443, 'samples': 1100352, 'steps': 5730, 'loss/train': 1.7039726972579956} -11/06/2021 22:03:29 - INFO - __main__ - Step 5732: {'lr': 0.0004992163722413528, 'samples': 1100544, 'steps': 5731, 'loss/train': 1.9213690757751465} -11/06/2021 22:03:30 - INFO - __main__ - Step 5733: {'lr': 0.0004992159523416683, 'samples': 1100736, 'steps': 5732, 'loss/train': 1.352500081062317} -11/06/2021 22:03:30 - INFO - __main__ - Step 5734: {'lr': 0.000499215532329691, 'samples': 1100928, 'steps': 5733, 'loss/train': 2.3343346118927} -11/06/2021 22:03:30 - INFO - __main__ - Step 5735: {'lr': 0.000499215112205421, 'samples': 1101120, 'steps': 5734, 'loss/train': 2.6258137226104736} -11/06/2021 22:03:31 - INFO - __main__ - Step 5736: {'lr': 0.0004992146919688584, 'samples': 1101312, 'steps': 5735, 'loss/train': 2.2007718086242676} -11/06/2021 22:03:31 - INFO - __main__ - Step 5737: {'lr': 0.0004992142716200036, 'samples': 1101504, 'steps': 5736, 'loss/train': 1.8303169012069702} -11/06/2021 22:03:32 - INFO - __main__ - Step 5738: {'lr': 0.0004992138511588567, 'samples': 1101696, 'steps': 5737, 'loss/train': 1.5697263479232788} -11/06/2021 22:03:33 - INFO - __main__ - Step 5739: {'lr': 0.0004992134305854179, 'samples': 1101888, 'steps': 5738, 'loss/train': 1.949165940284729} -11/06/2021 22:03:33 - INFO - __main__ - Step 5740: {'lr': 0.0004992130098996873, 'samples': 1102080, 'steps': 5739, 'loss/train': 2.357881784439087} -11/06/2021 22:03:33 - INFO - __main__ - Step 5741: {'lr': 0.0004992125891016652, 'samples': 1102272, 'steps': 5740, 'loss/train': 2.1080918312072754} -11/06/2021 22:03:34 - INFO - __main__ - Step 5742: {'lr': 0.0004992121681913518, 'samples': 1102464, 'steps': 5741, 'loss/train': 1.897286295890808} -11/06/2021 22:03:35 - INFO - __main__ - Step 5743: {'lr': 0.0004992117471687472, 'samples': 1102656, 'steps': 5742, 'loss/train': 1.7857768535614014} -11/06/2021 22:03:35 - INFO - __main__ - Step 5744: {'lr': 0.0004992113260338517, 'samples': 1102848, 'steps': 5743, 'loss/train': 1.731091022491455} -11/06/2021 22:03:36 - INFO - __main__ - Step 5745: {'lr': 0.0004992109047866653, 'samples': 1103040, 'steps': 5744, 'loss/train': 0.806926429271698} -11/06/2021 22:03:36 - INFO - __main__ - Step 5746: {'lr': 0.0004992104834271884, 'samples': 1103232, 'steps': 5745, 'loss/train': 1.5223336219787598} -11/06/2021 22:03:36 - INFO - __main__ - Step 5747: {'lr': 0.0004992100619554211, 'samples': 1103424, 'steps': 5746, 'loss/train': 0.8918942809104919} -11/06/2021 22:03:37 - INFO - __main__ - Step 5748: {'lr': 0.0004992096403713635, 'samples': 1103616, 'steps': 5747, 'loss/train': 2.426661491394043} -11/06/2021 22:03:38 - INFO - __main__ - Step 5749: {'lr': 0.000499209218675016, 'samples': 1103808, 'steps': 5748, 'loss/train': 1.9452520608901978} -11/06/2021 22:03:38 - INFO - __main__ - Step 5750: {'lr': 0.0004992087968663786, 'samples': 1104000, 'steps': 5749, 'loss/train': 2.1779873371124268} -11/06/2021 22:03:38 - INFO - __main__ - Step 5751: {'lr': 0.0004992083749454515, 'samples': 1104192, 'steps': 5750, 'loss/train': 2.161979913711548} -11/06/2021 22:03:39 - INFO - __main__ - Step 5752: {'lr': 0.0004992079529122351, 'samples': 1104384, 'steps': 5751, 'loss/train': 2.0824427604675293} -11/06/2021 22:03:39 - INFO - __main__ - Step 5753: {'lr': 0.0004992075307667294, 'samples': 1104576, 'steps': 5752, 'loss/train': 1.917615532875061} -11/06/2021 22:03:40 - INFO - __main__ - Step 5754: {'lr': 0.0004992071085089346, 'samples': 1104768, 'steps': 5753, 'loss/train': 1.9957177639007568} -11/06/2021 22:03:40 - INFO - __main__ - Step 5755: {'lr': 0.0004992066861388509, 'samples': 1104960, 'steps': 5754, 'loss/train': 2.4890198707580566} -11/06/2021 22:03:41 - INFO - __main__ - Step 5756: {'lr': 0.0004992062636564786, 'samples': 1105152, 'steps': 5755, 'loss/train': 2.0366508960723877} -11/06/2021 22:03:41 - INFO - __main__ - Step 5757: {'lr': 0.0004992058410618177, 'samples': 1105344, 'steps': 5756, 'loss/train': 1.8771767616271973} -11/06/2021 22:03:41 - INFO - __main__ - Step 5758: {'lr': 0.0004992054183548685, 'samples': 1105536, 'steps': 5757, 'loss/train': 1.831110954284668} -11/06/2021 22:03:42 - INFO - __main__ - Step 5759: {'lr': 0.0004992049955356313, 'samples': 1105728, 'steps': 5758, 'loss/train': 1.9998888969421387} -11/06/2021 22:03:43 - INFO - __main__ - Step 5760: {'lr': 0.0004992045726041061, 'samples': 1105920, 'steps': 5759, 'loss/train': 1.6390290260314941} -11/06/2021 22:03:43 - INFO - __main__ - Step 5761: {'lr': 0.0004992041495602931, 'samples': 1106112, 'steps': 5760, 'loss/train': 1.8871279954910278} -11/06/2021 22:03:43 - INFO - __main__ - Step 5762: {'lr': 0.0004992037264041927, 'samples': 1106304, 'steps': 5761, 'loss/train': 2.7481179237365723} -11/06/2021 22:03:44 - INFO - __main__ - Step 5763: {'lr': 0.0004992033031358048, 'samples': 1106496, 'steps': 5762, 'loss/train': 2.292053699493408} -11/06/2021 22:03:45 - INFO - __main__ - Step 5764: {'lr': 0.0004992028797551298, 'samples': 1106688, 'steps': 5763, 'loss/train': 1.911152720451355} -11/06/2021 22:03:45 - INFO - __main__ - Step 5765: {'lr': 0.0004992024562621678, 'samples': 1106880, 'steps': 5764, 'loss/train': 2.004040479660034} -11/06/2021 22:03:46 - INFO - __main__ - Step 5766: {'lr': 0.0004992020326569191, 'samples': 1107072, 'steps': 5765, 'loss/train': 2.0469226837158203} -11/06/2021 22:03:46 - INFO - __main__ - Step 5767: {'lr': 0.0004992016089393837, 'samples': 1107264, 'steps': 5766, 'loss/train': 1.93135666847229} -11/06/2021 22:03:46 - INFO - __main__ - Step 5768: {'lr': 0.000499201185109562, 'samples': 1107456, 'steps': 5767, 'loss/train': 2.3704495429992676} -11/06/2021 22:03:47 - INFO - __main__ - Step 5769: {'lr': 0.000499200761167454, 'samples': 1107648, 'steps': 5768, 'loss/train': 1.7773163318634033} -11/06/2021 22:03:48 - INFO - __main__ - Step 5770: {'lr': 0.0004992003371130601, 'samples': 1107840, 'steps': 5769, 'loss/train': 1.401180386543274} -11/06/2021 22:03:48 - INFO - __main__ - Step 5771: {'lr': 0.0004991999129463803, 'samples': 1108032, 'steps': 5770, 'loss/train': 2.0761475563049316} -11/06/2021 22:03:48 - INFO - __main__ - Step 5772: {'lr': 0.0004991994886674148, 'samples': 1108224, 'steps': 5771, 'loss/train': 2.294243574142456} -11/06/2021 22:03:49 - INFO - __main__ - Step 5773: {'lr': 0.000499199064276164, 'samples': 1108416, 'steps': 5772, 'loss/train': 2.8149049282073975} -11/06/2021 22:03:50 - INFO - __main__ - Step 5774: {'lr': 0.0004991986397726278, 'samples': 1108608, 'steps': 5773, 'loss/train': 1.9633965492248535} -11/06/2021 22:03:50 - INFO - __main__ - Step 5775: {'lr': 0.0004991982151568066, 'samples': 1108800, 'steps': 5774, 'loss/train': 2.1700239181518555} -11/06/2021 22:03:50 - INFO - __main__ - Step 5776: {'lr': 0.0004991977904287006, 'samples': 1108992, 'steps': 5775, 'loss/train': 1.5528236627578735} -11/06/2021 22:03:51 - INFO - __main__ - Step 5777: {'lr': 0.0004991973655883099, 'samples': 1109184, 'steps': 5776, 'loss/train': 1.8211041688919067} -11/06/2021 22:03:51 - INFO - __main__ - Step 5778: {'lr': 0.0004991969406356346, 'samples': 1109376, 'steps': 5777, 'loss/train': 2.413984775543213} -11/06/2021 22:03:51 - INFO - __main__ - Step 5779: {'lr': 0.0004991965155706752, 'samples': 1109568, 'steps': 5778, 'loss/train': 1.5177364349365234} -11/06/2021 22:03:52 - INFO - __main__ - Step 5780: {'lr': 0.0004991960903934315, 'samples': 1109760, 'steps': 5779, 'loss/train': 1.6337430477142334} -11/06/2021 22:03:53 - INFO - __main__ - Step 5781: {'lr': 0.0004991956651039039, 'samples': 1109952, 'steps': 5780, 'loss/train': 1.6799068450927734} -11/06/2021 22:03:53 - INFO - __main__ - Step 5782: {'lr': 0.0004991952397020927, 'samples': 1110144, 'steps': 5781, 'loss/train': 1.9769641160964966} -11/06/2021 22:03:54 - INFO - __main__ - Step 5783: {'lr': 0.0004991948141879978, 'samples': 1110336, 'steps': 5782, 'loss/train': 1.8195029497146606} -11/06/2021 22:03:54 - INFO - __main__ - Step 5784: {'lr': 0.0004991943885616198, 'samples': 1110528, 'steps': 5783, 'loss/train': 1.771957516670227} -11/06/2021 22:03:55 - INFO - __main__ - Step 5785: {'lr': 0.0004991939628229585, 'samples': 1110720, 'steps': 5784, 'loss/train': 1.7779532670974731} -11/06/2021 22:03:55 - INFO - __main__ - Step 5786: {'lr': 0.0004991935369720143, 'samples': 1110912, 'steps': 5785, 'loss/train': 2.5987279415130615} -11/06/2021 22:03:56 - INFO - __main__ - Step 5787: {'lr': 0.0004991931110087873, 'samples': 1111104, 'steps': 5786, 'loss/train': 2.056739568710327} -11/06/2021 22:03:56 - INFO - __main__ - Step 5788: {'lr': 0.0004991926849332777, 'samples': 1111296, 'steps': 5787, 'loss/train': 2.098029851913452} -11/06/2021 22:03:56 - INFO - __main__ - Step 5789: {'lr': 0.0004991922587454858, 'samples': 1111488, 'steps': 5788, 'loss/train': 1.8450032472610474} -11/06/2021 22:03:57 - INFO - __main__ - Step 5790: {'lr': 0.0004991918324454117, 'samples': 1111680, 'steps': 5789, 'loss/train': 1.8697025775909424} -11/06/2021 22:03:58 - INFO - __main__ - Step 5791: {'lr': 0.0004991914060330556, 'samples': 1111872, 'steps': 5790, 'loss/train': 2.107398271560669} -11/06/2021 22:03:58 - INFO - __main__ - Step 5792: {'lr': 0.0004991909795084177, 'samples': 1112064, 'steps': 5791, 'loss/train': 1.6011704206466675} -11/06/2021 22:03:58 - INFO - __main__ - Step 5793: {'lr': 0.0004991905528714981, 'samples': 1112256, 'steps': 5792, 'loss/train': 1.8442002534866333} -11/06/2021 22:03:59 - INFO - __main__ - Step 5794: {'lr': 0.0004991901261222971, 'samples': 1112448, 'steps': 5793, 'loss/train': 2.1112143993377686} -11/06/2021 22:04:00 - INFO - __main__ - Step 5795: {'lr': 0.000499189699260815, 'samples': 1112640, 'steps': 5794, 'loss/train': 1.3628276586532593} -11/06/2021 22:04:00 - INFO - __main__ - Step 5796: {'lr': 0.0004991892722870517, 'samples': 1112832, 'steps': 5795, 'loss/train': 1.7392164468765259} -11/06/2021 22:04:00 - INFO - __main__ - Step 5797: {'lr': 0.0004991888452010076, 'samples': 1113024, 'steps': 5796, 'loss/train': 2.1500654220581055} -11/06/2021 22:04:01 - INFO - __main__ - Step 5798: {'lr': 0.000499188418002683, 'samples': 1113216, 'steps': 5797, 'loss/train': 2.0395941734313965} -11/06/2021 22:04:01 - INFO - __main__ - Step 5799: {'lr': 0.0004991879906920779, 'samples': 1113408, 'steps': 5798, 'loss/train': 1.4463250637054443} -11/06/2021 22:04:02 - INFO - __main__ - Step 5800: {'lr': 0.0004991875632691924, 'samples': 1113600, 'steps': 5799, 'loss/train': 2.434201717376709} -11/06/2021 22:04:02 - INFO - __main__ - Step 5801: {'lr': 0.0004991871357340269, 'samples': 1113792, 'steps': 5800, 'loss/train': 2.0661230087280273} -11/06/2021 22:04:03 - INFO - __main__ - Step 5802: {'lr': 0.0004991867080865815, 'samples': 1113984, 'steps': 5801, 'loss/train': 2.2368245124816895} -11/06/2021 22:04:03 - INFO - __main__ - Step 5803: {'lr': 0.0004991862803268564, 'samples': 1114176, 'steps': 5802, 'loss/train': 2.107743501663208} -11/06/2021 22:04:03 - INFO - __main__ - Step 5804: {'lr': 0.0004991858524548519, 'samples': 1114368, 'steps': 5803, 'loss/train': 1.269503116607666} -11/06/2021 22:04:05 - INFO - __main__ - Step 5805: {'lr': 0.000499185424470568, 'samples': 1114560, 'steps': 5804, 'loss/train': 1.8158258199691772} -11/06/2021 22:04:05 - INFO - __main__ - Step 5806: {'lr': 0.0004991849963740052, 'samples': 1114752, 'steps': 5805, 'loss/train': 1.9110217094421387} -11/06/2021 22:04:06 - INFO - __main__ - Step 5807: {'lr': 0.0004991845681651632, 'samples': 1114944, 'steps': 5806, 'loss/train': 1.8827478885650635} -11/06/2021 22:04:06 - INFO - __main__ - Step 5808: {'lr': 0.0004991841398440427, 'samples': 1115136, 'steps': 5807, 'loss/train': 1.9933255910873413} -11/06/2021 22:04:06 - INFO - __main__ - Step 5809: {'lr': 0.0004991837114106436, 'samples': 1115328, 'steps': 5808, 'loss/train': 2.1655633449554443} -11/06/2021 22:04:07 - INFO - __main__ - Step 5810: {'lr': 0.0004991832828649661, 'samples': 1115520, 'steps': 5809, 'loss/train': 1.6817560195922852} -11/06/2021 22:04:08 - INFO - __main__ - Step 5811: {'lr': 0.0004991828542070105, 'samples': 1115712, 'steps': 5810, 'loss/train': 0.6421383023262024} -11/06/2021 22:04:08 - INFO - __main__ - Step 5812: {'lr': 0.000499182425436777, 'samples': 1115904, 'steps': 5811, 'loss/train': 1.786048173904419} -11/06/2021 22:04:08 - INFO - __main__ - Step 5813: {'lr': 0.0004991819965542657, 'samples': 1116096, 'steps': 5812, 'loss/train': 1.7168254852294922} -11/06/2021 22:04:09 - INFO - __main__ - Step 5814: {'lr': 0.0004991815675594768, 'samples': 1116288, 'steps': 5813, 'loss/train': 1.5646218061447144} -11/06/2021 22:04:09 - INFO - __main__ - Step 5815: {'lr': 0.0004991811384524106, 'samples': 1116480, 'steps': 5814, 'loss/train': 1.233889102935791} -11/06/2021 22:04:10 - INFO - __main__ - Step 5816: {'lr': 0.0004991807092330671, 'samples': 1116672, 'steps': 5815, 'loss/train': 1.7671700716018677} -11/06/2021 22:04:10 - INFO - __main__ - Step 5817: {'lr': 0.0004991802799014467, 'samples': 1116864, 'steps': 5816, 'loss/train': 2.299095630645752} -11/06/2021 22:04:11 - INFO - __main__ - Step 5818: {'lr': 0.0004991798504575495, 'samples': 1117056, 'steps': 5817, 'loss/train': 1.8498998880386353} -11/06/2021 22:04:11 - INFO - __main__ - Step 5819: {'lr': 0.0004991794209013758, 'samples': 1117248, 'steps': 5818, 'loss/train': 1.8572213649749756} -11/06/2021 22:04:11 - INFO - __main__ - Step 5820: {'lr': 0.0004991789912329257, 'samples': 1117440, 'steps': 5819, 'loss/train': 0.8670408725738525} -11/06/2021 22:04:12 - INFO - __main__ - Step 5821: {'lr': 0.0004991785614521993, 'samples': 1117632, 'steps': 5820, 'loss/train': 3.0006051063537598} -11/06/2021 22:04:13 - INFO - __main__ - Step 5822: {'lr': 0.0004991781315591969, 'samples': 1117824, 'steps': 5821, 'loss/train': 2.1679015159606934} -11/06/2021 22:04:13 - INFO - __main__ - Step 5823: {'lr': 0.0004991777015539186, 'samples': 1118016, 'steps': 5822, 'loss/train': 2.232862710952759} -11/06/2021 22:04:13 - INFO - __main__ - Step 5824: {'lr': 0.0004991772714363649, 'samples': 1118208, 'steps': 5823, 'loss/train': 1.790226936340332} -11/06/2021 22:04:14 - INFO - __main__ - Step 5825: {'lr': 0.0004991768412065355, 'samples': 1118400, 'steps': 5824, 'loss/train': 1.278944492340088} -11/06/2021 22:04:15 - INFO - __main__ - Step 5826: {'lr': 0.000499176410864431, 'samples': 1118592, 'steps': 5825, 'loss/train': 1.5651650428771973} -11/06/2021 22:04:15 - INFO - __main__ - Step 5827: {'lr': 0.0004991759804100515, 'samples': 1118784, 'steps': 5826, 'loss/train': 1.8785316944122314} -11/06/2021 22:04:16 - INFO - __main__ - Step 5828: {'lr': 0.000499175549843397, 'samples': 1118976, 'steps': 5827, 'loss/train': 2.057476282119751} -11/06/2021 22:04:16 - INFO - __main__ - Step 5829: {'lr': 0.0004991751191644679, 'samples': 1119168, 'steps': 5828, 'loss/train': 2.047145366668701} -11/06/2021 22:04:16 - INFO - __main__ - Step 5830: {'lr': 0.0004991746883732644, 'samples': 1119360, 'steps': 5829, 'loss/train': 1.9324302673339844} -11/06/2021 22:04:17 - INFO - __main__ - Step 5831: {'lr': 0.0004991742574697866, 'samples': 1119552, 'steps': 5830, 'loss/train': 1.9625569581985474} -11/06/2021 22:04:18 - INFO - __main__ - Step 5832: {'lr': 0.0004991738264540347, 'samples': 1119744, 'steps': 5831, 'loss/train': 2.0301690101623535} -11/06/2021 22:04:18 - INFO - __main__ - Step 5833: {'lr': 0.0004991733953260089, 'samples': 1119936, 'steps': 5832, 'loss/train': 2.2081518173217773} -11/06/2021 22:04:18 - INFO - __main__ - Step 5834: {'lr': 0.0004991729640857095, 'samples': 1120128, 'steps': 5833, 'loss/train': 1.706737756729126} -11/06/2021 22:04:19 - INFO - __main__ - Step 5835: {'lr': 0.0004991725327331366, 'samples': 1120320, 'steps': 5834, 'loss/train': 1.6535284519195557} -11/06/2021 22:04:19 - INFO - __main__ - Step 5836: {'lr': 0.0004991721012682903, 'samples': 1120512, 'steps': 5835, 'loss/train': 1.5109832286834717} -11/06/2021 22:04:20 - INFO - __main__ - Step 5837: {'lr': 0.0004991716696911709, 'samples': 1120704, 'steps': 5836, 'loss/train': 1.7255332469940186} -11/06/2021 22:04:21 - INFO - __main__ - Step 5838: {'lr': 0.0004991712380017786, 'samples': 1120896, 'steps': 5837, 'loss/train': 2.3126747608184814} -11/06/2021 22:04:21 - INFO - __main__ - Step 5839: {'lr': 0.0004991708062001137, 'samples': 1121088, 'steps': 5838, 'loss/train': 1.5363658666610718} -11/06/2021 22:04:22 - INFO - __main__ - Step 5840: {'lr': 0.0004991703742861762, 'samples': 1121280, 'steps': 5839, 'loss/train': 2.014793872833252} -11/06/2021 22:04:22 - INFO - __main__ - Step 5841: {'lr': 0.0004991699422599664, 'samples': 1121472, 'steps': 5840, 'loss/train': 5.858007907867432} -11/06/2021 22:04:22 - INFO - __main__ - Step 5842: {'lr': 0.0004991695101214844, 'samples': 1121664, 'steps': 5841, 'loss/train': 6.085140228271484} -11/06/2021 22:04:23 - INFO - __main__ - Step 5843: {'lr': 0.0004991690778707305, 'samples': 1121856, 'steps': 5842, 'loss/train': 1.8172892332077026} -11/06/2021 22:04:24 - INFO - __main__ - Step 5844: {'lr': 0.0004991686455077049, 'samples': 1122048, 'steps': 5843, 'loss/train': 2.0172688961029053} -11/06/2021 22:04:24 - INFO - __main__ - Step 5845: {'lr': 0.0004991682130324078, 'samples': 1122240, 'steps': 5844, 'loss/train': 1.5611968040466309} -11/06/2021 22:04:24 - INFO - __main__ - Step 5846: {'lr': 0.0004991677804448392, 'samples': 1122432, 'steps': 5845, 'loss/train': 2.0921804904937744} -11/06/2021 22:04:25 - INFO - __main__ - Step 5847: {'lr': 0.0004991673477449995, 'samples': 1122624, 'steps': 5846, 'loss/train': 1.8288406133651733} -11/06/2021 22:04:25 - INFO - __main__ - Step 5848: {'lr': 0.0004991669149328889, 'samples': 1122816, 'steps': 5847, 'loss/train': 1.8865562677383423} -11/06/2021 22:04:26 - INFO - __main__ - Step 5849: {'lr': 0.0004991664820085074, 'samples': 1123008, 'steps': 5848, 'loss/train': 2.1795449256896973} -11/06/2021 22:04:27 - INFO - __main__ - Step 5850: {'lr': 0.0004991660489718554, 'samples': 1123200, 'steps': 5849, 'loss/train': 1.6964969635009766} -11/06/2021 22:04:27 - INFO - __main__ - Step 5851: {'lr': 0.0004991656158229331, 'samples': 1123392, 'steps': 5850, 'loss/train': 1.9025615453720093} -11/06/2021 22:04:27 - INFO - __main__ - Step 5852: {'lr': 0.0004991651825617406, 'samples': 1123584, 'steps': 5851, 'loss/train': 2.156768560409546} -11/06/2021 22:04:28 - INFO - __main__ - Step 5853: {'lr': 0.000499164749188278, 'samples': 1123776, 'steps': 5852, 'loss/train': 2.2558553218841553} -11/06/2021 22:04:29 - INFO - __main__ - Step 5854: {'lr': 0.0004991643157025458, 'samples': 1123968, 'steps': 5853, 'loss/train': 1.9887200593948364} -11/06/2021 22:04:29 - INFO - __main__ - Step 5855: {'lr': 0.0004991638821045439, 'samples': 1124160, 'steps': 5854, 'loss/train': 2.0848309993743896} -11/06/2021 22:04:29 - INFO - __main__ - Step 5856: {'lr': 0.0004991634483942725, 'samples': 1124352, 'steps': 5855, 'loss/train': 1.9906128644943237} -11/06/2021 22:04:30 - INFO - __main__ - Step 5857: {'lr': 0.000499163014571732, 'samples': 1124544, 'steps': 5856, 'loss/train': 1.9705578088760376} -11/06/2021 22:04:30 - INFO - __main__ - Step 5858: {'lr': 0.0004991625806369225, 'samples': 1124736, 'steps': 5857, 'loss/train': 1.9932202100753784} -11/06/2021 22:04:32 - INFO - __main__ - Step 5859: {'lr': 0.0004991621465898441, 'samples': 1124928, 'steps': 5858, 'loss/train': 1.7375214099884033} -11/06/2021 22:04:32 - INFO - __main__ - Step 5860: {'lr': 0.0004991617124304971, 'samples': 1125120, 'steps': 5859, 'loss/train': 1.9731206893920898} -11/06/2021 22:04:32 - INFO - __main__ - Step 5861: {'lr': 0.0004991612781588818, 'samples': 1125312, 'steps': 5860, 'loss/train': 0.45900076627731323} -11/06/2021 22:04:33 - INFO - __main__ - Step 5862: {'lr': 0.0004991608437749981, 'samples': 1125504, 'steps': 5861, 'loss/train': 2.0371387004852295} -11/06/2021 22:04:33 - INFO - __main__ - Step 5863: {'lr': 0.0004991604092788465, 'samples': 1125696, 'steps': 5862, 'loss/train': 3.404467821121216} -11/06/2021 22:04:33 - INFO - __main__ - Step 5864: {'lr': 0.000499159974670427, 'samples': 1125888, 'steps': 5863, 'loss/train': 1.9706652164459229} -11/06/2021 22:04:34 - INFO - __main__ - Step 5865: {'lr': 0.00049915953994974, 'samples': 1126080, 'steps': 5864, 'loss/train': 1.71634042263031} -11/06/2021 22:04:35 - INFO - __main__ - Step 5866: {'lr': 0.0004991591051167853, 'samples': 1126272, 'steps': 5865, 'loss/train': 2.338533401489258} -11/06/2021 22:04:35 - INFO - __main__ - Step 5867: {'lr': 0.0004991586701715635, 'samples': 1126464, 'steps': 5866, 'loss/train': 0.339321494102478} -11/06/2021 22:04:36 - INFO - __main__ - Step 5868: {'lr': 0.0004991582351140747, 'samples': 1126656, 'steps': 5867, 'loss/train': 1.8088363409042358} -11/06/2021 22:04:36 - INFO - __main__ - Step 5869: {'lr': 0.000499157799944319, 'samples': 1126848, 'steps': 5868, 'loss/train': 1.787323236465454} -11/06/2021 22:04:36 - INFO - __main__ - Step 5870: {'lr': 0.0004991573646622965, 'samples': 1127040, 'steps': 5869, 'loss/train': 1.9397883415222168} -11/06/2021 22:04:37 - INFO - __main__ - Step 5871: {'lr': 0.0004991569292680078, 'samples': 1127232, 'steps': 5870, 'loss/train': 0.43821990489959717} -11/06/2021 22:04:38 - INFO - __main__ - Step 5872: {'lr': 0.0004991564937614526, 'samples': 1127424, 'steps': 5871, 'loss/train': 2.1050267219543457} -11/06/2021 22:04:38 - INFO - __main__ - Step 5873: {'lr': 0.0004991560581426314, 'samples': 1127616, 'steps': 5872, 'loss/train': 2.0710291862487793} -11/06/2021 22:04:38 - INFO - __main__ - Step 5874: {'lr': 0.0004991556224115444, 'samples': 1127808, 'steps': 5873, 'loss/train': 2.220693349838257} -11/06/2021 22:04:39 - INFO - __main__ - Step 5875: {'lr': 0.0004991551865681916, 'samples': 1128000, 'steps': 5874, 'loss/train': 1.8416770696640015} -11/06/2021 22:04:40 - INFO - __main__ - Step 5876: {'lr': 0.0004991547506125734, 'samples': 1128192, 'steps': 5875, 'loss/train': 2.190176248550415} -11/06/2021 22:04:40 - INFO - __main__ - Step 5877: {'lr': 0.0004991543145446899, 'samples': 1128384, 'steps': 5876, 'loss/train': 1.174869418144226} -11/06/2021 22:04:40 - INFO - __main__ - Step 5878: {'lr': 0.0004991538783645413, 'samples': 1128576, 'steps': 5877, 'loss/train': 2.180773973464966} -11/06/2021 22:04:41 - INFO - __main__ - Step 5879: {'lr': 0.0004991534420721278, 'samples': 1128768, 'steps': 5878, 'loss/train': 1.775754451751709} -11/06/2021 22:04:41 - INFO - __main__ - Step 5880: {'lr': 0.0004991530056674496, 'samples': 1128960, 'steps': 5879, 'loss/train': 1.8799948692321777} -11/06/2021 22:04:42 - INFO - __main__ - Step 5881: {'lr': 0.000499152569150507, 'samples': 1129152, 'steps': 5880, 'loss/train': 2.05820894241333} -11/06/2021 22:04:43 - INFO - __main__ - Step 5882: {'lr': 0.0004991521325213, 'samples': 1129344, 'steps': 5881, 'loss/train': 1.8497810363769531} -11/06/2021 22:04:43 - INFO - __main__ - Step 5883: {'lr': 0.0004991516957798289, 'samples': 1129536, 'steps': 5882, 'loss/train': 2.388411521911621} -11/06/2021 22:04:43 - INFO - __main__ - Step 5884: {'lr': 0.0004991512589260939, 'samples': 1129728, 'steps': 5883, 'loss/train': 2.0570759773254395} -11/06/2021 22:04:44 - INFO - __main__ - Step 5885: {'lr': 0.0004991508219600952, 'samples': 1129920, 'steps': 5884, 'loss/train': 2.236051321029663} -11/06/2021 22:04:45 - INFO - __main__ - Step 5886: {'lr': 0.000499150384881833, 'samples': 1130112, 'steps': 5885, 'loss/train': 1.3894482851028442} -11/06/2021 22:04:45 - INFO - __main__ - Step 5887: {'lr': 0.0004991499476913074, 'samples': 1130304, 'steps': 5886, 'loss/train': 1.8141835927963257} -11/06/2021 22:04:45 - INFO - __main__ - Step 5888: {'lr': 0.0004991495103885187, 'samples': 1130496, 'steps': 5887, 'loss/train': 1.7120885848999023} -11/06/2021 22:04:46 - INFO - __main__ - Step 5889: {'lr': 0.0004991490729734672, 'samples': 1130688, 'steps': 5888, 'loss/train': 1.4462894201278687} -11/06/2021 22:04:46 - INFO - __main__ - Step 5890: {'lr': 0.0004991486354461528, 'samples': 1130880, 'steps': 5889, 'loss/train': 2.2380330562591553} -11/06/2021 22:04:46 - INFO - __main__ - Step 5891: {'lr': 0.000499148197806576, 'samples': 1131072, 'steps': 5890, 'loss/train': 1.384273648262024} -11/06/2021 22:04:47 - INFO - __main__ - Step 5892: {'lr': 0.0004991477600547367, 'samples': 1131264, 'steps': 5891, 'loss/train': 1.8132703304290771} -11/06/2021 22:04:48 - INFO - __main__ - Step 5893: {'lr': 0.0004991473221906354, 'samples': 1131456, 'steps': 5892, 'loss/train': 2.0042428970336914} -11/06/2021 22:04:48 - INFO - __main__ - Step 5894: {'lr': 0.0004991468842142722, 'samples': 1131648, 'steps': 5893, 'loss/train': 2.088541030883789} -11/06/2021 22:04:48 - INFO - __main__ - Step 5895: {'lr': 0.0004991464461256472, 'samples': 1131840, 'steps': 5894, 'loss/train': 1.8709157705307007} -11/06/2021 22:04:49 - INFO - __main__ - Step 5896: {'lr': 0.0004991460079247606, 'samples': 1132032, 'steps': 5895, 'loss/train': 1.9683117866516113} -11/06/2021 22:04:50 - INFO - __main__ - Step 5897: {'lr': 0.0004991455696116128, 'samples': 1132224, 'steps': 5896, 'loss/train': 1.7423728704452515} -11/06/2021 22:04:50 - INFO - __main__ - Step 5898: {'lr': 0.0004991451311862037, 'samples': 1132416, 'steps': 5897, 'loss/train': 1.5214271545410156} -11/06/2021 22:04:50 - INFO - __main__ - Step 5899: {'lr': 0.0004991446926485337, 'samples': 1132608, 'steps': 5898, 'loss/train': 1.8397377729415894} -11/06/2021 22:04:51 - INFO - __main__ - Step 5900: {'lr': 0.0004991442539986029, 'samples': 1132800, 'steps': 5899, 'loss/train': 2.119931697845459} -11/06/2021 22:04:51 - INFO - __main__ - Step 5901: {'lr': 0.0004991438152364117, 'samples': 1132992, 'steps': 5900, 'loss/train': 1.960817813873291} -11/06/2021 22:04:52 - INFO - __main__ - Step 5902: {'lr': 0.0004991433763619599, 'samples': 1133184, 'steps': 5901, 'loss/train': 1.7662793397903442} -11/06/2021 22:04:52 - INFO - __main__ - Step 5903: {'lr': 0.0004991429373752482, 'samples': 1133376, 'steps': 5902, 'loss/train': 1.5504059791564941} -11/06/2021 22:04:53 - INFO - __main__ - Step 5904: {'lr': 0.0004991424982762763, 'samples': 1133568, 'steps': 5903, 'loss/train': 2.349090576171875} -11/06/2021 22:04:53 - INFO - __main__ - Step 5905: {'lr': 0.0004991420590650448, 'samples': 1133760, 'steps': 5904, 'loss/train': 1.9303275346755981} -11/06/2021 22:04:54 - INFO - __main__ - Step 5906: {'lr': 0.0004991416197415537, 'samples': 1133952, 'steps': 5905, 'loss/train': 1.6415051221847534} -11/06/2021 22:04:55 - INFO - __main__ - Step 5907: {'lr': 0.0004991411803058032, 'samples': 1134144, 'steps': 5906, 'loss/train': 1.6599597930908203} -11/06/2021 22:04:55 - INFO - __main__ - Step 5908: {'lr': 0.0004991407407577936, 'samples': 1134336, 'steps': 5907, 'loss/train': 1.926432728767395} -11/06/2021 22:04:55 - INFO - __main__ - Step 5909: {'lr': 0.0004991403010975249, 'samples': 1134528, 'steps': 5908, 'loss/train': 1.6873294115066528} -11/06/2021 22:04:56 - INFO - __main__ - Step 5910: {'lr': 0.0004991398613249976, 'samples': 1134720, 'steps': 5909, 'loss/train': 2.0104522705078125} -11/06/2021 22:04:56 - INFO - __main__ - Step 5911: {'lr': 0.0004991394214402115, 'samples': 1134912, 'steps': 5910, 'loss/train': 1.2183507680892944} -11/06/2021 22:04:57 - INFO - __main__ - Step 5912: {'lr': 0.0004991389814431672, 'samples': 1135104, 'steps': 5911, 'loss/train': 2.336418390274048} -11/06/2021 22:04:57 - INFO - __main__ - Step 5913: {'lr': 0.0004991385413338646, 'samples': 1135296, 'steps': 5912, 'loss/train': 1.6936346292495728} -11/06/2021 22:04:58 - INFO - __main__ - Step 5914: {'lr': 0.0004991381011123041, 'samples': 1135488, 'steps': 5913, 'loss/train': 1.936176061630249} -11/06/2021 22:04:58 - INFO - __main__ - Step 5915: {'lr': 0.0004991376607784857, 'samples': 1135680, 'steps': 5914, 'loss/train': 2.222874402999878} -11/06/2021 22:04:58 - INFO - __main__ - Step 5916: {'lr': 0.0004991372203324098, 'samples': 1135872, 'steps': 5915, 'loss/train': 1.72451913356781} -11/06/2021 22:04:59 - INFO - __main__ - Step 5917: {'lr': 0.0004991367797740765, 'samples': 1136064, 'steps': 5916, 'loss/train': 2.277719736099243} -11/06/2021 22:05:00 - INFO - __main__ - Step 5918: {'lr': 0.0004991363391034861, 'samples': 1136256, 'steps': 5917, 'loss/train': 1.82767915725708} -11/06/2021 22:05:00 - INFO - __main__ - Step 5919: {'lr': 0.0004991358983206386, 'samples': 1136448, 'steps': 5918, 'loss/train': 1.7569984197616577} -11/06/2021 22:05:00 - INFO - __main__ - Step 5920: {'lr': 0.0004991354574255344, 'samples': 1136640, 'steps': 5919, 'loss/train': 1.7401177883148193} -11/06/2021 22:05:01 - INFO - __main__ - Step 5921: {'lr': 0.0004991350164181735, 'samples': 1136832, 'steps': 5920, 'loss/train': 1.826175332069397} -11/06/2021 22:05:02 - INFO - __main__ - Step 5922: {'lr': 0.0004991345752985563, 'samples': 1137024, 'steps': 5921, 'loss/train': 1.4562937021255493} -11/06/2021 22:05:02 - INFO - __main__ - Step 5923: {'lr': 0.0004991341340666828, 'samples': 1137216, 'steps': 5922, 'loss/train': 2.3827600479125977} -11/06/2021 22:05:03 - INFO - __main__ - Step 5924: {'lr': 0.0004991336927225534, 'samples': 1137408, 'steps': 5923, 'loss/train': 1.9076972007751465} -11/06/2021 22:05:03 - INFO - __main__ - Step 5925: {'lr': 0.0004991332512661682, 'samples': 1137600, 'steps': 5924, 'loss/train': 1.9979768991470337} -11/06/2021 22:05:03 - INFO - __main__ - Step 5926: {'lr': 0.0004991328096975273, 'samples': 1137792, 'steps': 5925, 'loss/train': 2.118201971054077} -11/06/2021 22:05:04 - INFO - __main__ - Step 5927: {'lr': 0.0004991323680166312, 'samples': 1137984, 'steps': 5926, 'loss/train': 2.161531925201416} -11/06/2021 22:05:05 - INFO - __main__ - Step 5928: {'lr': 0.0004991319262234797, 'samples': 1138176, 'steps': 5927, 'loss/train': 1.8950947523117065} -11/06/2021 22:05:05 - INFO - __main__ - Step 5929: {'lr': 0.0004991314843180733, 'samples': 1138368, 'steps': 5928, 'loss/train': 1.211108684539795} -11/06/2021 22:05:05 - INFO - __main__ - Step 5930: {'lr': 0.0004991310423004121, 'samples': 1138560, 'steps': 5929, 'loss/train': 2.195322275161743} -11/06/2021 22:05:06 - INFO - __main__ - Step 5931: {'lr': 0.0004991306001704962, 'samples': 1138752, 'steps': 5930, 'loss/train': 2.2083332538604736} -11/06/2021 22:05:06 - INFO - __main__ - Step 5932: {'lr': 0.000499130157928326, 'samples': 1138944, 'steps': 5931, 'loss/train': 1.8265712261199951} -11/06/2021 22:05:07 - INFO - __main__ - Step 5933: {'lr': 0.0004991297155739015, 'samples': 1139136, 'steps': 5932, 'loss/train': 2.3104774951934814} -11/06/2021 22:05:08 - INFO - __main__ - Step 5934: {'lr': 0.0004991292731072231, 'samples': 1139328, 'steps': 5933, 'loss/train': 1.6424787044525146} -11/06/2021 22:05:08 - INFO - __main__ - Step 5935: {'lr': 0.0004991288305282908, 'samples': 1139520, 'steps': 5934, 'loss/train': 1.7371667623519897} -11/06/2021 22:05:08 - INFO - __main__ - Step 5936: {'lr': 0.0004991283878371049, 'samples': 1139712, 'steps': 5935, 'loss/train': 2.0819458961486816} -11/06/2021 22:05:09 - INFO - __main__ - Step 5937: {'lr': 0.0004991279450336656, 'samples': 1139904, 'steps': 5936, 'loss/train': 2.049226999282837} -11/06/2021 22:05:09 - INFO - __main__ - Step 5938: {'lr': 0.0004991275021179732, 'samples': 1140096, 'steps': 5937, 'loss/train': 1.6424188613891602} -11/06/2021 22:05:10 - INFO - __main__ - Step 5939: {'lr': 0.0004991270590900277, 'samples': 1140288, 'steps': 5938, 'loss/train': 2.0688111782073975} -11/06/2021 22:05:11 - INFO - __main__ - Step 5940: {'lr': 0.0004991266159498294, 'samples': 1140480, 'steps': 5939, 'loss/train': 1.3544045686721802} -11/06/2021 22:05:11 - INFO - __main__ - Step 5941: {'lr': 0.0004991261726973784, 'samples': 1140672, 'steps': 5940, 'loss/train': 2.6650118827819824} -11/06/2021 22:05:11 - INFO - __main__ - Step 5942: {'lr': 0.0004991257293326752, 'samples': 1140864, 'steps': 5941, 'loss/train': 1.340391993522644} -11/06/2021 22:05:12 - INFO - __main__ - Step 5943: {'lr': 0.0004991252858557196, 'samples': 1141056, 'steps': 5942, 'loss/train': 1.737450122833252} -11/06/2021 22:05:12 - INFO - __main__ - Step 5944: {'lr': 0.0004991248422665122, 'samples': 1141248, 'steps': 5943, 'loss/train': 2.2285938262939453} -11/06/2021 22:05:13 - INFO - __main__ - Step 5945: {'lr': 0.0004991243985650528, 'samples': 1141440, 'steps': 5944, 'loss/train': 2.2643086910247803} -11/06/2021 22:05:13 - INFO - __main__ - Step 5946: {'lr': 0.0004991239547513419, 'samples': 1141632, 'steps': 5945, 'loss/train': 1.9071139097213745} -11/06/2021 22:05:14 - INFO - __main__ - Step 5947: {'lr': 0.0004991235108253795, 'samples': 1141824, 'steps': 5946, 'loss/train': 1.679957628250122} -11/06/2021 22:05:14 - INFO - __main__ - Step 5948: {'lr': 0.0004991230667871659, 'samples': 1142016, 'steps': 5947, 'loss/train': 0.8383622765541077} -11/06/2021 22:05:16 - INFO - __main__ - Step 5949: {'lr': 0.0004991226226367013, 'samples': 1142208, 'steps': 5948, 'loss/train': 1.7677212953567505} -11/06/2021 22:05:16 - INFO - __main__ - Step 5950: {'lr': 0.0004991221783739859, 'samples': 1142400, 'steps': 5949, 'loss/train': 2.1849448680877686} -11/06/2021 22:05:16 - INFO - __main__ - Step 5951: {'lr': 0.0004991217339990199, 'samples': 1142592, 'steps': 5950, 'loss/train': 1.8535935878753662} -11/06/2021 22:05:17 - INFO - __main__ - Step 5952: {'lr': 0.0004991212895118035, 'samples': 1142784, 'steps': 5951, 'loss/train': 2.292984962463379} -11/06/2021 22:05:17 - INFO - __main__ - Step 5953: {'lr': 0.0004991208449123369, 'samples': 1142976, 'steps': 5952, 'loss/train': 2.318779468536377} -11/06/2021 22:05:17 - INFO - __main__ - Step 5954: {'lr': 0.0004991204002006203, 'samples': 1143168, 'steps': 5953, 'loss/train': 2.651663064956665} -11/06/2021 22:05:18 - INFO - __main__ - Step 5955: {'lr': 0.0004991199553766538, 'samples': 1143360, 'steps': 5954, 'loss/train': 2.468550205230713} -11/06/2021 22:05:19 - INFO - __main__ - Step 5956: {'lr': 0.0004991195104404378, 'samples': 1143552, 'steps': 5955, 'loss/train': 1.74437415599823} -11/06/2021 22:05:19 - INFO - __main__ - Step 5957: {'lr': 0.0004991190653919723, 'samples': 1143744, 'steps': 5956, 'loss/train': 1.5060465335845947} -11/06/2021 22:05:19 - INFO - __main__ - Step 5958: {'lr': 0.0004991186202312576, 'samples': 1143936, 'steps': 5957, 'loss/train': 2.46972393989563} -11/06/2021 22:05:20 - INFO - __main__ - Step 5959: {'lr': 0.0004991181749582941, 'samples': 1144128, 'steps': 5958, 'loss/train': 1.874528408050537} -11/06/2021 22:05:20 - INFO - __main__ - Step 5960: {'lr': 0.0004991177295730815, 'samples': 1144320, 'steps': 5959, 'loss/train': 1.015513300895691} -11/06/2021 22:05:21 - INFO - __main__ - Step 5961: {'lr': 0.0004991172840756204, 'samples': 1144512, 'steps': 5960, 'loss/train': 1.6141202449798584} -11/06/2021 22:05:22 - INFO - __main__ - Step 5962: {'lr': 0.000499116838465911, 'samples': 1144704, 'steps': 5961, 'loss/train': 2.2520675659179688} -11/06/2021 22:05:22 - INFO - __main__ - Step 5963: {'lr': 0.0004991163927439533, 'samples': 1144896, 'steps': 5962, 'loss/train': 2.061602830886841} -11/06/2021 22:05:22 - INFO - __main__ - Step 5964: {'lr': 0.0004991159469097476, 'samples': 1145088, 'steps': 5963, 'loss/train': 1.7788499593734741} -11/06/2021 22:05:23 - INFO - __main__ - Step 5965: {'lr': 0.0004991155009632941, 'samples': 1145280, 'steps': 5964, 'loss/train': 2.016207456588745} -11/06/2021 22:05:23 - INFO - __main__ - Step 5966: {'lr': 0.0004991150549045931, 'samples': 1145472, 'steps': 5965, 'loss/train': 2.390394926071167} -11/06/2021 22:05:24 - INFO - __main__ - Step 5967: {'lr': 0.0004991146087336446, 'samples': 1145664, 'steps': 5966, 'loss/train': 2.1438944339752197} -11/06/2021 22:05:24 - INFO - __main__ - Step 5968: {'lr': 0.0004991141624504489, 'samples': 1145856, 'steps': 5967, 'loss/train': 2.0830070972442627} -11/06/2021 22:05:25 - INFO - __main__ - Step 5969: {'lr': 0.0004991137160550062, 'samples': 1146048, 'steps': 5968, 'loss/train': 1.9556607007980347} -11/06/2021 22:05:25 - INFO - __main__ - Step 5970: {'lr': 0.0004991132695473167, 'samples': 1146240, 'steps': 5969, 'loss/train': 1.7997961044311523} -11/06/2021 22:05:25 - INFO - __main__ - Step 5971: {'lr': 0.0004991128229273807, 'samples': 1146432, 'steps': 5970, 'loss/train': 2.2100391387939453} -11/06/2021 22:05:26 - INFO - __main__ - Step 5972: {'lr': 0.0004991123761951982, 'samples': 1146624, 'steps': 5971, 'loss/train': 2.2720751762390137} -11/06/2021 22:05:27 - INFO - __main__ - Step 5973: {'lr': 0.0004991119293507695, 'samples': 1146816, 'steps': 5972, 'loss/train': 2.5560436248779297} -11/06/2021 22:05:27 - INFO - __main__ - Step 5974: {'lr': 0.0004991114823940948, 'samples': 1147008, 'steps': 5973, 'loss/train': 1.9444048404693604} -11/06/2021 22:05:27 - INFO - __main__ - Step 5975: {'lr': 0.0004991110353251744, 'samples': 1147200, 'steps': 5974, 'loss/train': 1.894894003868103} -11/06/2021 22:05:28 - INFO - __main__ - Step 5976: {'lr': 0.0004991105881440084, 'samples': 1147392, 'steps': 5975, 'loss/train': 1.42281174659729} -11/06/2021 22:05:29 - INFO - __main__ - Step 5977: {'lr': 0.000499110140850597, 'samples': 1147584, 'steps': 5976, 'loss/train': 1.4847767353057861} -11/06/2021 22:05:29 - INFO - __main__ - Step 5978: {'lr': 0.0004991096934449404, 'samples': 1147776, 'steps': 5977, 'loss/train': 1.5438770055770874} -11/06/2021 22:05:30 - INFO - __main__ - Step 5979: {'lr': 0.0004991092459270388, 'samples': 1147968, 'steps': 5978, 'loss/train': 1.8954336643218994} -11/06/2021 22:05:30 - INFO - __main__ - Step 5980: {'lr': 0.0004991087982968924, 'samples': 1148160, 'steps': 5979, 'loss/train': 1.413256287574768} -11/06/2021 22:05:30 - INFO - __main__ - Step 5981: {'lr': 0.0004991083505545014, 'samples': 1148352, 'steps': 5980, 'loss/train': 2.335400104522705} -11/06/2021 22:05:31 - INFO - __main__ - Step 5982: {'lr': 0.0004991079026998662, 'samples': 1148544, 'steps': 5981, 'loss/train': 1.8564774990081787} -11/06/2021 22:05:32 - INFO - __main__ - Step 5983: {'lr': 0.0004991074547329867, 'samples': 1148736, 'steps': 5982, 'loss/train': 2.0363080501556396} -11/06/2021 22:05:32 - INFO - __main__ - Step 5984: {'lr': 0.0004991070066538632, 'samples': 1148928, 'steps': 5983, 'loss/train': 1.7715718746185303} -11/06/2021 22:05:32 - INFO - __main__ - Step 5985: {'lr': 0.0004991065584624959, 'samples': 1149120, 'steps': 5984, 'loss/train': 2.119075059890747} -11/06/2021 22:05:33 - INFO - __main__ - Step 5986: {'lr': 0.0004991061101588851, 'samples': 1149312, 'steps': 5985, 'loss/train': 1.6880245208740234} -11/06/2021 22:05:33 - INFO - __main__ - Step 5987: {'lr': 0.0004991056617430308, 'samples': 1149504, 'steps': 5986, 'loss/train': 1.5863991975784302} -11/06/2021 22:05:34 - INFO - __main__ - Step 5988: {'lr': 0.0004991052132149336, 'samples': 1149696, 'steps': 5987, 'loss/train': 1.918567419052124} -11/06/2021 22:05:35 - INFO - __main__ - Step 5989: {'lr': 0.0004991047645745932, 'samples': 1149888, 'steps': 5988, 'loss/train': 2.1846141815185547} -11/06/2021 22:05:35 - INFO - __main__ - Step 5990: {'lr': 0.0004991043158220101, 'samples': 1150080, 'steps': 5989, 'loss/train': 0.287127822637558} -11/06/2021 22:05:35 - INFO - __main__ - Step 5991: {'lr': 0.0004991038669571844, 'samples': 1150272, 'steps': 5990, 'loss/train': 2.2613940238952637} -11/06/2021 22:05:36 - INFO - __main__ - Step 5992: {'lr': 0.0004991034179801165, 'samples': 1150464, 'steps': 5991, 'loss/train': 2.2237813472747803} -11/06/2021 22:05:37 - INFO - __main__ - Step 5993: {'lr': 0.0004991029688908063, 'samples': 1150656, 'steps': 5992, 'loss/train': 1.6125682592391968} -11/06/2021 22:05:37 - INFO - __main__ - Step 5994: {'lr': 0.0004991025196892542, 'samples': 1150848, 'steps': 5993, 'loss/train': 2.0412638187408447} -11/06/2021 22:05:37 - INFO - __main__ - Step 5995: {'lr': 0.0004991020703754603, 'samples': 1151040, 'steps': 5994, 'loss/train': 2.479659080505371} -11/06/2021 22:05:38 - INFO - __main__ - Step 5996: {'lr': 0.0004991016209494249, 'samples': 1151232, 'steps': 5995, 'loss/train': 1.6935555934906006} -11/06/2021 22:05:38 - INFO - __main__ - Step 5997: {'lr': 0.000499101171411148, 'samples': 1151424, 'steps': 5996, 'loss/train': 1.8328980207443237} -11/06/2021 22:05:39 - INFO - __main__ - Step 5998: {'lr': 0.0004991007217606303, 'samples': 1151616, 'steps': 5997, 'loss/train': 1.736120343208313} -11/06/2021 22:05:39 - INFO - __main__ - Step 5999: {'lr': 0.0004991002719978713, 'samples': 1151808, 'steps': 5998, 'loss/train': 1.7928426265716553} -11/06/2021 22:05:40 - INFO - __main__ - Step 6000: {'lr': 0.0004990998221228718, 'samples': 1152000, 'steps': 5999, 'loss/train': 2.1965417861938477} -11/06/2021 22:05:40 - INFO - __main__ - Step 6001: {'lr': 0.0004990993721356316, 'samples': 1152192, 'steps': 6000, 'loss/train': 1.9689626693725586} -11/06/2021 22:05:41 - INFO - __main__ - Step 6002: {'lr': 0.0004990989220361511, 'samples': 1152384, 'steps': 6001, 'loss/train': 2.398984670639038} -11/06/2021 22:05:42 - INFO - __main__ - Step 6003: {'lr': 0.0004990984718244306, 'samples': 1152576, 'steps': 6002, 'loss/train': 1.8467917442321777} -11/06/2021 22:05:42 - INFO - __main__ - Step 6004: {'lr': 0.00049909802150047, 'samples': 1152768, 'steps': 6003, 'loss/train': 1.9117133617401123} -11/06/2021 22:05:42 - INFO - __main__ - Step 6005: {'lr': 0.0004990975710642699, 'samples': 1152960, 'steps': 6004, 'loss/train': 2.0805423259735107} -11/06/2021 22:05:43 - INFO - __main__ - Step 6006: {'lr': 0.0004990971205158301, 'samples': 1153152, 'steps': 6005, 'loss/train': 1.9245171546936035} -11/06/2021 22:05:43 - INFO - __main__ - Step 6007: {'lr': 0.000499096669855151, 'samples': 1153344, 'steps': 6006, 'loss/train': 1.9373234510421753} -11/06/2021 22:05:44 - INFO - __main__ - Step 6008: {'lr': 0.0004990962190822328, 'samples': 1153536, 'steps': 6007, 'loss/train': 2.0879454612731934} -11/06/2021 22:05:44 - INFO - __main__ - Step 6009: {'lr': 0.0004990957681970757, 'samples': 1153728, 'steps': 6008, 'loss/train': 1.5155565738677979} -11/06/2021 22:05:45 - INFO - __main__ - Step 6010: {'lr': 0.0004990953171996798, 'samples': 1153920, 'steps': 6009, 'loss/train': 1.890929937362671} -11/06/2021 22:05:45 - INFO - __main__ - Step 6011: {'lr': 0.0004990948660900455, 'samples': 1154112, 'steps': 6010, 'loss/train': 1.6468206644058228} -11/06/2021 22:05:45 - INFO - __main__ - Step 6012: {'lr': 0.0004990944148681729, 'samples': 1154304, 'steps': 6011, 'loss/train': 1.8808773756027222} -11/06/2021 22:05:46 - INFO - __main__ - Step 6013: {'lr': 0.0004990939635340621, 'samples': 1154496, 'steps': 6012, 'loss/train': 1.6922487020492554} -11/06/2021 22:05:47 - INFO - __main__ - Step 6014: {'lr': 0.0004990935120877136, 'samples': 1154688, 'steps': 6013, 'loss/train': 1.5045371055603027} -11/06/2021 22:05:47 - INFO - __main__ - Step 6015: {'lr': 0.0004990930605291272, 'samples': 1154880, 'steps': 6014, 'loss/train': 1.9965391159057617} -11/06/2021 22:05:47 - INFO - __main__ - Step 6016: {'lr': 0.0004990926088583034, 'samples': 1155072, 'steps': 6015, 'loss/train': 1.9830745458602905} -11/06/2021 22:05:48 - INFO - __main__ - Step 6017: {'lr': 0.0004990921570752424, 'samples': 1155264, 'steps': 6016, 'loss/train': 1.850488305091858} -11/06/2021 22:05:49 - INFO - __main__ - Step 6018: {'lr': 0.0004990917051799442, 'samples': 1155456, 'steps': 6017, 'loss/train': 2.0463662147521973} -11/06/2021 22:05:49 - INFO - __main__ - Step 6019: {'lr': 0.0004990912531724092, 'samples': 1155648, 'steps': 6018, 'loss/train': 1.561757206916809} -11/06/2021 22:05:50 - INFO - __main__ - Step 6020: {'lr': 0.0004990908010526374, 'samples': 1155840, 'steps': 6019, 'loss/train': 2.3812918663024902} -11/06/2021 22:05:50 - INFO - __main__ - Step 6021: {'lr': 0.0004990903488206292, 'samples': 1156032, 'steps': 6020, 'loss/train': 1.9738842248916626} -11/06/2021 22:05:50 - INFO - __main__ - Step 6022: {'lr': 0.0004990898964763847, 'samples': 1156224, 'steps': 6021, 'loss/train': 1.0704938173294067} -11/06/2021 22:05:51 - INFO - __main__ - Step 6023: {'lr': 0.0004990894440199042, 'samples': 1156416, 'steps': 6022, 'loss/train': 2.2078778743743896} -11/06/2021 22:05:52 - INFO - __main__ - Step 6024: {'lr': 0.0004990889914511878, 'samples': 1156608, 'steps': 6023, 'loss/train': 1.3262114524841309} -11/06/2021 22:05:52 - INFO - __main__ - Step 6025: {'lr': 0.0004990885387702357, 'samples': 1156800, 'steps': 6024, 'loss/train': 2.6244781017303467} -11/06/2021 22:05:52 - INFO - __main__ - Step 6026: {'lr': 0.0004990880859770483, 'samples': 1156992, 'steps': 6025, 'loss/train': 2.0771734714508057} -11/06/2021 22:05:53 - INFO - __main__ - Step 6027: {'lr': 0.0004990876330716256, 'samples': 1157184, 'steps': 6026, 'loss/train': 1.7819007635116577} -11/06/2021 22:05:53 - INFO - __main__ - Step 6028: {'lr': 0.0004990871800539677, 'samples': 1157376, 'steps': 6027, 'loss/train': 2.1311354637145996} -11/06/2021 22:05:54 - INFO - __main__ - Step 6029: {'lr': 0.0004990867269240751, 'samples': 1157568, 'steps': 6028, 'loss/train': 2.2152881622314453} -11/06/2021 22:05:55 - INFO - __main__ - Step 6030: {'lr': 0.0004990862736819478, 'samples': 1157760, 'steps': 6029, 'loss/train': 2.027174949645996} -11/06/2021 22:05:55 - INFO - __main__ - Step 6031: {'lr': 0.000499085820327586, 'samples': 1157952, 'steps': 6030, 'loss/train': 1.750157356262207} -11/06/2021 22:05:55 - INFO - __main__ - Step 6032: {'lr': 0.0004990853668609902, 'samples': 1158144, 'steps': 6031, 'loss/train': 1.8239428997039795} -11/06/2021 22:05:56 - INFO - __main__ - Step 6033: {'lr': 0.0004990849132821602, 'samples': 1158336, 'steps': 6032, 'loss/train': 1.92527437210083} -11/06/2021 22:05:57 - INFO - __main__ - Step 6034: {'lr': 0.0004990844595910965, 'samples': 1158528, 'steps': 6033, 'loss/train': 2.1087069511413574} -11/06/2021 22:05:57 - INFO - __main__ - Step 6035: {'lr': 0.0004990840057877991, 'samples': 1158720, 'steps': 6034, 'loss/train': 1.7086195945739746} -11/06/2021 22:05:57 - INFO - __main__ - Step 6036: {'lr': 0.0004990835518722683, 'samples': 1158912, 'steps': 6035, 'loss/train': 1.736742615699768} -11/06/2021 22:05:58 - INFO - __main__ - Step 6037: {'lr': 0.0004990830978445043, 'samples': 1159104, 'steps': 6036, 'loss/train': 2.061073064804077} -11/06/2021 22:05:58 - INFO - __main__ - Step 6038: {'lr': 0.0004990826437045073, 'samples': 1159296, 'steps': 6037, 'loss/train': 1.51176917552948} -11/06/2021 22:05:59 - INFO - __main__ - Step 6039: {'lr': 0.0004990821894522775, 'samples': 1159488, 'steps': 6038, 'loss/train': 2.080949306488037} -11/06/2021 22:05:59 - INFO - __main__ - Step 6040: {'lr': 0.0004990817350878152, 'samples': 1159680, 'steps': 6039, 'loss/train': 1.2319962978363037} -11/06/2021 22:06:00 - INFO - __main__ - Step 6041: {'lr': 0.0004990812806111205, 'samples': 1159872, 'steps': 6040, 'loss/train': 2.2004785537719727} -11/06/2021 22:06:00 - INFO - __main__ - Step 6042: {'lr': 0.0004990808260221934, 'samples': 1160064, 'steps': 6041, 'loss/train': 2.198143243789673} -11/06/2021 22:06:00 - INFO - __main__ - Step 6043: {'lr': 0.0004990803713210345, 'samples': 1160256, 'steps': 6042, 'loss/train': 2.189502716064453} -11/06/2021 22:06:01 - INFO - __main__ - Step 6044: {'lr': 0.0004990799165076438, 'samples': 1160448, 'steps': 6043, 'loss/train': 0.32099586725234985} -11/06/2021 22:06:02 - INFO - __main__ - Step 6045: {'lr': 0.0004990794615820216, 'samples': 1160640, 'steps': 6044, 'loss/train': 2.055501937866211} -11/06/2021 22:06:02 - INFO - __main__ - Step 6046: {'lr': 0.0004990790065441679, 'samples': 1160832, 'steps': 6045, 'loss/train': 2.4283854961395264} -11/06/2021 22:06:03 - INFO - __main__ - Step 6047: {'lr': 0.0004990785513940832, 'samples': 1161024, 'steps': 6046, 'loss/train': 1.5293772220611572} -11/06/2021 22:06:03 - INFO - __main__ - Step 6048: {'lr': 0.0004990780961317674, 'samples': 1161216, 'steps': 6047, 'loss/train': 1.82656729221344} -11/06/2021 22:06:04 - INFO - __main__ - Step 6049: {'lr': 0.0004990776407572209, 'samples': 1161408, 'steps': 6048, 'loss/train': 2.004995107650757} -11/06/2021 22:06:04 - INFO - __main__ - Step 6050: {'lr': 0.000499077185270444, 'samples': 1161600, 'steps': 6049, 'loss/train': 1.4372830390930176} -11/06/2021 22:06:05 - INFO - __main__ - Step 6051: {'lr': 0.0004990767296714365, 'samples': 1161792, 'steps': 6050, 'loss/train': 1.7014871835708618} -11/06/2021 22:06:05 - INFO - __main__ - Step 6052: {'lr': 0.000499076273960199, 'samples': 1161984, 'steps': 6051, 'loss/train': 2.0586600303649902} -11/06/2021 22:06:05 - INFO - __main__ - Step 6053: {'lr': 0.0004990758181367316, 'samples': 1162176, 'steps': 6052, 'loss/train': 1.914888858795166} -11/06/2021 22:06:06 - INFO - __main__ - Step 6054: {'lr': 0.0004990753622010345, 'samples': 1162368, 'steps': 6053, 'loss/train': 2.2003793716430664} -11/06/2021 22:06:06 - INFO - __main__ - Step 6055: {'lr': 0.0004990749061531079, 'samples': 1162560, 'steps': 6054, 'loss/train': 2.1446890830993652} -11/06/2021 22:06:07 - INFO - __main__ - Step 6056: {'lr': 0.0004990744499929519, 'samples': 1162752, 'steps': 6055, 'loss/train': 1.890893578529358} -11/06/2021 22:06:07 - INFO - __main__ - Step 6057: {'lr': 0.0004990739937205668, 'samples': 1162944, 'steps': 6056, 'loss/train': 1.2735779285430908} -11/06/2021 22:06:08 - INFO - __main__ - Step 6058: {'lr': 0.0004990735373359529, 'samples': 1163136, 'steps': 6057, 'loss/train': 1.9701690673828125} -11/06/2021 22:06:08 - INFO - __main__ - Step 6059: {'lr': 0.0004990730808391102, 'samples': 1163328, 'steps': 6058, 'loss/train': 2.143030881881714} -11/06/2021 22:06:09 - INFO - __main__ - Step 6060: {'lr': 0.0004990726242300391, 'samples': 1163520, 'steps': 6059, 'loss/train': 2.049363613128662} -11/06/2021 22:06:09 - INFO - __main__ - Step 6061: {'lr': 0.0004990721675087397, 'samples': 1163712, 'steps': 6060, 'loss/train': 2.1596553325653076} -11/06/2021 22:06:10 - INFO - __main__ - Step 6062: {'lr': 0.0004990717106752122, 'samples': 1163904, 'steps': 6061, 'loss/train': 2.0180513858795166} -11/06/2021 22:06:10 - INFO - __main__ - Step 6063: {'lr': 0.0004990712537294568, 'samples': 1164096, 'steps': 6062, 'loss/train': 2.0434930324554443} -11/06/2021 22:06:10 - INFO - __main__ - Step 6064: {'lr': 0.0004990707966714738, 'samples': 1164288, 'steps': 6063, 'loss/train': 1.9746204614639282} -11/06/2021 22:06:11 - INFO - __main__ - Step 6065: {'lr': 0.0004990703395012634, 'samples': 1164480, 'steps': 6064, 'loss/train': 2.094088554382324} -11/06/2021 22:06:12 - INFO - __main__ - Step 6066: {'lr': 0.0004990698822188255, 'samples': 1164672, 'steps': 6065, 'loss/train': 1.3795504570007324} -11/06/2021 22:06:12 - INFO - __main__ - Step 6067: {'lr': 0.0004990694248241608, 'samples': 1164864, 'steps': 6066, 'loss/train': 2.1936051845550537} -11/06/2021 22:06:12 - INFO - __main__ - Step 6068: {'lr': 0.0004990689673172691, 'samples': 1165056, 'steps': 6067, 'loss/train': 2.1371805667877197} -11/06/2021 22:06:13 - INFO - __main__ - Step 6069: {'lr': 0.000499068509698151, 'samples': 1165248, 'steps': 6068, 'loss/train': 1.7530931234359741} -11/06/2021 22:06:14 - INFO - __main__ - Step 6070: {'lr': 0.0004990680519668063, 'samples': 1165440, 'steps': 6069, 'loss/train': 2.192474842071533} -11/06/2021 22:06:14 - INFO - __main__ - Step 6071: {'lr': 0.0004990675941232354, 'samples': 1165632, 'steps': 6070, 'loss/train': 1.666622281074524} -11/06/2021 22:06:15 - INFO - __main__ - Step 6072: {'lr': 0.0004990671361674384, 'samples': 1165824, 'steps': 6071, 'loss/train': 1.9727286100387573} -11/06/2021 22:06:15 - INFO - __main__ - Step 6073: {'lr': 0.0004990666780994156, 'samples': 1166016, 'steps': 6072, 'loss/train': 2.116274356842041} -11/06/2021 22:06:15 - INFO - __main__ - Step 6074: {'lr': 0.0004990662199191673, 'samples': 1166208, 'steps': 6073, 'loss/train': 2.271106243133545} -11/06/2021 22:06:16 - INFO - __main__ - Step 6075: {'lr': 0.0004990657616266936, 'samples': 1166400, 'steps': 6074, 'loss/train': 1.8674793243408203} -11/06/2021 22:06:17 - INFO - __main__ - Step 6076: {'lr': 0.0004990653032219947, 'samples': 1166592, 'steps': 6075, 'loss/train': 1.4734982252120972} -11/06/2021 22:06:17 - INFO - __main__ - Step 6077: {'lr': 0.0004990648447050709, 'samples': 1166784, 'steps': 6076, 'loss/train': 1.8218048810958862} -11/06/2021 22:06:17 - INFO - __main__ - Step 6078: {'lr': 0.0004990643860759222, 'samples': 1166976, 'steps': 6077, 'loss/train': 1.642020583152771} -11/06/2021 22:06:18 - INFO - __main__ - Step 6079: {'lr': 0.0004990639273345489, 'samples': 1167168, 'steps': 6078, 'loss/train': 1.3877575397491455} -11/06/2021 22:06:18 - INFO - __main__ - Step 6080: {'lr': 0.0004990634684809513, 'samples': 1167360, 'steps': 6079, 'loss/train': 1.8536438941955566} -11/06/2021 22:06:19 - INFO - __main__ - Step 6081: {'lr': 0.0004990630095151296, 'samples': 1167552, 'steps': 6080, 'loss/train': 2.0661253929138184} -11/06/2021 22:06:19 - INFO - __main__ - Step 6082: {'lr': 0.0004990625504370838, 'samples': 1167744, 'steps': 6081, 'loss/train': 1.9790138006210327} -11/06/2021 22:06:20 - INFO - __main__ - Step 6083: {'lr': 0.0004990620912468143, 'samples': 1167936, 'steps': 6082, 'loss/train': 1.5834496021270752} -11/06/2021 22:06:20 - INFO - __main__ - Step 6084: {'lr': 0.0004990616319443214, 'samples': 1168128, 'steps': 6083, 'loss/train': 1.8926007747650146} -11/06/2021 22:06:20 - INFO - __main__ - Step 6085: {'lr': 0.0004990611725296052, 'samples': 1168320, 'steps': 6084, 'loss/train': 1.9960976839065552} -11/06/2021 22:06:21 - INFO - __main__ - Step 6086: {'lr': 0.0004990607130026657, 'samples': 1168512, 'steps': 6085, 'loss/train': 2.563918113708496} -11/06/2021 22:06:22 - INFO - __main__ - Step 6087: {'lr': 0.0004990602533635033, 'samples': 1168704, 'steps': 6086, 'loss/train': 1.8031913042068481} -11/06/2021 22:06:22 - INFO - __main__ - Step 6088: {'lr': 0.0004990597936121182, 'samples': 1168896, 'steps': 6087, 'loss/train': 1.5920250415802002} -11/06/2021 22:06:22 - INFO - __main__ - Step 6089: {'lr': 0.0004990593337485108, 'samples': 1169088, 'steps': 6088, 'loss/train': 2.1160354614257812} -11/06/2021 22:06:23 - INFO - __main__ - Step 6090: {'lr': 0.0004990588737726809, 'samples': 1169280, 'steps': 6089, 'loss/train': 2.0593221187591553} -11/06/2021 22:06:24 - INFO - __main__ - Step 6091: {'lr': 0.0004990584136846289, 'samples': 1169472, 'steps': 6090, 'loss/train': 2.7556521892547607} -11/06/2021 22:06:24 - INFO - __main__ - Step 6092: {'lr': 0.0004990579534843551, 'samples': 1169664, 'steps': 6091, 'loss/train': 2.4434940814971924} -11/06/2021 22:06:24 - INFO - __main__ - Step 6093: {'lr': 0.0004990574931718597, 'samples': 1169856, 'steps': 6092, 'loss/train': 2.342974901199341} -11/06/2021 22:06:25 - INFO - __main__ - Step 6094: {'lr': 0.0004990570327471427, 'samples': 1170048, 'steps': 6093, 'loss/train': 1.9696969985961914} -11/06/2021 22:06:25 - INFO - __main__ - Step 6095: {'lr': 0.0004990565722102045, 'samples': 1170240, 'steps': 6094, 'loss/train': 1.6603606939315796} -11/06/2021 22:06:26 - INFO - __main__ - Step 6096: {'lr': 0.0004990561115610452, 'samples': 1170432, 'steps': 6095, 'loss/train': 1.3589533567428589} -11/06/2021 22:06:26 - INFO - __main__ - Step 6097: {'lr': 0.0004990556507996652, 'samples': 1170624, 'steps': 6096, 'loss/train': 1.9999220371246338} -11/06/2021 22:06:27 - INFO - __main__ - Step 6098: {'lr': 0.0004990551899260644, 'samples': 1170816, 'steps': 6097, 'loss/train': 1.987586498260498} -11/06/2021 22:06:27 - INFO - __main__ - Step 6099: {'lr': 0.0004990547289402433, 'samples': 1171008, 'steps': 6098, 'loss/train': 1.9792393445968628} -11/06/2021 22:06:27 - INFO - __main__ - Step 6100: {'lr': 0.0004990542678422019, 'samples': 1171200, 'steps': 6099, 'loss/train': 1.7970731258392334} -11/06/2021 22:06:29 - INFO - __main__ - Step 6101: {'lr': 0.0004990538066319406, 'samples': 1171392, 'steps': 6100, 'loss/train': 1.9069502353668213} -11/06/2021 22:06:29 - INFO - __main__ - Step 6102: {'lr': 0.0004990533453094594, 'samples': 1171584, 'steps': 6101, 'loss/train': 1.354381799697876} -11/06/2021 22:06:29 - INFO - __main__ - Step 6103: {'lr': 0.0004990528838747586, 'samples': 1171776, 'steps': 6102, 'loss/train': 1.948202133178711} -11/06/2021 22:06:30 - INFO - __main__ - Step 6104: {'lr': 0.0004990524223278384, 'samples': 1171968, 'steps': 6103, 'loss/train': 1.6591429710388184} -11/06/2021 22:06:30 - INFO - __main__ - Step 6105: {'lr': 0.0004990519606686991, 'samples': 1172160, 'steps': 6104, 'loss/train': 2.1720986366271973} -11/06/2021 22:06:31 - INFO - __main__ - Step 6106: {'lr': 0.0004990514988973408, 'samples': 1172352, 'steps': 6105, 'loss/train': 2.1691129207611084} -11/06/2021 22:06:31 - INFO - __main__ - Step 6107: {'lr': 0.0004990510370137637, 'samples': 1172544, 'steps': 6106, 'loss/train': 1.6799395084381104} -11/06/2021 22:06:32 - INFO - __main__ - Step 6108: {'lr': 0.0004990505750179682, 'samples': 1172736, 'steps': 6107, 'loss/train': 1.9363466501235962} -11/06/2021 22:06:32 - INFO - __main__ - Step 6109: {'lr': 0.0004990501129099542, 'samples': 1172928, 'steps': 6108, 'loss/train': 1.7905744314193726} -11/06/2021 22:06:32 - INFO - __main__ - Step 6110: {'lr': 0.000499049650689722, 'samples': 1173120, 'steps': 6109, 'loss/train': 1.5997885465621948} -11/06/2021 22:06:33 - INFO - __main__ - Step 6111: {'lr': 0.000499049188357272, 'samples': 1173312, 'steps': 6110, 'loss/train': 2.1724469661712646} -11/06/2021 22:06:34 - INFO - __main__ - Step 6112: {'lr': 0.0004990487259126043, 'samples': 1173504, 'steps': 6111, 'loss/train': 1.6976191997528076} -11/06/2021 22:06:34 - INFO - __main__ - Step 6113: {'lr': 0.0004990482633557189, 'samples': 1173696, 'steps': 6112, 'loss/train': 1.716886281967163} -11/06/2021 22:06:34 - INFO - __main__ - Step 6114: {'lr': 0.0004990478006866165, 'samples': 1173888, 'steps': 6113, 'loss/train': 1.6597141027450562} -11/06/2021 22:06:35 - INFO - __main__ - Step 6115: {'lr': 0.0004990473379052968, 'samples': 1174080, 'steps': 6114, 'loss/train': 2.12764835357666} -11/06/2021 22:06:36 - INFO - __main__ - Step 6116: {'lr': 0.0004990468750117602, 'samples': 1174272, 'steps': 6115, 'loss/train': 1.4543788433074951} -11/06/2021 22:06:36 - INFO - __main__ - Step 6117: {'lr': 0.000499046412006007, 'samples': 1174464, 'steps': 6116, 'loss/train': 1.662864327430725} -11/06/2021 22:06:37 - INFO - __main__ - Step 6118: {'lr': 0.0004990459488880372, 'samples': 1174656, 'steps': 6117, 'loss/train': 1.5874830484390259} -11/06/2021 22:06:37 - INFO - __main__ - Step 6119: {'lr': 0.0004990454856578513, 'samples': 1174848, 'steps': 6118, 'loss/train': 1.8817105293273926} -11/06/2021 22:06:37 - INFO - __main__ - Step 6120: {'lr': 0.0004990450223154492, 'samples': 1175040, 'steps': 6119, 'loss/train': 1.8093229532241821} -11/06/2021 22:06:38 - INFO - __main__ - Step 6121: {'lr': 0.0004990445588608313, 'samples': 1175232, 'steps': 6120, 'loss/train': 1.6032285690307617} -11/06/2021 22:06:39 - INFO - __main__ - Step 6122: {'lr': 0.0004990440952939979, 'samples': 1175424, 'steps': 6121, 'loss/train': 2.429919719696045} -11/06/2021 22:06:39 - INFO - __main__ - Step 6123: {'lr': 0.0004990436316149489, 'samples': 1175616, 'steps': 6122, 'loss/train': 1.6632248163223267} -11/06/2021 22:06:40 - INFO - __main__ - Step 6124: {'lr': 0.0004990431678236849, 'samples': 1175808, 'steps': 6123, 'loss/train': 1.8044439554214478} -11/06/2021 22:06:40 - INFO - __main__ - Step 6125: {'lr': 0.0004990427039202057, 'samples': 1176000, 'steps': 6124, 'loss/train': 1.9963434934616089} -11/06/2021 22:06:40 - INFO - __main__ - Step 6126: {'lr': 0.0004990422399045117, 'samples': 1176192, 'steps': 6125, 'loss/train': 1.9155720472335815} -11/06/2021 22:06:41 - INFO - __main__ - Step 6127: {'lr': 0.0004990417757766031, 'samples': 1176384, 'steps': 6126, 'loss/train': 1.775386929512024} -11/06/2021 22:06:42 - INFO - __main__ - Step 6128: {'lr': 0.0004990413115364803, 'samples': 1176576, 'steps': 6127, 'loss/train': 1.5602920055389404} -11/06/2021 22:06:42 - INFO - __main__ - Step 6129: {'lr': 0.0004990408471841431, 'samples': 1176768, 'steps': 6128, 'loss/train': 2.0410501956939697} -11/06/2021 22:06:42 - INFO - __main__ - Step 6130: {'lr': 0.0004990403827195921, 'samples': 1176960, 'steps': 6129, 'loss/train': 2.2790169715881348} -11/06/2021 22:06:43 - INFO - __main__ - Step 6131: {'lr': 0.0004990399181428273, 'samples': 1177152, 'steps': 6130, 'loss/train': 2.0821285247802734} -11/06/2021 22:06:44 - INFO - __main__ - Step 6132: {'lr': 0.000499039453453849, 'samples': 1177344, 'steps': 6131, 'loss/train': 1.8965604305267334} -11/06/2021 22:06:44 - INFO - __main__ - Step 6133: {'lr': 0.0004990389886526573, 'samples': 1177536, 'steps': 6132, 'loss/train': 1.8164457082748413} -11/06/2021 22:06:44 - INFO - __main__ - Step 6134: {'lr': 0.0004990385237392524, 'samples': 1177728, 'steps': 6133, 'loss/train': 1.9925854206085205} -11/06/2021 22:06:45 - INFO - __main__ - Step 6135: {'lr': 0.0004990380587136347, 'samples': 1177920, 'steps': 6134, 'loss/train': 1.2192782163619995} -11/06/2021 22:06:45 - INFO - __main__ - Step 6136: {'lr': 0.0004990375935758042, 'samples': 1178112, 'steps': 6135, 'loss/train': 1.5371315479278564} -11/06/2021 22:06:46 - INFO - __main__ - Step 6137: {'lr': 0.0004990371283257613, 'samples': 1178304, 'steps': 6136, 'loss/train': 1.8077142238616943} -11/06/2021 22:06:47 - INFO - __main__ - Step 6138: {'lr': 0.0004990366629635062, 'samples': 1178496, 'steps': 6137, 'loss/train': 2.013735771179199} -11/06/2021 22:06:47 - INFO - __main__ - Step 6139: {'lr': 0.0004990361974890388, 'samples': 1178688, 'steps': 6138, 'loss/train': 2.858919620513916} -11/06/2021 22:06:47 - INFO - __main__ - Step 6140: {'lr': 0.0004990357319023597, 'samples': 1178880, 'steps': 6139, 'loss/train': 1.368839144706726} -11/06/2021 22:06:48 - INFO - __main__ - Step 6141: {'lr': 0.0004990352662034689, 'samples': 1179072, 'steps': 6140, 'loss/train': 1.362464427947998} -11/06/2021 22:06:49 - INFO - __main__ - Step 6142: {'lr': 0.0004990348003923665, 'samples': 1179264, 'steps': 6141, 'loss/train': 1.9596736431121826} -11/06/2021 22:06:49 - INFO - __main__ - Step 6143: {'lr': 0.000499034334469053, 'samples': 1179456, 'steps': 6142, 'loss/train': 2.131988048553467} -11/06/2021 22:06:50 - INFO - __main__ - Step 6144: {'lr': 0.0004990338684335285, 'samples': 1179648, 'steps': 6143, 'loss/train': 1.4277572631835938} -11/06/2021 22:06:50 - INFO - __main__ - Step 6145: {'lr': 0.0004990334022857932, 'samples': 1179840, 'steps': 6144, 'loss/train': 1.9954853057861328} -11/06/2021 22:06:50 - INFO - __main__ - Step 6146: {'lr': 0.0004990329360258472, 'samples': 1180032, 'steps': 6145, 'loss/train': 1.7441011667251587} -11/06/2021 22:06:51 - INFO - __main__ - Step 6147: {'lr': 0.0004990324696536908, 'samples': 1180224, 'steps': 6146, 'loss/train': 0.7077341079711914} -11/06/2021 22:06:52 - INFO - __main__ - Step 6148: {'lr': 0.0004990320031693242, 'samples': 1180416, 'steps': 6147, 'loss/train': 2.2118520736694336} -11/06/2021 22:06:52 - INFO - __main__ - Step 6149: {'lr': 0.0004990315365727476, 'samples': 1180608, 'steps': 6148, 'loss/train': 2.055332660675049} -11/06/2021 22:06:52 - INFO - __main__ - Step 6150: {'lr': 0.0004990310698639614, 'samples': 1180800, 'steps': 6149, 'loss/train': 2.1165621280670166} -11/06/2021 22:06:53 - INFO - __main__ - Step 6151: {'lr': 0.0004990306030429655, 'samples': 1180992, 'steps': 6150, 'loss/train': 1.5419307947158813} -11/06/2021 22:06:53 - INFO - __main__ - Step 6152: {'lr': 0.0004990301361097603, 'samples': 1181184, 'steps': 6151, 'loss/train': 1.1245484352111816} -11/06/2021 22:06:54 - INFO - __main__ - Step 6153: {'lr': 0.000499029669064346, 'samples': 1181376, 'steps': 6152, 'loss/train': 2.3590290546417236} -11/06/2021 22:06:54 - INFO - __main__ - Step 6154: {'lr': 0.0004990292019067227, 'samples': 1181568, 'steps': 6153, 'loss/train': 1.9370914697647095} -11/06/2021 22:06:55 - INFO - __main__ - Step 6155: {'lr': 0.0004990287346368908, 'samples': 1181760, 'steps': 6154, 'loss/train': 2.3206193447113037} -11/06/2021 22:06:55 - INFO - __main__ - Step 6156: {'lr': 0.0004990282672548503, 'samples': 1181952, 'steps': 6155, 'loss/train': 1.679478645324707} -11/06/2021 22:06:56 - INFO - __main__ - Step 6157: {'lr': 0.0004990277997606016, 'samples': 1182144, 'steps': 6156, 'loss/train': 1.524378776550293} -11/06/2021 22:06:56 - INFO - __main__ - Step 6158: {'lr': 0.0004990273321541447, 'samples': 1182336, 'steps': 6157, 'loss/train': 0.6619194149971008} -11/06/2021 22:06:57 - INFO - __main__ - Step 6159: {'lr': 0.0004990268644354799, 'samples': 1182528, 'steps': 6158, 'loss/train': 1.9400123357772827} -11/06/2021 22:06:57 - INFO - __main__ - Step 6160: {'lr': 0.0004990263966046075, 'samples': 1182720, 'steps': 6159, 'loss/train': 1.8187702894210815} -11/06/2021 22:06:57 - INFO - __main__ - Step 6161: {'lr': 0.0004990259286615276, 'samples': 1182912, 'steps': 6160, 'loss/train': 1.444914698600769} -11/06/2021 22:06:58 - INFO - __main__ - Step 6162: {'lr': 0.0004990254606062406, 'samples': 1183104, 'steps': 6161, 'loss/train': 1.4133529663085938} -11/06/2021 22:06:59 - INFO - __main__ - Step 6163: {'lr': 0.0004990249924387465, 'samples': 1183296, 'steps': 6162, 'loss/train': 1.8153014183044434} -11/06/2021 22:06:59 - INFO - __main__ - Step 6164: {'lr': 0.0004990245241590455, 'samples': 1183488, 'steps': 6163, 'loss/train': 1.761313796043396} -11/06/2021 22:07:00 - INFO - __main__ - Step 6165: {'lr': 0.0004990240557671379, 'samples': 1183680, 'steps': 6164, 'loss/train': 0.9687419533729553} -11/06/2021 22:07:00 - INFO - __main__ - Step 6166: {'lr': 0.000499023587263024, 'samples': 1183872, 'steps': 6165, 'loss/train': 1.6445512771606445} -11/06/2021 22:07:00 - INFO - __main__ - Step 6167: {'lr': 0.0004990231186467039, 'samples': 1184064, 'steps': 6166, 'loss/train': 1.3879804611206055} -11/06/2021 22:07:01 - INFO - __main__ - Step 6168: {'lr': 0.0004990226499181778, 'samples': 1184256, 'steps': 6167, 'loss/train': 2.506103992462158} -11/06/2021 22:07:02 - INFO - __main__ - Step 6169: {'lr': 0.0004990221810774459, 'samples': 1184448, 'steps': 6168, 'loss/train': 2.4504177570343018} -11/06/2021 22:07:02 - INFO - __main__ - Step 6170: {'lr': 0.0004990217121245084, 'samples': 1184640, 'steps': 6169, 'loss/train': 1.9792548418045044} -11/06/2021 22:07:02 - INFO - __main__ - Step 6171: {'lr': 0.0004990212430593657, 'samples': 1184832, 'steps': 6170, 'loss/train': 1.8940435647964478} -11/06/2021 22:07:03 - INFO - __main__ - Step 6172: {'lr': 0.0004990207738820178, 'samples': 1185024, 'steps': 6171, 'loss/train': 1.8361660242080688} -11/06/2021 22:07:04 - INFO - __main__ - Step 6173: {'lr': 0.000499020304592465, 'samples': 1185216, 'steps': 6172, 'loss/train': 2.492899179458618} -11/06/2021 22:07:04 - INFO - __main__ - Step 6174: {'lr': 0.0004990198351907075, 'samples': 1185408, 'steps': 6173, 'loss/train': 1.5003889799118042} -11/06/2021 22:07:04 - INFO - __main__ - Step 6175: {'lr': 0.0004990193656767455, 'samples': 1185600, 'steps': 6174, 'loss/train': 2.0811853408813477} -11/06/2021 22:07:05 - INFO - __main__ - Step 6176: {'lr': 0.0004990188960505792, 'samples': 1185792, 'steps': 6175, 'loss/train': 3.0719258785247803} -11/06/2021 22:07:05 - INFO - __main__ - Step 6177: {'lr': 0.0004990184263122088, 'samples': 1185984, 'steps': 6176, 'loss/train': 1.861528754234314} -11/06/2021 22:07:05 - INFO - __main__ - Step 6178: {'lr': 0.0004990179564616346, 'samples': 1186176, 'steps': 6177, 'loss/train': 5.958117485046387} -11/06/2021 22:07:07 - INFO - __main__ - Step 6179: {'lr': 0.0004990174864988566, 'samples': 1186368, 'steps': 6178, 'loss/train': 1.926222562789917} -11/06/2021 22:07:07 - INFO - __main__ - Step 6180: {'lr': 0.0004990170164238754, 'samples': 1186560, 'steps': 6179, 'loss/train': 1.9009610414505005} -11/06/2021 22:07:07 - INFO - __main__ - Step 6181: {'lr': 0.0004990165462366909, 'samples': 1186752, 'steps': 6180, 'loss/train': 2.4664011001586914} -11/06/2021 22:07:08 - INFO - __main__ - Step 6182: {'lr': 0.0004990160759373033, 'samples': 1186944, 'steps': 6181, 'loss/train': 2.10902738571167} -11/06/2021 22:07:08 - INFO - __main__ - Step 6183: {'lr': 0.0004990156055257129, 'samples': 1187136, 'steps': 6182, 'loss/train': 1.813493251800537} -11/06/2021 22:07:09 - INFO - __main__ - Step 6184: {'lr': 0.00049901513500192, 'samples': 1187328, 'steps': 6183, 'loss/train': 2.25309681892395} -11/06/2021 22:07:09 - INFO - __main__ - Step 6185: {'lr': 0.0004990146643659247, 'samples': 1187520, 'steps': 6184, 'loss/train': 2.2059273719787598} -11/06/2021 22:07:10 - INFO - __main__ - Step 6186: {'lr': 0.0004990141936177272, 'samples': 1187712, 'steps': 6185, 'loss/train': 2.0499684810638428} -11/06/2021 22:07:10 - INFO - __main__ - Step 6187: {'lr': 0.0004990137227573278, 'samples': 1187904, 'steps': 6186, 'loss/train': 3.2400269508361816} -11/06/2021 22:07:10 - INFO - __main__ - Step 6188: {'lr': 0.0004990132517847266, 'samples': 1188096, 'steps': 6187, 'loss/train': 1.8898727893829346} -11/06/2021 22:07:11 - INFO - __main__ - Step 6189: {'lr': 0.0004990127806999239, 'samples': 1188288, 'steps': 6188, 'loss/train': 0.9931958317756653} -11/06/2021 22:07:12 - INFO - __main__ - Step 6190: {'lr': 0.0004990123095029199, 'samples': 1188480, 'steps': 6189, 'loss/train': 1.6618373394012451} -11/06/2021 22:07:12 - INFO - __main__ - Step 6191: {'lr': 0.0004990118381937148, 'samples': 1188672, 'steps': 6190, 'loss/train': 1.4901134967803955} -11/06/2021 22:07:12 - INFO - __main__ - Step 6192: {'lr': 0.0004990113667723088, 'samples': 1188864, 'steps': 6191, 'loss/train': 1.1681599617004395} -11/06/2021 22:07:13 - INFO - __main__ - Step 6193: {'lr': 0.000499010895238702, 'samples': 1189056, 'steps': 6192, 'loss/train': 1.8815301656723022} -11/06/2021 22:07:14 - INFO - __main__ - Step 6194: {'lr': 0.0004990104235928948, 'samples': 1189248, 'steps': 6193, 'loss/train': 1.8837906122207642} -11/06/2021 22:07:14 - INFO - __main__ - Step 6195: {'lr': 0.0004990099518348874, 'samples': 1189440, 'steps': 6194, 'loss/train': 2.526460647583008} -11/06/2021 22:07:14 - INFO - __main__ - Step 6196: {'lr': 0.00049900947996468, 'samples': 1189632, 'steps': 6195, 'loss/train': 1.910827875137329} -11/06/2021 22:07:15 - INFO - __main__ - Step 6197: {'lr': 0.0004990090079822726, 'samples': 1189824, 'steps': 6196, 'loss/train': 2.300349473953247} -11/06/2021 22:07:15 - INFO - __main__ - Step 6198: {'lr': 0.0004990085358876658, 'samples': 1190016, 'steps': 6197, 'loss/train': 1.6927975416183472} -11/06/2021 22:07:16 - INFO - __main__ - Step 6199: {'lr': 0.0004990080636808595, 'samples': 1190208, 'steps': 6198, 'loss/train': 2.1126410961151123} -11/06/2021 22:07:17 - INFO - __main__ - Step 6200: {'lr': 0.000499007591361854, 'samples': 1190400, 'steps': 6199, 'loss/train': 1.71726393699646} -11/06/2021 22:07:17 - INFO - __main__ - Step 6201: {'lr': 0.0004990071189306495, 'samples': 1190592, 'steps': 6200, 'loss/train': 2.024538040161133} -11/06/2021 22:07:17 - INFO - __main__ - Step 6202: {'lr': 0.0004990066463872462, 'samples': 1190784, 'steps': 6201, 'loss/train': 1.7335742712020874} -11/06/2021 22:07:18 - INFO - __main__ - Step 6203: {'lr': 0.0004990061737316445, 'samples': 1190976, 'steps': 6202, 'loss/train': 1.7096867561340332} -11/06/2021 22:07:18 - INFO - __main__ - Step 6204: {'lr': 0.0004990057009638443, 'samples': 1191168, 'steps': 6203, 'loss/train': 1.5593353509902954} -11/06/2021 22:07:19 - INFO - __main__ - Step 6205: {'lr': 0.000499005228083846, 'samples': 1191360, 'steps': 6204, 'loss/train': 2.450568437576294} -11/06/2021 22:07:20 - INFO - __main__ - Step 6206: {'lr': 0.0004990047550916498, 'samples': 1191552, 'steps': 6205, 'loss/train': 2.2195775508880615} -11/06/2021 22:07:20 - INFO - __main__ - Step 6207: {'lr': 0.000499004281987256, 'samples': 1191744, 'steps': 6206, 'loss/train': 1.6635841131210327} -11/06/2021 22:07:20 - INFO - __main__ - Step 6208: {'lr': 0.0004990038087706646, 'samples': 1191936, 'steps': 6207, 'loss/train': 1.9627450704574585} -11/06/2021 22:07:21 - INFO - __main__ - Step 6209: {'lr': 0.000499003335441876, 'samples': 1192128, 'steps': 6208, 'loss/train': 2.254753351211548} -11/06/2021 22:07:22 - INFO - __main__ - Step 6210: {'lr': 0.0004990028620008903, 'samples': 1192320, 'steps': 6209, 'loss/train': 1.8182693719863892} -11/06/2021 22:07:22 - INFO - __main__ - Step 6211: {'lr': 0.0004990023884477077, 'samples': 1192512, 'steps': 6210, 'loss/train': 2.1537516117095947} -11/06/2021 22:07:23 - INFO - __main__ - Step 6212: {'lr': 0.0004990019147823286, 'samples': 1192704, 'steps': 6211, 'loss/train': 1.6900304555892944} -11/06/2021 22:07:23 - INFO - __main__ - Step 6213: {'lr': 0.000499001441004753, 'samples': 1192896, 'steps': 6212, 'loss/train': 0.32827237248420715} -11/06/2021 22:07:23 - INFO - __main__ - Step 6214: {'lr': 0.0004990009671149811, 'samples': 1193088, 'steps': 6213, 'loss/train': 1.9133497476577759} -11/06/2021 22:07:24 - INFO - __main__ - Step 6215: {'lr': 0.0004990004931130133, 'samples': 1193280, 'steps': 6214, 'loss/train': 2.055999994277954} -11/06/2021 22:07:25 - INFO - __main__ - Step 6216: {'lr': 0.0004990000189988497, 'samples': 1193472, 'steps': 6215, 'loss/train': 2.248798370361328} -11/06/2021 22:07:25 - INFO - __main__ - Step 6217: {'lr': 0.0004989995447724907, 'samples': 1193664, 'steps': 6216, 'loss/train': 1.8303406238555908} -11/06/2021 22:07:26 - INFO - __main__ - Step 6218: {'lr': 0.0004989990704339361, 'samples': 1193856, 'steps': 6217, 'loss/train': 1.0167715549468994} -11/06/2021 22:07:26 - INFO - __main__ - Step 6219: {'lr': 0.0004989985959831865, 'samples': 1194048, 'steps': 6218, 'loss/train': 1.4236408472061157} -11/06/2021 22:07:27 - INFO - __main__ - Step 6220: {'lr': 0.0004989981214202419, 'samples': 1194240, 'steps': 6219, 'loss/train': 2.0307483673095703} -11/06/2021 22:07:28 - INFO - __main__ - Step 6221: {'lr': 0.0004989976467451026, 'samples': 1194432, 'steps': 6220, 'loss/train': 2.141268253326416} -11/06/2021 22:07:28 - INFO - __main__ - Step 6222: {'lr': 0.0004989971719577688, 'samples': 1194624, 'steps': 6221, 'loss/train': 1.8791309595108032} -11/06/2021 22:07:28 - INFO - __main__ - Step 6223: {'lr': 0.0004989966970582408, 'samples': 1194816, 'steps': 6222, 'loss/train': 1.7829779386520386} -11/06/2021 22:07:29 - INFO - __main__ - Step 6224: {'lr': 0.0004989962220465187, 'samples': 1195008, 'steps': 6223, 'loss/train': 4.018397331237793} -11/06/2021 22:07:29 - INFO - __main__ - Step 6225: {'lr': 0.0004989957469226027, 'samples': 1195200, 'steps': 6224, 'loss/train': 0.3159443736076355} -11/06/2021 22:07:30 - INFO - __main__ - Step 6226: {'lr': 0.0004989952716864931, 'samples': 1195392, 'steps': 6225, 'loss/train': 2.1702065467834473} -11/06/2021 22:07:30 - INFO - __main__ - Step 6227: {'lr': 0.00049899479633819, 'samples': 1195584, 'steps': 6226, 'loss/train': 1.8308675289154053} -11/06/2021 22:07:31 - INFO - __main__ - Step 6228: {'lr': 0.0004989943208776938, 'samples': 1195776, 'steps': 6227, 'loss/train': 2.180677890777588} -11/06/2021 22:07:31 - INFO - __main__ - Step 6229: {'lr': 0.0004989938453050045, 'samples': 1195968, 'steps': 6228, 'loss/train': 1.6663007736206055} -11/06/2021 22:07:31 - INFO - __main__ - Step 6230: {'lr': 0.0004989933696201225, 'samples': 1196160, 'steps': 6229, 'loss/train': 1.936288595199585} -11/06/2021 22:07:33 - INFO - __main__ - Step 6231: {'lr': 0.0004989928938230478, 'samples': 1196352, 'steps': 6230, 'loss/train': 2.008770227432251} -11/06/2021 22:07:33 - INFO - __main__ - Step 6232: {'lr': 0.0004989924179137808, 'samples': 1196544, 'steps': 6231, 'loss/train': 2.004091501235962} -11/06/2021 22:07:33 - INFO - __main__ - Step 6233: {'lr': 0.0004989919418923218, 'samples': 1196736, 'steps': 6232, 'loss/train': 1.9655420780181885} -11/06/2021 22:07:34 - INFO - __main__ - Step 6234: {'lr': 0.0004989914657586707, 'samples': 1196928, 'steps': 6233, 'loss/train': 1.8493226766586304} -11/06/2021 22:07:34 - INFO - __main__ - Step 6235: {'lr': 0.000498990989512828, 'samples': 1197120, 'steps': 6234, 'loss/train': 2.194037675857544} -11/06/2021 22:07:35 - INFO - __main__ - Step 6236: {'lr': 0.0004989905131547937, 'samples': 1197312, 'steps': 6235, 'loss/train': 2.581127643585205} -11/06/2021 22:07:35 - INFO - __main__ - Step 6237: {'lr': 0.0004989900366845682, 'samples': 1197504, 'steps': 6236, 'loss/train': 2.2226333618164062} -11/06/2021 22:07:36 - INFO - __main__ - Step 6238: {'lr': 0.0004989895601021515, 'samples': 1197696, 'steps': 6237, 'loss/train': 2.466501235961914} -11/06/2021 22:07:36 - INFO - __main__ - Step 6239: {'lr': 0.0004989890834075441, 'samples': 1197888, 'steps': 6238, 'loss/train': 1.5966987609863281} -11/06/2021 22:07:36 - INFO - __main__ - Step 6240: {'lr': 0.000498988606600746, 'samples': 1198080, 'steps': 6239, 'loss/train': 1.8267741203308105} -11/06/2021 22:07:37 - INFO - __main__ - Step 6241: {'lr': 0.0004989881296817575, 'samples': 1198272, 'steps': 6240, 'loss/train': 2.1044561862945557} -11/06/2021 22:07:38 - INFO - __main__ - Step 6242: {'lr': 0.0004989876526505788, 'samples': 1198464, 'steps': 6241, 'loss/train': 1.7580589056015015} -11/06/2021 22:07:38 - INFO - __main__ - Step 6243: {'lr': 0.0004989871755072101, 'samples': 1198656, 'steps': 6242, 'loss/train': 1.8593974113464355} -11/06/2021 22:07:38 - INFO - __main__ - Step 6244: {'lr': 0.0004989866982516516, 'samples': 1198848, 'steps': 6243, 'loss/train': 1.7739224433898926} -11/06/2021 22:07:39 - INFO - __main__ - Step 6245: {'lr': 0.0004989862208839035, 'samples': 1199040, 'steps': 6244, 'loss/train': 2.1439409255981445} -11/06/2021 22:07:40 - INFO - __main__ - Step 6246: {'lr': 0.0004989857434039661, 'samples': 1199232, 'steps': 6245, 'loss/train': 1.7785552740097046} -11/06/2021 22:07:40 - INFO - __main__ - Step 6247: {'lr': 0.0004989852658118395, 'samples': 1199424, 'steps': 6246, 'loss/train': 0.6885305047035217} -11/06/2021 22:07:41 - INFO - __main__ - Step 6248: {'lr': 0.000498984788107524, 'samples': 1199616, 'steps': 6247, 'loss/train': 1.918849229812622} -11/06/2021 22:07:41 - INFO - __main__ - Step 6249: {'lr': 0.0004989843102910198, 'samples': 1199808, 'steps': 6248, 'loss/train': 1.5366085767745972} -11/06/2021 22:07:41 - INFO - __main__ - Step 6250: {'lr': 0.0004989838323623272, 'samples': 1200000, 'steps': 6249, 'loss/train': 2.3803365230560303} -11/06/2021 22:07:42 - INFO - __main__ - Step 6251: {'lr': 0.0004989833543214463, 'samples': 1200192, 'steps': 6250, 'loss/train': 1.9775062799453735} -11/06/2021 22:07:43 - INFO - __main__ - Step 6252: {'lr': 0.0004989828761683774, 'samples': 1200384, 'steps': 6251, 'loss/train': 1.7551454305648804} -11/06/2021 22:07:43 - INFO - __main__ - Step 6253: {'lr': 0.0004989823979031205, 'samples': 1200576, 'steps': 6252, 'loss/train': 1.5888711214065552} -11/06/2021 22:07:43 - INFO - __main__ - Step 6254: {'lr': 0.000498981919525676, 'samples': 1200768, 'steps': 6253, 'loss/train': 1.925179362297058} -11/06/2021 22:07:44 - INFO - __main__ - Step 6255: {'lr': 0.0004989814410360442, 'samples': 1200960, 'steps': 6254, 'loss/train': 0.6360993981361389} -11/06/2021 22:07:45 - INFO - __main__ - Step 6256: {'lr': 0.0004989809624342251, 'samples': 1201152, 'steps': 6255, 'loss/train': 1.8095260858535767} -11/06/2021 22:07:45 - INFO - __main__ - Step 6257: {'lr': 0.000498980483720219, 'samples': 1201344, 'steps': 6256, 'loss/train': 1.7746502161026} -11/06/2021 22:07:46 - INFO - __main__ - Step 6258: {'lr': 0.0004989800048940263, 'samples': 1201536, 'steps': 6257, 'loss/train': 2.096313953399658} -11/06/2021 22:07:46 - INFO - __main__ - Step 6259: {'lr': 0.0004989795259556469, 'samples': 1201728, 'steps': 6258, 'loss/train': 2.1959168910980225} -11/06/2021 22:07:46 - INFO - __main__ - Step 6260: {'lr': 0.0004989790469050813, 'samples': 1201920, 'steps': 6259, 'loss/train': 1.8663018941879272} -11/06/2021 22:07:47 - INFO - __main__ - Step 6261: {'lr': 0.0004989785677423295, 'samples': 1202112, 'steps': 6260, 'loss/train': 1.3765881061553955} -11/06/2021 22:07:47 - INFO - __main__ - Step 6262: {'lr': 0.0004989780884673917, 'samples': 1202304, 'steps': 6261, 'loss/train': 2.113983631134033} -11/06/2021 22:07:48 - INFO - __main__ - Step 6263: {'lr': 0.0004989776090802683, 'samples': 1202496, 'steps': 6262, 'loss/train': 2.6338729858398438} -11/06/2021 22:07:48 - INFO - __main__ - Step 6264: {'lr': 0.0004989771295809594, 'samples': 1202688, 'steps': 6263, 'loss/train': 1.5440324544906616} -11/06/2021 22:07:49 - INFO - __main__ - Step 6265: {'lr': 0.0004989766499694653, 'samples': 1202880, 'steps': 6264, 'loss/train': 2.112800121307373} -11/06/2021 22:07:50 - INFO - __main__ - Step 6266: {'lr': 0.0004989761702457862, 'samples': 1203072, 'steps': 6265, 'loss/train': 1.9621334075927734} -11/06/2021 22:07:50 - INFO - __main__ - Step 6267: {'lr': 0.0004989756904099222, 'samples': 1203264, 'steps': 6266, 'loss/train': 2.0875959396362305} -11/06/2021 22:07:50 - INFO - __main__ - Step 6268: {'lr': 0.0004989752104618736, 'samples': 1203456, 'steps': 6267, 'loss/train': 2.009376287460327} -11/06/2021 22:07:51 - INFO - __main__ - Step 6269: {'lr': 0.0004989747304016407, 'samples': 1203648, 'steps': 6268, 'loss/train': 2.29427433013916} -11/06/2021 22:07:51 - INFO - __main__ - Step 6270: {'lr': 0.0004989742502292235, 'samples': 1203840, 'steps': 6269, 'loss/train': 2.1417438983917236} -11/06/2021 22:07:52 - INFO - __main__ - Step 6271: {'lr': 0.0004989737699446225, 'samples': 1204032, 'steps': 6270, 'loss/train': 1.981139063835144} -11/06/2021 22:07:52 - INFO - __main__ - Step 6272: {'lr': 0.0004989732895478376, 'samples': 1204224, 'steps': 6271, 'loss/train': 1.8909876346588135} -11/06/2021 22:07:53 - INFO - __main__ - Step 6273: {'lr': 0.0004989728090388693, 'samples': 1204416, 'steps': 6272, 'loss/train': 1.6940367221832275} -11/06/2021 22:07:53 - INFO - __main__ - Step 6274: {'lr': 0.0004989723284177177, 'samples': 1204608, 'steps': 6273, 'loss/train': 2.325897216796875} -11/06/2021 22:07:53 - INFO - __main__ - Step 6275: {'lr': 0.0004989718476843828, 'samples': 1204800, 'steps': 6274, 'loss/train': 1.9315811395645142} -11/06/2021 22:07:54 - INFO - __main__ - Step 6276: {'lr': 0.0004989713668388652, 'samples': 1204992, 'steps': 6275, 'loss/train': 1.894089937210083} -11/06/2021 22:07:55 - INFO - __main__ - Step 6277: {'lr': 0.000498970885881165, 'samples': 1205184, 'steps': 6276, 'loss/train': 1.7275776863098145} -11/06/2021 22:07:55 - INFO - __main__ - Step 6278: {'lr': 0.0004989704048112823, 'samples': 1205376, 'steps': 6277, 'loss/train': 2.880239486694336} -11/06/2021 22:07:55 - INFO - __main__ - Step 6279: {'lr': 0.0004989699236292173, 'samples': 1205568, 'steps': 6278, 'loss/train': 1.9111852645874023} -11/06/2021 22:07:56 - INFO - __main__ - Step 6280: {'lr': 0.0004989694423349704, 'samples': 1205760, 'steps': 6279, 'loss/train': 2.0868144035339355} -11/06/2021 22:07:57 - INFO - __main__ - Step 6281: {'lr': 0.0004989689609285417, 'samples': 1205952, 'steps': 6280, 'loss/train': 2.3991446495056152} -11/06/2021 22:07:57 - INFO - __main__ - Step 6282: {'lr': 0.0004989684794099314, 'samples': 1206144, 'steps': 6281, 'loss/train': 1.962192177772522} -11/06/2021 22:07:57 - INFO - __main__ - Step 6283: {'lr': 0.0004989679977791397, 'samples': 1206336, 'steps': 6282, 'loss/train': 2.007171630859375} -11/06/2021 22:07:58 - INFO - __main__ - Step 6284: {'lr': 0.0004989675160361669, 'samples': 1206528, 'steps': 6283, 'loss/train': 2.0830070972442627} -11/06/2021 22:07:58 - INFO - __main__ - Step 6285: {'lr': 0.0004989670341810132, 'samples': 1206720, 'steps': 6284, 'loss/train': 1.7555127143859863} -11/06/2021 22:07:59 - INFO - __main__ - Step 6286: {'lr': 0.0004989665522136789, 'samples': 1206912, 'steps': 6285, 'loss/train': 1.7010811567306519} -11/06/2021 22:08:00 - INFO - __main__ - Step 6287: {'lr': 0.0004989660701341639, 'samples': 1207104, 'steps': 6286, 'loss/train': 1.6270495653152466} -11/06/2021 22:08:00 - INFO - __main__ - Step 6288: {'lr': 0.0004989655879424687, 'samples': 1207296, 'steps': 6287, 'loss/train': 0.33006778359413147} -11/06/2021 22:08:00 - INFO - __main__ - Step 6289: {'lr': 0.0004989651056385936, 'samples': 1207488, 'steps': 6288, 'loss/train': 1.9551554918289185} -11/06/2021 22:08:01 - INFO - __main__ - Step 6290: {'lr': 0.0004989646232225384, 'samples': 1207680, 'steps': 6289, 'loss/train': 5.657275199890137} -11/06/2021 22:08:01 - INFO - __main__ - Step 6291: {'lr': 0.0004989641406943037, 'samples': 1207872, 'steps': 6290, 'loss/train': 1.931122899055481} -11/06/2021 22:08:02 - INFO - __main__ - Step 6292: {'lr': 0.0004989636580538896, 'samples': 1208064, 'steps': 6291, 'loss/train': 1.3750081062316895} -11/06/2021 22:08:02 - INFO - __main__ - Step 6293: {'lr': 0.0004989631753012964, 'samples': 1208256, 'steps': 6292, 'loss/train': 2.0061533451080322} -11/06/2021 22:08:03 - INFO - __main__ - Step 6294: {'lr': 0.0004989626924365242, 'samples': 1208448, 'steps': 6293, 'loss/train': 1.9302148818969727} -11/06/2021 22:08:03 - INFO - __main__ - Step 6295: {'lr': 0.0004989622094595733, 'samples': 1208640, 'steps': 6294, 'loss/train': 2.0548641681671143} -11/06/2021 22:08:03 - INFO - __main__ - Step 6296: {'lr': 0.0004989617263704437, 'samples': 1208832, 'steps': 6295, 'loss/train': 1.7614363431930542} -11/06/2021 22:08:05 - INFO - __main__ - Step 6297: {'lr': 0.0004989612431691359, 'samples': 1209024, 'steps': 6296, 'loss/train': 1.5389564037322998} -11/06/2021 22:08:05 - INFO - __main__ - Step 6298: {'lr': 0.0004989607598556501, 'samples': 1209216, 'steps': 6297, 'loss/train': 2.1703968048095703} -11/06/2021 22:08:05 - INFO - __main__ - Step 6299: {'lr': 0.0004989602764299862, 'samples': 1209408, 'steps': 6298, 'loss/train': 1.22577702999115} -11/06/2021 22:08:06 - INFO - __main__ - Step 6300: {'lr': 0.0004989597928921447, 'samples': 1209600, 'steps': 6299, 'loss/train': 2.2829113006591797} -11/06/2021 22:08:06 - INFO - __main__ - Step 6301: {'lr': 0.0004989593092421258, 'samples': 1209792, 'steps': 6300, 'loss/train': 1.3044848442077637} -11/06/2021 22:08:06 - INFO - __main__ - Step 6302: {'lr': 0.0004989588254799297, 'samples': 1209984, 'steps': 6301, 'loss/train': 1.8990617990493774} -11/06/2021 22:08:07 - INFO - __main__ - Step 6303: {'lr': 0.0004989583416055566, 'samples': 1210176, 'steps': 6302, 'loss/train': 1.9017807245254517} -11/06/2021 22:08:08 - INFO - __main__ - Step 6304: {'lr': 0.0004989578576190068, 'samples': 1210368, 'steps': 6303, 'loss/train': 2.0887370109558105} -11/06/2021 22:08:08 - INFO - __main__ - Step 6305: {'lr': 0.0004989573735202802, 'samples': 1210560, 'steps': 6304, 'loss/train': 1.910634994506836} -11/06/2021 22:08:08 - INFO - __main__ - Step 6306: {'lr': 0.0004989568893093774, 'samples': 1210752, 'steps': 6305, 'loss/train': 1.4305139780044556} -11/06/2021 22:08:09 - INFO - __main__ - Step 6307: {'lr': 0.0004989564049862986, 'samples': 1210944, 'steps': 6306, 'loss/train': 1.7775681018829346} -11/06/2021 22:08:10 - INFO - __main__ - Step 6308: {'lr': 0.0004989559205510436, 'samples': 1211136, 'steps': 6307, 'loss/train': 1.7592074871063232} -11/06/2021 22:08:10 - INFO - __main__ - Step 6309: {'lr': 0.000498955436003613, 'samples': 1211328, 'steps': 6308, 'loss/train': 1.7411454916000366} -11/06/2021 22:08:10 - INFO - __main__ - Step 6310: {'lr': 0.0004989549513440071, 'samples': 1211520, 'steps': 6309, 'loss/train': 2.116926431655884} -11/06/2021 22:08:11 - INFO - __main__ - Step 6311: {'lr': 0.0004989544665722258, 'samples': 1211712, 'steps': 6310, 'loss/train': 1.8361932039260864} -11/06/2021 22:08:11 - INFO - __main__ - Step 6312: {'lr': 0.0004989539816882694, 'samples': 1211904, 'steps': 6311, 'loss/train': 1.3926923274993896} -11/06/2021 22:08:12 - INFO - __main__ - Step 6313: {'lr': 0.0004989534966921382, 'samples': 1212096, 'steps': 6312, 'loss/train': 1.8578460216522217} -11/06/2021 22:08:13 - INFO - __main__ - Step 6314: {'lr': 0.0004989530115838324, 'samples': 1212288, 'steps': 6313, 'loss/train': 2.0698132514953613} -11/06/2021 22:08:13 - INFO - __main__ - Step 6315: {'lr': 0.0004989525263633523, 'samples': 1212480, 'steps': 6314, 'loss/train': 1.3116508722305298} -11/06/2021 22:08:13 - INFO - __main__ - Step 6316: {'lr': 0.0004989520410306979, 'samples': 1212672, 'steps': 6315, 'loss/train': 1.9149450063705444} -11/06/2021 22:08:14 - INFO - __main__ - Step 6317: {'lr': 0.0004989515555858697, 'samples': 1212864, 'steps': 6316, 'loss/train': 2.206059694290161} -11/06/2021 22:08:15 - INFO - __main__ - Step 6318: {'lr': 0.0004989510700288678, 'samples': 1213056, 'steps': 6317, 'loss/train': 1.6991815567016602} -11/06/2021 22:08:15 - INFO - __main__ - Step 6319: {'lr': 0.0004989505843596922, 'samples': 1213248, 'steps': 6318, 'loss/train': 2.7226216793060303} -11/06/2021 22:08:15 - INFO - __main__ - Step 6320: {'lr': 0.0004989500985783434, 'samples': 1213440, 'steps': 6319, 'loss/train': 2.1540679931640625} -11/06/2021 22:08:16 - INFO - __main__ - Step 6321: {'lr': 0.0004989496126848215, 'samples': 1213632, 'steps': 6320, 'loss/train': 1.8948540687561035} -11/06/2021 22:08:16 - INFO - __main__ - Step 6322: {'lr': 0.0004989491266791268, 'samples': 1213824, 'steps': 6321, 'loss/train': 1.8643752336502075} -11/06/2021 22:08:17 - INFO - __main__ - Step 6323: {'lr': 0.0004989486405612595, 'samples': 1214016, 'steps': 6322, 'loss/train': 1.8771063089370728} -11/06/2021 22:08:18 - INFO - __main__ - Step 6324: {'lr': 0.0004989481543312196, 'samples': 1214208, 'steps': 6323, 'loss/train': 1.7344616651535034} -11/06/2021 22:08:18 - INFO - __main__ - Step 6325: {'lr': 0.0004989476679890077, 'samples': 1214400, 'steps': 6324, 'loss/train': 1.7559272050857544} -11/06/2021 22:08:18 - INFO - __main__ - Step 6326: {'lr': 0.0004989471815346237, 'samples': 1214592, 'steps': 6325, 'loss/train': 2.1662731170654297} -11/06/2021 22:08:19 - INFO - __main__ - Step 6327: {'lr': 0.000498946694968068, 'samples': 1214784, 'steps': 6326, 'loss/train': 2.0608224868774414} -11/06/2021 22:08:19 - INFO - __main__ - Step 6328: {'lr': 0.0004989462082893407, 'samples': 1214976, 'steps': 6327, 'loss/train': 2.2688443660736084} -11/06/2021 22:08:20 - INFO - __main__ - Step 6329: {'lr': 0.0004989457214984421, 'samples': 1215168, 'steps': 6328, 'loss/train': 2.0150251388549805} -11/06/2021 22:08:20 - INFO - __main__ - Step 6330: {'lr': 0.0004989452345953725, 'samples': 1215360, 'steps': 6329, 'loss/train': 1.8572430610656738} -11/06/2021 22:08:21 - INFO - __main__ - Step 6331: {'lr': 0.000498944747580132, 'samples': 1215552, 'steps': 6330, 'loss/train': 1.986055850982666} -11/06/2021 22:08:21 - INFO - __main__ - Step 6332: {'lr': 0.0004989442604527208, 'samples': 1215744, 'steps': 6331, 'loss/train': 1.7587941884994507} -11/06/2021 22:08:21 - INFO - __main__ - Step 6333: {'lr': 0.0004989437732131391, 'samples': 1215936, 'steps': 6332, 'loss/train': 1.8428518772125244} -11/06/2021 22:08:23 - INFO - __main__ - Step 6334: {'lr': 0.0004989432858613873, 'samples': 1216128, 'steps': 6333, 'loss/train': 2.1033074855804443} -11/06/2021 22:08:23 - INFO - __main__ - Step 6335: {'lr': 0.0004989427983974653, 'samples': 1216320, 'steps': 6334, 'loss/train': 1.3180185556411743} -11/06/2021 22:08:23 - INFO - __main__ - Step 6336: {'lr': 0.0004989423108213737, 'samples': 1216512, 'steps': 6335, 'loss/train': 2.3260984420776367} -11/06/2021 22:08:24 - INFO - __main__ - Step 6337: {'lr': 0.0004989418231331124, 'samples': 1216704, 'steps': 6336, 'loss/train': 2.056525230407715} -11/06/2021 22:08:24 - INFO - __main__ - Step 6338: {'lr': 0.0004989413353326818, 'samples': 1216896, 'steps': 6337, 'loss/train': 2.151630401611328} -11/06/2021 22:08:25 - INFO - __main__ - Step 6339: {'lr': 0.0004989408474200821, 'samples': 1217088, 'steps': 6338, 'loss/train': 0.4232385456562042} -11/06/2021 22:08:25 - INFO - __main__ - Step 6340: {'lr': 0.0004989403593953135, 'samples': 1217280, 'steps': 6339, 'loss/train': 2.0424396991729736} -11/06/2021 22:08:26 - INFO - __main__ - Step 6341: {'lr': 0.0004989398712583762, 'samples': 1217472, 'steps': 6340, 'loss/train': 1.5621088743209839} -11/06/2021 22:08:26 - INFO - __main__ - Step 6342: {'lr': 0.0004989393830092705, 'samples': 1217664, 'steps': 6341, 'loss/train': 2.555983781814575} -11/06/2021 22:08:26 - INFO - __main__ - Step 6343: {'lr': 0.0004989388946479965, 'samples': 1217856, 'steps': 6342, 'loss/train': 1.820717692375183} -11/06/2021 22:08:27 - INFO - __main__ - Step 6344: {'lr': 0.0004989384061745545, 'samples': 1218048, 'steps': 6343, 'loss/train': 1.8627382516860962} -11/06/2021 22:08:28 - INFO - __main__ - Step 6345: {'lr': 0.0004989379175889447, 'samples': 1218240, 'steps': 6344, 'loss/train': 2.2447197437286377} -11/06/2021 22:08:28 - INFO - __main__ - Step 6346: {'lr': 0.0004989374288911672, 'samples': 1218432, 'steps': 6345, 'loss/train': 2.0814595222473145} -11/06/2021 22:08:28 - INFO - __main__ - Step 6347: {'lr': 0.0004989369400812225, 'samples': 1218624, 'steps': 6346, 'loss/train': 1.2773443460464478} -11/06/2021 22:08:29 - INFO - __main__ - Step 6348: {'lr': 0.0004989364511591106, 'samples': 1218816, 'steps': 6347, 'loss/train': 1.5852837562561035} -11/06/2021 22:08:29 - INFO - __main__ - Step 6349: {'lr': 0.0004989359621248317, 'samples': 1219008, 'steps': 6348, 'loss/train': 1.5508657693862915} -11/06/2021 22:08:30 - INFO - __main__ - Step 6350: {'lr': 0.0004989354729783861, 'samples': 1219200, 'steps': 6349, 'loss/train': 1.6555392742156982} -11/06/2021 22:08:31 - INFO - __main__ - Step 6351: {'lr': 0.0004989349837197742, 'samples': 1219392, 'steps': 6350, 'loss/train': 1.6861871480941772} -11/06/2021 22:08:31 - INFO - __main__ - Step 6352: {'lr': 0.0004989344943489958, 'samples': 1219584, 'steps': 6351, 'loss/train': 2.0413320064544678} -11/06/2021 22:08:31 - INFO - __main__ - Step 6353: {'lr': 0.0004989340048660515, 'samples': 1219776, 'steps': 6352, 'loss/train': 2.444296360015869} -11/06/2021 22:08:32 - INFO - __main__ - Step 6354: {'lr': 0.0004989335152709414, 'samples': 1219968, 'steps': 6353, 'loss/train': 2.159029245376587} -11/06/2021 22:08:33 - INFO - __main__ - Step 6355: {'lr': 0.0004989330255636656, 'samples': 1220160, 'steps': 6354, 'loss/train': 1.5128992795944214} -11/06/2021 22:08:33 - INFO - __main__ - Step 6356: {'lr': 0.0004989325357442245, 'samples': 1220352, 'steps': 6355, 'loss/train': 1.8759398460388184} -11/06/2021 22:08:33 - INFO - __main__ - Step 6357: {'lr': 0.0004989320458126182, 'samples': 1220544, 'steps': 6356, 'loss/train': 1.6384868621826172} -11/06/2021 22:08:34 - INFO - __main__ - Step 6358: {'lr': 0.0004989315557688469, 'samples': 1220736, 'steps': 6357, 'loss/train': 2.0724997520446777} -11/06/2021 22:08:34 - INFO - __main__ - Step 6359: {'lr': 0.000498931065612911, 'samples': 1220928, 'steps': 6358, 'loss/train': 1.3788177967071533} -11/06/2021 22:08:35 - INFO - __main__ - Step 6360: {'lr': 0.0004989305753448106, 'samples': 1221120, 'steps': 6359, 'loss/train': 1.6440093517303467} -11/06/2021 22:08:35 - INFO - __main__ - Step 6361: {'lr': 0.0004989300849645459, 'samples': 1221312, 'steps': 6360, 'loss/train': 0.8680780529975891} -11/06/2021 22:08:36 - INFO - __main__ - Step 6362: {'lr': 0.0004989295944721171, 'samples': 1221504, 'steps': 6361, 'loss/train': 1.834447979927063} -11/06/2021 22:08:36 - INFO - __main__ - Step 6363: {'lr': 0.0004989291038675245, 'samples': 1221696, 'steps': 6362, 'loss/train': 2.109246015548706} -11/06/2021 22:08:36 - INFO - __main__ - Step 6364: {'lr': 0.0004989286131507682, 'samples': 1221888, 'steps': 6363, 'loss/train': 2.3124148845672607} -11/06/2021 22:08:37 - INFO - __main__ - Step 6365: {'lr': 0.0004989281223218486, 'samples': 1222080, 'steps': 6364, 'loss/train': 2.2666964530944824} -11/06/2021 22:08:38 - INFO - __main__ - Step 6366: {'lr': 0.0004989276313807658, 'samples': 1222272, 'steps': 6365, 'loss/train': 2.1086597442626953} -11/06/2021 22:08:38 - INFO - __main__ - Step 6367: {'lr': 0.00049892714032752, 'samples': 1222464, 'steps': 6366, 'loss/train': 1.7961052656173706} -11/06/2021 22:08:39 - INFO - __main__ - Step 6368: {'lr': 0.0004989266491621117, 'samples': 1222656, 'steps': 6367, 'loss/train': 1.7916598320007324} -11/06/2021 22:08:39 - INFO - __main__ - Step 6369: {'lr': 0.0004989261578845406, 'samples': 1222848, 'steps': 6368, 'loss/train': 2.015110731124878} -11/06/2021 22:08:40 - INFO - __main__ - Step 6370: {'lr': 0.0004989256664948073, 'samples': 1223040, 'steps': 6369, 'loss/train': 1.7681583166122437} -11/06/2021 22:08:40 - INFO - __main__ - Step 6371: {'lr': 0.000498925174992912, 'samples': 1223232, 'steps': 6370, 'loss/train': 2.142261266708374} -11/06/2021 22:08:41 - INFO - __main__ - Step 6372: {'lr': 0.0004989246833788549, 'samples': 1223424, 'steps': 6371, 'loss/train': 1.6870710849761963} -11/06/2021 22:08:41 - INFO - __main__ - Step 6373: {'lr': 0.000498924191652636, 'samples': 1223616, 'steps': 6372, 'loss/train': 1.6174527406692505} -11/06/2021 22:08:41 - INFO - __main__ - Step 6374: {'lr': 0.0004989236998142559, 'samples': 1223808, 'steps': 6373, 'loss/train': 1.6731904745101929} -11/06/2021 22:08:42 - INFO - __main__ - Step 6375: {'lr': 0.0004989232078637145, 'samples': 1224000, 'steps': 6374, 'loss/train': 1.9477375745773315} -11/06/2021 22:08:44 - INFO - __main__ - Step 6376: {'lr': 0.0004989227158010123, 'samples': 1224192, 'steps': 6375, 'loss/train': 1.9696638584136963} -11/06/2021 22:08:44 - INFO - __main__ - Step 6377: {'lr': 0.0004989222236261491, 'samples': 1224384, 'steps': 6376, 'loss/train': 2.0389769077301025} -11/06/2021 22:08:45 - INFO - __main__ - Step 6378: {'lr': 0.0004989217313391256, 'samples': 1224576, 'steps': 6377, 'loss/train': 1.981373906135559} -11/06/2021 22:08:45 - INFO - __main__ - Step 6379: {'lr': 0.0004989212389399417, 'samples': 1224768, 'steps': 6378, 'loss/train': 1.8569397926330566} -11/06/2021 22:08:46 - INFO - __main__ - Step 6380: {'lr': 0.0004989207464285978, 'samples': 1224960, 'steps': 6379, 'loss/train': 1.8618382215499878} -11/06/2021 22:08:46 - INFO - __main__ - Step 6381: {'lr': 0.0004989202538050939, 'samples': 1225152, 'steps': 6380, 'loss/train': 1.969157099723816} -11/06/2021 22:08:46 - INFO - __main__ - Step 6382: {'lr': 0.0004989197610694306, 'samples': 1225344, 'steps': 6381, 'loss/train': 4.056380748748779} -11/06/2021 22:08:47 - INFO - __main__ - Step 6383: {'lr': 0.0004989192682216078, 'samples': 1225536, 'steps': 6382, 'loss/train': 2.3175463676452637} -11/06/2021 22:08:48 - INFO - __main__ - Step 6384: {'lr': 0.0004989187752616258, 'samples': 1225728, 'steps': 6383, 'loss/train': 2.1582441329956055} -11/06/2021 22:08:48 - INFO - __main__ - Step 6385: {'lr': 0.0004989182821894849, 'samples': 1225920, 'steps': 6384, 'loss/train': 1.9625952243804932} -11/06/2021 22:08:48 - INFO - __main__ - Step 6386: {'lr': 0.0004989177890051852, 'samples': 1226112, 'steps': 6385, 'loss/train': 2.3441145420074463} -11/06/2021 22:08:49 - INFO - __main__ - Step 6387: {'lr': 0.000498917295708727, 'samples': 1226304, 'steps': 6386, 'loss/train': 2.260986328125} -11/06/2021 22:08:49 - INFO - __main__ - Step 6388: {'lr': 0.0004989168023001105, 'samples': 1226496, 'steps': 6387, 'loss/train': 2.005218029022217} -11/06/2021 22:08:50 - INFO - __main__ - Step 6389: {'lr': 0.0004989163087793359, 'samples': 1226688, 'steps': 6388, 'loss/train': 1.657336950302124} -11/06/2021 22:08:50 - INFO - __main__ - Step 6390: {'lr': 0.0004989158151464036, 'samples': 1226880, 'steps': 6389, 'loss/train': 1.1649143695831299} -11/06/2021 22:08:51 - INFO - __main__ - Step 6391: {'lr': 0.0004989153214013135, 'samples': 1227072, 'steps': 6390, 'loss/train': 2.1878926753997803} -11/06/2021 22:08:51 - INFO - __main__ - Step 6392: {'lr': 0.0004989148275440661, 'samples': 1227264, 'steps': 6391, 'loss/train': 2.312974691390991} -11/06/2021 22:08:51 - INFO - __main__ - Step 6393: {'lr': 0.0004989143335746614, 'samples': 1227456, 'steps': 6392, 'loss/train': 2.0476460456848145} -11/06/2021 22:08:52 - INFO - __main__ - Step 6394: {'lr': 0.0004989138394930998, 'samples': 1227648, 'steps': 6393, 'loss/train': 2.358633518218994} -11/06/2021 22:08:53 - INFO - __main__ - Step 6395: {'lr': 0.0004989133452993816, 'samples': 1227840, 'steps': 6394, 'loss/train': 1.8311744928359985} -11/06/2021 22:08:53 - INFO - __main__ - Step 6396: {'lr': 0.0004989128509935068, 'samples': 1228032, 'steps': 6395, 'loss/train': 1.4626703262329102} -11/06/2021 22:08:53 - INFO - __main__ - Step 6397: {'lr': 0.0004989123565754756, 'samples': 1228224, 'steps': 6396, 'loss/train': 2.180896043777466} -11/06/2021 22:08:54 - INFO - __main__ - Step 6398: {'lr': 0.0004989118620452884, 'samples': 1228416, 'steps': 6397, 'loss/train': 1.6816266775131226} -11/06/2021 22:08:55 - INFO - __main__ - Step 6399: {'lr': 0.0004989113674029454, 'samples': 1228608, 'steps': 6398, 'loss/train': 2.068782091140747} -11/06/2021 22:08:55 - INFO - __main__ - Step 6400: {'lr': 0.0004989108726484469, 'samples': 1228800, 'steps': 6399, 'loss/train': 2.064892530441284} -11/06/2021 22:08:55 - INFO - __main__ - Step 6401: {'lr': 0.0004989103777817928, 'samples': 1228992, 'steps': 6400, 'loss/train': 1.7987390756607056} -11/06/2021 22:08:56 - INFO - __main__ - Step 6402: {'lr': 0.0004989098828029836, 'samples': 1229184, 'steps': 6401, 'loss/train': 2.1822431087493896} -11/06/2021 22:08:56 - INFO - __main__ - Step 6403: {'lr': 0.0004989093877120194, 'samples': 1229376, 'steps': 6402, 'loss/train': 1.9657015800476074} -11/06/2021 22:08:58 - INFO - __main__ - Step 6404: {'lr': 0.0004989088925089005, 'samples': 1229568, 'steps': 6403, 'loss/train': 1.4904416799545288} -11/06/2021 22:08:58 - INFO - __main__ - Step 6405: {'lr': 0.0004989083971936271, 'samples': 1229760, 'steps': 6404, 'loss/train': 2.7258121967315674} -11/06/2021 22:08:58 - INFO - __main__ - Step 6406: {'lr': 0.0004989079017661994, 'samples': 1229952, 'steps': 6405, 'loss/train': 1.961512804031372} -11/06/2021 22:08:59 - INFO - __main__ - Step 6407: {'lr': 0.0004989074062266177, 'samples': 1230144, 'steps': 6406, 'loss/train': 5.536162853240967} -11/06/2021 22:08:59 - INFO - __main__ - Step 6408: {'lr': 0.0004989069105748821, 'samples': 1230336, 'steps': 6407, 'loss/train': 1.5103638172149658} -11/06/2021 22:08:59 - INFO - __main__ - Step 6409: {'lr': 0.0004989064148109929, 'samples': 1230528, 'steps': 6408, 'loss/train': 1.6851413249969482} -11/06/2021 22:09:00 - INFO - __main__ - Step 6410: {'lr': 0.0004989059189349503, 'samples': 1230720, 'steps': 6409, 'loss/train': 1.7821619510650635} -11/06/2021 22:09:01 - INFO - __main__ - Step 6411: {'lr': 0.0004989054229467546, 'samples': 1230912, 'steps': 6410, 'loss/train': 1.9058226346969604} -11/06/2021 22:09:01 - INFO - __main__ - Step 6412: {'lr': 0.0004989049268464058, 'samples': 1231104, 'steps': 6411, 'loss/train': 1.1312766075134277} -11/06/2021 22:09:01 - INFO - __main__ - Step 6413: {'lr': 0.0004989044306339044, 'samples': 1231296, 'steps': 6412, 'loss/train': 2.2100672721862793} -11/06/2021 22:09:02 - INFO - __main__ - Step 6414: {'lr': 0.0004989039343092505, 'samples': 1231488, 'steps': 6413, 'loss/train': 1.6702120304107666} -11/06/2021 22:09:03 - INFO - __main__ - Step 6415: {'lr': 0.0004989034378724443, 'samples': 1231680, 'steps': 6414, 'loss/train': 2.1043949127197266} -11/06/2021 22:09:03 - INFO - __main__ - Step 6416: {'lr': 0.0004989029413234861, 'samples': 1231872, 'steps': 6415, 'loss/train': 1.9456948041915894} -11/06/2021 22:09:03 - INFO - __main__ - Step 6417: {'lr': 0.000498902444662376, 'samples': 1232064, 'steps': 6416, 'loss/train': 2.429739475250244} -11/06/2021 22:09:04 - INFO - __main__ - Step 6418: {'lr': 0.0004989019478891144, 'samples': 1232256, 'steps': 6417, 'loss/train': 2.0660645961761475} -11/06/2021 22:09:04 - INFO - __main__ - Step 6419: {'lr': 0.0004989014510037013, 'samples': 1232448, 'steps': 6418, 'loss/train': 1.0096818208694458} -11/06/2021 22:09:05 - INFO - __main__ - Step 6420: {'lr': 0.0004989009540061373, 'samples': 1232640, 'steps': 6419, 'loss/train': 1.7009047269821167} -11/06/2021 22:09:05 - INFO - __main__ - Step 6421: {'lr': 0.0004989004568964221, 'samples': 1232832, 'steps': 6420, 'loss/train': 1.8998950719833374} -11/06/2021 22:09:06 - INFO - __main__ - Step 6422: {'lr': 0.0004988999596745562, 'samples': 1233024, 'steps': 6421, 'loss/train': 2.2160139083862305} -11/06/2021 22:09:06 - INFO - __main__ - Step 6423: {'lr': 0.00049889946234054, 'samples': 1233216, 'steps': 6422, 'loss/train': 1.466779351234436} -11/06/2021 22:09:07 - INFO - __main__ - Step 6424: {'lr': 0.0004988989648943734, 'samples': 1233408, 'steps': 6423, 'loss/train': 1.9524688720703125} -11/06/2021 22:09:08 - INFO - __main__ - Step 6425: {'lr': 0.0004988984673360568, 'samples': 1233600, 'steps': 6424, 'loss/train': 1.4690804481506348} -11/06/2021 22:09:08 - INFO - __main__ - Step 6426: {'lr': 0.0004988979696655904, 'samples': 1233792, 'steps': 6425, 'loss/train': 1.6141606569290161} -11/06/2021 22:09:08 - INFO - __main__ - Step 6427: {'lr': 0.0004988974718829744, 'samples': 1233984, 'steps': 6426, 'loss/train': 1.9417755603790283} -11/06/2021 22:09:09 - INFO - __main__ - Step 6428: {'lr': 0.0004988969739882091, 'samples': 1234176, 'steps': 6427, 'loss/train': 1.8715691566467285} -11/06/2021 22:09:09 - INFO - __main__ - Step 6429: {'lr': 0.0004988964759812946, 'samples': 1234368, 'steps': 6428, 'loss/train': 1.668321132659912} -11/06/2021 22:09:11 - INFO - __main__ - Step 6430: {'lr': 0.0004988959778622313, 'samples': 1234560, 'steps': 6429, 'loss/train': 1.9378490447998047} -11/06/2021 22:09:11 - INFO - __main__ - Step 6431: {'lr': 0.0004988954796310191, 'samples': 1234752, 'steps': 6430, 'loss/train': 1.9765774011611938} -11/06/2021 22:09:12 - INFO - __main__ - Step 6432: {'lr': 0.0004988949812876586, 'samples': 1234944, 'steps': 6431, 'loss/train': 1.7189645767211914} -11/06/2021 22:09:12 - INFO - __main__ - Step 6433: {'lr': 0.0004988944828321499, 'samples': 1235136, 'steps': 6432, 'loss/train': 1.8814183473587036} -11/06/2021 22:09:12 - INFO - __main__ - Step 6434: {'lr': 0.0004988939842644931, 'samples': 1235328, 'steps': 6433, 'loss/train': 1.60706627368927} -11/06/2021 22:09:13 - INFO - __main__ - Step 6435: {'lr': 0.0004988934855846885, 'samples': 1235520, 'steps': 6434, 'loss/train': 1.5853242874145508} -11/06/2021 22:09:13 - INFO - __main__ - Step 6436: {'lr': 0.0004988929867927363, 'samples': 1235712, 'steps': 6435, 'loss/train': 1.9436169862747192} -11/06/2021 22:09:13 - INFO - __main__ - Step 6437: {'lr': 0.0004988924878886368, 'samples': 1235904, 'steps': 6436, 'loss/train': 1.9640707969665527} -11/06/2021 22:09:15 - INFO - __main__ - Step 6438: {'lr': 0.0004988919888723902, 'samples': 1236096, 'steps': 6437, 'loss/train': 1.9225521087646484} -11/06/2021 22:09:15 - INFO - __main__ - Step 6439: {'lr': 0.0004988914897439968, 'samples': 1236288, 'steps': 6438, 'loss/train': 1.5273348093032837} -11/06/2021 22:09:15 - INFO - __main__ - Step 6440: {'lr': 0.0004988909905034566, 'samples': 1236480, 'steps': 6439, 'loss/train': 1.8240584135055542} -11/06/2021 22:09:16 - INFO - __main__ - Step 6441: {'lr': 0.00049889049115077, 'samples': 1236672, 'steps': 6440, 'loss/train': 1.741806983947754} -11/06/2021 22:09:16 - INFO - __main__ - Step 6442: {'lr': 0.0004988899916859372, 'samples': 1236864, 'steps': 6441, 'loss/train': 2.750673294067383} -11/06/2021 22:09:17 - INFO - __main__ - Step 6443: {'lr': 0.0004988894921089584, 'samples': 1237056, 'steps': 6442, 'loss/train': 1.7780988216400146} -11/06/2021 22:09:17 - INFO - __main__ - Step 6444: {'lr': 0.0004988889924198339, 'samples': 1237248, 'steps': 6443, 'loss/train': 1.9567726850509644} -11/06/2021 22:09:18 - INFO - __main__ - Step 6445: {'lr': 0.0004988884926185637, 'samples': 1237440, 'steps': 6444, 'loss/train': 1.8130319118499756} -11/06/2021 22:09:18 - INFO - __main__ - Step 6446: {'lr': 0.0004988879927051484, 'samples': 1237632, 'steps': 6445, 'loss/train': 1.573569655418396} -11/06/2021 22:09:18 - INFO - __main__ - Step 6447: {'lr': 0.0004988874926795878, 'samples': 1237824, 'steps': 6446, 'loss/train': 1.8743444681167603} -11/06/2021 22:09:19 - INFO - __main__ - Step 6448: {'lr': 0.0004988869925418825, 'samples': 1238016, 'steps': 6447, 'loss/train': 1.5253403186798096} -11/06/2021 22:09:20 - INFO - __main__ - Step 6449: {'lr': 0.0004988864922920325, 'samples': 1238208, 'steps': 6448, 'loss/train': 1.7076308727264404} -11/06/2021 22:09:20 - INFO - __main__ - Step 6450: {'lr': 0.000498885991930038, 'samples': 1238400, 'steps': 6449, 'loss/train': 2.227938413619995} -11/06/2021 22:09:20 - INFO - __main__ - Step 6451: {'lr': 0.0004988854914558994, 'samples': 1238592, 'steps': 6450, 'loss/train': 1.7760518789291382} -11/06/2021 22:09:21 - INFO - __main__ - Step 6452: {'lr': 0.0004988849908696169, 'samples': 1238784, 'steps': 6451, 'loss/train': 2.213900566101074} -11/06/2021 22:09:21 - INFO - __main__ - Step 6453: {'lr': 0.0004988844901711905, 'samples': 1238976, 'steps': 6452, 'loss/train': 2.0823049545288086} -11/06/2021 22:09:22 - INFO - __main__ - Step 6454: {'lr': 0.0004988839893606208, 'samples': 1239168, 'steps': 6453, 'loss/train': 1.9034770727157593} -11/06/2021 22:09:23 - INFO - __main__ - Step 6455: {'lr': 0.0004988834884379076, 'samples': 1239360, 'steps': 6454, 'loss/train': 1.2255651950836182} -11/06/2021 22:09:23 - INFO - __main__ - Step 6456: {'lr': 0.0004988829874030514, 'samples': 1239552, 'steps': 6455, 'loss/train': 2.5880677700042725} -11/06/2021 22:09:23 - INFO - __main__ - Step 6457: {'lr': 0.0004988824862560525, 'samples': 1239744, 'steps': 6456, 'loss/train': 4.904447078704834} -11/06/2021 22:09:24 - INFO - __main__ - Step 6458: {'lr': 0.0004988819849969109, 'samples': 1239936, 'steps': 6457, 'loss/train': 1.9330166578292847} -11/06/2021 22:09:25 - INFO - __main__ - Step 6459: {'lr': 0.0004988814836256269, 'samples': 1240128, 'steps': 6458, 'loss/train': 1.4734045267105103} -11/06/2021 22:09:25 - INFO - __main__ - Step 6460: {'lr': 0.0004988809821422008, 'samples': 1240320, 'steps': 6459, 'loss/train': 2.5002269744873047} -11/06/2021 22:09:25 - INFO - __main__ - Step 6461: {'lr': 0.0004988804805466327, 'samples': 1240512, 'steps': 6460, 'loss/train': 1.7648297548294067} -11/06/2021 22:09:26 - INFO - __main__ - Step 6462: {'lr': 0.000498879978838923, 'samples': 1240704, 'steps': 6461, 'loss/train': 2.2282261848449707} -11/06/2021 22:09:26 - INFO - __main__ - Step 6463: {'lr': 0.0004988794770190717, 'samples': 1240896, 'steps': 6462, 'loss/train': 2.106597661972046} -11/06/2021 22:09:27 - INFO - __main__ - Step 6464: {'lr': 0.0004988789750870792, 'samples': 1241088, 'steps': 6463, 'loss/train': 2.194019317626953} -11/06/2021 22:09:28 - INFO - __main__ - Step 6465: {'lr': 0.0004988784730429457, 'samples': 1241280, 'steps': 6464, 'loss/train': 2.4788918495178223} -11/06/2021 22:09:28 - INFO - __main__ - Step 6466: {'lr': 0.0004988779708866714, 'samples': 1241472, 'steps': 6465, 'loss/train': 2.1936397552490234} -11/06/2021 22:09:28 - INFO - __main__ - Step 6467: {'lr': 0.0004988774686182564, 'samples': 1241664, 'steps': 6466, 'loss/train': 1.6836004257202148} -11/06/2021 22:09:29 - INFO - __main__ - Step 6468: {'lr': 0.0004988769662377013, 'samples': 1241856, 'steps': 6467, 'loss/train': 2.2871172428131104} -11/06/2021 22:09:29 - INFO - __main__ - Step 6469: {'lr': 0.0004988764637450058, 'samples': 1242048, 'steps': 6468, 'loss/train': 2.1349170207977295} -11/06/2021 22:09:30 - INFO - __main__ - Step 6470: {'lr': 0.0004988759611401706, 'samples': 1242240, 'steps': 6469, 'loss/train': 2.350022315979004} -11/06/2021 22:09:30 - INFO - __main__ - Step 6471: {'lr': 0.0004988754584231957, 'samples': 1242432, 'steps': 6470, 'loss/train': 1.986899971961975} -11/06/2021 22:09:31 - INFO - __main__ - Step 6472: {'lr': 0.0004988749555940814, 'samples': 1242624, 'steps': 6471, 'loss/train': 1.6348545551300049} -11/06/2021 22:09:31 - INFO - __main__ - Step 6473: {'lr': 0.0004988744526528277, 'samples': 1242816, 'steps': 6472, 'loss/train': 2.23770809173584} -11/06/2021 22:09:31 - INFO - __main__ - Step 6474: {'lr': 0.0004988739495994352, 'samples': 1243008, 'steps': 6473, 'loss/train': 1.4470930099487305} -11/06/2021 22:09:32 - INFO - __main__ - Step 6475: {'lr': 0.0004988734464339038, 'samples': 1243200, 'steps': 6474, 'loss/train': 1.8867287635803223} -11/06/2021 22:09:33 - INFO - __main__ - Step 6476: {'lr': 0.0004988729431562339, 'samples': 1243392, 'steps': 6475, 'loss/train': 2.184319496154785} -11/06/2021 22:09:33 - INFO - __main__ - Step 6477: {'lr': 0.0004988724397664258, 'samples': 1243584, 'steps': 6476, 'loss/train': 2.0487940311431885} -11/06/2021 22:09:33 - INFO - __main__ - Step 6478: {'lr': 0.0004988719362644795, 'samples': 1243776, 'steps': 6477, 'loss/train': 2.7399888038635254} -11/06/2021 22:09:34 - INFO - __main__ - Step 6479: {'lr': 0.0004988714326503953, 'samples': 1243968, 'steps': 6478, 'loss/train': 1.4962778091430664} -11/06/2021 22:09:35 - INFO - __main__ - Step 6480: {'lr': 0.0004988709289241736, 'samples': 1244160, 'steps': 6479, 'loss/train': 2.1878020763397217} -11/06/2021 22:09:35 - INFO - __main__ - Step 6481: {'lr': 0.0004988704250858145, 'samples': 1244352, 'steps': 6480, 'loss/train': 1.851172685623169} -11/06/2021 22:09:36 - INFO - __main__ - Step 6482: {'lr': 0.0004988699211353182, 'samples': 1244544, 'steps': 6481, 'loss/train': 1.0221189260482788} -11/06/2021 22:09:36 - INFO - __main__ - Step 6483: {'lr': 0.000498869417072685, 'samples': 1244736, 'steps': 6482, 'loss/train': 1.667419672012329} -11/06/2021 22:09:36 - INFO - __main__ - Step 6484: {'lr': 0.000498868912897915, 'samples': 1244928, 'steps': 6483, 'loss/train': 1.5354762077331543} -11/06/2021 22:09:37 - INFO - __main__ - Step 6485: {'lr': 0.0004988684086110085, 'samples': 1245120, 'steps': 6484, 'loss/train': 1.7448598146438599} -11/06/2021 22:09:38 - INFO - __main__ - Step 6486: {'lr': 0.0004988679042119658, 'samples': 1245312, 'steps': 6485, 'loss/train': 1.7529888153076172} -11/06/2021 22:09:38 - INFO - __main__ - Step 6487: {'lr': 0.000498867399700787, 'samples': 1245504, 'steps': 6486, 'loss/train': 2.0920798778533936} -11/06/2021 22:09:38 - INFO - __main__ - Step 6488: {'lr': 0.0004988668950774724, 'samples': 1245696, 'steps': 6487, 'loss/train': 2.620828151702881} -11/06/2021 22:09:39 - INFO - __main__ - Step 6489: {'lr': 0.0004988663903420222, 'samples': 1245888, 'steps': 6488, 'loss/train': 2.216024398803711} -11/06/2021 22:09:39 - INFO - __main__ - Step 6490: {'lr': 0.0004988658854944367, 'samples': 1246080, 'steps': 6489, 'loss/train': 2.130100727081299} -11/06/2021 22:09:40 - INFO - __main__ - Step 6491: {'lr': 0.0004988653805347161, 'samples': 1246272, 'steps': 6490, 'loss/train': 1.8137882947921753} -11/06/2021 22:09:40 - INFO - __main__ - Step 6492: {'lr': 0.0004988648754628605, 'samples': 1246464, 'steps': 6491, 'loss/train': 1.7981539964675903} -11/06/2021 22:09:41 - INFO - __main__ - Step 6493: {'lr': 0.0004988643702788703, 'samples': 1246656, 'steps': 6492, 'loss/train': 2.0300815105438232} -11/06/2021 22:09:41 - INFO - __main__ - Step 6494: {'lr': 0.0004988638649827456, 'samples': 1246848, 'steps': 6493, 'loss/train': 2.65700101852417} -11/06/2021 22:09:41 - INFO - __main__ - Step 6495: {'lr': 0.0004988633595744867, 'samples': 1247040, 'steps': 6494, 'loss/train': 2.369478940963745} -11/06/2021 22:09:43 - INFO - __main__ - Step 6496: {'lr': 0.0004988628540540939, 'samples': 1247232, 'steps': 6495, 'loss/train': 1.5928741693496704} -11/06/2021 22:09:43 - INFO - __main__ - Step 6497: {'lr': 0.0004988623484215673, 'samples': 1247424, 'steps': 6496, 'loss/train': 0.6462783217430115} -11/06/2021 22:09:43 - INFO - __main__ - Step 6498: {'lr': 0.0004988618426769071, 'samples': 1247616, 'steps': 6497, 'loss/train': 1.936950922012329} -11/06/2021 22:09:44 - INFO - __main__ - Step 6499: {'lr': 0.0004988613368201135, 'samples': 1247808, 'steps': 6498, 'loss/train': 2.1868393421173096} -11/06/2021 22:09:44 - INFO - __main__ - Step 6500: {'lr': 0.0004988608308511871, 'samples': 1248000, 'steps': 6499, 'loss/train': 1.6641846895217896} -11/06/2021 22:09:45 - INFO - __main__ - Step 6501: {'lr': 0.0004988603247701276, 'samples': 1248192, 'steps': 6500, 'loss/train': 1.803402066230774} -11/06/2021 22:09:45 - INFO - __main__ - Step 6502: {'lr': 0.0004988598185769357, 'samples': 1248384, 'steps': 6501, 'loss/train': 2.2652242183685303} -11/06/2021 22:09:46 - INFO - __main__ - Step 6503: {'lr': 0.0004988593122716112, 'samples': 1248576, 'steps': 6502, 'loss/train': 1.5960944890975952} -11/06/2021 22:09:46 - INFO - __main__ - Step 6504: {'lr': 0.0004988588058541547, 'samples': 1248768, 'steps': 6503, 'loss/train': 1.9997038841247559} -11/06/2021 22:09:46 - INFO - __main__ - Step 6505: {'lr': 0.0004988582993245661, 'samples': 1248960, 'steps': 6504, 'loss/train': 2.119647264480591} -11/06/2021 22:09:47 - INFO - __main__ - Step 6506: {'lr': 0.0004988577926828459, 'samples': 1249152, 'steps': 6505, 'loss/train': 1.9104197025299072} -11/06/2021 22:09:48 - INFO - __main__ - Step 6507: {'lr': 0.0004988572859289941, 'samples': 1249344, 'steps': 6506, 'loss/train': 0.5368994474411011} -11/06/2021 22:09:48 - INFO - __main__ - Step 6508: {'lr': 0.0004988567790630111, 'samples': 1249536, 'steps': 6507, 'loss/train': 1.2611361742019653} -11/06/2021 22:09:48 - INFO - __main__ - Step 6509: {'lr': 0.0004988562720848973, 'samples': 1249728, 'steps': 6508, 'loss/train': 2.310293674468994} -11/06/2021 22:09:49 - INFO - __main__ - Step 6510: {'lr': 0.0004988557649946525, 'samples': 1249920, 'steps': 6509, 'loss/train': 1.3652870655059814} -11/06/2021 22:09:50 - INFO - __main__ - Step 6511: {'lr': 0.000498855257792277, 'samples': 1250112, 'steps': 6510, 'loss/train': 2.2352139949798584} -11/06/2021 22:09:50 - INFO - __main__ - Step 6512: {'lr': 0.0004988547504777714, 'samples': 1250304, 'steps': 6511, 'loss/train': 1.4359506368637085} -11/06/2021 22:09:50 - INFO - __main__ - Step 6513: {'lr': 0.0004988542430511356, 'samples': 1250496, 'steps': 6512, 'loss/train': 2.3191769123077393} -11/06/2021 22:09:51 - INFO - __main__ - Step 6514: {'lr': 0.0004988537355123699, 'samples': 1250688, 'steps': 6513, 'loss/train': 2.3833720684051514} -11/06/2021 22:09:51 - INFO - __main__ - Step 6515: {'lr': 0.0004988532278614745, 'samples': 1250880, 'steps': 6514, 'loss/train': 1.4373453855514526} -11/06/2021 22:09:52 - INFO - __main__ - Step 6516: {'lr': 0.0004988527200984498, 'samples': 1251072, 'steps': 6515, 'loss/train': 1.5178534984588623} -11/06/2021 22:09:52 - INFO - __main__ - Step 6517: {'lr': 0.0004988522122232958, 'samples': 1251264, 'steps': 6516, 'loss/train': 1.9620566368103027} -11/06/2021 22:09:53 - INFO - __main__ - Step 6518: {'lr': 0.0004988517042360128, 'samples': 1251456, 'steps': 6517, 'loss/train': 1.9547860622406006} -11/06/2021 22:09:53 - INFO - __main__ - Step 6519: {'lr': 0.0004988511961366012, 'samples': 1251648, 'steps': 6518, 'loss/train': 5.9194560050964355} -11/06/2021 22:09:54 - INFO - __main__ - Step 6520: {'lr': 0.000498850687925061, 'samples': 1251840, 'steps': 6519, 'loss/train': 2.1525418758392334} -11/06/2021 22:09:54 - INFO - __main__ - Step 6521: {'lr': 0.0004988501796013926, 'samples': 1252032, 'steps': 6520, 'loss/train': 1.9909714460372925} -11/06/2021 22:09:55 - INFO - __main__ - Step 6522: {'lr': 0.0004988496711655961, 'samples': 1252224, 'steps': 6521, 'loss/train': 1.5848283767700195} -11/06/2021 22:09:55 - INFO - __main__ - Step 6523: {'lr': 0.0004988491626176718, 'samples': 1252416, 'steps': 6522, 'loss/train': 1.9467501640319824} -11/06/2021 22:09:56 - INFO - __main__ - Step 6524: {'lr': 0.0004988486539576198, 'samples': 1252608, 'steps': 6523, 'loss/train': 2.0624489784240723} -11/06/2021 22:09:56 - INFO - __main__ - Step 6525: {'lr': 0.0004988481451854406, 'samples': 1252800, 'steps': 6524, 'loss/train': 1.9637494087219238} -11/06/2021 22:09:56 - INFO - __main__ - Step 6526: {'lr': 0.0004988476363011341, 'samples': 1252992, 'steps': 6525, 'loss/train': 2.017069101333618} -11/06/2021 22:09:57 - INFO - __main__ - Step 6527: {'lr': 0.0004988471273047008, 'samples': 1253184, 'steps': 6526, 'loss/train': 1.8356379270553589} -11/06/2021 22:09:58 - INFO - __main__ - Step 6528: {'lr': 0.0004988466181961408, 'samples': 1253376, 'steps': 6527, 'loss/train': 1.6690013408660889} -11/06/2021 22:09:58 - INFO - __main__ - Step 6529: {'lr': 0.0004988461089754544, 'samples': 1253568, 'steps': 6528, 'loss/train': 1.86026930809021} -11/06/2021 22:09:58 - INFO - __main__ - Step 6530: {'lr': 0.0004988455996426418, 'samples': 1253760, 'steps': 6529, 'loss/train': 1.9897722005844116} -11/06/2021 22:09:59 - INFO - __main__ - Step 6531: {'lr': 0.0004988450901977031, 'samples': 1253952, 'steps': 6530, 'loss/train': 2.079590082168579} -11/06/2021 22:10:00 - INFO - __main__ - Step 6532: {'lr': 0.0004988445806406387, 'samples': 1254144, 'steps': 6531, 'loss/train': 3.077930212020874} -11/06/2021 22:10:00 - INFO - __main__ - Step 6533: {'lr': 0.0004988440709714487, 'samples': 1254336, 'steps': 6532, 'loss/train': 2.232908010482788} -11/06/2021 22:10:01 - INFO - __main__ - Step 6534: {'lr': 0.0004988435611901335, 'samples': 1254528, 'steps': 6533, 'loss/train': 1.569143533706665} -11/06/2021 22:10:01 - INFO - __main__ - Step 6535: {'lr': 0.0004988430512966932, 'samples': 1254720, 'steps': 6534, 'loss/train': 2.3683085441589355} -11/06/2021 22:10:01 - INFO - __main__ - Step 6536: {'lr': 0.000498842541291128, 'samples': 1254912, 'steps': 6535, 'loss/train': 1.7087137699127197} -11/06/2021 22:10:02 - INFO - __main__ - Step 6537: {'lr': 0.0004988420311734383, 'samples': 1255104, 'steps': 6536, 'loss/train': 2.1297061443328857} -11/06/2021 22:10:03 - INFO - __main__ - Step 6538: {'lr': 0.0004988415209436243, 'samples': 1255296, 'steps': 6537, 'loss/train': 1.857115387916565} -11/06/2021 22:10:03 - INFO - __main__ - Step 6539: {'lr': 0.000498841010601686, 'samples': 1255488, 'steps': 6538, 'loss/train': 2.037982225418091} -11/06/2021 22:10:03 - INFO - __main__ - Step 6540: {'lr': 0.0004988405001476237, 'samples': 1255680, 'steps': 6539, 'loss/train': 2.1346702575683594} -11/06/2021 22:10:04 - INFO - __main__ - Step 6541: {'lr': 0.0004988399895814378, 'samples': 1255872, 'steps': 6540, 'loss/train': 1.6024067401885986} -11/06/2021 22:10:05 - INFO - __main__ - Step 6542: {'lr': 0.0004988394789031286, 'samples': 1256064, 'steps': 6541, 'loss/train': 2.4668922424316406} -11/06/2021 22:10:05 - INFO - __main__ - Step 6543: {'lr': 0.000498838968112696, 'samples': 1256256, 'steps': 6542, 'loss/train': 1.6090011596679688} -11/06/2021 22:10:05 - INFO - __main__ - Step 6544: {'lr': 0.0004988384572101403, 'samples': 1256448, 'steps': 6543, 'loss/train': 1.8808883428573608} -11/06/2021 22:10:06 - INFO - __main__ - Step 6545: {'lr': 0.000498837946195462, 'samples': 1256640, 'steps': 6544, 'loss/train': 1.728848934173584} -11/06/2021 22:10:06 - INFO - __main__ - Step 6546: {'lr': 0.0004988374350686611, 'samples': 1256832, 'steps': 6545, 'loss/train': 1.9686365127563477} -11/06/2021 22:10:07 - INFO - __main__ - Step 6547: {'lr': 0.000498836923829738, 'samples': 1257024, 'steps': 6546, 'loss/train': 1.8499354124069214} -11/06/2021 22:10:07 - INFO - __main__ - Step 6548: {'lr': 0.0004988364124786927, 'samples': 1257216, 'steps': 6547, 'loss/train': 1.4615224599838257} -11/06/2021 22:10:08 - INFO - __main__ - Step 6549: {'lr': 0.0004988359010155255, 'samples': 1257408, 'steps': 6548, 'loss/train': 1.7403419017791748} -11/06/2021 22:10:08 - INFO - __main__ - Step 6550: {'lr': 0.0004988353894402368, 'samples': 1257600, 'steps': 6549, 'loss/train': 1.965841293334961} -11/06/2021 22:10:09 - INFO - __main__ - Step 6551: {'lr': 0.0004988348777528267, 'samples': 1257792, 'steps': 6550, 'loss/train': 2.171156883239746} -11/06/2021 22:10:09 - INFO - __main__ - Step 6552: {'lr': 0.0004988343659532954, 'samples': 1257984, 'steps': 6551, 'loss/train': 2.217395782470703} -11/06/2021 22:10:10 - INFO - __main__ - Step 6553: {'lr': 0.0004988338540416432, 'samples': 1258176, 'steps': 6552, 'loss/train': 2.0271527767181396} -11/06/2021 22:10:10 - INFO - __main__ - Step 6554: {'lr': 0.0004988333420178704, 'samples': 1258368, 'steps': 6553, 'loss/train': 1.7768346071243286} -11/06/2021 22:10:11 - INFO - __main__ - Step 6555: {'lr': 0.000498832829881977, 'samples': 1258560, 'steps': 6554, 'loss/train': 2.1017751693725586} -11/06/2021 22:10:11 - INFO - __main__ - Step 6556: {'lr': 0.0004988323176339633, 'samples': 1258752, 'steps': 6555, 'loss/train': 1.467564582824707} -11/06/2021 22:10:11 - INFO - __main__ - Step 6557: {'lr': 0.0004988318052738298, 'samples': 1258944, 'steps': 6556, 'loss/train': 1.9192558526992798} -11/06/2021 22:10:12 - INFO - __main__ - Step 6558: {'lr': 0.0004988312928015763, 'samples': 1259136, 'steps': 6557, 'loss/train': 1.927575945854187} -11/06/2021 22:10:13 - INFO - __main__ - Step 6559: {'lr': 0.0004988307802172035, 'samples': 1259328, 'steps': 6558, 'loss/train': 2.1528429985046387} -11/06/2021 22:10:13 - INFO - __main__ - Step 6560: {'lr': 0.0004988302675207112, 'samples': 1259520, 'steps': 6559, 'loss/train': 2.317401170730591} -11/06/2021 22:10:13 - INFO - __main__ - Step 6561: {'lr': 0.0004988297547121, 'samples': 1259712, 'steps': 6560, 'loss/train': 1.843315839767456} -11/06/2021 22:10:14 - INFO - __main__ - Step 6562: {'lr': 0.0004988292417913698, 'samples': 1259904, 'steps': 6561, 'loss/train': 2.109565019607544} -11/06/2021 22:10:15 - INFO - __main__ - Step 6563: {'lr': 0.0004988287287585211, 'samples': 1260096, 'steps': 6562, 'loss/train': 0.9284586906433105} -11/06/2021 22:10:15 - INFO - __main__ - Step 6564: {'lr': 0.0004988282156135539, 'samples': 1260288, 'steps': 6563, 'loss/train': 1.7303180694580078} -11/06/2021 22:10:15 - INFO - __main__ - Step 6565: {'lr': 0.0004988277023564685, 'samples': 1260480, 'steps': 6564, 'loss/train': 2.28778338432312} -11/06/2021 22:10:16 - INFO - __main__ - Step 6566: {'lr': 0.0004988271889872654, 'samples': 1260672, 'steps': 6565, 'loss/train': 2.138411045074463} -11/06/2021 22:10:16 - INFO - __main__ - Step 6567: {'lr': 0.0004988266755059444, 'samples': 1260864, 'steps': 6566, 'loss/train': 2.42995023727417} -11/06/2021 22:10:17 - INFO - __main__ - Step 6568: {'lr': 0.000498826161912506, 'samples': 1261056, 'steps': 6567, 'loss/train': 1.8563683032989502} -11/06/2021 22:10:17 - INFO - __main__ - Step 6569: {'lr': 0.0004988256482069505, 'samples': 1261248, 'steps': 6568, 'loss/train': 1.7521291971206665} -11/06/2021 22:10:18 - INFO - __main__ - Step 6570: {'lr': 0.0004988251343892779, 'samples': 1261440, 'steps': 6569, 'loss/train': 1.6020236015319824} -11/06/2021 22:10:18 - INFO - __main__ - Step 6571: {'lr': 0.0004988246204594885, 'samples': 1261632, 'steps': 6570, 'loss/train': 1.995780348777771} -11/06/2021 22:10:18 - INFO - __main__ - Step 6572: {'lr': 0.0004988241064175826, 'samples': 1261824, 'steps': 6571, 'loss/train': 2.2202649116516113} -11/06/2021 22:10:19 - INFO - __main__ - Step 6573: {'lr': 0.0004988235922635604, 'samples': 1262016, 'steps': 6572, 'loss/train': 2.3514225482940674} -11/06/2021 22:10:20 - INFO - __main__ - Step 6574: {'lr': 0.0004988230779974221, 'samples': 1262208, 'steps': 6573, 'loss/train': 1.9057080745697021} -11/06/2021 22:10:20 - INFO - __main__ - Step 6575: {'lr': 0.000498822563619168, 'samples': 1262400, 'steps': 6574, 'loss/train': 1.9137215614318848} -11/06/2021 22:10:21 - INFO - __main__ - Step 6576: {'lr': 0.0004988220491287983, 'samples': 1262592, 'steps': 6575, 'loss/train': 1.931260108947754} -11/06/2021 22:10:21 - INFO - __main__ - Step 6577: {'lr': 0.0004988215345263132, 'samples': 1262784, 'steps': 6576, 'loss/train': 1.774949550628662} -11/06/2021 22:10:21 - INFO - __main__ - Step 6578: {'lr': 0.0004988210198117129, 'samples': 1262976, 'steps': 6577, 'loss/train': 1.8798142671585083} -11/06/2021 22:10:22 - INFO - __main__ - Step 6579: {'lr': 0.0004988205049849978, 'samples': 1263168, 'steps': 6578, 'loss/train': 2.2597692012786865} -11/06/2021 22:10:23 - INFO - __main__ - Step 6580: {'lr': 0.0004988199900461679, 'samples': 1263360, 'steps': 6579, 'loss/train': 2.158470869064331} -11/06/2021 22:10:23 - INFO - __main__ - Step 6581: {'lr': 0.0004988194749952237, 'samples': 1263552, 'steps': 6580, 'loss/train': 1.9333513975143433} -11/06/2021 22:10:23 - INFO - __main__ - Step 6582: {'lr': 0.0004988189598321652, 'samples': 1263744, 'steps': 6581, 'loss/train': 2.1383774280548096} -11/06/2021 22:10:24 - INFO - __main__ - Step 6583: {'lr': 0.0004988184445569926, 'samples': 1263936, 'steps': 6582, 'loss/train': 2.0251195430755615} -11/06/2021 22:10:25 - INFO - __main__ - Step 6584: {'lr': 0.0004988179291697064, 'samples': 1264128, 'steps': 6583, 'loss/train': 1.354901671409607} -11/06/2021 22:10:25 - INFO - __main__ - Step 6585: {'lr': 0.0004988174136703066, 'samples': 1264320, 'steps': 6584, 'loss/train': 1.922788381576538} -11/06/2021 22:10:25 - INFO - __main__ - Step 6586: {'lr': 0.0004988168980587936, 'samples': 1264512, 'steps': 6585, 'loss/train': 1.8145787715911865} -11/06/2021 22:10:26 - INFO - __main__ - Step 6587: {'lr': 0.0004988163823351676, 'samples': 1264704, 'steps': 6586, 'loss/train': 1.9621999263763428} -11/06/2021 22:10:26 - INFO - __main__ - Step 6588: {'lr': 0.0004988158664994286, 'samples': 1264896, 'steps': 6587, 'loss/train': 1.8063040971755981} -11/06/2021 22:10:27 - INFO - __main__ - Step 6589: {'lr': 0.0004988153505515771, 'samples': 1265088, 'steps': 6588, 'loss/train': 2.8506147861480713} -11/06/2021 22:10:28 - INFO - __main__ - Step 6590: {'lr': 0.0004988148344916133, 'samples': 1265280, 'steps': 6589, 'loss/train': 1.649754524230957} -11/06/2021 22:10:28 - INFO - __main__ - Step 6591: {'lr': 0.0004988143183195373, 'samples': 1265472, 'steps': 6590, 'loss/train': 1.709517478942871} -11/06/2021 22:10:28 - INFO - __main__ - Step 6592: {'lr': 0.0004988138020353493, 'samples': 1265664, 'steps': 6591, 'loss/train': 1.7125308513641357} -11/06/2021 22:10:29 - INFO - __main__ - Step 6593: {'lr': 0.0004988132856390498, 'samples': 1265856, 'steps': 6592, 'loss/train': 1.3303931951522827} -11/06/2021 22:10:30 - INFO - __main__ - Step 6594: {'lr': 0.0004988127691306388, 'samples': 1266048, 'steps': 6593, 'loss/train': 2.029025077819824} -11/06/2021 22:10:30 - INFO - __main__ - Step 6595: {'lr': 0.0004988122525101166, 'samples': 1266240, 'steps': 6594, 'loss/train': 1.7039332389831543} -11/06/2021 22:10:30 - INFO - __main__ - Step 6596: {'lr': 0.0004988117357774835, 'samples': 1266432, 'steps': 6595, 'loss/train': 2.2546744346618652} -11/06/2021 22:10:31 - INFO - __main__ - Step 6597: {'lr': 0.0004988112189327397, 'samples': 1266624, 'steps': 6596, 'loss/train': 2.0449981689453125} -11/06/2021 22:10:31 - INFO - __main__ - Step 6598: {'lr': 0.0004988107019758853, 'samples': 1266816, 'steps': 6597, 'loss/train': 1.963868260383606} -11/06/2021 22:10:31 - INFO - __main__ - Step 6599: {'lr': 0.0004988101849069208, 'samples': 1267008, 'steps': 6598, 'loss/train': 1.7069015502929688} -11/06/2021 22:10:32 - INFO - __main__ - Step 6600: {'lr': 0.0004988096677258461, 'samples': 1267200, 'steps': 6599, 'loss/train': 2.1868088245391846} -11/06/2021 22:10:33 - INFO - __main__ - Step 6601: {'lr': 0.0004988091504326616, 'samples': 1267392, 'steps': 6600, 'loss/train': 1.8266377449035645} -11/06/2021 22:10:33 - INFO - __main__ - Step 6602: {'lr': 0.0004988086330273676, 'samples': 1267584, 'steps': 6601, 'loss/train': 1.2428114414215088} -11/06/2021 22:10:34 - INFO - __main__ - Step 6603: {'lr': 0.0004988081155099643, 'samples': 1267776, 'steps': 6602, 'loss/train': 1.4701017141342163} -11/06/2021 22:10:34 - INFO - __main__ - Step 6604: {'lr': 0.0004988075978804518, 'samples': 1267968, 'steps': 6603, 'loss/train': 1.7105156183242798} -11/06/2021 22:10:35 - INFO - __main__ - Step 6605: {'lr': 0.0004988070801388306, 'samples': 1268160, 'steps': 6604, 'loss/train': 0.2404092252254486} -11/06/2021 22:10:35 - INFO - __main__ - Step 6606: {'lr': 0.0004988065622851006, 'samples': 1268352, 'steps': 6605, 'loss/train': 1.55886709690094} -11/06/2021 22:10:36 - INFO - __main__ - Step 6607: {'lr': 0.0004988060443192623, 'samples': 1268544, 'steps': 6606, 'loss/train': 1.470017671585083} -11/06/2021 22:10:36 - INFO - __main__ - Step 6608: {'lr': 0.0004988055262413158, 'samples': 1268736, 'steps': 6607, 'loss/train': 1.6374818086624146} -11/06/2021 22:10:36 - INFO - __main__ - Step 6609: {'lr': 0.0004988050080512614, 'samples': 1268928, 'steps': 6608, 'loss/train': 1.785929799079895} -11/06/2021 22:10:37 - INFO - __main__ - Step 6610: {'lr': 0.0004988044897490993, 'samples': 1269120, 'steps': 6609, 'loss/train': 1.8489357233047485} -11/06/2021 22:10:38 - INFO - __main__ - Step 6611: {'lr': 0.0004988039713348297, 'samples': 1269312, 'steps': 6610, 'loss/train': 2.0114858150482178} -11/06/2021 22:10:38 - INFO - __main__ - Step 6612: {'lr': 0.0004988034528084529, 'samples': 1269504, 'steps': 6611, 'loss/train': 1.6072686910629272} -11/06/2021 22:10:38 - INFO - __main__ - Step 6613: {'lr': 0.000498802934169969, 'samples': 1269696, 'steps': 6612, 'loss/train': 2.4517900943756104} -11/06/2021 22:10:39 - INFO - __main__ - Step 6614: {'lr': 0.0004988024154193785, 'samples': 1269888, 'steps': 6613, 'loss/train': 2.244598627090454} -11/06/2021 22:10:40 - INFO - __main__ - Step 6615: {'lr': 0.0004988018965566814, 'samples': 1270080, 'steps': 6614, 'loss/train': 1.5164146423339844} -11/06/2021 22:10:40 - INFO - __main__ - Step 6616: {'lr': 0.000498801377581878, 'samples': 1270272, 'steps': 6615, 'loss/train': 1.9338390827178955} -11/06/2021 22:10:40 - INFO - __main__ - Step 6617: {'lr': 0.0004988008584949686, 'samples': 1270464, 'steps': 6616, 'loss/train': 0.2597677409648895} -11/06/2021 22:10:41 - INFO - __main__ - Step 6618: {'lr': 0.0004988003392959533, 'samples': 1270656, 'steps': 6617, 'loss/train': 2.182772397994995} -11/06/2021 22:10:41 - INFO - __main__ - Step 6619: {'lr': 0.0004987998199848324, 'samples': 1270848, 'steps': 6618, 'loss/train': 1.4753804206848145} -11/06/2021 22:10:42 - INFO - __main__ - Step 6620: {'lr': 0.0004987993005616061, 'samples': 1271040, 'steps': 6619, 'loss/train': 1.8077441453933716} -11/06/2021 22:10:43 - INFO - __main__ - Step 6621: {'lr': 0.0004987987810262747, 'samples': 1271232, 'steps': 6620, 'loss/train': 0.7256439328193665} -11/06/2021 22:10:43 - INFO - __main__ - Step 6622: {'lr': 0.0004987982613788384, 'samples': 1271424, 'steps': 6621, 'loss/train': 1.808817744255066} -11/06/2021 22:10:43 - INFO - __main__ - Step 6623: {'lr': 0.0004987977416192976, 'samples': 1271616, 'steps': 6622, 'loss/train': 2.2159342765808105} -11/06/2021 22:10:44 - INFO - __main__ - Step 6624: {'lr': 0.0004987972217476523, 'samples': 1271808, 'steps': 6623, 'loss/train': 2.1314337253570557} -11/06/2021 22:10:45 - INFO - __main__ - Step 6625: {'lr': 0.0004987967017639027, 'samples': 1272000, 'steps': 6624, 'loss/train': 1.8644086122512817} -11/06/2021 22:10:45 - INFO - __main__ - Step 6626: {'lr': 0.0004987961816680492, 'samples': 1272192, 'steps': 6625, 'loss/train': 1.5684220790863037} -11/06/2021 22:10:45 - INFO - __main__ - Step 6627: {'lr': 0.000498795661460092, 'samples': 1272384, 'steps': 6626, 'loss/train': 2.122796058654785} -11/06/2021 22:10:46 - INFO - __main__ - Step 6628: {'lr': 0.0004987951411400313, 'samples': 1272576, 'steps': 6627, 'loss/train': 1.8228185176849365} -11/06/2021 22:10:46 - INFO - __main__ - Step 6629: {'lr': 0.0004987946207078674, 'samples': 1272768, 'steps': 6628, 'loss/train': 1.77996826171875} -11/06/2021 22:10:47 - INFO - __main__ - Step 6630: {'lr': 0.0004987941001636004, 'samples': 1272960, 'steps': 6629, 'loss/train': 2.308150291442871} -11/06/2021 22:10:47 - INFO - __main__ - Step 6631: {'lr': 0.0004987935795072307, 'samples': 1273152, 'steps': 6630, 'loss/train': 1.8831443786621094} -11/06/2021 22:10:48 - INFO - __main__ - Step 6632: {'lr': 0.0004987930587387584, 'samples': 1273344, 'steps': 6631, 'loss/train': 2.2510716915130615} -11/06/2021 22:10:48 - INFO - __main__ - Step 6633: {'lr': 0.0004987925378581838, 'samples': 1273536, 'steps': 6632, 'loss/train': 1.590349793434143} -11/06/2021 22:10:48 - INFO - __main__ - Step 6634: {'lr': 0.0004987920168655071, 'samples': 1273728, 'steps': 6633, 'loss/train': 1.4046695232391357} -11/06/2021 22:10:49 - INFO - __main__ - Step 6635: {'lr': 0.0004987914957607286, 'samples': 1273920, 'steps': 6634, 'loss/train': 2.134047746658325} -11/06/2021 22:10:50 - INFO - __main__ - Step 6636: {'lr': 0.0004987909745438484, 'samples': 1274112, 'steps': 6635, 'loss/train': 1.8218518495559692} -11/06/2021 22:10:50 - INFO - __main__ - Step 6637: {'lr': 0.000498790453214867, 'samples': 1274304, 'steps': 6636, 'loss/train': 2.182149648666382} -11/06/2021 22:10:51 - INFO - __main__ - Step 6638: {'lr': 0.0004987899317737843, 'samples': 1274496, 'steps': 6637, 'loss/train': 2.091320753097534} -11/06/2021 22:10:51 - INFO - __main__ - Step 6639: {'lr': 0.0004987894102206008, 'samples': 1274688, 'steps': 6638, 'loss/train': 1.5049811601638794} -11/06/2021 22:10:51 - INFO - __main__ - Step 6640: {'lr': 0.0004987888885553166, 'samples': 1274880, 'steps': 6639, 'loss/train': 2.0964086055755615} -11/06/2021 22:10:52 - INFO - __main__ - Step 6641: {'lr': 0.0004987883667779319, 'samples': 1275072, 'steps': 6640, 'loss/train': 0.3089179992675781} -11/06/2021 22:10:53 - INFO - __main__ - Step 6642: {'lr': 0.0004987878448884471, 'samples': 1275264, 'steps': 6641, 'loss/train': 1.5907493829727173} -11/06/2021 22:10:53 - INFO - __main__ - Step 6643: {'lr': 0.0004987873228868622, 'samples': 1275456, 'steps': 6642, 'loss/train': 1.9820168018341064} -11/06/2021 22:10:53 - INFO - __main__ - Step 6644: {'lr': 0.0004987868007731778, 'samples': 1275648, 'steps': 6643, 'loss/train': 1.0979185104370117} -11/06/2021 22:10:54 - INFO - __main__ - Step 6645: {'lr': 0.0004987862785473937, 'samples': 1275840, 'steps': 6644, 'loss/train': 1.9548885822296143} -11/06/2021 22:10:55 - INFO - __main__ - Step 6646: {'lr': 0.0004987857562095103, 'samples': 1276032, 'steps': 6645, 'loss/train': 1.8669013977050781} -11/06/2021 22:10:55 - INFO - __main__ - Step 6647: {'lr': 0.0004987852337595281, 'samples': 1276224, 'steps': 6646, 'loss/train': 1.6619402170181274} -11/06/2021 22:10:55 - INFO - __main__ - Step 6648: {'lr': 0.0004987847111974469, 'samples': 1276416, 'steps': 6647, 'loss/train': 1.4700028896331787} -11/06/2021 22:10:56 - INFO - __main__ - Step 6649: {'lr': 0.0004987841885232674, 'samples': 1276608, 'steps': 6648, 'loss/train': 1.8722918033599854} -11/06/2021 22:10:56 - INFO - __main__ - Step 6650: {'lr': 0.0004987836657369893, 'samples': 1276800, 'steps': 6649, 'loss/train': 2.425621271133423} -11/06/2021 22:10:57 - INFO - __main__ - Step 6651: {'lr': 0.0004987831428386133, 'samples': 1276992, 'steps': 6650, 'loss/train': 1.4940102100372314} -11/06/2021 22:10:58 - INFO - __main__ - Step 6652: {'lr': 0.0004987826198281394, 'samples': 1277184, 'steps': 6651, 'loss/train': 1.6286990642547607} -11/06/2021 22:10:58 - INFO - __main__ - Step 6653: {'lr': 0.0004987820967055678, 'samples': 1277376, 'steps': 6652, 'loss/train': 1.9754180908203125} -11/06/2021 22:10:58 - INFO - __main__ - Step 6654: {'lr': 0.000498781573470899, 'samples': 1277568, 'steps': 6653, 'loss/train': 2.209815502166748} -11/06/2021 22:10:59 - INFO - __main__ - Step 6655: {'lr': 0.000498781050124133, 'samples': 1277760, 'steps': 6654, 'loss/train': 2.132535934448242} -11/06/2021 22:11:00 - INFO - __main__ - Step 6656: {'lr': 0.0004987805266652701, 'samples': 1277952, 'steps': 6655, 'loss/train': 1.9133520126342773} -11/06/2021 22:11:00 - INFO - __main__ - Step 6657: {'lr': 0.0004987800030943105, 'samples': 1278144, 'steps': 6656, 'loss/train': 1.6376458406448364} -11/06/2021 22:11:00 - INFO - __main__ - Step 6658: {'lr': 0.0004987794794112545, 'samples': 1278336, 'steps': 6657, 'loss/train': 1.9937931299209595} -11/06/2021 22:11:01 - INFO - __main__ - Step 6659: {'lr': 0.0004987789556161022, 'samples': 1278528, 'steps': 6658, 'loss/train': 0.2782423198223114} -11/06/2021 22:11:01 - INFO - __main__ - Step 6660: {'lr': 0.0004987784317088541, 'samples': 1278720, 'steps': 6659, 'loss/train': 1.6906732320785522} -11/06/2021 22:11:02 - INFO - __main__ - Step 6661: {'lr': 0.0004987779076895102, 'samples': 1278912, 'steps': 6660, 'loss/train': 2.3083863258361816} -11/06/2021 22:11:03 - INFO - __main__ - Step 6662: {'lr': 0.0004987773835580708, 'samples': 1279104, 'steps': 6661, 'loss/train': 1.6070939302444458} -11/06/2021 22:11:03 - INFO - __main__ - Step 6663: {'lr': 0.0004987768593145362, 'samples': 1279296, 'steps': 6662, 'loss/train': 1.7183184623718262} -11/06/2021 22:11:03 - INFO - __main__ - Step 6664: {'lr': 0.0004987763349589065, 'samples': 1279488, 'steps': 6663, 'loss/train': 1.628963828086853} -11/06/2021 22:11:04 - INFO - __main__ - Step 6665: {'lr': 0.0004987758104911821, 'samples': 1279680, 'steps': 6664, 'loss/train': 1.9477825164794922} -11/06/2021 22:11:05 - INFO - __main__ - Step 6666: {'lr': 0.0004987752859113631, 'samples': 1279872, 'steps': 6665, 'loss/train': 1.3619539737701416} -11/06/2021 22:11:05 - INFO - __main__ - Step 6667: {'lr': 0.0004987747612194499, 'samples': 1280064, 'steps': 6666, 'loss/train': 1.2572715282440186} -11/06/2021 22:11:05 - INFO - __main__ - Step 6668: {'lr': 0.0004987742364154425, 'samples': 1280256, 'steps': 6667, 'loss/train': 2.365995407104492} -11/06/2021 22:11:06 - INFO - __main__ - Step 6669: {'lr': 0.0004987737114993413, 'samples': 1280448, 'steps': 6668, 'loss/train': 1.940123438835144} -11/06/2021 22:11:06 - INFO - __main__ - Step 6670: {'lr': 0.0004987731864711466, 'samples': 1280640, 'steps': 6669, 'loss/train': 1.1229156255722046} -11/06/2021 22:11:07 - INFO - __main__ - Step 6671: {'lr': 0.0004987726613308584, 'samples': 1280832, 'steps': 6670, 'loss/train': 1.7459203004837036} -11/06/2021 22:11:07 - INFO - __main__ - Step 6672: {'lr': 0.0004987721360784772, 'samples': 1281024, 'steps': 6671, 'loss/train': 1.6915955543518066} -11/06/2021 22:11:08 - INFO - __main__ - Step 6673: {'lr': 0.0004987716107140031, 'samples': 1281216, 'steps': 6672, 'loss/train': 2.0414986610412598} -11/06/2021 22:11:08 - INFO - __main__ - Step 6674: {'lr': 0.0004987710852374363, 'samples': 1281408, 'steps': 6673, 'loss/train': 2.4011054039001465} -11/06/2021 22:11:08 - INFO - __main__ - Step 6675: {'lr': 0.0004987705596487771, 'samples': 1281600, 'steps': 6674, 'loss/train': 1.3550761938095093} -11/06/2021 22:11:09 - INFO - __main__ - Step 6676: {'lr': 0.0004987700339480258, 'samples': 1281792, 'steps': 6675, 'loss/train': 1.6839749813079834} -11/06/2021 22:11:10 - INFO - __main__ - Step 6677: {'lr': 0.0004987695081351824, 'samples': 1281984, 'steps': 6676, 'loss/train': 2.2747011184692383} -11/06/2021 22:11:10 - INFO - __main__ - Step 6678: {'lr': 0.0004987689822102474, 'samples': 1282176, 'steps': 6677, 'loss/train': 1.934715747833252} -11/06/2021 22:11:10 - INFO - __main__ - Step 6679: {'lr': 0.000498768456173221, 'samples': 1282368, 'steps': 6678, 'loss/train': 1.7885398864746094} -11/06/2021 22:11:11 - INFO - __main__ - Step 6680: {'lr': 0.0004987679300241033, 'samples': 1282560, 'steps': 6679, 'loss/train': 1.533270239830017} -11/06/2021 22:11:11 - INFO - __main__ - Step 6681: {'lr': 0.0004987674037628945, 'samples': 1282752, 'steps': 6680, 'loss/train': 1.9293286800384521} -11/06/2021 22:11:12 - INFO - __main__ - Step 6682: {'lr': 0.0004987668773895951, 'samples': 1282944, 'steps': 6681, 'loss/train': 1.8046060800552368} -11/06/2021 22:11:13 - INFO - __main__ - Step 6683: {'lr': 0.0004987663509042052, 'samples': 1283136, 'steps': 6682, 'loss/train': 1.674709677696228} -11/06/2021 22:11:13 - INFO - __main__ - Step 6684: {'lr': 0.000498765824306725, 'samples': 1283328, 'steps': 6683, 'loss/train': 1.765952467918396} -11/06/2021 22:11:13 - INFO - __main__ - Step 6685: {'lr': 0.0004987652975971546, 'samples': 1283520, 'steps': 6684, 'loss/train': 2.027494192123413} -11/06/2021 22:11:14 - INFO - __main__ - Step 6686: {'lr': 0.0004987647707754945, 'samples': 1283712, 'steps': 6685, 'loss/train': 1.870924949645996} -11/06/2021 22:11:15 - INFO - __main__ - Step 6687: {'lr': 0.0004987642438417449, 'samples': 1283904, 'steps': 6686, 'loss/train': 1.476467490196228} -11/06/2021 22:11:15 - INFO - __main__ - Step 6688: {'lr': 0.0004987637167959059, 'samples': 1284096, 'steps': 6687, 'loss/train': 2.0917282104492188} -11/06/2021 22:11:15 - INFO - __main__ - Step 6689: {'lr': 0.0004987631896379779, 'samples': 1284288, 'steps': 6688, 'loss/train': 1.4638168811798096} -11/06/2021 22:11:16 - INFO - __main__ - Step 6690: {'lr': 0.0004987626623679609, 'samples': 1284480, 'steps': 6689, 'loss/train': 1.3137454986572266} -11/06/2021 22:11:16 - INFO - __main__ - Step 6691: {'lr': 0.0004987621349858553, 'samples': 1284672, 'steps': 6690, 'loss/train': 2.255805015563965} -11/06/2021 22:11:17 - INFO - __main__ - Step 6692: {'lr': 0.0004987616074916615, 'samples': 1284864, 'steps': 6691, 'loss/train': 1.9453632831573486} -11/06/2021 22:11:18 - INFO - __main__ - Step 6693: {'lr': 0.0004987610798853794, 'samples': 1285056, 'steps': 6692, 'loss/train': 1.9508827924728394} -11/06/2021 22:11:18 - INFO - __main__ - Step 6694: {'lr': 0.0004987605521670094, 'samples': 1285248, 'steps': 6693, 'loss/train': 1.6768591403961182} -11/06/2021 22:11:18 - INFO - __main__ - Step 6695: {'lr': 0.0004987600243365518, 'samples': 1285440, 'steps': 6694, 'loss/train': 1.7393834590911865} -11/06/2021 22:11:19 - INFO - __main__ - Step 6696: {'lr': 0.0004987594963940066, 'samples': 1285632, 'steps': 6695, 'loss/train': 1.7367832660675049} -11/06/2021 22:11:20 - INFO - __main__ - Step 6697: {'lr': 0.0004987589683393744, 'samples': 1285824, 'steps': 6696, 'loss/train': 2.0130209922790527} -11/06/2021 22:11:20 - INFO - __main__ - Step 6698: {'lr': 0.0004987584401726552, 'samples': 1286016, 'steps': 6697, 'loss/train': 2.1210427284240723} -11/06/2021 22:11:20 - INFO - __main__ - Step 6699: {'lr': 0.0004987579118938492, 'samples': 1286208, 'steps': 6698, 'loss/train': 1.9069485664367676} -11/06/2021 22:11:21 - INFO - __main__ - Step 6700: {'lr': 0.0004987573835029569, 'samples': 1286400, 'steps': 6699, 'loss/train': 2.1391384601593018} -11/06/2021 22:11:21 - INFO - __main__ - Step 6701: {'lr': 0.0004987568549999782, 'samples': 1286592, 'steps': 6700, 'loss/train': 1.8220481872558594} -11/06/2021 22:11:22 - INFO - __main__ - Step 6702: {'lr': 0.0004987563263849136, 'samples': 1286784, 'steps': 6701, 'loss/train': 2.194391965866089} -11/06/2021 22:11:22 - INFO - __main__ - Step 6703: {'lr': 0.0004987557976577632, 'samples': 1286976, 'steps': 6702, 'loss/train': 1.930019497871399} -11/06/2021 22:11:23 - INFO - __main__ - Step 6704: {'lr': 0.0004987552688185273, 'samples': 1287168, 'steps': 6703, 'loss/train': 2.2534563541412354} -11/06/2021 22:11:23 - INFO - __main__ - Step 6705: {'lr': 0.0004987547398672061, 'samples': 1287360, 'steps': 6704, 'loss/train': 1.8196769952774048} -11/06/2021 22:11:23 - INFO - __main__ - Step 6706: {'lr': 0.0004987542108037998, 'samples': 1287552, 'steps': 6705, 'loss/train': 2.2005743980407715} -11/06/2021 22:11:24 - INFO - __main__ - Step 6707: {'lr': 0.0004987536816283087, 'samples': 1287744, 'steps': 6706, 'loss/train': 1.494478702545166} -11/06/2021 22:11:25 - INFO - __main__ - Step 6708: {'lr': 0.0004987531523407331, 'samples': 1287936, 'steps': 6707, 'loss/train': 1.9010131359100342} -11/06/2021 22:11:25 - INFO - __main__ - Step 6709: {'lr': 0.0004987526229410732, 'samples': 1288128, 'steps': 6708, 'loss/train': 1.8058475255966187} -11/06/2021 22:11:25 - INFO - __main__ - Step 6710: {'lr': 0.000498752093429329, 'samples': 1288320, 'steps': 6709, 'loss/train': 1.8113231658935547} -11/06/2021 22:11:26 - INFO - __main__ - Step 6711: {'lr': 0.0004987515638055012, 'samples': 1288512, 'steps': 6710, 'loss/train': 1.8796414136886597} -11/06/2021 22:11:27 - INFO - __main__ - Step 6712: {'lr': 0.0004987510340695896, 'samples': 1288704, 'steps': 6711, 'loss/train': 2.1111533641815186} -11/06/2021 22:11:27 - INFO - __main__ - Step 6713: {'lr': 0.0004987505042215948, 'samples': 1288896, 'steps': 6712, 'loss/train': 2.0792810916900635} -11/06/2021 22:11:27 - INFO - __main__ - Step 6714: {'lr': 0.0004987499742615167, 'samples': 1289088, 'steps': 6713, 'loss/train': 1.8710038661956787} -11/06/2021 22:11:28 - INFO - __main__ - Step 6715: {'lr': 0.0004987494441893557, 'samples': 1289280, 'steps': 6714, 'loss/train': 2.19236421585083} -11/06/2021 22:11:28 - INFO - __main__ - Step 6716: {'lr': 0.0004987489140051121, 'samples': 1289472, 'steps': 6715, 'loss/train': 2.288778066635132} -11/06/2021 22:11:29 - INFO - __main__ - Step 6717: {'lr': 0.000498748383708786, 'samples': 1289664, 'steps': 6716, 'loss/train': 1.4987444877624512} -11/06/2021 22:11:30 - INFO - __main__ - Step 6718: {'lr': 0.0004987478533003779, 'samples': 1289856, 'steps': 6717, 'loss/train': 1.6623836755752563} -11/06/2021 22:11:30 - INFO - __main__ - Step 6719: {'lr': 0.0004987473227798877, 'samples': 1290048, 'steps': 6718, 'loss/train': 1.9826804399490356} -11/06/2021 22:11:30 - INFO - __main__ - Step 6720: {'lr': 0.0004987467921473157, 'samples': 1290240, 'steps': 6719, 'loss/train': 1.859378457069397} -11/06/2021 22:11:31 - INFO - __main__ - Step 6721: {'lr': 0.0004987462614026624, 'samples': 1290432, 'steps': 6720, 'loss/train': 1.4481638669967651} -11/06/2021 22:11:32 - INFO - __main__ - Step 6722: {'lr': 0.0004987457305459279, 'samples': 1290624, 'steps': 6721, 'loss/train': 1.673604965209961} -11/06/2021 22:11:32 - INFO - __main__ - Step 6723: {'lr': 0.0004987451995771124, 'samples': 1290816, 'steps': 6722, 'loss/train': 1.731692910194397} -11/06/2021 22:11:32 - INFO - __main__ - Step 6724: {'lr': 0.000498744668496216, 'samples': 1291008, 'steps': 6723, 'loss/train': 1.4091925621032715} -11/06/2021 22:11:33 - INFO - __main__ - Step 6725: {'lr': 0.0004987441373032393, 'samples': 1291200, 'steps': 6724, 'loss/train': 1.264276385307312} -11/06/2021 22:11:33 - INFO - __main__ - Step 6726: {'lr': 0.0004987436059981821, 'samples': 1291392, 'steps': 6725, 'loss/train': 1.7149850130081177} -11/06/2021 22:11:34 - INFO - __main__ - Step 6727: {'lr': 0.0004987430745810451, 'samples': 1291584, 'steps': 6726, 'loss/train': 1.8684431314468384} -11/06/2021 22:11:34 - INFO - __main__ - Step 6728: {'lr': 0.0004987425430518282, 'samples': 1291776, 'steps': 6727, 'loss/train': 1.2485170364379883} -11/06/2021 22:11:35 - INFO - __main__ - Step 6729: {'lr': 0.0004987420114105317, 'samples': 1291968, 'steps': 6728, 'loss/train': 1.7726978063583374} -11/06/2021 22:11:35 - INFO - __main__ - Step 6730: {'lr': 0.000498741479657156, 'samples': 1292160, 'steps': 6729, 'loss/train': 2.122650146484375} -11/06/2021 22:11:35 - INFO - __main__ - Step 6731: {'lr': 0.0004987409477917011, 'samples': 1292352, 'steps': 6730, 'loss/train': 2.2055673599243164} -11/06/2021 22:11:36 - INFO - __main__ - Step 6732: {'lr': 0.0004987404158141675, 'samples': 1292544, 'steps': 6731, 'loss/train': 1.7402311563491821} -11/06/2021 22:11:37 - INFO - __main__ - Step 6733: {'lr': 0.0004987398837245552, 'samples': 1292736, 'steps': 6732, 'loss/train': 2.053032159805298} -11/06/2021 22:11:37 - INFO - __main__ - Step 6734: {'lr': 0.0004987393515228646, 'samples': 1292928, 'steps': 6733, 'loss/train': 1.614290475845337} -11/06/2021 22:11:38 - INFO - __main__ - Step 6735: {'lr': 0.0004987388192090959, 'samples': 1293120, 'steps': 6734, 'loss/train': 1.5254181623458862} -11/06/2021 22:11:38 - INFO - __main__ - Step 6736: {'lr': 0.0004987382867832493, 'samples': 1293312, 'steps': 6735, 'loss/train': 2.606459379196167} -11/06/2021 22:11:38 - INFO - __main__ - Step 6737: {'lr': 0.0004987377542453251, 'samples': 1293504, 'steps': 6736, 'loss/train': 1.3655518293380737} -11/06/2021 22:11:39 - INFO - __main__ - Step 6738: {'lr': 0.0004987372215953234, 'samples': 1293696, 'steps': 6737, 'loss/train': 1.8274635076522827} -11/06/2021 22:11:40 - INFO - __main__ - Step 6739: {'lr': 0.0004987366888332446, 'samples': 1293888, 'steps': 6738, 'loss/train': 1.5153939723968506} -11/06/2021 22:11:40 - INFO - __main__ - Step 6740: {'lr': 0.0004987361559590889, 'samples': 1294080, 'steps': 6739, 'loss/train': 2.4495294094085693} -11/06/2021 22:11:40 - INFO - __main__ - Step 6741: {'lr': 0.0004987356229728566, 'samples': 1294272, 'steps': 6740, 'loss/train': 1.0965790748596191} -11/06/2021 22:11:41 - INFO - __main__ - Step 6742: {'lr': 0.0004987350898745477, 'samples': 1294464, 'steps': 6741, 'loss/train': 1.4959521293640137} -11/06/2021 22:11:42 - INFO - __main__ - Step 6743: {'lr': 0.0004987345566641628, 'samples': 1294656, 'steps': 6742, 'loss/train': 0.2513975501060486} -11/06/2021 22:11:42 - INFO - __main__ - Step 6744: {'lr': 0.0004987340233417019, 'samples': 1294848, 'steps': 6743, 'loss/train': 1.892668604850769} -11/06/2021 22:11:42 - INFO - __main__ - Step 6745: {'lr': 0.0004987334899071652, 'samples': 1295040, 'steps': 6744, 'loss/train': 3.132077217102051} -11/06/2021 22:11:43 - INFO - __main__ - Step 6746: {'lr': 0.000498732956360553, 'samples': 1295232, 'steps': 6745, 'loss/train': 2.2569050788879395} -11/06/2021 22:11:43 - INFO - __main__ - Step 6747: {'lr': 0.0004987324227018657, 'samples': 1295424, 'steps': 6746, 'loss/train': 2.1900782585144043} -11/06/2021 22:11:44 - INFO - __main__ - Step 6748: {'lr': 0.0004987318889311033, 'samples': 1295616, 'steps': 6747, 'loss/train': 2.0776844024658203} -11/06/2021 22:11:45 - INFO - __main__ - Step 6749: {'lr': 0.0004987313550482663, 'samples': 1295808, 'steps': 6748, 'loss/train': 2.524590253829956} -11/06/2021 22:11:45 - INFO - __main__ - Step 6750: {'lr': 0.0004987308210533546, 'samples': 1296000, 'steps': 6749, 'loss/train': 2.416774272918701} -11/06/2021 22:11:45 - INFO - __main__ - Step 6751: {'lr': 0.0004987302869463686, 'samples': 1296192, 'steps': 6750, 'loss/train': 1.5255533456802368} -11/06/2021 22:11:46 - INFO - __main__ - Step 6752: {'lr': 0.0004987297527273088, 'samples': 1296384, 'steps': 6751, 'loss/train': 1.5347144603729248} -11/06/2021 22:11:47 - INFO - __main__ - Step 6753: {'lr': 0.0004987292183961751, 'samples': 1296576, 'steps': 6752, 'loss/train': 1.8391497135162354} -11/06/2021 22:11:47 - INFO - __main__ - Step 6754: {'lr': 0.0004987286839529679, 'samples': 1296768, 'steps': 6753, 'loss/train': 1.9722280502319336} -11/06/2021 22:11:47 - INFO - __main__ - Step 6755: {'lr': 0.0004987281493976873, 'samples': 1296960, 'steps': 6754, 'loss/train': 1.6345213651657104} -11/06/2021 22:11:48 - INFO - __main__ - Step 6756: {'lr': 0.0004987276147303337, 'samples': 1297152, 'steps': 6755, 'loss/train': 1.5767613649368286} -11/06/2021 22:11:48 - INFO - __main__ - Step 6757: {'lr': 0.0004987270799509071, 'samples': 1297344, 'steps': 6756, 'loss/train': 1.8740566968917847} -11/06/2021 22:11:49 - INFO - __main__ - Step 6758: {'lr': 0.0004987265450594082, 'samples': 1297536, 'steps': 6757, 'loss/train': 1.6574358940124512} -11/06/2021 22:11:49 - INFO - __main__ - Step 6759: {'lr': 0.0004987260100558368, 'samples': 1297728, 'steps': 6758, 'loss/train': 2.1299595832824707} -11/06/2021 22:11:50 - INFO - __main__ - Step 6760: {'lr': 0.0004987254749401933, 'samples': 1297920, 'steps': 6759, 'loss/train': 1.5151968002319336} -11/06/2021 22:11:50 - INFO - __main__ - Step 6761: {'lr': 0.000498724939712478, 'samples': 1298112, 'steps': 6760, 'loss/train': 2.2985787391662598} -11/06/2021 22:11:51 - INFO - __main__ - Step 6762: {'lr': 0.000498724404372691, 'samples': 1298304, 'steps': 6761, 'loss/train': 2.6387453079223633} -11/06/2021 22:11:51 - INFO - __main__ - Step 6763: {'lr': 0.0004987238689208327, 'samples': 1298496, 'steps': 6762, 'loss/train': 1.8828072547912598} -11/06/2021 22:11:52 - INFO - __main__ - Step 6764: {'lr': 0.0004987233333569031, 'samples': 1298688, 'steps': 6763, 'loss/train': 2.250027894973755} -11/06/2021 22:11:52 - INFO - __main__ - Step 6765: {'lr': 0.0004987227976809028, 'samples': 1298880, 'steps': 6764, 'loss/train': 1.8417761325836182} -11/06/2021 22:11:53 - INFO - __main__ - Step 6766: {'lr': 0.0004987222618928318, 'samples': 1299072, 'steps': 6765, 'loss/train': 1.9207943677902222} -11/06/2021 22:11:53 - INFO - __main__ - Step 6767: {'lr': 0.0004987217259926904, 'samples': 1299264, 'steps': 6766, 'loss/train': 0.23178565502166748} -11/06/2021 22:11:53 - INFO - __main__ - Step 6768: {'lr': 0.0004987211899804788, 'samples': 1299456, 'steps': 6767, 'loss/train': 1.8414160013198853} -11/06/2021 22:11:55 - INFO - __main__ - Step 6769: {'lr': 0.0004987206538561972, 'samples': 1299648, 'steps': 6768, 'loss/train': 1.939680814743042} -11/06/2021 22:11:55 - INFO - __main__ - Step 6770: {'lr': 0.000498720117619846, 'samples': 1299840, 'steps': 6769, 'loss/train': 1.4610973596572876} -11/06/2021 22:11:55 - INFO - __main__ - Step 6771: {'lr': 0.0004987195812714252, 'samples': 1300032, 'steps': 6770, 'loss/train': 1.526523232460022} -11/06/2021 22:11:56 - INFO - __main__ - Step 6772: {'lr': 0.0004987190448109354, 'samples': 1300224, 'steps': 6771, 'loss/train': 2.2244198322296143} -11/06/2021 22:11:56 - INFO - __main__ - Step 6773: {'lr': 0.0004987185082383765, 'samples': 1300416, 'steps': 6772, 'loss/train': 1.7443127632141113} -11/06/2021 22:11:56 - INFO - __main__ - Step 6774: {'lr': 0.000498717971553749, 'samples': 1300608, 'steps': 6773, 'loss/train': 2.230355978012085} -11/06/2021 22:11:57 - INFO - __main__ - Step 6775: {'lr': 0.0004987174347570529, 'samples': 1300800, 'steps': 6774, 'loss/train': 0.42308324575424194} -11/06/2021 22:11:58 - INFO - __main__ - Step 6776: {'lr': 0.0004987168978482886, 'samples': 1300992, 'steps': 6775, 'loss/train': 1.6637697219848633} -11/06/2021 22:11:58 - INFO - __main__ - Step 6777: {'lr': 0.0004987163608274564, 'samples': 1301184, 'steps': 6776, 'loss/train': 1.6888412237167358} -11/06/2021 22:11:58 - INFO - __main__ - Step 6778: {'lr': 0.0004987158236945563, 'samples': 1301376, 'steps': 6777, 'loss/train': 1.6136714220046997} -11/06/2021 22:11:59 - INFO - __main__ - Step 6779: {'lr': 0.0004987152864495887, 'samples': 1301568, 'steps': 6778, 'loss/train': 2.1859946250915527} -11/06/2021 22:12:00 - INFO - __main__ - Step 6780: {'lr': 0.000498714749092554, 'samples': 1301760, 'steps': 6779, 'loss/train': 1.9430932998657227} -11/06/2021 22:12:00 - INFO - __main__ - Step 6781: {'lr': 0.0004987142116234521, 'samples': 1301952, 'steps': 6780, 'loss/train': 1.1831541061401367} -11/06/2021 22:12:00 - INFO - __main__ - Step 6782: {'lr': 0.0004987136740422835, 'samples': 1302144, 'steps': 6781, 'loss/train': 1.972415566444397} -11/06/2021 22:12:01 - INFO - __main__ - Step 6783: {'lr': 0.0004987131363490483, 'samples': 1302336, 'steps': 6782, 'loss/train': 1.6971096992492676} -11/06/2021 22:12:01 - INFO - __main__ - Step 6784: {'lr': 0.0004987125985437468, 'samples': 1302528, 'steps': 6783, 'loss/train': 2.15081524848938} -11/06/2021 22:12:02 - INFO - __main__ - Step 6785: {'lr': 0.0004987120606263794, 'samples': 1302720, 'steps': 6784, 'loss/train': 2.056392192840576} -11/06/2021 22:12:03 - INFO - __main__ - Step 6786: {'lr': 0.000498711522596946, 'samples': 1302912, 'steps': 6785, 'loss/train': 1.852485179901123} -11/06/2021 22:12:03 - INFO - __main__ - Step 6787: {'lr': 0.000498710984455447, 'samples': 1303104, 'steps': 6786, 'loss/train': 1.6676357984542847} -11/06/2021 22:12:03 - INFO - __main__ - Step 6788: {'lr': 0.0004987104462018828, 'samples': 1303296, 'steps': 6787, 'loss/train': 1.6238676309585571} -11/06/2021 22:12:04 - INFO - __main__ - Step 6789: {'lr': 0.0004987099078362534, 'samples': 1303488, 'steps': 6788, 'loss/train': 1.8077821731567383} -11/06/2021 22:12:05 - INFO - __main__ - Step 6790: {'lr': 0.0004987093693585591, 'samples': 1303680, 'steps': 6789, 'loss/train': 2.1676840782165527} -11/06/2021 22:12:05 - INFO - __main__ - Step 6791: {'lr': 0.0004987088307688004, 'samples': 1303872, 'steps': 6790, 'loss/train': 0.8062730431556702} -11/06/2021 22:12:05 - INFO - __main__ - Step 6792: {'lr': 0.0004987082920669772, 'samples': 1304064, 'steps': 6791, 'loss/train': 1.5815889835357666} -11/06/2021 22:12:06 - INFO - __main__ - Step 6793: {'lr': 0.0004987077532530899, 'samples': 1304256, 'steps': 6792, 'loss/train': 1.743523120880127} -11/06/2021 22:12:06 - INFO - __main__ - Step 6794: {'lr': 0.0004987072143271388, 'samples': 1304448, 'steps': 6793, 'loss/train': 1.1385010480880737} -11/06/2021 22:12:07 - INFO - __main__ - Step 6795: {'lr': 0.000498706675289124, 'samples': 1304640, 'steps': 6794, 'loss/train': 1.5993659496307373} -11/06/2021 22:12:07 - INFO - __main__ - Step 6796: {'lr': 0.0004987061361390458, 'samples': 1304832, 'steps': 6795, 'loss/train': 1.9786431789398193} -11/06/2021 22:12:08 - INFO - __main__ - Step 6797: {'lr': 0.0004987055968769045, 'samples': 1305024, 'steps': 6796, 'loss/train': 1.779247522354126} -11/06/2021 22:12:08 - INFO - __main__ - Step 6798: {'lr': 0.0004987050575027002, 'samples': 1305216, 'steps': 6797, 'loss/train': 1.8261228799819946} -11/06/2021 22:12:08 - INFO - __main__ - Step 6799: {'lr': 0.0004987045180164333, 'samples': 1305408, 'steps': 6798, 'loss/train': 1.5211654901504517} -11/06/2021 22:12:10 - INFO - __main__ - Step 6800: {'lr': 0.0004987039784181041, 'samples': 1305600, 'steps': 6799, 'loss/train': 0.9507125616073608} -11/06/2021 22:12:10 - INFO - __main__ - Step 6801: {'lr': 0.0004987034387077126, 'samples': 1305792, 'steps': 6800, 'loss/train': 1.7004783153533936} -11/06/2021 22:12:10 - INFO - __main__ - Step 6802: {'lr': 0.0004987028988852592, 'samples': 1305984, 'steps': 6801, 'loss/train': 2.2649049758911133} -11/06/2021 22:12:11 - INFO - __main__ - Step 6803: {'lr': 0.0004987023589507441, 'samples': 1306176, 'steps': 6802, 'loss/train': 1.9656171798706055} -11/06/2021 22:12:11 - INFO - __main__ - Step 6804: {'lr': 0.0004987018189041675, 'samples': 1306368, 'steps': 6803, 'loss/train': 1.7351499795913696} -11/06/2021 22:12:12 - INFO - __main__ - Step 6805: {'lr': 0.0004987012787455297, 'samples': 1306560, 'steps': 6804, 'loss/train': 1.2826176881790161} -11/06/2021 22:12:12 - INFO - __main__ - Step 6806: {'lr': 0.000498700738474831, 'samples': 1306752, 'steps': 6805, 'loss/train': 1.076385736465454} -11/06/2021 22:12:13 - INFO - __main__ - Step 6807: {'lr': 0.0004987001980920716, 'samples': 1306944, 'steps': 6806, 'loss/train': 1.8413560390472412} -11/06/2021 22:12:13 - INFO - __main__ - Step 6808: {'lr': 0.0004986996575972517, 'samples': 1307136, 'steps': 6807, 'loss/train': 0.7521131038665771} -11/06/2021 22:12:13 - INFO - __main__ - Step 6809: {'lr': 0.0004986991169903716, 'samples': 1307328, 'steps': 6808, 'loss/train': 2.316514015197754} -11/06/2021 22:12:14 - INFO - __main__ - Step 6810: {'lr': 0.0004986985762714314, 'samples': 1307520, 'steps': 6809, 'loss/train': 2.3181118965148926} -11/06/2021 22:12:15 - INFO - __main__ - Step 6811: {'lr': 0.0004986980354404316, 'samples': 1307712, 'steps': 6810, 'loss/train': 1.841756820678711} -11/06/2021 22:12:15 - INFO - __main__ - Step 6812: {'lr': 0.0004986974944973723, 'samples': 1307904, 'steps': 6811, 'loss/train': 2.5697433948516846} -11/06/2021 22:12:16 - INFO - __main__ - Step 6813: {'lr': 0.0004986969534422537, 'samples': 1308096, 'steps': 6812, 'loss/train': 0.27386459708213806} -11/06/2021 22:12:16 - INFO - __main__ - Step 6814: {'lr': 0.000498696412275076, 'samples': 1308288, 'steps': 6813, 'loss/train': 1.9443211555480957} -11/06/2021 22:12:16 - INFO - __main__ - Step 6815: {'lr': 0.0004986958709958396, 'samples': 1308480, 'steps': 6814, 'loss/train': 1.8300877809524536} -11/06/2021 22:12:18 - INFO - __main__ - Step 6816: {'lr': 0.0004986953296045448, 'samples': 1308672, 'steps': 6815, 'loss/train': 1.716494083404541} -11/06/2021 22:12:18 - INFO - __main__ - Step 6817: {'lr': 0.0004986947881011917, 'samples': 1308864, 'steps': 6816, 'loss/train': 1.5828531980514526} -11/06/2021 22:12:18 - INFO - __main__ - Step 6818: {'lr': 0.0004986942464857804, 'samples': 1309056, 'steps': 6817, 'loss/train': 1.8163785934448242} -11/06/2021 22:12:19 - INFO - __main__ - Step 6819: {'lr': 0.0004986937047583114, 'samples': 1309248, 'steps': 6818, 'loss/train': 1.8825898170471191} -11/06/2021 22:12:19 - INFO - __main__ - Step 6820: {'lr': 0.0004986931629187848, 'samples': 1309440, 'steps': 6819, 'loss/train': 2.2714736461639404} -11/06/2021 22:12:20 - INFO - __main__ - Step 6821: {'lr': 0.0004986926209672011, 'samples': 1309632, 'steps': 6820, 'loss/train': 2.2257802486419678} -11/06/2021 22:12:20 - INFO - __main__ - Step 6822: {'lr': 0.0004986920789035601, 'samples': 1309824, 'steps': 6821, 'loss/train': 1.6289818286895752} -11/06/2021 22:12:21 - INFO - __main__ - Step 6823: {'lr': 0.0004986915367278623, 'samples': 1310016, 'steps': 6822, 'loss/train': 1.8991657495498657} -11/06/2021 22:12:21 - INFO - __main__ - Step 6824: {'lr': 0.0004986909944401082, 'samples': 1310208, 'steps': 6823, 'loss/train': 1.4807871580123901} -11/06/2021 22:12:21 - INFO - __main__ - Step 6825: {'lr': 0.0004986904520402975, 'samples': 1310400, 'steps': 6824, 'loss/train': 1.9092999696731567} -11/06/2021 22:12:23 - INFO - __main__ - Step 6826: {'lr': 0.0004986899095284308, 'samples': 1310592, 'steps': 6825, 'loss/train': 2.1994271278381348} -11/06/2021 22:12:23 - INFO - __main__ - Step 6827: {'lr': 0.0004986893669045083, 'samples': 1310784, 'steps': 6826, 'loss/train': 2.3838884830474854} -11/06/2021 22:12:23 - INFO - __main__ - Step 6828: {'lr': 0.0004986888241685301, 'samples': 1310976, 'steps': 6827, 'loss/train': 1.6222882270812988} -11/06/2021 22:12:24 - INFO - __main__ - Step 6829: {'lr': 0.0004986882813204967, 'samples': 1311168, 'steps': 6828, 'loss/train': 2.6850411891937256} -11/06/2021 22:12:24 - INFO - __main__ - Step 6830: {'lr': 0.0004986877383604081, 'samples': 1311360, 'steps': 6829, 'loss/train': 1.8489203453063965} -11/06/2021 22:12:25 - INFO - __main__ - Step 6831: {'lr': 0.0004986871952882647, 'samples': 1311552, 'steps': 6830, 'loss/train': 1.933595061302185} -11/06/2021 22:12:25 - INFO - __main__ - Step 6832: {'lr': 0.0004986866521040666, 'samples': 1311744, 'steps': 6831, 'loss/train': 1.9676979780197144} -11/06/2021 22:12:26 - INFO - __main__ - Step 6833: {'lr': 0.0004986861088078142, 'samples': 1311936, 'steps': 6832, 'loss/train': 1.3297863006591797} -11/06/2021 22:12:26 - INFO - __main__ - Step 6834: {'lr': 0.0004986855653995077, 'samples': 1312128, 'steps': 6833, 'loss/train': 0.9145995378494263} -11/06/2021 22:12:26 - INFO - __main__ - Step 6835: {'lr': 0.0004986850218791474, 'samples': 1312320, 'steps': 6834, 'loss/train': 2.046581983566284} -11/06/2021 22:12:28 - INFO - __main__ - Step 6836: {'lr': 0.0004986844782467332, 'samples': 1312512, 'steps': 6835, 'loss/train': 1.6971626281738281} -11/06/2021 22:12:28 - INFO - __main__ - Step 6837: {'lr': 0.0004986839345022658, 'samples': 1312704, 'steps': 6836, 'loss/train': 1.80866539478302} -11/06/2021 22:12:29 - INFO - __main__ - Step 6838: {'lr': 0.0004986833906457453, 'samples': 1312896, 'steps': 6837, 'loss/train': 2.049255609512329} -11/06/2021 22:12:29 - INFO - __main__ - Step 6839: {'lr': 0.0004986828466771718, 'samples': 1313088, 'steps': 6838, 'loss/train': 2.1545591354370117} -11/06/2021 22:12:29 - INFO - __main__ - Step 6840: {'lr': 0.0004986823025965457, 'samples': 1313280, 'steps': 6839, 'loss/train': 1.8146533966064453} -11/06/2021 22:12:30 - INFO - __main__ - Step 6841: {'lr': 0.0004986817584038671, 'samples': 1313472, 'steps': 6840, 'loss/train': 1.6725200414657593} -11/06/2021 22:12:31 - INFO - __main__ - Step 6842: {'lr': 0.0004986812140991365, 'samples': 1313664, 'steps': 6841, 'loss/train': 2.010808229446411} -11/06/2021 22:12:31 - INFO - __main__ - Step 6843: {'lr': 0.0004986806696823538, 'samples': 1313856, 'steps': 6842, 'loss/train': 1.6977182626724243} -11/06/2021 22:12:31 - INFO - __main__ - Step 6844: {'lr': 0.0004986801251535195, 'samples': 1314048, 'steps': 6843, 'loss/train': 1.7137373685836792} -11/06/2021 22:12:32 - INFO - __main__ - Step 6845: {'lr': 0.0004986795805126339, 'samples': 1314240, 'steps': 6844, 'loss/train': 1.878450632095337} -11/06/2021 22:12:32 - INFO - __main__ - Step 6846: {'lr': 0.000498679035759697, 'samples': 1314432, 'steps': 6845, 'loss/train': 1.5944817066192627} -11/06/2021 22:12:33 - INFO - __main__ - Step 6847: {'lr': 0.0004986784908947091, 'samples': 1314624, 'steps': 6846, 'loss/train': 1.7078269720077515} -11/06/2021 22:12:34 - INFO - __main__ - Step 6848: {'lr': 0.0004986779459176706, 'samples': 1314816, 'steps': 6847, 'loss/train': 1.9563493728637695} -11/06/2021 22:12:34 - INFO - __main__ - Step 6849: {'lr': 0.0004986774008285816, 'samples': 1315008, 'steps': 6848, 'loss/train': 1.9744795560836792} -11/06/2021 22:12:34 - INFO - __main__ - Step 6850: {'lr': 0.0004986768556274425, 'samples': 1315200, 'steps': 6849, 'loss/train': 1.5663435459136963} -11/06/2021 22:12:35 - INFO - __main__ - Step 6851: {'lr': 0.0004986763103142533, 'samples': 1315392, 'steps': 6850, 'loss/train': 1.9012843370437622} -11/06/2021 22:12:36 - INFO - __main__ - Step 6852: {'lr': 0.0004986757648890145, 'samples': 1315584, 'steps': 6851, 'loss/train': 1.9131489992141724} -11/06/2021 22:12:36 - INFO - __main__ - Step 6853: {'lr': 0.0004986752193517262, 'samples': 1315776, 'steps': 6852, 'loss/train': 1.6437551975250244} -11/06/2021 22:12:36 - INFO - __main__ - Step 6854: {'lr': 0.0004986746737023887, 'samples': 1315968, 'steps': 6853, 'loss/train': 0.30247291922569275} -11/06/2021 22:12:37 - INFO - __main__ - Step 6855: {'lr': 0.0004986741279410023, 'samples': 1316160, 'steps': 6854, 'loss/train': 2.0035195350646973} -11/06/2021 22:12:37 - INFO - __main__ - Step 6856: {'lr': 0.000498673582067567, 'samples': 1316352, 'steps': 6855, 'loss/train': 1.685018539428711} -11/06/2021 22:12:38 - INFO - __main__ - Step 6857: {'lr': 0.0004986730360820833, 'samples': 1316544, 'steps': 6856, 'loss/train': 1.0697712898254395} -11/06/2021 22:12:39 - INFO - __main__ - Step 6858: {'lr': 0.0004986724899845514, 'samples': 1316736, 'steps': 6857, 'loss/train': 1.4516496658325195} -11/06/2021 22:12:39 - INFO - __main__ - Step 6859: {'lr': 0.0004986719437749716, 'samples': 1316928, 'steps': 6858, 'loss/train': 2.176100730895996} -11/06/2021 22:12:39 - INFO - __main__ - Step 6860: {'lr': 0.0004986713974533439, 'samples': 1317120, 'steps': 6859, 'loss/train': 1.1705691814422607} -11/06/2021 22:12:40 - INFO - __main__ - Step 6861: {'lr': 0.0004986708510196688, 'samples': 1317312, 'steps': 6860, 'loss/train': 1.852432131767273} -11/06/2021 22:12:40 - INFO - __main__ - Step 6862: {'lr': 0.0004986703044739464, 'samples': 1317504, 'steps': 6861, 'loss/train': 1.9012736082077026} -11/06/2021 22:12:41 - INFO - __main__ - Step 6863: {'lr': 0.000498669757816177, 'samples': 1317696, 'steps': 6862, 'loss/train': 2.041994333267212} -11/06/2021 22:12:41 - INFO - __main__ - Step 6864: {'lr': 0.0004986692110463609, 'samples': 1317888, 'steps': 6863, 'loss/train': 0.9249697327613831} -11/06/2021 22:12:42 - INFO - __main__ - Step 6865: {'lr': 0.0004986686641644982, 'samples': 1318080, 'steps': 6864, 'loss/train': 1.9790064096450806} -11/06/2021 22:12:42 - INFO - __main__ - Step 6866: {'lr': 0.0004986681171705893, 'samples': 1318272, 'steps': 6865, 'loss/train': 1.9213021993637085} -11/06/2021 22:12:42 - INFO - __main__ - Step 6867: {'lr': 0.0004986675700646343, 'samples': 1318464, 'steps': 6866, 'loss/train': 1.9628852605819702} -11/06/2021 22:12:43 - INFO - __main__ - Step 6868: {'lr': 0.0004986670228466337, 'samples': 1318656, 'steps': 6867, 'loss/train': 2.0977110862731934} -11/06/2021 22:12:44 - INFO - __main__ - Step 6869: {'lr': 0.0004986664755165874, 'samples': 1318848, 'steps': 6868, 'loss/train': 1.4509758949279785} -11/06/2021 22:12:44 - INFO - __main__ - Step 6870: {'lr': 0.000498665928074496, 'samples': 1319040, 'steps': 6869, 'loss/train': 1.9043452739715576} -11/06/2021 22:12:44 - INFO - __main__ - Step 6871: {'lr': 0.0004986653805203594, 'samples': 1319232, 'steps': 6870, 'loss/train': 1.188199520111084} -11/06/2021 22:12:45 - INFO - __main__ - Step 6872: {'lr': 0.0004986648328541781, 'samples': 1319424, 'steps': 6871, 'loss/train': 1.6279737949371338} -11/06/2021 22:12:46 - INFO - __main__ - Step 6873: {'lr': 0.0004986642850759522, 'samples': 1319616, 'steps': 6872, 'loss/train': 1.2891004085540771} -11/06/2021 22:12:46 - INFO - __main__ - Step 6874: {'lr': 0.0004986637371856822, 'samples': 1319808, 'steps': 6873, 'loss/train': 2.0982792377471924} -11/06/2021 22:12:47 - INFO - __main__ - Step 6875: {'lr': 0.000498663189183368, 'samples': 1320000, 'steps': 6874, 'loss/train': 1.6079758405685425} -11/06/2021 22:12:47 - INFO - __main__ - Step 6876: {'lr': 0.0004986626410690099, 'samples': 1320192, 'steps': 6875, 'loss/train': 1.3328086137771606} -11/06/2021 22:12:47 - INFO - __main__ - Step 6877: {'lr': 0.0004986620928426085, 'samples': 1320384, 'steps': 6876, 'loss/train': 1.9018620252609253} -11/06/2021 22:12:48 - INFO - __main__ - Step 6878: {'lr': 0.0004986615445041636, 'samples': 1320576, 'steps': 6877, 'loss/train': 1.5764297246932983} -11/06/2021 22:12:49 - INFO - __main__ - Step 6879: {'lr': 0.0004986609960536757, 'samples': 1320768, 'steps': 6878, 'loss/train': 1.831556797027588} -11/06/2021 22:12:49 - INFO - __main__ - Step 6880: {'lr': 0.000498660447491145, 'samples': 1320960, 'steps': 6879, 'loss/train': 1.3842569589614868} -11/06/2021 22:12:49 - INFO - __main__ - Step 6881: {'lr': 0.0004986598988165718, 'samples': 1321152, 'steps': 6880, 'loss/train': 2.5729262828826904} -11/06/2021 22:12:50 - INFO - __main__ - Step 6882: {'lr': 0.0004986593500299562, 'samples': 1321344, 'steps': 6881, 'loss/train': 2.3645272254943848} -11/06/2021 22:12:51 - INFO - __main__ - Step 6883: {'lr': 0.0004986588011312986, 'samples': 1321536, 'steps': 6882, 'loss/train': 1.524306058883667} -11/06/2021 22:12:51 - INFO - __main__ - Step 6884: {'lr': 0.0004986582521205992, 'samples': 1321728, 'steps': 6883, 'loss/train': 2.1317756175994873} -11/06/2021 22:12:51 - INFO - __main__ - Step 6885: {'lr': 0.0004986577029978581, 'samples': 1321920, 'steps': 6884, 'loss/train': 2.3129236698150635} -11/06/2021 22:12:52 - INFO - __main__ - Step 6886: {'lr': 0.0004986571537630757, 'samples': 1322112, 'steps': 6885, 'loss/train': 1.8439607620239258} -11/06/2021 22:12:52 - INFO - __main__ - Step 6887: {'lr': 0.0004986566044162523, 'samples': 1322304, 'steps': 6886, 'loss/train': 2.0930988788604736} -11/06/2021 22:12:53 - INFO - __main__ - Step 6888: {'lr': 0.0004986560549573881, 'samples': 1322496, 'steps': 6887, 'loss/train': 2.0430047512054443} -11/06/2021 22:12:53 - INFO - __main__ - Step 6889: {'lr': 0.0004986555053864833, 'samples': 1322688, 'steps': 6888, 'loss/train': 1.7372727394104004} -11/06/2021 22:12:54 - INFO - __main__ - Step 6890: {'lr': 0.0004986549557035381, 'samples': 1322880, 'steps': 6889, 'loss/train': 1.7419931888580322} -11/06/2021 22:12:54 - INFO - __main__ - Step 6891: {'lr': 0.0004986544059085528, 'samples': 1323072, 'steps': 6890, 'loss/train': 1.3079571723937988} -11/06/2021 22:12:55 - INFO - __main__ - Step 6892: {'lr': 0.0004986538560015277, 'samples': 1323264, 'steps': 6891, 'loss/train': 2.068556070327759} -11/06/2021 22:12:56 - INFO - __main__ - Step 6893: {'lr': 0.000498653305982463, 'samples': 1323456, 'steps': 6892, 'loss/train': 1.350880742073059} -11/06/2021 22:12:56 - INFO - __main__ - Step 6894: {'lr': 0.0004986527558513591, 'samples': 1323648, 'steps': 6893, 'loss/train': 1.4500173330307007} -11/06/2021 22:12:56 - INFO - __main__ - Step 6895: {'lr': 0.0004986522056082159, 'samples': 1323840, 'steps': 6894, 'loss/train': 2.146724224090576} -11/06/2021 22:12:57 - INFO - __main__ - Step 6896: {'lr': 0.0004986516552530339, 'samples': 1324032, 'steps': 6895, 'loss/train': 1.203369140625} -11/06/2021 22:12:57 - INFO - __main__ - Step 6897: {'lr': 0.0004986511047858134, 'samples': 1324224, 'steps': 6896, 'loss/train': 2.2133257389068604} -11/06/2021 22:12:57 - INFO - __main__ - Step 6898: {'lr': 0.0004986505542065545, 'samples': 1324416, 'steps': 6897, 'loss/train': 2.0129928588867188} -11/06/2021 22:12:58 - INFO - __main__ - Step 6899: {'lr': 0.0004986500035152574, 'samples': 1324608, 'steps': 6898, 'loss/train': 2.3049161434173584} -11/06/2021 22:12:59 - INFO - __main__ - Step 6900: {'lr': 0.0004986494527119226, 'samples': 1324800, 'steps': 6899, 'loss/train': 1.816585898399353} -11/06/2021 22:12:59 - INFO - __main__ - Step 6901: {'lr': 0.0004986489017965501, 'samples': 1324992, 'steps': 6900, 'loss/train': 1.263410210609436} -11/06/2021 22:12:59 - INFO - __main__ - Step 6902: {'lr': 0.0004986483507691403, 'samples': 1325184, 'steps': 6901, 'loss/train': 1.9309344291687012} -11/06/2021 22:13:00 - INFO - __main__ - Step 6903: {'lr': 0.0004986477996296934, 'samples': 1325376, 'steps': 6902, 'loss/train': 1.9613704681396484} -11/06/2021 22:13:01 - INFO - __main__ - Step 6904: {'lr': 0.0004986472483782096, 'samples': 1325568, 'steps': 6903, 'loss/train': 1.877648115158081} -11/06/2021 22:13:01 - INFO - __main__ - Step 6905: {'lr': 0.0004986466970146891, 'samples': 1325760, 'steps': 6904, 'loss/train': 1.900101900100708} -11/06/2021 22:13:01 - INFO - __main__ - Step 6906: {'lr': 0.0004986461455391323, 'samples': 1325952, 'steps': 6905, 'loss/train': 2.0257797241210938} -11/06/2021 22:13:02 - INFO - __main__ - Step 6907: {'lr': 0.0004986455939515395, 'samples': 1326144, 'steps': 6906, 'loss/train': 1.7874330282211304} -11/06/2021 22:13:02 - INFO - __main__ - Step 6908: {'lr': 0.0004986450422519107, 'samples': 1326336, 'steps': 6907, 'loss/train': 1.842711091041565} -11/06/2021 22:13:03 - INFO - __main__ - Step 6909: {'lr': 0.0004986444904402463, 'samples': 1326528, 'steps': 6908, 'loss/train': 2.1983108520507812} -11/06/2021 22:13:03 - INFO - __main__ - Step 6910: {'lr': 0.0004986439385165464, 'samples': 1326720, 'steps': 6909, 'loss/train': 1.821173906326294} -11/06/2021 22:13:04 - INFO - __main__ - Step 6911: {'lr': 0.0004986433864808115, 'samples': 1326912, 'steps': 6910, 'loss/train': 2.3128411769866943} -11/06/2021 22:13:04 - INFO - __main__ - Step 6912: {'lr': 0.0004986428343330418, 'samples': 1327104, 'steps': 6911, 'loss/train': 1.7972272634506226} -11/06/2021 22:13:05 - INFO - __main__ - Step 6913: {'lr': 0.0004986422820732375, 'samples': 1327296, 'steps': 6912, 'loss/train': 2.888493776321411} -11/06/2021 22:13:05 - INFO - __main__ - Step 6914: {'lr': 0.0004986417297013987, 'samples': 1327488, 'steps': 6913, 'loss/train': 1.6202863454818726} -11/06/2021 22:13:06 - INFO - __main__ - Step 6915: {'lr': 0.0004986411772175258, 'samples': 1327680, 'steps': 6914, 'loss/train': 1.704667329788208} -11/06/2021 22:13:06 - INFO - __main__ - Step 6916: {'lr': 0.000498640624621619, 'samples': 1327872, 'steps': 6915, 'loss/train': 1.571314811706543} -11/06/2021 22:13:07 - INFO - __main__ - Step 6917: {'lr': 0.0004986400719136786, 'samples': 1328064, 'steps': 6916, 'loss/train': 1.8842869997024536} -11/06/2021 22:13:07 - INFO - __main__ - Step 6918: {'lr': 0.0004986395190937048, 'samples': 1328256, 'steps': 6917, 'loss/train': 1.7865066528320312} -11/06/2021 22:13:08 - INFO - __main__ - Step 6919: {'lr': 0.000498638966161698, 'samples': 1328448, 'steps': 6918, 'loss/train': 1.9803627729415894} -11/06/2021 22:13:08 - INFO - __main__ - Step 6920: {'lr': 0.0004986384131176583, 'samples': 1328640, 'steps': 6919, 'loss/train': 2.02374529838562} -11/06/2021 22:13:09 - INFO - __main__ - Step 6921: {'lr': 0.0004986378599615858, 'samples': 1328832, 'steps': 6920, 'loss/train': 2.2463250160217285} -11/06/2021 22:13:09 - INFO - __main__ - Step 6922: {'lr': 0.000498637306693481, 'samples': 1329024, 'steps': 6921, 'loss/train': 1.9036977291107178} -11/06/2021 22:13:09 - INFO - __main__ - Step 6923: {'lr': 0.0004986367533133441, 'samples': 1329216, 'steps': 6922, 'loss/train': 1.8560709953308105} -11/06/2021 22:13:10 - INFO - __main__ - Step 6924: {'lr': 0.0004986361998211752, 'samples': 1329408, 'steps': 6923, 'loss/train': 1.860509991645813} -11/06/2021 22:13:11 - INFO - __main__ - Step 6925: {'lr': 0.0004986356462169748, 'samples': 1329600, 'steps': 6924, 'loss/train': 1.627434253692627} -11/06/2021 22:13:11 - INFO - __main__ - Step 6926: {'lr': 0.0004986350925007429, 'samples': 1329792, 'steps': 6925, 'loss/train': 1.9676358699798584} -11/06/2021 22:13:11 - INFO - __main__ - Step 6927: {'lr': 0.00049863453867248, 'samples': 1329984, 'steps': 6926, 'loss/train': 1.5846327543258667} -11/06/2021 22:13:12 - INFO - __main__ - Step 6928: {'lr': 0.0004986339847321862, 'samples': 1330176, 'steps': 6927, 'loss/train': 2.3178396224975586} -11/06/2021 22:13:13 - INFO - __main__ - Step 6929: {'lr': 0.0004986334306798616, 'samples': 1330368, 'steps': 6928, 'loss/train': 2.166189432144165} -11/06/2021 22:13:13 - INFO - __main__ - Step 6930: {'lr': 0.0004986328765155068, 'samples': 1330560, 'steps': 6929, 'loss/train': 2.235844373703003} -11/06/2021 22:13:13 - INFO - __main__ - Step 6931: {'lr': 0.0004986323222391217, 'samples': 1330752, 'steps': 6930, 'loss/train': 1.5991435050964355} -11/06/2021 22:13:14 - INFO - __main__ - Step 6932: {'lr': 0.0004986317678507069, 'samples': 1330944, 'steps': 6931, 'loss/train': 1.773486852645874} -11/06/2021 22:13:14 - INFO - __main__ - Step 6933: {'lr': 0.0004986312133502623, 'samples': 1331136, 'steps': 6932, 'loss/train': 0.26625779271125793} -11/06/2021 22:13:15 - INFO - __main__ - Step 6934: {'lr': 0.0004986306587377884, 'samples': 1331328, 'steps': 6933, 'loss/train': 1.767874836921692} -11/06/2021 22:13:16 - INFO - __main__ - Step 6935: {'lr': 0.0004986301040132853, 'samples': 1331520, 'steps': 6934, 'loss/train': 1.564034342765808} -11/06/2021 22:13:16 - INFO - __main__ - Step 6936: {'lr': 0.0004986295491767533, 'samples': 1331712, 'steps': 6935, 'loss/train': 1.7570186853408813} -11/06/2021 22:13:16 - INFO - __main__ - Step 6937: {'lr': 0.0004986289942281927, 'samples': 1331904, 'steps': 6936, 'loss/train': 1.7670789957046509} -11/06/2021 22:13:17 - INFO - __main__ - Step 6938: {'lr': 0.0004986284391676037, 'samples': 1332096, 'steps': 6937, 'loss/train': 2.3007538318634033} -11/06/2021 22:13:18 - INFO - __main__ - Step 6939: {'lr': 0.0004986278839949866, 'samples': 1332288, 'steps': 6938, 'loss/train': 2.0607035160064697} -11/06/2021 22:13:18 - INFO - __main__ - Step 6940: {'lr': 0.0004986273287103416, 'samples': 1332480, 'steps': 6939, 'loss/train': 2.072021484375} -11/06/2021 22:13:18 - INFO - __main__ - Step 6941: {'lr': 0.0004986267733136689, 'samples': 1332672, 'steps': 6940, 'loss/train': 1.5899384021759033} -11/06/2021 22:13:19 - INFO - __main__ - Step 6942: {'lr': 0.0004986262178049689, 'samples': 1332864, 'steps': 6941, 'loss/train': 2.349639415740967} -11/06/2021 22:13:19 - INFO - __main__ - Step 6943: {'lr': 0.0004986256621842417, 'samples': 1333056, 'steps': 6942, 'loss/train': 1.3075493574142456} -11/06/2021 22:13:20 - INFO - __main__ - Step 6944: {'lr': 0.0004986251064514878, 'samples': 1333248, 'steps': 6943, 'loss/train': 1.4353903532028198} -11/06/2021 22:13:21 - INFO - __main__ - Step 6945: {'lr': 0.000498624550606707, 'samples': 1333440, 'steps': 6944, 'loss/train': 2.1542229652404785} -11/06/2021 22:13:21 - INFO - __main__ - Step 6946: {'lr': 0.0004986239946498999, 'samples': 1333632, 'steps': 6945, 'loss/train': 1.9125726222991943} -11/06/2021 22:13:21 - INFO - __main__ - Step 6947: {'lr': 0.0004986234385810668, 'samples': 1333824, 'steps': 6946, 'loss/train': 1.9208937883377075} -11/06/2021 22:13:22 - INFO - __main__ - Step 6948: {'lr': 0.0004986228824002076, 'samples': 1334016, 'steps': 6947, 'loss/train': 1.7958143949508667} -11/06/2021 22:13:23 - INFO - __main__ - Step 6949: {'lr': 0.0004986223261073228, 'samples': 1334208, 'steps': 6948, 'loss/train': 2.022138833999634} -11/06/2021 22:13:23 - INFO - __main__ - Step 6950: {'lr': 0.0004986217697024128, 'samples': 1334400, 'steps': 6949, 'loss/train': 2.049771785736084} -11/06/2021 22:13:23 - INFO - __main__ - Step 6951: {'lr': 0.0004986212131854775, 'samples': 1334592, 'steps': 6950, 'loss/train': 1.7569395303726196} -11/06/2021 22:13:24 - INFO - __main__ - Step 6952: {'lr': 0.0004986206565565173, 'samples': 1334784, 'steps': 6951, 'loss/train': 1.6181141138076782} -11/06/2021 22:13:24 - INFO - __main__ - Step 6953: {'lr': 0.0004986200998155325, 'samples': 1334976, 'steps': 6952, 'loss/train': 2.3144214153289795} -11/06/2021 22:13:24 - INFO - __main__ - Step 6954: {'lr': 0.0004986195429625234, 'samples': 1335168, 'steps': 6953, 'loss/train': 1.8186416625976562} -11/06/2021 22:13:25 - INFO - __main__ - Step 6955: {'lr': 0.0004986189859974901, 'samples': 1335360, 'steps': 6954, 'loss/train': 1.4414639472961426} -11/06/2021 22:13:26 - INFO - __main__ - Step 6956: {'lr': 0.000498618428920433, 'samples': 1335552, 'steps': 6955, 'loss/train': 1.4519563913345337} -11/06/2021 22:13:26 - INFO - __main__ - Step 6957: {'lr': 0.0004986178717313522, 'samples': 1335744, 'steps': 6956, 'loss/train': 1.7825121879577637} -11/06/2021 22:13:26 - INFO - __main__ - Step 6958: {'lr': 0.000498617314430248, 'samples': 1335936, 'steps': 6957, 'loss/train': 2.2233121395111084} -11/06/2021 22:13:27 - INFO - __main__ - Step 6959: {'lr': 0.0004986167570171208, 'samples': 1336128, 'steps': 6958, 'loss/train': 2.0718345642089844} -11/06/2021 22:13:28 - INFO - __main__ - Step 6960: {'lr': 0.0004986161994919706, 'samples': 1336320, 'steps': 6959, 'loss/train': 1.547726035118103} -11/06/2021 22:13:28 - INFO - __main__ - Step 6961: {'lr': 0.0004986156418547978, 'samples': 1336512, 'steps': 6960, 'loss/train': 2.062274694442749} -11/06/2021 22:13:29 - INFO - __main__ - Step 6962: {'lr': 0.0004986150841056027, 'samples': 1336704, 'steps': 6961, 'loss/train': 2.067039966583252} -11/06/2021 22:13:29 - INFO - __main__ - Step 6963: {'lr': 0.0004986145262443854, 'samples': 1336896, 'steps': 6962, 'loss/train': 1.8536887168884277} -11/06/2021 22:13:29 - INFO - __main__ - Step 6964: {'lr': 0.0004986139682711463, 'samples': 1337088, 'steps': 6963, 'loss/train': 2.060143232345581} -11/06/2021 22:13:31 - INFO - __main__ - Step 6965: {'lr': 0.0004986134101858854, 'samples': 1337280, 'steps': 6964, 'loss/train': 1.9564449787139893} -11/06/2021 22:13:31 - INFO - __main__ - Step 6966: {'lr': 0.0004986128519886033, 'samples': 1337472, 'steps': 6965, 'loss/train': 2.0002098083496094} -11/06/2021 22:13:31 - INFO - __main__ - Step 6967: {'lr': 0.0004986122936793, 'samples': 1337664, 'steps': 6966, 'loss/train': 1.0394262075424194} -11/06/2021 22:13:32 - INFO - __main__ - Step 6968: {'lr': 0.000498611735257976, 'samples': 1337856, 'steps': 6967, 'loss/train': 1.8004080057144165} -11/06/2021 22:13:32 - INFO - __main__ - Step 6969: {'lr': 0.0004986111767246313, 'samples': 1338048, 'steps': 6968, 'loss/train': 1.8207870721817017} -11/06/2021 22:13:33 - INFO - __main__ - Step 6970: {'lr': 0.0004986106180792662, 'samples': 1338240, 'steps': 6969, 'loss/train': 2.2126078605651855} -11/06/2021 22:13:33 - INFO - __main__ - Step 6971: {'lr': 0.000498610059321881, 'samples': 1338432, 'steps': 6970, 'loss/train': 1.8455476760864258} -11/06/2021 22:13:34 - INFO - __main__ - Step 6972: {'lr': 0.000498609500452476, 'samples': 1338624, 'steps': 6971, 'loss/train': 1.8543205261230469} -11/06/2021 22:13:34 - INFO - __main__ - Step 6973: {'lr': 0.0004986089414710513, 'samples': 1338816, 'steps': 6972, 'loss/train': 2.0430335998535156} -11/06/2021 22:13:35 - INFO - __main__ - Step 6974: {'lr': 0.0004986083823776073, 'samples': 1339008, 'steps': 6973, 'loss/train': 1.9079920053482056} -11/06/2021 22:13:35 - INFO - __main__ - Step 6975: {'lr': 0.0004986078231721443, 'samples': 1339200, 'steps': 6974, 'loss/train': 0.6376028060913086} -11/06/2021 22:13:36 - INFO - __main__ - Step 6976: {'lr': 0.0004986072638546623, 'samples': 1339392, 'steps': 6975, 'loss/train': 1.7745708227157593} -11/06/2021 22:13:36 - INFO - __main__ - Step 6977: {'lr': 0.0004986067044251617, 'samples': 1339584, 'steps': 6976, 'loss/train': 2.010833740234375} -11/06/2021 22:13:37 - INFO - __main__ - Step 6978: {'lr': 0.0004986061448836428, 'samples': 1339776, 'steps': 6977, 'loss/train': 1.629277229309082} -11/06/2021 22:13:37 - INFO - __main__ - Step 6979: {'lr': 0.0004986055852301058, 'samples': 1339968, 'steps': 6978, 'loss/train': 1.9664230346679688} -11/06/2021 22:13:39 - INFO - __main__ - Step 6980: {'lr': 0.000498605025464551, 'samples': 1340160, 'steps': 6979, 'loss/train': 1.915958046913147} -11/06/2021 22:13:39 - INFO - __main__ - Step 6981: {'lr': 0.0004986044655869786, 'samples': 1340352, 'steps': 6980, 'loss/train': 1.7974884510040283} -11/06/2021 22:13:40 - INFO - __main__ - Step 6982: {'lr': 0.0004986039055973889, 'samples': 1340544, 'steps': 6981, 'loss/train': 1.9128649234771729} -11/06/2021 22:13:40 - INFO - __main__ - Step 6983: {'lr': 0.000498603345495782, 'samples': 1340736, 'steps': 6982, 'loss/train': 1.8619794845581055} -11/06/2021 22:13:40 - INFO - __main__ - Step 6984: {'lr': 0.0004986027852821583, 'samples': 1340928, 'steps': 6983, 'loss/train': 1.3572192192077637} -11/06/2021 22:13:41 - INFO - __main__ - Step 6985: {'lr': 0.000498602224956518, 'samples': 1341120, 'steps': 6984, 'loss/train': 1.4499187469482422} -11/06/2021 22:13:41 - INFO - __main__ - Step 6986: {'lr': 0.0004986016645188615, 'samples': 1341312, 'steps': 6985, 'loss/train': 1.4657028913497925} -11/06/2021 22:13:41 - INFO - __main__ - Step 6987: {'lr': 0.0004986011039691889, 'samples': 1341504, 'steps': 6986, 'loss/train': 2.016274929046631} -11/06/2021 22:13:43 - INFO - __main__ - Step 6988: {'lr': 0.0004986005433075004, 'samples': 1341696, 'steps': 6987, 'loss/train': 2.058478355407715} -11/06/2021 22:13:43 - INFO - __main__ - Step 6989: {'lr': 0.0004985999825337964, 'samples': 1341888, 'steps': 6988, 'loss/train': 2.3388593196868896} -11/06/2021 22:13:43 - INFO - __main__ - Step 6990: {'lr': 0.000498599421648077, 'samples': 1342080, 'steps': 6989, 'loss/train': 1.34577214717865} -11/06/2021 22:13:44 - INFO - __main__ - Step 6991: {'lr': 0.0004985988606503426, 'samples': 1342272, 'steps': 6990, 'loss/train': 1.556723713874817} -11/06/2021 22:13:44 - INFO - __main__ - Step 6992: {'lr': 0.0004985982995405933, 'samples': 1342464, 'steps': 6991, 'loss/train': 1.9663342237472534} -11/06/2021 22:13:45 - INFO - __main__ - Step 6993: {'lr': 0.0004985977383188296, 'samples': 1342656, 'steps': 6992, 'loss/train': 1.9654285907745361} -11/06/2021 22:13:45 - INFO - __main__ - Step 6994: {'lr': 0.0004985971769850515, 'samples': 1342848, 'steps': 6993, 'loss/train': 1.9241557121276855} -11/06/2021 22:13:46 - INFO - __main__ - Step 6995: {'lr': 0.0004985966155392593, 'samples': 1343040, 'steps': 6994, 'loss/train': 2.185478687286377} -11/06/2021 22:13:46 - INFO - __main__ - Step 6996: {'lr': 0.0004985960539814534, 'samples': 1343232, 'steps': 6995, 'loss/train': 1.901774287223816} -11/06/2021 22:13:46 - INFO - __main__ - Step 6997: {'lr': 0.000498595492311634, 'samples': 1343424, 'steps': 6996, 'loss/train': 1.8927873373031616} -11/06/2021 22:13:47 - INFO - __main__ - Step 6998: {'lr': 0.0004985949305298012, 'samples': 1343616, 'steps': 6997, 'loss/train': 1.5036976337432861} -11/06/2021 22:13:48 - INFO - __main__ - Step 6999: {'lr': 0.0004985943686359554, 'samples': 1343808, 'steps': 6998, 'loss/train': 2.1838197708129883} -11/06/2021 22:13:48 - INFO - __main__ - Step 7000: {'lr': 0.0004985938066300968, 'samples': 1344000, 'steps': 6999, 'loss/train': 1.8023282289505005} -11/06/2021 22:13:48 - INFO - __main__ - Step 7001: {'lr': 0.0004985932445122257, 'samples': 1344192, 'steps': 7000, 'loss/train': 0.9377233982086182} -11/06/2021 22:13:49 - INFO - __main__ - Step 7002: {'lr': 0.0004985926822823422, 'samples': 1344384, 'steps': 7001, 'loss/train': 2.0790352821350098} -11/06/2021 22:13:49 - INFO - __main__ - Step 7003: {'lr': 0.0004985921199404467, 'samples': 1344576, 'steps': 7002, 'loss/train': 1.5738434791564941} -11/06/2021 22:13:50 - INFO - __main__ - Step 7004: {'lr': 0.0004985915574865395, 'samples': 1344768, 'steps': 7003, 'loss/train': 2.0488102436065674} -11/06/2021 22:13:50 - INFO - __main__ - Step 7005: {'lr': 0.0004985909949206209, 'samples': 1344960, 'steps': 7004, 'loss/train': 2.2131500244140625} -11/06/2021 22:13:51 - INFO - __main__ - Step 7006: {'lr': 0.0004985904322426909, 'samples': 1345152, 'steps': 7005, 'loss/train': 2.16741681098938} -11/06/2021 22:13:51 - INFO - __main__ - Step 7007: {'lr': 0.0004985898694527498, 'samples': 1345344, 'steps': 7006, 'loss/train': 1.9892717599868774} -11/06/2021 22:13:52 - INFO - __main__ - Step 7008: {'lr': 0.000498589306550798, 'samples': 1345536, 'steps': 7007, 'loss/train': 1.8207341432571411} -11/06/2021 22:13:53 - INFO - __main__ - Step 7009: {'lr': 0.0004985887435368357, 'samples': 1345728, 'steps': 7008, 'loss/train': 2.600703716278076} -11/06/2021 22:13:53 - INFO - __main__ - Step 7010: {'lr': 0.0004985881804108632, 'samples': 1345920, 'steps': 7009, 'loss/train': 1.830875277519226} -11/06/2021 22:13:53 - INFO - __main__ - Step 7011: {'lr': 0.0004985876171728807, 'samples': 1346112, 'steps': 7010, 'loss/train': 1.6429589986801147} -11/06/2021 22:13:54 - INFO - __main__ - Step 7012: {'lr': 0.0004985870538228884, 'samples': 1346304, 'steps': 7011, 'loss/train': 1.831001877784729} -11/06/2021 22:13:54 - INFO - __main__ - Step 7013: {'lr': 0.0004985864903608866, 'samples': 1346496, 'steps': 7012, 'loss/train': 1.9762578010559082} -11/06/2021 22:13:55 - INFO - __main__ - Step 7014: {'lr': 0.0004985859267868756, 'samples': 1346688, 'steps': 7013, 'loss/train': 2.1162519454956055} -11/06/2021 22:13:55 - INFO - __main__ - Step 7015: {'lr': 0.0004985853631008557, 'samples': 1346880, 'steps': 7014, 'loss/train': 1.9965474605560303} -11/06/2021 22:13:56 - INFO - __main__ - Step 7016: {'lr': 0.000498584799302827, 'samples': 1347072, 'steps': 7015, 'loss/train': 1.330285906791687} -11/06/2021 22:13:56 - INFO - __main__ - Step 7017: {'lr': 0.0004985842353927897, 'samples': 1347264, 'steps': 7016, 'loss/train': 1.870910406112671} -11/06/2021 22:13:57 - INFO - __main__ - Step 7018: {'lr': 0.0004985836713707443, 'samples': 1347456, 'steps': 7017, 'loss/train': 2.007260799407959} -11/06/2021 22:13:58 - INFO - __main__ - Step 7019: {'lr': 0.000498583107236691, 'samples': 1347648, 'steps': 7018, 'loss/train': 1.9178532361984253} -11/06/2021 22:13:58 - INFO - __main__ - Step 7020: {'lr': 0.0004985825429906299, 'samples': 1347840, 'steps': 7019, 'loss/train': 1.8477237224578857} -11/06/2021 22:13:58 - INFO - __main__ - Step 7021: {'lr': 0.0004985819786325614, 'samples': 1348032, 'steps': 7020, 'loss/train': 1.7012065649032593} -11/06/2021 22:13:59 - INFO - __main__ - Step 7022: {'lr': 0.0004985814141624856, 'samples': 1348224, 'steps': 7021, 'loss/train': 1.9966686964035034} -11/06/2021 22:13:59 - INFO - __main__ - Step 7023: {'lr': 0.000498580849580403, 'samples': 1348416, 'steps': 7022, 'loss/train': 1.7305803298950195} -11/06/2021 22:13:59 - INFO - __main__ - Step 7024: {'lr': 0.0004985802848863135, 'samples': 1348608, 'steps': 7023, 'loss/train': 2.0270166397094727} -11/06/2021 22:14:00 - INFO - __main__ - Step 7025: {'lr': 0.0004985797200802176, 'samples': 1348800, 'steps': 7024, 'loss/train': 2.123034715652466} -11/06/2021 22:14:01 - INFO - __main__ - Step 7026: {'lr': 0.0004985791551621158, 'samples': 1348992, 'steps': 7025, 'loss/train': 1.589381456375122} -11/06/2021 22:14:01 - INFO - __main__ - Step 7027: {'lr': 0.0004985785901320078, 'samples': 1349184, 'steps': 7026, 'loss/train': 1.8792399168014526} -11/06/2021 22:14:02 - INFO - __main__ - Step 7028: {'lr': 0.0004985780249898941, 'samples': 1349376, 'steps': 7027, 'loss/train': 1.8955899477005005} -11/06/2021 22:14:02 - INFO - __main__ - Step 7029: {'lr': 0.0004985774597357751, 'samples': 1349568, 'steps': 7028, 'loss/train': 2.0755574703216553} -11/06/2021 22:14:03 - INFO - __main__ - Step 7030: {'lr': 0.0004985768943696509, 'samples': 1349760, 'steps': 7029, 'loss/train': 1.896838903427124} -11/06/2021 22:14:03 - INFO - __main__ - Step 7031: {'lr': 0.0004985763288915217, 'samples': 1349952, 'steps': 7030, 'loss/train': 2.0868396759033203} -11/06/2021 22:14:04 - INFO - __main__ - Step 7032: {'lr': 0.0004985757633013879, 'samples': 1350144, 'steps': 7031, 'loss/train': 1.9611470699310303} -11/06/2021 22:14:04 - INFO - __main__ - Step 7033: {'lr': 0.0004985751975992497, 'samples': 1350336, 'steps': 7032, 'loss/train': 2.039046287536621} -11/06/2021 22:14:04 - INFO - __main__ - Step 7034: {'lr': 0.0004985746317851074, 'samples': 1350528, 'steps': 7033, 'loss/train': 2.1592774391174316} -11/06/2021 22:14:05 - INFO - __main__ - Step 7035: {'lr': 0.0004985740658589612, 'samples': 1350720, 'steps': 7034, 'loss/train': 1.7554975748062134} -11/06/2021 22:14:06 - INFO - __main__ - Step 7036: {'lr': 0.0004985734998208112, 'samples': 1350912, 'steps': 7035, 'loss/train': 1.64145028591156} -11/06/2021 22:14:06 - INFO - __main__ - Step 7037: {'lr': 0.000498572933670658, 'samples': 1351104, 'steps': 7036, 'loss/train': 1.8642250299453735} -11/06/2021 22:14:06 - INFO - __main__ - Step 7038: {'lr': 0.0004985723674085016, 'samples': 1351296, 'steps': 7037, 'loss/train': 1.789941430091858} -11/06/2021 22:14:07 - INFO - __main__ - Step 7039: {'lr': 0.0004985718010343424, 'samples': 1351488, 'steps': 7038, 'loss/train': 2.0578839778900146} -11/06/2021 22:14:08 - INFO - __main__ - Step 7040: {'lr': 0.0004985712345481805, 'samples': 1351680, 'steps': 7039, 'loss/train': 1.8973031044006348} -11/06/2021 22:14:08 - INFO - __main__ - Step 7041: {'lr': 0.0004985706679500163, 'samples': 1351872, 'steps': 7040, 'loss/train': 2.2261483669281006} -11/06/2021 22:14:08 - INFO - __main__ - Step 7042: {'lr': 0.0004985701012398499, 'samples': 1352064, 'steps': 7041, 'loss/train': 2.026362657546997} -11/06/2021 22:14:09 - INFO - __main__ - Step 7043: {'lr': 0.0004985695344176817, 'samples': 1352256, 'steps': 7042, 'loss/train': 2.370086669921875} -11/06/2021 22:14:09 - INFO - __main__ - Step 7044: {'lr': 0.0004985689674835119, 'samples': 1352448, 'steps': 7043, 'loss/train': 1.789720058441162} -11/06/2021 22:14:10 - INFO - __main__ - Step 7045: {'lr': 0.0004985684004373409, 'samples': 1352640, 'steps': 7044, 'loss/train': 1.5516489744186401} -11/06/2021 22:14:10 - INFO - __main__ - Step 7046: {'lr': 0.0004985678332791686, 'samples': 1352832, 'steps': 7045, 'loss/train': 1.1448746919631958} -11/06/2021 22:14:11 - INFO - __main__ - Step 7047: {'lr': 0.0004985672660089956, 'samples': 1353024, 'steps': 7046, 'loss/train': 1.9174386262893677} -11/06/2021 22:14:11 - INFO - __main__ - Step 7048: {'lr': 0.000498566698626822, 'samples': 1353216, 'steps': 7047, 'loss/train': 2.0857248306274414} -11/06/2021 22:14:12 - INFO - __main__ - Step 7049: {'lr': 0.000498566131132648, 'samples': 1353408, 'steps': 7048, 'loss/train': 1.5200681686401367} -11/06/2021 22:14:13 - INFO - __main__ - Step 7050: {'lr': 0.0004985655635264739, 'samples': 1353600, 'steps': 7049, 'loss/train': 2.0432159900665283} -11/06/2021 22:14:13 - INFO - __main__ - Step 7051: {'lr': 0.0004985649958083001, 'samples': 1353792, 'steps': 7050, 'loss/train': 2.034838914871216} -11/06/2021 22:14:13 - INFO - __main__ - Step 7052: {'lr': 0.0004985644279781268, 'samples': 1353984, 'steps': 7051, 'loss/train': 2.010187864303589} -11/06/2021 22:14:14 - INFO - __main__ - Step 7053: {'lr': 0.0004985638600359542, 'samples': 1354176, 'steps': 7052, 'loss/train': 2.2024543285369873} -11/06/2021 22:14:14 - INFO - __main__ - Step 7054: {'lr': 0.0004985632919817824, 'samples': 1354368, 'steps': 7053, 'loss/train': 2.1596481800079346} -11/06/2021 22:14:14 - INFO - __main__ - Step 7055: {'lr': 0.000498562723815612, 'samples': 1354560, 'steps': 7054, 'loss/train': 1.9444608688354492} -11/06/2021 22:14:15 - INFO - __main__ - Step 7056: {'lr': 0.000498562155537443, 'samples': 1354752, 'steps': 7055, 'loss/train': 1.5930293798446655} -11/06/2021 22:14:16 - INFO - __main__ - Step 7057: {'lr': 0.0004985615871472757, 'samples': 1354944, 'steps': 7056, 'loss/train': 2.356843948364258} -11/06/2021 22:14:16 - INFO - __main__ - Step 7058: {'lr': 0.0004985610186451104, 'samples': 1355136, 'steps': 7057, 'loss/train': 2.400442123413086} -11/06/2021 22:14:16 - INFO - __main__ - Step 7059: {'lr': 0.0004985604500309473, 'samples': 1355328, 'steps': 7058, 'loss/train': 1.9683334827423096} -11/06/2021 22:14:17 - INFO - __main__ - Step 7060: {'lr': 0.0004985598813047868, 'samples': 1355520, 'steps': 7059, 'loss/train': 2.3564374446868896} -11/06/2021 22:14:18 - INFO - __main__ - Step 7061: {'lr': 0.000498559312466629, 'samples': 1355712, 'steps': 7060, 'loss/train': 2.06729793548584} -11/06/2021 22:14:18 - INFO - __main__ - Step 7062: {'lr': 0.0004985587435164742, 'samples': 1355904, 'steps': 7061, 'loss/train': 2.2818222045898438} -11/06/2021 22:14:19 - INFO - __main__ - Step 7063: {'lr': 0.0004985581744543226, 'samples': 1356096, 'steps': 7062, 'loss/train': 2.8262219429016113} -11/06/2021 22:14:19 - INFO - __main__ - Step 7064: {'lr': 0.0004985576052801747, 'samples': 1356288, 'steps': 7063, 'loss/train': 2.252566337585449} -11/06/2021 22:14:19 - INFO - __main__ - Step 7065: {'lr': 0.0004985570359940304, 'samples': 1356480, 'steps': 7064, 'loss/train': 1.9672572612762451} -11/06/2021 22:14:20 - INFO - __main__ - Step 7066: {'lr': 0.0004985564665958901, 'samples': 1356672, 'steps': 7065, 'loss/train': 1.8801449537277222} -11/06/2021 22:14:21 - INFO - __main__ - Step 7067: {'lr': 0.0004985558970857543, 'samples': 1356864, 'steps': 7066, 'loss/train': 2.165799379348755} -11/06/2021 22:14:21 - INFO - __main__ - Step 7068: {'lr': 0.000498555327463623, 'samples': 1357056, 'steps': 7067, 'loss/train': 1.7966886758804321} -11/06/2021 22:14:21 - INFO - __main__ - Step 7069: {'lr': 0.0004985547577294963, 'samples': 1357248, 'steps': 7068, 'loss/train': 1.4728955030441284} -11/06/2021 22:14:22 - INFO - __main__ - Step 7070: {'lr': 0.0004985541878833749, 'samples': 1357440, 'steps': 7069, 'loss/train': 1.446349024772644} -11/06/2021 22:14:23 - INFO - __main__ - Step 7071: {'lr': 0.0004985536179252587, 'samples': 1357632, 'steps': 7070, 'loss/train': 1.8138748407363892} -11/06/2021 22:14:23 - INFO - __main__ - Step 7072: {'lr': 0.0004985530478551481, 'samples': 1357824, 'steps': 7071, 'loss/train': 1.72260582447052} -11/06/2021 22:14:23 - INFO - __main__ - Step 7073: {'lr': 0.0004985524776730434, 'samples': 1358016, 'steps': 7072, 'loss/train': 2.2067058086395264} -11/06/2021 22:14:24 - INFO - __main__ - Step 7074: {'lr': 0.0004985519073789447, 'samples': 1358208, 'steps': 7073, 'loss/train': 2.0647716522216797} -11/06/2021 22:14:24 - INFO - __main__ - Step 7075: {'lr': 0.0004985513369728524, 'samples': 1358400, 'steps': 7074, 'loss/train': 1.755244255065918} -11/06/2021 22:14:26 - INFO - __main__ - Step 7076: {'lr': 0.0004985507664547666, 'samples': 1358592, 'steps': 7075, 'loss/train': 2.965153455734253} -11/06/2021 22:14:26 - INFO - __main__ - Step 7077: {'lr': 0.0004985501958246878, 'samples': 1358784, 'steps': 7076, 'loss/train': 2.4291107654571533} -11/06/2021 22:14:26 - INFO - __main__ - Step 7078: {'lr': 0.000498549625082616, 'samples': 1358976, 'steps': 7077, 'loss/train': 1.5984909534454346} -11/06/2021 22:14:27 - INFO - __main__ - Step 7079: {'lr': 0.0004985490542285516, 'samples': 1359168, 'steps': 7078, 'loss/train': 2.098381519317627} -11/06/2021 22:14:27 - INFO - __main__ - Step 7080: {'lr': 0.0004985484832624949, 'samples': 1359360, 'steps': 7079, 'loss/train': 1.983779788017273} -11/06/2021 22:14:27 - INFO - __main__ - Step 7081: {'lr': 0.000498547912184446, 'samples': 1359552, 'steps': 7080, 'loss/train': 2.0644752979278564} -11/06/2021 22:14:28 - INFO - __main__ - Step 7082: {'lr': 0.0004985473409944054, 'samples': 1359744, 'steps': 7081, 'loss/train': 1.7944436073303223} -11/06/2021 22:14:29 - INFO - __main__ - Step 7083: {'lr': 0.000498546769692373, 'samples': 1359936, 'steps': 7082, 'loss/train': 2.2252354621887207} -11/06/2021 22:14:29 - INFO - __main__ - Step 7084: {'lr': 0.0004985461982783494, 'samples': 1360128, 'steps': 7083, 'loss/train': 1.653979778289795} -11/06/2021 22:14:30 - INFO - __main__ - Step 7085: {'lr': 0.0004985456267523346, 'samples': 1360320, 'steps': 7084, 'loss/train': 1.65984308719635} -11/06/2021 22:14:30 - INFO - __main__ - Step 7086: {'lr': 0.0004985450551143291, 'samples': 1360512, 'steps': 7085, 'loss/train': 2.264176607131958} -11/06/2021 22:14:31 - INFO - __main__ - Step 7087: {'lr': 0.000498544483364333, 'samples': 1360704, 'steps': 7086, 'loss/train': 2.1907835006713867} -11/06/2021 22:14:31 - INFO - __main__ - Step 7088: {'lr': 0.0004985439115023465, 'samples': 1360896, 'steps': 7087, 'loss/train': 1.8847299814224243} -11/06/2021 22:14:32 - INFO - __main__ - Step 7089: {'lr': 0.0004985433395283701, 'samples': 1361088, 'steps': 7088, 'loss/train': 1.9816615581512451} -11/06/2021 22:14:32 - INFO - __main__ - Step 7090: {'lr': 0.0004985427674424038, 'samples': 1361280, 'steps': 7089, 'loss/train': 1.8997712135314941} -11/06/2021 22:14:32 - INFO - __main__ - Step 7091: {'lr': 0.000498542195244448, 'samples': 1361472, 'steps': 7090, 'loss/train': 1.139441967010498} -11/06/2021 22:14:33 - INFO - __main__ - Step 7092: {'lr': 0.0004985416229345029, 'samples': 1361664, 'steps': 7091, 'loss/train': 1.571520209312439} -11/06/2021 22:14:34 - INFO - __main__ - Step 7093: {'lr': 0.0004985410505125689, 'samples': 1361856, 'steps': 7092, 'loss/train': 2.138139486312866} -11/06/2021 22:14:34 - INFO - __main__ - Step 7094: {'lr': 0.0004985404779786459, 'samples': 1362048, 'steps': 7093, 'loss/train': 2.261357545852661} -11/06/2021 22:14:35 - INFO - __main__ - Step 7095: {'lr': 0.0004985399053327346, 'samples': 1362240, 'steps': 7094, 'loss/train': 1.7595309019088745} -11/06/2021 22:14:35 - INFO - __main__ - Step 7096: {'lr': 0.000498539332574835, 'samples': 1362432, 'steps': 7095, 'loss/train': 1.8926126956939697} -11/06/2021 22:14:35 - INFO - __main__ - Step 7097: {'lr': 0.0004985387597049474, 'samples': 1362624, 'steps': 7096, 'loss/train': 2.004615306854248} -11/06/2021 22:14:37 - INFO - __main__ - Step 7098: {'lr': 0.0004985381867230721, 'samples': 1362816, 'steps': 7097, 'loss/train': 1.6198385953903198} -11/06/2021 22:14:37 - INFO - __main__ - Step 7099: {'lr': 0.0004985376136292093, 'samples': 1363008, 'steps': 7098, 'loss/train': 1.9833897352218628} -11/06/2021 22:14:37 - INFO - __main__ - Step 7100: {'lr': 0.0004985370404233592, 'samples': 1363200, 'steps': 7099, 'loss/train': 1.9819221496582031} -11/06/2021 22:14:38 - INFO - __main__ - Step 7101: {'lr': 0.0004985364671055223, 'samples': 1363392, 'steps': 7100, 'loss/train': 2.0017964839935303} -11/06/2021 22:14:38 - INFO - __main__ - Step 7102: {'lr': 0.0004985358936756985, 'samples': 1363584, 'steps': 7101, 'loss/train': 1.8916939496994019} -11/06/2021 22:14:38 - INFO - __main__ - Step 7103: {'lr': 0.0004985353201338885, 'samples': 1363776, 'steps': 7102, 'loss/train': 1.6781333684921265} -11/06/2021 22:14:39 - INFO - __main__ - Step 7104: {'lr': 0.0004985347464800921, 'samples': 1363968, 'steps': 7103, 'loss/train': 0.41633597016334534} -11/06/2021 22:14:40 - INFO - __main__ - Step 7105: {'lr': 0.0004985341727143099, 'samples': 1364160, 'steps': 7104, 'loss/train': 1.5315263271331787} -11/06/2021 22:14:40 - INFO - __main__ - Step 7106: {'lr': 0.000498533598836542, 'samples': 1364352, 'steps': 7105, 'loss/train': 1.2057009935379028} -11/06/2021 22:14:40 - INFO - __main__ - Step 7107: {'lr': 0.0004985330248467888, 'samples': 1364544, 'steps': 7106, 'loss/train': 1.7681790590286255} -11/06/2021 22:14:41 - INFO - __main__ - Step 7108: {'lr': 0.0004985324507450504, 'samples': 1364736, 'steps': 7107, 'loss/train': 1.7636619806289673} -11/06/2021 22:14:42 - INFO - __main__ - Step 7109: {'lr': 0.000498531876531327, 'samples': 1364928, 'steps': 7108, 'loss/train': 1.970746397972107} -11/06/2021 22:14:42 - INFO - __main__ - Step 7110: {'lr': 0.0004985313022056191, 'samples': 1365120, 'steps': 7109, 'loss/train': 1.8806291818618774} -11/06/2021 22:14:43 - INFO - __main__ - Step 7111: {'lr': 0.0004985307277679267, 'samples': 1365312, 'steps': 7110, 'loss/train': 1.3008683919906616} -11/06/2021 22:14:43 - INFO - __main__ - Step 7112: {'lr': 0.0004985301532182503, 'samples': 1365504, 'steps': 7111, 'loss/train': 1.9515055418014526} -11/06/2021 22:14:43 - INFO - __main__ - Step 7113: {'lr': 0.0004985295785565901, 'samples': 1365696, 'steps': 7112, 'loss/train': 1.8485970497131348} -11/06/2021 22:14:44 - INFO - __main__ - Step 7114: {'lr': 0.0004985290037829462, 'samples': 1365888, 'steps': 7113, 'loss/train': 3.7923812866210938} -11/06/2021 22:14:45 - INFO - __main__ - Step 7115: {'lr': 0.000498528428897319, 'samples': 1366080, 'steps': 7114, 'loss/train': 1.5386725664138794} -11/06/2021 22:14:45 - INFO - __main__ - Step 7116: {'lr': 0.0004985278538997088, 'samples': 1366272, 'steps': 7115, 'loss/train': 2.0282657146453857} -11/06/2021 22:14:45 - INFO - __main__ - Step 7117: {'lr': 0.0004985272787901156, 'samples': 1366464, 'steps': 7116, 'loss/train': 2.3269381523132324} -11/06/2021 22:14:46 - INFO - __main__ - Step 7118: {'lr': 0.00049852670356854, 'samples': 1366656, 'steps': 7117, 'loss/train': 1.7581599950790405} -11/06/2021 22:14:47 - INFO - __main__ - Step 7119: {'lr': 0.000498526128234982, 'samples': 1366848, 'steps': 7118, 'loss/train': 2.1720402240753174} -11/06/2021 22:14:47 - INFO - __main__ - Step 7120: {'lr': 0.000498525552789442, 'samples': 1367040, 'steps': 7119, 'loss/train': 1.491886019706726} -11/06/2021 22:14:48 - INFO - __main__ - Step 7121: {'lr': 0.0004985249772319202, 'samples': 1367232, 'steps': 7120, 'loss/train': 2.0638139247894287} -11/06/2021 22:14:48 - INFO - __main__ - Step 7122: {'lr': 0.000498524401562417, 'samples': 1367424, 'steps': 7121, 'loss/train': 1.7350369691848755} -11/06/2021 22:14:48 - INFO - __main__ - Step 7123: {'lr': 0.0004985238257809325, 'samples': 1367616, 'steps': 7122, 'loss/train': 2.518477201461792} -11/06/2021 22:14:49 - INFO - __main__ - Step 7124: {'lr': 0.0004985232498874669, 'samples': 1367808, 'steps': 7123, 'loss/train': 1.7711327075958252} -11/06/2021 22:14:50 - INFO - __main__ - Step 7125: {'lr': 0.0004985226738820207, 'samples': 1368000, 'steps': 7124, 'loss/train': 1.2557427883148193} -11/06/2021 22:14:50 - INFO - __main__ - Step 7126: {'lr': 0.0004985220977645939, 'samples': 1368192, 'steps': 7125, 'loss/train': 2.177485942840576} -11/06/2021 22:14:50 - INFO - __main__ - Step 7127: {'lr': 0.0004985215215351869, 'samples': 1368384, 'steps': 7126, 'loss/train': 1.9587048292160034} -11/06/2021 22:14:51 - INFO - __main__ - Step 7128: {'lr': 0.0004985209451937999, 'samples': 1368576, 'steps': 7127, 'loss/train': 2.1263420581817627} -11/06/2021 22:14:51 - INFO - __main__ - Step 7129: {'lr': 0.0004985203687404333, 'samples': 1368768, 'steps': 7128, 'loss/train': 1.8560582399368286} -11/06/2021 22:14:52 - INFO - __main__ - Step 7130: {'lr': 0.0004985197921750871, 'samples': 1368960, 'steps': 7129, 'loss/train': 1.6565303802490234} -11/06/2021 22:14:52 - INFO - __main__ - Step 7131: {'lr': 0.0004985192154977619, 'samples': 1369152, 'steps': 7130, 'loss/train': 1.868842601776123} -11/06/2021 22:14:53 - INFO - __main__ - Step 7132: {'lr': 0.0004985186387084577, 'samples': 1369344, 'steps': 7131, 'loss/train': 1.80448317527771} -11/06/2021 22:14:53 - INFO - __main__ - Step 7133: {'lr': 0.0004985180618071748, 'samples': 1369536, 'steps': 7132, 'loss/train': 1.7268800735473633} -11/06/2021 22:14:53 - INFO - __main__ - Step 7134: {'lr': 0.0004985174847939135, 'samples': 1369728, 'steps': 7133, 'loss/train': 2.039775848388672} -11/06/2021 22:14:55 - INFO - __main__ - Step 7135: {'lr': 0.0004985169076686741, 'samples': 1369920, 'steps': 7134, 'loss/train': 1.5857948064804077} -11/06/2021 22:14:55 - INFO - __main__ - Step 7136: {'lr': 0.0004985163304314568, 'samples': 1370112, 'steps': 7135, 'loss/train': 1.8448445796966553} -11/06/2021 22:14:55 - INFO - __main__ - Step 7137: {'lr': 0.0004985157530822619, 'samples': 1370304, 'steps': 7136, 'loss/train': 1.450709342956543} -11/06/2021 22:14:56 - INFO - __main__ - Step 7138: {'lr': 0.0004985151756210897, 'samples': 1370496, 'steps': 7137, 'loss/train': 1.8486833572387695} -11/06/2021 22:14:56 - INFO - __main__ - Step 7139: {'lr': 0.0004985145980479402, 'samples': 1370688, 'steps': 7138, 'loss/train': 1.828140377998352} -11/06/2021 22:14:57 - INFO - __main__ - Step 7140: {'lr': 0.000498514020362814, 'samples': 1370880, 'steps': 7139, 'loss/train': 1.5421890020370483} -11/06/2021 22:14:57 - INFO - __main__ - Step 7141: {'lr': 0.0004985134425657111, 'samples': 1371072, 'steps': 7140, 'loss/train': 2.6949613094329834} -11/06/2021 22:14:58 - INFO - __main__ - Step 7142: {'lr': 0.000498512864656632, 'samples': 1371264, 'steps': 7141, 'loss/train': 1.5988658666610718} -11/06/2021 22:14:58 - INFO - __main__ - Step 7143: {'lr': 0.0004985122866355768, 'samples': 1371456, 'steps': 7142, 'loss/train': 2.1116602420806885} -11/06/2021 22:14:58 - INFO - __main__ - Step 7144: {'lr': 0.0004985117085025458, 'samples': 1371648, 'steps': 7143, 'loss/train': 2.3443734645843506} -11/06/2021 22:14:59 - INFO - __main__ - Step 7145: {'lr': 0.0004985111302575392, 'samples': 1371840, 'steps': 7144, 'loss/train': 1.9202158451080322} -11/06/2021 22:15:00 - INFO - __main__ - Step 7146: {'lr': 0.0004985105519005573, 'samples': 1372032, 'steps': 7145, 'loss/train': 1.7188575267791748} -11/06/2021 22:15:00 - INFO - __main__ - Step 7147: {'lr': 0.0004985099734316006, 'samples': 1372224, 'steps': 7146, 'loss/train': 1.5859005451202393} -11/06/2021 22:15:00 - INFO - __main__ - Step 7148: {'lr': 0.0004985093948506689, 'samples': 1372416, 'steps': 7147, 'loss/train': 1.5859280824661255} -11/06/2021 22:15:01 - INFO - __main__ - Step 7149: {'lr': 0.0004985088161577628, 'samples': 1372608, 'steps': 7148, 'loss/train': 1.8605209589004517} -11/06/2021 22:15:01 - INFO - __main__ - Step 7150: {'lr': 0.0004985082373528825, 'samples': 1372800, 'steps': 7149, 'loss/train': 2.1094627380371094} -11/06/2021 22:15:02 - INFO - __main__ - Step 7151: {'lr': 0.0004985076584360282, 'samples': 1372992, 'steps': 7150, 'loss/train': 2.0223774909973145} -11/06/2021 22:15:03 - INFO - __main__ - Step 7152: {'lr': 0.0004985070794072002, 'samples': 1373184, 'steps': 7151, 'loss/train': 2.0557656288146973} -11/06/2021 22:15:03 - INFO - __main__ - Step 7153: {'lr': 0.0004985065002663986, 'samples': 1373376, 'steps': 7152, 'loss/train': 1.9789502620697021} -11/06/2021 22:15:03 - INFO - __main__ - Step 7154: {'lr': 0.000498505921013624, 'samples': 1373568, 'steps': 7153, 'loss/train': 1.9508652687072754} -11/06/2021 22:15:04 - INFO - __main__ - Step 7155: {'lr': 0.0004985053416488764, 'samples': 1373760, 'steps': 7154, 'loss/train': 2.078094244003296} -11/06/2021 22:15:05 - INFO - __main__ - Step 7156: {'lr': 0.0004985047621721561, 'samples': 1373952, 'steps': 7155, 'loss/train': 0.8238686323165894} -11/06/2021 22:15:05 - INFO - __main__ - Step 7157: {'lr': 0.0004985041825834634, 'samples': 1374144, 'steps': 7156, 'loss/train': 1.8907822370529175} -11/06/2021 22:15:05 - INFO - __main__ - Step 7158: {'lr': 0.0004985036028827986, 'samples': 1374336, 'steps': 7157, 'loss/train': 2.6892762184143066} -11/06/2021 22:15:06 - INFO - __main__ - Step 7159: {'lr': 0.0004985030230701619, 'samples': 1374528, 'steps': 7158, 'loss/train': 2.3940746784210205} -11/06/2021 22:15:06 - INFO - __main__ - Step 7160: {'lr': 0.0004985024431455534, 'samples': 1374720, 'steps': 7159, 'loss/train': 1.8155590295791626} -11/06/2021 22:15:07 - INFO - __main__ - Step 7161: {'lr': 0.0004985018631089738, 'samples': 1374912, 'steps': 7160, 'loss/train': 2.003696918487549} -11/06/2021 22:15:07 - INFO - __main__ - Step 7162: {'lr': 0.0004985012829604228, 'samples': 1375104, 'steps': 7161, 'loss/train': 1.8686398267745972} -11/06/2021 22:15:08 - INFO - __main__ - Step 7163: {'lr': 0.0004985007026999011, 'samples': 1375296, 'steps': 7162, 'loss/train': 1.7682377099990845} -11/06/2021 22:15:08 - INFO - __main__ - Step 7164: {'lr': 0.0004985001223274089, 'samples': 1375488, 'steps': 7163, 'loss/train': 2.357848644256592} -11/06/2021 22:15:08 - INFO - __main__ - Step 7165: {'lr': 0.0004984995418429463, 'samples': 1375680, 'steps': 7164, 'loss/train': 2.2802202701568604} -11/06/2021 22:15:09 - INFO - __main__ - Step 7166: {'lr': 0.0004984989612465137, 'samples': 1375872, 'steps': 7165, 'loss/train': 2.0252628326416016} -11/06/2021 22:15:10 - INFO - __main__ - Step 7167: {'lr': 0.0004984983805381112, 'samples': 1376064, 'steps': 7166, 'loss/train': 1.8542309999465942} -11/06/2021 22:15:10 - INFO - __main__ - Step 7168: {'lr': 0.0004984977997177393, 'samples': 1376256, 'steps': 7167, 'loss/train': 1.5369564294815063} -11/06/2021 22:15:10 - INFO - __main__ - Step 7169: {'lr': 0.000498497218785398, 'samples': 1376448, 'steps': 7168, 'loss/train': 1.955859899520874} -11/06/2021 22:15:11 - INFO - __main__ - Step 7170: {'lr': 0.0004984966377410878, 'samples': 1376640, 'steps': 7169, 'loss/train': 2.5765957832336426} -11/06/2021 22:15:12 - INFO - __main__ - Step 7171: {'lr': 0.0004984960565848086, 'samples': 1376832, 'steps': 7170, 'loss/train': 2.264620304107666} -11/06/2021 22:15:12 - INFO - __main__ - Step 7172: {'lr': 0.0004984954753165612, 'samples': 1377024, 'steps': 7171, 'loss/train': 1.8249037265777588} -11/06/2021 22:15:13 - INFO - __main__ - Step 7173: {'lr': 0.0004984948939363455, 'samples': 1377216, 'steps': 7172, 'loss/train': 1.3821079730987549} -11/06/2021 22:15:13 - INFO - __main__ - Step 7174: {'lr': 0.0004984943124441617, 'samples': 1377408, 'steps': 7173, 'loss/train': 1.980968952178955} -11/06/2021 22:15:13 - INFO - __main__ - Step 7175: {'lr': 0.0004984937308400104, 'samples': 1377600, 'steps': 7174, 'loss/train': 1.0405446290969849} -11/06/2021 22:15:15 - INFO - __main__ - Step 7176: {'lr': 0.0004984931491238915, 'samples': 1377792, 'steps': 7175, 'loss/train': 2.0840656757354736} -11/06/2021 22:15:15 - INFO - __main__ - Step 7177: {'lr': 0.0004984925672958055, 'samples': 1377984, 'steps': 7176, 'loss/train': 1.7736377716064453} -11/06/2021 22:15:15 - INFO - __main__ - Step 7178: {'lr': 0.0004984919853557526, 'samples': 1378176, 'steps': 7177, 'loss/train': 2.2246837615966797} -11/06/2021 22:15:16 - INFO - __main__ - Step 7179: {'lr': 0.000498491403303733, 'samples': 1378368, 'steps': 7178, 'loss/train': 2.4547572135925293} -11/06/2021 22:15:16 - INFO - __main__ - Step 7180: {'lr': 0.000498490821139747, 'samples': 1378560, 'steps': 7179, 'loss/train': 1.4960209131240845} -11/06/2021 22:15:16 - INFO - __main__ - Step 7181: {'lr': 0.0004984902388637949, 'samples': 1378752, 'steps': 7180, 'loss/train': 1.8791706562042236} -11/06/2021 22:15:17 - INFO - __main__ - Step 7182: {'lr': 0.000498489656475877, 'samples': 1378944, 'steps': 7181, 'loss/train': 2.0455527305603027} -11/06/2021 22:15:18 - INFO - __main__ - Step 7183: {'lr': 0.0004984890739759934, 'samples': 1379136, 'steps': 7182, 'loss/train': 1.8560911417007446} -11/06/2021 22:15:18 - INFO - __main__ - Step 7184: {'lr': 0.0004984884913641444, 'samples': 1379328, 'steps': 7183, 'loss/train': 2.0507397651672363} -11/06/2021 22:15:18 - INFO - __main__ - Step 7185: {'lr': 0.0004984879086403304, 'samples': 1379520, 'steps': 7184, 'loss/train': 2.017399311065674} -11/06/2021 22:15:19 - INFO - __main__ - Step 7186: {'lr': 0.0004984873258045517, 'samples': 1379712, 'steps': 7185, 'loss/train': 1.7196428775787354} -11/06/2021 22:15:19 - INFO - __main__ - Step 7187: {'lr': 0.0004984867428568083, 'samples': 1379904, 'steps': 7186, 'loss/train': 1.79092276096344} -11/06/2021 22:15:20 - INFO - __main__ - Step 7188: {'lr': 0.0004984861597971006, 'samples': 1380096, 'steps': 7187, 'loss/train': 2.169832468032837} -11/06/2021 22:15:21 - INFO - __main__ - Step 7189: {'lr': 0.000498485576625429, 'samples': 1380288, 'steps': 7188, 'loss/train': 1.9039487838745117} -11/06/2021 22:15:21 - INFO - __main__ - Step 7190: {'lr': 0.0004984849933417935, 'samples': 1380480, 'steps': 7189, 'loss/train': 1.6038901805877686} -11/06/2021 22:15:21 - INFO - __main__ - Step 7191: {'lr': 0.0004984844099461945, 'samples': 1380672, 'steps': 7190, 'loss/train': 1.7970324754714966} -11/06/2021 22:15:22 - INFO - __main__ - Step 7192: {'lr': 0.0004984838264386322, 'samples': 1380864, 'steps': 7191, 'loss/train': 1.7720707654953003} -11/06/2021 22:15:23 - INFO - __main__ - Step 7193: {'lr': 0.000498483242819107, 'samples': 1381056, 'steps': 7192, 'loss/train': 1.6350319385528564} -11/06/2021 22:15:23 - INFO - __main__ - Step 7194: {'lr': 0.0004984826590876192, 'samples': 1381248, 'steps': 7193, 'loss/train': 1.857775092124939} -11/06/2021 22:15:23 - INFO - __main__ - Step 7195: {'lr': 0.0004984820752441688, 'samples': 1381440, 'steps': 7194, 'loss/train': 1.664402961730957} -11/06/2021 22:15:24 - INFO - __main__ - Step 7196: {'lr': 0.0004984814912887563, 'samples': 1381632, 'steps': 7195, 'loss/train': 2.1821253299713135} -11/06/2021 22:15:24 - INFO - __main__ - Step 7197: {'lr': 0.0004984809072213818, 'samples': 1381824, 'steps': 7196, 'loss/train': 1.2754813432693481} -11/06/2021 22:15:25 - INFO - __main__ - Step 7198: {'lr': 0.0004984803230420457, 'samples': 1382016, 'steps': 7197, 'loss/train': 1.7471867799758911} -11/06/2021 22:15:25 - INFO - __main__ - Step 7199: {'lr': 0.0004984797387507481, 'samples': 1382208, 'steps': 7198, 'loss/train': 1.889627456665039} -11/06/2021 22:15:26 - INFO - __main__ - Step 7200: {'lr': 0.0004984791543474896, 'samples': 1382400, 'steps': 7199, 'loss/train': 1.987942099571228} -11/06/2021 22:15:26 - INFO - __main__ - Step 7201: {'lr': 0.0004984785698322699, 'samples': 1382592, 'steps': 7200, 'loss/train': 1.3614236116409302} -11/06/2021 22:15:26 - INFO - __main__ - Step 7202: {'lr': 0.0004984779852050898, 'samples': 1382784, 'steps': 7201, 'loss/train': 1.576859712600708} -11/06/2021 22:15:28 - INFO - __main__ - Step 7203: {'lr': 0.0004984774004659493, 'samples': 1382976, 'steps': 7202, 'loss/train': 2.200059413909912} -11/06/2021 22:15:28 - INFO - __main__ - Step 7204: {'lr': 0.0004984768156148489, 'samples': 1383168, 'steps': 7203, 'loss/train': 2.1063573360443115} -11/06/2021 22:15:28 - INFO - __main__ - Step 7205: {'lr': 0.0004984762306517883, 'samples': 1383360, 'steps': 7204, 'loss/train': 2.0486106872558594} -11/06/2021 22:15:29 - INFO - __main__ - Step 7206: {'lr': 0.0004984756455767684, 'samples': 1383552, 'steps': 7205, 'loss/train': 1.8581416606903076} -11/06/2021 22:15:29 - INFO - __main__ - Step 7207: {'lr': 0.0004984750603897892, 'samples': 1383744, 'steps': 7206, 'loss/train': 1.1366732120513916} -11/06/2021 22:15:29 - INFO - __main__ - Step 7208: {'lr': 0.0004984744750908509, 'samples': 1383936, 'steps': 7207, 'loss/train': 1.8445619344711304} -11/06/2021 22:15:30 - INFO - __main__ - Step 7209: {'lr': 0.0004984738896799539, 'samples': 1384128, 'steps': 7208, 'loss/train': 2.4114151000976562} -11/06/2021 22:15:31 - INFO - __main__ - Step 7210: {'lr': 0.0004984733041570983, 'samples': 1384320, 'steps': 7209, 'loss/train': 1.8552770614624023} -11/06/2021 22:15:31 - INFO - __main__ - Step 7211: {'lr': 0.0004984727185222846, 'samples': 1384512, 'steps': 7210, 'loss/train': 2.154346466064453} -11/06/2021 22:15:31 - INFO - __main__ - Step 7212: {'lr': 0.0004984721327755128, 'samples': 1384704, 'steps': 7211, 'loss/train': 2.079803466796875} -11/06/2021 22:15:32 - INFO - __main__ - Step 7213: {'lr': 0.0004984715469167835, 'samples': 1384896, 'steps': 7212, 'loss/train': 1.798585295677185} -11/06/2021 22:15:33 - INFO - __main__ - Step 7214: {'lr': 0.0004984709609460966, 'samples': 1385088, 'steps': 7213, 'loss/train': 1.8755601644515991} -11/06/2021 22:15:33 - INFO - __main__ - Step 7215: {'lr': 0.0004984703748634524, 'samples': 1385280, 'steps': 7214, 'loss/train': 1.9229755401611328} -11/06/2021 22:15:33 - INFO - __main__ - Step 7216: {'lr': 0.0004984697886688514, 'samples': 1385472, 'steps': 7215, 'loss/train': 2.1766183376312256} -11/06/2021 22:15:34 - INFO - __main__ - Step 7217: {'lr': 0.0004984692023622938, 'samples': 1385664, 'steps': 7216, 'loss/train': 2.0930893421173096} -11/06/2021 22:15:34 - INFO - __main__ - Step 7218: {'lr': 0.0004984686159437798, 'samples': 1385856, 'steps': 7217, 'loss/train': 1.6894450187683105} -11/06/2021 22:15:35 - INFO - __main__ - Step 7219: {'lr': 0.0004984680294133096, 'samples': 1386048, 'steps': 7218, 'loss/train': 2.3785271644592285} -11/06/2021 22:15:35 - INFO - __main__ - Step 7220: {'lr': 0.0004984674427708836, 'samples': 1386240, 'steps': 7219, 'loss/train': 2.290306806564331} -11/06/2021 22:15:36 - INFO - __main__ - Step 7221: {'lr': 0.000498466856016502, 'samples': 1386432, 'steps': 7220, 'loss/train': 1.620937705039978} -11/06/2021 22:15:36 - INFO - __main__ - Step 7222: {'lr': 0.000498466269150165, 'samples': 1386624, 'steps': 7221, 'loss/train': 1.4030883312225342} -11/06/2021 22:15:36 - INFO - __main__ - Step 7223: {'lr': 0.000498465682171873, 'samples': 1386816, 'steps': 7222, 'loss/train': 2.2824783325195312} -11/06/2021 22:15:37 - INFO - __main__ - Step 7224: {'lr': 0.0004984650950816262, 'samples': 1387008, 'steps': 7223, 'loss/train': 2.3977138996124268} -11/06/2021 22:15:38 - INFO - __main__ - Step 7225: {'lr': 0.0004984645078794248, 'samples': 1387200, 'steps': 7224, 'loss/train': 1.694911241531372} -11/06/2021 22:15:38 - INFO - __main__ - Step 7226: {'lr': 0.0004984639205652692, 'samples': 1387392, 'steps': 7225, 'loss/train': 2.0143306255340576} -11/06/2021 22:15:39 - INFO - __main__ - Step 7227: {'lr': 0.0004984633331391596, 'samples': 1387584, 'steps': 7226, 'loss/train': 1.6768375635147095} -11/06/2021 22:15:39 - INFO - __main__ - Step 7228: {'lr': 0.0004984627456010962, 'samples': 1387776, 'steps': 7227, 'loss/train': 1.5799198150634766} -11/06/2021 22:15:39 - INFO - __main__ - Step 7229: {'lr': 0.0004984621579510794, 'samples': 1387968, 'steps': 7228, 'loss/train': 1.486791729927063} -11/06/2021 22:15:40 - INFO - __main__ - Step 7230: {'lr': 0.0004984615701891093, 'samples': 1388160, 'steps': 7229, 'loss/train': 3.868530035018921} -11/06/2021 22:15:41 - INFO - __main__ - Step 7231: {'lr': 0.0004984609823151863, 'samples': 1388352, 'steps': 7230, 'loss/train': 0.9350582957267761} -11/06/2021 22:15:41 - INFO - __main__ - Step 7232: {'lr': 0.0004984603943293106, 'samples': 1388544, 'steps': 7231, 'loss/train': 0.9871623516082764} -11/06/2021 22:15:41 - INFO - __main__ - Step 7233: {'lr': 0.0004984598062314824, 'samples': 1388736, 'steps': 7232, 'loss/train': 1.3852111101150513} -11/06/2021 22:15:42 - INFO - __main__ - Step 7234: {'lr': 0.0004984592180217022, 'samples': 1388928, 'steps': 7233, 'loss/train': 1.602423906326294} -11/06/2021 22:15:43 - INFO - __main__ - Step 7235: {'lr': 0.00049845862969997, 'samples': 1389120, 'steps': 7234, 'loss/train': 2.038180351257324} -11/06/2021 22:15:43 - INFO - __main__ - Step 7236: {'lr': 0.0004984580412662862, 'samples': 1389312, 'steps': 7235, 'loss/train': 2.45739483833313} -11/06/2021 22:15:44 - INFO - __main__ - Step 7237: {'lr': 0.000498457452720651, 'samples': 1389504, 'steps': 7236, 'loss/train': 2.169727087020874} -11/06/2021 22:15:44 - INFO - __main__ - Step 7238: {'lr': 0.0004984568640630648, 'samples': 1389696, 'steps': 7237, 'loss/train': 1.3969769477844238} -11/06/2021 22:15:44 - INFO - __main__ - Step 7239: {'lr': 0.0004984562752935278, 'samples': 1389888, 'steps': 7238, 'loss/train': 2.331590175628662} -11/06/2021 22:15:45 - INFO - __main__ - Step 7240: {'lr': 0.0004984556864120401, 'samples': 1390080, 'steps': 7239, 'loss/train': 1.9875437021255493} -11/06/2021 22:15:46 - INFO - __main__ - Step 7241: {'lr': 0.0004984550974186021, 'samples': 1390272, 'steps': 7240, 'loss/train': 2.1947824954986572} -11/06/2021 22:15:46 - INFO - __main__ - Step 7242: {'lr': 0.0004984545083132142, 'samples': 1390464, 'steps': 7241, 'loss/train': 1.9179041385650635} -11/06/2021 22:15:46 - INFO - __main__ - Step 7243: {'lr': 0.0004984539190958765, 'samples': 1390656, 'steps': 7242, 'loss/train': 2.117086887359619} -11/06/2021 22:15:47 - INFO - __main__ - Step 7244: {'lr': 0.0004984533297665892, 'samples': 1390848, 'steps': 7243, 'loss/train': 1.8736786842346191} -11/06/2021 22:15:48 - INFO - __main__ - Step 7245: {'lr': 0.0004984527403253527, 'samples': 1391040, 'steps': 7244, 'loss/train': 2.511869430541992} -11/06/2021 22:15:48 - INFO - __main__ - Step 7246: {'lr': 0.0004984521507721672, 'samples': 1391232, 'steps': 7245, 'loss/train': 2.5657119750976562} -11/06/2021 22:15:48 - INFO - __main__ - Step 7247: {'lr': 0.0004984515611070331, 'samples': 1391424, 'steps': 7246, 'loss/train': 1.9452552795410156} -11/06/2021 22:15:49 - INFO - __main__ - Step 7248: {'lr': 0.0004984509713299505, 'samples': 1391616, 'steps': 7247, 'loss/train': 1.7578961849212646} -11/06/2021 22:15:49 - INFO - __main__ - Step 7249: {'lr': 0.0004984503814409198, 'samples': 1391808, 'steps': 7248, 'loss/train': 1.7365186214447021} -11/06/2021 22:15:49 - INFO - __main__ - Step 7250: {'lr': 0.000498449791439941, 'samples': 1392000, 'steps': 7249, 'loss/train': 2.028444766998291} -11/06/2021 22:15:50 - INFO - __main__ - Step 7251: {'lr': 0.0004984492013270147, 'samples': 1392192, 'steps': 7250, 'loss/train': 1.9997104406356812} -11/06/2021 22:15:51 - INFO - __main__ - Step 7252: {'lr': 0.0004984486111021411, 'samples': 1392384, 'steps': 7251, 'loss/train': 1.7183914184570312} -11/06/2021 22:15:51 - INFO - __main__ - Step 7253: {'lr': 0.0004984480207653202, 'samples': 1392576, 'steps': 7252, 'loss/train': 1.8998106718063354} -11/06/2021 22:15:52 - INFO - __main__ - Step 7254: {'lr': 0.0004984474303165526, 'samples': 1392768, 'steps': 7253, 'loss/train': 1.8647713661193848} -11/06/2021 22:15:52 - INFO - __main__ - Step 7255: {'lr': 0.0004984468397558384, 'samples': 1392960, 'steps': 7254, 'loss/train': 1.3238756656646729} -11/06/2021 22:15:53 - INFO - __main__ - Step 7256: {'lr': 0.0004984462490831778, 'samples': 1393152, 'steps': 7255, 'loss/train': 2.027043104171753} -11/06/2021 22:15:53 - INFO - __main__ - Step 7257: {'lr': 0.0004984456582985713, 'samples': 1393344, 'steps': 7256, 'loss/train': 1.4800242185592651} -11/06/2021 22:15:54 - INFO - __main__ - Step 7258: {'lr': 0.0004984450674020189, 'samples': 1393536, 'steps': 7257, 'loss/train': 2.1049439907073975} -11/06/2021 22:15:54 - INFO - __main__ - Step 7259: {'lr': 0.000498444476393521, 'samples': 1393728, 'steps': 7258, 'loss/train': 2.349273920059204} -11/06/2021 22:15:54 - INFO - __main__ - Step 7260: {'lr': 0.0004984438852730779, 'samples': 1393920, 'steps': 7259, 'loss/train': 1.9256495237350464} -11/06/2021 22:15:55 - INFO - __main__ - Step 7261: {'lr': 0.0004984432940406898, 'samples': 1394112, 'steps': 7260, 'loss/train': 1.3321802616119385} -11/06/2021 22:15:56 - INFO - __main__ - Step 7262: {'lr': 0.0004984427026963569, 'samples': 1394304, 'steps': 7261, 'loss/train': 1.8123741149902344} -11/06/2021 22:15:56 - INFO - __main__ - Step 7263: {'lr': 0.0004984421112400796, 'samples': 1394496, 'steps': 7262, 'loss/train': 1.7774724960327148} -11/06/2021 22:15:56 - INFO - __main__ - Step 7264: {'lr': 0.0004984415196718582, 'samples': 1394688, 'steps': 7263, 'loss/train': 1.5477303266525269} -11/06/2021 22:15:57 - INFO - __main__ - Step 7265: {'lr': 0.0004984409279916929, 'samples': 1394880, 'steps': 7264, 'loss/train': 1.974310278892517} -11/06/2021 22:15:58 - INFO - __main__ - Step 7266: {'lr': 0.0004984403361995839, 'samples': 1395072, 'steps': 7265, 'loss/train': 1.740934133529663} -11/06/2021 22:15:58 - INFO - __main__ - Step 7267: {'lr': 0.0004984397442955315, 'samples': 1395264, 'steps': 7266, 'loss/train': 2.080972194671631} -11/06/2021 22:15:59 - INFO - __main__ - Step 7268: {'lr': 0.0004984391522795359, 'samples': 1395456, 'steps': 7267, 'loss/train': 1.868264079093933} -11/06/2021 22:15:59 - INFO - __main__ - Step 7269: {'lr': 0.0004984385601515977, 'samples': 1395648, 'steps': 7268, 'loss/train': 1.7006977796554565} -11/06/2021 22:15:59 - INFO - __main__ - Step 7270: {'lr': 0.0004984379679117166, 'samples': 1395840, 'steps': 7269, 'loss/train': 2.674793004989624} -11/06/2021 22:16:00 - INFO - __main__ - Step 7271: {'lr': 0.0004984373755598934, 'samples': 1396032, 'steps': 7270, 'loss/train': 1.7683382034301758} -11/06/2021 22:16:01 - INFO - __main__ - Step 7272: {'lr': 0.0004984367830961281, 'samples': 1396224, 'steps': 7271, 'loss/train': 2.167809247970581} -11/06/2021 22:16:01 - INFO - __main__ - Step 7273: {'lr': 0.0004984361905204209, 'samples': 1396416, 'steps': 7272, 'loss/train': 1.7610995769500732} -11/06/2021 22:16:01 - INFO - __main__ - Step 7274: {'lr': 0.0004984355978327724, 'samples': 1396608, 'steps': 7273, 'loss/train': 1.7615541219711304} -11/06/2021 22:16:02 - INFO - __main__ - Step 7275: {'lr': 0.0004984350050331826, 'samples': 1396800, 'steps': 7274, 'loss/train': 1.920972466468811} -11/06/2021 22:16:03 - INFO - __main__ - Step 7276: {'lr': 0.0004984344121216518, 'samples': 1396992, 'steps': 7275, 'loss/train': 1.9374135732650757} -11/06/2021 22:16:03 - INFO - __main__ - Step 7277: {'lr': 0.0004984338190981802, 'samples': 1397184, 'steps': 7276, 'loss/train': 1.6864734888076782} -11/06/2021 22:16:04 - INFO - __main__ - Step 7278: {'lr': 0.0004984332259627682, 'samples': 1397376, 'steps': 7277, 'loss/train': 1.0560840368270874} -11/06/2021 22:16:04 - INFO - __main__ - Step 7279: {'lr': 0.000498432632715416, 'samples': 1397568, 'steps': 7278, 'loss/train': 0.6851865649223328} -11/06/2021 22:16:04 - INFO - __main__ - Step 7280: {'lr': 0.000498432039356124, 'samples': 1397760, 'steps': 7279, 'loss/train': 1.729858160018921} -11/06/2021 22:16:05 - INFO - __main__ - Step 7281: {'lr': 0.0004984314458848923, 'samples': 1397952, 'steps': 7280, 'loss/train': 1.9476943016052246} -11/06/2021 22:16:06 - INFO - __main__ - Step 7282: {'lr': 0.0004984308523017212, 'samples': 1398144, 'steps': 7281, 'loss/train': 1.9683444499969482} -11/06/2021 22:16:06 - INFO - __main__ - Step 7283: {'lr': 0.000498430258606611, 'samples': 1398336, 'steps': 7282, 'loss/train': 2.0607752799987793} -11/06/2021 22:16:06 - INFO - __main__ - Step 7284: {'lr': 0.000498429664799562, 'samples': 1398528, 'steps': 7283, 'loss/train': 2.243265151977539} -11/06/2021 22:16:07 - INFO - __main__ - Step 7285: {'lr': 0.0004984290708805743, 'samples': 1398720, 'steps': 7284, 'loss/train': 1.7015665769577026} -11/06/2021 22:16:07 - INFO - __main__ - Step 7286: {'lr': 0.0004984284768496484, 'samples': 1398912, 'steps': 7285, 'loss/train': 2.0108847618103027} -11/06/2021 22:16:08 - INFO - __main__ - Step 7287: {'lr': 0.0004984278827067844, 'samples': 1399104, 'steps': 7286, 'loss/train': 5.661211967468262} -11/06/2021 22:16:08 - INFO - __main__ - Step 7288: {'lr': 0.0004984272884519827, 'samples': 1399296, 'steps': 7287, 'loss/train': 2.067732572555542} -11/06/2021 22:16:09 - INFO - __main__ - Step 7289: {'lr': 0.0004984266940852434, 'samples': 1399488, 'steps': 7288, 'loss/train': 2.0083210468292236} -11/06/2021 22:16:09 - INFO - __main__ - Step 7290: {'lr': 0.0004984260996065671, 'samples': 1399680, 'steps': 7289, 'loss/train': 1.771776795387268} -11/06/2021 22:16:10 - INFO - __main__ - Step 7291: {'lr': 0.0004984255050159536, 'samples': 1399872, 'steps': 7290, 'loss/train': 2.357623815536499} -11/06/2021 22:16:10 - INFO - __main__ - Step 7292: {'lr': 0.0004984249103134035, 'samples': 1400064, 'steps': 7291, 'loss/train': 1.8594292402267456} -11/06/2021 22:16:11 - INFO - __main__ - Step 7293: {'lr': 0.0004984243154989168, 'samples': 1400256, 'steps': 7292, 'loss/train': 1.5568764209747314} -11/06/2021 22:16:11 - INFO - __main__ - Step 7294: {'lr': 0.0004984237205724942, 'samples': 1400448, 'steps': 7293, 'loss/train': 2.0495903491973877} -11/06/2021 22:16:12 - INFO - __main__ - Step 7295: {'lr': 0.0004984231255341355, 'samples': 1400640, 'steps': 7294, 'loss/train': 1.9171841144561768} -11/06/2021 22:16:12 - INFO - __main__ - Step 7296: {'lr': 0.0004984225303838413, 'samples': 1400832, 'steps': 7295, 'loss/train': 2.2132482528686523} -11/06/2021 22:16:12 - INFO - __main__ - Step 7297: {'lr': 0.0004984219351216116, 'samples': 1401024, 'steps': 7296, 'loss/train': 2.4018189907073975} -11/06/2021 22:16:13 - INFO - __main__ - Step 7298: {'lr': 0.000498421339747447, 'samples': 1401216, 'steps': 7297, 'loss/train': 1.9810959100723267} -11/06/2021 22:16:14 - INFO - __main__ - Step 7299: {'lr': 0.0004984207442613474, 'samples': 1401408, 'steps': 7298, 'loss/train': 2.1550214290618896} -11/06/2021 22:16:14 - INFO - __main__ - Step 7300: {'lr': 0.0004984201486633134, 'samples': 1401600, 'steps': 7299, 'loss/train': 1.7208765745162964} -11/06/2021 22:16:14 - INFO - __main__ - Step 7301: {'lr': 0.0004984195529533451, 'samples': 1401792, 'steps': 7300, 'loss/train': 1.912482500076294} -11/06/2021 22:16:15 - INFO - __main__ - Step 7302: {'lr': 0.0004984189571314426, 'samples': 1401984, 'steps': 7301, 'loss/train': 2.2242941856384277} -11/06/2021 22:16:16 - INFO - __main__ - Step 7303: {'lr': 0.0004984183611976065, 'samples': 1402176, 'steps': 7302, 'loss/train': 1.918655276298523} -11/06/2021 22:16:16 - INFO - __main__ - Step 7304: {'lr': 0.0004984177651518369, 'samples': 1402368, 'steps': 7303, 'loss/train': 2.114764451980591} -11/06/2021 22:16:16 - INFO - __main__ - Step 7305: {'lr': 0.0004984171689941341, 'samples': 1402560, 'steps': 7304, 'loss/train': 1.9402523040771484} -11/06/2021 22:16:17 - INFO - __main__ - Step 7306: {'lr': 0.0004984165727244984, 'samples': 1402752, 'steps': 7305, 'loss/train': 1.6583056449890137} -11/06/2021 22:16:17 - INFO - __main__ - Step 7307: {'lr': 0.0004984159763429299, 'samples': 1402944, 'steps': 7306, 'loss/train': 1.5926767587661743} -11/06/2021 22:16:17 - INFO - __main__ - Step 7308: {'lr': 0.0004984153798494291, 'samples': 1403136, 'steps': 7307, 'loss/train': 1.6592446565628052} -11/06/2021 22:16:18 - INFO - __main__ - Step 7309: {'lr': 0.000498414783243996, 'samples': 1403328, 'steps': 7308, 'loss/train': 1.728884220123291} -11/06/2021 22:16:19 - INFO - __main__ - Step 7310: {'lr': 0.0004984141865266312, 'samples': 1403520, 'steps': 7309, 'loss/train': 0.43410855531692505} -11/06/2021 22:16:19 - INFO - __main__ - Step 7311: {'lr': 0.0004984135896973348, 'samples': 1403712, 'steps': 7310, 'loss/train': 2.0036983489990234} -11/06/2021 22:16:20 - INFO - __main__ - Step 7312: {'lr': 0.000498412992756107, 'samples': 1403904, 'steps': 7311, 'loss/train': 1.7266615629196167} -11/06/2021 22:16:20 - INFO - __main__ - Step 7313: {'lr': 0.0004984123957029482, 'samples': 1404096, 'steps': 7312, 'loss/train': 1.9898042678833008} -11/06/2021 22:16:21 - INFO - __main__ - Step 7314: {'lr': 0.0004984117985378586, 'samples': 1404288, 'steps': 7313, 'loss/train': 2.5833494663238525} -11/06/2021 22:16:21 - INFO - __main__ - Step 7315: {'lr': 0.0004984112012608384, 'samples': 1404480, 'steps': 7314, 'loss/train': 1.9153599739074707} -11/06/2021 22:16:22 - INFO - __main__ - Step 7316: {'lr': 0.000498410603871888, 'samples': 1404672, 'steps': 7315, 'loss/train': 1.9567968845367432} -11/06/2021 22:16:22 - INFO - __main__ - Step 7317: {'lr': 0.0004984100063710076, 'samples': 1404864, 'steps': 7316, 'loss/train': 1.922874927520752} -11/06/2021 22:16:22 - INFO - __main__ - Step 7318: {'lr': 0.0004984094087581975, 'samples': 1405056, 'steps': 7317, 'loss/train': 1.7780122756958008} -11/06/2021 22:16:23 - INFO - __main__ - Step 7319: {'lr': 0.0004984088110334579, 'samples': 1405248, 'steps': 7318, 'loss/train': 1.6674338579177856} -11/06/2021 22:16:24 - INFO - __main__ - Step 7320: {'lr': 0.0004984082131967892, 'samples': 1405440, 'steps': 7319, 'loss/train': 1.5355974435806274} -11/06/2021 22:16:24 - INFO - __main__ - Step 7321: {'lr': 0.0004984076152481916, 'samples': 1405632, 'steps': 7320, 'loss/train': 1.7139782905578613} -11/06/2021 22:16:24 - INFO - __main__ - Step 7322: {'lr': 0.0004984070171876653, 'samples': 1405824, 'steps': 7321, 'loss/train': 2.0687177181243896} -11/06/2021 22:16:25 - INFO - __main__ - Step 7323: {'lr': 0.0004984064190152106, 'samples': 1406016, 'steps': 7322, 'loss/train': 1.93816077709198} -11/06/2021 22:16:26 - INFO - __main__ - Step 7324: {'lr': 0.0004984058207308279, 'samples': 1406208, 'steps': 7323, 'loss/train': 1.9266688823699951} -11/06/2021 22:16:26 - INFO - __main__ - Step 7325: {'lr': 0.0004984052223345174, 'samples': 1406400, 'steps': 7324, 'loss/train': 1.676986575126648} -11/06/2021 22:16:27 - INFO - __main__ - Step 7326: {'lr': 0.0004984046238262792, 'samples': 1406592, 'steps': 7325, 'loss/train': 1.8388060331344604} -11/06/2021 22:16:27 - INFO - __main__ - Step 7327: {'lr': 0.0004984040252061137, 'samples': 1406784, 'steps': 7326, 'loss/train': 2.036705255508423} -11/06/2021 22:16:27 - INFO - __main__ - Step 7328: {'lr': 0.0004984034264740213, 'samples': 1406976, 'steps': 7327, 'loss/train': 1.4209593534469604} -11/06/2021 22:16:28 - INFO - __main__ - Step 7329: {'lr': 0.0004984028276300021, 'samples': 1407168, 'steps': 7328, 'loss/train': 1.2647329568862915} -11/06/2021 22:16:29 - INFO - __main__ - Step 7330: {'lr': 0.0004984022286740565, 'samples': 1407360, 'steps': 7329, 'loss/train': 1.7428815364837646} -11/06/2021 22:16:29 - INFO - __main__ - Step 7331: {'lr': 0.0004984016296061846, 'samples': 1407552, 'steps': 7330, 'loss/train': 1.4878357648849487} -11/06/2021 22:16:29 - INFO - __main__ - Step 7332: {'lr': 0.0004984010304263868, 'samples': 1407744, 'steps': 7331, 'loss/train': 1.8269178867340088} -11/06/2021 22:16:30 - INFO - __main__ - Step 7333: {'lr': 0.0004984004311346632, 'samples': 1407936, 'steps': 7332, 'loss/train': 1.686158299446106} -11/06/2021 22:16:31 - INFO - __main__ - Step 7334: {'lr': 0.0004983998317310143, 'samples': 1408128, 'steps': 7333, 'loss/train': 0.8892830610275269} -11/06/2021 22:16:31 - INFO - __main__ - Step 7335: {'lr': 0.0004983992322154403, 'samples': 1408320, 'steps': 7334, 'loss/train': 1.7509515285491943} -11/06/2021 22:16:31 - INFO - __main__ - Step 7336: {'lr': 0.0004983986325879414, 'samples': 1408512, 'steps': 7335, 'loss/train': 1.561832070350647} -11/06/2021 22:16:32 - INFO - __main__ - Step 7337: {'lr': 0.0004983980328485179, 'samples': 1408704, 'steps': 7336, 'loss/train': 1.7405585050582886} -11/06/2021 22:16:32 - INFO - __main__ - Step 7338: {'lr': 0.0004983974329971702, 'samples': 1408896, 'steps': 7337, 'loss/train': 1.8037465810775757} -11/06/2021 22:16:32 - INFO - __main__ - Step 7339: {'lr': 0.0004983968330338983, 'samples': 1409088, 'steps': 7338, 'loss/train': 1.8311342000961304} -11/06/2021 22:16:33 - INFO - __main__ - Step 7340: {'lr': 0.0004983962329587026, 'samples': 1409280, 'steps': 7339, 'loss/train': 1.649807333946228} -11/06/2021 22:16:34 - INFO - __main__ - Step 7341: {'lr': 0.0004983956327715835, 'samples': 1409472, 'steps': 7340, 'loss/train': 1.9435052871704102} -11/06/2021 22:16:34 - INFO - __main__ - Step 7342: {'lr': 0.000498395032472541, 'samples': 1409664, 'steps': 7341, 'loss/train': 1.9914734363555908} -11/06/2021 22:16:34 - INFO - __main__ - Step 7343: {'lr': 0.0004983944320615757, 'samples': 1409856, 'steps': 7342, 'loss/train': 2.154550552368164} -11/06/2021 22:16:35 - INFO - __main__ - Step 7344: {'lr': 0.0004983938315386877, 'samples': 1410048, 'steps': 7343, 'loss/train': 0.9631898403167725} -11/06/2021 22:16:36 - INFO - __main__ - Step 7345: {'lr': 0.0004983932309038773, 'samples': 1410240, 'steps': 7344, 'loss/train': 1.8528187274932861} -11/06/2021 22:16:36 - INFO - __main__ - Step 7346: {'lr': 0.0004983926301571445, 'samples': 1410432, 'steps': 7345, 'loss/train': 1.4792355298995972} -11/06/2021 22:16:36 - INFO - __main__ - Step 7347: {'lr': 0.00049839202929849, 'samples': 1410624, 'steps': 7346, 'loss/train': 2.132795572280884} -11/06/2021 22:16:37 - INFO - __main__ - Step 7348: {'lr': 0.0004983914283279139, 'samples': 1410816, 'steps': 7347, 'loss/train': 1.8769862651824951} -11/06/2021 22:16:37 - INFO - __main__ - Step 7349: {'lr': 0.0004983908272454164, 'samples': 1411008, 'steps': 7348, 'loss/train': 1.8160367012023926} -11/06/2021 22:16:38 - INFO - __main__ - Step 7350: {'lr': 0.0004983902260509978, 'samples': 1411200, 'steps': 7349, 'loss/train': 0.7067152857780457} -11/06/2021 22:16:38 - INFO - __main__ - Step 7351: {'lr': 0.0004983896247446585, 'samples': 1411392, 'steps': 7350, 'loss/train': 1.9250173568725586} -11/06/2021 22:16:39 - INFO - __main__ - Step 7352: {'lr': 0.0004983890233263986, 'samples': 1411584, 'steps': 7351, 'loss/train': 1.8521647453308105} -11/06/2021 22:16:39 - INFO - __main__ - Step 7353: {'lr': 0.0004983884217962185, 'samples': 1411776, 'steps': 7352, 'loss/train': 1.7597779035568237} -11/06/2021 22:16:40 - INFO - __main__ - Step 7354: {'lr': 0.0004983878201541183, 'samples': 1411968, 'steps': 7353, 'loss/train': 1.017517328262329} -11/06/2021 22:16:41 - INFO - __main__ - Step 7355: {'lr': 0.0004983872184000984, 'samples': 1412160, 'steps': 7354, 'loss/train': 2.1541800498962402} -11/06/2021 22:16:41 - INFO - __main__ - Step 7356: {'lr': 0.0004983866165341592, 'samples': 1412352, 'steps': 7355, 'loss/train': 2.184023380279541} -11/06/2021 22:16:41 - INFO - __main__ - Step 7357: {'lr': 0.0004983860145563006, 'samples': 1412544, 'steps': 7356, 'loss/train': 1.9269651174545288} -11/06/2021 22:16:42 - INFO - __main__ - Step 7358: {'lr': 0.0004983854124665232, 'samples': 1412736, 'steps': 7357, 'loss/train': 0.9575059413909912} -11/06/2021 22:16:42 - INFO - __main__ - Step 7359: {'lr': 0.0004983848102648273, 'samples': 1412928, 'steps': 7358, 'loss/train': 1.8082619905471802} -11/06/2021 22:16:43 - INFO - __main__ - Step 7360: {'lr': 0.0004983842079512128, 'samples': 1413120, 'steps': 7359, 'loss/train': 1.5754534006118774} -11/06/2021 22:16:43 - INFO - __main__ - Step 7361: {'lr': 0.0004983836055256804, 'samples': 1413312, 'steps': 7360, 'loss/train': 1.5222283601760864} -11/06/2021 22:16:44 - INFO - __main__ - Step 7362: {'lr': 0.0004983830029882301, 'samples': 1413504, 'steps': 7361, 'loss/train': 2.070965051651001} -11/06/2021 22:16:44 - INFO - __main__ - Step 7363: {'lr': 0.0004983824003388622, 'samples': 1413696, 'steps': 7362, 'loss/train': 1.8946985006332397} -11/06/2021 22:16:44 - INFO - __main__ - Step 7364: {'lr': 0.0004983817975775771, 'samples': 1413888, 'steps': 7363, 'loss/train': 1.666754126548767} -11/06/2021 22:16:45 - INFO - __main__ - Step 7365: {'lr': 0.000498381194704375, 'samples': 1414080, 'steps': 7364, 'loss/train': 1.879746675491333} -11/06/2021 22:16:46 - INFO - __main__ - Step 7366: {'lr': 0.000498380591719256, 'samples': 1414272, 'steps': 7365, 'loss/train': 1.6441892385482788} -11/06/2021 22:16:46 - INFO - __main__ - Step 7367: {'lr': 0.0004983799886222207, 'samples': 1414464, 'steps': 7366, 'loss/train': 2.2601382732391357} -11/06/2021 22:16:47 - INFO - __main__ - Step 7368: {'lr': 0.0004983793854132693, 'samples': 1414656, 'steps': 7367, 'loss/train': 1.803916335105896} -11/06/2021 22:16:47 - INFO - __main__ - Step 7369: {'lr': 0.0004983787820924019, 'samples': 1414848, 'steps': 7368, 'loss/train': 1.7164603471755981} -11/06/2021 22:16:48 - INFO - __main__ - Step 7370: {'lr': 0.0004983781786596187, 'samples': 1415040, 'steps': 7369, 'loss/train': 1.3875094652175903} -11/06/2021 22:16:48 - INFO - __main__ - Step 7371: {'lr': 0.0004983775751149204, 'samples': 1415232, 'steps': 7370, 'loss/train': 2.1840782165527344} -11/06/2021 22:16:49 - INFO - __main__ - Step 7372: {'lr': 0.0004983769714583067, 'samples': 1415424, 'steps': 7371, 'loss/train': 2.081000328063965} -11/06/2021 22:16:49 - INFO - __main__ - Step 7373: {'lr': 0.0004983763676897784, 'samples': 1415616, 'steps': 7372, 'loss/train': 1.749665379524231} -11/06/2021 22:16:49 - INFO - __main__ - Step 7374: {'lr': 0.0004983757638093355, 'samples': 1415808, 'steps': 7373, 'loss/train': 1.8339048624038696} -11/06/2021 22:16:50 - INFO - __main__ - Step 7375: {'lr': 0.0004983751598169781, 'samples': 1416000, 'steps': 7374, 'loss/train': 1.631373405456543} -11/06/2021 22:16:51 - INFO - __main__ - Step 7376: {'lr': 0.000498374555712707, 'samples': 1416192, 'steps': 7375, 'loss/train': 2.2265982627868652} -11/06/2021 22:16:51 - INFO - __main__ - Step 7377: {'lr': 0.000498373951496522, 'samples': 1416384, 'steps': 7376, 'loss/train': 2.2691292762756348} -11/06/2021 22:16:51 - INFO - __main__ - Step 7378: {'lr': 0.0004983733471684234, 'samples': 1416576, 'steps': 7377, 'loss/train': 2.114935874938965} -11/06/2021 22:16:52 - INFO - __main__ - Step 7379: {'lr': 0.0004983727427284118, 'samples': 1416768, 'steps': 7378, 'loss/train': 1.5053443908691406} -11/06/2021 22:16:52 - INFO - __main__ - Step 7380: {'lr': 0.0004983721381764873, 'samples': 1416960, 'steps': 7379, 'loss/train': 2.0003550052642822} -11/06/2021 22:16:53 - INFO - __main__ - Step 7381: {'lr': 0.00049837153351265, 'samples': 1417152, 'steps': 7380, 'loss/train': 1.6483396291732788} -11/06/2021 22:16:53 - INFO - __main__ - Step 7382: {'lr': 0.0004983709287369004, 'samples': 1417344, 'steps': 7381, 'loss/train': 1.4799424409866333} -11/06/2021 22:16:54 - INFO - __main__ - Step 7383: {'lr': 0.0004983703238492386, 'samples': 1417536, 'steps': 7382, 'loss/train': 1.8734862804412842} -11/06/2021 22:16:54 - INFO - __main__ - Step 7384: {'lr': 0.000498369718849665, 'samples': 1417728, 'steps': 7383, 'loss/train': 2.09423565864563} -11/06/2021 22:16:54 - INFO - __main__ - Step 7385: {'lr': 0.00049836911373818, 'samples': 1417920, 'steps': 7384, 'loss/train': 1.690798044204712} -11/06/2021 22:16:55 - INFO - __main__ - Step 7386: {'lr': 0.0004983685085147836, 'samples': 1418112, 'steps': 7385, 'loss/train': 1.6163359880447388} -11/06/2021 22:16:56 - INFO - __main__ - Step 7387: {'lr': 0.0004983679031794762, 'samples': 1418304, 'steps': 7386, 'loss/train': 1.860256552696228} -11/06/2021 22:16:56 - INFO - __main__ - Step 7388: {'lr': 0.000498367297732258, 'samples': 1418496, 'steps': 7387, 'loss/train': 1.9493474960327148} -11/06/2021 22:16:56 - INFO - __main__ - Step 7389: {'lr': 0.0004983666921731293, 'samples': 1418688, 'steps': 7388, 'loss/train': 1.6616744995117188} -11/06/2021 22:16:57 - INFO - __main__ - Step 7390: {'lr': 0.0004983660865020905, 'samples': 1418880, 'steps': 7389, 'loss/train': 1.901392936706543} -11/06/2021 22:16:58 - INFO - __main__ - Step 7391: {'lr': 0.0004983654807191418, 'samples': 1419072, 'steps': 7390, 'loss/train': 2.3318119049072266} -11/06/2021 22:16:58 - INFO - __main__ - Step 7392: {'lr': 0.0004983648748242833, 'samples': 1419264, 'steps': 7391, 'loss/train': 1.922995686531067} -11/06/2021 22:16:59 - INFO - __main__ - Step 7393: {'lr': 0.0004983642688175155, 'samples': 1419456, 'steps': 7392, 'loss/train': 1.9183114767074585} -11/06/2021 22:16:59 - INFO - __main__ - Step 7394: {'lr': 0.0004983636626988386, 'samples': 1419648, 'steps': 7393, 'loss/train': 2.0506041049957275} -11/06/2021 22:16:59 - INFO - __main__ - Step 7395: {'lr': 0.0004983630564682529, 'samples': 1419840, 'steps': 7394, 'loss/train': 1.6490904092788696} -11/06/2021 22:17:00 - INFO - __main__ - Step 7396: {'lr': 0.0004983624501257585, 'samples': 1420032, 'steps': 7395, 'loss/train': 2.0997846126556396} -11/06/2021 22:17:01 - INFO - __main__ - Step 7397: {'lr': 0.000498361843671356, 'samples': 1420224, 'steps': 7396, 'loss/train': 1.3421412706375122} -11/06/2021 22:17:01 - INFO - __main__ - Step 7398: {'lr': 0.0004983612371050453, 'samples': 1420416, 'steps': 7397, 'loss/train': 1.7991613149642944} -11/06/2021 22:17:01 - INFO - __main__ - Step 7399: {'lr': 0.000498360630426827, 'samples': 1420608, 'steps': 7398, 'loss/train': 2.0792791843414307} -11/06/2021 22:17:02 - INFO - __main__ - Step 7400: {'lr': 0.0004983600236367012, 'samples': 1420800, 'steps': 7399, 'loss/train': 3.388317346572876} -11/06/2021 22:17:03 - INFO - __main__ - Step 7401: {'lr': 0.0004983594167346681, 'samples': 1420992, 'steps': 7400, 'loss/train': 1.5198123455047607} -11/06/2021 22:17:03 - INFO - __main__ - Step 7402: {'lr': 0.0004983588097207283, 'samples': 1421184, 'steps': 7401, 'loss/train': 1.678063988685608} -11/06/2021 22:17:03 - INFO - __main__ - Step 7403: {'lr': 0.0004983582025948816, 'samples': 1421376, 'steps': 7402, 'loss/train': 1.8395053148269653} -11/06/2021 22:17:04 - INFO - __main__ - Step 7404: {'lr': 0.0004983575953571287, 'samples': 1421568, 'steps': 7403, 'loss/train': 0.9479645490646362} -11/06/2021 22:17:04 - INFO - __main__ - Step 7405: {'lr': 0.0004983569880074696, 'samples': 1421760, 'steps': 7404, 'loss/train': 1.9720947742462158} -11/06/2021 22:17:05 - INFO - __main__ - Step 7406: {'lr': 0.0004983563805459048, 'samples': 1421952, 'steps': 7405, 'loss/train': 1.7848727703094482} -11/06/2021 22:17:06 - INFO - __main__ - Step 7407: {'lr': 0.0004983557729724343, 'samples': 1422144, 'steps': 7406, 'loss/train': 1.2195593118667603} -11/06/2021 22:17:06 - INFO - __main__ - Step 7408: {'lr': 0.0004983551652870586, 'samples': 1422336, 'steps': 7407, 'loss/train': 1.9602643251419067} -11/06/2021 22:17:06 - INFO - __main__ - Step 7409: {'lr': 0.000498354557489778, 'samples': 1422528, 'steps': 7408, 'loss/train': 1.9274659156799316} -11/06/2021 22:17:07 - INFO - __main__ - Step 7410: {'lr': 0.0004983539495805925, 'samples': 1422720, 'steps': 7409, 'loss/train': 0.8858946561813354} -11/06/2021 22:17:07 - INFO - __main__ - Step 7411: {'lr': 0.0004983533415595026, 'samples': 1422912, 'steps': 7410, 'loss/train': 2.1833174228668213} -11/06/2021 22:17:08 - INFO - __main__ - Step 7412: {'lr': 0.0004983527334265085, 'samples': 1423104, 'steps': 7411, 'loss/train': 1.8606438636779785} -11/06/2021 22:17:08 - INFO - __main__ - Step 7413: {'lr': 0.0004983521251816105, 'samples': 1423296, 'steps': 7412, 'loss/train': 2.0643343925476074} -11/06/2021 22:17:09 - INFO - __main__ - Step 7414: {'lr': 0.0004983515168248088, 'samples': 1423488, 'steps': 7413, 'loss/train': 2.0445151329040527} -11/06/2021 22:17:09 - INFO - __main__ - Step 7415: {'lr': 0.0004983509083561038, 'samples': 1423680, 'steps': 7414, 'loss/train': 2.069981813430786} -11/06/2021 22:17:09 - INFO - __main__ - Step 7416: {'lr': 0.0004983502997754958, 'samples': 1423872, 'steps': 7415, 'loss/train': 1.200181245803833} -11/06/2021 22:17:11 - INFO - __main__ - Step 7417: {'lr': 0.0004983496910829849, 'samples': 1424064, 'steps': 7416, 'loss/train': 1.8883745670318604} -11/06/2021 22:17:11 - INFO - __main__ - Step 7418: {'lr': 0.0004983490822785715, 'samples': 1424256, 'steps': 7417, 'loss/train': 2.2220919132232666} -11/06/2021 22:17:11 - INFO - __main__ - Step 7419: {'lr': 0.0004983484733622558, 'samples': 1424448, 'steps': 7418, 'loss/train': 1.7355570793151855} -11/06/2021 22:17:12 - INFO - __main__ - Step 7420: {'lr': 0.0004983478643340382, 'samples': 1424640, 'steps': 7419, 'loss/train': 2.0675618648529053} -11/06/2021 22:17:12 - INFO - __main__ - Step 7421: {'lr': 0.0004983472551939186, 'samples': 1424832, 'steps': 7420, 'loss/train': 1.9630166292190552} -11/06/2021 22:17:13 - INFO - __main__ - Step 7422: {'lr': 0.0004983466459418978, 'samples': 1425024, 'steps': 7421, 'loss/train': 2.4349045753479004} -11/06/2021 22:17:13 - INFO - __main__ - Step 7423: {'lr': 0.0004983460365779759, 'samples': 1425216, 'steps': 7422, 'loss/train': 2.1964800357818604} -11/06/2021 22:17:14 - INFO - __main__ - Step 7424: {'lr': 0.0004983454271021529, 'samples': 1425408, 'steps': 7423, 'loss/train': 2.5369303226470947} -11/06/2021 22:17:14 - INFO - __main__ - Step 7425: {'lr': 0.0004983448175144294, 'samples': 1425600, 'steps': 7424, 'loss/train': 2.294490098953247} -11/06/2021 22:17:14 - INFO - __main__ - Step 7426: {'lr': 0.0004983442078148056, 'samples': 1425792, 'steps': 7425, 'loss/train': 1.7043726444244385} -11/06/2021 22:17:15 - INFO - __main__ - Step 7427: {'lr': 0.0004983435980032817, 'samples': 1425984, 'steps': 7426, 'loss/train': 1.0851516723632812} -11/06/2021 22:17:16 - INFO - __main__ - Step 7428: {'lr': 0.0004983429880798579, 'samples': 1426176, 'steps': 7427, 'loss/train': 1.8238978385925293} -11/06/2021 22:17:16 - INFO - __main__ - Step 7429: {'lr': 0.0004983423780445346, 'samples': 1426368, 'steps': 7428, 'loss/train': 2.179898977279663} -11/06/2021 22:17:16 - INFO - __main__ - Step 7430: {'lr': 0.0004983417678973123, 'samples': 1426560, 'steps': 7429, 'loss/train': 2.2200920581817627} -11/06/2021 22:17:17 - INFO - __main__ - Step 7431: {'lr': 0.0004983411576381907, 'samples': 1426752, 'steps': 7430, 'loss/train': 2.471855640411377} -11/06/2021 22:17:18 - INFO - __main__ - Step 7432: {'lr': 0.0004983405472671706, 'samples': 1426944, 'steps': 7431, 'loss/train': 1.9045939445495605} -11/06/2021 22:17:18 - INFO - __main__ - Step 7433: {'lr': 0.000498339936784252, 'samples': 1427136, 'steps': 7432, 'loss/train': 2.156907558441162} -11/06/2021 22:17:18 - INFO - __main__ - Step 7434: {'lr': 0.0004983393261894354, 'samples': 1427328, 'steps': 7433, 'loss/train': 2.357154130935669} -11/06/2021 22:17:19 - INFO - __main__ - Step 7435: {'lr': 0.0004983387154827208, 'samples': 1427520, 'steps': 7434, 'loss/train': 1.69056236743927} -11/06/2021 22:17:19 - INFO - __main__ - Step 7436: {'lr': 0.0004983381046641085, 'samples': 1427712, 'steps': 7435, 'loss/train': 1.9962103366851807} -11/06/2021 22:17:20 - INFO - __main__ - Step 7437: {'lr': 0.0004983374937335991, 'samples': 1427904, 'steps': 7436, 'loss/train': 1.3792200088500977} -11/06/2021 22:17:21 - INFO - __main__ - Step 7438: {'lr': 0.0004983368826911926, 'samples': 1428096, 'steps': 7437, 'loss/train': 1.7087842226028442} -11/06/2021 22:17:21 - INFO - __main__ - Step 7439: {'lr': 0.0004983362715368893, 'samples': 1428288, 'steps': 7438, 'loss/train': 1.5336834192276} -11/06/2021 22:17:21 - INFO - __main__ - Step 7440: {'lr': 0.0004983356602706895, 'samples': 1428480, 'steps': 7439, 'loss/train': 2.1194801330566406} -11/06/2021 22:17:22 - INFO - __main__ - Step 7441: {'lr': 0.0004983350488925936, 'samples': 1428672, 'steps': 7440, 'loss/train': 1.9883663654327393} -11/06/2021 22:17:22 - INFO - __main__ - Step 7442: {'lr': 0.0004983344374026016, 'samples': 1428864, 'steps': 7441, 'loss/train': 1.836441993713379} -11/06/2021 22:17:23 - INFO - __main__ - Step 7443: {'lr': 0.0004983338258007139, 'samples': 1429056, 'steps': 7442, 'loss/train': 1.3787864446640015} -11/06/2021 22:17:24 - INFO - __main__ - Step 7444: {'lr': 0.0004983332140869309, 'samples': 1429248, 'steps': 7443, 'loss/train': 1.911993384361267} -11/06/2021 22:17:24 - INFO - __main__ - Step 7445: {'lr': 0.0004983326022612528, 'samples': 1429440, 'steps': 7444, 'loss/train': 2.0019690990448} -11/06/2021 22:17:24 - INFO - __main__ - Step 7446: {'lr': 0.0004983319903236799, 'samples': 1429632, 'steps': 7445, 'loss/train': 2.305609941482544} -11/06/2021 22:17:25 - INFO - __main__ - Step 7447: {'lr': 0.0004983313782742124, 'samples': 1429824, 'steps': 7446, 'loss/train': 1.3778132200241089} -11/06/2021 22:17:26 - INFO - __main__ - Step 7448: {'lr': 0.0004983307661128505, 'samples': 1430016, 'steps': 7447, 'loss/train': 1.7583122253417969} -11/06/2021 22:17:26 - INFO - __main__ - Step 7449: {'lr': 0.0004983301538395948, 'samples': 1430208, 'steps': 7448, 'loss/train': 1.846149206161499} -11/06/2021 22:17:27 - INFO - __main__ - Step 7450: {'lr': 0.0004983295414544452, 'samples': 1430400, 'steps': 7449, 'loss/train': 1.9692158699035645} -11/06/2021 22:17:27 - INFO - __main__ - Step 7451: {'lr': 0.0004983289289574022, 'samples': 1430592, 'steps': 7450, 'loss/train': 1.7557963132858276} -11/06/2021 22:17:27 - INFO - __main__ - Step 7452: {'lr': 0.000498328316348466, 'samples': 1430784, 'steps': 7451, 'loss/train': 2.0076990127563477} -11/06/2021 22:17:28 - INFO - __main__ - Step 7453: {'lr': 0.0004983277036276369, 'samples': 1430976, 'steps': 7452, 'loss/train': 0.7926499843597412} -11/06/2021 22:17:29 - INFO - __main__ - Step 7454: {'lr': 0.0004983270907949152, 'samples': 1431168, 'steps': 7453, 'loss/train': 1.5046730041503906} -11/06/2021 22:17:29 - INFO - __main__ - Step 7455: {'lr': 0.0004983264778503011, 'samples': 1431360, 'steps': 7454, 'loss/train': 1.3215335607528687} -11/06/2021 22:17:29 - INFO - __main__ - Step 7456: {'lr': 0.0004983258647937949, 'samples': 1431552, 'steps': 7455, 'loss/train': 2.1020658016204834} -11/06/2021 22:17:30 - INFO - __main__ - Step 7457: {'lr': 0.0004983252516253969, 'samples': 1431744, 'steps': 7456, 'loss/train': 1.746657133102417} -11/06/2021 22:17:31 - INFO - __main__ - Step 7458: {'lr': 0.0004983246383451074, 'samples': 1431936, 'steps': 7457, 'loss/train': 2.16377329826355} -11/06/2021 22:17:31 - INFO - __main__ - Step 7459: {'lr': 0.0004983240249529267, 'samples': 1432128, 'steps': 7458, 'loss/train': 2.1467676162719727} -11/06/2021 22:17:31 - INFO - __main__ - Step 7460: {'lr': 0.000498323411448855, 'samples': 1432320, 'steps': 7459, 'loss/train': 1.7520476579666138} -11/06/2021 22:17:32 - INFO - __main__ - Step 7461: {'lr': 0.0004983227978328926, 'samples': 1432512, 'steps': 7460, 'loss/train': 2.5341601371765137} -11/06/2021 22:17:32 - INFO - __main__ - Step 7462: {'lr': 0.0004983221841050397, 'samples': 1432704, 'steps': 7461, 'loss/train': 2.3244829177856445} -11/06/2021 22:17:33 - INFO - __main__ - Step 7463: {'lr': 0.0004983215702652968, 'samples': 1432896, 'steps': 7462, 'loss/train': 1.8480935096740723} -11/06/2021 22:17:34 - INFO - __main__ - Step 7464: {'lr': 0.0004983209563136639, 'samples': 1433088, 'steps': 7463, 'loss/train': 1.939214825630188} -11/06/2021 22:17:34 - INFO - __main__ - Step 7465: {'lr': 0.0004983203422501414, 'samples': 1433280, 'steps': 7464, 'loss/train': 2.0819010734558105} -11/06/2021 22:17:34 - INFO - __main__ - Step 7466: {'lr': 0.0004983197280747297, 'samples': 1433472, 'steps': 7465, 'loss/train': 1.9236360788345337} -11/06/2021 22:17:35 - INFO - __main__ - Step 7467: {'lr': 0.0004983191137874289, 'samples': 1433664, 'steps': 7466, 'loss/train': 1.6283338069915771} -11/06/2021 22:17:35 - INFO - __main__ - Step 7468: {'lr': 0.0004983184993882394, 'samples': 1433856, 'steps': 7467, 'loss/train': 1.6667938232421875} -11/06/2021 22:17:36 - INFO - __main__ - Step 7469: {'lr': 0.0004983178848771613, 'samples': 1434048, 'steps': 7468, 'loss/train': 2.123434066772461} -11/06/2021 22:17:36 - INFO - __main__ - Step 7470: {'lr': 0.0004983172702541951, 'samples': 1434240, 'steps': 7469, 'loss/train': 1.7942487001419067} -11/06/2021 22:17:37 - INFO - __main__ - Step 7471: {'lr': 0.0004983166555193409, 'samples': 1434432, 'steps': 7470, 'loss/train': 2.0577187538146973} -11/06/2021 22:17:37 - INFO - __main__ - Step 7472: {'lr': 0.000498316040672599, 'samples': 1434624, 'steps': 7471, 'loss/train': 1.767512559890747} -11/06/2021 22:17:37 - INFO - __main__ - Step 7473: {'lr': 0.00049831542571397, 'samples': 1434816, 'steps': 7472, 'loss/train': 1.7135177850723267} -11/06/2021 22:17:38 - INFO - __main__ - Step 7474: {'lr': 0.0004983148106434536, 'samples': 1435008, 'steps': 7473, 'loss/train': 1.7563962936401367} -11/06/2021 22:17:39 - INFO - __main__ - Step 7475: {'lr': 0.0004983141954610505, 'samples': 1435200, 'steps': 7474, 'loss/train': 1.7334504127502441} -11/06/2021 22:17:39 - INFO - __main__ - Step 7476: {'lr': 0.0004983135801667608, 'samples': 1435392, 'steps': 7475, 'loss/train': 2.2196826934814453} -11/06/2021 22:17:39 - INFO - __main__ - Step 7477: {'lr': 0.0004983129647605849, 'samples': 1435584, 'steps': 7476, 'loss/train': 1.6023023128509521} -11/06/2021 22:17:40 - INFO - __main__ - Step 7478: {'lr': 0.0004983123492425229, 'samples': 1435776, 'steps': 7477, 'loss/train': 1.4602479934692383} -11/06/2021 22:17:41 - INFO - __main__ - Step 7479: {'lr': 0.0004983117336125753, 'samples': 1435968, 'steps': 7478, 'loss/train': 1.8138916492462158} -11/06/2021 22:17:41 - INFO - __main__ - Step 7480: {'lr': 0.0004983111178707422, 'samples': 1436160, 'steps': 7479, 'loss/train': 1.5433342456817627} -11/06/2021 22:17:41 - INFO - __main__ - Step 7481: {'lr': 0.0004983105020170239, 'samples': 1436352, 'steps': 7480, 'loss/train': 1.7849801778793335} -11/06/2021 22:17:42 - INFO - __main__ - Step 7482: {'lr': 0.0004983098860514209, 'samples': 1436544, 'steps': 7481, 'loss/train': 2.041818380355835} -11/06/2021 22:17:42 - INFO - __main__ - Step 7483: {'lr': 0.0004983092699739331, 'samples': 1436736, 'steps': 7482, 'loss/train': 1.6931136846542358} -11/06/2021 22:17:43 - INFO - __main__ - Step 7484: {'lr': 0.0004983086537845611, 'samples': 1436928, 'steps': 7483, 'loss/train': 1.9418973922729492} -11/06/2021 22:17:44 - INFO - __main__ - Step 7485: {'lr': 0.000498308037483305, 'samples': 1437120, 'steps': 7484, 'loss/train': 1.8237574100494385} -11/06/2021 22:17:44 - INFO - __main__ - Step 7486: {'lr': 0.0004983074210701651, 'samples': 1437312, 'steps': 7485, 'loss/train': 1.779268503189087} -11/06/2021 22:17:44 - INFO - __main__ - Step 7487: {'lr': 0.0004983068045451418, 'samples': 1437504, 'steps': 7486, 'loss/train': 2.059835433959961} -11/06/2021 22:17:45 - INFO - __main__ - Step 7488: {'lr': 0.0004983061879082352, 'samples': 1437696, 'steps': 7487, 'loss/train': 2.341383218765259} -11/06/2021 22:17:46 - INFO - __main__ - Step 7489: {'lr': 0.0004983055711594458, 'samples': 1437888, 'steps': 7488, 'loss/train': 1.6205718517303467} -11/06/2021 22:17:46 - INFO - __main__ - Step 7490: {'lr': 0.0004983049542987736, 'samples': 1438080, 'steps': 7489, 'loss/train': 1.5462263822555542} -11/06/2021 22:17:46 - INFO - __main__ - Step 7491: {'lr': 0.000498304337326219, 'samples': 1438272, 'steps': 7490, 'loss/train': 2.009598970413208} -11/06/2021 22:17:47 - INFO - __main__ - Step 7492: {'lr': 0.0004983037202417824, 'samples': 1438464, 'steps': 7491, 'loss/train': 1.6653988361358643} -11/06/2021 22:17:47 - INFO - __main__ - Step 7493: {'lr': 0.0004983031030454639, 'samples': 1438656, 'steps': 7492, 'loss/train': 1.2993390560150146} -11/06/2021 22:17:48 - INFO - __main__ - Step 7494: {'lr': 0.0004983024857372639, 'samples': 1438848, 'steps': 7493, 'loss/train': 1.8429198265075684} -11/06/2021 22:17:49 - INFO - __main__ - Step 7495: {'lr': 0.0004983018683171826, 'samples': 1439040, 'steps': 7494, 'loss/train': 1.9161350727081299} -11/06/2021 22:17:49 - INFO - __main__ - Step 7496: {'lr': 0.0004983012507852203, 'samples': 1439232, 'steps': 7495, 'loss/train': 1.8230706453323364} -11/06/2021 22:17:49 - INFO - __main__ - Step 7497: {'lr': 0.0004983006331413773, 'samples': 1439424, 'steps': 7496, 'loss/train': 1.6898235082626343} -11/06/2021 22:17:50 - INFO - __main__ - Step 7498: {'lr': 0.0004983000153856539, 'samples': 1439616, 'steps': 7497, 'loss/train': 1.4853415489196777} -11/06/2021 22:17:50 - INFO - __main__ - Step 7499: {'lr': 0.0004982993975180504, 'samples': 1439808, 'steps': 7498, 'loss/train': 2.2079527378082275} -11/06/2021 22:17:51 - INFO - __main__ - Step 7500: {'lr': 0.0004982987795385669, 'samples': 1440000, 'steps': 7499, 'loss/train': 2.117600440979004} -11/06/2021 22:17:51 - INFO - __main__ - Step 7501: {'lr': 0.0004982981614472039, 'samples': 1440192, 'steps': 7500, 'loss/train': 2.0123913288116455} -11/06/2021 22:17:52 - INFO - __main__ - Step 7502: {'lr': 0.0004982975432439615, 'samples': 1440384, 'steps': 7501, 'loss/train': 1.6575013399124146} -11/06/2021 22:17:52 - INFO - __main__ - Step 7503: {'lr': 0.0004982969249288401, 'samples': 1440576, 'steps': 7502, 'loss/train': 0.48864415287971497} -11/06/2021 22:17:53 - INFO - __main__ - Step 7504: {'lr': 0.0004982963065018399, 'samples': 1440768, 'steps': 7503, 'loss/train': 2.1326282024383545} -11/06/2021 22:17:54 - INFO - __main__ - Step 7505: {'lr': 0.0004982956879629612, 'samples': 1440960, 'steps': 7504, 'loss/train': 2.184455633163452} -11/06/2021 22:17:54 - INFO - __main__ - Step 7506: {'lr': 0.0004982950693122044, 'samples': 1441152, 'steps': 7505, 'loss/train': 1.8725202083587646} -11/06/2021 22:17:54 - INFO - __main__ - Step 7507: {'lr': 0.0004982944505495696, 'samples': 1441344, 'steps': 7506, 'loss/train': 1.6214361190795898} -11/06/2021 22:17:55 - INFO - __main__ - Step 7508: {'lr': 0.0004982938316750572, 'samples': 1441536, 'steps': 7507, 'loss/train': 2.0111021995544434} -11/06/2021 22:17:55 - INFO - __main__ - Step 7509: {'lr': 0.0004982932126886674, 'samples': 1441728, 'steps': 7508, 'loss/train': 1.670443058013916} -11/06/2021 22:17:56 - INFO - __main__ - Step 7510: {'lr': 0.0004982925935904004, 'samples': 1441920, 'steps': 7509, 'loss/train': 1.7598836421966553} -11/06/2021 22:17:56 - INFO - __main__ - Step 7511: {'lr': 0.0004982919743802567, 'samples': 1442112, 'steps': 7510, 'loss/train': 2.0992119312286377} -11/06/2021 22:17:57 - INFO - __main__ - Step 7512: {'lr': 0.0004982913550582364, 'samples': 1442304, 'steps': 7511, 'loss/train': 1.790313720703125} -11/06/2021 22:17:57 - INFO - __main__ - Step 7513: {'lr': 0.00049829073562434, 'samples': 1442496, 'steps': 7512, 'loss/train': 1.9669575691223145} -11/06/2021 22:17:57 - INFO - __main__ - Step 7514: {'lr': 0.0004982901160785675, 'samples': 1442688, 'steps': 7513, 'loss/train': 1.6649370193481445} -11/06/2021 22:17:58 - INFO - __main__ - Step 7515: {'lr': 0.0004982894964209193, 'samples': 1442880, 'steps': 7514, 'loss/train': 2.0550930500030518} -11/06/2021 22:17:59 - INFO - __main__ - Step 7516: {'lr': 0.0004982888766513957, 'samples': 1443072, 'steps': 7515, 'loss/train': 1.5787222385406494} -11/06/2021 22:17:59 - INFO - __main__ - Step 7517: {'lr': 0.000498288256769997, 'samples': 1443264, 'steps': 7516, 'loss/train': 1.9650318622589111} -11/06/2021 22:17:59 - INFO - __main__ - Step 7518: {'lr': 0.0004982876367767234, 'samples': 1443456, 'steps': 7517, 'loss/train': 2.108997106552124} -11/06/2021 22:18:00 - INFO - __main__ - Step 7519: {'lr': 0.0004982870166715753, 'samples': 1443648, 'steps': 7518, 'loss/train': 1.5011414289474487} -11/06/2021 22:18:01 - INFO - __main__ - Step 7520: {'lr': 0.0004982863964545529, 'samples': 1443840, 'steps': 7519, 'loss/train': 2.0259969234466553} -11/06/2021 22:18:01 - INFO - __main__ - Step 7521: {'lr': 0.0004982857761256564, 'samples': 1444032, 'steps': 7520, 'loss/train': 2.0949344635009766} -11/06/2021 22:18:01 - INFO - __main__ - Step 7522: {'lr': 0.0004982851556848861, 'samples': 1444224, 'steps': 7521, 'loss/train': 1.771378993988037} -11/06/2021 22:18:02 - INFO - __main__ - Step 7523: {'lr': 0.0004982845351322424, 'samples': 1444416, 'steps': 7522, 'loss/train': 1.6753596067428589} -11/06/2021 22:18:02 - INFO - __main__ - Step 7524: {'lr': 0.0004982839144677257, 'samples': 1444608, 'steps': 7523, 'loss/train': 0.8086962103843689} -11/06/2021 22:18:03 - INFO - __main__ - Step 7525: {'lr': 0.0004982832936913359, 'samples': 1444800, 'steps': 7524, 'loss/train': 1.749570608139038} -11/06/2021 22:18:04 - INFO - __main__ - Step 7526: {'lr': 0.0004982826728030735, 'samples': 1444992, 'steps': 7525, 'loss/train': 1.9992296695709229} -11/06/2021 22:18:04 - INFO - __main__ - Step 7527: {'lr': 0.0004982820518029387, 'samples': 1445184, 'steps': 7526, 'loss/train': 2.0168237686157227} -11/06/2021 22:18:04 - INFO - __main__ - Step 7528: {'lr': 0.000498281430690932, 'samples': 1445376, 'steps': 7527, 'loss/train': 1.9467054605484009} -11/06/2021 22:18:05 - INFO - __main__ - Step 7529: {'lr': 0.0004982808094670534, 'samples': 1445568, 'steps': 7528, 'loss/train': 1.8640716075897217} -11/06/2021 22:18:05 - INFO - __main__ - Step 7530: {'lr': 0.0004982801881313034, 'samples': 1445760, 'steps': 7529, 'loss/train': 1.9027869701385498} -11/06/2021 22:18:06 - INFO - __main__ - Step 7531: {'lr': 0.0004982795666836821, 'samples': 1445952, 'steps': 7530, 'loss/train': 1.8328138589859009} -11/06/2021 22:18:06 - INFO - __main__ - Step 7532: {'lr': 0.00049827894512419, 'samples': 1446144, 'steps': 7531, 'loss/train': 2.27284836769104} -11/06/2021 22:18:07 - INFO - __main__ - Step 7533: {'lr': 0.000498278323452827, 'samples': 1446336, 'steps': 7532, 'loss/train': 1.7987669706344604} -11/06/2021 22:18:07 - INFO - __main__ - Step 7534: {'lr': 0.0004982777016695937, 'samples': 1446528, 'steps': 7533, 'loss/train': 1.1510889530181885} -11/06/2021 22:18:08 - INFO - __main__ - Step 7535: {'lr': 0.0004982770797744904, 'samples': 1446720, 'steps': 7534, 'loss/train': 1.9908004999160767} -11/06/2021 22:18:09 - INFO - __main__ - Step 7536: {'lr': 0.0004982764577675172, 'samples': 1446912, 'steps': 7535, 'loss/train': 2.135575532913208} -11/06/2021 22:18:09 - INFO - __main__ - Step 7537: {'lr': 0.0004982758356486746, 'samples': 1447104, 'steps': 7536, 'loss/train': 1.4963163137435913} -11/06/2021 22:18:09 - INFO - __main__ - Step 7538: {'lr': 0.0004982752134179624, 'samples': 1447296, 'steps': 7537, 'loss/train': 2.040847063064575} -11/06/2021 22:18:10 - INFO - __main__ - Step 7539: {'lr': 0.0004982745910753815, 'samples': 1447488, 'steps': 7538, 'loss/train': 2.0529308319091797} -11/06/2021 22:18:10 - INFO - __main__ - Step 7540: {'lr': 0.0004982739686209319, 'samples': 1447680, 'steps': 7539, 'loss/train': 1.5102424621582031} -11/06/2021 22:18:10 - INFO - __main__ - Step 7541: {'lr': 0.0004982733460546138, 'samples': 1447872, 'steps': 7540, 'loss/train': 2.3759987354278564} -11/06/2021 22:18:11 - INFO - __main__ - Step 7542: {'lr': 0.0004982727233764276, 'samples': 1448064, 'steps': 7541, 'loss/train': 1.264660120010376} -11/06/2021 22:18:12 - INFO - __main__ - Step 7543: {'lr': 0.0004982721005863734, 'samples': 1448256, 'steps': 7542, 'loss/train': 2.076897621154785} -11/06/2021 22:18:12 - INFO - __main__ - Step 7544: {'lr': 0.0004982714776844518, 'samples': 1448448, 'steps': 7543, 'loss/train': 1.9812895059585571} -11/06/2021 22:18:13 - INFO - __main__ - Step 7545: {'lr': 0.0004982708546706628, 'samples': 1448640, 'steps': 7544, 'loss/train': 1.7536218166351318} -11/06/2021 22:18:13 - INFO - __main__ - Step 7546: {'lr': 0.0004982702315450068, 'samples': 1448832, 'steps': 7545, 'loss/train': 2.1761927604675293} -11/06/2021 22:18:14 - INFO - __main__ - Step 7547: {'lr': 0.0004982696083074841, 'samples': 1449024, 'steps': 7546, 'loss/train': 1.766358494758606} -11/06/2021 22:18:14 - INFO - __main__ - Step 7548: {'lr': 0.0004982689849580951, 'samples': 1449216, 'steps': 7547, 'loss/train': 0.7626532912254333} -11/06/2021 22:18:15 - INFO - __main__ - Step 7549: {'lr': 0.0004982683614968396, 'samples': 1449408, 'steps': 7548, 'loss/train': 1.5238088369369507} -11/06/2021 22:18:15 - INFO - __main__ - Step 7550: {'lr': 0.0004982677379237185, 'samples': 1449600, 'steps': 7549, 'loss/train': 1.834945797920227} -11/06/2021 22:18:15 - INFO - __main__ - Step 7551: {'lr': 0.0004982671142387316, 'samples': 1449792, 'steps': 7550, 'loss/train': 1.1642390489578247} -11/06/2021 22:18:17 - INFO - __main__ - Step 7552: {'lr': 0.0004982664904418794, 'samples': 1449984, 'steps': 7551, 'loss/train': 0.791139543056488} -11/06/2021 22:18:17 - INFO - __main__ - Step 7553: {'lr': 0.0004982658665331622, 'samples': 1450176, 'steps': 7552, 'loss/train': 2.0422914028167725} -11/06/2021 22:18:17 - INFO - __main__ - Step 7554: {'lr': 0.0004982652425125802, 'samples': 1450368, 'steps': 7553, 'loss/train': 2.1857669353485107} -11/06/2021 22:18:18 - INFO - __main__ - Step 7555: {'lr': 0.0004982646183801337, 'samples': 1450560, 'steps': 7554, 'loss/train': 2.560479164123535} -11/06/2021 22:18:18 - INFO - __main__ - Step 7556: {'lr': 0.000498263994135823, 'samples': 1450752, 'steps': 7555, 'loss/train': 2.5498902797698975} -11/06/2021 22:18:18 - INFO - __main__ - Step 7557: {'lr': 0.0004982633697796484, 'samples': 1450944, 'steps': 7556, 'loss/train': 2.1660470962524414} -11/06/2021 22:18:19 - INFO - __main__ - Step 7558: {'lr': 0.0004982627453116102, 'samples': 1451136, 'steps': 7557, 'loss/train': 1.7757936716079712} -11/06/2021 22:18:20 - INFO - __main__ - Step 7559: {'lr': 0.0004982621207317086, 'samples': 1451328, 'steps': 7558, 'loss/train': 1.7856800556182861} -11/06/2021 22:18:20 - INFO - __main__ - Step 7560: {'lr': 0.0004982614960399439, 'samples': 1451520, 'steps': 7559, 'loss/train': 1.483529806137085} -11/06/2021 22:18:20 - INFO - __main__ - Step 7561: {'lr': 0.0004982608712363163, 'samples': 1451712, 'steps': 7560, 'loss/train': 2.1394612789154053} -11/06/2021 22:18:21 - INFO - __main__ - Step 7562: {'lr': 0.0004982602463208263, 'samples': 1451904, 'steps': 7561, 'loss/train': 2.436344861984253} -11/06/2021 22:18:22 - INFO - __main__ - Step 7563: {'lr': 0.0004982596212934742, 'samples': 1452096, 'steps': 7562, 'loss/train': 2.3320164680480957} -11/06/2021 22:18:22 - INFO - __main__ - Step 7564: {'lr': 0.00049825899615426, 'samples': 1452288, 'steps': 7563, 'loss/train': 1.0937427282333374} -11/06/2021 22:18:22 - INFO - __main__ - Step 7565: {'lr': 0.000498258370903184, 'samples': 1452480, 'steps': 7564, 'loss/train': 1.8388676643371582} -11/06/2021 22:18:23 - INFO - __main__ - Step 7566: {'lr': 0.0004982577455402467, 'samples': 1452672, 'steps': 7565, 'loss/train': 1.7357767820358276} -11/06/2021 22:18:23 - INFO - __main__ - Step 7567: {'lr': 0.0004982571200654485, 'samples': 1452864, 'steps': 7566, 'loss/train': 1.5761942863464355} -11/06/2021 22:18:24 - INFO - __main__ - Step 7568: {'lr': 0.0004982564944787892, 'samples': 1453056, 'steps': 7567, 'loss/train': 2.1120853424072266} -11/06/2021 22:18:25 - INFO - __main__ - Step 7569: {'lr': 0.0004982558687802695, 'samples': 1453248, 'steps': 7568, 'loss/train': 2.013747453689575} -11/06/2021 22:18:25 - INFO - __main__ - Step 7570: {'lr': 0.0004982552429698894, 'samples': 1453440, 'steps': 7569, 'loss/train': 2.029210090637207} -11/06/2021 22:18:25 - INFO - __main__ - Step 7571: {'lr': 0.0004982546170476494, 'samples': 1453632, 'steps': 7570, 'loss/train': 1.5686355829238892} -11/06/2021 22:18:26 - INFO - __main__ - Step 7572: {'lr': 0.0004982539910135497, 'samples': 1453824, 'steps': 7571, 'loss/train': 1.8889784812927246} -11/06/2021 22:18:27 - INFO - __main__ - Step 7573: {'lr': 0.0004982533648675906, 'samples': 1454016, 'steps': 7572, 'loss/train': 2.56605863571167} -11/06/2021 22:18:27 - INFO - __main__ - Step 7574: {'lr': 0.0004982527386097723, 'samples': 1454208, 'steps': 7573, 'loss/train': 1.9748719930648804} -11/06/2021 22:18:27 - INFO - __main__ - Step 7575: {'lr': 0.0004982521122400953, 'samples': 1454400, 'steps': 7574, 'loss/train': 1.4213409423828125} -11/06/2021 22:18:28 - INFO - __main__ - Step 7576: {'lr': 0.0004982514857585596, 'samples': 1454592, 'steps': 7575, 'loss/train': 1.8690491914749146} -11/06/2021 22:18:28 - INFO - __main__ - Step 7577: {'lr': 0.0004982508591651657, 'samples': 1454784, 'steps': 7576, 'loss/train': 2.0668842792510986} -11/06/2021 22:18:29 - INFO - __main__ - Step 7578: {'lr': 0.0004982502324599137, 'samples': 1454976, 'steps': 7577, 'loss/train': 2.21287202835083} -11/06/2021 22:18:29 - INFO - __main__ - Step 7579: {'lr': 0.000498249605642804, 'samples': 1455168, 'steps': 7578, 'loss/train': 1.7789140939712524} -11/06/2021 22:18:30 - INFO - __main__ - Step 7580: {'lr': 0.0004982489787138369, 'samples': 1455360, 'steps': 7579, 'loss/train': 1.9952287673950195} -11/06/2021 22:18:30 - INFO - __main__ - Step 7581: {'lr': 0.0004982483516730126, 'samples': 1455552, 'steps': 7580, 'loss/train': 1.8334144353866577} -11/06/2021 22:18:30 - INFO - __main__ - Step 7582: {'lr': 0.0004982477245203314, 'samples': 1455744, 'steps': 7581, 'loss/train': 1.755232572555542} -11/06/2021 22:18:31 - INFO - __main__ - Step 7583: {'lr': 0.0004982470972557936, 'samples': 1455936, 'steps': 7582, 'loss/train': 2.4827017784118652} -11/06/2021 22:18:32 - INFO - __main__ - Step 7584: {'lr': 0.0004982464698793995, 'samples': 1456128, 'steps': 7583, 'loss/train': 1.831977128982544} -11/06/2021 22:18:32 - INFO - __main__ - Step 7585: {'lr': 0.0004982458423911495, 'samples': 1456320, 'steps': 7584, 'loss/train': 2.0919387340545654} -11/06/2021 22:18:32 - INFO - __main__ - Step 7586: {'lr': 0.0004982452147910437, 'samples': 1456512, 'steps': 7585, 'loss/train': 2.820591449737549} -11/06/2021 22:18:33 - INFO - __main__ - Step 7587: {'lr': 0.0004982445870790823, 'samples': 1456704, 'steps': 7586, 'loss/train': 1.7887145280838013} -11/06/2021 22:18:34 - INFO - __main__ - Step 7588: {'lr': 0.0004982439592552658, 'samples': 1456896, 'steps': 7587, 'loss/train': 1.2820543050765991} -11/06/2021 22:18:35 - INFO - __main__ - Step 7589: {'lr': 0.0004982433313195945, 'samples': 1457088, 'steps': 7588, 'loss/train': 2.508904218673706} -11/06/2021 22:18:35 - INFO - __main__ - Step 7590: {'lr': 0.0004982427032720685, 'samples': 1457280, 'steps': 7589, 'loss/train': 1.968804121017456} -11/06/2021 22:18:35 - INFO - __main__ - Step 7591: {'lr': 0.0004982420751126882, 'samples': 1457472, 'steps': 7590, 'loss/train': 2.2515952587127686} -11/06/2021 22:18:36 - INFO - __main__ - Step 7592: {'lr': 0.0004982414468414538, 'samples': 1457664, 'steps': 7591, 'loss/train': 2.3000688552856445} -11/06/2021 22:18:36 - INFO - __main__ - Step 7593: {'lr': 0.0004982408184583656, 'samples': 1457856, 'steps': 7592, 'loss/train': 1.6771053075790405} -11/06/2021 22:18:37 - INFO - __main__ - Step 7594: {'lr': 0.000498240189963424, 'samples': 1458048, 'steps': 7593, 'loss/train': 1.5368093252182007} -11/06/2021 22:18:37 - INFO - __main__ - Step 7595: {'lr': 0.0004982395613566291, 'samples': 1458240, 'steps': 7594, 'loss/train': 2.213350772857666} -11/06/2021 22:18:38 - INFO - __main__ - Step 7596: {'lr': 0.0004982389326379814, 'samples': 1458432, 'steps': 7595, 'loss/train': 1.887166142463684} -11/06/2021 22:18:38 - INFO - __main__ - Step 7597: {'lr': 0.000498238303807481, 'samples': 1458624, 'steps': 7596, 'loss/train': 2.0999624729156494} -11/06/2021 22:18:38 - INFO - __main__ - Step 7598: {'lr': 0.0004982376748651283, 'samples': 1458816, 'steps': 7597, 'loss/train': 1.3151088953018188} -11/06/2021 22:18:39 - INFO - __main__ - Step 7599: {'lr': 0.0004982370458109235, 'samples': 1459008, 'steps': 7598, 'loss/train': 1.5262982845306396} -11/06/2021 22:18:40 - INFO - __main__ - Step 7600: {'lr': 0.0004982364166448669, 'samples': 1459200, 'steps': 7599, 'loss/train': 1.9225597381591797} -11/06/2021 22:18:40 - INFO - __main__ - Step 7601: {'lr': 0.0004982357873669588, 'samples': 1459392, 'steps': 7600, 'loss/train': 1.6969056129455566} -11/06/2021 22:18:40 - INFO - __main__ - Step 7602: {'lr': 0.0004982351579771995, 'samples': 1459584, 'steps': 7601, 'loss/train': 1.8867172002792358} -11/06/2021 22:18:41 - INFO - __main__ - Step 7603: {'lr': 0.0004982345284755893, 'samples': 1459776, 'steps': 7602, 'loss/train': 2.111384868621826} -11/06/2021 22:18:41 - INFO - __main__ - Step 7604: {'lr': 0.0004982338988621284, 'samples': 1459968, 'steps': 7603, 'loss/train': 1.420168161392212} -11/06/2021 22:18:42 - INFO - __main__ - Step 7605: {'lr': 0.0004982332691368172, 'samples': 1460160, 'steps': 7604, 'loss/train': 2.9915659427642822} -11/06/2021 22:18:43 - INFO - __main__ - Step 7606: {'lr': 0.0004982326392996559, 'samples': 1460352, 'steps': 7605, 'loss/train': 1.3998850584030151} -11/06/2021 22:18:43 - INFO - __main__ - Step 7607: {'lr': 0.0004982320093506449, 'samples': 1460544, 'steps': 7606, 'loss/train': 1.5841953754425049} -11/06/2021 22:18:43 - INFO - __main__ - Step 7608: {'lr': 0.0004982313792897843, 'samples': 1460736, 'steps': 7607, 'loss/train': 1.2424761056900024} -11/06/2021 22:18:44 - INFO - __main__ - Step 7609: {'lr': 0.0004982307491170744, 'samples': 1460928, 'steps': 7608, 'loss/train': 2.063056707382202} -11/06/2021 22:18:45 - INFO - __main__ - Step 7610: {'lr': 0.0004982301188325156, 'samples': 1461120, 'steps': 7609, 'loss/train': 1.6519533395767212} -11/06/2021 22:18:45 - INFO - __main__ - Step 7611: {'lr': 0.0004982294884361081, 'samples': 1461312, 'steps': 7610, 'loss/train': 1.2619507312774658} -11/06/2021 22:18:45 - INFO - __main__ - Step 7612: {'lr': 0.0004982288579278522, 'samples': 1461504, 'steps': 7611, 'loss/train': 1.7545194625854492} -11/06/2021 22:18:46 - INFO - __main__ - Step 7613: {'lr': 0.0004982282273077483, 'samples': 1461696, 'steps': 7612, 'loss/train': 1.8897991180419922} -11/06/2021 22:18:46 - INFO - __main__ - Step 7614: {'lr': 0.0004982275965757965, 'samples': 1461888, 'steps': 7613, 'loss/train': 1.383413314819336} -11/06/2021 22:18:47 - INFO - __main__ - Step 7615: {'lr': 0.0004982269657319974, 'samples': 1462080, 'steps': 7614, 'loss/train': 1.955425500869751} -11/06/2021 22:18:47 - INFO - __main__ - Step 7616: {'lr': 0.0004982263347763508, 'samples': 1462272, 'steps': 7615, 'loss/train': 1.6622871160507202} -11/06/2021 22:18:48 - INFO - __main__ - Step 7617: {'lr': 0.0004982257037088574, 'samples': 1462464, 'steps': 7616, 'loss/train': 1.82854425907135} -11/06/2021 22:18:48 - INFO - __main__ - Step 7618: {'lr': 0.0004982250725295173, 'samples': 1462656, 'steps': 7617, 'loss/train': 2.0947282314300537} -11/06/2021 22:18:48 - INFO - __main__ - Step 7619: {'lr': 0.0004982244412383307, 'samples': 1462848, 'steps': 7618, 'loss/train': 1.5993701219558716} -11/06/2021 22:18:49 - INFO - __main__ - Step 7620: {'lr': 0.0004982238098352981, 'samples': 1463040, 'steps': 7619, 'loss/train': 2.0519866943359375} -11/06/2021 22:18:50 - INFO - __main__ - Step 7621: {'lr': 0.0004982231783204196, 'samples': 1463232, 'steps': 7620, 'loss/train': 1.768385887145996} -11/06/2021 22:18:50 - INFO - __main__ - Step 7622: {'lr': 0.0004982225466936957, 'samples': 1463424, 'steps': 7621, 'loss/train': 2.114351749420166} -11/06/2021 22:18:51 - INFO - __main__ - Step 7623: {'lr': 0.0004982219149551265, 'samples': 1463616, 'steps': 7622, 'loss/train': 2.196870803833008} -11/06/2021 22:18:51 - INFO - __main__ - Step 7624: {'lr': 0.0004982212831047123, 'samples': 1463808, 'steps': 7623, 'loss/train': 2.04628586769104} -11/06/2021 22:18:51 - INFO - __main__ - Step 7625: {'lr': 0.0004982206511424534, 'samples': 1464000, 'steps': 7624, 'loss/train': 1.2371141910552979} -11/06/2021 22:18:52 - INFO - __main__ - Step 7626: {'lr': 0.0004982200190683502, 'samples': 1464192, 'steps': 7625, 'loss/train': 1.4562172889709473} -11/06/2021 22:18:53 - INFO - __main__ - Step 7627: {'lr': 0.0004982193868824028, 'samples': 1464384, 'steps': 7626, 'loss/train': 1.9983298778533936} -11/06/2021 22:18:53 - INFO - __main__ - Step 7628: {'lr': 0.0004982187545846116, 'samples': 1464576, 'steps': 7627, 'loss/train': 2.135972261428833} -11/06/2021 22:18:53 - INFO - __main__ - Step 7629: {'lr': 0.0004982181221749769, 'samples': 1464768, 'steps': 7628, 'loss/train': 2.405860424041748} -11/06/2021 22:18:54 - INFO - __main__ - Step 7630: {'lr': 0.0004982174896534989, 'samples': 1464960, 'steps': 7629, 'loss/train': 1.3668652772903442} -11/06/2021 22:18:55 - INFO - __main__ - Step 7631: {'lr': 0.0004982168570201779, 'samples': 1465152, 'steps': 7630, 'loss/train': 1.261794924736023} -11/06/2021 22:18:55 - INFO - __main__ - Step 7632: {'lr': 0.0004982162242750143, 'samples': 1465344, 'steps': 7631, 'loss/train': 1.8205006122589111} -11/06/2021 22:18:55 - INFO - __main__ - Step 7633: {'lr': 0.0004982155914180082, 'samples': 1465536, 'steps': 7632, 'loss/train': 1.8356959819793701} -11/06/2021 22:18:56 - INFO - __main__ - Step 7634: {'lr': 0.0004982149584491601, 'samples': 1465728, 'steps': 7633, 'loss/train': 2.227440357208252} -11/06/2021 22:18:56 - INFO - __main__ - Step 7635: {'lr': 0.0004982143253684701, 'samples': 1465920, 'steps': 7634, 'loss/train': 1.8960446119308472} -11/06/2021 22:18:57 - INFO - __main__ - Step 7636: {'lr': 0.0004982136921759385, 'samples': 1466112, 'steps': 7635, 'loss/train': 1.77176833152771} -11/06/2021 22:18:57 - INFO - __main__ - Step 7637: {'lr': 0.0004982130588715657, 'samples': 1466304, 'steps': 7636, 'loss/train': 1.8046529293060303} -11/06/2021 22:18:58 - INFO - __main__ - Step 7638: {'lr': 0.000498212425455352, 'samples': 1466496, 'steps': 7637, 'loss/train': 1.6778465509414673} -11/06/2021 22:18:58 - INFO - __main__ - Step 7639: {'lr': 0.0004982117919272975, 'samples': 1466688, 'steps': 7638, 'loss/train': 1.662865400314331} -11/06/2021 22:18:59 - INFO - __main__ - Step 7640: {'lr': 0.0004982111582874026, 'samples': 1466880, 'steps': 7639, 'loss/train': 1.8962922096252441} -11/06/2021 22:18:59 - INFO - __main__ - Step 7641: {'lr': 0.0004982105245356676, 'samples': 1467072, 'steps': 7640, 'loss/train': 1.8994383811950684} -11/06/2021 22:19:00 - INFO - __main__ - Step 7642: {'lr': 0.0004982098906720928, 'samples': 1467264, 'steps': 7641, 'loss/train': 1.8286490440368652} -11/06/2021 22:19:00 - INFO - __main__ - Step 7643: {'lr': 0.0004982092566966785, 'samples': 1467456, 'steps': 7642, 'loss/train': 1.5329943895339966} -11/06/2021 22:19:01 - INFO - __main__ - Step 7644: {'lr': 0.0004982086226094248, 'samples': 1467648, 'steps': 7643, 'loss/train': 2.1548547744750977} -11/06/2021 22:19:01 - INFO - __main__ - Step 7645: {'lr': 0.0004982079884103322, 'samples': 1467840, 'steps': 7644, 'loss/train': 2.1634531021118164} -11/06/2021 22:19:02 - INFO - __main__ - Step 7646: {'lr': 0.0004982073540994009, 'samples': 1468032, 'steps': 7645, 'loss/train': 2.008009195327759} -11/06/2021 22:19:02 - INFO - __main__ - Step 7647: {'lr': 0.0004982067196766312, 'samples': 1468224, 'steps': 7646, 'loss/train': 1.8204351663589478} -11/06/2021 22:19:03 - INFO - __main__ - Step 7648: {'lr': 0.0004982060851420235, 'samples': 1468416, 'steps': 7647, 'loss/train': 2.1249916553497314} -11/06/2021 22:19:03 - INFO - __main__ - Step 7649: {'lr': 0.0004982054504955778, 'samples': 1468608, 'steps': 7648, 'loss/train': 1.6242306232452393} -11/06/2021 22:19:03 - INFO - __main__ - Step 7650: {'lr': 0.0004982048157372946, 'samples': 1468800, 'steps': 7649, 'loss/train': 1.693130612373352} -11/06/2021 22:19:04 - INFO - __main__ - Step 7651: {'lr': 0.0004982041808671741, 'samples': 1468992, 'steps': 7650, 'loss/train': 2.0973668098449707} -11/06/2021 22:19:05 - INFO - __main__ - Step 7652: {'lr': 0.0004982035458852168, 'samples': 1469184, 'steps': 7651, 'loss/train': 2.164299488067627} -11/06/2021 22:19:05 - INFO - __main__ - Step 7653: {'lr': 0.0004982029107914226, 'samples': 1469376, 'steps': 7652, 'loss/train': 2.062432289123535} -11/06/2021 22:19:05 - INFO - __main__ - Step 7654: {'lr': 0.0004982022755857921, 'samples': 1469568, 'steps': 7653, 'loss/train': 2.0671913623809814} -11/06/2021 22:19:06 - INFO - __main__ - Step 7655: {'lr': 0.0004982016402683255, 'samples': 1469760, 'steps': 7654, 'loss/train': 2.361668348312378} -11/06/2021 22:19:06 - INFO - __main__ - Step 7656: {'lr': 0.000498201004839023, 'samples': 1469952, 'steps': 7655, 'loss/train': 1.3417774438858032} -11/06/2021 22:19:07 - INFO - __main__ - Step 7657: {'lr': 0.000498200369297885, 'samples': 1470144, 'steps': 7656, 'loss/train': 1.8992770910263062} -11/06/2021 22:19:08 - INFO - __main__ - Step 7658: {'lr': 0.0004981997336449118, 'samples': 1470336, 'steps': 7657, 'loss/train': 1.9563990831375122} -11/06/2021 22:19:08 - INFO - __main__ - Step 7659: {'lr': 0.0004981990978801035, 'samples': 1470528, 'steps': 7658, 'loss/train': 2.046013593673706} -11/06/2021 22:19:08 - INFO - __main__ - Step 7660: {'lr': 0.0004981984620034606, 'samples': 1470720, 'steps': 7659, 'loss/train': 1.6640254259109497} -11/06/2021 22:19:09 - INFO - __main__ - Step 7661: {'lr': 0.0004981978260149833, 'samples': 1470912, 'steps': 7660, 'loss/train': 1.9074742794036865} -11/06/2021 22:19:10 - INFO - __main__ - Step 7662: {'lr': 0.0004981971899146719, 'samples': 1471104, 'steps': 7661, 'loss/train': 2.0889925956726074} -11/06/2021 22:19:10 - INFO - __main__ - Step 7663: {'lr': 0.0004981965537025267, 'samples': 1471296, 'steps': 7662, 'loss/train': 2.0140273571014404} -11/06/2021 22:19:10 - INFO - __main__ - Step 7664: {'lr': 0.000498195917378548, 'samples': 1471488, 'steps': 7663, 'loss/train': 1.5945501327514648} -11/06/2021 22:19:11 - INFO - __main__ - Step 7665: {'lr': 0.0004981952809427359, 'samples': 1471680, 'steps': 7664, 'loss/train': 1.7172966003417969} -11/06/2021 22:19:11 - INFO - __main__ - Step 7666: {'lr': 0.0004981946443950909, 'samples': 1471872, 'steps': 7665, 'loss/train': 1.3649691343307495} -11/06/2021 22:19:12 - INFO - __main__ - Step 7667: {'lr': 0.0004981940077356132, 'samples': 1472064, 'steps': 7666, 'loss/train': 0.8751164674758911} -11/06/2021 22:19:12 - INFO - __main__ - Step 7668: {'lr': 0.0004981933709643032, 'samples': 1472256, 'steps': 7667, 'loss/train': 1.916032314300537} -11/06/2021 22:19:13 - INFO - __main__ - Step 7669: {'lr': 0.000498192734081161, 'samples': 1472448, 'steps': 7668, 'loss/train': 1.9548919200897217} -11/06/2021 22:19:13 - INFO - __main__ - Step 7670: {'lr': 0.000498192097086187, 'samples': 1472640, 'steps': 7669, 'loss/train': 1.8466298580169678} -11/06/2021 22:19:13 - INFO - __main__ - Step 7671: {'lr': 0.0004981914599793816, 'samples': 1472832, 'steps': 7670, 'loss/train': 3.0567245483398438} -11/06/2021 22:19:14 - INFO - __main__ - Step 7672: {'lr': 0.0004981908227607448, 'samples': 1473024, 'steps': 7671, 'loss/train': 1.7764103412628174} -11/06/2021 22:19:15 - INFO - __main__ - Step 7673: {'lr': 0.0004981901854302771, 'samples': 1473216, 'steps': 7672, 'loss/train': 2.425710678100586} -11/06/2021 22:19:15 - INFO - __main__ - Step 7674: {'lr': 0.0004981895479879787, 'samples': 1473408, 'steps': 7673, 'loss/train': 1.5297969579696655} -11/06/2021 22:19:15 - INFO - __main__ - Step 7675: {'lr': 0.0004981889104338499, 'samples': 1473600, 'steps': 7674, 'loss/train': 1.673049807548523} -11/06/2021 22:19:16 - INFO - __main__ - Step 7676: {'lr': 0.0004981882727678912, 'samples': 1473792, 'steps': 7675, 'loss/train': 1.8792694807052612} -11/06/2021 22:19:17 - INFO - __main__ - Step 7677: {'lr': 0.0004981876349901025, 'samples': 1473984, 'steps': 7676, 'loss/train': 1.6450796127319336} -11/06/2021 22:19:17 - INFO - __main__ - Step 7678: {'lr': 0.0004981869971004843, 'samples': 1474176, 'steps': 7677, 'loss/train': 1.8612487316131592} -11/06/2021 22:19:18 - INFO - __main__ - Step 7679: {'lr': 0.0004981863590990369, 'samples': 1474368, 'steps': 7678, 'loss/train': 1.9628400802612305} -11/06/2021 22:19:18 - INFO - __main__ - Step 7680: {'lr': 0.0004981857209857605, 'samples': 1474560, 'steps': 7679, 'loss/train': 2.1773593425750732} -11/06/2021 22:19:18 - INFO - __main__ - Step 7681: {'lr': 0.0004981850827606556, 'samples': 1474752, 'steps': 7680, 'loss/train': 2.009646415710449} -11/06/2021 22:19:19 - INFO - __main__ - Step 7682: {'lr': 0.0004981844444237223, 'samples': 1474944, 'steps': 7681, 'loss/train': 1.6620737314224243} -11/06/2021 22:19:20 - INFO - __main__ - Step 7683: {'lr': 0.0004981838059749607, 'samples': 1475136, 'steps': 7682, 'loss/train': 1.8136749267578125} -11/06/2021 22:19:20 - INFO - __main__ - Step 7684: {'lr': 0.0004981831674143716, 'samples': 1475328, 'steps': 7683, 'loss/train': 2.1339547634124756} -11/06/2021 22:19:20 - INFO - __main__ - Step 7685: {'lr': 0.0004981825287419549, 'samples': 1475520, 'steps': 7684, 'loss/train': 1.375860571861267} -11/06/2021 22:19:21 - INFO - __main__ - Step 7686: {'lr': 0.0004981818899577108, 'samples': 1475712, 'steps': 7685, 'loss/train': 1.8953708410263062} -11/06/2021 22:19:21 - INFO - __main__ - Step 7687: {'lr': 0.0004981812510616399, 'samples': 1475904, 'steps': 7686, 'loss/train': 1.9942034482955933} -11/06/2021 22:19:22 - INFO - __main__ - Step 7688: {'lr': 0.0004981806120537424, 'samples': 1476096, 'steps': 7687, 'loss/train': 1.7413487434387207} -11/06/2021 22:19:22 - INFO - __main__ - Step 7689: {'lr': 0.0004981799729340185, 'samples': 1476288, 'steps': 7688, 'loss/train': 1.861914038658142} -11/06/2021 22:19:23 - INFO - __main__ - Step 7690: {'lr': 0.0004981793337024685, 'samples': 1476480, 'steps': 7689, 'loss/train': 1.644492745399475} -11/06/2021 22:19:23 - INFO - __main__ - Step 7691: {'lr': 0.0004981786943590928, 'samples': 1476672, 'steps': 7690, 'loss/train': 1.96816885471344} -11/06/2021 22:19:24 - INFO - __main__ - Step 7692: {'lr': 0.0004981780549038916, 'samples': 1476864, 'steps': 7691, 'loss/train': 1.6738519668579102} -11/06/2021 22:19:25 - INFO - __main__ - Step 7693: {'lr': 0.0004981774153368651, 'samples': 1477056, 'steps': 7692, 'loss/train': 1.7269313335418701} -11/06/2021 22:19:25 - INFO - __main__ - Step 7694: {'lr': 0.0004981767756580138, 'samples': 1477248, 'steps': 7693, 'loss/train': 1.7965588569641113} -11/06/2021 22:19:25 - INFO - __main__ - Step 7695: {'lr': 0.0004981761358673378, 'samples': 1477440, 'steps': 7694, 'loss/train': 2.0630042552948} -11/06/2021 22:19:26 - INFO - __main__ - Step 7696: {'lr': 0.0004981754959648376, 'samples': 1477632, 'steps': 7695, 'loss/train': 1.89278244972229} -11/06/2021 22:19:26 - INFO - __main__ - Step 7697: {'lr': 0.0004981748559505131, 'samples': 1477824, 'steps': 7696, 'loss/train': 1.7540265321731567} -11/06/2021 22:19:27 - INFO - __main__ - Step 7698: {'lr': 0.0004981742158243651, 'samples': 1478016, 'steps': 7697, 'loss/train': 1.4253634214401245} -11/06/2021 22:19:27 - INFO - __main__ - Step 7699: {'lr': 0.0004981735755863934, 'samples': 1478208, 'steps': 7698, 'loss/train': 2.059159517288208} -11/06/2021 22:19:28 - INFO - __main__ - Step 7700: {'lr': 0.0004981729352365986, 'samples': 1478400, 'steps': 7699, 'loss/train': 1.953817367553711} -11/06/2021 22:19:28 - INFO - __main__ - Step 7701: {'lr': 0.0004981722947749811, 'samples': 1478592, 'steps': 7700, 'loss/train': 1.9342195987701416} -11/06/2021 22:19:28 - INFO - __main__ - Step 7702: {'lr': 0.0004981716542015408, 'samples': 1478784, 'steps': 7701, 'loss/train': 1.841950535774231} -11/06/2021 22:19:29 - INFO - __main__ - Step 7703: {'lr': 0.0004981710135162781, 'samples': 1478976, 'steps': 7702, 'loss/train': 1.5683513879776} -11/06/2021 22:19:30 - INFO - __main__ - Step 7704: {'lr': 0.0004981703727191935, 'samples': 1479168, 'steps': 7703, 'loss/train': 1.7264535427093506} -11/06/2021 22:19:30 - INFO - __main__ - Step 7705: {'lr': 0.0004981697318102872, 'samples': 1479360, 'steps': 7704, 'loss/train': 2.026911973953247} -11/06/2021 22:19:31 - INFO - __main__ - Step 7706: {'lr': 0.0004981690907895594, 'samples': 1479552, 'steps': 7705, 'loss/train': 1.9870184659957886} -11/06/2021 22:19:31 - INFO - __main__ - Step 7707: {'lr': 0.0004981684496570104, 'samples': 1479744, 'steps': 7706, 'loss/train': 1.9878273010253906} -11/06/2021 22:19:31 - INFO - __main__ - Step 7708: {'lr': 0.0004981678084126405, 'samples': 1479936, 'steps': 7707, 'loss/train': 1.5540006160736084} -11/06/2021 22:19:32 - INFO - __main__ - Step 7709: {'lr': 0.0004981671670564502, 'samples': 1480128, 'steps': 7708, 'loss/train': 1.544403314590454} -11/06/2021 22:19:33 - INFO - __main__ - Step 7710: {'lr': 0.0004981665255884394, 'samples': 1480320, 'steps': 7709, 'loss/train': 2.273404598236084} -11/06/2021 22:19:33 - INFO - __main__ - Step 7711: {'lr': 0.0004981658840086087, 'samples': 1480512, 'steps': 7710, 'loss/train': 2.1462695598602295} -11/06/2021 22:19:33 - INFO - __main__ - Step 7712: {'lr': 0.0004981652423169582, 'samples': 1480704, 'steps': 7711, 'loss/train': 1.3098105192184448} -11/06/2021 22:19:34 - INFO - __main__ - Step 7713: {'lr': 0.0004981646005134884, 'samples': 1480896, 'steps': 7712, 'loss/train': 1.9249402284622192} -11/06/2021 22:19:35 - INFO - __main__ - Step 7714: {'lr': 0.0004981639585981993, 'samples': 1481088, 'steps': 7713, 'loss/train': 1.955265760421753} -11/06/2021 22:19:35 - INFO - __main__ - Step 7715: {'lr': 0.0004981633165710914, 'samples': 1481280, 'steps': 7714, 'loss/train': 2.254359722137451} -11/06/2021 22:19:35 - INFO - __main__ - Step 7716: {'lr': 0.000498162674432165, 'samples': 1481472, 'steps': 7715, 'loss/train': 1.0957801342010498} -11/06/2021 22:19:36 - INFO - __main__ - Step 7717: {'lr': 0.0004981620321814203, 'samples': 1481664, 'steps': 7716, 'loss/train': 1.9144853353500366} -11/06/2021 22:19:36 - INFO - __main__ - Step 7718: {'lr': 0.0004981613898188576, 'samples': 1481856, 'steps': 7717, 'loss/train': 1.7931559085845947} -11/06/2021 22:19:37 - INFO - __main__ - Step 7719: {'lr': 0.0004981607473444772, 'samples': 1482048, 'steps': 7718, 'loss/train': 1.8735288381576538} -11/06/2021 22:19:37 - INFO - __main__ - Step 7720: {'lr': 0.0004981601047582794, 'samples': 1482240, 'steps': 7719, 'loss/train': 1.727927327156067} -11/06/2021 22:19:38 - INFO - __main__ - Step 7721: {'lr': 0.0004981594620602645, 'samples': 1482432, 'steps': 7720, 'loss/train': 1.948897361755371} -11/06/2021 22:19:38 - INFO - __main__ - Step 7722: {'lr': 0.0004981588192504329, 'samples': 1482624, 'steps': 7721, 'loss/train': 0.8639780879020691} -11/06/2021 22:19:38 - INFO - __main__ - Step 7723: {'lr': 0.0004981581763287845, 'samples': 1482816, 'steps': 7722, 'loss/train': 2.073319673538208} -11/06/2021 22:19:39 - INFO - __main__ - Step 7724: {'lr': 0.0004981575332953201, 'samples': 1483008, 'steps': 7723, 'loss/train': 1.5656884908676147} -11/06/2021 22:19:40 - INFO - __main__ - Step 7725: {'lr': 0.0004981568901500396, 'samples': 1483200, 'steps': 7724, 'loss/train': 1.949126124382019} -11/06/2021 22:19:40 - INFO - __main__ - Step 7726: {'lr': 0.0004981562468929435, 'samples': 1483392, 'steps': 7725, 'loss/train': 2.107515811920166} -11/06/2021 22:19:40 - INFO - __main__ - Step 7727: {'lr': 0.000498155603524032, 'samples': 1483584, 'steps': 7726, 'loss/train': 1.8496572971343994} -11/06/2021 22:19:41 - INFO - __main__ - Step 7728: {'lr': 0.0004981549600433054, 'samples': 1483776, 'steps': 7727, 'loss/train': 2.109135627746582} -11/06/2021 22:19:42 - INFO - __main__ - Step 7729: {'lr': 0.000498154316450764, 'samples': 1483968, 'steps': 7728, 'loss/train': 1.3323477506637573} -11/06/2021 22:19:43 - INFO - __main__ - Step 7730: {'lr': 0.0004981536727464082, 'samples': 1484160, 'steps': 7729, 'loss/train': 1.855273962020874} -11/06/2021 22:19:43 - INFO - __main__ - Step 7731: {'lr': 0.0004981530289302381, 'samples': 1484352, 'steps': 7730, 'loss/train': 0.4355550706386566} -11/06/2021 22:19:43 - INFO - __main__ - Step 7732: {'lr': 0.000498152385002254, 'samples': 1484544, 'steps': 7731, 'loss/train': 2.0949268341064453} -11/06/2021 22:19:44 - INFO - __main__ - Step 7733: {'lr': 0.0004981517409624564, 'samples': 1484736, 'steps': 7732, 'loss/train': 2.226652145385742} -11/06/2021 22:19:44 - INFO - __main__ - Step 7734: {'lr': 0.0004981510968108453, 'samples': 1484928, 'steps': 7733, 'loss/train': 2.1331582069396973} -11/06/2021 22:19:45 - INFO - __main__ - Step 7735: {'lr': 0.0004981504525474214, 'samples': 1485120, 'steps': 7734, 'loss/train': 1.9985811710357666} -11/06/2021 22:19:45 - INFO - __main__ - Step 7736: {'lr': 0.0004981498081721845, 'samples': 1485312, 'steps': 7735, 'loss/train': 2.0506227016448975} -11/06/2021 22:19:46 - INFO - __main__ - Step 7737: {'lr': 0.0004981491636851351, 'samples': 1485504, 'steps': 7736, 'loss/train': 1.7922340631484985} -11/06/2021 22:19:46 - INFO - __main__ - Step 7738: {'lr': 0.0004981485190862737, 'samples': 1485696, 'steps': 7737, 'loss/train': 1.6075444221496582} -11/06/2021 22:19:46 - INFO - __main__ - Step 7739: {'lr': 0.0004981478743756004, 'samples': 1485888, 'steps': 7738, 'loss/train': 1.6328068971633911} -11/06/2021 22:19:47 - INFO - __main__ - Step 7740: {'lr': 0.0004981472295531153, 'samples': 1486080, 'steps': 7739, 'loss/train': 2.0658867359161377} -11/06/2021 22:19:48 - INFO - __main__ - Step 7741: {'lr': 0.000498146584618819, 'samples': 1486272, 'steps': 7740, 'loss/train': 2.0356781482696533} -11/06/2021 22:19:48 - INFO - __main__ - Step 7742: {'lr': 0.0004981459395727117, 'samples': 1486464, 'steps': 7741, 'loss/train': 2.1248600482940674} -11/06/2021 22:19:49 - INFO - __main__ - Step 7743: {'lr': 0.0004981452944147937, 'samples': 1486656, 'steps': 7742, 'loss/train': 2.0457077026367188} -11/06/2021 22:19:49 - INFO - __main__ - Step 7744: {'lr': 0.0004981446491450652, 'samples': 1486848, 'steps': 7743, 'loss/train': 2.0596790313720703} -11/06/2021 22:19:50 - INFO - __main__ - Step 7745: {'lr': 0.0004981440037635266, 'samples': 1487040, 'steps': 7744, 'loss/train': 1.76706862449646} -11/06/2021 22:19:50 - INFO - __main__ - Step 7746: {'lr': 0.0004981433582701781, 'samples': 1487232, 'steps': 7745, 'loss/train': 1.9943227767944336} -11/06/2021 22:19:51 - INFO - __main__ - Step 7747: {'lr': 0.00049814271266502, 'samples': 1487424, 'steps': 7746, 'loss/train': 1.9205338954925537} -11/06/2021 22:19:51 - INFO - __main__ - Step 7748: {'lr': 0.0004981420669480526, 'samples': 1487616, 'steps': 7747, 'loss/train': 1.346489667892456} -11/06/2021 22:19:51 - INFO - __main__ - Step 7749: {'lr': 0.0004981414211192763, 'samples': 1487808, 'steps': 7748, 'loss/train': 2.3146755695343018} -11/06/2021 22:19:52 - INFO - __main__ - Step 7750: {'lr': 0.0004981407751786913, 'samples': 1488000, 'steps': 7749, 'loss/train': 1.654209852218628} -11/06/2021 22:19:53 - INFO - __main__ - Step 7751: {'lr': 0.0004981401291262979, 'samples': 1488192, 'steps': 7750, 'loss/train': 0.34622922539711} -11/06/2021 22:19:53 - INFO - __main__ - Step 7752: {'lr': 0.0004981394829620963, 'samples': 1488384, 'steps': 7751, 'loss/train': 1.7355235815048218} -11/06/2021 22:19:53 - INFO - __main__ - Step 7753: {'lr': 0.0004981388366860869, 'samples': 1488576, 'steps': 7752, 'loss/train': 1.484642744064331} -11/06/2021 22:19:54 - INFO - __main__ - Step 7754: {'lr': 0.0004981381902982702, 'samples': 1488768, 'steps': 7753, 'loss/train': 1.2855114936828613} -11/06/2021 22:19:54 - INFO - __main__ - Step 7755: {'lr': 0.0004981375437986459, 'samples': 1488960, 'steps': 7754, 'loss/train': 1.6895129680633545} -11/06/2021 22:19:55 - INFO - __main__ - Step 7756: {'lr': 0.0004981368971872149, 'samples': 1489152, 'steps': 7755, 'loss/train': 1.9353357553482056} -11/06/2021 22:19:55 - INFO - __main__ - Step 7757: {'lr': 0.0004981362504639772, 'samples': 1489344, 'steps': 7756, 'loss/train': 1.9244894981384277} -11/06/2021 22:19:56 - INFO - __main__ - Step 7758: {'lr': 0.0004981356036289331, 'samples': 1489536, 'steps': 7757, 'loss/train': 1.332854151725769} -11/06/2021 22:19:56 - INFO - __main__ - Step 7759: {'lr': 0.0004981349566820828, 'samples': 1489728, 'steps': 7758, 'loss/train': 1.9951647520065308} -11/06/2021 22:19:57 - INFO - __main__ - Step 7760: {'lr': 0.0004981343096234268, 'samples': 1489920, 'steps': 7759, 'loss/train': 1.7065505981445312} -11/06/2021 22:19:58 - INFO - __main__ - Step 7761: {'lr': 0.0004981336624529654, 'samples': 1490112, 'steps': 7760, 'loss/train': 1.5033037662506104} -11/06/2021 22:19:58 - INFO - __main__ - Step 7762: {'lr': 0.0004981330151706988, 'samples': 1490304, 'steps': 7761, 'loss/train': 1.2406482696533203} -11/06/2021 22:19:58 - INFO - __main__ - Step 7763: {'lr': 0.0004981323677766273, 'samples': 1490496, 'steps': 7762, 'loss/train': 2.313772678375244} -11/06/2021 22:19:59 - INFO - __main__ - Step 7764: {'lr': 0.000498131720270751, 'samples': 1490688, 'steps': 7763, 'loss/train': 1.9050623178482056} -11/06/2021 22:19:59 - INFO - __main__ - Step 7765: {'lr': 0.0004981310726530706, 'samples': 1490880, 'steps': 7764, 'loss/train': 1.5810691118240356} -11/06/2021 22:20:00 - INFO - __main__ - Step 7766: {'lr': 0.0004981304249235861, 'samples': 1491072, 'steps': 7765, 'loss/train': 1.6522554159164429} -11/06/2021 22:20:00 - INFO - __main__ - Step 7767: {'lr': 0.0004981297770822977, 'samples': 1491264, 'steps': 7766, 'loss/train': 2.1629531383514404} -11/06/2021 22:20:01 - INFO - __main__ - Step 7768: {'lr': 0.0004981291291292061, 'samples': 1491456, 'steps': 7767, 'loss/train': 2.0148024559020996} -11/06/2021 22:20:01 - INFO - __main__ - Step 7769: {'lr': 0.0004981284810643112, 'samples': 1491648, 'steps': 7768, 'loss/train': 1.8133976459503174} -11/06/2021 22:20:01 - INFO - __main__ - Step 7770: {'lr': 0.0004981278328876134, 'samples': 1491840, 'steps': 7769, 'loss/train': 1.844529151916504} -11/06/2021 22:20:02 - INFO - __main__ - Step 7771: {'lr': 0.0004981271845991131, 'samples': 1492032, 'steps': 7770, 'loss/train': 1.6602436304092407} -11/06/2021 22:20:03 - INFO - __main__ - Step 7772: {'lr': 0.0004981265361988105, 'samples': 1492224, 'steps': 7771, 'loss/train': 1.7457406520843506} -11/06/2021 22:20:03 - INFO - __main__ - Step 7773: {'lr': 0.000498125887686706, 'samples': 1492416, 'steps': 7772, 'loss/train': 1.8187391757965088} -11/06/2021 22:20:03 - INFO - __main__ - Step 7774: {'lr': 0.0004981252390627997, 'samples': 1492608, 'steps': 7773, 'loss/train': 2.382383108139038} -11/06/2021 22:20:04 - INFO - __main__ - Step 7775: {'lr': 0.000498124590327092, 'samples': 1492800, 'steps': 7774, 'loss/train': 2.054161310195923} -11/06/2021 22:20:05 - INFO - __main__ - Step 7776: {'lr': 0.0004981239414795832, 'samples': 1492992, 'steps': 7775, 'loss/train': 1.5990222692489624} -11/06/2021 22:20:05 - INFO - __main__ - Step 7777: {'lr': 0.0004981232925202736, 'samples': 1493184, 'steps': 7776, 'loss/train': 1.856432318687439} -11/06/2021 22:20:06 - INFO - __main__ - Step 7778: {'lr': 0.0004981226434491635, 'samples': 1493376, 'steps': 7777, 'loss/train': 1.7675282955169678} -11/06/2021 22:20:06 - INFO - __main__ - Step 7779: {'lr': 0.000498121994266253, 'samples': 1493568, 'steps': 7778, 'loss/train': 1.9787876605987549} -11/06/2021 22:20:07 - INFO - __main__ - Step 7780: {'lr': 0.0004981213449715427, 'samples': 1493760, 'steps': 7779, 'loss/train': 2.1368026733398438} -11/06/2021 22:20:07 - INFO - __main__ - Step 7781: {'lr': 0.0004981206955650328, 'samples': 1493952, 'steps': 7780, 'loss/train': 1.7741491794586182} -11/06/2021 22:20:08 - INFO - __main__ - Step 7782: {'lr': 0.0004981200460467234, 'samples': 1494144, 'steps': 7781, 'loss/train': 1.8448156118392944} -11/06/2021 22:20:08 - INFO - __main__ - Step 7783: {'lr': 0.0004981193964166151, 'samples': 1494336, 'steps': 7782, 'loss/train': 2.476020097732544} -11/06/2021 22:20:09 - INFO - __main__ - Step 7784: {'lr': 0.0004981187466747079, 'samples': 1494528, 'steps': 7783, 'loss/train': 1.604864478111267} -11/06/2021 22:20:09 - INFO - __main__ - Step 7785: {'lr': 0.0004981180968210023, 'samples': 1494720, 'steps': 7784, 'loss/train': 1.6935956478118896} -11/06/2021 22:20:09 - INFO - __main__ - Step 7786: {'lr': 0.0004981174468554984, 'samples': 1494912, 'steps': 7785, 'loss/train': 1.7149159908294678} -11/06/2021 22:20:10 - INFO - __main__ - Step 7787: {'lr': 0.0004981167967781968, 'samples': 1495104, 'steps': 7786, 'loss/train': 1.5972424745559692} -11/06/2021 22:20:11 - INFO - __main__ - Step 7788: {'lr': 0.0004981161465890975, 'samples': 1495296, 'steps': 7787, 'loss/train': 1.8924384117126465} -11/06/2021 22:20:11 - INFO - __main__ - Step 7789: {'lr': 0.0004981154962882008, 'samples': 1495488, 'steps': 7788, 'loss/train': 2.01082444190979} -11/06/2021 22:20:11 - INFO - __main__ - Step 7790: {'lr': 0.0004981148458755071, 'samples': 1495680, 'steps': 7789, 'loss/train': 2.0022146701812744} -11/06/2021 22:20:12 - INFO - __main__ - Step 7791: {'lr': 0.0004981141953510169, 'samples': 1495872, 'steps': 7790, 'loss/train': 1.9454317092895508} -11/06/2021 22:20:13 - INFO - __main__ - Step 7792: {'lr': 0.00049811354471473, 'samples': 1496064, 'steps': 7791, 'loss/train': 1.6417571306228638} -11/06/2021 22:20:13 - INFO - __main__ - Step 7793: {'lr': 0.0004981128939666471, 'samples': 1496256, 'steps': 7792, 'loss/train': 2.925060510635376} -11/06/2021 22:20:13 - INFO - __main__ - Step 7794: {'lr': 0.0004981122431067683, 'samples': 1496448, 'steps': 7793, 'loss/train': 2.0619399547576904} -11/06/2021 22:20:14 - INFO - __main__ - Step 7795: {'lr': 0.0004981115921350941, 'samples': 1496640, 'steps': 7794, 'loss/train': 1.3753095865249634} -11/06/2021 22:20:14 - INFO - __main__ - Step 7796: {'lr': 0.0004981109410516245, 'samples': 1496832, 'steps': 7795, 'loss/train': 1.4551738500595093} -11/06/2021 22:20:15 - INFO - __main__ - Step 7797: {'lr': 0.00049811028985636, 'samples': 1497024, 'steps': 7796, 'loss/train': 2.0298280715942383} -11/06/2021 22:20:15 - INFO - __main__ - Step 7798: {'lr': 0.0004981096385493007, 'samples': 1497216, 'steps': 7797, 'loss/train': 1.5669386386871338} -11/06/2021 22:20:16 - INFO - __main__ - Step 7799: {'lr': 0.0004981089871304472, 'samples': 1497408, 'steps': 7798, 'loss/train': 1.8886076211929321} -11/06/2021 22:20:16 - INFO - __main__ - Step 7800: {'lr': 0.0004981083355997995, 'samples': 1497600, 'steps': 7799, 'loss/train': 2.574296236038208} -11/06/2021 22:20:16 - INFO - __main__ - Step 7801: {'lr': 0.0004981076839573581, 'samples': 1497792, 'steps': 7800, 'loss/train': 0.9300814867019653} -11/06/2021 22:20:18 - INFO - __main__ - Step 7802: {'lr': 0.0004981070322031231, 'samples': 1497984, 'steps': 7801, 'loss/train': 1.7975281476974487} -11/06/2021 22:20:18 - INFO - __main__ - Step 7803: {'lr': 0.000498106380337095, 'samples': 1498176, 'steps': 7802, 'loss/train': 1.889115810394287} -11/06/2021 22:20:18 - INFO - __main__ - Step 7804: {'lr': 0.000498105728359274, 'samples': 1498368, 'steps': 7803, 'loss/train': 1.7939035892486572} -11/06/2021 22:20:19 - INFO - __main__ - Step 7805: {'lr': 0.0004981050762696604, 'samples': 1498560, 'steps': 7804, 'loss/train': 0.8266537189483643} -11/06/2021 22:20:19 - INFO - __main__ - Step 7806: {'lr': 0.0004981044240682544, 'samples': 1498752, 'steps': 7805, 'loss/train': 1.2602494955062866} -11/06/2021 22:20:19 - INFO - __main__ - Step 7807: {'lr': 0.0004981037717550564, 'samples': 1498944, 'steps': 7806, 'loss/train': 1.8031574487686157} -11/06/2021 22:20:20 - INFO - __main__ - Step 7808: {'lr': 0.0004981031193300667, 'samples': 1499136, 'steps': 7807, 'loss/train': 1.0529712438583374} -11/06/2021 22:20:21 - INFO - __main__ - Step 7809: {'lr': 0.0004981024667932855, 'samples': 1499328, 'steps': 7808, 'loss/train': 2.0406086444854736} -11/06/2021 22:20:21 - INFO - __main__ - Step 7810: {'lr': 0.0004981018141447133, 'samples': 1499520, 'steps': 7809, 'loss/train': 2.1355226039886475} -11/06/2021 22:20:21 - INFO - __main__ - Step 7811: {'lr': 0.00049810116138435, 'samples': 1499712, 'steps': 7810, 'loss/train': 1.709943413734436} -11/06/2021 22:20:22 - INFO - __main__ - Step 7812: {'lr': 0.0004981005085121963, 'samples': 1499904, 'steps': 7811, 'loss/train': 2.1915555000305176} -11/06/2021 22:20:23 - INFO - __main__ - Step 7813: {'lr': 0.0004980998555282524, 'samples': 1500096, 'steps': 7812, 'loss/train': 1.9955559968948364} -11/06/2021 22:20:23 - INFO - __main__ - Step 7814: {'lr': 0.0004980992024325185, 'samples': 1500288, 'steps': 7813, 'loss/train': 1.8444761037826538} -11/06/2021 22:20:24 - INFO - __main__ - Step 7815: {'lr': 0.0004980985492249949, 'samples': 1500480, 'steps': 7814, 'loss/train': 1.2955152988433838} -11/06/2021 22:20:24 - INFO - __main__ - Step 7816: {'lr': 0.0004980978959056819, 'samples': 1500672, 'steps': 7815, 'loss/train': 2.804755926132202} -11/06/2021 22:20:24 - INFO - __main__ - Step 7817: {'lr': 0.0004980972424745798, 'samples': 1500864, 'steps': 7816, 'loss/train': 2.022976875305176} -11/06/2021 22:20:26 - INFO - __main__ - Step 7818: {'lr': 0.000498096588931689, 'samples': 1501056, 'steps': 7817, 'loss/train': 1.9922711849212646} -11/06/2021 22:20:26 - INFO - __main__ - Step 7819: {'lr': 0.0004980959352770095, 'samples': 1501248, 'steps': 7818, 'loss/train': 2.2206287384033203} -11/06/2021 22:20:27 - INFO - __main__ - Step 7820: {'lr': 0.000498095281510542, 'samples': 1501440, 'steps': 7819, 'loss/train': 2.107832908630371} -11/06/2021 22:20:27 - INFO - __main__ - Step 7821: {'lr': 0.0004980946276322866, 'samples': 1501632, 'steps': 7820, 'loss/train': 2.020620822906494} -11/06/2021 22:20:27 - INFO - __main__ - Step 7822: {'lr': 0.0004980939736422436, 'samples': 1501824, 'steps': 7821, 'loss/train': 1.574951410293579} -11/06/2021 22:20:28 - INFO - __main__ - Step 7823: {'lr': 0.0004980933195404131, 'samples': 1502016, 'steps': 7822, 'loss/train': 1.5748287439346313} -11/06/2021 22:20:29 - INFO - __main__ - Step 7824: {'lr': 0.0004980926653267957, 'samples': 1502208, 'steps': 7823, 'loss/train': 2.000244617462158} -11/06/2021 22:20:29 - INFO - __main__ - Step 7825: {'lr': 0.0004980920110013915, 'samples': 1502400, 'steps': 7824, 'loss/train': 1.830479383468628} -11/06/2021 22:20:29 - INFO - __main__ - Step 7826: {'lr': 0.000498091356564201, 'samples': 1502592, 'steps': 7825, 'loss/train': 2.059532880783081} -11/06/2021 22:20:30 - INFO - __main__ - Step 7827: {'lr': 0.0004980907020152242, 'samples': 1502784, 'steps': 7826, 'loss/train': 2.0572545528411865} -11/06/2021 22:20:30 - INFO - __main__ - Step 7828: {'lr': 0.0004980900473544617, 'samples': 1502976, 'steps': 7827, 'loss/train': 1.7238388061523438} -11/06/2021 22:20:31 - INFO - __main__ - Step 7829: {'lr': 0.0004980893925819137, 'samples': 1503168, 'steps': 7828, 'loss/train': 1.9951441287994385} -11/06/2021 22:20:31 - INFO - __main__ - Step 7830: {'lr': 0.0004980887376975804, 'samples': 1503360, 'steps': 7829, 'loss/train': 1.7326819896697998} -11/06/2021 22:20:32 - INFO - __main__ - Step 7831: {'lr': 0.000498088082701462, 'samples': 1503552, 'steps': 7830, 'loss/train': 2.2184314727783203} -11/06/2021 22:20:32 - INFO - __main__ - Step 7832: {'lr': 0.0004980874275935591, 'samples': 1503744, 'steps': 7831, 'loss/train': 0.8481667041778564} -11/06/2021 22:20:32 - INFO - __main__ - Step 7833: {'lr': 0.0004980867723738717, 'samples': 1503936, 'steps': 7832, 'loss/train': 1.9760394096374512} -11/06/2021 22:20:34 - INFO - __main__ - Step 7834: {'lr': 0.0004980861170424003, 'samples': 1504128, 'steps': 7833, 'loss/train': 2.106902837753296} -11/06/2021 22:20:34 - INFO - __main__ - Step 7835: {'lr': 0.0004980854615991452, 'samples': 1504320, 'steps': 7834, 'loss/train': 2.3520045280456543} -11/06/2021 22:20:34 - INFO - __main__ - Step 7836: {'lr': 0.0004980848060441064, 'samples': 1504512, 'steps': 7835, 'loss/train': 2.106365442276001} -11/06/2021 22:20:35 - INFO - __main__ - Step 7837: {'lr': 0.0004980841503772846, 'samples': 1504704, 'steps': 7836, 'loss/train': 1.764209270477295} -11/06/2021 22:20:35 - INFO - __main__ - Step 7838: {'lr': 0.0004980834945986799, 'samples': 1504896, 'steps': 7837, 'loss/train': 2.0532870292663574} -11/06/2021 22:20:37 - INFO - __main__ - Step 7839: {'lr': 0.0004980828387082925, 'samples': 1505088, 'steps': 7838, 'loss/train': 2.207231283187866} -11/06/2021 22:20:37 - INFO - __main__ - Step 7840: {'lr': 0.000498082182706123, 'samples': 1505280, 'steps': 7839, 'loss/train': 0.6530503034591675} -11/06/2021 22:20:37 - INFO - __main__ - Step 7841: {'lr': 0.0004980815265921713, 'samples': 1505472, 'steps': 7840, 'loss/train': 0.6378718614578247} -11/06/2021 22:20:38 - INFO - __main__ - Step 7842: {'lr': 0.000498080870366438, 'samples': 1505664, 'steps': 7841, 'loss/train': 1.529860258102417} -11/06/2021 22:20:38 - INFO - __main__ - Step 7843: {'lr': 0.0004980802140289232, 'samples': 1505856, 'steps': 7842, 'loss/train': 1.2913402318954468} -11/06/2021 22:20:39 - INFO - __main__ - Step 7844: {'lr': 0.0004980795575796273, 'samples': 1506048, 'steps': 7843, 'loss/train': 1.243632435798645} -11/06/2021 22:20:39 - INFO - __main__ - Step 7845: {'lr': 0.0004980789010185507, 'samples': 1506240, 'steps': 7844, 'loss/train': 1.593994379043579} -11/06/2021 22:20:40 - INFO - __main__ - Step 7846: {'lr': 0.0004980782443456935, 'samples': 1506432, 'steps': 7845, 'loss/train': 1.4024707078933716} -11/06/2021 22:20:40 - INFO - __main__ - Step 7847: {'lr': 0.000498077587561056, 'samples': 1506624, 'steps': 7846, 'loss/train': 1.6562167406082153} -11/06/2021 22:20:40 - INFO - __main__ - Step 7848: {'lr': 0.0004980769306646386, 'samples': 1506816, 'steps': 7847, 'loss/train': 1.7106425762176514} -11/06/2021 22:20:41 - INFO - __main__ - Step 7849: {'lr': 0.0004980762736564417, 'samples': 1507008, 'steps': 7848, 'loss/train': 2.013291358947754} -11/06/2021 22:20:42 - INFO - __main__ - Step 7850: {'lr': 0.0004980756165364653, 'samples': 1507200, 'steps': 7849, 'loss/train': 2.613538980484009} -11/06/2021 22:20:42 - INFO - __main__ - Step 7851: {'lr': 0.0004980749593047099, 'samples': 1507392, 'steps': 7850, 'loss/train': 1.5560020208358765} -11/06/2021 22:20:43 - INFO - __main__ - Step 7852: {'lr': 0.0004980743019611757, 'samples': 1507584, 'steps': 7851, 'loss/train': 1.659212589263916} -11/06/2021 22:20:43 - INFO - __main__ - Step 7853: {'lr': 0.0004980736445058631, 'samples': 1507776, 'steps': 7852, 'loss/train': 1.3701859712600708} -11/06/2021 22:20:43 - INFO - __main__ - Step 7854: {'lr': 0.0004980729869387724, 'samples': 1507968, 'steps': 7853, 'loss/train': 1.2803887128829956} -11/06/2021 22:20:44 - INFO - __main__ - Step 7855: {'lr': 0.0004980723292599037, 'samples': 1508160, 'steps': 7854, 'loss/train': 1.8908063173294067} -11/06/2021 22:20:45 - INFO - __main__ - Step 7856: {'lr': 0.0004980716714692576, 'samples': 1508352, 'steps': 7855, 'loss/train': 1.353319764137268} -11/06/2021 22:20:45 - INFO - __main__ - Step 7857: {'lr': 0.0004980710135668342, 'samples': 1508544, 'steps': 7856, 'loss/train': 1.9040857553482056} -11/06/2021 22:20:45 - INFO - __main__ - Step 7858: {'lr': 0.0004980703555526338, 'samples': 1508736, 'steps': 7857, 'loss/train': 1.8307812213897705} -11/06/2021 22:20:46 - INFO - __main__ - Step 7859: {'lr': 0.0004980696974266566, 'samples': 1508928, 'steps': 7858, 'loss/train': 1.9307920932769775} -11/06/2021 22:20:47 - INFO - __main__ - Step 7860: {'lr': 0.0004980690391889033, 'samples': 1509120, 'steps': 7859, 'loss/train': 1.5426441431045532} -11/06/2021 22:20:47 - INFO - __main__ - Step 7861: {'lr': 0.0004980683808393737, 'samples': 1509312, 'steps': 7860, 'loss/train': 2.0717623233795166} -11/06/2021 22:20:48 - INFO - __main__ - Step 7862: {'lr': 0.0004980677223780683, 'samples': 1509504, 'steps': 7861, 'loss/train': 1.8097648620605469} -11/06/2021 22:20:48 - INFO - __main__ - Step 7863: {'lr': 0.0004980670638049875, 'samples': 1509696, 'steps': 7862, 'loss/train': 2.1986732482910156} -11/06/2021 22:20:48 - INFO - __main__ - Step 7864: {'lr': 0.0004980664051201315, 'samples': 1509888, 'steps': 7863, 'loss/train': 1.8978809118270874} -11/06/2021 22:20:49 - INFO - __main__ - Step 7865: {'lr': 0.0004980657463235006, 'samples': 1510080, 'steps': 7864, 'loss/train': 2.399979829788208} -11/06/2021 22:20:50 - INFO - __main__ - Step 7866: {'lr': 0.0004980650874150951, 'samples': 1510272, 'steps': 7865, 'loss/train': 2.042692184448242} -11/06/2021 22:20:50 - INFO - __main__ - Step 7867: {'lr': 0.0004980644283949152, 'samples': 1510464, 'steps': 7866, 'loss/train': 1.8365942239761353} -11/06/2021 22:20:50 - INFO - __main__ - Step 7868: {'lr': 0.0004980637692629615, 'samples': 1510656, 'steps': 7867, 'loss/train': 1.6458255052566528} -11/06/2021 22:20:51 - INFO - __main__ - Step 7869: {'lr': 0.0004980631100192339, 'samples': 1510848, 'steps': 7868, 'loss/train': 1.41680908203125} -11/06/2021 22:20:52 - INFO - __main__ - Step 7870: {'lr': 0.000498062450663733, 'samples': 1511040, 'steps': 7869, 'loss/train': 1.9412450790405273} -11/06/2021 22:20:53 - INFO - __main__ - Step 7871: {'lr': 0.000498061791196459, 'samples': 1511232, 'steps': 7870, 'loss/train': 1.4640387296676636} -11/06/2021 22:20:53 - INFO - __main__ - Step 7872: {'lr': 0.0004980611316174122, 'samples': 1511424, 'steps': 7871, 'loss/train': 1.4650890827178955} -11/06/2021 22:20:53 - INFO - __main__ - Step 7873: {'lr': 0.0004980604719265928, 'samples': 1511616, 'steps': 7872, 'loss/train': 1.9281331300735474} -11/06/2021 22:20:54 - INFO - __main__ - Step 7874: {'lr': 0.0004980598121240012, 'samples': 1511808, 'steps': 7873, 'loss/train': 1.7270317077636719} -11/06/2021 22:20:54 - INFO - __main__ - Step 7875: {'lr': 0.0004980591522096377, 'samples': 1512000, 'steps': 7874, 'loss/train': 3.885760545730591} -11/06/2021 22:20:55 - INFO - __main__ - Step 7876: {'lr': 0.0004980584921835025, 'samples': 1512192, 'steps': 7875, 'loss/train': 1.878515362739563} -11/06/2021 22:20:56 - INFO - __main__ - Step 7877: {'lr': 0.000498057832045596, 'samples': 1512384, 'steps': 7876, 'loss/train': 2.0955753326416016} -11/06/2021 22:20:56 - INFO - __main__ - Step 7878: {'lr': 0.0004980571717959186, 'samples': 1512576, 'steps': 7877, 'loss/train': 1.7663307189941406} -11/06/2021 22:20:56 - INFO - __main__ - Step 7879: {'lr': 0.0004980565114344704, 'samples': 1512768, 'steps': 7878, 'loss/train': 2.003199577331543} -11/06/2021 22:20:57 - INFO - __main__ - Step 7880: {'lr': 0.0004980558509612516, 'samples': 1512960, 'steps': 7879, 'loss/train': 1.4468077421188354} -11/06/2021 22:20:58 - INFO - __main__ - Step 7881: {'lr': 0.0004980551903762629, 'samples': 1513152, 'steps': 7880, 'loss/train': 1.9286073446273804} -11/06/2021 22:20:58 - INFO - __main__ - Step 7882: {'lr': 0.0004980545296795043, 'samples': 1513344, 'steps': 7881, 'loss/train': 1.9439208507537842} -11/06/2021 22:20:58 - INFO - __main__ - Step 7883: {'lr': 0.0004980538688709761, 'samples': 1513536, 'steps': 7882, 'loss/train': 1.9707108736038208} -11/06/2021 22:20:59 - INFO - __main__ - Step 7884: {'lr': 0.0004980532079506786, 'samples': 1513728, 'steps': 7883, 'loss/train': 2.4057676792144775} -11/06/2021 22:20:59 - INFO - __main__ - Step 7885: {'lr': 0.0004980525469186122, 'samples': 1513920, 'steps': 7884, 'loss/train': 2.0141124725341797} -11/06/2021 22:20:59 - INFO - __main__ - Step 7886: {'lr': 0.0004980518857747772, 'samples': 1514112, 'steps': 7885, 'loss/train': 1.6964260339736938} -11/06/2021 22:21:00 - INFO - __main__ - Step 7887: {'lr': 0.0004980512245191738, 'samples': 1514304, 'steps': 7886, 'loss/train': 2.2796289920806885} -11/06/2021 22:21:01 - INFO - __main__ - Step 7888: {'lr': 0.0004980505631518023, 'samples': 1514496, 'steps': 7887, 'loss/train': 1.9760662317276} -11/06/2021 22:21:01 - INFO - __main__ - Step 7889: {'lr': 0.0004980499016726632, 'samples': 1514688, 'steps': 7888, 'loss/train': 1.9461336135864258} -11/06/2021 22:21:01 - INFO - __main__ - Step 7890: {'lr': 0.0004980492400817564, 'samples': 1514880, 'steps': 7889, 'loss/train': 1.913292407989502} -11/06/2021 22:21:02 - INFO - __main__ - Step 7891: {'lr': 0.0004980485783790827, 'samples': 1515072, 'steps': 7890, 'loss/train': 1.8750466108322144} -11/06/2021 22:21:03 - INFO - __main__ - Step 7892: {'lr': 0.0004980479165646419, 'samples': 1515264, 'steps': 7891, 'loss/train': 2.3821234703063965} -11/06/2021 22:21:04 - INFO - __main__ - Step 7893: {'lr': 0.0004980472546384347, 'samples': 1515456, 'steps': 7892, 'loss/train': 2.1186270713806152} -11/06/2021 22:21:04 - INFO - __main__ - Step 7894: {'lr': 0.0004980465926004613, 'samples': 1515648, 'steps': 7893, 'loss/train': 5.3973493576049805} -11/06/2021 22:21:04 - INFO - __main__ - Step 7895: {'lr': 0.0004980459304507218, 'samples': 1515840, 'steps': 7894, 'loss/train': 2.0702314376831055} -11/06/2021 22:21:05 - INFO - __main__ - Step 7896: {'lr': 0.0004980452681892166, 'samples': 1516032, 'steps': 7895, 'loss/train': 2.7855825424194336} -11/06/2021 22:21:05 - INFO - __main__ - Step 7897: {'lr': 0.0004980446058159461, 'samples': 1516224, 'steps': 7896, 'loss/train': 2.5757217407226562} -11/06/2021 22:21:06 - INFO - __main__ - Step 7898: {'lr': 0.0004980439433309106, 'samples': 1516416, 'steps': 7897, 'loss/train': 1.7188911437988281} -11/06/2021 22:21:06 - INFO - __main__ - Step 7899: {'lr': 0.0004980432807341102, 'samples': 1516608, 'steps': 7898, 'loss/train': 1.881008267402649} -11/06/2021 22:21:07 - INFO - __main__ - Step 7900: {'lr': 0.0004980426180255453, 'samples': 1516800, 'steps': 7899, 'loss/train': 2.025660514831543} -11/06/2021 22:21:07 - INFO - __main__ - Step 7901: {'lr': 0.0004980419552052163, 'samples': 1516992, 'steps': 7900, 'loss/train': 1.8244693279266357} -11/06/2021 22:21:07 - INFO - __main__ - Step 7902: {'lr': 0.0004980412922731234, 'samples': 1517184, 'steps': 7901, 'loss/train': 2.084381103515625} -11/06/2021 22:21:09 - INFO - __main__ - Step 7903: {'lr': 0.0004980406292292669, 'samples': 1517376, 'steps': 7902, 'loss/train': 1.546284556388855} -11/06/2021 22:21:09 - INFO - __main__ - Step 7904: {'lr': 0.0004980399660736472, 'samples': 1517568, 'steps': 7903, 'loss/train': 1.5335673093795776} -11/06/2021 22:21:09 - INFO - __main__ - Step 7905: {'lr': 0.0004980393028062646, 'samples': 1517760, 'steps': 7904, 'loss/train': 2.310431480407715} -11/06/2021 22:21:10 - INFO - __main__ - Step 7906: {'lr': 0.0004980386394271191, 'samples': 1517952, 'steps': 7905, 'loss/train': 1.9592478275299072} -11/06/2021 22:21:10 - INFO - __main__ - Step 7907: {'lr': 0.0004980379759362113, 'samples': 1518144, 'steps': 7906, 'loss/train': 2.000092029571533} -11/06/2021 22:21:11 - INFO - __main__ - Step 7908: {'lr': 0.0004980373123335414, 'samples': 1518336, 'steps': 7907, 'loss/train': 2.0210494995117188} -11/06/2021 22:21:11 - INFO - __main__ - Step 7909: {'lr': 0.0004980366486191098, 'samples': 1518528, 'steps': 7908, 'loss/train': 1.597767949104309} -11/06/2021 22:21:12 - INFO - __main__ - Step 7910: {'lr': 0.0004980359847929167, 'samples': 1518720, 'steps': 7909, 'loss/train': 1.6900368928909302} -11/06/2021 22:21:12 - INFO - __main__ - Step 7911: {'lr': 0.0004980353208549623, 'samples': 1518912, 'steps': 7910, 'loss/train': 2.016561508178711} -11/06/2021 22:21:12 - INFO - __main__ - Step 7912: {'lr': 0.0004980346568052471, 'samples': 1519104, 'steps': 7911, 'loss/train': 1.868909478187561} -11/06/2021 22:21:14 - INFO - __main__ - Step 7913: {'lr': 0.0004980339926437713, 'samples': 1519296, 'steps': 7912, 'loss/train': 1.8896089792251587} -11/06/2021 22:21:14 - INFO - __main__ - Step 7914: {'lr': 0.0004980333283705351, 'samples': 1519488, 'steps': 7913, 'loss/train': 1.9207043647766113} -11/06/2021 22:21:14 - INFO - __main__ - Step 7915: {'lr': 0.000498032663985539, 'samples': 1519680, 'steps': 7914, 'loss/train': 1.3756333589553833} -11/06/2021 22:21:15 - INFO - __main__ - Step 7916: {'lr': 0.0004980319994887833, 'samples': 1519872, 'steps': 7915, 'loss/train': 1.878954291343689} -11/06/2021 22:21:15 - INFO - __main__ - Step 7917: {'lr': 0.0004980313348802681, 'samples': 1520064, 'steps': 7916, 'loss/train': 2.100268602371216} -11/06/2021 22:21:15 - INFO - __main__ - Step 7918: {'lr': 0.0004980306701599938, 'samples': 1520256, 'steps': 7917, 'loss/train': 2.110107421875} -11/06/2021 22:21:17 - INFO - __main__ - Step 7919: {'lr': 0.0004980300053279607, 'samples': 1520448, 'steps': 7918, 'loss/train': 2.0678465366363525} -11/06/2021 22:21:17 - INFO - __main__ - Step 7920: {'lr': 0.0004980293403841693, 'samples': 1520640, 'steps': 7919, 'loss/train': 2.0250751972198486} -11/06/2021 22:21:17 - INFO - __main__ - Step 7921: {'lr': 0.0004980286753286195, 'samples': 1520832, 'steps': 7920, 'loss/train': 0.41942548751831055} -11/06/2021 22:21:18 - INFO - __main__ - Step 7922: {'lr': 0.0004980280101613119, 'samples': 1521024, 'steps': 7921, 'loss/train': 2.067695379257202} -11/06/2021 22:21:18 - INFO - __main__ - Step 7923: {'lr': 0.0004980273448822466, 'samples': 1521216, 'steps': 7922, 'loss/train': 1.7907764911651611} -11/06/2021 22:21:19 - INFO - __main__ - Step 7924: {'lr': 0.000498026679491424, 'samples': 1521408, 'steps': 7923, 'loss/train': 1.5925756692886353} -11/06/2021 22:21:20 - INFO - __main__ - Step 7925: {'lr': 0.0004980260139888445, 'samples': 1521600, 'steps': 7924, 'loss/train': 1.906895637512207} -11/06/2021 22:21:20 - INFO - __main__ - Step 7926: {'lr': 0.0004980253483745083, 'samples': 1521792, 'steps': 7925, 'loss/train': 1.7573232650756836} -11/06/2021 22:21:20 - INFO - __main__ - Step 7927: {'lr': 0.0004980246826484157, 'samples': 1521984, 'steps': 7926, 'loss/train': 1.8057146072387695} -11/06/2021 22:21:21 - INFO - __main__ - Step 7928: {'lr': 0.000498024016810567, 'samples': 1522176, 'steps': 7927, 'loss/train': 0.6858081221580505} -11/06/2021 22:21:22 - INFO - __main__ - Step 7929: {'lr': 0.0004980233508609625, 'samples': 1522368, 'steps': 7928, 'loss/train': 1.501013994216919} -11/06/2021 22:21:22 - INFO - __main__ - Step 7930: {'lr': 0.0004980226847996025, 'samples': 1522560, 'steps': 7929, 'loss/train': 1.761657476425171} -11/06/2021 22:21:23 - INFO - __main__ - Step 7931: {'lr': 0.0004980220186264874, 'samples': 1522752, 'steps': 7930, 'loss/train': 1.874160885810852} -11/06/2021 22:21:23 - INFO - __main__ - Step 7932: {'lr': 0.0004980213523416172, 'samples': 1522944, 'steps': 7931, 'loss/train': 2.012180805206299} -11/06/2021 22:21:23 - INFO - __main__ - Step 7933: {'lr': 0.0004980206859449926, 'samples': 1523136, 'steps': 7932, 'loss/train': 2.158865213394165} -11/06/2021 22:21:24 - INFO - __main__ - Step 7934: {'lr': 0.0004980200194366136, 'samples': 1523328, 'steps': 7933, 'loss/train': 1.6870510578155518} -11/06/2021 22:21:25 - INFO - __main__ - Step 7935: {'lr': 0.0004980193528164806, 'samples': 1523520, 'steps': 7934, 'loss/train': 1.3986356258392334} -11/06/2021 22:21:25 - INFO - __main__ - Step 7936: {'lr': 0.0004980186860845939, 'samples': 1523712, 'steps': 7935, 'loss/train': 2.1106855869293213} -11/06/2021 22:21:25 - INFO - __main__ - Step 7937: {'lr': 0.0004980180192409539, 'samples': 1523904, 'steps': 7936, 'loss/train': 1.40969979763031} -11/06/2021 22:21:26 - INFO - __main__ - Step 7938: {'lr': 0.0004980173522855608, 'samples': 1524096, 'steps': 7937, 'loss/train': 1.793459415435791} -11/06/2021 22:21:26 - INFO - __main__ - Step 7939: {'lr': 0.0004980166852184148, 'samples': 1524288, 'steps': 7938, 'loss/train': 1.5917954444885254} -11/06/2021 22:21:27 - INFO - __main__ - Step 7940: {'lr': 0.0004980160180395164, 'samples': 1524480, 'steps': 7939, 'loss/train': 1.0192344188690186} -11/06/2021 22:21:27 - INFO - __main__ - Step 7941: {'lr': 0.0004980153507488657, 'samples': 1524672, 'steps': 7940, 'loss/train': 1.7049601078033447} -11/06/2021 22:21:28 - INFO - __main__ - Step 7942: {'lr': 0.0004980146833464633, 'samples': 1524864, 'steps': 7941, 'loss/train': 1.757932424545288} -11/06/2021 22:21:28 - INFO - __main__ - Step 7943: {'lr': 0.0004980140158323092, 'samples': 1525056, 'steps': 7942, 'loss/train': 1.4568382501602173} -11/06/2021 22:21:29 - INFO - __main__ - Step 7944: {'lr': 0.0004980133482064038, 'samples': 1525248, 'steps': 7943, 'loss/train': 2.041997194290161} -11/06/2021 22:21:30 - INFO - __main__ - Step 7945: {'lr': 0.0004980126804687474, 'samples': 1525440, 'steps': 7944, 'loss/train': 1.5531878471374512} -11/06/2021 22:21:30 - INFO - __main__ - Step 7946: {'lr': 0.0004980120126193403, 'samples': 1525632, 'steps': 7945, 'loss/train': 1.8834867477416992} -11/06/2021 22:21:30 - INFO - __main__ - Step 7947: {'lr': 0.0004980113446581829, 'samples': 1525824, 'steps': 7946, 'loss/train': 1.9784860610961914} -11/06/2021 22:21:31 - INFO - __main__ - Step 7948: {'lr': 0.0004980106765852753, 'samples': 1526016, 'steps': 7947, 'loss/train': 1.549972653388977} -11/06/2021 22:21:31 - INFO - __main__ - Step 7949: {'lr': 0.0004980100084006181, 'samples': 1526208, 'steps': 7948, 'loss/train': 1.9199172258377075} -11/06/2021 22:21:32 - INFO - __main__ - Step 7950: {'lr': 0.0004980093401042113, 'samples': 1526400, 'steps': 7949, 'loss/train': 1.6837117671966553} -11/06/2021 22:21:32 - INFO - __main__ - Step 7951: {'lr': 0.0004980086716960552, 'samples': 1526592, 'steps': 7950, 'loss/train': 2.027440071105957} -11/06/2021 22:21:33 - INFO - __main__ - Step 7952: {'lr': 0.0004980080031761504, 'samples': 1526784, 'steps': 7951, 'loss/train': 1.549945592880249} -11/06/2021 22:21:33 - INFO - __main__ - Step 7953: {'lr': 0.000498007334544497, 'samples': 1526976, 'steps': 7952, 'loss/train': 2.5235583782196045} -11/06/2021 22:21:33 - INFO - __main__ - Step 7954: {'lr': 0.0004980066658010952, 'samples': 1527168, 'steps': 7953, 'loss/train': 1.8120335340499878} -11/06/2021 22:21:34 - INFO - __main__ - Step 7955: {'lr': 0.0004980059969459455, 'samples': 1527360, 'steps': 7954, 'loss/train': 1.7081891298294067} -11/06/2021 22:21:35 - INFO - __main__ - Step 7956: {'lr': 0.0004980053279790481, 'samples': 1527552, 'steps': 7955, 'loss/train': 1.0960886478424072} -11/06/2021 22:21:35 - INFO - __main__ - Step 7957: {'lr': 0.0004980046589004034, 'samples': 1527744, 'steps': 7956, 'loss/train': 1.416310429573059} -11/06/2021 22:21:35 - INFO - __main__ - Step 7958: {'lr': 0.0004980039897100115, 'samples': 1527936, 'steps': 7957, 'loss/train': 2.159583568572998} -11/06/2021 22:21:36 - INFO - __main__ - Step 7959: {'lr': 0.000498003320407873, 'samples': 1528128, 'steps': 7958, 'loss/train': 2.172380208969116} -11/06/2021 22:21:36 - INFO - __main__ - Step 7960: {'lr': 0.000498002650993988, 'samples': 1528320, 'steps': 7959, 'loss/train': 1.913335919380188} -11/06/2021 22:21:37 - INFO - __main__ - Step 7961: {'lr': 0.0004980019814683568, 'samples': 1528512, 'steps': 7960, 'loss/train': 1.8780403137207031} -11/06/2021 22:21:38 - INFO - __main__ - Step 7962: {'lr': 0.0004980013118309796, 'samples': 1528704, 'steps': 7961, 'loss/train': 1.8526026010513306} -11/06/2021 22:21:38 - INFO - __main__ - Step 7963: {'lr': 0.000498000642081857, 'samples': 1528896, 'steps': 7962, 'loss/train': 1.8182376623153687} -11/06/2021 22:21:38 - INFO - __main__ - Step 7964: {'lr': 0.0004979999722209891, 'samples': 1529088, 'steps': 7963, 'loss/train': 1.9147931337356567} -11/06/2021 22:21:39 - INFO - __main__ - Step 7965: {'lr': 0.0004979993022483762, 'samples': 1529280, 'steps': 7964, 'loss/train': 1.8008043766021729} -11/06/2021 22:21:40 - INFO - __main__ - Step 7966: {'lr': 0.0004979986321640187, 'samples': 1529472, 'steps': 7965, 'loss/train': 1.427006483078003} -11/06/2021 22:21:40 - INFO - __main__ - Step 7967: {'lr': 0.0004979979619679168, 'samples': 1529664, 'steps': 7966, 'loss/train': 1.8842092752456665} -11/06/2021 22:21:41 - INFO - __main__ - Step 7968: {'lr': 0.0004979972916600708, 'samples': 1529856, 'steps': 7967, 'loss/train': 2.3407888412475586} -11/06/2021 22:21:41 - INFO - __main__ - Step 7969: {'lr': 0.0004979966212404812, 'samples': 1530048, 'steps': 7968, 'loss/train': 1.6167200803756714} -11/06/2021 22:21:41 - INFO - __main__ - Step 7970: {'lr': 0.0004979959507091479, 'samples': 1530240, 'steps': 7969, 'loss/train': 1.8462982177734375} -11/06/2021 22:21:42 - INFO - __main__ - Step 7971: {'lr': 0.0004979952800660717, 'samples': 1530432, 'steps': 7970, 'loss/train': 2.2095303535461426} -11/06/2021 22:21:43 - INFO - __main__ - Step 7972: {'lr': 0.0004979946093112525, 'samples': 1530624, 'steps': 7971, 'loss/train': 2.2119836807250977} -11/06/2021 22:21:44 - INFO - __main__ - Step 7973: {'lr': 0.0004979939384446908, 'samples': 1530816, 'steps': 7972, 'loss/train': 1.7757575511932373} -11/06/2021 22:21:44 - INFO - __main__ - Step 7974: {'lr': 0.0004979932674663869, 'samples': 1531008, 'steps': 7973, 'loss/train': 1.04556405544281} -11/06/2021 22:21:44 - INFO - __main__ - Step 7975: {'lr': 0.000497992596376341, 'samples': 1531200, 'steps': 7974, 'loss/train': 1.6081430912017822} -11/06/2021 22:21:45 - INFO - __main__ - Step 7976: {'lr': 0.0004979919251745535, 'samples': 1531392, 'steps': 7975, 'loss/train': 2.162876844406128} -11/06/2021 22:21:46 - INFO - __main__ - Step 7977: {'lr': 0.0004979912538610247, 'samples': 1531584, 'steps': 7976, 'loss/train': 1.4090156555175781} -11/06/2021 22:21:46 - INFO - __main__ - Step 7978: {'lr': 0.0004979905824357548, 'samples': 1531776, 'steps': 7977, 'loss/train': 1.850123405456543} -11/06/2021 22:21:46 - INFO - __main__ - Step 7979: {'lr': 0.0004979899108987442, 'samples': 1531968, 'steps': 7978, 'loss/train': 2.130842685699463} -11/06/2021 22:21:47 - INFO - __main__ - Step 7980: {'lr': 0.0004979892392499932, 'samples': 1532160, 'steps': 7979, 'loss/train': 1.864031434059143} -11/06/2021 22:21:47 - INFO - __main__ - Step 7981: {'lr': 0.0004979885674895021, 'samples': 1532352, 'steps': 7980, 'loss/train': 1.6603336334228516} -11/06/2021 22:21:48 - INFO - __main__ - Step 7982: {'lr': 0.0004979878956172711, 'samples': 1532544, 'steps': 7981, 'loss/train': 1.4955323934555054} -11/06/2021 22:21:48 - INFO - __main__ - Step 7983: {'lr': 0.0004979872236333005, 'samples': 1532736, 'steps': 7982, 'loss/train': 2.017420530319214} -11/06/2021 22:21:49 - INFO - __main__ - Step 7984: {'lr': 0.0004979865515375908, 'samples': 1532928, 'steps': 7983, 'loss/train': 1.8274989128112793} -11/06/2021 22:21:49 - INFO - __main__ - Step 7985: {'lr': 0.0004979858793301422, 'samples': 1533120, 'steps': 7984, 'loss/train': 1.6632914543151855} -11/06/2021 22:21:49 - INFO - __main__ - Step 7986: {'lr': 0.000497985207010955, 'samples': 1533312, 'steps': 7985, 'loss/train': 1.2843949794769287} -11/06/2021 22:21:50 - INFO - __main__ - Step 7987: {'lr': 0.0004979845345800294, 'samples': 1533504, 'steps': 7986, 'loss/train': 1.5527995824813843} -11/06/2021 22:21:51 - INFO - __main__ - Step 7988: {'lr': 0.0004979838620373659, 'samples': 1533696, 'steps': 7987, 'loss/train': 1.7927266359329224} -11/06/2021 22:21:52 - INFO - __main__ - Step 7989: {'lr': 0.0004979831893829646, 'samples': 1533888, 'steps': 7988, 'loss/train': 0.755244791507721} -11/06/2021 22:21:52 - INFO - __main__ - Step 7990: {'lr': 0.0004979825166168259, 'samples': 1534080, 'steps': 7989, 'loss/train': 1.9054588079452515} -11/06/2021 22:21:52 - INFO - __main__ - Step 7991: {'lr': 0.0004979818437389502, 'samples': 1534272, 'steps': 7990, 'loss/train': 1.586555004119873} -11/06/2021 22:21:53 - INFO - __main__ - Step 7992: {'lr': 0.0004979811707493377, 'samples': 1534464, 'steps': 7991, 'loss/train': 2.3696506023406982} -11/06/2021 22:21:53 - INFO - __main__ - Step 7993: {'lr': 0.0004979804976479887, 'samples': 1534656, 'steps': 7992, 'loss/train': 2.9696648120880127} -11/06/2021 22:21:54 - INFO - __main__ - Step 7994: {'lr': 0.0004979798244349034, 'samples': 1534848, 'steps': 7993, 'loss/train': 0.5555250644683838} -11/06/2021 22:21:54 - INFO - __main__ - Step 7995: {'lr': 0.0004979791511100823, 'samples': 1535040, 'steps': 7994, 'loss/train': 2.1885805130004883} -11/06/2021 22:21:55 - INFO - __main__ - Step 7996: {'lr': 0.0004979784776735257, 'samples': 1535232, 'steps': 7995, 'loss/train': 2.107032060623169} -11/06/2021 22:21:55 - INFO - __main__ - Step 7997: {'lr': 0.0004979778041252338, 'samples': 1535424, 'steps': 7996, 'loss/train': 1.827415943145752} -11/06/2021 22:21:55 - INFO - __main__ - Step 7998: {'lr': 0.0004979771304652068, 'samples': 1535616, 'steps': 7997, 'loss/train': 1.842453122138977} -11/06/2021 22:21:56 - INFO - __main__ - Step 7999: {'lr': 0.0004979764566934452, 'samples': 1535808, 'steps': 7998, 'loss/train': 1.6808557510375977} -11/06/2021 22:21:57 - INFO - __main__ - Step 8000: {'lr': 0.0004979757828099492, 'samples': 1536000, 'steps': 7999, 'loss/train': 1.729453206062317} -11/06/2021 22:21:57 - INFO - __main__ - Step 8001: {'lr': 0.0004979751088147192, 'samples': 1536192, 'steps': 8000, 'loss/train': 1.9405218362808228} -11/06/2021 22:21:58 - INFO - __main__ - Step 8002: {'lr': 0.0004979744347077555, 'samples': 1536384, 'steps': 8001, 'loss/train': 1.666454553604126} -11/06/2021 22:21:58 - INFO - __main__ - Step 8003: {'lr': 0.0004979737604890582, 'samples': 1536576, 'steps': 8002, 'loss/train': 2.0916402339935303} -11/06/2021 22:22:00 - INFO - __main__ - Step 8004: {'lr': 0.0004979730861586278, 'samples': 1536768, 'steps': 8003, 'loss/train': 2.936959743499756} -11/06/2021 22:22:00 - INFO - __main__ - Step 8005: {'lr': 0.0004979724117164646, 'samples': 1536960, 'steps': 8004, 'loss/train': 2.1846797466278076} -11/06/2021 22:22:00 - INFO - __main__ - Step 8006: {'lr': 0.0004979717371625689, 'samples': 1537152, 'steps': 8005, 'loss/train': 1.4431344270706177} -11/06/2021 22:22:01 - INFO - __main__ - Step 8007: {'lr': 0.0004979710624969408, 'samples': 1537344, 'steps': 8006, 'loss/train': 1.6920371055603027} -11/06/2021 22:22:01 - INFO - __main__ - Step 8008: {'lr': 0.000497970387719581, 'samples': 1537536, 'steps': 8007, 'loss/train': 1.7911888360977173} -11/06/2021 22:22:01 - INFO - __main__ - Step 8009: {'lr': 0.0004979697128304893, 'samples': 1537728, 'steps': 8008, 'loss/train': 2.065598249435425} -11/06/2021 22:22:02 - INFO - __main__ - Step 8010: {'lr': 0.0004979690378296665, 'samples': 1537920, 'steps': 8009, 'loss/train': 1.9170726537704468} -11/06/2021 22:22:02 - INFO - __main__ - Step 8011: {'lr': 0.0004979683627171125, 'samples': 1538112, 'steps': 8010, 'loss/train': 2.038038730621338} -11/06/2021 22:22:03 - INFO - __main__ - Step 8012: {'lr': 0.0004979676874928278, 'samples': 1538304, 'steps': 8011, 'loss/train': 1.8985741138458252} -11/06/2021 22:22:04 - INFO - __main__ - Step 8013: {'lr': 0.0004979670121568129, 'samples': 1538496, 'steps': 8012, 'loss/train': 2.169818878173828} -11/06/2021 22:22:04 - INFO - __main__ - Step 8014: {'lr': 0.0004979663367090676, 'samples': 1538688, 'steps': 8013, 'loss/train': 2.037712335586548} -11/06/2021 22:22:04 - INFO - __main__ - Step 8015: {'lr': 0.0004979656611495927, 'samples': 1538880, 'steps': 8014, 'loss/train': 2.2237470149993896} -11/06/2021 22:22:05 - INFO - __main__ - Step 8016: {'lr': 0.0004979649854783883, 'samples': 1539072, 'steps': 8015, 'loss/train': 1.822688341140747} -11/06/2021 22:22:06 - INFO - __main__ - Step 8017: {'lr': 0.0004979643096954545, 'samples': 1539264, 'steps': 8016, 'loss/train': 2.502737283706665} -11/06/2021 22:22:06 - INFO - __main__ - Step 8018: {'lr': 0.000497963633800792, 'samples': 1539456, 'steps': 8017, 'loss/train': 1.937386393547058} -11/06/2021 22:22:06 - INFO - __main__ - Step 8019: {'lr': 0.0004979629577944009, 'samples': 1539648, 'steps': 8018, 'loss/train': 1.8304017782211304} -11/06/2021 22:22:07 - INFO - __main__ - Step 8020: {'lr': 0.0004979622816762815, 'samples': 1539840, 'steps': 8019, 'loss/train': 2.0212595462799072} -11/06/2021 22:22:07 - INFO - __main__ - Step 8021: {'lr': 0.0004979616054464341, 'samples': 1540032, 'steps': 8020, 'loss/train': 1.852665662765503} -11/06/2021 22:22:08 - INFO - __main__ - Step 8022: {'lr': 0.000497960929104859, 'samples': 1540224, 'steps': 8021, 'loss/train': 2.02396821975708} -11/06/2021 22:22:08 - INFO - __main__ - Step 8023: {'lr': 0.0004979602526515566, 'samples': 1540416, 'steps': 8022, 'loss/train': 2.089334726333618} -11/06/2021 22:22:09 - INFO - __main__ - Step 8024: {'lr': 0.0004979595760865271, 'samples': 1540608, 'steps': 8023, 'loss/train': 1.602588176727295} -11/06/2021 22:22:09 - INFO - __main__ - Step 8025: {'lr': 0.0004979588994097708, 'samples': 1540800, 'steps': 8024, 'loss/train': 1.3973878622055054} -11/06/2021 22:22:09 - INFO - __main__ - Step 8026: {'lr': 0.0004979582226212881, 'samples': 1540992, 'steps': 8025, 'loss/train': 1.1899759769439697} -11/06/2021 22:22:10 - INFO - __main__ - Step 8027: {'lr': 0.0004979575457210792, 'samples': 1541184, 'steps': 8026, 'loss/train': 1.6932975053787231} -11/06/2021 22:22:11 - INFO - __main__ - Step 8028: {'lr': 0.0004979568687091446, 'samples': 1541376, 'steps': 8027, 'loss/train': 1.7348906993865967} -11/06/2021 22:22:11 - INFO - __main__ - Step 8029: {'lr': 0.0004979561915854843, 'samples': 1541568, 'steps': 8028, 'loss/train': 1.5938066244125366} -11/06/2021 22:22:12 - INFO - __main__ - Step 8030: {'lr': 0.0004979555143500988, 'samples': 1541760, 'steps': 8029, 'loss/train': 2.0716259479522705} -11/06/2021 22:22:12 - INFO - __main__ - Step 8031: {'lr': 0.0004979548370029884, 'samples': 1541952, 'steps': 8030, 'loss/train': 1.7080976963043213} -11/06/2021 22:22:12 - INFO - __main__ - Step 8032: {'lr': 0.0004979541595441534, 'samples': 1542144, 'steps': 8031, 'loss/train': 1.9131830930709839} -11/06/2021 22:22:13 - INFO - __main__ - Step 8033: {'lr': 0.000497953481973594, 'samples': 1542336, 'steps': 8032, 'loss/train': 1.6197700500488281} -11/06/2021 22:22:14 - INFO - __main__ - Step 8034: {'lr': 0.0004979528042913106, 'samples': 1542528, 'steps': 8033, 'loss/train': 1.7297489643096924} -11/06/2021 22:22:14 - INFO - __main__ - Step 8035: {'lr': 0.0004979521264973036, 'samples': 1542720, 'steps': 8034, 'loss/train': 2.004364490509033} -11/06/2021 22:22:14 - INFO - __main__ - Step 8036: {'lr': 0.0004979514485915731, 'samples': 1542912, 'steps': 8035, 'loss/train': 1.4310439825057983} -11/06/2021 22:22:15 - INFO - __main__ - Step 8037: {'lr': 0.0004979507705741195, 'samples': 1543104, 'steps': 8036, 'loss/train': 1.9910510778427124} -11/06/2021 22:22:16 - INFO - __main__ - Step 8038: {'lr': 0.0004979500924449431, 'samples': 1543296, 'steps': 8037, 'loss/train': 1.46047043800354} -11/06/2021 22:22:16 - INFO - __main__ - Step 8039: {'lr': 0.0004979494142040444, 'samples': 1543488, 'steps': 8038, 'loss/train': 1.9380624294281006} -11/06/2021 22:22:16 - INFO - __main__ - Step 8040: {'lr': 0.0004979487358514233, 'samples': 1543680, 'steps': 8039, 'loss/train': 1.9118831157684326} -11/06/2021 22:22:17 - INFO - __main__ - Step 8041: {'lr': 0.0004979480573870803, 'samples': 1543872, 'steps': 8040, 'loss/train': 1.2592707872390747} -11/06/2021 22:22:17 - INFO - __main__ - Step 8042: {'lr': 0.000497947378811016, 'samples': 1544064, 'steps': 8041, 'loss/train': 2.1490068435668945} -11/06/2021 22:22:18 - INFO - __main__ - Step 8043: {'lr': 0.0004979467001232302, 'samples': 1544256, 'steps': 8042, 'loss/train': 1.6307603120803833} -11/06/2021 22:22:18 - INFO - __main__ - Step 8044: {'lr': 0.0004979460213237235, 'samples': 1544448, 'steps': 8043, 'loss/train': 1.8183969259262085} -11/06/2021 22:22:19 - INFO - __main__ - Step 8045: {'lr': 0.0004979453424124961, 'samples': 1544640, 'steps': 8044, 'loss/train': 1.2424389123916626} -11/06/2021 22:22:19 - INFO - __main__ - Step 8046: {'lr': 0.0004979446633895484, 'samples': 1544832, 'steps': 8045, 'loss/train': 1.352750301361084} -11/06/2021 22:22:20 - INFO - __main__ - Step 8047: {'lr': 0.0004979439842548808, 'samples': 1545024, 'steps': 8046, 'loss/train': 1.8693174123764038} -11/06/2021 22:22:20 - INFO - __main__ - Step 8048: {'lr': 0.0004979433050084933, 'samples': 1545216, 'steps': 8047, 'loss/train': 1.2310196161270142} -11/06/2021 22:22:21 - INFO - __main__ - Step 8049: {'lr': 0.0004979426256503863, 'samples': 1545408, 'steps': 8048, 'loss/train': 2.2753522396087646} -11/06/2021 22:22:21 - INFO - __main__ - Step 8050: {'lr': 0.0004979419461805603, 'samples': 1545600, 'steps': 8049, 'loss/train': 2.1069955825805664} -11/06/2021 22:22:22 - INFO - __main__ - Step 8051: {'lr': 0.0004979412665990156, 'samples': 1545792, 'steps': 8050, 'loss/train': 1.705078125} -11/06/2021 22:22:22 - INFO - __main__ - Step 8052: {'lr': 0.0004979405869057522, 'samples': 1545984, 'steps': 8051, 'loss/train': 1.9316350221633911} -11/06/2021 22:22:23 - INFO - __main__ - Step 8053: {'lr': 0.0004979399071007707, 'samples': 1546176, 'steps': 8052, 'loss/train': 2.099993944168091} -11/06/2021 22:22:23 - INFO - __main__ - Step 8054: {'lr': 0.0004979392271840712, 'samples': 1546368, 'steps': 8053, 'loss/train': 1.937470555305481} -11/06/2021 22:22:24 - INFO - __main__ - Step 8055: {'lr': 0.0004979385471556542, 'samples': 1546560, 'steps': 8054, 'loss/train': 2.03237247467041} -11/06/2021 22:22:24 - INFO - __main__ - Step 8056: {'lr': 0.00049793786701552, 'samples': 1546752, 'steps': 8055, 'loss/train': 1.7011387348175049} -11/06/2021 22:22:24 - INFO - __main__ - Step 8057: {'lr': 0.0004979371867636687, 'samples': 1546944, 'steps': 8056, 'loss/train': 1.647082805633545} -11/06/2021 22:22:25 - INFO - __main__ - Step 8058: {'lr': 0.0004979365064001007, 'samples': 1547136, 'steps': 8057, 'loss/train': 1.8520019054412842} -11/06/2021 22:22:26 - INFO - __main__ - Step 8059: {'lr': 0.0004979358259248164, 'samples': 1547328, 'steps': 8058, 'loss/train': 1.324270486831665} -11/06/2021 22:22:26 - INFO - __main__ - Step 8060: {'lr': 0.000497935145337816, 'samples': 1547520, 'steps': 8059, 'loss/train': 1.6463035345077515} -11/06/2021 22:22:27 - INFO - __main__ - Step 8061: {'lr': 0.0004979344646390999, 'samples': 1547712, 'steps': 8060, 'loss/train': 2.0036861896514893} -11/06/2021 22:22:27 - INFO - __main__ - Step 8062: {'lr': 0.0004979337838286684, 'samples': 1547904, 'steps': 8061, 'loss/train': 1.1817820072174072} -11/06/2021 22:22:27 - INFO - __main__ - Step 8063: {'lr': 0.0004979331029065216, 'samples': 1548096, 'steps': 8062, 'loss/train': 1.7082180976867676} -11/06/2021 22:22:28 - INFO - __main__ - Step 8064: {'lr': 0.00049793242187266, 'samples': 1548288, 'steps': 8063, 'loss/train': 1.778818964958191} -11/06/2021 22:22:29 - INFO - __main__ - Step 8065: {'lr': 0.000497931740727084, 'samples': 1548480, 'steps': 8064, 'loss/train': 6.108870983123779} -11/06/2021 22:22:29 - INFO - __main__ - Step 8066: {'lr': 0.0004979310594697937, 'samples': 1548672, 'steps': 8065, 'loss/train': 2.9927406311035156} -11/06/2021 22:22:30 - INFO - __main__ - Step 8067: {'lr': 0.0004979303781007896, 'samples': 1548864, 'steps': 8066, 'loss/train': 1.902443528175354} -11/06/2021 22:22:30 - INFO - __main__ - Step 8068: {'lr': 0.0004979296966200718, 'samples': 1549056, 'steps': 8067, 'loss/train': 1.7086400985717773} -11/06/2021 22:22:30 - INFO - __main__ - Step 8069: {'lr': 0.0004979290150276407, 'samples': 1549248, 'steps': 8068, 'loss/train': 1.9971203804016113} -11/06/2021 22:22:31 - INFO - __main__ - Step 8070: {'lr': 0.0004979283333234966, 'samples': 1549440, 'steps': 8069, 'loss/train': 1.9657219648361206} -11/06/2021 22:22:32 - INFO - __main__ - Step 8071: {'lr': 0.0004979276515076399, 'samples': 1549632, 'steps': 8070, 'loss/train': 1.041121482849121} -11/06/2021 22:22:32 - INFO - __main__ - Step 8072: {'lr': 0.0004979269695800707, 'samples': 1549824, 'steps': 8071, 'loss/train': 2.119021415710449} -11/06/2021 22:22:32 - INFO - __main__ - Step 8073: {'lr': 0.0004979262875407896, 'samples': 1550016, 'steps': 8072, 'loss/train': 1.3283685445785522} -11/06/2021 22:22:33 - INFO - __main__ - Step 8074: {'lr': 0.0004979256053897966, 'samples': 1550208, 'steps': 8073, 'loss/train': 2.044589042663574} -11/06/2021 22:22:35 - INFO - __main__ - Step 8075: {'lr': 0.0004979249231270923, 'samples': 1550400, 'steps': 8074, 'loss/train': 1.9413076639175415} -11/06/2021 22:22:35 - INFO - __main__ - Step 8076: {'lr': 0.0004979242407526766, 'samples': 1550592, 'steps': 8075, 'loss/train': 1.5758004188537598} -11/06/2021 22:22:35 - INFO - __main__ - Step 8077: {'lr': 0.0004979235582665503, 'samples': 1550784, 'steps': 8076, 'loss/train': 2.4612207412719727} -11/06/2021 22:22:36 - INFO - __main__ - Step 8078: {'lr': 0.0004979228756687135, 'samples': 1550976, 'steps': 8077, 'loss/train': 2.0157461166381836} -11/06/2021 22:22:36 - INFO - __main__ - Step 8079: {'lr': 0.0004979221929591663, 'samples': 1551168, 'steps': 8078, 'loss/train': 2.025535821914673} -11/06/2021 22:22:36 - INFO - __main__ - Step 8080: {'lr': 0.0004979215101379093, 'samples': 1551360, 'steps': 8079, 'loss/train': 1.8989232778549194} -11/06/2021 22:22:37 - INFO - __main__ - Step 8081: {'lr': 0.0004979208272049426, 'samples': 1551552, 'steps': 8080, 'loss/train': 1.8116631507873535} -11/06/2021 22:22:37 - INFO - __main__ - Step 8082: {'lr': 0.0004979201441602665, 'samples': 1551744, 'steps': 8081, 'loss/train': 1.6327272653579712} -11/06/2021 22:22:38 - INFO - __main__ - Step 8083: {'lr': 0.0004979194610038816, 'samples': 1551936, 'steps': 8082, 'loss/train': 2.1452510356903076} -11/06/2021 22:22:39 - INFO - __main__ - Step 8084: {'lr': 0.000497918777735788, 'samples': 1552128, 'steps': 8083, 'loss/train': 1.8749728202819824} -11/06/2021 22:22:39 - INFO - __main__ - Step 8085: {'lr': 0.000497918094355986, 'samples': 1552320, 'steps': 8084, 'loss/train': 1.904146671295166} -11/06/2021 22:22:39 - INFO - __main__ - Step 8086: {'lr': 0.000497917410864476, 'samples': 1552512, 'steps': 8085, 'loss/train': 1.7037712335586548} -11/06/2021 22:22:40 - INFO - __main__ - Step 8087: {'lr': 0.0004979167272612581, 'samples': 1552704, 'steps': 8086, 'loss/train': 1.7576018571853638} -11/06/2021 22:22:41 - INFO - __main__ - Step 8088: {'lr': 0.0004979160435463328, 'samples': 1552896, 'steps': 8087, 'loss/train': 1.7359386682510376} -11/06/2021 22:22:41 - INFO - __main__ - Step 8089: {'lr': 0.0004979153597197003, 'samples': 1553088, 'steps': 8088, 'loss/train': 1.035143256187439} -11/06/2021 22:22:41 - INFO - __main__ - Step 8090: {'lr': 0.0004979146757813611, 'samples': 1553280, 'steps': 8089, 'loss/train': 1.9019252061843872} -11/06/2021 22:22:42 - INFO - __main__ - Step 8091: {'lr': 0.0004979139917313153, 'samples': 1553472, 'steps': 8090, 'loss/train': 1.6100707054138184} -11/06/2021 22:22:42 - INFO - __main__ - Step 8092: {'lr': 0.0004979133075695634, 'samples': 1553664, 'steps': 8091, 'loss/train': 1.4543089866638184} -11/06/2021 22:22:43 - INFO - __main__ - Step 8093: {'lr': 0.0004979126232961054, 'samples': 1553856, 'steps': 8092, 'loss/train': 1.6169660091400146} -11/06/2021 22:22:43 - INFO - __main__ - Step 8094: {'lr': 0.0004979119389109419, 'samples': 1554048, 'steps': 8093, 'loss/train': 1.693862795829773} -11/06/2021 22:22:44 - INFO - __main__ - Step 8095: {'lr': 0.000497911254414073, 'samples': 1554240, 'steps': 8094, 'loss/train': 1.6328054666519165} -11/06/2021 22:22:44 - INFO - __main__ - Step 8096: {'lr': 0.0004979105698054992, 'samples': 1554432, 'steps': 8095, 'loss/train': 2.0879011154174805} -11/06/2021 22:22:44 - INFO - __main__ - Step 8097: {'lr': 0.0004979098850852208, 'samples': 1554624, 'steps': 8096, 'loss/train': 1.8429865837097168} -11/06/2021 22:22:46 - INFO - __main__ - Step 8098: {'lr': 0.0004979092002532379, 'samples': 1554816, 'steps': 8097, 'loss/train': 2.1915647983551025} -11/06/2021 22:22:46 - INFO - __main__ - Step 8099: {'lr': 0.0004979085153095509, 'samples': 1555008, 'steps': 8098, 'loss/train': 2.256697177886963} -11/06/2021 22:22:46 - INFO - __main__ - Step 8100: {'lr': 0.0004979078302541604, 'samples': 1555200, 'steps': 8099, 'loss/train': 1.6514664888381958} -11/06/2021 22:22:47 - INFO - __main__ - Step 8101: {'lr': 0.0004979071450870662, 'samples': 1555392, 'steps': 8100, 'loss/train': 1.7830842733383179} -11/06/2021 22:22:47 - INFO - __main__ - Step 8102: {'lr': 0.0004979064598082689, 'samples': 1555584, 'steps': 8101, 'loss/train': 2.325873851776123} -11/06/2021 22:22:48 - INFO - __main__ - Step 8103: {'lr': 0.0004979057744177689, 'samples': 1555776, 'steps': 8102, 'loss/train': 1.6292482614517212} -11/06/2021 22:22:48 - INFO - __main__ - Step 8104: {'lr': 0.0004979050889155663, 'samples': 1555968, 'steps': 8103, 'loss/train': 1.9589861631393433} -11/06/2021 22:22:49 - INFO - __main__ - Step 8105: {'lr': 0.0004979044033016616, 'samples': 1556160, 'steps': 8104, 'loss/train': 1.5695750713348389} -11/06/2021 22:22:49 - INFO - __main__ - Step 8106: {'lr': 0.0004979037175760548, 'samples': 1556352, 'steps': 8105, 'loss/train': 2.045214891433716} -11/06/2021 22:22:49 - INFO - __main__ - Step 8107: {'lr': 0.0004979030317387466, 'samples': 1556544, 'steps': 8106, 'loss/train': 2.292895555496216} -11/06/2021 22:22:50 - INFO - __main__ - Step 8108: {'lr': 0.0004979023457897371, 'samples': 1556736, 'steps': 8107, 'loss/train': 2.0541205406188965} -11/06/2021 22:22:51 - INFO - __main__ - Step 8109: {'lr': 0.0004979016597290264, 'samples': 1556928, 'steps': 8108, 'loss/train': 2.090756893157959} -11/06/2021 22:22:51 - INFO - __main__ - Step 8110: {'lr': 0.0004979009735566152, 'samples': 1557120, 'steps': 8109, 'loss/train': 1.956437110900879} -11/06/2021 22:22:51 - INFO - __main__ - Step 8111: {'lr': 0.0004979002872725037, 'samples': 1557312, 'steps': 8110, 'loss/train': 0.9265539050102234} -11/06/2021 22:22:52 - INFO - __main__ - Step 8112: {'lr': 0.0004978996008766922, 'samples': 1557504, 'steps': 8111, 'loss/train': 1.8253365755081177} -11/06/2021 22:22:53 - INFO - __main__ - Step 8113: {'lr': 0.0004978989143691808, 'samples': 1557696, 'steps': 8112, 'loss/train': 2.0821549892425537} -11/06/2021 22:22:54 - INFO - __main__ - Step 8114: {'lr': 0.00049789822774997, 'samples': 1557888, 'steps': 8113, 'loss/train': 1.468117356300354} -11/06/2021 22:22:54 - INFO - __main__ - Step 8115: {'lr': 0.0004978975410190601, 'samples': 1558080, 'steps': 8114, 'loss/train': 2.1024975776672363} -11/06/2021 22:22:54 - INFO - __main__ - Step 8116: {'lr': 0.0004978968541764515, 'samples': 1558272, 'steps': 8115, 'loss/train': 2.9898436069488525} -11/06/2021 22:22:55 - INFO - __main__ - Step 8117: {'lr': 0.0004978961672221444, 'samples': 1558464, 'steps': 8116, 'loss/train': 2.3070497512817383} -11/06/2021 22:22:55 - INFO - __main__ - Step 8118: {'lr': 0.000497895480156139, 'samples': 1558656, 'steps': 8117, 'loss/train': 1.9509214162826538} -11/06/2021 22:22:56 - INFO - __main__ - Step 8119: {'lr': 0.0004978947929784358, 'samples': 1558848, 'steps': 8118, 'loss/train': 1.3840776681900024} -11/06/2021 22:22:57 - INFO - __main__ - Step 8120: {'lr': 0.0004978941056890349, 'samples': 1559040, 'steps': 8119, 'loss/train': 1.7440425157546997} -11/06/2021 22:22:57 - INFO - __main__ - Step 8121: {'lr': 0.0004978934182879369, 'samples': 1559232, 'steps': 8120, 'loss/train': 1.8195523023605347} -11/06/2021 22:22:57 - INFO - __main__ - Step 8122: {'lr': 0.0004978927307751419, 'samples': 1559424, 'steps': 8121, 'loss/train': 1.3453588485717773} -11/06/2021 22:22:58 - INFO - __main__ - Step 8123: {'lr': 0.0004978920431506501, 'samples': 1559616, 'steps': 8122, 'loss/train': 1.8378467559814453} -11/06/2021 22:22:58 - INFO - __main__ - Step 8124: {'lr': 0.0004978913554144623, 'samples': 1559808, 'steps': 8123, 'loss/train': 2.123873472213745} -11/06/2021 22:22:59 - INFO - __main__ - Step 8125: {'lr': 0.0004978906675665782, 'samples': 1560000, 'steps': 8124, 'loss/train': 2.085545063018799} -11/06/2021 22:22:59 - INFO - __main__ - Step 8126: {'lr': 0.0004978899796069985, 'samples': 1560192, 'steps': 8125, 'loss/train': 1.9374345541000366} -11/06/2021 22:23:00 - INFO - __main__ - Step 8127: {'lr': 0.0004978892915357234, 'samples': 1560384, 'steps': 8126, 'loss/train': 2.0188064575195312} -11/06/2021 22:23:00 - INFO - __main__ - Step 8128: {'lr': 0.0004978886033527532, 'samples': 1560576, 'steps': 8127, 'loss/train': 2.549909830093384} -11/06/2021 22:23:00 - INFO - __main__ - Step 8129: {'lr': 0.0004978879150580882, 'samples': 1560768, 'steps': 8128, 'loss/train': 1.8509951829910278} -11/06/2021 22:23:01 - INFO - __main__ - Step 8130: {'lr': 0.0004978872266517288, 'samples': 1560960, 'steps': 8129, 'loss/train': 1.873234748840332} -11/06/2021 22:23:02 - INFO - __main__ - Step 8131: {'lr': 0.0004978865381336752, 'samples': 1561152, 'steps': 8130, 'loss/train': 1.8826571702957153} -11/06/2021 22:23:03 - INFO - __main__ - Step 8132: {'lr': 0.0004978858495039277, 'samples': 1561344, 'steps': 8131, 'loss/train': 1.34197998046875} -11/06/2021 22:23:03 - INFO - __main__ - Step 8133: {'lr': 0.0004978851607624867, 'samples': 1561536, 'steps': 8132, 'loss/train': 3.694458484649658} -11/06/2021 22:23:03 - INFO - __main__ - Step 8134: {'lr': 0.0004978844719093525, 'samples': 1561728, 'steps': 8133, 'loss/train': 2.0985944271087646} -11/06/2021 22:23:04 - INFO - __main__ - Step 8135: {'lr': 0.0004978837829445254, 'samples': 1561920, 'steps': 8134, 'loss/train': 1.7875434160232544} -11/06/2021 22:23:04 - INFO - __main__ - Step 8136: {'lr': 0.0004978830938680056, 'samples': 1562112, 'steps': 8135, 'loss/train': 1.9818612337112427} -11/06/2021 22:23:05 - INFO - __main__ - Step 8137: {'lr': 0.0004978824046797935, 'samples': 1562304, 'steps': 8136, 'loss/train': 2.647218942642212} -11/06/2021 22:23:05 - INFO - __main__ - Step 8138: {'lr': 0.0004978817153798895, 'samples': 1562496, 'steps': 8137, 'loss/train': 1.852639079093933} -11/06/2021 22:23:06 - INFO - __main__ - Step 8139: {'lr': 0.0004978810259682939, 'samples': 1562688, 'steps': 8138, 'loss/train': 1.697789192199707} -11/06/2021 22:23:06 - INFO - __main__ - Step 8140: {'lr': 0.0004978803364450068, 'samples': 1562880, 'steps': 8139, 'loss/train': 1.768872618675232} -11/06/2021 22:23:06 - INFO - __main__ - Step 8141: {'lr': 0.0004978796468100286, 'samples': 1563072, 'steps': 8140, 'loss/train': 1.7271705865859985} -11/06/2021 22:23:07 - INFO - __main__ - Step 8142: {'lr': 0.0004978789570633598, 'samples': 1563264, 'steps': 8141, 'loss/train': 2.176313638687134} -11/06/2021 22:23:08 - INFO - __main__ - Step 8143: {'lr': 0.0004978782672050004, 'samples': 1563456, 'steps': 8142, 'loss/train': 2.180102586746216} -11/06/2021 22:23:08 - INFO - __main__ - Step 8144: {'lr': 0.000497877577234951, 'samples': 1563648, 'steps': 8143, 'loss/train': 2.109963893890381} -11/06/2021 22:23:08 - INFO - __main__ - Step 8145: {'lr': 0.0004978768871532117, 'samples': 1563840, 'steps': 8144, 'loss/train': 2.1114203929901123} -11/06/2021 22:23:09 - INFO - __main__ - Step 8146: {'lr': 0.0004978761969597831, 'samples': 1564032, 'steps': 8145, 'loss/train': 2.357698917388916} -11/06/2021 22:23:09 - INFO - __main__ - Step 8147: {'lr': 0.0004978755066546651, 'samples': 1564224, 'steps': 8146, 'loss/train': 1.9668238162994385} -11/06/2021 22:23:10 - INFO - __main__ - Step 8148: {'lr': 0.0004978748162378583, 'samples': 1564416, 'steps': 8147, 'loss/train': 1.837101936340332} -11/06/2021 22:23:11 - INFO - __main__ - Step 8149: {'lr': 0.0004978741257093629, 'samples': 1564608, 'steps': 8148, 'loss/train': 2.2903544902801514} -11/06/2021 22:23:11 - INFO - __main__ - Step 8150: {'lr': 0.0004978734350691793, 'samples': 1564800, 'steps': 8149, 'loss/train': 1.4162994623184204} -11/06/2021 22:23:11 - INFO - __main__ - Step 8151: {'lr': 0.0004978727443173077, 'samples': 1564992, 'steps': 8150, 'loss/train': 1.6277093887329102} -11/06/2021 22:23:12 - INFO - __main__ - Step 8152: {'lr': 0.0004978720534537485, 'samples': 1565184, 'steps': 8151, 'loss/train': 1.715814471244812} -11/06/2021 22:23:13 - INFO - __main__ - Step 8153: {'lr': 0.000497871362478502, 'samples': 1565376, 'steps': 8152, 'loss/train': 1.4183335304260254} -11/06/2021 22:23:13 - INFO - __main__ - Step 8154: {'lr': 0.0004978706713915684, 'samples': 1565568, 'steps': 8153, 'loss/train': 1.7779927253723145} -11/06/2021 22:23:13 - INFO - __main__ - Step 8155: {'lr': 0.0004978699801929481, 'samples': 1565760, 'steps': 8154, 'loss/train': 1.3929790258407593} -11/06/2021 22:23:14 - INFO - __main__ - Step 8156: {'lr': 0.0004978692888826415, 'samples': 1565952, 'steps': 8155, 'loss/train': 1.6693589687347412} -11/06/2021 22:23:14 - INFO - __main__ - Step 8157: {'lr': 0.0004978685974606488, 'samples': 1566144, 'steps': 8156, 'loss/train': 1.4203959703445435} -11/06/2021 22:23:15 - INFO - __main__ - Step 8158: {'lr': 0.0004978679059269704, 'samples': 1566336, 'steps': 8157, 'loss/train': 1.9157639741897583} -11/06/2021 22:23:16 - INFO - __main__ - Step 8159: {'lr': 0.0004978672142816064, 'samples': 1566528, 'steps': 8158, 'loss/train': 1.5440396070480347} -11/06/2021 22:23:16 - INFO - __main__ - Step 8160: {'lr': 0.0004978665225245573, 'samples': 1566720, 'steps': 8159, 'loss/train': 1.5769977569580078} -11/06/2021 22:23:16 - INFO - __main__ - Step 8161: {'lr': 0.0004978658306558234, 'samples': 1566912, 'steps': 8160, 'loss/train': 1.9604636430740356} -11/06/2021 22:23:17 - INFO - __main__ - Step 8162: {'lr': 0.000497865138675405, 'samples': 1567104, 'steps': 8161, 'loss/train': 1.6201629638671875} -11/06/2021 22:23:18 - INFO - __main__ - Step 8163: {'lr': 0.0004978644465833024, 'samples': 1567296, 'steps': 8162, 'loss/train': 1.5474094152450562} -11/06/2021 22:23:18 - INFO - __main__ - Step 8164: {'lr': 0.000497863754379516, 'samples': 1567488, 'steps': 8163, 'loss/train': 2.2988481521606445} -11/06/2021 22:23:18 - INFO - __main__ - Step 8165: {'lr': 0.0004978630620640458, 'samples': 1567680, 'steps': 8164, 'loss/train': 1.2239776849746704} -11/06/2021 22:23:19 - INFO - __main__ - Step 8166: {'lr': 0.0004978623696368924, 'samples': 1567872, 'steps': 8165, 'loss/train': 1.8691977262496948} -11/06/2021 22:23:19 - INFO - __main__ - Step 8167: {'lr': 0.0004978616770980561, 'samples': 1568064, 'steps': 8166, 'loss/train': 1.9919401407241821} -11/06/2021 22:23:19 - INFO - __main__ - Step 8168: {'lr': 0.0004978609844475371, 'samples': 1568256, 'steps': 8167, 'loss/train': 2.040534257888794} -11/06/2021 22:23:21 - INFO - __main__ - Step 8169: {'lr': 0.0004978602916853359, 'samples': 1568448, 'steps': 8168, 'loss/train': 1.9862347841262817} -11/06/2021 22:23:21 - INFO - __main__ - Step 8170: {'lr': 0.0004978595988114525, 'samples': 1568640, 'steps': 8169, 'loss/train': 1.8854844570159912} -11/06/2021 22:23:21 - INFO - __main__ - Step 8171: {'lr': 0.0004978589058258874, 'samples': 1568832, 'steps': 8170, 'loss/train': 1.8785438537597656} -11/06/2021 22:23:22 - INFO - __main__ - Step 8172: {'lr': 0.0004978582127286409, 'samples': 1569024, 'steps': 8171, 'loss/train': 2.3725521564483643} -11/06/2021 22:23:22 - INFO - __main__ - Step 8173: {'lr': 0.0004978575195197135, 'samples': 1569216, 'steps': 8172, 'loss/train': 2.0266950130462646} -11/06/2021 22:23:23 - INFO - __main__ - Step 8174: {'lr': 0.0004978568261991051, 'samples': 1569408, 'steps': 8173, 'loss/train': 1.6820038557052612} -11/06/2021 22:23:23 - INFO - __main__ - Step 8175: {'lr': 0.0004978561327668164, 'samples': 1569600, 'steps': 8174, 'loss/train': 1.5046055316925049} -11/06/2021 22:23:24 - INFO - __main__ - Step 8176: {'lr': 0.0004978554392228475, 'samples': 1569792, 'steps': 8175, 'loss/train': 1.718424916267395} -11/06/2021 22:23:24 - INFO - __main__ - Step 8177: {'lr': 0.0004978547455671986, 'samples': 1569984, 'steps': 8176, 'loss/train': 1.3242571353912354} -11/06/2021 22:23:24 - INFO - __main__ - Step 8178: {'lr': 0.0004978540517998704, 'samples': 1570176, 'steps': 8177, 'loss/train': 1.511248230934143} -11/06/2021 22:23:25 - INFO - __main__ - Step 8179: {'lr': 0.0004978533579208629, 'samples': 1570368, 'steps': 8178, 'loss/train': 1.66165292263031} -11/06/2021 22:23:26 - INFO - __main__ - Step 8180: {'lr': 0.0004978526639301766, 'samples': 1570560, 'steps': 8179, 'loss/train': 2.0218098163604736} -11/06/2021 22:23:26 - INFO - __main__ - Step 8181: {'lr': 0.0004978519698278116, 'samples': 1570752, 'steps': 8180, 'loss/train': 2.0883474349975586} -11/06/2021 22:23:26 - INFO - __main__ - Step 8182: {'lr': 0.0004978512756137684, 'samples': 1570944, 'steps': 8181, 'loss/train': 2.5265679359436035} -11/06/2021 22:23:27 - INFO - __main__ - Step 8183: {'lr': 0.0004978505812880472, 'samples': 1571136, 'steps': 8182, 'loss/train': 1.8759024143218994} -11/06/2021 22:23:28 - INFO - __main__ - Step 8184: {'lr': 0.0004978498868506483, 'samples': 1571328, 'steps': 8183, 'loss/train': 2.0600368976593018} -11/06/2021 22:23:28 - INFO - __main__ - Step 8185: {'lr': 0.0004978491923015721, 'samples': 1571520, 'steps': 8184, 'loss/train': 1.7194626331329346} -11/06/2021 22:23:28 - INFO - __main__ - Step 8186: {'lr': 0.0004978484976408189, 'samples': 1571712, 'steps': 8185, 'loss/train': 1.817257285118103} -11/06/2021 22:23:29 - INFO - __main__ - Step 8187: {'lr': 0.000497847802868389, 'samples': 1571904, 'steps': 8186, 'loss/train': 1.9279881715774536} -11/06/2021 22:23:29 - INFO - __main__ - Step 8188: {'lr': 0.0004978471079842827, 'samples': 1572096, 'steps': 8187, 'loss/train': 1.9306005239486694} -11/06/2021 22:23:30 - INFO - __main__ - Step 8189: {'lr': 0.0004978464129885003, 'samples': 1572288, 'steps': 8188, 'loss/train': 1.9209128618240356} -11/06/2021 22:23:31 - INFO - __main__ - Step 8190: {'lr': 0.0004978457178810422, 'samples': 1572480, 'steps': 8189, 'loss/train': 0.7898921966552734} -11/06/2021 22:23:31 - INFO - __main__ - Step 8191: {'lr': 0.0004978450226619085, 'samples': 1572672, 'steps': 8190, 'loss/train': 1.9690088033676147} -11/06/2021 22:23:31 - INFO - __main__ - Step 8192: {'lr': 0.0004978443273310997, 'samples': 1572864, 'steps': 8191, 'loss/train': 1.8891528844833374} -11/06/2021 22:23:32 - INFO - __main__ - Step 8193: {'lr': 0.0004978436318886162, 'samples': 1573056, 'steps': 8192, 'loss/train': 1.6559553146362305} -11/06/2021 22:23:32 - INFO - __main__ - Step 8194: {'lr': 0.0004978429363344581, 'samples': 1573248, 'steps': 8193, 'loss/train': 0.9482629299163818} -11/06/2021 22:23:33 - INFO - __main__ - Step 8195: {'lr': 0.0004978422406686257, 'samples': 1573440, 'steps': 8194, 'loss/train': 1.9039665460586548} -11/06/2021 22:23:33 - INFO - __main__ - Step 8196: {'lr': 0.0004978415448911196, 'samples': 1573632, 'steps': 8195, 'loss/train': 1.7499048709869385} -11/06/2021 22:23:34 - INFO - __main__ - Step 8197: {'lr': 0.0004978408490019398, 'samples': 1573824, 'steps': 8196, 'loss/train': 1.526663064956665} -11/06/2021 22:23:34 - INFO - __main__ - Step 8198: {'lr': 0.0004978401530010868, 'samples': 1574016, 'steps': 8197, 'loss/train': 2.0458552837371826} -11/06/2021 22:23:35 - INFO - __main__ - Step 8199: {'lr': 0.0004978394568885608, 'samples': 1574208, 'steps': 8198, 'loss/train': 1.7852051258087158} -11/06/2021 22:23:36 - INFO - __main__ - Step 8200: {'lr': 0.0004978387606643621, 'samples': 1574400, 'steps': 8199, 'loss/train': 1.7068928480148315} -11/06/2021 22:23:36 - INFO - __main__ - Step 8201: {'lr': 0.0004978380643284912, 'samples': 1574592, 'steps': 8200, 'loss/train': 1.7486140727996826} -11/06/2021 22:23:36 - INFO - __main__ - Step 8202: {'lr': 0.0004978373678809482, 'samples': 1574784, 'steps': 8201, 'loss/train': 6.046335220336914} -11/06/2021 22:23:37 - INFO - __main__ - Step 8203: {'lr': 0.0004978366713217336, 'samples': 1574976, 'steps': 8202, 'loss/train': 1.418635368347168} -11/06/2021 22:23:37 - INFO - __main__ - Step 8204: {'lr': 0.0004978359746508476, 'samples': 1575168, 'steps': 8203, 'loss/train': 2.039991855621338} -11/06/2021 22:23:38 - INFO - __main__ - Step 8205: {'lr': 0.0004978352778682905, 'samples': 1575360, 'steps': 8204, 'loss/train': 1.6890138387680054} -11/06/2021 22:23:38 - INFO - __main__ - Step 8206: {'lr': 0.0004978345809740626, 'samples': 1575552, 'steps': 8205, 'loss/train': 1.5831921100616455} -11/06/2021 22:23:39 - INFO - __main__ - Step 8207: {'lr': 0.0004978338839681644, 'samples': 1575744, 'steps': 8206, 'loss/train': 1.284598469734192} -11/06/2021 22:23:39 - INFO - __main__ - Step 8208: {'lr': 0.000497833186850596, 'samples': 1575936, 'steps': 8207, 'loss/train': 1.9825032949447632} -11/06/2021 22:23:39 - INFO - __main__ - Step 8209: {'lr': 0.0004978324896213577, 'samples': 1576128, 'steps': 8208, 'loss/train': 1.068908929824829} -11/06/2021 22:23:40 - INFO - __main__ - Step 8210: {'lr': 0.00049783179228045, 'samples': 1576320, 'steps': 8209, 'loss/train': 2.0612127780914307} -11/06/2021 22:23:41 - INFO - __main__ - Step 8211: {'lr': 0.0004978310948278731, 'samples': 1576512, 'steps': 8210, 'loss/train': 1.5374093055725098} -11/06/2021 22:23:41 - INFO - __main__ - Step 8212: {'lr': 0.0004978303972636275, 'samples': 1576704, 'steps': 8211, 'loss/train': 1.6517690420150757} -11/06/2021 22:23:41 - INFO - __main__ - Step 8213: {'lr': 0.0004978296995877132, 'samples': 1576896, 'steps': 8212, 'loss/train': 1.9710806608200073} -11/06/2021 22:23:42 - INFO - __main__ - Step 8214: {'lr': 0.0004978290018001306, 'samples': 1577088, 'steps': 8213, 'loss/train': 1.794217824935913} -11/06/2021 22:23:42 - INFO - __main__ - Step 8215: {'lr': 0.0004978283039008801, 'samples': 1577280, 'steps': 8214, 'loss/train': 2.031745433807373} -11/06/2021 22:23:43 - INFO - __main__ - Step 8216: {'lr': 0.000497827605889962, 'samples': 1577472, 'steps': 8215, 'loss/train': 1.8105554580688477} -11/06/2021 22:23:44 - INFO - __main__ - Step 8217: {'lr': 0.0004978269077673766, 'samples': 1577664, 'steps': 8216, 'loss/train': 1.3719156980514526} -11/06/2021 22:23:44 - INFO - __main__ - Step 8218: {'lr': 0.0004978262095331243, 'samples': 1577856, 'steps': 8217, 'loss/train': 1.7575129270553589} -11/06/2021 22:23:44 - INFO - __main__ - Step 8219: {'lr': 0.0004978255111872053, 'samples': 1578048, 'steps': 8218, 'loss/train': 1.9451090097427368} -11/06/2021 22:23:45 - INFO - __main__ - Step 8220: {'lr': 0.0004978248127296198, 'samples': 1578240, 'steps': 8219, 'loss/train': 2.2303905487060547} -11/06/2021 22:23:46 - INFO - __main__ - Step 8221: {'lr': 0.0004978241141603685, 'samples': 1578432, 'steps': 8220, 'loss/train': 2.1511523723602295} -11/06/2021 22:23:46 - INFO - __main__ - Step 8222: {'lr': 0.0004978234154794514, 'samples': 1578624, 'steps': 8221, 'loss/train': 1.9754325151443481} -11/06/2021 22:23:46 - INFO - __main__ - Step 8223: {'lr': 0.0004978227166868689, 'samples': 1578816, 'steps': 8222, 'loss/train': 1.4744144678115845} -11/06/2021 22:23:47 - INFO - __main__ - Step 8224: {'lr': 0.0004978220177826212, 'samples': 1579008, 'steps': 8223, 'loss/train': 1.977313756942749} -11/06/2021 22:23:47 - INFO - __main__ - Step 8225: {'lr': 0.0004978213187667087, 'samples': 1579200, 'steps': 8224, 'loss/train': 1.9514577388763428} -11/06/2021 22:23:48 - INFO - __main__ - Step 8226: {'lr': 0.0004978206196391319, 'samples': 1579392, 'steps': 8225, 'loss/train': 1.6040639877319336} -11/06/2021 22:23:48 - INFO - __main__ - Step 8227: {'lr': 0.0004978199203998909, 'samples': 1579584, 'steps': 8226, 'loss/train': 2.2450778484344482} -11/06/2021 22:23:49 - INFO - __main__ - Step 8228: {'lr': 0.0004978192210489861, 'samples': 1579776, 'steps': 8227, 'loss/train': 1.8342416286468506} -11/06/2021 22:23:49 - INFO - __main__ - Step 8229: {'lr': 0.0004978185215864177, 'samples': 1579968, 'steps': 8228, 'loss/train': 1.8177608251571655} -11/06/2021 22:23:50 - INFO - __main__ - Step 8230: {'lr': 0.0004978178220121862, 'samples': 1580160, 'steps': 8229, 'loss/train': 1.1857390403747559} -11/06/2021 22:23:50 - INFO - __main__ - Step 8231: {'lr': 0.0004978171223262917, 'samples': 1580352, 'steps': 8230, 'loss/train': 1.4002374410629272} -11/06/2021 22:23:51 - INFO - __main__ - Step 8232: {'lr': 0.0004978164225287346, 'samples': 1580544, 'steps': 8231, 'loss/train': 1.7684195041656494} -11/06/2021 22:23:51 - INFO - __main__ - Step 8233: {'lr': 0.0004978157226195153, 'samples': 1580736, 'steps': 8232, 'loss/train': 1.4781603813171387} -11/06/2021 22:23:52 - INFO - __main__ - Step 8234: {'lr': 0.0004978150225986342, 'samples': 1580928, 'steps': 8233, 'loss/train': 1.919776439666748} -11/06/2021 22:23:52 - INFO - __main__ - Step 8235: {'lr': 0.0004978143224660913, 'samples': 1581120, 'steps': 8234, 'loss/train': 2.3026692867279053} -11/06/2021 22:23:52 - INFO - __main__ - Step 8236: {'lr': 0.0004978136222218872, 'samples': 1581312, 'steps': 8235, 'loss/train': 1.9693598747253418} -11/06/2021 22:23:53 - INFO - __main__ - Step 8237: {'lr': 0.000497812921866022, 'samples': 1581504, 'steps': 8236, 'loss/train': 2.0580477714538574} -11/06/2021 22:23:54 - INFO - __main__ - Step 8238: {'lr': 0.0004978122213984961, 'samples': 1581696, 'steps': 8237, 'loss/train': 1.808411955833435} -11/06/2021 22:23:54 - INFO - __main__ - Step 8239: {'lr': 0.00049781152081931, 'samples': 1581888, 'steps': 8238, 'loss/train': 1.9752439260482788} -11/06/2021 22:23:54 - INFO - __main__ - Step 8240: {'lr': 0.0004978108201284638, 'samples': 1582080, 'steps': 8239, 'loss/train': 0.9977089166641235} -11/06/2021 22:23:55 - INFO - __main__ - Step 8241: {'lr': 0.0004978101193259578, 'samples': 1582272, 'steps': 8240, 'loss/train': 0.3795441687107086} -11/06/2021 22:23:56 - INFO - __main__ - Step 8242: {'lr': 0.0004978094184117924, 'samples': 1582464, 'steps': 8241, 'loss/train': 1.8929859399795532} -11/06/2021 22:23:56 - INFO - __main__ - Step 8243: {'lr': 0.0004978087173859679, 'samples': 1582656, 'steps': 8242, 'loss/train': 1.606785774230957} -11/06/2021 22:23:56 - INFO - __main__ - Step 8244: {'lr': 0.0004978080162484846, 'samples': 1582848, 'steps': 8243, 'loss/train': 2.046319007873535} -11/06/2021 22:23:57 - INFO - __main__ - Step 8245: {'lr': 0.000497807314999343, 'samples': 1583040, 'steps': 8244, 'loss/train': 1.9589273929595947} -11/06/2021 22:23:57 - INFO - __main__ - Step 8246: {'lr': 0.000497806613638543, 'samples': 1583232, 'steps': 8245, 'loss/train': 1.904953956604004} -11/06/2021 22:23:58 - INFO - __main__ - Step 8247: {'lr': 0.0004978059121660853, 'samples': 1583424, 'steps': 8246, 'loss/train': 1.978081226348877} -11/06/2021 22:23:59 - INFO - __main__ - Step 8248: {'lr': 0.0004978052105819701, 'samples': 1583616, 'steps': 8247, 'loss/train': 2.0313427448272705} -11/06/2021 22:23:59 - INFO - __main__ - Step 8249: {'lr': 0.0004978045088861976, 'samples': 1583808, 'steps': 8248, 'loss/train': 2.3198392391204834} -11/06/2021 22:23:59 - INFO - __main__ - Step 8250: {'lr': 0.0004978038070787683, 'samples': 1584000, 'steps': 8249, 'loss/train': 2.009343147277832} -11/06/2021 22:24:00 - INFO - __main__ - Step 8251: {'lr': 0.0004978031051596824, 'samples': 1584192, 'steps': 8250, 'loss/train': 1.775676965713501} -11/06/2021 22:24:01 - INFO - __main__ - Step 8252: {'lr': 0.0004978024031289402, 'samples': 1584384, 'steps': 8251, 'loss/train': 1.8589789867401123} -11/06/2021 22:24:01 - INFO - __main__ - Step 8253: {'lr': 0.0004978017009865421, 'samples': 1584576, 'steps': 8252, 'loss/train': 1.619974970817566} -11/06/2021 22:24:01 - INFO - __main__ - Step 8254: {'lr': 0.0004978009987324884, 'samples': 1584768, 'steps': 8253, 'loss/train': 1.9142787456512451} -11/06/2021 22:24:02 - INFO - __main__ - Step 8255: {'lr': 0.0004978002963667794, 'samples': 1584960, 'steps': 8254, 'loss/train': 1.2939250469207764} -11/06/2021 22:24:02 - INFO - __main__ - Step 8256: {'lr': 0.0004977995938894153, 'samples': 1585152, 'steps': 8255, 'loss/train': 2.2025363445281982} -11/06/2021 22:24:03 - INFO - __main__ - Step 8257: {'lr': 0.0004977988913003966, 'samples': 1585344, 'steps': 8256, 'loss/train': 2.0969882011413574} -11/06/2021 22:24:03 - INFO - __main__ - Step 8258: {'lr': 0.0004977981885997235, 'samples': 1585536, 'steps': 8257, 'loss/train': 1.3908742666244507} -11/06/2021 22:24:04 - INFO - __main__ - Step 8259: {'lr': 0.0004977974857873964, 'samples': 1585728, 'steps': 8258, 'loss/train': 1.7966902256011963} -11/06/2021 22:24:04 - INFO - __main__ - Step 8260: {'lr': 0.0004977967828634157, 'samples': 1585920, 'steps': 8259, 'loss/train': 1.8227860927581787} -11/06/2021 22:24:05 - INFO - __main__ - Step 8261: {'lr': 0.0004977960798277814, 'samples': 1586112, 'steps': 8260, 'loss/train': 1.9070138931274414} -11/06/2021 22:24:05 - INFO - __main__ - Step 8262: {'lr': 0.0004977953766804941, 'samples': 1586304, 'steps': 8261, 'loss/train': 1.7750216722488403} -11/06/2021 22:24:06 - INFO - __main__ - Step 8263: {'lr': 0.0004977946734215541, 'samples': 1586496, 'steps': 8262, 'loss/train': 1.3663748502731323} -11/06/2021 22:24:06 - INFO - __main__ - Step 8264: {'lr': 0.0004977939700509615, 'samples': 1586688, 'steps': 8263, 'loss/train': 2.318755626678467} -11/06/2021 22:24:07 - INFO - __main__ - Step 8265: {'lr': 0.0004977932665687168, 'samples': 1586880, 'steps': 8264, 'loss/train': 1.6168603897094727} -11/06/2021 22:24:07 - INFO - __main__ - Step 8266: {'lr': 0.0004977925629748203, 'samples': 1587072, 'steps': 8265, 'loss/train': 1.8348907232284546} -11/06/2021 22:24:07 - INFO - __main__ - Step 8267: {'lr': 0.0004977918592692723, 'samples': 1587264, 'steps': 8266, 'loss/train': 2.0127944946289062} -11/06/2021 22:24:08 - INFO - __main__ - Step 8268: {'lr': 0.0004977911554520731, 'samples': 1587456, 'steps': 8267, 'loss/train': 2.4717700481414795} -11/06/2021 22:24:09 - INFO - __main__ - Step 8269: {'lr': 0.000497790451523223, 'samples': 1587648, 'steps': 8268, 'loss/train': 1.848479151725769} -11/06/2021 22:24:09 - INFO - __main__ - Step 8270: {'lr': 0.0004977897474827224, 'samples': 1587840, 'steps': 8269, 'loss/train': 2.058631420135498} -11/06/2021 22:24:09 - INFO - __main__ - Step 8271: {'lr': 0.0004977890433305716, 'samples': 1588032, 'steps': 8270, 'loss/train': 2.1743407249450684} -11/06/2021 22:24:10 - INFO - __main__ - Step 8272: {'lr': 0.0004977883390667707, 'samples': 1588224, 'steps': 8271, 'loss/train': 1.7695982456207275} -11/06/2021 22:24:11 - INFO - __main__ - Step 8273: {'lr': 0.0004977876346913204, 'samples': 1588416, 'steps': 8272, 'loss/train': 1.5789722204208374} -11/06/2021 22:24:11 - INFO - __main__ - Step 8274: {'lr': 0.0004977869302042207, 'samples': 1588608, 'steps': 8273, 'loss/train': 1.8004614114761353} -11/06/2021 22:24:12 - INFO - __main__ - Step 8275: {'lr': 0.0004977862256054721, 'samples': 1588800, 'steps': 8274, 'loss/train': 1.8264741897583008} -11/06/2021 22:24:12 - INFO - __main__ - Step 8276: {'lr': 0.0004977855208950748, 'samples': 1588992, 'steps': 8275, 'loss/train': 1.8771971464157104} -11/06/2021 22:24:12 - INFO - __main__ - Step 8277: {'lr': 0.0004977848160730292, 'samples': 1589184, 'steps': 8276, 'loss/train': 1.6610857248306274} -11/06/2021 22:24:13 - INFO - __main__ - Step 8278: {'lr': 0.0004977841111393356, 'samples': 1589376, 'steps': 8277, 'loss/train': 1.7846906185150146} -11/06/2021 22:24:14 - INFO - __main__ - Step 8279: {'lr': 0.0004977834060939943, 'samples': 1589568, 'steps': 8278, 'loss/train': 1.6243547201156616} -11/06/2021 22:24:14 - INFO - __main__ - Step 8280: {'lr': 0.0004977827009370056, 'samples': 1589760, 'steps': 8279, 'loss/train': 1.42178475856781} -11/06/2021 22:24:14 - INFO - __main__ - Step 8281: {'lr': 0.0004977819956683698, 'samples': 1589952, 'steps': 8280, 'loss/train': 1.8669449090957642} -11/06/2021 22:24:15 - INFO - __main__ - Step 8282: {'lr': 0.0004977812902880873, 'samples': 1590144, 'steps': 8281, 'loss/train': 2.0661544799804688} -11/06/2021 22:24:15 - INFO - __main__ - Step 8283: {'lr': 0.0004977805847961584, 'samples': 1590336, 'steps': 8282, 'loss/train': 1.9494577646255493} -11/06/2021 22:24:16 - INFO - __main__ - Step 8284: {'lr': 0.0004977798791925834, 'samples': 1590528, 'steps': 8283, 'loss/train': 1.9344879388809204} -11/06/2021 22:24:16 - INFO - __main__ - Step 8285: {'lr': 0.0004977791734773624, 'samples': 1590720, 'steps': 8284, 'loss/train': 1.7498496770858765} -11/06/2021 22:24:17 - INFO - __main__ - Step 8286: {'lr': 0.0004977784676504962, 'samples': 1590912, 'steps': 8285, 'loss/train': 1.4974678754806519} -11/06/2021 22:24:17 - INFO - __main__ - Step 8287: {'lr': 0.0004977777617119847, 'samples': 1591104, 'steps': 8286, 'loss/train': 1.8675819635391235} -11/06/2021 22:24:18 - INFO - __main__ - Step 8288: {'lr': 0.0004977770556618284, 'samples': 1591296, 'steps': 8287, 'loss/train': 2.119424343109131} -11/06/2021 22:24:18 - INFO - __main__ - Step 8289: {'lr': 0.0004977763495000276, 'samples': 1591488, 'steps': 8288, 'loss/train': 1.7665525674819946} -11/06/2021 22:24:19 - INFO - __main__ - Step 8290: {'lr': 0.0004977756432265827, 'samples': 1591680, 'steps': 8289, 'loss/train': 1.5919955968856812} -11/06/2021 22:24:19 - INFO - __main__ - Step 8291: {'lr': 0.0004977749368414937, 'samples': 1591872, 'steps': 8290, 'loss/train': 1.6842032670974731} -11/06/2021 22:24:20 - INFO - __main__ - Step 8292: {'lr': 0.0004977742303447613, 'samples': 1592064, 'steps': 8291, 'loss/train': 2.4035115242004395} -11/06/2021 22:24:20 - INFO - __main__ - Step 8293: {'lr': 0.0004977735237363855, 'samples': 1592256, 'steps': 8292, 'loss/train': 1.7982686758041382} -11/06/2021 22:24:21 - INFO - __main__ - Step 8294: {'lr': 0.0004977728170163669, 'samples': 1592448, 'steps': 8293, 'loss/train': 2.0274014472961426} -11/06/2021 22:24:21 - INFO - __main__ - Step 8295: {'lr': 0.0004977721101847057, 'samples': 1592640, 'steps': 8294, 'loss/train': 2.058189868927002} -11/06/2021 22:24:22 - INFO - __main__ - Step 8296: {'lr': 0.0004977714032414021, 'samples': 1592832, 'steps': 8295, 'loss/train': 1.709094762802124} -11/06/2021 22:24:22 - INFO - __main__ - Step 8297: {'lr': 0.0004977706961864566, 'samples': 1593024, 'steps': 8296, 'loss/train': 2.004429578781128} -11/06/2021 22:24:22 - INFO - __main__ - Step 8298: {'lr': 0.0004977699890198695, 'samples': 1593216, 'steps': 8297, 'loss/train': 0.9048164486885071} -11/06/2021 22:24:23 - INFO - __main__ - Step 8299: {'lr': 0.0004977692817416411, 'samples': 1593408, 'steps': 8298, 'loss/train': 1.415739893913269} -11/06/2021 22:24:24 - INFO - __main__ - Step 8300: {'lr': 0.0004977685743517715, 'samples': 1593600, 'steps': 8299, 'loss/train': 1.8536925315856934} -11/06/2021 22:24:24 - INFO - __main__ - Step 8301: {'lr': 0.0004977678668502614, 'samples': 1593792, 'steps': 8300, 'loss/train': 2.0791187286376953} -11/06/2021 22:24:24 - INFO - __main__ - Step 8302: {'lr': 0.0004977671592371108, 'samples': 1593984, 'steps': 8301, 'loss/train': 0.7785729765892029} -11/06/2021 22:24:25 - INFO - __main__ - Step 8303: {'lr': 0.0004977664515123201, 'samples': 1594176, 'steps': 8302, 'loss/train': 1.8622348308563232} -11/06/2021 22:24:26 - INFO - __main__ - Step 8304: {'lr': 0.0004977657436758898, 'samples': 1594368, 'steps': 8303, 'loss/train': 1.9687023162841797} -11/06/2021 22:24:26 - INFO - __main__ - Step 8305: {'lr': 0.00049776503572782, 'samples': 1594560, 'steps': 8304, 'loss/train': 1.782356858253479} -11/06/2021 22:24:27 - INFO - __main__ - Step 8306: {'lr': 0.0004977643276681111, 'samples': 1594752, 'steps': 8305, 'loss/train': 1.6314135789871216} -11/06/2021 22:24:27 - INFO - __main__ - Step 8307: {'lr': 0.0004977636194967634, 'samples': 1594944, 'steps': 8306, 'loss/train': 2.114375591278076} -11/06/2021 22:24:27 - INFO - __main__ - Step 8308: {'lr': 0.0004977629112137773, 'samples': 1595136, 'steps': 8307, 'loss/train': 1.4448978900909424} -11/06/2021 22:24:28 - INFO - __main__ - Step 8309: {'lr': 0.000497762202819153, 'samples': 1595328, 'steps': 8308, 'loss/train': 2.2745602130889893} -11/06/2021 22:24:29 - INFO - __main__ - Step 8310: {'lr': 0.0004977614943128909, 'samples': 1595520, 'steps': 8309, 'loss/train': 2.14582896232605} -11/06/2021 22:24:29 - INFO - __main__ - Step 8311: {'lr': 0.0004977607856949913, 'samples': 1595712, 'steps': 8310, 'loss/train': 1.7548679113388062} -11/06/2021 22:24:29 - INFO - __main__ - Step 8312: {'lr': 0.0004977600769654545, 'samples': 1595904, 'steps': 8311, 'loss/train': 1.5743494033813477} -11/06/2021 22:24:30 - INFO - __main__ - Step 8313: {'lr': 0.0004977593681242808, 'samples': 1596096, 'steps': 8312, 'loss/train': 2.279632806777954} -11/06/2021 22:24:30 - INFO - __main__ - Step 8314: {'lr': 0.0004977586591714706, 'samples': 1596288, 'steps': 8313, 'loss/train': 2.477036714553833} -11/06/2021 22:24:31 - INFO - __main__ - Step 8315: {'lr': 0.0004977579501070241, 'samples': 1596480, 'steps': 8314, 'loss/train': 1.5748059749603271} -11/06/2021 22:24:31 - INFO - __main__ - Step 8316: {'lr': 0.0004977572409309418, 'samples': 1596672, 'steps': 8315, 'loss/train': 1.7749756574630737} -11/06/2021 22:24:32 - INFO - __main__ - Step 8317: {'lr': 0.0004977565316432238, 'samples': 1596864, 'steps': 8316, 'loss/train': 2.0671162605285645} -11/06/2021 22:24:32 - INFO - __main__ - Step 8318: {'lr': 0.0004977558222438707, 'samples': 1597056, 'steps': 8317, 'loss/train': 1.9523950815200806} -11/06/2021 22:24:33 - INFO - __main__ - Step 8319: {'lr': 0.0004977551127328824, 'samples': 1597248, 'steps': 8318, 'loss/train': 1.767422080039978} -11/06/2021 22:24:34 - INFO - __main__ - Step 8320: {'lr': 0.0004977544031102597, 'samples': 1597440, 'steps': 8319, 'loss/train': 1.7613978385925293} -11/06/2021 22:24:34 - INFO - __main__ - Step 8321: {'lr': 0.0004977536933760025, 'samples': 1597632, 'steps': 8320, 'loss/train': 1.8801629543304443} -11/06/2021 22:24:34 - INFO - __main__ - Step 8322: {'lr': 0.0004977529835301115, 'samples': 1597824, 'steps': 8321, 'loss/train': 1.653210163116455} -11/06/2021 22:24:35 - INFO - __main__ - Step 8323: {'lr': 0.0004977522735725866, 'samples': 1598016, 'steps': 8322, 'loss/train': 1.4604030847549438} -11/06/2021 22:24:35 - INFO - __main__ - Step 8324: {'lr': 0.0004977515635034285, 'samples': 1598208, 'steps': 8323, 'loss/train': 1.7190172672271729} -11/06/2021 22:24:36 - INFO - __main__ - Step 8325: {'lr': 0.0004977508533226374, 'samples': 1598400, 'steps': 8324, 'loss/train': 1.7144981622695923} -11/06/2021 22:24:36 - INFO - __main__ - Step 8326: {'lr': 0.0004977501430302136, 'samples': 1598592, 'steps': 8325, 'loss/train': 2.134070873260498} -11/06/2021 22:24:37 - INFO - __main__ - Step 8327: {'lr': 0.0004977494326261573, 'samples': 1598784, 'steps': 8326, 'loss/train': 2.0011684894561768} -11/06/2021 22:24:37 - INFO - __main__ - Step 8328: {'lr': 0.000497748722110469, 'samples': 1598976, 'steps': 8327, 'loss/train': 3.0373826026916504} -11/06/2021 22:24:38 - INFO - __main__ - Step 8329: {'lr': 0.0004977480114831489, 'samples': 1599168, 'steps': 8328, 'loss/train': 1.5927302837371826} -11/06/2021 22:24:38 - INFO - __main__ - Step 8330: {'lr': 0.0004977473007441973, 'samples': 1599360, 'steps': 8329, 'loss/train': 1.6622514724731445} -11/06/2021 22:24:39 - INFO - __main__ - Step 8331: {'lr': 0.0004977465898936147, 'samples': 1599552, 'steps': 8330, 'loss/train': 2.2087743282318115} -11/06/2021 22:24:39 - INFO - __main__ - Step 8332: {'lr': 0.0004977458789314014, 'samples': 1599744, 'steps': 8331, 'loss/train': 2.013927936553955} -11/06/2021 22:24:40 - INFO - __main__ - Step 8333: {'lr': 0.0004977451678575575, 'samples': 1599936, 'steps': 8332, 'loss/train': 1.207032561302185} -11/06/2021 22:24:40 - INFO - __main__ - Step 8334: {'lr': 0.0004977444566720834, 'samples': 1600128, 'steps': 8333, 'loss/train': 1.9208728075027466} -11/06/2021 22:24:40 - INFO - __main__ - Step 8335: {'lr': 0.0004977437453749795, 'samples': 1600320, 'steps': 8334, 'loss/train': 1.8534126281738281} -11/06/2021 22:24:42 - INFO - __main__ - Step 8336: {'lr': 0.0004977430339662462, 'samples': 1600512, 'steps': 8335, 'loss/train': 2.3053481578826904} -11/06/2021 22:24:42 - INFO - __main__ - Step 8337: {'lr': 0.0004977423224458837, 'samples': 1600704, 'steps': 8336, 'loss/train': 1.7347732782363892} -11/06/2021 22:24:42 - INFO - __main__ - Step 8338: {'lr': 0.0004977416108138922, 'samples': 1600896, 'steps': 8337, 'loss/train': 1.3853802680969238} -11/06/2021 22:24:43 - INFO - __main__ - Step 8339: {'lr': 0.0004977408990702722, 'samples': 1601088, 'steps': 8338, 'loss/train': 1.826993465423584} -11/06/2021 22:24:43 - INFO - __main__ - Step 8340: {'lr': 0.0004977401872150241, 'samples': 1601280, 'steps': 8339, 'loss/train': 1.857647180557251} -11/06/2021 22:24:44 - INFO - __main__ - Step 8341: {'lr': 0.000497739475248148, 'samples': 1601472, 'steps': 8340, 'loss/train': 1.9734106063842773} -11/06/2021 22:24:44 - INFO - __main__ - Step 8342: {'lr': 0.0004977387631696443, 'samples': 1601664, 'steps': 8341, 'loss/train': 1.5935910940170288} -11/06/2021 22:24:45 - INFO - __main__ - Step 8343: {'lr': 0.0004977380509795133, 'samples': 1601856, 'steps': 8342, 'loss/train': 1.8237578868865967} -11/06/2021 22:24:45 - INFO - __main__ - Step 8344: {'lr': 0.0004977373386777554, 'samples': 1602048, 'steps': 8343, 'loss/train': 2.0518319606781006} -11/06/2021 22:24:45 - INFO - __main__ - Step 8345: {'lr': 0.0004977366262643709, 'samples': 1602240, 'steps': 8344, 'loss/train': 2.2713077068328857} -11/06/2021 22:24:46 - INFO - __main__ - Step 8346: {'lr': 0.0004977359137393601, 'samples': 1602432, 'steps': 8345, 'loss/train': 1.824563980102539} -11/06/2021 22:24:47 - INFO - __main__ - Step 8347: {'lr': 0.0004977352011027233, 'samples': 1602624, 'steps': 8346, 'loss/train': 2.087007999420166} -11/06/2021 22:24:47 - INFO - __main__ - Step 8348: {'lr': 0.0004977344883544608, 'samples': 1602816, 'steps': 8347, 'loss/train': 1.990113615989685} -11/06/2021 22:24:47 - INFO - __main__ - Step 8349: {'lr': 0.0004977337754945731, 'samples': 1603008, 'steps': 8348, 'loss/train': 1.9418188333511353} -11/06/2021 22:24:48 - INFO - __main__ - Step 8350: {'lr': 0.0004977330625230603, 'samples': 1603200, 'steps': 8349, 'loss/train': 1.706646203994751} -11/06/2021 22:24:49 - INFO - __main__ - Step 8351: {'lr': 0.0004977323494399227, 'samples': 1603392, 'steps': 8350, 'loss/train': 2.1837000846862793} -11/06/2021 22:24:49 - INFO - __main__ - Step 8352: {'lr': 0.0004977316362451608, 'samples': 1603584, 'steps': 8351, 'loss/train': 1.3790884017944336} -11/06/2021 22:24:50 - INFO - __main__ - Step 8353: {'lr': 0.0004977309229387749, 'samples': 1603776, 'steps': 8352, 'loss/train': 2.0610451698303223} -11/06/2021 22:24:50 - INFO - __main__ - Step 8354: {'lr': 0.0004977302095207653, 'samples': 1603968, 'steps': 8353, 'loss/train': 1.990189552307129} -11/06/2021 22:24:50 - INFO - __main__ - Step 8355: {'lr': 0.0004977294959911322, 'samples': 1604160, 'steps': 8354, 'loss/train': 1.6748875379562378} -11/06/2021 22:24:51 - INFO - __main__ - Step 8356: {'lr': 0.0004977287823498761, 'samples': 1604352, 'steps': 8355, 'loss/train': 2.276111602783203} -11/06/2021 22:24:52 - INFO - __main__ - Step 8357: {'lr': 0.0004977280685969971, 'samples': 1604544, 'steps': 8356, 'loss/train': 2.2838523387908936} -11/06/2021 22:24:52 - INFO - __main__ - Step 8358: {'lr': 0.0004977273547324958, 'samples': 1604736, 'steps': 8357, 'loss/train': 2.2760424613952637} -11/06/2021 22:24:52 - INFO - __main__ - Step 8359: {'lr': 0.0004977266407563722, 'samples': 1604928, 'steps': 8358, 'loss/train': 3.90104079246521} -11/06/2021 22:24:53 - INFO - __main__ - Step 8360: {'lr': 0.0004977259266686269, 'samples': 1605120, 'steps': 8359, 'loss/train': 1.3751955032348633} -11/06/2021 22:24:54 - INFO - __main__ - Step 8361: {'lr': 0.0004977252124692601, 'samples': 1605312, 'steps': 8360, 'loss/train': 1.8619705438613892} -11/06/2021 22:24:54 - INFO - __main__ - Step 8362: {'lr': 0.0004977244981582723, 'samples': 1605504, 'steps': 8361, 'loss/train': 1.7409098148345947} -11/06/2021 22:24:54 - INFO - __main__ - Step 8363: {'lr': 0.0004977237837356634, 'samples': 1605696, 'steps': 8362, 'loss/train': 1.7340418100357056} -11/06/2021 22:24:55 - INFO - __main__ - Step 8364: {'lr': 0.0004977230692014341, 'samples': 1605888, 'steps': 8363, 'loss/train': 1.5807855129241943} -11/06/2021 22:24:55 - INFO - __main__ - Step 8365: {'lr': 0.0004977223545555847, 'samples': 1606080, 'steps': 8364, 'loss/train': 1.9046440124511719} -11/06/2021 22:24:56 - INFO - __main__ - Step 8366: {'lr': 0.0004977216397981153, 'samples': 1606272, 'steps': 8365, 'loss/train': 1.9120842218399048} -11/06/2021 22:24:56 - INFO - __main__ - Step 8367: {'lr': 0.0004977209249290264, 'samples': 1606464, 'steps': 8366, 'loss/train': 1.9572821855545044} -11/06/2021 22:24:57 - INFO - __main__ - Step 8368: {'lr': 0.0004977202099483184, 'samples': 1606656, 'steps': 8367, 'loss/train': 2.009401559829712} -11/06/2021 22:24:57 - INFO - __main__ - Step 8369: {'lr': 0.0004977194948559913, 'samples': 1606848, 'steps': 8368, 'loss/train': 1.6611480712890625} -11/06/2021 22:24:58 - INFO - __main__ - Step 8370: {'lr': 0.0004977187796520457, 'samples': 1607040, 'steps': 8369, 'loss/train': 1.6625375747680664} -11/06/2021 22:24:58 - INFO - __main__ - Step 8371: {'lr': 0.0004977180643364819, 'samples': 1607232, 'steps': 8370, 'loss/train': 1.967087984085083} -11/06/2021 22:24:59 - INFO - __main__ - Step 8372: {'lr': 0.0004977173489093, 'samples': 1607424, 'steps': 8371, 'loss/train': 1.945002555847168} -11/06/2021 22:24:59 - INFO - __main__ - Step 8373: {'lr': 0.0004977166333705005, 'samples': 1607616, 'steps': 8372, 'loss/train': 1.0230144262313843} -11/06/2021 22:25:00 - INFO - __main__ - Step 8374: {'lr': 0.0004977159177200839, 'samples': 1607808, 'steps': 8373, 'loss/train': 1.9832271337509155} -11/06/2021 22:25:00 - INFO - __main__ - Step 8375: {'lr': 0.0004977152019580502, 'samples': 1608000, 'steps': 8374, 'loss/train': 1.5450023412704468} -11/06/2021 22:25:00 - INFO - __main__ - Step 8376: {'lr': 0.0004977144860843998, 'samples': 1608192, 'steps': 8375, 'loss/train': 1.7388193607330322} -11/06/2021 22:25:01 - INFO - __main__ - Step 8377: {'lr': 0.0004977137700991332, 'samples': 1608384, 'steps': 8376, 'loss/train': 1.4530218839645386} -11/06/2021 22:25:02 - INFO - __main__ - Step 8378: {'lr': 0.0004977130540022506, 'samples': 1608576, 'steps': 8377, 'loss/train': 1.5566548109054565} -11/06/2021 22:25:02 - INFO - __main__ - Step 8379: {'lr': 0.0004977123377937523, 'samples': 1608768, 'steps': 8378, 'loss/train': 1.7430671453475952} -11/06/2021 22:25:02 - INFO - __main__ - Step 8380: {'lr': 0.0004977116214736385, 'samples': 1608960, 'steps': 8379, 'loss/train': 1.1904152631759644} -11/06/2021 22:25:03 - INFO - __main__ - Step 8381: {'lr': 0.0004977109050419097, 'samples': 1609152, 'steps': 8380, 'loss/train': 2.402639150619507} -11/06/2021 22:25:04 - INFO - __main__ - Step 8382: {'lr': 0.0004977101884985663, 'samples': 1609344, 'steps': 8381, 'loss/train': 1.059557557106018} -11/06/2021 22:25:04 - INFO - __main__ - Step 8383: {'lr': 0.0004977094718436085, 'samples': 1609536, 'steps': 8382, 'loss/train': 1.9162335395812988} -11/06/2021 22:25:04 - INFO - __main__ - Step 8384: {'lr': 0.0004977087550770366, 'samples': 1609728, 'steps': 8383, 'loss/train': 1.9313476085662842} -11/06/2021 22:25:05 - INFO - __main__ - Step 8385: {'lr': 0.000497708038198851, 'samples': 1609920, 'steps': 8384, 'loss/train': 1.6063017845153809} -11/06/2021 22:25:05 - INFO - __main__ - Step 8386: {'lr': 0.0004977073212090519, 'samples': 1610112, 'steps': 8385, 'loss/train': 1.8818663358688354} -11/06/2021 22:25:06 - INFO - __main__ - Step 8387: {'lr': 0.0004977066041076398, 'samples': 1610304, 'steps': 8386, 'loss/train': 1.9069045782089233} -11/06/2021 22:25:06 - INFO - __main__ - Step 8388: {'lr': 0.0004977058868946148, 'samples': 1610496, 'steps': 8387, 'loss/train': 2.062808036804199} -11/06/2021 22:25:07 - INFO - __main__ - Step 8389: {'lr': 0.0004977051695699775, 'samples': 1610688, 'steps': 8388, 'loss/train': 1.8666964769363403} -11/06/2021 22:25:07 - INFO - __main__ - Step 8390: {'lr': 0.000497704452133728, 'samples': 1610880, 'steps': 8389, 'loss/train': 2.0732336044311523} -11/06/2021 22:25:08 - INFO - __main__ - Step 8391: {'lr': 0.0004977037345858667, 'samples': 1611072, 'steps': 8390, 'loss/train': 2.5039222240448} -11/06/2021 22:25:09 - INFO - __main__ - Step 8392: {'lr': 0.0004977030169263938, 'samples': 1611264, 'steps': 8391, 'loss/train': 1.8938769102096558} -11/06/2021 22:25:09 - INFO - __main__ - Step 8393: {'lr': 0.0004977022991553099, 'samples': 1611456, 'steps': 8392, 'loss/train': 1.8383945226669312} -11/06/2021 22:25:09 - INFO - __main__ - Step 8394: {'lr': 0.0004977015812726151, 'samples': 1611648, 'steps': 8393, 'loss/train': 1.9845424890518188} -11/06/2021 22:25:10 - INFO - __main__ - Step 8395: {'lr': 0.0004977008632783098, 'samples': 1611840, 'steps': 8394, 'loss/train': 1.7527318000793457} -11/06/2021 22:25:10 - INFO - __main__ - Step 8396: {'lr': 0.0004977001451723944, 'samples': 1612032, 'steps': 8395, 'loss/train': 0.8850865364074707} -11/06/2021 22:25:10 - INFO - __main__ - Step 8397: {'lr': 0.000497699426954869, 'samples': 1612224, 'steps': 8396, 'loss/train': 1.9200553894042969} -11/06/2021 22:25:11 - INFO - __main__ - Step 8398: {'lr': 0.0004976987086257342, 'samples': 1612416, 'steps': 8397, 'loss/train': 1.0962588787078857} -11/06/2021 22:25:12 - INFO - __main__ - Step 8399: {'lr': 0.0004976979901849901, 'samples': 1612608, 'steps': 8398, 'loss/train': 1.736077070236206} -11/06/2021 22:25:12 - INFO - __main__ - Step 8400: {'lr': 0.000497697271632637, 'samples': 1612800, 'steps': 8399, 'loss/train': 1.651288390159607} -11/06/2021 22:25:12 - INFO - __main__ - Step 8401: {'lr': 0.0004976965529686756, 'samples': 1612992, 'steps': 8400, 'loss/train': 1.851194977760315} -11/06/2021 22:25:13 - INFO - __main__ - Step 8402: {'lr': 0.0004976958341931057, 'samples': 1613184, 'steps': 8401, 'loss/train': 1.0811164379119873} -11/06/2021 22:25:14 - INFO - __main__ - Step 8403: {'lr': 0.000497695115305928, 'samples': 1613376, 'steps': 8402, 'loss/train': 1.9029980897903442} -11/06/2021 22:25:14 - INFO - __main__ - Step 8404: {'lr': 0.0004976943963071426, 'samples': 1613568, 'steps': 8403, 'loss/train': 1.7651731967926025} -11/06/2021 22:25:15 - INFO - __main__ - Step 8405: {'lr': 0.0004976936771967501, 'samples': 1613760, 'steps': 8404, 'loss/train': 2.381589412689209} -11/06/2021 22:25:15 - INFO - __main__ - Step 8406: {'lr': 0.0004976929579747505, 'samples': 1613952, 'steps': 8405, 'loss/train': 1.7756294012069702} -11/06/2021 22:25:15 - INFO - __main__ - Step 8407: {'lr': 0.0004976922386411444, 'samples': 1614144, 'steps': 8406, 'loss/train': 2.137291669845581} -11/06/2021 22:25:16 - INFO - __main__ - Step 8408: {'lr': 0.0004976915191959319, 'samples': 1614336, 'steps': 8407, 'loss/train': 1.879096508026123} -11/06/2021 22:25:17 - INFO - __main__ - Step 8409: {'lr': 0.0004976907996391135, 'samples': 1614528, 'steps': 8408, 'loss/train': 1.870473861694336} -11/06/2021 22:25:17 - INFO - __main__ - Step 8410: {'lr': 0.0004976900799706894, 'samples': 1614720, 'steps': 8409, 'loss/train': 2.050117015838623} -11/06/2021 22:25:17 - INFO - __main__ - Step 8411: {'lr': 0.00049768936019066, 'samples': 1614912, 'steps': 8410, 'loss/train': 1.824702262878418} -11/06/2021 22:25:18 - INFO - __main__ - Step 8412: {'lr': 0.0004976886402990255, 'samples': 1615104, 'steps': 8411, 'loss/train': 1.77139413356781} -11/06/2021 22:25:19 - INFO - __main__ - Step 8413: {'lr': 0.0004976879202957864, 'samples': 1615296, 'steps': 8412, 'loss/train': 1.8707973957061768} -11/06/2021 22:25:19 - INFO - __main__ - Step 8414: {'lr': 0.000497687200180943, 'samples': 1615488, 'steps': 8413, 'loss/train': 1.7304356098175049} -11/06/2021 22:25:19 - INFO - __main__ - Step 8415: {'lr': 0.0004976864799544954, 'samples': 1615680, 'steps': 8414, 'loss/train': 1.8535863161087036} -11/06/2021 22:25:20 - INFO - __main__ - Step 8416: {'lr': 0.0004976857596164443, 'samples': 1615872, 'steps': 8415, 'loss/train': 1.761738896369934} -11/06/2021 22:25:20 - INFO - __main__ - Step 8417: {'lr': 0.0004976850391667897, 'samples': 1616064, 'steps': 8416, 'loss/train': 1.0257487297058105} -11/06/2021 22:25:21 - INFO - __main__ - Step 8418: {'lr': 0.0004976843186055321, 'samples': 1616256, 'steps': 8417, 'loss/train': 1.9058445692062378} -11/06/2021 22:25:21 - INFO - __main__ - Step 8419: {'lr': 0.0004976835979326718, 'samples': 1616448, 'steps': 8418, 'loss/train': 1.5903434753417969} -11/06/2021 22:25:22 - INFO - __main__ - Step 8420: {'lr': 0.0004976828771482089, 'samples': 1616640, 'steps': 8419, 'loss/train': 1.9769971370697021} -11/06/2021 22:25:22 - INFO - __main__ - Step 8421: {'lr': 0.0004976821562521441, 'samples': 1616832, 'steps': 8420, 'loss/train': 1.9733790159225464} -11/06/2021 22:25:22 - INFO - __main__ - Step 8422: {'lr': 0.0004976814352444775, 'samples': 1617024, 'steps': 8421, 'loss/train': 1.1663745641708374} -11/06/2021 22:25:24 - INFO - __main__ - Step 8423: {'lr': 0.0004976807141252094, 'samples': 1617216, 'steps': 8422, 'loss/train': 1.938113808631897} -11/06/2021 22:25:24 - INFO - __main__ - Step 8424: {'lr': 0.0004976799928943403, 'samples': 1617408, 'steps': 8423, 'loss/train': 0.9520623683929443} -11/06/2021 22:25:25 - INFO - __main__ - Step 8425: {'lr': 0.0004976792715518703, 'samples': 1617600, 'steps': 8424, 'loss/train': 2.006859302520752} -11/06/2021 22:25:25 - INFO - __main__ - Step 8426: {'lr': 0.0004976785500978, 'samples': 1617792, 'steps': 8425, 'loss/train': 1.5716438293457031} -11/06/2021 22:25:25 - INFO - __main__ - Step 8427: {'lr': 0.0004976778285321294, 'samples': 1617984, 'steps': 8426, 'loss/train': 1.7659454345703125} -11/06/2021 22:25:26 - INFO - __main__ - Step 8428: {'lr': 0.0004976771068548591, 'samples': 1618176, 'steps': 8427, 'loss/train': 2.2531676292419434} -11/06/2021 22:25:27 - INFO - __main__ - Step 8429: {'lr': 0.0004976763850659893, 'samples': 1618368, 'steps': 8428, 'loss/train': 0.3412085175514221} -11/06/2021 22:25:27 - INFO - __main__ - Step 8430: {'lr': 0.0004976756631655203, 'samples': 1618560, 'steps': 8429, 'loss/train': 1.789984941482544} -11/06/2021 22:25:27 - INFO - __main__ - Step 8431: {'lr': 0.0004976749411534525, 'samples': 1618752, 'steps': 8430, 'loss/train': 1.566307783126831} -11/06/2021 22:25:28 - INFO - __main__ - Step 8432: {'lr': 0.0004976742190297862, 'samples': 1618944, 'steps': 8431, 'loss/train': 2.2874772548675537} -11/06/2021 22:25:28 - INFO - __main__ - Step 8433: {'lr': 0.0004976734967945217, 'samples': 1619136, 'steps': 8432, 'loss/train': 1.724574327468872} -11/06/2021 22:25:29 - INFO - __main__ - Step 8434: {'lr': 0.0004976727744476593, 'samples': 1619328, 'steps': 8433, 'loss/train': 2.225064516067505} -11/06/2021 22:25:29 - INFO - __main__ - Step 8435: {'lr': 0.0004976720519891994, 'samples': 1619520, 'steps': 8434, 'loss/train': 1.7268136739730835} -11/06/2021 22:25:30 - INFO - __main__ - Step 8436: {'lr': 0.0004976713294191423, 'samples': 1619712, 'steps': 8435, 'loss/train': 1.76718270778656} -11/06/2021 22:25:30 - INFO - __main__ - Step 8437: {'lr': 0.0004976706067374885, 'samples': 1619904, 'steps': 8436, 'loss/train': 1.7768479585647583} -11/06/2021 22:25:31 - INFO - __main__ - Step 8438: {'lr': 0.0004976698839442379, 'samples': 1620096, 'steps': 8437, 'loss/train': 1.0732344388961792} -11/06/2021 22:25:31 - INFO - __main__ - Step 8439: {'lr': 0.0004976691610393911, 'samples': 1620288, 'steps': 8438, 'loss/train': 2.1499216556549072} -11/06/2021 22:25:32 - INFO - __main__ - Step 8440: {'lr': 0.0004976684380229485, 'samples': 1620480, 'steps': 8439, 'loss/train': 1.8291432857513428} -11/06/2021 22:25:32 - INFO - __main__ - Step 8441: {'lr': 0.0004976677148949102, 'samples': 1620672, 'steps': 8440, 'loss/train': 1.7826381921768188} -11/06/2021 22:25:33 - INFO - __main__ - Step 8442: {'lr': 0.0004976669916552768, 'samples': 1620864, 'steps': 8441, 'loss/train': 1.9281136989593506} -11/06/2021 22:25:33 - INFO - __main__ - Step 8443: {'lr': 0.0004976662683040484, 'samples': 1621056, 'steps': 8442, 'loss/train': 1.7835140228271484} -11/06/2021 22:25:33 - INFO - __main__ - Step 8444: {'lr': 0.0004976655448412254, 'samples': 1621248, 'steps': 8443, 'loss/train': 2.6480824947357178} -11/06/2021 22:25:34 - INFO - __main__ - Step 8445: {'lr': 0.0004976648212668081, 'samples': 1621440, 'steps': 8444, 'loss/train': 1.505518913269043} -11/06/2021 22:25:35 - INFO - __main__ - Step 8446: {'lr': 0.0004976640975807969, 'samples': 1621632, 'steps': 8445, 'loss/train': 1.532829761505127} -11/06/2021 22:25:35 - INFO - __main__ - Step 8447: {'lr': 0.0004976633737831921, 'samples': 1621824, 'steps': 8446, 'loss/train': 1.6985620260238647} -11/06/2021 22:25:35 - INFO - __main__ - Step 8448: {'lr': 0.000497662649873994, 'samples': 1622016, 'steps': 8447, 'loss/train': 1.2889354228973389} -11/06/2021 22:25:36 - INFO - __main__ - Step 8449: {'lr': 0.0004976619258532029, 'samples': 1622208, 'steps': 8448, 'loss/train': 1.8851784467697144} -11/06/2021 22:25:37 - INFO - __main__ - Step 8450: {'lr': 0.0004976612017208191, 'samples': 1622400, 'steps': 8449, 'loss/train': 2.305765151977539} -11/06/2021 22:25:37 - INFO - __main__ - Step 8451: {'lr': 0.000497660477476843, 'samples': 1622592, 'steps': 8450, 'loss/train': 1.9551142454147339} -11/06/2021 22:25:37 - INFO - __main__ - Step 8452: {'lr': 0.000497659753121275, 'samples': 1622784, 'steps': 8451, 'loss/train': 2.0676944255828857} -11/06/2021 22:25:38 - INFO - __main__ - Step 8453: {'lr': 0.0004976590286541152, 'samples': 1622976, 'steps': 8452, 'loss/train': 1.929355502128601} -11/06/2021 22:25:38 - INFO - __main__ - Step 8454: {'lr': 0.0004976583040753643, 'samples': 1623168, 'steps': 8453, 'loss/train': 1.959873080253601} -11/06/2021 22:25:39 - INFO - __main__ - Step 8455: {'lr': 0.0004976575793850223, 'samples': 1623360, 'steps': 8454, 'loss/train': 1.7598445415496826} -11/06/2021 22:25:40 - INFO - __main__ - Step 8456: {'lr': 0.0004976568545830894, 'samples': 1623552, 'steps': 8455, 'loss/train': 1.6411019563674927} -11/06/2021 22:25:40 - INFO - __main__ - Step 8457: {'lr': 0.0004976561296695663, 'samples': 1623744, 'steps': 8456, 'loss/train': 1.8063533306121826} -11/06/2021 22:25:40 - INFO - __main__ - Step 8458: {'lr': 0.0004976554046444532, 'samples': 1623936, 'steps': 8457, 'loss/train': 1.4065788984298706} -11/06/2021 22:25:41 - INFO - __main__ - Step 8459: {'lr': 0.0004976546795077503, 'samples': 1624128, 'steps': 8458, 'loss/train': 2.1664505004882812} -11/06/2021 22:25:42 - INFO - __main__ - Step 8460: {'lr': 0.0004976539542594582, 'samples': 1624320, 'steps': 8459, 'loss/train': 1.423108458518982} -11/06/2021 22:25:42 - INFO - __main__ - Step 8461: {'lr': 0.0004976532288995768, 'samples': 1624512, 'steps': 8460, 'loss/train': 1.727888822555542} -11/06/2021 22:25:42 - INFO - __main__ - Step 8462: {'lr': 0.0004976525034281069, 'samples': 1624704, 'steps': 8461, 'loss/train': 1.7131630182266235} -11/06/2021 22:25:43 - INFO - __main__ - Step 8463: {'lr': 0.0004976517778450486, 'samples': 1624896, 'steps': 8462, 'loss/train': 1.9994878768920898} -11/06/2021 22:25:43 - INFO - __main__ - Step 8464: {'lr': 0.000497651052150402, 'samples': 1625088, 'steps': 8463, 'loss/train': 1.3184614181518555} -11/06/2021 22:25:44 - INFO - __main__ - Step 8465: {'lr': 0.0004976503263441679, 'samples': 1625280, 'steps': 8464, 'loss/train': 1.885838270187378} -11/06/2021 22:25:44 - INFO - __main__ - Step 8466: {'lr': 0.0004976496004263463, 'samples': 1625472, 'steps': 8465, 'loss/train': 1.80532968044281} -11/06/2021 22:25:45 - INFO - __main__ - Step 8467: {'lr': 0.0004976488743969376, 'samples': 1625664, 'steps': 8466, 'loss/train': 1.5060994625091553} -11/06/2021 22:25:45 - INFO - __main__ - Step 8468: {'lr': 0.0004976481482559421, 'samples': 1625856, 'steps': 8467, 'loss/train': 1.5242974758148193} -11/06/2021 22:25:46 - INFO - __main__ - Step 8469: {'lr': 0.0004976474220033602, 'samples': 1626048, 'steps': 8468, 'loss/train': 1.838634729385376} -11/06/2021 22:25:46 - INFO - __main__ - Step 8470: {'lr': 0.0004976466956391922, 'samples': 1626240, 'steps': 8469, 'loss/train': 1.2237740755081177} -11/06/2021 22:25:47 - INFO - __main__ - Step 8471: {'lr': 0.0004976459691634384, 'samples': 1626432, 'steps': 8470, 'loss/train': 1.4460675716400146} -11/06/2021 22:25:47 - INFO - __main__ - Step 8472: {'lr': 0.0004976452425760992, 'samples': 1626624, 'steps': 8471, 'loss/train': 2.1150126457214355} -11/06/2021 22:25:48 - INFO - __main__ - Step 8473: {'lr': 0.0004976445158771748, 'samples': 1626816, 'steps': 8472, 'loss/train': 1.7219116687774658} -11/06/2021 22:25:48 - INFO - __main__ - Step 8474: {'lr': 0.0004976437890666657, 'samples': 1627008, 'steps': 8473, 'loss/train': 1.7514417171478271} -11/06/2021 22:25:48 - INFO - __main__ - Step 8475: {'lr': 0.0004976430621445721, 'samples': 1627200, 'steps': 8474, 'loss/train': 1.6506552696228027} -11/06/2021 22:25:50 - INFO - __main__ - Step 8476: {'lr': 0.0004976423351108943, 'samples': 1627392, 'steps': 8475, 'loss/train': 1.3242745399475098} -11/06/2021 22:25:50 - INFO - __main__ - Step 8477: {'lr': 0.0004976416079656328, 'samples': 1627584, 'steps': 8476, 'loss/train': 2.3073718547821045} -11/06/2021 22:25:50 - INFO - __main__ - Step 8478: {'lr': 0.0004976408807087876, 'samples': 1627776, 'steps': 8477, 'loss/train': 1.0934592485427856} -11/06/2021 22:25:51 - INFO - __main__ - Step 8479: {'lr': 0.0004976401533403594, 'samples': 1627968, 'steps': 8478, 'loss/train': 1.5833334922790527} -11/06/2021 22:25:51 - INFO - __main__ - Step 8480: {'lr': 0.0004976394258603484, 'samples': 1628160, 'steps': 8479, 'loss/train': 1.3912901878356934} -11/06/2021 22:25:52 - INFO - __main__ - Step 8481: {'lr': 0.0004976386982687549, 'samples': 1628352, 'steps': 8480, 'loss/train': 1.8894435167312622} -11/06/2021 22:25:52 - INFO - __main__ - Step 8482: {'lr': 0.0004976379705655791, 'samples': 1628544, 'steps': 8481, 'loss/train': 1.7393689155578613} -11/06/2021 22:25:53 - INFO - __main__ - Step 8483: {'lr': 0.0004976372427508215, 'samples': 1628736, 'steps': 8482, 'loss/train': 1.9663249254226685} -11/06/2021 22:25:53 - INFO - __main__ - Step 8484: {'lr': 0.0004976365148244824, 'samples': 1628928, 'steps': 8483, 'loss/train': 2.2855916023254395} -11/06/2021 22:25:53 - INFO - __main__ - Step 8485: {'lr': 0.0004976357867865621, 'samples': 1629120, 'steps': 8484, 'loss/train': 1.8762072324752808} -11/06/2021 22:25:54 - INFO - __main__ - Step 8486: {'lr': 0.0004976350586370609, 'samples': 1629312, 'steps': 8485, 'loss/train': 1.8550057411193848} -11/06/2021 22:25:55 - INFO - __main__ - Step 8487: {'lr': 0.0004976343303759792, 'samples': 1629504, 'steps': 8486, 'loss/train': 1.618645191192627} -11/06/2021 22:25:55 - INFO - __main__ - Step 8488: {'lr': 0.0004976336020033174, 'samples': 1629696, 'steps': 8487, 'loss/train': 1.672871470451355} -11/06/2021 22:25:55 - INFO - __main__ - Step 8489: {'lr': 0.0004976328735190755, 'samples': 1629888, 'steps': 8488, 'loss/train': 1.8050670623779297} -11/06/2021 22:25:56 - INFO - __main__ - Step 8490: {'lr': 0.0004976321449232542, 'samples': 1630080, 'steps': 8489, 'loss/train': 1.4703295230865479} -11/06/2021 22:25:56 - INFO - __main__ - Step 8491: {'lr': 0.0004976314162158536, 'samples': 1630272, 'steps': 8490, 'loss/train': 1.5319691896438599} -11/06/2021 22:25:57 - INFO - __main__ - Step 8492: {'lr': 0.0004976306873968741, 'samples': 1630464, 'steps': 8491, 'loss/train': 1.876915454864502} -11/06/2021 22:25:57 - INFO - __main__ - Step 8493: {'lr': 0.0004976299584663161, 'samples': 1630656, 'steps': 8492, 'loss/train': 1.787011981010437} -11/06/2021 22:25:58 - INFO - __main__ - Step 8494: {'lr': 0.0004976292294241798, 'samples': 1630848, 'steps': 8493, 'loss/train': 1.3954660892486572} -11/06/2021 22:25:58 - INFO - __main__ - Step 8495: {'lr': 0.0004976285002704656, 'samples': 1631040, 'steps': 8494, 'loss/train': 2.078723669052124} -11/06/2021 22:25:59 - INFO - __main__ - Step 8496: {'lr': 0.0004976277710051739, 'samples': 1631232, 'steps': 8495, 'loss/train': 2.3327043056488037} -11/06/2021 22:26:00 - INFO - __main__ - Step 8497: {'lr': 0.0004976270416283049, 'samples': 1631424, 'steps': 8496, 'loss/train': 1.9234745502471924} -11/06/2021 22:26:00 - INFO - __main__ - Step 8498: {'lr': 0.000497626312139859, 'samples': 1631616, 'steps': 8497, 'loss/train': 1.7845796346664429} -11/06/2021 22:26:00 - INFO - __main__ - Step 8499: {'lr': 0.0004976255825398365, 'samples': 1631808, 'steps': 8498, 'loss/train': 2.1495463848114014} -11/06/2021 22:26:01 - INFO - __main__ - Step 8500: {'lr': 0.0004976248528282376, 'samples': 1632000, 'steps': 8499, 'loss/train': 2.1509108543395996} -11/06/2021 22:26:01 - INFO - __main__ - Step 8501: {'lr': 0.000497624123005063, 'samples': 1632192, 'steps': 8500, 'loss/train': 1.78944993019104} -11/06/2021 22:26:02 - INFO - __main__ - Step 8502: {'lr': 0.0004976233930703126, 'samples': 1632384, 'steps': 8501, 'loss/train': 1.7581290006637573} -11/06/2021 22:26:02 - INFO - __main__ - Step 8503: {'lr': 0.000497622663023987, 'samples': 1632576, 'steps': 8502, 'loss/train': 1.6255358457565308} -11/06/2021 22:26:03 - INFO - __main__ - Step 8504: {'lr': 0.0004976219328660864, 'samples': 1632768, 'steps': 8503, 'loss/train': 1.977895975112915} -11/06/2021 22:26:03 - INFO - __main__ - Step 8505: {'lr': 0.0004976212025966112, 'samples': 1632960, 'steps': 8504, 'loss/train': 3.297560453414917} -11/06/2021 22:26:03 - INFO - __main__ - Step 8506: {'lr': 0.0004976204722155617, 'samples': 1633152, 'steps': 8505, 'loss/train': 1.7833354473114014} -11/06/2021 22:26:05 - INFO - __main__ - Step 8507: {'lr': 0.0004976197417229383, 'samples': 1633344, 'steps': 8506, 'loss/train': 1.4364817142486572} -11/06/2021 22:26:05 - INFO - __main__ - Step 8508: {'lr': 0.0004976190111187412, 'samples': 1633536, 'steps': 8507, 'loss/train': 2.1614036560058594} -11/06/2021 22:26:05 - INFO - __main__ - Step 8509: {'lr': 0.0004976182804029708, 'samples': 1633728, 'steps': 8508, 'loss/train': 1.8485922813415527} -11/06/2021 22:26:06 - INFO - __main__ - Step 8510: {'lr': 0.0004976175495756274, 'samples': 1633920, 'steps': 8509, 'loss/train': 1.9994100332260132} -11/06/2021 22:26:06 - INFO - __main__ - Step 8511: {'lr': 0.0004976168186367115, 'samples': 1634112, 'steps': 8510, 'loss/train': 1.4582551717758179} -11/06/2021 22:26:07 - INFO - __main__ - Step 8512: {'lr': 0.0004976160875862231, 'samples': 1634304, 'steps': 8511, 'loss/train': 1.6600501537322998} -11/06/2021 22:26:07 - INFO - __main__ - Step 8513: {'lr': 0.0004976153564241628, 'samples': 1634496, 'steps': 8512, 'loss/train': 1.6046333312988281} -11/06/2021 22:26:08 - INFO - __main__ - Step 8514: {'lr': 0.0004976146251505309, 'samples': 1634688, 'steps': 8513, 'loss/train': 2.3201334476470947} -11/06/2021 22:26:08 - INFO - __main__ - Step 8515: {'lr': 0.0004976138937653275, 'samples': 1634880, 'steps': 8514, 'loss/train': 1.6256712675094604} -11/06/2021 22:26:08 - INFO - __main__ - Step 8516: {'lr': 0.0004976131622685532, 'samples': 1635072, 'steps': 8515, 'loss/train': 1.8171868324279785} -11/06/2021 22:26:09 - INFO - __main__ - Step 8517: {'lr': 0.0004976124306602083, 'samples': 1635264, 'steps': 8516, 'loss/train': 1.7854278087615967} -11/06/2021 22:26:10 - INFO - __main__ - Step 8518: {'lr': 0.0004976116989402929, 'samples': 1635456, 'steps': 8517, 'loss/train': 1.7013543844223022} -11/06/2021 22:26:10 - INFO - __main__ - Step 8519: {'lr': 0.0004976109671088076, 'samples': 1635648, 'steps': 8518, 'loss/train': 1.9890172481536865} -11/06/2021 22:26:10 - INFO - __main__ - Step 8520: {'lr': 0.0004976102351657526, 'samples': 1635840, 'steps': 8519, 'loss/train': 1.8006373643875122} -11/06/2021 22:26:11 - INFO - __main__ - Step 8521: {'lr': 0.0004976095031111283, 'samples': 1636032, 'steps': 8520, 'loss/train': 1.9364084005355835} -11/06/2021 22:26:11 - INFO - __main__ - Step 8522: {'lr': 0.0004976087709449348, 'samples': 1636224, 'steps': 8521, 'loss/train': 1.6207133531570435} -11/06/2021 22:26:12 - INFO - __main__ - Step 8523: {'lr': 0.0004976080386671728, 'samples': 1636416, 'steps': 8522, 'loss/train': 2.250715732574463} -11/06/2021 22:26:13 - INFO - __main__ - Step 8524: {'lr': 0.0004976073062778423, 'samples': 1636608, 'steps': 8523, 'loss/train': 1.8443859815597534} -11/06/2021 22:26:13 - INFO - __main__ - Step 8525: {'lr': 0.0004976065737769439, 'samples': 1636800, 'steps': 8524, 'loss/train': 0.9607848525047302} -11/06/2021 22:26:13 - INFO - __main__ - Step 8526: {'lr': 0.0004976058411644777, 'samples': 1636992, 'steps': 8525, 'loss/train': 1.7340941429138184} -11/06/2021 22:26:14 - INFO - __main__ - Step 8527: {'lr': 0.0004976051084404443, 'samples': 1637184, 'steps': 8526, 'loss/train': 2.0823657512664795} -11/06/2021 22:26:15 - INFO - __main__ - Step 8528: {'lr': 0.0004976043756048436, 'samples': 1637376, 'steps': 8527, 'loss/train': 1.8343414068222046} -11/06/2021 22:26:15 - INFO - __main__ - Step 8529: {'lr': 0.0004976036426576763, 'samples': 1637568, 'steps': 8528, 'loss/train': 2.1914784908294678} -11/06/2021 22:26:15 - INFO - __main__ - Step 8530: {'lr': 0.0004976029095989427, 'samples': 1637760, 'steps': 8529, 'loss/train': 3.2090442180633545} -11/06/2021 22:26:16 - INFO - __main__ - Step 8531: {'lr': 0.000497602176428643, 'samples': 1637952, 'steps': 8530, 'loss/train': 2.355168342590332} -11/06/2021 22:26:16 - INFO - __main__ - Step 8532: {'lr': 0.0004976014431467775, 'samples': 1638144, 'steps': 8531, 'loss/train': 1.1861897706985474} -11/06/2021 22:26:17 - INFO - __main__ - Step 8533: {'lr': 0.0004976007097533467, 'samples': 1638336, 'steps': 8532, 'loss/train': 2.105987071990967} -11/06/2021 22:26:17 - INFO - __main__ - Step 8534: {'lr': 0.0004975999762483509, 'samples': 1638528, 'steps': 8533, 'loss/train': 1.797425389289856} -11/06/2021 22:26:18 - INFO - __main__ - Step 8535: {'lr': 0.0004975992426317902, 'samples': 1638720, 'steps': 8534, 'loss/train': 1.2677090167999268} -11/06/2021 22:26:18 - INFO - __main__ - Step 8536: {'lr': 0.0004975985089036652, 'samples': 1638912, 'steps': 8535, 'loss/train': 1.7440499067306519} -11/06/2021 22:26:18 - INFO - __main__ - Step 8537: {'lr': 0.0004975977750639761, 'samples': 1639104, 'steps': 8536, 'loss/train': 3.189857244491577} -11/06/2021 22:26:19 - INFO - __main__ - Step 8538: {'lr': 0.0004975970411127233, 'samples': 1639296, 'steps': 8537, 'loss/train': 1.8964868783950806} -11/06/2021 22:26:20 - INFO - __main__ - Step 8539: {'lr': 0.0004975963070499071, 'samples': 1639488, 'steps': 8538, 'loss/train': 2.1125876903533936} -11/06/2021 22:26:20 - INFO - __main__ - Step 8540: {'lr': 0.0004975955728755277, 'samples': 1639680, 'steps': 8539, 'loss/train': 1.6929922103881836} -11/06/2021 22:26:21 - INFO - __main__ - Step 8541: {'lr': 0.0004975948385895858, 'samples': 1639872, 'steps': 8540, 'loss/train': 1.6374714374542236} -11/06/2021 22:26:21 - INFO - __main__ - Step 8542: {'lr': 0.0004975941041920813, 'samples': 1640064, 'steps': 8541, 'loss/train': 2.006967067718506} -11/06/2021 22:26:22 - INFO - __main__ - Step 8543: {'lr': 0.0004975933696830147, 'samples': 1640256, 'steps': 8542, 'loss/train': 1.9213240146636963} -11/06/2021 22:26:22 - INFO - __main__ - Step 8544: {'lr': 0.0004975926350623864, 'samples': 1640448, 'steps': 8543, 'loss/train': 2.296802043914795} -11/06/2021 22:26:23 - INFO - __main__ - Step 8545: {'lr': 0.0004975919003301967, 'samples': 1640640, 'steps': 8544, 'loss/train': 1.7071173191070557} -11/06/2021 22:26:23 - INFO - __main__ - Step 8546: {'lr': 0.0004975911654864459, 'samples': 1640832, 'steps': 8545, 'loss/train': 2.5078957080841064} -11/06/2021 22:26:23 - INFO - __main__ - Step 8547: {'lr': 0.0004975904305311344, 'samples': 1641024, 'steps': 8546, 'loss/train': 2.413429021835327} -11/06/2021 22:26:25 - INFO - __main__ - Step 8548: {'lr': 0.0004975896954642623, 'samples': 1641216, 'steps': 8547, 'loss/train': 1.545986294746399} -11/06/2021 22:26:25 - INFO - __main__ - Step 8549: {'lr': 0.0004975889602858303, 'samples': 1641408, 'steps': 8548, 'loss/train': 1.858424425125122} -11/06/2021 22:26:26 - INFO - __main__ - Step 8550: {'lr': 0.0004975882249958385, 'samples': 1641600, 'steps': 8549, 'loss/train': 2.576998472213745} -11/06/2021 22:26:26 - INFO - __main__ - Step 8551: {'lr': 0.0004975874895942872, 'samples': 1641792, 'steps': 8550, 'loss/train': 1.2816332578659058} -11/06/2021 22:26:26 - INFO - __main__ - Step 8552: {'lr': 0.0004975867540811768, 'samples': 1641984, 'steps': 8551, 'loss/train': 1.6916189193725586} -11/06/2021 22:26:27 - INFO - __main__ - Step 8553: {'lr': 0.0004975860184565076, 'samples': 1642176, 'steps': 8552, 'loss/train': 1.8677070140838623} -11/06/2021 22:26:27 - INFO - __main__ - Step 8554: {'lr': 0.0004975852827202801, 'samples': 1642368, 'steps': 8553, 'loss/train': 1.7044568061828613} -11/06/2021 22:26:28 - INFO - __main__ - Step 8555: {'lr': 0.0004975845468724944, 'samples': 1642560, 'steps': 8554, 'loss/train': 1.236737847328186} -11/06/2021 22:26:29 - INFO - __main__ - Step 8556: {'lr': 0.0004975838109131509, 'samples': 1642752, 'steps': 8555, 'loss/train': 1.6801140308380127} -11/06/2021 22:26:29 - INFO - __main__ - Step 8557: {'lr': 0.0004975830748422499, 'samples': 1642944, 'steps': 8556, 'loss/train': 1.9419505596160889} -11/06/2021 22:26:29 - INFO - __main__ - Step 8558: {'lr': 0.0004975823386597918, 'samples': 1643136, 'steps': 8557, 'loss/train': 1.7988413572311401} -11/06/2021 22:26:30 - INFO - __main__ - Step 8559: {'lr': 0.000497581602365777, 'samples': 1643328, 'steps': 8558, 'loss/train': 2.347743511199951} -11/06/2021 22:26:30 - INFO - __main__ - Step 8560: {'lr': 0.0004975808659602058, 'samples': 1643520, 'steps': 8559, 'loss/train': 1.103050947189331} -11/06/2021 22:26:31 - INFO - __main__ - Step 8561: {'lr': 0.0004975801294430784, 'samples': 1643712, 'steps': 8560, 'loss/train': 2.005465030670166} -11/06/2021 22:26:31 - INFO - __main__ - Step 8562: {'lr': 0.0004975793928143952, 'samples': 1643904, 'steps': 8561, 'loss/train': 1.6958545446395874} -11/06/2021 22:26:32 - INFO - __main__ - Step 8563: {'lr': 0.0004975786560741566, 'samples': 1644096, 'steps': 8562, 'loss/train': 1.6469171047210693} -11/06/2021 22:26:32 - INFO - __main__ - Step 8564: {'lr': 0.0004975779192223629, 'samples': 1644288, 'steps': 8563, 'loss/train': 1.7488797903060913} -11/06/2021 22:26:32 - INFO - __main__ - Step 8565: {'lr': 0.0004975771822590143, 'samples': 1644480, 'steps': 8564, 'loss/train': 1.531661868095398} -11/06/2021 22:26:33 - INFO - __main__ - Step 8566: {'lr': 0.0004975764451841114, 'samples': 1644672, 'steps': 8565, 'loss/train': 1.9583240747451782} -11/06/2021 22:26:34 - INFO - __main__ - Step 8567: {'lr': 0.0004975757079976542, 'samples': 1644864, 'steps': 8566, 'loss/train': 2.6760129928588867} -11/06/2021 22:26:34 - INFO - __main__ - Step 8568: {'lr': 0.0004975749706996433, 'samples': 1645056, 'steps': 8567, 'loss/train': 1.9086993932724} -11/06/2021 22:26:34 - INFO - __main__ - Step 8569: {'lr': 0.0004975742332900789, 'samples': 1645248, 'steps': 8568, 'loss/train': 1.3222005367279053} -11/06/2021 22:26:35 - INFO - __main__ - Step 8570: {'lr': 0.0004975734957689614, 'samples': 1645440, 'steps': 8569, 'loss/train': 2.3594229221343994} -11/06/2021 22:26:36 - INFO - __main__ - Step 8571: {'lr': 0.0004975727581362911, 'samples': 1645632, 'steps': 8570, 'loss/train': 1.3136167526245117} -11/06/2021 22:26:36 - INFO - __main__ - Step 8572: {'lr': 0.0004975720203920683, 'samples': 1645824, 'steps': 8571, 'loss/train': 2.3485770225524902} -11/06/2021 22:26:36 - INFO - __main__ - Step 8573: {'lr': 0.0004975712825362934, 'samples': 1646016, 'steps': 8572, 'loss/train': 2.9186878204345703} -11/06/2021 22:26:37 - INFO - __main__ - Step 8574: {'lr': 0.0004975705445689668, 'samples': 1646208, 'steps': 8573, 'loss/train': 1.8523027896881104} -11/06/2021 22:26:37 - INFO - __main__ - Step 8575: {'lr': 0.0004975698064900886, 'samples': 1646400, 'steps': 8574, 'loss/train': 2.420170783996582} -11/06/2021 22:26:38 - INFO - __main__ - Step 8576: {'lr': 0.0004975690682996592, 'samples': 1646592, 'steps': 8575, 'loss/train': 1.9467846155166626} -11/06/2021 22:26:38 - INFO - __main__ - Step 8577: {'lr': 0.0004975683299976791, 'samples': 1646784, 'steps': 8576, 'loss/train': 1.946389079093933} -11/06/2021 22:26:39 - INFO - __main__ - Step 8578: {'lr': 0.0004975675915841485, 'samples': 1646976, 'steps': 8577, 'loss/train': 2.061795711517334} -11/06/2021 22:26:39 - INFO - __main__ - Step 8579: {'lr': 0.0004975668530590679, 'samples': 1647168, 'steps': 8578, 'loss/train': 2.067392110824585} -11/06/2021 22:26:40 - INFO - __main__ - Step 8580: {'lr': 0.0004975661144224374, 'samples': 1647360, 'steps': 8579, 'loss/train': 2.0112924575805664} -11/06/2021 22:26:41 - INFO - __main__ - Step 8581: {'lr': 0.0004975653756742574, 'samples': 1647552, 'steps': 8580, 'loss/train': 1.770460605621338} -11/06/2021 22:26:42 - INFO - __main__ - Step 8582: {'lr': 0.0004975646368145282, 'samples': 1647744, 'steps': 8581, 'loss/train': 2.0862138271331787} -11/06/2021 22:26:42 - INFO - __main__ - Step 8583: {'lr': 0.0004975638978432503, 'samples': 1647936, 'steps': 8582, 'loss/train': 1.6407994031906128} -11/06/2021 22:26:42 - INFO - __main__ - Step 8584: {'lr': 0.0004975631587604239, 'samples': 1648128, 'steps': 8583, 'loss/train': 1.8305928707122803} -11/06/2021 22:26:43 - INFO - __main__ - Step 8585: {'lr': 0.0004975624195660494, 'samples': 1648320, 'steps': 8584, 'loss/train': 1.8244094848632812} -11/06/2021 22:26:43 - INFO - __main__ - Step 8586: {'lr': 0.0004975616802601271, 'samples': 1648512, 'steps': 8585, 'loss/train': 1.8164951801300049} -11/06/2021 22:26:44 - INFO - __main__ - Step 8587: {'lr': 0.0004975609408426572, 'samples': 1648704, 'steps': 8586, 'loss/train': 1.84238600730896} -11/06/2021 22:26:45 - INFO - __main__ - Step 8588: {'lr': 0.0004975602013136403, 'samples': 1648896, 'steps': 8587, 'loss/train': 1.9760645627975464} -11/06/2021 22:26:45 - INFO - __main__ - Step 8589: {'lr': 0.0004975594616730766, 'samples': 1649088, 'steps': 8588, 'loss/train': 1.6991413831710815} -11/06/2021 22:26:45 - INFO - __main__ - Step 8590: {'lr': 0.0004975587219209663, 'samples': 1649280, 'steps': 8589, 'loss/train': 1.3211325407028198} -11/06/2021 22:26:46 - INFO - __main__ - Step 8591: {'lr': 0.0004975579820573099, 'samples': 1649472, 'steps': 8590, 'loss/train': 1.5335558652877808} -11/06/2021 22:26:46 - INFO - __main__ - Step 8592: {'lr': 0.0004975572420821078, 'samples': 1649664, 'steps': 8591, 'loss/train': 1.8905811309814453} -11/06/2021 22:26:47 - INFO - __main__ - Step 8593: {'lr': 0.0004975565019953601, 'samples': 1649856, 'steps': 8592, 'loss/train': 1.5297328233718872} -11/06/2021 22:26:47 - INFO - __main__ - Step 8594: {'lr': 0.0004975557617970673, 'samples': 1650048, 'steps': 8593, 'loss/train': 1.714114785194397} -11/06/2021 22:26:48 - INFO - __main__ - Step 8595: {'lr': 0.0004975550214872296, 'samples': 1650240, 'steps': 8594, 'loss/train': 1.8319971561431885} -11/06/2021 22:26:48 - INFO - __main__ - Step 8596: {'lr': 0.0004975542810658476, 'samples': 1650432, 'steps': 8595, 'loss/train': 1.850310206413269} -11/06/2021 22:26:48 - INFO - __main__ - Step 8597: {'lr': 0.0004975535405329213, 'samples': 1650624, 'steps': 8596, 'loss/train': 1.9651538133621216} -11/06/2021 22:26:49 - INFO - __main__ - Step 8598: {'lr': 0.0004975527998884513, 'samples': 1650816, 'steps': 8597, 'loss/train': 1.1798516511917114} -11/06/2021 22:26:50 - INFO - __main__ - Step 8599: {'lr': 0.0004975520591324378, 'samples': 1651008, 'steps': 8598, 'loss/train': 1.6260879039764404} -11/06/2021 22:26:51 - INFO - __main__ - Step 8600: {'lr': 0.0004975513182648812, 'samples': 1651200, 'steps': 8599, 'loss/train': 1.9237269163131714} -11/06/2021 22:26:51 - INFO - __main__ - Step 8601: {'lr': 0.0004975505772857818, 'samples': 1651392, 'steps': 8600, 'loss/train': 1.373760461807251} -11/06/2021 22:26:51 - INFO - __main__ - Step 8602: {'lr': 0.0004975498361951398, 'samples': 1651584, 'steps': 8601, 'loss/train': 1.5592304468154907} -11/06/2021 22:26:52 - INFO - __main__ - Step 8603: {'lr': 0.0004975490949929558, 'samples': 1651776, 'steps': 8602, 'loss/train': 1.782822608947754} -11/06/2021 22:26:53 - INFO - __main__ - Step 8604: {'lr': 0.00049754835367923, 'samples': 1651968, 'steps': 8603, 'loss/train': 1.2513318061828613} -11/06/2021 22:26:53 - INFO - __main__ - Step 8605: {'lr': 0.0004975476122539627, 'samples': 1652160, 'steps': 8604, 'loss/train': 1.4960685968399048} -11/06/2021 22:26:53 - INFO - __main__ - Step 8606: {'lr': 0.0004975468707171542, 'samples': 1652352, 'steps': 8605, 'loss/train': 1.4390000104904175} -11/06/2021 22:26:54 - INFO - __main__ - Step 8607: {'lr': 0.000497546129068805, 'samples': 1652544, 'steps': 8606, 'loss/train': 1.4670497179031372} -11/06/2021 22:26:54 - INFO - __main__ - Step 8608: {'lr': 0.0004975453873089153, 'samples': 1652736, 'steps': 8607, 'loss/train': 2.2388570308685303} -11/06/2021 22:26:55 - INFO - __main__ - Step 8609: {'lr': 0.0004975446454374854, 'samples': 1652928, 'steps': 8608, 'loss/train': 1.8201464414596558} -11/06/2021 22:26:55 - INFO - __main__ - Step 8610: {'lr': 0.0004975439034545158, 'samples': 1653120, 'steps': 8609, 'loss/train': 1.0466943979263306} -11/06/2021 22:26:56 - INFO - __main__ - Step 8611: {'lr': 0.0004975431613600067, 'samples': 1653312, 'steps': 8610, 'loss/train': 1.8127079010009766} -11/06/2021 22:26:56 - INFO - __main__ - Step 8612: {'lr': 0.0004975424191539585, 'samples': 1653504, 'steps': 8611, 'loss/train': 1.8894764184951782} -11/06/2021 22:26:57 - INFO - __main__ - Step 8613: {'lr': 0.0004975416768363715, 'samples': 1653696, 'steps': 8612, 'loss/train': 1.5986841917037964} -11/06/2021 22:26:57 - INFO - __main__ - Step 8614: {'lr': 0.0004975409344072459, 'samples': 1653888, 'steps': 8613, 'loss/train': 1.9542250633239746} -11/06/2021 22:26:58 - INFO - __main__ - Step 8615: {'lr': 0.0004975401918665823, 'samples': 1654080, 'steps': 8614, 'loss/train': 1.8345215320587158} -11/06/2021 22:26:58 - INFO - __main__ - Step 8616: {'lr': 0.0004975394492143808, 'samples': 1654272, 'steps': 8615, 'loss/train': 2.525263547897339} -11/06/2021 22:26:59 - INFO - __main__ - Step 8617: {'lr': 0.0004975387064506421, 'samples': 1654464, 'steps': 8616, 'loss/train': 1.956400752067566} -11/06/2021 22:26:59 - INFO - __main__ - Step 8618: {'lr': 0.000497537963575366, 'samples': 1654656, 'steps': 8617, 'loss/train': 1.734102725982666} -11/06/2021 22:26:59 - INFO - __main__ - Step 8619: {'lr': 0.0004975372205885533, 'samples': 1654848, 'steps': 8618, 'loss/train': 1.9009313583374023} -11/06/2021 22:27:00 - INFO - __main__ - Step 8620: {'lr': 0.0004975364774902041, 'samples': 1655040, 'steps': 8619, 'loss/train': 2.392646551132202} -11/06/2021 22:27:01 - INFO - __main__ - Step 8621: {'lr': 0.0004975357342803187, 'samples': 1655232, 'steps': 8620, 'loss/train': 1.483763575553894} -11/06/2021 22:27:01 - INFO - __main__ - Step 8622: {'lr': 0.0004975349909588976, 'samples': 1655424, 'steps': 8621, 'loss/train': 1.836098313331604} -11/06/2021 22:27:02 - INFO - __main__ - Step 8623: {'lr': 0.000497534247525941, 'samples': 1655616, 'steps': 8622, 'loss/train': 1.932421326637268} -11/06/2021 22:27:02 - INFO - __main__ - Step 8624: {'lr': 0.0004975335039814493, 'samples': 1655808, 'steps': 8623, 'loss/train': 1.0708638429641724} -11/06/2021 22:27:03 - INFO - __main__ - Step 8625: {'lr': 0.0004975327603254229, 'samples': 1656000, 'steps': 8624, 'loss/train': 1.1579554080963135} -11/06/2021 22:27:03 - INFO - __main__ - Step 8626: {'lr': 0.000497532016557862, 'samples': 1656192, 'steps': 8625, 'loss/train': 1.4248061180114746} -11/06/2021 22:27:04 - INFO - __main__ - Step 8627: {'lr': 0.0004975312726787671, 'samples': 1656384, 'steps': 8626, 'loss/train': 2.444399833679199} -11/06/2021 22:27:04 - INFO - __main__ - Step 8628: {'lr': 0.0004975305286881383, 'samples': 1656576, 'steps': 8627, 'loss/train': 1.7895426750183105} -11/06/2021 22:27:04 - INFO - __main__ - Step 8629: {'lr': 0.0004975297845859761, 'samples': 1656768, 'steps': 8628, 'loss/train': 1.8516370058059692} -11/06/2021 22:27:05 - INFO - __main__ - Step 8630: {'lr': 0.0004975290403722807, 'samples': 1656960, 'steps': 8629, 'loss/train': 1.1760151386260986} -11/06/2021 22:27:06 - INFO - __main__ - Step 8631: {'lr': 0.0004975282960470527, 'samples': 1657152, 'steps': 8630, 'loss/train': 0.9543409943580627} -11/06/2021 22:27:06 - INFO - __main__ - Step 8632: {'lr': 0.0004975275516102922, 'samples': 1657344, 'steps': 8631, 'loss/train': 1.7859746217727661} -11/06/2021 22:27:06 - INFO - __main__ - Step 8633: {'lr': 0.0004975268070619996, 'samples': 1657536, 'steps': 8632, 'loss/train': 1.8400938510894775} -11/06/2021 22:27:07 - INFO - __main__ - Step 8634: {'lr': 0.0004975260624021752, 'samples': 1657728, 'steps': 8633, 'loss/train': 1.3847429752349854} -11/06/2021 22:27:07 - INFO - __main__ - Step 8635: {'lr': 0.0004975253176308194, 'samples': 1657920, 'steps': 8634, 'loss/train': 1.8140875101089478} -11/06/2021 22:27:08 - INFO - __main__ - Step 8636: {'lr': 0.0004975245727479325, 'samples': 1658112, 'steps': 8635, 'loss/train': 1.8529094457626343} -11/06/2021 22:27:09 - INFO - __main__ - Step 8637: {'lr': 0.0004975238277535149, 'samples': 1658304, 'steps': 8636, 'loss/train': 1.9702752828598022} -11/06/2021 22:27:09 - INFO - __main__ - Step 8638: {'lr': 0.0004975230826475669, 'samples': 1658496, 'steps': 8637, 'loss/train': 1.9060972929000854} -11/06/2021 22:27:09 - INFO - __main__ - Step 8639: {'lr': 0.0004975223374300887, 'samples': 1658688, 'steps': 8638, 'loss/train': 2.0410006046295166} -11/06/2021 22:27:10 - INFO - __main__ - Step 8640: {'lr': 0.0004975215921010808, 'samples': 1658880, 'steps': 8639, 'loss/train': 1.9541411399841309} -11/06/2021 22:27:11 - INFO - __main__ - Step 8641: {'lr': 0.0004975208466605435, 'samples': 1659072, 'steps': 8640, 'loss/train': 1.7635051012039185} -11/06/2021 22:27:12 - INFO - __main__ - Step 8642: {'lr': 0.0004975201011084773, 'samples': 1659264, 'steps': 8641, 'loss/train': 1.650898814201355} -11/06/2021 22:27:12 - INFO - __main__ - Step 8643: {'lr': 0.0004975193554448821, 'samples': 1659456, 'steps': 8642, 'loss/train': 1.8950550556182861} -11/06/2021 22:27:12 - INFO - __main__ - Step 8644: {'lr': 0.0004975186096697585, 'samples': 1659648, 'steps': 8643, 'loss/train': 2.5472521781921387} -11/06/2021 22:27:13 - INFO - __main__ - Step 8645: {'lr': 0.000497517863783107, 'samples': 1659840, 'steps': 8644, 'loss/train': 1.438095211982727} -11/06/2021 22:27:13 - INFO - __main__ - Step 8646: {'lr': 0.0004975171177849277, 'samples': 1660032, 'steps': 8645, 'loss/train': 2.031336545944214} -11/06/2021 22:27:14 - INFO - __main__ - Step 8647: {'lr': 0.000497516371675221, 'samples': 1660224, 'steps': 8646, 'loss/train': 2.2316641807556152} -11/06/2021 22:27:15 - INFO - __main__ - Step 8648: {'lr': 0.0004975156254539873, 'samples': 1660416, 'steps': 8647, 'loss/train': 2.0939579010009766} -11/06/2021 22:27:15 - INFO - __main__ - Step 8649: {'lr': 0.0004975148791212269, 'samples': 1660608, 'steps': 8648, 'loss/train': 1.8442882299423218} -11/06/2021 22:27:15 - INFO - __main__ - Step 8650: {'lr': 0.00049751413267694, 'samples': 1660800, 'steps': 8649, 'loss/train': 2.065793752670288} -11/06/2021 22:27:16 - INFO - __main__ - Step 8651: {'lr': 0.000497513386121127, 'samples': 1660992, 'steps': 8650, 'loss/train': 1.510509729385376} -11/06/2021 22:27:17 - INFO - __main__ - Step 8652: {'lr': 0.0004975126394537884, 'samples': 1661184, 'steps': 8651, 'loss/train': 1.9904800653457642} -11/06/2021 22:27:17 - INFO - __main__ - Step 8653: {'lr': 0.0004975118926749245, 'samples': 1661376, 'steps': 8652, 'loss/train': 2.4816510677337646} -11/06/2021 22:27:17 - INFO - __main__ - Step 8654: {'lr': 0.0004975111457845354, 'samples': 1661568, 'steps': 8653, 'loss/train': 1.7848095893859863} -11/06/2021 22:27:18 - INFO - __main__ - Step 8655: {'lr': 0.0004975103987826217, 'samples': 1661760, 'steps': 8654, 'loss/train': 1.5138027667999268} -11/06/2021 22:27:18 - INFO - __main__ - Step 8656: {'lr': 0.0004975096516691836, 'samples': 1661952, 'steps': 8655, 'loss/train': 2.094496965408325} -11/06/2021 22:27:19 - INFO - __main__ - Step 8657: {'lr': 0.0004975089044442215, 'samples': 1662144, 'steps': 8656, 'loss/train': 2.499422073364258} -11/06/2021 22:27:19 - INFO - __main__ - Step 8658: {'lr': 0.0004975081571077357, 'samples': 1662336, 'steps': 8657, 'loss/train': 2.3265016078948975} -11/06/2021 22:27:20 - INFO - __main__ - Step 8659: {'lr': 0.0004975074096597265, 'samples': 1662528, 'steps': 8658, 'loss/train': 1.801966905593872} -11/06/2021 22:27:20 - INFO - __main__ - Step 8660: {'lr': 0.0004975066621001943, 'samples': 1662720, 'steps': 8659, 'loss/train': 1.1997767686843872} -11/06/2021 22:27:20 - INFO - __main__ - Step 8661: {'lr': 0.0004975059144291394, 'samples': 1662912, 'steps': 8660, 'loss/train': 1.4698797464370728} -11/06/2021 22:27:21 - INFO - __main__ - Step 8662: {'lr': 0.0004975051666465622, 'samples': 1663104, 'steps': 8661, 'loss/train': 2.032155990600586} -11/06/2021 22:27:22 - INFO - __main__ - Step 8663: {'lr': 0.0004975044187524629, 'samples': 1663296, 'steps': 8662, 'loss/train': 1.661537766456604} -11/06/2021 22:27:22 - INFO - __main__ - Step 8664: {'lr': 0.000497503670746842, 'samples': 1663488, 'steps': 8663, 'loss/train': 1.3858249187469482} -11/06/2021 22:27:23 - INFO - __main__ - Step 8665: {'lr': 0.0004975029226296998, 'samples': 1663680, 'steps': 8664, 'loss/train': 2.2269275188446045} -11/06/2021 22:27:23 - INFO - __main__ - Step 8666: {'lr': 0.0004975021744010365, 'samples': 1663872, 'steps': 8665, 'loss/train': 2.003019332885742} -11/06/2021 22:27:23 - INFO - __main__ - Step 8667: {'lr': 0.0004975014260608527, 'samples': 1664064, 'steps': 8666, 'loss/train': 1.5768145322799683} -11/06/2021 22:27:24 - INFO - __main__ - Step 8668: {'lr': 0.0004975006776091484, 'samples': 1664256, 'steps': 8667, 'loss/train': 1.9532525539398193} -11/06/2021 22:27:25 - INFO - __main__ - Step 8669: {'lr': 0.0004974999290459243, 'samples': 1664448, 'steps': 8668, 'loss/train': 1.587928295135498} -11/06/2021 22:27:25 - INFO - __main__ - Step 8670: {'lr': 0.0004974991803711803, 'samples': 1664640, 'steps': 8669, 'loss/train': 1.7508021593093872} -11/06/2021 22:27:25 - INFO - __main__ - Step 8671: {'lr': 0.0004974984315849172, 'samples': 1664832, 'steps': 8670, 'loss/train': 1.5539518594741821} -11/06/2021 22:27:26 - INFO - __main__ - Step 8672: {'lr': 0.000497497682687135, 'samples': 1665024, 'steps': 8671, 'loss/train': 1.5913190841674805} -11/06/2021 22:27:27 - INFO - __main__ - Step 8673: {'lr': 0.0004974969336778343, 'samples': 1665216, 'steps': 8672, 'loss/train': 1.3758063316345215} -11/06/2021 22:27:27 - INFO - __main__ - Step 8674: {'lr': 0.0004974961845570152, 'samples': 1665408, 'steps': 8673, 'loss/train': 1.925683856010437} -11/06/2021 22:27:27 - INFO - __main__ - Step 8675: {'lr': 0.0004974954353246781, 'samples': 1665600, 'steps': 8674, 'loss/train': 1.983332872390747} -11/06/2021 22:27:28 - INFO - __main__ - Step 8676: {'lr': 0.0004974946859808235, 'samples': 1665792, 'steps': 8675, 'loss/train': 1.5062406063079834} -11/06/2021 22:27:28 - INFO - __main__ - Step 8677: {'lr': 0.0004974939365254515, 'samples': 1665984, 'steps': 8676, 'loss/train': 1.4310129880905151} -11/06/2021 22:27:29 - INFO - __main__ - Step 8678: {'lr': 0.0004974931869585626, 'samples': 1666176, 'steps': 8677, 'loss/train': 1.1025075912475586} -11/06/2021 22:27:29 - INFO - __main__ - Step 8679: {'lr': 0.0004974924372801572, 'samples': 1666368, 'steps': 8678, 'loss/train': 1.5145713090896606} -11/06/2021 22:27:30 - INFO - __main__ - Step 8680: {'lr': 0.0004974916874902353, 'samples': 1666560, 'steps': 8679, 'loss/train': 1.819180965423584} -11/06/2021 22:27:30 - INFO - __main__ - Step 8681: {'lr': 0.0004974909375887976, 'samples': 1666752, 'steps': 8680, 'loss/train': 1.7356830835342407} -11/06/2021 22:27:31 - INFO - __main__ - Step 8682: {'lr': 0.0004974901875758444, 'samples': 1666944, 'steps': 8681, 'loss/train': 2.002690315246582} -11/06/2021 22:27:31 - INFO - __main__ - Step 8683: {'lr': 0.0004974894374513757, 'samples': 1667136, 'steps': 8682, 'loss/train': 2.2562174797058105} -11/06/2021 22:27:32 - INFO - __main__ - Step 8684: {'lr': 0.0004974886872153922, 'samples': 1667328, 'steps': 8683, 'loss/train': 1.799873948097229} -11/06/2021 22:27:32 - INFO - __main__ - Step 8685: {'lr': 0.0004974879368678942, 'samples': 1667520, 'steps': 8684, 'loss/train': 2.1796953678131104} -11/06/2021 22:27:32 - INFO - __main__ - Step 8686: {'lr': 0.0004974871864088818, 'samples': 1667712, 'steps': 8685, 'loss/train': 1.7284247875213623} -11/06/2021 22:27:33 - INFO - __main__ - Step 8687: {'lr': 0.0004974864358383555, 'samples': 1667904, 'steps': 8686, 'loss/train': 2.1161437034606934} -11/06/2021 22:27:34 - INFO - __main__ - Step 8688: {'lr': 0.0004974856851563158, 'samples': 1668096, 'steps': 8687, 'loss/train': 1.6163461208343506} -11/06/2021 22:27:34 - INFO - __main__ - Step 8689: {'lr': 0.0004974849343627628, 'samples': 1668288, 'steps': 8688, 'loss/train': 2.1865105628967285} -11/06/2021 22:27:35 - INFO - __main__ - Step 8690: {'lr': 0.0004974841834576968, 'samples': 1668480, 'steps': 8689, 'loss/train': 2.0201218128204346} -11/06/2021 22:27:35 - INFO - __main__ - Step 8691: {'lr': 0.0004974834324411183, 'samples': 1668672, 'steps': 8690, 'loss/train': 1.748487949371338} -11/06/2021 22:27:35 - INFO - __main__ - Step 8692: {'lr': 0.0004974826813130276, 'samples': 1668864, 'steps': 8691, 'loss/train': 1.8078097105026245} -11/06/2021 22:27:36 - INFO - __main__ - Step 8693: {'lr': 0.000497481930073425, 'samples': 1669056, 'steps': 8692, 'loss/train': 1.9291731119155884} -11/06/2021 22:27:37 - INFO - __main__ - Step 8694: {'lr': 0.000497481178722311, 'samples': 1669248, 'steps': 8693, 'loss/train': 1.6936627626419067} -11/06/2021 22:27:37 - INFO - __main__ - Step 8695: {'lr': 0.0004974804272596857, 'samples': 1669440, 'steps': 8694, 'loss/train': 1.6667145490646362} -11/06/2021 22:27:37 - INFO - __main__ - Step 8696: {'lr': 0.0004974796756855494, 'samples': 1669632, 'steps': 8695, 'loss/train': 1.6822011470794678} -11/06/2021 22:27:38 - INFO - __main__ - Step 8697: {'lr': 0.0004974789239999027, 'samples': 1669824, 'steps': 8696, 'loss/train': 1.7184191942214966} -11/06/2021 22:27:38 - INFO - __main__ - Step 8698: {'lr': 0.0004974781722027459, 'samples': 1670016, 'steps': 8697, 'loss/train': 1.8397278785705566} -11/06/2021 22:27:39 - INFO - __main__ - Step 8699: {'lr': 0.0004974774202940791, 'samples': 1670208, 'steps': 8698, 'loss/train': 1.9065308570861816} -11/06/2021 22:27:40 - INFO - __main__ - Step 8700: {'lr': 0.000497476668273903, 'samples': 1670400, 'steps': 8699, 'loss/train': 0.9457817673683167} -11/06/2021 22:27:40 - INFO - __main__ - Step 8701: {'lr': 0.0004974759161422175, 'samples': 1670592, 'steps': 8700, 'loss/train': 1.5651483535766602} -11/06/2021 22:27:40 - INFO - __main__ - Step 8702: {'lr': 0.0004974751638990233, 'samples': 1670784, 'steps': 8701, 'loss/train': 1.9571999311447144} -11/06/2021 22:27:41 - INFO - __main__ - Step 8703: {'lr': 0.0004974744115443206, 'samples': 1670976, 'steps': 8702, 'loss/train': 1.1419717073440552} -11/06/2021 22:27:42 - INFO - __main__ - Step 8704: {'lr': 0.0004974736590781097, 'samples': 1671168, 'steps': 8703, 'loss/train': 2.3399507999420166} -11/06/2021 22:27:42 - INFO - __main__ - Step 8705: {'lr': 0.000497472906500391, 'samples': 1671360, 'steps': 8704, 'loss/train': 1.9851784706115723} -11/06/2021 22:27:43 - INFO - __main__ - Step 8706: {'lr': 0.0004974721538111649, 'samples': 1671552, 'steps': 8705, 'loss/train': 1.7644202709197998} -11/06/2021 22:27:43 - INFO - __main__ - Step 8707: {'lr': 0.0004974714010104315, 'samples': 1671744, 'steps': 8706, 'loss/train': 2.234442949295044} -11/06/2021 22:27:43 - INFO - __main__ - Step 8708: {'lr': 0.0004974706480981914, 'samples': 1671936, 'steps': 8707, 'loss/train': 1.5944517850875854} -11/06/2021 22:27:44 - INFO - __main__ - Step 8709: {'lr': 0.0004974698950744449, 'samples': 1672128, 'steps': 8708, 'loss/train': 2.5472395420074463} -11/06/2021 22:27:45 - INFO - __main__ - Step 8710: {'lr': 0.0004974691419391922, 'samples': 1672320, 'steps': 8709, 'loss/train': 1.8900412321090698} -11/06/2021 22:27:45 - INFO - __main__ - Step 8711: {'lr': 0.0004974683886924339, 'samples': 1672512, 'steps': 8710, 'loss/train': 1.7456995248794556} -11/06/2021 22:27:45 - INFO - __main__ - Step 8712: {'lr': 0.00049746763533417, 'samples': 1672704, 'steps': 8711, 'loss/train': 2.188673257827759} -11/06/2021 22:27:46 - INFO - __main__ - Step 8713: {'lr': 0.000497466881864401, 'samples': 1672896, 'steps': 8712, 'loss/train': 1.39998459815979} -11/06/2021 22:27:46 - INFO - __main__ - Step 8714: {'lr': 0.0004974661282831272, 'samples': 1673088, 'steps': 8713, 'loss/train': 1.890992522239685} -11/06/2021 22:27:47 - INFO - __main__ - Step 8715: {'lr': 0.0004974653745903491, 'samples': 1673280, 'steps': 8714, 'loss/train': 1.2863065004348755} -11/06/2021 22:27:47 - INFO - __main__ - Step 8716: {'lr': 0.0004974646207860668, 'samples': 1673472, 'steps': 8715, 'loss/train': 2.333582878112793} -11/06/2021 22:27:48 - INFO - __main__ - Step 8717: {'lr': 0.0004974638668702809, 'samples': 1673664, 'steps': 8716, 'loss/train': 0.5336604714393616} -11/06/2021 22:27:48 - INFO - __main__ - Step 8718: {'lr': 0.0004974631128429915, 'samples': 1673856, 'steps': 8717, 'loss/train': 2.640268564224243} -11/06/2021 22:27:48 - INFO - __main__ - Step 8719: {'lr': 0.0004974623587041991, 'samples': 1674048, 'steps': 8718, 'loss/train': 2.1433913707733154} -11/06/2021 22:27:49 - INFO - __main__ - Step 8720: {'lr': 0.000497461604453904, 'samples': 1674240, 'steps': 8719, 'loss/train': 1.5393385887145996} -11/06/2021 22:27:50 - INFO - __main__ - Step 8721: {'lr': 0.0004974608500921064, 'samples': 1674432, 'steps': 8720, 'loss/train': 2.028142213821411} -11/06/2021 22:27:50 - INFO - __main__ - Step 8722: {'lr': 0.0004974600956188068, 'samples': 1674624, 'steps': 8721, 'loss/train': 1.8649543523788452} -11/06/2021 22:27:50 - INFO - __main__ - Step 8723: {'lr': 0.0004974593410340056, 'samples': 1674816, 'steps': 8722, 'loss/train': 1.037925124168396} -11/06/2021 22:27:51 - INFO - __main__ - Step 8724: {'lr': 0.000497458586337703, 'samples': 1675008, 'steps': 8723, 'loss/train': 1.7672851085662842} -11/06/2021 22:27:52 - INFO - __main__ - Step 8725: {'lr': 0.0004974578315298993, 'samples': 1675200, 'steps': 8724, 'loss/train': 1.966469407081604} -11/06/2021 22:27:52 - INFO - __main__ - Step 8726: {'lr': 0.000497457076610595, 'samples': 1675392, 'steps': 8725, 'loss/train': 1.7877483367919922} -11/06/2021 22:27:53 - INFO - __main__ - Step 8727: {'lr': 0.0004974563215797903, 'samples': 1675584, 'steps': 8726, 'loss/train': 1.3742201328277588} -11/06/2021 22:27:53 - INFO - __main__ - Step 8728: {'lr': 0.0004974555664374857, 'samples': 1675776, 'steps': 8727, 'loss/train': 2.265516757965088} -11/06/2021 22:27:53 - INFO - __main__ - Step 8729: {'lr': 0.0004974548111836812, 'samples': 1675968, 'steps': 8728, 'loss/train': 1.7990782260894775} -11/06/2021 22:27:54 - INFO - __main__ - Step 8730: {'lr': 0.0004974540558183776, 'samples': 1676160, 'steps': 8729, 'loss/train': 1.5700663328170776} -11/06/2021 22:27:55 - INFO - __main__ - Step 8731: {'lr': 0.0004974533003415751, 'samples': 1676352, 'steps': 8730, 'loss/train': 2.584472894668579} -11/06/2021 22:27:55 - INFO - __main__ - Step 8732: {'lr': 0.0004974525447532737, 'samples': 1676544, 'steps': 8731, 'loss/train': 0.7004466652870178} -11/06/2021 22:27:55 - INFO - __main__ - Step 8733: {'lr': 0.0004974517890534742, 'samples': 1676736, 'steps': 8732, 'loss/train': 2.029585361480713} -11/06/2021 22:27:56 - INFO - __main__ - Step 8734: {'lr': 0.0004974510332421767, 'samples': 1676928, 'steps': 8733, 'loss/train': 2.3354976177215576} -11/06/2021 22:27:57 - INFO - __main__ - Step 8735: {'lr': 0.0004974502773193815, 'samples': 1677120, 'steps': 8734, 'loss/train': 1.779792308807373} -11/06/2021 22:27:57 - INFO - __main__ - Step 8736: {'lr': 0.0004974495212850892, 'samples': 1677312, 'steps': 8735, 'loss/train': 1.7999184131622314} -11/06/2021 22:27:58 - INFO - __main__ - Step 8737: {'lr': 0.0004974487651392998, 'samples': 1677504, 'steps': 8736, 'loss/train': 2.0719504356384277} -11/06/2021 22:27:58 - INFO - __main__ - Step 8738: {'lr': 0.0004974480088820139, 'samples': 1677696, 'steps': 8737, 'loss/train': 1.93135666847229} -11/06/2021 22:27:59 - INFO - __main__ - Step 8739: {'lr': 0.0004974472525132316, 'samples': 1677888, 'steps': 8738, 'loss/train': 2.191235303878784} -11/06/2021 22:27:59 - INFO - __main__ - Step 8740: {'lr': 0.0004974464960329536, 'samples': 1678080, 'steps': 8739, 'loss/train': 1.711877465248108} -11/06/2021 22:28:00 - INFO - __main__ - Step 8741: {'lr': 0.0004974457394411798, 'samples': 1678272, 'steps': 8740, 'loss/train': 1.1441311836242676} -11/06/2021 22:28:00 - INFO - __main__ - Step 8742: {'lr': 0.0004974449827379109, 'samples': 1678464, 'steps': 8741, 'loss/train': 2.325981616973877} -11/06/2021 22:28:01 - INFO - __main__ - Step 8743: {'lr': 0.000497444225923147, 'samples': 1678656, 'steps': 8742, 'loss/train': 1.826312780380249} -11/06/2021 22:28:01 - INFO - __main__ - Step 8744: {'lr': 0.0004974434689968887, 'samples': 1678848, 'steps': 8743, 'loss/train': 2.2900896072387695} -11/06/2021 22:28:01 - INFO - __main__ - Step 8745: {'lr': 0.0004974427119591361, 'samples': 1679040, 'steps': 8744, 'loss/train': 2.352595090866089} -11/06/2021 22:28:02 - INFO - __main__ - Step 8746: {'lr': 0.0004974419548098897, 'samples': 1679232, 'steps': 8745, 'loss/train': 1.2469137907028198} -11/06/2021 22:28:03 - INFO - __main__ - Step 8747: {'lr': 0.0004974411975491498, 'samples': 1679424, 'steps': 8746, 'loss/train': 1.8148316144943237} -11/06/2021 22:28:03 - INFO - __main__ - Step 8748: {'lr': 0.0004974404401769167, 'samples': 1679616, 'steps': 8747, 'loss/train': 2.2442069053649902} -11/06/2021 22:28:03 - INFO - __main__ - Step 8749: {'lr': 0.0004974396826931906, 'samples': 1679808, 'steps': 8748, 'loss/train': 2.0725631713867188} -11/06/2021 22:28:04 - INFO - __main__ - Step 8750: {'lr': 0.0004974389250979722, 'samples': 1680000, 'steps': 8749, 'loss/train': 1.7763142585754395} -11/06/2021 22:28:05 - INFO - __main__ - Step 8751: {'lr': 0.0004974381673912614, 'samples': 1680192, 'steps': 8750, 'loss/train': 2.2424070835113525} -11/06/2021 22:28:05 - INFO - __main__ - Step 8752: {'lr': 0.000497437409573059, 'samples': 1680384, 'steps': 8751, 'loss/train': 1.8414136171340942} -11/06/2021 22:28:05 - INFO - __main__ - Step 8753: {'lr': 0.000497436651643365, 'samples': 1680576, 'steps': 8752, 'loss/train': 1.7458195686340332} -11/06/2021 22:28:06 - INFO - __main__ - Step 8754: {'lr': 0.00049743589360218, 'samples': 1680768, 'steps': 8753, 'loss/train': 2.1746933460235596} -11/06/2021 22:28:06 - INFO - __main__ - Step 8755: {'lr': 0.0004974351354495041, 'samples': 1680960, 'steps': 8754, 'loss/train': 1.9091649055480957} -11/06/2021 22:28:07 - INFO - __main__ - Step 8756: {'lr': 0.0004974343771853377, 'samples': 1681152, 'steps': 8755, 'loss/train': 1.7813023328781128} -11/06/2021 22:28:07 - INFO - __main__ - Step 8757: {'lr': 0.0004974336188096813, 'samples': 1681344, 'steps': 8756, 'loss/train': 1.627087116241455} -11/06/2021 22:28:08 - INFO - __main__ - Step 8758: {'lr': 0.0004974328603225351, 'samples': 1681536, 'steps': 8757, 'loss/train': 1.492101788520813} -11/06/2021 22:28:08 - INFO - __main__ - Step 8759: {'lr': 0.0004974321017238994, 'samples': 1681728, 'steps': 8758, 'loss/train': 1.5569329261779785} -11/06/2021 22:28:09 - INFO - __main__ - Step 8760: {'lr': 0.0004974313430137747, 'samples': 1681920, 'steps': 8759, 'loss/train': 1.9305700063705444} -11/06/2021 22:28:10 - INFO - __main__ - Step 8761: {'lr': 0.0004974305841921612, 'samples': 1682112, 'steps': 8760, 'loss/train': 1.7186388969421387} -11/06/2021 22:28:10 - INFO - __main__ - Step 8762: {'lr': 0.0004974298252590593, 'samples': 1682304, 'steps': 8761, 'loss/train': 1.9467127323150635} -11/06/2021 22:28:10 - INFO - __main__ - Step 8763: {'lr': 0.0004974290662144694, 'samples': 1682496, 'steps': 8762, 'loss/train': 1.675337791442871} -11/06/2021 22:28:11 - INFO - __main__ - Step 8764: {'lr': 0.0004974283070583917, 'samples': 1682688, 'steps': 8763, 'loss/train': 1.5082322359085083} -11/06/2021 22:28:11 - INFO - __main__ - Step 8765: {'lr': 0.0004974275477908266, 'samples': 1682880, 'steps': 8764, 'loss/train': 2.1924538612365723} -11/06/2021 22:28:12 - INFO - __main__ - Step 8766: {'lr': 0.0004974267884117746, 'samples': 1683072, 'steps': 8765, 'loss/train': 0.8508917093276978} -11/06/2021 22:28:12 - INFO - __main__ - Step 8767: {'lr': 0.0004974260289212358, 'samples': 1683264, 'steps': 8766, 'loss/train': 1.8229551315307617} -11/06/2021 22:28:13 - INFO - __main__ - Step 8768: {'lr': 0.0004974252693192106, 'samples': 1683456, 'steps': 8767, 'loss/train': 1.7984812259674072} -11/06/2021 22:28:13 - INFO - __main__ - Step 8769: {'lr': 0.0004974245096056995, 'samples': 1683648, 'steps': 8768, 'loss/train': 1.664389729499817} -11/06/2021 22:28:13 - INFO - __main__ - Step 8770: {'lr': 0.0004974237497807027, 'samples': 1683840, 'steps': 8769, 'loss/train': 0.3073934018611908} -11/06/2021 22:28:14 - INFO - __main__ - Step 8771: {'lr': 0.0004974229898442207, 'samples': 1684032, 'steps': 8770, 'loss/train': 1.7521414756774902} -11/06/2021 22:28:15 - INFO - __main__ - Step 8772: {'lr': 0.0004974222297962535, 'samples': 1684224, 'steps': 8771, 'loss/train': 1.6954983472824097} -11/06/2021 22:28:15 - INFO - __main__ - Step 8773: {'lr': 0.0004974214696368017, 'samples': 1684416, 'steps': 8772, 'loss/train': 1.7648489475250244} -11/06/2021 22:28:15 - INFO - __main__ - Step 8774: {'lr': 0.0004974207093658657, 'samples': 1684608, 'steps': 8773, 'loss/train': 1.5386720895767212} -11/06/2021 22:28:16 - INFO - __main__ - Step 8775: {'lr': 0.0004974199489834457, 'samples': 1684800, 'steps': 8774, 'loss/train': 1.757877230644226} -11/06/2021 22:28:17 - INFO - __main__ - Step 8776: {'lr': 0.0004974191884895421, 'samples': 1684992, 'steps': 8775, 'loss/train': 1.9185556173324585} -11/06/2021 22:28:17 - INFO - __main__ - Step 8777: {'lr': 0.0004974184278841552, 'samples': 1685184, 'steps': 8776, 'loss/train': 2.359382152557373} -11/06/2021 22:28:18 - INFO - __main__ - Step 8778: {'lr': 0.0004974176671672854, 'samples': 1685376, 'steps': 8777, 'loss/train': 1.3928838968276978} -11/06/2021 22:28:18 - INFO - __main__ - Step 8779: {'lr': 0.000497416906338933, 'samples': 1685568, 'steps': 8778, 'loss/train': 2.1888182163238525} -11/06/2021 22:28:18 - INFO - __main__ - Step 8780: {'lr': 0.0004974161453990985, 'samples': 1685760, 'steps': 8779, 'loss/train': 1.9797148704528809} -11/06/2021 22:28:19 - INFO - __main__ - Step 8781: {'lr': 0.0004974153843477819, 'samples': 1685952, 'steps': 8780, 'loss/train': 1.6259188652038574} -11/06/2021 22:28:20 - INFO - __main__ - Step 8782: {'lr': 0.0004974146231849838, 'samples': 1686144, 'steps': 8781, 'loss/train': 1.612627387046814} -11/06/2021 22:28:20 - INFO - __main__ - Step 8783: {'lr': 0.0004974138619107046, 'samples': 1686336, 'steps': 8782, 'loss/train': 1.9349783658981323} -11/06/2021 22:28:20 - INFO - __main__ - Step 8784: {'lr': 0.0004974131005249444, 'samples': 1686528, 'steps': 8783, 'loss/train': 1.3217498064041138} -11/06/2021 22:28:21 - INFO - __main__ - Step 8785: {'lr': 0.0004974123390277037, 'samples': 1686720, 'steps': 8784, 'loss/train': 0.9705907702445984} -11/06/2021 22:28:21 - INFO - __main__ - Step 8786: {'lr': 0.0004974115774189829, 'samples': 1686912, 'steps': 8785, 'loss/train': 1.2650182247161865} -11/06/2021 22:28:22 - INFO - __main__ - Step 8787: {'lr': 0.0004974108156987822, 'samples': 1687104, 'steps': 8786, 'loss/train': 1.8180323839187622} -11/06/2021 22:28:23 - INFO - __main__ - Step 8788: {'lr': 0.000497410053867102, 'samples': 1687296, 'steps': 8787, 'loss/train': 2.028273105621338} -11/06/2021 22:28:23 - INFO - __main__ - Step 8789: {'lr': 0.0004974092919239427, 'samples': 1687488, 'steps': 8788, 'loss/train': 1.8566056489944458} -11/06/2021 22:28:23 - INFO - __main__ - Step 8790: {'lr': 0.0004974085298693045, 'samples': 1687680, 'steps': 8789, 'loss/train': 1.7841997146606445} -11/06/2021 22:28:24 - INFO - __main__ - Step 8791: {'lr': 0.0004974077677031879, 'samples': 1687872, 'steps': 8790, 'loss/train': 1.7749842405319214} -11/06/2021 22:28:25 - INFO - __main__ - Step 8792: {'lr': 0.0004974070054255932, 'samples': 1688064, 'steps': 8791, 'loss/train': 1.3394575119018555} -11/06/2021 22:28:25 - INFO - __main__ - Step 8793: {'lr': 0.0004974062430365206, 'samples': 1688256, 'steps': 8792, 'loss/train': 2.017791509628296} -11/06/2021 22:28:25 - INFO - __main__ - Step 8794: {'lr': 0.0004974054805359706, 'samples': 1688448, 'steps': 8793, 'loss/train': 1.5951640605926514} -11/06/2021 22:28:26 - INFO - __main__ - Step 8795: {'lr': 0.0004974047179239436, 'samples': 1688640, 'steps': 8794, 'loss/train': 1.9513581991195679} -11/06/2021 22:28:26 - INFO - __main__ - Step 8796: {'lr': 0.0004974039552004398, 'samples': 1688832, 'steps': 8795, 'loss/train': 1.227823257446289} -11/06/2021 22:28:27 - INFO - __main__ - Step 8797: {'lr': 0.0004974031923654596, 'samples': 1689024, 'steps': 8796, 'loss/train': 1.9323481321334839} -11/06/2021 22:28:27 - INFO - __main__ - Step 8798: {'lr': 0.0004974024294190034, 'samples': 1689216, 'steps': 8797, 'loss/train': 1.6938538551330566} -11/06/2021 22:28:28 - INFO - __main__ - Step 8799: {'lr': 0.0004974016663610713, 'samples': 1689408, 'steps': 8798, 'loss/train': 1.885172724723816} -11/06/2021 22:28:28 - INFO - __main__ - Step 8800: {'lr': 0.000497400903191664, 'samples': 1689600, 'steps': 8799, 'loss/train': 1.5480501651763916} -11/06/2021 22:28:28 - INFO - __main__ - Step 8801: {'lr': 0.0004974001399107816, 'samples': 1689792, 'steps': 8800, 'loss/train': 2.519402265548706} -11/06/2021 22:28:29 - INFO - __main__ - Step 8802: {'lr': 0.0004973993765184246, 'samples': 1689984, 'steps': 8801, 'loss/train': 1.6957279443740845} -11/06/2021 22:28:30 - INFO - __main__ - Step 8803: {'lr': 0.0004973986130145931, 'samples': 1690176, 'steps': 8802, 'loss/train': 1.698414921760559} -11/06/2021 22:28:30 - INFO - __main__ - Step 8804: {'lr': 0.0004973978493992877, 'samples': 1690368, 'steps': 8803, 'loss/train': 1.4111169576644897} -11/06/2021 22:28:30 - INFO - __main__ - Step 8805: {'lr': 0.0004973970856725086, 'samples': 1690560, 'steps': 8804, 'loss/train': 1.862740159034729} -11/06/2021 22:28:31 - INFO - __main__ - Step 8806: {'lr': 0.0004973963218342563, 'samples': 1690752, 'steps': 8805, 'loss/train': 1.8943990468978882} -11/06/2021 22:28:32 - INFO - __main__ - Step 8807: {'lr': 0.000497395557884531, 'samples': 1690944, 'steps': 8806, 'loss/train': 2.2840816974639893} -11/06/2021 22:28:32 - INFO - __main__ - Step 8808: {'lr': 0.000497394793823333, 'samples': 1691136, 'steps': 8807, 'loss/train': 1.346774697303772} -11/06/2021 22:28:33 - INFO - __main__ - Step 8809: {'lr': 0.0004973940296506627, 'samples': 1691328, 'steps': 8808, 'loss/train': 1.4218136072158813} -11/06/2021 22:28:33 - INFO - __main__ - Step 8810: {'lr': 0.0004973932653665206, 'samples': 1691520, 'steps': 8809, 'loss/train': 0.507257878780365} -11/06/2021 22:28:33 - INFO - __main__ - Step 8811: {'lr': 0.0004973925009709068, 'samples': 1691712, 'steps': 8810, 'loss/train': 1.9113545417785645} -11/06/2021 22:28:34 - INFO - __main__ - Step 8812: {'lr': 0.0004973917364638218, 'samples': 1691904, 'steps': 8811, 'loss/train': 1.7712737321853638} -11/06/2021 22:28:34 - INFO - __main__ - Step 8813: {'lr': 0.0004973909718452659, 'samples': 1692096, 'steps': 8812, 'loss/train': 2.098034381866455} -11/06/2021 22:28:35 - INFO - __main__ - Step 8814: {'lr': 0.0004973902071152396, 'samples': 1692288, 'steps': 8813, 'loss/train': 1.7307425737380981} -11/06/2021 22:28:35 - INFO - __main__ - Step 8815: {'lr': 0.0004973894422737428, 'samples': 1692480, 'steps': 8814, 'loss/train': 1.682647466659546} -11/06/2021 22:28:36 - INFO - __main__ - Step 8816: {'lr': 0.0004973886773207763, 'samples': 1692672, 'steps': 8815, 'loss/train': 1.6713685989379883} -11/06/2021 22:28:37 - INFO - __main__ - Step 8817: {'lr': 0.0004973879122563403, 'samples': 1692864, 'steps': 8816, 'loss/train': 2.685642957687378} -11/06/2021 22:28:37 - INFO - __main__ - Step 8818: {'lr': 0.000497387147080435, 'samples': 1693056, 'steps': 8817, 'loss/train': 1.6026307344436646} -11/06/2021 22:28:37 - INFO - __main__ - Step 8819: {'lr': 0.000497386381793061, 'samples': 1693248, 'steps': 8818, 'loss/train': 1.8597676753997803} -11/06/2021 22:28:38 - INFO - __main__ - Step 8820: {'lr': 0.0004973856163942185, 'samples': 1693440, 'steps': 8819, 'loss/train': 1.8286590576171875} -11/06/2021 22:28:38 - INFO - __main__ - Step 8821: {'lr': 0.0004973848508839077, 'samples': 1693632, 'steps': 8820, 'loss/train': 1.868646264076233} -11/06/2021 22:28:38 - INFO - __main__ - Step 8822: {'lr': 0.0004973840852621293, 'samples': 1693824, 'steps': 8821, 'loss/train': 1.4488940238952637} -11/06/2021 22:28:39 - INFO - __main__ - Step 8823: {'lr': 0.0004973833195288834, 'samples': 1694016, 'steps': 8822, 'loss/train': 1.7625603675842285} -11/06/2021 22:28:40 - INFO - __main__ - Step 8824: {'lr': 0.0004973825536841703, 'samples': 1694208, 'steps': 8823, 'loss/train': 1.8687225580215454} -11/06/2021 22:28:40 - INFO - __main__ - Step 8825: {'lr': 0.0004973817877279906, 'samples': 1694400, 'steps': 8824, 'loss/train': 1.4771027565002441} -11/06/2021 22:28:41 - INFO - __main__ - Step 8826: {'lr': 0.0004973810216603443, 'samples': 1694592, 'steps': 8825, 'loss/train': 0.3064444959163666} -11/06/2021 22:28:41 - INFO - __main__ - Step 8827: {'lr': 0.000497380255481232, 'samples': 1694784, 'steps': 8826, 'loss/train': 1.9688664674758911} -11/06/2021 22:28:42 - INFO - __main__ - Step 8828: {'lr': 0.000497379489190654, 'samples': 1694976, 'steps': 8827, 'loss/train': 1.279405117034912} -11/06/2021 22:28:42 - INFO - __main__ - Step 8829: {'lr': 0.0004973787227886106, 'samples': 1695168, 'steps': 8828, 'loss/train': 1.0162687301635742} -11/06/2021 22:28:43 - INFO - __main__ - Step 8830: {'lr': 0.0004973779562751022, 'samples': 1695360, 'steps': 8829, 'loss/train': 1.7933107614517212} -11/06/2021 22:28:43 - INFO - __main__ - Step 8831: {'lr': 0.0004973771896501292, 'samples': 1695552, 'steps': 8830, 'loss/train': 2.0314056873321533} -11/06/2021 22:28:43 - INFO - __main__ - Step 8832: {'lr': 0.0004973764229136917, 'samples': 1695744, 'steps': 8831, 'loss/train': 1.8036915063858032} -11/06/2021 22:28:44 - INFO - __main__ - Step 8833: {'lr': 0.0004973756560657901, 'samples': 1695936, 'steps': 8832, 'loss/train': 1.417937994003296} -11/06/2021 22:28:45 - INFO - __main__ - Step 8834: {'lr': 0.0004973748891064251, 'samples': 1696128, 'steps': 8833, 'loss/train': 1.0796078443527222} -11/06/2021 22:28:45 - INFO - __main__ - Step 8835: {'lr': 0.0004973741220355967, 'samples': 1696320, 'steps': 8834, 'loss/train': 1.756775975227356} -11/06/2021 22:28:45 - INFO - __main__ - Step 8836: {'lr': 0.0004973733548533052, 'samples': 1696512, 'steps': 8835, 'loss/train': 1.7436381578445435} -11/06/2021 22:28:46 - INFO - __main__ - Step 8837: {'lr': 0.0004973725875595513, 'samples': 1696704, 'steps': 8836, 'loss/train': 2.336061716079712} -11/06/2021 22:28:47 - INFO - __main__ - Step 8838: {'lr': 0.000497371820154335, 'samples': 1696896, 'steps': 8837, 'loss/train': 1.9740123748779297} -11/06/2021 22:28:47 - INFO - __main__ - Step 8839: {'lr': 0.0004973710526376569, 'samples': 1697088, 'steps': 8838, 'loss/train': 0.7141327261924744} -11/06/2021 22:28:47 - INFO - __main__ - Step 8840: {'lr': 0.000497370285009517, 'samples': 1697280, 'steps': 8839, 'loss/train': 1.4266327619552612} -11/06/2021 22:28:48 - INFO - __main__ - Step 8841: {'lr': 0.000497369517269916, 'samples': 1697472, 'steps': 8840, 'loss/train': 2.1014244556427} -11/06/2021 22:28:48 - INFO - __main__ - Step 8842: {'lr': 0.0004973687494188541, 'samples': 1697664, 'steps': 8841, 'loss/train': 1.9083147048950195} -11/06/2021 22:28:49 - INFO - __main__ - Step 8843: {'lr': 0.0004973679814563318, 'samples': 1697856, 'steps': 8842, 'loss/train': 1.9293524026870728} -11/06/2021 22:28:50 - INFO - __main__ - Step 8844: {'lr': 0.0004973672133823491, 'samples': 1698048, 'steps': 8843, 'loss/train': 1.9651559591293335} -11/06/2021 22:28:50 - INFO - __main__ - Step 8845: {'lr': 0.0004973664451969066, 'samples': 1698240, 'steps': 8844, 'loss/train': 2.337369203567505} -11/06/2021 22:28:50 - INFO - __main__ - Step 8846: {'lr': 0.0004973656769000046, 'samples': 1698432, 'steps': 8845, 'loss/train': 1.0025054216384888} -11/06/2021 22:28:51 - INFO - __main__ - Step 8847: {'lr': 0.0004973649084916435, 'samples': 1698624, 'steps': 8846, 'loss/train': 2.6142988204956055} -11/06/2021 22:28:52 - INFO - __main__ - Step 8848: {'lr': 0.0004973641399718236, 'samples': 1698816, 'steps': 8847, 'loss/train': 2.0085182189941406} -11/06/2021 22:28:52 - INFO - __main__ - Step 8849: {'lr': 0.0004973633713405451, 'samples': 1699008, 'steps': 8848, 'loss/train': 1.4306745529174805} -11/06/2021 22:28:53 - INFO - __main__ - Step 8850: {'lr': 0.0004973626025978086, 'samples': 1699200, 'steps': 8849, 'loss/train': 1.551592469215393} -11/06/2021 22:28:53 - INFO - __main__ - Step 8851: {'lr': 0.0004973618337436143, 'samples': 1699392, 'steps': 8850, 'loss/train': 1.7350374460220337} -11/06/2021 22:28:53 - INFO - __main__ - Step 8852: {'lr': 0.0004973610647779626, 'samples': 1699584, 'steps': 8851, 'loss/train': 1.860516905784607} -11/06/2021 22:28:54 - INFO - __main__ - Step 8853: {'lr': 0.0004973602957008537, 'samples': 1699776, 'steps': 8852, 'loss/train': 1.765555739402771} -11/06/2021 22:28:55 - INFO - __main__ - Step 8854: {'lr': 0.0004973595265122883, 'samples': 1699968, 'steps': 8853, 'loss/train': 2.4081969261169434} -11/06/2021 22:28:55 - INFO - __main__ - Step 8855: {'lr': 0.0004973587572122663, 'samples': 1700160, 'steps': 8854, 'loss/train': 1.8850605487823486} -11/06/2021 22:28:55 - INFO - __main__ - Step 8856: {'lr': 0.0004973579878007884, 'samples': 1700352, 'steps': 8855, 'loss/train': 1.608045220375061} -11/06/2021 22:28:56 - INFO - __main__ - Step 8857: {'lr': 0.0004973572182778546, 'samples': 1700544, 'steps': 8856, 'loss/train': 1.670106291770935} -11/06/2021 22:28:56 - INFO - __main__ - Step 8858: {'lr': 0.0004973564486434656, 'samples': 1700736, 'steps': 8857, 'loss/train': 1.6520261764526367} -11/06/2021 22:28:57 - INFO - __main__ - Step 8859: {'lr': 0.0004973556788976217, 'samples': 1700928, 'steps': 8858, 'loss/train': 1.5881348848342896} -11/06/2021 22:28:57 - INFO - __main__ - Step 8860: {'lr': 0.000497354909040323, 'samples': 1701120, 'steps': 8859, 'loss/train': 1.7174054384231567} -11/06/2021 22:28:58 - INFO - __main__ - Step 8861: {'lr': 0.00049735413907157, 'samples': 1701312, 'steps': 8860, 'loss/train': 1.8992524147033691} -11/06/2021 22:28:58 - INFO - __main__ - Step 8862: {'lr': 0.0004973533689913631, 'samples': 1701504, 'steps': 8861, 'loss/train': 1.570049524307251} -11/06/2021 22:28:58 - INFO - __main__ - Step 8863: {'lr': 0.0004973525987997026, 'samples': 1701696, 'steps': 8862, 'loss/train': 2.445530891418457} -11/06/2021 22:28:59 - INFO - __main__ - Step 8864: {'lr': 0.0004973518284965888, 'samples': 1701888, 'steps': 8863, 'loss/train': 1.9217685461044312} -11/06/2021 22:29:00 - INFO - __main__ - Step 8865: {'lr': 0.0004973510580820221, 'samples': 1702080, 'steps': 8864, 'loss/train': 1.8503520488739014} -11/06/2021 22:29:00 - INFO - __main__ - Step 8866: {'lr': 0.0004973502875560028, 'samples': 1702272, 'steps': 8865, 'loss/train': 1.635284185409546} -11/06/2021 22:29:01 - INFO - __main__ - Step 8867: {'lr': 0.0004973495169185313, 'samples': 1702464, 'steps': 8866, 'loss/train': 1.2922062873840332} -11/06/2021 22:29:01 - INFO - __main__ - Step 8868: {'lr': 0.0004973487461696079, 'samples': 1702656, 'steps': 8867, 'loss/train': 1.878747820854187} -11/06/2021 22:29:02 - INFO - __main__ - Step 8869: {'lr': 0.000497347975309233, 'samples': 1702848, 'steps': 8868, 'loss/train': 1.7777513265609741} -11/06/2021 22:29:02 - INFO - __main__ - Step 8870: {'lr': 0.0004973472043374069, 'samples': 1703040, 'steps': 8869, 'loss/train': 1.8679721355438232} -11/06/2021 22:29:03 - INFO - __main__ - Step 8871: {'lr': 0.00049734643325413, 'samples': 1703232, 'steps': 8870, 'loss/train': 1.7162529230117798} -11/06/2021 22:29:03 - INFO - __main__ - Step 8872: {'lr': 0.0004973456620594026, 'samples': 1703424, 'steps': 8871, 'loss/train': 1.8824801445007324} -11/06/2021 22:29:03 - INFO - __main__ - Step 8873: {'lr': 0.0004973448907532251, 'samples': 1703616, 'steps': 8872, 'loss/train': 1.3267327547073364} -11/06/2021 22:29:04 - INFO - __main__ - Step 8874: {'lr': 0.0004973441193355978, 'samples': 1703808, 'steps': 8873, 'loss/train': 2.032459259033203} -11/06/2021 22:29:05 - INFO - __main__ - Step 8875: {'lr': 0.0004973433478065209, 'samples': 1704000, 'steps': 8874, 'loss/train': 1.6638219356536865} -11/06/2021 22:29:05 - INFO - __main__ - Step 8876: {'lr': 0.0004973425761659951, 'samples': 1704192, 'steps': 8875, 'loss/train': 1.3877533674240112} -11/06/2021 22:29:05 - INFO - __main__ - Step 8877: {'lr': 0.0004973418044140204, 'samples': 1704384, 'steps': 8876, 'loss/train': 1.6968107223510742} -11/06/2021 22:29:06 - INFO - __main__ - Step 8878: {'lr': 0.0004973410325505974, 'samples': 1704576, 'steps': 8877, 'loss/train': 0.47580868005752563} -11/06/2021 22:29:07 - INFO - __main__ - Step 8879: {'lr': 0.0004973402605757263, 'samples': 1704768, 'steps': 8878, 'loss/train': 1.8513538837432861} -11/06/2021 22:29:07 - INFO - __main__ - Step 8880: {'lr': 0.0004973394884894075, 'samples': 1704960, 'steps': 8879, 'loss/train': 1.8675156831741333} -11/06/2021 22:29:08 - INFO - __main__ - Step 8881: {'lr': 0.0004973387162916415, 'samples': 1705152, 'steps': 8880, 'loss/train': 1.1261378526687622} -11/06/2021 22:29:08 - INFO - __main__ - Step 8882: {'lr': 0.0004973379439824283, 'samples': 1705344, 'steps': 8881, 'loss/train': 2.2020576000213623} -11/06/2021 22:29:09 - INFO - __main__ - Step 8883: {'lr': 0.0004973371715617685, 'samples': 1705536, 'steps': 8882, 'loss/train': 1.241743803024292} -11/06/2021 22:29:09 - INFO - __main__ - Step 8884: {'lr': 0.0004973363990296624, 'samples': 1705728, 'steps': 8883, 'loss/train': 1.7667030096054077} -11/06/2021 22:29:10 - INFO - __main__ - Step 8885: {'lr': 0.0004973356263861103, 'samples': 1705920, 'steps': 8884, 'loss/train': 1.5185878276824951} -11/06/2021 22:29:10 - INFO - __main__ - Step 8886: {'lr': 0.0004973348536311126, 'samples': 1706112, 'steps': 8885, 'loss/train': 2.001230001449585} -11/06/2021 22:29:11 - INFO - __main__ - Step 8887: {'lr': 0.0004973340807646696, 'samples': 1706304, 'steps': 8886, 'loss/train': 2.3790831565856934} -11/06/2021 22:29:11 - INFO - __main__ - Step 8888: {'lr': 0.0004973333077867817, 'samples': 1706496, 'steps': 8887, 'loss/train': 1.9295786619186401} -11/06/2021 22:29:11 - INFO - __main__ - Step 8889: {'lr': 0.0004973325346974493, 'samples': 1706688, 'steps': 8888, 'loss/train': 1.372741937637329} -11/06/2021 22:29:13 - INFO - __main__ - Step 8890: {'lr': 0.0004973317614966726, 'samples': 1706880, 'steps': 8889, 'loss/train': 2.034008502960205} -11/06/2021 22:29:13 - INFO - __main__ - Step 8891: {'lr': 0.000497330988184452, 'samples': 1707072, 'steps': 8890, 'loss/train': 1.9604440927505493} -11/06/2021 22:29:13 - INFO - __main__ - Step 8892: {'lr': 0.000497330214760788, 'samples': 1707264, 'steps': 8891, 'loss/train': 0.9298360347747803} -11/06/2021 22:29:14 - INFO - __main__ - Step 8893: {'lr': 0.0004973294412256807, 'samples': 1707456, 'steps': 8892, 'loss/train': 1.6712414026260376} -11/06/2021 22:29:14 - INFO - __main__ - Step 8894: {'lr': 0.0004973286675791305, 'samples': 1707648, 'steps': 8893, 'loss/train': 1.9249519109725952} -11/06/2021 22:29:15 - INFO - __main__ - Step 8895: {'lr': 0.000497327893821138, 'samples': 1707840, 'steps': 8894, 'loss/train': 1.5401326417922974} -11/06/2021 22:29:15 - INFO - __main__ - Step 8896: {'lr': 0.0004973271199517033, 'samples': 1708032, 'steps': 8895, 'loss/train': 1.5258654356002808} -11/06/2021 22:29:16 - INFO - __main__ - Step 8897: {'lr': 0.0004973263459708268, 'samples': 1708224, 'steps': 8896, 'loss/train': 1.3488224744796753} -11/06/2021 22:29:16 - INFO - __main__ - Step 8898: {'lr': 0.0004973255718785088, 'samples': 1708416, 'steps': 8897, 'loss/train': 1.7817871570587158} -11/06/2021 22:29:16 - INFO - __main__ - Step 8899: {'lr': 0.0004973247976747499, 'samples': 1708608, 'steps': 8898, 'loss/train': 1.7609913349151611} -11/06/2021 22:29:17 - INFO - __main__ - Step 8900: {'lr': 0.00049732402335955, 'samples': 1708800, 'steps': 8899, 'loss/train': 1.659672737121582} -11/06/2021 22:29:18 - INFO - __main__ - Step 8901: {'lr': 0.0004973232489329099, 'samples': 1708992, 'steps': 8900, 'loss/train': 1.438830852508545} -11/06/2021 22:29:18 - INFO - __main__ - Step 8902: {'lr': 0.0004973224743948298, 'samples': 1709184, 'steps': 8901, 'loss/train': 2.05006742477417} -11/06/2021 22:29:18 - INFO - __main__ - Step 8903: {'lr': 0.00049732169974531, 'samples': 1709376, 'steps': 8902, 'loss/train': 1.8295646905899048} -11/06/2021 22:29:19 - INFO - __main__ - Step 8904: {'lr': 0.0004973209249843507, 'samples': 1709568, 'steps': 8903, 'loss/train': 1.4633625745773315} -11/06/2021 22:29:19 - INFO - __main__ - Step 8905: {'lr': 0.0004973201501119525, 'samples': 1709760, 'steps': 8904, 'loss/train': 1.7192811965942383} -11/06/2021 22:29:20 - INFO - __main__ - Step 8906: {'lr': 0.0004973193751281156, 'samples': 1709952, 'steps': 8905, 'loss/train': 1.834681510925293} -11/06/2021 22:29:20 - INFO - __main__ - Step 8907: {'lr': 0.0004973186000328405, 'samples': 1710144, 'steps': 8906, 'loss/train': 1.5164721012115479} -11/06/2021 22:29:21 - INFO - __main__ - Step 8908: {'lr': 0.0004973178248261274, 'samples': 1710336, 'steps': 8907, 'loss/train': 2.1482808589935303} -11/06/2021 22:29:21 - INFO - __main__ - Step 8909: {'lr': 0.0004973170495079768, 'samples': 1710528, 'steps': 8908, 'loss/train': 2.774986505508423} -11/06/2021 22:29:22 - INFO - __main__ - Step 8910: {'lr': 0.0004973162740783888, 'samples': 1710720, 'steps': 8909, 'loss/train': 1.804287075996399} -11/06/2021 22:29:23 - INFO - __main__ - Step 8911: {'lr': 0.000497315498537364, 'samples': 1710912, 'steps': 8910, 'loss/train': 1.4533205032348633} -11/06/2021 22:29:23 - INFO - __main__ - Step 8912: {'lr': 0.0004973147228849027, 'samples': 1711104, 'steps': 8911, 'loss/train': 1.924820065498352} -11/06/2021 22:29:23 - INFO - __main__ - Step 8913: {'lr': 0.0004973139471210051, 'samples': 1711296, 'steps': 8912, 'loss/train': 1.9860786199569702} -11/06/2021 22:29:24 - INFO - __main__ - Step 8914: {'lr': 0.0004973131712456717, 'samples': 1711488, 'steps': 8913, 'loss/train': 1.800611972808838} -11/06/2021 22:29:24 - INFO - __main__ - Step 8915: {'lr': 0.0004973123952589027, 'samples': 1711680, 'steps': 8914, 'loss/train': 2.1335561275482178} -11/06/2021 22:29:25 - INFO - __main__ - Step 8916: {'lr': 0.0004973116191606987, 'samples': 1711872, 'steps': 8915, 'loss/train': 2.246720552444458} -11/06/2021 22:29:25 - INFO - __main__ - Step 8917: {'lr': 0.0004973108429510598, 'samples': 1712064, 'steps': 8916, 'loss/train': 1.5170209407806396} -11/06/2021 22:29:26 - INFO - __main__ - Step 8918: {'lr': 0.0004973100666299864, 'samples': 1712256, 'steps': 8917, 'loss/train': 1.8479684591293335} -11/06/2021 22:29:26 - INFO - __main__ - Step 8919: {'lr': 0.000497309290197479, 'samples': 1712448, 'steps': 8918, 'loss/train': 1.6200121641159058} -11/06/2021 22:29:27 - INFO - __main__ - Step 8920: {'lr': 0.0004973085136535379, 'samples': 1712640, 'steps': 8919, 'loss/train': 1.8492422103881836} -11/06/2021 22:29:27 - INFO - __main__ - Step 8921: {'lr': 0.0004973077369981633, 'samples': 1712832, 'steps': 8920, 'loss/train': 1.80856192111969} -11/06/2021 22:29:28 - INFO - __main__ - Step 8922: {'lr': 0.0004973069602313557, 'samples': 1713024, 'steps': 8921, 'loss/train': 2.0224783420562744} -11/06/2021 22:29:28 - INFO - __main__ - Step 8923: {'lr': 0.0004973061833531154, 'samples': 1713216, 'steps': 8922, 'loss/train': 1.5250040292739868} -11/06/2021 22:29:28 - INFO - __main__ - Step 8924: {'lr': 0.0004973054063634428, 'samples': 1713408, 'steps': 8923, 'loss/train': 1.9554498195648193} -11/06/2021 22:29:29 - INFO - __main__ - Step 8925: {'lr': 0.0004973046292623382, 'samples': 1713600, 'steps': 8924, 'loss/train': 1.6448603868484497} -11/06/2021 22:29:30 - INFO - __main__ - Step 8926: {'lr': 0.0004973038520498017, 'samples': 1713792, 'steps': 8925, 'loss/train': 1.983763575553894} -11/06/2021 22:29:30 - INFO - __main__ - Step 8927: {'lr': 0.0004973030747258342, 'samples': 1713984, 'steps': 8926, 'loss/train': 1.5370417833328247} -11/06/2021 22:29:31 - INFO - __main__ - Step 8928: {'lr': 0.0004973022972904356, 'samples': 1714176, 'steps': 8927, 'loss/train': 2.2001898288726807} -11/06/2021 22:29:31 - INFO - __main__ - Step 8929: {'lr': 0.0004973015197436063, 'samples': 1714368, 'steps': 8928, 'loss/train': 3.589097023010254} -11/06/2021 22:29:31 - INFO - __main__ - Step 8930: {'lr': 0.0004973007420853471, 'samples': 1714560, 'steps': 8929, 'loss/train': 1.7380764484405518} -11/06/2021 22:29:32 - INFO - __main__ - Step 8931: {'lr': 0.0004972999643156577, 'samples': 1714752, 'steps': 8930, 'loss/train': 1.9435979127883911} -11/06/2021 22:29:33 - INFO - __main__ - Step 8932: {'lr': 0.0004972991864345389, 'samples': 1714944, 'steps': 8931, 'loss/train': 1.745599627494812} -11/06/2021 22:29:33 - INFO - __main__ - Step 8933: {'lr': 0.0004972984084419908, 'samples': 1715136, 'steps': 8932, 'loss/train': 1.9273251295089722} -11/06/2021 22:29:34 - INFO - __main__ - Step 8934: {'lr': 0.0004972976303380139, 'samples': 1715328, 'steps': 8933, 'loss/train': 1.3530958890914917} -11/06/2021 22:29:34 - INFO - __main__ - Step 8935: {'lr': 0.0004972968521226085, 'samples': 1715520, 'steps': 8934, 'loss/train': 2.121579885482788} -11/06/2021 22:29:34 - INFO - __main__ - Step 8936: {'lr': 0.0004972960737957749, 'samples': 1715712, 'steps': 8935, 'loss/train': 1.9268077611923218} -11/06/2021 22:29:35 - INFO - __main__ - Step 8937: {'lr': 0.0004972952953575136, 'samples': 1715904, 'steps': 8936, 'loss/train': 1.8524378538131714} -11/06/2021 22:29:36 - INFO - __main__ - Step 8938: {'lr': 0.0004972945168078248, 'samples': 1716096, 'steps': 8937, 'loss/train': 0.22625112533569336} -11/06/2021 22:29:36 - INFO - __main__ - Step 8939: {'lr': 0.000497293738146709, 'samples': 1716288, 'steps': 8938, 'loss/train': 1.5457402467727661} -11/06/2021 22:29:36 - INFO - __main__ - Step 8940: {'lr': 0.0004972929593741662, 'samples': 1716480, 'steps': 8939, 'loss/train': 1.9634605646133423} -11/06/2021 22:29:37 - INFO - __main__ - Step 8941: {'lr': 0.0004972921804901973, 'samples': 1716672, 'steps': 8940, 'loss/train': 1.6684246063232422} -11/06/2021 22:29:38 - INFO - __main__ - Step 8942: {'lr': 0.0004972914014948023, 'samples': 1716864, 'steps': 8941, 'loss/train': 2.112210512161255} -11/06/2021 22:29:38 - INFO - __main__ - Step 8943: {'lr': 0.0004972906223879815, 'samples': 1717056, 'steps': 8942, 'loss/train': 2.020785331726074} -11/06/2021 22:29:39 - INFO - __main__ - Step 8944: {'lr': 0.0004972898431697355, 'samples': 1717248, 'steps': 8943, 'loss/train': 1.4316191673278809} -11/06/2021 22:29:39 - INFO - __main__ - Step 8945: {'lr': 0.0004972890638400644, 'samples': 1717440, 'steps': 8944, 'loss/train': 3.3050966262817383} -11/06/2021 22:29:39 - INFO - __main__ - Step 8946: {'lr': 0.0004972882843989687, 'samples': 1717632, 'steps': 8945, 'loss/train': 1.6966694593429565} -11/06/2021 22:29:40 - INFO - __main__ - Step 8947: {'lr': 0.0004972875048464487, 'samples': 1717824, 'steps': 8946, 'loss/train': 1.5771774053573608} -11/06/2021 22:29:41 - INFO - __main__ - Step 8948: {'lr': 0.0004972867251825048, 'samples': 1718016, 'steps': 8947, 'loss/train': 2.001603841781616} -11/06/2021 22:29:41 - INFO - __main__ - Step 8949: {'lr': 0.0004972859454071373, 'samples': 1718208, 'steps': 8948, 'loss/train': 1.704656720161438} -11/06/2021 22:29:41 - INFO - __main__ - Step 8950: {'lr': 0.0004972851655203465, 'samples': 1718400, 'steps': 8949, 'loss/train': 2.2928240299224854} -11/06/2021 22:29:42 - INFO - __main__ - Step 8951: {'lr': 0.000497284385522133, 'samples': 1718592, 'steps': 8950, 'loss/train': 2.0876405239105225} -11/06/2021 22:29:42 - INFO - __main__ - Step 8952: {'lr': 0.0004972836054124968, 'samples': 1718784, 'steps': 8951, 'loss/train': 1.9462846517562866} -11/06/2021 22:29:43 - INFO - __main__ - Step 8953: {'lr': 0.0004972828251914384, 'samples': 1718976, 'steps': 8952, 'loss/train': 1.3022961616516113} -11/06/2021 22:29:43 - INFO - __main__ - Step 8954: {'lr': 0.0004972820448589584, 'samples': 1719168, 'steps': 8953, 'loss/train': 1.0215758085250854} -11/06/2021 22:29:44 - INFO - __main__ - Step 8955: {'lr': 0.0004972812644150567, 'samples': 1719360, 'steps': 8954, 'loss/train': 1.7224310636520386} -11/06/2021 22:29:44 - INFO - __main__ - Step 8956: {'lr': 0.000497280483859734, 'samples': 1719552, 'steps': 8955, 'loss/train': 1.3424328565597534} -11/06/2021 22:29:45 - INFO - __main__ - Step 8957: {'lr': 0.0004972797031929904, 'samples': 1719744, 'steps': 8956, 'loss/train': 1.9782111644744873} -11/06/2021 22:29:45 - INFO - __main__ - Step 8958: {'lr': 0.0004972789224148266, 'samples': 1719936, 'steps': 8957, 'loss/train': 2.0518736839294434} -11/06/2021 22:29:46 - INFO - __main__ - Step 8959: {'lr': 0.0004972781415252426, 'samples': 1720128, 'steps': 8958, 'loss/train': 2.4421885013580322} -11/06/2021 22:29:46 - INFO - __main__ - Step 8960: {'lr': 0.0004972773605242388, 'samples': 1720320, 'steps': 8959, 'loss/train': 1.4392913579940796} -11/06/2021 22:29:47 - INFO - __main__ - Step 8961: {'lr': 0.0004972765794118158, 'samples': 1720512, 'steps': 8960, 'loss/train': 1.1508708000183105} -11/06/2021 22:29:47 - INFO - __main__ - Step 8962: {'lr': 0.0004972757981879737, 'samples': 1720704, 'steps': 8961, 'loss/train': 1.7767452001571655} -11/06/2021 22:29:48 - INFO - __main__ - Step 8963: {'lr': 0.000497275016852713, 'samples': 1720896, 'steps': 8962, 'loss/train': 2.000983953475952} -11/06/2021 22:29:48 - INFO - __main__ - Step 8964: {'lr': 0.0004972742354060339, 'samples': 1721088, 'steps': 8963, 'loss/train': 1.6095494031906128} -11/06/2021 22:29:49 - INFO - __main__ - Step 8965: {'lr': 0.0004972734538479369, 'samples': 1721280, 'steps': 8964, 'loss/train': 2.106870174407959} -11/06/2021 22:29:49 - INFO - __main__ - Step 8966: {'lr': 0.0004972726721784223, 'samples': 1721472, 'steps': 8965, 'loss/train': 1.3510915040969849} -11/06/2021 22:29:49 - INFO - __main__ - Step 8967: {'lr': 0.0004972718903974904, 'samples': 1721664, 'steps': 8966, 'loss/train': 2.6114096641540527} -11/06/2021 22:29:50 - INFO - __main__ - Step 8968: {'lr': 0.0004972711085051417, 'samples': 1721856, 'steps': 8967, 'loss/train': 1.257983922958374} -11/06/2021 22:29:51 - INFO - __main__ - Step 8969: {'lr': 0.0004972703265013764, 'samples': 1722048, 'steps': 8968, 'loss/train': 1.7631484270095825} -11/06/2021 22:29:51 - INFO - __main__ - Step 8970: {'lr': 0.0004972695443861949, 'samples': 1722240, 'steps': 8969, 'loss/train': 1.826780080795288} -11/06/2021 22:29:51 - INFO - __main__ - Step 8971: {'lr': 0.0004972687621595975, 'samples': 1722432, 'steps': 8970, 'loss/train': 1.8841552734375} -11/06/2021 22:29:52 - INFO - __main__ - Step 8972: {'lr': 0.0004972679798215847, 'samples': 1722624, 'steps': 8971, 'loss/train': 1.433433175086975} -11/06/2021 22:29:53 - INFO - __main__ - Step 8973: {'lr': 0.0004972671973721567, 'samples': 1722816, 'steps': 8972, 'loss/train': 1.9559110403060913} -11/06/2021 22:29:53 - INFO - __main__ - Step 8974: {'lr': 0.000497266414811314, 'samples': 1723008, 'steps': 8973, 'loss/train': 2.148409605026245} -11/06/2021 22:29:54 - INFO - __main__ - Step 8975: {'lr': 0.0004972656321390568, 'samples': 1723200, 'steps': 8974, 'loss/train': 1.603281855583191} -11/06/2021 22:29:54 - INFO - __main__ - Step 8976: {'lr': 0.0004972648493553856, 'samples': 1723392, 'steps': 8975, 'loss/train': 1.3855030536651611} -11/06/2021 22:29:54 - INFO - __main__ - Step 8977: {'lr': 0.0004972640664603006, 'samples': 1723584, 'steps': 8976, 'loss/train': 1.4343771934509277} -11/06/2021 22:29:55 - INFO - __main__ - Step 8978: {'lr': 0.0004972632834538023, 'samples': 1723776, 'steps': 8977, 'loss/train': 1.4176015853881836} -11/06/2021 22:29:56 - INFO - __main__ - Step 8979: {'lr': 0.0004972625003358908, 'samples': 1723968, 'steps': 8978, 'loss/train': 1.4474366903305054} -11/06/2021 22:29:56 - INFO - __main__ - Step 8980: {'lr': 0.0004972617171065668, 'samples': 1724160, 'steps': 8979, 'loss/train': 0.7004616260528564} -11/06/2021 22:29:56 - INFO - __main__ - Step 8981: {'lr': 0.0004972609337658305, 'samples': 1724352, 'steps': 8980, 'loss/train': 1.7616783380508423} -11/06/2021 22:29:57 - INFO - __main__ - Step 8982: {'lr': 0.0004972601503136822, 'samples': 1724544, 'steps': 8981, 'loss/train': 1.6659023761749268} -11/06/2021 22:29:57 - INFO - __main__ - Step 8983: {'lr': 0.0004972593667501222, 'samples': 1724736, 'steps': 8982, 'loss/train': 1.7344557046890259} -11/06/2021 22:29:58 - INFO - __main__ - Step 8984: {'lr': 0.0004972585830751511, 'samples': 1724928, 'steps': 8983, 'loss/train': 1.725408673286438} -11/06/2021 22:29:59 - INFO - __main__ - Step 8985: {'lr': 0.0004972577992887689, 'samples': 1725120, 'steps': 8984, 'loss/train': 1.803905725479126} -11/06/2021 22:29:59 - INFO - __main__ - Step 8986: {'lr': 0.0004972570153909763, 'samples': 1725312, 'steps': 8985, 'loss/train': 2.232513427734375} -11/06/2021 22:29:59 - INFO - __main__ - Step 8987: {'lr': 0.0004972562313817735, 'samples': 1725504, 'steps': 8986, 'loss/train': 0.8127360343933105} -11/06/2021 22:30:00 - INFO - __main__ - Step 8988: {'lr': 0.0004972554472611609, 'samples': 1725696, 'steps': 8987, 'loss/train': 2.031003713607788} -11/06/2021 22:30:01 - INFO - __main__ - Step 8989: {'lr': 0.0004972546630291387, 'samples': 1725888, 'steps': 8988, 'loss/train': 1.9944013357162476} -11/06/2021 22:30:01 - INFO - __main__ - Step 8990: {'lr': 0.0004972538786857073, 'samples': 1726080, 'steps': 8989, 'loss/train': 2.087233781814575} -11/06/2021 22:30:01 - INFO - __main__ - Step 8991: {'lr': 0.0004972530942308673, 'samples': 1726272, 'steps': 8990, 'loss/train': 2.0797486305236816} -11/06/2021 22:30:02 - INFO - __main__ - Step 8992: {'lr': 0.0004972523096646188, 'samples': 1726464, 'steps': 8991, 'loss/train': 1.4353597164154053} -11/06/2021 22:30:02 - INFO - __main__ - Step 8993: {'lr': 0.0004972515249869622, 'samples': 1726656, 'steps': 8992, 'loss/train': 1.706042766571045} -11/06/2021 22:30:03 - INFO - __main__ - Step 8994: {'lr': 0.000497250740197898, 'samples': 1726848, 'steps': 8993, 'loss/train': 1.5139485597610474} -11/06/2021 22:30:04 - INFO - __main__ - Step 8995: {'lr': 0.0004972499552974263, 'samples': 1727040, 'steps': 8994, 'loss/train': 1.8484820127487183} -11/06/2021 22:30:04 - INFO - __main__ - Step 8996: {'lr': 0.0004972491702855477, 'samples': 1727232, 'steps': 8995, 'loss/train': 1.559495210647583} -11/06/2021 22:30:04 - INFO - __main__ - Step 8997: {'lr': 0.0004972483851622623, 'samples': 1727424, 'steps': 8996, 'loss/train': 2.627495527267456} -11/06/2021 22:30:05 - INFO - __main__ - Step 8998: {'lr': 0.0004972475999275707, 'samples': 1727616, 'steps': 8997, 'loss/train': 1.676787257194519} -11/06/2021 22:30:06 - INFO - __main__ - Step 8999: {'lr': 0.0004972468145814729, 'samples': 1727808, 'steps': 8998, 'loss/train': 1.9144270420074463} -11/06/2021 22:30:06 - INFO - __main__ - Step 9000: {'lr': 0.0004972460291239697, 'samples': 1728000, 'steps': 8999, 'loss/train': 2.2997002601623535} -11/06/2021 22:30:06 - INFO - __main__ - Step 9001: {'lr': 0.0004972452435550613, 'samples': 1728192, 'steps': 9000, 'loss/train': 1.8456697463989258} -11/06/2021 22:30:07 - INFO - __main__ - Step 9002: {'lr': 0.000497244457874748, 'samples': 1728384, 'steps': 9001, 'loss/train': 1.736275315284729} -11/06/2021 22:30:07 - INFO - __main__ - Step 9003: {'lr': 0.0004972436720830301, 'samples': 1728576, 'steps': 9002, 'loss/train': 1.504355549812317} -11/06/2021 22:30:08 - INFO - __main__ - Step 9004: {'lr': 0.000497242886179908, 'samples': 1728768, 'steps': 9003, 'loss/train': 1.5996493101119995} -11/06/2021 22:30:08 - INFO - __main__ - Step 9005: {'lr': 0.0004972421001653822, 'samples': 1728960, 'steps': 9004, 'loss/train': 1.5102970600128174} -11/06/2021 22:30:09 - INFO - __main__ - Step 9006: {'lr': 0.0004972413140394528, 'samples': 1729152, 'steps': 9005, 'loss/train': 2.118058204650879} -11/06/2021 22:30:09 - INFO - __main__ - Step 9007: {'lr': 0.0004972405278021203, 'samples': 1729344, 'steps': 9006, 'loss/train': 2.190336227416992} -11/06/2021 22:30:09 - INFO - __main__ - Step 9008: {'lr': 0.000497239741453385, 'samples': 1729536, 'steps': 9007, 'loss/train': 1.8450963497161865} -11/06/2021 22:30:10 - INFO - __main__ - Step 9009: {'lr': 0.0004972389549932473, 'samples': 1729728, 'steps': 9008, 'loss/train': 2.0399389266967773} -11/06/2021 22:30:11 - INFO - __main__ - Step 9010: {'lr': 0.0004972381684217077, 'samples': 1729920, 'steps': 9009, 'loss/train': 1.8316234350204468} -11/06/2021 22:30:11 - INFO - __main__ - Step 9011: {'lr': 0.0004972373817387662, 'samples': 1730112, 'steps': 9010, 'loss/train': 0.9349846839904785} -11/06/2021 22:30:11 - INFO - __main__ - Step 9012: {'lr': 0.0004972365949444234, 'samples': 1730304, 'steps': 9011, 'loss/train': 1.6661643981933594} -11/06/2021 22:30:12 - INFO - __main__ - Step 9013: {'lr': 0.0004972358080386796, 'samples': 1730496, 'steps': 9012, 'loss/train': 1.3828058242797852} -11/06/2021 22:30:12 - INFO - __main__ - Step 9014: {'lr': 0.0004972350210215353, 'samples': 1730688, 'steps': 9013, 'loss/train': 1.3896691799163818} -11/06/2021 22:30:13 - INFO - __main__ - Step 9015: {'lr': 0.0004972342338929906, 'samples': 1730880, 'steps': 9014, 'loss/train': 1.6471271514892578} -11/06/2021 22:30:13 - INFO - __main__ - Step 9016: {'lr': 0.000497233446653046, 'samples': 1731072, 'steps': 9015, 'loss/train': 1.893143892288208} -11/06/2021 22:30:14 - INFO - __main__ - Step 9017: {'lr': 0.0004972326593017017, 'samples': 1731264, 'steps': 9016, 'loss/train': 1.5417567491531372} -11/06/2021 22:30:14 - INFO - __main__ - Step 9018: {'lr': 0.0004972318718389583, 'samples': 1731456, 'steps': 9017, 'loss/train': 2.1753854751586914} -11/06/2021 22:30:14 - INFO - __main__ - Step 9019: {'lr': 0.000497231084264816, 'samples': 1731648, 'steps': 9018, 'loss/train': 1.7801073789596558} -11/06/2021 22:30:16 - INFO - __main__ - Step 9020: {'lr': 0.0004972302965792752, 'samples': 1731840, 'steps': 9019, 'loss/train': 1.927689790725708} -11/06/2021 22:30:16 - INFO - __main__ - Step 9021: {'lr': 0.0004972295087823362, 'samples': 1732032, 'steps': 9020, 'loss/train': 1.54207444190979} -11/06/2021 22:30:16 - INFO - __main__ - Step 9022: {'lr': 0.0004972287208739995, 'samples': 1732224, 'steps': 9021, 'loss/train': 1.5854400396347046} -11/06/2021 22:30:17 - INFO - __main__ - Step 9023: {'lr': 0.0004972279328542652, 'samples': 1732416, 'steps': 9022, 'loss/train': 2.2019128799438477} -11/06/2021 22:30:17 - INFO - __main__ - Step 9024: {'lr': 0.000497227144723134, 'samples': 1732608, 'steps': 9023, 'loss/train': 1.814888596534729} -11/06/2021 22:30:18 - INFO - __main__ - Step 9025: {'lr': 0.0004972263564806059, 'samples': 1732800, 'steps': 9024, 'loss/train': 2.2460262775421143} -11/06/2021 22:30:18 - INFO - __main__ - Step 9026: {'lr': 0.0004972255681266816, 'samples': 1732992, 'steps': 9025, 'loss/train': 2.0175039768218994} -11/06/2021 22:30:19 - INFO - __main__ - Step 9027: {'lr': 0.0004972247796613611, 'samples': 1733184, 'steps': 9026, 'loss/train': 1.2223052978515625} -11/06/2021 22:30:19 - INFO - __main__ - Step 9028: {'lr': 0.000497223991084645, 'samples': 1733376, 'steps': 9027, 'loss/train': 1.550275206565857} -11/06/2021 22:30:19 - INFO - __main__ - Step 9029: {'lr': 0.0004972232023965335, 'samples': 1733568, 'steps': 9028, 'loss/train': 1.8038307428359985} -11/06/2021 22:30:20 - INFO - __main__ - Step 9030: {'lr': 0.0004972224135970271, 'samples': 1733760, 'steps': 9029, 'loss/train': 1.7093403339385986} -11/06/2021 22:30:21 - INFO - __main__ - Step 9031: {'lr': 0.0004972216246861262, 'samples': 1733952, 'steps': 9030, 'loss/train': 2.1160690784454346} -11/06/2021 22:30:21 - INFO - __main__ - Step 9032: {'lr': 0.0004972208356638309, 'samples': 1734144, 'steps': 9031, 'loss/train': 0.9576528072357178} -11/06/2021 22:30:21 - INFO - __main__ - Step 9033: {'lr': 0.0004972200465301418, 'samples': 1734336, 'steps': 9032, 'loss/train': 2.587282657623291} -11/06/2021 22:30:22 - INFO - __main__ - Step 9034: {'lr': 0.0004972192572850592, 'samples': 1734528, 'steps': 9033, 'loss/train': 1.5511127710342407} -11/06/2021 22:30:22 - INFO - __main__ - Step 9035: {'lr': 0.0004972184679285833, 'samples': 1734720, 'steps': 9034, 'loss/train': 1.6166201829910278} -11/06/2021 22:30:23 - INFO - __main__ - Step 9036: {'lr': 0.0004972176784607146, 'samples': 1734912, 'steps': 9035, 'loss/train': 1.4050244092941284} -11/06/2021 22:30:24 - INFO - __main__ - Step 9037: {'lr': 0.0004972168888814533, 'samples': 1735104, 'steps': 9036, 'loss/train': 2.019019842147827} -11/06/2021 22:30:24 - INFO - __main__ - Step 9038: {'lr': 0.0004972160991908001, 'samples': 1735296, 'steps': 9037, 'loss/train': 1.9093737602233887} -11/06/2021 22:30:24 - INFO - __main__ - Step 9039: {'lr': 0.0004972153093887551, 'samples': 1735488, 'steps': 9038, 'loss/train': 1.671932578086853} -11/06/2021 22:30:25 - INFO - __main__ - Step 9040: {'lr': 0.0004972145194753186, 'samples': 1735680, 'steps': 9039, 'loss/train': 1.3389232158660889} -11/06/2021 22:30:26 - INFO - __main__ - Step 9041: {'lr': 0.0004972137294504912, 'samples': 1735872, 'steps': 9040, 'loss/train': 2.4330387115478516} -11/06/2021 22:30:26 - INFO - __main__ - Step 9042: {'lr': 0.000497212939314273, 'samples': 1736064, 'steps': 9041, 'loss/train': 1.3045024871826172} -11/06/2021 22:30:26 - INFO - __main__ - Step 9043: {'lr': 0.0004972121490666644, 'samples': 1736256, 'steps': 9042, 'loss/train': 1.6939752101898193} -11/06/2021 22:30:27 - INFO - __main__ - Step 9044: {'lr': 0.000497211358707666, 'samples': 1736448, 'steps': 9043, 'loss/train': 1.862133502960205} -11/06/2021 22:30:27 - INFO - __main__ - Step 9045: {'lr': 0.0004972105682372779, 'samples': 1736640, 'steps': 9044, 'loss/train': 2.044528007507324} -11/06/2021 22:30:29 - INFO - __main__ - Step 9046: {'lr': 0.0004972097776555005, 'samples': 1736832, 'steps': 9045, 'loss/train': 1.8090245723724365} -11/06/2021 22:30:29 - INFO - __main__ - Step 9047: {'lr': 0.0004972089869623342, 'samples': 1737024, 'steps': 9046, 'loss/train': 1.5942614078521729} -11/06/2021 22:30:29 - INFO - __main__ - Step 9048: {'lr': 0.0004972081961577793, 'samples': 1737216, 'steps': 9047, 'loss/train': 2.0264124870300293} -11/06/2021 22:30:30 - INFO - __main__ - Step 9049: {'lr': 0.0004972074052418363, 'samples': 1737408, 'steps': 9048, 'loss/train': 1.723054051399231} -11/06/2021 22:30:30 - INFO - __main__ - Step 9050: {'lr': 0.0004972066142145055, 'samples': 1737600, 'steps': 9049, 'loss/train': 1.216286540031433} -11/06/2021 22:30:30 - INFO - __main__ - Step 9051: {'lr': 0.0004972058230757871, 'samples': 1737792, 'steps': 9050, 'loss/train': 1.870058536529541} -11/06/2021 22:30:31 - INFO - __main__ - Step 9052: {'lr': 0.0004972050318256815, 'samples': 1737984, 'steps': 9051, 'loss/train': 0.3041784465312958} -11/06/2021 22:30:32 - INFO - __main__ - Step 9053: {'lr': 0.0004972042404641893, 'samples': 1738176, 'steps': 9052, 'loss/train': 1.6829752922058105} -11/06/2021 22:30:32 - INFO - __main__ - Step 9054: {'lr': 0.0004972034489913106, 'samples': 1738368, 'steps': 9053, 'loss/train': 1.7771741151809692} -11/06/2021 22:30:32 - INFO - __main__ - Step 9055: {'lr': 0.0004972026574070459, 'samples': 1738560, 'steps': 9054, 'loss/train': 2.233604907989502} -11/06/2021 22:30:33 - INFO - __main__ - Step 9056: {'lr': 0.0004972018657113953, 'samples': 1738752, 'steps': 9055, 'loss/train': 2.35441517829895} -11/06/2021 22:30:34 - INFO - __main__ - Step 9057: {'lr': 0.0004972010739043596, 'samples': 1738944, 'steps': 9056, 'loss/train': 1.8315443992614746} -11/06/2021 22:30:34 - INFO - __main__ - Step 9058: {'lr': 0.0004972002819859388, 'samples': 1739136, 'steps': 9057, 'loss/train': 1.4996757507324219} -11/06/2021 22:30:34 - INFO - __main__ - Step 9059: {'lr': 0.0004971994899561334, 'samples': 1739328, 'steps': 9058, 'loss/train': 2.07483172416687} -11/06/2021 22:30:35 - INFO - __main__ - Step 9060: {'lr': 0.0004971986978149437, 'samples': 1739520, 'steps': 9059, 'loss/train': 1.568691372871399} -11/06/2021 22:30:35 - INFO - __main__ - Step 9061: {'lr': 0.0004971979055623701, 'samples': 1739712, 'steps': 9060, 'loss/train': 1.295201063156128} -11/06/2021 22:30:36 - INFO - __main__ - Step 9062: {'lr': 0.0004971971131984129, 'samples': 1739904, 'steps': 9061, 'loss/train': 2.6647539138793945} -11/06/2021 22:30:37 - INFO - __main__ - Step 9063: {'lr': 0.0004971963207230725, 'samples': 1740096, 'steps': 9062, 'loss/train': 1.6942551136016846} -11/06/2021 22:30:37 - INFO - __main__ - Step 9064: {'lr': 0.0004971955281363493, 'samples': 1740288, 'steps': 9063, 'loss/train': 1.9272085428237915} -11/06/2021 22:30:37 - INFO - __main__ - Step 9065: {'lr': 0.0004971947354382436, 'samples': 1740480, 'steps': 9064, 'loss/train': 1.482258677482605} -11/06/2021 22:30:38 - INFO - __main__ - Step 9066: {'lr': 0.0004971939426287557, 'samples': 1740672, 'steps': 9065, 'loss/train': 2.1765670776367188} -11/06/2021 22:30:39 - INFO - __main__ - Step 9067: {'lr': 0.0004971931497078861, 'samples': 1740864, 'steps': 9066, 'loss/train': 1.9422248601913452} -11/06/2021 22:30:39 - INFO - __main__ - Step 9068: {'lr': 0.000497192356675635, 'samples': 1741056, 'steps': 9067, 'loss/train': 0.8091076612472534} -11/06/2021 22:30:39 - INFO - __main__ - Step 9069: {'lr': 0.0004971915635320029, 'samples': 1741248, 'steps': 9068, 'loss/train': 2.0615551471710205} -11/06/2021 22:30:40 - INFO - __main__ - Step 9070: {'lr': 0.0004971907702769901, 'samples': 1741440, 'steps': 9069, 'loss/train': 1.8505113124847412} -11/06/2021 22:30:40 - INFO - __main__ - Step 9071: {'lr': 0.000497189976910597, 'samples': 1741632, 'steps': 9070, 'loss/train': 2.2380783557891846} -11/06/2021 22:30:41 - INFO - __main__ - Step 9072: {'lr': 0.0004971891834328238, 'samples': 1741824, 'steps': 9071, 'loss/train': 0.3026748597621918} -11/06/2021 22:30:41 - INFO - __main__ - Step 9073: {'lr': 0.000497188389843671, 'samples': 1742016, 'steps': 9072, 'loss/train': 1.1784673929214478} -11/06/2021 22:30:42 - INFO - __main__ - Step 9074: {'lr': 0.0004971875961431389, 'samples': 1742208, 'steps': 9073, 'loss/train': 1.7177537679672241} -11/06/2021 22:30:42 - INFO - __main__ - Step 9075: {'lr': 0.000497186802331228, 'samples': 1742400, 'steps': 9074, 'loss/train': 2.291787624359131} -11/06/2021 22:30:43 - INFO - __main__ - Step 9076: {'lr': 0.0004971860084079385, 'samples': 1742592, 'steps': 9075, 'loss/train': 1.1271553039550781} -11/06/2021 22:30:43 - INFO - __main__ - Step 9077: {'lr': 0.0004971852143732707, 'samples': 1742784, 'steps': 9076, 'loss/train': 1.6700618267059326} -11/06/2021 22:30:44 - INFO - __main__ - Step 9078: {'lr': 0.0004971844202272251, 'samples': 1742976, 'steps': 9077, 'loss/train': 1.7252506017684937} -11/06/2021 22:30:44 - INFO - __main__ - Step 9079: {'lr': 0.000497183625969802, 'samples': 1743168, 'steps': 9078, 'loss/train': 1.921452283859253} -11/06/2021 22:30:45 - INFO - __main__ - Step 9080: {'lr': 0.0004971828316010019, 'samples': 1743360, 'steps': 9079, 'loss/train': 1.8389270305633545} -11/06/2021 22:30:45 - INFO - __main__ - Step 9081: {'lr': 0.0004971820371208248, 'samples': 1743552, 'steps': 9080, 'loss/train': 1.7379286289215088} -11/06/2021 22:30:45 - INFO - __main__ - Step 9082: {'lr': 0.0004971812425292716, 'samples': 1743744, 'steps': 9081, 'loss/train': 2.1627986431121826} -11/06/2021 22:30:46 - INFO - __main__ - Step 9083: {'lr': 0.000497180447826342, 'samples': 1743936, 'steps': 9082, 'loss/train': 1.5003117322921753} -11/06/2021 22:30:47 - INFO - __main__ - Step 9084: {'lr': 0.0004971796530120371, 'samples': 1744128, 'steps': 9083, 'loss/train': 1.885785460472107} -11/06/2021 22:30:47 - INFO - __main__ - Step 9085: {'lr': 0.0004971788580863566, 'samples': 1744320, 'steps': 9084, 'loss/train': 1.6980434656143188} -11/06/2021 22:30:47 - INFO - __main__ - Step 9086: {'lr': 0.0004971780630493012, 'samples': 1744512, 'steps': 9085, 'loss/train': 1.8362492322921753} -11/06/2021 22:30:48 - INFO - __main__ - Step 9087: {'lr': 0.000497177267900871, 'samples': 1744704, 'steps': 9086, 'loss/train': 1.9315646886825562} -11/06/2021 22:30:49 - INFO - __main__ - Step 9088: {'lr': 0.0004971764726410668, 'samples': 1744896, 'steps': 9087, 'loss/train': 1.8160526752471924} -11/06/2021 22:30:49 - INFO - __main__ - Step 9089: {'lr': 0.0004971756772698886, 'samples': 1745088, 'steps': 9088, 'loss/train': 1.7330033779144287} -11/06/2021 22:30:50 - INFO - __main__ - Step 9090: {'lr': 0.0004971748817873367, 'samples': 1745280, 'steps': 9089, 'loss/train': 1.8694642782211304} -11/06/2021 22:30:50 - INFO - __main__ - Step 9091: {'lr': 0.0004971740861934117, 'samples': 1745472, 'steps': 9090, 'loss/train': 1.788362741470337} -11/06/2021 22:30:50 - INFO - __main__ - Step 9092: {'lr': 0.000497173290488114, 'samples': 1745664, 'steps': 9091, 'loss/train': 1.6177334785461426} -11/06/2021 22:30:52 - INFO - __main__ - Step 9093: {'lr': 0.0004971724946714437, 'samples': 1745856, 'steps': 9092, 'loss/train': 1.626973032951355} -11/06/2021 22:30:52 - INFO - __main__ - Step 9094: {'lr': 0.0004971716987434014, 'samples': 1746048, 'steps': 9093, 'loss/train': 1.3091498613357544} -11/06/2021 22:30:52 - INFO - __main__ - Step 9095: {'lr': 0.0004971709027039872, 'samples': 1746240, 'steps': 9094, 'loss/train': 1.3420382738113403} -11/06/2021 22:30:53 - INFO - __main__ - Step 9096: {'lr': 0.0004971701065532017, 'samples': 1746432, 'steps': 9095, 'loss/train': 1.4940237998962402} -11/06/2021 22:30:53 - INFO - __main__ - Step 9097: {'lr': 0.0004971693102910451, 'samples': 1746624, 'steps': 9096, 'loss/train': 2.1180343627929688} -11/06/2021 22:30:53 - INFO - __main__ - Step 9098: {'lr': 0.0004971685139175179, 'samples': 1746816, 'steps': 9097, 'loss/train': 2.4166030883789062} -11/06/2021 22:30:54 - INFO - __main__ - Step 9099: {'lr': 0.0004971677174326204, 'samples': 1747008, 'steps': 9098, 'loss/train': 5.840542316436768} -11/06/2021 22:30:55 - INFO - __main__ - Step 9100: {'lr': 0.0004971669208363529, 'samples': 1747200, 'steps': 9099, 'loss/train': 5.970412731170654} -11/06/2021 22:30:55 - INFO - __main__ - Step 9101: {'lr': 0.0004971661241287157, 'samples': 1747392, 'steps': 9100, 'loss/train': 2.0452849864959717} -11/06/2021 22:30:55 - INFO - __main__ - Step 9102: {'lr': 0.0004971653273097094, 'samples': 1747584, 'steps': 9101, 'loss/train': 1.074893593788147} -11/06/2021 22:30:56 - INFO - __main__ - Step 9103: {'lr': 0.0004971645303793342, 'samples': 1747776, 'steps': 9102, 'loss/train': 1.511845588684082} -11/06/2021 22:30:56 - INFO - __main__ - Step 9104: {'lr': 0.0004971637333375904, 'samples': 1747968, 'steps': 9103, 'loss/train': 1.4513171911239624} -11/06/2021 22:30:57 - INFO - __main__ - Step 9105: {'lr': 0.0004971629361844785, 'samples': 1748160, 'steps': 9104, 'loss/train': 1.3599135875701904} -11/06/2021 22:30:58 - INFO - __main__ - Step 9106: {'lr': 0.0004971621389199988, 'samples': 1748352, 'steps': 9105, 'loss/train': 1.6643626689910889} -11/06/2021 22:30:58 - INFO - __main__ - Step 9107: {'lr': 0.0004971613415441516, 'samples': 1748544, 'steps': 9106, 'loss/train': 1.0446491241455078} -11/06/2021 22:30:58 - INFO - __main__ - Step 9108: {'lr': 0.0004971605440569374, 'samples': 1748736, 'steps': 9107, 'loss/train': 1.783698558807373} -11/06/2021 22:30:59 - INFO - __main__ - Step 9109: {'lr': 0.0004971597464583563, 'samples': 1748928, 'steps': 9108, 'loss/train': 1.7281625270843506} -11/06/2021 22:31:00 - INFO - __main__ - Step 9110: {'lr': 0.0004971589487484091, 'samples': 1749120, 'steps': 9109, 'loss/train': 1.642425537109375} -11/06/2021 22:31:00 - INFO - __main__ - Step 9111: {'lr': 0.0004971581509270956, 'samples': 1749312, 'steps': 9110, 'loss/train': 1.2902659177780151} -11/06/2021 22:31:01 - INFO - __main__ - Step 9112: {'lr': 0.0004971573529944167, 'samples': 1749504, 'steps': 9111, 'loss/train': 2.028707981109619} -11/06/2021 22:31:01 - INFO - __main__ - Step 9113: {'lr': 0.0004971565549503723, 'samples': 1749696, 'steps': 9112, 'loss/train': 2.295679807662964} -11/06/2021 22:31:01 - INFO - __main__ - Step 9114: {'lr': 0.0004971557567949631, 'samples': 1749888, 'steps': 9113, 'loss/train': 1.6835025548934937} -11/06/2021 22:31:02 - INFO - __main__ - Step 9115: {'lr': 0.0004971549585281893, 'samples': 1750080, 'steps': 9114, 'loss/train': 1.3464192152023315} -11/06/2021 22:31:03 - INFO - __main__ - Step 9116: {'lr': 0.0004971541601500513, 'samples': 1750272, 'steps': 9115, 'loss/train': 1.7078288793563843} -11/06/2021 22:31:03 - INFO - __main__ - Step 9117: {'lr': 0.0004971533616605495, 'samples': 1750464, 'steps': 9116, 'loss/train': 1.4062687158584595} -11/06/2021 22:31:03 - INFO - __main__ - Step 9118: {'lr': 0.0004971525630596841, 'samples': 1750656, 'steps': 9117, 'loss/train': 1.889479637145996} -11/06/2021 22:31:04 - INFO - __main__ - Step 9119: {'lr': 0.0004971517643474556, 'samples': 1750848, 'steps': 9118, 'loss/train': 2.2042081356048584} -11/06/2021 22:31:04 - INFO - __main__ - Step 9120: {'lr': 0.0004971509655238643, 'samples': 1751040, 'steps': 9119, 'loss/train': 1.9173781871795654} -11/06/2021 22:31:05 - INFO - __main__ - Step 9121: {'lr': 0.0004971501665889107, 'samples': 1751232, 'steps': 9120, 'loss/train': 1.5485329627990723} -11/06/2021 22:31:05 - INFO - __main__ - Step 9122: {'lr': 0.000497149367542595, 'samples': 1751424, 'steps': 9121, 'loss/train': 2.2474119663238525} -11/06/2021 22:31:06 - INFO - __main__ - Step 9123: {'lr': 0.0004971485683849176, 'samples': 1751616, 'steps': 9122, 'loss/train': 1.9738703966140747} -11/06/2021 22:31:06 - INFO - __main__ - Step 9124: {'lr': 0.0004971477691158788, 'samples': 1751808, 'steps': 9123, 'loss/train': 1.9322994947433472} -11/06/2021 22:31:06 - INFO - __main__ - Step 9125: {'lr': 0.0004971469697354792, 'samples': 1752000, 'steps': 9124, 'loss/train': 2.1170740127563477} -11/06/2021 22:31:08 - INFO - __main__ - Step 9126: {'lr': 0.0004971461702437188, 'samples': 1752192, 'steps': 9125, 'loss/train': 1.9848999977111816} -11/06/2021 22:31:08 - INFO - __main__ - Step 9127: {'lr': 0.0004971453706405981, 'samples': 1752384, 'steps': 9126, 'loss/train': 1.6258814334869385} -11/06/2021 22:31:08 - INFO - __main__ - Step 9128: {'lr': 0.0004971445709261177, 'samples': 1752576, 'steps': 9127, 'loss/train': 1.3074932098388672} -11/06/2021 22:31:09 - INFO - __main__ - Step 9129: {'lr': 0.0004971437711002777, 'samples': 1752768, 'steps': 9128, 'loss/train': 1.880787968635559} -11/06/2021 22:31:09 - INFO - __main__ - Step 9130: {'lr': 0.0004971429711630786, 'samples': 1752960, 'steps': 9129, 'loss/train': 1.60108482837677} -11/06/2021 22:31:10 - INFO - __main__ - Step 9131: {'lr': 0.0004971421711145207, 'samples': 1753152, 'steps': 9130, 'loss/train': 1.9594632387161255} -11/06/2021 22:31:10 - INFO - __main__ - Step 9132: {'lr': 0.0004971413709546043, 'samples': 1753344, 'steps': 9131, 'loss/train': 1.4151302576065063} -11/06/2021 22:31:11 - INFO - __main__ - Step 9133: {'lr': 0.0004971405706833297, 'samples': 1753536, 'steps': 9132, 'loss/train': 2.054569721221924} -11/06/2021 22:31:11 - INFO - __main__ - Step 9134: {'lr': 0.0004971397703006974, 'samples': 1753728, 'steps': 9133, 'loss/train': 2.073517322540283} -11/06/2021 22:31:11 - INFO - __main__ - Step 9135: {'lr': 0.0004971389698067079, 'samples': 1753920, 'steps': 9134, 'loss/train': 2.4211151599884033} -11/06/2021 22:31:12 - INFO - __main__ - Step 9136: {'lr': 0.0004971381692013612, 'samples': 1754112, 'steps': 9135, 'loss/train': 1.4416491985321045} -11/06/2021 22:31:13 - INFO - __main__ - Step 9137: {'lr': 0.000497137368484658, 'samples': 1754304, 'steps': 9136, 'loss/train': 1.7312275171279907} -11/06/2021 22:31:13 - INFO - __main__ - Step 9138: {'lr': 0.0004971365676565984, 'samples': 1754496, 'steps': 9137, 'loss/train': 1.9141130447387695} -11/06/2021 22:31:13 - INFO - __main__ - Step 9139: {'lr': 0.000497135766717183, 'samples': 1754688, 'steps': 9138, 'loss/train': 1.8034145832061768} -11/06/2021 22:31:14 - INFO - __main__ - Step 9140: {'lr': 0.000497134965666412, 'samples': 1754880, 'steps': 9139, 'loss/train': 1.8870742321014404} -11/06/2021 22:31:14 - INFO - __main__ - Step 9141: {'lr': 0.0004971341645042857, 'samples': 1755072, 'steps': 9140, 'loss/train': 1.999513030052185} -11/06/2021 22:31:15 - INFO - __main__ - Step 9142: {'lr': 0.0004971333632308047, 'samples': 1755264, 'steps': 9141, 'loss/train': 2.0353739261627197} -11/06/2021 22:31:15 - INFO - __main__ - Step 9143: {'lr': 0.0004971325618459691, 'samples': 1755456, 'steps': 9142, 'loss/train': 2.1731367111206055} -11/06/2021 22:31:16 - INFO - __main__ - Step 9144: {'lr': 0.0004971317603497795, 'samples': 1755648, 'steps': 9143, 'loss/train': 1.4460906982421875} -11/06/2021 22:31:16 - INFO - __main__ - Step 9145: {'lr': 0.000497130958742236, 'samples': 1755840, 'steps': 9144, 'loss/train': 1.5800894498825073} -11/06/2021 22:31:17 - INFO - __main__ - Step 9146: {'lr': 0.0004971301570233392, 'samples': 1756032, 'steps': 9145, 'loss/train': 2.155123472213745} -11/06/2021 22:31:18 - INFO - __main__ - Step 9147: {'lr': 0.0004971293551930894, 'samples': 1756224, 'steps': 9146, 'loss/train': 1.0763784646987915} -11/06/2021 22:31:18 - INFO - __main__ - Step 9148: {'lr': 0.0004971285532514868, 'samples': 1756416, 'steps': 9147, 'loss/train': 1.7974958419799805} -11/06/2021 22:31:18 - INFO - __main__ - Step 9149: {'lr': 0.000497127751198532, 'samples': 1756608, 'steps': 9148, 'loss/train': 1.7774125337600708} -11/06/2021 22:31:19 - INFO - __main__ - Step 9150: {'lr': 0.0004971269490342252, 'samples': 1756800, 'steps': 9149, 'loss/train': 1.6433255672454834} -11/06/2021 22:31:19 - INFO - __main__ - Step 9151: {'lr': 0.0004971261467585669, 'samples': 1756992, 'steps': 9150, 'loss/train': 2.028750419616699} -11/06/2021 22:31:20 - INFO - __main__ - Step 9152: {'lr': 0.0004971253443715572, 'samples': 1757184, 'steps': 9151, 'loss/train': 1.2226204872131348} -11/06/2021 22:31:20 - INFO - __main__ - Step 9153: {'lr': 0.0004971245418731966, 'samples': 1757376, 'steps': 9152, 'loss/train': 2.202749490737915} -11/06/2021 22:31:21 - INFO - __main__ - Step 9154: {'lr': 0.0004971237392634857, 'samples': 1757568, 'steps': 9153, 'loss/train': 1.7844159603118896} -11/06/2021 22:31:21 - INFO - __main__ - Step 9155: {'lr': 0.0004971229365424246, 'samples': 1757760, 'steps': 9154, 'loss/train': 1.973191738128662} -11/06/2021 22:31:21 - INFO - __main__ - Step 9156: {'lr': 0.0004971221337100137, 'samples': 1757952, 'steps': 9155, 'loss/train': 1.785252332687378} -11/06/2021 22:31:23 - INFO - __main__ - Step 9157: {'lr': 0.0004971213307662534, 'samples': 1758144, 'steps': 9156, 'loss/train': 2.1560020446777344} -11/06/2021 22:31:23 - INFO - __main__ - Step 9158: {'lr': 0.000497120527711144, 'samples': 1758336, 'steps': 9157, 'loss/train': 1.1199406385421753} -11/06/2021 22:31:23 - INFO - __main__ - Step 9159: {'lr': 0.0004971197245446859, 'samples': 1758528, 'steps': 9158, 'loss/train': 2.273866891860962} -11/06/2021 22:31:24 - INFO - __main__ - Step 9160: {'lr': 0.0004971189212668794, 'samples': 1758720, 'steps': 9159, 'loss/train': 2.1585633754730225} -11/06/2021 22:31:24 - INFO - __main__ - Step 9161: {'lr': 0.0004971181178777251, 'samples': 1758912, 'steps': 9160, 'loss/train': 2.7556064128875732} -11/06/2021 22:31:24 - INFO - __main__ - Step 9162: {'lr': 0.0004971173143772231, 'samples': 1759104, 'steps': 9161, 'loss/train': 1.7603553533554077} -11/06/2021 22:31:25 - INFO - __main__ - Step 9163: {'lr': 0.0004971165107653738, 'samples': 1759296, 'steps': 9162, 'loss/train': 1.7750883102416992} -11/06/2021 22:31:26 - INFO - __main__ - Step 9164: {'lr': 0.0004971157070421776, 'samples': 1759488, 'steps': 9163, 'loss/train': 2.1838340759277344} -11/06/2021 22:31:26 - INFO - __main__ - Step 9165: {'lr': 0.000497114903207635, 'samples': 1759680, 'steps': 9164, 'loss/train': 2.311770439147949} -11/06/2021 22:31:26 - INFO - __main__ - Step 9166: {'lr': 0.0004971140992617462, 'samples': 1759872, 'steps': 9165, 'loss/train': 1.977513074874878} -11/06/2021 22:31:27 - INFO - __main__ - Step 9167: {'lr': 0.0004971132952045115, 'samples': 1760064, 'steps': 9166, 'loss/train': 1.9859895706176758} -11/06/2021 22:31:28 - INFO - __main__ - Step 9168: {'lr': 0.0004971124910359315, 'samples': 1760256, 'steps': 9167, 'loss/train': 1.7666734457015991} -11/06/2021 22:31:28 - INFO - __main__ - Step 9169: {'lr': 0.0004971116867560064, 'samples': 1760448, 'steps': 9168, 'loss/train': 1.7961926460266113} -11/06/2021 22:31:28 - INFO - __main__ - Step 9170: {'lr': 0.0004971108823647365, 'samples': 1760640, 'steps': 9169, 'loss/train': 1.904386281967163} -11/06/2021 22:31:29 - INFO - __main__ - Step 9171: {'lr': 0.0004971100778621223, 'samples': 1760832, 'steps': 9170, 'loss/train': 1.477123498916626} -11/06/2021 22:31:29 - INFO - __main__ - Step 9172: {'lr': 0.0004971092732481641, 'samples': 1761024, 'steps': 9171, 'loss/train': 1.5037059783935547} -11/06/2021 22:31:30 - INFO - __main__ - Step 9173: {'lr': 0.0004971084685228623, 'samples': 1761216, 'steps': 9172, 'loss/train': 1.8202991485595703} -11/06/2021 22:31:30 - INFO - __main__ - Step 9174: {'lr': 0.0004971076636862172, 'samples': 1761408, 'steps': 9173, 'loss/train': 1.7181813716888428} -11/06/2021 22:31:31 - INFO - __main__ - Step 9175: {'lr': 0.0004971068587382293, 'samples': 1761600, 'steps': 9174, 'loss/train': 1.4500627517700195} -11/06/2021 22:31:31 - INFO - __main__ - Step 9176: {'lr': 0.0004971060536788988, 'samples': 1761792, 'steps': 9175, 'loss/train': 1.9381426572799683} -11/06/2021 22:31:31 - INFO - __main__ - Step 9177: {'lr': 0.000497105248508226, 'samples': 1761984, 'steps': 9176, 'loss/train': 1.841038465499878} -11/06/2021 22:31:33 - INFO - __main__ - Step 9178: {'lr': 0.0004971044432262115, 'samples': 1762176, 'steps': 9177, 'loss/train': 1.351794958114624} -11/06/2021 22:31:33 - INFO - __main__ - Step 9179: {'lr': 0.0004971036378328556, 'samples': 1762368, 'steps': 9178, 'loss/train': 1.7219154834747314} -11/06/2021 22:31:33 - INFO - __main__ - Step 9180: {'lr': 0.0004971028323281586, 'samples': 1762560, 'steps': 9179, 'loss/train': 2.6767475605010986} -11/06/2021 22:31:34 - INFO - __main__ - Step 9181: {'lr': 0.0004971020267121208, 'samples': 1762752, 'steps': 9180, 'loss/train': 2.2747514247894287} -11/06/2021 22:31:34 - INFO - __main__ - Step 9182: {'lr': 0.0004971012209847427, 'samples': 1762944, 'steps': 9181, 'loss/train': 1.0986586809158325} -11/06/2021 22:31:35 - INFO - __main__ - Step 9183: {'lr': 0.0004971004151460245, 'samples': 1763136, 'steps': 9182, 'loss/train': 1.2503761053085327} -11/06/2021 22:31:35 - INFO - __main__ - Step 9184: {'lr': 0.0004970996091959668, 'samples': 1763328, 'steps': 9183, 'loss/train': 1.487623691558838} -11/06/2021 22:31:36 - INFO - __main__ - Step 9185: {'lr': 0.0004970988031345698, 'samples': 1763520, 'steps': 9184, 'loss/train': 1.718331217765808} -11/06/2021 22:31:36 - INFO - __main__ - Step 9186: {'lr': 0.0004970979969618338, 'samples': 1763712, 'steps': 9185, 'loss/train': 1.1969623565673828} -11/06/2021 22:31:36 - INFO - __main__ - Step 9187: {'lr': 0.0004970971906777593, 'samples': 1763904, 'steps': 9186, 'loss/train': 1.9592634439468384} -11/06/2021 22:31:37 - INFO - __main__ - Step 9188: {'lr': 0.0004970963842823468, 'samples': 1764096, 'steps': 9187, 'loss/train': 1.1920486688613892} -11/06/2021 22:31:38 - INFO - __main__ - Step 9189: {'lr': 0.0004970955777755963, 'samples': 1764288, 'steps': 9188, 'loss/train': 1.6599271297454834} -11/06/2021 22:31:39 - INFO - __main__ - Step 9190: {'lr': 0.0004970947711575083, 'samples': 1764480, 'steps': 9189, 'loss/train': 1.8432694673538208} -11/06/2021 22:31:39 - INFO - __main__ - Step 9191: {'lr': 0.0004970939644280833, 'samples': 1764672, 'steps': 9190, 'loss/train': 1.6999132633209229} -11/06/2021 22:31:39 - INFO - __main__ - Step 9192: {'lr': 0.0004970931575873215, 'samples': 1764864, 'steps': 9191, 'loss/train': 1.533847451210022} -11/06/2021 22:31:40 - INFO - __main__ - Step 9193: {'lr': 0.0004970923506352234, 'samples': 1765056, 'steps': 9192, 'loss/train': 1.8772602081298828} -11/06/2021 22:31:40 - INFO - __main__ - Step 9194: {'lr': 0.0004970915435717893, 'samples': 1765248, 'steps': 9193, 'loss/train': 1.8430668115615845} -11/06/2021 22:31:41 - INFO - __main__ - Step 9195: {'lr': 0.0004970907363970196, 'samples': 1765440, 'steps': 9194, 'loss/train': 1.7536627054214478} -11/06/2021 22:31:41 - INFO - __main__ - Step 9196: {'lr': 0.0004970899291109145, 'samples': 1765632, 'steps': 9195, 'loss/train': 1.858238697052002} -11/06/2021 22:31:42 - INFO - __main__ - Step 9197: {'lr': 0.0004970891217134746, 'samples': 1765824, 'steps': 9196, 'loss/train': 2.1001169681549072} -11/06/2021 22:31:42 - INFO - __main__ - Step 9198: {'lr': 0.0004970883142047001, 'samples': 1766016, 'steps': 9197, 'loss/train': 2.0097129344940186} -11/06/2021 22:31:43 - INFO - __main__ - Step 9199: {'lr': 0.0004970875065845914, 'samples': 1766208, 'steps': 9198, 'loss/train': 2.0182600021362305} -11/06/2021 22:31:44 - INFO - __main__ - Step 9200: {'lr': 0.000497086698853149, 'samples': 1766400, 'steps': 9199, 'loss/train': 1.785837173461914} -11/06/2021 22:31:44 - INFO - __main__ - Step 9201: {'lr': 0.0004970858910103731, 'samples': 1766592, 'steps': 9200, 'loss/train': 1.773368000984192} -11/06/2021 22:31:44 - INFO - __main__ - Step 9202: {'lr': 0.0004970850830562641, 'samples': 1766784, 'steps': 9201, 'loss/train': 2.1283977031707764} -11/06/2021 22:31:45 - INFO - __main__ - Step 9203: {'lr': 0.0004970842749908223, 'samples': 1766976, 'steps': 9202, 'loss/train': 1.710228443145752} -11/06/2021 22:31:45 - INFO - __main__ - Step 9204: {'lr': 0.0004970834668140482, 'samples': 1767168, 'steps': 9203, 'loss/train': 1.6465903520584106} -11/06/2021 22:31:46 - INFO - __main__ - Step 9205: {'lr': 0.0004970826585259421, 'samples': 1767360, 'steps': 9204, 'loss/train': 1.8432360887527466} -11/06/2021 22:31:46 - INFO - __main__ - Step 9206: {'lr': 0.0004970818501265044, 'samples': 1767552, 'steps': 9205, 'loss/train': 1.9140604734420776} -11/06/2021 22:31:47 - INFO - __main__ - Step 9207: {'lr': 0.0004970810416157354, 'samples': 1767744, 'steps': 9206, 'loss/train': 1.4957774877548218} -11/06/2021 22:31:47 - INFO - __main__ - Step 9208: {'lr': 0.0004970802329936355, 'samples': 1767936, 'steps': 9207, 'loss/train': 1.110896110534668} -11/06/2021 22:31:47 - INFO - __main__ - Step 9209: {'lr': 0.000497079424260205, 'samples': 1768128, 'steps': 9208, 'loss/train': 2.041264057159424} -11/06/2021 22:31:48 - INFO - __main__ - Step 9210: {'lr': 0.0004970786154154444, 'samples': 1768320, 'steps': 9209, 'loss/train': 1.8915854692459106} -11/06/2021 22:31:49 - INFO - __main__ - Step 9211: {'lr': 0.000497077806459354, 'samples': 1768512, 'steps': 9210, 'loss/train': 1.495437502861023} -11/06/2021 22:31:49 - INFO - __main__ - Step 9212: {'lr': 0.0004970769973919341, 'samples': 1768704, 'steps': 9211, 'loss/train': 1.2148029804229736} -11/06/2021 22:31:50 - INFO - __main__ - Step 9213: {'lr': 0.0004970761882131851, 'samples': 1768896, 'steps': 9212, 'loss/train': 3.2807438373565674} -11/06/2021 22:31:50 - INFO - __main__ - Step 9214: {'lr': 0.0004970753789231074, 'samples': 1769088, 'steps': 9213, 'loss/train': 1.3468689918518066} -11/06/2021 22:31:50 - INFO - __main__ - Step 9215: {'lr': 0.0004970745695217014, 'samples': 1769280, 'steps': 9214, 'loss/train': 2.1012730598449707} -11/06/2021 22:31:51 - INFO - __main__ - Step 9216: {'lr': 0.0004970737600089673, 'samples': 1769472, 'steps': 9215, 'loss/train': 2.018321990966797} -11/06/2021 22:31:52 - INFO - __main__ - Step 9217: {'lr': 0.0004970729503849057, 'samples': 1769664, 'steps': 9216, 'loss/train': 0.4318278431892395} -11/06/2021 22:31:52 - INFO - __main__ - Step 9218: {'lr': 0.0004970721406495168, 'samples': 1769856, 'steps': 9217, 'loss/train': 1.8669426441192627} -11/06/2021 22:31:53 - INFO - __main__ - Step 9219: {'lr': 0.000497071330802801, 'samples': 1770048, 'steps': 9218, 'loss/train': 1.9158834218978882} -11/06/2021 22:31:53 - INFO - __main__ - Step 9220: {'lr': 0.0004970705208447587, 'samples': 1770240, 'steps': 9219, 'loss/train': 1.9058424234390259} -11/06/2021 22:31:53 - INFO - __main__ - Step 9221: {'lr': 0.0004970697107753902, 'samples': 1770432, 'steps': 9220, 'loss/train': 2.554187059402466} -11/06/2021 22:31:54 - INFO - __main__ - Step 9222: {'lr': 0.0004970689005946959, 'samples': 1770624, 'steps': 9221, 'loss/train': 1.937746286392212} -11/06/2021 22:31:55 - INFO - __main__ - Step 9223: {'lr': 0.0004970680903026762, 'samples': 1770816, 'steps': 9222, 'loss/train': 1.8598175048828125} -11/06/2021 22:31:55 - INFO - __main__ - Step 9224: {'lr': 0.0004970672798993313, 'samples': 1771008, 'steps': 9223, 'loss/train': 1.6042256355285645} -11/06/2021 22:31:55 - INFO - __main__ - Step 9225: {'lr': 0.0004970664693846618, 'samples': 1771200, 'steps': 9224, 'loss/train': 1.7904118299484253} -11/06/2021 22:31:56 - INFO - __main__ - Step 9226: {'lr': 0.000497065658758668, 'samples': 1771392, 'steps': 9225, 'loss/train': 1.8984659910202026} -11/06/2021 22:31:57 - INFO - __main__ - Step 9227: {'lr': 0.0004970648480213502, 'samples': 1771584, 'steps': 9226, 'loss/train': 2.082733631134033} -11/06/2021 22:31:57 - INFO - __main__ - Step 9228: {'lr': 0.0004970640371727088, 'samples': 1771776, 'steps': 9227, 'loss/train': 1.6446478366851807} -11/06/2021 22:31:57 - INFO - __main__ - Step 9229: {'lr': 0.0004970632262127441, 'samples': 1771968, 'steps': 9228, 'loss/train': 1.608752965927124} -11/06/2021 22:31:58 - INFO - __main__ - Step 9230: {'lr': 0.0004970624151414565, 'samples': 1772160, 'steps': 9229, 'loss/train': 1.8369768857955933} -11/06/2021 22:31:58 - INFO - __main__ - Step 9231: {'lr': 0.0004970616039588465, 'samples': 1772352, 'steps': 9230, 'loss/train': 1.8356631994247437} -11/06/2021 22:31:59 - INFO - __main__ - Step 9232: {'lr': 0.0004970607926649143, 'samples': 1772544, 'steps': 9231, 'loss/train': 1.8199883699417114} -11/06/2021 22:31:59 - INFO - __main__ - Step 9233: {'lr': 0.0004970599812596603, 'samples': 1772736, 'steps': 9232, 'loss/train': 1.2998876571655273} -11/06/2021 22:32:00 - INFO - __main__ - Step 9234: {'lr': 0.0004970591697430849, 'samples': 1772928, 'steps': 9233, 'loss/train': 1.8944025039672852} -11/06/2021 22:32:00 - INFO - __main__ - Step 9235: {'lr': 0.0004970583581151885, 'samples': 1773120, 'steps': 9234, 'loss/train': 1.8377676010131836} -11/06/2021 22:32:00 - INFO - __main__ - Step 9236: {'lr': 0.0004970575463759713, 'samples': 1773312, 'steps': 9235, 'loss/train': 1.6329200267791748} -11/06/2021 22:32:02 - INFO - __main__ - Step 9237: {'lr': 0.0004970567345254339, 'samples': 1773504, 'steps': 9236, 'loss/train': 1.544152021408081} -11/06/2021 22:32:02 - INFO - __main__ - Step 9238: {'lr': 0.0004970559225635765, 'samples': 1773696, 'steps': 9237, 'loss/train': 1.5652451515197754} -11/06/2021 22:32:02 - INFO - __main__ - Step 9239: {'lr': 0.0004970551104903995, 'samples': 1773888, 'steps': 9238, 'loss/train': 2.267305374145508} -11/06/2021 22:32:03 - INFO - __main__ - Step 9240: {'lr': 0.0004970542983059033, 'samples': 1774080, 'steps': 9239, 'loss/train': 1.8805835247039795} -11/06/2021 22:32:03 - INFO - __main__ - Step 9241: {'lr': 0.0004970534860100883, 'samples': 1774272, 'steps': 9240, 'loss/train': 1.7890807390213013} -11/06/2021 22:32:04 - INFO - __main__ - Step 9242: {'lr': 0.0004970526736029547, 'samples': 1774464, 'steps': 9241, 'loss/train': 1.4509460926055908} -11/06/2021 22:32:04 - INFO - __main__ - Step 9243: {'lr': 0.000497051861084503, 'samples': 1774656, 'steps': 9242, 'loss/train': 1.3258929252624512} -11/06/2021 22:32:05 - INFO - __main__ - Step 9244: {'lr': 0.0004970510484547336, 'samples': 1774848, 'steps': 9243, 'loss/train': 1.9906156063079834} -11/06/2021 22:32:05 - INFO - __main__ - Step 9245: {'lr': 0.0004970502357136468, 'samples': 1775040, 'steps': 9244, 'loss/train': 1.9643011093139648} -11/06/2021 22:32:05 - INFO - __main__ - Step 9246: {'lr': 0.0004970494228612429, 'samples': 1775232, 'steps': 9245, 'loss/train': 1.9511194229125977} -11/06/2021 22:32:06 - INFO - __main__ - Step 9247: {'lr': 0.0004970486098975224, 'samples': 1775424, 'steps': 9246, 'loss/train': 1.7946999073028564} -11/06/2021 22:32:07 - INFO - __main__ - Step 9248: {'lr': 0.0004970477968224856, 'samples': 1775616, 'steps': 9247, 'loss/train': 1.9336384534835815} -11/06/2021 22:32:07 - INFO - __main__ - Step 9249: {'lr': 0.000497046983636133, 'samples': 1775808, 'steps': 9248, 'loss/train': 1.3553489446640015} -11/06/2021 22:32:07 - INFO - __main__ - Step 9250: {'lr': 0.0004970461703384647, 'samples': 1776000, 'steps': 9249, 'loss/train': 1.9446792602539062} -11/06/2021 22:32:08 - INFO - __main__ - Step 9251: {'lr': 0.0004970453569294812, 'samples': 1776192, 'steps': 9250, 'loss/train': 1.8456064462661743} -11/06/2021 22:32:08 - INFO - __main__ - Step 9252: {'lr': 0.000497044543409183, 'samples': 1776384, 'steps': 9251, 'loss/train': 1.9062843322753906} -11/06/2021 22:32:09 - INFO - __main__ - Step 9253: {'lr': 0.0004970437297775702, 'samples': 1776576, 'steps': 9252, 'loss/train': 1.9113454818725586} -11/06/2021 22:32:10 - INFO - __main__ - Step 9254: {'lr': 0.0004970429160346433, 'samples': 1776768, 'steps': 9253, 'loss/train': 1.5249048471450806} -11/06/2021 22:32:10 - INFO - __main__ - Step 9255: {'lr': 0.0004970421021804027, 'samples': 1776960, 'steps': 9254, 'loss/train': 2.172207832336426} -11/06/2021 22:32:10 - INFO - __main__ - Step 9256: {'lr': 0.0004970412882148488, 'samples': 1777152, 'steps': 9255, 'loss/train': 1.1907613277435303} -11/06/2021 22:32:11 - INFO - __main__ - Step 9257: {'lr': 0.0004970404741379818, 'samples': 1777344, 'steps': 9256, 'loss/train': 1.6788753271102905} -11/06/2021 22:32:12 - INFO - __main__ - Step 9258: {'lr': 0.0004970396599498023, 'samples': 1777536, 'steps': 9257, 'loss/train': 1.072892189025879} -11/06/2021 22:32:12 - INFO - __main__ - Step 9259: {'lr': 0.0004970388456503105, 'samples': 1777728, 'steps': 9258, 'loss/train': 1.4916554689407349} -11/06/2021 22:32:13 - INFO - __main__ - Step 9260: {'lr': 0.0004970380312395069, 'samples': 1777920, 'steps': 9259, 'loss/train': 1.7013155221939087} -11/06/2021 22:32:13 - INFO - __main__ - Step 9261: {'lr': 0.0004970372167173915, 'samples': 1778112, 'steps': 9260, 'loss/train': 2.010669708251953} -11/06/2021 22:32:13 - INFO - __main__ - Step 9262: {'lr': 0.0004970364020839652, 'samples': 1778304, 'steps': 9261, 'loss/train': 1.8238394260406494} -11/06/2021 22:32:14 - INFO - __main__ - Step 9263: {'lr': 0.0004970355873392281, 'samples': 1778496, 'steps': 9262, 'loss/train': 1.3550951480865479} -11/06/2021 22:32:15 - INFO - __main__ - Step 9264: {'lr': 0.0004970347724831804, 'samples': 1778688, 'steps': 9263, 'loss/train': 1.880463719367981} -11/06/2021 22:32:15 - INFO - __main__ - Step 9265: {'lr': 0.0004970339575158228, 'samples': 1778880, 'steps': 9264, 'loss/train': 1.692347764968872} -11/06/2021 22:32:15 - INFO - __main__ - Step 9266: {'lr': 0.0004970331424371555, 'samples': 1779072, 'steps': 9265, 'loss/train': 1.760794997215271} -11/06/2021 22:32:16 - INFO - __main__ - Step 9267: {'lr': 0.0004970323272471788, 'samples': 1779264, 'steps': 9266, 'loss/train': 1.9668833017349243} -11/06/2021 22:32:16 - INFO - __main__ - Step 9268: {'lr': 0.0004970315119458931, 'samples': 1779456, 'steps': 9267, 'loss/train': 1.905427098274231} -11/06/2021 22:32:17 - INFO - __main__ - Step 9269: {'lr': 0.000497030696533299, 'samples': 1779648, 'steps': 9268, 'loss/train': 1.6687836647033691} -11/06/2021 22:32:17 - INFO - __main__ - Step 9270: {'lr': 0.0004970298810093965, 'samples': 1779840, 'steps': 9269, 'loss/train': 1.7328218221664429} -11/06/2021 22:32:18 - INFO - __main__ - Step 9271: {'lr': 0.0004970290653741863, 'samples': 1780032, 'steps': 9270, 'loss/train': 1.6917048692703247} -11/06/2021 22:32:18 - INFO - __main__ - Step 9272: {'lr': 0.0004970282496276684, 'samples': 1780224, 'steps': 9271, 'loss/train': 1.8625608682632446} -11/06/2021 22:32:19 - INFO - __main__ - Step 9273: {'lr': 0.0004970274337698436, 'samples': 1780416, 'steps': 9272, 'loss/train': 1.789774775505066} -11/06/2021 22:32:19 - INFO - __main__ - Step 9274: {'lr': 0.000497026617800712, 'samples': 1780608, 'steps': 9273, 'loss/train': 1.5155421495437622} -11/06/2021 22:32:20 - INFO - __main__ - Step 9275: {'lr': 0.000497025801720274, 'samples': 1780800, 'steps': 9274, 'loss/train': 1.8197972774505615} -11/06/2021 22:32:20 - INFO - __main__ - Step 9276: {'lr': 0.00049702498552853, 'samples': 1780992, 'steps': 9275, 'loss/train': 2.1639773845672607} -11/06/2021 22:32:21 - INFO - __main__ - Step 9277: {'lr': 0.0004970241692254803, 'samples': 1781184, 'steps': 9276, 'loss/train': 1.6572617292404175} -11/06/2021 22:32:21 - INFO - __main__ - Step 9278: {'lr': 0.0004970233528111253, 'samples': 1781376, 'steps': 9277, 'loss/train': 1.9275052547454834} -11/06/2021 22:32:22 - INFO - __main__ - Step 9279: {'lr': 0.0004970225362854654, 'samples': 1781568, 'steps': 9278, 'loss/train': 1.4207885265350342} -11/06/2021 22:32:22 - INFO - __main__ - Step 9280: {'lr': 0.0004970217196485011, 'samples': 1781760, 'steps': 9279, 'loss/train': 1.7480263710021973} -11/06/2021 22:32:23 - INFO - __main__ - Step 9281: {'lr': 0.0004970209029002325, 'samples': 1781952, 'steps': 9280, 'loss/train': 2.001077890396118} -11/06/2021 22:32:23 - INFO - __main__ - Step 9282: {'lr': 0.0004970200860406601, 'samples': 1782144, 'steps': 9281, 'loss/train': 1.4385563135147095} -11/06/2021 22:32:23 - INFO - __main__ - Step 9283: {'lr': 0.0004970192690697843, 'samples': 1782336, 'steps': 9282, 'loss/train': 1.1170109510421753} -11/06/2021 22:32:24 - INFO - __main__ - Step 9284: {'lr': 0.0004970184519876053, 'samples': 1782528, 'steps': 9283, 'loss/train': 1.6639217138290405} -11/06/2021 22:32:25 - INFO - __main__ - Step 9285: {'lr': 0.0004970176347941237, 'samples': 1782720, 'steps': 9284, 'loss/train': 1.5901360511779785} -11/06/2021 22:32:25 - INFO - __main__ - Step 9286: {'lr': 0.0004970168174893398, 'samples': 1782912, 'steps': 9285, 'loss/train': 2.016771078109741} -11/06/2021 22:32:25 - INFO - __main__ - Step 9287: {'lr': 0.0004970160000732539, 'samples': 1783104, 'steps': 9286, 'loss/train': 1.7004362344741821} -11/06/2021 22:32:26 - INFO - __main__ - Step 9288: {'lr': 0.0004970151825458664, 'samples': 1783296, 'steps': 9287, 'loss/train': 2.1699607372283936} -11/06/2021 22:32:27 - INFO - __main__ - Step 9289: {'lr': 0.0004970143649071777, 'samples': 1783488, 'steps': 9288, 'loss/train': 1.9318630695343018} -11/06/2021 22:32:27 - INFO - __main__ - Step 9290: {'lr': 0.0004970135471571881, 'samples': 1783680, 'steps': 9289, 'loss/train': 1.4492002725601196} -11/06/2021 22:32:28 - INFO - __main__ - Step 9291: {'lr': 0.000497012729295898, 'samples': 1783872, 'steps': 9290, 'loss/train': 1.6423429250717163} -11/06/2021 22:32:28 - INFO - __main__ - Step 9292: {'lr': 0.0004970119113233078, 'samples': 1784064, 'steps': 9291, 'loss/train': 1.7522389888763428} -11/06/2021 22:32:28 - INFO - __main__ - Step 9293: {'lr': 0.0004970110932394178, 'samples': 1784256, 'steps': 9292, 'loss/train': 1.4317411184310913} -11/06/2021 22:32:29 - INFO - __main__ - Step 9294: {'lr': 0.0004970102750442285, 'samples': 1784448, 'steps': 9293, 'loss/train': 2.1833393573760986} -11/06/2021 22:32:30 - INFO - __main__ - Step 9295: {'lr': 0.0004970094567377402, 'samples': 1784640, 'steps': 9294, 'loss/train': 0.5875868797302246} -11/06/2021 22:32:30 - INFO - __main__ - Step 9296: {'lr': 0.0004970086383199532, 'samples': 1784832, 'steps': 9295, 'loss/train': 2.128361701965332} -11/06/2021 22:32:30 - INFO - __main__ - Step 9297: {'lr': 0.0004970078197908678, 'samples': 1785024, 'steps': 9296, 'loss/train': 1.418079137802124} -11/06/2021 22:32:31 - INFO - __main__ - Step 9298: {'lr': 0.0004970070011504846, 'samples': 1785216, 'steps': 9297, 'loss/train': 1.8061836957931519} -11/06/2021 22:32:31 - INFO - __main__ - Step 9299: {'lr': 0.0004970061823988038, 'samples': 1785408, 'steps': 9298, 'loss/train': 1.9081430435180664} -11/06/2021 22:32:32 - INFO - __main__ - Step 9300: {'lr': 0.0004970053635358259, 'samples': 1785600, 'steps': 9299, 'loss/train': 1.5807913541793823} -11/06/2021 22:32:33 - INFO - __main__ - Step 9301: {'lr': 0.0004970045445615512, 'samples': 1785792, 'steps': 9300, 'loss/train': 1.5762659311294556} -11/06/2021 22:32:33 - INFO - __main__ - Step 9302: {'lr': 0.00049700372547598, 'samples': 1785984, 'steps': 9301, 'loss/train': 1.5313711166381836} -11/06/2021 22:32:33 - INFO - __main__ - Step 9303: {'lr': 0.0004970029062791128, 'samples': 1786176, 'steps': 9302, 'loss/train': 1.933624505996704} -11/06/2021 22:32:34 - INFO - __main__ - Step 9304: {'lr': 0.0004970020869709498, 'samples': 1786368, 'steps': 9303, 'loss/train': 1.6305302381515503} -11/06/2021 22:32:35 - INFO - __main__ - Step 9305: {'lr': 0.0004970012675514915, 'samples': 1786560, 'steps': 9304, 'loss/train': 1.5275381803512573} -11/06/2021 22:32:35 - INFO - __main__ - Step 9306: {'lr': 0.0004970004480207384, 'samples': 1786752, 'steps': 9305, 'loss/train': 1.6243155002593994} -11/06/2021 22:32:35 - INFO - __main__ - Step 9307: {'lr': 0.0004969996283786905, 'samples': 1786944, 'steps': 9306, 'loss/train': 1.8101203441619873} -11/06/2021 22:32:36 - INFO - __main__ - Step 9308: {'lr': 0.0004969988086253486, 'samples': 1787136, 'steps': 9307, 'loss/train': 1.9703173637390137} -11/06/2021 22:32:36 - INFO - __main__ - Step 9309: {'lr': 0.0004969979887607125, 'samples': 1787328, 'steps': 9308, 'loss/train': 1.6925435066223145} -11/06/2021 22:32:37 - INFO - __main__ - Step 9310: {'lr': 0.0004969971687847832, 'samples': 1787520, 'steps': 9309, 'loss/train': 2.585664749145508} -11/06/2021 22:32:37 - INFO - __main__ - Step 9311: {'lr': 0.0004969963486975607, 'samples': 1787712, 'steps': 9310, 'loss/train': 1.2041494846343994} -11/06/2021 22:32:38 - INFO - __main__ - Step 9312: {'lr': 0.0004969955284990455, 'samples': 1787904, 'steps': 9311, 'loss/train': 1.6597546339035034} -11/06/2021 22:32:38 - INFO - __main__ - Step 9313: {'lr': 0.0004969947081892379, 'samples': 1788096, 'steps': 9312, 'loss/train': 1.6976758241653442} -11/06/2021 22:32:38 - INFO - __main__ - Step 9314: {'lr': 0.0004969938877681383, 'samples': 1788288, 'steps': 9313, 'loss/train': 1.9452763795852661} -11/06/2021 22:32:39 - INFO - __main__ - Step 9315: {'lr': 0.0004969930672357471, 'samples': 1788480, 'steps': 9314, 'loss/train': 2.183551788330078} -11/06/2021 22:32:40 - INFO - __main__ - Step 9316: {'lr': 0.0004969922465920645, 'samples': 1788672, 'steps': 9315, 'loss/train': 2.362039089202881} -11/06/2021 22:32:40 - INFO - __main__ - Step 9317: {'lr': 0.0004969914258370912, 'samples': 1788864, 'steps': 9316, 'loss/train': 2.2192182540893555} -11/06/2021 22:32:41 - INFO - __main__ - Step 9318: {'lr': 0.0004969906049708272, 'samples': 1789056, 'steps': 9317, 'loss/train': 1.708990454673767} -11/06/2021 22:32:41 - INFO - __main__ - Step 9319: {'lr': 0.0004969897839932732, 'samples': 1789248, 'steps': 9318, 'loss/train': 1.988546371459961} -11/06/2021 22:32:41 - INFO - __main__ - Step 9320: {'lr': 0.0004969889629044293, 'samples': 1789440, 'steps': 9319, 'loss/train': 1.3980268239974976} -11/06/2021 22:32:42 - INFO - __main__ - Step 9321: {'lr': 0.000496988141704296, 'samples': 1789632, 'steps': 9320, 'loss/train': 6.165026664733887} -11/06/2021 22:32:43 - INFO - __main__ - Step 9322: {'lr': 0.0004969873203928737, 'samples': 1789824, 'steps': 9321, 'loss/train': 1.2539154291152954} -11/06/2021 22:32:43 - INFO - __main__ - Step 9323: {'lr': 0.0004969864989701626, 'samples': 1790016, 'steps': 9322, 'loss/train': 1.7540534734725952} -11/06/2021 22:32:43 - INFO - __main__ - Step 9324: {'lr': 0.0004969856774361634, 'samples': 1790208, 'steps': 9323, 'loss/train': 1.9644792079925537} -11/06/2021 22:32:44 - INFO - __main__ - Step 9325: {'lr': 0.0004969848557908761, 'samples': 1790400, 'steps': 9324, 'loss/train': 1.722193717956543} -11/06/2021 22:32:44 - INFO - __main__ - Step 9326: {'lr': 0.0004969840340343013, 'samples': 1790592, 'steps': 9325, 'loss/train': 2.381248712539673} -11/06/2021 22:32:45 - INFO - __main__ - Step 9327: {'lr': 0.0004969832121664394, 'samples': 1790784, 'steps': 9326, 'loss/train': 1.3223377466201782} -11/06/2021 22:32:46 - INFO - __main__ - Step 9328: {'lr': 0.0004969823901872906, 'samples': 1790976, 'steps': 9327, 'loss/train': 2.1059629917144775} -11/06/2021 22:32:46 - INFO - __main__ - Step 9329: {'lr': 0.0004969815680968552, 'samples': 1791168, 'steps': 9328, 'loss/train': 1.7567250728607178} -11/06/2021 22:32:46 - INFO - __main__ - Step 9330: {'lr': 0.0004969807458951339, 'samples': 1791360, 'steps': 9329, 'loss/train': 1.10848867893219} -11/06/2021 22:32:47 - INFO - __main__ - Step 9331: {'lr': 0.0004969799235821268, 'samples': 1791552, 'steps': 9330, 'loss/train': 1.527244210243225} -11/06/2021 22:32:48 - INFO - __main__ - Step 9332: {'lr': 0.0004969791011578344, 'samples': 1791744, 'steps': 9331, 'loss/train': 1.9717392921447754} -11/06/2021 22:32:48 - INFO - __main__ - Step 9333: {'lr': 0.000496978278622257, 'samples': 1791936, 'steps': 9332, 'loss/train': 1.1061983108520508} -11/06/2021 22:32:48 - INFO - __main__ - Step 9334: {'lr': 0.000496977455975395, 'samples': 1792128, 'steps': 9333, 'loss/train': 1.6116451025009155} -11/06/2021 22:32:49 - INFO - __main__ - Step 9335: {'lr': 0.0004969766332172488, 'samples': 1792320, 'steps': 9334, 'loss/train': 2.009783983230591} -11/06/2021 22:32:49 - INFO - __main__ - Step 9336: {'lr': 0.0004969758103478187, 'samples': 1792512, 'steps': 9335, 'loss/train': 1.6776036024093628} -11/06/2021 22:32:50 - INFO - __main__ - Step 9337: {'lr': 0.0004969749873671051, 'samples': 1792704, 'steps': 9336, 'loss/train': 1.6824532747268677} -11/06/2021 22:32:50 - INFO - __main__ - Step 9338: {'lr': 0.0004969741642751085, 'samples': 1792896, 'steps': 9337, 'loss/train': 1.9121274948120117} -11/06/2021 22:32:51 - INFO - __main__ - Step 9339: {'lr': 0.000496973341071829, 'samples': 1793088, 'steps': 9338, 'loss/train': 1.8858976364135742} -11/06/2021 22:32:51 - INFO - __main__ - Step 9340: {'lr': 0.0004969725177572672, 'samples': 1793280, 'steps': 9339, 'loss/train': 1.5066814422607422} -11/06/2021 22:32:51 - INFO - __main__ - Step 9341: {'lr': 0.0004969716943314234, 'samples': 1793472, 'steps': 9340, 'loss/train': 1.8776342868804932} -11/06/2021 22:32:52 - INFO - __main__ - Step 9342: {'lr': 0.0004969708707942979, 'samples': 1793664, 'steps': 9341, 'loss/train': 2.180288314819336} -11/06/2021 22:32:53 - INFO - __main__ - Step 9343: {'lr': 0.0004969700471458913, 'samples': 1793856, 'steps': 9342, 'loss/train': 1.4142295122146606} -11/06/2021 22:32:53 - INFO - __main__ - Step 9344: {'lr': 0.0004969692233862036, 'samples': 1794048, 'steps': 9343, 'loss/train': 1.8621501922607422} -11/06/2021 22:32:53 - INFO - __main__ - Step 9345: {'lr': 0.0004969683995152355, 'samples': 1794240, 'steps': 9344, 'loss/train': 3.186241626739502} -11/06/2021 22:32:54 - INFO - __main__ - Step 9346: {'lr': 0.0004969675755329872, 'samples': 1794432, 'steps': 9345, 'loss/train': 1.875054121017456} -11/06/2021 22:32:55 - INFO - __main__ - Step 9347: {'lr': 0.0004969667514394592, 'samples': 1794624, 'steps': 9346, 'loss/train': 2.312483072280884} -11/06/2021 22:32:55 - INFO - __main__ - Step 9348: {'lr': 0.0004969659272346517, 'samples': 1794816, 'steps': 9347, 'loss/train': 1.7761608362197876} -11/06/2021 22:32:56 - INFO - __main__ - Step 9349: {'lr': 0.0004969651029185652, 'samples': 1795008, 'steps': 9348, 'loss/train': 1.646713137626648} -11/06/2021 22:32:56 - INFO - __main__ - Step 9350: {'lr': 0.0004969642784912001, 'samples': 1795200, 'steps': 9349, 'loss/train': 3.636963367462158} -11/06/2021 22:32:57 - INFO - __main__ - Step 9351: {'lr': 0.0004969634539525566, 'samples': 1795392, 'steps': 9350, 'loss/train': 2.115077495574951} -11/06/2021 22:32:57 - INFO - __main__ - Step 9352: {'lr': 0.0004969626293026353, 'samples': 1795584, 'steps': 9351, 'loss/train': 1.7228342294692993} -11/06/2021 22:32:58 - INFO - __main__ - Step 9353: {'lr': 0.0004969618045414363, 'samples': 1795776, 'steps': 9352, 'loss/train': 1.540665626525879} -11/06/2021 22:32:58 - INFO - __main__ - Step 9354: {'lr': 0.0004969609796689602, 'samples': 1795968, 'steps': 9353, 'loss/train': 1.7847797870635986} -11/06/2021 22:32:59 - INFO - __main__ - Step 9355: {'lr': 0.0004969601546852073, 'samples': 1796160, 'steps': 9354, 'loss/train': 1.4905754327774048} -11/06/2021 22:32:59 - INFO - __main__ - Step 9356: {'lr': 0.0004969593295901779, 'samples': 1796352, 'steps': 9355, 'loss/train': 1.998396873474121} -11/06/2021 22:32:59 - INFO - __main__ - Step 9357: {'lr': 0.0004969585043838725, 'samples': 1796544, 'steps': 9356, 'loss/train': 2.060382127761841} -11/06/2021 22:33:00 - INFO - __main__ - Step 9358: {'lr': 0.0004969576790662914, 'samples': 1796736, 'steps': 9357, 'loss/train': 1.823445200920105} -11/06/2021 22:33:01 - INFO - __main__ - Step 9359: {'lr': 0.0004969568536374349, 'samples': 1796928, 'steps': 9358, 'loss/train': 1.6767795085906982} -11/06/2021 22:33:01 - INFO - __main__ - Step 9360: {'lr': 0.0004969560280973036, 'samples': 1797120, 'steps': 9359, 'loss/train': 2.0261526107788086} -11/06/2021 22:33:01 - INFO - __main__ - Step 9361: {'lr': 0.0004969552024458976, 'samples': 1797312, 'steps': 9360, 'loss/train': 1.6986967325210571} -11/06/2021 22:33:02 - INFO - __main__ - Step 9362: {'lr': 0.0004969543766832176, 'samples': 1797504, 'steps': 9361, 'loss/train': 1.3113603591918945} -11/06/2021 22:33:03 - INFO - __main__ - Step 9363: {'lr': 0.0004969535508092635, 'samples': 1797696, 'steps': 9362, 'loss/train': 1.4548332691192627} -11/06/2021 22:33:03 - INFO - __main__ - Step 9364: {'lr': 0.0004969527248240361, 'samples': 1797888, 'steps': 9363, 'loss/train': 2.1433870792388916} -11/06/2021 22:33:03 - INFO - __main__ - Step 9365: {'lr': 0.0004969518987275356, 'samples': 1798080, 'steps': 9364, 'loss/train': 1.7857718467712402} -11/06/2021 22:33:04 - INFO - __main__ - Step 9366: {'lr': 0.0004969510725197624, 'samples': 1798272, 'steps': 9365, 'loss/train': 1.3735690116882324} -11/06/2021 22:33:04 - INFO - __main__ - Step 9367: {'lr': 0.0004969502462007167, 'samples': 1798464, 'steps': 9366, 'loss/train': 2.3249306678771973} -11/06/2021 22:33:05 - INFO - __main__ - Step 9368: {'lr': 0.0004969494197703992, 'samples': 1798656, 'steps': 9367, 'loss/train': 1.9111498594284058} -11/06/2021 22:33:05 - INFO - __main__ - Step 9369: {'lr': 0.00049694859322881, 'samples': 1798848, 'steps': 9368, 'loss/train': 1.7562119960784912} -11/06/2021 22:33:06 - INFO - __main__ - Step 9370: {'lr': 0.0004969477665759496, 'samples': 1799040, 'steps': 9369, 'loss/train': 1.8081409931182861} -11/06/2021 22:33:06 - INFO - __main__ - Step 9371: {'lr': 0.0004969469398118184, 'samples': 1799232, 'steps': 9370, 'loss/train': 1.3036324977874756} -11/06/2021 22:33:07 - INFO - __main__ - Step 9372: {'lr': 0.0004969461129364167, 'samples': 1799424, 'steps': 9371, 'loss/train': 1.8562147617340088} -11/06/2021 22:33:08 - INFO - __main__ - Step 9373: {'lr': 0.0004969452859497449, 'samples': 1799616, 'steps': 9372, 'loss/train': 1.927634596824646} -11/06/2021 22:33:08 - INFO - __main__ - Step 9374: {'lr': 0.0004969444588518034, 'samples': 1799808, 'steps': 9373, 'loss/train': 2.170872449874878} -11/06/2021 22:33:08 - INFO - __main__ - Step 9375: {'lr': 0.0004969436316425924, 'samples': 1800000, 'steps': 9374, 'loss/train': 1.852042317390442} -11/06/2021 22:33:09 - INFO - __main__ - Step 9376: {'lr': 0.0004969428043221125, 'samples': 1800192, 'steps': 9375, 'loss/train': 1.5770512819290161} -11/06/2021 22:33:09 - INFO - __main__ - Step 9377: {'lr': 0.000496941976890364, 'samples': 1800384, 'steps': 9376, 'loss/train': 1.6627328395843506} -11/06/2021 22:33:09 - INFO - __main__ - Step 9378: {'lr': 0.0004969411493473472, 'samples': 1800576, 'steps': 9377, 'loss/train': 1.592746376991272} -11/06/2021 22:33:11 - INFO - __main__ - Step 9379: {'lr': 0.0004969403216930626, 'samples': 1800768, 'steps': 9378, 'loss/train': 1.5629326105117798} -11/06/2021 22:33:11 - INFO - __main__ - Step 9380: {'lr': 0.0004969394939275105, 'samples': 1800960, 'steps': 9379, 'loss/train': 1.9716914892196655} -11/06/2021 22:33:11 - INFO - __main__ - Step 9381: {'lr': 0.0004969386660506912, 'samples': 1801152, 'steps': 9380, 'loss/train': 1.612454891204834} -11/06/2021 22:33:12 - INFO - __main__ - Step 9382: {'lr': 0.0004969378380626051, 'samples': 1801344, 'steps': 9381, 'loss/train': 1.764012336730957} -11/06/2021 22:33:12 - INFO - __main__ - Step 9383: {'lr': 0.0004969370099632528, 'samples': 1801536, 'steps': 9382, 'loss/train': 1.9213483333587646} -11/06/2021 22:33:13 - INFO - __main__ - Step 9384: {'lr': 0.0004969361817526343, 'samples': 1801728, 'steps': 9383, 'loss/train': 1.2012592554092407} -11/06/2021 22:33:14 - INFO - __main__ - Step 9385: {'lr': 0.0004969353534307504, 'samples': 1801920, 'steps': 9384, 'loss/train': 2.151750087738037} -11/06/2021 22:33:14 - INFO - __main__ - Step 9386: {'lr': 0.000496934524997601, 'samples': 1802112, 'steps': 9385, 'loss/train': 0.9660016894340515} -11/06/2021 22:33:14 - INFO - __main__ - Step 9387: {'lr': 0.0004969336964531869, 'samples': 1802304, 'steps': 9386, 'loss/train': 1.7892236709594727} -11/06/2021 22:33:15 - INFO - __main__ - Step 9388: {'lr': 0.0004969328677975083, 'samples': 1802496, 'steps': 9387, 'loss/train': 1.6319315433502197} -11/06/2021 22:33:15 - INFO - __main__ - Step 9389: {'lr': 0.0004969320390305654, 'samples': 1802688, 'steps': 9388, 'loss/train': 2.0772619247436523} -11/06/2021 22:33:16 - INFO - __main__ - Step 9390: {'lr': 0.0004969312101523588, 'samples': 1802880, 'steps': 9389, 'loss/train': 1.8143119812011719} -11/06/2021 22:33:17 - INFO - __main__ - Step 9391: {'lr': 0.0004969303811628888, 'samples': 1803072, 'steps': 9390, 'loss/train': 1.7659382820129395} -11/06/2021 22:33:17 - INFO - __main__ - Step 9392: {'lr': 0.0004969295520621558, 'samples': 1803264, 'steps': 9391, 'loss/train': 2.3056082725524902} -11/06/2021 22:33:17 - INFO - __main__ - Step 9393: {'lr': 0.0004969287228501602, 'samples': 1803456, 'steps': 9392, 'loss/train': 1.8238893747329712} -11/06/2021 22:33:18 - INFO - __main__ - Step 9394: {'lr': 0.0004969278935269022, 'samples': 1803648, 'steps': 9393, 'loss/train': 0.7025987505912781} -11/06/2021 22:33:19 - INFO - __main__ - Step 9395: {'lr': 0.0004969270640923823, 'samples': 1803840, 'steps': 9394, 'loss/train': 1.8956180810928345} -11/06/2021 22:33:19 - INFO - __main__ - Step 9396: {'lr': 0.0004969262345466011, 'samples': 1804032, 'steps': 9395, 'loss/train': 1.8042242527008057} -11/06/2021 22:33:19 - INFO - __main__ - Step 9397: {'lr': 0.0004969254048895585, 'samples': 1804224, 'steps': 9396, 'loss/train': 1.8003126382827759} -11/06/2021 22:33:20 - INFO - __main__ - Step 9398: {'lr': 0.0004969245751212552, 'samples': 1804416, 'steps': 9397, 'loss/train': 1.8957905769348145} -11/06/2021 22:33:20 - INFO - __main__ - Step 9399: {'lr': 0.0004969237452416915, 'samples': 1804608, 'steps': 9398, 'loss/train': 1.0701171159744263} -11/06/2021 22:33:21 - INFO - __main__ - Step 9400: {'lr': 0.0004969229152508678, 'samples': 1804800, 'steps': 9399, 'loss/train': 1.8020981550216675} -11/06/2021 22:33:22 - INFO - __main__ - Step 9401: {'lr': 0.0004969220851487844, 'samples': 1804992, 'steps': 9400, 'loss/train': 0.40175554156303406} -11/06/2021 22:33:22 - INFO - __main__ - Step 9402: {'lr': 0.0004969212549354418, 'samples': 1805184, 'steps': 9401, 'loss/train': 1.8108609914779663} -11/06/2021 22:33:22 - INFO - __main__ - Step 9403: {'lr': 0.0004969204246108402, 'samples': 1805376, 'steps': 9402, 'loss/train': 1.1330207586288452} -11/06/2021 22:33:23 - INFO - __main__ - Step 9404: {'lr': 0.0004969195941749801, 'samples': 1805568, 'steps': 9403, 'loss/train': 1.2011972665786743} -11/06/2021 22:33:23 - INFO - __main__ - Step 9405: {'lr': 0.000496918763627862, 'samples': 1805760, 'steps': 9404, 'loss/train': 1.7720991373062134} -11/06/2021 22:33:24 - INFO - __main__ - Step 9406: {'lr': 0.0004969179329694859, 'samples': 1805952, 'steps': 9405, 'loss/train': 1.7720216512680054} -11/06/2021 22:33:24 - INFO - __main__ - Step 9407: {'lr': 0.0004969171021998525, 'samples': 1806144, 'steps': 9406, 'loss/train': 1.1517207622528076} -11/06/2021 22:33:25 - INFO - __main__ - Step 9408: {'lr': 0.0004969162713189619, 'samples': 1806336, 'steps': 9407, 'loss/train': 1.5206893682479858} -11/06/2021 22:33:25 - INFO - __main__ - Step 9409: {'lr': 0.0004969154403268148, 'samples': 1806528, 'steps': 9408, 'loss/train': 1.8082882165908813} -11/06/2021 22:33:25 - INFO - __main__ - Step 9410: {'lr': 0.0004969146092234114, 'samples': 1806720, 'steps': 9409, 'loss/train': 1.3360158205032349} -11/06/2021 22:33:26 - INFO - __main__ - Step 9411: {'lr': 0.000496913778008752, 'samples': 1806912, 'steps': 9410, 'loss/train': 2.1113593578338623} -11/06/2021 22:33:27 - INFO - __main__ - Step 9412: {'lr': 0.0004969129466828371, 'samples': 1807104, 'steps': 9411, 'loss/train': 2.4222865104675293} -11/06/2021 22:33:27 - INFO - __main__ - Step 9413: {'lr': 0.0004969121152456671, 'samples': 1807296, 'steps': 9412, 'loss/train': 1.631757378578186} -11/06/2021 22:33:27 - INFO - __main__ - Step 9414: {'lr': 0.0004969112836972423, 'samples': 1807488, 'steps': 9413, 'loss/train': 1.678197979927063} -11/06/2021 22:33:28 - INFO - __main__ - Step 9415: {'lr': 0.000496910452037563, 'samples': 1807680, 'steps': 9414, 'loss/train': 2.7772085666656494} -11/06/2021 22:33:29 - INFO - __main__ - Step 9416: {'lr': 0.0004969096202666297, 'samples': 1807872, 'steps': 9415, 'loss/train': 1.9640326499938965} -11/06/2021 22:33:29 - INFO - __main__ - Step 9417: {'lr': 0.0004969087883844428, 'samples': 1808064, 'steps': 9416, 'loss/train': 1.4064429998397827} -11/06/2021 22:33:30 - INFO - __main__ - Step 9418: {'lr': 0.0004969079563910025, 'samples': 1808256, 'steps': 9417, 'loss/train': 1.8658392429351807} -11/06/2021 22:33:30 - INFO - __main__ - Step 9419: {'lr': 0.0004969071242863093, 'samples': 1808448, 'steps': 9418, 'loss/train': 2.186412811279297} -11/06/2021 22:33:30 - INFO - __main__ - Step 9420: {'lr': 0.0004969062920703636, 'samples': 1808640, 'steps': 9419, 'loss/train': 1.6242451667785645} -11/06/2021 22:33:31 - INFO - __main__ - Step 9421: {'lr': 0.0004969054597431658, 'samples': 1808832, 'steps': 9420, 'loss/train': 2.4329140186309814} -11/06/2021 22:33:32 - INFO - __main__ - Step 9422: {'lr': 0.0004969046273047161, 'samples': 1809024, 'steps': 9421, 'loss/train': 1.61650812625885} -11/06/2021 22:33:32 - INFO - __main__ - Step 9423: {'lr': 0.0004969037947550151, 'samples': 1809216, 'steps': 9422, 'loss/train': 1.550029993057251} -11/06/2021 22:33:32 - INFO - __main__ - Step 9424: {'lr': 0.000496902962094063, 'samples': 1809408, 'steps': 9423, 'loss/train': 1.670718789100647} -11/06/2021 22:33:33 - INFO - __main__ - Step 9425: {'lr': 0.0004969021293218602, 'samples': 1809600, 'steps': 9424, 'loss/train': 1.6841366291046143} -11/06/2021 22:33:34 - INFO - __main__ - Step 9426: {'lr': 0.0004969012964384071, 'samples': 1809792, 'steps': 9425, 'loss/train': 2.19000244140625} -11/06/2021 22:33:34 - INFO - __main__ - Step 9427: {'lr': 0.0004969004634437042, 'samples': 1809984, 'steps': 9426, 'loss/train': 1.5909390449523926} -11/06/2021 22:33:34 - INFO - __main__ - Step 9428: {'lr': 0.0004968996303377517, 'samples': 1810176, 'steps': 9427, 'loss/train': 2.3377866744995117} -11/06/2021 22:33:35 - INFO - __main__ - Step 9429: {'lr': 0.00049689879712055, 'samples': 1810368, 'steps': 9428, 'loss/train': 1.959466576576233} -11/06/2021 22:33:35 - INFO - __main__ - Step 9430: {'lr': 0.0004968979637920995, 'samples': 1810560, 'steps': 9429, 'loss/train': 2.1791741847991943} -11/06/2021 22:33:35 - INFO - __main__ - Step 9431: {'lr': 0.0004968971303524007, 'samples': 1810752, 'steps': 9430, 'loss/train': 1.2849524021148682} -11/06/2021 22:33:36 - INFO - __main__ - Step 9432: {'lr': 0.0004968962968014537, 'samples': 1810944, 'steps': 9431, 'loss/train': 1.7930939197540283} -11/06/2021 22:33:37 - INFO - __main__ - Step 9433: {'lr': 0.0004968954631392592, 'samples': 1811136, 'steps': 9432, 'loss/train': 1.8857711553573608} -11/06/2021 22:33:37 - INFO - __main__ - Step 9434: {'lr': 0.0004968946293658173, 'samples': 1811328, 'steps': 9433, 'loss/train': 1.6014503240585327} -11/06/2021 22:33:37 - INFO - __main__ - Step 9435: {'lr': 0.0004968937954811284, 'samples': 1811520, 'steps': 9434, 'loss/train': 1.701316237449646} -11/06/2021 22:33:38 - INFO - __main__ - Step 9436: {'lr': 0.0004968929614851932, 'samples': 1811712, 'steps': 9435, 'loss/train': 1.106537938117981} -11/06/2021 22:33:39 - INFO - __main__ - Step 9437: {'lr': 0.0004968921273780118, 'samples': 1811904, 'steps': 9436, 'loss/train': 1.812904715538025} -11/06/2021 22:33:39 - INFO - __main__ - Step 9438: {'lr': 0.0004968912931595845, 'samples': 1812096, 'steps': 9437, 'loss/train': 1.294390082359314} -11/06/2021 22:33:39 - INFO - __main__ - Step 9439: {'lr': 0.0004968904588299118, 'samples': 1812288, 'steps': 9438, 'loss/train': 1.2054589986801147} -11/06/2021 22:33:40 - INFO - __main__ - Step 9440: {'lr': 0.0004968896243889941, 'samples': 1812480, 'steps': 9439, 'loss/train': 1.6848827600479126} -11/06/2021 22:33:40 - INFO - __main__ - Step 9441: {'lr': 0.0004968887898368318, 'samples': 1812672, 'steps': 9440, 'loss/train': 2.0966432094573975} -11/06/2021 22:33:41 - INFO - __main__ - Step 9442: {'lr': 0.0004968879551734252, 'samples': 1812864, 'steps': 9441, 'loss/train': 1.6406598091125488} -11/06/2021 22:33:42 - INFO - __main__ - Step 9443: {'lr': 0.0004968871203987746, 'samples': 1813056, 'steps': 9442, 'loss/train': 1.871316909790039} -11/06/2021 22:33:42 - INFO - __main__ - Step 9444: {'lr': 0.0004968862855128806, 'samples': 1813248, 'steps': 9443, 'loss/train': 1.394817590713501} -11/06/2021 22:33:42 - INFO - __main__ - Step 9445: {'lr': 0.0004968854505157434, 'samples': 1813440, 'steps': 9444, 'loss/train': 1.726036787033081} -11/06/2021 22:33:43 - INFO - __main__ - Step 9446: {'lr': 0.0004968846154073634, 'samples': 1813632, 'steps': 9445, 'loss/train': 0.7175917625427246} -11/06/2021 22:33:44 - INFO - __main__ - Step 9447: {'lr': 0.0004968837801877411, 'samples': 1813824, 'steps': 9446, 'loss/train': 1.9097816944122314} -11/06/2021 22:33:44 - INFO - __main__ - Step 9448: {'lr': 0.0004968829448568766, 'samples': 1814016, 'steps': 9447, 'loss/train': 1.6947396993637085} -11/06/2021 22:33:44 - INFO - __main__ - Step 9449: {'lr': 0.0004968821094147706, 'samples': 1814208, 'steps': 9448, 'loss/train': 1.652908205986023} -11/06/2021 22:33:45 - INFO - __main__ - Step 9450: {'lr': 0.0004968812738614232, 'samples': 1814400, 'steps': 9449, 'loss/train': 1.8884683847427368} -11/06/2021 22:33:45 - INFO - __main__ - Step 9451: {'lr': 0.000496880438196835, 'samples': 1814592, 'steps': 9450, 'loss/train': 1.878915786743164} -11/06/2021 22:33:46 - INFO - __main__ - Step 9452: {'lr': 0.0004968796024210064, 'samples': 1814784, 'steps': 9451, 'loss/train': 1.934395670890808} -11/06/2021 22:33:46 - INFO - __main__ - Step 9453: {'lr': 0.0004968787665339375, 'samples': 1814976, 'steps': 9452, 'loss/train': 1.7748756408691406} -11/06/2021 22:33:47 - INFO - __main__ - Step 9454: {'lr': 0.0004968779305356289, 'samples': 1815168, 'steps': 9453, 'loss/train': 1.8355199098587036} -11/06/2021 22:33:47 - INFO - __main__ - Step 9455: {'lr': 0.0004968770944260808, 'samples': 1815360, 'steps': 9454, 'loss/train': 1.931564450263977} -11/06/2021 22:33:47 - INFO - __main__ - Step 9456: {'lr': 0.0004968762582052938, 'samples': 1815552, 'steps': 9455, 'loss/train': 1.959632396697998} -11/06/2021 22:33:48 - INFO - __main__ - Step 9457: {'lr': 0.0004968754218732682, 'samples': 1815744, 'steps': 9456, 'loss/train': 1.8338159322738647} -11/06/2021 22:33:49 - INFO - __main__ - Step 9458: {'lr': 0.0004968745854300043, 'samples': 1815936, 'steps': 9457, 'loss/train': 1.7420405149459839} -11/06/2021 22:33:49 - INFO - __main__ - Step 9459: {'lr': 0.0004968737488755025, 'samples': 1816128, 'steps': 9458, 'loss/train': 1.8314000368118286} -11/06/2021 22:33:49 - INFO - __main__ - Step 9460: {'lr': 0.0004968729122097632, 'samples': 1816320, 'steps': 9459, 'loss/train': 1.9877064228057861} -11/06/2021 22:33:50 - INFO - __main__ - Step 9461: {'lr': 0.0004968720754327867, 'samples': 1816512, 'steps': 9460, 'loss/train': 1.5283275842666626} -11/06/2021 22:33:51 - INFO - __main__ - Step 9462: {'lr': 0.0004968712385445737, 'samples': 1816704, 'steps': 9461, 'loss/train': 1.5519593954086304} -11/06/2021 22:33:51 - INFO - __main__ - Step 9463: {'lr': 0.0004968704015451241, 'samples': 1816896, 'steps': 9462, 'loss/train': 2.173038959503174} -11/06/2021 22:33:51 - INFO - __main__ - Step 9464: {'lr': 0.0004968695644344387, 'samples': 1817088, 'steps': 9463, 'loss/train': 2.0512888431549072} -11/06/2021 22:33:52 - INFO - __main__ - Step 9465: {'lr': 0.0004968687272125174, 'samples': 1817280, 'steps': 9464, 'loss/train': 1.5592188835144043} -11/06/2021 22:33:52 - INFO - __main__ - Step 9466: {'lr': 0.0004968678898793611, 'samples': 1817472, 'steps': 9465, 'loss/train': 1.7354072332382202} -11/06/2021 22:33:53 - INFO - __main__ - Step 9467: {'lr': 0.0004968670524349699, 'samples': 1817664, 'steps': 9466, 'loss/train': 1.9592326879501343} -11/06/2021 22:33:54 - INFO - __main__ - Step 9468: {'lr': 0.0004968662148793441, 'samples': 1817856, 'steps': 9467, 'loss/train': 1.6401126384735107} -11/06/2021 22:33:54 - INFO - __main__ - Step 9469: {'lr': 0.0004968653772124843, 'samples': 1818048, 'steps': 9468, 'loss/train': 1.6802074909210205} -11/06/2021 22:33:54 - INFO - __main__ - Step 9470: {'lr': 0.0004968645394343908, 'samples': 1818240, 'steps': 9469, 'loss/train': 1.5846213102340698} -11/06/2021 22:33:55 - INFO - __main__ - Step 9471: {'lr': 0.0004968637015450639, 'samples': 1818432, 'steps': 9470, 'loss/train': 1.8173738718032837} -11/06/2021 22:33:55 - INFO - __main__ - Step 9472: {'lr': 0.000496862863544504, 'samples': 1818624, 'steps': 9471, 'loss/train': 1.4764689207077026} -11/06/2021 22:33:56 - INFO - __main__ - Step 9473: {'lr': 0.0004968620254327114, 'samples': 1818816, 'steps': 9472, 'loss/train': 1.9476569890975952} -11/06/2021 22:33:56 - INFO - __main__ - Step 9474: {'lr': 0.0004968611872096868, 'samples': 1819008, 'steps': 9473, 'loss/train': 1.7643886804580688} -11/06/2021 22:33:57 - INFO - __main__ - Step 9475: {'lr': 0.0004968603488754302, 'samples': 1819200, 'steps': 9474, 'loss/train': 1.442833423614502} -11/06/2021 22:33:57 - INFO - __main__ - Step 9476: {'lr': 0.0004968595104299422, 'samples': 1819392, 'steps': 9475, 'loss/train': 2.2946574687957764} -11/06/2021 22:33:57 - INFO - __main__ - Step 9477: {'lr': 0.000496858671873223, 'samples': 1819584, 'steps': 9476, 'loss/train': 2.2401070594787598} -11/06/2021 22:33:58 - INFO - __main__ - Step 9478: {'lr': 0.0004968578332052733, 'samples': 1819776, 'steps': 9477, 'loss/train': 1.696811556816101} -11/06/2021 22:33:59 - INFO - __main__ - Step 9479: {'lr': 0.0004968569944260932, 'samples': 1819968, 'steps': 9478, 'loss/train': 2.2511560916900635} -11/06/2021 22:33:59 - INFO - __main__ - Step 9480: {'lr': 0.0004968561555356831, 'samples': 1820160, 'steps': 9479, 'loss/train': 1.6641721725463867} -11/06/2021 22:33:59 - INFO - __main__ - Step 9481: {'lr': 0.0004968553165340435, 'samples': 1820352, 'steps': 9480, 'loss/train': 1.7705086469650269} -11/06/2021 22:34:00 - INFO - __main__ - Step 9482: {'lr': 0.0004968544774211746, 'samples': 1820544, 'steps': 9481, 'loss/train': 1.7317209243774414} -11/06/2021 22:34:01 - INFO - __main__ - Step 9483: {'lr': 0.0004968536381970769, 'samples': 1820736, 'steps': 9482, 'loss/train': 1.7108385562896729} -11/06/2021 22:34:01 - INFO - __main__ - Step 9484: {'lr': 0.0004968527988617508, 'samples': 1820928, 'steps': 9483, 'loss/train': 1.9148114919662476} -11/06/2021 22:34:02 - INFO - __main__ - Step 9485: {'lr': 0.0004968519594151966, 'samples': 1821120, 'steps': 9484, 'loss/train': 2.120004653930664} -11/06/2021 22:34:02 - INFO - __main__ - Step 9486: {'lr': 0.0004968511198574147, 'samples': 1821312, 'steps': 9485, 'loss/train': 2.175170660018921} -11/06/2021 22:34:02 - INFO - __main__ - Step 9487: {'lr': 0.0004968502801884056, 'samples': 1821504, 'steps': 9486, 'loss/train': 1.964535117149353} -11/06/2021 22:34:03 - INFO - __main__ - Step 9488: {'lr': 0.0004968494404081695, 'samples': 1821696, 'steps': 9487, 'loss/train': 1.3058781623840332} -11/06/2021 22:34:04 - INFO - __main__ - Step 9489: {'lr': 0.0004968486005167069, 'samples': 1821888, 'steps': 9488, 'loss/train': 1.7480806112289429} -11/06/2021 22:34:04 - INFO - __main__ - Step 9490: {'lr': 0.000496847760514018, 'samples': 1822080, 'steps': 9489, 'loss/train': 1.46340012550354} -11/06/2021 22:34:04 - INFO - __main__ - Step 9491: {'lr': 0.0004968469204001035, 'samples': 1822272, 'steps': 9490, 'loss/train': 2.2288196086883545} -11/06/2021 22:34:05 - INFO - __main__ - Step 9492: {'lr': 0.0004968460801749635, 'samples': 1822464, 'steps': 9491, 'loss/train': 1.707292914390564} -11/06/2021 22:34:05 - INFO - __main__ - Step 9493: {'lr': 0.0004968452398385984, 'samples': 1822656, 'steps': 9492, 'loss/train': 1.734236240386963} -11/06/2021 22:34:06 - INFO - __main__ - Step 9494: {'lr': 0.0004968443993910086, 'samples': 1822848, 'steps': 9493, 'loss/train': 1.8103415966033936} -11/06/2021 22:34:07 - INFO - __main__ - Step 9495: {'lr': 0.0004968435588321947, 'samples': 1823040, 'steps': 9494, 'loss/train': 1.4598149061203003} -11/06/2021 22:34:07 - INFO - __main__ - Step 9496: {'lr': 0.0004968427181621567, 'samples': 1823232, 'steps': 9495, 'loss/train': 1.8984959125518799} -11/06/2021 22:34:07 - INFO - __main__ - Step 9497: {'lr': 0.0004968418773808954, 'samples': 1823424, 'steps': 9496, 'loss/train': 1.705300211906433} -11/06/2021 22:34:08 - INFO - __main__ - Step 9498: {'lr': 0.0004968410364884109, 'samples': 1823616, 'steps': 9497, 'loss/train': 1.6887762546539307} -11/06/2021 22:34:09 - INFO - __main__ - Step 9499: {'lr': 0.0004968401954847035, 'samples': 1823808, 'steps': 9498, 'loss/train': 1.4879417419433594} -11/06/2021 22:34:09 - INFO - __main__ - Step 9500: {'lr': 0.0004968393543697739, 'samples': 1824000, 'steps': 9499, 'loss/train': 1.49965238571167} -11/06/2021 22:34:09 - INFO - __main__ - Step 9501: {'lr': 0.0004968385131436222, 'samples': 1824192, 'steps': 9500, 'loss/train': 1.9283766746520996} -11/06/2021 22:34:10 - INFO - __main__ - Step 9502: {'lr': 0.0004968376718062488, 'samples': 1824384, 'steps': 9501, 'loss/train': 1.9032224416732788} -11/06/2021 22:34:10 - INFO - __main__ - Step 9503: {'lr': 0.0004968368303576542, 'samples': 1824576, 'steps': 9502, 'loss/train': 2.1025607585906982} -11/06/2021 22:34:11 - INFO - __main__ - Step 9504: {'lr': 0.0004968359887978389, 'samples': 1824768, 'steps': 9503, 'loss/train': 0.9440047144889832} -11/06/2021 22:34:11 - INFO - __main__ - Step 9505: {'lr': 0.0004968351471268029, 'samples': 1824960, 'steps': 9504, 'loss/train': 2.4170825481414795} -11/06/2021 22:34:12 - INFO - __main__ - Step 9506: {'lr': 0.0004968343053445469, 'samples': 1825152, 'steps': 9505, 'loss/train': 1.723289132118225} -11/06/2021 22:34:12 - INFO - __main__ - Step 9507: {'lr': 0.0004968334634510712, 'samples': 1825344, 'steps': 9506, 'loss/train': 2.1578383445739746} -11/06/2021 22:34:13 - INFO - __main__ - Step 9508: {'lr': 0.000496832621446376, 'samples': 1825536, 'steps': 9507, 'loss/train': 1.3967469930648804} -11/06/2021 22:34:13 - INFO - __main__ - Step 9509: {'lr': 0.000496831779330462, 'samples': 1825728, 'steps': 9508, 'loss/train': 1.5260154008865356} -11/06/2021 22:34:14 - INFO - __main__ - Step 9510: {'lr': 0.0004968309371033293, 'samples': 1825920, 'steps': 9509, 'loss/train': 1.9803547859191895} -11/06/2021 22:34:14 - INFO - __main__ - Step 9511: {'lr': 0.0004968300947649784, 'samples': 1826112, 'steps': 9510, 'loss/train': 1.811102271080017} -11/06/2021 22:34:15 - INFO - __main__ - Step 9512: {'lr': 0.0004968292523154096, 'samples': 1826304, 'steps': 9511, 'loss/train': 1.6655768156051636} -11/06/2021 22:34:15 - INFO - __main__ - Step 9513: {'lr': 0.0004968284097546235, 'samples': 1826496, 'steps': 9512, 'loss/train': 1.665718913078308} -11/06/2021 22:34:15 - INFO - __main__ - Step 9514: {'lr': 0.0004968275670826204, 'samples': 1826688, 'steps': 9513, 'loss/train': 1.7052531242370605} -11/06/2021 22:34:16 - INFO - __main__ - Step 9515: {'lr': 0.0004968267242994003, 'samples': 1826880, 'steps': 9514, 'loss/train': 1.3750792741775513} -11/06/2021 22:34:17 - INFO - __main__ - Step 9516: {'lr': 0.0004968258814049641, 'samples': 1827072, 'steps': 9515, 'loss/train': 1.3806614875793457} -11/06/2021 22:34:17 - INFO - __main__ - Step 9517: {'lr': 0.0004968250383993119, 'samples': 1827264, 'steps': 9516, 'loss/train': 2.3476414680480957} -11/06/2021 22:34:17 - INFO - __main__ - Step 9518: {'lr': 0.0004968241952824442, 'samples': 1827456, 'steps': 9517, 'loss/train': 1.6158838272094727} -11/06/2021 22:34:18 - INFO - __main__ - Step 9519: {'lr': 0.0004968233520543613, 'samples': 1827648, 'steps': 9518, 'loss/train': 2.4204187393188477} -11/06/2021 22:34:19 - INFO - __main__ - Step 9520: {'lr': 0.0004968225087150636, 'samples': 1827840, 'steps': 9519, 'loss/train': 1.876865267753601} -11/06/2021 22:34:19 - INFO - __main__ - Step 9521: {'lr': 0.0004968216652645515, 'samples': 1828032, 'steps': 9520, 'loss/train': 2.089869737625122} -11/06/2021 22:34:20 - INFO - __main__ - Step 9522: {'lr': 0.0004968208217028254, 'samples': 1828224, 'steps': 9521, 'loss/train': 1.1889524459838867} -11/06/2021 22:34:20 - INFO - __main__ - Step 9523: {'lr': 0.0004968199780298855, 'samples': 1828416, 'steps': 9522, 'loss/train': 1.8859481811523438} -11/06/2021 22:34:20 - INFO - __main__ - Step 9524: {'lr': 0.0004968191342457325, 'samples': 1828608, 'steps': 9523, 'loss/train': 1.6368975639343262} -11/06/2021 22:34:22 - INFO - __main__ - Step 9525: {'lr': 0.0004968182903503665, 'samples': 1828800, 'steps': 9524, 'loss/train': 1.5924121141433716} -11/06/2021 22:34:22 - INFO - __main__ - Step 9526: {'lr': 0.0004968174463437881, 'samples': 1828992, 'steps': 9525, 'loss/train': 1.3622881174087524} -11/06/2021 22:34:22 - INFO - __main__ - Step 9527: {'lr': 0.0004968166022259974, 'samples': 1829184, 'steps': 9526, 'loss/train': 1.6611684560775757} -11/06/2021 22:34:23 - INFO - __main__ - Step 9528: {'lr': 0.0004968157579969951, 'samples': 1829376, 'steps': 9527, 'loss/train': 1.8583652973175049} -11/06/2021 22:34:23 - INFO - __main__ - Step 9529: {'lr': 0.0004968149136567814, 'samples': 1829568, 'steps': 9528, 'loss/train': 1.5691323280334473} -11/06/2021 22:34:23 - INFO - __main__ - Step 9530: {'lr': 0.0004968140692053567, 'samples': 1829760, 'steps': 9529, 'loss/train': 1.7236870527267456} -11/06/2021 22:34:24 - INFO - __main__ - Step 9531: {'lr': 0.0004968132246427212, 'samples': 1829952, 'steps': 9530, 'loss/train': 2.275637149810791} -11/06/2021 22:34:25 - INFO - __main__ - Step 9532: {'lr': 0.0004968123799688757, 'samples': 1830144, 'steps': 9531, 'loss/train': 1.7203338146209717} -11/06/2021 22:34:25 - INFO - __main__ - Step 9533: {'lr': 0.0004968115351838203, 'samples': 1830336, 'steps': 9532, 'loss/train': 2.002017021179199} -11/06/2021 22:34:26 - INFO - __main__ - Step 9534: {'lr': 0.0004968106902875554, 'samples': 1830528, 'steps': 9533, 'loss/train': 1.5515137910842896} -11/06/2021 22:34:26 - INFO - __main__ - Step 9535: {'lr': 0.0004968098452800815, 'samples': 1830720, 'steps': 9534, 'loss/train': 1.9174106121063232} -11/06/2021 22:34:26 - INFO - __main__ - Step 9536: {'lr': 0.0004968090001613987, 'samples': 1830912, 'steps': 9535, 'loss/train': 1.4403159618377686} -11/06/2021 22:34:27 - INFO - __main__ - Step 9537: {'lr': 0.0004968081549315078, 'samples': 1831104, 'steps': 9536, 'loss/train': 1.640446662902832} -11/06/2021 22:34:28 - INFO - __main__ - Step 9538: {'lr': 0.0004968073095904088, 'samples': 1831296, 'steps': 9537, 'loss/train': 1.7125294208526611} -11/06/2021 22:34:28 - INFO - __main__ - Step 9539: {'lr': 0.0004968064641381022, 'samples': 1831488, 'steps': 9538, 'loss/train': 2.010976552963257} -11/06/2021 22:34:28 - INFO - __main__ - Step 9540: {'lr': 0.0004968056185745886, 'samples': 1831680, 'steps': 9539, 'loss/train': 2.09594464302063} -11/06/2021 22:34:29 - INFO - __main__ - Step 9541: {'lr': 0.000496804772899868, 'samples': 1831872, 'steps': 9540, 'loss/train': 1.843455195426941} -11/06/2021 22:34:30 - INFO - __main__ - Step 9542: {'lr': 0.0004968039271139412, 'samples': 1832064, 'steps': 9541, 'loss/train': 2.009514331817627} -11/06/2021 22:34:30 - INFO - __main__ - Step 9543: {'lr': 0.0004968030812168082, 'samples': 1832256, 'steps': 9542, 'loss/train': 1.7577793598175049} -11/06/2021 22:34:30 - INFO - __main__ - Step 9544: {'lr': 0.0004968022352084695, 'samples': 1832448, 'steps': 9543, 'loss/train': 2.0828323364257812} -11/06/2021 22:34:31 - INFO - __main__ - Step 9545: {'lr': 0.0004968013890889256, 'samples': 1832640, 'steps': 9544, 'loss/train': 1.7458568811416626} -11/06/2021 22:34:31 - INFO - __main__ - Step 9546: {'lr': 0.0004968005428581767, 'samples': 1832832, 'steps': 9545, 'loss/train': 2.1240222454071045} -11/06/2021 22:34:32 - INFO - __main__ - Step 9547: {'lr': 0.0004967996965162235, 'samples': 1833024, 'steps': 9546, 'loss/train': 1.8390196561813354} -11/06/2021 22:34:32 - INFO - __main__ - Step 9548: {'lr': 0.0004967988500630661, 'samples': 1833216, 'steps': 9547, 'loss/train': 1.910079836845398} -11/06/2021 22:34:33 - INFO - __main__ - Step 9549: {'lr': 0.0004967980034987048, 'samples': 1833408, 'steps': 9548, 'loss/train': 2.003260374069214} -11/06/2021 22:34:33 - INFO - __main__ - Step 9550: {'lr': 0.0004967971568231402, 'samples': 1833600, 'steps': 9549, 'loss/train': 1.5235668420791626} -11/06/2021 22:34:33 - INFO - __main__ - Step 9551: {'lr': 0.0004967963100363726, 'samples': 1833792, 'steps': 9550, 'loss/train': 1.7840920686721802} -11/06/2021 22:34:35 - INFO - __main__ - Step 9552: {'lr': 0.0004967954631384025, 'samples': 1833984, 'steps': 9551, 'loss/train': 1.2505114078521729} -11/06/2021 22:34:35 - INFO - __main__ - Step 9553: {'lr': 0.00049679461612923, 'samples': 1834176, 'steps': 9552, 'loss/train': 1.4225518703460693} -11/06/2021 22:34:36 - INFO - __main__ - Step 9554: {'lr': 0.0004967937690088558, 'samples': 1834368, 'steps': 9553, 'loss/train': 2.004608154296875} -11/06/2021 22:34:36 - INFO - __main__ - Step 9555: {'lr': 0.0004967929217772801, 'samples': 1834560, 'steps': 9554, 'loss/train': 2.0895955562591553} -11/06/2021 22:34:36 - INFO - __main__ - Step 9556: {'lr': 0.0004967920744345033, 'samples': 1834752, 'steps': 9555, 'loss/train': 0.44858700037002563} -11/06/2021 22:34:37 - INFO - __main__ - Step 9557: {'lr': 0.0004967912269805257, 'samples': 1834944, 'steps': 9556, 'loss/train': 2.1345250606536865} -11/06/2021 22:34:38 - INFO - __main__ - Step 9558: {'lr': 0.000496790379415348, 'samples': 1835136, 'steps': 9557, 'loss/train': 1.6229137182235718} -11/06/2021 22:34:38 - INFO - __main__ - Step 9559: {'lr': 0.0004967895317389702, 'samples': 1835328, 'steps': 9558, 'loss/train': 1.6342477798461914} -11/06/2021 22:34:38 - INFO - __main__ - Step 9560: {'lr': 0.0004967886839513929, 'samples': 1835520, 'steps': 9559, 'loss/train': 1.9332375526428223} -11/06/2021 22:34:39 - INFO - __main__ - Step 9561: {'lr': 0.0004967878360526163, 'samples': 1835712, 'steps': 9560, 'loss/train': 1.733110785484314} -11/06/2021 22:34:39 - INFO - __main__ - Step 9562: {'lr': 0.0004967869880426411, 'samples': 1835904, 'steps': 9561, 'loss/train': 1.7204447984695435} -11/06/2021 22:34:40 - INFO - __main__ - Step 9563: {'lr': 0.0004967861399214674, 'samples': 1836096, 'steps': 9562, 'loss/train': 1.7751929759979248} -11/06/2021 22:34:40 - INFO - __main__ - Step 9564: {'lr': 0.0004967852916890958, 'samples': 1836288, 'steps': 9563, 'loss/train': 1.7982103824615479} -11/06/2021 22:34:41 - INFO - __main__ - Step 9565: {'lr': 0.0004967844433455263, 'samples': 1836480, 'steps': 9564, 'loss/train': 2.2210209369659424} -11/06/2021 22:34:41 - INFO - __main__ - Step 9566: {'lr': 0.0004967835948907598, 'samples': 1836672, 'steps': 9565, 'loss/train': 1.8117777109146118} -11/06/2021 22:34:41 - INFO - __main__ - Step 9567: {'lr': 0.0004967827463247962, 'samples': 1836864, 'steps': 9566, 'loss/train': 1.7700427770614624} -11/06/2021 22:34:42 - INFO - __main__ - Step 9568: {'lr': 0.0004967818976476363, 'samples': 1837056, 'steps': 9567, 'loss/train': 1.9625296592712402} -11/06/2021 22:34:43 - INFO - __main__ - Step 9569: {'lr': 0.0004967810488592801, 'samples': 1837248, 'steps': 9568, 'loss/train': 1.7147427797317505} -11/06/2021 22:34:43 - INFO - __main__ - Step 9570: {'lr': 0.0004967801999597283, 'samples': 1837440, 'steps': 9569, 'loss/train': 1.954040765762329} -11/06/2021 22:34:43 - INFO - __main__ - Step 9571: {'lr': 0.0004967793509489811, 'samples': 1837632, 'steps': 9570, 'loss/train': 2.0516250133514404} -11/06/2021 22:34:44 - INFO - __main__ - Step 9572: {'lr': 0.0004967785018270389, 'samples': 1837824, 'steps': 9571, 'loss/train': 1.2908155918121338} -11/06/2021 22:34:45 - INFO - __main__ - Step 9573: {'lr': 0.0004967776525939022, 'samples': 1838016, 'steps': 9572, 'loss/train': 1.586142897605896} -11/06/2021 22:34:45 - INFO - __main__ - Step 9574: {'lr': 0.0004967768032495712, 'samples': 1838208, 'steps': 9573, 'loss/train': 1.9211750030517578} -11/06/2021 22:34:46 - INFO - __main__ - Step 9575: {'lr': 0.0004967759537940464, 'samples': 1838400, 'steps': 9574, 'loss/train': 6.170900821685791} -11/06/2021 22:34:46 - INFO - __main__ - Step 9576: {'lr': 0.0004967751042273282, 'samples': 1838592, 'steps': 9575, 'loss/train': 2.606065273284912} -11/06/2021 22:34:46 - INFO - __main__ - Step 9577: {'lr': 0.000496774254549417, 'samples': 1838784, 'steps': 9576, 'loss/train': 1.8838642835617065} -11/06/2021 22:34:47 - INFO - __main__ - Step 9578: {'lr': 0.0004967734047603131, 'samples': 1838976, 'steps': 9577, 'loss/train': 1.8725879192352295} -11/06/2021 22:34:48 - INFO - __main__ - Step 9579: {'lr': 0.0004967725548600168, 'samples': 1839168, 'steps': 9578, 'loss/train': 1.7218821048736572} -11/06/2021 22:34:48 - INFO - __main__ - Step 9580: {'lr': 0.0004967717048485287, 'samples': 1839360, 'steps': 9579, 'loss/train': 2.031545400619507} -11/06/2021 22:34:48 - INFO - __main__ - Step 9581: {'lr': 0.000496770854725849, 'samples': 1839552, 'steps': 9580, 'loss/train': 1.9540653228759766} -11/06/2021 22:34:49 - INFO - __main__ - Step 9582: {'lr': 0.0004967700044919783, 'samples': 1839744, 'steps': 9581, 'loss/train': 2.139894485473633} -11/06/2021 22:34:49 - INFO - __main__ - Step 9583: {'lr': 0.0004967691541469167, 'samples': 1839936, 'steps': 9582, 'loss/train': 1.7633771896362305} -11/06/2021 22:34:50 - INFO - __main__ - Step 9584: {'lr': 0.0004967683036906648, 'samples': 1840128, 'steps': 9583, 'loss/train': 2.204907178878784} -11/06/2021 22:34:50 - INFO - __main__ - Step 9585: {'lr': 0.0004967674531232229, 'samples': 1840320, 'steps': 9584, 'loss/train': 1.9411033391952515} -11/06/2021 22:34:51 - INFO - __main__ - Step 9586: {'lr': 0.0004967666024445913, 'samples': 1840512, 'steps': 9585, 'loss/train': 1.1677578687667847} -11/06/2021 22:34:51 - INFO - __main__ - Step 9587: {'lr': 0.0004967657516547707, 'samples': 1840704, 'steps': 9586, 'loss/train': 1.5230824947357178} -11/06/2021 22:34:51 - INFO - __main__ - Step 9588: {'lr': 0.0004967649007537611, 'samples': 1840896, 'steps': 9587, 'loss/train': 1.3074101209640503} -11/06/2021 22:34:52 - INFO - __main__ - Step 9589: {'lr': 0.0004967640497415631, 'samples': 1841088, 'steps': 9588, 'loss/train': 2.527937412261963} -11/06/2021 22:34:53 - INFO - __main__ - Step 9590: {'lr': 0.000496763198618177, 'samples': 1841280, 'steps': 9589, 'loss/train': 2.1263439655303955} -11/06/2021 22:34:53 - INFO - __main__ - Step 9591: {'lr': 0.0004967623473836032, 'samples': 1841472, 'steps': 9590, 'loss/train': 1.8565070629119873} -11/06/2021 22:34:53 - INFO - __main__ - Step 9592: {'lr': 0.0004967614960378421, 'samples': 1841664, 'steps': 9591, 'loss/train': 2.0305135250091553} -11/06/2021 22:34:54 - INFO - __main__ - Step 9593: {'lr': 0.000496760644580894, 'samples': 1841856, 'steps': 9592, 'loss/train': 1.905313491821289} -11/06/2021 22:34:55 - INFO - __main__ - Step 9594: {'lr': 0.0004967597930127595, 'samples': 1842048, 'steps': 9593, 'loss/train': 2.1325924396514893} -11/06/2021 22:34:55 - INFO - __main__ - Step 9595: {'lr': 0.0004967589413334387, 'samples': 1842240, 'steps': 9594, 'loss/train': 1.6247498989105225} -11/06/2021 22:34:56 - INFO - __main__ - Step 9596: {'lr': 0.0004967580895429322, 'samples': 1842432, 'steps': 9595, 'loss/train': 1.7681033611297607} -11/06/2021 22:34:56 - INFO - __main__ - Step 9597: {'lr': 0.0004967572376412405, 'samples': 1842624, 'steps': 9596, 'loss/train': 1.8701852560043335} -11/06/2021 22:34:56 - INFO - __main__ - Step 9598: {'lr': 0.0004967563856283636, 'samples': 1842816, 'steps': 9597, 'loss/train': 1.6864864826202393} -11/06/2021 22:34:58 - INFO - __main__ - Step 9599: {'lr': 0.000496755533504302, 'samples': 1843008, 'steps': 9598, 'loss/train': 1.842852234840393} -11/06/2021 22:34:58 - INFO - __main__ - Step 9600: {'lr': 0.0004967546812690563, 'samples': 1843200, 'steps': 9599, 'loss/train': 1.65439772605896} -11/06/2021 22:34:58 - INFO - __main__ - Step 9601: {'lr': 0.0004967538289226267, 'samples': 1843392, 'steps': 9600, 'loss/train': 1.5017353296279907} -11/06/2021 22:34:59 - INFO - __main__ - Step 9602: {'lr': 0.0004967529764650137, 'samples': 1843584, 'steps': 9601, 'loss/train': 1.895011067390442} -11/06/2021 22:34:59 - INFO - __main__ - Step 9603: {'lr': 0.0004967521238962175, 'samples': 1843776, 'steps': 9602, 'loss/train': 1.7376617193222046} -11/06/2021 22:34:59 - INFO - __main__ - Step 9604: {'lr': 0.0004967512712162387, 'samples': 1843968, 'steps': 9603, 'loss/train': 1.7263696193695068} -11/06/2021 22:35:00 - INFO - __main__ - Step 9605: {'lr': 0.0004967504184250775, 'samples': 1844160, 'steps': 9604, 'loss/train': 2.917311906814575} -11/06/2021 22:35:01 - INFO - __main__ - Step 9606: {'lr': 0.0004967495655227344, 'samples': 1844352, 'steps': 9605, 'loss/train': 2.3843181133270264} -11/06/2021 22:35:01 - INFO - __main__ - Step 9607: {'lr': 0.0004967487125092098, 'samples': 1844544, 'steps': 9606, 'loss/train': 1.349475622177124} -11/06/2021 22:35:02 - INFO - __main__ - Step 9608: {'lr': 0.0004967478593845041, 'samples': 1844736, 'steps': 9607, 'loss/train': 1.40731942653656} -11/06/2021 22:35:02 - INFO - __main__ - Step 9609: {'lr': 0.0004967470061486175, 'samples': 1844928, 'steps': 9608, 'loss/train': 1.621782660484314} -11/06/2021 22:35:02 - INFO - __main__ - Step 9610: {'lr': 0.0004967461528015506, 'samples': 1845120, 'steps': 9609, 'loss/train': 1.7241379022598267} -11/06/2021 22:35:03 - INFO - __main__ - Step 9611: {'lr': 0.0004967452993433036, 'samples': 1845312, 'steps': 9610, 'loss/train': 1.7397297620773315} -11/06/2021 22:35:04 - INFO - __main__ - Step 9612: {'lr': 0.0004967444457738769, 'samples': 1845504, 'steps': 9611, 'loss/train': 1.5325270891189575} -11/06/2021 22:35:04 - INFO - __main__ - Step 9613: {'lr': 0.0004967435920932711, 'samples': 1845696, 'steps': 9612, 'loss/train': 1.8796131610870361} -11/06/2021 22:35:04 - INFO - __main__ - Step 9614: {'lr': 0.0004967427383014865, 'samples': 1845888, 'steps': 9613, 'loss/train': 2.0587081909179688} -11/06/2021 22:35:05 - INFO - __main__ - Step 9615: {'lr': 0.0004967418843985233, 'samples': 1846080, 'steps': 9614, 'loss/train': 1.6247023344039917} -11/06/2021 22:35:06 - INFO - __main__ - Step 9616: {'lr': 0.0004967410303843821, 'samples': 1846272, 'steps': 9615, 'loss/train': 2.14107346534729} -11/06/2021 22:35:06 - INFO - __main__ - Step 9617: {'lr': 0.0004967401762590631, 'samples': 1846464, 'steps': 9616, 'loss/train': 1.674919605255127} -11/06/2021 22:35:06 - INFO - __main__ - Step 9618: {'lr': 0.0004967393220225668, 'samples': 1846656, 'steps': 9617, 'loss/train': 1.9346179962158203} -11/06/2021 22:35:07 - INFO - __main__ - Step 9619: {'lr': 0.0004967384676748936, 'samples': 1846848, 'steps': 9618, 'loss/train': 1.5423815250396729} -11/06/2021 22:35:07 - INFO - __main__ - Step 9620: {'lr': 0.0004967376132160438, 'samples': 1847040, 'steps': 9619, 'loss/train': 2.3580563068389893} -11/06/2021 22:35:08 - INFO - __main__ - Step 9621: {'lr': 0.000496736758646018, 'samples': 1847232, 'steps': 9620, 'loss/train': 1.7103986740112305} -11/06/2021 22:35:09 - INFO - __main__ - Step 9622: {'lr': 0.0004967359039648163, 'samples': 1847424, 'steps': 9621, 'loss/train': 1.5623164176940918} -11/06/2021 22:35:09 - INFO - __main__ - Step 9623: {'lr': 0.0004967350491724392, 'samples': 1847616, 'steps': 9622, 'loss/train': 1.5282793045043945} -11/06/2021 22:35:09 - INFO - __main__ - Step 9624: {'lr': 0.0004967341942688872, 'samples': 1847808, 'steps': 9623, 'loss/train': 1.75148344039917} -11/06/2021 22:35:10 - INFO - __main__ - Step 9625: {'lr': 0.0004967333392541604, 'samples': 1848000, 'steps': 9624, 'loss/train': 1.2734038829803467} -11/06/2021 22:35:11 - INFO - __main__ - Step 9626: {'lr': 0.0004967324841282596, 'samples': 1848192, 'steps': 9625, 'loss/train': 1.7880160808563232} -11/06/2021 22:35:11 - INFO - __main__ - Step 9627: {'lr': 0.0004967316288911847, 'samples': 1848384, 'steps': 9626, 'loss/train': 1.675197958946228} -11/06/2021 22:35:11 - INFO - __main__ - Step 9628: {'lr': 0.0004967307735429365, 'samples': 1848576, 'steps': 9627, 'loss/train': 2.0006182193756104} -11/06/2021 22:35:12 - INFO - __main__ - Step 9629: {'lr': 0.0004967299180835153, 'samples': 1848768, 'steps': 9628, 'loss/train': 1.4124494791030884} -11/06/2021 22:35:12 - INFO - __main__ - Step 9630: {'lr': 0.0004967290625129212, 'samples': 1848960, 'steps': 9629, 'loss/train': 1.5025792121887207} -11/06/2021 22:35:12 - INFO - __main__ - Step 9631: {'lr': 0.0004967282068311548, 'samples': 1849152, 'steps': 9630, 'loss/train': 2.0721802711486816} -11/06/2021 22:35:14 - INFO - __main__ - Step 9632: {'lr': 0.0004967273510382166, 'samples': 1849344, 'steps': 9631, 'loss/train': 1.781577229499817} -11/06/2021 22:35:14 - INFO - __main__ - Step 9633: {'lr': 0.0004967264951341069, 'samples': 1849536, 'steps': 9632, 'loss/train': 1.7446000576019287} -11/06/2021 22:35:14 - INFO - __main__ - Step 9634: {'lr': 0.0004967256391188258, 'samples': 1849728, 'steps': 9633, 'loss/train': 1.9075095653533936} -11/06/2021 22:35:15 - INFO - __main__ - Step 9635: {'lr': 0.0004967247829923742, 'samples': 1849920, 'steps': 9634, 'loss/train': 2.3468635082244873} -11/06/2021 22:35:15 - INFO - __main__ - Step 9636: {'lr': 0.0004967239267547521, 'samples': 1850112, 'steps': 9635, 'loss/train': 1.420114278793335} -11/06/2021 22:35:16 - INFO - __main__ - Step 9637: {'lr': 0.00049672307040596, 'samples': 1850304, 'steps': 9636, 'loss/train': 1.8249211311340332} -11/06/2021 22:35:17 - INFO - __main__ - Step 9638: {'lr': 0.0004967222139459983, 'samples': 1850496, 'steps': 9637, 'loss/train': 0.8801685571670532} -11/06/2021 22:35:17 - INFO - __main__ - Step 9639: {'lr': 0.0004967213573748674, 'samples': 1850688, 'steps': 9638, 'loss/train': 1.8244924545288086} -11/06/2021 22:35:17 - INFO - __main__ - Step 9640: {'lr': 0.0004967205006925677, 'samples': 1850880, 'steps': 9639, 'loss/train': 1.8652440309524536} -11/06/2021 22:35:18 - INFO - __main__ - Step 9641: {'lr': 0.0004967196438990995, 'samples': 1851072, 'steps': 9640, 'loss/train': 1.3965966701507568} -11/06/2021 22:35:18 - INFO - __main__ - Step 9642: {'lr': 0.0004967187869944632, 'samples': 1851264, 'steps': 9641, 'loss/train': 2.0054564476013184} -11/06/2021 22:35:19 - INFO - __main__ - Step 9643: {'lr': 0.0004967179299786593, 'samples': 1851456, 'steps': 9642, 'loss/train': 0.7685950994491577} -11/06/2021 22:35:19 - INFO - __main__ - Step 9644: {'lr': 0.000496717072851688, 'samples': 1851648, 'steps': 9643, 'loss/train': 1.9576327800750732} -11/06/2021 22:35:20 - INFO - __main__ - Step 9645: {'lr': 0.0004967162156135499, 'samples': 1851840, 'steps': 9644, 'loss/train': 1.0496654510498047} -11/06/2021 22:35:20 - INFO - __main__ - Step 9646: {'lr': 0.0004967153582642452, 'samples': 1852032, 'steps': 9645, 'loss/train': 5.934883117675781} -11/06/2021 22:35:21 - INFO - __main__ - Step 9647: {'lr': 0.0004967145008037744, 'samples': 1852224, 'steps': 9646, 'loss/train': 1.2428544759750366} -11/06/2021 22:35:21 - INFO - __main__ - Step 9648: {'lr': 0.000496713643232138, 'samples': 1852416, 'steps': 9647, 'loss/train': 1.7407283782958984} -11/06/2021 22:35:22 - INFO - __main__ - Step 9649: {'lr': 0.000496712785549336, 'samples': 1852608, 'steps': 9648, 'loss/train': 1.9216516017913818} -11/06/2021 22:35:22 - INFO - __main__ - Step 9650: {'lr': 0.0004967119277553692, 'samples': 1852800, 'steps': 9649, 'loss/train': 1.5039646625518799} -11/06/2021 22:35:23 - INFO - __main__ - Step 9651: {'lr': 0.0004967110698502377, 'samples': 1852992, 'steps': 9650, 'loss/train': 1.7824867963790894} -11/06/2021 22:35:23 - INFO - __main__ - Step 9652: {'lr': 0.000496710211833942, 'samples': 1853184, 'steps': 9651, 'loss/train': 1.6737051010131836} -11/06/2021 22:35:24 - INFO - __main__ - Step 9653: {'lr': 0.0004967093537064825, 'samples': 1853376, 'steps': 9652, 'loss/train': 2.1513617038726807} -11/06/2021 22:35:24 - INFO - __main__ - Step 9654: {'lr': 0.0004967084954678597, 'samples': 1853568, 'steps': 9653, 'loss/train': 2.3092923164367676} -11/06/2021 22:35:25 - INFO - __main__ - Step 9655: {'lr': 0.0004967076371180738, 'samples': 1853760, 'steps': 9654, 'loss/train': 1.796209454536438} -11/06/2021 22:35:25 - INFO - __main__ - Step 9656: {'lr': 0.0004967067786571251, 'samples': 1853952, 'steps': 9655, 'loss/train': 1.7951509952545166} -11/06/2021 22:35:25 - INFO - __main__ - Step 9657: {'lr': 0.0004967059200850142, 'samples': 1854144, 'steps': 9656, 'loss/train': 1.7078092098236084} -11/06/2021 22:35:26 - INFO - __main__ - Step 9658: {'lr': 0.0004967050614017415, 'samples': 1854336, 'steps': 9657, 'loss/train': 2.276421546936035} -11/06/2021 22:35:27 - INFO - __main__ - Step 9659: {'lr': 0.0004967042026073073, 'samples': 1854528, 'steps': 9658, 'loss/train': 2.434033155441284} -11/06/2021 22:35:27 - INFO - __main__ - Step 9660: {'lr': 0.000496703343701712, 'samples': 1854720, 'steps': 9659, 'loss/train': 2.1363980770111084} -11/06/2021 22:35:28 - INFO - __main__ - Step 9661: {'lr': 0.0004967024846849558, 'samples': 1854912, 'steps': 9660, 'loss/train': 1.4073458909988403} -11/06/2021 22:35:28 - INFO - __main__ - Step 9662: {'lr': 0.0004967016255570394, 'samples': 1855104, 'steps': 9661, 'loss/train': 1.8968331813812256} -11/06/2021 22:35:28 - INFO - __main__ - Step 9663: {'lr': 0.0004967007663179632, 'samples': 1855296, 'steps': 9662, 'loss/train': 1.9019638299942017} -11/06/2021 22:35:29 - INFO - __main__ - Step 9664: {'lr': 0.0004966999069677272, 'samples': 1855488, 'steps': 9663, 'loss/train': 1.987317681312561} -11/06/2021 22:35:30 - INFO - __main__ - Step 9665: {'lr': 0.0004966990475063321, 'samples': 1855680, 'steps': 9664, 'loss/train': 1.3810869455337524} -11/06/2021 22:35:30 - INFO - __main__ - Step 9666: {'lr': 0.0004966981879337783, 'samples': 1855872, 'steps': 9665, 'loss/train': 1.1948487758636475} -11/06/2021 22:35:30 - INFO - __main__ - Step 9667: {'lr': 0.0004966973282500661, 'samples': 1856064, 'steps': 9666, 'loss/train': 1.8805911540985107} -11/06/2021 22:35:31 - INFO - __main__ - Step 9668: {'lr': 0.0004966964684551958, 'samples': 1856256, 'steps': 9667, 'loss/train': 1.9904563426971436} -11/06/2021 22:35:32 - INFO - __main__ - Step 9669: {'lr': 0.0004966956085491679, 'samples': 1856448, 'steps': 9668, 'loss/train': 1.7589201927185059} -11/06/2021 22:35:32 - INFO - __main__ - Step 9670: {'lr': 0.0004966947485319828, 'samples': 1856640, 'steps': 9669, 'loss/train': 2.156191825866699} -11/06/2021 22:35:32 - INFO - __main__ - Step 9671: {'lr': 0.0004966938884036408, 'samples': 1856832, 'steps': 9670, 'loss/train': 1.8533520698547363} -11/06/2021 22:35:33 - INFO - __main__ - Step 9672: {'lr': 0.0004966930281641423, 'samples': 1857024, 'steps': 9671, 'loss/train': 2.1764333248138428} -11/06/2021 22:35:33 - INFO - __main__ - Step 9673: {'lr': 0.0004966921678134879, 'samples': 1857216, 'steps': 9672, 'loss/train': 2.0473735332489014} -11/06/2021 22:35:34 - INFO - __main__ - Step 9674: {'lr': 0.0004966913073516777, 'samples': 1857408, 'steps': 9673, 'loss/train': 2.0089006423950195} -11/06/2021 22:35:35 - INFO - __main__ - Step 9675: {'lr': 0.0004966904467787123, 'samples': 1857600, 'steps': 9674, 'loss/train': 1.5391348600387573} -11/06/2021 22:35:35 - INFO - __main__ - Step 9676: {'lr': 0.0004966895860945918, 'samples': 1857792, 'steps': 9675, 'loss/train': 0.35723814368247986} -11/06/2021 22:35:35 - INFO - __main__ - Step 9677: {'lr': 0.0004966887252993169, 'samples': 1857984, 'steps': 9676, 'loss/train': 1.9116827249526978} -11/06/2021 22:35:36 - INFO - __main__ - Step 9678: {'lr': 0.0004966878643928879, 'samples': 1858176, 'steps': 9677, 'loss/train': 2.0364251136779785} -11/06/2021 22:35:37 - INFO - __main__ - Step 9679: {'lr': 0.0004966870033753051, 'samples': 1858368, 'steps': 9678, 'loss/train': 2.400313138961792} -11/06/2021 22:35:37 - INFO - __main__ - Step 9680: {'lr': 0.0004966861422465689, 'samples': 1858560, 'steps': 9679, 'loss/train': 1.7770127058029175} -11/06/2021 22:35:37 - INFO - __main__ - Step 9681: {'lr': 0.0004966852810066798, 'samples': 1858752, 'steps': 9680, 'loss/train': 1.5626760721206665} -11/06/2021 22:35:38 - INFO - __main__ - Step 9682: {'lr': 0.0004966844196556382, 'samples': 1858944, 'steps': 9681, 'loss/train': 1.113672137260437} -11/06/2021 22:35:38 - INFO - __main__ - Step 9683: {'lr': 0.0004966835581934442, 'samples': 1859136, 'steps': 9682, 'loss/train': 1.9191310405731201} -11/06/2021 22:35:39 - INFO - __main__ - Step 9684: {'lr': 0.0004966826966200985, 'samples': 1859328, 'steps': 9683, 'loss/train': 1.801482915878296} -11/06/2021 22:35:40 - INFO - __main__ - Step 9685: {'lr': 0.0004966818349356015, 'samples': 1859520, 'steps': 9684, 'loss/train': 2.271620273590088} -11/06/2021 22:35:40 - INFO - __main__ - Step 9686: {'lr': 0.0004966809731399533, 'samples': 1859712, 'steps': 9685, 'loss/train': 1.5356147289276123} -11/06/2021 22:35:40 - INFO - __main__ - Step 9687: {'lr': 0.0004966801112331545, 'samples': 1859904, 'steps': 9686, 'loss/train': 1.8079742193222046} -11/06/2021 22:35:41 - INFO - __main__ - Step 9688: {'lr': 0.0004966792492152054, 'samples': 1860096, 'steps': 9687, 'loss/train': 1.7540109157562256} -11/06/2021 22:35:41 - INFO - __main__ - Step 9689: {'lr': 0.0004966783870861066, 'samples': 1860288, 'steps': 9688, 'loss/train': 1.8654999732971191} -11/06/2021 22:35:42 - INFO - __main__ - Step 9690: {'lr': 0.0004966775248458582, 'samples': 1860480, 'steps': 9689, 'loss/train': 1.8638839721679688} -11/06/2021 22:35:42 - INFO - __main__ - Step 9691: {'lr': 0.0004966766624944607, 'samples': 1860672, 'steps': 9690, 'loss/train': 1.839411735534668} -11/06/2021 22:35:43 - INFO - __main__ - Step 9692: {'lr': 0.0004966758000319147, 'samples': 1860864, 'steps': 9691, 'loss/train': 1.5078877210617065} -11/06/2021 22:35:43 - INFO - __main__ - Step 9693: {'lr': 0.0004966749374582202, 'samples': 1861056, 'steps': 9692, 'loss/train': 2.1486093997955322} -11/06/2021 22:35:43 - INFO - __main__ - Step 9694: {'lr': 0.0004966740747733778, 'samples': 1861248, 'steps': 9693, 'loss/train': 2.061601161956787} -11/06/2021 22:35:44 - INFO - __main__ - Step 9695: {'lr': 0.0004966732119773879, 'samples': 1861440, 'steps': 9694, 'loss/train': 1.997467279434204} -11/06/2021 22:35:45 - INFO - __main__ - Step 9696: {'lr': 0.0004966723490702509, 'samples': 1861632, 'steps': 9695, 'loss/train': 1.515207052230835} -11/06/2021 22:35:45 - INFO - __main__ - Step 9697: {'lr': 0.000496671486051967, 'samples': 1861824, 'steps': 9696, 'loss/train': 1.542418122291565} -11/06/2021 22:35:45 - INFO - __main__ - Step 9698: {'lr': 0.0004966706229225368, 'samples': 1862016, 'steps': 9697, 'loss/train': 1.7097152471542358} -11/06/2021 22:35:46 - INFO - __main__ - Step 9699: {'lr': 0.0004966697596819607, 'samples': 1862208, 'steps': 9698, 'loss/train': 1.9859890937805176} -11/06/2021 22:35:47 - INFO - __main__ - Step 9700: {'lr': 0.0004966688963302389, 'samples': 1862400, 'steps': 9699, 'loss/train': 1.6902731657028198} -11/06/2021 22:35:47 - INFO - __main__ - Step 9701: {'lr': 0.000496668032867372, 'samples': 1862592, 'steps': 9700, 'loss/train': 2.2249433994293213} -11/06/2021 22:35:48 - INFO - __main__ - Step 9702: {'lr': 0.0004966671692933603, 'samples': 1862784, 'steps': 9701, 'loss/train': 2.1209845542907715} -11/06/2021 22:35:48 - INFO - __main__ - Step 9703: {'lr': 0.0004966663056082041, 'samples': 1862976, 'steps': 9702, 'loss/train': 2.0231058597564697} -11/06/2021 22:35:48 - INFO - __main__ - Step 9704: {'lr': 0.0004966654418119039, 'samples': 1863168, 'steps': 9703, 'loss/train': 1.7849528789520264} -11/06/2021 22:35:49 - INFO - __main__ - Step 9705: {'lr': 0.00049666457790446, 'samples': 1863360, 'steps': 9704, 'loss/train': 1.677087664604187} -11/06/2021 22:35:49 - INFO - __main__ - Step 9706: {'lr': 0.000496663713885873, 'samples': 1863552, 'steps': 9705, 'loss/train': 1.6094074249267578} -11/06/2021 22:35:50 - INFO - __main__ - Step 9707: {'lr': 0.0004966628497561431, 'samples': 1863744, 'steps': 9706, 'loss/train': 1.4655191898345947} -11/06/2021 22:35:50 - INFO - __main__ - Step 9708: {'lr': 0.0004966619855152706, 'samples': 1863936, 'steps': 9707, 'loss/train': 1.6858545541763306} -11/06/2021 22:35:51 - INFO - __main__ - Step 9709: {'lr': 0.0004966611211632561, 'samples': 1864128, 'steps': 9708, 'loss/train': 2.7526583671569824} -11/06/2021 22:35:51 - INFO - __main__ - Step 9710: {'lr': 0.0004966602567000999, 'samples': 1864320, 'steps': 9709, 'loss/train': 1.8276556730270386} -11/06/2021 22:35:52 - INFO - __main__ - Step 9711: {'lr': 0.0004966593921258023, 'samples': 1864512, 'steps': 9710, 'loss/train': 2.059382677078247} -11/06/2021 22:35:52 - INFO - __main__ - Step 9712: {'lr': 0.000496658527440364, 'samples': 1864704, 'steps': 9711, 'loss/train': 1.3967629671096802} -11/06/2021 22:35:53 - INFO - __main__ - Step 9713: {'lr': 0.000496657662643785, 'samples': 1864896, 'steps': 9712, 'loss/train': 1.2711286544799805} -11/06/2021 22:35:53 - INFO - __main__ - Step 9714: {'lr': 0.000496656797736066, 'samples': 1865088, 'steps': 9713, 'loss/train': 1.6706697940826416} -11/06/2021 22:35:53 - INFO - __main__ - Step 9715: {'lr': 0.0004966559327172071, 'samples': 1865280, 'steps': 9714, 'loss/train': 1.8991764783859253} -11/06/2021 22:35:54 - INFO - __main__ - Step 9716: {'lr': 0.0004966550675872089, 'samples': 1865472, 'steps': 9715, 'loss/train': 0.8012776970863342} -11/06/2021 22:35:55 - INFO - __main__ - Step 9717: {'lr': 0.0004966542023460718, 'samples': 1865664, 'steps': 9716, 'loss/train': 1.5615832805633545} -11/06/2021 22:35:55 - INFO - __main__ - Step 9718: {'lr': 0.000496653336993796, 'samples': 1865856, 'steps': 9717, 'loss/train': 1.8252805471420288} -11/06/2021 22:35:55 - INFO - __main__ - Step 9719: {'lr': 0.0004966524715303821, 'samples': 1866048, 'steps': 9718, 'loss/train': 1.7340925931930542} -11/06/2021 22:35:56 - INFO - __main__ - Step 9720: {'lr': 0.0004966516059558304, 'samples': 1866240, 'steps': 9719, 'loss/train': 1.9591999053955078} -11/06/2021 22:35:57 - INFO - __main__ - Step 9721: {'lr': 0.0004966507402701413, 'samples': 1866432, 'steps': 9720, 'loss/train': 1.574877142906189} -11/06/2021 22:35:57 - INFO - __main__ - Step 9722: {'lr': 0.0004966498744733151, 'samples': 1866624, 'steps': 9721, 'loss/train': 1.7162398099899292} -11/06/2021 22:35:58 - INFO - __main__ - Step 9723: {'lr': 0.0004966490085653523, 'samples': 1866816, 'steps': 9722, 'loss/train': 1.3233344554901123} -11/06/2021 22:35:58 - INFO - __main__ - Step 9724: {'lr': 0.0004966481425462533, 'samples': 1867008, 'steps': 9723, 'loss/train': 2.0228872299194336} -11/06/2021 22:35:58 - INFO - __main__ - Step 9725: {'lr': 0.0004966472764160183, 'samples': 1867200, 'steps': 9724, 'loss/train': 2.029508590698242} -11/06/2021 22:35:59 - INFO - __main__ - Step 9726: {'lr': 0.000496646410174648, 'samples': 1867392, 'steps': 9725, 'loss/train': 2.0226128101348877} -11/06/2021 22:36:00 - INFO - __main__ - Step 9727: {'lr': 0.0004966455438221427, 'samples': 1867584, 'steps': 9726, 'loss/train': 1.7145023345947266} -11/06/2021 22:36:00 - INFO - __main__ - Step 9728: {'lr': 0.0004966446773585026, 'samples': 1867776, 'steps': 9727, 'loss/train': 1.7100311517715454} -11/06/2021 22:36:00 - INFO - __main__ - Step 9729: {'lr': 0.0004966438107837283, 'samples': 1867968, 'steps': 9728, 'loss/train': 1.7535374164581299} -11/06/2021 22:36:01 - INFO - __main__ - Step 9730: {'lr': 0.00049664294409782, 'samples': 1868160, 'steps': 9729, 'loss/train': 1.442859172821045} -11/06/2021 22:36:01 - INFO - __main__ - Step 9731: {'lr': 0.0004966420773007782, 'samples': 1868352, 'steps': 9730, 'loss/train': 1.5532867908477783} -11/06/2021 22:36:02 - INFO - __main__ - Step 9732: {'lr': 0.0004966412103926034, 'samples': 1868544, 'steps': 9731, 'loss/train': 1.9052324295043945} -11/06/2021 22:36:02 - INFO - __main__ - Step 9733: {'lr': 0.0004966403433732958, 'samples': 1868736, 'steps': 9732, 'loss/train': 1.7569751739501953} -11/06/2021 22:36:03 - INFO - __main__ - Step 9734: {'lr': 0.0004966394762428559, 'samples': 1868928, 'steps': 9733, 'loss/train': 1.3910471200942993} -11/06/2021 22:36:03 - INFO - __main__ - Step 9735: {'lr': 0.0004966386090012841, 'samples': 1869120, 'steps': 9734, 'loss/train': 1.8945108652114868} -11/06/2021 22:36:03 - INFO - __main__ - Step 9736: {'lr': 0.0004966377416485806, 'samples': 1869312, 'steps': 9735, 'loss/train': 2.4226298332214355} -11/06/2021 22:36:05 - INFO - __main__ - Step 9737: {'lr': 0.0004966368741847461, 'samples': 1869504, 'steps': 9736, 'loss/train': 1.5357730388641357} -11/06/2021 22:36:05 - INFO - __main__ - Step 9738: {'lr': 0.0004966360066097807, 'samples': 1869696, 'steps': 9737, 'loss/train': 1.4675438404083252} -11/06/2021 22:36:05 - INFO - __main__ - Step 9739: {'lr': 0.0004966351389236851, 'samples': 1869888, 'steps': 9738, 'loss/train': 1.7604131698608398} -11/06/2021 22:36:06 - INFO - __main__ - Step 9740: {'lr': 0.0004966342711264593, 'samples': 1870080, 'steps': 9739, 'loss/train': 2.1939752101898193} -11/06/2021 22:36:06 - INFO - __main__ - Step 9741: {'lr': 0.000496633403218104, 'samples': 1870272, 'steps': 9740, 'loss/train': 1.855295181274414} -11/06/2021 22:36:07 - INFO - __main__ - Step 9742: {'lr': 0.0004966325351986195, 'samples': 1870464, 'steps': 9741, 'loss/train': 2.2889838218688965} -11/06/2021 22:36:07 - INFO - __main__ - Step 9743: {'lr': 0.0004966316670680062, 'samples': 1870656, 'steps': 9742, 'loss/train': 1.9611015319824219} -11/06/2021 22:36:08 - INFO - __main__ - Step 9744: {'lr': 0.0004966307988262644, 'samples': 1870848, 'steps': 9743, 'loss/train': 1.9820667505264282} -11/06/2021 22:36:08 - INFO - __main__ - Step 9745: {'lr': 0.0004966299304733947, 'samples': 1871040, 'steps': 9744, 'loss/train': 1.8761732578277588} -11/06/2021 22:36:08 - INFO - __main__ - Step 9746: {'lr': 0.0004966290620093972, 'samples': 1871232, 'steps': 9745, 'loss/train': 1.9568790197372437} -11/06/2021 22:36:09 - INFO - __main__ - Step 9747: {'lr': 0.0004966281934342725, 'samples': 1871424, 'steps': 9746, 'loss/train': 1.7533879280090332} -11/06/2021 22:36:10 - INFO - __main__ - Step 9748: {'lr': 0.000496627324748021, 'samples': 1871616, 'steps': 9747, 'loss/train': 2.03949236869812} -11/06/2021 22:36:10 - INFO - __main__ - Step 9749: {'lr': 0.000496626455950643, 'samples': 1871808, 'steps': 9748, 'loss/train': 2.50878643989563} -11/06/2021 22:36:10 - INFO - __main__ - Step 9750: {'lr': 0.000496625587042139, 'samples': 1872000, 'steps': 9749, 'loss/train': 1.5603324174880981} -11/06/2021 22:36:11 - INFO - __main__ - Step 9751: {'lr': 0.0004966247180225092, 'samples': 1872192, 'steps': 9750, 'loss/train': 1.700454592704773} -11/06/2021 22:36:11 - INFO - __main__ - Step 9752: {'lr': 0.0004966238488917542, 'samples': 1872384, 'steps': 9751, 'loss/train': 0.7267507910728455} -11/06/2021 22:36:12 - INFO - __main__ - Step 9753: {'lr': 0.0004966229796498742, 'samples': 1872576, 'steps': 9752, 'loss/train': 1.431842565536499} -11/06/2021 22:36:13 - INFO - __main__ - Step 9754: {'lr': 0.0004966221102968698, 'samples': 1872768, 'steps': 9753, 'loss/train': 1.7751144170761108} -11/06/2021 22:36:13 - INFO - __main__ - Step 9755: {'lr': 0.0004966212408327412, 'samples': 1872960, 'steps': 9754, 'loss/train': 1.7627856731414795} -11/06/2021 22:36:13 - INFO - __main__ - Step 9756: {'lr': 0.0004966203712574889, 'samples': 1873152, 'steps': 9755, 'loss/train': 2.068781852722168} -11/06/2021 22:36:14 - INFO - __main__ - Step 9757: {'lr': 0.0004966195015711132, 'samples': 1873344, 'steps': 9756, 'loss/train': 1.8314954042434692} -11/06/2021 22:36:15 - INFO - __main__ - Step 9758: {'lr': 0.0004966186317736146, 'samples': 1873536, 'steps': 9757, 'loss/train': 1.5385262966156006} -11/06/2021 22:36:15 - INFO - __main__ - Step 9759: {'lr': 0.0004966177618649935, 'samples': 1873728, 'steps': 9758, 'loss/train': 2.23832106590271} -11/06/2021 22:36:15 - INFO - __main__ - Step 9760: {'lr': 0.0004966168918452503, 'samples': 1873920, 'steps': 9759, 'loss/train': 2.2789201736450195} -11/06/2021 22:36:16 - INFO - __main__ - Step 9761: {'lr': 0.0004966160217143852, 'samples': 1874112, 'steps': 9760, 'loss/train': 1.4507635831832886} -11/06/2021 22:36:16 - INFO - __main__ - Step 9762: {'lr': 0.0004966151514723988, 'samples': 1874304, 'steps': 9761, 'loss/train': 1.7444387674331665} -11/06/2021 22:36:17 - INFO - __main__ - Step 9763: {'lr': 0.0004966142811192914, 'samples': 1874496, 'steps': 9762, 'loss/train': 2.5484769344329834} -11/06/2021 22:36:17 - INFO - __main__ - Step 9764: {'lr': 0.0004966134106550634, 'samples': 1874688, 'steps': 9763, 'loss/train': 2.3604612350463867} -11/06/2021 22:36:18 - INFO - __main__ - Step 9765: {'lr': 0.0004966125400797152, 'samples': 1874880, 'steps': 9764, 'loss/train': 1.8499844074249268} -11/06/2021 22:36:18 - INFO - __main__ - Step 9766: {'lr': 0.0004966116693932472, 'samples': 1875072, 'steps': 9765, 'loss/train': 2.1143555641174316} -11/06/2021 22:36:18 - INFO - __main__ - Step 9767: {'lr': 0.0004966107985956598, 'samples': 1875264, 'steps': 9766, 'loss/train': 1.2633049488067627} -11/06/2021 22:36:19 - INFO - __main__ - Step 9768: {'lr': 0.0004966099276869534, 'samples': 1875456, 'steps': 9767, 'loss/train': 1.519136667251587} -11/06/2021 22:36:20 - INFO - __main__ - Step 9769: {'lr': 0.0004966090566671283, 'samples': 1875648, 'steps': 9768, 'loss/train': 1.8271578550338745} -11/06/2021 22:36:20 - INFO - __main__ - Step 9770: {'lr': 0.000496608185536185, 'samples': 1875840, 'steps': 9769, 'loss/train': 1.837522268295288} -11/06/2021 22:36:20 - INFO - __main__ - Step 9771: {'lr': 0.0004966073142941239, 'samples': 1876032, 'steps': 9770, 'loss/train': 2.2010583877563477} -11/06/2021 22:36:21 - INFO - __main__ - Step 9772: {'lr': 0.0004966064429409452, 'samples': 1876224, 'steps': 9771, 'loss/train': 1.9248576164245605} -11/06/2021 22:36:22 - INFO - __main__ - Step 9773: {'lr': 0.0004966055714766496, 'samples': 1876416, 'steps': 9772, 'loss/train': 2.22214412689209} -11/06/2021 22:36:22 - INFO - __main__ - Step 9774: {'lr': 0.0004966046999012373, 'samples': 1876608, 'steps': 9773, 'loss/train': 1.0785945653915405} -11/06/2021 22:36:22 - INFO - __main__ - Step 9775: {'lr': 0.0004966038282147087, 'samples': 1876800, 'steps': 9774, 'loss/train': 1.5319066047668457} -11/06/2021 22:36:23 - INFO - __main__ - Step 9776: {'lr': 0.0004966029564170643, 'samples': 1876992, 'steps': 9775, 'loss/train': 1.8373252153396606} -11/06/2021 22:36:23 - INFO - __main__ - Step 9777: {'lr': 0.0004966020845083044, 'samples': 1877184, 'steps': 9776, 'loss/train': 1.9333018064498901} -11/06/2021 22:36:24 - INFO - __main__ - Step 9778: {'lr': 0.0004966012124884292, 'samples': 1877376, 'steps': 9777, 'loss/train': 1.7784291505813599} -11/06/2021 22:36:24 - INFO - __main__ - Step 9779: {'lr': 0.0004966003403574395, 'samples': 1877568, 'steps': 9778, 'loss/train': 2.0057530403137207} -11/06/2021 22:36:25 - INFO - __main__ - Step 9780: {'lr': 0.0004965994681153355, 'samples': 1877760, 'steps': 9779, 'loss/train': 1.3653117418289185} -11/06/2021 22:36:25 - INFO - __main__ - Step 9781: {'lr': 0.0004965985957621175, 'samples': 1877952, 'steps': 9780, 'loss/train': 1.5184459686279297} -11/06/2021 22:36:26 - INFO - __main__ - Step 9782: {'lr': 0.0004965977232977861, 'samples': 1878144, 'steps': 9781, 'loss/train': 1.0429720878601074} -11/06/2021 22:36:26 - INFO - __main__ - Step 9783: {'lr': 0.0004965968507223414, 'samples': 1878336, 'steps': 9782, 'loss/train': 1.5216965675354004} -11/06/2021 22:36:27 - INFO - __main__ - Step 9784: {'lr': 0.000496595978035784, 'samples': 1878528, 'steps': 9783, 'loss/train': 1.9085612297058105} -11/06/2021 22:36:27 - INFO - __main__ - Step 9785: {'lr': 0.0004965951052381144, 'samples': 1878720, 'steps': 9784, 'loss/train': 1.6528103351593018} -11/06/2021 22:36:28 - INFO - __main__ - Step 9786: {'lr': 0.0004965942323293328, 'samples': 1878912, 'steps': 9785, 'loss/train': 1.703324317932129} -11/06/2021 22:36:28 - INFO - __main__ - Step 9787: {'lr': 0.0004965933593094395, 'samples': 1879104, 'steps': 9786, 'loss/train': 1.8389208316802979} -11/06/2021 22:36:28 - INFO - __main__ - Step 9788: {'lr': 0.0004965924861784352, 'samples': 1879296, 'steps': 9787, 'loss/train': 2.069736957550049} -11/06/2021 22:36:29 - INFO - __main__ - Step 9789: {'lr': 0.0004965916129363201, 'samples': 1879488, 'steps': 9788, 'loss/train': 1.9471229314804077} -11/06/2021 22:36:30 - INFO - __main__ - Step 9790: {'lr': 0.0004965907395830945, 'samples': 1879680, 'steps': 9789, 'loss/train': 1.7488764524459839} -11/06/2021 22:36:30 - INFO - __main__ - Step 9791: {'lr': 0.000496589866118759, 'samples': 1879872, 'steps': 9790, 'loss/train': 2.344801902770996} -11/06/2021 22:36:30 - INFO - __main__ - Step 9792: {'lr': 0.000496588992543314, 'samples': 1880064, 'steps': 9791, 'loss/train': 1.8304022550582886} -11/06/2021 22:36:31 - INFO - __main__ - Step 9793: {'lr': 0.0004965881188567597, 'samples': 1880256, 'steps': 9792, 'loss/train': 1.6867663860321045} -11/06/2021 22:36:32 - INFO - __main__ - Step 9794: {'lr': 0.0004965872450590965, 'samples': 1880448, 'steps': 9793, 'loss/train': 1.4658312797546387} -11/06/2021 22:36:32 - INFO - __main__ - Step 9795: {'lr': 0.0004965863711503251, 'samples': 1880640, 'steps': 9794, 'loss/train': 2.786965847015381} -11/06/2021 22:36:33 - INFO - __main__ - Step 9796: {'lr': 0.0004965854971304457, 'samples': 1880832, 'steps': 9795, 'loss/train': 1.9178855419158936} -11/06/2021 22:36:33 - INFO - __main__ - Step 9797: {'lr': 0.0004965846229994586, 'samples': 1881024, 'steps': 9796, 'loss/train': 1.2724156379699707} -11/06/2021 22:36:34 - INFO - __main__ - Step 9798: {'lr': 0.0004965837487573641, 'samples': 1881216, 'steps': 9797, 'loss/train': 2.09515380859375} -11/06/2021 22:36:35 - INFO - __main__ - Step 9799: {'lr': 0.000496582874404163, 'samples': 1881408, 'steps': 9798, 'loss/train': 0.2936389148235321} -11/06/2021 22:36:35 - INFO - __main__ - Step 9800: {'lr': 0.0004965819999398554, 'samples': 1881600, 'steps': 9799, 'loss/train': 1.556630253791809} -11/06/2021 22:36:35 - INFO - __main__ - Step 9801: {'lr': 0.0004965811253644418, 'samples': 1881792, 'steps': 9800, 'loss/train': 1.5148653984069824} -11/06/2021 22:36:36 - INFO - __main__ - Step 9802: {'lr': 0.0004965802506779225, 'samples': 1881984, 'steps': 9801, 'loss/train': 1.8393759727478027} -11/06/2021 22:36:36 - INFO - __main__ - Step 9803: {'lr': 0.0004965793758802978, 'samples': 1882176, 'steps': 9802, 'loss/train': 1.732246994972229} -11/06/2021 22:36:37 - INFO - __main__ - Step 9804: {'lr': 0.0004965785009715684, 'samples': 1882368, 'steps': 9803, 'loss/train': 1.4041547775268555} -11/06/2021 22:36:37 - INFO - __main__ - Step 9805: {'lr': 0.0004965776259517345, 'samples': 1882560, 'steps': 9804, 'loss/train': 1.8803133964538574} -11/06/2021 22:36:38 - INFO - __main__ - Step 9806: {'lr': 0.0004965767508207966, 'samples': 1882752, 'steps': 9805, 'loss/train': 1.2590349912643433} -11/06/2021 22:36:38 - INFO - __main__ - Step 9807: {'lr': 0.000496575875578755, 'samples': 1882944, 'steps': 9806, 'loss/train': 2.212789535522461} -11/06/2021 22:36:38 - INFO - __main__ - Step 9808: {'lr': 0.00049657500022561, 'samples': 1883136, 'steps': 9807, 'loss/train': 1.9373009204864502} -11/06/2021 22:36:39 - INFO - __main__ - Step 9809: {'lr': 0.0004965741247613622, 'samples': 1883328, 'steps': 9808, 'loss/train': 0.9651688933372498} -11/06/2021 22:36:40 - INFO - __main__ - Step 9810: {'lr': 0.0004965732491860119, 'samples': 1883520, 'steps': 9809, 'loss/train': 2.099937915802002} -11/06/2021 22:36:40 - INFO - __main__ - Step 9811: {'lr': 0.0004965723734995594, 'samples': 1883712, 'steps': 9810, 'loss/train': 1.7372392416000366} -11/06/2021 22:36:40 - INFO - __main__ - Step 9812: {'lr': 0.0004965714977020053, 'samples': 1883904, 'steps': 9811, 'loss/train': 1.6284079551696777} -11/06/2021 22:36:41 - INFO - __main__ - Step 9813: {'lr': 0.0004965706217933499, 'samples': 1884096, 'steps': 9812, 'loss/train': 1.849391222000122} -11/06/2021 22:36:41 - INFO - __main__ - Step 9814: {'lr': 0.0004965697457735936, 'samples': 1884288, 'steps': 9813, 'loss/train': 1.648018717765808} -11/06/2021 22:36:42 - INFO - __main__ - Step 9815: {'lr': 0.0004965688696427366, 'samples': 1884480, 'steps': 9814, 'loss/train': 1.7322882413864136} -11/06/2021 22:36:42 - INFO - __main__ - Step 9816: {'lr': 0.0004965679934007797, 'samples': 1884672, 'steps': 9815, 'loss/train': 1.7675822973251343} -11/06/2021 22:36:43 - INFO - __main__ - Step 9817: {'lr': 0.0004965671170477229, 'samples': 1884864, 'steps': 9816, 'loss/train': 1.9023000001907349} -11/06/2021 22:36:43 - INFO - __main__ - Step 9818: {'lr': 0.0004965662405835668, 'samples': 1885056, 'steps': 9817, 'loss/train': 1.9403313398361206} -11/06/2021 22:36:43 - INFO - __main__ - Step 9819: {'lr': 0.0004965653640083118, 'samples': 1885248, 'steps': 9818, 'loss/train': 0.30051112174987793} -11/06/2021 22:36:45 - INFO - __main__ - Step 9820: {'lr': 0.0004965644873219583, 'samples': 1885440, 'steps': 9819, 'loss/train': 1.5804340839385986} -11/06/2021 22:36:45 - INFO - __main__ - Step 9821: {'lr': 0.0004965636105245066, 'samples': 1885632, 'steps': 9820, 'loss/train': 3.80881404876709} -11/06/2021 22:36:45 - INFO - __main__ - Step 9822: {'lr': 0.000496562733615957, 'samples': 1885824, 'steps': 9821, 'loss/train': 1.808201551437378} -11/06/2021 22:36:46 - INFO - __main__ - Step 9823: {'lr': 0.0004965618565963102, 'samples': 1886016, 'steps': 9822, 'loss/train': 1.3552080392837524} -11/06/2021 22:36:46 - INFO - __main__ - Step 9824: {'lr': 0.0004965609794655664, 'samples': 1886208, 'steps': 9823, 'loss/train': 1.8378883600234985} -11/06/2021 22:36:47 - INFO - __main__ - Step 9825: {'lr': 0.0004965601022237261, 'samples': 1886400, 'steps': 9824, 'loss/train': 1.9869000911712646} -11/06/2021 22:36:47 - INFO - __main__ - Step 9826: {'lr': 0.0004965592248707895, 'samples': 1886592, 'steps': 9825, 'loss/train': 1.6496671438217163} -11/06/2021 22:36:48 - INFO - __main__ - Step 9827: {'lr': 0.0004965583474067571, 'samples': 1886784, 'steps': 9826, 'loss/train': 1.5552690029144287} -11/06/2021 22:36:48 - INFO - __main__ - Step 9828: {'lr': 0.0004965574698316294, 'samples': 1886976, 'steps': 9827, 'loss/train': 1.9440776109695435} -11/06/2021 22:36:48 - INFO - __main__ - Step 9829: {'lr': 0.0004965565921454067, 'samples': 1887168, 'steps': 9828, 'loss/train': 1.336730718612671} -11/06/2021 22:36:49 - INFO - __main__ - Step 9830: {'lr': 0.0004965557143480893, 'samples': 1887360, 'steps': 9829, 'loss/train': 0.4165128171443939} -11/06/2021 22:36:50 - INFO - __main__ - Step 9831: {'lr': 0.0004965548364396779, 'samples': 1887552, 'steps': 9830, 'loss/train': 1.5435590744018555} -11/06/2021 22:36:50 - INFO - __main__ - Step 9832: {'lr': 0.0004965539584201725, 'samples': 1887744, 'steps': 9831, 'loss/train': 1.4158097505569458} -11/06/2021 22:36:50 - INFO - __main__ - Step 9833: {'lr': 0.0004965530802895738, 'samples': 1887936, 'steps': 9832, 'loss/train': 1.8684687614440918} -11/06/2021 22:36:51 - INFO - __main__ - Step 9834: {'lr': 0.000496552202047882, 'samples': 1888128, 'steps': 9833, 'loss/train': 2.1222503185272217} -11/06/2021 22:36:52 - INFO - __main__ - Step 9835: {'lr': 0.0004965513236950977, 'samples': 1888320, 'steps': 9834, 'loss/train': 1.6643342971801758} -11/06/2021 22:36:52 - INFO - __main__ - Step 9836: {'lr': 0.0004965504452312211, 'samples': 1888512, 'steps': 9835, 'loss/train': 1.892832636833191} -11/06/2021 22:36:53 - INFO - __main__ - Step 9837: {'lr': 0.0004965495666562527, 'samples': 1888704, 'steps': 9836, 'loss/train': 1.7342534065246582} -11/06/2021 22:36:53 - INFO - __main__ - Step 9838: {'lr': 0.0004965486879701928, 'samples': 1888896, 'steps': 9837, 'loss/train': 1.782392978668213} -11/06/2021 22:36:53 - INFO - __main__ - Step 9839: {'lr': 0.000496547809173042, 'samples': 1889088, 'steps': 9838, 'loss/train': 5.928685665130615} -11/06/2021 22:36:54 - INFO - __main__ - Step 9840: {'lr': 0.0004965469302648005, 'samples': 1889280, 'steps': 9839, 'loss/train': 2.1997225284576416} -11/06/2021 22:36:55 - INFO - __main__ - Step 9841: {'lr': 0.0004965460512454688, 'samples': 1889472, 'steps': 9840, 'loss/train': 1.9922882318496704} -11/06/2021 22:36:55 - INFO - __main__ - Step 9842: {'lr': 0.0004965451721150471, 'samples': 1889664, 'steps': 9841, 'loss/train': 1.385520100593567} -11/06/2021 22:36:55 - INFO - __main__ - Step 9843: {'lr': 0.0004965442928735361, 'samples': 1889856, 'steps': 9842, 'loss/train': 1.5797951221466064} -11/06/2021 22:36:56 - INFO - __main__ - Step 9844: {'lr': 0.000496543413520936, 'samples': 1890048, 'steps': 9843, 'loss/train': 1.9805771112442017} -11/06/2021 22:36:56 - INFO - __main__ - Step 9845: {'lr': 0.0004965425340572472, 'samples': 1890240, 'steps': 9844, 'loss/train': 2.120030403137207} -11/06/2021 22:36:57 - INFO - __main__ - Step 9846: {'lr': 0.0004965416544824703, 'samples': 1890432, 'steps': 9845, 'loss/train': 1.6327179670333862} -11/06/2021 22:36:58 - INFO - __main__ - Step 9847: {'lr': 0.0004965407747966053, 'samples': 1890624, 'steps': 9846, 'loss/train': 1.7754491567611694} -11/06/2021 22:36:58 - INFO - __main__ - Step 9848: {'lr': 0.000496539894999653, 'samples': 1890816, 'steps': 9847, 'loss/train': 1.8676059246063232} -11/06/2021 22:36:59 - INFO - __main__ - Step 9849: {'lr': 0.0004965390150916136, 'samples': 1891008, 'steps': 9848, 'loss/train': 1.9253339767456055} -11/06/2021 22:36:59 - INFO - __main__ - Step 9850: {'lr': 0.0004965381350724874, 'samples': 1891200, 'steps': 9849, 'loss/train': 1.7396340370178223} -11/06/2021 22:36:59 - INFO - __main__ - Step 9851: {'lr': 0.000496537254942275, 'samples': 1891392, 'steps': 9850, 'loss/train': 1.8926670551300049} -11/06/2021 22:37:00 - INFO - __main__ - Step 9852: {'lr': 0.0004965363747009767, 'samples': 1891584, 'steps': 9851, 'loss/train': 1.3262872695922852} -11/06/2021 22:37:01 - INFO - __main__ - Step 9853: {'lr': 0.000496535494348593, 'samples': 1891776, 'steps': 9852, 'loss/train': 1.9677116870880127} -11/06/2021 22:37:01 - INFO - __main__ - Step 9854: {'lr': 0.0004965346138851241, 'samples': 1891968, 'steps': 9853, 'loss/train': 1.1874512434005737} -11/06/2021 22:37:01 - INFO - __main__ - Step 9855: {'lr': 0.0004965337333105706, 'samples': 1892160, 'steps': 9854, 'loss/train': 2.6719613075256348} -11/06/2021 22:37:02 - INFO - __main__ - Step 9856: {'lr': 0.0004965328526249328, 'samples': 1892352, 'steps': 9855, 'loss/train': 1.6148555278778076} -11/06/2021 22:37:03 - INFO - __main__ - Step 9857: {'lr': 0.000496531971828211, 'samples': 1892544, 'steps': 9856, 'loss/train': 1.9275423288345337} -11/06/2021 22:37:03 - INFO - __main__ - Step 9858: {'lr': 0.0004965310909204058, 'samples': 1892736, 'steps': 9857, 'loss/train': 2.38356876373291} -11/06/2021 22:37:03 - INFO - __main__ - Step 9859: {'lr': 0.0004965302099015175, 'samples': 1892928, 'steps': 9858, 'loss/train': 1.5586031675338745} -11/06/2021 22:37:04 - INFO - __main__ - Step 9860: {'lr': 0.0004965293287715464, 'samples': 1893120, 'steps': 9859, 'loss/train': 1.8850369453430176} -11/06/2021 22:37:04 - INFO - __main__ - Step 9861: {'lr': 0.0004965284475304931, 'samples': 1893312, 'steps': 9860, 'loss/train': 2.069514274597168} -11/06/2021 22:37:06 - INFO - __main__ - Step 9862: {'lr': 0.0004965275661783579, 'samples': 1893504, 'steps': 9861, 'loss/train': 2.3399882316589355} -11/06/2021 22:37:06 - INFO - __main__ - Step 9863: {'lr': 0.0004965266847151411, 'samples': 1893696, 'steps': 9862, 'loss/train': 1.8240324258804321} -11/06/2021 22:37:07 - INFO - __main__ - Step 9864: {'lr': 0.0004965258031408432, 'samples': 1893888, 'steps': 9863, 'loss/train': 1.4843631982803345} -11/06/2021 22:37:07 - INFO - __main__ - Step 9865: {'lr': 0.0004965249214554645, 'samples': 1894080, 'steps': 9864, 'loss/train': 1.9368473291397095} -11/06/2021 22:37:07 - INFO - __main__ - Step 9866: {'lr': 0.0004965240396590055, 'samples': 1894272, 'steps': 9865, 'loss/train': 1.9536662101745605} -11/06/2021 22:37:08 - INFO - __main__ - Step 9867: {'lr': 0.0004965231577514666, 'samples': 1894464, 'steps': 9866, 'loss/train': 2.018059253692627} -11/06/2021 22:37:08 - INFO - __main__ - Step 9868: {'lr': 0.0004965222757328482, 'samples': 1894656, 'steps': 9867, 'loss/train': 2.956916093826294} -11/06/2021 22:37:09 - INFO - __main__ - Step 9869: {'lr': 0.0004965213936031507, 'samples': 1894848, 'steps': 9868, 'loss/train': 2.127044677734375} -11/06/2021 22:37:09 - INFO - __main__ - Step 9870: {'lr': 0.0004965205113623744, 'samples': 1895040, 'steps': 9869, 'loss/train': 1.807254433631897} -11/06/2021 22:37:10 - INFO - __main__ - Step 9871: {'lr': 0.0004965196290105197, 'samples': 1895232, 'steps': 9870, 'loss/train': 1.9776854515075684} -11/06/2021 22:37:10 - INFO - __main__ - Step 9872: {'lr': 0.0004965187465475873, 'samples': 1895424, 'steps': 9871, 'loss/train': 1.997361660003662} -11/06/2021 22:37:11 - INFO - __main__ - Step 9873: {'lr': 0.0004965178639735772, 'samples': 1895616, 'steps': 9872, 'loss/train': 1.981247067451477} -11/06/2021 22:37:11 - INFO - __main__ - Step 9874: {'lr': 0.0004965169812884898, 'samples': 1895808, 'steps': 9873, 'loss/train': 1.2999768257141113} -11/06/2021 22:37:12 - INFO - __main__ - Step 9875: {'lr': 0.0004965160984923259, 'samples': 1896000, 'steps': 9874, 'loss/train': 2.367384433746338} -11/06/2021 22:37:12 - INFO - __main__ - Step 9876: {'lr': 0.0004965152155850855, 'samples': 1896192, 'steps': 9875, 'loss/train': 1.639930248260498} -11/06/2021 22:37:13 - INFO - __main__ - Step 9877: {'lr': 0.0004965143325667692, 'samples': 1896384, 'steps': 9876, 'loss/train': 2.1641268730163574} -11/06/2021 22:37:13 - INFO - __main__ - Step 9878: {'lr': 0.0004965134494373773, 'samples': 1896576, 'steps': 9877, 'loss/train': 1.5240188837051392} -11/06/2021 22:37:13 - INFO - __main__ - Step 9879: {'lr': 0.0004965125661969103, 'samples': 1896768, 'steps': 9878, 'loss/train': 1.7663499116897583} -11/06/2021 22:37:14 - INFO - __main__ - Step 9880: {'lr': 0.0004965116828453685, 'samples': 1896960, 'steps': 9879, 'loss/train': 1.9683094024658203} -11/06/2021 22:37:15 - INFO - __main__ - Step 9881: {'lr': 0.0004965107993827524, 'samples': 1897152, 'steps': 9880, 'loss/train': 1.8044612407684326} -11/06/2021 22:37:15 - INFO - __main__ - Step 9882: {'lr': 0.0004965099158090624, 'samples': 1897344, 'steps': 9881, 'loss/train': 1.7531816959381104} -11/06/2021 22:37:15 - INFO - __main__ - Step 9883: {'lr': 0.0004965090321242987, 'samples': 1897536, 'steps': 9882, 'loss/train': 1.9520115852355957} -11/06/2021 22:37:16 - INFO - __main__ - Step 9884: {'lr': 0.0004965081483284618, 'samples': 1897728, 'steps': 9883, 'loss/train': 2.066235065460205} -11/06/2021 22:37:17 - INFO - __main__ - Step 9885: {'lr': 0.0004965072644215522, 'samples': 1897920, 'steps': 9884, 'loss/train': 1.9941020011901855} -11/06/2021 22:37:17 - INFO - __main__ - Step 9886: {'lr': 0.0004965063804035703, 'samples': 1898112, 'steps': 9885, 'loss/train': 1.8429374694824219} -11/06/2021 22:37:17 - INFO - __main__ - Step 9887: {'lr': 0.0004965054962745163, 'samples': 1898304, 'steps': 9886, 'loss/train': 2.1564157009124756} -11/06/2021 22:37:18 - INFO - __main__ - Step 9888: {'lr': 0.0004965046120343908, 'samples': 1898496, 'steps': 9887, 'loss/train': 1.4476630687713623} -11/06/2021 22:37:18 - INFO - __main__ - Step 9889: {'lr': 0.0004965037276831942, 'samples': 1898688, 'steps': 9888, 'loss/train': 1.0114924907684326} -11/06/2021 22:37:19 - INFO - __main__ - Step 9890: {'lr': 0.0004965028432209267, 'samples': 1898880, 'steps': 9889, 'loss/train': 1.0621055364608765} -11/06/2021 22:37:19 - INFO - __main__ - Step 9891: {'lr': 0.0004965019586475888, 'samples': 1899072, 'steps': 9890, 'loss/train': 1.3111342191696167} -11/06/2021 22:37:20 - INFO - __main__ - Step 9892: {'lr': 0.000496501073963181, 'samples': 1899264, 'steps': 9891, 'loss/train': 1.5163756608963013} -11/06/2021 22:37:20 - INFO - __main__ - Step 9893: {'lr': 0.0004965001891677037, 'samples': 1899456, 'steps': 9892, 'loss/train': 1.4711591005325317} -11/06/2021 22:37:21 - INFO - __main__ - Step 9894: {'lr': 0.000496499304261157, 'samples': 1899648, 'steps': 9893, 'loss/train': 2.3137621879577637} -11/06/2021 22:37:22 - INFO - __main__ - Step 9895: {'lr': 0.0004964984192435417, 'samples': 1899840, 'steps': 9894, 'loss/train': 1.8023244142532349} -11/06/2021 22:37:22 - INFO - __main__ - Step 9896: {'lr': 0.000496497534114858, 'samples': 1900032, 'steps': 9895, 'loss/train': 1.5675020217895508} -11/06/2021 22:37:23 - INFO - __main__ - Step 9897: {'lr': 0.0004964966488751062, 'samples': 1900224, 'steps': 9896, 'loss/train': 1.4843635559082031} -11/06/2021 22:37:23 - INFO - __main__ - Step 9898: {'lr': 0.000496495763524287, 'samples': 1900416, 'steps': 9897, 'loss/train': 2.4118194580078125} -11/06/2021 22:37:24 - INFO - __main__ - Step 9899: {'lr': 0.0004964948780624005, 'samples': 1900608, 'steps': 9898, 'loss/train': 1.6140505075454712} -11/06/2021 22:37:24 - INFO - __main__ - Step 9900: {'lr': 0.0004964939924894472, 'samples': 1900800, 'steps': 9899, 'loss/train': 1.5659464597702026} -11/06/2021 22:37:24 - INFO - __main__ - Step 9901: {'lr': 0.0004964931068054274, 'samples': 1900992, 'steps': 9900, 'loss/train': 0.7185819149017334} -11/06/2021 22:37:25 - INFO - __main__ - Step 9902: {'lr': 0.0004964922210103418, 'samples': 1901184, 'steps': 9901, 'loss/train': 0.6721516251564026} -11/06/2021 22:37:26 - INFO - __main__ - Step 9903: {'lr': 0.0004964913351041905, 'samples': 1901376, 'steps': 9902, 'loss/train': 2.110550880432129} -11/06/2021 22:37:26 - INFO - __main__ - Step 9904: {'lr': 0.000496490449086974, 'samples': 1901568, 'steps': 9903, 'loss/train': 2.038620948791504} -11/06/2021 22:37:26 - INFO - __main__ - Step 9905: {'lr': 0.0004964895629586928, 'samples': 1901760, 'steps': 9904, 'loss/train': 2.2174274921417236} -11/06/2021 22:37:27 - INFO - __main__ - Step 9906: {'lr': 0.0004964886767193471, 'samples': 1901952, 'steps': 9905, 'loss/train': 1.2710689306259155} -11/06/2021 22:37:27 - INFO - __main__ - Step 9907: {'lr': 0.0004964877903689375, 'samples': 1902144, 'steps': 9906, 'loss/train': 1.9977413415908813} -11/06/2021 22:37:28 - INFO - __main__ - Step 9908: {'lr': 0.0004964869039074643, 'samples': 1902336, 'steps': 9907, 'loss/train': 1.3191601037979126} -11/06/2021 22:37:29 - INFO - __main__ - Step 9909: {'lr': 0.000496486017334928, 'samples': 1902528, 'steps': 9908, 'loss/train': 2.083883047103882} -11/06/2021 22:37:29 - INFO - __main__ - Step 9910: {'lr': 0.0004964851306513287, 'samples': 1902720, 'steps': 9909, 'loss/train': 0.8083091974258423} -11/06/2021 22:37:29 - INFO - __main__ - Step 9911: {'lr': 0.0004964842438566671, 'samples': 1902912, 'steps': 9910, 'loss/train': 1.8291444778442383} -11/06/2021 22:37:30 - INFO - __main__ - Step 9912: {'lr': 0.0004964833569509434, 'samples': 1903104, 'steps': 9911, 'loss/train': 1.752215027809143} -11/06/2021 22:37:31 - INFO - __main__ - Step 9913: {'lr': 0.0004964824699341582, 'samples': 1903296, 'steps': 9912, 'loss/train': 1.807940125465393} -11/06/2021 22:37:31 - INFO - __main__ - Step 9914: {'lr': 0.0004964815828063118, 'samples': 1903488, 'steps': 9913, 'loss/train': 1.4366697072982788} -11/06/2021 22:37:31 - INFO - __main__ - Step 9915: {'lr': 0.0004964806955674046, 'samples': 1903680, 'steps': 9914, 'loss/train': 2.080610752105713} -11/06/2021 22:37:32 - INFO - __main__ - Step 9916: {'lr': 0.0004964798082174371, 'samples': 1903872, 'steps': 9915, 'loss/train': 1.5181411504745483} -11/06/2021 22:37:32 - INFO - __main__ - Step 9917: {'lr': 0.0004964789207564094, 'samples': 1904064, 'steps': 9916, 'loss/train': 1.8686342239379883} -11/06/2021 22:37:33 - INFO - __main__ - Step 9918: {'lr': 0.0004964780331843223, 'samples': 1904256, 'steps': 9917, 'loss/train': 2.0889878273010254} -11/06/2021 22:37:33 - INFO - __main__ - Step 9919: {'lr': 0.0004964771455011758, 'samples': 1904448, 'steps': 9918, 'loss/train': 1.7543959617614746} -11/06/2021 22:37:34 - INFO - __main__ - Step 9920: {'lr': 0.0004964762577069707, 'samples': 1904640, 'steps': 9919, 'loss/train': 1.4055709838867188} -11/06/2021 22:37:34 - INFO - __main__ - Step 9921: {'lr': 0.0004964753698017071, 'samples': 1904832, 'steps': 9920, 'loss/train': 1.6933525800704956} -11/06/2021 22:37:34 - INFO - __main__ - Step 9922: {'lr': 0.0004964744817853855, 'samples': 1905024, 'steps': 9921, 'loss/train': 1.261832356452942} -11/06/2021 22:37:35 - INFO - __main__ - Step 9923: {'lr': 0.0004964735936580063, 'samples': 1905216, 'steps': 9922, 'loss/train': 2.1547069549560547} -11/06/2021 22:37:36 - INFO - __main__ - Step 9924: {'lr': 0.00049647270541957, 'samples': 1905408, 'steps': 9923, 'loss/train': 1.4039684534072876} -11/06/2021 22:37:36 - INFO - __main__ - Step 9925: {'lr': 0.0004964718170700767, 'samples': 1905600, 'steps': 9924, 'loss/train': 1.7743269205093384} -11/06/2021 22:37:37 - INFO - __main__ - Step 9926: {'lr': 0.0004964709286095271, 'samples': 1905792, 'steps': 9925, 'loss/train': 1.6846635341644287} -11/06/2021 22:37:37 - INFO - __main__ - Step 9927: {'lr': 0.0004964700400379215, 'samples': 1905984, 'steps': 9926, 'loss/train': 1.7219330072402954} -11/06/2021 22:37:37 - INFO - __main__ - Step 9928: {'lr': 0.0004964691513552604, 'samples': 1906176, 'steps': 9927, 'loss/train': 1.6441329717636108} -11/06/2021 22:37:38 - INFO - __main__ - Step 9929: {'lr': 0.000496468262561544, 'samples': 1906368, 'steps': 9928, 'loss/train': 1.6577142477035522} -11/06/2021 22:37:38 - INFO - __main__ - Step 9930: {'lr': 0.0004964673736567728, 'samples': 1906560, 'steps': 9929, 'loss/train': 1.7367271184921265} -11/06/2021 22:37:39 - INFO - __main__ - Step 9931: {'lr': 0.0004964664846409473, 'samples': 1906752, 'steps': 9930, 'loss/train': 1.7608524560928345} -11/06/2021 22:37:39 - INFO - __main__ - Step 9932: {'lr': 0.0004964655955140677, 'samples': 1906944, 'steps': 9931, 'loss/train': 1.8868800401687622} -11/06/2021 22:37:40 - INFO - __main__ - Step 9933: {'lr': 0.0004964647062761345, 'samples': 1907136, 'steps': 9932, 'loss/train': 2.024883270263672} -11/06/2021 22:37:41 - INFO - __main__ - Step 9934: {'lr': 0.0004964638169271482, 'samples': 1907328, 'steps': 9933, 'loss/train': 1.661513328552246} -11/06/2021 22:37:41 - INFO - __main__ - Step 9935: {'lr': 0.0004964629274671091, 'samples': 1907520, 'steps': 9934, 'loss/train': 1.6273504495620728} -11/06/2021 22:37:42 - INFO - __main__ - Step 9936: {'lr': 0.0004964620378960175, 'samples': 1907712, 'steps': 9935, 'loss/train': 1.556241750717163} -11/06/2021 22:37:42 - INFO - __main__ - Step 9937: {'lr': 0.000496461148213874, 'samples': 1907904, 'steps': 9936, 'loss/train': 2.6705877780914307} -11/06/2021 22:37:42 - INFO - __main__ - Step 9938: {'lr': 0.0004964602584206788, 'samples': 1908096, 'steps': 9937, 'loss/train': 1.8545628786087036} -11/06/2021 22:37:43 - INFO - __main__ - Step 9939: {'lr': 0.0004964593685164326, 'samples': 1908288, 'steps': 9938, 'loss/train': 1.645344614982605} -11/06/2021 22:37:44 - INFO - __main__ - Step 9940: {'lr': 0.0004964584785011355, 'samples': 1908480, 'steps': 9939, 'loss/train': 1.6063035726547241} -11/06/2021 22:37:44 - INFO - __main__ - Step 9941: {'lr': 0.000496457588374788, 'samples': 1908672, 'steps': 9940, 'loss/train': 0.9683166146278381} -11/06/2021 22:37:44 - INFO - __main__ - Step 9942: {'lr': 0.0004964566981373905, 'samples': 1908864, 'steps': 9941, 'loss/train': 1.5615383386611938} -11/06/2021 22:37:45 - INFO - __main__ - Step 9943: {'lr': 0.0004964558077889435, 'samples': 1909056, 'steps': 9942, 'loss/train': 1.4332380294799805} -11/06/2021 22:37:45 - INFO - __main__ - Step 9944: {'lr': 0.0004964549173294472, 'samples': 1909248, 'steps': 9943, 'loss/train': 1.4659695625305176} -11/06/2021 22:37:46 - INFO - __main__ - Step 9945: {'lr': 0.0004964540267589023, 'samples': 1909440, 'steps': 9944, 'loss/train': 1.1614114046096802} -11/06/2021 22:37:46 - INFO - __main__ - Step 9946: {'lr': 0.0004964531360773088, 'samples': 1909632, 'steps': 9945, 'loss/train': 1.5709928274154663} -11/06/2021 22:37:47 - INFO - __main__ - Step 9947: {'lr': 0.0004964522452846675, 'samples': 1909824, 'steps': 9946, 'loss/train': 1.8149683475494385} -11/06/2021 22:37:47 - INFO - __main__ - Step 9948: {'lr': 0.0004964513543809785, 'samples': 1910016, 'steps': 9947, 'loss/train': 1.0438923835754395} -11/06/2021 22:37:48 - INFO - __main__ - Step 9949: {'lr': 0.0004964504633662424, 'samples': 1910208, 'steps': 9948, 'loss/train': 0.8558833599090576} -11/06/2021 22:37:49 - INFO - __main__ - Step 9950: {'lr': 0.0004964495722404595, 'samples': 1910400, 'steps': 9949, 'loss/train': 1.9778287410736084} -11/06/2021 22:37:49 - INFO - __main__ - Step 9951: {'lr': 0.0004964486810036301, 'samples': 1910592, 'steps': 9950, 'loss/train': 2.1700186729431152} -11/06/2021 22:37:49 - INFO - __main__ - Step 9952: {'lr': 0.000496447789655755, 'samples': 1910784, 'steps': 9951, 'loss/train': 1.5003530979156494} -11/06/2021 22:37:50 - INFO - __main__ - Step 9953: {'lr': 0.0004964468981968341, 'samples': 1910976, 'steps': 9952, 'loss/train': 1.8400135040283203} -11/06/2021 22:37:50 - INFO - __main__ - Step 9954: {'lr': 0.0004964460066268681, 'samples': 1911168, 'steps': 9953, 'loss/train': 1.9778108596801758} -11/06/2021 22:37:51 - INFO - __main__ - Step 9955: {'lr': 0.0004964451149458573, 'samples': 1911360, 'steps': 9954, 'loss/train': 1.6574676036834717} -11/06/2021 22:37:51 - INFO - __main__ - Step 9956: {'lr': 0.0004964442231538023, 'samples': 1911552, 'steps': 9955, 'loss/train': 1.1613150835037231} -11/06/2021 22:37:52 - INFO - __main__ - Step 9957: {'lr': 0.000496443331250703, 'samples': 1911744, 'steps': 9956, 'loss/train': 1.88170325756073} -11/06/2021 22:37:52 - INFO - __main__ - Step 9958: {'lr': 0.0004964424392365604, 'samples': 1911936, 'steps': 9957, 'loss/train': 2.3807883262634277} -11/06/2021 22:37:52 - INFO - __main__ - Step 9959: {'lr': 0.0004964415471113747, 'samples': 1912128, 'steps': 9958, 'loss/train': 2.4166524410247803} -11/06/2021 22:37:53 - INFO - __main__ - Step 9960: {'lr': 0.0004964406548751461, 'samples': 1912320, 'steps': 9959, 'loss/train': 2.397183656692505} -11/06/2021 22:37:54 - INFO - __main__ - Step 9961: {'lr': 0.0004964397625278751, 'samples': 1912512, 'steps': 9960, 'loss/train': 1.7461156845092773} -11/06/2021 22:37:54 - INFO - __main__ - Step 9962: {'lr': 0.0004964388700695623, 'samples': 1912704, 'steps': 9961, 'loss/train': 1.654305100440979} -11/06/2021 22:37:55 - INFO - __main__ - Step 9963: {'lr': 0.0004964379775002078, 'samples': 1912896, 'steps': 9962, 'loss/train': 2.360861301422119} -11/06/2021 22:37:55 - INFO - __main__ - Step 9964: {'lr': 0.0004964370848198122, 'samples': 1913088, 'steps': 9963, 'loss/train': 2.1414263248443604} -11/06/2021 22:37:55 - INFO - __main__ - Step 9965: {'lr': 0.0004964361920283759, 'samples': 1913280, 'steps': 9964, 'loss/train': 1.4624086618423462} -11/06/2021 22:37:56 - INFO - __main__ - Step 9966: {'lr': 0.0004964352991258992, 'samples': 1913472, 'steps': 9965, 'loss/train': 1.942596435546875} -11/06/2021 22:37:57 - INFO - __main__ - Step 9967: {'lr': 0.0004964344061123826, 'samples': 1913664, 'steps': 9966, 'loss/train': 1.6361198425292969} -11/06/2021 22:37:57 - INFO - __main__ - Step 9968: {'lr': 0.0004964335129878264, 'samples': 1913856, 'steps': 9967, 'loss/train': 1.1940803527832031} -11/06/2021 22:37:57 - INFO - __main__ - Step 9969: {'lr': 0.0004964326197522311, 'samples': 1914048, 'steps': 9968, 'loss/train': 1.8905918598175049} -11/06/2021 22:37:58 - INFO - __main__ - Step 9970: {'lr': 0.0004964317264055971, 'samples': 1914240, 'steps': 9969, 'loss/train': 1.6931695938110352} -11/06/2021 22:37:59 - INFO - __main__ - Step 9971: {'lr': 0.0004964308329479247, 'samples': 1914432, 'steps': 9970, 'loss/train': 2.065845489501953} -11/06/2021 22:37:59 - INFO - __main__ - Step 9972: {'lr': 0.0004964299393792143, 'samples': 1914624, 'steps': 9971, 'loss/train': 2.043527603149414} -11/06/2021 22:37:59 - INFO - __main__ - Step 9973: {'lr': 0.0004964290456994666, 'samples': 1914816, 'steps': 9972, 'loss/train': 1.4954372644424438} -11/06/2021 22:38:00 - INFO - __main__ - Step 9974: {'lr': 0.0004964281519086816, 'samples': 1915008, 'steps': 9973, 'loss/train': 2.400644302368164} -11/06/2021 22:38:00 - INFO - __main__ - Step 9975: {'lr': 0.0004964272580068599, 'samples': 1915200, 'steps': 9974, 'loss/train': 1.6218897104263306} -11/06/2021 22:38:01 - INFO - __main__ - Step 9976: {'lr': 0.0004964263639940018, 'samples': 1915392, 'steps': 9975, 'loss/train': 2.0930655002593994} -11/06/2021 22:38:02 - INFO - __main__ - Step 9977: {'lr': 0.000496425469870108, 'samples': 1915584, 'steps': 9976, 'loss/train': 1.391600251197815} -11/06/2021 22:38:02 - INFO - __main__ - Step 9978: {'lr': 0.0004964245756351786, 'samples': 1915776, 'steps': 9977, 'loss/train': 1.8200713396072388} -11/06/2021 22:38:02 - INFO - __main__ - Step 9979: {'lr': 0.000496423681289214, 'samples': 1915968, 'steps': 9978, 'loss/train': 1.7776697874069214} -11/06/2021 22:38:03 - INFO - __main__ - Step 9980: {'lr': 0.0004964227868322148, 'samples': 1916160, 'steps': 9979, 'loss/train': 1.082550287246704} -11/06/2021 22:38:04 - INFO - __main__ - Step 9981: {'lr': 0.0004964218922641812, 'samples': 1916352, 'steps': 9980, 'loss/train': 1.5953223705291748} -11/06/2021 22:38:04 - INFO - __main__ - Step 9982: {'lr': 0.0004964209975851137, 'samples': 1916544, 'steps': 9981, 'loss/train': 1.3076783418655396} -11/06/2021 22:38:04 - INFO - __main__ - Step 9983: {'lr': 0.0004964201027950129, 'samples': 1916736, 'steps': 9982, 'loss/train': 1.7255864143371582} -11/06/2021 22:38:05 - INFO - __main__ - Step 9984: {'lr': 0.0004964192078938788, 'samples': 1916928, 'steps': 9983, 'loss/train': 2.1289093494415283} -11/06/2021 22:38:05 - INFO - __main__ - Step 9985: {'lr': 0.0004964183128817121, 'samples': 1917120, 'steps': 9984, 'loss/train': 1.9382929801940918} -11/06/2021 22:38:06 - INFO - __main__ - Step 9986: {'lr': 0.000496417417758513, 'samples': 1917312, 'steps': 9985, 'loss/train': 1.6477100849151611} -11/06/2021 22:38:06 - INFO - __main__ - Step 9987: {'lr': 0.000496416522524282, 'samples': 1917504, 'steps': 9986, 'loss/train': 1.6857631206512451} -11/06/2021 22:38:07 - INFO - __main__ - Step 9988: {'lr': 0.0004964156271790197, 'samples': 1917696, 'steps': 9987, 'loss/train': 1.4530490636825562} -11/06/2021 22:38:07 - INFO - __main__ - Step 9989: {'lr': 0.0004964147317227262, 'samples': 1917888, 'steps': 9988, 'loss/train': 1.7035175561904907} -11/06/2021 22:38:07 - INFO - __main__ - Step 9990: {'lr': 0.000496413836155402, 'samples': 1918080, 'steps': 9989, 'loss/train': 1.9417301416397095} -11/06/2021 22:38:09 - INFO - __main__ - Step 9991: {'lr': 0.0004964129404770476, 'samples': 1918272, 'steps': 9990, 'loss/train': 1.67684006690979} -11/06/2021 22:38:09 - INFO - __main__ - Step 9992: {'lr': 0.0004964120446876633, 'samples': 1918464, 'steps': 9991, 'loss/train': 1.8245000839233398} -11/06/2021 22:38:09 - INFO - __main__ - Step 9993: {'lr': 0.0004964111487872495, 'samples': 1918656, 'steps': 9992, 'loss/train': 1.7816718816757202} -11/06/2021 22:38:10 - INFO - __main__ - Step 9994: {'lr': 0.0004964102527758067, 'samples': 1918848, 'steps': 9993, 'loss/train': 1.7993488311767578} -11/06/2021 22:38:10 - INFO - __main__ - Step 9995: {'lr': 0.0004964093566533352, 'samples': 1919040, 'steps': 9994, 'loss/train': 1.1521903276443481} -11/06/2021 22:38:11 - INFO - __main__ - Step 9996: {'lr': 0.0004964084604198354, 'samples': 1919232, 'steps': 9995, 'loss/train': 1.9137816429138184} -11/06/2021 22:38:11 - INFO - __main__ - Step 9997: {'lr': 0.0004964075640753079, 'samples': 1919424, 'steps': 9996, 'loss/train': 1.5610769987106323} -11/06/2021 22:38:12 - INFO - __main__ - Step 9998: {'lr': 0.0004964066676197528, 'samples': 1919616, 'steps': 9997, 'loss/train': 1.6594487428665161} -11/06/2021 22:38:12 - INFO - __main__ - Step 9999: {'lr': 0.0004964057710531707, 'samples': 1919808, 'steps': 9998, 'loss/train': 1.531420111656189} -11/06/2021 22:38:12 - INFO - __main__ - Step 10000: {'lr': 0.0004964048743755621, 'samples': 1920000, 'steps': 9999, 'loss/train': 1.2586203813552856} -11/06/2021 22:38:13 - INFO - __main__ - Step 10001: {'lr': 0.0004964039775869272, 'samples': 1920192, 'steps': 10000, 'loss/train': 1.3523963689804077} -11/06/2021 22:38:14 - INFO - __main__ - Step 10002: {'lr': 0.0004964030806872664, 'samples': 1920384, 'steps': 10001, 'loss/train': 1.9878268241882324} -11/06/2021 22:38:14 - INFO - __main__ - Step 10003: {'lr': 0.0004964021836765802, 'samples': 1920576, 'steps': 10002, 'loss/train': 1.8906978368759155} -11/06/2021 22:38:14 - INFO - __main__ - Step 10004: {'lr': 0.000496401286554869, 'samples': 1920768, 'steps': 10003, 'loss/train': 1.310309648513794} -11/06/2021 22:38:15 - INFO - __main__ - Step 10005: {'lr': 0.000496400389322133, 'samples': 1920960, 'steps': 10004, 'loss/train': 1.6377642154693604} -11/06/2021 22:38:15 - INFO - __main__ - Step 10006: {'lr': 0.000496399491978373, 'samples': 1921152, 'steps': 10005, 'loss/train': 2.1881837844848633} -11/06/2021 22:38:16 - INFO - __main__ - Step 10007: {'lr': 0.0004963985945235891, 'samples': 1921344, 'steps': 10006, 'loss/train': 1.2533279657363892} -11/06/2021 22:38:16 - INFO - __main__ - Step 10008: {'lr': 0.0004963976969577819, 'samples': 1921536, 'steps': 10007, 'loss/train': 1.3222609758377075} -11/06/2021 22:38:17 - INFO - __main__ - Step 10009: {'lr': 0.0004963967992809516, 'samples': 1921728, 'steps': 10008, 'loss/train': 1.7431193590164185} -11/06/2021 22:38:17 - INFO - __main__ - Step 10010: {'lr': 0.0004963959014930988, 'samples': 1921920, 'steps': 10009, 'loss/train': 2.0606842041015625} -11/06/2021 22:38:17 - INFO - __main__ - Step 10011: {'lr': 0.0004963950035942237, 'samples': 1922112, 'steps': 10010, 'loss/train': 1.9937307834625244} -11/06/2021 22:38:19 - INFO - __main__ - Step 10012: {'lr': 0.0004963941055843268, 'samples': 1922304, 'steps': 10011, 'loss/train': 1.7773168087005615} -11/06/2021 22:38:19 - INFO - __main__ - Step 10013: {'lr': 0.0004963932074634087, 'samples': 1922496, 'steps': 10012, 'loss/train': 1.3404390811920166} -11/06/2021 22:38:19 - INFO - __main__ - Step 10014: {'lr': 0.0004963923092314694, 'samples': 1922688, 'steps': 10013, 'loss/train': 1.3710219860076904} -11/06/2021 22:38:20 - INFO - __main__ - Step 10015: {'lr': 0.0004963914108885097, 'samples': 1922880, 'steps': 10014, 'loss/train': 1.7717443704605103} -11/06/2021 22:38:20 - INFO - __main__ - Step 10016: {'lr': 0.0004963905124345297, 'samples': 1923072, 'steps': 10015, 'loss/train': 1.6650587320327759} -11/06/2021 22:38:21 - INFO - __main__ - Step 10017: {'lr': 0.00049638961386953, 'samples': 1923264, 'steps': 10016, 'loss/train': 1.4850966930389404} -11/06/2021 22:38:21 - INFO - __main__ - Step 10018: {'lr': 0.000496388715193511, 'samples': 1923456, 'steps': 10017, 'loss/train': 1.0550109148025513} -11/06/2021 22:38:22 - INFO - __main__ - Step 10019: {'lr': 0.000496387816406473, 'samples': 1923648, 'steps': 10018, 'loss/train': 1.6358630657196045} -11/06/2021 22:38:22 - INFO - __main__ - Step 10020: {'lr': 0.0004963869175084164, 'samples': 1923840, 'steps': 10019, 'loss/train': 1.7765165567398071} -11/06/2021 22:38:22 - INFO - __main__ - Step 10021: {'lr': 0.0004963860184993416, 'samples': 1924032, 'steps': 10020, 'loss/train': 1.717958688735962} -11/06/2021 22:38:23 - INFO - __main__ - Step 10022: {'lr': 0.0004963851193792492, 'samples': 1924224, 'steps': 10021, 'loss/train': 1.7283834218978882} -11/06/2021 22:38:24 - INFO - __main__ - Step 10023: {'lr': 0.0004963842201481394, 'samples': 1924416, 'steps': 10022, 'loss/train': 1.514644742012024} -11/06/2021 22:38:24 - INFO - __main__ - Step 10024: {'lr': 0.0004963833208060128, 'samples': 1924608, 'steps': 10023, 'loss/train': 1.3506485223770142} -11/06/2021 22:38:24 - INFO - __main__ - Step 10025: {'lr': 0.0004963824213528696, 'samples': 1924800, 'steps': 10024, 'loss/train': 1.9384859800338745} -11/06/2021 22:38:25 - INFO - __main__ - Step 10026: {'lr': 0.0004963815217887102, 'samples': 1924992, 'steps': 10025, 'loss/train': 2.230543851852417} -11/06/2021 22:38:26 - INFO - __main__ - Step 10027: {'lr': 0.0004963806221135351, 'samples': 1925184, 'steps': 10026, 'loss/train': 1.5828680992126465} -11/06/2021 22:38:26 - INFO - __main__ - Step 10028: {'lr': 0.0004963797223273448, 'samples': 1925376, 'steps': 10027, 'loss/train': 2.0957136154174805} -11/06/2021 22:38:27 - INFO - __main__ - Step 10029: {'lr': 0.0004963788224301395, 'samples': 1925568, 'steps': 10028, 'loss/train': 2.020629405975342} -11/06/2021 22:38:27 - INFO - __main__ - Step 10030: {'lr': 0.0004963779224219197, 'samples': 1925760, 'steps': 10029, 'loss/train': 1.7997504472732544} -11/06/2021 22:38:27 - INFO - __main__ - Step 10031: {'lr': 0.0004963770223026858, 'samples': 1925952, 'steps': 10030, 'loss/train': 1.9878836870193481} -11/06/2021 22:38:28 - INFO - __main__ - Step 10032: {'lr': 0.0004963761220724384, 'samples': 1926144, 'steps': 10031, 'loss/train': 1.9155443906784058} -11/06/2021 22:38:29 - INFO - __main__ - Step 10033: {'lr': 0.0004963752217311775, 'samples': 1926336, 'steps': 10032, 'loss/train': 1.7525060176849365} -11/06/2021 22:38:29 - INFO - __main__ - Step 10034: {'lr': 0.0004963743212789038, 'samples': 1926528, 'steps': 10033, 'loss/train': 2.0401864051818848} -11/06/2021 22:38:29 - INFO - __main__ - Step 10035: {'lr': 0.0004963734207156178, 'samples': 1926720, 'steps': 10034, 'loss/train': 1.524163007736206} -11/06/2021 22:38:30 - INFO - __main__ - Step 10036: {'lr': 0.0004963725200413195, 'samples': 1926912, 'steps': 10035, 'loss/train': 1.768740177154541} -11/06/2021 22:38:30 - INFO - __main__ - Step 10037: {'lr': 0.0004963716192560097, 'samples': 1927104, 'steps': 10036, 'loss/train': 0.7059550285339355} -11/06/2021 22:38:31 - INFO - __main__ - Step 10038: {'lr': 0.0004963707183596885, 'samples': 1927296, 'steps': 10037, 'loss/train': 1.979498267173767} -11/06/2021 22:38:32 - INFO - __main__ - Step 10039: {'lr': 0.0004963698173523566, 'samples': 1927488, 'steps': 10038, 'loss/train': 1.3461339473724365} -11/06/2021 22:38:32 - INFO - __main__ - Step 10040: {'lr': 0.0004963689162340142, 'samples': 1927680, 'steps': 10039, 'loss/train': 1.8551632165908813} -11/06/2021 22:38:32 - INFO - __main__ - Step 10041: {'lr': 0.0004963680150046618, 'samples': 1927872, 'steps': 10040, 'loss/train': 1.8479679822921753} -11/06/2021 22:38:33 - INFO - __main__ - Step 10042: {'lr': 0.0004963671136642997, 'samples': 1928064, 'steps': 10041, 'loss/train': 1.8179422616958618} -11/06/2021 22:38:34 - INFO - __main__ - Step 10043: {'lr': 0.0004963662122129284, 'samples': 1928256, 'steps': 10042, 'loss/train': 1.5947130918502808} -11/06/2021 22:38:34 - INFO - __main__ - Step 10044: {'lr': 0.0004963653106505483, 'samples': 1928448, 'steps': 10043, 'loss/train': 2.2334413528442383} -11/06/2021 22:38:34 - INFO - __main__ - Step 10045: {'lr': 0.0004963644089771598, 'samples': 1928640, 'steps': 10044, 'loss/train': 1.9353092908859253} -11/06/2021 22:38:35 - INFO - __main__ - Step 10046: {'lr': 0.0004963635071927633, 'samples': 1928832, 'steps': 10045, 'loss/train': 1.261295199394226} -11/06/2021 22:38:35 - INFO - __main__ - Step 10047: {'lr': 0.0004963626052973592, 'samples': 1929024, 'steps': 10046, 'loss/train': 1.8938654661178589} -11/06/2021 22:38:36 - INFO - __main__ - Step 10048: {'lr': 0.0004963617032909479, 'samples': 1929216, 'steps': 10047, 'loss/train': 1.5131046772003174} -11/06/2021 22:38:36 - INFO - __main__ - Step 10049: {'lr': 0.0004963608011735298, 'samples': 1929408, 'steps': 10048, 'loss/train': 1.5676438808441162} -11/06/2021 22:38:37 - INFO - __main__ - Step 10050: {'lr': 0.0004963598989451053, 'samples': 1929600, 'steps': 10049, 'loss/train': 1.8830301761627197} -11/06/2021 22:38:37 - INFO - __main__ - Step 10051: {'lr': 0.000496358996605675, 'samples': 1929792, 'steps': 10050, 'loss/train': 1.9643739461898804} -11/06/2021 22:38:37 - INFO - __main__ - Step 10052: {'lr': 0.0004963580941552391, 'samples': 1929984, 'steps': 10051, 'loss/train': 1.7612366676330566} -11/06/2021 22:38:38 - INFO - __main__ - Step 10053: {'lr': 0.0004963571915937979, 'samples': 1930176, 'steps': 10052, 'loss/train': 1.8770025968551636} -11/06/2021 22:38:39 - INFO - __main__ - Step 10054: {'lr': 0.000496356288921352, 'samples': 1930368, 'steps': 10053, 'loss/train': 1.7088673114776611} -11/06/2021 22:38:39 - INFO - __main__ - Step 10055: {'lr': 0.0004963553861379018, 'samples': 1930560, 'steps': 10054, 'loss/train': 2.023212194442749} -11/06/2021 22:38:39 - INFO - __main__ - Step 10056: {'lr': 0.0004963544832434476, 'samples': 1930752, 'steps': 10055, 'loss/train': 1.9566535949707031} -11/06/2021 22:38:40 - INFO - __main__ - Step 10057: {'lr': 0.00049635358023799, 'samples': 1930944, 'steps': 10056, 'loss/train': 1.7718608379364014} -11/06/2021 22:38:41 - INFO - __main__ - Step 10058: {'lr': 0.0004963526771215291, 'samples': 1931136, 'steps': 10057, 'loss/train': 1.9035671949386597} -11/06/2021 22:38:41 - INFO - __main__ - Step 10059: {'lr': 0.0004963517738940656, 'samples': 1931328, 'steps': 10058, 'loss/train': 1.7526215314865112} -11/06/2021 22:38:41 - INFO - __main__ - Step 10060: {'lr': 0.0004963508705555998, 'samples': 1931520, 'steps': 10059, 'loss/train': 1.9995636940002441} -11/06/2021 22:38:42 - INFO - __main__ - Step 10061: {'lr': 0.000496349967106132, 'samples': 1931712, 'steps': 10060, 'loss/train': 1.6497392654418945} -11/06/2021 22:38:42 - INFO - __main__ - Step 10062: {'lr': 0.0004963490635456629, 'samples': 1931904, 'steps': 10061, 'loss/train': 1.680986762046814} -11/06/2021 22:38:42 - INFO - __main__ - Step 10063: {'lr': 0.0004963481598741925, 'samples': 1932096, 'steps': 10062, 'loss/train': 1.8724141120910645} -11/06/2021 22:38:43 - INFO - __main__ - Step 10064: {'lr': 0.0004963472560917216, 'samples': 1932288, 'steps': 10063, 'loss/train': 1.6809192895889282} -11/06/2021 22:38:44 - INFO - __main__ - Step 10065: {'lr': 0.0004963463521982503, 'samples': 1932480, 'steps': 10064, 'loss/train': 1.8800909519195557} -11/06/2021 22:38:44 - INFO - __main__ - Step 10066: {'lr': 0.0004963454481937791, 'samples': 1932672, 'steps': 10065, 'loss/train': 1.9918426275253296} -11/06/2021 22:38:45 - INFO - __main__ - Step 10067: {'lr': 0.0004963445440783086, 'samples': 1932864, 'steps': 10066, 'loss/train': 1.8763664960861206} -11/06/2021 22:38:45 - INFO - __main__ - Step 10068: {'lr': 0.0004963436398518389, 'samples': 1933056, 'steps': 10067, 'loss/train': 1.3873255252838135} -11/06/2021 22:38:46 - INFO - __main__ - Step 10069: {'lr': 0.0004963427355143706, 'samples': 1933248, 'steps': 10068, 'loss/train': 1.4686658382415771} -11/06/2021 22:38:46 - INFO - __main__ - Step 10070: {'lr': 0.0004963418310659041, 'samples': 1933440, 'steps': 10069, 'loss/train': 1.890317440032959} -11/06/2021 22:38:47 - INFO - __main__ - Step 10071: {'lr': 0.0004963409265064398, 'samples': 1933632, 'steps': 10070, 'loss/train': 1.8712046146392822} -11/06/2021 22:38:47 - INFO - __main__ - Step 10072: {'lr': 0.0004963400218359781, 'samples': 1933824, 'steps': 10071, 'loss/train': 1.9994356632232666} -11/06/2021 22:38:47 - INFO - __main__ - Step 10073: {'lr': 0.0004963391170545193, 'samples': 1934016, 'steps': 10072, 'loss/train': 1.4278088808059692} -11/06/2021 22:38:48 - INFO - __main__ - Step 10074: {'lr': 0.0004963382121620639, 'samples': 1934208, 'steps': 10073, 'loss/train': 1.821343183517456} -11/06/2021 22:38:49 - INFO - __main__ - Step 10075: {'lr': 0.0004963373071586123, 'samples': 1934400, 'steps': 10074, 'loss/train': 2.091646909713745} -11/06/2021 22:38:49 - INFO - __main__ - Step 10076: {'lr': 0.000496336402044165, 'samples': 1934592, 'steps': 10075, 'loss/train': 1.838132619857788} -11/06/2021 22:38:49 - INFO - __main__ - Step 10077: {'lr': 0.0004963354968187222, 'samples': 1934784, 'steps': 10076, 'loss/train': 1.6847151517868042} -11/06/2021 22:38:50 - INFO - __main__ - Step 10078: {'lr': 0.0004963345914822845, 'samples': 1934976, 'steps': 10077, 'loss/train': 1.5948516130447388} -11/06/2021 22:38:51 - INFO - __main__ - Step 10079: {'lr': 0.0004963336860348521, 'samples': 1935168, 'steps': 10078, 'loss/train': 1.8252551555633545} -11/06/2021 22:38:51 - INFO - __main__ - Step 10080: {'lr': 0.0004963327804764257, 'samples': 1935360, 'steps': 10079, 'loss/train': 1.9088850021362305} -11/06/2021 22:38:52 - INFO - __main__ - Step 10081: {'lr': 0.0004963318748070056, 'samples': 1935552, 'steps': 10080, 'loss/train': 1.7089757919311523} -11/06/2021 22:38:52 - INFO - __main__ - Step 10082: {'lr': 0.0004963309690265921, 'samples': 1935744, 'steps': 10081, 'loss/train': 1.9372551441192627} -11/06/2021 22:38:52 - INFO - __main__ - Step 10083: {'lr': 0.0004963300631351856, 'samples': 1935936, 'steps': 10082, 'loss/train': 1.6880172491073608} -11/06/2021 22:38:53 - INFO - __main__ - Step 10084: {'lr': 0.0004963291571327866, 'samples': 1936128, 'steps': 10083, 'loss/train': 1.8040343523025513} -11/06/2021 22:38:54 - INFO - __main__ - Step 10085: {'lr': 0.0004963282510193955, 'samples': 1936320, 'steps': 10084, 'loss/train': 1.7773646116256714} -11/06/2021 22:38:54 - INFO - __main__ - Step 10086: {'lr': 0.0004963273447950126, 'samples': 1936512, 'steps': 10085, 'loss/train': 1.7499951124191284} -11/06/2021 22:38:54 - INFO - __main__ - Step 10087: {'lr': 0.0004963264384596386, 'samples': 1936704, 'steps': 10086, 'loss/train': 1.3979496955871582} -11/06/2021 22:38:55 - INFO - __main__ - Step 10088: {'lr': 0.0004963255320132735, 'samples': 1936896, 'steps': 10087, 'loss/train': 2.1118416786193848} -11/06/2021 22:38:55 - INFO - __main__ - Step 10089: {'lr': 0.0004963246254559181, 'samples': 1937088, 'steps': 10088, 'loss/train': 1.7357311248779297} -11/06/2021 22:38:56 - INFO - __main__ - Step 10090: {'lr': 0.0004963237187875724, 'samples': 1937280, 'steps': 10089, 'loss/train': 1.6976773738861084} -11/06/2021 22:38:56 - INFO - __main__ - Step 10091: {'lr': 0.0004963228120082372, 'samples': 1937472, 'steps': 10090, 'loss/train': 2.041823148727417} -11/06/2021 22:38:57 - INFO - __main__ - Step 10092: {'lr': 0.0004963219051179127, 'samples': 1937664, 'steps': 10091, 'loss/train': 1.77364182472229} -11/06/2021 22:38:57 - INFO - __main__ - Step 10093: {'lr': 0.0004963209981165993, 'samples': 1937856, 'steps': 10092, 'loss/train': 2.122255802154541} -11/06/2021 22:38:57 - INFO - __main__ - Step 10094: {'lr': 0.0004963200910042976, 'samples': 1938048, 'steps': 10093, 'loss/train': 1.8102829456329346} -11/06/2021 22:38:59 - INFO - __main__ - Step 10095: {'lr': 0.0004963191837810077, 'samples': 1938240, 'steps': 10094, 'loss/train': 1.7681382894515991} -11/06/2021 22:38:59 - INFO - __main__ - Step 10096: {'lr': 0.0004963182764467303, 'samples': 1938432, 'steps': 10095, 'loss/train': 1.8665366172790527} -11/06/2021 22:38:59 - INFO - __main__ - Step 10097: {'lr': 0.0004963173690014656, 'samples': 1938624, 'steps': 10096, 'loss/train': 2.1923022270202637} -11/06/2021 22:39:00 - INFO - __main__ - Step 10098: {'lr': 0.0004963164614452142, 'samples': 1938816, 'steps': 10097, 'loss/train': 1.7837992906570435} -11/06/2021 22:39:00 - INFO - __main__ - Step 10099: {'lr': 0.0004963155537779764, 'samples': 1939008, 'steps': 10098, 'loss/train': 1.7613967657089233} -11/06/2021 22:39:01 - INFO - __main__ - Step 10100: {'lr': 0.0004963146459997525, 'samples': 1939200, 'steps': 10099, 'loss/train': 0.7903871536254883} -11/06/2021 22:39:01 - INFO - __main__ - Step 10101: {'lr': 0.0004963137381105431, 'samples': 1939392, 'steps': 10100, 'loss/train': 2.0459229946136475} -11/06/2021 22:39:02 - INFO - __main__ - Step 10102: {'lr': 0.0004963128301103485, 'samples': 1939584, 'steps': 10101, 'loss/train': 1.6579885482788086} -11/06/2021 22:39:02 - INFO - __main__ - Step 10103: {'lr': 0.0004963119219991691, 'samples': 1939776, 'steps': 10102, 'loss/train': 1.9690332412719727} -11/06/2021 22:39:02 - INFO - __main__ - Step 10104: {'lr': 0.0004963110137770054, 'samples': 1939968, 'steps': 10103, 'loss/train': 1.717148780822754} -11/06/2021 22:39:04 - INFO - __main__ - Step 10105: {'lr': 0.0004963101054438578, 'samples': 1940160, 'steps': 10104, 'loss/train': 2.5613667964935303} -11/06/2021 22:39:04 - INFO - __main__ - Step 10106: {'lr': 0.0004963091969997265, 'samples': 1940352, 'steps': 10105, 'loss/train': 1.79701566696167} -11/06/2021 22:39:05 - INFO - __main__ - Step 10107: {'lr': 0.0004963082884446123, 'samples': 1940544, 'steps': 10106, 'loss/train': 1.8763283491134644} -11/06/2021 22:39:05 - INFO - __main__ - Step 10108: {'lr': 0.0004963073797785153, 'samples': 1940736, 'steps': 10107, 'loss/train': 1.9007415771484375} -11/06/2021 22:39:06 - INFO - __main__ - Step 10109: {'lr': 0.000496306471001436, 'samples': 1940928, 'steps': 10108, 'loss/train': 0.9993707537651062} -11/06/2021 22:39:06 - INFO - __main__ - Step 10110: {'lr': 0.0004963055621133748, 'samples': 1941120, 'steps': 10109, 'loss/train': 1.6748651266098022} -11/06/2021 22:39:06 - INFO - __main__ - Step 10111: {'lr': 0.0004963046531143321, 'samples': 1941312, 'steps': 10110, 'loss/train': 1.998529076576233} -11/06/2021 22:39:07 - INFO - __main__ - Step 10112: {'lr': 0.0004963037440043083, 'samples': 1941504, 'steps': 10111, 'loss/train': 1.8323516845703125} -11/06/2021 22:39:08 - INFO - __main__ - Step 10113: {'lr': 0.0004963028347833038, 'samples': 1941696, 'steps': 10112, 'loss/train': 2.443237066268921} -11/06/2021 22:39:08 - INFO - __main__ - Step 10114: {'lr': 0.0004963019254513191, 'samples': 1941888, 'steps': 10113, 'loss/train': 1.495759129524231} -11/06/2021 22:39:08 - INFO - __main__ - Step 10115: {'lr': 0.0004963010160083546, 'samples': 1942080, 'steps': 10114, 'loss/train': 1.9651312828063965} -11/06/2021 22:39:09 - INFO - __main__ - Step 10116: {'lr': 0.0004963001064544106, 'samples': 1942272, 'steps': 10115, 'loss/train': 1.4049568176269531} -11/06/2021 22:39:10 - INFO - __main__ - Step 10117: {'lr': 0.0004962991967894876, 'samples': 1942464, 'steps': 10116, 'loss/train': 1.3363804817199707} -11/06/2021 22:39:10 - INFO - __main__ - Step 10118: {'lr': 0.0004962982870135859, 'samples': 1942656, 'steps': 10117, 'loss/train': 1.6501933336257935} -11/06/2021 22:39:11 - INFO - __main__ - Step 10119: {'lr': 0.0004962973771267061, 'samples': 1942848, 'steps': 10118, 'loss/train': 1.7426259517669678} -11/06/2021 22:39:11 - INFO - __main__ - Step 10120: {'lr': 0.0004962964671288484, 'samples': 1943040, 'steps': 10119, 'loss/train': 1.8889999389648438} -11/06/2021 22:39:11 - INFO - __main__ - Step 10121: {'lr': 0.0004962955570200135, 'samples': 1943232, 'steps': 10120, 'loss/train': 1.7648907899856567} -11/06/2021 22:39:12 - INFO - __main__ - Step 10122: {'lr': 0.0004962946468002014, 'samples': 1943424, 'steps': 10121, 'loss/train': 2.164283514022827} -11/06/2021 22:39:13 - INFO - __main__ - Step 10123: {'lr': 0.0004962937364694129, 'samples': 1943616, 'steps': 10122, 'loss/train': 2.0995631217956543} -11/06/2021 22:39:13 - INFO - __main__ - Step 10124: {'lr': 0.0004962928260276481, 'samples': 1943808, 'steps': 10123, 'loss/train': 0.9570446014404297} -11/06/2021 22:39:13 - INFO - __main__ - Step 10125: {'lr': 0.0004962919154749077, 'samples': 1944000, 'steps': 10124, 'loss/train': 1.9521758556365967} -11/06/2021 22:39:14 - INFO - __main__ - Step 10126: {'lr': 0.0004962910048111919, 'samples': 1944192, 'steps': 10125, 'loss/train': 1.8387959003448486} -11/06/2021 22:39:14 - INFO - __main__ - Step 10127: {'lr': 0.0004962900940365012, 'samples': 1944384, 'steps': 10126, 'loss/train': 1.178709864616394} -11/06/2021 22:39:15 - INFO - __main__ - Step 10128: {'lr': 0.0004962891831508359, 'samples': 1944576, 'steps': 10127, 'loss/train': 1.920640230178833} -11/06/2021 22:39:15 - INFO - __main__ - Step 10129: {'lr': 0.0004962882721541965, 'samples': 1944768, 'steps': 10128, 'loss/train': 1.703497290611267} -11/06/2021 22:39:16 - INFO - __main__ - Step 10130: {'lr': 0.0004962873610465835, 'samples': 1944960, 'steps': 10129, 'loss/train': 1.4937912225723267} -11/06/2021 22:39:16 - INFO - __main__ - Step 10131: {'lr': 0.0004962864498279972, 'samples': 1945152, 'steps': 10130, 'loss/train': 1.5674489736557007} -11/06/2021 22:39:17 - INFO - __main__ - Step 10132: {'lr': 0.000496285538498438, 'samples': 1945344, 'steps': 10131, 'loss/train': 1.649821162223816} -11/06/2021 22:39:18 - INFO - __main__ - Step 10133: {'lr': 0.0004962846270579062, 'samples': 1945536, 'steps': 10132, 'loss/train': 1.809035062789917} -11/06/2021 22:39:18 - INFO - __main__ - Step 10134: {'lr': 0.0004962837155064025, 'samples': 1945728, 'steps': 10133, 'loss/train': 1.8651890754699707} -11/06/2021 22:39:18 - INFO - __main__ - Step 10135: {'lr': 0.0004962828038439272, 'samples': 1945920, 'steps': 10134, 'loss/train': 1.8161650896072388} -11/06/2021 22:39:19 - INFO - __main__ - Step 10136: {'lr': 0.0004962818920704805, 'samples': 1946112, 'steps': 10135, 'loss/train': 2.1492648124694824} -11/06/2021 22:39:19 - INFO - __main__ - Step 10137: {'lr': 0.0004962809801860632, 'samples': 1946304, 'steps': 10136, 'loss/train': 1.2017062902450562} -11/06/2021 22:39:20 - INFO - __main__ - Step 10138: {'lr': 0.0004962800681906753, 'samples': 1946496, 'steps': 10137, 'loss/train': 1.8302303552627563} -11/06/2021 22:39:20 - INFO - __main__ - Step 10139: {'lr': 0.0004962791560843175, 'samples': 1946688, 'steps': 10138, 'loss/train': 1.9001319408416748} -11/06/2021 22:39:21 - INFO - __main__ - Step 10140: {'lr': 0.00049627824386699, 'samples': 1946880, 'steps': 10139, 'loss/train': 1.766602873802185} -11/06/2021 22:39:21 - INFO - __main__ - Step 10141: {'lr': 0.0004962773315386935, 'samples': 1947072, 'steps': 10140, 'loss/train': 2.360720157623291} -11/06/2021 22:39:21 - INFO - __main__ - Step 10142: {'lr': 0.0004962764190994282, 'samples': 1947264, 'steps': 10141, 'loss/train': 1.9311211109161377} -11/06/2021 22:39:22 - INFO - __main__ - Step 10143: {'lr': 0.0004962755065491944, 'samples': 1947456, 'steps': 10142, 'loss/train': 1.6629748344421387} -11/06/2021 22:39:23 - INFO - __main__ - Step 10144: {'lr': 0.0004962745938879928, 'samples': 1947648, 'steps': 10143, 'loss/train': 2.1842613220214844} -11/06/2021 22:39:23 - INFO - __main__ - Step 10145: {'lr': 0.0004962736811158236, 'samples': 1947840, 'steps': 10144, 'loss/train': 1.8755285739898682} -11/06/2021 22:39:23 - INFO - __main__ - Step 10146: {'lr': 0.0004962727682326873, 'samples': 1948032, 'steps': 10145, 'loss/train': 1.2577018737792969} -11/06/2021 22:39:24 - INFO - __main__ - Step 10147: {'lr': 0.0004962718552385843, 'samples': 1948224, 'steps': 10146, 'loss/train': 1.5316803455352783} -11/06/2021 22:39:25 - INFO - __main__ - Step 10148: {'lr': 0.000496270942133515, 'samples': 1948416, 'steps': 10147, 'loss/train': 2.5291173458099365} -11/06/2021 22:39:25 - INFO - __main__ - Step 10149: {'lr': 0.0004962700289174798, 'samples': 1948608, 'steps': 10148, 'loss/train': 1.7601622343063354} -11/06/2021 22:39:26 - INFO - __main__ - Step 10150: {'lr': 0.0004962691155904791, 'samples': 1948800, 'steps': 10149, 'loss/train': 1.9934760332107544} -11/06/2021 22:39:26 - INFO - __main__ - Step 10151: {'lr': 0.0004962682021525134, 'samples': 1948992, 'steps': 10150, 'loss/train': 1.820966124534607} -11/06/2021 22:39:26 - INFO - __main__ - Step 10152: {'lr': 0.000496267288603583, 'samples': 1949184, 'steps': 10151, 'loss/train': 1.7241519689559937} -11/06/2021 22:39:27 - INFO - __main__ - Step 10153: {'lr': 0.0004962663749436883, 'samples': 1949376, 'steps': 10152, 'loss/train': 1.250434160232544} -11/06/2021 22:39:28 - INFO - __main__ - Step 10154: {'lr': 0.0004962654611728299, 'samples': 1949568, 'steps': 10153, 'loss/train': 1.601660966873169} -11/06/2021 22:39:28 - INFO - __main__ - Step 10155: {'lr': 0.000496264547291008, 'samples': 1949760, 'steps': 10154, 'loss/train': 1.6472324132919312} -11/06/2021 22:39:28 - INFO - __main__ - Step 10156: {'lr': 0.0004962636332982232, 'samples': 1949952, 'steps': 10155, 'loss/train': 0.9378107786178589} -11/06/2021 22:39:29 - INFO - __main__ - Step 10157: {'lr': 0.0004962627191944756, 'samples': 1950144, 'steps': 10156, 'loss/train': 1.7389650344848633} -11/06/2021 22:39:29 - INFO - __main__ - Step 10158: {'lr': 0.000496261804979766, 'samples': 1950336, 'steps': 10157, 'loss/train': 1.7131973505020142} -11/06/2021 22:39:30 - INFO - __main__ - Step 10159: {'lr': 0.0004962608906540946, 'samples': 1950528, 'steps': 10158, 'loss/train': 1.5908807516098022} -11/06/2021 22:39:30 - INFO - __main__ - Step 10160: {'lr': 0.0004962599762174618, 'samples': 1950720, 'steps': 10159, 'loss/train': 1.8197942972183228} -11/06/2021 22:39:31 - INFO - __main__ - Step 10161: {'lr': 0.0004962590616698681, 'samples': 1950912, 'steps': 10160, 'loss/train': 1.3586111068725586} -11/06/2021 22:39:31 - INFO - __main__ - Step 10162: {'lr': 0.0004962581470113138, 'samples': 1951104, 'steps': 10161, 'loss/train': 1.4758445024490356} -11/06/2021 22:39:31 - INFO - __main__ - Step 10163: {'lr': 0.0004962572322417994, 'samples': 1951296, 'steps': 10162, 'loss/train': 2.033109426498413} -11/06/2021 22:39:33 - INFO - __main__ - Step 10164: {'lr': 0.0004962563173613254, 'samples': 1951488, 'steps': 10163, 'loss/train': 2.092374324798584} -11/06/2021 22:39:33 - INFO - __main__ - Step 10165: {'lr': 0.000496255402369892, 'samples': 1951680, 'steps': 10164, 'loss/train': 1.1480693817138672} -11/06/2021 22:39:33 - INFO - __main__ - Step 10166: {'lr': 0.0004962544872674997, 'samples': 1951872, 'steps': 10165, 'loss/train': 1.6419637203216553} -11/06/2021 22:39:34 - INFO - __main__ - Step 10167: {'lr': 0.000496253572054149, 'samples': 1952064, 'steps': 10166, 'loss/train': 2.001441240310669} -11/06/2021 22:39:34 - INFO - __main__ - Step 10168: {'lr': 0.0004962526567298402, 'samples': 1952256, 'steps': 10167, 'loss/train': 0.8515803217887878} -11/06/2021 22:39:35 - INFO - __main__ - Step 10169: {'lr': 0.0004962517412945738, 'samples': 1952448, 'steps': 10168, 'loss/train': 1.8724167346954346} -11/06/2021 22:39:35 - INFO - __main__ - Step 10170: {'lr': 0.00049625082574835, 'samples': 1952640, 'steps': 10169, 'loss/train': 1.8901619911193848} -11/06/2021 22:39:36 - INFO - __main__ - Step 10171: {'lr': 0.0004962499100911696, 'samples': 1952832, 'steps': 10170, 'loss/train': 1.726631999015808} -11/06/2021 22:39:36 - INFO - __main__ - Step 10172: {'lr': 0.0004962489943230326, 'samples': 1953024, 'steps': 10171, 'loss/train': 1.2755616903305054} -11/06/2021 22:39:36 - INFO - __main__ - Step 10173: {'lr': 0.0004962480784439397, 'samples': 1953216, 'steps': 10172, 'loss/train': 1.9039602279663086} -11/06/2021 22:39:38 - INFO - __main__ - Step 10174: {'lr': 0.0004962471624538913, 'samples': 1953408, 'steps': 10173, 'loss/train': 2.694628953933716} -11/06/2021 22:39:38 - INFO - __main__ - Step 10175: {'lr': 0.0004962462463528875, 'samples': 1953600, 'steps': 10174, 'loss/train': 1.5455642938613892} -11/06/2021 22:39:38 - INFO - __main__ - Step 10176: {'lr': 0.0004962453301409291, 'samples': 1953792, 'steps': 10175, 'loss/train': 2.612506866455078} -11/06/2021 22:39:39 - INFO - __main__ - Step 10177: {'lr': 0.0004962444138180164, 'samples': 1953984, 'steps': 10176, 'loss/train': 1.5094280242919922} -11/06/2021 22:39:39 - INFO - __main__ - Step 10178: {'lr': 0.0004962434973841497, 'samples': 1954176, 'steps': 10177, 'loss/train': 1.740395426750183} -11/06/2021 22:39:39 - INFO - __main__ - Step 10179: {'lr': 0.0004962425808393295, 'samples': 1954368, 'steps': 10178, 'loss/train': 1.4363911151885986} -11/06/2021 22:39:40 - INFO - __main__ - Step 10180: {'lr': 0.000496241664183556, 'samples': 1954560, 'steps': 10179, 'loss/train': 1.8234004974365234} -11/06/2021 22:39:41 - INFO - __main__ - Step 10181: {'lr': 0.0004962407474168301, 'samples': 1954752, 'steps': 10180, 'loss/train': 2.219465970993042} -11/06/2021 22:39:41 - INFO - __main__ - Step 10182: {'lr': 0.0004962398305391518, 'samples': 1954944, 'steps': 10181, 'loss/train': 1.733228087425232} -11/06/2021 22:39:41 - INFO - __main__ - Step 10183: {'lr': 0.0004962389135505217, 'samples': 1955136, 'steps': 10182, 'loss/train': 1.9149515628814697} -11/06/2021 22:39:42 - INFO - __main__ - Step 10184: {'lr': 0.00049623799645094, 'samples': 1955328, 'steps': 10183, 'loss/train': 1.2486367225646973} -11/06/2021 22:39:43 - INFO - __main__ - Step 10185: {'lr': 0.0004962370792404073, 'samples': 1955520, 'steps': 10184, 'loss/train': 1.7573951482772827} -11/06/2021 22:39:43 - INFO - __main__ - Step 10186: {'lr': 0.000496236161918924, 'samples': 1955712, 'steps': 10185, 'loss/train': 2.166736125946045} -11/06/2021 22:39:43 - INFO - __main__ - Step 10187: {'lr': 0.0004962352444864904, 'samples': 1955904, 'steps': 10186, 'loss/train': 1.8243874311447144} -11/06/2021 22:39:44 - INFO - __main__ - Step 10188: {'lr': 0.0004962343269431072, 'samples': 1956096, 'steps': 10187, 'loss/train': 1.3378742933273315} -11/06/2021 22:39:44 - INFO - __main__ - Step 10189: {'lr': 0.0004962334092887744, 'samples': 1956288, 'steps': 10188, 'loss/train': 1.5770504474639893} -11/06/2021 22:39:45 - INFO - __main__ - Step 10190: {'lr': 0.0004962324915234928, 'samples': 1956480, 'steps': 10189, 'loss/train': 1.703421711921692} -11/06/2021 22:39:46 - INFO - __main__ - Step 10191: {'lr': 0.0004962315736472626, 'samples': 1956672, 'steps': 10190, 'loss/train': 1.7759064435958862} -11/06/2021 22:39:46 - INFO - __main__ - Step 10192: {'lr': 0.0004962306556600842, 'samples': 1956864, 'steps': 10191, 'loss/train': 1.7851485013961792} -11/06/2021 22:39:46 - INFO - __main__ - Step 10193: {'lr': 0.0004962297375619581, 'samples': 1957056, 'steps': 10192, 'loss/train': 1.8357267379760742} -11/06/2021 22:39:47 - INFO - __main__ - Step 10194: {'lr': 0.0004962288193528846, 'samples': 1957248, 'steps': 10193, 'loss/train': 1.8837649822235107} -11/06/2021 22:39:48 - INFO - __main__ - Step 10195: {'lr': 0.0004962279010328642, 'samples': 1957440, 'steps': 10194, 'loss/train': 1.5941526889801025} -11/06/2021 22:39:48 - INFO - __main__ - Step 10196: {'lr': 0.0004962269826018974, 'samples': 1957632, 'steps': 10195, 'loss/train': 1.2281931638717651} -11/06/2021 22:39:48 - INFO - __main__ - Step 10197: {'lr': 0.0004962260640599845, 'samples': 1957824, 'steps': 10196, 'loss/train': 1.6017422676086426} -11/06/2021 22:39:49 - INFO - __main__ - Step 10198: {'lr': 0.0004962251454071259, 'samples': 1958016, 'steps': 10197, 'loss/train': 1.4461283683776855} -11/06/2021 22:39:49 - INFO - __main__ - Step 10199: {'lr': 0.0004962242266433221, 'samples': 1958208, 'steps': 10198, 'loss/train': 1.918282151222229} -11/06/2021 22:39:51 - INFO - __main__ - Step 10200: {'lr': 0.0004962233077685734, 'samples': 1958400, 'steps': 10199, 'loss/train': 1.5870373249053955} -11/06/2021 22:39:51 - INFO - __main__ - Step 10201: {'lr': 0.0004962223887828803, 'samples': 1958592, 'steps': 10200, 'loss/train': 1.9776827096939087} -11/06/2021 22:39:52 - INFO - __main__ - Step 10202: {'lr': 0.0004962214696862432, 'samples': 1958784, 'steps': 10201, 'loss/train': 1.859332799911499} -11/06/2021 22:39:52 - INFO - __main__ - Step 10203: {'lr': 0.0004962205504786626, 'samples': 1958976, 'steps': 10202, 'loss/train': 1.5587915182113647} -11/06/2021 22:39:52 - INFO - __main__ - Step 10204: {'lr': 0.0004962196311601386, 'samples': 1959168, 'steps': 10203, 'loss/train': 2.007300615310669} -11/06/2021 22:39:53 - INFO - __main__ - Step 10205: {'lr': 0.000496218711730672, 'samples': 1959360, 'steps': 10204, 'loss/train': 1.5240142345428467} -11/06/2021 22:39:53 - INFO - __main__ - Step 10206: {'lr': 0.000496217792190263, 'samples': 1959552, 'steps': 10205, 'loss/train': 1.8262863159179688} -11/06/2021 22:39:54 - INFO - __main__ - Step 10207: {'lr': 0.0004962168725389121, 'samples': 1959744, 'steps': 10206, 'loss/train': 1.8134788274765015} -11/06/2021 22:39:54 - INFO - __main__ - Step 10208: {'lr': 0.0004962159527766196, 'samples': 1959936, 'steps': 10207, 'loss/train': 1.8182828426361084} -11/06/2021 22:39:55 - INFO - __main__ - Step 10209: {'lr': 0.000496215032903386, 'samples': 1960128, 'steps': 10208, 'loss/train': 2.6121604442596436} -11/06/2021 22:39:55 - INFO - __main__ - Step 10210: {'lr': 0.0004962141129192118, 'samples': 1960320, 'steps': 10209, 'loss/train': 1.8937207460403442} -11/06/2021 22:39:56 - INFO - __main__ - Step 10211: {'lr': 0.0004962131928240972, 'samples': 1960512, 'steps': 10210, 'loss/train': 2.1297640800476074} -11/06/2021 22:39:56 - INFO - __main__ - Step 10212: {'lr': 0.0004962122726180428, 'samples': 1960704, 'steps': 10211, 'loss/train': 1.8525015115737915} -11/06/2021 22:39:57 - INFO - __main__ - Step 10213: {'lr': 0.000496211352301049, 'samples': 1960896, 'steps': 10212, 'loss/train': 2.0309906005859375} -11/06/2021 22:39:57 - INFO - __main__ - Step 10214: {'lr': 0.0004962104318731161, 'samples': 1961088, 'steps': 10213, 'loss/train': 1.6677395105361938} -11/06/2021 22:39:58 - INFO - __main__ - Step 10215: {'lr': 0.0004962095113342445, 'samples': 1961280, 'steps': 10214, 'loss/train': 1.9678434133529663} -11/06/2021 22:39:58 - INFO - __main__ - Step 10216: {'lr': 0.0004962085906844348, 'samples': 1961472, 'steps': 10215, 'loss/train': 1.773742437362671} -11/06/2021 22:39:58 - INFO - __main__ - Step 10217: {'lr': 0.0004962076699236873, 'samples': 1961664, 'steps': 10216, 'loss/train': 1.3391557931900024} -11/06/2021 22:39:59 - INFO - __main__ - Step 10218: {'lr': 0.0004962067490520024, 'samples': 1961856, 'steps': 10217, 'loss/train': 1.5753556489944458} -11/06/2021 22:40:00 - INFO - __main__ - Step 10219: {'lr': 0.0004962058280693805, 'samples': 1962048, 'steps': 10218, 'loss/train': 1.1909321546554565} -11/06/2021 22:40:00 - INFO - __main__ - Step 10220: {'lr': 0.0004962049069758221, 'samples': 1962240, 'steps': 10219, 'loss/train': 2.3441052436828613} -11/06/2021 22:40:00 - INFO - __main__ - Step 10221: {'lr': 0.0004962039857713276, 'samples': 1962432, 'steps': 10220, 'loss/train': 2.0248935222625732} -11/06/2021 22:40:01 - INFO - __main__ - Step 10222: {'lr': 0.0004962030644558974, 'samples': 1962624, 'steps': 10221, 'loss/train': 2.0207021236419678} -11/06/2021 22:40:02 - INFO - __main__ - Step 10223: {'lr': 0.0004962021430295319, 'samples': 1962816, 'steps': 10222, 'loss/train': 2.0765750408172607} -11/06/2021 22:40:02 - INFO - __main__ - Step 10224: {'lr': 0.0004962012214922314, 'samples': 1963008, 'steps': 10223, 'loss/train': 1.82279372215271} -11/06/2021 22:40:02 - INFO - __main__ - Step 10225: {'lr': 0.0004962002998439966, 'samples': 1963200, 'steps': 10224, 'loss/train': 2.235682725906372} -11/06/2021 22:40:03 - INFO - __main__ - Step 10226: {'lr': 0.0004961993780848276, 'samples': 1963392, 'steps': 10225, 'loss/train': 1.372536301612854} -11/06/2021 22:40:03 - INFO - __main__ - Step 10227: {'lr': 0.000496198456214725, 'samples': 1963584, 'steps': 10226, 'loss/train': 2.1596105098724365} -11/06/2021 22:40:04 - INFO - __main__ - Step 10228: {'lr': 0.0004961975342336891, 'samples': 1963776, 'steps': 10227, 'loss/train': 1.9234440326690674} -11/06/2021 22:40:05 - INFO - __main__ - Step 10229: {'lr': 0.0004961966121417204, 'samples': 1963968, 'steps': 10228, 'loss/train': 1.7350918054580688} -11/06/2021 22:40:05 - INFO - __main__ - Step 10230: {'lr': 0.0004961956899388195, 'samples': 1964160, 'steps': 10229, 'loss/train': 1.6040425300598145} -11/06/2021 22:40:05 - INFO - __main__ - Step 10231: {'lr': 0.0004961947676249864, 'samples': 1964352, 'steps': 10230, 'loss/train': 1.6913650035858154} -11/06/2021 22:40:06 - INFO - __main__ - Step 10232: {'lr': 0.0004961938452002218, 'samples': 1964544, 'steps': 10231, 'loss/train': 1.3374961614608765} -11/06/2021 22:40:06 - INFO - __main__ - Step 10233: {'lr': 0.0004961929226645261, 'samples': 1964736, 'steps': 10232, 'loss/train': 1.7283188104629517} -11/06/2021 22:40:07 - INFO - __main__ - Step 10234: {'lr': 0.0004961920000178996, 'samples': 1964928, 'steps': 10233, 'loss/train': 1.5170456171035767} -11/06/2021 22:40:07 - INFO - __main__ - Step 10235: {'lr': 0.0004961910772603429, 'samples': 1965120, 'steps': 10234, 'loss/train': 1.6485928297042847} -11/06/2021 22:40:08 - INFO - __main__ - Step 10236: {'lr': 0.0004961901543918563, 'samples': 1965312, 'steps': 10235, 'loss/train': 1.1824220418930054} -11/06/2021 22:40:08 - INFO - __main__ - Step 10237: {'lr': 0.0004961892314124401, 'samples': 1965504, 'steps': 10236, 'loss/train': 1.3500611782073975} -11/06/2021 22:40:08 - INFO - __main__ - Step 10238: {'lr': 0.0004961883083220948, 'samples': 1965696, 'steps': 10237, 'loss/train': 1.5080724954605103} -11/06/2021 22:40:09 - INFO - __main__ - Step 10239: {'lr': 0.0004961873851208209, 'samples': 1965888, 'steps': 10238, 'loss/train': 1.8465136289596558} -11/06/2021 22:40:10 - INFO - __main__ - Step 10240: {'lr': 0.0004961864618086188, 'samples': 1966080, 'steps': 10239, 'loss/train': 1.8443377017974854} -11/06/2021 22:40:10 - INFO - __main__ - Step 10241: {'lr': 0.0004961855383854889, 'samples': 1966272, 'steps': 10240, 'loss/train': 1.4369864463806152} -11/06/2021 22:40:10 - INFO - __main__ - Step 10242: {'lr': 0.0004961846148514315, 'samples': 1966464, 'steps': 10241, 'loss/train': 1.790596842765808} -11/06/2021 22:40:11 - INFO - __main__ - Step 10243: {'lr': 0.0004961836912064472, 'samples': 1966656, 'steps': 10242, 'loss/train': 1.661517858505249} -11/06/2021 22:40:12 - INFO - __main__ - Step 10244: {'lr': 0.0004961827674505363, 'samples': 1966848, 'steps': 10243, 'loss/train': 0.9283877015113831} -11/06/2021 22:40:12 - INFO - __main__ - Step 10245: {'lr': 0.0004961818435836993, 'samples': 1967040, 'steps': 10244, 'loss/train': 2.5082814693450928} -11/06/2021 22:40:13 - INFO - __main__ - Step 10246: {'lr': 0.0004961809196059365, 'samples': 1967232, 'steps': 10245, 'loss/train': 0.8113244771957397} -11/06/2021 22:40:13 - INFO - __main__ - Step 10247: {'lr': 0.0004961799955172483, 'samples': 1967424, 'steps': 10246, 'loss/train': 1.7437840700149536} -11/06/2021 22:40:13 - INFO - __main__ - Step 10248: {'lr': 0.0004961790713176353, 'samples': 1967616, 'steps': 10247, 'loss/train': 1.9482618570327759} -11/06/2021 22:40:14 - INFO - __main__ - Step 10249: {'lr': 0.0004961781470070978, 'samples': 1967808, 'steps': 10248, 'loss/train': 1.7293133735656738} -11/06/2021 22:40:15 - INFO - __main__ - Step 10250: {'lr': 0.0004961772225856362, 'samples': 1968000, 'steps': 10249, 'loss/train': 1.6525590419769287} -11/06/2021 22:40:15 - INFO - __main__ - Step 10251: {'lr': 0.0004961762980532509, 'samples': 1968192, 'steps': 10250, 'loss/train': 1.758000135421753} -11/06/2021 22:40:15 - INFO - __main__ - Step 10252: {'lr': 0.0004961753734099425, 'samples': 1968384, 'steps': 10251, 'loss/train': 1.3765827417373657} -11/06/2021 22:40:16 - INFO - __main__ - Step 10253: {'lr': 0.0004961744486557112, 'samples': 1968576, 'steps': 10252, 'loss/train': 1.9734203815460205} -11/06/2021 22:40:17 - INFO - __main__ - Step 10254: {'lr': 0.0004961735237905574, 'samples': 1968768, 'steps': 10253, 'loss/train': 1.5639272928237915} -11/06/2021 22:40:17 - INFO - __main__ - Step 10255: {'lr': 0.0004961725988144816, 'samples': 1968960, 'steps': 10254, 'loss/train': 1.7732101678848267} -11/06/2021 22:40:17 - INFO - __main__ - Step 10256: {'lr': 0.0004961716737274844, 'samples': 1969152, 'steps': 10255, 'loss/train': 1.2973039150238037} -11/06/2021 22:40:18 - INFO - __main__ - Step 10257: {'lr': 0.0004961707485295659, 'samples': 1969344, 'steps': 10256, 'loss/train': 1.6465765237808228} -11/06/2021 22:40:18 - INFO - __main__ - Step 10258: {'lr': 0.0004961698232207268, 'samples': 1969536, 'steps': 10257, 'loss/train': 1.0470538139343262} -11/06/2021 22:40:18 - INFO - __main__ - Step 10259: {'lr': 0.0004961688978009672, 'samples': 1969728, 'steps': 10258, 'loss/train': 1.853024959564209} -11/06/2021 22:40:19 - INFO - __main__ - Step 10260: {'lr': 0.0004961679722702879, 'samples': 1969920, 'steps': 10259, 'loss/train': 1.3597272634506226} -11/06/2021 22:40:20 - INFO - __main__ - Step 10261: {'lr': 0.0004961670466286889, 'samples': 1970112, 'steps': 10260, 'loss/train': 1.9587664604187012} -11/06/2021 22:40:20 - INFO - __main__ - Step 10262: {'lr': 0.000496166120876171, 'samples': 1970304, 'steps': 10261, 'loss/train': 1.988135814666748} -11/06/2021 22:40:21 - INFO - __main__ - Step 10263: {'lr': 0.0004961651950127343, 'samples': 1970496, 'steps': 10262, 'loss/train': 1.9414300918579102} -11/06/2021 22:40:21 - INFO - __main__ - Step 10264: {'lr': 0.0004961642690383794, 'samples': 1970688, 'steps': 10263, 'loss/train': 1.9191449880599976} -11/06/2021 22:40:22 - INFO - __main__ - Step 10265: {'lr': 0.0004961633429531068, 'samples': 1970880, 'steps': 10264, 'loss/train': 2.015342950820923} -11/06/2021 22:40:22 - INFO - __main__ - Step 10266: {'lr': 0.0004961624167569166, 'samples': 1971072, 'steps': 10265, 'loss/train': 1.3776711225509644} -11/06/2021 22:40:23 - INFO - __main__ - Step 10267: {'lr': 0.0004961614904498095, 'samples': 1971264, 'steps': 10266, 'loss/train': 2.4013566970825195} -11/06/2021 22:40:23 - INFO - __main__ - Step 10268: {'lr': 0.0004961605640317858, 'samples': 1971456, 'steps': 10267, 'loss/train': 1.6062275171279907} -11/06/2021 22:40:23 - INFO - __main__ - Step 10269: {'lr': 0.0004961596375028461, 'samples': 1971648, 'steps': 10268, 'loss/train': 1.3712677955627441} -11/06/2021 22:40:24 - INFO - __main__ - Step 10270: {'lr': 0.0004961587108629906, 'samples': 1971840, 'steps': 10269, 'loss/train': 1.1406784057617188} -11/06/2021 22:40:25 - INFO - __main__ - Step 10271: {'lr': 0.0004961577841122197, 'samples': 1972032, 'steps': 10270, 'loss/train': 1.5826045274734497} -11/06/2021 22:40:25 - INFO - __main__ - Step 10272: {'lr': 0.000496156857250534, 'samples': 1972224, 'steps': 10271, 'loss/train': 1.612403154373169} -11/06/2021 22:40:25 - INFO - __main__ - Step 10273: {'lr': 0.0004961559302779338, 'samples': 1972416, 'steps': 10272, 'loss/train': 1.9364298582077026} -11/06/2021 22:40:26 - INFO - __main__ - Step 10274: {'lr': 0.0004961550031944194, 'samples': 1972608, 'steps': 10273, 'loss/train': 1.6951217651367188} -11/06/2021 22:40:27 - INFO - __main__ - Step 10275: {'lr': 0.0004961540759999914, 'samples': 1972800, 'steps': 10274, 'loss/train': 2.1520490646362305} -11/06/2021 22:40:27 - INFO - __main__ - Step 10276: {'lr': 0.0004961531486946502, 'samples': 1972992, 'steps': 10275, 'loss/train': 1.9737766981124878} -11/06/2021 22:40:28 - INFO - __main__ - Step 10277: {'lr': 0.0004961522212783962, 'samples': 1973184, 'steps': 10276, 'loss/train': 1.5989540815353394} -11/06/2021 22:40:28 - INFO - __main__ - Step 10278: {'lr': 0.00049615129375123, 'samples': 1973376, 'steps': 10277, 'loss/train': 0.26742538809776306} -11/06/2021 22:40:29 - INFO - __main__ - Step 10279: {'lr': 0.0004961503661131515, 'samples': 1973568, 'steps': 10278, 'loss/train': 1.548420786857605} -11/06/2021 22:40:30 - INFO - __main__ - Step 10280: {'lr': 0.0004961494383641616, 'samples': 1973760, 'steps': 10279, 'loss/train': 1.5787936449050903} -11/06/2021 22:40:30 - INFO - __main__ - Step 10281: {'lr': 0.0004961485105042606, 'samples': 1973952, 'steps': 10280, 'loss/train': 2.117009401321411} -11/06/2021 22:40:30 - INFO - __main__ - Step 10282: {'lr': 0.0004961475825334488, 'samples': 1974144, 'steps': 10281, 'loss/train': 1.2511065006256104} -11/06/2021 22:40:31 - INFO - __main__ - Step 10283: {'lr': 0.0004961466544517267, 'samples': 1974336, 'steps': 10282, 'loss/train': 2.109795570373535} -11/06/2021 22:40:31 - INFO - __main__ - Step 10284: {'lr': 0.0004961457262590948, 'samples': 1974528, 'steps': 10283, 'loss/train': 1.5047543048858643} -11/06/2021 22:40:31 - INFO - __main__ - Step 10285: {'lr': 0.0004961447979555533, 'samples': 1974720, 'steps': 10284, 'loss/train': 1.6194933652877808} -11/06/2021 22:40:32 - INFO - __main__ - Step 10286: {'lr': 0.000496143869541103, 'samples': 1974912, 'steps': 10285, 'loss/train': 1.41692054271698} -11/06/2021 22:40:33 - INFO - __main__ - Step 10287: {'lr': 0.0004961429410157437, 'samples': 1975104, 'steps': 10286, 'loss/train': 1.688002586364746} -11/06/2021 22:40:33 - INFO - __main__ - Step 10288: {'lr': 0.0004961420123794764, 'samples': 1975296, 'steps': 10287, 'loss/train': 1.7760323286056519} -11/06/2021 22:40:34 - INFO - __main__ - Step 10289: {'lr': 0.0004961410836323014, 'samples': 1975488, 'steps': 10288, 'loss/train': 1.8118081092834473} -11/06/2021 22:40:34 - INFO - __main__ - Step 10290: {'lr': 0.0004961401547742189, 'samples': 1975680, 'steps': 10289, 'loss/train': 1.0009771585464478} -11/06/2021 22:40:35 - INFO - __main__ - Step 10291: {'lr': 0.0004961392258052294, 'samples': 1975872, 'steps': 10290, 'loss/train': 1.9054882526397705} -11/06/2021 22:40:35 - INFO - __main__ - Step 10292: {'lr': 0.0004961382967253335, 'samples': 1976064, 'steps': 10291, 'loss/train': 1.815101981163025} -11/06/2021 22:40:36 - INFO - __main__ - Step 10293: {'lr': 0.0004961373675345315, 'samples': 1976256, 'steps': 10292, 'loss/train': 1.6685025691986084} -11/06/2021 22:40:36 - INFO - __main__ - Step 10294: {'lr': 0.0004961364382328236, 'samples': 1976448, 'steps': 10293, 'loss/train': 1.8122519254684448} -11/06/2021 22:40:36 - INFO - __main__ - Step 10295: {'lr': 0.0004961355088202106, 'samples': 1976640, 'steps': 10294, 'loss/train': 1.760857105255127} -11/06/2021 22:40:37 - INFO - __main__ - Step 10296: {'lr': 0.0004961345792966926, 'samples': 1976832, 'steps': 10295, 'loss/train': 2.0797855854034424} -11/06/2021 22:40:38 - INFO - __main__ - Step 10297: {'lr': 0.0004961336496622702, 'samples': 1977024, 'steps': 10296, 'loss/train': 0.4716089367866516} -11/06/2021 22:40:38 - INFO - __main__ - Step 10298: {'lr': 0.0004961327199169438, 'samples': 1977216, 'steps': 10297, 'loss/train': 1.8852925300598145} -11/06/2021 22:40:39 - INFO - __main__ - Step 10299: {'lr': 0.0004961317900607138, 'samples': 1977408, 'steps': 10298, 'loss/train': 2.788236141204834} -11/06/2021 22:40:39 - INFO - __main__ - Step 10300: {'lr': 0.0004961308600935807, 'samples': 1977600, 'steps': 10299, 'loss/train': 1.8009984493255615} -11/06/2021 22:40:39 - INFO - __main__ - Step 10301: {'lr': 0.0004961299300155446, 'samples': 1977792, 'steps': 10300, 'loss/train': 1.9995626211166382} -11/06/2021 22:40:40 - INFO - __main__ - Step 10302: {'lr': 0.0004961289998266064, 'samples': 1977984, 'steps': 10301, 'loss/train': 1.1890935897827148} -11/06/2021 22:40:41 - INFO - __main__ - Step 10303: {'lr': 0.0004961280695267662, 'samples': 1978176, 'steps': 10302, 'loss/train': 1.4275264739990234} -11/06/2021 22:40:41 - INFO - __main__ - Step 10304: {'lr': 0.0004961271391160243, 'samples': 1978368, 'steps': 10303, 'loss/train': 1.8430927991867065} -11/06/2021 22:40:41 - INFO - __main__ - Step 10305: {'lr': 0.0004961262085943815, 'samples': 1978560, 'steps': 10304, 'loss/train': 1.3772211074829102} -11/06/2021 22:40:42 - INFO - __main__ - Step 10306: {'lr': 0.000496125277961838, 'samples': 1978752, 'steps': 10305, 'loss/train': 1.3290560245513916} -11/06/2021 22:40:43 - INFO - __main__ - Step 10307: {'lr': 0.0004961243472183942, 'samples': 1978944, 'steps': 10306, 'loss/train': 1.4642337560653687} -11/06/2021 22:40:43 - INFO - __main__ - Step 10308: {'lr': 0.0004961234163640507, 'samples': 1979136, 'steps': 10307, 'loss/train': 1.9507293701171875} -11/06/2021 22:40:43 - INFO - __main__ - Step 10309: {'lr': 0.0004961224853988076, 'samples': 1979328, 'steps': 10308, 'loss/train': 2.0494842529296875} -11/06/2021 22:40:44 - INFO - __main__ - Step 10310: {'lr': 0.0004961215543226657, 'samples': 1979520, 'steps': 10309, 'loss/train': 1.839885950088501} -11/06/2021 22:40:44 - INFO - __main__ - Step 10311: {'lr': 0.0004961206231356251, 'samples': 1979712, 'steps': 10310, 'loss/train': 1.5155304670333862} -11/06/2021 22:40:45 - INFO - __main__ - Step 10312: {'lr': 0.0004961196918376864, 'samples': 1979904, 'steps': 10311, 'loss/train': 1.361377239227295} -11/06/2021 22:40:46 - INFO - __main__ - Step 10313: {'lr': 0.0004961187604288498, 'samples': 1980096, 'steps': 10312, 'loss/train': 1.2928553819656372} -11/06/2021 22:40:46 - INFO - __main__ - Step 10314: {'lr': 0.0004961178289091161, 'samples': 1980288, 'steps': 10313, 'loss/train': 1.8654111623764038} -11/06/2021 22:40:46 - INFO - __main__ - Step 10315: {'lr': 0.0004961168972784855, 'samples': 1980480, 'steps': 10314, 'loss/train': 1.5969183444976807} -11/06/2021 22:40:47 - INFO - __main__ - Step 10316: {'lr': 0.0004961159655369582, 'samples': 1980672, 'steps': 10315, 'loss/train': 1.5698388814926147} -11/06/2021 22:40:48 - INFO - __main__ - Step 10317: {'lr': 0.0004961150336845351, 'samples': 1980864, 'steps': 10316, 'loss/train': 1.988451600074768} -11/06/2021 22:40:48 - INFO - __main__ - Step 10318: {'lr': 0.0004961141017212162, 'samples': 1981056, 'steps': 10317, 'loss/train': 1.8295103311538696} -11/06/2021 22:40:48 - INFO - __main__ - Step 10319: {'lr': 0.0004961131696470021, 'samples': 1981248, 'steps': 10318, 'loss/train': 1.9807548522949219} -11/06/2021 22:40:49 - INFO - __main__ - Step 10320: {'lr': 0.0004961122374618933, 'samples': 1981440, 'steps': 10319, 'loss/train': 1.6604183912277222} -11/06/2021 22:40:49 - INFO - __main__ - Step 10321: {'lr': 0.00049611130516589, 'samples': 1981632, 'steps': 10320, 'loss/train': 1.369404911994934} -11/06/2021 22:40:49 - INFO - __main__ - Step 10322: {'lr': 0.0004961103727589929, 'samples': 1981824, 'steps': 10321, 'loss/train': 1.0568779706954956} -11/06/2021 22:40:50 - INFO - __main__ - Step 10323: {'lr': 0.0004961094402412021, 'samples': 1982016, 'steps': 10322, 'loss/train': 1.5058151483535767} -11/06/2021 22:40:51 - INFO - __main__ - Step 10324: {'lr': 0.0004961085076125182, 'samples': 1982208, 'steps': 10323, 'loss/train': 1.933563470840454} -11/06/2021 22:40:51 - INFO - __main__ - Step 10325: {'lr': 0.0004961075748729418, 'samples': 1982400, 'steps': 10324, 'loss/train': 1.765858769416809} -11/06/2021 22:40:51 - INFO - __main__ - Step 10326: {'lr': 0.0004961066420224729, 'samples': 1982592, 'steps': 10325, 'loss/train': 1.309130072593689} -11/06/2021 22:40:52 - INFO - __main__ - Step 10327: {'lr': 0.0004961057090611123, 'samples': 1982784, 'steps': 10326, 'loss/train': 1.8366987705230713} -11/06/2021 22:40:53 - INFO - __main__ - Step 10328: {'lr': 0.0004961047759888601, 'samples': 1982976, 'steps': 10327, 'loss/train': 1.7899473905563354} -11/06/2021 22:40:53 - INFO - __main__ - Step 10329: {'lr': 0.000496103842805717, 'samples': 1983168, 'steps': 10328, 'loss/train': 1.4649665355682373} -11/06/2021 22:40:54 - INFO - __main__ - Step 10330: {'lr': 0.0004961029095116833, 'samples': 1983360, 'steps': 10329, 'loss/train': 2.0712430477142334} -11/06/2021 22:40:54 - INFO - __main__ - Step 10331: {'lr': 0.0004961019761067594, 'samples': 1983552, 'steps': 10330, 'loss/train': 2.5029542446136475} -11/06/2021 22:40:54 - INFO - __main__ - Step 10332: {'lr': 0.0004961010425909458, 'samples': 1983744, 'steps': 10331, 'loss/train': 2.1280171871185303} -11/06/2021 22:40:55 - INFO - __main__ - Step 10333: {'lr': 0.0004961001089642428, 'samples': 1983936, 'steps': 10332, 'loss/train': 1.8614065647125244} -11/06/2021 22:40:56 - INFO - __main__ - Step 10334: {'lr': 0.000496099175226651, 'samples': 1984128, 'steps': 10333, 'loss/train': 2.124863862991333} -11/06/2021 22:40:56 - INFO - __main__ - Step 10335: {'lr': 0.0004960982413781705, 'samples': 1984320, 'steps': 10334, 'loss/train': 1.0853912830352783} -11/06/2021 22:40:56 - INFO - __main__ - Step 10336: {'lr': 0.0004960973074188021, 'samples': 1984512, 'steps': 10335, 'loss/train': 1.535399317741394} -11/06/2021 22:40:57 - INFO - __main__ - Step 10337: {'lr': 0.000496096373348546, 'samples': 1984704, 'steps': 10336, 'loss/train': 1.792807936668396} -11/06/2021 22:40:58 - INFO - __main__ - Step 10338: {'lr': 0.0004960954391674026, 'samples': 1984896, 'steps': 10337, 'loss/train': 1.693973183631897} -11/06/2021 22:40:58 - INFO - __main__ - Step 10339: {'lr': 0.0004960945048753725, 'samples': 1985088, 'steps': 10338, 'loss/train': 2.293344020843506} -11/06/2021 22:40:58 - INFO - __main__ - Step 10340: {'lr': 0.000496093570472456, 'samples': 1985280, 'steps': 10339, 'loss/train': 1.3442373275756836} -11/06/2021 22:40:59 - INFO - __main__ - Step 10341: {'lr': 0.0004960926359586535, 'samples': 1985472, 'steps': 10340, 'loss/train': 1.554911732673645} -11/06/2021 22:40:59 - INFO - __main__ - Step 10342: {'lr': 0.0004960917013339656, 'samples': 1985664, 'steps': 10341, 'loss/train': 2.2928225994110107} -11/06/2021 22:41:00 - INFO - __main__ - Step 10343: {'lr': 0.0004960907665983923, 'samples': 1985856, 'steps': 10342, 'loss/train': 1.8382941484451294} -11/06/2021 22:41:00 - INFO - __main__ - Step 10344: {'lr': 0.0004960898317519345, 'samples': 1986048, 'steps': 10343, 'loss/train': 1.9304149150848389} -11/06/2021 22:41:01 - INFO - __main__ - Step 10345: {'lr': 0.0004960888967945924, 'samples': 1986240, 'steps': 10344, 'loss/train': 1.7264574766159058} -11/06/2021 22:41:01 - INFO - __main__ - Step 10346: {'lr': 0.0004960879617263664, 'samples': 1986432, 'steps': 10345, 'loss/train': 1.2233792543411255} -11/06/2021 22:41:02 - INFO - __main__ - Step 10347: {'lr': 0.000496087026547257, 'samples': 1986624, 'steps': 10346, 'loss/train': 1.9374359846115112} -11/06/2021 22:41:02 - INFO - __main__ - Step 10348: {'lr': 0.0004960860912572645, 'samples': 1986816, 'steps': 10347, 'loss/train': 1.7407712936401367} -11/06/2021 22:41:03 - INFO - __main__ - Step 10349: {'lr': 0.0004960851558563895, 'samples': 1987008, 'steps': 10348, 'loss/train': 1.7582014799118042} -11/06/2021 22:41:04 - INFO - __main__ - Step 10350: {'lr': 0.0004960842203446322, 'samples': 1987200, 'steps': 10349, 'loss/train': 0.7253603935241699} -11/06/2021 22:41:04 - INFO - __main__ - Step 10351: {'lr': 0.0004960832847219933, 'samples': 1987392, 'steps': 10350, 'loss/train': 1.7652232646942139} -11/06/2021 22:41:04 - INFO - __main__ - Step 10352: {'lr': 0.000496082348988473, 'samples': 1987584, 'steps': 10351, 'loss/train': 1.9226405620574951} -11/06/2021 22:41:05 - INFO - __main__ - Step 10353: {'lr': 0.0004960814131440717, 'samples': 1987776, 'steps': 10352, 'loss/train': 2.1182456016540527} -11/06/2021 22:41:06 - INFO - __main__ - Step 10354: {'lr': 0.0004960804771887901, 'samples': 1987968, 'steps': 10353, 'loss/train': 1.939481496810913} -11/06/2021 22:41:06 - INFO - __main__ - Step 10355: {'lr': 0.0004960795411226283, 'samples': 1988160, 'steps': 10354, 'loss/train': 2.0060768127441406} -11/06/2021 22:41:06 - INFO - __main__ - Step 10356: {'lr': 0.0004960786049455868, 'samples': 1988352, 'steps': 10355, 'loss/train': 1.5645967721939087} -11/06/2021 22:41:07 - INFO - __main__ - Step 10357: {'lr': 0.0004960776686576663, 'samples': 1988544, 'steps': 10356, 'loss/train': 1.7053444385528564} -11/06/2021 22:41:07 - INFO - __main__ - Step 10358: {'lr': 0.0004960767322588668, 'samples': 1988736, 'steps': 10357, 'loss/train': 1.8968679904937744} -11/06/2021 22:41:08 - INFO - __main__ - Step 10359: {'lr': 0.000496075795749189, 'samples': 1988928, 'steps': 10358, 'loss/train': 1.6383986473083496} -11/06/2021 22:41:08 - INFO - __main__ - Step 10360: {'lr': 0.0004960748591286332, 'samples': 1989120, 'steps': 10359, 'loss/train': 2.3410348892211914} -11/06/2021 22:41:09 - INFO - __main__ - Step 10361: {'lr': 0.0004960739223971999, 'samples': 1989312, 'steps': 10360, 'loss/train': 2.367793560028076} -11/06/2021 22:41:09 - INFO - __main__ - Step 10362: {'lr': 0.0004960729855548895, 'samples': 1989504, 'steps': 10361, 'loss/train': 1.650147795677185} -11/06/2021 22:41:10 - INFO - __main__ - Step 10363: {'lr': 0.0004960720486017025, 'samples': 1989696, 'steps': 10362, 'loss/train': 0.8240565657615662} -11/06/2021 22:41:11 - INFO - __main__ - Step 10364: {'lr': 0.0004960711115376391, 'samples': 1989888, 'steps': 10363, 'loss/train': 2.253253698348999} -11/06/2021 22:41:11 - INFO - __main__ - Step 10365: {'lr': 0.0004960701743626999, 'samples': 1990080, 'steps': 10364, 'loss/train': 1.3892946243286133} -11/06/2021 22:41:11 - INFO - __main__ - Step 10366: {'lr': 0.0004960692370768853, 'samples': 1990272, 'steps': 10365, 'loss/train': 1.6433247327804565} -11/06/2021 22:41:12 - INFO - __main__ - Step 10367: {'lr': 0.0004960682996801956, 'samples': 1990464, 'steps': 10366, 'loss/train': 1.6244982481002808} -11/06/2021 22:41:12 - INFO - __main__ - Step 10368: {'lr': 0.0004960673621726314, 'samples': 1990656, 'steps': 10367, 'loss/train': 1.839497685432434} -11/06/2021 22:41:13 - INFO - __main__ - Step 10369: {'lr': 0.000496066424554193, 'samples': 1990848, 'steps': 10368, 'loss/train': 1.401164174079895} -11/06/2021 22:41:14 - INFO - __main__ - Step 10370: {'lr': 0.0004960654868248809, 'samples': 1991040, 'steps': 10369, 'loss/train': 2.057040214538574} -11/06/2021 22:41:14 - INFO - __main__ - Step 10371: {'lr': 0.0004960645489846955, 'samples': 1991232, 'steps': 10370, 'loss/train': 2.0657546520233154} -11/06/2021 22:41:14 - INFO - __main__ - Step 10372: {'lr': 0.0004960636110336371, 'samples': 1991424, 'steps': 10371, 'loss/train': 1.8819034099578857} -11/06/2021 22:41:15 - INFO - __main__ - Step 10373: {'lr': 0.0004960626729717064, 'samples': 1991616, 'steps': 10372, 'loss/train': 1.3991193771362305} -11/06/2021 22:41:15 - INFO - __main__ - Step 10374: {'lr': 0.0004960617347989036, 'samples': 1991808, 'steps': 10373, 'loss/train': 1.9511737823486328} -11/06/2021 22:41:17 - INFO - __main__ - Step 10375: {'lr': 0.0004960607965152292, 'samples': 1992000, 'steps': 10374, 'loss/train': 1.4117087125778198} -11/06/2021 22:41:17 - INFO - __main__ - Step 10376: {'lr': 0.0004960598581206835, 'samples': 1992192, 'steps': 10375, 'loss/train': 1.0104448795318604} -11/06/2021 22:41:18 - INFO - __main__ - Step 10377: {'lr': 0.000496058919615267, 'samples': 1992384, 'steps': 10376, 'loss/train': 1.3164684772491455} -11/06/2021 22:41:18 - INFO - __main__ - Step 10378: {'lr': 0.0004960579809989803, 'samples': 1992576, 'steps': 10377, 'loss/train': 1.1793992519378662} -11/06/2021 22:41:19 - INFO - __main__ - Step 10379: {'lr': 0.0004960570422718237, 'samples': 1992768, 'steps': 10378, 'loss/train': 0.8159379959106445} -11/06/2021 22:41:19 - INFO - __main__ - Step 10380: {'lr': 0.0004960561034337975, 'samples': 1992960, 'steps': 10379, 'loss/train': 2.050475835800171} -11/06/2021 22:41:19 - INFO - __main__ - Step 10381: {'lr': 0.0004960551644849022, 'samples': 1993152, 'steps': 10380, 'loss/train': 1.5734912157058716} -11/06/2021 22:41:20 - INFO - __main__ - Step 10382: {'lr': 0.0004960542254251382, 'samples': 1993344, 'steps': 10381, 'loss/train': 1.4547319412231445} -11/06/2021 22:41:21 - INFO - __main__ - Step 10383: {'lr': 0.0004960532862545061, 'samples': 1993536, 'steps': 10382, 'loss/train': 1.9347224235534668} -11/06/2021 22:41:21 - INFO - __main__ - Step 10384: {'lr': 0.0004960523469730061, 'samples': 1993728, 'steps': 10383, 'loss/train': 1.8350725173950195} -11/06/2021 22:41:21 - INFO - __main__ - Step 10385: {'lr': 0.0004960514075806387, 'samples': 1993920, 'steps': 10384, 'loss/train': 2.118435859680176} -11/06/2021 22:41:22 - INFO - __main__ - Step 10386: {'lr': 0.0004960504680774043, 'samples': 1994112, 'steps': 10385, 'loss/train': 1.8689095973968506} -11/06/2021 22:41:23 - INFO - __main__ - Step 10387: {'lr': 0.0004960495284633034, 'samples': 1994304, 'steps': 10386, 'loss/train': 0.7011041045188904} -11/06/2021 22:41:23 - INFO - __main__ - Step 10388: {'lr': 0.0004960485887383363, 'samples': 1994496, 'steps': 10387, 'loss/train': 1.9033364057540894} -11/06/2021 22:41:23 - INFO - __main__ - Step 10389: {'lr': 0.0004960476489025037, 'samples': 1994688, 'steps': 10388, 'loss/train': 1.7955809831619263} -11/06/2021 22:41:24 - INFO - __main__ - Step 10390: {'lr': 0.0004960467089558057, 'samples': 1994880, 'steps': 10389, 'loss/train': 1.9313750267028809} -11/06/2021 22:41:24 - INFO - __main__ - Step 10391: {'lr': 0.0004960457688982428, 'samples': 1995072, 'steps': 10390, 'loss/train': 1.3544516563415527} -11/06/2021 22:41:25 - INFO - __main__ - Step 10392: {'lr': 0.0004960448287298156, 'samples': 1995264, 'steps': 10391, 'loss/train': 1.409073829650879} -11/06/2021 22:41:26 - INFO - __main__ - Step 10393: {'lr': 0.0004960438884505242, 'samples': 1995456, 'steps': 10392, 'loss/train': 1.8170816898345947} -11/06/2021 22:41:26 - INFO - __main__ - Step 10394: {'lr': 0.0004960429480603694, 'samples': 1995648, 'steps': 10393, 'loss/train': 1.6994777917861938} -11/06/2021 22:41:26 - INFO - __main__ - Step 10395: {'lr': 0.0004960420075593515, 'samples': 1995840, 'steps': 10394, 'loss/train': 1.7487272024154663} -11/06/2021 22:41:27 - INFO - __main__ - Step 10396: {'lr': 0.0004960410669474708, 'samples': 1996032, 'steps': 10395, 'loss/train': 1.8390122652053833} -11/06/2021 22:41:28 - INFO - __main__ - Step 10397: {'lr': 0.0004960401262247277, 'samples': 1996224, 'steps': 10396, 'loss/train': 1.0365424156188965} -11/06/2021 22:41:28 - INFO - __main__ - Step 10398: {'lr': 0.0004960391853911228, 'samples': 1996416, 'steps': 10397, 'loss/train': 1.6385880708694458} -11/06/2021 22:41:29 - INFO - __main__ - Step 10399: {'lr': 0.0004960382444466564, 'samples': 1996608, 'steps': 10398, 'loss/train': 1.1302746534347534} -11/06/2021 22:41:29 - INFO - __main__ - Step 10400: {'lr': 0.0004960373033913289, 'samples': 1996800, 'steps': 10399, 'loss/train': 1.6192007064819336} -11/06/2021 22:41:29 - INFO - __main__ - Step 10401: {'lr': 0.0004960363622251409, 'samples': 1996992, 'steps': 10400, 'loss/train': 1.7356743812561035} -11/06/2021 22:41:30 - INFO - __main__ - Step 10402: {'lr': 0.0004960354209480927, 'samples': 1997184, 'steps': 10401, 'loss/train': 1.772154688835144} -11/06/2021 22:41:31 - INFO - __main__ - Step 10403: {'lr': 0.0004960344795601847, 'samples': 1997376, 'steps': 10402, 'loss/train': 2.327993869781494} -11/06/2021 22:41:31 - INFO - __main__ - Step 10404: {'lr': 0.0004960335380614174, 'samples': 1997568, 'steps': 10403, 'loss/train': 1.9825865030288696} -11/06/2021 22:41:31 - INFO - __main__ - Step 10405: {'lr': 0.0004960325964517912, 'samples': 1997760, 'steps': 10404, 'loss/train': 1.8894060850143433} -11/06/2021 22:41:32 - INFO - __main__ - Step 10406: {'lr': 0.0004960316547313064, 'samples': 1997952, 'steps': 10405, 'loss/train': 1.8726656436920166} -11/06/2021 22:41:33 - INFO - __main__ - Step 10407: {'lr': 0.0004960307128999636, 'samples': 1998144, 'steps': 10406, 'loss/train': 1.447789192199707} -11/06/2021 22:41:33 - INFO - __main__ - Step 10408: {'lr': 0.0004960297709577632, 'samples': 1998336, 'steps': 10407, 'loss/train': 2.224510431289673} -11/06/2021 22:41:34 - INFO - __main__ - Step 10409: {'lr': 0.0004960288289047054, 'samples': 1998528, 'steps': 10408, 'loss/train': 1.373806118965149} -11/06/2021 22:41:34 - INFO - __main__ - Step 10410: {'lr': 0.000496027886740791, 'samples': 1998720, 'steps': 10409, 'loss/train': 1.4621202945709229} -11/06/2021 22:41:34 - INFO - __main__ - Step 10411: {'lr': 0.0004960269444660201, 'samples': 1998912, 'steps': 10410, 'loss/train': 1.9223895072937012} -11/06/2021 22:41:35 - INFO - __main__ - Step 10412: {'lr': 0.0004960260020803934, 'samples': 1999104, 'steps': 10411, 'loss/train': 1.9031519889831543} -11/06/2021 22:41:36 - INFO - __main__ - Step 10413: {'lr': 0.0004960250595839111, 'samples': 1999296, 'steps': 10412, 'loss/train': 1.6633156538009644} -11/06/2021 22:41:36 - INFO - __main__ - Step 10414: {'lr': 0.0004960241169765737, 'samples': 1999488, 'steps': 10413, 'loss/train': 1.947817087173462} -11/06/2021 22:41:36 - INFO - __main__ - Step 10415: {'lr': 0.0004960231742583817, 'samples': 1999680, 'steps': 10414, 'loss/train': 1.6474344730377197} -11/06/2021 22:41:37 - INFO - __main__ - Step 10416: {'lr': 0.0004960222314293354, 'samples': 1999872, 'steps': 10415, 'loss/train': 1.6221576929092407} -11/06/2021 22:41:37 - INFO - __main__ - Step 10417: {'lr': 0.0004960212884894353, 'samples': 2000064, 'steps': 10416, 'loss/train': 1.5149108171463013} -11/06/2021 22:41:38 - INFO - __main__ - Step 10418: {'lr': 0.0004960203454386817, 'samples': 2000256, 'steps': 10417, 'loss/train': 0.9100244641304016} -11/06/2021 22:41:38 - INFO - __main__ - Step 10419: {'lr': 0.0004960194022770753, 'samples': 2000448, 'steps': 10418, 'loss/train': 1.549153447151184} -11/06/2021 22:41:39 - INFO - __main__ - Step 10420: {'lr': 0.0004960184590046162, 'samples': 2000640, 'steps': 10419, 'loss/train': 1.8034104108810425} -11/06/2021 22:41:39 - INFO - __main__ - Step 10421: {'lr': 0.0004960175156213051, 'samples': 2000832, 'steps': 10420, 'loss/train': 0.9687737226486206} -11/06/2021 22:41:39 - INFO - __main__ - Step 10422: {'lr': 0.0004960165721271422, 'samples': 2001024, 'steps': 10421, 'loss/train': 1.8846495151519775} -11/06/2021 22:41:41 - INFO - __main__ - Step 10423: {'lr': 0.000496015628522128, 'samples': 2001216, 'steps': 10422, 'loss/train': 1.9125192165374756} -11/06/2021 22:41:41 - INFO - __main__ - Step 10424: {'lr': 0.000496014684806263, 'samples': 2001408, 'steps': 10423, 'loss/train': 1.8119043111801147} -11/06/2021 22:41:41 - INFO - __main__ - Step 10425: {'lr': 0.0004960137409795477, 'samples': 2001600, 'steps': 10424, 'loss/train': 2.1726603507995605} -11/06/2021 22:41:42 - INFO - __main__ - Step 10426: {'lr': 0.0004960127970419822, 'samples': 2001792, 'steps': 10425, 'loss/train': 1.9231642484664917} -11/06/2021 22:41:42 - INFO - __main__ - Step 10427: {'lr': 0.0004960118529935674, 'samples': 2001984, 'steps': 10426, 'loss/train': 2.1175436973571777} -11/06/2021 22:41:43 - INFO - __main__ - Step 10428: {'lr': 0.0004960109088343032, 'samples': 2002176, 'steps': 10427, 'loss/train': 2.0986135005950928} -11/06/2021 22:41:43 - INFO - __main__ - Step 10429: {'lr': 0.0004960099645641903, 'samples': 2002368, 'steps': 10428, 'loss/train': 1.7129641771316528} -11/06/2021 22:41:44 - INFO - __main__ - Step 10430: {'lr': 0.0004960090201832293, 'samples': 2002560, 'steps': 10429, 'loss/train': 1.1784454584121704} -11/06/2021 22:41:44 - INFO - __main__ - Step 10431: {'lr': 0.0004960080756914203, 'samples': 2002752, 'steps': 10430, 'loss/train': 1.253516674041748} -11/06/2021 22:41:44 - INFO - __main__ - Step 10432: {'lr': 0.0004960071310887638, 'samples': 2002944, 'steps': 10431, 'loss/train': 1.8971530199050903} -11/06/2021 22:41:45 - INFO - __main__ - Step 10433: {'lr': 0.0004960061863752604, 'samples': 2003136, 'steps': 10432, 'loss/train': 2.065613031387329} -11/06/2021 22:41:46 - INFO - __main__ - Step 10434: {'lr': 0.0004960052415509103, 'samples': 2003328, 'steps': 10433, 'loss/train': 1.7110601663589478} -11/06/2021 22:41:46 - INFO - __main__ - Step 10435: {'lr': 0.0004960042966157141, 'samples': 2003520, 'steps': 10434, 'loss/train': 1.3858282566070557} -11/06/2021 22:41:47 - INFO - __main__ - Step 10436: {'lr': 0.0004960033515696722, 'samples': 2003712, 'steps': 10435, 'loss/train': 1.303482174873352} -11/06/2021 22:41:47 - INFO - __main__ - Step 10437: {'lr': 0.0004960024064127849, 'samples': 2003904, 'steps': 10436, 'loss/train': 1.2062408924102783} -11/06/2021 22:41:47 - INFO - __main__ - Step 10438: {'lr': 0.0004960014611450527, 'samples': 2004096, 'steps': 10437, 'loss/train': 1.7718604803085327} -11/06/2021 22:41:48 - INFO - __main__ - Step 10439: {'lr': 0.0004960005157664762, 'samples': 2004288, 'steps': 10438, 'loss/train': 1.6597301959991455} -11/06/2021 22:41:49 - INFO - __main__ - Step 10440: {'lr': 0.0004959995702770555, 'samples': 2004480, 'steps': 10439, 'loss/train': 1.9467318058013916} -11/06/2021 22:41:49 - INFO - __main__ - Step 10441: {'lr': 0.0004959986246767913, 'samples': 2004672, 'steps': 10440, 'loss/train': 2.24183988571167} -11/06/2021 22:41:49 - INFO - __main__ - Step 10442: {'lr': 0.0004959976789656838, 'samples': 2004864, 'steps': 10441, 'loss/train': 1.8617457151412964} -11/06/2021 22:41:50 - INFO - __main__ - Step 10443: {'lr': 0.0004959967331437336, 'samples': 2005056, 'steps': 10442, 'loss/train': 2.394559621810913} -11/06/2021 22:41:51 - INFO - __main__ - Step 10444: {'lr': 0.0004959957872109411, 'samples': 2005248, 'steps': 10443, 'loss/train': 2.127652168273926} -11/06/2021 22:41:51 - INFO - __main__ - Step 10445: {'lr': 0.0004959948411673066, 'samples': 2005440, 'steps': 10444, 'loss/train': 1.733871579170227} -11/06/2021 22:41:51 - INFO - __main__ - Step 10446: {'lr': 0.0004959938950128308, 'samples': 2005632, 'steps': 10445, 'loss/train': 1.8825232982635498} -11/06/2021 22:41:52 - INFO - __main__ - Step 10447: {'lr': 0.0004959929487475138, 'samples': 2005824, 'steps': 10446, 'loss/train': 1.3970377445220947} -11/06/2021 22:41:52 - INFO - __main__ - Step 10448: {'lr': 0.0004959920023713563, 'samples': 2006016, 'steps': 10447, 'loss/train': 1.3850414752960205} -11/06/2021 22:41:52 - INFO - __main__ - Step 10449: {'lr': 0.0004959910558843584, 'samples': 2006208, 'steps': 10448, 'loss/train': 1.893357753753662} -11/06/2021 22:41:54 - INFO - __main__ - Step 10450: {'lr': 0.0004959901092865208, 'samples': 2006400, 'steps': 10449, 'loss/train': 1.3027065992355347} -11/06/2021 22:41:54 - INFO - __main__ - Step 10451: {'lr': 0.0004959891625778438, 'samples': 2006592, 'steps': 10450, 'loss/train': 2.1753814220428467} -11/06/2021 22:41:54 - INFO - __main__ - Step 10452: {'lr': 0.0004959882157583281, 'samples': 2006784, 'steps': 10451, 'loss/train': 1.65367591381073} -11/06/2021 22:41:55 - INFO - __main__ - Step 10453: {'lr': 0.0004959872688279737, 'samples': 2006976, 'steps': 10452, 'loss/train': 1.8160592317581177} -11/06/2021 22:41:55 - INFO - __main__ - Step 10454: {'lr': 0.0004959863217867814, 'samples': 2007168, 'steps': 10453, 'loss/train': 1.6027116775512695} -11/06/2021 22:41:56 - INFO - __main__ - Step 10455: {'lr': 0.0004959853746347513, 'samples': 2007360, 'steps': 10454, 'loss/train': 1.9197403192520142} -11/06/2021 22:41:57 - INFO - __main__ - Step 10456: {'lr': 0.0004959844273718841, 'samples': 2007552, 'steps': 10455, 'loss/train': 1.6267117261886597} -11/06/2021 22:41:57 - INFO - __main__ - Step 10457: {'lr': 0.00049598347999818, 'samples': 2007744, 'steps': 10456, 'loss/train': 1.6874116659164429} -11/06/2021 22:41:58 - INFO - __main__ - Step 10458: {'lr': 0.0004959825325136396, 'samples': 2007936, 'steps': 10457, 'loss/train': 1.9572356939315796} -11/06/2021 22:41:58 - INFO - __main__ - Step 10459: {'lr': 0.0004959815849182633, 'samples': 2008128, 'steps': 10458, 'loss/train': 1.2736876010894775} -11/06/2021 22:41:58 - INFO - __main__ - Step 10460: {'lr': 0.0004959806372120515, 'samples': 2008320, 'steps': 10459, 'loss/train': 1.9439113140106201} -11/06/2021 22:41:59 - INFO - __main__ - Step 10461: {'lr': 0.0004959796893950045, 'samples': 2008512, 'steps': 10460, 'loss/train': 2.2238245010375977} -11/06/2021 22:42:00 - INFO - __main__ - Step 10462: {'lr': 0.0004959787414671229, 'samples': 2008704, 'steps': 10461, 'loss/train': 1.8460416793823242} -11/06/2021 22:42:00 - INFO - __main__ - Step 10463: {'lr': 0.000495977793428407, 'samples': 2008896, 'steps': 10462, 'loss/train': 1.9288679361343384} -11/06/2021 22:42:00 - INFO - __main__ - Step 10464: {'lr': 0.0004959768452788575, 'samples': 2009088, 'steps': 10463, 'loss/train': 1.7732502222061157} -11/06/2021 22:42:01 - INFO - __main__ - Step 10465: {'lr': 0.0004959758970184745, 'samples': 2009280, 'steps': 10464, 'loss/train': 2.398732900619507} -11/06/2021 22:42:02 - INFO - __main__ - Step 10466: {'lr': 0.0004959749486472587, 'samples': 2009472, 'steps': 10465, 'loss/train': 1.7253568172454834} -11/06/2021 22:42:02 - INFO - __main__ - Step 10467: {'lr': 0.0004959740001652102, 'samples': 2009664, 'steps': 10466, 'loss/train': 1.70595121383667} -11/06/2021 22:42:02 - INFO - __main__ - Step 10468: {'lr': 0.0004959730515723298, 'samples': 2009856, 'steps': 10467, 'loss/train': 1.9712741374969482} -11/06/2021 22:42:03 - INFO - __main__ - Step 10469: {'lr': 0.0004959721028686175, 'samples': 2010048, 'steps': 10468, 'loss/train': 1.4620518684387207} -11/06/2021 22:42:03 - INFO - __main__ - Step 10470: {'lr': 0.0004959711540540741, 'samples': 2010240, 'steps': 10469, 'loss/train': 1.9116092920303345} -11/06/2021 22:42:04 - INFO - __main__ - Step 10471: {'lr': 0.0004959702051286999, 'samples': 2010432, 'steps': 10470, 'loss/train': 2.0080511569976807} -11/06/2021 22:42:04 - INFO - __main__ - Step 10472: {'lr': 0.0004959692560924954, 'samples': 2010624, 'steps': 10471, 'loss/train': 1.8201708793640137} -11/06/2021 22:42:05 - INFO - __main__ - Step 10473: {'lr': 0.0004959683069454608, 'samples': 2010816, 'steps': 10472, 'loss/train': 1.4937697649002075} -11/06/2021 22:42:05 - INFO - __main__ - Step 10474: {'lr': 0.0004959673576875967, 'samples': 2011008, 'steps': 10473, 'loss/train': 1.4996908903121948} -11/06/2021 22:42:06 - INFO - __main__ - Step 10475: {'lr': 0.0004959664083189035, 'samples': 2011200, 'steps': 10474, 'loss/train': 1.8766359090805054} -11/06/2021 22:42:07 - INFO - __main__ - Step 10476: {'lr': 0.0004959654588393818, 'samples': 2011392, 'steps': 10475, 'loss/train': 2.539846181869507} -11/06/2021 22:42:07 - INFO - __main__ - Step 10477: {'lr': 0.0004959645092490316, 'samples': 2011584, 'steps': 10476, 'loss/train': 2.0664992332458496} -11/06/2021 22:42:07 - INFO - __main__ - Step 10478: {'lr': 0.0004959635595478537, 'samples': 2011776, 'steps': 10477, 'loss/train': 2.1357581615448} -11/06/2021 22:42:08 - INFO - __main__ - Step 10479: {'lr': 0.0004959626097358485, 'samples': 2011968, 'steps': 10478, 'loss/train': 1.7041106224060059} -11/06/2021 22:42:08 - INFO - __main__ - Step 10480: {'lr': 0.0004959616598130162, 'samples': 2012160, 'steps': 10479, 'loss/train': 1.5367162227630615} -11/06/2021 22:42:09 - INFO - __main__ - Step 10481: {'lr': 0.0004959607097793575, 'samples': 2012352, 'steps': 10480, 'loss/train': 0.8361077904701233} -11/06/2021 22:42:09 - INFO - __main__ - Step 10482: {'lr': 0.0004959597596348726, 'samples': 2012544, 'steps': 10481, 'loss/train': 1.425622582435608} -11/06/2021 22:42:10 - INFO - __main__ - Step 10483: {'lr': 0.0004959588093795621, 'samples': 2012736, 'steps': 10482, 'loss/train': 1.8034032583236694} -11/06/2021 22:42:10 - INFO - __main__ - Step 10484: {'lr': 0.0004959578590134262, 'samples': 2012928, 'steps': 10483, 'loss/train': 1.7551143169403076} -11/06/2021 22:42:10 - INFO - __main__ - Step 10485: {'lr': 0.0004959569085364657, 'samples': 2013120, 'steps': 10484, 'loss/train': 1.8540403842926025} -11/06/2021 22:42:11 - INFO - __main__ - Step 10486: {'lr': 0.0004959559579486807, 'samples': 2013312, 'steps': 10485, 'loss/train': 1.9935126304626465} -11/06/2021 22:42:12 - INFO - __main__ - Step 10487: {'lr': 0.0004959550072500718, 'samples': 2013504, 'steps': 10486, 'loss/train': 1.6862492561340332} -11/06/2021 22:42:12 - INFO - __main__ - Step 10488: {'lr': 0.0004959540564406393, 'samples': 2013696, 'steps': 10487, 'loss/train': 1.781096339225769} -11/06/2021 22:42:12 - INFO - __main__ - Step 10489: {'lr': 0.0004959531055203837, 'samples': 2013888, 'steps': 10488, 'loss/train': 1.8593416213989258} -11/06/2021 22:42:13 - INFO - __main__ - Step 10490: {'lr': 0.0004959521544893055, 'samples': 2014080, 'steps': 10489, 'loss/train': 1.739823579788208} -11/06/2021 22:42:13 - INFO - __main__ - Step 10491: {'lr': 0.000495951203347405, 'samples': 2014272, 'steps': 10490, 'loss/train': 1.9146326780319214} -11/06/2021 22:42:14 - INFO - __main__ - Step 10492: {'lr': 0.0004959502520946827, 'samples': 2014464, 'steps': 10491, 'loss/train': 2.1610023975372314} -11/06/2021 22:42:14 - INFO - __main__ - Step 10493: {'lr': 0.000495949300731139, 'samples': 2014656, 'steps': 10492, 'loss/train': 1.6168802976608276} -11/06/2021 22:42:15 - INFO - __main__ - Step 10494: {'lr': 0.0004959483492567744, 'samples': 2014848, 'steps': 10493, 'loss/train': 1.6835715770721436} -11/06/2021 22:42:15 - INFO - __main__ - Step 10495: {'lr': 0.0004959473976715892, 'samples': 2015040, 'steps': 10494, 'loss/train': 1.6348047256469727} -11/06/2021 22:42:15 - INFO - __main__ - Step 10496: {'lr': 0.0004959464459755839, 'samples': 2015232, 'steps': 10495, 'loss/train': 1.2869349718093872} -11/06/2021 22:42:17 - INFO - __main__ - Step 10497: {'lr': 0.0004959454941687589, 'samples': 2015424, 'steps': 10496, 'loss/train': 1.733815312385559} -11/06/2021 22:42:17 - INFO - __main__ - Step 10498: {'lr': 0.0004959445422511148, 'samples': 2015616, 'steps': 10497, 'loss/train': 1.9846241474151611} -11/06/2021 22:42:17 - INFO - __main__ - Step 10499: {'lr': 0.0004959435902226517, 'samples': 2015808, 'steps': 10498, 'loss/train': 0.9969847202301025} -11/06/2021 22:42:18 - INFO - __main__ - Step 10500: {'lr': 0.0004959426380833703, 'samples': 2016000, 'steps': 10499, 'loss/train': 1.6832598447799683} -11/06/2021 22:42:18 - INFO - __main__ - Step 10501: {'lr': 0.0004959416858332709, 'samples': 2016192, 'steps': 10500, 'loss/train': 1.6795216798782349} -11/06/2021 22:42:19 - INFO - __main__ - Step 10502: {'lr': 0.000495940733472354, 'samples': 2016384, 'steps': 10501, 'loss/train': 2.3554139137268066} -11/06/2021 22:42:19 - INFO - __main__ - Step 10503: {'lr': 0.00049593978100062, 'samples': 2016576, 'steps': 10502, 'loss/train': 1.8953803777694702} -11/06/2021 22:42:20 - INFO - __main__ - Step 10504: {'lr': 0.0004959388284180694, 'samples': 2016768, 'steps': 10503, 'loss/train': 2.1253671646118164} -11/06/2021 22:42:20 - INFO - __main__ - Step 10505: {'lr': 0.0004959378757247024, 'samples': 2016960, 'steps': 10504, 'loss/train': 1.8000476360321045} -11/06/2021 22:42:20 - INFO - __main__ - Step 10506: {'lr': 0.0004959369229205197, 'samples': 2017152, 'steps': 10505, 'loss/train': 0.36025920510292053} -11/06/2021 22:42:21 - INFO - __main__ - Step 10507: {'lr': 0.0004959359700055216, 'samples': 2017344, 'steps': 10506, 'loss/train': 1.7624599933624268} -11/06/2021 22:42:22 - INFO - __main__ - Step 10508: {'lr': 0.0004959350169797085, 'samples': 2017536, 'steps': 10507, 'loss/train': 1.786071538925171} -11/06/2021 22:42:22 - INFO - __main__ - Step 10509: {'lr': 0.000495934063843081, 'samples': 2017728, 'steps': 10508, 'loss/train': 2.0693178176879883} -11/06/2021 22:42:23 - INFO - __main__ - Step 10510: {'lr': 0.0004959331105956393, 'samples': 2017920, 'steps': 10509, 'loss/train': 1.65921950340271} -11/06/2021 22:42:23 - INFO - __main__ - Step 10511: {'lr': 0.000495932157237384, 'samples': 2018112, 'steps': 10510, 'loss/train': 1.9849227666854858} -11/06/2021 22:42:23 - INFO - __main__ - Step 10512: {'lr': 0.0004959312037683154, 'samples': 2018304, 'steps': 10511, 'loss/train': 1.6077988147735596} -11/06/2021 22:42:24 - INFO - __main__ - Step 10513: {'lr': 0.0004959302501884341, 'samples': 2018496, 'steps': 10512, 'loss/train': 1.6553412675857544} -11/06/2021 22:42:25 - INFO - __main__ - Step 10514: {'lr': 0.0004959292964977403, 'samples': 2018688, 'steps': 10513, 'loss/train': 1.3393796682357788} -11/06/2021 22:42:25 - INFO - __main__ - Step 10515: {'lr': 0.0004959283426962345, 'samples': 2018880, 'steps': 10514, 'loss/train': 1.1275650262832642} -11/06/2021 22:42:25 - INFO - __main__ - Step 10516: {'lr': 0.0004959273887839175, 'samples': 2019072, 'steps': 10515, 'loss/train': 1.4780120849609375} -11/06/2021 22:42:26 - INFO - __main__ - Step 10517: {'lr': 0.000495926434760789, 'samples': 2019264, 'steps': 10516, 'loss/train': 1.8599119186401367} -11/06/2021 22:42:27 - INFO - __main__ - Step 10518: {'lr': 0.0004959254806268501, 'samples': 2019456, 'steps': 10517, 'loss/train': 1.910403847694397} -11/06/2021 22:42:27 - INFO - __main__ - Step 10519: {'lr': 0.0004959245263821009, 'samples': 2019648, 'steps': 10518, 'loss/train': 1.8654783964157104} -11/06/2021 22:42:27 - INFO - __main__ - Step 10520: {'lr': 0.0004959235720265419, 'samples': 2019840, 'steps': 10519, 'loss/train': 1.3041726350784302} -11/06/2021 22:42:28 - INFO - __main__ - Step 10521: {'lr': 0.0004959226175601736, 'samples': 2020032, 'steps': 10520, 'loss/train': 1.7402362823486328} -11/06/2021 22:42:28 - INFO - __main__ - Step 10522: {'lr': 0.0004959216629829964, 'samples': 2020224, 'steps': 10521, 'loss/train': 1.8779191970825195} -11/06/2021 22:42:29 - INFO - __main__ - Step 10523: {'lr': 0.0004959207082950105, 'samples': 2020416, 'steps': 10522, 'loss/train': 1.9938749074935913} -11/06/2021 22:42:29 - INFO - __main__ - Step 10524: {'lr': 0.0004959197534962166, 'samples': 2020608, 'steps': 10523, 'loss/train': 1.7240444421768188} -11/06/2021 22:42:30 - INFO - __main__ - Step 10525: {'lr': 0.0004959187985866152, 'samples': 2020800, 'steps': 10524, 'loss/train': 1.3333297967910767} -11/06/2021 22:42:30 - INFO - __main__ - Step 10526: {'lr': 0.0004959178435662064, 'samples': 2020992, 'steps': 10525, 'loss/train': 3.172778606414795} -11/06/2021 22:42:30 - INFO - __main__ - Step 10527: {'lr': 0.0004959168884349909, 'samples': 2021184, 'steps': 10526, 'loss/train': 2.005765438079834} -11/06/2021 22:42:32 - INFO - __main__ - Step 10528: {'lr': 0.0004959159331929691, 'samples': 2021376, 'steps': 10527, 'loss/train': 1.9616241455078125} -11/06/2021 22:42:32 - INFO - __main__ - Step 10529: {'lr': 0.0004959149778401412, 'samples': 2021568, 'steps': 10528, 'loss/train': 0.44385576248168945} -11/06/2021 22:42:32 - INFO - __main__ - Step 10530: {'lr': 0.000495914022376508, 'samples': 2021760, 'steps': 10529, 'loss/train': 1.7894715070724487} -11/06/2021 22:42:33 - INFO - __main__ - Step 10531: {'lr': 0.0004959130668020696, 'samples': 2021952, 'steps': 10530, 'loss/train': 1.43883216381073} -11/06/2021 22:42:33 - INFO - __main__ - Step 10532: {'lr': 0.0004959121111168266, 'samples': 2022144, 'steps': 10531, 'loss/train': 1.801062822341919} -11/06/2021 22:42:34 - INFO - __main__ - Step 10533: {'lr': 0.0004959111553207794, 'samples': 2022336, 'steps': 10532, 'loss/train': 1.905466914176941} -11/06/2021 22:42:34 - INFO - __main__ - Step 10534: {'lr': 0.0004959101994139284, 'samples': 2022528, 'steps': 10533, 'loss/train': 1.9462462663650513} -11/06/2021 22:42:35 - INFO - __main__ - Step 10535: {'lr': 0.0004959092433962742, 'samples': 2022720, 'steps': 10534, 'loss/train': 1.9173693656921387} -11/06/2021 22:42:35 - INFO - __main__ - Step 10536: {'lr': 0.0004959082872678169, 'samples': 2022912, 'steps': 10535, 'loss/train': 0.9070050716400146} -11/06/2021 22:42:35 - INFO - __main__ - Step 10537: {'lr': 0.0004959073310285572, 'samples': 2023104, 'steps': 10536, 'loss/train': 1.65950345993042} -11/06/2021 22:42:37 - INFO - __main__ - Step 10538: {'lr': 0.0004959063746784955, 'samples': 2023296, 'steps': 10537, 'loss/train': 1.9055320024490356} -11/06/2021 22:42:37 - INFO - __main__ - Step 10539: {'lr': 0.0004959054182176321, 'samples': 2023488, 'steps': 10538, 'loss/train': 1.639905333518982} -11/06/2021 22:42:38 - INFO - __main__ - Step 10540: {'lr': 0.0004959044616459676, 'samples': 2023680, 'steps': 10539, 'loss/train': 1.4272217750549316} -11/06/2021 22:42:38 - INFO - __main__ - Step 10541: {'lr': 0.0004959035049635023, 'samples': 2023872, 'steps': 10540, 'loss/train': 0.9154389500617981} -11/06/2021 22:42:38 - INFO - __main__ - Step 10542: {'lr': 0.0004959025481702366, 'samples': 2024064, 'steps': 10541, 'loss/train': 1.519034504890442} -11/06/2021 22:42:39 - INFO - __main__ - Step 10543: {'lr': 0.0004959015912661712, 'samples': 2024256, 'steps': 10542, 'loss/train': 1.571833848953247} -11/06/2021 22:42:40 - INFO - __main__ - Step 10544: {'lr': 0.0004959006342513062, 'samples': 2024448, 'steps': 10543, 'loss/train': 0.902131974697113} -11/06/2021 22:42:40 - INFO - __main__ - Step 10545: {'lr': 0.0004958996771256422, 'samples': 2024640, 'steps': 10544, 'loss/train': 1.765254259109497} -11/06/2021 22:42:40 - INFO - __main__ - Step 10546: {'lr': 0.0004958987198891796, 'samples': 2024832, 'steps': 10545, 'loss/train': 1.8613026142120361} -11/06/2021 22:42:41 - INFO - __main__ - Step 10547: {'lr': 0.0004958977625419187, 'samples': 2025024, 'steps': 10546, 'loss/train': 1.9227455854415894} -11/06/2021 22:42:41 - INFO - __main__ - Step 10548: {'lr': 0.0004958968050838603, 'samples': 2025216, 'steps': 10547, 'loss/train': 1.920836091041565} -11/06/2021 22:42:42 - INFO - __main__ - Step 10549: {'lr': 0.0004958958475150044, 'samples': 2025408, 'steps': 10548, 'loss/train': 1.9864680767059326} -11/06/2021 22:42:43 - INFO - __main__ - Step 10550: {'lr': 0.0004958948898353516, 'samples': 2025600, 'steps': 10549, 'loss/train': 1.8649414777755737} -11/06/2021 22:42:43 - INFO - __main__ - Step 10551: {'lr': 0.0004958939320449026, 'samples': 2025792, 'steps': 10550, 'loss/train': 2.0411078929901123} -11/06/2021 22:42:43 - INFO - __main__ - Step 10552: {'lr': 0.0004958929741436574, 'samples': 2025984, 'steps': 10551, 'loss/train': 1.3231031894683838} -11/06/2021 22:42:44 - INFO - __main__ - Step 10553: {'lr': 0.0004958920161316167, 'samples': 2026176, 'steps': 10552, 'loss/train': 1.855413556098938} -11/06/2021 22:42:45 - INFO - __main__ - Step 10554: {'lr': 0.0004958910580087808, 'samples': 2026368, 'steps': 10553, 'loss/train': 2.308320999145508} -11/06/2021 22:42:45 - INFO - __main__ - Step 10555: {'lr': 0.0004958900997751502, 'samples': 2026560, 'steps': 10554, 'loss/train': 1.9437730312347412} -11/06/2021 22:42:45 - INFO - __main__ - Step 10556: {'lr': 0.0004958891414307253, 'samples': 2026752, 'steps': 10555, 'loss/train': 2.246142864227295} -11/06/2021 22:42:46 - INFO - __main__ - Step 10557: {'lr': 0.0004958881829755066, 'samples': 2026944, 'steps': 10556, 'loss/train': 2.26411771774292} -11/06/2021 22:42:46 - INFO - __main__ - Step 10558: {'lr': 0.0004958872244094944, 'samples': 2027136, 'steps': 10557, 'loss/train': 1.6010162830352783} -11/06/2021 22:42:46 - INFO - __main__ - Step 10559: {'lr': 0.0004958862657326893, 'samples': 2027328, 'steps': 10558, 'loss/train': 1.5600662231445312} -11/06/2021 22:42:48 - INFO - __main__ - Step 10560: {'lr': 0.0004958853069450916, 'samples': 2027520, 'steps': 10559, 'loss/train': 1.8983862400054932} -11/06/2021 22:42:48 - INFO - __main__ - Step 10561: {'lr': 0.0004958843480467017, 'samples': 2027712, 'steps': 10560, 'loss/train': 0.7014676332473755} -11/06/2021 22:42:48 - INFO - __main__ - Step 10562: {'lr': 0.0004958833890375202, 'samples': 2027904, 'steps': 10561, 'loss/train': 1.9279460906982422} -11/06/2021 22:42:49 - INFO - __main__ - Step 10563: {'lr': 0.0004958824299175474, 'samples': 2028096, 'steps': 10562, 'loss/train': 1.799846887588501} -11/06/2021 22:42:49 - INFO - __main__ - Step 10564: {'lr': 0.0004958814706867838, 'samples': 2028288, 'steps': 10563, 'loss/train': 1.8568742275238037} -11/06/2021 22:42:50 - INFO - __main__ - Step 10565: {'lr': 0.0004958805113452298, 'samples': 2028480, 'steps': 10564, 'loss/train': 1.6105812788009644} -11/06/2021 22:42:50 - INFO - __main__ - Step 10566: {'lr': 0.0004958795518928858, 'samples': 2028672, 'steps': 10565, 'loss/train': 1.1961236000061035} -11/06/2021 22:42:51 - INFO - __main__ - Step 10567: {'lr': 0.0004958785923297522, 'samples': 2028864, 'steps': 10566, 'loss/train': 1.8169901371002197} -11/06/2021 22:42:51 - INFO - __main__ - Step 10568: {'lr': 0.0004958776326558298, 'samples': 2029056, 'steps': 10567, 'loss/train': 1.83092200756073} -11/06/2021 22:42:51 - INFO - __main__ - Step 10569: {'lr': 0.0004958766728711184, 'samples': 2029248, 'steps': 10568, 'loss/train': 1.380372166633606} -11/06/2021 22:42:52 - INFO - __main__ - Step 10570: {'lr': 0.000495875712975619, 'samples': 2029440, 'steps': 10569, 'loss/train': 1.897265076637268} -11/06/2021 22:42:53 - INFO - __main__ - Step 10571: {'lr': 0.0004958747529693316, 'samples': 2029632, 'steps': 10570, 'loss/train': 1.3889024257659912} -11/06/2021 22:42:53 - INFO - __main__ - Step 10572: {'lr': 0.000495873792852257, 'samples': 2029824, 'steps': 10571, 'loss/train': 1.0971200466156006} -11/06/2021 22:42:53 - INFO - __main__ - Step 10573: {'lr': 0.0004958728326243954, 'samples': 2030016, 'steps': 10572, 'loss/train': 1.5941991806030273} -11/06/2021 22:42:54 - INFO - __main__ - Step 10574: {'lr': 0.0004958718722857473, 'samples': 2030208, 'steps': 10573, 'loss/train': 1.6007957458496094} -11/06/2021 22:42:55 - INFO - __main__ - Step 10575: {'lr': 0.0004958709118363131, 'samples': 2030400, 'steps': 10574, 'loss/train': 1.9947025775909424} -11/06/2021 22:42:55 - INFO - __main__ - Step 10576: {'lr': 0.0004958699512760933, 'samples': 2030592, 'steps': 10575, 'loss/train': 1.9763280153274536} -11/06/2021 22:42:55 - INFO - __main__ - Step 10577: {'lr': 0.0004958689906050882, 'samples': 2030784, 'steps': 10576, 'loss/train': 1.577843189239502} -11/06/2021 22:42:56 - INFO - __main__ - Step 10578: {'lr': 0.0004958680298232983, 'samples': 2030976, 'steps': 10577, 'loss/train': 1.4245156049728394} -11/06/2021 22:42:56 - INFO - __main__ - Step 10579: {'lr': 0.0004958670689307242, 'samples': 2031168, 'steps': 10578, 'loss/train': 2.1011838912963867} -11/06/2021 22:42:57 - INFO - __main__ - Step 10580: {'lr': 0.0004958661079273662, 'samples': 2031360, 'steps': 10579, 'loss/train': 1.68887197971344} -11/06/2021 22:42:58 - INFO - __main__ - Step 10581: {'lr': 0.0004958651468132246, 'samples': 2031552, 'steps': 10580, 'loss/train': 1.6149951219558716} -11/06/2021 22:42:58 - INFO - __main__ - Step 10582: {'lr': 0.0004958641855883001, 'samples': 2031744, 'steps': 10581, 'loss/train': 1.577684760093689} -11/06/2021 22:42:58 - INFO - __main__ - Step 10583: {'lr': 0.0004958632242525929, 'samples': 2031936, 'steps': 10582, 'loss/train': 1.9628639221191406} -11/06/2021 22:42:59 - INFO - __main__ - Step 10584: {'lr': 0.0004958622628061035, 'samples': 2032128, 'steps': 10583, 'loss/train': 1.6041213274002075} -11/06/2021 22:42:59 - INFO - __main__ - Step 10585: {'lr': 0.0004958613012488324, 'samples': 2032320, 'steps': 10584, 'loss/train': 0.9554458856582642} -11/06/2021 22:43:00 - INFO - __main__ - Step 10586: {'lr': 0.00049586033958078, 'samples': 2032512, 'steps': 10585, 'loss/train': 2.0318799018859863} -11/06/2021 22:43:00 - INFO - __main__ - Step 10587: {'lr': 0.0004958593778019468, 'samples': 2032704, 'steps': 10586, 'loss/train': 1.9779229164123535} -11/06/2021 22:43:01 - INFO - __main__ - Step 10588: {'lr': 0.0004958584159123331, 'samples': 2032896, 'steps': 10587, 'loss/train': 2.021127939224243} -11/06/2021 22:43:01 - INFO - __main__ - Step 10589: {'lr': 0.0004958574539119392, 'samples': 2033088, 'steps': 10588, 'loss/train': 1.864471435546875} -11/06/2021 22:43:01 - INFO - __main__ - Step 10590: {'lr': 0.0004958564918007659, 'samples': 2033280, 'steps': 10589, 'loss/train': 0.6293484568595886} -11/06/2021 22:43:03 - INFO - __main__ - Step 10591: {'lr': 0.0004958555295788135, 'samples': 2033472, 'steps': 10590, 'loss/train': 1.892540454864502} -11/06/2021 22:43:03 - INFO - __main__ - Step 10592: {'lr': 0.0004958545672460824, 'samples': 2033664, 'steps': 10591, 'loss/train': 2.0386414527893066} -11/06/2021 22:43:03 - INFO - __main__ - Step 10593: {'lr': 0.0004958536048025729, 'samples': 2033856, 'steps': 10592, 'loss/train': 2.018533706665039} -11/06/2021 22:43:04 - INFO - __main__ - Step 10594: {'lr': 0.0004958526422482857, 'samples': 2034048, 'steps': 10593, 'loss/train': 1.8704800605773926} -11/06/2021 22:43:04 - INFO - __main__ - Step 10595: {'lr': 0.000495851679583221, 'samples': 2034240, 'steps': 10594, 'loss/train': 1.2096422910690308} -11/06/2021 22:43:05 - INFO - __main__ - Step 10596: {'lr': 0.0004958507168073793, 'samples': 2034432, 'steps': 10595, 'loss/train': 1.69189453125} -11/06/2021 22:43:05 - INFO - __main__ - Step 10597: {'lr': 0.0004958497539207611, 'samples': 2034624, 'steps': 10596, 'loss/train': 1.6835681200027466} -11/06/2021 22:43:06 - INFO - __main__ - Step 10598: {'lr': 0.0004958487909233669, 'samples': 2034816, 'steps': 10597, 'loss/train': 1.550663948059082} -11/06/2021 22:43:06 - INFO - __main__ - Step 10599: {'lr': 0.0004958478278151969, 'samples': 2035008, 'steps': 10598, 'loss/train': 1.3910499811172485} -11/06/2021 22:43:06 - INFO - __main__ - Step 10600: {'lr': 0.0004958468645962517, 'samples': 2035200, 'steps': 10599, 'loss/train': 0.5436376333236694} -11/06/2021 22:43:08 - INFO - __main__ - Step 10601: {'lr': 0.0004958459012665317, 'samples': 2035392, 'steps': 10600, 'loss/train': 1.8061374425888062} -11/06/2021 22:43:08 - INFO - __main__ - Step 10602: {'lr': 0.0004958449378260374, 'samples': 2035584, 'steps': 10601, 'loss/train': 1.4709066152572632} -11/06/2021 22:43:08 - INFO - __main__ - Step 10603: {'lr': 0.000495843974274769, 'samples': 2035776, 'steps': 10602, 'loss/train': 1.4589587450027466} -11/06/2021 22:43:09 - INFO - __main__ - Step 10604: {'lr': 0.0004958430106127272, 'samples': 2035968, 'steps': 10603, 'loss/train': 2.1720454692840576} -11/06/2021 22:43:09 - INFO - __main__ - Step 10605: {'lr': 0.0004958420468399123, 'samples': 2036160, 'steps': 10604, 'loss/train': 1.612654209136963} -11/06/2021 22:43:10 - INFO - __main__ - Step 10606: {'lr': 0.0004958410829563248, 'samples': 2036352, 'steps': 10605, 'loss/train': 1.6653211116790771} -11/06/2021 22:43:10 - INFO - __main__ - Step 10607: {'lr': 0.0004958401189619652, 'samples': 2036544, 'steps': 10606, 'loss/train': 1.9401401281356812} -11/06/2021 22:43:11 - INFO - __main__ - Step 10608: {'lr': 0.0004958391548568336, 'samples': 2036736, 'steps': 10607, 'loss/train': 2.150745391845703} -11/06/2021 22:43:11 - INFO - __main__ - Step 10609: {'lr': 0.0004958381906409308, 'samples': 2036928, 'steps': 10608, 'loss/train': 1.7484651803970337} -11/06/2021 22:43:11 - INFO - __main__ - Step 10610: {'lr': 0.0004958372263142571, 'samples': 2037120, 'steps': 10609, 'loss/train': 1.8919156789779663} -11/06/2021 22:43:12 - INFO - __main__ - Step 10611: {'lr': 0.0004958362618768129, 'samples': 2037312, 'steps': 10610, 'loss/train': 1.3154926300048828} -11/06/2021 22:43:14 - INFO - __main__ - Step 10612: {'lr': 0.0004958352973285987, 'samples': 2037504, 'steps': 10611, 'loss/train': 1.8000268936157227} -11/06/2021 22:43:14 - INFO - __main__ - Step 10613: {'lr': 0.000495834332669615, 'samples': 2037696, 'steps': 10612, 'loss/train': 0.241807758808136} -11/06/2021 22:43:15 - INFO - __main__ - Step 10614: {'lr': 0.0004958333678998622, 'samples': 2037888, 'steps': 10613, 'loss/train': 1.521072268486023} -11/06/2021 22:43:15 - INFO - __main__ - Step 10615: {'lr': 0.0004958324030193404, 'samples': 2038080, 'steps': 10614, 'loss/train': 1.6696323156356812} -11/06/2021 22:43:15 - INFO - __main__ - Step 10616: {'lr': 0.0004958314380280504, 'samples': 2038272, 'steps': 10615, 'loss/train': 1.4865412712097168} -11/06/2021 22:43:16 - INFO - __main__ - Step 10617: {'lr': 0.0004958304729259927, 'samples': 2038464, 'steps': 10616, 'loss/train': 1.9140490293502808} -11/06/2021 22:43:16 - INFO - __main__ - Step 10618: {'lr': 0.0004958295077131674, 'samples': 2038656, 'steps': 10617, 'loss/train': 1.3753329515457153} -11/06/2021 22:43:17 - INFO - __main__ - Step 10619: {'lr': 0.0004958285423895752, 'samples': 2038848, 'steps': 10618, 'loss/train': 1.8530157804489136} -11/06/2021 22:43:18 - INFO - __main__ - Step 10620: {'lr': 0.0004958275769552165, 'samples': 2039040, 'steps': 10619, 'loss/train': 1.2794376611709595} -11/06/2021 22:43:18 - INFO - __main__ - Step 10621: {'lr': 0.0004958266114100917, 'samples': 2039232, 'steps': 10620, 'loss/train': 1.9506590366363525} -11/06/2021 22:43:18 - INFO - __main__ - Step 10622: {'lr': 0.0004958256457542011, 'samples': 2039424, 'steps': 10621, 'loss/train': 1.7138190269470215} -11/06/2021 22:43:19 - INFO - __main__ - Step 10623: {'lr': 0.0004958246799875453, 'samples': 2039616, 'steps': 10622, 'loss/train': 1.564102292060852} -11/06/2021 22:43:19 - INFO - __main__ - Step 10624: {'lr': 0.0004958237141101247, 'samples': 2039808, 'steps': 10623, 'loss/train': 0.428017258644104} -11/06/2021 22:43:19 - INFO - __main__ - Step 10625: {'lr': 0.0004958227481219399, 'samples': 2040000, 'steps': 10624, 'loss/train': 1.5035067796707153} -11/06/2021 22:43:21 - INFO - __main__ - Step 10626: {'lr': 0.0004958217820229909, 'samples': 2040192, 'steps': 10625, 'loss/train': 1.7794239521026611} -11/06/2021 22:43:21 - INFO - __main__ - Step 10627: {'lr': 0.0004958208158132785, 'samples': 2040384, 'steps': 10626, 'loss/train': 1.4251916408538818} -11/06/2021 22:43:21 - INFO - __main__ - Step 10628: {'lr': 0.000495819849492803, 'samples': 2040576, 'steps': 10627, 'loss/train': 1.7260355949401855} -11/06/2021 22:43:22 - INFO - __main__ - Step 10629: {'lr': 0.0004958188830615649, 'samples': 2040768, 'steps': 10628, 'loss/train': 2.004051446914673} -11/06/2021 22:43:22 - INFO - __main__ - Step 10630: {'lr': 0.0004958179165195646, 'samples': 2040960, 'steps': 10629, 'loss/train': 1.7460932731628418} -11/06/2021 22:43:23 - INFO - __main__ - Step 10631: {'lr': 0.0004958169498668026, 'samples': 2041152, 'steps': 10630, 'loss/train': 1.8938854932785034} -11/06/2021 22:43:23 - INFO - __main__ - Step 10632: {'lr': 0.0004958159831032793, 'samples': 2041344, 'steps': 10631, 'loss/train': 1.446541428565979} -11/06/2021 22:43:24 - INFO - __main__ - Step 10633: {'lr': 0.000495815016228995, 'samples': 2041536, 'steps': 10632, 'loss/train': 1.7085440158843994} -11/06/2021 22:43:24 - INFO - __main__ - Step 10634: {'lr': 0.0004958140492439502, 'samples': 2041728, 'steps': 10633, 'loss/train': 1.8917224407196045} -11/06/2021 22:43:24 - INFO - __main__ - Step 10635: {'lr': 0.0004958130821481455, 'samples': 2041920, 'steps': 10634, 'loss/train': 1.9071261882781982} -11/06/2021 22:43:25 - INFO - __main__ - Step 10636: {'lr': 0.0004958121149415812, 'samples': 2042112, 'steps': 10635, 'loss/train': 1.352231502532959} -11/06/2021 22:43:26 - INFO - __main__ - Step 10637: {'lr': 0.0004958111476242577, 'samples': 2042304, 'steps': 10636, 'loss/train': 1.8399983644485474} -11/06/2021 22:43:26 - INFO - __main__ - Step 10638: {'lr': 0.0004958101801961755, 'samples': 2042496, 'steps': 10637, 'loss/train': 2.4199862480163574} -11/06/2021 22:43:26 - INFO - __main__ - Step 10639: {'lr': 0.0004958092126573352, 'samples': 2042688, 'steps': 10638, 'loss/train': 1.832000970840454} -11/06/2021 22:43:27 - INFO - __main__ - Step 10640: {'lr': 0.0004958082450077369, 'samples': 2042880, 'steps': 10639, 'loss/train': 2.0270063877105713} -11/06/2021 22:43:28 - INFO - __main__ - Step 10641: {'lr': 0.0004958072772473812, 'samples': 2043072, 'steps': 10640, 'loss/train': 1.655840277671814} -11/06/2021 22:43:28 - INFO - __main__ - Step 10642: {'lr': 0.0004958063093762684, 'samples': 2043264, 'steps': 10641, 'loss/train': 2.09566330909729} -11/06/2021 22:43:29 - INFO - __main__ - Step 10643: {'lr': 0.0004958053413943993, 'samples': 2043456, 'steps': 10642, 'loss/train': 1.8067339658737183} -11/06/2021 22:43:29 - INFO - __main__ - Step 10644: {'lr': 0.0004958043733017741, 'samples': 2043648, 'steps': 10643, 'loss/train': 1.5341635942459106} -11/06/2021 22:43:29 - INFO - __main__ - Step 10645: {'lr': 0.0004958034050983932, 'samples': 2043840, 'steps': 10644, 'loss/train': 1.7686036825180054} -11/06/2021 22:43:30 - INFO - __main__ - Step 10646: {'lr': 0.0004958024367842569, 'samples': 2044032, 'steps': 10645, 'loss/train': 1.8402926921844482} -11/06/2021 22:43:31 - INFO - __main__ - Step 10647: {'lr': 0.000495801468359366, 'samples': 2044224, 'steps': 10646, 'loss/train': 1.6536637544631958} -11/06/2021 22:43:31 - INFO - __main__ - Step 10648: {'lr': 0.0004958004998237207, 'samples': 2044416, 'steps': 10647, 'loss/train': 2.0047109127044678} -11/06/2021 22:43:31 - INFO - __main__ - Step 10649: {'lr': 0.0004957995311773215, 'samples': 2044608, 'steps': 10648, 'loss/train': 1.8218034505844116} -11/06/2021 22:43:32 - INFO - __main__ - Step 10650: {'lr': 0.0004957985624201688, 'samples': 2044800, 'steps': 10649, 'loss/train': 1.3269506692886353} -11/06/2021 22:43:32 - INFO - __main__ - Step 10651: {'lr': 0.0004957975935522632, 'samples': 2044992, 'steps': 10650, 'loss/train': 1.8232018947601318} -11/06/2021 22:43:33 - INFO - __main__ - Step 10652: {'lr': 0.0004957966245736048, 'samples': 2045184, 'steps': 10651, 'loss/train': 1.26266348361969} -11/06/2021 22:43:34 - INFO - __main__ - Step 10653: {'lr': 0.0004957956554841943, 'samples': 2045376, 'steps': 10652, 'loss/train': 1.7997419834136963} -11/06/2021 22:43:34 - INFO - __main__ - Step 10654: {'lr': 0.0004957946862840321, 'samples': 2045568, 'steps': 10653, 'loss/train': 1.7390581369400024} -11/06/2021 22:43:34 - INFO - __main__ - Step 10655: {'lr': 0.0004957937169731186, 'samples': 2045760, 'steps': 10654, 'loss/train': 1.672598958015442} -11/06/2021 22:43:35 - INFO - __main__ - Step 10656: {'lr': 0.0004957927475514542, 'samples': 2045952, 'steps': 10655, 'loss/train': 1.358737826347351} -11/06/2021 22:43:36 - INFO - __main__ - Step 10657: {'lr': 0.0004957917780190395, 'samples': 2046144, 'steps': 10656, 'loss/train': 1.9060399532318115} -11/06/2021 22:43:36 - INFO - __main__ - Step 10658: {'lr': 0.0004957908083758747, 'samples': 2046336, 'steps': 10657, 'loss/train': 1.6999403238296509} -11/06/2021 22:43:36 - INFO - __main__ - Step 10659: {'lr': 0.0004957898386219603, 'samples': 2046528, 'steps': 10658, 'loss/train': 1.6076505184173584} -11/06/2021 22:43:37 - INFO - __main__ - Step 10660: {'lr': 0.000495788868757297, 'samples': 2046720, 'steps': 10659, 'loss/train': 1.7159380912780762} -11/06/2021 22:43:37 - INFO - __main__ - Step 10661: {'lr': 0.0004957878987818849, 'samples': 2046912, 'steps': 10660, 'loss/train': 1.4848712682724} -11/06/2021 22:43:39 - INFO - __main__ - Step 10662: {'lr': 0.0004957869286957246, 'samples': 2047104, 'steps': 10661, 'loss/train': 1.9166350364685059} -11/06/2021 22:43:39 - INFO - __main__ - Step 10663: {'lr': 0.0004957859584988164, 'samples': 2047296, 'steps': 10662, 'loss/train': 1.3673206567764282} -11/06/2021 22:43:39 - INFO - __main__ - Step 10664: {'lr': 0.0004957849881911609, 'samples': 2047488, 'steps': 10663, 'loss/train': 1.7530118227005005} -11/06/2021 22:43:40 - INFO - __main__ - Step 10665: {'lr': 0.0004957840177727585, 'samples': 2047680, 'steps': 10664, 'loss/train': 1.5396183729171753} -11/06/2021 22:43:40 - INFO - __main__ - Step 10666: {'lr': 0.0004957830472436097, 'samples': 2047872, 'steps': 10665, 'loss/train': 2.27144718170166} -11/06/2021 22:43:40 - INFO - __main__ - Step 10667: {'lr': 0.0004957820766037147, 'samples': 2048064, 'steps': 10666, 'loss/train': 2.53610897064209} -11/06/2021 22:43:41 - INFO - __main__ - Step 10668: {'lr': 0.0004957811058530742, 'samples': 2048256, 'steps': 10667, 'loss/train': 2.2089219093322754} -11/06/2021 22:43:42 - INFO - __main__ - Step 10669: {'lr': 0.0004957801349916884, 'samples': 2048448, 'steps': 10668, 'loss/train': 2.4702768325805664} -11/06/2021 22:43:42 - INFO - __main__ - Step 10670: {'lr': 0.000495779164019558, 'samples': 2048640, 'steps': 10669, 'loss/train': 0.2976198196411133} -11/06/2021 22:43:42 - INFO - __main__ - Step 10671: {'lr': 0.0004957781929366832, 'samples': 2048832, 'steps': 10670, 'loss/train': 2.503723382949829} -11/06/2021 22:43:43 - INFO - __main__ - Step 10672: {'lr': 0.0004957772217430646, 'samples': 2049024, 'steps': 10671, 'loss/train': 1.338193416595459} -11/06/2021 22:43:44 - INFO - __main__ - Step 10673: {'lr': 0.0004957762504387025, 'samples': 2049216, 'steps': 10672, 'loss/train': 1.5494346618652344} -11/06/2021 22:43:45 - INFO - __main__ - Step 10674: {'lr': 0.0004957752790235976, 'samples': 2049408, 'steps': 10673, 'loss/train': 2.082453489303589} -11/06/2021 22:43:45 - INFO - __main__ - Step 10675: {'lr': 0.00049577430749775, 'samples': 2049600, 'steps': 10674, 'loss/train': 1.9406588077545166} -11/06/2021 22:43:45 - INFO - __main__ - Step 10676: {'lr': 0.0004957733358611602, 'samples': 2049792, 'steps': 10675, 'loss/train': 1.727967381477356} -11/06/2021 22:43:46 - INFO - __main__ - Step 10677: {'lr': 0.0004957723641138289, 'samples': 2049984, 'steps': 10676, 'loss/train': 1.9043892621994019} -11/06/2021 22:43:47 - INFO - __main__ - Step 10678: {'lr': 0.0004957713922557563, 'samples': 2050176, 'steps': 10677, 'loss/train': 1.6342339515686035} -11/06/2021 22:43:47 - INFO - __main__ - Step 10679: {'lr': 0.0004957704202869429, 'samples': 2050368, 'steps': 10678, 'loss/train': 2.188232898712158} -11/06/2021 22:43:47 - INFO - __main__ - Step 10680: {'lr': 0.0004957694482073891, 'samples': 2050560, 'steps': 10679, 'loss/train': 2.068922758102417} -11/06/2021 22:43:48 - INFO - __main__ - Step 10681: {'lr': 0.0004957684760170955, 'samples': 2050752, 'steps': 10680, 'loss/train': 1.8861031532287598} -11/06/2021 22:43:48 - INFO - __main__ - Step 10682: {'lr': 0.0004957675037160624, 'samples': 2050944, 'steps': 10681, 'loss/train': 1.979127049446106} -11/06/2021 22:43:49 - INFO - __main__ - Step 10683: {'lr': 0.0004957665313042902, 'samples': 2051136, 'steps': 10682, 'loss/train': 1.728943109512329} -11/06/2021 22:43:49 - INFO - __main__ - Step 10684: {'lr': 0.0004957655587817793, 'samples': 2051328, 'steps': 10683, 'loss/train': 1.295758605003357} -11/06/2021 22:43:50 - INFO - __main__ - Step 10685: {'lr': 0.0004957645861485304, 'samples': 2051520, 'steps': 10684, 'loss/train': 1.4567430019378662} -11/06/2021 22:43:50 - INFO - __main__ - Step 10686: {'lr': 0.0004957636134045437, 'samples': 2051712, 'steps': 10685, 'loss/train': 1.5401474237442017} -11/06/2021 22:43:50 - INFO - __main__ - Step 10687: {'lr': 0.0004957626405498196, 'samples': 2051904, 'steps': 10686, 'loss/train': 2.0036814212799072} -11/06/2021 22:43:51 - INFO - __main__ - Step 10688: {'lr': 0.0004957616675843588, 'samples': 2052096, 'steps': 10687, 'loss/train': 1.8221772909164429} -11/06/2021 22:43:52 - INFO - __main__ - Step 10689: {'lr': 0.0004957606945081615, 'samples': 2052288, 'steps': 10688, 'loss/train': 1.658942461013794} -11/06/2021 22:43:52 - INFO - __main__ - Step 10690: {'lr': 0.0004957597213212284, 'samples': 2052480, 'steps': 10689, 'loss/train': 1.7910033464431763} -11/06/2021 22:43:52 - INFO - __main__ - Step 10691: {'lr': 0.0004957587480235595, 'samples': 2052672, 'steps': 10690, 'loss/train': 1.7230714559555054} -11/06/2021 22:43:53 - INFO - __main__ - Step 10692: {'lr': 0.0004957577746151556, 'samples': 2052864, 'steps': 10691, 'loss/train': 1.9783008098602295} -11/06/2021 22:43:54 - INFO - __main__ - Step 10693: {'lr': 0.0004957568010960171, 'samples': 2053056, 'steps': 10692, 'loss/train': 1.6153764724731445} -11/06/2021 22:43:54 - INFO - __main__ - Step 10694: {'lr': 0.0004957558274661444, 'samples': 2053248, 'steps': 10693, 'loss/train': 1.5456531047821045} -11/06/2021 22:43:55 - INFO - __main__ - Step 10695: {'lr': 0.0004957548537255378, 'samples': 2053440, 'steps': 10694, 'loss/train': 2.194444417953491} -11/06/2021 22:43:55 - INFO - __main__ - Step 10696: {'lr': 0.000495753879874198, 'samples': 2053632, 'steps': 10695, 'loss/train': 1.8297362327575684} -11/06/2021 22:43:55 - INFO - __main__ - Step 10697: {'lr': 0.0004957529059121251, 'samples': 2053824, 'steps': 10696, 'loss/train': 2.081062078475952} -11/06/2021 22:43:56 - INFO - __main__ - Step 10698: {'lr': 0.0004957519318393199, 'samples': 2054016, 'steps': 10697, 'loss/train': 1.8401142358779907} -11/06/2021 22:43:57 - INFO - __main__ - Step 10699: {'lr': 0.0004957509576557826, 'samples': 2054208, 'steps': 10698, 'loss/train': 1.7377288341522217} -11/06/2021 22:43:57 - INFO - __main__ - Step 10700: {'lr': 0.0004957499833615137, 'samples': 2054400, 'steps': 10699, 'loss/train': 2.147418260574341} -11/06/2021 22:43:57 - INFO - __main__ - Step 10701: {'lr': 0.0004957490089565137, 'samples': 2054592, 'steps': 10700, 'loss/train': 1.7337613105773926} -11/06/2021 22:43:58 - INFO - __main__ - Step 10702: {'lr': 0.0004957480344407829, 'samples': 2054784, 'steps': 10701, 'loss/train': 1.7109180688858032} -11/06/2021 22:43:58 - INFO - __main__ - Step 10703: {'lr': 0.0004957470598143218, 'samples': 2054976, 'steps': 10702, 'loss/train': 1.4152930974960327} -11/06/2021 22:43:59 - INFO - __main__ - Step 10704: {'lr': 0.000495746085077131, 'samples': 2055168, 'steps': 10703, 'loss/train': 1.6608555316925049} -11/06/2021 22:44:00 - INFO - __main__ - Step 10705: {'lr': 0.0004957451102292108, 'samples': 2055360, 'steps': 10704, 'loss/train': 1.8776973485946655} -11/06/2021 22:44:00 - INFO - __main__ - Step 10706: {'lr': 0.0004957441352705616, 'samples': 2055552, 'steps': 10705, 'loss/train': 1.9885625839233398} -11/06/2021 22:44:00 - INFO - __main__ - Step 10707: {'lr': 0.0004957431602011839, 'samples': 2055744, 'steps': 10706, 'loss/train': 1.5255722999572754} -11/06/2021 22:44:01 - INFO - __main__ - Step 10708: {'lr': 0.0004957421850210781, 'samples': 2055936, 'steps': 10707, 'loss/train': 1.827954649925232} -11/06/2021 22:44:02 - INFO - __main__ - Step 10709: {'lr': 0.0004957412097302446, 'samples': 2056128, 'steps': 10708, 'loss/train': 2.0723941326141357} -11/06/2021 22:44:02 - INFO - __main__ - Step 10710: {'lr': 0.000495740234328684, 'samples': 2056320, 'steps': 10709, 'loss/train': 2.509693145751953} -11/06/2021 22:44:02 - INFO - __main__ - Step 10711: {'lr': 0.0004957392588163967, 'samples': 2056512, 'steps': 10710, 'loss/train': 1.9670145511627197} -11/06/2021 22:44:03 - INFO - __main__ - Step 10712: {'lr': 0.000495738283193383, 'samples': 2056704, 'steps': 10711, 'loss/train': 1.6758942604064941} -11/06/2021 22:44:03 - INFO - __main__ - Step 10713: {'lr': 0.0004957373074596434, 'samples': 2056896, 'steps': 10712, 'loss/train': 1.8210440874099731} -11/06/2021 22:44:04 - INFO - __main__ - Step 10714: {'lr': 0.0004957363316151784, 'samples': 2057088, 'steps': 10713, 'loss/train': 1.4150325059890747} -11/06/2021 22:44:04 - INFO - __main__ - Step 10715: {'lr': 0.0004957353556599884, 'samples': 2057280, 'steps': 10714, 'loss/train': 1.9680533409118652} -11/06/2021 22:44:05 - INFO - __main__ - Step 10716: {'lr': 0.0004957343795940738, 'samples': 2057472, 'steps': 10715, 'loss/train': 2.222113847732544} -11/06/2021 22:44:05 - INFO - __main__ - Step 10717: {'lr': 0.0004957334034174351, 'samples': 2057664, 'steps': 10716, 'loss/train': 1.4754172563552856} -11/06/2021 22:44:06 - INFO - __main__ - Step 10718: {'lr': 0.0004957324271300728, 'samples': 2057856, 'steps': 10717, 'loss/train': 1.6506346464157104} -11/06/2021 22:44:07 - INFO - __main__ - Step 10719: {'lr': 0.0004957314507319871, 'samples': 2058048, 'steps': 10718, 'loss/train': 1.6497141122817993} -11/06/2021 22:44:07 - INFO - __main__ - Step 10720: {'lr': 0.0004957304742231787, 'samples': 2058240, 'steps': 10719, 'loss/train': 1.7145750522613525} -11/06/2021 22:44:07 - INFO - __main__ - Step 10721: {'lr': 0.0004957294976036479, 'samples': 2058432, 'steps': 10720, 'loss/train': 1.7986055612564087} -11/06/2021 22:44:08 - INFO - __main__ - Step 10722: {'lr': 0.0004957285208733953, 'samples': 2058624, 'steps': 10721, 'loss/train': 1.592078447341919} -11/06/2021 22:44:08 - INFO - __main__ - Step 10723: {'lr': 0.0004957275440324211, 'samples': 2058816, 'steps': 10722, 'loss/train': 1.7179454565048218} -11/06/2021 22:44:09 - INFO - __main__ - Step 10724: {'lr': 0.0004957265670807258, 'samples': 2059008, 'steps': 10723, 'loss/train': 1.8023722171783447} -11/06/2021 22:44:09 - INFO - __main__ - Step 10725: {'lr': 0.0004957255900183101, 'samples': 2059200, 'steps': 10724, 'loss/train': 2.032273292541504} -11/06/2021 22:44:10 - INFO - __main__ - Step 10726: {'lr': 0.000495724612845174, 'samples': 2059392, 'steps': 10725, 'loss/train': 1.7515367269515991} -11/06/2021 22:44:10 - INFO - __main__ - Step 10727: {'lr': 0.0004957236355613184, 'samples': 2059584, 'steps': 10726, 'loss/train': 1.7511495351791382} -11/06/2021 22:44:10 - INFO - __main__ - Step 10728: {'lr': 0.0004957226581667434, 'samples': 2059776, 'steps': 10727, 'loss/train': 2.232154369354248} -11/06/2021 22:44:11 - INFO - __main__ - Step 10729: {'lr': 0.0004957216806614496, 'samples': 2059968, 'steps': 10728, 'loss/train': 2.1359822750091553} -11/06/2021 22:44:12 - INFO - __main__ - Step 10730: {'lr': 0.0004957207030454374, 'samples': 2060160, 'steps': 10729, 'loss/train': 2.018582582473755} -11/06/2021 22:44:12 - INFO - __main__ - Step 10731: {'lr': 0.0004957197253187073, 'samples': 2060352, 'steps': 10730, 'loss/train': 1.6088690757751465} -11/06/2021 22:44:12 - INFO - __main__ - Step 10732: {'lr': 0.0004957187474812595, 'samples': 2060544, 'steps': 10731, 'loss/train': 1.1297942399978638} -11/06/2021 22:44:13 - INFO - __main__ - Step 10733: {'lr': 0.0004957177695330948, 'samples': 2060736, 'steps': 10732, 'loss/train': 1.5375380516052246} -11/06/2021 22:44:13 - INFO - __main__ - Step 10734: {'lr': 0.0004957167914742134, 'samples': 2060928, 'steps': 10733, 'loss/train': 1.797157883644104} -11/06/2021 22:44:14 - INFO - __main__ - Step 10735: {'lr': 0.0004957158133046158, 'samples': 2061120, 'steps': 10734, 'loss/train': 2.323326587677002} -11/06/2021 22:44:15 - INFO - __main__ - Step 10736: {'lr': 0.0004957148350243025, 'samples': 2061312, 'steps': 10735, 'loss/train': 2.2027082443237305} -11/06/2021 22:44:15 - INFO - __main__ - Step 10737: {'lr': 0.0004957138566332738, 'samples': 2061504, 'steps': 10736, 'loss/train': 1.9741092920303345} -11/06/2021 22:44:15 - INFO - __main__ - Step 10738: {'lr': 0.0004957128781315303, 'samples': 2061696, 'steps': 10737, 'loss/train': 1.5470525026321411} -11/06/2021 22:44:16 - INFO - __main__ - Step 10739: {'lr': 0.0004957118995190723, 'samples': 2061888, 'steps': 10738, 'loss/train': 1.9221845865249634} -11/06/2021 22:44:17 - INFO - __main__ - Step 10740: {'lr': 0.0004957109207959004, 'samples': 2062080, 'steps': 10739, 'loss/train': 1.5594979524612427} -11/06/2021 22:44:17 - INFO - __main__ - Step 10741: {'lr': 0.0004957099419620149, 'samples': 2062272, 'steps': 10740, 'loss/train': 1.0245342254638672} -11/06/2021 22:44:17 - INFO - __main__ - Step 10742: {'lr': 0.0004957089630174163, 'samples': 2062464, 'steps': 10741, 'loss/train': 1.913503885269165} -11/06/2021 22:44:18 - INFO - __main__ - Step 10743: {'lr': 0.0004957079839621051, 'samples': 2062656, 'steps': 10742, 'loss/train': 2.051661968231201} -11/06/2021 22:44:18 - INFO - __main__ - Step 10744: {'lr': 0.0004957070047960816, 'samples': 2062848, 'steps': 10743, 'loss/train': 2.0730690956115723} -11/06/2021 22:44:19 - INFO - __main__ - Step 10745: {'lr': 0.0004957060255193462, 'samples': 2063040, 'steps': 10744, 'loss/train': 2.2329344749450684} -11/06/2021 22:44:19 - INFO - __main__ - Step 10746: {'lr': 0.0004957050461318997, 'samples': 2063232, 'steps': 10745, 'loss/train': 1.7052743434906006} -11/06/2021 22:44:20 - INFO - __main__ - Step 10747: {'lr': 0.0004957040666337422, 'samples': 2063424, 'steps': 10746, 'loss/train': 1.7934210300445557} -11/06/2021 22:44:20 - INFO - __main__ - Step 10748: {'lr': 0.0004957030870248742, 'samples': 2063616, 'steps': 10747, 'loss/train': 1.2029649019241333} -11/06/2021 22:44:21 - INFO - __main__ - Step 10749: {'lr': 0.0004957021073052962, 'samples': 2063808, 'steps': 10748, 'loss/train': 1.534114122390747} -11/06/2021 22:44:21 - INFO - __main__ - Step 10750: {'lr': 0.0004957011274750086, 'samples': 2064000, 'steps': 10749, 'loss/train': 0.9407898783683777} -11/06/2021 22:44:22 - INFO - __main__ - Step 10751: {'lr': 0.0004957001475340119, 'samples': 2064192, 'steps': 10750, 'loss/train': 1.5393911600112915} -11/06/2021 22:44:22 - INFO - __main__ - Step 10752: {'lr': 0.0004956991674823065, 'samples': 2064384, 'steps': 10751, 'loss/train': 1.8228400945663452} -11/06/2021 22:44:23 - INFO - __main__ - Step 10753: {'lr': 0.0004956981873198928, 'samples': 2064576, 'steps': 10752, 'loss/train': 1.507121205329895} -11/06/2021 22:44:23 - INFO - __main__ - Step 10754: {'lr': 0.0004956972070467712, 'samples': 2064768, 'steps': 10753, 'loss/train': 1.64657461643219} -11/06/2021 22:44:23 - INFO - __main__ - Step 10755: {'lr': 0.0004956962266629424, 'samples': 2064960, 'steps': 10754, 'loss/train': 1.6212588548660278} -11/06/2021 22:44:24 - INFO - __main__ - Step 10756: {'lr': 0.0004956952461684066, 'samples': 2065152, 'steps': 10755, 'loss/train': 2.1202139854431152} -11/06/2021 22:44:25 - INFO - __main__ - Step 10757: {'lr': 0.0004956942655631644, 'samples': 2065344, 'steps': 10756, 'loss/train': 1.5507880449295044} -11/06/2021 22:44:25 - INFO - __main__ - Step 10758: {'lr': 0.0004956932848472161, 'samples': 2065536, 'steps': 10757, 'loss/train': 1.8729193210601807} -11/06/2021 22:44:25 - INFO - __main__ - Step 10759: {'lr': 0.0004956923040205622, 'samples': 2065728, 'steps': 10758, 'loss/train': 1.7279722690582275} -11/06/2021 22:44:26 - INFO - __main__ - Step 10760: {'lr': 0.0004956913230832031, 'samples': 2065920, 'steps': 10759, 'loss/train': 2.134770154953003} -11/06/2021 22:44:27 - INFO - __main__ - Step 10761: {'lr': 0.0004956903420351393, 'samples': 2066112, 'steps': 10760, 'loss/train': 1.6158196926116943} -11/06/2021 22:44:28 - INFO - __main__ - Step 10762: {'lr': 0.0004956893608763713, 'samples': 2066304, 'steps': 10761, 'loss/train': 1.8567177057266235} -11/06/2021 22:44:28 - INFO - __main__ - Step 10763: {'lr': 0.0004956883796068993, 'samples': 2066496, 'steps': 10762, 'loss/train': 1.9238213300704956} -11/06/2021 22:44:28 - INFO - __main__ - Step 10764: {'lr': 0.000495687398226724, 'samples': 2066688, 'steps': 10763, 'loss/train': 1.661841869354248} -11/06/2021 22:44:29 - INFO - __main__ - Step 10765: {'lr': 0.0004956864167358458, 'samples': 2066880, 'steps': 10764, 'loss/train': 1.6980998516082764} -11/06/2021 22:44:29 - INFO - __main__ - Step 10766: {'lr': 0.000495685435134265, 'samples': 2067072, 'steps': 10765, 'loss/train': 1.7710494995117188} -11/06/2021 22:44:30 - INFO - __main__ - Step 10767: {'lr': 0.0004956844534219822, 'samples': 2067264, 'steps': 10766, 'loss/train': 1.8926702737808228} -11/06/2021 22:44:31 - INFO - __main__ - Step 10768: {'lr': 0.0004956834715989977, 'samples': 2067456, 'steps': 10767, 'loss/train': 1.8057781457901} -11/06/2021 22:44:31 - INFO - __main__ - Step 10769: {'lr': 0.0004956824896653122, 'samples': 2067648, 'steps': 10768, 'loss/train': 1.9344799518585205} -11/06/2021 22:44:31 - INFO - __main__ - Step 10770: {'lr': 0.0004956815076209257, 'samples': 2067840, 'steps': 10769, 'loss/train': 1.7666970491409302} -11/06/2021 22:44:32 - INFO - __main__ - Step 10771: {'lr': 0.0004956805254658391, 'samples': 2068032, 'steps': 10770, 'loss/train': 1.9876887798309326} -11/06/2021 22:44:32 - INFO - __main__ - Step 10772: {'lr': 0.0004956795432000526, 'samples': 2068224, 'steps': 10771, 'loss/train': 1.9097800254821777} -11/06/2021 22:44:33 - INFO - __main__ - Step 10773: {'lr': 0.0004956785608235667, 'samples': 2068416, 'steps': 10772, 'loss/train': 1.9691766500473022} -11/06/2021 22:44:33 - INFO - __main__ - Step 10774: {'lr': 0.0004956775783363817, 'samples': 2068608, 'steps': 10773, 'loss/train': 1.7181099653244019} -11/06/2021 22:44:34 - INFO - __main__ - Step 10775: {'lr': 0.0004956765957384984, 'samples': 2068800, 'steps': 10774, 'loss/train': 1.4132951498031616} -11/06/2021 22:44:34 - INFO - __main__ - Step 10776: {'lr': 0.0004956756130299169, 'samples': 2068992, 'steps': 10775, 'loss/train': 1.20347261428833} -11/06/2021 22:44:34 - INFO - __main__ - Step 10777: {'lr': 0.0004956746302106378, 'samples': 2069184, 'steps': 10776, 'loss/train': 1.4337294101715088} -11/06/2021 22:44:35 - INFO - __main__ - Step 10778: {'lr': 0.0004956736472806614, 'samples': 2069376, 'steps': 10777, 'loss/train': 1.8119988441467285} -11/06/2021 22:44:36 - INFO - __main__ - Step 10779: {'lr': 0.0004956726642399883, 'samples': 2069568, 'steps': 10778, 'loss/train': 1.28266179561615} -11/06/2021 22:44:36 - INFO - __main__ - Step 10780: {'lr': 0.0004956716810886189, 'samples': 2069760, 'steps': 10779, 'loss/train': 1.9151232242584229} -11/06/2021 22:44:36 - INFO - __main__ - Step 10781: {'lr': 0.0004956706978265536, 'samples': 2069952, 'steps': 10780, 'loss/train': 1.7361626625061035} -11/06/2021 22:44:37 - INFO - __main__ - Step 10782: {'lr': 0.0004956697144537929, 'samples': 2070144, 'steps': 10781, 'loss/train': 1.9696669578552246} -11/06/2021 22:44:38 - INFO - __main__ - Step 10783: {'lr': 0.0004956687309703372, 'samples': 2070336, 'steps': 10782, 'loss/train': 2.0651187896728516} -11/06/2021 22:44:38 - INFO - __main__ - Step 10784: {'lr': 0.0004956677473761871, 'samples': 2070528, 'steps': 10783, 'loss/train': 1.8574343919754028} -11/06/2021 22:44:38 - INFO - __main__ - Step 10785: {'lr': 0.0004956667636713427, 'samples': 2070720, 'steps': 10784, 'loss/train': 1.5868165493011475} -11/06/2021 22:44:39 - INFO - __main__ - Step 10786: {'lr': 0.0004956657798558047, 'samples': 2070912, 'steps': 10785, 'loss/train': 1.4748395681381226} -11/06/2021 22:44:39 - INFO - __main__ - Step 10787: {'lr': 0.0004956647959295735, 'samples': 2071104, 'steps': 10786, 'loss/train': 1.701545000076294} -11/06/2021 22:44:40 - INFO - __main__ - Step 10788: {'lr': 0.0004956638118926495, 'samples': 2071296, 'steps': 10787, 'loss/train': 1.976759910583496} -11/06/2021 22:44:40 - INFO - __main__ - Step 10789: {'lr': 0.0004956628277450333, 'samples': 2071488, 'steps': 10788, 'loss/train': 2.1454813480377197} -11/06/2021 22:44:41 - INFO - __main__ - Step 10790: {'lr': 0.0004956618434867251, 'samples': 2071680, 'steps': 10789, 'loss/train': 1.5759694576263428} -11/06/2021 22:44:41 - INFO - __main__ - Step 10791: {'lr': 0.0004956608591177256, 'samples': 2071872, 'steps': 10790, 'loss/train': 1.8092042207717896} -11/06/2021 22:44:41 - INFO - __main__ - Step 10792: {'lr': 0.0004956598746380349, 'samples': 2072064, 'steps': 10791, 'loss/train': 1.6778979301452637} -11/06/2021 22:44:43 - INFO - __main__ - Step 10793: {'lr': 0.0004956588900476538, 'samples': 2072256, 'steps': 10792, 'loss/train': 1.459761381149292} -11/06/2021 22:44:43 - INFO - __main__ - Step 10794: {'lr': 0.0004956579053465826, 'samples': 2072448, 'steps': 10793, 'loss/train': 1.5399609804153442} -11/06/2021 22:44:43 - INFO - __main__ - Step 10795: {'lr': 0.0004956569205348217, 'samples': 2072640, 'steps': 10794, 'loss/train': 1.4473868608474731} -11/06/2021 22:44:44 - INFO - __main__ - Step 10796: {'lr': 0.0004956559356123717, 'samples': 2072832, 'steps': 10795, 'loss/train': 1.825037956237793} -11/06/2021 22:44:44 - INFO - __main__ - Step 10797: {'lr': 0.0004956549505792327, 'samples': 2073024, 'steps': 10796, 'loss/train': 2.264521360397339} -11/06/2021 22:44:45 - INFO - __main__ - Step 10798: {'lr': 0.0004956539654354055, 'samples': 2073216, 'steps': 10797, 'loss/train': 1.450287938117981} -11/06/2021 22:44:45 - INFO - __main__ - Step 10799: {'lr': 0.0004956529801808904, 'samples': 2073408, 'steps': 10798, 'loss/train': 1.9415364265441895} -11/06/2021 22:44:46 - INFO - __main__ - Step 10800: {'lr': 0.0004956519948156879, 'samples': 2073600, 'steps': 10799, 'loss/train': 1.7281900644302368} -11/06/2021 22:44:46 - INFO - __main__ - Step 10801: {'lr': 0.0004956510093397983, 'samples': 2073792, 'steps': 10800, 'loss/train': 1.6848071813583374} -11/06/2021 22:44:46 - INFO - __main__ - Step 10802: {'lr': 0.0004956500237532222, 'samples': 2073984, 'steps': 10801, 'loss/train': 2.119485855102539} -11/06/2021 22:44:47 - INFO - __main__ - Step 10803: {'lr': 0.0004956490380559601, 'samples': 2074176, 'steps': 10802, 'loss/train': 1.7440723180770874} -11/06/2021 22:44:48 - INFO - __main__ - Step 10804: {'lr': 0.0004956480522480121, 'samples': 2074368, 'steps': 10803, 'loss/train': 1.6248648166656494} -11/06/2021 22:44:48 - INFO - __main__ - Step 10805: {'lr': 0.000495647066329379, 'samples': 2074560, 'steps': 10804, 'loss/train': 2.111401081085205} -11/06/2021 22:44:49 - INFO - __main__ - Step 10806: {'lr': 0.0004956460803000612, 'samples': 2074752, 'steps': 10805, 'loss/train': 2.2455363273620605} -11/06/2021 22:44:49 - INFO - __main__ - Step 10807: {'lr': 0.0004956450941600589, 'samples': 2074944, 'steps': 10806, 'loss/train': 4.325562477111816} -11/06/2021 22:44:49 - INFO - __main__ - Step 10808: {'lr': 0.0004956441079093729, 'samples': 2075136, 'steps': 10807, 'loss/train': 1.592270851135254} -11/06/2021 22:44:50 - INFO - __main__ - Step 10809: {'lr': 0.0004956431215480034, 'samples': 2075328, 'steps': 10808, 'loss/train': 1.865347981452942} -11/06/2021 22:44:51 - INFO - __main__ - Step 10810: {'lr': 0.0004956421350759508, 'samples': 2075520, 'steps': 10809, 'loss/train': 1.3117084503173828} -11/06/2021 22:44:51 - INFO - __main__ - Step 10811: {'lr': 0.0004956411484932158, 'samples': 2075712, 'steps': 10810, 'loss/train': 1.8176014423370361} -11/06/2021 22:44:51 - INFO - __main__ - Step 10812: {'lr': 0.0004956401617997985, 'samples': 2075904, 'steps': 10811, 'loss/train': 1.2668240070343018} -11/06/2021 22:44:52 - INFO - __main__ - Step 10813: {'lr': 0.0004956391749956997, 'samples': 2076096, 'steps': 10812, 'loss/train': 2.1930673122406006} -11/06/2021 22:44:53 - INFO - __main__ - Step 10814: {'lr': 0.0004956381880809195, 'samples': 2076288, 'steps': 10813, 'loss/train': 2.0894155502319336} -11/06/2021 22:44:53 - INFO - __main__ - Step 10815: {'lr': 0.0004956372010554587, 'samples': 2076480, 'steps': 10814, 'loss/train': 1.8282910585403442} -11/06/2021 22:44:54 - INFO - __main__ - Step 10816: {'lr': 0.0004956362139193174, 'samples': 2076672, 'steps': 10815, 'loss/train': 2.062333345413208} -11/06/2021 22:44:54 - INFO - __main__ - Step 10817: {'lr': 0.0004956352266724964, 'samples': 2076864, 'steps': 10816, 'loss/train': 1.4473098516464233} -11/06/2021 22:44:54 - INFO - __main__ - Step 10818: {'lr': 0.0004956342393149959, 'samples': 2077056, 'steps': 10817, 'loss/train': 1.7274878025054932} -11/06/2021 22:44:56 - INFO - __main__ - Step 10819: {'lr': 0.0004956332518468163, 'samples': 2077248, 'steps': 10818, 'loss/train': 1.570633053779602} -11/06/2021 22:44:56 - INFO - __main__ - Step 10820: {'lr': 0.0004956322642679583, 'samples': 2077440, 'steps': 10819, 'loss/train': 1.7297214269638062} -11/06/2021 22:44:56 - INFO - __main__ - Step 10821: {'lr': 0.000495631276578422, 'samples': 2077632, 'steps': 10820, 'loss/train': 4.519792079925537} -11/06/2021 22:44:57 - INFO - __main__ - Step 10822: {'lr': 0.0004956302887782082, 'samples': 2077824, 'steps': 10821, 'loss/train': 1.0446696281433105} -11/06/2021 22:44:57 - INFO - __main__ - Step 10823: {'lr': 0.0004956293008673172, 'samples': 2078016, 'steps': 10822, 'loss/train': 0.5035202503204346} -11/06/2021 22:44:57 - INFO - __main__ - Step 10824: {'lr': 0.0004956283128457493, 'samples': 2078208, 'steps': 10823, 'loss/train': 0.34573525190353394} -11/06/2021 22:44:58 - INFO - __main__ - Step 10825: {'lr': 0.0004956273247135051, 'samples': 2078400, 'steps': 10824, 'loss/train': 1.6415156126022339} -11/06/2021 22:44:59 - INFO - __main__ - Step 10826: {'lr': 0.0004956263364705851, 'samples': 2078592, 'steps': 10825, 'loss/train': 1.6332308053970337} -11/06/2021 22:44:59 - INFO - __main__ - Step 10827: {'lr': 0.0004956253481169895, 'samples': 2078784, 'steps': 10826, 'loss/train': 2.319352865219116} -11/06/2021 22:44:59 - INFO - __main__ - Step 10828: {'lr': 0.0004956243596527191, 'samples': 2078976, 'steps': 10827, 'loss/train': 1.773661494255066} -11/06/2021 22:45:00 - INFO - __main__ - Step 10829: {'lr': 0.000495623371077774, 'samples': 2079168, 'steps': 10828, 'loss/train': 1.8046337366104126} -11/06/2021 22:45:01 - INFO - __main__ - Step 10830: {'lr': 0.000495622382392155, 'samples': 2079360, 'steps': 10829, 'loss/train': 1.06633460521698} -11/06/2021 22:45:01 - INFO - __main__ - Step 10831: {'lr': 0.0004956213935958621, 'samples': 2079552, 'steps': 10830, 'loss/train': 1.7313029766082764} -11/06/2021 22:45:02 - INFO - __main__ - Step 10832: {'lr': 0.0004956204046888961, 'samples': 2079744, 'steps': 10831, 'loss/train': 1.655548095703125} -11/06/2021 22:45:02 - INFO - __main__ - Step 10833: {'lr': 0.0004956194156712574, 'samples': 2079936, 'steps': 10832, 'loss/train': 2.0152714252471924} -11/06/2021 22:45:02 - INFO - __main__ - Step 10834: {'lr': 0.0004956184265429463, 'samples': 2080128, 'steps': 10833, 'loss/train': 2.010787010192871} -11/06/2021 22:45:03 - INFO - __main__ - Step 10835: {'lr': 0.0004956174373039634, 'samples': 2080320, 'steps': 10834, 'loss/train': 1.838008999824524} -11/06/2021 22:45:04 - INFO - __main__ - Step 10836: {'lr': 0.0004956164479543089, 'samples': 2080512, 'steps': 10835, 'loss/train': 1.985622525215149} -11/06/2021 22:45:04 - INFO - __main__ - Step 10837: {'lr': 0.0004956154584939836, 'samples': 2080704, 'steps': 10836, 'loss/train': 1.8421908617019653} -11/06/2021 22:45:04 - INFO - __main__ - Step 10838: {'lr': 0.0004956144689229877, 'samples': 2080896, 'steps': 10837, 'loss/train': 2.1746902465820312} -11/06/2021 22:45:05 - INFO - __main__ - Step 10839: {'lr': 0.0004956134792413218, 'samples': 2081088, 'steps': 10838, 'loss/train': 1.700150966644287} -11/06/2021 22:45:05 - INFO - __main__ - Step 10840: {'lr': 0.0004956124894489861, 'samples': 2081280, 'steps': 10839, 'loss/train': 2.058382749557495} -11/06/2021 22:45:06 - INFO - __main__ - Step 10841: {'lr': 0.0004956114995459813, 'samples': 2081472, 'steps': 10840, 'loss/train': 6.1868720054626465} -11/06/2021 22:45:06 - INFO - __main__ - Step 10842: {'lr': 0.0004956105095323077, 'samples': 2081664, 'steps': 10841, 'loss/train': 1.7854186296463013} -11/06/2021 22:45:07 - INFO - __main__ - Step 10843: {'lr': 0.0004956095194079658, 'samples': 2081856, 'steps': 10842, 'loss/train': 1.8103166818618774} -11/06/2021 22:45:07 - INFO - __main__ - Step 10844: {'lr': 0.000495608529172956, 'samples': 2082048, 'steps': 10843, 'loss/train': 1.3330121040344238} -11/06/2021 22:45:08 - INFO - __main__ - Step 10845: {'lr': 0.0004956075388272789, 'samples': 2082240, 'steps': 10844, 'loss/train': 1.5644762516021729} -11/06/2021 22:45:09 - INFO - __main__ - Step 10846: {'lr': 0.0004956065483709348, 'samples': 2082432, 'steps': 10845, 'loss/train': 1.6880342960357666} -11/06/2021 22:45:09 - INFO - __main__ - Step 10847: {'lr': 0.0004956055578039241, 'samples': 2082624, 'steps': 10846, 'loss/train': 1.727042317390442} -11/06/2021 22:45:09 - INFO - __main__ - Step 10848: {'lr': 0.0004956045671262475, 'samples': 2082816, 'steps': 10847, 'loss/train': 1.3795113563537598} -11/06/2021 22:45:10 - INFO - __main__ - Step 10849: {'lr': 0.0004956035763379051, 'samples': 2083008, 'steps': 10848, 'loss/train': 1.9024347066879272} -11/06/2021 22:45:10 - INFO - __main__ - Step 10850: {'lr': 0.0004956025854388976, 'samples': 2083200, 'steps': 10849, 'loss/train': 0.8960413336753845} -11/06/2021 22:45:11 - INFO - __main__ - Step 10851: {'lr': 0.0004956015944292253, 'samples': 2083392, 'steps': 10850, 'loss/train': 2.1259398460388184} -11/06/2021 22:45:11 - INFO - __main__ - Step 10852: {'lr': 0.0004956006033088888, 'samples': 2083584, 'steps': 10851, 'loss/train': 1.9654005765914917} -11/06/2021 22:45:12 - INFO - __main__ - Step 10853: {'lr': 0.0004955996120778884, 'samples': 2083776, 'steps': 10852, 'loss/train': 1.8148349523544312} -11/06/2021 22:45:12 - INFO - __main__ - Step 10854: {'lr': 0.0004955986207362246, 'samples': 2083968, 'steps': 10853, 'loss/train': 0.7852979898452759} -11/06/2021 22:45:12 - INFO - __main__ - Step 10855: {'lr': 0.0004955976292838979, 'samples': 2084160, 'steps': 10854, 'loss/train': 1.4349844455718994} -11/06/2021 22:45:14 - INFO - __main__ - Step 10856: {'lr': 0.0004955966377209086, 'samples': 2084352, 'steps': 10855, 'loss/train': 1.8268946409225464} -11/06/2021 22:45:14 - INFO - __main__ - Step 10857: {'lr': 0.0004955956460472573, 'samples': 2084544, 'steps': 10856, 'loss/train': 2.225966453552246} -11/06/2021 22:45:14 - INFO - __main__ - Step 10858: {'lr': 0.0004955946542629444, 'samples': 2084736, 'steps': 10857, 'loss/train': 1.7703862190246582} -11/06/2021 22:45:15 - INFO - __main__ - Step 10859: {'lr': 0.0004955936623679703, 'samples': 2084928, 'steps': 10858, 'loss/train': 2.2991316318511963} -11/06/2021 22:45:15 - INFO - __main__ - Step 10860: {'lr': 0.0004955926703623356, 'samples': 2085120, 'steps': 10859, 'loss/train': 2.4180328845977783} -11/06/2021 22:45:15 - INFO - __main__ - Step 10861: {'lr': 0.0004955916782460405, 'samples': 2085312, 'steps': 10860, 'loss/train': 2.1252551078796387} -11/06/2021 22:45:16 - INFO - __main__ - Step 10862: {'lr': 0.0004955906860190857, 'samples': 2085504, 'steps': 10861, 'loss/train': 1.9650782346725464} -11/06/2021 22:45:17 - INFO - __main__ - Step 10863: {'lr': 0.0004955896936814714, 'samples': 2085696, 'steps': 10862, 'loss/train': 1.8924416303634644} -11/06/2021 22:45:17 - INFO - __main__ - Step 10864: {'lr': 0.0004955887012331982, 'samples': 2085888, 'steps': 10863, 'loss/train': 1.7115322351455688} -11/06/2021 22:45:17 - INFO - __main__ - Step 10865: {'lr': 0.0004955877086742666, 'samples': 2086080, 'steps': 10864, 'loss/train': 1.3016084432601929} -11/06/2021 22:45:18 - INFO - __main__ - Step 10866: {'lr': 0.0004955867160046769, 'samples': 2086272, 'steps': 10865, 'loss/train': 1.6526113748550415} -11/06/2021 22:45:19 - INFO - __main__ - Step 10867: {'lr': 0.0004955857232244297, 'samples': 2086464, 'steps': 10866, 'loss/train': 1.5143797397613525} -11/06/2021 22:45:19 - INFO - __main__ - Step 10868: {'lr': 0.0004955847303335253, 'samples': 2086656, 'steps': 10867, 'loss/train': 1.8986718654632568} -11/06/2021 22:45:19 - INFO - __main__ - Step 10869: {'lr': 0.0004955837373319641, 'samples': 2086848, 'steps': 10868, 'loss/train': 1.6956390142440796} -11/06/2021 22:45:20 - INFO - __main__ - Step 10870: {'lr': 0.0004955827442197468, 'samples': 2087040, 'steps': 10869, 'loss/train': 1.9190312623977661} -11/06/2021 22:45:20 - INFO - __main__ - Step 10871: {'lr': 0.0004955817509968737, 'samples': 2087232, 'steps': 10870, 'loss/train': 1.3590363264083862} -11/06/2021 22:45:21 - INFO - __main__ - Step 10872: {'lr': 0.0004955807576633452, 'samples': 2087424, 'steps': 10871, 'loss/train': 1.7737996578216553} -11/06/2021 22:45:22 - INFO - __main__ - Step 10873: {'lr': 0.0004955797642191618, 'samples': 2087616, 'steps': 10872, 'loss/train': 1.8622442483901978} -11/06/2021 22:45:22 - INFO - __main__ - Step 10874: {'lr': 0.000495578770664324, 'samples': 2087808, 'steps': 10873, 'loss/train': 1.9006373882293701} -11/06/2021 22:45:22 - INFO - __main__ - Step 10875: {'lr': 0.0004955777769988322, 'samples': 2088000, 'steps': 10874, 'loss/train': 2.0556890964508057} -11/06/2021 22:45:23 - INFO - __main__ - Step 10876: {'lr': 0.0004955767832226868, 'samples': 2088192, 'steps': 10875, 'loss/train': 1.6354632377624512} -11/06/2021 22:45:24 - INFO - __main__ - Step 10877: {'lr': 0.0004955757893358884, 'samples': 2088384, 'steps': 10876, 'loss/train': 1.777341365814209} -11/06/2021 22:45:24 - INFO - __main__ - Step 10878: {'lr': 0.0004955747953384372, 'samples': 2088576, 'steps': 10877, 'loss/train': 1.4678032398223877} -11/06/2021 22:45:25 - INFO - __main__ - Step 10879: {'lr': 0.0004955738012303338, 'samples': 2088768, 'steps': 10878, 'loss/train': 2.07291579246521} -11/06/2021 22:45:25 - INFO - __main__ - Step 10880: {'lr': 0.0004955728070115787, 'samples': 2088960, 'steps': 10879, 'loss/train': 1.9695255756378174} -11/06/2021 22:45:25 - INFO - __main__ - Step 10881: {'lr': 0.0004955718126821722, 'samples': 2089152, 'steps': 10880, 'loss/train': 2.657900094985962} -11/06/2021 22:45:26 - INFO - __main__ - Step 10882: {'lr': 0.0004955708182421149, 'samples': 2089344, 'steps': 10881, 'loss/train': 1.587023377418518} -11/06/2021 22:45:26 - INFO - __main__ - Step 10883: {'lr': 0.0004955698236914071, 'samples': 2089536, 'steps': 10882, 'loss/train': 1.4646183252334595} -11/06/2021 22:45:27 - INFO - __main__ - Step 10884: {'lr': 0.0004955688290300494, 'samples': 2089728, 'steps': 10883, 'loss/train': 2.305067539215088} -11/06/2021 22:45:27 - INFO - __main__ - Step 10885: {'lr': 0.0004955678342580421, 'samples': 2089920, 'steps': 10884, 'loss/train': 2.04618501663208} -11/06/2021 22:45:28 - INFO - __main__ - Step 10886: {'lr': 0.0004955668393753858, 'samples': 2090112, 'steps': 10885, 'loss/train': 1.8852858543395996} -11/06/2021 22:45:28 - INFO - __main__ - Step 10887: {'lr': 0.0004955658443820809, 'samples': 2090304, 'steps': 10886, 'loss/train': 1.9681472778320312} -11/06/2021 22:45:28 - INFO - __main__ - Step 10888: {'lr': 0.0004955648492781277, 'samples': 2090496, 'steps': 10887, 'loss/train': 2.0879921913146973} -11/06/2021 22:45:30 - INFO - __main__ - Step 10889: {'lr': 0.0004955638540635269, 'samples': 2090688, 'steps': 10888, 'loss/train': 1.7729140520095825} -11/06/2021 22:45:30 - INFO - __main__ - Step 10890: {'lr': 0.0004955628587382788, 'samples': 2090880, 'steps': 10889, 'loss/train': 1.8550975322723389} -11/06/2021 22:45:30 - INFO - __main__ - Step 10891: {'lr': 0.0004955618633023837, 'samples': 2091072, 'steps': 10890, 'loss/train': 1.8905608654022217} -11/06/2021 22:45:31 - INFO - __main__ - Step 10892: {'lr': 0.0004955608677558424, 'samples': 2091264, 'steps': 10891, 'loss/train': 1.5222508907318115} -11/06/2021 22:45:31 - INFO - __main__ - Step 10893: {'lr': 0.0004955598720986551, 'samples': 2091456, 'steps': 10892, 'loss/train': 1.770163655281067} -11/06/2021 22:45:32 - INFO - __main__ - Step 10894: {'lr': 0.0004955588763308223, 'samples': 2091648, 'steps': 10893, 'loss/train': 1.9412416219711304} -11/06/2021 22:45:32 - INFO - __main__ - Step 10895: {'lr': 0.0004955578804523445, 'samples': 2091840, 'steps': 10894, 'loss/train': 1.9182251691818237} -11/06/2021 22:45:33 - INFO - __main__ - Step 10896: {'lr': 0.000495556884463222, 'samples': 2092032, 'steps': 10895, 'loss/train': 1.7548394203186035} -11/06/2021 22:45:33 - INFO - __main__ - Step 10897: {'lr': 0.0004955558883634555, 'samples': 2092224, 'steps': 10896, 'loss/train': 2.1378374099731445} -11/06/2021 22:45:33 - INFO - __main__ - Step 10898: {'lr': 0.0004955548921530452, 'samples': 2092416, 'steps': 10897, 'loss/train': 1.4862196445465088} -11/06/2021 22:45:34 - INFO - __main__ - Step 10899: {'lr': 0.0004955538958319917, 'samples': 2092608, 'steps': 10898, 'loss/train': 1.4818750619888306} -11/06/2021 22:45:35 - INFO - __main__ - Step 10900: {'lr': 0.0004955528994002954, 'samples': 2092800, 'steps': 10899, 'loss/train': 2.25352144241333} -11/06/2021 22:45:35 - INFO - __main__ - Step 10901: {'lr': 0.0004955519028579568, 'samples': 2092992, 'steps': 10900, 'loss/train': 1.904826045036316} -11/06/2021 22:45:35 - INFO - __main__ - Step 10902: {'lr': 0.0004955509062049763, 'samples': 2093184, 'steps': 10901, 'loss/train': 2.2646710872650146} -11/06/2021 22:45:36 - INFO - __main__ - Step 10903: {'lr': 0.0004955499094413542, 'samples': 2093376, 'steps': 10902, 'loss/train': 1.8453540802001953} -11/06/2021 22:45:37 - INFO - __main__ - Step 10904: {'lr': 0.0004955489125670912, 'samples': 2093568, 'steps': 10903, 'loss/train': 1.2901415824890137} -11/06/2021 22:45:37 - INFO - __main__ - Step 10905: {'lr': 0.0004955479155821877, 'samples': 2093760, 'steps': 10904, 'loss/train': 1.7908188104629517} -11/06/2021 22:45:37 - INFO - __main__ - Step 10906: {'lr': 0.000495546918486644, 'samples': 2093952, 'steps': 10905, 'loss/train': 1.9787135124206543} -11/06/2021 22:45:38 - INFO - __main__ - Step 10907: {'lr': 0.0004955459212804607, 'samples': 2094144, 'steps': 10906, 'loss/train': 0.762311577796936} -11/06/2021 22:45:38 - INFO - __main__ - Step 10908: {'lr': 0.0004955449239636382, 'samples': 2094336, 'steps': 10907, 'loss/train': 1.5875378847122192} -11/06/2021 22:45:38 - INFO - __main__ - Step 10909: {'lr': 0.000495543926536177, 'samples': 2094528, 'steps': 10908, 'loss/train': 1.9852023124694824} -11/06/2021 22:45:39 - INFO - __main__ - Step 10910: {'lr': 0.0004955429289980774, 'samples': 2094720, 'steps': 10909, 'loss/train': 1.7083479166030884} -11/06/2021 22:45:40 - INFO - __main__ - Step 10911: {'lr': 0.00049554193134934, 'samples': 2094912, 'steps': 10910, 'loss/train': 2.226473808288574} -11/06/2021 22:45:40 - INFO - __main__ - Step 10912: {'lr': 0.0004955409335899651, 'samples': 2095104, 'steps': 10911, 'loss/train': 1.7257845401763916} -11/06/2021 22:45:40 - INFO - __main__ - Step 10913: {'lr': 0.0004955399357199534, 'samples': 2095296, 'steps': 10912, 'loss/train': 1.5614092350006104} -11/06/2021 22:45:41 - INFO - __main__ - Step 10914: {'lr': 0.0004955389377393051, 'samples': 2095488, 'steps': 10913, 'loss/train': 1.6544125080108643} -11/06/2021 22:45:42 - INFO - __main__ - Step 10915: {'lr': 0.0004955379396480207, 'samples': 2095680, 'steps': 10914, 'loss/train': 2.452582836151123} -11/06/2021 22:45:42 - INFO - __main__ - Step 10916: {'lr': 0.0004955369414461007, 'samples': 2095872, 'steps': 10915, 'loss/train': 1.0178364515304565} -11/06/2021 22:45:43 - INFO - __main__ - Step 10917: {'lr': 0.0004955359431335456, 'samples': 2096064, 'steps': 10916, 'loss/train': 0.8691990375518799} -11/06/2021 22:45:43 - INFO - __main__ - Step 10918: {'lr': 0.0004955349447103559, 'samples': 2096256, 'steps': 10917, 'loss/train': 1.4804587364196777} -11/06/2021 22:45:43 - INFO - __main__ - Step 10919: {'lr': 0.0004955339461765318, 'samples': 2096448, 'steps': 10918, 'loss/train': 1.8954075574874878} -11/06/2021 22:45:44 - INFO - __main__ - Step 10920: {'lr': 0.0004955329475320739, 'samples': 2096640, 'steps': 10919, 'loss/train': 1.3000982999801636} -11/06/2021 22:45:45 - INFO - __main__ - Step 10921: {'lr': 0.0004955319487769827, 'samples': 2096832, 'steps': 10920, 'loss/train': 1.6396160125732422} -11/06/2021 22:45:45 - INFO - __main__ - Step 10922: {'lr': 0.0004955309499112586, 'samples': 2097024, 'steps': 10921, 'loss/train': 1.534606695175171} -11/06/2021 22:45:45 - INFO - __main__ - Step 10923: {'lr': 0.000495529950934902, 'samples': 2097216, 'steps': 10922, 'loss/train': 1.6064701080322266} -11/06/2021 22:45:46 - INFO - __main__ - Step 10924: {'lr': 0.0004955289518479134, 'samples': 2097408, 'steps': 10923, 'loss/train': 1.5156863927841187} -11/06/2021 22:45:47 - INFO - __main__ - Step 10925: {'lr': 0.0004955279526502931, 'samples': 2097600, 'steps': 10924, 'loss/train': 1.9213401079177856} -11/06/2021 22:45:47 - INFO - __main__ - Step 10926: {'lr': 0.0004955269533420419, 'samples': 2097792, 'steps': 10925, 'loss/train': 1.5095373392105103} -11/06/2021 22:45:47 - INFO - __main__ - Step 10927: {'lr': 0.00049552595392316, 'samples': 2097984, 'steps': 10926, 'loss/train': 1.9724854230880737} -11/06/2021 22:45:48 - INFO - __main__ - Step 10928: {'lr': 0.0004955249543936479, 'samples': 2098176, 'steps': 10927, 'loss/train': 1.7889426946640015} -11/06/2021 22:45:48 - INFO - __main__ - Step 10929: {'lr': 0.000495523954753506, 'samples': 2098368, 'steps': 10928, 'loss/train': 2.7239041328430176} -11/06/2021 22:45:49 - INFO - __main__ - Step 10930: {'lr': 0.0004955229550027347, 'samples': 2098560, 'steps': 10929, 'loss/train': 1.7207810878753662} -11/06/2021 22:45:49 - INFO - __main__ - Step 10931: {'lr': 0.0004955219551413347, 'samples': 2098752, 'steps': 10930, 'loss/train': 1.4292515516281128} -11/06/2021 22:45:50 - INFO - __main__ - Step 10932: {'lr': 0.0004955209551693063, 'samples': 2098944, 'steps': 10931, 'loss/train': 2.1134376525878906} -11/06/2021 22:45:50 - INFO - __main__ - Step 10933: {'lr': 0.0004955199550866498, 'samples': 2099136, 'steps': 10932, 'loss/train': 1.5380351543426514} -11/06/2021 22:45:51 - INFO - __main__ - Step 10934: {'lr': 0.000495518954893366, 'samples': 2099328, 'steps': 10933, 'loss/train': 1.7026230096817017} -11/06/2021 22:45:51 - INFO - __main__ - Step 10935: {'lr': 0.000495517954589455, 'samples': 2099520, 'steps': 10934, 'loss/train': 1.979361891746521} -11/06/2021 22:45:52 - INFO - __main__ - Step 10936: {'lr': 0.0004955169541749173, 'samples': 2099712, 'steps': 10935, 'loss/train': 1.7494332790374756} -11/06/2021 22:45:52 - INFO - __main__ - Step 10937: {'lr': 0.0004955159536497536, 'samples': 2099904, 'steps': 10936, 'loss/train': 1.8730812072753906} -11/06/2021 22:45:53 - INFO - __main__ - Step 10938: {'lr': 0.0004955149530139643, 'samples': 2100096, 'steps': 10937, 'loss/train': 1.707970142364502} -11/06/2021 22:45:53 - INFO - __main__ - Step 10939: {'lr': 0.0004955139522675496, 'samples': 2100288, 'steps': 10938, 'loss/train': 2.6687307357788086} -11/06/2021 22:45:53 - INFO - __main__ - Step 10940: {'lr': 0.0004955129514105101, 'samples': 2100480, 'steps': 10939, 'loss/train': 2.0217690467834473} -11/06/2021 22:45:54 - INFO - __main__ - Step 10941: {'lr': 0.0004955119504428464, 'samples': 2100672, 'steps': 10940, 'loss/train': 1.6573915481567383} -11/06/2021 22:45:55 - INFO - __main__ - Step 10942: {'lr': 0.0004955109493645587, 'samples': 2100864, 'steps': 10941, 'loss/train': 1.8716685771942139} -11/06/2021 22:45:55 - INFO - __main__ - Step 10943: {'lr': 0.0004955099481756475, 'samples': 2101056, 'steps': 10942, 'loss/train': 2.186129331588745} -11/06/2021 22:45:55 - INFO - __main__ - Step 10944: {'lr': 0.0004955089468761133, 'samples': 2101248, 'steps': 10943, 'loss/train': 2.171231985092163} -11/06/2021 22:45:56 - INFO - __main__ - Step 10945: {'lr': 0.0004955079454659567, 'samples': 2101440, 'steps': 10944, 'loss/train': 1.6056174039840698} -11/06/2021 22:45:57 - INFO - __main__ - Step 10946: {'lr': 0.0004955069439451778, 'samples': 2101632, 'steps': 10945, 'loss/train': 1.8130086660385132} -11/06/2021 22:45:57 - INFO - __main__ - Step 10947: {'lr': 0.0004955059423137774, 'samples': 2101824, 'steps': 10946, 'loss/train': 1.8952678442001343} -11/06/2021 22:45:57 - INFO - __main__ - Step 10948: {'lr': 0.0004955049405717558, 'samples': 2102016, 'steps': 10947, 'loss/train': 1.9916630983352661} -11/06/2021 22:45:58 - INFO - __main__ - Step 10949: {'lr': 0.0004955039387191135, 'samples': 2102208, 'steps': 10948, 'loss/train': 1.791800618171692} -11/06/2021 22:45:58 - INFO - __main__ - Step 10950: {'lr': 0.0004955029367558508, 'samples': 2102400, 'steps': 10949, 'loss/train': 1.4076131582260132} -11/06/2021 22:45:59 - INFO - __main__ - Step 10951: {'lr': 0.0004955019346819684, 'samples': 2102592, 'steps': 10950, 'loss/train': 1.7060812711715698} -11/06/2021 22:45:59 - INFO - __main__ - Step 10952: {'lr': 0.0004955009324974666, 'samples': 2102784, 'steps': 10951, 'loss/train': 1.271490216255188} -11/06/2021 22:46:00 - INFO - __main__ - Step 10953: {'lr': 0.0004954999302023458, 'samples': 2102976, 'steps': 10952, 'loss/train': 2.104248046875} -11/06/2021 22:46:00 - INFO - __main__ - Step 10954: {'lr': 0.0004954989277966064, 'samples': 2103168, 'steps': 10953, 'loss/train': 1.4961109161376953} -11/06/2021 22:46:01 - INFO - __main__ - Step 10955: {'lr': 0.0004954979252802491, 'samples': 2103360, 'steps': 10954, 'loss/train': 1.854745626449585} -11/06/2021 22:46:02 - INFO - __main__ - Step 10956: {'lr': 0.0004954969226532743, 'samples': 2103552, 'steps': 10955, 'loss/train': 1.7922343015670776} -11/06/2021 22:46:02 - INFO - __main__ - Step 10957: {'lr': 0.0004954959199156824, 'samples': 2103744, 'steps': 10956, 'loss/train': 2.0796141624450684} -11/06/2021 22:46:02 - INFO - __main__ - Step 10958: {'lr': 0.0004954949170674736, 'samples': 2103936, 'steps': 10957, 'loss/train': 2.0407614707946777} -11/06/2021 22:46:03 - INFO - __main__ - Step 10959: {'lr': 0.0004954939141086488, 'samples': 2104128, 'steps': 10958, 'loss/train': 1.2875730991363525} -11/06/2021 22:46:03 - INFO - __main__ - Step 10960: {'lr': 0.0004954929110392081, 'samples': 2104320, 'steps': 10959, 'loss/train': 1.918273687362671} -11/06/2021 22:46:04 - INFO - __main__ - Step 10961: {'lr': 0.0004954919078591521, 'samples': 2104512, 'steps': 10960, 'loss/train': 1.7532039880752563} -11/06/2021 22:46:05 - INFO - __main__ - Step 10962: {'lr': 0.0004954909045684812, 'samples': 2104704, 'steps': 10961, 'loss/train': 1.595262050628662} -11/06/2021 22:46:05 - INFO - __main__ - Step 10963: {'lr': 0.000495489901167196, 'samples': 2104896, 'steps': 10962, 'loss/train': 1.8555185794830322} -11/06/2021 22:46:05 - INFO - __main__ - Step 10964: {'lr': 0.0004954888976552968, 'samples': 2105088, 'steps': 10963, 'loss/train': 1.559324026107788} -11/06/2021 22:46:06 - INFO - __main__ - Step 10965: {'lr': 0.0004954878940327841, 'samples': 2105280, 'steps': 10964, 'loss/train': 1.616891860961914} -11/06/2021 22:46:07 - INFO - __main__ - Step 10966: {'lr': 0.0004954868902996582, 'samples': 2105472, 'steps': 10965, 'loss/train': 1.9043447971343994} -11/06/2021 22:46:07 - INFO - __main__ - Step 10967: {'lr': 0.0004954858864559199, 'samples': 2105664, 'steps': 10966, 'loss/train': 2.002821922302246} -11/06/2021 22:46:07 - INFO - __main__ - Step 10968: {'lr': 0.0004954848825015694, 'samples': 2105856, 'steps': 10967, 'loss/train': 1.3038442134857178} -11/06/2021 22:46:08 - INFO - __main__ - Step 10969: {'lr': 0.0004954838784366071, 'samples': 2106048, 'steps': 10968, 'loss/train': 1.6041873693466187} -11/06/2021 22:46:08 - INFO - __main__ - Step 10970: {'lr': 0.0004954828742610336, 'samples': 2106240, 'steps': 10969, 'loss/train': 2.28267502784729} -11/06/2021 22:46:09 - INFO - __main__ - Step 10971: {'lr': 0.0004954818699748493, 'samples': 2106432, 'steps': 10970, 'loss/train': 1.9312834739685059} -11/06/2021 22:46:09 - INFO - __main__ - Step 10972: {'lr': 0.0004954808655780546, 'samples': 2106624, 'steps': 10971, 'loss/train': 1.7641648054122925} -11/06/2021 22:46:10 - INFO - __main__ - Step 10973: {'lr': 0.0004954798610706502, 'samples': 2106816, 'steps': 10972, 'loss/train': 1.8444775342941284} -11/06/2021 22:46:10 - INFO - __main__ - Step 10974: {'lr': 0.0004954788564526362, 'samples': 2107008, 'steps': 10973, 'loss/train': 1.9866970777511597} -11/06/2021 22:46:10 - INFO - __main__ - Step 10975: {'lr': 0.0004954778517240133, 'samples': 2107200, 'steps': 10974, 'loss/train': 1.7459683418273926} -11/06/2021 22:46:11 - INFO - __main__ - Step 10976: {'lr': 0.0004954768468847818, 'samples': 2107392, 'steps': 10975, 'loss/train': 3.977201223373413} -11/06/2021 22:46:12 - INFO - __main__ - Step 10977: {'lr': 0.0004954758419349422, 'samples': 2107584, 'steps': 10976, 'loss/train': 1.9195420742034912} -11/06/2021 22:46:12 - INFO - __main__ - Step 10978: {'lr': 0.000495474836874495, 'samples': 2107776, 'steps': 10977, 'loss/train': 1.9030547142028809} -11/06/2021 22:46:12 - INFO - __main__ - Step 10979: {'lr': 0.0004954738317034408, 'samples': 2107968, 'steps': 10978, 'loss/train': 1.9866000413894653} -11/06/2021 22:46:13 - INFO - __main__ - Step 10980: {'lr': 0.0004954728264217796, 'samples': 2108160, 'steps': 10979, 'loss/train': 1.738264560699463} -11/06/2021 22:46:13 - INFO - __main__ - Step 10981: {'lr': 0.0004954718210295123, 'samples': 2108352, 'steps': 10980, 'loss/train': 1.8209415674209595} -11/06/2021 22:46:14 - INFO - __main__ - Step 10982: {'lr': 0.0004954708155266392, 'samples': 2108544, 'steps': 10981, 'loss/train': 1.931311011314392} -11/06/2021 22:46:15 - INFO - __main__ - Step 10983: {'lr': 0.0004954698099131606, 'samples': 2108736, 'steps': 10982, 'loss/train': 2.182440996170044} -11/06/2021 22:46:15 - INFO - __main__ - Step 10984: {'lr': 0.0004954688041890772, 'samples': 2108928, 'steps': 10983, 'loss/train': 1.8009920120239258} -11/06/2021 22:46:15 - INFO - __main__ - Step 10985: {'lr': 0.0004954677983543893, 'samples': 2109120, 'steps': 10984, 'loss/train': 1.65086829662323} -11/06/2021 22:46:16 - INFO - __main__ - Step 10986: {'lr': 0.0004954667924090974, 'samples': 2109312, 'steps': 10985, 'loss/train': 2.294792413711548} -11/06/2021 22:46:17 - INFO - __main__ - Step 10987: {'lr': 0.000495465786353202, 'samples': 2109504, 'steps': 10986, 'loss/train': 1.9113411903381348} -11/06/2021 22:46:17 - INFO - __main__ - Step 10988: {'lr': 0.0004954647801867035, 'samples': 2109696, 'steps': 10987, 'loss/train': 1.2942930459976196} -11/06/2021 22:46:17 - INFO - __main__ - Step 10989: {'lr': 0.0004954637739096023, 'samples': 2109888, 'steps': 10988, 'loss/train': 2.1266255378723145} -11/06/2021 22:46:18 - INFO - __main__ - Step 10990: {'lr': 0.0004954627675218989, 'samples': 2110080, 'steps': 10989, 'loss/train': 1.2343058586120605} -11/06/2021 22:46:18 - INFO - __main__ - Step 10991: {'lr': 0.0004954617610235939, 'samples': 2110272, 'steps': 10990, 'loss/train': 1.7390135526657104} -11/06/2021 22:46:18 - INFO - __main__ - Step 10992: {'lr': 0.0004954607544146875, 'samples': 2110464, 'steps': 10991, 'loss/train': 1.8976117372512817} -11/06/2021 22:46:20 - INFO - __main__ - Step 10993: {'lr': 0.0004954597476951804, 'samples': 2110656, 'steps': 10992, 'loss/train': 1.9760702848434448} -11/06/2021 22:46:20 - INFO - __main__ - Step 10994: {'lr': 0.0004954587408650727, 'samples': 2110848, 'steps': 10993, 'loss/train': 2.1973133087158203} -11/06/2021 22:46:21 - INFO - __main__ - Step 10995: {'lr': 0.0004954577339243652, 'samples': 2111040, 'steps': 10994, 'loss/train': 1.842615008354187} -11/06/2021 22:46:21 - INFO - __main__ - Step 10996: {'lr': 0.0004954567268730582, 'samples': 2111232, 'steps': 10995, 'loss/train': 1.7507246732711792} -11/06/2021 22:46:21 - INFO - __main__ - Step 10997: {'lr': 0.0004954557197111522, 'samples': 2111424, 'steps': 10996, 'loss/train': 4.712644577026367} -11/06/2021 22:46:22 - INFO - __main__ - Step 10998: {'lr': 0.0004954547124386477, 'samples': 2111616, 'steps': 10997, 'loss/train': 2.954491138458252} -11/06/2021 22:46:23 - INFO - __main__ - Step 10999: {'lr': 0.0004954537050555451, 'samples': 2111808, 'steps': 10998, 'loss/train': 1.7333556413650513} -11/06/2021 22:46:23 - INFO - __main__ - Step 11000: {'lr': 0.0004954526975618447, 'samples': 2112000, 'steps': 10999, 'loss/train': 1.7559417486190796} -11/06/2021 22:46:23 - INFO - __main__ - Step 11001: {'lr': 0.0004954516899575473, 'samples': 2112192, 'steps': 11000, 'loss/train': 1.4720401763916016} -11/06/2021 22:46:24 - INFO - __main__ - Step 11002: {'lr': 0.000495450682242653, 'samples': 2112384, 'steps': 11001, 'loss/train': 1.7932754755020142} -11/06/2021 22:46:24 - INFO - __main__ - Step 11003: {'lr': 0.0004954496744171624, 'samples': 2112576, 'steps': 11002, 'loss/train': 2.697819232940674} -11/06/2021 22:46:25 - INFO - __main__ - Step 11004: {'lr': 0.0004954486664810762, 'samples': 2112768, 'steps': 11003, 'loss/train': 1.973361849784851} -11/06/2021 22:46:25 - INFO - __main__ - Step 11005: {'lr': 0.0004954476584343945, 'samples': 2112960, 'steps': 11004, 'loss/train': 1.4034092426300049} -11/06/2021 22:46:26 - INFO - __main__ - Step 11006: {'lr': 0.0004954466502771178, 'samples': 2113152, 'steps': 11005, 'loss/train': 1.6337881088256836} -11/06/2021 22:46:26 - INFO - __main__ - Step 11007: {'lr': 0.0004954456420092466, 'samples': 2113344, 'steps': 11006, 'loss/train': 1.6302669048309326} -11/06/2021 22:46:27 - INFO - __main__ - Step 11008: {'lr': 0.0004954446336307814, 'samples': 2113536, 'steps': 11007, 'loss/train': 1.5346612930297852} -11/06/2021 22:46:28 - INFO - __main__ - Step 11009: {'lr': 0.0004954436251417227, 'samples': 2113728, 'steps': 11008, 'loss/train': 1.931561827659607} -11/06/2021 22:46:29 - INFO - __main__ - Step 11010: {'lr': 0.0004954426165420709, 'samples': 2113920, 'steps': 11009, 'loss/train': 2.0047390460968018} -11/06/2021 22:46:29 - INFO - __main__ - Step 11011: {'lr': 0.0004954416078318263, 'samples': 2114112, 'steps': 11010, 'loss/train': 1.6063743829727173} -11/06/2021 22:46:29 - INFO - __main__ - Step 11012: {'lr': 0.0004954405990109897, 'samples': 2114304, 'steps': 11011, 'loss/train': 1.1053050756454468} -11/06/2021 22:46:30 - INFO - __main__ - Step 11013: {'lr': 0.0004954395900795611, 'samples': 2114496, 'steps': 11012, 'loss/train': 1.6776947975158691} -11/06/2021 22:46:30 - INFO - __main__ - Step 11014: {'lr': 0.0004954385810375415, 'samples': 2114688, 'steps': 11013, 'loss/train': 0.4628012776374817} -11/06/2021 22:46:31 - INFO - __main__ - Step 11015: {'lr': 0.0004954375718849308, 'samples': 2114880, 'steps': 11014, 'loss/train': 1.808875560760498} -11/06/2021 22:46:31 - INFO - __main__ - Step 11016: {'lr': 0.0004954365626217299, 'samples': 2115072, 'steps': 11015, 'loss/train': 1.8625273704528809} -11/06/2021 22:46:32 - INFO - __main__ - Step 11017: {'lr': 0.0004954355532479391, 'samples': 2115264, 'steps': 11016, 'loss/train': 1.388060450553894} -11/06/2021 22:46:32 - INFO - __main__ - Step 11018: {'lr': 0.0004954345437635587, 'samples': 2115456, 'steps': 11017, 'loss/train': 1.43634033203125} -11/06/2021 22:46:32 - INFO - __main__ - Step 11019: {'lr': 0.0004954335341685893, 'samples': 2115648, 'steps': 11018, 'loss/train': 1.6223043203353882} -11/06/2021 22:46:33 - INFO - __main__ - Step 11020: {'lr': 0.0004954325244630315, 'samples': 2115840, 'steps': 11019, 'loss/train': 1.9205574989318848} -11/06/2021 22:46:34 - INFO - __main__ - Step 11021: {'lr': 0.0004954315146468854, 'samples': 2116032, 'steps': 11020, 'loss/train': 2.2265076637268066} -11/06/2021 22:46:34 - INFO - __main__ - Step 11022: {'lr': 0.0004954305047201517, 'samples': 2116224, 'steps': 11021, 'loss/train': 1.7414882183074951} -11/06/2021 22:46:34 - INFO - __main__ - Step 11023: {'lr': 0.0004954294946828308, 'samples': 2116416, 'steps': 11022, 'loss/train': 2.187809944152832} -11/06/2021 22:46:35 - INFO - __main__ - Step 11024: {'lr': 0.0004954284845349232, 'samples': 2116608, 'steps': 11023, 'loss/train': 1.778928279876709} -11/06/2021 22:46:35 - INFO - __main__ - Step 11025: {'lr': 0.0004954274742764292, 'samples': 2116800, 'steps': 11024, 'loss/train': 1.018846869468689} -11/06/2021 22:46:36 - INFO - __main__ - Step 11026: {'lr': 0.0004954264639073495, 'samples': 2116992, 'steps': 11025, 'loss/train': 4.848390579223633} -11/06/2021 22:46:37 - INFO - __main__ - Step 11027: {'lr': 0.0004954254534276843, 'samples': 2117184, 'steps': 11026, 'loss/train': 1.92079496383667} -11/06/2021 22:46:37 - INFO - __main__ - Step 11028: {'lr': 0.0004954244428374343, 'samples': 2117376, 'steps': 11027, 'loss/train': 1.617121934890747} -11/06/2021 22:46:37 - INFO - __main__ - Step 11029: {'lr': 0.0004954234321365998, 'samples': 2117568, 'steps': 11028, 'loss/train': 2.104278087615967} -11/06/2021 22:46:38 - INFO - __main__ - Step 11030: {'lr': 0.0004954224213251813, 'samples': 2117760, 'steps': 11029, 'loss/train': 1.8662179708480835} -11/06/2021 22:46:39 - INFO - __main__ - Step 11031: {'lr': 0.0004954214104031791, 'samples': 2117952, 'steps': 11030, 'loss/train': 1.559154748916626} -11/06/2021 22:46:39 - INFO - __main__ - Step 11032: {'lr': 0.0004954203993705939, 'samples': 2118144, 'steps': 11031, 'loss/train': 1.7694008350372314} -11/06/2021 22:46:39 - INFO - __main__ - Step 11033: {'lr': 0.0004954193882274261, 'samples': 2118336, 'steps': 11032, 'loss/train': 1.8850313425064087} -11/06/2021 22:46:40 - INFO - __main__ - Step 11034: {'lr': 0.000495418376973676, 'samples': 2118528, 'steps': 11033, 'loss/train': 1.6931498050689697} -11/06/2021 22:46:40 - INFO - __main__ - Step 11035: {'lr': 0.0004954173656093443, 'samples': 2118720, 'steps': 11034, 'loss/train': 1.525468111038208} -11/06/2021 22:46:41 - INFO - __main__ - Step 11036: {'lr': 0.0004954163541344312, 'samples': 2118912, 'steps': 11035, 'loss/train': 1.5203142166137695} -11/06/2021 22:46:41 - INFO - __main__ - Step 11037: {'lr': 0.0004954153425489374, 'samples': 2119104, 'steps': 11036, 'loss/train': 1.7933595180511475} -11/06/2021 22:46:42 - INFO - __main__ - Step 11038: {'lr': 0.0004954143308528631, 'samples': 2119296, 'steps': 11037, 'loss/train': 1.0918980836868286} -11/06/2021 22:46:42 - INFO - __main__ - Step 11039: {'lr': 0.000495413319046209, 'samples': 2119488, 'steps': 11038, 'loss/train': 2.03767728805542} -11/06/2021 22:46:42 - INFO - __main__ - Step 11040: {'lr': 0.0004954123071289754, 'samples': 2119680, 'steps': 11039, 'loss/train': 1.9475619792938232} -11/06/2021 22:46:43 - INFO - __main__ - Step 11041: {'lr': 0.0004954112951011628, 'samples': 2119872, 'steps': 11040, 'loss/train': 1.5636467933654785} -11/06/2021 22:46:44 - INFO - __main__ - Step 11042: {'lr': 0.0004954102829627717, 'samples': 2120064, 'steps': 11041, 'loss/train': 2.0013155937194824} -11/06/2021 22:46:44 - INFO - __main__ - Step 11043: {'lr': 0.0004954092707138024, 'samples': 2120256, 'steps': 11042, 'loss/train': 1.427595853805542} -11/06/2021 22:46:44 - INFO - __main__ - Step 11044: {'lr': 0.0004954082583542557, 'samples': 2120448, 'steps': 11043, 'loss/train': 1.2948354482650757} -11/06/2021 22:46:45 - INFO - __main__ - Step 11045: {'lr': 0.0004954072458841315, 'samples': 2120640, 'steps': 11044, 'loss/train': 1.7006868124008179} -11/06/2021 22:46:46 - INFO - __main__ - Step 11046: {'lr': 0.0004954062333034308, 'samples': 2120832, 'steps': 11045, 'loss/train': 1.9174220561981201} -11/06/2021 22:46:46 - INFO - __main__ - Step 11047: {'lr': 0.0004954052206121538, 'samples': 2121024, 'steps': 11046, 'loss/train': 2.2105274200439453} -11/06/2021 22:46:47 - INFO - __main__ - Step 11048: {'lr': 0.000495404207810301, 'samples': 2121216, 'steps': 11047, 'loss/train': 1.7449531555175781} -11/06/2021 22:46:47 - INFO - __main__ - Step 11049: {'lr': 0.0004954031948978729, 'samples': 2121408, 'steps': 11048, 'loss/train': 1.3999689817428589} -11/06/2021 22:46:47 - INFO - __main__ - Step 11050: {'lr': 0.0004954021818748698, 'samples': 2121600, 'steps': 11049, 'loss/train': 2.2191524505615234} -11/06/2021 22:46:48 - INFO - __main__ - Step 11051: {'lr': 0.0004954011687412923, 'samples': 2121792, 'steps': 11050, 'loss/train': 1.5955177545547485} -11/06/2021 22:46:49 - INFO - __main__ - Step 11052: {'lr': 0.0004954001554971409, 'samples': 2121984, 'steps': 11051, 'loss/train': 1.4700356721878052} -11/06/2021 22:46:49 - INFO - __main__ - Step 11053: {'lr': 0.0004953991421424159, 'samples': 2122176, 'steps': 11052, 'loss/train': 1.7988489866256714} -11/06/2021 22:46:49 - INFO - __main__ - Step 11054: {'lr': 0.0004953981286771178, 'samples': 2122368, 'steps': 11053, 'loss/train': 0.8524397015571594} -11/06/2021 22:46:50 - INFO - __main__ - Step 11055: {'lr': 0.0004953971151012471, 'samples': 2122560, 'steps': 11054, 'loss/train': 1.956466794013977} -11/06/2021 22:46:51 - INFO - __main__ - Step 11056: {'lr': 0.0004953961014148043, 'samples': 2122752, 'steps': 11055, 'loss/train': 1.7897028923034668} -11/06/2021 22:46:51 - INFO - __main__ - Step 11057: {'lr': 0.0004953950876177897, 'samples': 2122944, 'steps': 11056, 'loss/train': 2.5609962940216064} -11/06/2021 22:46:51 - INFO - __main__ - Step 11058: {'lr': 0.000495394073710204, 'samples': 2123136, 'steps': 11057, 'loss/train': 1.6628973484039307} -11/06/2021 22:46:52 - INFO - __main__ - Step 11059: {'lr': 0.0004953930596920474, 'samples': 2123328, 'steps': 11058, 'loss/train': 0.9463735222816467} -11/06/2021 22:46:52 - INFO - __main__ - Step 11060: {'lr': 0.0004953920455633206, 'samples': 2123520, 'steps': 11059, 'loss/train': 1.7199558019638062} -11/06/2021 22:46:53 - INFO - __main__ - Step 11061: {'lr': 0.0004953910313240239, 'samples': 2123712, 'steps': 11060, 'loss/train': 2.0685226917266846} -11/06/2021 22:46:53 - INFO - __main__ - Step 11062: {'lr': 0.0004953900169741577, 'samples': 2123904, 'steps': 11061, 'loss/train': 1.852885127067566} -11/06/2021 22:46:54 - INFO - __main__ - Step 11063: {'lr': 0.0004953890025137226, 'samples': 2124096, 'steps': 11062, 'loss/train': 1.0211209058761597} -11/06/2021 22:46:54 - INFO - __main__ - Step 11064: {'lr': 0.000495387987942719, 'samples': 2124288, 'steps': 11063, 'loss/train': 1.8901044130325317} -11/06/2021 22:46:55 - INFO - __main__ - Step 11065: {'lr': 0.0004953869732611474, 'samples': 2124480, 'steps': 11064, 'loss/train': 1.3837004899978638} -11/06/2021 22:46:56 - INFO - __main__ - Step 11066: {'lr': 0.0004953859584690081, 'samples': 2124672, 'steps': 11065, 'loss/train': 1.3166968822479248} -11/06/2021 22:46:56 - INFO - __main__ - Step 11067: {'lr': 0.0004953849435663018, 'samples': 2124864, 'steps': 11066, 'loss/train': 1.1097654104232788} -11/06/2021 22:46:56 - INFO - __main__ - Step 11068: {'lr': 0.0004953839285530287, 'samples': 2125056, 'steps': 11067, 'loss/train': 1.8698753118515015} -11/06/2021 22:46:57 - INFO - __main__ - Step 11069: {'lr': 0.0004953829134291895, 'samples': 2125248, 'steps': 11068, 'loss/train': 2.0392954349517822} -11/06/2021 22:46:57 - INFO - __main__ - Step 11070: {'lr': 0.0004953818981947845, 'samples': 2125440, 'steps': 11069, 'loss/train': 1.821742057800293} -11/06/2021 22:46:58 - INFO - __main__ - Step 11071: {'lr': 0.0004953808828498142, 'samples': 2125632, 'steps': 11070, 'loss/train': 1.4613873958587646} -11/06/2021 22:46:58 - INFO - __main__ - Step 11072: {'lr': 0.0004953798673942791, 'samples': 2125824, 'steps': 11071, 'loss/train': 1.947845220565796} -11/06/2021 22:46:59 - INFO - __main__ - Step 11073: {'lr': 0.0004953788518281796, 'samples': 2126016, 'steps': 11072, 'loss/train': 2.3288230895996094} -11/06/2021 22:46:59 - INFO - __main__ - Step 11074: {'lr': 0.0004953778361515163, 'samples': 2126208, 'steps': 11073, 'loss/train': 1.7177420854568481} -11/06/2021 22:46:59 - INFO - __main__ - Step 11075: {'lr': 0.0004953768203642893, 'samples': 2126400, 'steps': 11074, 'loss/train': 1.5442180633544922} -11/06/2021 22:47:00 - INFO - __main__ - Step 11076: {'lr': 0.0004953758044664994, 'samples': 2126592, 'steps': 11075, 'loss/train': 2.2615766525268555} -11/06/2021 22:47:01 - INFO - __main__ - Step 11077: {'lr': 0.0004953747884581469, 'samples': 2126784, 'steps': 11076, 'loss/train': 2.156431198120117} -11/06/2021 22:47:01 - INFO - __main__ - Step 11078: {'lr': 0.0004953737723392324, 'samples': 2126976, 'steps': 11077, 'loss/train': 2.2842390537261963} -11/06/2021 22:47:01 - INFO - __main__ - Step 11079: {'lr': 0.0004953727561097562, 'samples': 2127168, 'steps': 11078, 'loss/train': 1.461220383644104} -11/06/2021 22:47:02 - INFO - __main__ - Step 11080: {'lr': 0.0004953717397697189, 'samples': 2127360, 'steps': 11079, 'loss/train': 1.6877996921539307} -11/06/2021 22:47:02 - INFO - __main__ - Step 11081: {'lr': 0.0004953707233191207, 'samples': 2127552, 'steps': 11080, 'loss/train': 1.1885510683059692} -11/06/2021 22:47:03 - INFO - __main__ - Step 11082: {'lr': 0.0004953697067579624, 'samples': 2127744, 'steps': 11081, 'loss/train': 1.5058166980743408} -11/06/2021 22:47:03 - INFO - __main__ - Step 11083: {'lr': 0.0004953686900862442, 'samples': 2127936, 'steps': 11082, 'loss/train': 1.6675527095794678} -11/06/2021 22:47:04 - INFO - __main__ - Step 11084: {'lr': 0.0004953676733039668, 'samples': 2128128, 'steps': 11083, 'loss/train': 1.9385559558868408} -11/06/2021 22:47:04 - INFO - __main__ - Step 11085: {'lr': 0.0004953666564111303, 'samples': 2128320, 'steps': 11084, 'loss/train': 1.6214722394943237} -11/06/2021 22:47:05 - INFO - __main__ - Step 11086: {'lr': 0.0004953656394077355, 'samples': 2128512, 'steps': 11085, 'loss/train': 1.1860450506210327} -11/06/2021 22:47:06 - INFO - __main__ - Step 11087: {'lr': 0.0004953646222937828, 'samples': 2128704, 'steps': 11086, 'loss/train': 1.8663421869277954} -11/06/2021 22:47:06 - INFO - __main__ - Step 11088: {'lr': 0.0004953636050692724, 'samples': 2128896, 'steps': 11087, 'loss/train': 1.5686103105545044} -11/06/2021 22:47:06 - INFO - __main__ - Step 11089: {'lr': 0.0004953625877342051, 'samples': 2129088, 'steps': 11088, 'loss/train': 1.8276753425598145} -11/06/2021 22:47:07 - INFO - __main__ - Step 11090: {'lr': 0.0004953615702885812, 'samples': 2129280, 'steps': 11089, 'loss/train': 1.5646089315414429} -11/06/2021 22:47:07 - INFO - __main__ - Step 11091: {'lr': 0.0004953605527324011, 'samples': 2129472, 'steps': 11090, 'loss/train': 1.7502714395523071} -11/06/2021 22:47:08 - INFO - __main__ - Step 11092: {'lr': 0.0004953595350656653, 'samples': 2129664, 'steps': 11091, 'loss/train': 1.3079643249511719} -11/06/2021 22:47:08 - INFO - __main__ - Step 11093: {'lr': 0.0004953585172883743, 'samples': 2129856, 'steps': 11092, 'loss/train': 1.8320194482803345} -11/06/2021 22:47:09 - INFO - __main__ - Step 11094: {'lr': 0.0004953574994005286, 'samples': 2130048, 'steps': 11093, 'loss/train': 1.7098597288131714} -11/06/2021 22:47:09 - INFO - __main__ - Step 11095: {'lr': 0.0004953564814021285, 'samples': 2130240, 'steps': 11094, 'loss/train': 1.9974864721298218} -11/06/2021 22:47:09 - INFO - __main__ - Step 11096: {'lr': 0.0004953554632931746, 'samples': 2130432, 'steps': 11095, 'loss/train': 1.8548189401626587} -11/06/2021 22:47:10 - INFO - __main__ - Step 11097: {'lr': 0.0004953544450736674, 'samples': 2130624, 'steps': 11096, 'loss/train': 1.8645987510681152} -11/06/2021 22:47:11 - INFO - __main__ - Step 11098: {'lr': 0.0004953534267436072, 'samples': 2130816, 'steps': 11097, 'loss/train': 2.160127878189087} -11/06/2021 22:47:11 - INFO - __main__ - Step 11099: {'lr': 0.0004953524083029945, 'samples': 2131008, 'steps': 11098, 'loss/train': 2.143897533416748} -11/06/2021 22:47:11 - INFO - __main__ - Step 11100: {'lr': 0.0004953513897518298, 'samples': 2131200, 'steps': 11099, 'loss/train': 1.7265970706939697} -11/06/2021 22:47:12 - INFO - __main__ - Step 11101: {'lr': 0.0004953503710901136, 'samples': 2131392, 'steps': 11100, 'loss/train': 1.6248968839645386} -11/06/2021 22:47:13 - INFO - __main__ - Step 11102: {'lr': 0.0004953493523178463, 'samples': 2131584, 'steps': 11101, 'loss/train': 1.7727121114730835} -11/06/2021 22:47:13 - INFO - __main__ - Step 11103: {'lr': 0.0004953483334350283, 'samples': 2131776, 'steps': 11102, 'loss/train': 1.5690078735351562} -11/06/2021 22:47:13 - INFO - __main__ - Step 11104: {'lr': 0.0004953473144416602, 'samples': 2131968, 'steps': 11103, 'loss/train': 1.7810686826705933} -11/06/2021 22:47:14 - INFO - __main__ - Step 11105: {'lr': 0.0004953462953377424, 'samples': 2132160, 'steps': 11104, 'loss/train': 1.8869816064834595} -11/06/2021 22:47:14 - INFO - __main__ - Step 11106: {'lr': 0.0004953452761232753, 'samples': 2132352, 'steps': 11105, 'loss/train': 2.1093719005584717} -11/06/2021 22:47:15 - INFO - __main__ - Step 11107: {'lr': 0.0004953442567982593, 'samples': 2132544, 'steps': 11106, 'loss/train': 1.606833815574646} -11/06/2021 22:47:15 - INFO - __main__ - Step 11108: {'lr': 0.0004953432373626951, 'samples': 2132736, 'steps': 11107, 'loss/train': 1.9414929151535034} -11/06/2021 22:47:16 - INFO - __main__ - Step 11109: {'lr': 0.0004953422178165831, 'samples': 2132928, 'steps': 11108, 'loss/train': 1.8882904052734375} -11/06/2021 22:47:16 - INFO - __main__ - Step 11110: {'lr': 0.0004953411981599235, 'samples': 2133120, 'steps': 11109, 'loss/train': 1.7762526273727417} -11/06/2021 22:47:17 - INFO - __main__ - Step 11111: {'lr': 0.0004953401783927171, 'samples': 2133312, 'steps': 11110, 'loss/train': 1.9979164600372314} -11/06/2021 22:47:17 - INFO - __main__ - Step 11112: {'lr': 0.000495339158514964, 'samples': 2133504, 'steps': 11111, 'loss/train': 1.818439245223999} -11/06/2021 22:47:18 - INFO - __main__ - Step 11113: {'lr': 0.0004953381385266651, 'samples': 2133696, 'steps': 11112, 'loss/train': 1.8462194204330444} -11/06/2021 22:47:18 - INFO - __main__ - Step 11114: {'lr': 0.0004953371184278205, 'samples': 2133888, 'steps': 11113, 'loss/train': 1.7984886169433594} -11/06/2021 22:47:19 - INFO - __main__ - Step 11115: {'lr': 0.0004953360982184308, 'samples': 2134080, 'steps': 11114, 'loss/train': 2.2713496685028076} -11/06/2021 22:47:19 - INFO - __main__ - Step 11116: {'lr': 0.0004953350778984963, 'samples': 2134272, 'steps': 11115, 'loss/train': 1.8427363634109497} -11/06/2021 22:47:19 - INFO - __main__ - Step 11117: {'lr': 0.0004953340574680177, 'samples': 2134464, 'steps': 11116, 'loss/train': 1.2288328409194946} -11/06/2021 22:47:20 - INFO - __main__ - Step 11118: {'lr': 0.0004953330369269955, 'samples': 2134656, 'steps': 11117, 'loss/train': 1.9006093740463257} -11/06/2021 22:47:21 - INFO - __main__ - Step 11119: {'lr': 0.0004953320162754298, 'samples': 2134848, 'steps': 11118, 'loss/train': 1.618245244026184} -11/06/2021 22:47:21 - INFO - __main__ - Step 11120: {'lr': 0.0004953309955133214, 'samples': 2135040, 'steps': 11119, 'loss/train': 1.8152966499328613} -11/06/2021 22:47:22 - INFO - __main__ - Step 11121: {'lr': 0.0004953299746406707, 'samples': 2135232, 'steps': 11120, 'loss/train': 1.3982417583465576} -11/06/2021 22:47:22 - INFO - __main__ - Step 11122: {'lr': 0.000495328953657478, 'samples': 2135424, 'steps': 11121, 'loss/train': 1.8065004348754883} -11/06/2021 22:47:23 - INFO - __main__ - Step 11123: {'lr': 0.0004953279325637438, 'samples': 2135616, 'steps': 11122, 'loss/train': 1.807936191558838} -11/06/2021 22:47:23 - INFO - __main__ - Step 11124: {'lr': 0.0004953269113594687, 'samples': 2135808, 'steps': 11123, 'loss/train': 1.684847116470337} -11/06/2021 22:47:24 - INFO - __main__ - Step 11125: {'lr': 0.0004953258900446531, 'samples': 2136000, 'steps': 11124, 'loss/train': 1.3972996473312378} -11/06/2021 22:47:24 - INFO - __main__ - Step 11126: {'lr': 0.0004953248686192975, 'samples': 2136192, 'steps': 11125, 'loss/train': 1.6219148635864258} -11/06/2021 22:47:24 - INFO - __main__ - Step 11127: {'lr': 0.0004953238470834022, 'samples': 2136384, 'steps': 11126, 'loss/train': 0.5669246912002563} -11/06/2021 22:47:25 - INFO - __main__ - Step 11128: {'lr': 0.0004953228254369677, 'samples': 2136576, 'steps': 11127, 'loss/train': 1.5386314392089844} -11/06/2021 22:47:26 - INFO - __main__ - Step 11129: {'lr': 0.0004953218036799946, 'samples': 2136768, 'steps': 11128, 'loss/train': 1.7558674812316895} -11/06/2021 22:47:26 - INFO - __main__ - Step 11130: {'lr': 0.0004953207818124833, 'samples': 2136960, 'steps': 11129, 'loss/train': 1.2307705879211426} -11/06/2021 22:47:26 - INFO - __main__ - Step 11131: {'lr': 0.0004953197598344342, 'samples': 2137152, 'steps': 11130, 'loss/train': 2.116920232772827} -11/06/2021 22:47:27 - INFO - __main__ - Step 11132: {'lr': 0.0004953187377458478, 'samples': 2137344, 'steps': 11131, 'loss/train': 2.0362181663513184} -11/06/2021 22:47:28 - INFO - __main__ - Step 11133: {'lr': 0.0004953177155467246, 'samples': 2137536, 'steps': 11132, 'loss/train': 1.7032719850540161} -11/06/2021 22:47:28 - INFO - __main__ - Step 11134: {'lr': 0.0004953166932370651, 'samples': 2137728, 'steps': 11133, 'loss/train': 1.8138678073883057} -11/06/2021 22:47:28 - INFO - __main__ - Step 11135: {'lr': 0.0004953156708168695, 'samples': 2137920, 'steps': 11134, 'loss/train': 1.8151832818984985} -11/06/2021 22:47:29 - INFO - __main__ - Step 11136: {'lr': 0.0004953146482861385, 'samples': 2138112, 'steps': 11135, 'loss/train': 1.7565672397613525} -11/06/2021 22:47:29 - INFO - __main__ - Step 11137: {'lr': 0.0004953136256448725, 'samples': 2138304, 'steps': 11136, 'loss/train': 1.687888741493225} -11/06/2021 22:47:29 - INFO - __main__ - Step 11138: {'lr': 0.0004953126028930721, 'samples': 2138496, 'steps': 11137, 'loss/train': 1.2880886793136597} -11/06/2021 22:47:31 - INFO - __main__ - Step 11139: {'lr': 0.0004953115800307375, 'samples': 2138688, 'steps': 11138, 'loss/train': 1.8301455974578857} -11/06/2021 22:47:31 - INFO - __main__ - Step 11140: {'lr': 0.0004953105570578693, 'samples': 2138880, 'steps': 11139, 'loss/train': 1.5267943143844604} -11/06/2021 22:47:31 - INFO - __main__ - Step 11141: {'lr': 0.000495309533974468, 'samples': 2139072, 'steps': 11140, 'loss/train': 1.7597218751907349} -11/06/2021 22:47:32 - INFO - __main__ - Step 11142: {'lr': 0.0004953085107805339, 'samples': 2139264, 'steps': 11141, 'loss/train': 0.6988817453384399} -11/06/2021 22:47:32 - INFO - __main__ - Step 11143: {'lr': 0.0004953074874760677, 'samples': 2139456, 'steps': 11142, 'loss/train': 1.4152743816375732} -11/06/2021 22:47:33 - INFO - __main__ - Step 11144: {'lr': 0.0004953064640610697, 'samples': 2139648, 'steps': 11143, 'loss/train': 1.5432703495025635} -11/06/2021 22:47:33 - INFO - __main__ - Step 11145: {'lr': 0.0004953054405355404, 'samples': 2139840, 'steps': 11144, 'loss/train': 2.103456735610962} -11/06/2021 22:47:34 - INFO - __main__ - Step 11146: {'lr': 0.0004953044168994802, 'samples': 2140032, 'steps': 11145, 'loss/train': 1.8357820510864258} -11/06/2021 22:47:34 - INFO - __main__ - Step 11147: {'lr': 0.0004953033931528897, 'samples': 2140224, 'steps': 11146, 'loss/train': 1.426553726196289} -11/06/2021 22:47:34 - INFO - __main__ - Step 11148: {'lr': 0.0004953023692957691, 'samples': 2140416, 'steps': 11147, 'loss/train': 0.9832262992858887} -11/06/2021 22:47:35 - INFO - __main__ - Step 11149: {'lr': 0.0004953013453281193, 'samples': 2140608, 'steps': 11148, 'loss/train': 2.1371872425079346} -11/06/2021 22:47:36 - INFO - __main__ - Step 11150: {'lr': 0.0004953003212499403, 'samples': 2140800, 'steps': 11149, 'loss/train': 2.0583853721618652} -11/06/2021 22:47:36 - INFO - __main__ - Step 11151: {'lr': 0.0004952992970612328, 'samples': 2140992, 'steps': 11150, 'loss/train': 1.6691161394119263} -11/06/2021 22:47:36 - INFO - __main__ - Step 11152: {'lr': 0.0004952982727619973, 'samples': 2141184, 'steps': 11151, 'loss/train': 1.672674298286438} -11/06/2021 22:47:37 - INFO - __main__ - Step 11153: {'lr': 0.000495297248352234, 'samples': 2141376, 'steps': 11152, 'loss/train': 0.8161516785621643} -11/06/2021 22:47:38 - INFO - __main__ - Step 11154: {'lr': 0.0004952962238319436, 'samples': 2141568, 'steps': 11153, 'loss/train': 1.0644028186798096} -11/06/2021 22:47:38 - INFO - __main__ - Step 11155: {'lr': 0.0004952951992011266, 'samples': 2141760, 'steps': 11154, 'loss/train': 1.5536161661148071} -11/06/2021 22:47:39 - INFO - __main__ - Step 11156: {'lr': 0.0004952941744597834, 'samples': 2141952, 'steps': 11155, 'loss/train': 1.6991686820983887} -11/06/2021 22:47:39 - INFO - __main__ - Step 11157: {'lr': 0.0004952931496079143, 'samples': 2142144, 'steps': 11156, 'loss/train': 1.9701721668243408} -11/06/2021 22:47:39 - INFO - __main__ - Step 11158: {'lr': 0.00049529212464552, 'samples': 2142336, 'steps': 11157, 'loss/train': 1.5034873485565186} -11/06/2021 22:47:40 - INFO - __main__ - Step 11159: {'lr': 0.0004952910995726008, 'samples': 2142528, 'steps': 11158, 'loss/train': 1.8932499885559082} -11/06/2021 22:47:41 - INFO - __main__ - Step 11160: {'lr': 0.0004952900743891573, 'samples': 2142720, 'steps': 11159, 'loss/train': 1.5492379665374756} -11/06/2021 22:47:41 - INFO - __main__ - Step 11161: {'lr': 0.0004952890490951898, 'samples': 2142912, 'steps': 11160, 'loss/train': 1.9090741872787476} -11/06/2021 22:47:41 - INFO - __main__ - Step 11162: {'lr': 0.0004952880236906988, 'samples': 2143104, 'steps': 11161, 'loss/train': 1.2465680837631226} -11/06/2021 22:47:42 - INFO - __main__ - Step 11163: {'lr': 0.0004952869981756848, 'samples': 2143296, 'steps': 11162, 'loss/train': 1.629738450050354} -11/06/2021 22:47:42 - INFO - __main__ - Step 11164: {'lr': 0.0004952859725501484, 'samples': 2143488, 'steps': 11163, 'loss/train': 1.934152364730835} -11/06/2021 22:47:43 - INFO - __main__ - Step 11165: {'lr': 0.0004952849468140898, 'samples': 2143680, 'steps': 11164, 'loss/train': 1.5853830575942993} -11/06/2021 22:47:43 - INFO - __main__ - Step 11166: {'lr': 0.0004952839209675096, 'samples': 2143872, 'steps': 11165, 'loss/train': 1.383769154548645} -11/06/2021 22:47:44 - INFO - __main__ - Step 11167: {'lr': 0.0004952828950104083, 'samples': 2144064, 'steps': 11166, 'loss/train': 1.3340117931365967} -11/06/2021 22:47:44 - INFO - __main__ - Step 11168: {'lr': 0.0004952818689427863, 'samples': 2144256, 'steps': 11167, 'loss/train': 1.787481665611267} -11/06/2021 22:47:44 - INFO - __main__ - Step 11169: {'lr': 0.0004952808427646441, 'samples': 2144448, 'steps': 11168, 'loss/train': 1.6143748760223389} -11/06/2021 22:47:45 - INFO - __main__ - Step 11170: {'lr': 0.000495279816475982, 'samples': 2144640, 'steps': 11169, 'loss/train': 1.741720199584961} -11/06/2021 22:47:46 - INFO - __main__ - Step 11171: {'lr': 0.0004952787900768008, 'samples': 2144832, 'steps': 11170, 'loss/train': 1.8251887559890747} -11/06/2021 22:47:46 - INFO - __main__ - Step 11172: {'lr': 0.0004952777635671006, 'samples': 2145024, 'steps': 11171, 'loss/train': 2.326918125152588} -11/06/2021 22:47:46 - INFO - __main__ - Step 11173: {'lr': 0.0004952767369468821, 'samples': 2145216, 'steps': 11172, 'loss/train': 1.6599018573760986} -11/06/2021 22:47:47 - INFO - __main__ - Step 11174: {'lr': 0.0004952757102161457, 'samples': 2145408, 'steps': 11173, 'loss/train': 1.3439342975616455} -11/06/2021 22:47:48 - INFO - __main__ - Step 11175: {'lr': 0.0004952746833748918, 'samples': 2145600, 'steps': 11174, 'loss/train': 1.5779838562011719} -11/06/2021 22:47:48 - INFO - __main__ - Step 11176: {'lr': 0.0004952736564231209, 'samples': 2145792, 'steps': 11175, 'loss/train': 1.711625099182129} -11/06/2021 22:47:49 - INFO - __main__ - Step 11177: {'lr': 0.0004952726293608335, 'samples': 2145984, 'steps': 11176, 'loss/train': 1.7261056900024414} -11/06/2021 22:47:49 - INFO - __main__ - Step 11178: {'lr': 0.0004952716021880301, 'samples': 2146176, 'steps': 11177, 'loss/train': 2.207341194152832} -11/06/2021 22:47:49 - INFO - __main__ - Step 11179: {'lr': 0.0004952705749047111, 'samples': 2146368, 'steps': 11178, 'loss/train': 1.6642247438430786} -11/06/2021 22:47:50 - INFO - __main__ - Step 11180: {'lr': 0.0004952695475108768, 'samples': 2146560, 'steps': 11179, 'loss/train': 1.309320092201233} -11/06/2021 22:47:51 - INFO - __main__ - Step 11181: {'lr': 0.000495268520006528, 'samples': 2146752, 'steps': 11180, 'loss/train': 1.2601646184921265} -11/06/2021 22:47:51 - INFO - __main__ - Step 11182: {'lr': 0.000495267492391665, 'samples': 2146944, 'steps': 11181, 'loss/train': 1.730563759803772} -11/06/2021 22:47:52 - INFO - __main__ - Step 11183: {'lr': 0.0004952664646662882, 'samples': 2147136, 'steps': 11182, 'loss/train': 1.8496640920639038} -11/06/2021 22:47:52 - INFO - __main__ - Step 11184: {'lr': 0.000495265436830398, 'samples': 2147328, 'steps': 11183, 'loss/train': 1.282710075378418} -11/06/2021 22:47:52 - INFO - __main__ - Step 11185: {'lr': 0.0004952644088839951, 'samples': 2147520, 'steps': 11184, 'loss/train': 0.9519102573394775} -11/06/2021 22:47:54 - INFO - __main__ - Step 11186: {'lr': 0.0004952633808270797, 'samples': 2147712, 'steps': 11185, 'loss/train': 2.1716973781585693} -11/06/2021 22:47:54 - INFO - __main__ - Step 11187: {'lr': 0.0004952623526596526, 'samples': 2147904, 'steps': 11186, 'loss/train': 1.5648038387298584} -11/06/2021 22:47:54 - INFO - __main__ - Step 11188: {'lr': 0.000495261324381714, 'samples': 2148096, 'steps': 11187, 'loss/train': 1.8554600477218628} -11/06/2021 22:47:55 - INFO - __main__ - Step 11189: {'lr': 0.0004952602959932644, 'samples': 2148288, 'steps': 11188, 'loss/train': 0.2998165488243103} -11/06/2021 22:47:55 - INFO - __main__ - Step 11190: {'lr': 0.0004952592674943043, 'samples': 2148480, 'steps': 11189, 'loss/train': 1.513887882232666} -11/06/2021 22:47:56 - INFO - __main__ - Step 11191: {'lr': 0.0004952582388848343, 'samples': 2148672, 'steps': 11190, 'loss/train': 1.61158287525177} -11/06/2021 22:47:56 - INFO - __main__ - Step 11192: {'lr': 0.0004952572101648545, 'samples': 2148864, 'steps': 11191, 'loss/train': 1.4567087888717651} -11/06/2021 22:47:57 - INFO - __main__ - Step 11193: {'lr': 0.0004952561813343657, 'samples': 2149056, 'steps': 11192, 'loss/train': 1.598156452178955} -11/06/2021 22:47:57 - INFO - __main__ - Step 11194: {'lr': 0.0004952551523933682, 'samples': 2149248, 'steps': 11193, 'loss/train': 2.243593692779541} -11/06/2021 22:47:58 - INFO - __main__ - Step 11195: {'lr': 0.0004952541233418626, 'samples': 2149440, 'steps': 11194, 'loss/train': 1.6861417293548584} -11/06/2021 22:47:59 - INFO - __main__ - Step 11196: {'lr': 0.0004952530941798492, 'samples': 2149632, 'steps': 11195, 'loss/train': 1.3837568759918213} -11/06/2021 22:47:59 - INFO - __main__ - Step 11197: {'lr': 0.0004952520649073286, 'samples': 2149824, 'steps': 11196, 'loss/train': 1.8483117818832397} -11/06/2021 22:47:59 - INFO - __main__ - Step 11198: {'lr': 0.0004952510355243012, 'samples': 2150016, 'steps': 11197, 'loss/train': 1.94416081905365} -11/06/2021 22:48:00 - INFO - __main__ - Step 11199: {'lr': 0.0004952500060307674, 'samples': 2150208, 'steps': 11198, 'loss/train': 1.9236924648284912} -11/06/2021 22:48:00 - INFO - __main__ - Step 11200: {'lr': 0.0004952489764267278, 'samples': 2150400, 'steps': 11199, 'loss/train': 2.271418333053589} -11/06/2021 22:48:01 - INFO - __main__ - Step 11201: {'lr': 0.0004952479467121827, 'samples': 2150592, 'steps': 11200, 'loss/train': 1.6901092529296875} -11/06/2021 22:48:01 - INFO - __main__ - Step 11202: {'lr': 0.0004952469168871327, 'samples': 2150784, 'steps': 11201, 'loss/train': 1.9666694402694702} -11/06/2021 22:48:02 - INFO - __main__ - Step 11203: {'lr': 0.0004952458869515782, 'samples': 2150976, 'steps': 11202, 'loss/train': 1.9771145582199097} -11/06/2021 22:48:02 - INFO - __main__ - Step 11204: {'lr': 0.0004952448569055198, 'samples': 2151168, 'steps': 11203, 'loss/train': 1.4397884607315063} -11/06/2021 22:48:02 - INFO - __main__ - Step 11205: {'lr': 0.0004952438267489578, 'samples': 2151360, 'steps': 11204, 'loss/train': 1.73050856590271} -11/06/2021 22:48:03 - INFO - __main__ - Step 11206: {'lr': 0.0004952427964818927, 'samples': 2151552, 'steps': 11205, 'loss/train': 1.7064839601516724} -11/06/2021 22:48:04 - INFO - __main__ - Step 11207: {'lr': 0.0004952417661043249, 'samples': 2151744, 'steps': 11206, 'loss/train': 1.7774326801300049} -11/06/2021 22:48:04 - INFO - __main__ - Step 11208: {'lr': 0.0004952407356162551, 'samples': 2151936, 'steps': 11207, 'loss/train': 1.5006650686264038} -11/06/2021 22:48:04 - INFO - __main__ - Step 11209: {'lr': 0.0004952397050176835, 'samples': 2152128, 'steps': 11208, 'loss/train': 1.9831914901733398} -11/06/2021 22:48:05 - INFO - __main__ - Step 11210: {'lr': 0.0004952386743086107, 'samples': 2152320, 'steps': 11209, 'loss/train': 1.5023480653762817} -11/06/2021 22:48:05 - INFO - __main__ - Step 11211: {'lr': 0.0004952376434890372, 'samples': 2152512, 'steps': 11210, 'loss/train': 1.4154393672943115} -11/06/2021 22:48:06 - INFO - __main__ - Step 11212: {'lr': 0.0004952366125589633, 'samples': 2152704, 'steps': 11211, 'loss/train': 1.498394250869751} -11/06/2021 22:48:07 - INFO - __main__ - Step 11213: {'lr': 0.0004952355815183897, 'samples': 2152896, 'steps': 11212, 'loss/train': 1.85457444190979} -11/06/2021 22:48:07 - INFO - __main__ - Step 11214: {'lr': 0.0004952345503673166, 'samples': 2153088, 'steps': 11213, 'loss/train': 1.908733606338501} -11/06/2021 22:48:07 - INFO - __main__ - Step 11215: {'lr': 0.0004952335191057447, 'samples': 2153280, 'steps': 11214, 'loss/train': 1.707075834274292} -11/06/2021 22:48:08 - INFO - __main__ - Step 11216: {'lr': 0.0004952324877336743, 'samples': 2153472, 'steps': 11215, 'loss/train': 1.5228673219680786} -11/06/2021 22:48:09 - INFO - __main__ - Step 11217: {'lr': 0.0004952314562511059, 'samples': 2153664, 'steps': 11216, 'loss/train': 2.17525053024292} -11/06/2021 22:48:09 - INFO - __main__ - Step 11218: {'lr': 0.00049523042465804, 'samples': 2153856, 'steps': 11217, 'loss/train': 1.8961803913116455} -11/06/2021 22:48:09 - INFO - __main__ - Step 11219: {'lr': 0.0004952293929544771, 'samples': 2154048, 'steps': 11218, 'loss/train': 1.9099823236465454} -11/06/2021 22:48:10 - INFO - __main__ - Step 11220: {'lr': 0.0004952283611404176, 'samples': 2154240, 'steps': 11219, 'loss/train': 1.5863221883773804} -11/06/2021 22:48:10 - INFO - __main__ - Step 11221: {'lr': 0.0004952273292158619, 'samples': 2154432, 'steps': 11220, 'loss/train': 1.5212019681930542} -11/06/2021 22:48:11 - INFO - __main__ - Step 11222: {'lr': 0.0004952262971808106, 'samples': 2154624, 'steps': 11221, 'loss/train': 1.0951485633850098} -11/06/2021 22:48:11 - INFO - __main__ - Step 11223: {'lr': 0.0004952252650352642, 'samples': 2154816, 'steps': 11222, 'loss/train': 1.8635188341140747} -11/06/2021 22:48:12 - INFO - __main__ - Step 11224: {'lr': 0.000495224232779223, 'samples': 2155008, 'steps': 11223, 'loss/train': 1.7595049142837524} -11/06/2021 22:48:12 - INFO - __main__ - Step 11225: {'lr': 0.0004952232004126876, 'samples': 2155200, 'steps': 11224, 'loss/train': 1.5507785081863403} -11/06/2021 22:48:12 - INFO - __main__ - Step 11226: {'lr': 0.0004952221679356583, 'samples': 2155392, 'steps': 11225, 'loss/train': 1.63408625125885} -11/06/2021 22:48:13 - INFO - __main__ - Step 11227: {'lr': 0.0004952211353481358, 'samples': 2155584, 'steps': 11226, 'loss/train': 1.6727948188781738} -11/06/2021 22:48:14 - INFO - __main__ - Step 11228: {'lr': 0.0004952201026501204, 'samples': 2155776, 'steps': 11227, 'loss/train': 1.2963249683380127} -11/06/2021 22:48:14 - INFO - __main__ - Step 11229: {'lr': 0.0004952190698416126, 'samples': 2155968, 'steps': 11228, 'loss/train': 1.5582791566848755} -11/06/2021 22:48:14 - INFO - __main__ - Step 11230: {'lr': 0.0004952180369226129, 'samples': 2156160, 'steps': 11229, 'loss/train': 2.1736087799072266} -11/06/2021 22:48:15 - INFO - __main__ - Step 11231: {'lr': 0.0004952170038931217, 'samples': 2156352, 'steps': 11230, 'loss/train': 1.376936912536621} -11/06/2021 22:48:15 - INFO - __main__ - Step 11232: {'lr': 0.0004952159707531395, 'samples': 2156544, 'steps': 11231, 'loss/train': 1.1369280815124512} -11/06/2021 22:48:17 - INFO - __main__ - Step 11233: {'lr': 0.0004952149375026668, 'samples': 2156736, 'steps': 11232, 'loss/train': 1.7504469156265259} -11/06/2021 22:48:17 - INFO - __main__ - Step 11234: {'lr': 0.000495213904141704, 'samples': 2156928, 'steps': 11233, 'loss/train': 1.4631931781768799} -11/06/2021 22:48:17 - INFO - __main__ - Step 11235: {'lr': 0.0004952128706702516, 'samples': 2157120, 'steps': 11234, 'loss/train': 2.062126636505127} -11/06/2021 22:48:18 - INFO - __main__ - Step 11236: {'lr': 0.0004952118370883101, 'samples': 2157312, 'steps': 11235, 'loss/train': 2.1615216732025146} -11/06/2021 22:48:18 - INFO - __main__ - Step 11237: {'lr': 0.0004952108033958798, 'samples': 2157504, 'steps': 11236, 'loss/train': 2.1354172229766846} -11/06/2021 22:48:19 - INFO - __main__ - Step 11238: {'lr': 0.0004952097695929614, 'samples': 2157696, 'steps': 11237, 'loss/train': 1.028824806213379} -11/06/2021 22:48:19 - INFO - __main__ - Step 11239: {'lr': 0.0004952087356795553, 'samples': 2157888, 'steps': 11238, 'loss/train': 1.6951218843460083} -11/06/2021 22:48:20 - INFO - __main__ - Step 11240: {'lr': 0.0004952077016556619, 'samples': 2158080, 'steps': 11239, 'loss/train': 1.766661524772644} -11/06/2021 22:48:20 - INFO - __main__ - Step 11241: {'lr': 0.0004952066675212816, 'samples': 2158272, 'steps': 11240, 'loss/train': 1.3343703746795654} -11/06/2021 22:48:20 - INFO - __main__ - Step 11242: {'lr': 0.0004952056332764151, 'samples': 2158464, 'steps': 11241, 'loss/train': 1.303107500076294} -11/06/2021 22:48:21 - INFO - __main__ - Step 11243: {'lr': 0.0004952045989210627, 'samples': 2158656, 'steps': 11242, 'loss/train': 1.767581820487976} -11/06/2021 22:48:22 - INFO - __main__ - Step 11244: {'lr': 0.0004952035644552249, 'samples': 2158848, 'steps': 11243, 'loss/train': 1.4197368621826172} -11/06/2021 22:48:22 - INFO - __main__ - Step 11245: {'lr': 0.000495202529878902, 'samples': 2159040, 'steps': 11244, 'loss/train': 1.4061685800552368} -11/06/2021 22:48:22 - INFO - __main__ - Step 11246: {'lr': 0.0004952014951920948, 'samples': 2159232, 'steps': 11245, 'loss/train': 2.45194673538208} -11/06/2021 22:48:23 - INFO - __main__ - Step 11247: {'lr': 0.0004952004603948034, 'samples': 2159424, 'steps': 11246, 'loss/train': 2.113942861557007} -11/06/2021 22:48:24 - INFO - __main__ - Step 11248: {'lr': 0.0004951994254870286, 'samples': 2159616, 'steps': 11247, 'loss/train': 1.3976362943649292} -11/06/2021 22:48:24 - INFO - __main__ - Step 11249: {'lr': 0.0004951983904687708, 'samples': 2159808, 'steps': 11248, 'loss/train': 1.9836783409118652} -11/06/2021 22:48:24 - INFO - __main__ - Step 11250: {'lr': 0.0004951973553400303, 'samples': 2160000, 'steps': 11249, 'loss/train': 2.1718714237213135} -11/06/2021 22:48:25 - INFO - __main__ - Step 11251: {'lr': 0.0004951963201008077, 'samples': 2160192, 'steps': 11250, 'loss/train': 1.9737859964370728} -11/06/2021 22:48:25 - INFO - __main__ - Step 11252: {'lr': 0.0004951952847511033, 'samples': 2160384, 'steps': 11251, 'loss/train': 1.3120644092559814} -11/06/2021 22:48:25 - INFO - __main__ - Step 11253: {'lr': 0.0004951942492909177, 'samples': 2160576, 'steps': 11252, 'loss/train': 1.7218273878097534} -11/06/2021 22:48:26 - INFO - __main__ - Step 11254: {'lr': 0.0004951932137202515, 'samples': 2160768, 'steps': 11253, 'loss/train': 1.8016955852508545} -11/06/2021 22:48:27 - INFO - __main__ - Step 11255: {'lr': 0.0004951921780391049, 'samples': 2160960, 'steps': 11254, 'loss/train': 1.4004523754119873} -11/06/2021 22:48:27 - INFO - __main__ - Step 11256: {'lr': 0.0004951911422474785, 'samples': 2161152, 'steps': 11255, 'loss/train': 1.1996997594833374} -11/06/2021 22:48:28 - INFO - __main__ - Step 11257: {'lr': 0.0004951901063453728, 'samples': 2161344, 'steps': 11256, 'loss/train': 1.6938501596450806} -11/06/2021 22:48:28 - INFO - __main__ - Step 11258: {'lr': 0.0004951890703327883, 'samples': 2161536, 'steps': 11257, 'loss/train': 1.6818426847457886} -11/06/2021 22:48:29 - INFO - __main__ - Step 11259: {'lr': 0.0004951880342097251, 'samples': 2161728, 'steps': 11258, 'loss/train': 1.2888652086257935} -11/06/2021 22:48:29 - INFO - __main__ - Step 11260: {'lr': 0.0004951869979761842, 'samples': 2161920, 'steps': 11259, 'loss/train': 1.692081332206726} -11/06/2021 22:48:30 - INFO - __main__ - Step 11261: {'lr': 0.0004951859616321658, 'samples': 2162112, 'steps': 11260, 'loss/train': 1.8977314233779907} -11/06/2021 22:48:30 - INFO - __main__ - Step 11262: {'lr': 0.0004951849251776703, 'samples': 2162304, 'steps': 11261, 'loss/train': 3.5356547832489014} -11/06/2021 22:48:30 - INFO - __main__ - Step 11263: {'lr': 0.0004951838886126983, 'samples': 2162496, 'steps': 11262, 'loss/train': 1.3212937116622925} -11/06/2021 22:48:31 - INFO - __main__ - Step 11264: {'lr': 0.0004951828519372503, 'samples': 2162688, 'steps': 11263, 'loss/train': 1.470284104347229} -11/06/2021 22:48:32 - INFO - __main__ - Step 11265: {'lr': 0.0004951818151513267, 'samples': 2162880, 'steps': 11264, 'loss/train': 1.6359577178955078} -11/06/2021 22:48:32 - INFO - __main__ - Step 11266: {'lr': 0.0004951807782549277, 'samples': 2163072, 'steps': 11265, 'loss/train': 1.4494744539260864} -11/06/2021 22:48:32 - INFO - __main__ - Step 11267: {'lr': 0.0004951797412480544, 'samples': 2163264, 'steps': 11266, 'loss/train': 1.7457062005996704} -11/06/2021 22:48:33 - INFO - __main__ - Step 11268: {'lr': 0.0004951787041307066, 'samples': 2163456, 'steps': 11267, 'loss/train': 1.7130874395370483} -11/06/2021 22:48:34 - INFO - __main__ - Step 11269: {'lr': 0.0004951776669028851, 'samples': 2163648, 'steps': 11268, 'loss/train': 1.1853411197662354} -11/06/2021 22:48:34 - INFO - __main__ - Step 11270: {'lr': 0.0004951766295645904, 'samples': 2163840, 'steps': 11269, 'loss/train': 0.6745047569274902} -11/06/2021 22:48:34 - INFO - __main__ - Step 11271: {'lr': 0.000495175592115823, 'samples': 2164032, 'steps': 11270, 'loss/train': 2.009004592895508} -11/06/2021 22:48:35 - INFO - __main__ - Step 11272: {'lr': 0.0004951745545565831, 'samples': 2164224, 'steps': 11271, 'loss/train': 1.5138862133026123} -11/06/2021 22:48:35 - INFO - __main__ - Step 11273: {'lr': 0.0004951735168868713, 'samples': 2164416, 'steps': 11272, 'loss/train': 1.8810991048812866} -11/06/2021 22:48:36 - INFO - __main__ - Step 11274: {'lr': 0.0004951724791066881, 'samples': 2164608, 'steps': 11273, 'loss/train': 1.8236666917800903} -11/06/2021 22:48:37 - INFO - __main__ - Step 11275: {'lr': 0.0004951714412160342, 'samples': 2164800, 'steps': 11274, 'loss/train': 1.84593665599823} -11/06/2021 22:48:37 - INFO - __main__ - Step 11276: {'lr': 0.0004951704032149096, 'samples': 2164992, 'steps': 11275, 'loss/train': 1.9748361110687256} -11/06/2021 22:48:37 - INFO - __main__ - Step 11277: {'lr': 0.000495169365103315, 'samples': 2165184, 'steps': 11276, 'loss/train': 1.7609519958496094} -11/06/2021 22:48:38 - INFO - __main__ - Step 11278: {'lr': 0.0004951683268812511, 'samples': 2165376, 'steps': 11277, 'loss/train': 2.1392531394958496} -11/06/2021 22:48:38 - INFO - __main__ - Step 11279: {'lr': 0.0004951672885487178, 'samples': 2165568, 'steps': 11278, 'loss/train': 1.3590013980865479} -11/06/2021 22:48:39 - INFO - __main__ - Step 11280: {'lr': 0.0004951662501057161, 'samples': 2165760, 'steps': 11279, 'loss/train': 1.762505054473877} -11/06/2021 22:48:39 - INFO - __main__ - Step 11281: {'lr': 0.0004951652115522462, 'samples': 2165952, 'steps': 11280, 'loss/train': 1.7629950046539307} -11/06/2021 22:48:40 - INFO - __main__ - Step 11282: {'lr': 0.0004951641728883087, 'samples': 2166144, 'steps': 11281, 'loss/train': 2.0722081661224365} -11/06/2021 22:48:40 - INFO - __main__ - Step 11283: {'lr': 0.000495163134113904, 'samples': 2166336, 'steps': 11282, 'loss/train': 1.4518979787826538} -11/06/2021 22:48:40 - INFO - __main__ - Step 11284: {'lr': 0.0004951620952290325, 'samples': 2166528, 'steps': 11283, 'loss/train': 1.5402740240097046} -11/06/2021 22:48:41 - INFO - __main__ - Step 11285: {'lr': 0.0004951610562336949, 'samples': 2166720, 'steps': 11284, 'loss/train': 1.6244908571243286} -11/06/2021 22:48:42 - INFO - __main__ - Step 11286: {'lr': 0.0004951600171278914, 'samples': 2166912, 'steps': 11285, 'loss/train': 1.898524522781372} -11/06/2021 22:48:42 - INFO - __main__ - Step 11287: {'lr': 0.0004951589779116225, 'samples': 2167104, 'steps': 11286, 'loss/train': 1.5938304662704468} -11/06/2021 22:48:42 - INFO - __main__ - Step 11288: {'lr': 0.0004951579385848889, 'samples': 2167296, 'steps': 11287, 'loss/train': 1.7559034824371338} -11/06/2021 22:48:43 - INFO - __main__ - Step 11289: {'lr': 0.0004951568991476908, 'samples': 2167488, 'steps': 11288, 'loss/train': 1.3978345394134521} -11/06/2021 22:48:44 - INFO - __main__ - Step 11290: {'lr': 0.0004951558596000289, 'samples': 2167680, 'steps': 11289, 'loss/train': 2.016148328781128} -11/06/2021 22:48:44 - INFO - __main__ - Step 11291: {'lr': 0.0004951548199419035, 'samples': 2167872, 'steps': 11290, 'loss/train': 1.7956223487854004} -11/06/2021 22:48:45 - INFO - __main__ - Step 11292: {'lr': 0.0004951537801733152, 'samples': 2168064, 'steps': 11291, 'loss/train': 2.4459264278411865} -11/06/2021 22:48:45 - INFO - __main__ - Step 11293: {'lr': 0.0004951527402942643, 'samples': 2168256, 'steps': 11292, 'loss/train': 1.4760860204696655} -11/06/2021 22:48:45 - INFO - __main__ - Step 11294: {'lr': 0.0004951517003047512, 'samples': 2168448, 'steps': 11293, 'loss/train': 1.7521895170211792} -11/06/2021 22:48:46 - INFO - __main__ - Step 11295: {'lr': 0.0004951506602047767, 'samples': 2168640, 'steps': 11294, 'loss/train': 1.6032721996307373} -11/06/2021 22:48:47 - INFO - __main__ - Step 11296: {'lr': 0.0004951496199943412, 'samples': 2168832, 'steps': 11295, 'loss/train': 1.7261722087860107} -11/06/2021 22:48:47 - INFO - __main__ - Step 11297: {'lr': 0.0004951485796734448, 'samples': 2169024, 'steps': 11296, 'loss/train': 1.5861694812774658} -11/06/2021 22:48:47 - INFO - __main__ - Step 11298: {'lr': 0.0004951475392420884, 'samples': 2169216, 'steps': 11297, 'loss/train': 2.0938913822174072} -11/06/2021 22:48:48 - INFO - __main__ - Step 11299: {'lr': 0.0004951464987002724, 'samples': 2169408, 'steps': 11298, 'loss/train': 1.6789658069610596} -11/06/2021 22:48:49 - INFO - __main__ - Step 11300: {'lr': 0.000495145458047997, 'samples': 2169600, 'steps': 11299, 'loss/train': 1.7498912811279297} -11/06/2021 22:48:49 - INFO - __main__ - Step 11301: {'lr': 0.0004951444172852629, 'samples': 2169792, 'steps': 11300, 'loss/train': 1.6389604806900024} -11/06/2021 22:48:50 - INFO - __main__ - Step 11302: {'lr': 0.0004951433764120705, 'samples': 2169984, 'steps': 11301, 'loss/train': 1.9538257122039795} -11/06/2021 22:48:50 - INFO - __main__ - Step 11303: {'lr': 0.0004951423354284202, 'samples': 2170176, 'steps': 11302, 'loss/train': 1.9088263511657715} -11/06/2021 22:48:50 - INFO - __main__ - Step 11304: {'lr': 0.0004951412943343126, 'samples': 2170368, 'steps': 11303, 'loss/train': 1.584460735321045} -11/06/2021 22:48:51 - INFO - __main__ - Step 11305: {'lr': 0.0004951402531297482, 'samples': 2170560, 'steps': 11304, 'loss/train': 2.0329270362854004} -11/06/2021 22:48:52 - INFO - __main__ - Step 11306: {'lr': 0.0004951392118147273, 'samples': 2170752, 'steps': 11305, 'loss/train': 1.8602527379989624} -11/06/2021 22:48:52 - INFO - __main__ - Step 11307: {'lr': 0.0004951381703892506, 'samples': 2170944, 'steps': 11306, 'loss/train': 2.025909185409546} -11/06/2021 22:48:52 - INFO - __main__ - Step 11308: {'lr': 0.0004951371288533182, 'samples': 2171136, 'steps': 11307, 'loss/train': 2.1841092109680176} -11/06/2021 22:48:53 - INFO - __main__ - Step 11309: {'lr': 0.0004951360872069309, 'samples': 2171328, 'steps': 11308, 'loss/train': 1.3344480991363525} -11/06/2021 22:48:53 - INFO - __main__ - Step 11310: {'lr': 0.0004951350454500891, 'samples': 2171520, 'steps': 11309, 'loss/train': 1.7531185150146484} -11/06/2021 22:48:54 - INFO - __main__ - Step 11311: {'lr': 0.0004951340035827932, 'samples': 2171712, 'steps': 11310, 'loss/train': 1.6113486289978027} -11/06/2021 22:48:54 - INFO - __main__ - Step 11312: {'lr': 0.0004951329616050437, 'samples': 2171904, 'steps': 11311, 'loss/train': 1.9962801933288574} -11/06/2021 22:48:55 - INFO - __main__ - Step 11313: {'lr': 0.000495131919516841, 'samples': 2172096, 'steps': 11312, 'loss/train': 1.5207346677780151} -11/06/2021 22:48:55 - INFO - __main__ - Step 11314: {'lr': 0.0004951308773181856, 'samples': 2172288, 'steps': 11313, 'loss/train': 2.1913249492645264} -11/06/2021 22:48:55 - INFO - __main__ - Step 11315: {'lr': 0.0004951298350090782, 'samples': 2172480, 'steps': 11314, 'loss/train': 1.2448691129684448} -11/06/2021 22:48:56 - INFO - __main__ - Step 11316: {'lr': 0.000495128792589519, 'samples': 2172672, 'steps': 11315, 'loss/train': 2.215278387069702} -11/06/2021 22:48:57 - INFO - __main__ - Step 11317: {'lr': 0.0004951277500595085, 'samples': 2172864, 'steps': 11316, 'loss/train': 1.4738010168075562} -11/06/2021 22:48:57 - INFO - __main__ - Step 11318: {'lr': 0.0004951267074190473, 'samples': 2173056, 'steps': 11317, 'loss/train': 1.4282978773117065} -11/06/2021 22:48:58 - INFO - __main__ - Step 11319: {'lr': 0.0004951256646681356, 'samples': 2173248, 'steps': 11318, 'loss/train': 1.662163496017456} -11/06/2021 22:48:58 - INFO - __main__ - Step 11320: {'lr': 0.0004951246218067744, 'samples': 2173440, 'steps': 11319, 'loss/train': 1.9382797479629517} -11/06/2021 22:48:59 - INFO - __main__ - Step 11321: {'lr': 0.0004951235788349636, 'samples': 2173632, 'steps': 11320, 'loss/train': 3.9597983360290527} -11/06/2021 22:48:59 - INFO - __main__ - Step 11322: {'lr': 0.0004951225357527038, 'samples': 2173824, 'steps': 11321, 'loss/train': 1.7996548414230347} -11/06/2021 22:49:00 - INFO - __main__ - Step 11323: {'lr': 0.0004951214925599957, 'samples': 2174016, 'steps': 11322, 'loss/train': 1.6424283981323242} -11/06/2021 22:49:00 - INFO - __main__ - Step 11324: {'lr': 0.0004951204492568397, 'samples': 2174208, 'steps': 11323, 'loss/train': 1.757283329963684} -11/06/2021 22:49:00 - INFO - __main__ - Step 11325: {'lr': 0.0004951194058432361, 'samples': 2174400, 'steps': 11324, 'loss/train': 1.688281774520874} -11/06/2021 22:49:01 - INFO - __main__ - Step 11326: {'lr': 0.0004951183623191855, 'samples': 2174592, 'steps': 11325, 'loss/train': 1.493397831916809} -11/06/2021 22:49:02 - INFO - __main__ - Step 11327: {'lr': 0.0004951173186846884, 'samples': 2174784, 'steps': 11326, 'loss/train': 3.6629881858825684} -11/06/2021 22:49:02 - INFO - __main__ - Step 11328: {'lr': 0.0004951162749397452, 'samples': 2174976, 'steps': 11327, 'loss/train': 3.2852323055267334} -11/06/2021 22:49:03 - INFO - __main__ - Step 11329: {'lr': 0.0004951152310843564, 'samples': 2175168, 'steps': 11328, 'loss/train': 1.8344948291778564} -11/06/2021 22:49:03 - INFO - __main__ - Step 11330: {'lr': 0.0004951141871185224, 'samples': 2175360, 'steps': 11329, 'loss/train': 2.280247449874878} -11/06/2021 22:49:03 - INFO - __main__ - Step 11331: {'lr': 0.0004951131430422438, 'samples': 2175552, 'steps': 11330, 'loss/train': 1.4350394010543823} -11/06/2021 22:49:05 - INFO - __main__ - Step 11332: {'lr': 0.0004951120988555209, 'samples': 2175744, 'steps': 11331, 'loss/train': 2.2273924350738525} -11/06/2021 22:49:05 - INFO - __main__ - Step 11333: {'lr': 0.0004951110545583543, 'samples': 2175936, 'steps': 11332, 'loss/train': 1.8531851768493652} -11/06/2021 22:49:05 - INFO - __main__ - Step 11334: {'lr': 0.0004951100101507445, 'samples': 2176128, 'steps': 11333, 'loss/train': 1.8258116245269775} -11/06/2021 22:49:06 - INFO - __main__ - Step 11335: {'lr': 0.0004951089656326919, 'samples': 2176320, 'steps': 11334, 'loss/train': 0.3128710389137268} -11/06/2021 22:49:06 - INFO - __main__ - Step 11336: {'lr': 0.0004951079210041969, 'samples': 2176512, 'steps': 11335, 'loss/train': 1.8034968376159668} -11/06/2021 22:49:06 - INFO - __main__ - Step 11337: {'lr': 0.0004951068762652602, 'samples': 2176704, 'steps': 11336, 'loss/train': 1.5365264415740967} -11/06/2021 22:49:07 - INFO - __main__ - Step 11338: {'lr': 0.000495105831415882, 'samples': 2176896, 'steps': 11337, 'loss/train': 1.9638972282409668} -11/06/2021 22:49:08 - INFO - __main__ - Step 11339: {'lr': 0.0004951047864560629, 'samples': 2177088, 'steps': 11338, 'loss/train': 1.64912748336792} -11/06/2021 22:49:08 - INFO - __main__ - Step 11340: {'lr': 0.0004951037413858034, 'samples': 2177280, 'steps': 11339, 'loss/train': 1.4875028133392334} -11/06/2021 22:49:08 - INFO - __main__ - Step 11341: {'lr': 0.000495102696205104, 'samples': 2177472, 'steps': 11340, 'loss/train': 1.8226743936538696} -11/06/2021 22:49:09 - INFO - __main__ - Step 11342: {'lr': 0.000495101650913965, 'samples': 2177664, 'steps': 11341, 'loss/train': 1.8261113166809082} -11/06/2021 22:49:10 - INFO - __main__ - Step 11343: {'lr': 0.000495100605512387, 'samples': 2177856, 'steps': 11342, 'loss/train': 1.8620246648788452} -11/06/2021 22:49:10 - INFO - __main__ - Step 11344: {'lr': 0.0004950995600003705, 'samples': 2178048, 'steps': 11343, 'loss/train': 1.7309132814407349} -11/06/2021 22:49:10 - INFO - __main__ - Step 11345: {'lr': 0.0004950985143779159, 'samples': 2178240, 'steps': 11344, 'loss/train': 1.5737980604171753} -11/06/2021 22:49:11 - INFO - __main__ - Step 11346: {'lr': 0.0004950974686450237, 'samples': 2178432, 'steps': 11345, 'loss/train': 1.4471863508224487} -11/06/2021 22:49:11 - INFO - __main__ - Step 11347: {'lr': 0.0004950964228016944, 'samples': 2178624, 'steps': 11346, 'loss/train': 1.8836588859558105} -11/06/2021 22:49:12 - INFO - __main__ - Step 11348: {'lr': 0.0004950953768479284, 'samples': 2178816, 'steps': 11347, 'loss/train': 1.526648998260498} -11/06/2021 22:49:12 - INFO - __main__ - Step 11349: {'lr': 0.0004950943307837261, 'samples': 2179008, 'steps': 11348, 'loss/train': 1.9713560342788696} -11/06/2021 22:49:13 - INFO - __main__ - Step 11350: {'lr': 0.0004950932846090882, 'samples': 2179200, 'steps': 11349, 'loss/train': 1.60298490524292} -11/06/2021 22:49:13 - INFO - __main__ - Step 11351: {'lr': 0.000495092238324015, 'samples': 2179392, 'steps': 11350, 'loss/train': 1.1730953454971313} -11/06/2021 22:49:13 - INFO - __main__ - Step 11352: {'lr': 0.0004950911919285071, 'samples': 2179584, 'steps': 11351, 'loss/train': 1.5877281427383423} -11/06/2021 22:49:15 - INFO - __main__ - Step 11353: {'lr': 0.0004950901454225647, 'samples': 2179776, 'steps': 11352, 'loss/train': 1.8872724771499634} -11/06/2021 22:49:15 - INFO - __main__ - Step 11354: {'lr': 0.0004950890988061886, 'samples': 2179968, 'steps': 11353, 'loss/train': 2.0779507160186768} -11/06/2021 22:49:15 - INFO - __main__ - Step 11355: {'lr': 0.0004950880520793791, 'samples': 2180160, 'steps': 11354, 'loss/train': 1.030417561531067} -11/06/2021 22:49:16 - INFO - __main__ - Step 11356: {'lr': 0.0004950870052421368, 'samples': 2180352, 'steps': 11355, 'loss/train': 1.806678295135498} -11/06/2021 22:49:16 - INFO - __main__ - Step 11357: {'lr': 0.000495085958294462, 'samples': 2180544, 'steps': 11356, 'loss/train': 1.621626377105713} -11/06/2021 22:49:17 - INFO - __main__ - Step 11358: {'lr': 0.0004950849112363553, 'samples': 2180736, 'steps': 11357, 'loss/train': 0.5637978911399841} -11/06/2021 22:49:17 - INFO - __main__ - Step 11359: {'lr': 0.000495083864067817, 'samples': 2180928, 'steps': 11358, 'loss/train': 1.728484869003296} -11/06/2021 22:49:18 - INFO - __main__ - Step 11360: {'lr': 0.0004950828167888478, 'samples': 2181120, 'steps': 11359, 'loss/train': 1.9310498237609863} -11/06/2021 22:49:18 - INFO - __main__ - Step 11361: {'lr': 0.0004950817693994481, 'samples': 2181312, 'steps': 11360, 'loss/train': 1.8141530752182007} -11/06/2021 22:49:18 - INFO - __main__ - Step 11362: {'lr': 0.0004950807218996182, 'samples': 2181504, 'steps': 11361, 'loss/train': 2.154552936553955} -11/06/2021 22:49:19 - INFO - __main__ - Step 11363: {'lr': 0.0004950796742893588, 'samples': 2181696, 'steps': 11362, 'loss/train': 1.7956241369247437} -11/06/2021 22:49:20 - INFO - __main__ - Step 11364: {'lr': 0.0004950786265686702, 'samples': 2181888, 'steps': 11363, 'loss/train': 1.6461005210876465} -11/06/2021 22:49:20 - INFO - __main__ - Step 11365: {'lr': 0.000495077578737553, 'samples': 2182080, 'steps': 11364, 'loss/train': 1.5644863843917847} -11/06/2021 22:49:20 - INFO - __main__ - Step 11366: {'lr': 0.0004950765307960076, 'samples': 2182272, 'steps': 11365, 'loss/train': 1.4656745195388794} -11/06/2021 22:49:21 - INFO - __main__ - Step 11367: {'lr': 0.0004950754827440346, 'samples': 2182464, 'steps': 11366, 'loss/train': 1.9674415588378906} -11/06/2021 22:49:21 - INFO - __main__ - Step 11368: {'lr': 0.0004950744345816342, 'samples': 2182656, 'steps': 11367, 'loss/train': 1.2006498575210571} -11/06/2021 22:49:22 - INFO - __main__ - Step 11369: {'lr': 0.0004950733863088072, 'samples': 2182848, 'steps': 11368, 'loss/train': 2.536311388015747} -11/06/2021 22:49:22 - INFO - __main__ - Step 11370: {'lr': 0.0004950723379255538, 'samples': 2183040, 'steps': 11369, 'loss/train': 1.9103096723556519} -11/06/2021 22:49:23 - INFO - __main__ - Step 11371: {'lr': 0.0004950712894318748, 'samples': 2183232, 'steps': 11370, 'loss/train': 1.7062427997589111} -11/06/2021 22:49:23 - INFO - __main__ - Step 11372: {'lr': 0.0004950702408277702, 'samples': 2183424, 'steps': 11371, 'loss/train': 1.4938647747039795} -11/06/2021 22:49:23 - INFO - __main__ - Step 11373: {'lr': 0.0004950691921132409, 'samples': 2183616, 'steps': 11372, 'loss/train': 1.9969819784164429} -11/06/2021 22:49:24 - INFO - __main__ - Step 11374: {'lr': 0.000495068143288287, 'samples': 2183808, 'steps': 11373, 'loss/train': 1.8315733671188354} -11/06/2021 22:49:25 - INFO - __main__ - Step 11375: {'lr': 0.0004950670943529094, 'samples': 2184000, 'steps': 11374, 'loss/train': 0.9384849071502686} -11/06/2021 22:49:25 - INFO - __main__ - Step 11376: {'lr': 0.0004950660453071082, 'samples': 2184192, 'steps': 11375, 'loss/train': 1.814307689666748} -11/06/2021 22:49:25 - INFO - __main__ - Step 11377: {'lr': 0.0004950649961508841, 'samples': 2184384, 'steps': 11376, 'loss/train': 2.194822311401367} -11/06/2021 22:49:26 - INFO - __main__ - Step 11378: {'lr': 0.0004950639468842375, 'samples': 2184576, 'steps': 11377, 'loss/train': 2.181577205657959} -11/06/2021 22:49:27 - INFO - __main__ - Step 11379: {'lr': 0.0004950628975071688, 'samples': 2184768, 'steps': 11378, 'loss/train': 1.6916229724884033} -11/06/2021 22:49:27 - INFO - __main__ - Step 11380: {'lr': 0.0004950618480196785, 'samples': 2184960, 'steps': 11379, 'loss/train': 1.5891834497451782} -11/06/2021 22:49:28 - INFO - __main__ - Step 11381: {'lr': 0.0004950607984217674, 'samples': 2185152, 'steps': 11380, 'loss/train': 1.64052414894104} -11/06/2021 22:49:28 - INFO - __main__ - Step 11382: {'lr': 0.0004950597487134354, 'samples': 2185344, 'steps': 11381, 'loss/train': 2.620680570602417} -11/06/2021 22:49:28 - INFO - __main__ - Step 11383: {'lr': 0.0004950586988946834, 'samples': 2185536, 'steps': 11382, 'loss/train': 1.9298031330108643} -11/06/2021 22:49:29 - INFO - __main__ - Step 11384: {'lr': 0.0004950576489655116, 'samples': 2185728, 'steps': 11383, 'loss/train': 1.8474303483963013} -11/06/2021 22:49:30 - INFO - __main__ - Step 11385: {'lr': 0.0004950565989259207, 'samples': 2185920, 'steps': 11384, 'loss/train': 1.4204002618789673} -11/06/2021 22:49:30 - INFO - __main__ - Step 11386: {'lr': 0.000495055548775911, 'samples': 2186112, 'steps': 11385, 'loss/train': 1.618093729019165} -11/06/2021 22:49:30 - INFO - __main__ - Step 11387: {'lr': 0.0004950544985154831, 'samples': 2186304, 'steps': 11386, 'loss/train': 2.119515895843506} -11/06/2021 22:49:31 - INFO - __main__ - Step 11388: {'lr': 0.0004950534481446375, 'samples': 2186496, 'steps': 11387, 'loss/train': 2.0047428607940674} -11/06/2021 22:49:31 - INFO - __main__ - Step 11389: {'lr': 0.0004950523976633745, 'samples': 2186688, 'steps': 11388, 'loss/train': 1.9979164600372314} -11/06/2021 22:49:32 - INFO - __main__ - Step 11390: {'lr': 0.0004950513470716947, 'samples': 2186880, 'steps': 11389, 'loss/train': 1.188913345336914} -11/06/2021 22:49:32 - INFO - __main__ - Step 11391: {'lr': 0.0004950502963695985, 'samples': 2187072, 'steps': 11390, 'loss/train': 1.6476091146469116} -11/06/2021 22:49:33 - INFO - __main__ - Step 11392: {'lr': 0.0004950492455570865, 'samples': 2187264, 'steps': 11391, 'loss/train': 7.051599502563477} -11/06/2021 22:49:33 - INFO - __main__ - Step 11393: {'lr': 0.000495048194634159, 'samples': 2187456, 'steps': 11392, 'loss/train': 1.676889419555664} -11/06/2021 22:49:33 - INFO - __main__ - Step 11394: {'lr': 0.0004950471436008167, 'samples': 2187648, 'steps': 11393, 'loss/train': 1.9109240770339966} -11/06/2021 22:49:35 - INFO - __main__ - Step 11395: {'lr': 0.0004950460924570598, 'samples': 2187840, 'steps': 11394, 'loss/train': 1.9026075601577759} -11/06/2021 22:49:35 - INFO - __main__ - Step 11396: {'lr': 0.0004950450412028889, 'samples': 2188032, 'steps': 11395, 'loss/train': 1.8585050106048584} -11/06/2021 22:49:35 - INFO - __main__ - Step 11397: {'lr': 0.0004950439898383047, 'samples': 2188224, 'steps': 11396, 'loss/train': 2.125458002090454} -11/06/2021 22:49:36 - INFO - __main__ - Step 11398: {'lr': 0.0004950429383633073, 'samples': 2188416, 'steps': 11397, 'loss/train': 1.5339622497558594} -11/06/2021 22:49:36 - INFO - __main__ - Step 11399: {'lr': 0.0004950418867778973, 'samples': 2188608, 'steps': 11398, 'loss/train': 1.875319480895996} -11/06/2021 22:49:37 - INFO - __main__ - Step 11400: {'lr': 0.0004950408350820752, 'samples': 2188800, 'steps': 11399, 'loss/train': 1.5913536548614502} -11/06/2021 22:49:37 - INFO - __main__ - Step 11401: {'lr': 0.0004950397832758415, 'samples': 2188992, 'steps': 11400, 'loss/train': 1.3669840097427368} -11/06/2021 22:49:38 - INFO - __main__ - Step 11402: {'lr': 0.0004950387313591968, 'samples': 2189184, 'steps': 11401, 'loss/train': 1.8628370761871338} -11/06/2021 22:49:38 - INFO - __main__ - Step 11403: {'lr': 0.0004950376793321413, 'samples': 2189376, 'steps': 11402, 'loss/train': 1.7271697521209717} -11/06/2021 22:49:38 - INFO - __main__ - Step 11404: {'lr': 0.0004950366271946756, 'samples': 2189568, 'steps': 11403, 'loss/train': 2.1682770252227783} -11/06/2021 22:49:39 - INFO - __main__ - Step 11405: {'lr': 0.0004950355749468001, 'samples': 2189760, 'steps': 11404, 'loss/train': 1.8250188827514648} -11/06/2021 22:49:40 - INFO - __main__ - Step 11406: {'lr': 0.0004950345225885155, 'samples': 2189952, 'steps': 11405, 'loss/train': 1.594653844833374} -11/06/2021 22:49:40 - INFO - __main__ - Step 11407: {'lr': 0.0004950334701198222, 'samples': 2190144, 'steps': 11406, 'loss/train': 1.9516605138778687} -11/06/2021 22:49:40 - INFO - __main__ - Step 11408: {'lr': 0.0004950324175407204, 'samples': 2190336, 'steps': 11407, 'loss/train': 1.3681046962738037} -11/06/2021 22:49:41 - INFO - __main__ - Step 11409: {'lr': 0.0004950313648512108, 'samples': 2190528, 'steps': 11408, 'loss/train': 1.6536760330200195} -11/06/2021 22:49:42 - INFO - __main__ - Step 11410: {'lr': 0.0004950303120512939, 'samples': 2190720, 'steps': 11409, 'loss/train': 1.9302911758422852} -11/06/2021 22:49:42 - INFO - __main__ - Step 11411: {'lr': 0.0004950292591409701, 'samples': 2190912, 'steps': 11410, 'loss/train': 2.0202114582061768} -11/06/2021 22:49:42 - INFO - __main__ - Step 11412: {'lr': 0.0004950282061202399, 'samples': 2191104, 'steps': 11411, 'loss/train': 1.8923609256744385} -11/06/2021 22:49:43 - INFO - __main__ - Step 11413: {'lr': 0.0004950271529891038, 'samples': 2191296, 'steps': 11412, 'loss/train': 1.6358274221420288} -11/06/2021 22:49:43 - INFO - __main__ - Step 11414: {'lr': 0.0004950260997475623, 'samples': 2191488, 'steps': 11413, 'loss/train': 1.7055529356002808} -11/06/2021 22:49:43 - INFO - __main__ - Step 11415: {'lr': 0.0004950250463956157, 'samples': 2191680, 'steps': 11414, 'loss/train': 1.4822801351547241} -11/06/2021 22:49:44 - INFO - __main__ - Step 11416: {'lr': 0.0004950239929332646, 'samples': 2191872, 'steps': 11415, 'loss/train': 1.7098220586776733} -11/06/2021 22:49:45 - INFO - __main__ - Step 11417: {'lr': 0.0004950229393605095, 'samples': 2192064, 'steps': 11416, 'loss/train': 1.437166690826416} -11/06/2021 22:49:45 - INFO - __main__ - Step 11418: {'lr': 0.0004950218856773509, 'samples': 2192256, 'steps': 11417, 'loss/train': 1.7919132709503174} -11/06/2021 22:49:46 - INFO - __main__ - Step 11419: {'lr': 0.0004950208318837892, 'samples': 2192448, 'steps': 11418, 'loss/train': 1.5548012256622314} -11/06/2021 22:49:46 - INFO - __main__ - Step 11420: {'lr': 0.0004950197779798248, 'samples': 2192640, 'steps': 11419, 'loss/train': 1.615087628364563} -11/06/2021 22:49:47 - INFO - __main__ - Step 11421: {'lr': 0.0004950187239654584, 'samples': 2192832, 'steps': 11420, 'loss/train': 1.5422042608261108} -11/06/2021 22:49:47 - INFO - __main__ - Step 11422: {'lr': 0.0004950176698406903, 'samples': 2193024, 'steps': 11421, 'loss/train': 1.7497607469558716} -11/06/2021 22:49:48 - INFO - __main__ - Step 11423: {'lr': 0.000495016615605521, 'samples': 2193216, 'steps': 11422, 'loss/train': 1.8676695823669434} -11/06/2021 22:49:48 - INFO - __main__ - Step 11424: {'lr': 0.0004950155612599511, 'samples': 2193408, 'steps': 11423, 'loss/train': 1.7228354215621948} -11/06/2021 22:49:48 - INFO - __main__ - Step 11425: {'lr': 0.0004950145068039808, 'samples': 2193600, 'steps': 11424, 'loss/train': 2.0538418292999268} -11/06/2021 22:49:50 - INFO - __main__ - Step 11426: {'lr': 0.0004950134522376108, 'samples': 2193792, 'steps': 11425, 'loss/train': 2.0715749263763428} -11/06/2021 22:49:50 - INFO - __main__ - Step 11427: {'lr': 0.0004950123975608415, 'samples': 2193984, 'steps': 11426, 'loss/train': 1.7007184028625488} -11/06/2021 22:49:50 - INFO - __main__ - Step 11428: {'lr': 0.0004950113427736734, 'samples': 2194176, 'steps': 11427, 'loss/train': 3.19921612739563} -11/06/2021 22:49:51 - INFO - __main__ - Step 11429: {'lr': 0.000495010287876107, 'samples': 2194368, 'steps': 11428, 'loss/train': 1.4021397829055786} -11/06/2021 22:49:51 - INFO - __main__ - Step 11430: {'lr': 0.0004950092328681428, 'samples': 2194560, 'steps': 11429, 'loss/train': 1.3537622690200806} -11/06/2021 22:49:52 - INFO - __main__ - Step 11431: {'lr': 0.0004950081777497812, 'samples': 2194752, 'steps': 11430, 'loss/train': 2.075549840927124} -11/06/2021 22:49:52 - INFO - __main__ - Step 11432: {'lr': 0.0004950071225210226, 'samples': 2194944, 'steps': 11431, 'loss/train': 2.2437236309051514} -11/06/2021 22:49:53 - INFO - __main__ - Step 11433: {'lr': 0.0004950060671818676, 'samples': 2195136, 'steps': 11432, 'loss/train': 1.8015081882476807} -11/06/2021 22:49:53 - INFO - __main__ - Step 11434: {'lr': 0.0004950050117323167, 'samples': 2195328, 'steps': 11433, 'loss/train': 1.7495261430740356} -11/06/2021 22:49:54 - INFO - __main__ - Step 11435: {'lr': 0.0004950039561723703, 'samples': 2195520, 'steps': 11434, 'loss/train': 2.0817348957061768} -11/06/2021 22:49:54 - INFO - __main__ - Step 11436: {'lr': 0.0004950029005020289, 'samples': 2195712, 'steps': 11435, 'loss/train': 1.7753431797027588} -11/06/2021 22:49:55 - INFO - __main__ - Step 11437: {'lr': 0.0004950018447212929, 'samples': 2195904, 'steps': 11436, 'loss/train': 2.0094332695007324} -11/06/2021 22:49:55 - INFO - __main__ - Step 11438: {'lr': 0.000495000788830163, 'samples': 2196096, 'steps': 11437, 'loss/train': 1.0826306343078613} -11/06/2021 22:49:56 - INFO - __main__ - Step 11439: {'lr': 0.0004949997328286394, 'samples': 2196288, 'steps': 11438, 'loss/train': 1.5447814464569092} -11/06/2021 22:49:56 - INFO - __main__ - Step 11440: {'lr': 0.0004949986767167228, 'samples': 2196480, 'steps': 11439, 'loss/train': 1.7402944564819336} -11/06/2021 22:49:56 - INFO - __main__ - Step 11441: {'lr': 0.0004949976204944135, 'samples': 2196672, 'steps': 11440, 'loss/train': 1.6975988149642944} -11/06/2021 22:49:57 - INFO - __main__ - Step 11442: {'lr': 0.0004949965641617121, 'samples': 2196864, 'steps': 11441, 'loss/train': 1.6777021884918213} -11/06/2021 22:49:58 - INFO - __main__ - Step 11443: {'lr': 0.000494995507718619, 'samples': 2197056, 'steps': 11442, 'loss/train': 1.3952085971832275} -11/06/2021 22:49:58 - INFO - __main__ - Step 11444: {'lr': 0.0004949944511651347, 'samples': 2197248, 'steps': 11443, 'loss/train': 1.7834969758987427} -11/06/2021 22:49:58 - INFO - __main__ - Step 11445: {'lr': 0.0004949933945012597, 'samples': 2197440, 'steps': 11444, 'loss/train': 1.753387212753296} -11/06/2021 22:49:59 - INFO - __main__ - Step 11446: {'lr': 0.0004949923377269945, 'samples': 2197632, 'steps': 11445, 'loss/train': 2.039705753326416} -11/06/2021 22:49:59 - INFO - __main__ - Step 11447: {'lr': 0.0004949912808423394, 'samples': 2197824, 'steps': 11446, 'loss/train': 1.4728835821151733} -11/06/2021 22:50:01 - INFO - __main__ - Step 11448: {'lr': 0.000494990223847295, 'samples': 2198016, 'steps': 11447, 'loss/train': 1.628504991531372} -11/06/2021 22:50:01 - INFO - __main__ - Step 11449: {'lr': 0.000494989166741862, 'samples': 2198208, 'steps': 11448, 'loss/train': 2.0440473556518555} -11/06/2021 22:50:01 - INFO - __main__ - Step 11450: {'lr': 0.0004949881095260405, 'samples': 2198400, 'steps': 11449, 'loss/train': 1.660749912261963} -11/06/2021 22:50:02 - INFO - __main__ - Step 11451: {'lr': 0.0004949870521998312, 'samples': 2198592, 'steps': 11450, 'loss/train': 1.8337377309799194} -11/06/2021 22:50:02 - INFO - __main__ - Step 11452: {'lr': 0.0004949859947632344, 'samples': 2198784, 'steps': 11451, 'loss/train': 1.8013213872909546} -11/06/2021 22:50:03 - INFO - __main__ - Step 11453: {'lr': 0.0004949849372162509, 'samples': 2198976, 'steps': 11452, 'loss/train': 1.1063177585601807} -11/06/2021 22:50:03 - INFO - __main__ - Step 11454: {'lr': 0.0004949838795588808, 'samples': 2199168, 'steps': 11453, 'loss/train': 1.6007579565048218} -11/06/2021 22:50:04 - INFO - __main__ - Step 11455: {'lr': 0.0004949828217911248, 'samples': 2199360, 'steps': 11454, 'loss/train': 1.6126108169555664} -11/06/2021 22:50:04 - INFO - __main__ - Step 11456: {'lr': 0.0004949817639129832, 'samples': 2199552, 'steps': 11455, 'loss/train': 1.85826575756073} -11/06/2021 22:50:04 - INFO - __main__ - Step 11457: {'lr': 0.0004949807059244568, 'samples': 2199744, 'steps': 11456, 'loss/train': 1.6572095155715942} -11/06/2021 22:50:05 - INFO - __main__ - Step 11458: {'lr': 0.0004949796478255458, 'samples': 2199936, 'steps': 11457, 'loss/train': 1.5031503438949585} -11/06/2021 22:50:06 - INFO - __main__ - Step 11459: {'lr': 0.0004949785896162507, 'samples': 2200128, 'steps': 11458, 'loss/train': 1.6806023120880127} -11/06/2021 22:50:06 - INFO - __main__ - Step 11460: {'lr': 0.0004949775312965721, 'samples': 2200320, 'steps': 11459, 'loss/train': 1.5449903011322021} -11/06/2021 22:50:06 - INFO - __main__ - Step 11461: {'lr': 0.0004949764728665103, 'samples': 2200512, 'steps': 11460, 'loss/train': 1.651967167854309} -11/06/2021 22:50:07 - INFO - __main__ - Step 11462: {'lr': 0.000494975414326066, 'samples': 2200704, 'steps': 11461, 'loss/train': 1.8669898509979248} -11/06/2021 22:50:07 - INFO - __main__ - Step 11463: {'lr': 0.0004949743556752395, 'samples': 2200896, 'steps': 11462, 'loss/train': 1.9016015529632568} -11/06/2021 22:50:08 - INFO - __main__ - Step 11464: {'lr': 0.0004949732969140313, 'samples': 2201088, 'steps': 11463, 'loss/train': 1.5884931087493896} -11/06/2021 22:50:09 - INFO - __main__ - Step 11465: {'lr': 0.000494972238042442, 'samples': 2201280, 'steps': 11464, 'loss/train': 1.8496793508529663} -11/06/2021 22:50:09 - INFO - __main__ - Step 11466: {'lr': 0.0004949711790604719, 'samples': 2201472, 'steps': 11465, 'loss/train': 1.83021879196167} -11/06/2021 22:50:09 - INFO - __main__ - Step 11467: {'lr': 0.0004949701199681217, 'samples': 2201664, 'steps': 11466, 'loss/train': 1.7761445045471191} -11/06/2021 22:50:10 - INFO - __main__ - Step 11468: {'lr': 0.0004949690607653916, 'samples': 2201856, 'steps': 11467, 'loss/train': 1.5645625591278076} -11/06/2021 22:50:10 - INFO - __main__ - Step 11469: {'lr': 0.0004949680014522822, 'samples': 2202048, 'steps': 11468, 'loss/train': 1.7550435066223145} -11/06/2021 22:50:11 - INFO - __main__ - Step 11470: {'lr': 0.0004949669420287941, 'samples': 2202240, 'steps': 11469, 'loss/train': 1.595177412033081} -11/06/2021 22:50:11 - INFO - __main__ - Step 11471: {'lr': 0.0004949658824949277, 'samples': 2202432, 'steps': 11470, 'loss/train': 1.6120365858078003} -11/06/2021 22:50:12 - INFO - __main__ - Step 11472: {'lr': 0.0004949648228506834, 'samples': 2202624, 'steps': 11471, 'loss/train': 1.6954563856124878} -11/06/2021 22:50:12 - INFO - __main__ - Step 11473: {'lr': 0.0004949637630960618, 'samples': 2202816, 'steps': 11472, 'loss/train': 1.4135258197784424} -11/06/2021 22:50:13 - INFO - __main__ - Step 11474: {'lr': 0.0004949627032310632, 'samples': 2203008, 'steps': 11473, 'loss/train': 1.074235200881958} -11/06/2021 22:50:13 - INFO - __main__ - Step 11475: {'lr': 0.0004949616432556882, 'samples': 2203200, 'steps': 11474, 'loss/train': 2.001767635345459} -11/06/2021 22:50:14 - INFO - __main__ - Step 11476: {'lr': 0.0004949605831699373, 'samples': 2203392, 'steps': 11475, 'loss/train': 1.4366241693496704} -11/06/2021 22:50:14 - INFO - __main__ - Step 11477: {'lr': 0.000494959522973811, 'samples': 2203584, 'steps': 11476, 'loss/train': 1.5947993993759155} -11/06/2021 22:50:14 - INFO - __main__ - Step 11478: {'lr': 0.0004949584626673096, 'samples': 2203776, 'steps': 11477, 'loss/train': 1.586674451828003} -11/06/2021 22:50:15 - INFO - __main__ - Step 11479: {'lr': 0.0004949574022504338, 'samples': 2203968, 'steps': 11478, 'loss/train': 1.7831062078475952} -11/06/2021 22:50:16 - INFO - __main__ - Step 11480: {'lr': 0.0004949563417231838, 'samples': 2204160, 'steps': 11479, 'loss/train': 2.0792524814605713} -11/06/2021 22:50:16 - INFO - __main__ - Step 11481: {'lr': 0.0004949552810855605, 'samples': 2204352, 'steps': 11480, 'loss/train': 1.7512733936309814} -11/06/2021 22:50:16 - INFO - __main__ - Step 11482: {'lr': 0.000494954220337564, 'samples': 2204544, 'steps': 11481, 'loss/train': 1.9360369443893433} -11/06/2021 22:50:17 - INFO - __main__ - Step 11483: {'lr': 0.0004949531594791948, 'samples': 2204736, 'steps': 11482, 'loss/train': 0.5724799633026123} -11/06/2021 22:50:18 - INFO - __main__ - Step 11484: {'lr': 0.0004949520985104536, 'samples': 2204928, 'steps': 11483, 'loss/train': 1.9736790657043457} -11/06/2021 22:50:18 - INFO - __main__ - Step 11485: {'lr': 0.0004949510374313409, 'samples': 2205120, 'steps': 11484, 'loss/train': 1.3778972625732422} -11/06/2021 22:50:18 - INFO - __main__ - Step 11486: {'lr': 0.0004949499762418568, 'samples': 2205312, 'steps': 11485, 'loss/train': 1.658096194267273} -11/06/2021 22:50:19 - INFO - __main__ - Step 11487: {'lr': 0.0004949489149420021, 'samples': 2205504, 'steps': 11486, 'loss/train': 1.9003406763076782} -11/06/2021 22:50:19 - INFO - __main__ - Step 11488: {'lr': 0.0004949478535317773, 'samples': 2205696, 'steps': 11487, 'loss/train': 1.31734299659729} -11/06/2021 22:50:20 - INFO - __main__ - Step 11489: {'lr': 0.0004949467920111827, 'samples': 2205888, 'steps': 11488, 'loss/train': 2.2677342891693115} -11/06/2021 22:50:21 - INFO - __main__ - Step 11490: {'lr': 0.0004949457303802189, 'samples': 2206080, 'steps': 11489, 'loss/train': 1.4590067863464355} -11/06/2021 22:50:21 - INFO - __main__ - Step 11491: {'lr': 0.0004949446686388862, 'samples': 2206272, 'steps': 11490, 'loss/train': 1.8408727645874023} -11/06/2021 22:50:21 - INFO - __main__ - Step 11492: {'lr': 0.0004949436067871854, 'samples': 2206464, 'steps': 11491, 'loss/train': 2.519899845123291} -11/06/2021 22:50:22 - INFO - __main__ - Step 11493: {'lr': 0.0004949425448251166, 'samples': 2206656, 'steps': 11492, 'loss/train': 1.598381757736206} -11/06/2021 22:50:22 - INFO - __main__ - Step 11494: {'lr': 0.0004949414827526805, 'samples': 2206848, 'steps': 11493, 'loss/train': 1.779862642288208} -11/06/2021 22:50:23 - INFO - __main__ - Step 11495: {'lr': 0.0004949404205698777, 'samples': 2207040, 'steps': 11494, 'loss/train': 1.9242050647735596} -11/06/2021 22:50:23 - INFO - __main__ - Step 11496: {'lr': 0.0004949393582767084, 'samples': 2207232, 'steps': 11495, 'loss/train': 1.6788808107376099} -11/06/2021 22:50:24 - INFO - __main__ - Step 11497: {'lr': 0.0004949382958731733, 'samples': 2207424, 'steps': 11496, 'loss/train': 1.5965083837509155} -11/06/2021 22:50:24 - INFO - __main__ - Step 11498: {'lr': 0.0004949372333592728, 'samples': 2207616, 'steps': 11497, 'loss/train': 2.236138105392456} -11/06/2021 22:50:24 - INFO - __main__ - Step 11499: {'lr': 0.0004949361707350072, 'samples': 2207808, 'steps': 11498, 'loss/train': 1.7686853408813477} -11/06/2021 22:50:25 - INFO - __main__ - Step 11500: {'lr': 0.0004949351080003773, 'samples': 2208000, 'steps': 11499, 'loss/train': 1.9962258338928223} -11/06/2021 22:50:26 - INFO - __main__ - Step 11501: {'lr': 0.0004949340451553833, 'samples': 2208192, 'steps': 11500, 'loss/train': 1.7358423471450806} -11/06/2021 22:50:26 - INFO - __main__ - Step 11502: {'lr': 0.0004949329822000259, 'samples': 2208384, 'steps': 11501, 'loss/train': 1.7392240762710571} -11/06/2021 22:50:26 - INFO - __main__ - Step 11503: {'lr': 0.0004949319191343053, 'samples': 2208576, 'steps': 11502, 'loss/train': 2.329840660095215} -11/06/2021 22:50:27 - INFO - __main__ - Step 11504: {'lr': 0.0004949308559582224, 'samples': 2208768, 'steps': 11503, 'loss/train': 1.5851150751113892} -11/06/2021 22:50:28 - INFO - __main__ - Step 11505: {'lr': 0.0004949297926717772, 'samples': 2208960, 'steps': 11504, 'loss/train': 1.932198166847229} -11/06/2021 22:50:28 - INFO - __main__ - Step 11506: {'lr': 0.0004949287292749705, 'samples': 2209152, 'steps': 11505, 'loss/train': 1.7171591520309448} -11/06/2021 22:50:29 - INFO - __main__ - Step 11507: {'lr': 0.0004949276657678028, 'samples': 2209344, 'steps': 11506, 'loss/train': 2.190236806869507} -11/06/2021 22:50:29 - INFO - __main__ - Step 11508: {'lr': 0.0004949266021502744, 'samples': 2209536, 'steps': 11507, 'loss/train': 1.2840288877487183} -11/06/2021 22:50:29 - INFO - __main__ - Step 11509: {'lr': 0.0004949255384223859, 'samples': 2209728, 'steps': 11508, 'loss/train': 0.29179802536964417} -11/06/2021 22:50:30 - INFO - __main__ - Step 11510: {'lr': 0.0004949244745841377, 'samples': 2209920, 'steps': 11509, 'loss/train': 1.3277264833450317} -11/06/2021 22:50:31 - INFO - __main__ - Step 11511: {'lr': 0.0004949234106355302, 'samples': 2210112, 'steps': 11510, 'loss/train': 2.052576780319214} -11/06/2021 22:50:31 - INFO - __main__ - Step 11512: {'lr': 0.0004949223465765642, 'samples': 2210304, 'steps': 11511, 'loss/train': 1.9434692859649658} -11/06/2021 22:50:32 - INFO - __main__ - Step 11513: {'lr': 0.0004949212824072398, 'samples': 2210496, 'steps': 11512, 'loss/train': 2.3121955394744873} -11/06/2021 22:50:32 - INFO - __main__ - Step 11514: {'lr': 0.0004949202181275577, 'samples': 2210688, 'steps': 11513, 'loss/train': 1.9893686771392822} -11/06/2021 22:50:32 - INFO - __main__ - Step 11515: {'lr': 0.0004949191537375184, 'samples': 2210880, 'steps': 11514, 'loss/train': 1.3614085912704468} -11/06/2021 22:50:33 - INFO - __main__ - Step 11516: {'lr': 0.0004949180892371223, 'samples': 2211072, 'steps': 11515, 'loss/train': 1.9664455652236938} -11/06/2021 22:50:34 - INFO - __main__ - Step 11517: {'lr': 0.0004949170246263697, 'samples': 2211264, 'steps': 11516, 'loss/train': 2.041748046875} -11/06/2021 22:50:34 - INFO - __main__ - Step 11518: {'lr': 0.0004949159599052614, 'samples': 2211456, 'steps': 11517, 'loss/train': 1.993459939956665} -11/06/2021 22:50:34 - INFO - __main__ - Step 11519: {'lr': 0.0004949148950737978, 'samples': 2211648, 'steps': 11518, 'loss/train': 1.6282458305358887} -11/06/2021 22:50:35 - INFO - __main__ - Step 11520: {'lr': 0.0004949138301319793, 'samples': 2211840, 'steps': 11519, 'loss/train': 1.2587100267410278} -11/06/2021 22:50:35 - INFO - __main__ - Step 11521: {'lr': 0.0004949127650798063, 'samples': 2212032, 'steps': 11520, 'loss/train': 1.619840145111084} -11/06/2021 22:50:36 - INFO - __main__ - Step 11522: {'lr': 0.0004949116999172795, 'samples': 2212224, 'steps': 11521, 'loss/train': 1.572475790977478} -11/06/2021 22:50:36 - INFO - __main__ - Step 11523: {'lr': 0.0004949106346443992, 'samples': 2212416, 'steps': 11522, 'loss/train': 1.6941105127334595} -11/06/2021 22:50:37 - INFO - __main__ - Step 11524: {'lr': 0.0004949095692611661, 'samples': 2212608, 'steps': 11523, 'loss/train': 1.9662777185440063} -11/06/2021 22:50:37 - INFO - __main__ - Step 11525: {'lr': 0.0004949085037675803, 'samples': 2212800, 'steps': 11524, 'loss/train': 1.7247838973999023} -11/06/2021 22:50:37 - INFO - __main__ - Step 11526: {'lr': 0.0004949074381636427, 'samples': 2212992, 'steps': 11525, 'loss/train': 1.9012329578399658} -11/06/2021 22:50:38 - INFO - __main__ - Step 11527: {'lr': 0.0004949063724493534, 'samples': 2213184, 'steps': 11526, 'loss/train': 1.9752020835876465} -11/06/2021 22:50:39 - INFO - __main__ - Step 11528: {'lr': 0.0004949053066247133, 'samples': 2213376, 'steps': 11527, 'loss/train': 1.4446111917495728} -11/06/2021 22:50:39 - INFO - __main__ - Step 11529: {'lr': 0.0004949042406897225, 'samples': 2213568, 'steps': 11528, 'loss/train': 1.739598274230957} -11/06/2021 22:50:40 - INFO - __main__ - Step 11530: {'lr': 0.0004949031746443816, 'samples': 2213760, 'steps': 11529, 'loss/train': 1.8068318367004395} -11/06/2021 22:50:40 - INFO - __main__ - Step 11531: {'lr': 0.0004949021084886912, 'samples': 2213952, 'steps': 11530, 'loss/train': 1.7446298599243164} -11/06/2021 22:50:41 - INFO - __main__ - Step 11532: {'lr': 0.0004949010422226517, 'samples': 2214144, 'steps': 11531, 'loss/train': 1.2922008037567139} -11/06/2021 22:50:41 - INFO - __main__ - Step 11533: {'lr': 0.0004948999758462634, 'samples': 2214336, 'steps': 11532, 'loss/train': 2.062342882156372} -11/06/2021 22:50:42 - INFO - __main__ - Step 11534: {'lr': 0.000494898909359527, 'samples': 2214528, 'steps': 11533, 'loss/train': 1.4486849308013916} -11/06/2021 22:50:42 - INFO - __main__ - Step 11535: {'lr': 0.0004948978427624431, 'samples': 2214720, 'steps': 11534, 'loss/train': 1.7897515296936035} -11/06/2021 22:50:42 - INFO - __main__ - Step 11536: {'lr': 0.0004948967760550119, 'samples': 2214912, 'steps': 11535, 'loss/train': 1.818204402923584} -11/06/2021 22:50:43 - INFO - __main__ - Step 11537: {'lr': 0.000494895709237234, 'samples': 2215104, 'steps': 11536, 'loss/train': 1.166475534439087} -11/06/2021 22:50:44 - INFO - __main__ - Step 11538: {'lr': 0.0004948946423091099, 'samples': 2215296, 'steps': 11537, 'loss/train': 1.8267381191253662} -11/06/2021 22:50:44 - INFO - __main__ - Step 11539: {'lr': 0.0004948935752706401, 'samples': 2215488, 'steps': 11538, 'loss/train': 2.1393001079559326} -11/06/2021 22:50:44 - INFO - __main__ - Step 11540: {'lr': 0.0004948925081218248, 'samples': 2215680, 'steps': 11539, 'loss/train': 1.0833170413970947} -11/06/2021 22:50:45 - INFO - __main__ - Step 11541: {'lr': 0.000494891440862665, 'samples': 2215872, 'steps': 11540, 'loss/train': 1.8711026906967163} -11/06/2021 22:50:46 - INFO - __main__ - Step 11542: {'lr': 0.0004948903734931608, 'samples': 2216064, 'steps': 11541, 'loss/train': 1.5871480703353882} -11/06/2021 22:50:46 - INFO - __main__ - Step 11543: {'lr': 0.0004948893060133128, 'samples': 2216256, 'steps': 11542, 'loss/train': 1.5107953548431396} -11/06/2021 22:50:47 - INFO - __main__ - Step 11544: {'lr': 0.0004948882384231213, 'samples': 2216448, 'steps': 11543, 'loss/train': 1.1852807998657227} -11/06/2021 22:50:47 - INFO - __main__ - Step 11545: {'lr': 0.0004948871707225871, 'samples': 2216640, 'steps': 11544, 'loss/train': 1.8642654418945312} -11/06/2021 22:50:47 - INFO - __main__ - Step 11546: {'lr': 0.0004948861029117104, 'samples': 2216832, 'steps': 11545, 'loss/train': 1.524583339691162} -11/06/2021 22:50:48 - INFO - __main__ - Step 11547: {'lr': 0.0004948850349904919, 'samples': 2217024, 'steps': 11546, 'loss/train': 1.7309693098068237} -11/06/2021 22:50:49 - INFO - __main__ - Step 11548: {'lr': 0.0004948839669589319, 'samples': 2217216, 'steps': 11547, 'loss/train': 1.4048861265182495} -11/06/2021 22:50:49 - INFO - __main__ - Step 11549: {'lr': 0.000494882898817031, 'samples': 2217408, 'steps': 11548, 'loss/train': 1.8817989826202393} -11/06/2021 22:50:49 - INFO - __main__ - Step 11550: {'lr': 0.0004948818305647897, 'samples': 2217600, 'steps': 11549, 'loss/train': 1.4648607969284058} -11/06/2021 22:50:50 - INFO - __main__ - Step 11551: {'lr': 0.0004948807622022083, 'samples': 2217792, 'steps': 11550, 'loss/train': 2.3621954917907715} -11/06/2021 22:50:50 - INFO - __main__ - Step 11552: {'lr': 0.0004948796937292875, 'samples': 2217984, 'steps': 11551, 'loss/train': 1.87119722366333} -11/06/2021 22:50:51 - INFO - __main__ - Step 11553: {'lr': 0.0004948786251460277, 'samples': 2218176, 'steps': 11552, 'loss/train': 2.0248570442199707} -11/06/2021 22:50:51 - INFO - __main__ - Step 11554: {'lr': 0.0004948775564524294, 'samples': 2218368, 'steps': 11553, 'loss/train': 2.0253686904907227} -11/06/2021 22:50:52 - INFO - __main__ - Step 11555: {'lr': 0.000494876487648493, 'samples': 2218560, 'steps': 11554, 'loss/train': 1.359278917312622} -11/06/2021 22:50:52 - INFO - __main__ - Step 11556: {'lr': 0.0004948754187342189, 'samples': 2218752, 'steps': 11555, 'loss/train': 2.02559757232666} -11/06/2021 22:50:52 - INFO - __main__ - Step 11557: {'lr': 0.0004948743497096079, 'samples': 2218944, 'steps': 11556, 'loss/train': 1.019589900970459} -11/06/2021 22:50:54 - INFO - __main__ - Step 11558: {'lr': 0.0004948732805746604, 'samples': 2219136, 'steps': 11557, 'loss/train': 1.860040545463562} -11/06/2021 22:50:54 - INFO - __main__ - Step 11559: {'lr': 0.0004948722113293766, 'samples': 2219328, 'steps': 11558, 'loss/train': 1.786012053489685} -11/06/2021 22:50:54 - INFO - __main__ - Step 11560: {'lr': 0.000494871141973757, 'samples': 2219520, 'steps': 11559, 'loss/train': 1.9296960830688477} -11/06/2021 22:50:55 - INFO - __main__ - Step 11561: {'lr': 0.0004948700725078025, 'samples': 2219712, 'steps': 11560, 'loss/train': 1.883889079093933} -11/06/2021 22:50:55 - INFO - __main__ - Step 11562: {'lr': 0.0004948690029315133, 'samples': 2219904, 'steps': 11561, 'loss/train': 1.7466262578964233} -11/06/2021 22:50:56 - INFO - __main__ - Step 11563: {'lr': 0.0004948679332448899, 'samples': 2220096, 'steps': 11562, 'loss/train': 1.7426663637161255} -11/06/2021 22:50:57 - INFO - __main__ - Step 11564: {'lr': 0.0004948668634479327, 'samples': 2220288, 'steps': 11563, 'loss/train': 2.0808141231536865} -11/06/2021 22:50:57 - INFO - __main__ - Step 11565: {'lr': 0.0004948657935406423, 'samples': 2220480, 'steps': 11564, 'loss/train': 1.635694980621338} -11/06/2021 22:50:57 - INFO - __main__ - Step 11566: {'lr': 0.0004948647235230192, 'samples': 2220672, 'steps': 11565, 'loss/train': 1.6016157865524292} -11/06/2021 22:50:58 - INFO - __main__ - Step 11567: {'lr': 0.0004948636533950638, 'samples': 2220864, 'steps': 11566, 'loss/train': 1.8231465816497803} -11/06/2021 22:50:59 - INFO - __main__ - Step 11568: {'lr': 0.0004948625831567766, 'samples': 2221056, 'steps': 11567, 'loss/train': 1.6762038469314575} -11/06/2021 22:50:59 - INFO - __main__ - Step 11569: {'lr': 0.000494861512808158, 'samples': 2221248, 'steps': 11568, 'loss/train': 1.9984252452850342} -11/06/2021 22:50:59 - INFO - __main__ - Step 11570: {'lr': 0.0004948604423492088, 'samples': 2221440, 'steps': 11569, 'loss/train': 1.8539700508117676} -11/06/2021 22:51:00 - INFO - __main__ - Step 11571: {'lr': 0.0004948593717799292, 'samples': 2221632, 'steps': 11570, 'loss/train': 1.6391667127609253} -11/06/2021 22:51:00 - INFO - __main__ - Step 11572: {'lr': 0.0004948583011003196, 'samples': 2221824, 'steps': 11571, 'loss/train': 1.7608556747436523} -11/06/2021 22:51:00 - INFO - __main__ - Step 11573: {'lr': 0.0004948572303103808, 'samples': 2222016, 'steps': 11572, 'loss/train': 1.8692219257354736} -11/06/2021 22:51:01 - INFO - __main__ - Step 11574: {'lr': 0.0004948561594101129, 'samples': 2222208, 'steps': 11573, 'loss/train': 1.743513584136963} -11/06/2021 22:51:02 - INFO - __main__ - Step 11575: {'lr': 0.0004948550883995168, 'samples': 2222400, 'steps': 11574, 'loss/train': 1.3404990434646606} -11/06/2021 22:51:02 - INFO - __main__ - Step 11576: {'lr': 0.0004948540172785927, 'samples': 2222592, 'steps': 11575, 'loss/train': 1.5622731447219849} -11/06/2021 22:51:02 - INFO - __main__ - Step 11577: {'lr': 0.0004948529460473412, 'samples': 2222784, 'steps': 11576, 'loss/train': 1.3603805303573608} -11/06/2021 22:51:03 - INFO - __main__ - Step 11578: {'lr': 0.0004948518747057626, 'samples': 2222976, 'steps': 11577, 'loss/train': 1.4765523672103882} -11/06/2021 22:51:04 - INFO - __main__ - Step 11579: {'lr': 0.0004948508032538578, 'samples': 2223168, 'steps': 11578, 'loss/train': 1.918787956237793} -11/06/2021 22:51:04 - INFO - __main__ - Step 11580: {'lr': 0.0004948497316916267, 'samples': 2223360, 'steps': 11579, 'loss/train': 2.0067150592803955} -11/06/2021 22:51:04 - INFO - __main__ - Step 11581: {'lr': 0.0004948486600190702, 'samples': 2223552, 'steps': 11580, 'loss/train': 1.6319156885147095} -11/06/2021 22:51:05 - INFO - __main__ - Step 11582: {'lr': 0.0004948475882361888, 'samples': 2223744, 'steps': 11581, 'loss/train': 1.4225183725357056} -11/06/2021 22:51:05 - INFO - __main__ - Step 11583: {'lr': 0.0004948465163429828, 'samples': 2223936, 'steps': 11582, 'loss/train': 1.5520676374435425} -11/06/2021 22:51:06 - INFO - __main__ - Step 11584: {'lr': 0.0004948454443394527, 'samples': 2224128, 'steps': 11583, 'loss/train': 1.5501137971878052} -11/06/2021 22:51:07 - INFO - __main__ - Step 11585: {'lr': 0.000494844372225599, 'samples': 2224320, 'steps': 11584, 'loss/train': 1.650390625} -11/06/2021 22:51:07 - INFO - __main__ - Step 11586: {'lr': 0.0004948433000014222, 'samples': 2224512, 'steps': 11585, 'loss/train': 1.4051388502120972} -11/06/2021 22:51:07 - INFO - __main__ - Step 11587: {'lr': 0.0004948422276669228, 'samples': 2224704, 'steps': 11586, 'loss/train': 1.91586434841156} -11/06/2021 22:51:08 - INFO - __main__ - Step 11588: {'lr': 0.0004948411552221012, 'samples': 2224896, 'steps': 11587, 'loss/train': 2.1239876747131348} -11/06/2021 22:51:09 - INFO - __main__ - Step 11589: {'lr': 0.000494840082666958, 'samples': 2225088, 'steps': 11588, 'loss/train': 1.9688409566879272} -11/06/2021 22:51:09 - INFO - __main__ - Step 11590: {'lr': 0.0004948390100014937, 'samples': 2225280, 'steps': 11589, 'loss/train': 1.567671775817871} -11/06/2021 22:51:09 - INFO - __main__ - Step 11591: {'lr': 0.0004948379372257086, 'samples': 2225472, 'steps': 11590, 'loss/train': 1.2471174001693726} -11/06/2021 22:51:10 - INFO - __main__ - Step 11592: {'lr': 0.0004948368643396035, 'samples': 2225664, 'steps': 11591, 'loss/train': 1.732541799545288} -11/06/2021 22:51:10 - INFO - __main__ - Step 11593: {'lr': 0.0004948357913431786, 'samples': 2225856, 'steps': 11592, 'loss/train': 1.8311717510223389} -11/06/2021 22:51:11 - INFO - __main__ - Step 11594: {'lr': 0.0004948347182364344, 'samples': 2226048, 'steps': 11593, 'loss/train': 2.0419249534606934} -11/06/2021 22:51:11 - INFO - __main__ - Step 11595: {'lr': 0.0004948336450193715, 'samples': 2226240, 'steps': 11594, 'loss/train': 0.42051059007644653} -11/06/2021 22:51:12 - INFO - __main__ - Step 11596: {'lr': 0.0004948325716919904, 'samples': 2226432, 'steps': 11595, 'loss/train': 2.2684004306793213} -11/06/2021 22:51:12 - INFO - __main__ - Step 11597: {'lr': 0.0004948314982542914, 'samples': 2226624, 'steps': 11596, 'loss/train': 1.7309365272521973} -11/06/2021 22:51:13 - INFO - __main__ - Step 11598: {'lr': 0.0004948304247062752, 'samples': 2226816, 'steps': 11597, 'loss/train': 1.4194977283477783} -11/06/2021 22:51:14 - INFO - __main__ - Step 11599: {'lr': 0.0004948293510479421, 'samples': 2227008, 'steps': 11598, 'loss/train': 0.8019549250602722} -11/06/2021 22:51:14 - INFO - __main__ - Step 11600: {'lr': 0.0004948282772792927, 'samples': 2227200, 'steps': 11599, 'loss/train': 1.8629350662231445} -11/06/2021 22:51:14 - INFO - __main__ - Step 11601: {'lr': 0.0004948272034003275, 'samples': 2227392, 'steps': 11600, 'loss/train': 1.8861653804779053} -11/06/2021 22:51:15 - INFO - __main__ - Step 11602: {'lr': 0.000494826129411047, 'samples': 2227584, 'steps': 11601, 'loss/train': 1.1293734312057495} -11/06/2021 22:51:15 - INFO - __main__ - Step 11603: {'lr': 0.0004948250553114516, 'samples': 2227776, 'steps': 11602, 'loss/train': 1.6663720607757568} -11/06/2021 22:51:15 - INFO - __main__ - Step 11604: {'lr': 0.0004948239811015416, 'samples': 2227968, 'steps': 11603, 'loss/train': 1.6033754348754883} -11/06/2021 22:51:16 - INFO - __main__ - Step 11605: {'lr': 0.0004948229067813179, 'samples': 2228160, 'steps': 11604, 'loss/train': 1.3643414974212646} -11/06/2021 22:51:17 - INFO - __main__ - Step 11606: {'lr': 0.0004948218323507807, 'samples': 2228352, 'steps': 11605, 'loss/train': 2.118734836578369} -11/06/2021 22:51:17 - INFO - __main__ - Step 11607: {'lr': 0.0004948207578099306, 'samples': 2228544, 'steps': 11606, 'loss/train': 1.5554416179656982} -11/06/2021 22:51:17 - INFO - __main__ - Step 11608: {'lr': 0.000494819683158768, 'samples': 2228736, 'steps': 11607, 'loss/train': 1.433336615562439} -11/06/2021 22:51:18 - INFO - __main__ - Step 11609: {'lr': 0.0004948186083972934, 'samples': 2228928, 'steps': 11608, 'loss/train': 1.552068829536438} -11/06/2021 22:51:19 - INFO - __main__ - Step 11610: {'lr': 0.0004948175335255075, 'samples': 2229120, 'steps': 11609, 'loss/train': 1.240715503692627} -11/06/2021 22:51:19 - INFO - __main__ - Step 11611: {'lr': 0.0004948164585434104, 'samples': 2229312, 'steps': 11610, 'loss/train': 1.7166132926940918} -11/06/2021 22:51:20 - INFO - __main__ - Step 11612: {'lr': 0.0004948153834510028, 'samples': 2229504, 'steps': 11611, 'loss/train': 1.7382307052612305} -11/06/2021 22:51:20 - INFO - __main__ - Step 11613: {'lr': 0.0004948143082482852, 'samples': 2229696, 'steps': 11612, 'loss/train': 1.9601466655731201} -11/06/2021 22:51:20 - INFO - __main__ - Step 11614: {'lr': 0.0004948132329352582, 'samples': 2229888, 'steps': 11613, 'loss/train': 1.7500718832015991} -11/06/2021 22:51:21 - INFO - __main__ - Step 11615: {'lr': 0.0004948121575119219, 'samples': 2230080, 'steps': 11614, 'loss/train': 5.872844696044922} -11/06/2021 22:51:22 - INFO - __main__ - Step 11616: {'lr': 0.0004948110819782771, 'samples': 2230272, 'steps': 11615, 'loss/train': 1.6911870241165161} -11/06/2021 22:51:22 - INFO - __main__ - Step 11617: {'lr': 0.0004948100063343243, 'samples': 2230464, 'steps': 11616, 'loss/train': 1.594088077545166} -11/06/2021 22:51:22 - INFO - __main__ - Step 11618: {'lr': 0.0004948089305800638, 'samples': 2230656, 'steps': 11617, 'loss/train': 1.9734327793121338} -11/06/2021 22:51:23 - INFO - __main__ - Step 11619: {'lr': 0.0004948078547154962, 'samples': 2230848, 'steps': 11618, 'loss/train': 1.6274333000183105} -11/06/2021 22:51:24 - INFO - __main__ - Step 11620: {'lr': 0.0004948067787406219, 'samples': 2231040, 'steps': 11619, 'loss/train': 2.051081418991089} -11/06/2021 22:51:24 - INFO - __main__ - Step 11621: {'lr': 0.0004948057026554415, 'samples': 2231232, 'steps': 11620, 'loss/train': 1.4982271194458008} -11/06/2021 22:51:24 - INFO - __main__ - Step 11622: {'lr': 0.0004948046264599554, 'samples': 2231424, 'steps': 11621, 'loss/train': 1.4409050941467285} -11/06/2021 22:51:25 - INFO - __main__ - Step 11623: {'lr': 0.0004948035501541641, 'samples': 2231616, 'steps': 11622, 'loss/train': 2.061194658279419} -11/06/2021 22:51:25 - INFO - __main__ - Step 11624: {'lr': 0.0004948024737380681, 'samples': 2231808, 'steps': 11623, 'loss/train': 1.7897642850875854} -11/06/2021 22:51:26 - INFO - __main__ - Step 11625: {'lr': 0.000494801397211668, 'samples': 2232000, 'steps': 11624, 'loss/train': 1.5584590435028076} -11/06/2021 22:51:27 - INFO - __main__ - Step 11626: {'lr': 0.000494800320574964, 'samples': 2232192, 'steps': 11625, 'loss/train': 1.4107680320739746} -11/06/2021 22:51:27 - INFO - __main__ - Step 11627: {'lr': 0.0004947992438279568, 'samples': 2232384, 'steps': 11626, 'loss/train': 1.7100175619125366} -11/06/2021 22:51:27 - INFO - __main__ - Step 11628: {'lr': 0.0004947981669706469, 'samples': 2232576, 'steps': 11627, 'loss/train': 1.3465707302093506} -11/06/2021 22:51:28 - INFO - __main__ - Step 11629: {'lr': 0.0004947970900030346, 'samples': 2232768, 'steps': 11628, 'loss/train': 1.6569414138793945} -11/06/2021 22:51:28 - INFO - __main__ - Step 11630: {'lr': 0.0004947960129251206, 'samples': 2232960, 'steps': 11629, 'loss/train': 1.8013361692428589} -11/06/2021 22:51:29 - INFO - __main__ - Step 11631: {'lr': 0.0004947949357369054, 'samples': 2233152, 'steps': 11630, 'loss/train': 1.4865167140960693} -11/06/2021 22:51:29 - INFO - __main__ - Step 11632: {'lr': 0.0004947938584383892, 'samples': 2233344, 'steps': 11631, 'loss/train': 2.1401309967041016} -11/06/2021 22:51:30 - INFO - __main__ - Step 11633: {'lr': 0.0004947927810295728, 'samples': 2233536, 'steps': 11632, 'loss/train': 1.6527354717254639} -11/06/2021 22:51:30 - INFO - __main__ - Step 11634: {'lr': 0.0004947917035104564, 'samples': 2233728, 'steps': 11633, 'loss/train': 1.9105935096740723} -11/06/2021 22:51:30 - INFO - __main__ - Step 11635: {'lr': 0.0004947906258810407, 'samples': 2233920, 'steps': 11634, 'loss/train': 1.906631350517273} -11/06/2021 22:51:31 - INFO - __main__ - Step 11636: {'lr': 0.0004947895481413262, 'samples': 2234112, 'steps': 11635, 'loss/train': 2.1798081398010254} -11/06/2021 22:51:32 - INFO - __main__ - Step 11637: {'lr': 0.0004947884702913133, 'samples': 2234304, 'steps': 11636, 'loss/train': 1.9816797971725464} -11/06/2021 22:51:32 - INFO - __main__ - Step 11638: {'lr': 0.0004947873923310024, 'samples': 2234496, 'steps': 11637, 'loss/train': 1.7533513307571411} -11/06/2021 22:51:32 - INFO - __main__ - Step 11639: {'lr': 0.0004947863142603941, 'samples': 2234688, 'steps': 11638, 'loss/train': 1.5233229398727417} -11/06/2021 22:51:33 - INFO - __main__ - Step 11640: {'lr': 0.0004947852360794889, 'samples': 2234880, 'steps': 11639, 'loss/train': 1.628521203994751} -11/06/2021 22:51:34 - INFO - __main__ - Step 11641: {'lr': 0.0004947841577882873, 'samples': 2235072, 'steps': 11640, 'loss/train': 1.8481824398040771} -11/06/2021 22:51:34 - INFO - __main__ - Step 11642: {'lr': 0.0004947830793867896, 'samples': 2235264, 'steps': 11641, 'loss/train': 2.2054293155670166} -11/06/2021 22:51:34 - INFO - __main__ - Step 11643: {'lr': 0.0004947820008749965, 'samples': 2235456, 'steps': 11642, 'loss/train': 1.8366459608078003} -11/06/2021 22:51:35 - INFO - __main__ - Step 11644: {'lr': 0.0004947809222529084, 'samples': 2235648, 'steps': 11643, 'loss/train': 1.237697720527649} -11/06/2021 22:51:35 - INFO - __main__ - Step 11645: {'lr': 0.0004947798435205258, 'samples': 2235840, 'steps': 11644, 'loss/train': 1.8298448324203491} -11/06/2021 22:51:36 - INFO - __main__ - Step 11646: {'lr': 0.0004947787646778491, 'samples': 2236032, 'steps': 11645, 'loss/train': 1.7138854265213013} -11/06/2021 22:51:36 - INFO - __main__ - Step 11647: {'lr': 0.0004947776857248791, 'samples': 2236224, 'steps': 11646, 'loss/train': 1.7913033962249756} -11/06/2021 22:51:37 - INFO - __main__ - Step 11648: {'lr': 0.0004947766066616157, 'samples': 2236416, 'steps': 11647, 'loss/train': 1.7357981204986572} -11/06/2021 22:51:37 - INFO - __main__ - Step 11649: {'lr': 0.00049477552748806, 'samples': 2236608, 'steps': 11648, 'loss/train': 1.6491725444793701} -11/06/2021 22:51:38 - INFO - __main__ - Step 11650: {'lr': 0.0004947744482042122, 'samples': 2236800, 'steps': 11649, 'loss/train': 1.3429278135299683} -11/06/2021 22:51:38 - INFO - __main__ - Step 11651: {'lr': 0.0004947733688100728, 'samples': 2236992, 'steps': 11650, 'loss/train': 1.4097791910171509} -11/06/2021 22:51:39 - INFO - __main__ - Step 11652: {'lr': 0.0004947722893056423, 'samples': 2237184, 'steps': 11651, 'loss/train': 1.9435794353485107} -11/06/2021 22:51:39 - INFO - __main__ - Step 11653: {'lr': 0.0004947712096909211, 'samples': 2237376, 'steps': 11652, 'loss/train': 1.272664189338684} -11/06/2021 22:51:40 - INFO - __main__ - Step 11654: {'lr': 0.0004947701299659097, 'samples': 2237568, 'steps': 11653, 'loss/train': 1.6220483779907227} -11/06/2021 22:51:40 - INFO - __main__ - Step 11655: {'lr': 0.0004947690501306088, 'samples': 2237760, 'steps': 11654, 'loss/train': 2.2113709449768066} -11/06/2021 22:51:40 - INFO - __main__ - Step 11656: {'lr': 0.0004947679701850187, 'samples': 2237952, 'steps': 11655, 'loss/train': 1.6100585460662842} -11/06/2021 22:51:41 - INFO - __main__ - Step 11657: {'lr': 0.00049476689012914, 'samples': 2238144, 'steps': 11656, 'loss/train': 1.5602444410324097} -11/06/2021 22:51:42 - INFO - __main__ - Step 11658: {'lr': 0.0004947658099629731, 'samples': 2238336, 'steps': 11657, 'loss/train': 1.4081251621246338} -11/06/2021 22:51:42 - INFO - __main__ - Step 11659: {'lr': 0.0004947647296865184, 'samples': 2238528, 'steps': 11658, 'loss/train': 1.445473074913025} -11/06/2021 22:51:42 - INFO - __main__ - Step 11660: {'lr': 0.0004947636492997765, 'samples': 2238720, 'steps': 11659, 'loss/train': 1.6339030265808105} -11/06/2021 22:51:43 - INFO - __main__ - Step 11661: {'lr': 0.0004947625688027479, 'samples': 2238912, 'steps': 11660, 'loss/train': 1.8317729234695435} -11/06/2021 22:51:44 - INFO - __main__ - Step 11662: {'lr': 0.0004947614881954332, 'samples': 2239104, 'steps': 11661, 'loss/train': 1.262568712234497} -11/06/2021 22:51:44 - INFO - __main__ - Step 11663: {'lr': 0.0004947604074778325, 'samples': 2239296, 'steps': 11662, 'loss/train': 1.5094019174575806} -11/06/2021 22:51:45 - INFO - __main__ - Step 11664: {'lr': 0.0004947593266499468, 'samples': 2239488, 'steps': 11663, 'loss/train': 1.4688637256622314} -11/06/2021 22:51:45 - INFO - __main__ - Step 11665: {'lr': 0.0004947582457117762, 'samples': 2239680, 'steps': 11664, 'loss/train': 2.3043243885040283} -11/06/2021 22:51:45 - INFO - __main__ - Step 11666: {'lr': 0.0004947571646633214, 'samples': 2239872, 'steps': 11665, 'loss/train': 1.4841505289077759} -11/06/2021 22:51:46 - INFO - __main__ - Step 11667: {'lr': 0.0004947560835045826, 'samples': 2240064, 'steps': 11666, 'loss/train': 1.7168904542922974} -11/06/2021 22:51:47 - INFO - __main__ - Step 11668: {'lr': 0.0004947550022355606, 'samples': 2240256, 'steps': 11667, 'loss/train': 1.6431477069854736} -11/06/2021 22:51:47 - INFO - __main__ - Step 11669: {'lr': 0.0004947539208562558, 'samples': 2240448, 'steps': 11668, 'loss/train': 0.3917955160140991} -11/06/2021 22:51:47 - INFO - __main__ - Step 11670: {'lr': 0.0004947528393666686, 'samples': 2240640, 'steps': 11669, 'loss/train': 1.4626667499542236} -11/06/2021 22:51:48 - INFO - __main__ - Step 11671: {'lr': 0.0004947517577667996, 'samples': 2240832, 'steps': 11670, 'loss/train': 1.9244534969329834} -11/06/2021 22:51:48 - INFO - __main__ - Step 11672: {'lr': 0.0004947506760566492, 'samples': 2241024, 'steps': 11671, 'loss/train': 1.6915565729141235} -11/06/2021 22:51:49 - INFO - __main__ - Step 11673: {'lr': 0.0004947495942362179, 'samples': 2241216, 'steps': 11672, 'loss/train': 1.8372933864593506} -11/06/2021 22:51:49 - INFO - __main__ - Step 11674: {'lr': 0.0004947485123055063, 'samples': 2241408, 'steps': 11673, 'loss/train': 1.7340296506881714} -11/06/2021 22:51:50 - INFO - __main__ - Step 11675: {'lr': 0.0004947474302645147, 'samples': 2241600, 'steps': 11674, 'loss/train': 2.306028127670288} -11/06/2021 22:51:50 - INFO - __main__ - Step 11676: {'lr': 0.0004947463481132438, 'samples': 2241792, 'steps': 11675, 'loss/train': 1.5373907089233398} -11/06/2021 22:51:50 - INFO - __main__ - Step 11677: {'lr': 0.0004947452658516938, 'samples': 2241984, 'steps': 11676, 'loss/train': 1.0355230569839478} -11/06/2021 22:51:52 - INFO - __main__ - Step 11678: {'lr': 0.0004947441834798655, 'samples': 2242176, 'steps': 11677, 'loss/train': 1.9624687433242798} -11/06/2021 22:51:52 - INFO - __main__ - Step 11679: {'lr': 0.0004947431009977592, 'samples': 2242368, 'steps': 11678, 'loss/train': 2.2089884281158447} -11/06/2021 22:51:52 - INFO - __main__ - Step 11680: {'lr': 0.0004947420184053755, 'samples': 2242560, 'steps': 11679, 'loss/train': 1.4249625205993652} -11/06/2021 22:51:53 - INFO - __main__ - Step 11681: {'lr': 0.0004947409357027148, 'samples': 2242752, 'steps': 11680, 'loss/train': 1.3146612644195557} -11/06/2021 22:51:53 - INFO - __main__ - Step 11682: {'lr': 0.0004947398528897775, 'samples': 2242944, 'steps': 11681, 'loss/train': 1.6115343570709229} -11/06/2021 22:51:53 - INFO - __main__ - Step 11683: {'lr': 0.0004947387699665643, 'samples': 2243136, 'steps': 11682, 'loss/train': 2.1556644439697266} -11/06/2021 22:51:54 - INFO - __main__ - Step 11684: {'lr': 0.0004947376869330755, 'samples': 2243328, 'steps': 11683, 'loss/train': 2.4655892848968506} -11/06/2021 22:51:55 - INFO - __main__ - Step 11685: {'lr': 0.0004947366037893118, 'samples': 2243520, 'steps': 11684, 'loss/train': 1.4725700616836548} -11/06/2021 22:51:55 - INFO - __main__ - Step 11686: {'lr': 0.0004947355205352735, 'samples': 2243712, 'steps': 11685, 'loss/train': 1.7428011894226074} -11/06/2021 22:51:55 - INFO - __main__ - Step 11687: {'lr': 0.0004947344371709611, 'samples': 2243904, 'steps': 11686, 'loss/train': 1.42606520652771} -11/06/2021 22:51:56 - INFO - __main__ - Step 11688: {'lr': 0.0004947333536963753, 'samples': 2244096, 'steps': 11687, 'loss/train': 1.7653391361236572} -11/06/2021 22:51:57 - INFO - __main__ - Step 11689: {'lr': 0.0004947322701115163, 'samples': 2244288, 'steps': 11688, 'loss/train': 2.0010745525360107} -11/06/2021 22:51:57 - INFO - __main__ - Step 11690: {'lr': 0.0004947311864163847, 'samples': 2244480, 'steps': 11689, 'loss/train': 1.4831074476242065} -11/06/2021 22:51:58 - INFO - __main__ - Step 11691: {'lr': 0.000494730102610981, 'samples': 2244672, 'steps': 11690, 'loss/train': 1.9865690469741821} -11/06/2021 22:51:58 - INFO - __main__ - Step 11692: {'lr': 0.0004947290186953057, 'samples': 2244864, 'steps': 11691, 'loss/train': 1.3742139339447021} -11/06/2021 22:51:58 - INFO - __main__ - Step 11693: {'lr': 0.0004947279346693594, 'samples': 2245056, 'steps': 11692, 'loss/train': 1.701667308807373} -11/06/2021 22:51:59 - INFO - __main__ - Step 11694: {'lr': 0.0004947268505331424, 'samples': 2245248, 'steps': 11693, 'loss/train': 1.9292877912521362} -11/06/2021 22:52:00 - INFO - __main__ - Step 11695: {'lr': 0.0004947257662866551, 'samples': 2245440, 'steps': 11694, 'loss/train': 2.0025382041931152} -11/06/2021 22:52:00 - INFO - __main__ - Step 11696: {'lr': 0.0004947246819298984, 'samples': 2245632, 'steps': 11695, 'loss/train': 1.10530424118042} -11/06/2021 22:52:00 - INFO - __main__ - Step 11697: {'lr': 0.0004947235974628723, 'samples': 2245824, 'steps': 11696, 'loss/train': 1.703428864479065} -11/06/2021 22:52:01 - INFO - __main__ - Step 11698: {'lr': 0.0004947225128855777, 'samples': 2246016, 'steps': 11697, 'loss/train': 1.4115582704544067} -11/06/2021 22:52:02 - INFO - __main__ - Step 11699: {'lr': 0.0004947214281980149, 'samples': 2246208, 'steps': 11698, 'loss/train': 1.6013803482055664} -11/06/2021 22:52:02 - INFO - __main__ - Step 11700: {'lr': 0.0004947203434001843, 'samples': 2246400, 'steps': 11699, 'loss/train': 0.8683410882949829} -11/06/2021 22:52:02 - INFO - __main__ - Step 11701: {'lr': 0.0004947192584920866, 'samples': 2246592, 'steps': 11700, 'loss/train': 1.931963324546814} -11/06/2021 22:52:03 - INFO - __main__ - Step 11702: {'lr': 0.000494718173473722, 'samples': 2246784, 'steps': 11701, 'loss/train': 1.411441683769226} -11/06/2021 22:52:03 - INFO - __main__ - Step 11703: {'lr': 0.0004947170883450913, 'samples': 2246976, 'steps': 11702, 'loss/train': 1.5308102369308472} -11/06/2021 22:52:04 - INFO - __main__ - Step 11704: {'lr': 0.000494716003106195, 'samples': 2247168, 'steps': 11703, 'loss/train': 2.047659158706665} -11/06/2021 22:52:05 - INFO - __main__ - Step 11705: {'lr': 0.0004947149177570332, 'samples': 2247360, 'steps': 11704, 'loss/train': 1.6442228555679321} -11/06/2021 22:52:05 - INFO - __main__ - Step 11706: {'lr': 0.0004947138322976067, 'samples': 2247552, 'steps': 11705, 'loss/train': 1.791576623916626} -11/06/2021 22:52:05 - INFO - __main__ - Step 11707: {'lr': 0.000494712746727916, 'samples': 2247744, 'steps': 11706, 'loss/train': 1.8355753421783447} -11/06/2021 22:52:06 - INFO - __main__ - Step 11708: {'lr': 0.0004947116610479614, 'samples': 2247936, 'steps': 11707, 'loss/train': 1.7016065120697021} -11/06/2021 22:52:06 - INFO - __main__ - Step 11709: {'lr': 0.0004947105752577436, 'samples': 2248128, 'steps': 11708, 'loss/train': 1.3050994873046875} -11/06/2021 22:52:07 - INFO - __main__ - Step 11710: {'lr': 0.0004947094893572629, 'samples': 2248320, 'steps': 11709, 'loss/train': 1.8479158878326416} -11/06/2021 22:52:08 - INFO - __main__ - Step 11711: {'lr': 0.00049470840334652, 'samples': 2248512, 'steps': 11710, 'loss/train': 1.892972707748413} -11/06/2021 22:52:08 - INFO - __main__ - Step 11712: {'lr': 0.0004947073172255151, 'samples': 2248704, 'steps': 11711, 'loss/train': 2.1024181842803955} -11/06/2021 22:52:08 - INFO - __main__ - Step 11713: {'lr': 0.000494706230994249, 'samples': 2248896, 'steps': 11712, 'loss/train': 1.7337501049041748} -11/06/2021 22:52:09 - INFO - __main__ - Step 11714: {'lr': 0.000494705144652722, 'samples': 2249088, 'steps': 11713, 'loss/train': 2.053222894668579} -11/06/2021 22:52:10 - INFO - __main__ - Step 11715: {'lr': 0.0004947040582009346, 'samples': 2249280, 'steps': 11714, 'loss/train': 1.5705617666244507} -11/06/2021 22:52:10 - INFO - __main__ - Step 11716: {'lr': 0.0004947029716388875, 'samples': 2249472, 'steps': 11715, 'loss/train': 1.1817337274551392} -11/06/2021 22:52:11 - INFO - __main__ - Step 11717: {'lr': 0.0004947018849665809, 'samples': 2249664, 'steps': 11716, 'loss/train': 1.7236446142196655} -11/06/2021 22:52:11 - INFO - __main__ - Step 11718: {'lr': 0.0004947007981840153, 'samples': 2249856, 'steps': 11717, 'loss/train': 1.561780571937561} -11/06/2021 22:52:11 - INFO - __main__ - Step 11719: {'lr': 0.0004946997112911914, 'samples': 2250048, 'steps': 11718, 'loss/train': 1.9812180995941162} -11/06/2021 22:52:12 - INFO - __main__ - Step 11720: {'lr': 0.0004946986242881096, 'samples': 2250240, 'steps': 11719, 'loss/train': 2.1320106983184814} -11/06/2021 22:52:13 - INFO - __main__ - Step 11721: {'lr': 0.0004946975371747704, 'samples': 2250432, 'steps': 11720, 'loss/train': 2.156588315963745} -11/06/2021 22:52:13 - INFO - __main__ - Step 11722: {'lr': 0.0004946964499511742, 'samples': 2250624, 'steps': 11721, 'loss/train': 1.9945005178451538} -11/06/2021 22:52:13 - INFO - __main__ - Step 11723: {'lr': 0.0004946953626173216, 'samples': 2250816, 'steps': 11722, 'loss/train': 1.00374174118042} -11/06/2021 22:52:14 - INFO - __main__ - Step 11724: {'lr': 0.0004946942751732129, 'samples': 2251008, 'steps': 11723, 'loss/train': 1.2549642324447632} -11/06/2021 22:52:14 - INFO - __main__ - Step 11725: {'lr': 0.000494693187618849, 'samples': 2251200, 'steps': 11724, 'loss/train': 1.6982334852218628} -11/06/2021 22:52:15 - INFO - __main__ - Step 11726: {'lr': 0.0004946920999542299, 'samples': 2251392, 'steps': 11725, 'loss/train': 5.76206636428833} -11/06/2021 22:52:15 - INFO - __main__ - Step 11727: {'lr': 0.0004946910121793564, 'samples': 2251584, 'steps': 11726, 'loss/train': 1.8769844770431519} -11/06/2021 22:52:16 - INFO - __main__ - Step 11728: {'lr': 0.0004946899242942289, 'samples': 2251776, 'steps': 11727, 'loss/train': 1.1642225980758667} -11/06/2021 22:52:16 - INFO - __main__ - Step 11729: {'lr': 0.000494688836298848, 'samples': 2251968, 'steps': 11728, 'loss/train': 1.9926396608352661} -11/06/2021 22:52:16 - INFO - __main__ - Step 11730: {'lr': 0.0004946877481932139, 'samples': 2252160, 'steps': 11729, 'loss/train': 1.9353605508804321} -11/06/2021 22:52:17 - INFO - __main__ - Step 11731: {'lr': 0.0004946866599773274, 'samples': 2252352, 'steps': 11730, 'loss/train': 1.884238839149475} -11/06/2021 22:52:18 - INFO - __main__ - Step 11732: {'lr': 0.0004946855716511888, 'samples': 2252544, 'steps': 11731, 'loss/train': 2.3865725994110107} -11/06/2021 22:52:18 - INFO - __main__ - Step 11733: {'lr': 0.0004946844832147987, 'samples': 2252736, 'steps': 11732, 'loss/train': 1.7648876905441284} -11/06/2021 22:52:18 - INFO - __main__ - Step 11734: {'lr': 0.0004946833946681575, 'samples': 2252928, 'steps': 11733, 'loss/train': 1.9588221311569214} -11/06/2021 22:52:19 - INFO - __main__ - Step 11735: {'lr': 0.0004946823060112658, 'samples': 2253120, 'steps': 11734, 'loss/train': 1.0032458305358887} -11/06/2021 22:52:20 - INFO - __main__ - Step 11736: {'lr': 0.000494681217244124, 'samples': 2253312, 'steps': 11735, 'loss/train': 1.9610958099365234} -11/06/2021 22:52:20 - INFO - __main__ - Step 11737: {'lr': 0.0004946801283667326, 'samples': 2253504, 'steps': 11736, 'loss/train': 1.6213114261627197} -11/06/2021 22:52:21 - INFO - __main__ - Step 11738: {'lr': 0.0004946790393790921, 'samples': 2253696, 'steps': 11737, 'loss/train': 1.8059797286987305} -11/06/2021 22:52:21 - INFO - __main__ - Step 11739: {'lr': 0.0004946779502812031, 'samples': 2253888, 'steps': 11738, 'loss/train': 2.2257320880889893} -11/06/2021 22:52:21 - INFO - __main__ - Step 11740: {'lr': 0.0004946768610730659, 'samples': 2254080, 'steps': 11739, 'loss/train': 1.6921347379684448} -11/06/2021 22:52:22 - INFO - __main__ - Step 11741: {'lr': 0.0004946757717546812, 'samples': 2254272, 'steps': 11740, 'loss/train': 1.7304112911224365} -11/06/2021 22:52:23 - INFO - __main__ - Step 11742: {'lr': 0.0004946746823260491, 'samples': 2254464, 'steps': 11741, 'loss/train': 0.8344317078590393} -11/06/2021 22:52:23 - INFO - __main__ - Step 11743: {'lr': 0.0004946735927871706, 'samples': 2254656, 'steps': 11742, 'loss/train': 1.438720941543579} -11/06/2021 22:52:23 - INFO - __main__ - Step 11744: {'lr': 0.0004946725031380459, 'samples': 2254848, 'steps': 11743, 'loss/train': 2.020857572555542} -11/06/2021 22:52:24 - INFO - __main__ - Step 11745: {'lr': 0.0004946714133786756, 'samples': 2255040, 'steps': 11744, 'loss/train': 1.5829726457595825} -11/06/2021 22:52:24 - INFO - __main__ - Step 11746: {'lr': 0.00049467032350906, 'samples': 2255232, 'steps': 11745, 'loss/train': 1.7040636539459229} -11/06/2021 22:52:25 - INFO - __main__ - Step 11747: {'lr': 0.0004946692335291999, 'samples': 2255424, 'steps': 11746, 'loss/train': 1.7753183841705322} -11/06/2021 22:52:26 - INFO - __main__ - Step 11748: {'lr': 0.0004946681434390955, 'samples': 2255616, 'steps': 11747, 'loss/train': 2.8313393592834473} -11/06/2021 22:52:26 - INFO - __main__ - Step 11749: {'lr': 0.0004946670532387474, 'samples': 2255808, 'steps': 11748, 'loss/train': 1.4932595491409302} -11/06/2021 22:52:26 - INFO - __main__ - Step 11750: {'lr': 0.0004946659629281561, 'samples': 2256000, 'steps': 11749, 'loss/train': 1.6414493322372437} -11/06/2021 22:52:27 - INFO - __main__ - Step 11751: {'lr': 0.0004946648725073222, 'samples': 2256192, 'steps': 11750, 'loss/train': 1.8771973848342896} -11/06/2021 22:52:27 - INFO - __main__ - Step 11752: {'lr': 0.0004946637819762459, 'samples': 2256384, 'steps': 11751, 'loss/train': 1.819173812866211} -11/06/2021 22:52:28 - INFO - __main__ - Step 11753: {'lr': 0.000494662691334928, 'samples': 2256576, 'steps': 11752, 'loss/train': 1.7248607873916626} -11/06/2021 22:52:29 - INFO - __main__ - Step 11754: {'lr': 0.0004946616005833689, 'samples': 2256768, 'steps': 11753, 'loss/train': 1.390769362449646} -11/06/2021 22:52:29 - INFO - __main__ - Step 11755: {'lr': 0.0004946605097215691, 'samples': 2256960, 'steps': 11754, 'loss/train': 1.4197173118591309} -11/06/2021 22:52:29 - INFO - __main__ - Step 11756: {'lr': 0.0004946594187495289, 'samples': 2257152, 'steps': 11755, 'loss/train': 1.846717357635498} -11/06/2021 22:52:30 - INFO - __main__ - Step 11757: {'lr': 0.0004946583276672489, 'samples': 2257344, 'steps': 11756, 'loss/train': 1.6870449781417847} -11/06/2021 22:52:31 - INFO - __main__ - Step 11758: {'lr': 0.0004946572364747298, 'samples': 2257536, 'steps': 11757, 'loss/train': 1.6424260139465332} -11/06/2021 22:52:31 - INFO - __main__ - Step 11759: {'lr': 0.0004946561451719719, 'samples': 2257728, 'steps': 11758, 'loss/train': 1.8925001621246338} -11/06/2021 22:52:32 - INFO - __main__ - Step 11760: {'lr': 0.0004946550537589757, 'samples': 2257920, 'steps': 11759, 'loss/train': 1.6655386686325073} -11/06/2021 22:52:32 - INFO - __main__ - Step 11761: {'lr': 0.0004946539622357417, 'samples': 2258112, 'steps': 11760, 'loss/train': 1.9449368715286255} -11/06/2021 22:52:32 - INFO - __main__ - Step 11762: {'lr': 0.0004946528706022703, 'samples': 2258304, 'steps': 11761, 'loss/train': 2.078275442123413} -11/06/2021 22:52:33 - INFO - __main__ - Step 11763: {'lr': 0.0004946517788585622, 'samples': 2258496, 'steps': 11762, 'loss/train': 1.4620633125305176} -11/06/2021 22:52:34 - INFO - __main__ - Step 11764: {'lr': 0.0004946506870046178, 'samples': 2258688, 'steps': 11763, 'loss/train': 1.66291344165802} -11/06/2021 22:52:34 - INFO - __main__ - Step 11765: {'lr': 0.0004946495950404375, 'samples': 2258880, 'steps': 11764, 'loss/train': 1.7311233282089233} -11/06/2021 22:52:34 - INFO - __main__ - Step 11766: {'lr': 0.0004946485029660219, 'samples': 2259072, 'steps': 11765, 'loss/train': 1.9496246576309204} -11/06/2021 22:52:35 - INFO - __main__ - Step 11767: {'lr': 0.0004946474107813715, 'samples': 2259264, 'steps': 11766, 'loss/train': 1.842336654663086} -11/06/2021 22:52:35 - INFO - __main__ - Step 11768: {'lr': 0.0004946463184864867, 'samples': 2259456, 'steps': 11767, 'loss/train': 1.8693801164627075} -11/06/2021 22:52:36 - INFO - __main__ - Step 11769: {'lr': 0.000494645226081368, 'samples': 2259648, 'steps': 11768, 'loss/train': 1.6797724962234497} -11/06/2021 22:52:36 - INFO - __main__ - Step 11770: {'lr': 0.000494644133566016, 'samples': 2259840, 'steps': 11769, 'loss/train': 1.4810084104537964} -11/06/2021 22:52:37 - INFO - __main__ - Step 11771: {'lr': 0.0004946430409404311, 'samples': 2260032, 'steps': 11770, 'loss/train': 1.5809372663497925} -11/06/2021 22:52:37 - INFO - __main__ - Step 11772: {'lr': 0.0004946419482046139, 'samples': 2260224, 'steps': 11771, 'loss/train': 1.3877747058868408} -11/06/2021 22:52:38 - INFO - __main__ - Step 11773: {'lr': 0.0004946408553585648, 'samples': 2260416, 'steps': 11772, 'loss/train': 1.1509099006652832} -11/06/2021 22:52:38 - INFO - __main__ - Step 11774: {'lr': 0.0004946397624022843, 'samples': 2260608, 'steps': 11773, 'loss/train': 2.2780723571777344} -11/06/2021 22:52:39 - INFO - __main__ - Step 11775: {'lr': 0.0004946386693357728, 'samples': 2260800, 'steps': 11774, 'loss/train': 1.5526584386825562} -11/06/2021 22:52:39 - INFO - __main__ - Step 11776: {'lr': 0.0004946375761590309, 'samples': 2260992, 'steps': 11775, 'loss/train': 2.048732280731201} -11/06/2021 22:52:39 - INFO - __main__ - Step 11777: {'lr': 0.0004946364828720592, 'samples': 2261184, 'steps': 11776, 'loss/train': 1.518662929534912} -11/06/2021 22:52:40 - INFO - __main__ - Step 11778: {'lr': 0.000494635389474858, 'samples': 2261376, 'steps': 11777, 'loss/train': 2.078202962875366} -11/06/2021 22:52:41 - INFO - __main__ - Step 11779: {'lr': 0.0004946342959674278, 'samples': 2261568, 'steps': 11778, 'loss/train': 1.6700574159622192} -11/06/2021 22:52:41 - INFO - __main__ - Step 11780: {'lr': 0.0004946332023497693, 'samples': 2261760, 'steps': 11779, 'loss/train': 2.0931074619293213} -11/06/2021 22:52:42 - INFO - __main__ - Step 11781: {'lr': 0.0004946321086218828, 'samples': 2261952, 'steps': 11780, 'loss/train': 1.8575305938720703} -11/06/2021 22:52:42 - INFO - __main__ - Step 11782: {'lr': 0.0004946310147837689, 'samples': 2262144, 'steps': 11781, 'loss/train': 1.1181639432907104} -11/06/2021 22:52:42 - INFO - __main__ - Step 11783: {'lr': 0.0004946299208354279, 'samples': 2262336, 'steps': 11782, 'loss/train': 1.7613064050674438} -11/06/2021 22:52:43 - INFO - __main__ - Step 11784: {'lr': 0.0004946288267768605, 'samples': 2262528, 'steps': 11783, 'loss/train': 1.5127317905426025} -11/06/2021 22:52:44 - INFO - __main__ - Step 11785: {'lr': 0.0004946277326080672, 'samples': 2262720, 'steps': 11784, 'loss/train': 1.9431092739105225} -11/06/2021 22:52:44 - INFO - __main__ - Step 11786: {'lr': 0.0004946266383290483, 'samples': 2262912, 'steps': 11785, 'loss/train': 2.022489547729492} -11/06/2021 22:52:44 - INFO - __main__ - Step 11787: {'lr': 0.0004946255439398045, 'samples': 2263104, 'steps': 11786, 'loss/train': 1.829660177230835} -11/06/2021 22:52:45 - INFO - __main__ - Step 11788: {'lr': 0.0004946244494403361, 'samples': 2263296, 'steps': 11787, 'loss/train': 1.7674616575241089} -11/06/2021 22:52:45 - INFO - __main__ - Step 11789: {'lr': 0.0004946233548306438, 'samples': 2263488, 'steps': 11788, 'loss/train': 1.8133692741394043} -11/06/2021 22:52:46 - INFO - __main__ - Step 11790: {'lr': 0.000494622260110728, 'samples': 2263680, 'steps': 11789, 'loss/train': 1.611851453781128} -11/06/2021 22:52:46 - INFO - __main__ - Step 11791: {'lr': 0.0004946211652805891, 'samples': 2263872, 'steps': 11790, 'loss/train': 1.1969035863876343} -11/06/2021 22:52:47 - INFO - __main__ - Step 11792: {'lr': 0.0004946200703402278, 'samples': 2264064, 'steps': 11791, 'loss/train': 2.1586251258850098} -11/06/2021 22:52:47 - INFO - __main__ - Step 11793: {'lr': 0.0004946189752896443, 'samples': 2264256, 'steps': 11792, 'loss/train': 1.361173152923584} -11/06/2021 22:52:47 - INFO - __main__ - Step 11794: {'lr': 0.0004946178801288394, 'samples': 2264448, 'steps': 11793, 'loss/train': 1.3458670377731323} -11/06/2021 22:52:48 - INFO - __main__ - Step 11795: {'lr': 0.0004946167848578134, 'samples': 2264640, 'steps': 11794, 'loss/train': 1.4906079769134521} -11/06/2021 22:52:49 - INFO - __main__ - Step 11796: {'lr': 0.0004946156894765669, 'samples': 2264832, 'steps': 11795, 'loss/train': 1.776194453239441} -11/06/2021 22:52:49 - INFO - __main__ - Step 11797: {'lr': 0.0004946145939851004, 'samples': 2265024, 'steps': 11796, 'loss/train': 1.1889792680740356} -11/06/2021 22:52:49 - INFO - __main__ - Step 11798: {'lr': 0.0004946134983834142, 'samples': 2265216, 'steps': 11797, 'loss/train': 1.3798962831497192} -11/06/2021 22:52:50 - INFO - __main__ - Step 11799: {'lr': 0.0004946124026715089, 'samples': 2265408, 'steps': 11798, 'loss/train': 1.1393816471099854} -11/06/2021 22:52:51 - INFO - __main__ - Step 11800: {'lr': 0.0004946113068493851, 'samples': 2265600, 'steps': 11799, 'loss/train': 1.938144326210022} -11/06/2021 22:52:51 - INFO - __main__ - Step 11801: {'lr': 0.0004946102109170433, 'samples': 2265792, 'steps': 11800, 'loss/train': 1.085551381111145} -11/06/2021 22:52:52 - INFO - __main__ - Step 11802: {'lr': 0.0004946091148744838, 'samples': 2265984, 'steps': 11801, 'loss/train': 1.9782894849777222} -11/06/2021 22:52:52 - INFO - __main__ - Step 11803: {'lr': 0.0004946080187217072, 'samples': 2266176, 'steps': 11802, 'loss/train': 1.8065892457962036} -11/06/2021 22:52:52 - INFO - __main__ - Step 11804: {'lr': 0.0004946069224587141, 'samples': 2266368, 'steps': 11803, 'loss/train': 1.8885177373886108} -11/06/2021 22:52:53 - INFO - __main__ - Step 11805: {'lr': 0.0004946058260855049, 'samples': 2266560, 'steps': 11804, 'loss/train': 1.6581742763519287} -11/06/2021 22:52:54 - INFO - __main__ - Step 11806: {'lr': 0.00049460472960208, 'samples': 2266752, 'steps': 11805, 'loss/train': 1.8669217824935913} -11/06/2021 22:52:54 - INFO - __main__ - Step 11807: {'lr': 0.00049460363300844, 'samples': 2266944, 'steps': 11806, 'loss/train': 1.47137451171875} -11/06/2021 22:52:54 - INFO - __main__ - Step 11808: {'lr': 0.0004946025363045854, 'samples': 2267136, 'steps': 11807, 'loss/train': 1.8952033519744873} -11/06/2021 22:52:55 - INFO - __main__ - Step 11809: {'lr': 0.0004946014394905167, 'samples': 2267328, 'steps': 11808, 'loss/train': 1.2856425046920776} -11/06/2021 22:52:56 - INFO - __main__ - Step 11810: {'lr': 0.0004946003425662343, 'samples': 2267520, 'steps': 11809, 'loss/train': 2.00896954536438} -11/06/2021 22:52:56 - INFO - __main__ - Step 11811: {'lr': 0.0004945992455317389, 'samples': 2267712, 'steps': 11810, 'loss/train': 1.724480390548706} -11/06/2021 22:52:56 - INFO - __main__ - Step 11812: {'lr': 0.0004945981483870307, 'samples': 2267904, 'steps': 11811, 'loss/train': 1.5671536922454834} -11/06/2021 22:52:57 - INFO - __main__ - Step 11813: {'lr': 0.0004945970511321104, 'samples': 2268096, 'steps': 11812, 'loss/train': 2.0063626766204834} -11/06/2021 22:52:57 - INFO - __main__ - Step 11814: {'lr': 0.0004945959537669784, 'samples': 2268288, 'steps': 11813, 'loss/train': 1.2561020851135254} -11/06/2021 22:52:57 - INFO - __main__ - Step 11815: {'lr': 0.0004945948562916353, 'samples': 2268480, 'steps': 11814, 'loss/train': 1.8354805707931519} -11/06/2021 22:52:59 - INFO - __main__ - Step 11816: {'lr': 0.0004945937587060815, 'samples': 2268672, 'steps': 11815, 'loss/train': 1.270841360092163} -11/06/2021 22:53:00 - INFO - __main__ - Step 11817: {'lr': 0.0004945926610103175, 'samples': 2268864, 'steps': 11816, 'loss/train': 1.2347999811172485} -11/06/2021 22:53:00 - INFO - __main__ - Step 11818: {'lr': 0.0004945915632043439, 'samples': 2269056, 'steps': 11817, 'loss/train': 1.340549349784851} -11/06/2021 22:53:00 - INFO - __main__ - Step 11819: {'lr': 0.0004945904652881611, 'samples': 2269248, 'steps': 11818, 'loss/train': 1.905003547668457} -11/06/2021 22:53:01 - INFO - __main__ - Step 11820: {'lr': 0.0004945893672617695, 'samples': 2269440, 'steps': 11819, 'loss/train': 1.818457841873169} -11/06/2021 22:53:01 - INFO - __main__ - Step 11821: {'lr': 0.0004945882691251699, 'samples': 2269632, 'steps': 11820, 'loss/train': 1.8213856220245361} -11/06/2021 22:53:02 - INFO - __main__ - Step 11822: {'lr': 0.0004945871708783625, 'samples': 2269824, 'steps': 11821, 'loss/train': 1.8481453657150269} -11/06/2021 22:53:02 - INFO - __main__ - Step 11823: {'lr': 0.0004945860725213477, 'samples': 2270016, 'steps': 11822, 'loss/train': 1.7589327096939087} -11/06/2021 22:53:03 - INFO - __main__ - Step 11824: {'lr': 0.0004945849740541265, 'samples': 2270208, 'steps': 11823, 'loss/train': 1.8017772436141968} -11/06/2021 22:53:03 - INFO - __main__ - Step 11825: {'lr': 0.000494583875476699, 'samples': 2270400, 'steps': 11824, 'loss/train': 1.8388363122940063} -11/06/2021 22:53:03 - INFO - __main__ - Step 11826: {'lr': 0.0004945827767890657, 'samples': 2270592, 'steps': 11825, 'loss/train': 1.1017407178878784} -11/06/2021 22:53:04 - INFO - __main__ - Step 11827: {'lr': 0.0004945816779912272, 'samples': 2270784, 'steps': 11826, 'loss/train': 1.1215801239013672} -11/06/2021 22:53:05 - INFO - __main__ - Step 11828: {'lr': 0.000494580579083184, 'samples': 2270976, 'steps': 11827, 'loss/train': 1.8502867221832275} -11/06/2021 22:53:05 - INFO - __main__ - Step 11829: {'lr': 0.0004945794800649366, 'samples': 2271168, 'steps': 11828, 'loss/train': 1.7619470357894897} -11/06/2021 22:53:06 - INFO - __main__ - Step 11830: {'lr': 0.0004945783809364853, 'samples': 2271360, 'steps': 11829, 'loss/train': 1.7739301919937134} -11/06/2021 22:53:06 - INFO - __main__ - Step 11831: {'lr': 0.0004945772816978309, 'samples': 2271552, 'steps': 11830, 'loss/train': 1.8250958919525146} -11/06/2021 22:53:06 - INFO - __main__ - Step 11832: {'lr': 0.0004945761823489737, 'samples': 2271744, 'steps': 11831, 'loss/train': 2.298485040664673} -11/06/2021 22:53:07 - INFO - __main__ - Step 11833: {'lr': 0.0004945750828899144, 'samples': 2271936, 'steps': 11832, 'loss/train': 1.6959924697875977} -11/06/2021 22:53:08 - INFO - __main__ - Step 11834: {'lr': 0.0004945739833206531, 'samples': 2272128, 'steps': 11833, 'loss/train': 1.4420230388641357} -11/06/2021 22:53:08 - INFO - __main__ - Step 11835: {'lr': 0.0004945728836411907, 'samples': 2272320, 'steps': 11834, 'loss/train': 1.9085041284561157} -11/06/2021 22:53:08 - INFO - __main__ - Step 11836: {'lr': 0.0004945717838515275, 'samples': 2272512, 'steps': 11835, 'loss/train': 1.7910774946212769} -11/06/2021 22:53:09 - INFO - __main__ - Step 11837: {'lr': 0.0004945706839516639, 'samples': 2272704, 'steps': 11836, 'loss/train': 0.9751549363136292} -11/06/2021 22:53:10 - INFO - __main__ - Step 11838: {'lr': 0.0004945695839416006, 'samples': 2272896, 'steps': 11837, 'loss/train': 1.1652768850326538} -11/06/2021 22:53:10 - INFO - __main__ - Step 11839: {'lr': 0.0004945684838213382, 'samples': 2273088, 'steps': 11838, 'loss/train': 2.4562861919403076} -11/06/2021 22:53:10 - INFO - __main__ - Step 11840: {'lr': 0.0004945673835908767, 'samples': 2273280, 'steps': 11839, 'loss/train': 1.785056233406067} -11/06/2021 22:53:11 - INFO - __main__ - Step 11841: {'lr': 0.0004945662832502171, 'samples': 2273472, 'steps': 11840, 'loss/train': 1.478073000907898} -11/06/2021 22:53:11 - INFO - __main__ - Step 11842: {'lr': 0.0004945651827993597, 'samples': 2273664, 'steps': 11841, 'loss/train': 1.5558642148971558} -11/06/2021 22:53:11 - INFO - __main__ - Step 11843: {'lr': 0.000494564082238305, 'samples': 2273856, 'steps': 11842, 'loss/train': 1.5626791715621948} -11/06/2021 22:53:13 - INFO - __main__ - Step 11844: {'lr': 0.0004945629815670535, 'samples': 2274048, 'steps': 11843, 'loss/train': 1.923411250114441} -11/06/2021 22:53:13 - INFO - __main__ - Step 11845: {'lr': 0.0004945618807856056, 'samples': 2274240, 'steps': 11844, 'loss/train': 1.2191367149353027} -11/06/2021 22:53:13 - INFO - __main__ - Step 11846: {'lr': 0.000494560779893962, 'samples': 2274432, 'steps': 11845, 'loss/train': 1.695072054862976} -11/06/2021 22:53:14 - INFO - __main__ - Step 11847: {'lr': 0.0004945596788921231, 'samples': 2274624, 'steps': 11846, 'loss/train': 1.8576159477233887} -11/06/2021 22:53:14 - INFO - __main__ - Step 11848: {'lr': 0.0004945585777800893, 'samples': 2274816, 'steps': 11847, 'loss/train': 1.8127880096435547} -11/06/2021 22:53:15 - INFO - __main__ - Step 11849: {'lr': 0.0004945574765578612, 'samples': 2275008, 'steps': 11848, 'loss/train': 1.4972808361053467} -11/06/2021 22:53:15 - INFO - __main__ - Step 11850: {'lr': 0.0004945563752254393, 'samples': 2275200, 'steps': 11849, 'loss/train': 1.7864632606506348} -11/06/2021 22:53:16 - INFO - __main__ - Step 11851: {'lr': 0.000494555273782824, 'samples': 2275392, 'steps': 11850, 'loss/train': 1.0610276460647583} -11/06/2021 22:53:16 - INFO - __main__ - Step 11852: {'lr': 0.000494554172230016, 'samples': 2275584, 'steps': 11851, 'loss/train': 1.3797191381454468} -11/06/2021 22:53:16 - INFO - __main__ - Step 11853: {'lr': 0.0004945530705670156, 'samples': 2275776, 'steps': 11852, 'loss/train': 1.7779545783996582} -11/06/2021 22:53:18 - INFO - __main__ - Step 11854: {'lr': 0.0004945519687938234, 'samples': 2275968, 'steps': 11853, 'loss/train': 1.6782175302505493} -11/06/2021 22:53:18 - INFO - __main__ - Step 11855: {'lr': 0.0004945508669104397, 'samples': 2276160, 'steps': 11854, 'loss/train': 2.7653017044067383} -11/06/2021 22:53:18 - INFO - __main__ - Step 11856: {'lr': 0.0004945497649168654, 'samples': 2276352, 'steps': 11855, 'loss/train': 1.727919340133667} -11/06/2021 22:53:19 - INFO - __main__ - Step 11857: {'lr': 0.0004945486628131006, 'samples': 2276544, 'steps': 11856, 'loss/train': 1.342666506767273} -11/06/2021 22:53:19 - INFO - __main__ - Step 11858: {'lr': 0.0004945475605991459, 'samples': 2276736, 'steps': 11857, 'loss/train': 0.3159283399581909} -11/06/2021 22:53:20 - INFO - __main__ - Step 11859: {'lr': 0.0004945464582750019, 'samples': 2276928, 'steps': 11858, 'loss/train': 1.7237508296966553} -11/06/2021 22:53:20 - INFO - __main__ - Step 11860: {'lr': 0.000494545355840669, 'samples': 2277120, 'steps': 11859, 'loss/train': 1.4004329442977905} -11/06/2021 22:53:21 - INFO - __main__ - Step 11861: {'lr': 0.0004945442532961478, 'samples': 2277312, 'steps': 11860, 'loss/train': 1.3610728979110718} -11/06/2021 22:53:21 - INFO - __main__ - Step 11862: {'lr': 0.0004945431506414386, 'samples': 2277504, 'steps': 11861, 'loss/train': 2.1039764881134033} -11/06/2021 22:53:21 - INFO - __main__ - Step 11863: {'lr': 0.0004945420478765422, 'samples': 2277696, 'steps': 11862, 'loss/train': 2.395843505859375} -11/06/2021 22:53:22 - INFO - __main__ - Step 11864: {'lr': 0.0004945409450014588, 'samples': 2277888, 'steps': 11863, 'loss/train': 1.4284261465072632} -11/06/2021 22:53:23 - INFO - __main__ - Step 11865: {'lr': 0.0004945398420161892, 'samples': 2278080, 'steps': 11864, 'loss/train': 1.9594630002975464} -11/06/2021 22:53:23 - INFO - __main__ - Step 11866: {'lr': 0.0004945387389207335, 'samples': 2278272, 'steps': 11865, 'loss/train': 1.446509599685669} -11/06/2021 22:53:23 - INFO - __main__ - Step 11867: {'lr': 0.0004945376357150926, 'samples': 2278464, 'steps': 11866, 'loss/train': 1.6203410625457764} -11/06/2021 22:53:24 - INFO - __main__ - Step 11868: {'lr': 0.0004945365323992668, 'samples': 2278656, 'steps': 11867, 'loss/train': 1.354360818862915} -11/06/2021 22:53:24 - INFO - __main__ - Step 11869: {'lr': 0.0004945354289732565, 'samples': 2278848, 'steps': 11868, 'loss/train': 1.6801567077636719} -11/06/2021 22:53:25 - INFO - __main__ - Step 11870: {'lr': 0.0004945343254370623, 'samples': 2279040, 'steps': 11869, 'loss/train': 1.8512502908706665} -11/06/2021 22:53:26 - INFO - __main__ - Step 11871: {'lr': 0.0004945332217906848, 'samples': 2279232, 'steps': 11870, 'loss/train': 1.6721792221069336} -11/06/2021 22:53:26 - INFO - __main__ - Step 11872: {'lr': 0.0004945321180341244, 'samples': 2279424, 'steps': 11871, 'loss/train': 1.7960259914398193} -11/06/2021 22:53:26 - INFO - __main__ - Step 11873: {'lr': 0.0004945310141673816, 'samples': 2279616, 'steps': 11872, 'loss/train': 1.7067826986312866} -11/06/2021 22:53:27 - INFO - __main__ - Step 11874: {'lr': 0.0004945299101904568, 'samples': 2279808, 'steps': 11873, 'loss/train': 1.8478683233261108} -11/06/2021 22:53:28 - INFO - __main__ - Step 11875: {'lr': 0.0004945288061033507, 'samples': 2280000, 'steps': 11874, 'loss/train': 1.8449006080627441} -11/06/2021 22:53:28 - INFO - __main__ - Step 11876: {'lr': 0.0004945277019060637, 'samples': 2280192, 'steps': 11875, 'loss/train': 1.7363343238830566} -11/06/2021 22:53:28 - INFO - __main__ - Step 11877: {'lr': 0.0004945265975985962, 'samples': 2280384, 'steps': 11876, 'loss/train': 1.287642478942871} -11/06/2021 22:53:29 - INFO - __main__ - Step 11878: {'lr': 0.0004945254931809489, 'samples': 2280576, 'steps': 11877, 'loss/train': 1.5857558250427246} -11/06/2021 22:53:29 - INFO - __main__ - Step 11879: {'lr': 0.000494524388653122, 'samples': 2280768, 'steps': 11878, 'loss/train': 1.3704111576080322} -11/06/2021 22:53:30 - INFO - __main__ - Step 11880: {'lr': 0.0004945232840151164, 'samples': 2280960, 'steps': 11879, 'loss/train': 1.9039316177368164} -11/06/2021 22:53:31 - INFO - __main__ - Step 11881: {'lr': 0.0004945221792669322, 'samples': 2281152, 'steps': 11880, 'loss/train': 1.6828198432922363} -11/06/2021 22:53:31 - INFO - __main__ - Step 11882: {'lr': 0.0004945210744085702, 'samples': 2281344, 'steps': 11881, 'loss/train': 2.2412431240081787} -11/06/2021 22:53:31 - INFO - __main__ - Step 11883: {'lr': 0.0004945199694400308, 'samples': 2281536, 'steps': 11882, 'loss/train': 1.4356671571731567} -11/06/2021 22:53:32 - INFO - __main__ - Step 11884: {'lr': 0.0004945188643613144, 'samples': 2281728, 'steps': 11883, 'loss/train': 1.609714388847351} -11/06/2021 22:53:33 - INFO - __main__ - Step 11885: {'lr': 0.0004945177591724216, 'samples': 2281920, 'steps': 11884, 'loss/train': 1.3597244024276733} -11/06/2021 22:53:33 - INFO - __main__ - Step 11886: {'lr': 0.0004945166538733529, 'samples': 2282112, 'steps': 11885, 'loss/train': 1.8882817029953003} -11/06/2021 22:53:33 - INFO - __main__ - Step 11887: {'lr': 0.0004945155484641087, 'samples': 2282304, 'steps': 11886, 'loss/train': 1.242563009262085} -11/06/2021 22:53:34 - INFO - __main__ - Step 11888: {'lr': 0.0004945144429446897, 'samples': 2282496, 'steps': 11887, 'loss/train': 1.8521512746810913} -11/06/2021 22:53:34 - INFO - __main__ - Step 11889: {'lr': 0.000494513337315096, 'samples': 2282688, 'steps': 11888, 'loss/train': 1.7061456441879272} -11/06/2021 22:53:35 - INFO - __main__ - Step 11890: {'lr': 0.0004945122315753286, 'samples': 2282880, 'steps': 11889, 'loss/train': 1.742601990699768} -11/06/2021 22:53:35 - INFO - __main__ - Step 11891: {'lr': 0.0004945111257253877, 'samples': 2283072, 'steps': 11890, 'loss/train': 1.7886587381362915} -11/06/2021 22:53:36 - INFO - __main__ - Step 11892: {'lr': 0.0004945100197652738, 'samples': 2283264, 'steps': 11891, 'loss/train': 2.3092379570007324} -11/06/2021 22:53:36 - INFO - __main__ - Step 11893: {'lr': 0.0004945089136949876, 'samples': 2283456, 'steps': 11892, 'loss/train': 1.7748466730117798} -11/06/2021 22:53:37 - INFO - __main__ - Step 11894: {'lr': 0.0004945078075145292, 'samples': 2283648, 'steps': 11893, 'loss/train': 2.0001227855682373} -11/06/2021 22:53:37 - INFO - __main__ - Step 11895: {'lr': 0.0004945067012238996, 'samples': 2283840, 'steps': 11894, 'loss/train': 1.475651502609253} -11/06/2021 22:53:38 - INFO - __main__ - Step 11896: {'lr': 0.000494505594823099, 'samples': 2284032, 'steps': 11895, 'loss/train': 0.5591633915901184} -11/06/2021 22:53:38 - INFO - __main__ - Step 11897: {'lr': 0.0004945044883121279, 'samples': 2284224, 'steps': 11896, 'loss/train': 1.6657626628875732} -11/06/2021 22:53:39 - INFO - __main__ - Step 11898: {'lr': 0.0004945033816909868, 'samples': 2284416, 'steps': 11897, 'loss/train': 1.5739197731018066} -11/06/2021 22:53:39 - INFO - __main__ - Step 11899: {'lr': 0.0004945022749596764, 'samples': 2284608, 'steps': 11898, 'loss/train': 1.6990892887115479} -11/06/2021 22:53:39 - INFO - __main__ - Step 11900: {'lr': 0.000494501168118197, 'samples': 2284800, 'steps': 11899, 'loss/train': 1.785287618637085} -11/06/2021 22:53:40 - INFO - __main__ - Step 11901: {'lr': 0.0004945000611665491, 'samples': 2284992, 'steps': 11900, 'loss/train': 1.6788626909255981} -11/06/2021 22:53:41 - INFO - __main__ - Step 11902: {'lr': 0.0004944989541047333, 'samples': 2285184, 'steps': 11901, 'loss/train': 1.9078575372695923} -11/06/2021 22:53:41 - INFO - __main__ - Step 11903: {'lr': 0.0004944978469327499, 'samples': 2285376, 'steps': 11902, 'loss/train': 1.8978601694107056} -11/06/2021 22:53:41 - INFO - __main__ - Step 11904: {'lr': 0.0004944967396505998, 'samples': 2285568, 'steps': 11903, 'loss/train': 1.5183367729187012} -11/06/2021 22:53:42 - INFO - __main__ - Step 11905: {'lr': 0.000494495632258283, 'samples': 2285760, 'steps': 11904, 'loss/train': 1.6283320188522339} -11/06/2021 22:53:43 - INFO - __main__ - Step 11906: {'lr': 0.0004944945247558004, 'samples': 2285952, 'steps': 11905, 'loss/train': 1.0076183080673218} -11/06/2021 22:53:43 - INFO - __main__ - Step 11907: {'lr': 0.0004944934171431522, 'samples': 2286144, 'steps': 11906, 'loss/train': 1.794429898262024} -11/06/2021 22:53:43 - INFO - __main__ - Step 11908: {'lr': 0.0004944923094203391, 'samples': 2286336, 'steps': 11907, 'loss/train': 1.9065196514129639} -11/06/2021 22:53:44 - INFO - __main__ - Step 11909: {'lr': 0.0004944912015873616, 'samples': 2286528, 'steps': 11908, 'loss/train': 1.092329740524292} -11/06/2021 22:53:44 - INFO - __main__ - Step 11910: {'lr': 0.0004944900936442201, 'samples': 2286720, 'steps': 11909, 'loss/train': 1.7471907138824463} -11/06/2021 22:53:45 - INFO - __main__ - Step 11911: {'lr': 0.000494488985590915, 'samples': 2286912, 'steps': 11910, 'loss/train': 2.4433507919311523} -11/06/2021 22:53:46 - INFO - __main__ - Step 11912: {'lr': 0.0004944878774274472, 'samples': 2287104, 'steps': 11911, 'loss/train': 1.9557836055755615} -11/06/2021 22:53:46 - INFO - __main__ - Step 11913: {'lr': 0.0004944867691538167, 'samples': 2287296, 'steps': 11912, 'loss/train': 1.8252263069152832} -11/06/2021 22:53:46 - INFO - __main__ - Step 11914: {'lr': 0.0004944856607700243, 'samples': 2287488, 'steps': 11913, 'loss/train': 1.3514317274093628} -11/06/2021 22:53:47 - INFO - __main__ - Step 11915: {'lr': 0.0004944845522760706, 'samples': 2287680, 'steps': 11914, 'loss/train': 1.4288444519042969} -11/06/2021 22:53:47 - INFO - __main__ - Step 11916: {'lr': 0.0004944834436719557, 'samples': 2287872, 'steps': 11915, 'loss/train': 1.7817126512527466} -11/06/2021 22:53:48 - INFO - __main__ - Step 11917: {'lr': 0.0004944823349576805, 'samples': 2288064, 'steps': 11916, 'loss/train': 0.9959566593170166} -11/06/2021 22:53:48 - INFO - __main__ - Step 11918: {'lr': 0.0004944812261332452, 'samples': 2288256, 'steps': 11917, 'loss/train': 1.2782503366470337} -11/06/2021 22:53:49 - INFO - __main__ - Step 11919: {'lr': 0.0004944801171986505, 'samples': 2288448, 'steps': 11918, 'loss/train': 1.4812965393066406} -11/06/2021 22:53:49 - INFO - __main__ - Step 11920: {'lr': 0.0004944790081538969, 'samples': 2288640, 'steps': 11919, 'loss/train': 1.7780016660690308} -11/06/2021 22:53:49 - INFO - __main__ - Step 11921: {'lr': 0.0004944778989989847, 'samples': 2288832, 'steps': 11920, 'loss/train': 2.459728240966797} -11/06/2021 22:53:50 - INFO - __main__ - Step 11922: {'lr': 0.0004944767897339146, 'samples': 2289024, 'steps': 11921, 'loss/train': 1.5695812702178955} -11/06/2021 22:53:51 - INFO - __main__ - Step 11923: {'lr': 0.000494475680358687, 'samples': 2289216, 'steps': 11922, 'loss/train': 1.9413129091262817} -11/06/2021 22:53:51 - INFO - __main__ - Step 11924: {'lr': 0.0004944745708733025, 'samples': 2289408, 'steps': 11923, 'loss/train': 2.0285587310791016} -11/06/2021 22:53:52 - INFO - __main__ - Step 11925: {'lr': 0.0004944734612777615, 'samples': 2289600, 'steps': 11924, 'loss/train': 1.9409503936767578} -11/06/2021 22:53:52 - INFO - __main__ - Step 11926: {'lr': 0.0004944723515720645, 'samples': 2289792, 'steps': 11925, 'loss/train': 1.747592806816101} -11/06/2021 22:53:53 - INFO - __main__ - Step 11927: {'lr': 0.000494471241756212, 'samples': 2289984, 'steps': 11926, 'loss/train': 1.674291729927063} -11/06/2021 22:53:53 - INFO - __main__ - Step 11928: {'lr': 0.0004944701318302046, 'samples': 2290176, 'steps': 11927, 'loss/train': 1.5972325801849365} -11/06/2021 22:53:54 - INFO - __main__ - Step 11929: {'lr': 0.0004944690217940427, 'samples': 2290368, 'steps': 11928, 'loss/train': 1.5960736274719238} -11/06/2021 22:53:54 - INFO - __main__ - Step 11930: {'lr': 0.0004944679116477269, 'samples': 2290560, 'steps': 11929, 'loss/train': 1.5236477851867676} -11/06/2021 22:53:54 - INFO - __main__ - Step 11931: {'lr': 0.0004944668013912575, 'samples': 2290752, 'steps': 11930, 'loss/train': 1.5838426351547241} -11/06/2021 22:53:55 - INFO - __main__ - Step 11932: {'lr': 0.0004944656910246352, 'samples': 2290944, 'steps': 11931, 'loss/train': 1.651598572731018} -11/06/2021 22:53:56 - INFO - __main__ - Step 11933: {'lr': 0.0004944645805478605, 'samples': 2291136, 'steps': 11932, 'loss/train': 1.3770673274993896} -11/06/2021 22:53:56 - INFO - __main__ - Step 11934: {'lr': 0.0004944634699609338, 'samples': 2291328, 'steps': 11933, 'loss/train': 2.044022560119629} -11/06/2021 22:53:56 - INFO - __main__ - Step 11935: {'lr': 0.0004944623592638555, 'samples': 2291520, 'steps': 11934, 'loss/train': 1.4433174133300781} -11/06/2021 22:53:57 - INFO - __main__ - Step 11936: {'lr': 0.0004944612484566263, 'samples': 2291712, 'steps': 11935, 'loss/train': 1.43559730052948} -11/06/2021 22:53:57 - INFO - __main__ - Step 11937: {'lr': 0.0004944601375392467, 'samples': 2291904, 'steps': 11936, 'loss/train': 2.0127391815185547} -11/06/2021 22:53:58 - INFO - __main__ - Step 11938: {'lr': 0.000494459026511717, 'samples': 2292096, 'steps': 11937, 'loss/train': 1.7522636651992798} -11/06/2021 22:53:59 - INFO - __main__ - Step 11939: {'lr': 0.000494457915374038, 'samples': 2292288, 'steps': 11938, 'loss/train': 1.910089373588562} -11/06/2021 22:53:59 - INFO - __main__ - Step 11940: {'lr': 0.00049445680412621, 'samples': 2292480, 'steps': 11939, 'loss/train': 1.6067532300949097} -11/06/2021 22:53:59 - INFO - __main__ - Step 11941: {'lr': 0.0004944556927682335, 'samples': 2292672, 'steps': 11940, 'loss/train': 1.7804417610168457} -11/06/2021 22:54:00 - INFO - __main__ - Step 11942: {'lr': 0.000494454581300109, 'samples': 2292864, 'steps': 11941, 'loss/train': 1.387055516242981} -11/06/2021 22:54:00 - INFO - __main__ - Step 11943: {'lr': 0.0004944534697218371, 'samples': 2293056, 'steps': 11942, 'loss/train': 1.4685114622116089} -11/06/2021 22:54:01 - INFO - __main__ - Step 11944: {'lr': 0.0004944523580334183, 'samples': 2293248, 'steps': 11943, 'loss/train': 0.5896292924880981} -11/06/2021 22:54:01 - INFO - __main__ - Step 11945: {'lr': 0.0004944512462348528, 'samples': 2293440, 'steps': 11944, 'loss/train': 1.9006822109222412} -11/06/2021 22:54:02 - INFO - __main__ - Step 11946: {'lr': 0.0004944501343261416, 'samples': 2293632, 'steps': 11945, 'loss/train': 1.7416223287582397} -11/06/2021 22:54:02 - INFO - __main__ - Step 11947: {'lr': 0.0004944490223072848, 'samples': 2293824, 'steps': 11946, 'loss/train': 0.48262572288513184} -11/06/2021 22:54:03 - INFO - __main__ - Step 11948: {'lr': 0.0004944479101782831, 'samples': 2294016, 'steps': 11947, 'loss/train': 1.9362751245498657} -11/06/2021 22:54:03 - INFO - __main__ - Step 11949: {'lr': 0.0004944467979391369, 'samples': 2294208, 'steps': 11948, 'loss/train': 1.4246046543121338} -11/06/2021 22:54:04 - INFO - __main__ - Step 11950: {'lr': 0.0004944456855898469, 'samples': 2294400, 'steps': 11949, 'loss/train': 1.5375300645828247} -11/06/2021 22:54:04 - INFO - __main__ - Step 11951: {'lr': 0.0004944445731304133, 'samples': 2294592, 'steps': 11950, 'loss/train': 2.0238983631134033} -11/06/2021 22:54:04 - INFO - __main__ - Step 11952: {'lr': 0.0004944434605608367, 'samples': 2294784, 'steps': 11951, 'loss/train': 1.2838270664215088} -11/06/2021 22:54:05 - INFO - __main__ - Step 11953: {'lr': 0.0004944423478811177, 'samples': 2294976, 'steps': 11952, 'loss/train': 1.7840559482574463} -11/06/2021 22:54:06 - INFO - __main__ - Step 11954: {'lr': 0.0004944412350912567, 'samples': 2295168, 'steps': 11953, 'loss/train': 1.7490830421447754} -11/06/2021 22:54:06 - INFO - __main__ - Step 11955: {'lr': 0.0004944401221912544, 'samples': 2295360, 'steps': 11954, 'loss/train': 1.8949376344680786} -11/06/2021 22:54:06 - INFO - __main__ - Step 11956: {'lr': 0.0004944390091811111, 'samples': 2295552, 'steps': 11955, 'loss/train': 1.7346197366714478} -11/06/2021 22:54:07 - INFO - __main__ - Step 11957: {'lr': 0.0004944378960608272, 'samples': 2295744, 'steps': 11956, 'loss/train': 1.9037965536117554} -11/06/2021 22:54:07 - INFO - __main__ - Step 11958: {'lr': 0.0004944367828304035, 'samples': 2295936, 'steps': 11957, 'loss/train': 1.8399511575698853} -11/06/2021 22:54:08 - INFO - __main__ - Step 11959: {'lr': 0.0004944356694898404, 'samples': 2296128, 'steps': 11958, 'loss/train': 0.14074699580669403} -11/06/2021 22:54:09 - INFO - __main__ - Step 11960: {'lr': 0.0004944345560391382, 'samples': 2296320, 'steps': 11959, 'loss/train': 1.9995806217193604} -11/06/2021 22:54:09 - INFO - __main__ - Step 11961: {'lr': 0.0004944334424782977, 'samples': 2296512, 'steps': 11960, 'loss/train': 1.5391980409622192} -11/06/2021 22:54:09 - INFO - __main__ - Step 11962: {'lr': 0.0004944323288073192, 'samples': 2296704, 'steps': 11961, 'loss/train': 1.4151784181594849} -11/06/2021 22:54:10 - INFO - __main__ - Step 11963: {'lr': 0.0004944312150262033, 'samples': 2296896, 'steps': 11962, 'loss/train': 1.0756903886795044} -11/06/2021 22:54:11 - INFO - __main__ - Step 11964: {'lr': 0.0004944301011349505, 'samples': 2297088, 'steps': 11963, 'loss/train': 1.644909143447876} -11/06/2021 22:54:11 - INFO - __main__ - Step 11965: {'lr': 0.0004944289871335612, 'samples': 2297280, 'steps': 11964, 'loss/train': 2.0946547985076904} -11/06/2021 22:54:11 - INFO - __main__ - Step 11966: {'lr': 0.0004944278730220359, 'samples': 2297472, 'steps': 11965, 'loss/train': 1.4997888803482056} -11/06/2021 22:54:12 - INFO - __main__ - Step 11967: {'lr': 0.0004944267588003754, 'samples': 2297664, 'steps': 11966, 'loss/train': 1.587903618812561} -11/06/2021 22:54:12 - INFO - __main__ - Step 11968: {'lr': 0.0004944256444685798, 'samples': 2297856, 'steps': 11967, 'loss/train': 1.6351916790008545} -11/06/2021 22:54:13 - INFO - __main__ - Step 11969: {'lr': 0.0004944245300266498, 'samples': 2298048, 'steps': 11968, 'loss/train': 1.4442037343978882} -11/06/2021 22:54:13 - INFO - __main__ - Step 11970: {'lr': 0.0004944234154745859, 'samples': 2298240, 'steps': 11969, 'loss/train': 1.8854682445526123} -11/06/2021 22:54:14 - INFO - __main__ - Step 11971: {'lr': 0.0004944223008123886, 'samples': 2298432, 'steps': 11970, 'loss/train': 1.832446813583374} -11/06/2021 22:54:14 - INFO - __main__ - Step 11972: {'lr': 0.0004944211860400582, 'samples': 2298624, 'steps': 11971, 'loss/train': 1.448323130607605} -11/06/2021 22:54:15 - INFO - __main__ - Step 11973: {'lr': 0.0004944200711575956, 'samples': 2298816, 'steps': 11972, 'loss/train': 1.9672355651855469} -11/06/2021 22:54:16 - INFO - __main__ - Step 11974: {'lr': 0.0004944189561650011, 'samples': 2299008, 'steps': 11973, 'loss/train': 1.4000511169433594} -11/06/2021 22:54:16 - INFO - __main__ - Step 11975: {'lr': 0.0004944178410622751, 'samples': 2299200, 'steps': 11974, 'loss/train': 1.234156847000122} -11/06/2021 22:54:17 - INFO - __main__ - Step 11976: {'lr': 0.0004944167258494181, 'samples': 2299392, 'steps': 11975, 'loss/train': 1.449386477470398} -11/06/2021 22:54:17 - INFO - __main__ - Step 11977: {'lr': 0.0004944156105264308, 'samples': 2299584, 'steps': 11976, 'loss/train': 0.3471572995185852} -11/06/2021 22:54:17 - INFO - __main__ - Step 11978: {'lr': 0.0004944144950933137, 'samples': 2299776, 'steps': 11977, 'loss/train': 1.291796088218689} -11/06/2021 22:54:18 - INFO - __main__ - Step 11979: {'lr': 0.000494413379550067, 'samples': 2299968, 'steps': 11978, 'loss/train': 1.4064840078353882} -11/06/2021 22:54:19 - INFO - __main__ - Step 11980: {'lr': 0.0004944122638966916, 'samples': 2300160, 'steps': 11979, 'loss/train': 2.1589348316192627} -11/06/2021 22:54:19 - INFO - __main__ - Step 11981: {'lr': 0.0004944111481331876, 'samples': 2300352, 'steps': 11980, 'loss/train': 2.178071975708008} -11/06/2021 22:54:19 - INFO - __main__ - Step 11982: {'lr': 0.0004944100322595558, 'samples': 2300544, 'steps': 11981, 'loss/train': 1.5777186155319214} -11/06/2021 22:54:20 - INFO - __main__ - Step 11983: {'lr': 0.0004944089162757968, 'samples': 2300736, 'steps': 11982, 'loss/train': 1.8397846221923828} -11/06/2021 22:54:21 - INFO - __main__ - Step 11984: {'lr': 0.0004944078001819106, 'samples': 2300928, 'steps': 11983, 'loss/train': 1.9047267436981201} -11/06/2021 22:54:21 - INFO - __main__ - Step 11985: {'lr': 0.0004944066839778983, 'samples': 2301120, 'steps': 11984, 'loss/train': 1.7153035402297974} -11/06/2021 22:54:21 - INFO - __main__ - Step 11986: {'lr': 0.0004944055676637599, 'samples': 2301312, 'steps': 11985, 'loss/train': 1.4917117357254028} -11/06/2021 22:54:22 - INFO - __main__ - Step 11987: {'lr': 0.0004944044512394962, 'samples': 2301504, 'steps': 11986, 'loss/train': 1.906925916671753} -11/06/2021 22:54:22 - INFO - __main__ - Step 11988: {'lr': 0.0004944033347051076, 'samples': 2301696, 'steps': 11987, 'loss/train': 1.9712414741516113} -11/06/2021 22:54:23 - INFO - __main__ - Step 11989: {'lr': 0.0004944022180605947, 'samples': 2301888, 'steps': 11988, 'loss/train': 1.898970127105713} -11/06/2021 22:54:24 - INFO - __main__ - Step 11990: {'lr': 0.0004944011013059579, 'samples': 2302080, 'steps': 11989, 'loss/train': 1.1535645723342896} -11/06/2021 22:54:24 - INFO - __main__ - Step 11991: {'lr': 0.0004943999844411977, 'samples': 2302272, 'steps': 11990, 'loss/train': 1.2547049522399902} -11/06/2021 22:54:24 - INFO - __main__ - Step 11992: {'lr': 0.0004943988674663147, 'samples': 2302464, 'steps': 11991, 'loss/train': 1.8330069780349731} -11/06/2021 22:54:25 - INFO - __main__ - Step 11993: {'lr': 0.0004943977503813092, 'samples': 2302656, 'steps': 11992, 'loss/train': 1.3840059041976929} -11/06/2021 22:54:25 - INFO - __main__ - Step 11994: {'lr': 0.000494396633186182, 'samples': 2302848, 'steps': 11993, 'loss/train': 2.0180881023406982} -11/06/2021 22:54:26 - INFO - __main__ - Step 11995: {'lr': 0.0004943955158809334, 'samples': 2303040, 'steps': 11994, 'loss/train': 1.7665796279907227} -11/06/2021 22:54:26 - INFO - __main__ - Step 11996: {'lr': 0.0004943943984655639, 'samples': 2303232, 'steps': 11995, 'loss/train': 1.3726966381072998} -11/06/2021 22:54:27 - INFO - __main__ - Step 11997: {'lr': 0.0004943932809400741, 'samples': 2303424, 'steps': 11996, 'loss/train': 1.9251682758331299} -11/06/2021 22:54:27 - INFO - __main__ - Step 11998: {'lr': 0.0004943921633044644, 'samples': 2303616, 'steps': 11997, 'loss/train': 1.752882480621338} -11/06/2021 22:54:27 - INFO - __main__ - Step 11999: {'lr': 0.0004943910455587354, 'samples': 2303808, 'steps': 11998, 'loss/train': 1.246006727218628} -11/06/2021 22:54:28 - INFO - __main__ - Step 12000: {'lr': 0.0004943899277028877, 'samples': 2304000, 'steps': 11999, 'loss/train': 1.6304447650909424} -11/06/2021 22:54:29 - INFO - __main__ - Step 12001: {'lr': 0.0004943888097369216, 'samples': 2304192, 'steps': 12000, 'loss/train': 1.6695126295089722} -11/06/2021 22:54:29 - INFO - __main__ - Step 12002: {'lr': 0.0004943876916608375, 'samples': 2304384, 'steps': 12001, 'loss/train': 1.794386625289917} -11/06/2021 22:54:29 - INFO - __main__ - Step 12003: {'lr': 0.0004943865734746364, 'samples': 2304576, 'steps': 12002, 'loss/train': 1.8876904249191284} -11/06/2021 22:54:30 - INFO - __main__ - Step 12004: {'lr': 0.0004943854551783182, 'samples': 2304768, 'steps': 12003, 'loss/train': 1.6697297096252441} -11/06/2021 22:54:31 - INFO - __main__ - Step 12005: {'lr': 0.0004943843367718838, 'samples': 2304960, 'steps': 12004, 'loss/train': 1.6420907974243164} -11/06/2021 22:54:31 - INFO - __main__ - Step 12006: {'lr': 0.0004943832182553336, 'samples': 2305152, 'steps': 12005, 'loss/train': 1.553113341331482} -11/06/2021 22:54:32 - INFO - __main__ - Step 12007: {'lr': 0.000494382099628668, 'samples': 2305344, 'steps': 12006, 'loss/train': 2.0208699703216553} -11/06/2021 22:54:32 - INFO - __main__ - Step 12008: {'lr': 0.0004943809808918877, 'samples': 2305536, 'steps': 12007, 'loss/train': 1.575126051902771} -11/06/2021 22:54:32 - INFO - __main__ - Step 12009: {'lr': 0.000494379862044993, 'samples': 2305728, 'steps': 12008, 'loss/train': 1.9213340282440186} -11/06/2021 22:54:33 - INFO - __main__ - Step 12010: {'lr': 0.0004943787430879846, 'samples': 2305920, 'steps': 12009, 'loss/train': 1.99528169631958} -11/06/2021 22:54:34 - INFO - __main__ - Step 12011: {'lr': 0.0004943776240208628, 'samples': 2306112, 'steps': 12010, 'loss/train': 1.7493822574615479} -11/06/2021 22:54:34 - INFO - __main__ - Step 12012: {'lr': 0.0004943765048436283, 'samples': 2306304, 'steps': 12011, 'loss/train': 1.5333633422851562} -11/06/2021 22:54:34 - INFO - __main__ - Step 12013: {'lr': 0.0004943753855562815, 'samples': 2306496, 'steps': 12012, 'loss/train': 1.6219375133514404} -11/06/2021 22:54:35 - INFO - __main__ - Step 12014: {'lr': 0.000494374266158823, 'samples': 2306688, 'steps': 12013, 'loss/train': 1.9051744937896729} -11/06/2021 22:54:36 - INFO - __main__ - Step 12015: {'lr': 0.0004943731466512531, 'samples': 2306880, 'steps': 12014, 'loss/train': 1.5404677391052246} -11/06/2021 22:54:37 - INFO - __main__ - Step 12016: {'lr': 0.0004943720270335724, 'samples': 2307072, 'steps': 12015, 'loss/train': 1.5498056411743164} -11/06/2021 22:54:37 - INFO - __main__ - Step 12017: {'lr': 0.0004943709073057816, 'samples': 2307264, 'steps': 12016, 'loss/train': 1.53780198097229} -11/06/2021 22:54:37 - INFO - __main__ - Step 12018: {'lr': 0.000494369787467881, 'samples': 2307456, 'steps': 12017, 'loss/train': 1.328963041305542} -11/06/2021 22:54:38 - INFO - __main__ - Step 12019: {'lr': 0.000494368667519871, 'samples': 2307648, 'steps': 12018, 'loss/train': 1.014737844467163} -11/06/2021 22:54:38 - INFO - __main__ - Step 12020: {'lr': 0.0004943675474617524, 'samples': 2307840, 'steps': 12019, 'loss/train': 1.956551432609558} -11/06/2021 22:54:39 - INFO - __main__ - Step 12021: {'lr': 0.0004943664272935255, 'samples': 2308032, 'steps': 12020, 'loss/train': 1.9309561252593994} -11/06/2021 22:54:39 - INFO - __main__ - Step 12022: {'lr': 0.0004943653070151909, 'samples': 2308224, 'steps': 12021, 'loss/train': 1.6873791217803955} -11/06/2021 22:54:40 - INFO - __main__ - Step 12023: {'lr': 0.000494364186626749, 'samples': 2308416, 'steps': 12022, 'loss/train': 0.8956676125526428} -11/06/2021 22:54:40 - INFO - __main__ - Step 12024: {'lr': 0.0004943630661282004, 'samples': 2308608, 'steps': 12023, 'loss/train': 1.492911696434021} -11/06/2021 22:54:40 - INFO - __main__ - Step 12025: {'lr': 0.0004943619455195456, 'samples': 2308800, 'steps': 12024, 'loss/train': 2.243229627609253} -11/06/2021 22:54:41 - INFO - __main__ - Step 12026: {'lr': 0.000494360824800785, 'samples': 2308992, 'steps': 12025, 'loss/train': 2.4765336513519287} -11/06/2021 22:54:42 - INFO - __main__ - Step 12027: {'lr': 0.0004943597039719192, 'samples': 2309184, 'steps': 12026, 'loss/train': 2.0413081645965576} -11/06/2021 22:54:42 - INFO - __main__ - Step 12028: {'lr': 0.0004943585830329487, 'samples': 2309376, 'steps': 12027, 'loss/train': 1.6951693296432495} -11/06/2021 22:54:42 - INFO - __main__ - Step 12029: {'lr': 0.0004943574619838741, 'samples': 2309568, 'steps': 12028, 'loss/train': 1.7877787351608276} -11/06/2021 22:54:43 - INFO - __main__ - Step 12030: {'lr': 0.0004943563408246957, 'samples': 2309760, 'steps': 12029, 'loss/train': 2.547342300415039} -11/06/2021 22:54:44 - INFO - __main__ - Step 12031: {'lr': 0.000494355219555414, 'samples': 2309952, 'steps': 12030, 'loss/train': 1.9224157333374023} -11/06/2021 22:54:44 - INFO - __main__ - Step 12032: {'lr': 0.0004943540981760298, 'samples': 2310144, 'steps': 12031, 'loss/train': 1.732265591621399} -11/06/2021 22:54:45 - INFO - __main__ - Step 12033: {'lr': 0.0004943529766865434, 'samples': 2310336, 'steps': 12032, 'loss/train': 1.4456995725631714} -11/06/2021 22:54:45 - INFO - __main__ - Step 12034: {'lr': 0.0004943518550869552, 'samples': 2310528, 'steps': 12033, 'loss/train': 1.0278202295303345} -11/06/2021 22:54:45 - INFO - __main__ - Step 12035: {'lr': 0.0004943507333772659, 'samples': 2310720, 'steps': 12034, 'loss/train': 1.7194404602050781} -11/06/2021 22:54:46 - INFO - __main__ - Step 12036: {'lr': 0.0004943496115574758, 'samples': 2310912, 'steps': 12035, 'loss/train': 1.838610053062439} -11/06/2021 22:54:47 - INFO - __main__ - Step 12037: {'lr': 0.0004943484896275857, 'samples': 2311104, 'steps': 12036, 'loss/train': 1.8748886585235596} -11/06/2021 22:54:47 - INFO - __main__ - Step 12038: {'lr': 0.0004943473675875959, 'samples': 2311296, 'steps': 12037, 'loss/train': 1.785986304283142} -11/06/2021 22:54:47 - INFO - __main__ - Step 12039: {'lr': 0.0004943462454375069, 'samples': 2311488, 'steps': 12038, 'loss/train': 1.6484863758087158} -11/06/2021 22:54:48 - INFO - __main__ - Step 12040: {'lr': 0.0004943451231773192, 'samples': 2311680, 'steps': 12039, 'loss/train': 1.8287440538406372} -11/06/2021 22:54:48 - INFO - __main__ - Step 12041: {'lr': 0.0004943440008070336, 'samples': 2311872, 'steps': 12040, 'loss/train': 1.2634427547454834} -11/06/2021 22:54:49 - INFO - __main__ - Step 12042: {'lr': 0.0004943428783266502, 'samples': 2312064, 'steps': 12041, 'loss/train': 1.7805235385894775} -11/06/2021 22:54:49 - INFO - __main__ - Step 12043: {'lr': 0.0004943417557361696, 'samples': 2312256, 'steps': 12042, 'loss/train': 1.758927583694458} -11/06/2021 22:54:50 - INFO - __main__ - Step 12044: {'lr': 0.0004943406330355925, 'samples': 2312448, 'steps': 12043, 'loss/train': 1.159117341041565} -11/06/2021 22:54:50 - INFO - __main__ - Step 12045: {'lr': 0.0004943395102249192, 'samples': 2312640, 'steps': 12044, 'loss/train': 1.8468574285507202} -11/06/2021 22:54:51 - INFO - __main__ - Step 12046: {'lr': 0.0004943383873041503, 'samples': 2312832, 'steps': 12045, 'loss/train': 1.8814785480499268} -11/06/2021 22:54:51 - INFO - __main__ - Step 12047: {'lr': 0.0004943372642732864, 'samples': 2313024, 'steps': 12046, 'loss/train': 2.093292236328125} -11/06/2021 22:54:52 - INFO - __main__ - Step 12048: {'lr': 0.0004943361411323277, 'samples': 2313216, 'steps': 12047, 'loss/train': 1.5713038444519043} -11/06/2021 22:54:52 - INFO - __main__ - Step 12049: {'lr': 0.0004943350178812751, 'samples': 2313408, 'steps': 12048, 'loss/train': 1.8695523738861084} -11/06/2021 22:54:52 - INFO - __main__ - Step 12050: {'lr': 0.0004943338945201288, 'samples': 2313600, 'steps': 12049, 'loss/train': 1.4861245155334473} -11/06/2021 22:54:53 - INFO - __main__ - Step 12051: {'lr': 0.0004943327710488894, 'samples': 2313792, 'steps': 12050, 'loss/train': 1.4577797651290894} -11/06/2021 22:54:54 - INFO - __main__ - Step 12052: {'lr': 0.0004943316474675575, 'samples': 2313984, 'steps': 12051, 'loss/train': 1.26167631149292} -11/06/2021 22:54:54 - INFO - __main__ - Step 12053: {'lr': 0.0004943305237761335, 'samples': 2314176, 'steps': 12052, 'loss/train': 1.674010157585144} -11/06/2021 22:54:54 - INFO - __main__ - Step 12054: {'lr': 0.0004943293999746179, 'samples': 2314368, 'steps': 12053, 'loss/train': 1.585003137588501} -11/06/2021 22:54:55 - INFO - __main__ - Step 12055: {'lr': 0.0004943282760630114, 'samples': 2314560, 'steps': 12054, 'loss/train': 1.8338981866836548} -11/06/2021 22:54:56 - INFO - __main__ - Step 12056: {'lr': 0.0004943271520413141, 'samples': 2314752, 'steps': 12055, 'loss/train': 1.6926106214523315} -11/06/2021 22:54:56 - INFO - __main__ - Step 12057: {'lr': 0.0004943260279095269, 'samples': 2314944, 'steps': 12056, 'loss/train': 1.6934748888015747} -11/06/2021 22:54:57 - INFO - __main__ - Step 12058: {'lr': 0.0004943249036676501, 'samples': 2315136, 'steps': 12057, 'loss/train': 1.7814065217971802} -11/06/2021 22:54:57 - INFO - __main__ - Step 12059: {'lr': 0.0004943237793156844, 'samples': 2315328, 'steps': 12058, 'loss/train': 2.4570651054382324} -11/06/2021 22:54:57 - INFO - __main__ - Step 12060: {'lr': 0.00049432265485363, 'samples': 2315520, 'steps': 12059, 'loss/train': 1.1607862710952759} -11/06/2021 22:54:58 - INFO - __main__ - Step 12061: {'lr': 0.0004943215302814877, 'samples': 2315712, 'steps': 12060, 'loss/train': 1.2177666425704956} -11/06/2021 22:54:59 - INFO - __main__ - Step 12062: {'lr': 0.0004943204055992579, 'samples': 2315904, 'steps': 12061, 'loss/train': 1.5392464399337769} -11/06/2021 22:54:59 - INFO - __main__ - Step 12063: {'lr': 0.0004943192808069411, 'samples': 2316096, 'steps': 12062, 'loss/train': 1.2292014360427856} -11/06/2021 22:54:59 - INFO - __main__ - Step 12064: {'lr': 0.0004943181559045378, 'samples': 2316288, 'steps': 12063, 'loss/train': 1.9744259119033813} -11/06/2021 22:55:00 - INFO - __main__ - Step 12065: {'lr': 0.0004943170308920483, 'samples': 2316480, 'steps': 12064, 'loss/train': 1.6766237020492554} -11/06/2021 22:55:00 - INFO - __main__ - Step 12066: {'lr': 0.0004943159057694736, 'samples': 2316672, 'steps': 12065, 'loss/train': 1.6280395984649658} -11/06/2021 22:55:02 - INFO - __main__ - Step 12067: {'lr': 0.0004943147805368138, 'samples': 2316864, 'steps': 12066, 'loss/train': 1.6543623208999634} -11/06/2021 22:55:02 - INFO - __main__ - Step 12068: {'lr': 0.0004943136551940695, 'samples': 2317056, 'steps': 12067, 'loss/train': 1.1795415878295898} -11/06/2021 22:55:02 - INFO - __main__ - Step 12069: {'lr': 0.0004943125297412413, 'samples': 2317248, 'steps': 12068, 'loss/train': 1.8180369138717651} -11/06/2021 22:55:03 - INFO - __main__ - Step 12070: {'lr': 0.0004943114041783296, 'samples': 2317440, 'steps': 12069, 'loss/train': 1.788710355758667} -11/06/2021 22:55:03 - INFO - __main__ - Step 12071: {'lr': 0.000494310278505335, 'samples': 2317632, 'steps': 12070, 'loss/train': 1.761925458908081} -11/06/2021 22:55:03 - INFO - __main__ - Step 12072: {'lr': 0.0004943091527222579, 'samples': 2317824, 'steps': 12071, 'loss/train': 1.7475976943969727} -11/06/2021 22:55:04 - INFO - __main__ - Step 12073: {'lr': 0.0004943080268290989, 'samples': 2318016, 'steps': 12072, 'loss/train': 1.6183298826217651} -11/06/2021 22:55:05 - INFO - __main__ - Step 12074: {'lr': 0.0004943069008258584, 'samples': 2318208, 'steps': 12073, 'loss/train': 1.4593292474746704} -11/06/2021 22:55:05 - INFO - __main__ - Step 12075: {'lr': 0.0004943057747125371, 'samples': 2318400, 'steps': 12074, 'loss/train': 1.8841195106506348} -11/06/2021 22:55:06 - INFO - __main__ - Step 12076: {'lr': 0.0004943046484891352, 'samples': 2318592, 'steps': 12075, 'loss/train': 1.3961201906204224} -11/06/2021 22:55:06 - INFO - __main__ - Step 12077: {'lr': 0.0004943035221556536, 'samples': 2318784, 'steps': 12076, 'loss/train': 1.4814202785491943} -11/06/2021 22:55:07 - INFO - __main__ - Step 12078: {'lr': 0.0004943023957120926, 'samples': 2318976, 'steps': 12077, 'loss/train': 1.8115047216415405} -11/06/2021 22:55:07 - INFO - __main__ - Step 12079: {'lr': 0.0004943012691584526, 'samples': 2319168, 'steps': 12078, 'loss/train': 1.6468000411987305} -11/06/2021 22:55:08 - INFO - __main__ - Step 12080: {'lr': 0.0004943001424947343, 'samples': 2319360, 'steps': 12079, 'loss/train': 2.1361162662506104} -11/06/2021 22:55:08 - INFO - __main__ - Step 12081: {'lr': 0.000494299015720938, 'samples': 2319552, 'steps': 12080, 'loss/train': 1.2885714769363403} -11/06/2021 22:55:08 - INFO - __main__ - Step 12082: {'lr': 0.0004942978888370645, 'samples': 2319744, 'steps': 12081, 'loss/train': 2.0774118900299072} -11/06/2021 22:55:10 - INFO - __main__ - Step 12083: {'lr': 0.000494296761843114, 'samples': 2319936, 'steps': 12082, 'loss/train': 1.5701794624328613} -11/06/2021 22:55:10 - INFO - __main__ - Step 12084: {'lr': 0.0004942956347390872, 'samples': 2320128, 'steps': 12083, 'loss/train': 1.1753841638565063} -11/06/2021 22:55:11 - INFO - __main__ - Step 12085: {'lr': 0.0004942945075249845, 'samples': 2320320, 'steps': 12084, 'loss/train': 1.6543172597885132} -11/06/2021 22:55:11 - INFO - __main__ - Step 12086: {'lr': 0.0004942933802008066, 'samples': 2320512, 'steps': 12085, 'loss/train': 2.0663843154907227} -11/06/2021 22:55:12 - INFO - __main__ - Step 12087: {'lr': 0.0004942922527665538, 'samples': 2320704, 'steps': 12086, 'loss/train': 1.5923895835876465} -11/06/2021 22:55:12 - INFO - __main__ - Step 12088: {'lr': 0.0004942911252222267, 'samples': 2320896, 'steps': 12087, 'loss/train': 0.7742838263511658} -11/06/2021 22:55:12 - INFO - __main__ - Step 12089: {'lr': 0.0004942899975678257, 'samples': 2321088, 'steps': 12088, 'loss/train': 1.9447110891342163} -11/06/2021 22:55:13 - INFO - __main__ - Step 12090: {'lr': 0.0004942888698033515, 'samples': 2321280, 'steps': 12089, 'loss/train': 1.889116883277893} -11/06/2021 22:55:14 - INFO - __main__ - Step 12091: {'lr': 0.0004942877419288045, 'samples': 2321472, 'steps': 12090, 'loss/train': 1.8266593217849731} -11/06/2021 22:55:14 - INFO - __main__ - Step 12092: {'lr': 0.0004942866139441851, 'samples': 2321664, 'steps': 12091, 'loss/train': 1.2201491594314575} -11/06/2021 22:55:14 - INFO - __main__ - Step 12093: {'lr': 0.0004942854858494941, 'samples': 2321856, 'steps': 12092, 'loss/train': 1.8048791885375977} -11/06/2021 22:55:15 - INFO - __main__ - Step 12094: {'lr': 0.0004942843576447316, 'samples': 2322048, 'steps': 12093, 'loss/train': 1.6451750993728638} -11/06/2021 22:55:15 - INFO - __main__ - Step 12095: {'lr': 0.0004942832293298986, 'samples': 2322240, 'steps': 12094, 'loss/train': 1.459704041481018} -11/06/2021 22:55:16 - INFO - __main__ - Step 12096: {'lr': 0.0004942821009049952, 'samples': 2322432, 'steps': 12095, 'loss/train': 2.0811355113983154} -11/06/2021 22:55:16 - INFO - __main__ - Step 12097: {'lr': 0.0004942809723700221, 'samples': 2322624, 'steps': 12096, 'loss/train': 1.5584614276885986} -11/06/2021 22:55:17 - INFO - __main__ - Step 12098: {'lr': 0.0004942798437249797, 'samples': 2322816, 'steps': 12097, 'loss/train': 1.5112113952636719} -11/06/2021 22:55:17 - INFO - __main__ - Step 12099: {'lr': 0.0004942787149698687, 'samples': 2323008, 'steps': 12098, 'loss/train': 1.9871211051940918} -11/06/2021 22:55:17 - INFO - __main__ - Step 12100: {'lr': 0.0004942775861046893, 'samples': 2323200, 'steps': 12099, 'loss/train': 2.562870740890503} -11/06/2021 22:55:18 - INFO - __main__ - Step 12101: {'lr': 0.0004942764571294422, 'samples': 2323392, 'steps': 12100, 'loss/train': 1.39982008934021} -11/06/2021 22:55:19 - INFO - __main__ - Step 12102: {'lr': 0.0004942753280441281, 'samples': 2323584, 'steps': 12101, 'loss/train': 2.016968250274658} -11/06/2021 22:55:19 - INFO - __main__ - Step 12103: {'lr': 0.0004942741988487471, 'samples': 2323776, 'steps': 12102, 'loss/train': 1.8526740074157715} -11/06/2021 22:55:19 - INFO - __main__ - Step 12104: {'lr': 0.0004942730695433001, 'samples': 2323968, 'steps': 12103, 'loss/train': 1.4173227548599243} -11/06/2021 22:55:20 - INFO - __main__ - Step 12105: {'lr': 0.0004942719401277873, 'samples': 2324160, 'steps': 12104, 'loss/train': 1.0924817323684692} -11/06/2021 22:55:21 - INFO - __main__ - Step 12106: {'lr': 0.0004942708106022094, 'samples': 2324352, 'steps': 12105, 'loss/train': 1.5277026891708374} -11/06/2021 22:55:21 - INFO - __main__ - Step 12107: {'lr': 0.0004942696809665668, 'samples': 2324544, 'steps': 12106, 'loss/train': 1.9903008937835693} -11/06/2021 22:55:21 - INFO - __main__ - Step 12108: {'lr': 0.0004942685512208599, 'samples': 2324736, 'steps': 12107, 'loss/train': 1.1875405311584473} -11/06/2021 22:55:22 - INFO - __main__ - Step 12109: {'lr': 0.0004942674213650896, 'samples': 2324928, 'steps': 12108, 'loss/train': 1.4761584997177124} -11/06/2021 22:55:22 - INFO - __main__ - Step 12110: {'lr': 0.000494266291399256, 'samples': 2325120, 'steps': 12109, 'loss/train': 1.6016489267349243} -11/06/2021 22:55:23 - INFO - __main__ - Step 12111: {'lr': 0.0004942651613233599, 'samples': 2325312, 'steps': 12110, 'loss/train': 1.8227951526641846} -11/06/2021 22:55:24 - INFO - __main__ - Step 12112: {'lr': 0.0004942640311374017, 'samples': 2325504, 'steps': 12111, 'loss/train': 1.8934657573699951} -11/06/2021 22:55:24 - INFO - __main__ - Step 12113: {'lr': 0.0004942629008413818, 'samples': 2325696, 'steps': 12112, 'loss/train': 1.4961217641830444} -11/06/2021 22:55:24 - INFO - __main__ - Step 12114: {'lr': 0.0004942617704353008, 'samples': 2325888, 'steps': 12113, 'loss/train': 1.5559004545211792} -11/06/2021 22:55:25 - INFO - __main__ - Step 12115: {'lr': 0.0004942606399191593, 'samples': 2326080, 'steps': 12114, 'loss/train': 1.4733009338378906} -11/06/2021 22:55:25 - INFO - __main__ - Step 12116: {'lr': 0.0004942595092929577, 'samples': 2326272, 'steps': 12115, 'loss/train': 1.756181240081787} -11/06/2021 22:55:27 - INFO - __main__ - Step 12117: {'lr': 0.0004942583785566965, 'samples': 2326464, 'steps': 12116, 'loss/train': 1.810673475265503} -11/06/2021 22:55:27 - INFO - __main__ - Step 12118: {'lr': 0.0004942572477103763, 'samples': 2326656, 'steps': 12117, 'loss/train': 1.341216802597046} -11/06/2021 22:55:27 - INFO - __main__ - Step 12119: {'lr': 0.0004942561167539975, 'samples': 2326848, 'steps': 12118, 'loss/train': 1.2394644021987915} -11/06/2021 22:55:28 - INFO - __main__ - Step 12120: {'lr': 0.0004942549856875606, 'samples': 2327040, 'steps': 12119, 'loss/train': 1.7882914543151855} -11/06/2021 22:55:28 - INFO - __main__ - Step 12121: {'lr': 0.0004942538545110663, 'samples': 2327232, 'steps': 12120, 'loss/train': 1.967432975769043} -11/06/2021 22:55:29 - INFO - __main__ - Step 12122: {'lr': 0.0004942527232245149, 'samples': 2327424, 'steps': 12121, 'loss/train': 2.7210159301757812} -11/06/2021 22:55:30 - INFO - __main__ - Step 12123: {'lr': 0.0004942515918279071, 'samples': 2327616, 'steps': 12122, 'loss/train': 1.1575158834457397} -11/06/2021 22:55:30 - INFO - __main__ - Step 12124: {'lr': 0.0004942504603212433, 'samples': 2327808, 'steps': 12123, 'loss/train': 1.8473913669586182} -11/06/2021 22:55:30 - INFO - __main__ - Step 12125: {'lr': 0.0004942493287045239, 'samples': 2328000, 'steps': 12124, 'loss/train': 1.3073318004608154} -11/06/2021 22:55:31 - INFO - __main__ - Step 12126: {'lr': 0.0004942481969777495, 'samples': 2328192, 'steps': 12125, 'loss/train': 2.258380889892578} -11/06/2021 22:55:31 - INFO - __main__ - Step 12127: {'lr': 0.0004942470651409207, 'samples': 2328384, 'steps': 12126, 'loss/train': 1.8729878664016724} -11/06/2021 22:55:32 - INFO - __main__ - Step 12128: {'lr': 0.000494245933194038, 'samples': 2328576, 'steps': 12127, 'loss/train': 1.1568888425827026} -11/06/2021 22:55:33 - INFO - __main__ - Step 12129: {'lr': 0.0004942448011371018, 'samples': 2328768, 'steps': 12128, 'loss/train': 1.8721987009048462} -11/06/2021 22:55:33 - INFO - __main__ - Step 12130: {'lr': 0.0004942436689701126, 'samples': 2328960, 'steps': 12129, 'loss/train': 1.7959274053573608} -11/06/2021 22:55:33 - INFO - __main__ - Step 12131: {'lr': 0.000494242536693071, 'samples': 2329152, 'steps': 12130, 'loss/train': 1.718927264213562} -11/06/2021 22:55:34 - INFO - __main__ - Step 12132: {'lr': 0.0004942414043059776, 'samples': 2329344, 'steps': 12131, 'loss/train': 1.8697373867034912} -11/06/2021 22:55:35 - INFO - __main__ - Step 12133: {'lr': 0.0004942402718088326, 'samples': 2329536, 'steps': 12132, 'loss/train': 1.8126624822616577} -11/06/2021 22:55:35 - INFO - __main__ - Step 12134: {'lr': 0.0004942391392016368, 'samples': 2329728, 'steps': 12133, 'loss/train': 1.6488497257232666} -11/06/2021 22:55:35 - INFO - __main__ - Step 12135: {'lr': 0.0004942380064843906, 'samples': 2329920, 'steps': 12134, 'loss/train': 1.8256616592407227} -11/06/2021 22:55:36 - INFO - __main__ - Step 12136: {'lr': 0.0004942368736570946, 'samples': 2330112, 'steps': 12135, 'loss/train': 1.4627264738082886} -11/06/2021 22:55:36 - INFO - __main__ - Step 12137: {'lr': 0.0004942357407197491, 'samples': 2330304, 'steps': 12136, 'loss/train': 1.6289029121398926} -11/06/2021 22:55:37 - INFO - __main__ - Step 12138: {'lr': 0.0004942346076723548, 'samples': 2330496, 'steps': 12137, 'loss/train': 1.9620447158813477} -11/06/2021 22:55:38 - INFO - __main__ - Step 12139: {'lr': 0.0004942334745149122, 'samples': 2330688, 'steps': 12138, 'loss/train': 2.0332870483398438} -11/06/2021 22:55:38 - INFO - __main__ - Step 12140: {'lr': 0.0004942323412474218, 'samples': 2330880, 'steps': 12139, 'loss/train': 1.301571249961853} -11/06/2021 22:55:38 - INFO - __main__ - Step 12141: {'lr': 0.000494231207869884, 'samples': 2331072, 'steps': 12140, 'loss/train': 1.325974941253662} -11/06/2021 22:55:39 - INFO - __main__ - Step 12142: {'lr': 0.0004942300743822993, 'samples': 2331264, 'steps': 12141, 'loss/train': 1.419464111328125} -11/06/2021 22:55:40 - INFO - __main__ - Step 12143: {'lr': 0.0004942289407846684, 'samples': 2331456, 'steps': 12142, 'loss/train': 0.5399057865142822} -11/06/2021 22:55:40 - INFO - __main__ - Step 12144: {'lr': 0.0004942278070769917, 'samples': 2331648, 'steps': 12143, 'loss/train': 1.7828236818313599} -11/06/2021 22:55:40 - INFO - __main__ - Step 12145: {'lr': 0.0004942266732592697, 'samples': 2331840, 'steps': 12144, 'loss/train': 1.8341064453125} -11/06/2021 22:55:41 - INFO - __main__ - Step 12146: {'lr': 0.0004942255393315029, 'samples': 2332032, 'steps': 12145, 'loss/train': 1.1581087112426758} -11/06/2021 22:55:41 - INFO - __main__ - Step 12147: {'lr': 0.000494224405293692, 'samples': 2332224, 'steps': 12146, 'loss/train': 1.870377779006958} -11/06/2021 22:55:41 - INFO - __main__ - Step 12148: {'lr': 0.0004942232711458372, 'samples': 2332416, 'steps': 12147, 'loss/train': 1.5845227241516113} -11/06/2021 22:55:42 - INFO - __main__ - Step 12149: {'lr': 0.0004942221368879391, 'samples': 2332608, 'steps': 12148, 'loss/train': 1.2885611057281494} -11/06/2021 22:55:43 - INFO - __main__ - Step 12150: {'lr': 0.0004942210025199985, 'samples': 2332800, 'steps': 12149, 'loss/train': 1.941924810409546} -11/06/2021 22:55:43 - INFO - __main__ - Step 12151: {'lr': 0.0004942198680420155, 'samples': 2332992, 'steps': 12150, 'loss/train': 1.2128046751022339} -11/06/2021 22:55:43 - INFO - __main__ - Step 12152: {'lr': 0.0004942187334539908, 'samples': 2333184, 'steps': 12151, 'loss/train': 1.949316382408142} -11/06/2021 22:55:44 - INFO - __main__ - Step 12153: {'lr': 0.0004942175987559251, 'samples': 2333376, 'steps': 12152, 'loss/train': 3.1983020305633545} -11/06/2021 22:55:45 - INFO - __main__ - Step 12154: {'lr': 0.0004942164639478185, 'samples': 2333568, 'steps': 12153, 'loss/train': 2.0099000930786133} -11/06/2021 22:55:45 - INFO - __main__ - Step 12155: {'lr': 0.0004942153290296718, 'samples': 2333760, 'steps': 12154, 'loss/train': 2.0011119842529297} -11/06/2021 22:55:45 - INFO - __main__ - Step 12156: {'lr': 0.0004942141940014854, 'samples': 2333952, 'steps': 12155, 'loss/train': 1.7409350872039795} -11/06/2021 22:55:46 - INFO - __main__ - Step 12157: {'lr': 0.0004942130588632599, 'samples': 2334144, 'steps': 12156, 'loss/train': 2.0252602100372314} -11/06/2021 22:55:46 - INFO - __main__ - Step 12158: {'lr': 0.0004942119236149958, 'samples': 2334336, 'steps': 12157, 'loss/train': 1.6826229095458984} -11/06/2021 22:55:47 - INFO - __main__ - Step 12159: {'lr': 0.0004942107882566936, 'samples': 2334528, 'steps': 12158, 'loss/train': 1.7889363765716553} -11/06/2021 22:55:47 - INFO - __main__ - Step 12160: {'lr': 0.0004942096527883538, 'samples': 2334720, 'steps': 12159, 'loss/train': 1.4643501043319702} -11/06/2021 22:55:48 - INFO - __main__ - Step 12161: {'lr': 0.0004942085172099768, 'samples': 2334912, 'steps': 12160, 'loss/train': 1.5718570947647095} -11/06/2021 22:55:48 - INFO - __main__ - Step 12162: {'lr': 0.0004942073815215632, 'samples': 2335104, 'steps': 12161, 'loss/train': 1.6668059825897217} -11/06/2021 22:55:49 - INFO - __main__ - Step 12163: {'lr': 0.0004942062457231136, 'samples': 2335296, 'steps': 12162, 'loss/train': 1.9814776182174683} -11/06/2021 22:55:50 - INFO - __main__ - Step 12164: {'lr': 0.0004942051098146284, 'samples': 2335488, 'steps': 12163, 'loss/train': 1.9286428689956665} -11/06/2021 22:55:50 - INFO - __main__ - Step 12165: {'lr': 0.0004942039737961081, 'samples': 2335680, 'steps': 12164, 'loss/train': 1.8754050731658936} -11/06/2021 22:55:50 - INFO - __main__ - Step 12166: {'lr': 0.0004942028376675533, 'samples': 2335872, 'steps': 12165, 'loss/train': 1.3288780450820923} -11/06/2021 22:55:51 - INFO - __main__ - Step 12167: {'lr': 0.0004942017014289645, 'samples': 2336064, 'steps': 12166, 'loss/train': 1.694525957107544} -11/06/2021 22:55:51 - INFO - __main__ - Step 12168: {'lr': 0.0004942005650803421, 'samples': 2336256, 'steps': 12167, 'loss/train': 1.5838422775268555} -11/06/2021 22:55:51 - INFO - __main__ - Step 12169: {'lr': 0.0004941994286216867, 'samples': 2336448, 'steps': 12168, 'loss/train': 1.7149986028671265} -11/06/2021 22:55:52 - INFO - __main__ - Step 12170: {'lr': 0.0004941982920529989, 'samples': 2336640, 'steps': 12169, 'loss/train': 1.529640793800354} -11/06/2021 22:55:53 - INFO - __main__ - Step 12171: {'lr': 0.0004941971553742791, 'samples': 2336832, 'steps': 12170, 'loss/train': 1.0539520978927612} -11/06/2021 22:55:53 - INFO - __main__ - Step 12172: {'lr': 0.0004941960185855278, 'samples': 2337024, 'steps': 12171, 'loss/train': 2.0904853343963623} -11/06/2021 22:55:53 - INFO - __main__ - Step 12173: {'lr': 0.0004941948816867455, 'samples': 2337216, 'steps': 12172, 'loss/train': 1.5987201929092407} -11/06/2021 22:55:54 - INFO - __main__ - Step 12174: {'lr': 0.0004941937446779328, 'samples': 2337408, 'steps': 12173, 'loss/train': 1.9558372497558594} -11/06/2021 22:55:55 - INFO - __main__ - Step 12175: {'lr': 0.0004941926075590901, 'samples': 2337600, 'steps': 12174, 'loss/train': 1.9326342344284058} -11/06/2021 22:55:55 - INFO - __main__ - Step 12176: {'lr': 0.0004941914703302181, 'samples': 2337792, 'steps': 12175, 'loss/train': 1.5912054777145386} -11/06/2021 22:55:55 - INFO - __main__ - Step 12177: {'lr': 0.0004941903329913172, 'samples': 2337984, 'steps': 12176, 'loss/train': 1.657957911491394} -11/06/2021 22:55:56 - INFO - __main__ - Step 12178: {'lr': 0.0004941891955423878, 'samples': 2338176, 'steps': 12177, 'loss/train': 2.281742811203003} -11/06/2021 22:55:56 - INFO - __main__ - Step 12179: {'lr': 0.0004941880579834306, 'samples': 2338368, 'steps': 12178, 'loss/train': 1.9655019044876099} -11/06/2021 22:55:57 - INFO - __main__ - Step 12180: {'lr': 0.0004941869203144459, 'samples': 2338560, 'steps': 12179, 'loss/train': 0.7616149187088013} -11/06/2021 22:55:58 - INFO - __main__ - Step 12181: {'lr': 0.0004941857825354344, 'samples': 2338752, 'steps': 12180, 'loss/train': 1.607176423072815} -11/06/2021 22:55:58 - INFO - __main__ - Step 12182: {'lr': 0.0004941846446463966, 'samples': 2338944, 'steps': 12181, 'loss/train': 1.9033536911010742} -11/06/2021 22:55:58 - INFO - __main__ - Step 12183: {'lr': 0.000494183506647333, 'samples': 2339136, 'steps': 12182, 'loss/train': 1.972430944442749} -11/06/2021 22:55:59 - INFO - __main__ - Step 12184: {'lr': 0.000494182368538244, 'samples': 2339328, 'steps': 12183, 'loss/train': 1.4964816570281982} -11/06/2021 22:56:00 - INFO - __main__ - Step 12185: {'lr': 0.0004941812303191302, 'samples': 2339520, 'steps': 12184, 'loss/train': 1.8058403730392456} -11/06/2021 22:56:00 - INFO - __main__ - Step 12186: {'lr': 0.0004941800919899921, 'samples': 2339712, 'steps': 12185, 'loss/train': 1.9677493572235107} -11/06/2021 22:56:00 - INFO - __main__ - Step 12187: {'lr': 0.0004941789535508303, 'samples': 2339904, 'steps': 12186, 'loss/train': 1.774878978729248} -11/06/2021 22:56:01 - INFO - __main__ - Step 12188: {'lr': 0.0004941778150016451, 'samples': 2340096, 'steps': 12187, 'loss/train': 1.5408471822738647} -11/06/2021 22:56:01 - INFO - __main__ - Step 12189: {'lr': 0.0004941766763424373, 'samples': 2340288, 'steps': 12188, 'loss/train': 1.433286190032959} -11/06/2021 22:56:02 - INFO - __main__ - Step 12190: {'lr': 0.0004941755375732071, 'samples': 2340480, 'steps': 12189, 'loss/train': 1.7328075170516968} -11/06/2021 22:56:02 - INFO - __main__ - Step 12191: {'lr': 0.0004941743986939553, 'samples': 2340672, 'steps': 12190, 'loss/train': 1.647670030593872} -11/06/2021 22:56:03 - INFO - __main__ - Step 12192: {'lr': 0.0004941732597046822, 'samples': 2340864, 'steps': 12191, 'loss/train': 1.4415473937988281} -11/06/2021 22:56:03 - INFO - __main__ - Step 12193: {'lr': 0.0004941721206053885, 'samples': 2341056, 'steps': 12192, 'loss/train': 3.6256818771362305} -11/06/2021 22:56:04 - INFO - __main__ - Step 12194: {'lr': 0.0004941709813960745, 'samples': 2341248, 'steps': 12193, 'loss/train': 1.5252056121826172} -11/06/2021 22:56:05 - INFO - __main__ - Step 12195: {'lr': 0.0004941698420767408, 'samples': 2341440, 'steps': 12194, 'loss/train': 1.3925776481628418} -11/06/2021 22:56:05 - INFO - __main__ - Step 12196: {'lr': 0.0004941687026473881, 'samples': 2341632, 'steps': 12195, 'loss/train': 0.3151058852672577} -11/06/2021 22:56:05 - INFO - __main__ - Step 12197: {'lr': 0.0004941675631080166, 'samples': 2341824, 'steps': 12196, 'loss/train': 2.0778465270996094} -11/06/2021 22:56:06 - INFO - __main__ - Step 12198: {'lr': 0.000494166423458627, 'samples': 2342016, 'steps': 12197, 'loss/train': 2.043381929397583} -11/06/2021 22:56:06 - INFO - __main__ - Step 12199: {'lr': 0.0004941652836992198, 'samples': 2342208, 'steps': 12198, 'loss/train': 1.0915753841400146} -11/06/2021 22:56:06 - INFO - __main__ - Step 12200: {'lr': 0.0004941641438297955, 'samples': 2342400, 'steps': 12199, 'loss/train': 1.6756670475006104} -11/06/2021 22:56:07 - INFO - __main__ - Step 12201: {'lr': 0.0004941630038503545, 'samples': 2342592, 'steps': 12200, 'loss/train': 1.9415992498397827} -11/06/2021 22:56:08 - INFO - __main__ - Step 12202: {'lr': 0.0004941618637608976, 'samples': 2342784, 'steps': 12201, 'loss/train': 2.4285848140716553} -11/06/2021 22:56:08 - INFO - __main__ - Step 12203: {'lr': 0.000494160723561425, 'samples': 2342976, 'steps': 12202, 'loss/train': 0.7406458854675293} -11/06/2021 22:56:08 - INFO - __main__ - Step 12204: {'lr': 0.0004941595832519374, 'samples': 2343168, 'steps': 12203, 'loss/train': 1.799933910369873} -11/06/2021 22:56:09 - INFO - __main__ - Step 12205: {'lr': 0.0004941584428324352, 'samples': 2343360, 'steps': 12204, 'loss/train': 1.6155633926391602} -11/06/2021 22:56:10 - INFO - __main__ - Step 12206: {'lr': 0.000494157302302919, 'samples': 2343552, 'steps': 12205, 'loss/train': 1.4476592540740967} -11/06/2021 22:56:10 - INFO - __main__ - Step 12207: {'lr': 0.0004941561616633893, 'samples': 2343744, 'steps': 12206, 'loss/train': 1.3193042278289795} -11/06/2021 22:56:11 - INFO - __main__ - Step 12208: {'lr': 0.0004941550209138466, 'samples': 2343936, 'steps': 12207, 'loss/train': 0.9178276062011719} -11/06/2021 22:56:11 - INFO - __main__ - Step 12209: {'lr': 0.0004941538800542915, 'samples': 2344128, 'steps': 12208, 'loss/train': 2.1289122104644775} -11/06/2021 22:56:11 - INFO - __main__ - Step 12210: {'lr': 0.0004941527390847243, 'samples': 2344320, 'steps': 12209, 'loss/train': 1.1334985494613647} -11/06/2021 22:56:12 - INFO - __main__ - Step 12211: {'lr': 0.0004941515980051457, 'samples': 2344512, 'steps': 12210, 'loss/train': 1.8072400093078613} -11/06/2021 22:56:13 - INFO - __main__ - Step 12212: {'lr': 0.0004941504568155561, 'samples': 2344704, 'steps': 12211, 'loss/train': 2.0195960998535156} -11/06/2021 22:56:13 - INFO - __main__ - Step 12213: {'lr': 0.0004941493155159562, 'samples': 2344896, 'steps': 12212, 'loss/train': 1.8710730075836182} -11/06/2021 22:56:13 - INFO - __main__ - Step 12214: {'lr': 0.0004941481741063462, 'samples': 2345088, 'steps': 12213, 'loss/train': 6.926916599273682} -11/06/2021 22:56:14 - INFO - __main__ - Step 12215: {'lr': 0.000494147032586727, 'samples': 2345280, 'steps': 12214, 'loss/train': 1.6592782735824585} -11/06/2021 22:56:14 - INFO - __main__ - Step 12216: {'lr': 0.0004941458909570988, 'samples': 2345472, 'steps': 12215, 'loss/train': 2.1829493045806885} -11/06/2021 22:56:14 - INFO - __main__ - Step 12217: {'lr': 0.0004941447492174622, 'samples': 2345664, 'steps': 12216, 'loss/train': 1.9610031843185425} -11/06/2021 22:56:15 - INFO - __main__ - Step 12218: {'lr': 0.0004941436073678179, 'samples': 2345856, 'steps': 12217, 'loss/train': 1.678484320640564} -11/06/2021 22:56:16 - INFO - __main__ - Step 12219: {'lr': 0.0004941424654081661, 'samples': 2346048, 'steps': 12218, 'loss/train': 1.9036375284194946} -11/06/2021 22:56:16 - INFO - __main__ - Step 12220: {'lr': 0.0004941413233385075, 'samples': 2346240, 'steps': 12219, 'loss/train': 1.5224061012268066} -11/06/2021 22:56:16 - INFO - __main__ - Step 12221: {'lr': 0.0004941401811588426, 'samples': 2346432, 'steps': 12220, 'loss/train': 1.5389779806137085} -11/06/2021 22:56:17 - INFO - __main__ - Step 12222: {'lr': 0.0004941390388691719, 'samples': 2346624, 'steps': 12221, 'loss/train': 1.6822108030319214} -11/06/2021 22:56:18 - INFO - __main__ - Step 12223: {'lr': 0.0004941378964694959, 'samples': 2346816, 'steps': 12222, 'loss/train': 1.6283819675445557} -11/06/2021 22:56:18 - INFO - __main__ - Step 12224: {'lr': 0.0004941367539598152, 'samples': 2347008, 'steps': 12223, 'loss/train': 2.0302186012268066} -11/06/2021 22:56:19 - INFO - __main__ - Step 12225: {'lr': 0.0004941356113401301, 'samples': 2347200, 'steps': 12224, 'loss/train': 1.9460519552230835} -11/06/2021 22:56:19 - INFO - __main__ - Step 12226: {'lr': 0.0004941344686104414, 'samples': 2347392, 'steps': 12225, 'loss/train': 1.5134607553482056} -11/06/2021 22:56:19 - INFO - __main__ - Step 12227: {'lr': 0.0004941333257707495, 'samples': 2347584, 'steps': 12226, 'loss/train': 1.468488097190857} -11/06/2021 22:56:20 - INFO - __main__ - Step 12228: {'lr': 0.0004941321828210548, 'samples': 2347776, 'steps': 12227, 'loss/train': 1.6733677387237549} -11/06/2021 22:56:21 - INFO - __main__ - Step 12229: {'lr': 0.000494131039761358, 'samples': 2347968, 'steps': 12228, 'loss/train': 1.7591148614883423} -11/06/2021 22:56:21 - INFO - __main__ - Step 12230: {'lr': 0.0004941298965916594, 'samples': 2348160, 'steps': 12229, 'loss/train': 7.689951419830322} -11/06/2021 22:56:21 - INFO - __main__ - Step 12231: {'lr': 0.0004941287533119597, 'samples': 2348352, 'steps': 12230, 'loss/train': 1.1296072006225586} -11/06/2021 22:56:22 - INFO - __main__ - Step 12232: {'lr': 0.0004941276099222593, 'samples': 2348544, 'steps': 12231, 'loss/train': 1.8858994245529175} -11/06/2021 22:56:22 - INFO - __main__ - Step 12233: {'lr': 0.0004941264664225589, 'samples': 2348736, 'steps': 12232, 'loss/train': 1.4118883609771729} -11/06/2021 22:56:23 - INFO - __main__ - Step 12234: {'lr': 0.0004941253228128588, 'samples': 2348928, 'steps': 12233, 'loss/train': 2.075518846511841} -11/06/2021 22:56:24 - INFO - __main__ - Step 12235: {'lr': 0.0004941241790931595, 'samples': 2349120, 'steps': 12234, 'loss/train': 1.6000714302062988} -11/06/2021 22:56:24 - INFO - __main__ - Step 12236: {'lr': 0.0004941230352634617, 'samples': 2349312, 'steps': 12235, 'loss/train': 1.9275367259979248} -11/06/2021 22:56:24 - INFO - __main__ - Step 12237: {'lr': 0.0004941218913237658, 'samples': 2349504, 'steps': 12236, 'loss/train': 2.1970300674438477} -11/06/2021 22:56:25 - INFO - __main__ - Step 12238: {'lr': 0.0004941207472740724, 'samples': 2349696, 'steps': 12237, 'loss/train': 1.9084161520004272} -11/06/2021 22:56:26 - INFO - __main__ - Step 12239: {'lr': 0.000494119603114382, 'samples': 2349888, 'steps': 12238, 'loss/train': 2.308227062225342} -11/06/2021 22:56:26 - INFO - __main__ - Step 12240: {'lr': 0.000494118458844695, 'samples': 2350080, 'steps': 12239, 'loss/train': 2.078315019607544} -11/06/2021 22:56:26 - INFO - __main__ - Step 12241: {'lr': 0.0004941173144650119, 'samples': 2350272, 'steps': 12240, 'loss/train': 1.4600110054016113} -11/06/2021 22:56:27 - INFO - __main__ - Step 12242: {'lr': 0.0004941161699753335, 'samples': 2350464, 'steps': 12241, 'loss/train': 2.5496790409088135} -11/06/2021 22:56:27 - INFO - __main__ - Step 12243: {'lr': 0.00049411502537566, 'samples': 2350656, 'steps': 12242, 'loss/train': 1.7416751384735107} -11/06/2021 22:56:28 - INFO - __main__ - Step 12244: {'lr': 0.0004941138806659921, 'samples': 2350848, 'steps': 12243, 'loss/train': 1.8958357572555542} -11/06/2021 22:56:29 - INFO - __main__ - Step 12245: {'lr': 0.00049411273584633, 'samples': 2351040, 'steps': 12244, 'loss/train': 1.8675121068954468} -11/06/2021 22:56:29 - INFO - __main__ - Step 12246: {'lr': 0.0004941115909166748, 'samples': 2351232, 'steps': 12245, 'loss/train': 1.8117626905441284} -11/06/2021 22:56:29 - INFO - __main__ - Step 12247: {'lr': 0.0004941104458770266, 'samples': 2351424, 'steps': 12246, 'loss/train': 1.715092420578003} -11/06/2021 22:56:30 - INFO - __main__ - Step 12248: {'lr': 0.0004941093007273859, 'samples': 2351616, 'steps': 12247, 'loss/train': 2.001997470855713} -11/06/2021 22:56:30 - INFO - __main__ - Step 12249: {'lr': 0.0004941081554677534, 'samples': 2351808, 'steps': 12248, 'loss/train': 1.8709745407104492} -11/06/2021 22:56:31 - INFO - __main__ - Step 12250: {'lr': 0.0004941070100981295, 'samples': 2352000, 'steps': 12249, 'loss/train': 2.0071144104003906} -11/06/2021 22:56:32 - INFO - __main__ - Step 12251: {'lr': 0.0004941058646185148, 'samples': 2352192, 'steps': 12250, 'loss/train': 1.7076789140701294} -11/06/2021 22:56:32 - INFO - __main__ - Step 12252: {'lr': 0.0004941047190289096, 'samples': 2352384, 'steps': 12251, 'loss/train': 2.314211845397949} -11/06/2021 22:56:32 - INFO - __main__ - Step 12253: {'lr': 0.0004941035733293148, 'samples': 2352576, 'steps': 12252, 'loss/train': 2.0742650032043457} -11/06/2021 22:56:33 - INFO - __main__ - Step 12254: {'lr': 0.0004941024275197305, 'samples': 2352768, 'steps': 12253, 'loss/train': 1.7907441854476929} -11/06/2021 22:56:34 - INFO - __main__ - Step 12255: {'lr': 0.0004941012816001575, 'samples': 2352960, 'steps': 12254, 'loss/train': 1.6902923583984375} -11/06/2021 22:56:34 - INFO - __main__ - Step 12256: {'lr': 0.0004941001355705963, 'samples': 2353152, 'steps': 12255, 'loss/train': 1.4194196462631226} -11/06/2021 22:56:34 - INFO - __main__ - Step 12257: {'lr': 0.0004940989894310473, 'samples': 2353344, 'steps': 12256, 'loss/train': 2.029238224029541} -11/06/2021 22:56:35 - INFO - __main__ - Step 12258: {'lr': 0.000494097843181511, 'samples': 2353536, 'steps': 12257, 'loss/train': 1.5298515558242798} -11/06/2021 22:56:35 - INFO - __main__ - Step 12259: {'lr': 0.0004940966968219881, 'samples': 2353728, 'steps': 12258, 'loss/train': 1.807405948638916} -11/06/2021 22:56:35 - INFO - __main__ - Step 12260: {'lr': 0.0004940955503524789, 'samples': 2353920, 'steps': 12259, 'loss/train': 1.857525110244751} -11/06/2021 22:56:36 - INFO - __main__ - Step 12261: {'lr': 0.000494094403772984, 'samples': 2354112, 'steps': 12260, 'loss/train': 1.2936711311340332} -11/06/2021 22:56:37 - INFO - __main__ - Step 12262: {'lr': 0.0004940932570835039, 'samples': 2354304, 'steps': 12261, 'loss/train': 1.5933314561843872} -11/06/2021 22:56:37 - INFO - __main__ - Step 12263: {'lr': 0.0004940921102840393, 'samples': 2354496, 'steps': 12262, 'loss/train': 1.8495118618011475} -11/06/2021 22:56:37 - INFO - __main__ - Step 12264: {'lr': 0.0004940909633745905, 'samples': 2354688, 'steps': 12263, 'loss/train': 1.749647617340088} -11/06/2021 22:56:38 - INFO - __main__ - Step 12265: {'lr': 0.000494089816355158, 'samples': 2354880, 'steps': 12264, 'loss/train': 1.2525612115859985} -11/06/2021 22:56:39 - INFO - __main__ - Step 12266: {'lr': 0.0004940886692257424, 'samples': 2355072, 'steps': 12265, 'loss/train': 1.6700724363327026} -11/06/2021 22:56:40 - INFO - __main__ - Step 12267: {'lr': 0.0004940875219863443, 'samples': 2355264, 'steps': 12266, 'loss/train': 1.503882646560669} -11/06/2021 22:56:40 - INFO - __main__ - Step 12268: {'lr': 0.0004940863746369641, 'samples': 2355456, 'steps': 12267, 'loss/train': 1.7664172649383545} -11/06/2021 22:56:40 - INFO - __main__ - Step 12269: {'lr': 0.0004940852271776023, 'samples': 2355648, 'steps': 12268, 'loss/train': 1.7359364032745361} -11/06/2021 22:56:41 - INFO - __main__ - Step 12270: {'lr': 0.0004940840796082594, 'samples': 2355840, 'steps': 12269, 'loss/train': 1.848609447479248} -11/06/2021 22:56:41 - INFO - __main__ - Step 12271: {'lr': 0.0004940829319289361, 'samples': 2356032, 'steps': 12270, 'loss/train': 1.8408467769622803} -11/06/2021 22:56:42 - INFO - __main__ - Step 12272: {'lr': 0.0004940817841396327, 'samples': 2356224, 'steps': 12271, 'loss/train': 1.7952295541763306} -11/06/2021 22:56:42 - INFO - __main__ - Step 12273: {'lr': 0.0004940806362403499, 'samples': 2356416, 'steps': 12272, 'loss/train': 2.3083720207214355} -11/06/2021 22:56:43 - INFO - __main__ - Step 12274: {'lr': 0.0004940794882310882, 'samples': 2356608, 'steps': 12273, 'loss/train': 1.8015666007995605} -11/06/2021 22:56:43 - INFO - __main__ - Step 12275: {'lr': 0.000494078340111848, 'samples': 2356800, 'steps': 12274, 'loss/train': 1.8969393968582153} -11/06/2021 22:56:43 - INFO - __main__ - Step 12276: {'lr': 0.0004940771918826298, 'samples': 2356992, 'steps': 12275, 'loss/train': 1.4344086647033691} -11/06/2021 22:56:44 - INFO - __main__ - Step 12277: {'lr': 0.0004940760435434341, 'samples': 2357184, 'steps': 12276, 'loss/train': 1.9090864658355713} -11/06/2021 22:56:45 - INFO - __main__ - Step 12278: {'lr': 0.0004940748950942618, 'samples': 2357376, 'steps': 12277, 'loss/train': 1.6862670183181763} -11/06/2021 22:56:45 - INFO - __main__ - Step 12279: {'lr': 0.0004940737465351128, 'samples': 2357568, 'steps': 12278, 'loss/train': 1.9722408056259155} -11/06/2021 22:56:45 - INFO - __main__ - Step 12280: {'lr': 0.0004940725978659881, 'samples': 2357760, 'steps': 12279, 'loss/train': 1.9200348854064941} -11/06/2021 22:56:46 - INFO - __main__ - Step 12281: {'lr': 0.000494071449086888, 'samples': 2357952, 'steps': 12280, 'loss/train': 1.9199883937835693} -11/06/2021 22:56:47 - INFO - __main__ - Step 12282: {'lr': 0.0004940703001978131, 'samples': 2358144, 'steps': 12281, 'loss/train': 1.2483066320419312} -11/06/2021 22:56:47 - INFO - __main__ - Step 12283: {'lr': 0.0004940691511987639, 'samples': 2358336, 'steps': 12282, 'loss/train': 1.7513079643249512} -11/06/2021 22:56:47 - INFO - __main__ - Step 12284: {'lr': 0.0004940680020897409, 'samples': 2358528, 'steps': 12283, 'loss/train': 5.813735485076904} -11/06/2021 22:56:48 - INFO - __main__ - Step 12285: {'lr': 0.0004940668528707446, 'samples': 2358720, 'steps': 12284, 'loss/train': 1.4615005254745483} -11/06/2021 22:56:48 - INFO - __main__ - Step 12286: {'lr': 0.0004940657035417755, 'samples': 2358912, 'steps': 12285, 'loss/train': 2.1803793907165527} -11/06/2021 22:56:49 - INFO - __main__ - Step 12287: {'lr': 0.0004940645541028343, 'samples': 2359104, 'steps': 12286, 'loss/train': 3.126666307449341} -11/06/2021 22:56:50 - INFO - __main__ - Step 12288: {'lr': 0.0004940634045539213, 'samples': 2359296, 'steps': 12287, 'loss/train': 1.47324800491333} -11/06/2021 22:56:50 - INFO - __main__ - Step 12289: {'lr': 0.000494062254895037, 'samples': 2359488, 'steps': 12288, 'loss/train': 1.7035387754440308} -11/06/2021 22:56:50 - INFO - __main__ - Step 12290: {'lr': 0.0004940611051261822, 'samples': 2359680, 'steps': 12289, 'loss/train': 1.6604784727096558} -11/06/2021 22:56:51 - INFO - __main__ - Step 12291: {'lr': 0.000494059955247357, 'samples': 2359872, 'steps': 12290, 'loss/train': 1.833449125289917} -11/06/2021 22:56:51 - INFO - __main__ - Step 12292: {'lr': 0.0004940588052585624, 'samples': 2360064, 'steps': 12291, 'loss/train': 1.7617274522781372} -11/06/2021 22:56:52 - INFO - __main__ - Step 12293: {'lr': 0.0004940576551597985, 'samples': 2360256, 'steps': 12292, 'loss/train': 1.5269970893859863} -11/06/2021 22:56:52 - INFO - __main__ - Step 12294: {'lr': 0.000494056504951066, 'samples': 2360448, 'steps': 12293, 'loss/train': 0.993115246295929} -11/06/2021 22:56:53 - INFO - __main__ - Step 12295: {'lr': 0.0004940553546323655, 'samples': 2360640, 'steps': 12294, 'loss/train': 1.4290341138839722} -11/06/2021 22:56:53 - INFO - __main__ - Step 12296: {'lr': 0.0004940542042036974, 'samples': 2360832, 'steps': 12295, 'loss/train': 1.7313815355300903} -11/06/2021 22:56:53 - INFO - __main__ - Step 12297: {'lr': 0.0004940530536650621, 'samples': 2361024, 'steps': 12296, 'loss/train': 1.907927393913269} -11/06/2021 22:56:54 - INFO - __main__ - Step 12298: {'lr': 0.0004940519030164605, 'samples': 2361216, 'steps': 12297, 'loss/train': 1.4239506721496582} -11/06/2021 22:56:55 - INFO - __main__ - Step 12299: {'lr': 0.0004940507522578927, 'samples': 2361408, 'steps': 12298, 'loss/train': 2.017463207244873} -11/06/2021 22:56:55 - INFO - __main__ - Step 12300: {'lr': 0.0004940496013893594, 'samples': 2361600, 'steps': 12299, 'loss/train': 1.8298779726028442} -11/06/2021 22:56:55 - INFO - __main__ - Step 12301: {'lr': 0.0004940484504108612, 'samples': 2361792, 'steps': 12300, 'loss/train': 1.4371073246002197} -11/06/2021 22:56:56 - INFO - __main__ - Step 12302: {'lr': 0.0004940472993223985, 'samples': 2361984, 'steps': 12301, 'loss/train': 1.8154419660568237} -11/06/2021 22:56:56 - INFO - __main__ - Step 12303: {'lr': 0.0004940461481239719, 'samples': 2362176, 'steps': 12302, 'loss/train': 1.6027586460113525} -11/06/2021 22:56:57 - INFO - __main__ - Step 12304: {'lr': 0.0004940449968155818, 'samples': 2362368, 'steps': 12303, 'loss/train': 2.39496111869812} -11/06/2021 22:56:58 - INFO - __main__ - Step 12305: {'lr': 0.0004940438453972288, 'samples': 2362560, 'steps': 12304, 'loss/train': 1.6671775579452515} -11/06/2021 22:56:58 - INFO - __main__ - Step 12306: {'lr': 0.0004940426938689135, 'samples': 2362752, 'steps': 12305, 'loss/train': 1.91392183303833} -11/06/2021 22:56:58 - INFO - __main__ - Step 12307: {'lr': 0.0004940415422306361, 'samples': 2362944, 'steps': 12306, 'loss/train': 1.1845285892486572} -11/06/2021 22:56:59 - INFO - __main__ - Step 12308: {'lr': 0.0004940403904823976, 'samples': 2363136, 'steps': 12307, 'loss/train': 1.8613651990890503} -11/06/2021 22:57:00 - INFO - __main__ - Step 12309: {'lr': 0.0004940392386241981, 'samples': 2363328, 'steps': 12308, 'loss/train': 2.2593603134155273} -11/06/2021 22:57:00 - INFO - __main__ - Step 12310: {'lr': 0.0004940380866560384, 'samples': 2363520, 'steps': 12309, 'loss/train': 1.829590916633606} -11/06/2021 22:57:00 - INFO - __main__ - Step 12311: {'lr': 0.0004940369345779187, 'samples': 2363712, 'steps': 12310, 'loss/train': 1.535210371017456} -11/06/2021 22:57:01 - INFO - __main__ - Step 12312: {'lr': 0.00049403578238984, 'samples': 2363904, 'steps': 12311, 'loss/train': 1.498138189315796} -11/06/2021 22:57:01 - INFO - __main__ - Step 12313: {'lr': 0.0004940346300918024, 'samples': 2364096, 'steps': 12312, 'loss/train': 1.6373891830444336} -11/06/2021 22:57:02 - INFO - __main__ - Step 12314: {'lr': 0.0004940334776838065, 'samples': 2364288, 'steps': 12313, 'loss/train': 2.0152111053466797} -11/06/2021 22:57:02 - INFO - __main__ - Step 12315: {'lr': 0.000494032325165853, 'samples': 2364480, 'steps': 12314, 'loss/train': 1.4806876182556152} -11/06/2021 22:57:03 - INFO - __main__ - Step 12316: {'lr': 0.0004940311725379423, 'samples': 2364672, 'steps': 12315, 'loss/train': 1.7899569272994995} -11/06/2021 22:57:03 - INFO - __main__ - Step 12317: {'lr': 0.0004940300198000748, 'samples': 2364864, 'steps': 12316, 'loss/train': 1.8684685230255127} -11/06/2021 22:57:03 - INFO - __main__ - Step 12318: {'lr': 0.0004940288669522513, 'samples': 2365056, 'steps': 12317, 'loss/train': 1.5197453498840332} -11/06/2021 22:57:05 - INFO - __main__ - Step 12319: {'lr': 0.000494027713994472, 'samples': 2365248, 'steps': 12318, 'loss/train': 1.7379388809204102} -11/06/2021 22:57:05 - INFO - __main__ - Step 12320: {'lr': 0.0004940265609267377, 'samples': 2365440, 'steps': 12319, 'loss/train': 1.384351372718811} -11/06/2021 22:57:05 - INFO - __main__ - Step 12321: {'lr': 0.0004940254077490487, 'samples': 2365632, 'steps': 12320, 'loss/train': 2.0284841060638428} -11/06/2021 22:57:06 - INFO - __main__ - Step 12322: {'lr': 0.0004940242544614056, 'samples': 2365824, 'steps': 12321, 'loss/train': 1.541722297668457} -11/06/2021 22:57:06 - INFO - __main__ - Step 12323: {'lr': 0.0004940231010638091, 'samples': 2366016, 'steps': 12322, 'loss/train': 1.9831137657165527} -11/06/2021 22:57:07 - INFO - __main__ - Step 12324: {'lr': 0.0004940219475562593, 'samples': 2366208, 'steps': 12323, 'loss/train': 0.3079480528831482} -11/06/2021 22:57:08 - INFO - __main__ - Step 12325: {'lr': 0.0004940207939387573, 'samples': 2366400, 'steps': 12324, 'loss/train': 1.5259820222854614} -11/06/2021 22:57:08 - INFO - __main__ - Step 12326: {'lr': 0.0004940196402113031, 'samples': 2366592, 'steps': 12325, 'loss/train': 1.683254361152649} -11/06/2021 22:57:08 - INFO - __main__ - Step 12327: {'lr': 0.0004940184863738975, 'samples': 2366784, 'steps': 12326, 'loss/train': 1.8076988458633423} -11/06/2021 22:57:09 - INFO - __main__ - Step 12328: {'lr': 0.0004940173324265407, 'samples': 2366976, 'steps': 12327, 'loss/train': 1.4422165155410767} -11/06/2021 22:57:10 - INFO - __main__ - Step 12329: {'lr': 0.0004940161783692338, 'samples': 2367168, 'steps': 12328, 'loss/train': 1.9659552574157715} -11/06/2021 22:57:10 - INFO - __main__ - Step 12330: {'lr': 0.0004940150242019768, 'samples': 2367360, 'steps': 12329, 'loss/train': 1.24222731590271} -11/06/2021 22:57:11 - INFO - __main__ - Step 12331: {'lr': 0.0004940138699247704, 'samples': 2367552, 'steps': 12330, 'loss/train': 2.182091474533081} -11/06/2021 22:57:11 - INFO - __main__ - Step 12332: {'lr': 0.0004940127155376151, 'samples': 2367744, 'steps': 12331, 'loss/train': 1.8635755777359009} -11/06/2021 22:57:11 - INFO - __main__ - Step 12333: {'lr': 0.0004940115610405114, 'samples': 2367936, 'steps': 12332, 'loss/train': 1.9940561056137085} -11/06/2021 22:57:12 - INFO - __main__ - Step 12334: {'lr': 0.0004940104064334599, 'samples': 2368128, 'steps': 12333, 'loss/train': 1.4782226085662842} -11/06/2021 22:57:12 - INFO - __main__ - Step 12335: {'lr': 0.0004940092517164612, 'samples': 2368320, 'steps': 12334, 'loss/train': 1.205909252166748} -11/06/2021 22:57:13 - INFO - __main__ - Step 12336: {'lr': 0.0004940080968895155, 'samples': 2368512, 'steps': 12335, 'loss/train': 2.1496191024780273} -11/06/2021 22:57:13 - INFO - __main__ - Step 12337: {'lr': 0.0004940069419526236, 'samples': 2368704, 'steps': 12336, 'loss/train': 1.5507055521011353} -11/06/2021 22:57:14 - INFO - __main__ - Step 12338: {'lr': 0.0004940057869057859, 'samples': 2368896, 'steps': 12337, 'loss/train': 0.8827195763587952} -11/06/2021 22:57:14 - INFO - __main__ - Step 12339: {'lr': 0.000494004631749003, 'samples': 2369088, 'steps': 12338, 'loss/train': 1.7027802467346191} -11/06/2021 22:57:14 - INFO - __main__ - Step 12340: {'lr': 0.0004940034764822754, 'samples': 2369280, 'steps': 12339, 'loss/train': 1.6618696451187134} -11/06/2021 22:57:15 - INFO - __main__ - Step 12341: {'lr': 0.0004940023211056036, 'samples': 2369472, 'steps': 12340, 'loss/train': 1.9544622898101807} -11/06/2021 22:57:16 - INFO - __main__ - Step 12342: {'lr': 0.0004940011656189881, 'samples': 2369664, 'steps': 12341, 'loss/train': 1.8119089603424072} -11/06/2021 22:57:16 - INFO - __main__ - Step 12343: {'lr': 0.0004940000100224295, 'samples': 2369856, 'steps': 12342, 'loss/train': 1.2512726783752441} -11/06/2021 22:57:17 - INFO - __main__ - Step 12344: {'lr': 0.0004939988543159282, 'samples': 2370048, 'steps': 12343, 'loss/train': 1.5961833000183105} -11/06/2021 22:57:17 - INFO - __main__ - Step 12345: {'lr': 0.0004939976984994847, 'samples': 2370240, 'steps': 12344, 'loss/train': 1.501064419746399} -11/06/2021 22:57:18 - INFO - __main__ - Step 12346: {'lr': 0.0004939965425730996, 'samples': 2370432, 'steps': 12345, 'loss/train': 1.6873294115066528} -11/06/2021 22:57:18 - INFO - __main__ - Step 12347: {'lr': 0.0004939953865367735, 'samples': 2370624, 'steps': 12346, 'loss/train': 1.1613168716430664} -11/06/2021 22:57:19 - INFO - __main__ - Step 12348: {'lr': 0.0004939942303905069, 'samples': 2370816, 'steps': 12347, 'loss/train': 1.5683062076568604} -11/06/2021 22:57:19 - INFO - __main__ - Step 12349: {'lr': 0.0004939930741343002, 'samples': 2371008, 'steps': 12348, 'loss/train': 1.0350655317306519} -11/06/2021 22:57:19 - INFO - __main__ - Step 12350: {'lr': 0.000493991917768154, 'samples': 2371200, 'steps': 12349, 'loss/train': 1.5559569597244263} -11/06/2021 22:57:20 - INFO - __main__ - Step 12351: {'lr': 0.0004939907612920688, 'samples': 2371392, 'steps': 12350, 'loss/train': 1.799564003944397} -11/06/2021 22:57:21 - INFO - __main__ - Step 12352: {'lr': 0.0004939896047060451, 'samples': 2371584, 'steps': 12351, 'loss/train': 1.0660388469696045} -11/06/2021 22:57:21 - INFO - __main__ - Step 12353: {'lr': 0.0004939884480100836, 'samples': 2371776, 'steps': 12352, 'loss/train': 1.4161072969436646} -11/06/2021 22:57:21 - INFO - __main__ - Step 12354: {'lr': 0.0004939872912041844, 'samples': 2371968, 'steps': 12353, 'loss/train': 1.7622441053390503} -11/06/2021 22:57:22 - INFO - __main__ - Step 12355: {'lr': 0.0004939861342883485, 'samples': 2372160, 'steps': 12354, 'loss/train': 1.4472774267196655} -11/06/2021 22:57:22 - INFO - __main__ - Step 12356: {'lr': 0.0004939849772625761, 'samples': 2372352, 'steps': 12355, 'loss/train': 1.7829986810684204} -11/06/2021 22:57:23 - INFO - __main__ - Step 12357: {'lr': 0.0004939838201268679, 'samples': 2372544, 'steps': 12356, 'loss/train': 2.1662769317626953} -11/06/2021 22:57:24 - INFO - __main__ - Step 12358: {'lr': 0.0004939826628812244, 'samples': 2372736, 'steps': 12357, 'loss/train': 1.5202739238739014} -11/06/2021 22:57:24 - INFO - __main__ - Step 12359: {'lr': 0.000493981505525646, 'samples': 2372928, 'steps': 12358, 'loss/train': 1.9102394580841064} -11/06/2021 22:57:24 - INFO - __main__ - Step 12360: {'lr': 0.0004939803480601333, 'samples': 2373120, 'steps': 12359, 'loss/train': 1.4958027601242065} -11/06/2021 22:57:25 - INFO - __main__ - Step 12361: {'lr': 0.0004939791904846869, 'samples': 2373312, 'steps': 12360, 'loss/train': 1.0917266607284546} -11/06/2021 22:57:26 - INFO - __main__ - Step 12362: {'lr': 0.0004939780327993072, 'samples': 2373504, 'steps': 12361, 'loss/train': 1.7016918659210205} -11/06/2021 22:57:26 - INFO - __main__ - Step 12363: {'lr': 0.0004939768750039946, 'samples': 2373696, 'steps': 12362, 'loss/train': 1.3413039445877075} -11/06/2021 22:57:26 - INFO - __main__ - Step 12364: {'lr': 0.00049397571709875, 'samples': 2373888, 'steps': 12363, 'loss/train': 2.0355639457702637} -11/06/2021 22:57:27 - INFO - __main__ - Step 12365: {'lr': 0.0004939745590835736, 'samples': 2374080, 'steps': 12364, 'loss/train': 2.2837467193603516} -11/06/2021 22:57:27 - INFO - __main__ - Step 12366: {'lr': 0.0004939734009584661, 'samples': 2374272, 'steps': 12365, 'loss/train': 2.075040578842163} -11/06/2021 22:57:28 - INFO - __main__ - Step 12367: {'lr': 0.0004939722427234279, 'samples': 2374464, 'steps': 12366, 'loss/train': 1.9329279661178589} -11/06/2021 22:57:28 - INFO - __main__ - Step 12368: {'lr': 0.0004939710843784596, 'samples': 2374656, 'steps': 12367, 'loss/train': 1.624833106994629} -11/06/2021 22:57:29 - INFO - __main__ - Step 12369: {'lr': 0.0004939699259235617, 'samples': 2374848, 'steps': 12368, 'loss/train': 1.8931273221969604} -11/06/2021 22:57:29 - INFO - __main__ - Step 12370: {'lr': 0.0004939687673587346, 'samples': 2375040, 'steps': 12369, 'loss/train': 1.79799222946167} -11/06/2021 22:57:29 - INFO - __main__ - Step 12371: {'lr': 0.0004939676086839791, 'samples': 2375232, 'steps': 12370, 'loss/train': 1.7580457925796509} -11/06/2021 22:57:30 - INFO - __main__ - Step 12372: {'lr': 0.0004939664498992955, 'samples': 2375424, 'steps': 12371, 'loss/train': 1.5857473611831665} -11/06/2021 22:57:31 - INFO - __main__ - Step 12373: {'lr': 0.0004939652910046844, 'samples': 2375616, 'steps': 12372, 'loss/train': 1.6514397859573364} -11/06/2021 22:57:31 - INFO - __main__ - Step 12374: {'lr': 0.0004939641320001462, 'samples': 2375808, 'steps': 12373, 'loss/train': 1.8684816360473633} -11/06/2021 22:57:31 - INFO - __main__ - Step 12375: {'lr': 0.0004939629728856817, 'samples': 2376000, 'steps': 12374, 'loss/train': 1.2412973642349243} -11/06/2021 22:57:32 - INFO - __main__ - Step 12376: {'lr': 0.0004939618136612911, 'samples': 2376192, 'steps': 12375, 'loss/train': 1.7167083024978638} -11/06/2021 22:57:33 - INFO - __main__ - Step 12377: {'lr': 0.0004939606543269751, 'samples': 2376384, 'steps': 12376, 'loss/train': 1.4133563041687012} -11/06/2021 22:57:33 - INFO - __main__ - Step 12378: {'lr': 0.0004939594948827343, 'samples': 2376576, 'steps': 12377, 'loss/train': 1.8891206979751587} -11/06/2021 22:57:34 - INFO - __main__ - Step 12379: {'lr': 0.000493958335328569, 'samples': 2376768, 'steps': 12378, 'loss/train': 1.7850967645645142} -11/06/2021 22:57:34 - INFO - __main__ - Step 12380: {'lr': 0.0004939571756644799, 'samples': 2376960, 'steps': 12379, 'loss/train': 1.6386349201202393} -11/06/2021 22:57:34 - INFO - __main__ - Step 12381: {'lr': 0.0004939560158904675, 'samples': 2377152, 'steps': 12380, 'loss/train': 0.9704276323318481} -11/06/2021 22:57:36 - INFO - __main__ - Step 12382: {'lr': 0.0004939548560065322, 'samples': 2377344, 'steps': 12381, 'loss/train': 1.7817976474761963} -11/06/2021 22:57:36 - INFO - __main__ - Step 12383: {'lr': 0.0004939536960126746, 'samples': 2377536, 'steps': 12382, 'loss/train': 1.5621471405029297} -11/06/2021 22:57:37 - INFO - __main__ - Step 12384: {'lr': 0.0004939525359088953, 'samples': 2377728, 'steps': 12383, 'loss/train': 1.8215516805648804} -11/06/2021 22:57:37 - INFO - __main__ - Step 12385: {'lr': 0.0004939513756951946, 'samples': 2377920, 'steps': 12384, 'loss/train': 1.7546138763427734} -11/06/2021 22:57:37 - INFO - __main__ - Step 12386: {'lr': 0.0004939502153715733, 'samples': 2378112, 'steps': 12385, 'loss/train': 1.881219744682312} -11/06/2021 22:57:38 - INFO - __main__ - Step 12387: {'lr': 0.0004939490549380318, 'samples': 2378304, 'steps': 12386, 'loss/train': 2.4455485343933105} -11/06/2021 22:57:38 - INFO - __main__ - Step 12388: {'lr': 0.0004939478943945706, 'samples': 2378496, 'steps': 12387, 'loss/train': 1.8239833116531372} -11/06/2021 22:57:39 - INFO - __main__ - Step 12389: {'lr': 0.0004939467337411903, 'samples': 2378688, 'steps': 12388, 'loss/train': 1.7355788946151733} -11/06/2021 22:57:39 - INFO - __main__ - Step 12390: {'lr': 0.0004939455729778912, 'samples': 2378880, 'steps': 12389, 'loss/train': 1.7384986877441406} -11/06/2021 22:57:40 - INFO - __main__ - Step 12391: {'lr': 0.0004939444121046741, 'samples': 2379072, 'steps': 12390, 'loss/train': 1.171319603919983} -11/06/2021 22:57:40 - INFO - __main__ - Step 12392: {'lr': 0.0004939432511215395, 'samples': 2379264, 'steps': 12391, 'loss/train': 1.6471529006958008} -11/06/2021 22:57:40 - INFO - __main__ - Step 12393: {'lr': 0.0004939420900284876, 'samples': 2379456, 'steps': 12392, 'loss/train': 1.4227564334869385} -11/06/2021 22:57:41 - INFO - __main__ - Step 12394: {'lr': 0.0004939409288255194, 'samples': 2379648, 'steps': 12393, 'loss/train': 1.9644057750701904} -11/06/2021 22:57:42 - INFO - __main__ - Step 12395: {'lr': 0.000493939767512635, 'samples': 2379840, 'steps': 12394, 'loss/train': 1.767325758934021} -11/06/2021 22:57:42 - INFO - __main__ - Step 12396: {'lr': 0.0004939386060898353, 'samples': 2380032, 'steps': 12395, 'loss/train': 2.075618267059326} -11/06/2021 22:57:42 - INFO - __main__ - Step 12397: {'lr': 0.0004939374445571206, 'samples': 2380224, 'steps': 12396, 'loss/train': 1.4473564624786377} -11/06/2021 22:57:43 - INFO - __main__ - Step 12398: {'lr': 0.0004939362829144913, 'samples': 2380416, 'steps': 12397, 'loss/train': 1.165976643562317} -11/06/2021 22:57:44 - INFO - __main__ - Step 12399: {'lr': 0.0004939351211619481, 'samples': 2380608, 'steps': 12398, 'loss/train': 2.2611637115478516} -11/06/2021 22:57:44 - INFO - __main__ - Step 12400: {'lr': 0.0004939339592994916, 'samples': 2380800, 'steps': 12399, 'loss/train': 2.222313165664673} -11/06/2021 22:57:45 - INFO - __main__ - Step 12401: {'lr': 0.0004939327973271222, 'samples': 2380992, 'steps': 12400, 'loss/train': 1.8177175521850586} -11/06/2021 22:57:45 - INFO - __main__ - Step 12402: {'lr': 0.0004939316352448403, 'samples': 2381184, 'steps': 12401, 'loss/train': 1.0791970491409302} -11/06/2021 22:57:45 - INFO - __main__ - Step 12403: {'lr': 0.0004939304730526467, 'samples': 2381376, 'steps': 12402, 'loss/train': 1.8736491203308105} -11/06/2021 22:57:46 - INFO - __main__ - Step 12404: {'lr': 0.0004939293107505418, 'samples': 2381568, 'steps': 12403, 'loss/train': 2.0087807178497314} -11/06/2021 22:57:47 - INFO - __main__ - Step 12405: {'lr': 0.0004939281483385261, 'samples': 2381760, 'steps': 12404, 'loss/train': 1.4684945344924927} -11/06/2021 22:57:47 - INFO - __main__ - Step 12406: {'lr': 0.0004939269858166001, 'samples': 2381952, 'steps': 12405, 'loss/train': 1.8479887247085571} -11/06/2021 22:57:47 - INFO - __main__ - Step 12407: {'lr': 0.0004939258231847644, 'samples': 2382144, 'steps': 12406, 'loss/train': 1.5185550451278687} -11/06/2021 22:57:48 - INFO - __main__ - Step 12408: {'lr': 0.0004939246604430195, 'samples': 2382336, 'steps': 12407, 'loss/train': 1.8069547414779663} -11/06/2021 22:57:48 - INFO - __main__ - Step 12409: {'lr': 0.0004939234975913659, 'samples': 2382528, 'steps': 12408, 'loss/train': 1.5137650966644287} -11/06/2021 22:57:49 - INFO - __main__ - Step 12410: {'lr': 0.0004939223346298042, 'samples': 2382720, 'steps': 12409, 'loss/train': 0.2782944142818451} -11/06/2021 22:57:50 - INFO - __main__ - Step 12411: {'lr': 0.0004939211715583347, 'samples': 2382912, 'steps': 12410, 'loss/train': 1.9376318454742432} -11/06/2021 22:57:50 - INFO - __main__ - Step 12412: {'lr': 0.0004939200083769582, 'samples': 2383104, 'steps': 12411, 'loss/train': 1.265969157218933} -11/06/2021 22:57:50 - INFO - __main__ - Step 12413: {'lr': 0.000493918845085675, 'samples': 2383296, 'steps': 12412, 'loss/train': 1.7577980756759644} -11/06/2021 22:57:51 - INFO - __main__ - Step 12414: {'lr': 0.000493917681684486, 'samples': 2383488, 'steps': 12413, 'loss/train': 0.3489714562892914} -11/06/2021 22:57:52 - INFO - __main__ - Step 12415: {'lr': 0.0004939165181733911, 'samples': 2383680, 'steps': 12414, 'loss/train': 1.9580268859863281} -11/06/2021 22:57:52 - INFO - __main__ - Step 12416: {'lr': 0.0004939153545523914, 'samples': 2383872, 'steps': 12415, 'loss/train': 1.4286139011383057} -11/06/2021 22:57:52 - INFO - __main__ - Step 12417: {'lr': 0.0004939141908214871, 'samples': 2384064, 'steps': 12416, 'loss/train': 1.9150186777114868} -11/06/2021 22:57:53 - INFO - __main__ - Step 12418: {'lr': 0.000493913026980679, 'samples': 2384256, 'steps': 12417, 'loss/train': 1.4130078554153442} -11/06/2021 22:57:53 - INFO - __main__ - Step 12419: {'lr': 0.0004939118630299672, 'samples': 2384448, 'steps': 12418, 'loss/train': 1.799317479133606} -11/06/2021 22:57:54 - INFO - __main__ - Step 12420: {'lr': 0.0004939106989693527, 'samples': 2384640, 'steps': 12419, 'loss/train': 2.154881477355957} -11/06/2021 22:57:55 - INFO - __main__ - Step 12421: {'lr': 0.0004939095347988357, 'samples': 2384832, 'steps': 12420, 'loss/train': 1.9314367771148682} -11/06/2021 22:57:55 - INFO - __main__ - Step 12422: {'lr': 0.0004939083705184169, 'samples': 2385024, 'steps': 12421, 'loss/train': 1.7732396125793457} -11/06/2021 22:57:55 - INFO - __main__ - Step 12423: {'lr': 0.0004939072061280967, 'samples': 2385216, 'steps': 12422, 'loss/train': 1.4663667678833008} -11/06/2021 22:57:56 - INFO - __main__ - Step 12424: {'lr': 0.0004939060416278756, 'samples': 2385408, 'steps': 12423, 'loss/train': 1.8774303197860718} -11/06/2021 22:57:57 - INFO - __main__ - Step 12425: {'lr': 0.0004939048770177543, 'samples': 2385600, 'steps': 12424, 'loss/train': 1.5539430379867554} -11/06/2021 22:57:57 - INFO - __main__ - Step 12426: {'lr': 0.0004939037122977332, 'samples': 2385792, 'steps': 12425, 'loss/train': 1.527437448501587} -11/06/2021 22:57:57 - INFO - __main__ - Step 12427: {'lr': 0.0004939025474678129, 'samples': 2385984, 'steps': 12426, 'loss/train': 1.8269412517547607} -11/06/2021 22:57:58 - INFO - __main__ - Step 12428: {'lr': 0.0004939013825279939, 'samples': 2386176, 'steps': 12427, 'loss/train': 1.5649765729904175} -11/06/2021 22:57:58 - INFO - __main__ - Step 12429: {'lr': 0.0004939002174782766, 'samples': 2386368, 'steps': 12428, 'loss/train': 0.8925514221191406} -11/06/2021 22:57:59 - INFO - __main__ - Step 12430: {'lr': 0.0004938990523186616, 'samples': 2386560, 'steps': 12429, 'loss/train': 0.6605421304702759} -11/06/2021 22:57:59 - INFO - __main__ - Step 12431: {'lr': 0.0004938978870491495, 'samples': 2386752, 'steps': 12430, 'loss/train': 1.8025730848312378} -11/06/2021 22:58:00 - INFO - __main__ - Step 12432: {'lr': 0.0004938967216697409, 'samples': 2386944, 'steps': 12431, 'loss/train': 1.7200829982757568} -11/06/2021 22:58:00 - INFO - __main__ - Step 12433: {'lr': 0.0004938955561804361, 'samples': 2387136, 'steps': 12432, 'loss/train': 1.6927978992462158} -11/06/2021 22:58:00 - INFO - __main__ - Step 12434: {'lr': 0.0004938943905812357, 'samples': 2387328, 'steps': 12433, 'loss/train': 1.6915475130081177} -11/06/2021 22:58:02 - INFO - __main__ - Step 12435: {'lr': 0.0004938932248721401, 'samples': 2387520, 'steps': 12434, 'loss/train': 1.565805196762085} -11/06/2021 22:58:02 - INFO - __main__ - Step 12436: {'lr': 0.0004938920590531503, 'samples': 2387712, 'steps': 12435, 'loss/train': 1.8280435800552368} -11/06/2021 22:58:02 - INFO - __main__ - Step 12437: {'lr': 0.0004938908931242663, 'samples': 2387904, 'steps': 12436, 'loss/train': 1.499329924583435} -11/06/2021 22:58:03 - INFO - __main__ - Step 12438: {'lr': 0.0004938897270854889, 'samples': 2388096, 'steps': 12437, 'loss/train': 0.8522184491157532} -11/06/2021 22:58:03 - INFO - __main__ - Step 12439: {'lr': 0.0004938885609368184, 'samples': 2388288, 'steps': 12438, 'loss/train': 1.0399724245071411} -11/06/2021 22:58:03 - INFO - __main__ - Step 12440: {'lr': 0.0004938873946782557, 'samples': 2388480, 'steps': 12439, 'loss/train': 1.3930256366729736} -11/06/2021 22:58:04 - INFO - __main__ - Step 12441: {'lr': 0.000493886228309801, 'samples': 2388672, 'steps': 12440, 'loss/train': 2.077786922454834} -11/06/2021 22:58:05 - INFO - __main__ - Step 12442: {'lr': 0.0004938850618314549, 'samples': 2388864, 'steps': 12441, 'loss/train': 1.7731544971466064} -11/06/2021 22:58:05 - INFO - __main__ - Step 12443: {'lr': 0.000493883895243218, 'samples': 2389056, 'steps': 12442, 'loss/train': 1.930917501449585} -11/06/2021 22:58:05 - INFO - __main__ - Step 12444: {'lr': 0.0004938827285450908, 'samples': 2389248, 'steps': 12443, 'loss/train': 1.6230531930923462} -11/06/2021 22:58:06 - INFO - __main__ - Step 12445: {'lr': 0.0004938815617370737, 'samples': 2389440, 'steps': 12444, 'loss/train': 1.7806710004806519} -11/06/2021 22:58:07 - INFO - __main__ - Step 12446: {'lr': 0.0004938803948191674, 'samples': 2389632, 'steps': 12445, 'loss/train': 1.8226611614227295} -11/06/2021 22:58:07 - INFO - __main__ - Step 12447: {'lr': 0.0004938792277913724, 'samples': 2389824, 'steps': 12446, 'loss/train': 1.6907552480697632} -11/06/2021 22:58:07 - INFO - __main__ - Step 12448: {'lr': 0.0004938780606536891, 'samples': 2390016, 'steps': 12447, 'loss/train': 1.9399850368499756} -11/06/2021 22:58:08 - INFO - __main__ - Step 12449: {'lr': 0.0004938768934061182, 'samples': 2390208, 'steps': 12448, 'loss/train': 1.9037350416183472} -11/06/2021 22:58:08 - INFO - __main__ - Step 12450: {'lr': 0.0004938757260486601, 'samples': 2390400, 'steps': 12449, 'loss/train': 1.6695767641067505} -11/06/2021 22:58:09 - INFO - __main__ - Step 12451: {'lr': 0.0004938745585813153, 'samples': 2390592, 'steps': 12450, 'loss/train': 1.9863166809082031} -11/06/2021 22:58:09 - INFO - __main__ - Step 12452: {'lr': 0.0004938733910040845, 'samples': 2390784, 'steps': 12451, 'loss/train': 1.697218418121338} -11/06/2021 22:58:10 - INFO - __main__ - Step 12453: {'lr': 0.000493872223316968, 'samples': 2390976, 'steps': 12452, 'loss/train': 1.4199427366256714} -11/06/2021 22:58:10 - INFO - __main__ - Step 12454: {'lr': 0.0004938710555199664, 'samples': 2391168, 'steps': 12453, 'loss/train': 1.2885547876358032} -11/06/2021 22:58:10 - INFO - __main__ - Step 12455: {'lr': 0.0004938698876130804, 'samples': 2391360, 'steps': 12454, 'loss/train': 1.8421812057495117} -11/06/2021 22:58:12 - INFO - __main__ - Step 12456: {'lr': 0.0004938687195963104, 'samples': 2391552, 'steps': 12455, 'loss/train': 1.8967642784118652} -11/06/2021 22:58:12 - INFO - __main__ - Step 12457: {'lr': 0.0004938675514696569, 'samples': 2391744, 'steps': 12456, 'loss/train': 0.5866230726242065} -11/06/2021 22:58:12 - INFO - __main__ - Step 12458: {'lr': 0.0004938663832331204, 'samples': 2391936, 'steps': 12457, 'loss/train': 1.3953553438186646} -11/06/2021 22:58:13 - INFO - __main__ - Step 12459: {'lr': 0.0004938652148867014, 'samples': 2392128, 'steps': 12458, 'loss/train': 0.3347637355327606} -11/06/2021 22:58:13 - INFO - __main__ - Step 12460: {'lr': 0.0004938640464304006, 'samples': 2392320, 'steps': 12459, 'loss/train': 1.7510279417037964} -11/06/2021 22:58:14 - INFO - __main__ - Step 12461: {'lr': 0.0004938628778642185, 'samples': 2392512, 'steps': 12460, 'loss/train': 1.7119464874267578} -11/06/2021 22:58:15 - INFO - __main__ - Step 12462: {'lr': 0.0004938617091881554, 'samples': 2392704, 'steps': 12461, 'loss/train': 1.8808752298355103} -11/06/2021 22:58:15 - INFO - __main__ - Step 12463: {'lr': 0.000493860540402212, 'samples': 2392896, 'steps': 12462, 'loss/train': 1.534140706062317} -11/06/2021 22:58:15 - INFO - __main__ - Step 12464: {'lr': 0.0004938593715063888, 'samples': 2393088, 'steps': 12463, 'loss/train': 1.430334448814392} -11/06/2021 22:58:16 - INFO - __main__ - Step 12465: {'lr': 0.0004938582025006864, 'samples': 2393280, 'steps': 12464, 'loss/train': 1.060693621635437} -11/06/2021 22:58:16 - INFO - __main__ - Step 12466: {'lr': 0.0004938570333851052, 'samples': 2393472, 'steps': 12465, 'loss/train': 1.7933906316757202} -11/06/2021 22:58:17 - INFO - __main__ - Step 12467: {'lr': 0.0004938558641596458, 'samples': 2393664, 'steps': 12466, 'loss/train': 0.8866246938705444} -11/06/2021 22:58:18 - INFO - __main__ - Step 12468: {'lr': 0.0004938546948243087, 'samples': 2393856, 'steps': 12467, 'loss/train': 1.1550602912902832} -11/06/2021 22:58:18 - INFO - __main__ - Step 12469: {'lr': 0.0004938535253790944, 'samples': 2394048, 'steps': 12468, 'loss/train': 1.569968342781067} -11/06/2021 22:58:18 - INFO - __main__ - Step 12470: {'lr': 0.0004938523558240035, 'samples': 2394240, 'steps': 12469, 'loss/train': 1.5518238544464111} -11/06/2021 22:58:19 - INFO - __main__ - Step 12471: {'lr': 0.0004938511861590365, 'samples': 2394432, 'steps': 12470, 'loss/train': 1.680008053779602} -11/06/2021 22:58:20 - INFO - __main__ - Step 12472: {'lr': 0.000493850016384194, 'samples': 2394624, 'steps': 12471, 'loss/train': 1.5120447874069214} -11/06/2021 22:58:20 - INFO - __main__ - Step 12473: {'lr': 0.0004938488464994764, 'samples': 2394816, 'steps': 12472, 'loss/train': 1.2448487281799316} -11/06/2021 22:58:20 - INFO - __main__ - Step 12474: {'lr': 0.0004938476765048842, 'samples': 2395008, 'steps': 12473, 'loss/train': 1.75505530834198} -11/06/2021 22:58:21 - INFO - __main__ - Step 12475: {'lr': 0.0004938465064004181, 'samples': 2395200, 'steps': 12474, 'loss/train': 1.4993715286254883} -11/06/2021 22:58:21 - INFO - __main__ - Step 12476: {'lr': 0.0004938453361860785, 'samples': 2395392, 'steps': 12475, 'loss/train': 1.6002764701843262} -11/06/2021 22:58:22 - INFO - __main__ - Step 12477: {'lr': 0.0004938441658618659, 'samples': 2395584, 'steps': 12476, 'loss/train': 1.6196297407150269} -11/06/2021 22:58:22 - INFO - __main__ - Step 12478: {'lr': 0.0004938429954277809, 'samples': 2395776, 'steps': 12477, 'loss/train': 1.990778923034668} -11/06/2021 22:58:23 - INFO - __main__ - Step 12479: {'lr': 0.000493841824883824, 'samples': 2395968, 'steps': 12478, 'loss/train': 1.7635631561279297} -11/06/2021 22:58:23 - INFO - __main__ - Step 12480: {'lr': 0.0004938406542299956, 'samples': 2396160, 'steps': 12479, 'loss/train': 1.3563812971115112} -11/06/2021 22:58:23 - INFO - __main__ - Step 12481: {'lr': 0.0004938394834662966, 'samples': 2396352, 'steps': 12480, 'loss/train': 0.9850826859474182} -11/06/2021 22:58:24 - INFO - __main__ - Step 12482: {'lr': 0.0004938383125927272, 'samples': 2396544, 'steps': 12481, 'loss/train': 1.9261223077774048} -11/06/2021 22:58:25 - INFO - __main__ - Step 12483: {'lr': 0.0004938371416092881, 'samples': 2396736, 'steps': 12482, 'loss/train': 1.8350012302398682} -11/06/2021 22:58:25 - INFO - __main__ - Step 12484: {'lr': 0.0004938359705159796, 'samples': 2396928, 'steps': 12483, 'loss/train': 1.5597666501998901} -11/06/2021 22:58:25 - INFO - __main__ - Step 12485: {'lr': 0.0004938347993128025, 'samples': 2397120, 'steps': 12484, 'loss/train': 1.588280439376831} -11/06/2021 22:58:26 - INFO - __main__ - Step 12486: {'lr': 0.0004938336279997571, 'samples': 2397312, 'steps': 12485, 'loss/train': 1.8706063032150269} -11/06/2021 22:58:27 - INFO - __main__ - Step 12487: {'lr': 0.0004938324565768441, 'samples': 2397504, 'steps': 12486, 'loss/train': 1.8012641668319702} -11/06/2021 22:58:27 - INFO - __main__ - Step 12488: {'lr': 0.0004938312850440639, 'samples': 2397696, 'steps': 12487, 'loss/train': 0.9766202569007874} -11/06/2021 22:58:28 - INFO - __main__ - Step 12489: {'lr': 0.0004938301134014172, 'samples': 2397888, 'steps': 12488, 'loss/train': 1.6374305486679077} -11/06/2021 22:58:28 - INFO - __main__ - Step 12490: {'lr': 0.0004938289416489042, 'samples': 2398080, 'steps': 12489, 'loss/train': 2.0924293994903564} -11/06/2021 22:58:28 - INFO - __main__ - Step 12491: {'lr': 0.0004938277697865259, 'samples': 2398272, 'steps': 12490, 'loss/train': 1.4682444334030151} -11/06/2021 22:58:29 - INFO - __main__ - Step 12492: {'lr': 0.0004938265978142824, 'samples': 2398464, 'steps': 12491, 'loss/train': 2.014890193939209} -11/06/2021 22:58:30 - INFO - __main__ - Step 12493: {'lr': 0.0004938254257321745, 'samples': 2398656, 'steps': 12492, 'loss/train': 1.3816254138946533} -11/06/2021 22:58:30 - INFO - __main__ - Step 12494: {'lr': 0.0004938242535402025, 'samples': 2398848, 'steps': 12493, 'loss/train': 1.4478893280029297} -11/06/2021 22:58:30 - INFO - __main__ - Step 12495: {'lr': 0.0004938230812383672, 'samples': 2399040, 'steps': 12494, 'loss/train': 4.631295680999756} -11/06/2021 22:58:31 - INFO - __main__ - Step 12496: {'lr': 0.0004938219088266688, 'samples': 2399232, 'steps': 12495, 'loss/train': 1.651924729347229} -11/06/2021 22:58:31 - INFO - __main__ - Step 12497: {'lr': 0.0004938207363051082, 'samples': 2399424, 'steps': 12496, 'loss/train': 1.7738444805145264} -11/06/2021 22:58:32 - INFO - __main__ - Step 12498: {'lr': 0.0004938195636736857, 'samples': 2399616, 'steps': 12497, 'loss/train': 1.413539171218872} -11/06/2021 22:58:33 - INFO - __main__ - Step 12499: {'lr': 0.0004938183909324017, 'samples': 2399808, 'steps': 12498, 'loss/train': 1.9373109340667725} -11/06/2021 22:58:33 - INFO - __main__ - Step 12500: {'lr': 0.0004938172180812571, 'samples': 2400000, 'steps': 12499, 'loss/train': 2.0888149738311768} -11/06/2021 22:58:34 - INFO - __main__ - Step 12501: {'lr': 0.000493816045120252, 'samples': 2400192, 'steps': 12500, 'loss/train': 1.6998056173324585} -11/06/2021 22:58:34 - INFO - __main__ - Step 12502: {'lr': 0.0004938148720493873, 'samples': 2400384, 'steps': 12501, 'loss/train': 1.5378485918045044} -11/06/2021 22:58:35 - INFO - __main__ - Step 12503: {'lr': 0.0004938136988686634, 'samples': 2400576, 'steps': 12502, 'loss/train': 0.36686891317367554} -11/06/2021 22:58:35 - INFO - __main__ - Step 12504: {'lr': 0.0004938125255780808, 'samples': 2400768, 'steps': 12503, 'loss/train': 1.6974081993103027} -11/06/2021 22:58:36 - INFO - __main__ - Step 12505: {'lr': 0.0004938113521776401, 'samples': 2400960, 'steps': 12504, 'loss/train': 1.7452573776245117} -11/06/2021 22:58:36 - INFO - __main__ - Step 12506: {'lr': 0.0004938101786673416, 'samples': 2401152, 'steps': 12505, 'loss/train': 1.861094355583191} -11/06/2021 22:58:36 - INFO - __main__ - Step 12507: {'lr': 0.0004938090050471861, 'samples': 2401344, 'steps': 12506, 'loss/train': 1.3893704414367676} -11/06/2021 22:58:37 - INFO - __main__ - Step 12508: {'lr': 0.000493807831317174, 'samples': 2401536, 'steps': 12507, 'loss/train': 1.7757277488708496} -11/06/2021 22:58:38 - INFO - __main__ - Step 12509: {'lr': 0.0004938066574773058, 'samples': 2401728, 'steps': 12508, 'loss/train': 2.139897346496582} -11/06/2021 22:58:38 - INFO - __main__ - Step 12510: {'lr': 0.0004938054835275822, 'samples': 2401920, 'steps': 12509, 'loss/train': 1.3797563314437866} -11/06/2021 22:58:38 - INFO - __main__ - Step 12511: {'lr': 0.0004938043094680036, 'samples': 2402112, 'steps': 12510, 'loss/train': 1.6733269691467285} -11/06/2021 22:58:39 - INFO - __main__ - Step 12512: {'lr': 0.0004938031352985704, 'samples': 2402304, 'steps': 12511, 'loss/train': 1.8873792886734009} -11/06/2021 22:58:40 - INFO - __main__ - Step 12513: {'lr': 0.0004938019610192835, 'samples': 2402496, 'steps': 12512, 'loss/train': 2.266671657562256} -11/06/2021 22:58:40 - INFO - __main__ - Step 12514: {'lr': 0.0004938007866301429, 'samples': 2402688, 'steps': 12513, 'loss/train': 1.8477656841278076} -11/06/2021 22:58:40 - INFO - __main__ - Step 12515: {'lr': 0.0004937996121311496, 'samples': 2402880, 'steps': 12514, 'loss/train': 1.2845678329467773} -11/06/2021 22:58:41 - INFO - __main__ - Step 12516: {'lr': 0.000493798437522304, 'samples': 2403072, 'steps': 12515, 'loss/train': 1.3590694665908813} -11/06/2021 22:58:41 - INFO - __main__ - Step 12517: {'lr': 0.0004937972628036065, 'samples': 2403264, 'steps': 12516, 'loss/train': 1.4171817302703857} -11/06/2021 22:58:42 - INFO - __main__ - Step 12518: {'lr': 0.0004937960879750578, 'samples': 2403456, 'steps': 12517, 'loss/train': 1.5596864223480225} -11/06/2021 22:58:43 - INFO - __main__ - Step 12519: {'lr': 0.0004937949130366582, 'samples': 2403648, 'steps': 12518, 'loss/train': 1.6341605186462402} -11/06/2021 22:58:43 - INFO - __main__ - Step 12520: {'lr': 0.0004937937379884085, 'samples': 2403840, 'steps': 12519, 'loss/train': 1.1687759160995483} -11/06/2021 22:58:43 - INFO - __main__ - Step 12521: {'lr': 0.0004937925628303091, 'samples': 2404032, 'steps': 12520, 'loss/train': 1.7421510219573975} -11/06/2021 22:58:44 - INFO - __main__ - Step 12522: {'lr': 0.0004937913875623605, 'samples': 2404224, 'steps': 12521, 'loss/train': 1.12235426902771} -11/06/2021 22:58:44 - INFO - __main__ - Step 12523: {'lr': 0.0004937902121845633, 'samples': 2404416, 'steps': 12522, 'loss/train': 1.6094740629196167} -11/06/2021 22:58:45 - INFO - __main__ - Step 12524: {'lr': 0.000493789036696918, 'samples': 2404608, 'steps': 12523, 'loss/train': 1.749121069908142} -11/06/2021 22:58:45 - INFO - __main__ - Step 12525: {'lr': 0.000493787861099425, 'samples': 2404800, 'steps': 12524, 'loss/train': 1.0136215686798096} -11/06/2021 22:58:46 - INFO - __main__ - Step 12526: {'lr': 0.0004937866853920851, 'samples': 2404992, 'steps': 12525, 'loss/train': 1.7210983037948608} -11/06/2021 22:58:46 - INFO - __main__ - Step 12527: {'lr': 0.0004937855095748985, 'samples': 2405184, 'steps': 12526, 'loss/train': 1.8808726072311401} -11/06/2021 22:58:46 - INFO - __main__ - Step 12528: {'lr': 0.0004937843336478661, 'samples': 2405376, 'steps': 12527, 'loss/train': 1.6538246870040894} -11/06/2021 22:58:48 - INFO - __main__ - Step 12529: {'lr': 0.0004937831576109881, 'samples': 2405568, 'steps': 12528, 'loss/train': 1.4507884979248047} -11/06/2021 22:58:48 - INFO - __main__ - Step 12530: {'lr': 0.0004937819814642653, 'samples': 2405760, 'steps': 12529, 'loss/train': 1.7369753122329712} -11/06/2021 22:58:49 - INFO - __main__ - Step 12531: {'lr': 0.000493780805207698, 'samples': 2405952, 'steps': 12530, 'loss/train': 1.33586585521698} -11/06/2021 22:58:49 - INFO - __main__ - Step 12532: {'lr': 0.000493779628841287, 'samples': 2406144, 'steps': 12531, 'loss/train': 2.222987413406372} -11/06/2021 22:58:49 - INFO - __main__ - Step 12533: {'lr': 0.0004937784523650324, 'samples': 2406336, 'steps': 12532, 'loss/train': 0.8576833605766296} -11/06/2021 22:58:50 - INFO - __main__ - Step 12534: {'lr': 0.0004937772757789352, 'samples': 2406528, 'steps': 12533, 'loss/train': 0.9707418084144592} -11/06/2021 22:58:51 - INFO - __main__ - Step 12535: {'lr': 0.0004937760990829956, 'samples': 2406720, 'steps': 12534, 'loss/train': 1.9520204067230225} -11/06/2021 22:58:51 - INFO - __main__ - Step 12536: {'lr': 0.0004937749222772143, 'samples': 2406912, 'steps': 12535, 'loss/train': 1.7065337896347046} -11/06/2021 22:58:51 - INFO - __main__ - Step 12537: {'lr': 0.0004937737453615918, 'samples': 2407104, 'steps': 12536, 'loss/train': 1.8596389293670654} -11/06/2021 22:58:52 - INFO - __main__ - Step 12538: {'lr': 0.0004937725683361286, 'samples': 2407296, 'steps': 12537, 'loss/train': 1.6391980648040771} -11/06/2021 22:58:52 - INFO - __main__ - Step 12539: {'lr': 0.0004937713912008252, 'samples': 2407488, 'steps': 12538, 'loss/train': 0.9928711652755737} -11/06/2021 22:58:53 - INFO - __main__ - Step 12540: {'lr': 0.0004937702139556822, 'samples': 2407680, 'steps': 12539, 'loss/train': 2.0436432361602783} -11/06/2021 22:58:54 - INFO - __main__ - Step 12541: {'lr': 0.0004937690366007, 'samples': 2407872, 'steps': 12540, 'loss/train': 1.766875982284546} -11/06/2021 22:58:54 - INFO - __main__ - Step 12542: {'lr': 0.0004937678591358794, 'samples': 2408064, 'steps': 12541, 'loss/train': 1.9210069179534912} -11/06/2021 22:58:54 - INFO - __main__ - Step 12543: {'lr': 0.0004937666815612207, 'samples': 2408256, 'steps': 12542, 'loss/train': 1.523587703704834} -11/06/2021 22:58:55 - INFO - __main__ - Step 12544: {'lr': 0.0004937655038767245, 'samples': 2408448, 'steps': 12543, 'loss/train': 1.4020729064941406} -11/06/2021 22:58:56 - INFO - __main__ - Step 12545: {'lr': 0.0004937643260823914, 'samples': 2408640, 'steps': 12544, 'loss/train': 1.2543262243270874} -11/06/2021 22:58:56 - INFO - __main__ - Step 12546: {'lr': 0.0004937631481782218, 'samples': 2408832, 'steps': 12545, 'loss/train': 1.850257396697998} -11/06/2021 22:58:56 - INFO - __main__ - Step 12547: {'lr': 0.0004937619701642162, 'samples': 2409024, 'steps': 12546, 'loss/train': 2.321528434753418} -11/06/2021 22:58:57 - INFO - __main__ - Step 12548: {'lr': 0.0004937607920403752, 'samples': 2409216, 'steps': 12547, 'loss/train': 2.2833588123321533} -11/06/2021 22:58:57 - INFO - __main__ - Step 12549: {'lr': 0.0004937596138066996, 'samples': 2409408, 'steps': 12548, 'loss/train': 1.803352952003479} -11/06/2021 22:58:58 - INFO - __main__ - Step 12550: {'lr': 0.0004937584354631894, 'samples': 2409600, 'steps': 12549, 'loss/train': 2.182974100112915} -11/06/2021 22:58:58 - INFO - __main__ - Step 12551: {'lr': 0.0004937572570098455, 'samples': 2409792, 'steps': 12550, 'loss/train': 1.5153863430023193} -11/06/2021 22:58:59 - INFO - __main__ - Step 12552: {'lr': 0.0004937560784466685, 'samples': 2409984, 'steps': 12551, 'loss/train': 1.986527681350708} -11/06/2021 22:58:59 - INFO - __main__ - Step 12553: {'lr': 0.0004937548997736586, 'samples': 2410176, 'steps': 12552, 'loss/train': 1.3949472904205322} -11/06/2021 22:58:59 - INFO - __main__ - Step 12554: {'lr': 0.0004937537209908165, 'samples': 2410368, 'steps': 12553, 'loss/train': 1.5035032033920288} -11/06/2021 22:59:00 - INFO - __main__ - Step 12555: {'lr': 0.0004937525420981428, 'samples': 2410560, 'steps': 12554, 'loss/train': 2.261537790298462} -11/06/2021 22:59:01 - INFO - __main__ - Step 12556: {'lr': 0.0004937513630956379, 'samples': 2410752, 'steps': 12555, 'loss/train': 3.3203577995300293} -11/06/2021 22:59:01 - INFO - __main__ - Step 12557: {'lr': 0.0004937501839833024, 'samples': 2410944, 'steps': 12556, 'loss/train': 1.5435712337493896} -11/06/2021 22:59:01 - INFO - __main__ - Step 12558: {'lr': 0.0004937490047611369, 'samples': 2411136, 'steps': 12557, 'loss/train': 1.9833227396011353} -11/06/2021 22:59:02 - INFO - __main__ - Step 12559: {'lr': 0.0004937478254291418, 'samples': 2411328, 'steps': 12558, 'loss/train': 1.6904947757720947} -11/06/2021 22:59:02 - INFO - __main__ - Step 12560: {'lr': 0.0004937466459873178, 'samples': 2411520, 'steps': 12559, 'loss/train': 1.6554052829742432} -11/06/2021 22:59:03 - INFO - __main__ - Step 12561: {'lr': 0.0004937454664356652, 'samples': 2411712, 'steps': 12560, 'loss/train': 1.7198843955993652} -11/06/2021 22:59:04 - INFO - __main__ - Step 12562: {'lr': 0.0004937442867741848, 'samples': 2411904, 'steps': 12561, 'loss/train': 1.9236637353897095} -11/06/2021 22:59:04 - INFO - __main__ - Step 12563: {'lr': 0.0004937431070028768, 'samples': 2412096, 'steps': 12562, 'loss/train': 1.9572961330413818} -11/06/2021 22:59:04 - INFO - __main__ - Step 12564: {'lr': 0.0004937419271217419, 'samples': 2412288, 'steps': 12563, 'loss/train': 5.857589244842529} -11/06/2021 22:59:05 - INFO - __main__ - Step 12565: {'lr': 0.0004937407471307807, 'samples': 2412480, 'steps': 12564, 'loss/train': 1.5907723903656006} -11/06/2021 22:59:05 - INFO - __main__ - Step 12566: {'lr': 0.0004937395670299938, 'samples': 2412672, 'steps': 12565, 'loss/train': 1.3296524286270142} -11/06/2021 22:59:06 - INFO - __main__ - Step 12567: {'lr': 0.0004937383868193815, 'samples': 2412864, 'steps': 12566, 'loss/train': 1.7416648864746094} -11/06/2021 22:59:06 - INFO - __main__ - Step 12568: {'lr': 0.0004937372064989445, 'samples': 2413056, 'steps': 12567, 'loss/train': 1.3068746328353882} -11/06/2021 22:59:07 - INFO - __main__ - Step 12569: {'lr': 0.0004937360260686833, 'samples': 2413248, 'steps': 12568, 'loss/train': 1.8562533855438232} -11/06/2021 22:59:07 - INFO - __main__ - Step 12570: {'lr': 0.0004937348455285983, 'samples': 2413440, 'steps': 12569, 'loss/train': 1.5558427572250366} -11/06/2021 22:59:08 - INFO - __main__ - Step 12571: {'lr': 0.0004937336648786903, 'samples': 2413632, 'steps': 12570, 'loss/train': 1.8795865774154663} -11/06/2021 22:59:08 - INFO - __main__ - Step 12572: {'lr': 0.0004937324841189595, 'samples': 2413824, 'steps': 12571, 'loss/train': 1.9527837038040161} -11/06/2021 22:59:09 - INFO - __main__ - Step 12573: {'lr': 0.0004937313032494068, 'samples': 2414016, 'steps': 12572, 'loss/train': 1.613889217376709} -11/06/2021 22:59:09 - INFO - __main__ - Step 12574: {'lr': 0.0004937301222700324, 'samples': 2414208, 'steps': 12573, 'loss/train': 1.2357040643692017} -11/06/2021 22:59:10 - INFO - __main__ - Step 12575: {'lr': 0.0004937289411808369, 'samples': 2414400, 'steps': 12574, 'loss/train': 2.0651497840881348} -11/06/2021 22:59:10 - INFO - __main__ - Step 12576: {'lr': 0.000493727759981821, 'samples': 2414592, 'steps': 12575, 'loss/train': 1.5525745153427124} -11/06/2021 22:59:11 - INFO - __main__ - Step 12577: {'lr': 0.0004937265786729851, 'samples': 2414784, 'steps': 12576, 'loss/train': 0.8309584856033325} -11/06/2021 22:59:11 - INFO - __main__ - Step 12578: {'lr': 0.0004937253972543298, 'samples': 2414976, 'steps': 12577, 'loss/train': 2.5759201049804688} -11/06/2021 22:59:12 - INFO - __main__ - Step 12579: {'lr': 0.0004937242157258555, 'samples': 2415168, 'steps': 12578, 'loss/train': 2.0868546962738037} -11/06/2021 22:59:12 - INFO - __main__ - Step 12580: {'lr': 0.000493723034087563, 'samples': 2415360, 'steps': 12579, 'loss/train': 0.8102706074714661} -11/06/2021 22:59:12 - INFO - __main__ - Step 12581: {'lr': 0.0004937218523394525, 'samples': 2415552, 'steps': 12580, 'loss/train': 1.7701175212860107} -11/06/2021 22:59:13 - INFO - __main__ - Step 12582: {'lr': 0.0004937206704815248, 'samples': 2415744, 'steps': 12581, 'loss/train': 1.8174623250961304} -11/06/2021 22:59:14 - INFO - __main__ - Step 12583: {'lr': 0.0004937194885137803, 'samples': 2415936, 'steps': 12582, 'loss/train': 1.7041975259780884} -11/06/2021 22:59:14 - INFO - __main__ - Step 12584: {'lr': 0.0004937183064362196, 'samples': 2416128, 'steps': 12583, 'loss/train': 1.7389198541641235} -11/06/2021 22:59:14 - INFO - __main__ - Step 12585: {'lr': 0.0004937171242488431, 'samples': 2416320, 'steps': 12584, 'loss/train': 2.084197521209717} -11/06/2021 22:59:15 - INFO - __main__ - Step 12586: {'lr': 0.0004937159419516515, 'samples': 2416512, 'steps': 12585, 'loss/train': 1.9468644857406616} -11/06/2021 22:59:15 - INFO - __main__ - Step 12587: {'lr': 0.0004937147595446452, 'samples': 2416704, 'steps': 12586, 'loss/train': 1.4281747341156006} -11/06/2021 22:59:16 - INFO - __main__ - Step 12588: {'lr': 0.0004937135770278248, 'samples': 2416896, 'steps': 12587, 'loss/train': 1.688107967376709} -11/06/2021 22:59:17 - INFO - __main__ - Step 12589: {'lr': 0.0004937123944011908, 'samples': 2417088, 'steps': 12588, 'loss/train': 1.6565439701080322} -11/06/2021 22:59:17 - INFO - __main__ - Step 12590: {'lr': 0.0004937112116647439, 'samples': 2417280, 'steps': 12589, 'loss/train': 1.904050588607788} -11/06/2021 22:59:17 - INFO - __main__ - Step 12591: {'lr': 0.0004937100288184843, 'samples': 2417472, 'steps': 12590, 'loss/train': 1.9118624925613403} -11/06/2021 22:59:18 - INFO - __main__ - Step 12592: {'lr': 0.0004937088458624128, 'samples': 2417664, 'steps': 12591, 'loss/train': 1.8203307390213013} -11/06/2021 22:59:19 - INFO - __main__ - Step 12593: {'lr': 0.0004937076627965299, 'samples': 2417856, 'steps': 12592, 'loss/train': 2.2025625705718994} -11/06/2021 22:59:19 - INFO - __main__ - Step 12594: {'lr': 0.000493706479620836, 'samples': 2418048, 'steps': 12593, 'loss/train': 1.668437123298645} -11/06/2021 22:59:19 - INFO - __main__ - Step 12595: {'lr': 0.0004937052963353318, 'samples': 2418240, 'steps': 12594, 'loss/train': 0.7377382516860962} -11/06/2021 22:59:20 - INFO - __main__ - Step 12596: {'lr': 0.0004937041129400177, 'samples': 2418432, 'steps': 12595, 'loss/train': 2.0309805870056152} -11/06/2021 22:59:20 - INFO - __main__ - Step 12597: {'lr': 0.0004937029294348943, 'samples': 2418624, 'steps': 12596, 'loss/train': 2.111126661300659} -11/06/2021 22:59:21 - INFO - __main__ - Step 12598: {'lr': 0.0004937017458199621, 'samples': 2418816, 'steps': 12597, 'loss/train': 1.5420552492141724} -11/06/2021 22:59:21 - INFO - __main__ - Step 12599: {'lr': 0.0004937005620952217, 'samples': 2419008, 'steps': 12598, 'loss/train': 1.6897568702697754} -11/06/2021 22:59:22 - INFO - __main__ - Step 12600: {'lr': 0.0004936993782606735, 'samples': 2419200, 'steps': 12599, 'loss/train': 2.092362880706787} -11/06/2021 22:59:22 - INFO - __main__ - Step 12601: {'lr': 0.0004936981943163182, 'samples': 2419392, 'steps': 12600, 'loss/train': 1.7093287706375122} -11/06/2021 22:59:22 - INFO - __main__ - Step 12602: {'lr': 0.0004936970102621563, 'samples': 2419584, 'steps': 12601, 'loss/train': 1.4950854778289795} -11/06/2021 22:59:23 - INFO - __main__ - Step 12603: {'lr': 0.0004936958260981883, 'samples': 2419776, 'steps': 12602, 'loss/train': 1.867283582687378} -11/06/2021 22:59:24 - INFO - __main__ - Step 12604: {'lr': 0.0004936946418244146, 'samples': 2419968, 'steps': 12603, 'loss/train': 1.928859829902649} -11/06/2021 22:59:24 - INFO - __main__ - Step 12605: {'lr': 0.000493693457440836, 'samples': 2420160, 'steps': 12604, 'loss/train': 2.0806899070739746} -11/06/2021 22:59:25 - INFO - __main__ - Step 12606: {'lr': 0.0004936922729474526, 'samples': 2420352, 'steps': 12605, 'loss/train': 1.991079330444336} -11/06/2021 22:59:25 - INFO - __main__ - Step 12607: {'lr': 0.0004936910883442655, 'samples': 2420544, 'steps': 12606, 'loss/train': 1.499205231666565} -11/06/2021 22:59:25 - INFO - __main__ - Step 12608: {'lr': 0.0004936899036312749, 'samples': 2420736, 'steps': 12607, 'loss/train': 1.6349520683288574} -11/06/2021 22:59:26 - INFO - __main__ - Step 12609: {'lr': 0.0004936887188084813, 'samples': 2420928, 'steps': 12608, 'loss/train': 1.5434484481811523} -11/06/2021 22:59:27 - INFO - __main__ - Step 12610: {'lr': 0.0004936875338758855, 'samples': 2421120, 'steps': 12609, 'loss/train': 1.8176034688949585} -11/06/2021 22:59:27 - INFO - __main__ - Step 12611: {'lr': 0.0004936863488334877, 'samples': 2421312, 'steps': 12610, 'loss/train': 1.5530451536178589} -11/06/2021 22:59:27 - INFO - __main__ - Step 12612: {'lr': 0.0004936851636812886, 'samples': 2421504, 'steps': 12611, 'loss/train': 1.6083686351776123} -11/06/2021 22:59:28 - INFO - __main__ - Step 12613: {'lr': 0.0004936839784192888, 'samples': 2421696, 'steps': 12612, 'loss/train': 1.6676959991455078} -11/06/2021 22:59:29 - INFO - __main__ - Step 12614: {'lr': 0.0004936827930474887, 'samples': 2421888, 'steps': 12613, 'loss/train': 1.6996138095855713} -11/06/2021 22:59:29 - INFO - __main__ - Step 12615: {'lr': 0.0004936816075658889, 'samples': 2422080, 'steps': 12614, 'loss/train': 1.4866139888763428} -11/06/2021 22:59:30 - INFO - __main__ - Step 12616: {'lr': 0.00049368042197449, 'samples': 2422272, 'steps': 12615, 'loss/train': 1.4212651252746582} -11/06/2021 22:59:30 - INFO - __main__ - Step 12617: {'lr': 0.0004936792362732924, 'samples': 2422464, 'steps': 12616, 'loss/train': 1.7673671245574951} -11/06/2021 22:59:30 - INFO - __main__ - Step 12618: {'lr': 0.0004936780504622967, 'samples': 2422656, 'steps': 12617, 'loss/train': 0.7368472218513489} -11/06/2021 22:59:31 - INFO - __main__ - Step 12619: {'lr': 0.0004936768645415033, 'samples': 2422848, 'steps': 12618, 'loss/train': 1.724778652191162} -11/06/2021 22:59:32 - INFO - __main__ - Step 12620: {'lr': 0.0004936756785109131, 'samples': 2423040, 'steps': 12619, 'loss/train': 2.020928382873535} -11/06/2021 22:59:32 - INFO - __main__ - Step 12621: {'lr': 0.0004936744923705263, 'samples': 2423232, 'steps': 12620, 'loss/train': 1.8747974634170532} -11/06/2021 22:59:32 - INFO - __main__ - Step 12622: {'lr': 0.0004936733061203435, 'samples': 2423424, 'steps': 12621, 'loss/train': 1.8702856302261353} -11/06/2021 22:59:33 - INFO - __main__ - Step 12623: {'lr': 0.0004936721197603653, 'samples': 2423616, 'steps': 12622, 'loss/train': 2.058539628982544} -11/06/2021 22:59:34 - INFO - __main__ - Step 12624: {'lr': 0.0004936709332905923, 'samples': 2423808, 'steps': 12623, 'loss/train': 1.5451576709747314} -11/06/2021 22:59:34 - INFO - __main__ - Step 12625: {'lr': 0.0004936697467110248, 'samples': 2424000, 'steps': 12624, 'loss/train': 1.5256503820419312} -11/06/2021 22:59:34 - INFO - __main__ - Step 12626: {'lr': 0.0004936685600216635, 'samples': 2424192, 'steps': 12625, 'loss/train': 1.8777118921279907} -11/06/2021 22:59:35 - INFO - __main__ - Step 12627: {'lr': 0.0004936673732225088, 'samples': 2424384, 'steps': 12626, 'loss/train': 1.737566590309143} -11/06/2021 22:59:35 - INFO - __main__ - Step 12628: {'lr': 0.0004936661863135615, 'samples': 2424576, 'steps': 12627, 'loss/train': 1.7391878366470337} -11/06/2021 22:59:35 - INFO - __main__ - Step 12629: {'lr': 0.000493664999294822, 'samples': 2424768, 'steps': 12628, 'loss/train': 1.8638137578964233} -11/06/2021 22:59:37 - INFO - __main__ - Step 12630: {'lr': 0.0004936638121662908, 'samples': 2424960, 'steps': 12629, 'loss/train': 0.9604647159576416} -11/06/2021 22:59:37 - INFO - __main__ - Step 12631: {'lr': 0.0004936626249279683, 'samples': 2425152, 'steps': 12630, 'loss/train': 1.9379112720489502} -11/06/2021 22:59:37 - INFO - __main__ - Step 12632: {'lr': 0.0004936614375798553, 'samples': 2425344, 'steps': 12631, 'loss/train': 0.7208963632583618} -11/06/2021 22:59:38 - INFO - __main__ - Step 12633: {'lr': 0.0004936602501219522, 'samples': 2425536, 'steps': 12632, 'loss/train': 1.7763961553573608} -11/06/2021 22:59:38 - INFO - __main__ - Step 12634: {'lr': 0.0004936590625542595, 'samples': 2425728, 'steps': 12633, 'loss/train': 1.4927427768707275} -11/06/2021 22:59:39 - INFO - __main__ - Step 12635: {'lr': 0.0004936578748767779, 'samples': 2425920, 'steps': 12634, 'loss/train': 1.5714725255966187} -11/06/2021 22:59:40 - INFO - __main__ - Step 12636: {'lr': 0.0004936566870895078, 'samples': 2426112, 'steps': 12635, 'loss/train': 1.6926263570785522} -11/06/2021 22:59:40 - INFO - __main__ - Step 12637: {'lr': 0.0004936554991924496, 'samples': 2426304, 'steps': 12636, 'loss/train': 0.9753442406654358} -11/06/2021 22:59:40 - INFO - __main__ - Step 12638: {'lr': 0.0004936543111856041, 'samples': 2426496, 'steps': 12637, 'loss/train': 1.6684590578079224} -11/06/2021 22:59:41 - INFO - __main__ - Step 12639: {'lr': 0.0004936531230689717, 'samples': 2426688, 'steps': 12638, 'loss/train': 1.6691287755966187} -11/06/2021 22:59:42 - INFO - __main__ - Step 12640: {'lr': 0.000493651934842553, 'samples': 2426880, 'steps': 12639, 'loss/train': 1.628665566444397} -11/06/2021 22:59:42 - INFO - __main__ - Step 12641: {'lr': 0.0004936507465063486, 'samples': 2427072, 'steps': 12640, 'loss/train': 1.266121745109558} -11/06/2021 22:59:42 - INFO - __main__ - Step 12642: {'lr': 0.0004936495580603588, 'samples': 2427264, 'steps': 12641, 'loss/train': 1.7384616136550903} -11/06/2021 22:59:43 - INFO - __main__ - Step 12643: {'lr': 0.0004936483695045842, 'samples': 2427456, 'steps': 12642, 'loss/train': 1.6067787408828735} -11/06/2021 22:59:43 - INFO - __main__ - Step 12644: {'lr': 0.0004936471808390254, 'samples': 2427648, 'steps': 12643, 'loss/train': 1.7227269411087036} -11/06/2021 22:59:44 - INFO - __main__ - Step 12645: {'lr': 0.0004936459920636832, 'samples': 2427840, 'steps': 12644, 'loss/train': 1.4939666986465454} -11/06/2021 22:59:44 - INFO - __main__ - Step 12646: {'lr': 0.0004936448031785576, 'samples': 2428032, 'steps': 12645, 'loss/train': 1.5351349115371704} -11/06/2021 22:59:45 - INFO - __main__ - Step 12647: {'lr': 0.0004936436141836496, 'samples': 2428224, 'steps': 12646, 'loss/train': 1.6882507801055908} -11/06/2021 22:59:45 - INFO - __main__ - Step 12648: {'lr': 0.0004936424250789594, 'samples': 2428416, 'steps': 12647, 'loss/train': 2.1467108726501465} -11/06/2021 22:59:45 - INFO - __main__ - Step 12649: {'lr': 0.0004936412358644878, 'samples': 2428608, 'steps': 12648, 'loss/train': 1.2412645816802979} -11/06/2021 22:59:47 - INFO - __main__ - Step 12650: {'lr': 0.0004936400465402351, 'samples': 2428800, 'steps': 12649, 'loss/train': 1.8610800504684448} -11/06/2021 22:59:47 - INFO - __main__ - Step 12651: {'lr': 0.0004936388571062021, 'samples': 2428992, 'steps': 12650, 'loss/train': 0.7149181365966797} -11/06/2021 22:59:47 - INFO - __main__ - Step 12652: {'lr': 0.0004936376675623892, 'samples': 2429184, 'steps': 12651, 'loss/train': 1.40529203414917} -11/06/2021 22:59:48 - INFO - __main__ - Step 12653: {'lr': 0.0004936364779087967, 'samples': 2429376, 'steps': 12652, 'loss/train': 1.6117287874221802} -11/06/2021 22:59:48 - INFO - __main__ - Step 12654: {'lr': 0.0004936352881454256, 'samples': 2429568, 'steps': 12653, 'loss/train': 1.6259452104568481} -11/06/2021 22:59:49 - INFO - __main__ - Step 12655: {'lr': 0.000493634098272276, 'samples': 2429760, 'steps': 12654, 'loss/train': 0.9939618706703186} -11/06/2021 22:59:49 - INFO - __main__ - Step 12656: {'lr': 0.0004936329082893488, 'samples': 2429952, 'steps': 12655, 'loss/train': 1.6605446338653564} -11/06/2021 22:59:50 - INFO - __main__ - Step 12657: {'lr': 0.0004936317181966443, 'samples': 2430144, 'steps': 12656, 'loss/train': 1.8564437627792358} -11/06/2021 22:59:50 - INFO - __main__ - Step 12658: {'lr': 0.000493630527994163, 'samples': 2430336, 'steps': 12657, 'loss/train': 1.9009116888046265} -11/06/2021 22:59:50 - INFO - __main__ - Step 12659: {'lr': 0.0004936293376819058, 'samples': 2430528, 'steps': 12658, 'loss/train': 1.7733248472213745} -11/06/2021 22:59:52 - INFO - __main__ - Step 12660: {'lr': 0.0004936281472598728, 'samples': 2430720, 'steps': 12659, 'loss/train': 1.9527031183242798} -11/06/2021 22:59:52 - INFO - __main__ - Step 12661: {'lr': 0.0004936269567280648, 'samples': 2430912, 'steps': 12660, 'loss/train': 1.9170464277267456} -11/06/2021 22:59:52 - INFO - __main__ - Step 12662: {'lr': 0.0004936257660864822, 'samples': 2431104, 'steps': 12661, 'loss/train': 1.2196903228759766} -11/06/2021 22:59:53 - INFO - __main__ - Step 12663: {'lr': 0.0004936245753351256, 'samples': 2431296, 'steps': 12662, 'loss/train': 1.9647890329360962} -11/06/2021 22:59:53 - INFO - __main__ - Step 12664: {'lr': 0.0004936233844739955, 'samples': 2431488, 'steps': 12663, 'loss/train': 1.9114571809768677} -11/06/2021 22:59:54 - INFO - __main__ - Step 12665: {'lr': 0.0004936221935030924, 'samples': 2431680, 'steps': 12664, 'loss/train': 1.2946553230285645} -11/06/2021 22:59:54 - INFO - __main__ - Step 12666: {'lr': 0.000493621002422417, 'samples': 2431872, 'steps': 12665, 'loss/train': 1.6806825399398804} -11/06/2021 22:59:55 - INFO - __main__ - Step 12667: {'lr': 0.0004936198112319698, 'samples': 2432064, 'steps': 12666, 'loss/train': 1.6497493982315063} -11/06/2021 22:59:55 - INFO - __main__ - Step 12668: {'lr': 0.0004936186199317511, 'samples': 2432256, 'steps': 12667, 'loss/train': 0.71175217628479} -11/06/2021 22:59:55 - INFO - __main__ - Step 12669: {'lr': 0.0004936174285217618, 'samples': 2432448, 'steps': 12668, 'loss/train': 2.324061393737793} -11/06/2021 22:59:56 - INFO - __main__ - Step 12670: {'lr': 0.0004936162370020021, 'samples': 2432640, 'steps': 12669, 'loss/train': 1.2230273485183716} -11/06/2021 22:59:57 - INFO - __main__ - Step 12671: {'lr': 0.0004936150453724727, 'samples': 2432832, 'steps': 12670, 'loss/train': 1.6716129779815674} -11/06/2021 22:59:57 - INFO - __main__ - Step 12672: {'lr': 0.0004936138536331742, 'samples': 2433024, 'steps': 12671, 'loss/train': 1.5442752838134766} -11/06/2021 22:59:58 - INFO - __main__ - Step 12673: {'lr': 0.000493612661784107, 'samples': 2433216, 'steps': 12672, 'loss/train': 1.818224310874939} -11/06/2021 22:59:58 - INFO - __main__ - Step 12674: {'lr': 0.0004936114698252717, 'samples': 2433408, 'steps': 12673, 'loss/train': 1.5145035982131958} -11/06/2021 22:59:58 - INFO - __main__ - Step 12675: {'lr': 0.0004936102777566688, 'samples': 2433600, 'steps': 12674, 'loss/train': 0.6831874847412109} -11/06/2021 22:59:59 - INFO - __main__ - Step 12676: {'lr': 0.0004936090855782989, 'samples': 2433792, 'steps': 12675, 'loss/train': 1.201375961303711} -11/06/2021 23:00:00 - INFO - __main__ - Step 12677: {'lr': 0.0004936078932901625, 'samples': 2433984, 'steps': 12676, 'loss/train': 1.8787459135055542} -11/06/2021 23:00:00 - INFO - __main__ - Step 12678: {'lr': 0.0004936067008922602, 'samples': 2434176, 'steps': 12677, 'loss/train': 2.3367536067962646} -11/06/2021 23:00:00 - INFO - __main__ - Step 12679: {'lr': 0.0004936055083845924, 'samples': 2434368, 'steps': 12678, 'loss/train': 1.7321808338165283} -11/06/2021 23:00:01 - INFO - __main__ - Step 12680: {'lr': 0.0004936043157671597, 'samples': 2434560, 'steps': 12679, 'loss/train': 1.1493476629257202} -11/06/2021 23:00:02 - INFO - __main__ - Step 12681: {'lr': 0.0004936031230399628, 'samples': 2434752, 'steps': 12680, 'loss/train': 1.7847900390625} -11/06/2021 23:00:02 - INFO - __main__ - Step 12682: {'lr': 0.000493601930203002, 'samples': 2434944, 'steps': 12681, 'loss/train': 1.8895950317382812} -11/06/2021 23:00:03 - INFO - __main__ - Step 12683: {'lr': 0.0004936007372562778, 'samples': 2435136, 'steps': 12682, 'loss/train': 1.703395128250122} -11/06/2021 23:00:03 - INFO - __main__ - Step 12684: {'lr': 0.0004935995441997911, 'samples': 2435328, 'steps': 12683, 'loss/train': 1.5084177255630493} -11/06/2021 23:00:03 - INFO - __main__ - Step 12685: {'lr': 0.000493598351033542, 'samples': 2435520, 'steps': 12684, 'loss/train': 1.2693252563476562} -11/06/2021 23:00:04 - INFO - __main__ - Step 12686: {'lr': 0.0004935971577575313, 'samples': 2435712, 'steps': 12685, 'loss/train': 1.772753357887268} -11/06/2021 23:00:05 - INFO - __main__ - Step 12687: {'lr': 0.0004935959643717595, 'samples': 2435904, 'steps': 12686, 'loss/train': 1.3232539892196655} -11/06/2021 23:00:05 - INFO - __main__ - Step 12688: {'lr': 0.0004935947708762272, 'samples': 2436096, 'steps': 12687, 'loss/train': 1.1217036247253418} -11/06/2021 23:00:05 - INFO - __main__ - Step 12689: {'lr': 0.0004935935772709348, 'samples': 2436288, 'steps': 12688, 'loss/train': 2.837244987487793} -11/06/2021 23:00:06 - INFO - __main__ - Step 12690: {'lr': 0.0004935923835558829, 'samples': 2436480, 'steps': 12689, 'loss/train': 1.7220159769058228} -11/06/2021 23:00:07 - INFO - __main__ - Step 12691: {'lr': 0.0004935911897310719, 'samples': 2436672, 'steps': 12690, 'loss/train': 1.8013556003570557} -11/06/2021 23:00:07 - INFO - __main__ - Step 12692: {'lr': 0.0004935899957965027, 'samples': 2436864, 'steps': 12691, 'loss/train': 1.6648582220077515} -11/06/2021 23:00:07 - INFO - __main__ - Step 12693: {'lr': 0.0004935888017521754, 'samples': 2437056, 'steps': 12692, 'loss/train': 2.0813040733337402} -11/06/2021 23:00:08 - INFO - __main__ - Step 12694: {'lr': 0.0004935876075980908, 'samples': 2437248, 'steps': 12693, 'loss/train': 1.7684749364852905} -11/06/2021 23:00:08 - INFO - __main__ - Step 12695: {'lr': 0.0004935864133342495, 'samples': 2437440, 'steps': 12694, 'loss/train': 1.6431411504745483} -11/06/2021 23:00:09 - INFO - __main__ - Step 12696: {'lr': 0.0004935852189606517, 'samples': 2437632, 'steps': 12695, 'loss/train': 1.6132627725601196} -11/06/2021 23:00:09 - INFO - __main__ - Step 12697: {'lr': 0.0004935840244772984, 'samples': 2437824, 'steps': 12696, 'loss/train': 1.5991240739822388} -11/06/2021 23:00:10 - INFO - __main__ - Step 12698: {'lr': 0.0004935828298841898, 'samples': 2438016, 'steps': 12697, 'loss/train': 1.5647183656692505} -11/06/2021 23:00:10 - INFO - __main__ - Step 12699: {'lr': 0.0004935816351813265, 'samples': 2438208, 'steps': 12698, 'loss/train': 1.92881441116333} -11/06/2021 23:00:11 - INFO - __main__ - Step 12700: {'lr': 0.0004935804403687091, 'samples': 2438400, 'steps': 12699, 'loss/train': 1.8408360481262207} -11/06/2021 23:00:11 - INFO - __main__ - Step 12701: {'lr': 0.0004935792454463381, 'samples': 2438592, 'steps': 12700, 'loss/train': 1.49015212059021} -11/06/2021 23:00:12 - INFO - __main__ - Step 12702: {'lr': 0.000493578050414214, 'samples': 2438784, 'steps': 12701, 'loss/train': 1.8693770170211792} -11/06/2021 23:00:12 - INFO - __main__ - Step 12703: {'lr': 0.0004935768552723375, 'samples': 2438976, 'steps': 12702, 'loss/train': 1.6412677764892578} -11/06/2021 23:00:13 - INFO - __main__ - Step 12704: {'lr': 0.000493575660020709, 'samples': 2439168, 'steps': 12703, 'loss/train': 1.6965235471725464} -11/06/2021 23:00:13 - INFO - __main__ - Step 12705: {'lr': 0.000493574464659329, 'samples': 2439360, 'steps': 12704, 'loss/train': 1.4000598192214966} -11/06/2021 23:00:13 - INFO - __main__ - Step 12706: {'lr': 0.0004935732691881981, 'samples': 2439552, 'steps': 12705, 'loss/train': 1.8921767473220825} -11/06/2021 23:00:14 - INFO - __main__ - Step 12707: {'lr': 0.0004935720736073169, 'samples': 2439744, 'steps': 12706, 'loss/train': 1.973684310913086} -11/06/2021 23:00:15 - INFO - __main__ - Step 12708: {'lr': 0.0004935708779166859, 'samples': 2439936, 'steps': 12707, 'loss/train': 1.2805671691894531} -11/06/2021 23:00:15 - INFO - __main__ - Step 12709: {'lr': 0.0004935696821163056, 'samples': 2440128, 'steps': 12708, 'loss/train': 1.9279905557632446} -11/06/2021 23:00:15 - INFO - __main__ - Step 12710: {'lr': 0.0004935684862061766, 'samples': 2440320, 'steps': 12709, 'loss/train': 1.654013991355896} -11/06/2021 23:00:16 - INFO - __main__ - Step 12711: {'lr': 0.0004935672901862993, 'samples': 2440512, 'steps': 12710, 'loss/train': 1.4374395608901978} -11/06/2021 23:00:17 - INFO - __main__ - Step 12712: {'lr': 0.0004935660940566744, 'samples': 2440704, 'steps': 12711, 'loss/train': 1.640486240386963} -11/06/2021 23:00:17 - INFO - __main__ - Step 12713: {'lr': 0.0004935648978173024, 'samples': 2440896, 'steps': 12712, 'loss/train': 1.7238794565200806} -11/06/2021 23:00:17 - INFO - __main__ - Step 12714: {'lr': 0.0004935637014681837, 'samples': 2441088, 'steps': 12713, 'loss/train': 1.8015981912612915} -11/06/2021 23:00:18 - INFO - __main__ - Step 12715: {'lr': 0.0004935625050093191, 'samples': 2441280, 'steps': 12714, 'loss/train': 1.7736315727233887} -11/06/2021 23:00:18 - INFO - __main__ - Step 12716: {'lr': 0.000493561308440709, 'samples': 2441472, 'steps': 12715, 'loss/train': 1.336901068687439} -11/06/2021 23:00:19 - INFO - __main__ - Step 12717: {'lr': 0.0004935601117623538, 'samples': 2441664, 'steps': 12716, 'loss/train': 1.488775610923767} -11/06/2021 23:00:19 - INFO - __main__ - Step 12718: {'lr': 0.0004935589149742542, 'samples': 2441856, 'steps': 12717, 'loss/train': 2.1799232959747314} -11/06/2021 23:00:20 - INFO - __main__ - Step 12719: {'lr': 0.0004935577180764108, 'samples': 2442048, 'steps': 12718, 'loss/train': 1.3624755144119263} -11/06/2021 23:00:20 - INFO - __main__ - Step 12720: {'lr': 0.000493556521068824, 'samples': 2442240, 'steps': 12719, 'loss/train': 1.883273720741272} -11/06/2021 23:00:21 - INFO - __main__ - Step 12721: {'lr': 0.0004935553239514943, 'samples': 2442432, 'steps': 12720, 'loss/train': 1.8159416913986206} -11/06/2021 23:00:22 - INFO - __main__ - Step 12722: {'lr': 0.0004935541267244225, 'samples': 2442624, 'steps': 12721, 'loss/train': 1.7805633544921875} -11/06/2021 23:00:22 - INFO - __main__ - Step 12723: {'lr': 0.0004935529293876088, 'samples': 2442816, 'steps': 12722, 'loss/train': 1.8284835815429688} -11/06/2021 23:00:22 - INFO - __main__ - Step 12724: {'lr': 0.000493551731941054, 'samples': 2443008, 'steps': 12723, 'loss/train': 1.8245835304260254} -11/06/2021 23:00:23 - INFO - __main__ - Step 12725: {'lr': 0.0004935505343847586, 'samples': 2443200, 'steps': 12724, 'loss/train': 1.665300965309143} -11/06/2021 23:00:23 - INFO - __main__ - Step 12726: {'lr': 0.000493549336718723, 'samples': 2443392, 'steps': 12725, 'loss/train': 1.5313256978988647} -11/06/2021 23:00:23 - INFO - __main__ - Step 12727: {'lr': 0.0004935481389429479, 'samples': 2443584, 'steps': 12726, 'loss/train': 1.2466456890106201} -11/06/2021 23:00:24 - INFO - __main__ - Step 12728: {'lr': 0.0004935469410574337, 'samples': 2443776, 'steps': 12727, 'loss/train': 1.5720294713974} -11/06/2021 23:00:25 - INFO - __main__ - Step 12729: {'lr': 0.000493545743062181, 'samples': 2443968, 'steps': 12728, 'loss/train': 1.831040382385254} -11/06/2021 23:00:25 - INFO - __main__ - Step 12730: {'lr': 0.0004935445449571903, 'samples': 2444160, 'steps': 12729, 'loss/train': 1.5608617067337036} -11/06/2021 23:00:26 - INFO - __main__ - Step 12731: {'lr': 0.0004935433467424624, 'samples': 2444352, 'steps': 12730, 'loss/train': 1.843248963356018} -11/06/2021 23:00:26 - INFO - __main__ - Step 12732: {'lr': 0.0004935421484179974, 'samples': 2444544, 'steps': 12731, 'loss/train': 1.858343243598938} -11/06/2021 23:00:27 - INFO - __main__ - Step 12733: {'lr': 0.0004935409499837962, 'samples': 2444736, 'steps': 12732, 'loss/train': 2.449708938598633} -11/06/2021 23:00:27 - INFO - __main__ - Step 12734: {'lr': 0.0004935397514398591, 'samples': 2444928, 'steps': 12733, 'loss/train': 1.2555254697799683} -11/06/2021 23:00:27 - INFO - __main__ - Step 12735: {'lr': 0.0004935385527861869, 'samples': 2445120, 'steps': 12734, 'loss/train': 1.8298964500427246} -11/06/2021 23:00:28 - INFO - __main__ - Step 12736: {'lr': 0.0004935373540227798, 'samples': 2445312, 'steps': 12735, 'loss/train': 1.8937606811523438} -11/06/2021 23:00:28 - INFO - __main__ - Step 12737: {'lr': 0.0004935361551496387, 'samples': 2445504, 'steps': 12736, 'loss/train': 1.5406252145767212} -11/06/2021 23:00:29 - INFO - __main__ - Step 12738: {'lr': 0.0004935349561667638, 'samples': 2445696, 'steps': 12737, 'loss/train': 1.3331429958343506} -11/06/2021 23:00:30 - INFO - __main__ - Step 12739: {'lr': 0.000493533757074156, 'samples': 2445888, 'steps': 12738, 'loss/train': 1.462608814239502} -11/06/2021 23:00:30 - INFO - __main__ - Step 12740: {'lr': 0.0004935325578718155, 'samples': 2446080, 'steps': 12739, 'loss/train': 1.7719459533691406} -11/06/2021 23:00:30 - INFO - __main__ - Step 12741: {'lr': 0.000493531358559743, 'samples': 2446272, 'steps': 12740, 'loss/train': 1.849948525428772} -11/06/2021 23:00:31 - INFO - __main__ - Step 12742: {'lr': 0.0004935301591379391, 'samples': 2446464, 'steps': 12741, 'loss/train': 2.125699520111084} -11/06/2021 23:00:32 - INFO - __main__ - Step 12743: {'lr': 0.0004935289596064042, 'samples': 2446656, 'steps': 12742, 'loss/train': 1.4492217302322388} -11/06/2021 23:00:32 - INFO - __main__ - Step 12744: {'lr': 0.0004935277599651389, 'samples': 2446848, 'steps': 12743, 'loss/train': 1.4659162759780884} -11/06/2021 23:00:32 - INFO - __main__ - Step 12745: {'lr': 0.0004935265602141437, 'samples': 2447040, 'steps': 12744, 'loss/train': 2.072901964187622} -11/06/2021 23:00:33 - INFO - __main__ - Step 12746: {'lr': 0.0004935253603534193, 'samples': 2447232, 'steps': 12745, 'loss/train': 1.745668649673462} -11/06/2021 23:00:33 - INFO - __main__ - Step 12747: {'lr': 0.0004935241603829661, 'samples': 2447424, 'steps': 12746, 'loss/train': 1.9850726127624512} -11/06/2021 23:00:34 - INFO - __main__ - Step 12748: {'lr': 0.0004935229603027847, 'samples': 2447616, 'steps': 12747, 'loss/train': 1.3477630615234375} -11/06/2021 23:00:34 - INFO - __main__ - Step 12749: {'lr': 0.0004935217601128755, 'samples': 2447808, 'steps': 12748, 'loss/train': 1.7236028909683228} -11/06/2021 23:00:35 - INFO - __main__ - Step 12750: {'lr': 0.0004935205598132393, 'samples': 2448000, 'steps': 12749, 'loss/train': 1.637121319770813} -11/06/2021 23:00:35 - INFO - __main__ - Step 12751: {'lr': 0.0004935193594038764, 'samples': 2448192, 'steps': 12750, 'loss/train': 1.4060014486312866} -11/06/2021 23:00:35 - INFO - __main__ - Step 12752: {'lr': 0.0004935181588847876, 'samples': 2448384, 'steps': 12751, 'loss/train': 1.7447482347488403} -11/06/2021 23:00:36 - INFO - __main__ - Step 12753: {'lr': 0.0004935169582559731, 'samples': 2448576, 'steps': 12752, 'loss/train': 2.0324788093566895} -11/06/2021 23:00:37 - INFO - __main__ - Step 12754: {'lr': 0.0004935157575174336, 'samples': 2448768, 'steps': 12753, 'loss/train': 1.7007369995117188} -11/06/2021 23:00:37 - INFO - __main__ - Step 12755: {'lr': 0.0004935145566691698, 'samples': 2448960, 'steps': 12754, 'loss/train': 1.9936100244522095} -11/06/2021 23:00:37 - INFO - __main__ - Step 12756: {'lr': 0.000493513355711182, 'samples': 2449152, 'steps': 12755, 'loss/train': 1.6351784467697144} -11/06/2021 23:00:38 - INFO - __main__ - Step 12757: {'lr': 0.0004935121546434708, 'samples': 2449344, 'steps': 12756, 'loss/train': 1.7019697427749634} -11/06/2021 23:00:39 - INFO - __main__ - Step 12758: {'lr': 0.0004935109534660368, 'samples': 2449536, 'steps': 12757, 'loss/train': 1.8127813339233398} -11/06/2021 23:00:39 - INFO - __main__ - Step 12759: {'lr': 0.0004935097521788805, 'samples': 2449728, 'steps': 12758, 'loss/train': 0.67855304479599} -11/06/2021 23:00:40 - INFO - __main__ - Step 12760: {'lr': 0.0004935085507820026, 'samples': 2449920, 'steps': 12759, 'loss/train': 2.1449859142303467} -11/06/2021 23:00:40 - INFO - __main__ - Step 12761: {'lr': 0.0004935073492754034, 'samples': 2450112, 'steps': 12760, 'loss/train': 1.3522168397903442} -11/06/2021 23:00:40 - INFO - __main__ - Step 12762: {'lr': 0.0004935061476590835, 'samples': 2450304, 'steps': 12761, 'loss/train': 0.9896982908248901} -11/06/2021 23:00:41 - INFO - __main__ - Step 12763: {'lr': 0.0004935049459330437, 'samples': 2450496, 'steps': 12762, 'loss/train': 1.8502204418182373} -11/06/2021 23:00:42 - INFO - __main__ - Step 12764: {'lr': 0.0004935037440972841, 'samples': 2450688, 'steps': 12763, 'loss/train': 2.6931633949279785} -11/06/2021 23:00:42 - INFO - __main__ - Step 12765: {'lr': 0.0004935025421518056, 'samples': 2450880, 'steps': 12764, 'loss/train': 1.5279968976974487} -11/06/2021 23:00:42 - INFO - __main__ - Step 12766: {'lr': 0.0004935013400966086, 'samples': 2451072, 'steps': 12765, 'loss/train': 1.7780354022979736} -11/06/2021 23:00:43 - INFO - __main__ - Step 12767: {'lr': 0.0004935001379316935, 'samples': 2451264, 'steps': 12766, 'loss/train': 1.5596141815185547} -11/06/2021 23:00:43 - INFO - __main__ - Step 12768: {'lr': 0.0004934989356570611, 'samples': 2451456, 'steps': 12767, 'loss/train': 1.7943576574325562} -11/06/2021 23:00:44 - INFO - __main__ - Step 12769: {'lr': 0.0004934977332727118, 'samples': 2451648, 'steps': 12768, 'loss/train': 1.703242301940918} -11/06/2021 23:00:44 - INFO - __main__ - Step 12770: {'lr': 0.0004934965307786464, 'samples': 2451840, 'steps': 12769, 'loss/train': 1.6350740194320679} -11/06/2021 23:00:45 - INFO - __main__ - Step 12771: {'lr': 0.0004934953281748649, 'samples': 2452032, 'steps': 12770, 'loss/train': 1.350691318511963} -11/06/2021 23:00:45 - INFO - __main__ - Step 12772: {'lr': 0.0004934941254613684, 'samples': 2452224, 'steps': 12771, 'loss/train': 1.6434681415557861} -11/06/2021 23:00:45 - INFO - __main__ - Step 12773: {'lr': 0.0004934929226381572, 'samples': 2452416, 'steps': 12772, 'loss/train': 1.567505121231079} -11/06/2021 23:00:47 - INFO - __main__ - Step 12774: {'lr': 0.0004934917197052317, 'samples': 2452608, 'steps': 12773, 'loss/train': 1.6525659561157227} -11/06/2021 23:00:47 - INFO - __main__ - Step 12775: {'lr': 0.0004934905166625926, 'samples': 2452800, 'steps': 12774, 'loss/train': 1.8389402627944946} -11/06/2021 23:00:48 - INFO - __main__ - Step 12776: {'lr': 0.0004934893135102405, 'samples': 2452992, 'steps': 12775, 'loss/train': 0.4809941351413727} -11/06/2021 23:00:48 - INFO - __main__ - Step 12777: {'lr': 0.0004934881102481759, 'samples': 2453184, 'steps': 12776, 'loss/train': 1.6852707862854004} -11/06/2021 23:00:48 - INFO - __main__ - Step 12778: {'lr': 0.0004934869068763992, 'samples': 2453376, 'steps': 12777, 'loss/train': 1.8732150793075562} -11/06/2021 23:00:49 - INFO - __main__ - Step 12779: {'lr': 0.0004934857033949112, 'samples': 2453568, 'steps': 12778, 'loss/train': 1.4058620929718018} -11/06/2021 23:00:49 - INFO - __main__ - Step 12780: {'lr': 0.0004934844998037122, 'samples': 2453760, 'steps': 12779, 'loss/train': 1.6926714181900024} -11/06/2021 23:00:50 - INFO - __main__ - Step 12781: {'lr': 0.0004934832961028028, 'samples': 2453952, 'steps': 12780, 'loss/train': 1.8323222398757935} -11/06/2021 23:00:50 - INFO - __main__ - Step 12782: {'lr': 0.0004934820922921836, 'samples': 2454144, 'steps': 12781, 'loss/train': 1.9833849668502808} -11/06/2021 23:00:51 - INFO - __main__ - Step 12783: {'lr': 0.0004934808883718553, 'samples': 2454336, 'steps': 12782, 'loss/train': 1.3475416898727417} -11/06/2021 23:00:52 - INFO - __main__ - Step 12784: {'lr': 0.0004934796843418181, 'samples': 2454528, 'steps': 12783, 'loss/train': 1.8701623678207397} -11/06/2021 23:00:52 - INFO - __main__ - Step 12785: {'lr': 0.0004934784802020728, 'samples': 2454720, 'steps': 12784, 'loss/train': 1.69837486743927} -11/06/2021 23:00:52 - INFO - __main__ - Step 12786: {'lr': 0.0004934772759526198, 'samples': 2454912, 'steps': 12785, 'loss/train': 1.8089841604232788} -11/06/2021 23:00:53 - INFO - __main__ - Step 12787: {'lr': 0.0004934760715934597, 'samples': 2455104, 'steps': 12786, 'loss/train': 1.5334937572479248} -11/06/2021 23:00:53 - INFO - __main__ - Step 12788: {'lr': 0.0004934748671245931, 'samples': 2455296, 'steps': 12787, 'loss/train': 1.691651463508606} -11/06/2021 23:00:54 - INFO - __main__ - Step 12789: {'lr': 0.0004934736625460203, 'samples': 2455488, 'steps': 12788, 'loss/train': 1.8990588188171387} -11/06/2021 23:00:54 - INFO - __main__ - Step 12790: {'lr': 0.0004934724578577422, 'samples': 2455680, 'steps': 12789, 'loss/train': 1.2063190937042236} -11/06/2021 23:00:55 - INFO - __main__ - Step 12791: {'lr': 0.0004934712530597591, 'samples': 2455872, 'steps': 12790, 'loss/train': 1.6075855493545532} -11/06/2021 23:00:55 - INFO - __main__ - Step 12792: {'lr': 0.0004934700481520717, 'samples': 2456064, 'steps': 12791, 'loss/train': 1.9511923789978027} -11/06/2021 23:00:55 - INFO - __main__ - Step 12793: {'lr': 0.0004934688431346804, 'samples': 2456256, 'steps': 12792, 'loss/train': 1.5929433107376099} -11/06/2021 23:00:56 - INFO - __main__ - Step 12794: {'lr': 0.0004934676380075857, 'samples': 2456448, 'steps': 12793, 'loss/train': 1.243303894996643} -11/06/2021 23:00:57 - INFO - __main__ - Step 12795: {'lr': 0.0004934664327707884, 'samples': 2456640, 'steps': 12794, 'loss/train': 2.0900375843048096} -11/06/2021 23:00:57 - INFO - __main__ - Step 12796: {'lr': 0.0004934652274242888, 'samples': 2456832, 'steps': 12795, 'loss/train': 1.7989342212677002} -11/06/2021 23:00:58 - INFO - __main__ - Step 12797: {'lr': 0.0004934640219680875, 'samples': 2457024, 'steps': 12796, 'loss/train': 0.9342484474182129} -11/06/2021 23:00:58 - INFO - __main__ - Step 12798: {'lr': 0.0004934628164021851, 'samples': 2457216, 'steps': 12797, 'loss/train': 0.24721074104309082} -11/06/2021 23:00:59 - INFO - __main__ - Step 12799: {'lr': 0.0004934616107265821, 'samples': 2457408, 'steps': 12798, 'loss/train': 2.198434591293335} -11/06/2021 23:00:59 - INFO - __main__ - Step 12800: {'lr': 0.0004934604049412791, 'samples': 2457600, 'steps': 12799, 'loss/train': 1.550801157951355} -11/06/2021 23:01:00 - INFO - __main__ - Step 12801: {'lr': 0.0004934591990462766, 'samples': 2457792, 'steps': 12800, 'loss/train': 1.3108569383621216} -11/06/2021 23:01:00 - INFO - __main__ - Step 12802: {'lr': 0.0004934579930415751, 'samples': 2457984, 'steps': 12801, 'loss/train': 1.9333668947219849} -11/06/2021 23:01:00 - INFO - __main__ - Step 12803: {'lr': 0.0004934567869271751, 'samples': 2458176, 'steps': 12802, 'loss/train': 1.9801455736160278} -11/06/2021 23:01:01 - INFO - __main__ - Step 12804: {'lr': 0.0004934555807030774, 'samples': 2458368, 'steps': 12803, 'loss/train': 1.053701400756836} -11/06/2021 23:01:02 - INFO - __main__ - Step 12805: {'lr': 0.0004934543743692822, 'samples': 2458560, 'steps': 12804, 'loss/train': 1.4716850519180298} -11/06/2021 23:01:02 - INFO - __main__ - Step 12806: {'lr': 0.0004934531679257903, 'samples': 2458752, 'steps': 12805, 'loss/train': 1.5304038524627686} -11/06/2021 23:01:03 - INFO - __main__ - Step 12807: {'lr': 0.0004934519613726022, 'samples': 2458944, 'steps': 12806, 'loss/train': 1.6712217330932617} -11/06/2021 23:01:03 - INFO - __main__ - Step 12808: {'lr': 0.0004934507547097183, 'samples': 2459136, 'steps': 12807, 'loss/train': 1.6593072414398193} -11/06/2021 23:01:03 - INFO - __main__ - Step 12809: {'lr': 0.0004934495479371393, 'samples': 2459328, 'steps': 12808, 'loss/train': 4.7572102546691895} -11/06/2021 23:01:04 - INFO - __main__ - Step 12810: {'lr': 0.0004934483410548658, 'samples': 2459520, 'steps': 12809, 'loss/train': 0.9556400775909424} -11/06/2021 23:01:05 - INFO - __main__ - Step 12811: {'lr': 0.0004934471340628981, 'samples': 2459712, 'steps': 12810, 'loss/train': 0.8056848049163818} -11/06/2021 23:01:05 - INFO - __main__ - Step 12812: {'lr': 0.000493445926961237, 'samples': 2459904, 'steps': 12811, 'loss/train': 1.6957072019577026} -11/06/2021 23:01:05 - INFO - __main__ - Step 12813: {'lr': 0.0004934447197498828, 'samples': 2460096, 'steps': 12812, 'loss/train': 1.9989805221557617} -11/06/2021 23:01:06 - INFO - __main__ - Step 12814: {'lr': 0.0004934435124288362, 'samples': 2460288, 'steps': 12813, 'loss/train': 2.132337808609009} -11/06/2021 23:01:07 - INFO - __main__ - Step 12815: {'lr': 0.0004934423049980977, 'samples': 2460480, 'steps': 12814, 'loss/train': 1.7412266731262207} -11/06/2021 23:01:07 - INFO - __main__ - Step 12816: {'lr': 0.0004934410974576679, 'samples': 2460672, 'steps': 12815, 'loss/train': 1.9368259906768799} -11/06/2021 23:01:07 - INFO - __main__ - Step 12817: {'lr': 0.0004934398898075472, 'samples': 2460864, 'steps': 12816, 'loss/train': 1.8307538032531738} -11/06/2021 23:01:08 - INFO - __main__ - Step 12818: {'lr': 0.0004934386820477363, 'samples': 2461056, 'steps': 12817, 'loss/train': 1.4713562726974487} -11/06/2021 23:01:08 - INFO - __main__ - Step 12819: {'lr': 0.0004934374741782357, 'samples': 2461248, 'steps': 12818, 'loss/train': 1.4008110761642456} -11/06/2021 23:01:09 - INFO - __main__ - Step 12820: {'lr': 0.000493436266199046, 'samples': 2461440, 'steps': 12819, 'loss/train': 1.4729948043823242} -11/06/2021 23:01:09 - INFO - __main__ - Step 12821: {'lr': 0.0004934350581101676, 'samples': 2461632, 'steps': 12820, 'loss/train': 1.7127310037612915} -11/06/2021 23:01:10 - INFO - __main__ - Step 12822: {'lr': 0.0004934338499116011, 'samples': 2461824, 'steps': 12821, 'loss/train': 1.610058307647705} -11/06/2021 23:01:10 - INFO - __main__ - Step 12823: {'lr': 0.0004934326416033471, 'samples': 2462016, 'steps': 12822, 'loss/train': 1.9114627838134766} -11/06/2021 23:01:10 - INFO - __main__ - Step 12824: {'lr': 0.0004934314331854061, 'samples': 2462208, 'steps': 12823, 'loss/train': 1.826889157295227} -11/06/2021 23:01:12 - INFO - __main__ - Step 12825: {'lr': 0.0004934302246577786, 'samples': 2462400, 'steps': 12824, 'loss/train': 1.7399663925170898} -11/06/2021 23:01:12 - INFO - __main__ - Step 12826: {'lr': 0.0004934290160204652, 'samples': 2462592, 'steps': 12825, 'loss/train': 1.5818183422088623} -11/06/2021 23:01:12 - INFO - __main__ - Step 12827: {'lr': 0.0004934278072734666, 'samples': 2462784, 'steps': 12826, 'loss/train': 1.4330865144729614} -11/06/2021 23:01:13 - INFO - __main__ - Step 12828: {'lr': 0.000493426598416783, 'samples': 2462976, 'steps': 12827, 'loss/train': 1.77826988697052} -11/06/2021 23:01:13 - INFO - __main__ - Step 12829: {'lr': 0.0004934253894504152, 'samples': 2463168, 'steps': 12828, 'loss/train': 1.1493207216262817} -11/06/2021 23:01:14 - INFO - __main__ - Step 12830: {'lr': 0.0004934241803743637, 'samples': 2463360, 'steps': 12829, 'loss/train': 1.8719111680984497} -11/06/2021 23:01:14 - INFO - __main__ - Step 12831: {'lr': 0.000493422971188629, 'samples': 2463552, 'steps': 12830, 'loss/train': 1.228978157043457} -11/06/2021 23:01:15 - INFO - __main__ - Step 12832: {'lr': 0.0004934217618932117, 'samples': 2463744, 'steps': 12831, 'loss/train': 1.8399741649627686} -11/06/2021 23:01:15 - INFO - __main__ - Step 12833: {'lr': 0.0004934205524881123, 'samples': 2463936, 'steps': 12832, 'loss/train': 1.9681713581085205} -11/06/2021 23:01:15 - INFO - __main__ - Step 12834: {'lr': 0.0004934193429733312, 'samples': 2464128, 'steps': 12833, 'loss/train': 0.9652214050292969} -11/06/2021 23:01:17 - INFO - __main__ - Step 12835: {'lr': 0.0004934181333488693, 'samples': 2464320, 'steps': 12834, 'loss/train': 1.6454654932022095} -11/06/2021 23:01:18 - INFO - __main__ - Step 12836: {'lr': 0.0004934169236147268, 'samples': 2464512, 'steps': 12835, 'loss/train': 1.410776138305664} -11/06/2021 23:01:18 - INFO - __main__ - Step 12837: {'lr': 0.0004934157137709044, 'samples': 2464704, 'steps': 12836, 'loss/train': 1.5523715019226074} -11/06/2021 23:01:18 - INFO - __main__ - Step 12838: {'lr': 0.0004934145038174028, 'samples': 2464896, 'steps': 12837, 'loss/train': 1.6767199039459229} -11/06/2021 23:01:19 - INFO - __main__ - Step 12839: {'lr': 0.0004934132937542223, 'samples': 2465088, 'steps': 12838, 'loss/train': 1.64377760887146} -11/06/2021 23:01:19 - INFO - __main__ - Step 12840: {'lr': 0.0004934120835813634, 'samples': 2465280, 'steps': 12839, 'loss/train': 5.639301776885986} -11/06/2021 23:01:19 - INFO - __main__ - Step 12841: {'lr': 0.0004934108732988269, 'samples': 2465472, 'steps': 12840, 'loss/train': 5.523209095001221} -11/06/2021 23:01:20 - INFO - __main__ - Step 12842: {'lr': 0.0004934096629066133, 'samples': 2465664, 'steps': 12841, 'loss/train': 5.597353458404541} -11/06/2021 23:01:21 - INFO - __main__ - Step 12843: {'lr': 0.0004934084524047229, 'samples': 2465856, 'steps': 12842, 'loss/train': 2.109654188156128} -11/06/2021 23:01:21 - INFO - __main__ - Step 12844: {'lr': 0.0004934072417931564, 'samples': 2466048, 'steps': 12843, 'loss/train': 1.7585923671722412} -11/06/2021 23:01:22 - INFO - __main__ - Step 12845: {'lr': 0.0004934060310719145, 'samples': 2466240, 'steps': 12844, 'loss/train': 1.6276121139526367} -11/06/2021 23:01:22 - INFO - __main__ - Step 12846: {'lr': 0.0004934048202409974, 'samples': 2466432, 'steps': 12845, 'loss/train': 1.8930996656417847} -11/06/2021 23:01:22 - INFO - __main__ - Step 12847: {'lr': 0.000493403609300406, 'samples': 2466624, 'steps': 12846, 'loss/train': 1.744299054145813} -11/06/2021 23:01:23 - INFO - __main__ - Step 12848: {'lr': 0.0004934023982501406, 'samples': 2466816, 'steps': 12847, 'loss/train': 1.2807785272598267} -11/06/2021 23:01:24 - INFO - __main__ - Step 12849: {'lr': 0.000493401187090202, 'samples': 2467008, 'steps': 12848, 'loss/train': 1.8994098901748657} -11/06/2021 23:01:24 - INFO - __main__ - Step 12850: {'lr': 0.0004933999758205904, 'samples': 2467200, 'steps': 12849, 'loss/train': 1.5451972484588623} -11/06/2021 23:01:24 - INFO - __main__ - Step 12851: {'lr': 0.0004933987644413066, 'samples': 2467392, 'steps': 12850, 'loss/train': 1.0521020889282227} -11/06/2021 23:01:25 - INFO - __main__ - Step 12852: {'lr': 0.0004933975529523511, 'samples': 2467584, 'steps': 12851, 'loss/train': 1.6571444272994995} -11/06/2021 23:01:26 - INFO - __main__ - Step 12853: {'lr': 0.0004933963413537244, 'samples': 2467776, 'steps': 12852, 'loss/train': 1.570617437362671} -11/06/2021 23:01:26 - INFO - __main__ - Step 12854: {'lr': 0.000493395129645427, 'samples': 2467968, 'steps': 12853, 'loss/train': 0.8766611218452454} -11/06/2021 23:01:26 - INFO - __main__ - Step 12855: {'lr': 0.0004933939178274596, 'samples': 2468160, 'steps': 12854, 'loss/train': 1.5354561805725098} -11/06/2021 23:01:27 - INFO - __main__ - Step 12856: {'lr': 0.0004933927058998226, 'samples': 2468352, 'steps': 12855, 'loss/train': 1.74991774559021} -11/06/2021 23:01:27 - INFO - __main__ - Step 12857: {'lr': 0.0004933914938625166, 'samples': 2468544, 'steps': 12856, 'loss/train': 1.6767778396606445} -11/06/2021 23:01:28 - INFO - __main__ - Step 12858: {'lr': 0.0004933902817155422, 'samples': 2468736, 'steps': 12857, 'loss/train': 1.899521827697754} -11/06/2021 23:01:29 - INFO - __main__ - Step 12859: {'lr': 0.0004933890694588998, 'samples': 2468928, 'steps': 12858, 'loss/train': 1.837016224861145} -11/06/2021 23:01:29 - INFO - __main__ - Step 12860: {'lr': 0.0004933878570925901, 'samples': 2469120, 'steps': 12859, 'loss/train': 1.6478303670883179} -11/06/2021 23:01:29 - INFO - __main__ - Step 12861: {'lr': 0.0004933866446166136, 'samples': 2469312, 'steps': 12860, 'loss/train': 1.84537935256958} -11/06/2021 23:01:30 - INFO - __main__ - Step 12862: {'lr': 0.0004933854320309708, 'samples': 2469504, 'steps': 12861, 'loss/train': 2.0039706230163574} -11/06/2021 23:01:31 - INFO - __main__ - Step 12863: {'lr': 0.0004933842193356624, 'samples': 2469696, 'steps': 12862, 'loss/train': 2.835719585418701} -11/06/2021 23:01:31 - INFO - __main__ - Step 12864: {'lr': 0.0004933830065306887, 'samples': 2469888, 'steps': 12863, 'loss/train': 2.0461788177490234} -11/06/2021 23:01:31 - INFO - __main__ - Step 12865: {'lr': 0.0004933817936160504, 'samples': 2470080, 'steps': 12864, 'loss/train': 1.4113506078720093} -11/06/2021 23:01:32 - INFO - __main__ - Step 12866: {'lr': 0.0004933805805917479, 'samples': 2470272, 'steps': 12865, 'loss/train': 1.4473645687103271} -11/06/2021 23:01:32 - INFO - __main__ - Step 12867: {'lr': 0.000493379367457782, 'samples': 2470464, 'steps': 12866, 'loss/train': 1.7717403173446655} -11/06/2021 23:01:32 - INFO - __main__ - Step 12868: {'lr': 0.0004933781542141532, 'samples': 2470656, 'steps': 12867, 'loss/train': 1.985740303993225} -11/06/2021 23:01:34 - INFO - __main__ - Step 12869: {'lr': 0.0004933769408608618, 'samples': 2470848, 'steps': 12868, 'loss/train': 1.6742669343948364} -11/06/2021 23:01:34 - INFO - __main__ - Step 12870: {'lr': 0.0004933757273979086, 'samples': 2471040, 'steps': 12869, 'loss/train': 0.415326327085495} -11/06/2021 23:01:34 - INFO - __main__ - Step 12871: {'lr': 0.0004933745138252939, 'samples': 2471232, 'steps': 12870, 'loss/train': 1.893794298171997} -11/06/2021 23:01:35 - INFO - __main__ - Step 12872: {'lr': 0.0004933733001430186, 'samples': 2471424, 'steps': 12871, 'loss/train': 1.7198106050491333} -11/06/2021 23:01:35 - INFO - __main__ - Step 12873: {'lr': 0.000493372086351083, 'samples': 2471616, 'steps': 12872, 'loss/train': 2.0763978958129883} -11/06/2021 23:01:36 - INFO - __main__ - Step 12874: {'lr': 0.0004933708724494877, 'samples': 2471808, 'steps': 12873, 'loss/train': 1.426766276359558} -11/06/2021 23:01:36 - INFO - __main__ - Step 12875: {'lr': 0.0004933696584382331, 'samples': 2472000, 'steps': 12874, 'loss/train': 1.5616261959075928} -11/06/2021 23:01:37 - INFO - __main__ - Step 12876: {'lr': 0.00049336844431732, 'samples': 2472192, 'steps': 12875, 'loss/train': 1.1413694620132446} -11/06/2021 23:01:37 - INFO - __main__ - Step 12877: {'lr': 0.0004933672300867488, 'samples': 2472384, 'steps': 12876, 'loss/train': 1.5705578327178955} -11/06/2021 23:01:37 - INFO - __main__ - Step 12878: {'lr': 0.0004933660157465202, 'samples': 2472576, 'steps': 12877, 'loss/train': 1.6181583404541016} -11/06/2021 23:01:39 - INFO - __main__ - Step 12879: {'lr': 0.0004933648012966344, 'samples': 2472768, 'steps': 12878, 'loss/train': 2.557011842727661} -11/06/2021 23:01:39 - INFO - __main__ - Step 12880: {'lr': 0.0004933635867370923, 'samples': 2472960, 'steps': 12879, 'loss/train': 1.745104193687439} -11/06/2021 23:01:39 - INFO - __main__ - Step 12881: {'lr': 0.0004933623720678944, 'samples': 2473152, 'steps': 12880, 'loss/train': 1.816332459449768} -11/06/2021 23:01:40 - INFO - __main__ - Step 12882: {'lr': 0.000493361157289041, 'samples': 2473344, 'steps': 12881, 'loss/train': 1.7329145669937134} -11/06/2021 23:01:40 - INFO - __main__ - Step 12883: {'lr': 0.000493359942400533, 'samples': 2473536, 'steps': 12882, 'loss/train': 1.764685034751892} -11/06/2021 23:01:41 - INFO - __main__ - Step 12884: {'lr': 0.0004933587274023706, 'samples': 2473728, 'steps': 12883, 'loss/train': 1.9591374397277832} -11/06/2021 23:01:41 - INFO - __main__ - Step 12885: {'lr': 0.0004933575122945547, 'samples': 2473920, 'steps': 12884, 'loss/train': 1.8801758289337158} -11/06/2021 23:01:42 - INFO - __main__ - Step 12886: {'lr': 0.0004933562970770855, 'samples': 2474112, 'steps': 12885, 'loss/train': 1.7536741495132446} -11/06/2021 23:01:42 - INFO - __main__ - Step 12887: {'lr': 0.0004933550817499638, 'samples': 2474304, 'steps': 12886, 'loss/train': 1.2631752490997314} -11/06/2021 23:01:42 - INFO - __main__ - Step 12888: {'lr': 0.00049335386631319, 'samples': 2474496, 'steps': 12887, 'loss/train': 2.017979621887207} -11/06/2021 23:01:43 - INFO - __main__ - Step 12889: {'lr': 0.0004933526507667648, 'samples': 2474688, 'steps': 12888, 'loss/train': 2.223954200744629} -11/06/2021 23:01:44 - INFO - __main__ - Step 12890: {'lr': 0.0004933514351106885, 'samples': 2474880, 'steps': 12889, 'loss/train': 1.3178850412368774} -11/06/2021 23:01:44 - INFO - __main__ - Step 12891: {'lr': 0.0004933502193449618, 'samples': 2475072, 'steps': 12890, 'loss/train': 1.6767654418945312} -11/06/2021 23:01:44 - INFO - __main__ - Step 12892: {'lr': 0.0004933490034695853, 'samples': 2475264, 'steps': 12891, 'loss/train': 1.598570466041565} -11/06/2021 23:01:45 - INFO - __main__ - Step 12893: {'lr': 0.0004933477874845595, 'samples': 2475456, 'steps': 12892, 'loss/train': 1.9039117097854614} -11/06/2021 23:01:46 - INFO - __main__ - Step 12894: {'lr': 0.000493346571389885, 'samples': 2475648, 'steps': 12893, 'loss/train': 1.4883739948272705} -11/06/2021 23:01:46 - INFO - __main__ - Step 12895: {'lr': 0.0004933453551855622, 'samples': 2475840, 'steps': 12894, 'loss/train': 1.6035698652267456} -11/06/2021 23:01:47 - INFO - __main__ - Step 12896: {'lr': 0.0004933441388715919, 'samples': 2476032, 'steps': 12895, 'loss/train': 1.7423779964447021} -11/06/2021 23:01:47 - INFO - __main__ - Step 12897: {'lr': 0.0004933429224479743, 'samples': 2476224, 'steps': 12896, 'loss/train': 1.6877235174179077} -11/06/2021 23:01:48 - INFO - __main__ - Step 12898: {'lr': 0.0004933417059147102, 'samples': 2476416, 'steps': 12897, 'loss/train': 1.5222456455230713} -11/06/2021 23:01:48 - INFO - __main__ - Step 12899: {'lr': 0.0004933404892718, 'samples': 2476608, 'steps': 12898, 'loss/train': 0.5296525955200195} -11/06/2021 23:01:50 - INFO - __main__ - Step 12900: {'lr': 0.0004933392725192444, 'samples': 2476800, 'steps': 12899, 'loss/train': 2.3114047050476074} -11/06/2021 23:01:50 - INFO - __main__ - Step 12901: {'lr': 0.000493338055657044, 'samples': 2476992, 'steps': 12900, 'loss/train': 1.6073651313781738} -11/06/2021 23:01:50 - INFO - __main__ - Step 12902: {'lr': 0.0004933368386851991, 'samples': 2477184, 'steps': 12901, 'loss/train': 0.23120321333408356} -11/06/2021 23:01:51 - INFO - __main__ - Step 12903: {'lr': 0.0004933356216037104, 'samples': 2477376, 'steps': 12902, 'loss/train': 1.398972749710083} -11/06/2021 23:01:51 - INFO - __main__ - Step 12904: {'lr': 0.0004933344044125784, 'samples': 2477568, 'steps': 12903, 'loss/train': 1.585076093673706} -11/06/2021 23:01:52 - INFO - __main__ - Step 12905: {'lr': 0.0004933331871118037, 'samples': 2477760, 'steps': 12904, 'loss/train': 1.9329192638397217} -11/06/2021 23:01:52 - INFO - __main__ - Step 12906: {'lr': 0.0004933319697013869, 'samples': 2477952, 'steps': 12905, 'loss/train': 1.082170844078064} -11/06/2021 23:01:53 - INFO - __main__ - Step 12907: {'lr': 0.0004933307521813282, 'samples': 2478144, 'steps': 12906, 'loss/train': 1.3846449851989746} -11/06/2021 23:01:53 - INFO - __main__ - Step 12908: {'lr': 0.0004933295345516287, 'samples': 2478336, 'steps': 12907, 'loss/train': 1.5094048976898193} -11/06/2021 23:01:53 - INFO - __main__ - Step 12909: {'lr': 0.0004933283168122886, 'samples': 2478528, 'steps': 12908, 'loss/train': 1.7825679779052734} -11/06/2021 23:01:54 - INFO - __main__ - Step 12910: {'lr': 0.0004933270989633084, 'samples': 2478720, 'steps': 12909, 'loss/train': 2.0155463218688965} -11/06/2021 23:01:55 - INFO - __main__ - Step 12911: {'lr': 0.0004933258810046889, 'samples': 2478912, 'steps': 12910, 'loss/train': 1.8153250217437744} -11/06/2021 23:01:55 - INFO - __main__ - Step 12912: {'lr': 0.0004933246629364304, 'samples': 2479104, 'steps': 12911, 'loss/train': 1.8701039552688599} -11/06/2021 23:01:55 - INFO - __main__ - Step 12913: {'lr': 0.0004933234447585337, 'samples': 2479296, 'steps': 12912, 'loss/train': 1.6900960206985474} -11/06/2021 23:01:56 - INFO - __main__ - Step 12914: {'lr': 0.0004933222264709991, 'samples': 2479488, 'steps': 12913, 'loss/train': 1.2670124769210815} -11/06/2021 23:01:57 - INFO - __main__ - Step 12915: {'lr': 0.0004933210080738273, 'samples': 2479680, 'steps': 12914, 'loss/train': 1.0174174308776855} -11/06/2021 23:01:57 - INFO - __main__ - Step 12916: {'lr': 0.0004933197895670187, 'samples': 2479872, 'steps': 12915, 'loss/train': 1.1427866220474243} -11/06/2021 23:01:58 - INFO - __main__ - Step 12917: {'lr': 0.0004933185709505741, 'samples': 2480064, 'steps': 12916, 'loss/train': 1.5414581298828125} -11/06/2021 23:01:58 - INFO - __main__ - Step 12918: {'lr': 0.0004933173522244939, 'samples': 2480256, 'steps': 12917, 'loss/train': 1.7401179075241089} -11/06/2021 23:01:58 - INFO - __main__ - Step 12919: {'lr': 0.0004933161333887786, 'samples': 2480448, 'steps': 12918, 'loss/train': 0.29492583870887756} -11/06/2021 23:02:00 - INFO - __main__ - Step 12920: {'lr': 0.0004933149144434288, 'samples': 2480640, 'steps': 12919, 'loss/train': 1.3319393396377563} -11/06/2021 23:02:00 - INFO - __main__ - Step 12921: {'lr': 0.0004933136953884451, 'samples': 2480832, 'steps': 12920, 'loss/train': 1.2883689403533936} -11/06/2021 23:02:00 - INFO - __main__ - Step 12922: {'lr': 0.0004933124762238279, 'samples': 2481024, 'steps': 12921, 'loss/train': 1.720632791519165} -11/06/2021 23:02:01 - INFO - __main__ - Step 12923: {'lr': 0.000493311256949578, 'samples': 2481216, 'steps': 12922, 'loss/train': 1.5766397714614868} -11/06/2021 23:02:01 - INFO - __main__ - Step 12924: {'lr': 0.0004933100375656957, 'samples': 2481408, 'steps': 12923, 'loss/train': 1.3622182607650757} -11/06/2021 23:02:02 - INFO - __main__ - Step 12925: {'lr': 0.0004933088180721817, 'samples': 2481600, 'steps': 12924, 'loss/train': 1.876354694366455} -11/06/2021 23:02:02 - INFO - __main__ - Step 12926: {'lr': 0.0004933075984690365, 'samples': 2481792, 'steps': 12925, 'loss/train': 1.9899784326553345} -11/06/2021 23:02:03 - INFO - __main__ - Step 12927: {'lr': 0.0004933063787562606, 'samples': 2481984, 'steps': 12926, 'loss/train': 1.0341933965682983} -11/06/2021 23:02:03 - INFO - __main__ - Step 12928: {'lr': 0.0004933051589338547, 'samples': 2482176, 'steps': 12927, 'loss/train': 1.815047025680542} -11/06/2021 23:02:03 - INFO - __main__ - Step 12929: {'lr': 0.0004933039390018192, 'samples': 2482368, 'steps': 12928, 'loss/train': 1.346707820892334} -11/06/2021 23:02:04 - INFO - __main__ - Step 12930: {'lr': 0.0004933027189601547, 'samples': 2482560, 'steps': 12929, 'loss/train': 1.6749612092971802} -11/06/2021 23:02:05 - INFO - __main__ - Step 12931: {'lr': 0.0004933014988088616, 'samples': 2482752, 'steps': 12930, 'loss/train': 1.7851786613464355} -11/06/2021 23:02:05 - INFO - __main__ - Step 12932: {'lr': 0.0004933002785479408, 'samples': 2482944, 'steps': 12931, 'loss/train': 1.2040504217147827} -11/06/2021 23:02:06 - INFO - __main__ - Step 12933: {'lr': 0.0004932990581773926, 'samples': 2483136, 'steps': 12932, 'loss/train': 1.582513451576233} -11/06/2021 23:02:06 - INFO - __main__ - Step 12934: {'lr': 0.0004932978376972175, 'samples': 2483328, 'steps': 12933, 'loss/train': 0.32476386427879333} -11/06/2021 23:02:06 - INFO - __main__ - Step 12935: {'lr': 0.0004932966171074163, 'samples': 2483520, 'steps': 12934, 'loss/train': 1.2251867055892944} -11/06/2021 23:02:07 - INFO - __main__ - Step 12936: {'lr': 0.0004932953964079893, 'samples': 2483712, 'steps': 12935, 'loss/train': 1.569036841392517} -11/06/2021 23:02:08 - INFO - __main__ - Step 12937: {'lr': 0.0004932941755989372, 'samples': 2483904, 'steps': 12936, 'loss/train': 1.9879359006881714} -11/06/2021 23:02:08 - INFO - __main__ - Step 12938: {'lr': 0.0004932929546802605, 'samples': 2484096, 'steps': 12937, 'loss/train': 1.4933514595031738} -11/06/2021 23:02:08 - INFO - __main__ - Step 12939: {'lr': 0.0004932917336519597, 'samples': 2484288, 'steps': 12938, 'loss/train': 1.2084016799926758} -11/06/2021 23:02:09 - INFO - __main__ - Step 12940: {'lr': 0.0004932905125140354, 'samples': 2484480, 'steps': 12939, 'loss/train': 1.5175234079360962} -11/06/2021 23:02:10 - INFO - __main__ - Step 12941: {'lr': 0.0004932892912664882, 'samples': 2484672, 'steps': 12940, 'loss/train': 1.7356916666030884} -11/06/2021 23:02:10 - INFO - __main__ - Step 12942: {'lr': 0.0004932880699093186, 'samples': 2484864, 'steps': 12941, 'loss/train': 1.6481016874313354} -11/06/2021 23:02:10 - INFO - __main__ - Step 12943: {'lr': 0.0004932868484425271, 'samples': 2485056, 'steps': 12942, 'loss/train': 1.8215060234069824} -11/06/2021 23:02:11 - INFO - __main__ - Step 12944: {'lr': 0.0004932856268661143, 'samples': 2485248, 'steps': 12943, 'loss/train': 1.5122387409210205} -11/06/2021 23:02:11 - INFO - __main__ - Step 12945: {'lr': 0.0004932844051800808, 'samples': 2485440, 'steps': 12944, 'loss/train': 1.9089007377624512} -11/06/2021 23:02:12 - INFO - __main__ - Step 12946: {'lr': 0.000493283183384427, 'samples': 2485632, 'steps': 12945, 'loss/train': 1.1102064847946167} -11/06/2021 23:02:13 - INFO - __main__ - Step 12947: {'lr': 0.0004932819614791537, 'samples': 2485824, 'steps': 12946, 'loss/train': 1.6587165594100952} -11/06/2021 23:02:13 - INFO - __main__ - Step 12948: {'lr': 0.0004932807394642612, 'samples': 2486016, 'steps': 12947, 'loss/train': 1.7909165620803833} -11/06/2021 23:02:13 - INFO - __main__ - Step 12949: {'lr': 0.0004932795173397501, 'samples': 2486208, 'steps': 12948, 'loss/train': 2.574796199798584} -11/06/2021 23:02:14 - INFO - __main__ - Step 12950: {'lr': 0.0004932782951056211, 'samples': 2486400, 'steps': 12949, 'loss/train': 2.0372557640075684} -11/06/2021 23:02:15 - INFO - __main__ - Step 12951: {'lr': 0.0004932770727618747, 'samples': 2486592, 'steps': 12950, 'loss/train': 3.691620349884033} -11/06/2021 23:02:15 - INFO - __main__ - Step 12952: {'lr': 0.0004932758503085114, 'samples': 2486784, 'steps': 12951, 'loss/train': 1.6988760232925415} -11/06/2021 23:02:15 - INFO - __main__ - Step 12953: {'lr': 0.0004932746277455317, 'samples': 2486976, 'steps': 12952, 'loss/train': 1.674808382987976} -11/06/2021 23:02:16 - INFO - __main__ - Step 12954: {'lr': 0.0004932734050729362, 'samples': 2487168, 'steps': 12953, 'loss/train': 1.2582000494003296} -11/06/2021 23:02:16 - INFO - __main__ - Step 12955: {'lr': 0.0004932721822907255, 'samples': 2487360, 'steps': 12954, 'loss/train': 1.9092744588851929} -11/06/2021 23:02:17 - INFO - __main__ - Step 12956: {'lr': 0.0004932709593989, 'samples': 2487552, 'steps': 12955, 'loss/train': 0.7507480978965759} -11/06/2021 23:02:17 - INFO - __main__ - Step 12957: {'lr': 0.0004932697363974604, 'samples': 2487744, 'steps': 12956, 'loss/train': 1.7332943677902222} -11/06/2021 23:02:18 - INFO - __main__ - Step 12958: {'lr': 0.0004932685132864072, 'samples': 2487936, 'steps': 12957, 'loss/train': 1.3571699857711792} -11/06/2021 23:02:18 - INFO - __main__ - Step 12959: {'lr': 0.0004932672900657411, 'samples': 2488128, 'steps': 12958, 'loss/train': 1.7823020219802856} -11/06/2021 23:02:18 - INFO - __main__ - Step 12960: {'lr': 0.0004932660667354623, 'samples': 2488320, 'steps': 12959, 'loss/train': 1.8756752014160156} -11/06/2021 23:02:20 - INFO - __main__ - Step 12961: {'lr': 0.0004932648432955717, 'samples': 2488512, 'steps': 12960, 'loss/train': 1.2283211946487427} -11/06/2021 23:02:20 - INFO - __main__ - Step 12962: {'lr': 0.0004932636197460698, 'samples': 2488704, 'steps': 12961, 'loss/train': 1.6361844539642334} -11/06/2021 23:02:20 - INFO - __main__ - Step 12963: {'lr': 0.0004932623960869569, 'samples': 2488896, 'steps': 12962, 'loss/train': 2.1100404262542725} -11/06/2021 23:02:21 - INFO - __main__ - Step 12964: {'lr': 0.0004932611723182338, 'samples': 2489088, 'steps': 12963, 'loss/train': 2.5909249782562256} -11/06/2021 23:02:21 - INFO - __main__ - Step 12965: {'lr': 0.000493259948439901, 'samples': 2489280, 'steps': 12964, 'loss/train': 1.8154479265213013} -11/06/2021 23:02:21 - INFO - __main__ - Step 12966: {'lr': 0.0004932587244519589, 'samples': 2489472, 'steps': 12965, 'loss/train': 1.5690723657608032} -11/06/2021 23:02:22 - INFO - __main__ - Step 12967: {'lr': 0.0004932575003544083, 'samples': 2489664, 'steps': 12966, 'loss/train': 1.8327417373657227} -11/06/2021 23:02:23 - INFO - __main__ - Step 12968: {'lr': 0.0004932562761472496, 'samples': 2489856, 'steps': 12967, 'loss/train': 1.6555702686309814} -11/06/2021 23:02:23 - INFO - __main__ - Step 12969: {'lr': 0.0004932550518304833, 'samples': 2490048, 'steps': 12968, 'loss/train': 1.708749532699585} -11/06/2021 23:02:23 - INFO - __main__ - Step 12970: {'lr': 0.0004932538274041101, 'samples': 2490240, 'steps': 12969, 'loss/train': 1.741576910018921} -11/06/2021 23:02:24 - INFO - __main__ - Step 12971: {'lr': 0.0004932526028681304, 'samples': 2490432, 'steps': 12970, 'loss/train': 1.9435254335403442} -11/06/2021 23:02:25 - INFO - __main__ - Step 12972: {'lr': 0.0004932513782225449, 'samples': 2490624, 'steps': 12971, 'loss/train': 1.1495224237442017} -11/06/2021 23:02:26 - INFO - __main__ - Step 12973: {'lr': 0.000493250153467354, 'samples': 2490816, 'steps': 12972, 'loss/train': 1.953014850616455} -11/06/2021 23:02:26 - INFO - __main__ - Step 12974: {'lr': 0.0004932489286025584, 'samples': 2491008, 'steps': 12973, 'loss/train': 1.809768557548523} -11/06/2021 23:02:26 - INFO - __main__ - Step 12975: {'lr': 0.0004932477036281586, 'samples': 2491200, 'steps': 12974, 'loss/train': 1.7049349546432495} -11/06/2021 23:02:27 - INFO - __main__ - Step 12976: {'lr': 0.0004932464785441552, 'samples': 2491392, 'steps': 12975, 'loss/train': 1.7377121448516846} -11/06/2021 23:02:27 - INFO - __main__ - Step 12977: {'lr': 0.0004932452533505486, 'samples': 2491584, 'steps': 12976, 'loss/train': 1.471701979637146} -11/06/2021 23:02:27 - INFO - __main__ - Step 12978: {'lr': 0.0004932440280473395, 'samples': 2491776, 'steps': 12977, 'loss/train': 1.8254519701004028} -11/06/2021 23:02:28 - INFO - __main__ - Step 12979: {'lr': 0.0004932428026345282, 'samples': 2491968, 'steps': 12978, 'loss/train': 1.869467854499817} -11/06/2021 23:02:29 - INFO - __main__ - Step 12980: {'lr': 0.0004932415771121157, 'samples': 2492160, 'steps': 12979, 'loss/train': 2.1289100646972656} -11/06/2021 23:02:29 - INFO - __main__ - Step 12981: {'lr': 0.0004932403514801021, 'samples': 2492352, 'steps': 12980, 'loss/train': 1.9706026315689087} -11/06/2021 23:02:29 - INFO - __main__ - Step 12982: {'lr': 0.0004932391257384883, 'samples': 2492544, 'steps': 12981, 'loss/train': 1.9861183166503906} -11/06/2021 23:02:30 - INFO - __main__ - Step 12983: {'lr': 0.0004932378998872746, 'samples': 2492736, 'steps': 12982, 'loss/train': 2.142361640930176} -11/06/2021 23:02:31 - INFO - __main__ - Step 12984: {'lr': 0.0004932366739264618, 'samples': 2492928, 'steps': 12983, 'loss/train': 0.2792867422103882} -11/06/2021 23:02:31 - INFO - __main__ - Step 12985: {'lr': 0.0004932354478560502, 'samples': 2493120, 'steps': 12984, 'loss/train': 1.9411041736602783} -11/06/2021 23:02:31 - INFO - __main__ - Step 12986: {'lr': 0.0004932342216760405, 'samples': 2493312, 'steps': 12985, 'loss/train': 1.882585883140564} -11/06/2021 23:02:32 - INFO - __main__ - Step 12987: {'lr': 0.0004932329953864331, 'samples': 2493504, 'steps': 12986, 'loss/train': 1.9840530157089233} -11/06/2021 23:02:32 - INFO - __main__ - Step 12988: {'lr': 0.0004932317689872287, 'samples': 2493696, 'steps': 12987, 'loss/train': 1.5482817888259888} -11/06/2021 23:02:33 - INFO - __main__ - Step 12989: {'lr': 0.000493230542478428, 'samples': 2493888, 'steps': 12988, 'loss/train': 1.229072093963623} -11/06/2021 23:02:34 - INFO - __main__ - Step 12990: {'lr': 0.0004932293158600312, 'samples': 2494080, 'steps': 12989, 'loss/train': 2.037853717803955} -11/06/2021 23:02:34 - INFO - __main__ - Step 12991: {'lr': 0.0004932280891320391, 'samples': 2494272, 'steps': 12990, 'loss/train': 1.9727879762649536} -11/06/2021 23:02:34 - INFO - __main__ - Step 12992: {'lr': 0.0004932268622944521, 'samples': 2494464, 'steps': 12991, 'loss/train': 2.1666083335876465} -11/06/2021 23:02:35 - INFO - __main__ - Step 12993: {'lr': 0.0004932256353472709, 'samples': 2494656, 'steps': 12992, 'loss/train': 1.4905357360839844} -11/06/2021 23:02:36 - INFO - __main__ - Step 12994: {'lr': 0.0004932244082904959, 'samples': 2494848, 'steps': 12993, 'loss/train': 1.4867180585861206} -11/06/2021 23:02:36 - INFO - __main__ - Step 12995: {'lr': 0.0004932231811241278, 'samples': 2495040, 'steps': 12994, 'loss/train': 0.779282808303833} -11/06/2021 23:02:36 - INFO - __main__ - Step 12996: {'lr': 0.0004932219538481672, 'samples': 2495232, 'steps': 12995, 'loss/train': 1.931758165359497} -11/06/2021 23:02:37 - INFO - __main__ - Step 12997: {'lr': 0.0004932207264626143, 'samples': 2495424, 'steps': 12996, 'loss/train': 1.4099301099777222} -11/06/2021 23:02:37 - INFO - __main__ - Step 12998: {'lr': 0.00049321949896747, 'samples': 2495616, 'steps': 12997, 'loss/train': 1.4822603464126587} -11/06/2021 23:02:39 - INFO - __main__ - Step 12999: {'lr': 0.0004932182713627348, 'samples': 2495808, 'steps': 12998, 'loss/train': 1.0354619026184082} -11/06/2021 23:02:39 - INFO - __main__ - Step 13000: {'lr': 0.0004932170436484091, 'samples': 2496000, 'steps': 12999, 'loss/train': 0.504642903804779} -11/06/2021 23:02:39 - INFO - __main__ - Step 13001: {'lr': 0.0004932158158244937, 'samples': 2496192, 'steps': 13000, 'loss/train': 0.3501379191875458} -11/06/2021 23:02:40 - INFO - __main__ - Step 13002: {'lr': 0.0004932145878909889, 'samples': 2496384, 'steps': 13001, 'loss/train': 1.9297839403152466} -11/06/2021 23:02:40 - INFO - __main__ - Step 13003: {'lr': 0.0004932133598478953, 'samples': 2496576, 'steps': 13002, 'loss/train': 1.891198754310608} -11/06/2021 23:02:41 - INFO - __main__ - Step 13004: {'lr': 0.0004932121316952136, 'samples': 2496768, 'steps': 13003, 'loss/train': 1.5406192541122437} -11/06/2021 23:02:41 - INFO - __main__ - Step 13005: {'lr': 0.0004932109034329442, 'samples': 2496960, 'steps': 13004, 'loss/train': 1.6352239847183228} -11/06/2021 23:02:42 - INFO - __main__ - Step 13006: {'lr': 0.0004932096750610879, 'samples': 2497152, 'steps': 13005, 'loss/train': 1.8479753732681274} -11/06/2021 23:02:42 - INFO - __main__ - Step 13007: {'lr': 0.0004932084465796449, 'samples': 2497344, 'steps': 13006, 'loss/train': 1.7984743118286133} -11/06/2021 23:02:43 - INFO - __main__ - Step 13008: {'lr': 0.000493207217988616, 'samples': 2497536, 'steps': 13007, 'loss/train': 1.575510025024414} -11/06/2021 23:02:44 - INFO - __main__ - Step 13009: {'lr': 0.0004932059892880016, 'samples': 2497728, 'steps': 13008, 'loss/train': 1.1041618585586548} -11/06/2021 23:02:44 - INFO - __main__ - Step 13010: {'lr': 0.0004932047604778025, 'samples': 2497920, 'steps': 13009, 'loss/train': 0.6211431622505188} -11/06/2021 23:02:45 - INFO - __main__ - Step 13011: {'lr': 0.0004932035315580188, 'samples': 2498112, 'steps': 13010, 'loss/train': 2.066260576248169} -11/06/2021 23:02:45 - INFO - __main__ - Step 13012: {'lr': 0.0004932023025286516, 'samples': 2498304, 'steps': 13011, 'loss/train': 1.6674903631210327} -11/06/2021 23:02:45 - INFO - __main__ - Step 13013: {'lr': 0.0004932010733897012, 'samples': 2498496, 'steps': 13012, 'loss/train': 1.5579228401184082} -11/06/2021 23:02:46 - INFO - __main__ - Step 13014: {'lr': 0.000493199844141168, 'samples': 2498688, 'steps': 13013, 'loss/train': 1.8701536655426025} -11/06/2021 23:02:47 - INFO - __main__ - Step 13015: {'lr': 0.0004931986147830527, 'samples': 2498880, 'steps': 13014, 'loss/train': 1.726219654083252} -11/06/2021 23:02:47 - INFO - __main__ - Step 13016: {'lr': 0.000493197385315356, 'samples': 2499072, 'steps': 13015, 'loss/train': 1.4233412742614746} -11/06/2021 23:02:47 - INFO - __main__ - Step 13017: {'lr': 0.0004931961557380782, 'samples': 2499264, 'steps': 13016, 'loss/train': 1.2359046936035156} -11/06/2021 23:02:48 - INFO - __main__ - Step 13018: {'lr': 0.00049319492605122, 'samples': 2499456, 'steps': 13017, 'loss/train': 1.8722537755966187} -11/06/2021 23:02:48 - INFO - __main__ - Step 13019: {'lr': 0.000493193696254782, 'samples': 2499648, 'steps': 13018, 'loss/train': 1.5985851287841797} -11/06/2021 23:02:49 - INFO - __main__ - Step 13020: {'lr': 0.0004931924663487646, 'samples': 2499840, 'steps': 13019, 'loss/train': 1.6530154943466187} -11/06/2021 23:02:50 - INFO - __main__ - Step 13021: {'lr': 0.0004931912363331683, 'samples': 2500032, 'steps': 13020, 'loss/train': 1.8538419008255005} -11/06/2021 23:02:50 - INFO - __main__ - Step 13022: {'lr': 0.000493190006207994, 'samples': 2500224, 'steps': 13021, 'loss/train': 1.3083375692367554} -11/06/2021 23:02:50 - INFO - __main__ - Step 13023: {'lr': 0.0004931887759732419, 'samples': 2500416, 'steps': 13022, 'loss/train': 1.6392176151275635} -11/06/2021 23:02:51 - INFO - __main__ - Step 13024: {'lr': 0.0004931875456289128, 'samples': 2500608, 'steps': 13023, 'loss/train': 1.1660975217819214} -11/06/2021 23:02:52 - INFO - __main__ - Step 13025: {'lr': 0.000493186315175007, 'samples': 2500800, 'steps': 13024, 'loss/train': 1.6558512449264526} -11/06/2021 23:02:52 - INFO - __main__ - Step 13026: {'lr': 0.0004931850846115253, 'samples': 2500992, 'steps': 13025, 'loss/train': 1.7009488344192505} -11/06/2021 23:02:52 - INFO - __main__ - Step 13027: {'lr': 0.0004931838539384681, 'samples': 2501184, 'steps': 13026, 'loss/train': 1.87421452999115} -11/06/2021 23:02:53 - INFO - __main__ - Step 13028: {'lr': 0.0004931826231558361, 'samples': 2501376, 'steps': 13027, 'loss/train': 1.698980450630188} -11/06/2021 23:02:53 - INFO - __main__ - Step 13029: {'lr': 0.0004931813922636297, 'samples': 2501568, 'steps': 13028, 'loss/train': 2.1995387077331543} -11/06/2021 23:02:53 - INFO - __main__ - Step 13030: {'lr': 0.0004931801612618494, 'samples': 2501760, 'steps': 13029, 'loss/train': 0.9826458692550659} -11/06/2021 23:02:54 - INFO - __main__ - Step 13031: {'lr': 0.0004931789301504961, 'samples': 2501952, 'steps': 13030, 'loss/train': 1.9155287742614746} -11/06/2021 23:02:55 - INFO - __main__ - Step 13032: {'lr': 0.00049317769892957, 'samples': 2502144, 'steps': 13031, 'loss/train': 2.2658934593200684} -11/06/2021 23:02:55 - INFO - __main__ - Step 13033: {'lr': 0.0004931764675990718, 'samples': 2502336, 'steps': 13032, 'loss/train': 1.7716729640960693} -11/06/2021 23:02:56 - INFO - __main__ - Step 13034: {'lr': 0.000493175236159002, 'samples': 2502528, 'steps': 13033, 'loss/train': 2.120985269546509} -11/06/2021 23:02:56 - INFO - __main__ - Step 13035: {'lr': 0.0004931740046093612, 'samples': 2502720, 'steps': 13034, 'loss/train': 1.8945417404174805} -11/06/2021 23:02:57 - INFO - __main__ - Step 13036: {'lr': 0.0004931727729501499, 'samples': 2502912, 'steps': 13035, 'loss/train': 1.613181471824646} -11/06/2021 23:02:57 - INFO - __main__ - Step 13037: {'lr': 0.0004931715411813689, 'samples': 2503104, 'steps': 13036, 'loss/train': 1.5703870058059692} -11/06/2021 23:02:58 - INFO - __main__ - Step 13038: {'lr': 0.0004931703093030183, 'samples': 2503296, 'steps': 13037, 'loss/train': 1.6445674896240234} -11/06/2021 23:02:58 - INFO - __main__ - Step 13039: {'lr': 0.0004931690773150991, 'samples': 2503488, 'steps': 13038, 'loss/train': 1.3863145112991333} -11/06/2021 23:02:58 - INFO - __main__ - Step 13040: {'lr': 0.0004931678452176116, 'samples': 2503680, 'steps': 13039, 'loss/train': 1.5152404308319092} -11/06/2021 23:02:59 - INFO - __main__ - Step 13041: {'lr': 0.0004931666130105563, 'samples': 2503872, 'steps': 13040, 'loss/train': 1.6495338678359985} -11/06/2021 23:03:00 - INFO - __main__ - Step 13042: {'lr': 0.0004931653806939341, 'samples': 2504064, 'steps': 13041, 'loss/train': 1.6312777996063232} -11/06/2021 23:03:00 - INFO - __main__ - Step 13043: {'lr': 0.0004931641482677452, 'samples': 2504256, 'steps': 13042, 'loss/train': 1.6087427139282227} -11/06/2021 23:03:01 - INFO - __main__ - Step 13044: {'lr': 0.0004931629157319904, 'samples': 2504448, 'steps': 13043, 'loss/train': 1.2086093425750732} -11/06/2021 23:03:01 - INFO - __main__ - Step 13045: {'lr': 0.00049316168308667, 'samples': 2504640, 'steps': 13044, 'loss/train': 0.33910736441612244} -11/06/2021 23:03:02 - INFO - __main__ - Step 13046: {'lr': 0.0004931604503317846, 'samples': 2504832, 'steps': 13045, 'loss/train': 1.6171785593032837} -11/06/2021 23:03:02 - INFO - __main__ - Step 13047: {'lr': 0.0004931592174673351, 'samples': 2505024, 'steps': 13046, 'loss/train': 1.6778055429458618} -11/06/2021 23:03:03 - INFO - __main__ - Step 13048: {'lr': 0.0004931579844933218, 'samples': 2505216, 'steps': 13047, 'loss/train': 1.8838071823120117} -11/06/2021 23:03:03 - INFO - __main__ - Step 13049: {'lr': 0.0004931567514097451, 'samples': 2505408, 'steps': 13048, 'loss/train': 1.89003586769104} -11/06/2021 23:03:03 - INFO - __main__ - Step 13050: {'lr': 0.0004931555182166059, 'samples': 2505600, 'steps': 13049, 'loss/train': 1.5584383010864258} -11/06/2021 23:03:04 - INFO - __main__ - Step 13051: {'lr': 0.0004931542849139044, 'samples': 2505792, 'steps': 13050, 'loss/train': 2.8212499618530273} -11/06/2021 23:03:05 - INFO - __main__ - Step 13052: {'lr': 0.0004931530515016415, 'samples': 2505984, 'steps': 13051, 'loss/train': 1.6236906051635742} -11/06/2021 23:03:05 - INFO - __main__ - Step 13053: {'lr': 0.0004931518179798175, 'samples': 2506176, 'steps': 13052, 'loss/train': 1.8090659379959106} -11/06/2021 23:03:05 - INFO - __main__ - Step 13054: {'lr': 0.000493150584348433, 'samples': 2506368, 'steps': 13053, 'loss/train': 1.5024513006210327} -11/06/2021 23:03:06 - INFO - __main__ - Step 13055: {'lr': 0.0004931493506074886, 'samples': 2506560, 'steps': 13054, 'loss/train': 1.271149754524231} -11/06/2021 23:03:07 - INFO - __main__ - Step 13056: {'lr': 0.0004931481167569849, 'samples': 2506752, 'steps': 13055, 'loss/train': 1.1166818141937256} -11/06/2021 23:03:07 - INFO - __main__ - Step 13057: {'lr': 0.0004931468827969223, 'samples': 2506944, 'steps': 13056, 'loss/train': 1.8440206050872803} -11/06/2021 23:03:08 - INFO - __main__ - Step 13058: {'lr': 0.0004931456487273017, 'samples': 2507136, 'steps': 13057, 'loss/train': 1.7418556213378906} -11/06/2021 23:03:08 - INFO - __main__ - Step 13059: {'lr': 0.0004931444145481233, 'samples': 2507328, 'steps': 13058, 'loss/train': 1.3444815874099731} -11/06/2021 23:03:08 - INFO - __main__ - Step 13060: {'lr': 0.0004931431802593877, 'samples': 2507520, 'steps': 13059, 'loss/train': 2.082310438156128} -11/06/2021 23:03:09 - INFO - __main__ - Step 13061: {'lr': 0.0004931419458610956, 'samples': 2507712, 'steps': 13060, 'loss/train': 0.22066687047481537} -11/06/2021 23:03:10 - INFO - __main__ - Step 13062: {'lr': 0.0004931407113532476, 'samples': 2507904, 'steps': 13061, 'loss/train': 1.8766014575958252} -11/06/2021 23:03:10 - INFO - __main__ - Step 13063: {'lr': 0.000493139476735844, 'samples': 2508096, 'steps': 13062, 'loss/train': 2.6808207035064697} -11/06/2021 23:03:10 - INFO - __main__ - Step 13064: {'lr': 0.0004931382420088855, 'samples': 2508288, 'steps': 13063, 'loss/train': 1.8290174007415771} -11/06/2021 23:03:11 - INFO - __main__ - Step 13065: {'lr': 0.0004931370071723728, 'samples': 2508480, 'steps': 13064, 'loss/train': 1.6822478771209717} -11/06/2021 23:03:11 - INFO - __main__ - Step 13066: {'lr': 0.0004931357722263061, 'samples': 2508672, 'steps': 13065, 'loss/train': 1.7262883186340332} -11/06/2021 23:03:12 - INFO - __main__ - Step 13067: {'lr': 0.0004931345371706863, 'samples': 2508864, 'steps': 13066, 'loss/train': 1.8077123165130615} -11/06/2021 23:03:13 - INFO - __main__ - Step 13068: {'lr': 0.0004931333020055139, 'samples': 2509056, 'steps': 13067, 'loss/train': 1.600835919380188} -11/06/2021 23:03:13 - INFO - __main__ - Step 13069: {'lr': 0.0004931320667307893, 'samples': 2509248, 'steps': 13068, 'loss/train': 2.081484794616699} -11/06/2021 23:03:13 - INFO - __main__ - Step 13070: {'lr': 0.0004931308313465132, 'samples': 2509440, 'steps': 13069, 'loss/train': 1.9141942262649536} -11/06/2021 23:03:14 - INFO - __main__ - Step 13071: {'lr': 0.000493129595852686, 'samples': 2509632, 'steps': 13070, 'loss/train': 3.5768423080444336} -11/06/2021 23:03:15 - INFO - __main__ - Step 13072: {'lr': 0.0004931283602493084, 'samples': 2509824, 'steps': 13071, 'loss/train': 1.5225051641464233} -11/06/2021 23:03:15 - INFO - __main__ - Step 13073: {'lr': 0.0004931271245363809, 'samples': 2510016, 'steps': 13072, 'loss/train': 1.574705958366394} -11/06/2021 23:03:15 - INFO - __main__ - Step 13074: {'lr': 0.0004931258887139041, 'samples': 2510208, 'steps': 13073, 'loss/train': 1.5260777473449707} -11/06/2021 23:03:16 - INFO - __main__ - Step 13075: {'lr': 0.0004931246527818785, 'samples': 2510400, 'steps': 13074, 'loss/train': 1.26536226272583} -11/06/2021 23:03:16 - INFO - __main__ - Step 13076: {'lr': 0.0004931234167403047, 'samples': 2510592, 'steps': 13075, 'loss/train': 1.4206626415252686} -11/06/2021 23:03:17 - INFO - __main__ - Step 13077: {'lr': 0.0004931221805891833, 'samples': 2510784, 'steps': 13076, 'loss/train': 1.6260327100753784} -11/06/2021 23:03:17 - INFO - __main__ - Step 13078: {'lr': 0.0004931209443285147, 'samples': 2510976, 'steps': 13077, 'loss/train': 1.759495735168457} -11/06/2021 23:03:18 - INFO - __main__ - Step 13079: {'lr': 0.0004931197079582996, 'samples': 2511168, 'steps': 13078, 'loss/train': 1.1801636219024658} -11/06/2021 23:03:18 - INFO - __main__ - Step 13080: {'lr': 0.0004931184714785385, 'samples': 2511360, 'steps': 13079, 'loss/train': 1.9777021408081055} -11/06/2021 23:03:18 - INFO - __main__ - Step 13081: {'lr': 0.000493117234889232, 'samples': 2511552, 'steps': 13080, 'loss/train': 1.551526665687561} -11/06/2021 23:03:20 - INFO - __main__ - Step 13082: {'lr': 0.0004931159981903805, 'samples': 2511744, 'steps': 13081, 'loss/train': 1.3697116374969482} -11/06/2021 23:03:20 - INFO - __main__ - Step 13083: {'lr': 0.0004931147613819848, 'samples': 2511936, 'steps': 13082, 'loss/train': 1.5000561475753784} -11/06/2021 23:03:20 - INFO - __main__ - Step 13084: {'lr': 0.0004931135244640453, 'samples': 2512128, 'steps': 13083, 'loss/train': 1.6628344058990479} -11/06/2021 23:03:21 - INFO - __main__ - Step 13085: {'lr': 0.0004931122874365627, 'samples': 2512320, 'steps': 13084, 'loss/train': 1.448068618774414} -11/06/2021 23:03:21 - INFO - __main__ - Step 13086: {'lr': 0.0004931110502995374, 'samples': 2512512, 'steps': 13085, 'loss/train': 1.518585443496704} -11/06/2021 23:03:22 - INFO - __main__ - Step 13087: {'lr': 0.0004931098130529699, 'samples': 2512704, 'steps': 13086, 'loss/train': 2.025705099105835} -11/06/2021 23:03:22 - INFO - __main__ - Step 13088: {'lr': 0.000493108575696861, 'samples': 2512896, 'steps': 13087, 'loss/train': 1.6481513977050781} -11/06/2021 23:03:23 - INFO - __main__ - Step 13089: {'lr': 0.0004931073382312111, 'samples': 2513088, 'steps': 13088, 'loss/train': 1.394457221031189} -11/06/2021 23:03:23 - INFO - __main__ - Step 13090: {'lr': 0.0004931061006560207, 'samples': 2513280, 'steps': 13089, 'loss/train': 1.560387134552002} -11/06/2021 23:03:23 - INFO - __main__ - Step 13091: {'lr': 0.0004931048629712905, 'samples': 2513472, 'steps': 13090, 'loss/train': 1.8698866367340088} -11/06/2021 23:03:24 - INFO - __main__ - Step 13092: {'lr': 0.000493103625177021, 'samples': 2513664, 'steps': 13091, 'loss/train': 2.115483522415161} -11/06/2021 23:03:25 - INFO - __main__ - Step 13093: {'lr': 0.0004931023872732128, 'samples': 2513856, 'steps': 13092, 'loss/train': 1.7177084684371948} -11/06/2021 23:03:25 - INFO - __main__ - Step 13094: {'lr': 0.0004931011492598664, 'samples': 2514048, 'steps': 13093, 'loss/train': 0.9922665953636169} -11/06/2021 23:03:25 - INFO - __main__ - Step 13095: {'lr': 0.0004930999111369824, 'samples': 2514240, 'steps': 13094, 'loss/train': 1.6571738719940186} -11/06/2021 23:03:26 - INFO - __main__ - Step 13096: {'lr': 0.0004930986729045613, 'samples': 2514432, 'steps': 13095, 'loss/train': 1.8621472120285034} -11/06/2021 23:03:26 - INFO - __main__ - Step 13097: {'lr': 0.0004930974345626036, 'samples': 2514624, 'steps': 13096, 'loss/train': 1.177014708518982} -11/06/2021 23:03:27 - INFO - __main__ - Step 13098: {'lr': 0.00049309619611111, 'samples': 2514816, 'steps': 13097, 'loss/train': 1.6075189113616943} -11/06/2021 23:03:28 - INFO - __main__ - Step 13099: {'lr': 0.000493094957550081, 'samples': 2515008, 'steps': 13098, 'loss/train': 1.3369756937026978} -11/06/2021 23:03:28 - INFO - __main__ - Step 13100: {'lr': 0.0004930937188795172, 'samples': 2515200, 'steps': 13099, 'loss/train': 1.7597624063491821} -11/06/2021 23:03:28 - INFO - __main__ - Step 13101: {'lr': 0.0004930924800994192, 'samples': 2515392, 'steps': 13100, 'loss/train': 1.1955498456954956} -11/06/2021 23:03:29 - INFO - __main__ - Step 13102: {'lr': 0.0004930912412097874, 'samples': 2515584, 'steps': 13101, 'loss/train': 2.0432753562927246} -11/06/2021 23:03:30 - INFO - __main__ - Step 13103: {'lr': 0.0004930900022106224, 'samples': 2515776, 'steps': 13102, 'loss/train': 1.897919774055481} -11/06/2021 23:03:30 - INFO - __main__ - Step 13104: {'lr': 0.0004930887631019248, 'samples': 2515968, 'steps': 13103, 'loss/train': 1.3024754524230957} -11/06/2021 23:03:30 - INFO - __main__ - Step 13105: {'lr': 0.0004930875238836951, 'samples': 2516160, 'steps': 13104, 'loss/train': 1.7677634954452515} -11/06/2021 23:03:31 - INFO - __main__ - Step 13106: {'lr': 0.000493086284555934, 'samples': 2516352, 'steps': 13105, 'loss/train': 2.061279773712158} -11/06/2021 23:03:31 - INFO - __main__ - Step 13107: {'lr': 0.0004930850451186421, 'samples': 2516544, 'steps': 13106, 'loss/train': 1.8709264993667603} -11/06/2021 23:03:32 - INFO - __main__ - Step 13108: {'lr': 0.0004930838055718196, 'samples': 2516736, 'steps': 13107, 'loss/train': 1.6638407707214355} -11/06/2021 23:03:32 - INFO - __main__ - Step 13109: {'lr': 0.0004930825659154674, 'samples': 2516928, 'steps': 13108, 'loss/train': 0.959062397480011} -11/06/2021 23:03:33 - INFO - __main__ - Step 13110: {'lr': 0.000493081326149586, 'samples': 2517120, 'steps': 13109, 'loss/train': 1.8210927248001099} -11/06/2021 23:03:33 - INFO - __main__ - Step 13111: {'lr': 0.0004930800862741758, 'samples': 2517312, 'steps': 13110, 'loss/train': 1.239546775817871} -11/06/2021 23:03:33 - INFO - __main__ - Step 13112: {'lr': 0.0004930788462892375, 'samples': 2517504, 'steps': 13111, 'loss/train': 1.4559482336044312} -11/06/2021 23:03:34 - INFO - __main__ - Step 13113: {'lr': 0.0004930776061947716, 'samples': 2517696, 'steps': 13112, 'loss/train': 1.6347291469573975} -11/06/2021 23:03:35 - INFO - __main__ - Step 13114: {'lr': 0.0004930763659907788, 'samples': 2517888, 'steps': 13113, 'loss/train': 1.7659398317337036} -11/06/2021 23:03:35 - INFO - __main__ - Step 13115: {'lr': 0.0004930751256772593, 'samples': 2518080, 'steps': 13114, 'loss/train': 1.8895224332809448} -11/06/2021 23:03:35 - INFO - __main__ - Step 13116: {'lr': 0.0004930738852542141, 'samples': 2518272, 'steps': 13115, 'loss/train': 1.4143397808074951} -11/06/2021 23:03:36 - INFO - __main__ - Step 13117: {'lr': 0.0004930726447216435, 'samples': 2518464, 'steps': 13116, 'loss/train': 2.018646240234375} -11/06/2021 23:03:37 - INFO - __main__ - Step 13118: {'lr': 0.0004930714040795481, 'samples': 2518656, 'steps': 13117, 'loss/train': 1.5822020769119263} -11/06/2021 23:03:37 - INFO - __main__ - Step 13119: {'lr': 0.0004930701633279285, 'samples': 2518848, 'steps': 13118, 'loss/train': 1.5482772588729858} -11/06/2021 23:03:38 - INFO - __main__ - Step 13120: {'lr': 0.0004930689224667853, 'samples': 2519040, 'steps': 13119, 'loss/train': 1.1191784143447876} -11/06/2021 23:03:38 - INFO - __main__ - Step 13121: {'lr': 0.0004930676814961189, 'samples': 2519232, 'steps': 13120, 'loss/train': 1.5763609409332275} -11/06/2021 23:03:38 - INFO - __main__ - Step 13122: {'lr': 0.00049306644041593, 'samples': 2519424, 'steps': 13121, 'loss/train': 1.3790456056594849} -11/06/2021 23:03:40 - INFO - __main__ - Step 13123: {'lr': 0.0004930651992262191, 'samples': 2519616, 'steps': 13122, 'loss/train': 1.3503462076187134} -11/06/2021 23:03:40 - INFO - __main__ - Step 13124: {'lr': 0.0004930639579269866, 'samples': 2519808, 'steps': 13123, 'loss/train': 1.4450675249099731} -11/06/2021 23:03:41 - INFO - __main__ - Step 13125: {'lr': 0.0004930627165182335, 'samples': 2520000, 'steps': 13124, 'loss/train': 1.5567551851272583} -11/06/2021 23:03:41 - INFO - __main__ - Step 13126: {'lr': 0.00049306147499996, 'samples': 2520192, 'steps': 13125, 'loss/train': 1.7951613664627075} -11/06/2021 23:03:42 - INFO - __main__ - Step 13127: {'lr': 0.0004930602333721667, 'samples': 2520384, 'steps': 13126, 'loss/train': 1.6020070314407349} -11/06/2021 23:03:42 - INFO - __main__ - Step 13128: {'lr': 0.0004930589916348542, 'samples': 2520576, 'steps': 13127, 'loss/train': 1.8576689958572388} -11/06/2021 23:03:42 - INFO - __main__ - Step 13129: {'lr': 0.0004930577497880231, 'samples': 2520768, 'steps': 13128, 'loss/train': 1.8128331899642944} -11/06/2021 23:03:43 - INFO - __main__ - Step 13130: {'lr': 0.000493056507831674, 'samples': 2520960, 'steps': 13129, 'loss/train': 1.8191680908203125} -11/06/2021 23:03:44 - INFO - __main__ - Step 13131: {'lr': 0.0004930552657658073, 'samples': 2521152, 'steps': 13130, 'loss/train': 1.0424447059631348} -11/06/2021 23:03:44 - INFO - __main__ - Step 13132: {'lr': 0.0004930540235904237, 'samples': 2521344, 'steps': 13131, 'loss/train': 0.9502253532409668} -11/06/2021 23:03:44 - INFO - __main__ - Step 13133: {'lr': 0.0004930527813055237, 'samples': 2521536, 'steps': 13132, 'loss/train': 2.1043529510498047} -11/06/2021 23:03:45 - INFO - __main__ - Step 13134: {'lr': 0.0004930515389111078, 'samples': 2521728, 'steps': 13133, 'loss/train': 1.6203279495239258} -11/06/2021 23:03:46 - INFO - __main__ - Step 13135: {'lr': 0.0004930502964071767, 'samples': 2521920, 'steps': 13134, 'loss/train': 1.872376561164856} -11/06/2021 23:03:46 - INFO - __main__ - Step 13136: {'lr': 0.0004930490537937309, 'samples': 2522112, 'steps': 13135, 'loss/train': 1.530863881111145} -11/06/2021 23:03:46 - INFO - __main__ - Step 13137: {'lr': 0.0004930478110707709, 'samples': 2522304, 'steps': 13136, 'loss/train': 1.446254014968872} -11/06/2021 23:03:47 - INFO - __main__ - Step 13138: {'lr': 0.0004930465682382973, 'samples': 2522496, 'steps': 13137, 'loss/train': 2.3736038208007812} -11/06/2021 23:03:47 - INFO - __main__ - Step 13139: {'lr': 0.0004930453252963107, 'samples': 2522688, 'steps': 13138, 'loss/train': 1.7954354286193848} -11/06/2021 23:03:48 - INFO - __main__ - Step 13140: {'lr': 0.0004930440822448115, 'samples': 2522880, 'steps': 13139, 'loss/train': 1.4115676879882812} -11/06/2021 23:03:48 - INFO - __main__ - Step 13141: {'lr': 0.0004930428390838006, 'samples': 2523072, 'steps': 13140, 'loss/train': 1.7960898876190186} -11/06/2021 23:03:49 - INFO - __main__ - Step 13142: {'lr': 0.0004930415958132782, 'samples': 2523264, 'steps': 13141, 'loss/train': 1.5703538656234741} -11/06/2021 23:03:49 - INFO - __main__ - Step 13143: {'lr': 0.0004930403524332451, 'samples': 2523456, 'steps': 13142, 'loss/train': 1.3508336544036865} -11/06/2021 23:03:50 - INFO - __main__ - Step 13144: {'lr': 0.0004930391089437017, 'samples': 2523648, 'steps': 13143, 'loss/train': 1.7475541830062866} -11/06/2021 23:03:51 - INFO - __main__ - Step 13145: {'lr': 0.0004930378653446487, 'samples': 2523840, 'steps': 13144, 'loss/train': 1.8159362077713013} -11/06/2021 23:03:51 - INFO - __main__ - Step 13146: {'lr': 0.0004930366216360865, 'samples': 2524032, 'steps': 13145, 'loss/train': 1.6725317239761353} -11/06/2021 23:03:51 - INFO - __main__ - Step 13147: {'lr': 0.0004930353778180158, 'samples': 2524224, 'steps': 13146, 'loss/train': 1.5883946418762207} -11/06/2021 23:03:52 - INFO - __main__ - Step 13148: {'lr': 0.0004930341338904371, 'samples': 2524416, 'steps': 13147, 'loss/train': 1.889960765838623} -11/06/2021 23:03:52 - INFO - __main__ - Step 13149: {'lr': 0.000493032889853351, 'samples': 2524608, 'steps': 13148, 'loss/train': 1.9227193593978882} -11/06/2021 23:03:53 - INFO - __main__ - Step 13150: {'lr': 0.0004930316457067579, 'samples': 2524800, 'steps': 13149, 'loss/train': 1.51223886013031} -11/06/2021 23:03:53 - INFO - __main__ - Step 13151: {'lr': 0.0004930304014506586, 'samples': 2524992, 'steps': 13150, 'loss/train': 1.603259801864624} -11/06/2021 23:03:54 - INFO - __main__ - Step 13152: {'lr': 0.0004930291570850536, 'samples': 2525184, 'steps': 13151, 'loss/train': 1.576635479927063} -11/06/2021 23:03:54 - INFO - __main__ - Step 13153: {'lr': 0.0004930279126099433, 'samples': 2525376, 'steps': 13152, 'loss/train': 1.0832215547561646} -11/06/2021 23:03:54 - INFO - __main__ - Step 13154: {'lr': 0.0004930266680253284, 'samples': 2525568, 'steps': 13153, 'loss/train': 1.7394440174102783} -11/06/2021 23:03:55 - INFO - __main__ - Step 13155: {'lr': 0.0004930254233312095, 'samples': 2525760, 'steps': 13154, 'loss/train': 1.2529510259628296} -11/06/2021 23:03:56 - INFO - __main__ - Step 13156: {'lr': 0.000493024178527587, 'samples': 2525952, 'steps': 13155, 'loss/train': 2.2869997024536133} -11/06/2021 23:03:56 - INFO - __main__ - Step 13157: {'lr': 0.0004930229336144616, 'samples': 2526144, 'steps': 13156, 'loss/train': 1.7819799184799194} -11/06/2021 23:03:56 - INFO - __main__ - Step 13158: {'lr': 0.0004930216885918339, 'samples': 2526336, 'steps': 13157, 'loss/train': 1.7473498582839966} -11/06/2021 23:03:57 - INFO - __main__ - Step 13159: {'lr': 0.0004930204434597042, 'samples': 2526528, 'steps': 13158, 'loss/train': 1.48399019241333} -11/06/2021 23:03:57 - INFO - __main__ - Step 13160: {'lr': 0.0004930191982180734, 'samples': 2526720, 'steps': 13159, 'loss/train': 1.5737640857696533} -11/06/2021 23:03:58 - INFO - __main__ - Step 13161: {'lr': 0.0004930179528669418, 'samples': 2526912, 'steps': 13160, 'loss/train': 2.018446683883667} -11/06/2021 23:03:59 - INFO - __main__ - Step 13162: {'lr': 0.0004930167074063101, 'samples': 2527104, 'steps': 13161, 'loss/train': 1.7737540006637573} -11/06/2021 23:03:59 - INFO - __main__ - Step 13163: {'lr': 0.0004930154618361789, 'samples': 2527296, 'steps': 13162, 'loss/train': 1.867935299873352} -11/06/2021 23:03:59 - INFO - __main__ - Step 13164: {'lr': 0.0004930142161565486, 'samples': 2527488, 'steps': 13163, 'loss/train': 2.0381977558135986} -11/06/2021 23:04:00 - INFO - __main__ - Step 13165: {'lr': 0.0004930129703674198, 'samples': 2527680, 'steps': 13164, 'loss/train': 1.8840910196304321} -11/06/2021 23:04:01 - INFO - __main__ - Step 13166: {'lr': 0.0004930117244687931, 'samples': 2527872, 'steps': 13165, 'loss/train': 1.4074156284332275} -11/06/2021 23:04:01 - INFO - __main__ - Step 13167: {'lr': 0.0004930104784606692, 'samples': 2528064, 'steps': 13166, 'loss/train': 2.063450813293457} -11/06/2021 23:04:01 - INFO - __main__ - Step 13168: {'lr': 0.0004930092323430484, 'samples': 2528256, 'steps': 13167, 'loss/train': 2.0765469074249268} -11/06/2021 23:04:02 - INFO - __main__ - Step 13169: {'lr': 0.0004930079861159315, 'samples': 2528448, 'steps': 13168, 'loss/train': 1.3868030309677124} -11/06/2021 23:04:02 - INFO - __main__ - Step 13170: {'lr': 0.0004930067397793188, 'samples': 2528640, 'steps': 13169, 'loss/train': 1.732783317565918} -11/06/2021 23:04:03 - INFO - __main__ - Step 13171: {'lr': 0.0004930054933332111, 'samples': 2528832, 'steps': 13170, 'loss/train': 1.683578610420227} -11/06/2021 23:04:03 - INFO - __main__ - Step 13172: {'lr': 0.0004930042467776089, 'samples': 2529024, 'steps': 13171, 'loss/train': 1.720359206199646} -11/06/2021 23:04:04 - INFO - __main__ - Step 13173: {'lr': 0.0004930030001125128, 'samples': 2529216, 'steps': 13172, 'loss/train': 1.2218900918960571} -11/06/2021 23:04:04 - INFO - __main__ - Step 13174: {'lr': 0.000493001753337923, 'samples': 2529408, 'steps': 13173, 'loss/train': 1.542048692703247} -11/06/2021 23:04:04 - INFO - __main__ - Step 13175: {'lr': 0.0004930005064538406, 'samples': 2529600, 'steps': 13174, 'loss/train': 1.7872868776321411} -11/06/2021 23:04:05 - INFO - __main__ - Step 13176: {'lr': 0.0004929992594602659, 'samples': 2529792, 'steps': 13175, 'loss/train': 1.104972243309021} -11/06/2021 23:04:06 - INFO - __main__ - Step 13177: {'lr': 0.0004929980123571995, 'samples': 2529984, 'steps': 13176, 'loss/train': 1.122475504875183} -11/06/2021 23:04:06 - INFO - __main__ - Step 13178: {'lr': 0.000492996765144642, 'samples': 2530176, 'steps': 13177, 'loss/train': 1.7249083518981934} -11/06/2021 23:04:07 - INFO - __main__ - Step 13179: {'lr': 0.0004929955178225938, 'samples': 2530368, 'steps': 13178, 'loss/train': 1.1565667390823364} -11/06/2021 23:04:07 - INFO - __main__ - Step 13180: {'lr': 0.0004929942703910556, 'samples': 2530560, 'steps': 13179, 'loss/train': 2.3176705837249756} -11/06/2021 23:04:07 - INFO - __main__ - Step 13181: {'lr': 0.0004929930228500279, 'samples': 2530752, 'steps': 13180, 'loss/train': 1.5887360572814941} -11/06/2021 23:04:09 - INFO - __main__ - Step 13182: {'lr': 0.0004929917751995114, 'samples': 2530944, 'steps': 13181, 'loss/train': 1.8893414735794067} -11/06/2021 23:04:09 - INFO - __main__ - Step 13183: {'lr': 0.0004929905274395064, 'samples': 2531136, 'steps': 13182, 'loss/train': 1.7040241956710815} -11/06/2021 23:04:09 - INFO - __main__ - Step 13184: {'lr': 0.0004929892795700137, 'samples': 2531328, 'steps': 13183, 'loss/train': 1.8834102153778076} -11/06/2021 23:04:10 - INFO - __main__ - Step 13185: {'lr': 0.0004929880315910338, 'samples': 2531520, 'steps': 13184, 'loss/train': 0.39340120553970337} -11/06/2021 23:04:10 - INFO - __main__ - Step 13186: {'lr': 0.0004929867835025672, 'samples': 2531712, 'steps': 13185, 'loss/train': 0.29085573554039} -11/06/2021 23:04:10 - INFO - __main__ - Step 13187: {'lr': 0.0004929855353046145, 'samples': 2531904, 'steps': 13186, 'loss/train': 1.7704241275787354} -11/06/2021 23:04:11 - INFO - __main__ - Step 13188: {'lr': 0.0004929842869971763, 'samples': 2532096, 'steps': 13187, 'loss/train': 1.63791024684906} -11/06/2021 23:04:12 - INFO - __main__ - Step 13189: {'lr': 0.000492983038580253, 'samples': 2532288, 'steps': 13188, 'loss/train': 0.9975517392158508} -11/06/2021 23:04:12 - INFO - __main__ - Step 13190: {'lr': 0.0004929817900538455, 'samples': 2532480, 'steps': 13189, 'loss/train': 1.4178115129470825} -11/06/2021 23:04:12 - INFO - __main__ - Step 13191: {'lr': 0.000492980541417954, 'samples': 2532672, 'steps': 13190, 'loss/train': 1.3342525959014893} -11/06/2021 23:04:13 - INFO - __main__ - Step 13192: {'lr': 0.0004929792926725794, 'samples': 2532864, 'steps': 13191, 'loss/train': 1.589043140411377} -11/06/2021 23:04:14 - INFO - __main__ - Step 13193: {'lr': 0.000492978043817722, 'samples': 2533056, 'steps': 13192, 'loss/train': 1.7581723928451538} -11/06/2021 23:04:14 - INFO - __main__ - Step 13194: {'lr': 0.0004929767948533823, 'samples': 2533248, 'steps': 13193, 'loss/train': 1.6882779598236084} -11/06/2021 23:04:15 - INFO - __main__ - Step 13195: {'lr': 0.0004929755457795612, 'samples': 2533440, 'steps': 13194, 'loss/train': 1.444657802581787} -11/06/2021 23:04:15 - INFO - __main__ - Step 13196: {'lr': 0.0004929742965962589, 'samples': 2533632, 'steps': 13195, 'loss/train': 1.9157907962799072} -11/06/2021 23:04:15 - INFO - __main__ - Step 13197: {'lr': 0.0004929730473034763, 'samples': 2533824, 'steps': 13196, 'loss/train': 1.561155915260315} -11/06/2021 23:04:16 - INFO - __main__ - Step 13198: {'lr': 0.0004929717979012136, 'samples': 2534016, 'steps': 13197, 'loss/train': 1.3841657638549805} -11/06/2021 23:04:17 - INFO - __main__ - Step 13199: {'lr': 0.0004929705483894717, 'samples': 2534208, 'steps': 13198, 'loss/train': 1.5719326734542847} -11/06/2021 23:04:17 - INFO - __main__ - Step 13200: {'lr': 0.000492969298768251, 'samples': 2534400, 'steps': 13199, 'loss/train': 1.4586410522460938} -11/06/2021 23:04:17 - INFO - __main__ - Step 13201: {'lr': 0.000492968049037552, 'samples': 2534592, 'steps': 13200, 'loss/train': 1.2632533311843872} -11/06/2021 23:04:18 - INFO - __main__ - Step 13202: {'lr': 0.0004929667991973754, 'samples': 2534784, 'steps': 13201, 'loss/train': 1.835030436515808} -11/06/2021 23:04:19 - INFO - __main__ - Step 13203: {'lr': 0.0004929655492477218, 'samples': 2534976, 'steps': 13202, 'loss/train': 2.025620937347412} -11/06/2021 23:04:19 - INFO - __main__ - Step 13204: {'lr': 0.0004929642991885916, 'samples': 2535168, 'steps': 13203, 'loss/train': 1.8089247941970825} -11/06/2021 23:04:20 - INFO - __main__ - Step 13205: {'lr': 0.0004929630490199854, 'samples': 2535360, 'steps': 13204, 'loss/train': 1.419128656387329} -11/06/2021 23:04:20 - INFO - __main__ - Step 13206: {'lr': 0.0004929617987419039, 'samples': 2535552, 'steps': 13205, 'loss/train': 1.9509419202804565} -11/06/2021 23:04:20 - INFO - __main__ - Step 13207: {'lr': 0.0004929605483543474, 'samples': 2535744, 'steps': 13206, 'loss/train': 1.7414957284927368} -11/06/2021 23:04:21 - INFO - __main__ - Step 13208: {'lr': 0.0004929592978573168, 'samples': 2535936, 'steps': 13207, 'loss/train': 1.3497000932693481} -11/06/2021 23:04:22 - INFO - __main__ - Step 13209: {'lr': 0.0004929580472508124, 'samples': 2536128, 'steps': 13208, 'loss/train': 1.4849274158477783} -11/06/2021 23:04:22 - INFO - __main__ - Step 13210: {'lr': 0.0004929567965348347, 'samples': 2536320, 'steps': 13209, 'loss/train': 1.7661024332046509} -11/06/2021 23:04:22 - INFO - __main__ - Step 13211: {'lr': 0.0004929555457093847, 'samples': 2536512, 'steps': 13210, 'loss/train': 1.7493226528167725} -11/06/2021 23:04:23 - INFO - __main__ - Step 13212: {'lr': 0.0004929542947744625, 'samples': 2536704, 'steps': 13211, 'loss/train': 1.1652683019638062} -11/06/2021 23:04:23 - INFO - __main__ - Step 13213: {'lr': 0.0004929530437300689, 'samples': 2536896, 'steps': 13212, 'loss/train': 1.901105284690857} -11/06/2021 23:04:24 - INFO - __main__ - Step 13214: {'lr': 0.0004929517925762045, 'samples': 2537088, 'steps': 13213, 'loss/train': 1.7152559757232666} -11/06/2021 23:04:24 - INFO - __main__ - Step 13215: {'lr': 0.0004929505413128696, 'samples': 2537280, 'steps': 13214, 'loss/train': 1.5080220699310303} -11/06/2021 23:04:25 - INFO - __main__ - Step 13216: {'lr': 0.000492949289940065, 'samples': 2537472, 'steps': 13215, 'loss/train': 1.7063556909561157} -11/06/2021 23:04:25 - INFO - __main__ - Step 13217: {'lr': 0.0004929480384577912, 'samples': 2537664, 'steps': 13216, 'loss/train': 1.8721396923065186} -11/06/2021 23:04:25 - INFO - __main__ - Step 13218: {'lr': 0.0004929467868660487, 'samples': 2537856, 'steps': 13217, 'loss/train': 1.3065961599349976} -11/06/2021 23:04:27 - INFO - __main__ - Step 13219: {'lr': 0.0004929455351648383, 'samples': 2538048, 'steps': 13218, 'loss/train': 1.533849835395813} -11/06/2021 23:04:27 - INFO - __main__ - Step 13220: {'lr': 0.0004929442833541603, 'samples': 2538240, 'steps': 13219, 'loss/train': 1.7814805507659912} -11/06/2021 23:04:27 - INFO - __main__ - Step 13221: {'lr': 0.0004929430314340154, 'samples': 2538432, 'steps': 13220, 'loss/train': 1.5206717252731323} -11/06/2021 23:04:28 - INFO - __main__ - Step 13222: {'lr': 0.000492941779404404, 'samples': 2538624, 'steps': 13221, 'loss/train': 1.3217058181762695} -11/06/2021 23:04:28 - INFO - __main__ - Step 13223: {'lr': 0.0004929405272653269, 'samples': 2538816, 'steps': 13222, 'loss/train': 1.758650302886963} -11/06/2021 23:04:29 - INFO - __main__ - Step 13224: {'lr': 0.0004929392750167845, 'samples': 2539008, 'steps': 13223, 'loss/train': 0.7512359023094177} -11/06/2021 23:04:29 - INFO - __main__ - Step 13225: {'lr': 0.0004929380226587774, 'samples': 2539200, 'steps': 13224, 'loss/train': 1.9796491861343384} -11/06/2021 23:04:30 - INFO - __main__ - Step 13226: {'lr': 0.0004929367701913062, 'samples': 2539392, 'steps': 13225, 'loss/train': 0.7901928424835205} -11/06/2021 23:04:30 - INFO - __main__ - Step 13227: {'lr': 0.0004929355176143714, 'samples': 2539584, 'steps': 13226, 'loss/train': 1.6296266317367554} -11/06/2021 23:04:30 - INFO - __main__ - Step 13228: {'lr': 0.0004929342649279736, 'samples': 2539776, 'steps': 13227, 'loss/train': 2.2642016410827637} -11/06/2021 23:04:31 - INFO - __main__ - Step 13229: {'lr': 0.0004929330121321134, 'samples': 2539968, 'steps': 13228, 'loss/train': 1.9576764106750488} -11/06/2021 23:04:32 - INFO - __main__ - Step 13230: {'lr': 0.0004929317592267913, 'samples': 2540160, 'steps': 13229, 'loss/train': 1.3771681785583496} -11/06/2021 23:04:32 - INFO - __main__ - Step 13231: {'lr': 0.000492930506212008, 'samples': 2540352, 'steps': 13230, 'loss/train': 1.4580309391021729} -11/06/2021 23:04:32 - INFO - __main__ - Step 13232: {'lr': 0.0004929292530877638, 'samples': 2540544, 'steps': 13231, 'loss/train': 1.5122207403182983} -11/06/2021 23:04:33 - INFO - __main__ - Step 13233: {'lr': 0.0004929279998540596, 'samples': 2540736, 'steps': 13232, 'loss/train': 1.770660400390625} -11/06/2021 23:04:34 - INFO - __main__ - Step 13234: {'lr': 0.0004929267465108956, 'samples': 2540928, 'steps': 13233, 'loss/train': 0.6602691411972046} -11/06/2021 23:04:34 - INFO - __main__ - Step 13235: {'lr': 0.0004929254930582728, 'samples': 2541120, 'steps': 13234, 'loss/train': 1.746626853942871} -11/06/2021 23:04:35 - INFO - __main__ - Step 13236: {'lr': 0.0004929242394961914, 'samples': 2541312, 'steps': 13235, 'loss/train': 1.5053402185440063} -11/06/2021 23:04:35 - INFO - __main__ - Step 13237: {'lr': 0.000492922985824652, 'samples': 2541504, 'steps': 13236, 'loss/train': 1.3967210054397583} -11/06/2021 23:04:35 - INFO - __main__ - Step 13238: {'lr': 0.0004929217320436553, 'samples': 2541696, 'steps': 13237, 'loss/train': 1.8607147932052612} -11/06/2021 23:04:36 - INFO - __main__ - Step 13239: {'lr': 0.0004929204781532018, 'samples': 2541888, 'steps': 13238, 'loss/train': 1.915743112564087} -11/06/2021 23:04:37 - INFO - __main__ - Step 13240: {'lr': 0.0004929192241532921, 'samples': 2542080, 'steps': 13239, 'loss/train': 1.5825774669647217} -11/06/2021 23:04:37 - INFO - __main__ - Step 13241: {'lr': 0.0004929179700439269, 'samples': 2542272, 'steps': 13240, 'loss/train': 0.8731245994567871} -11/06/2021 23:04:37 - INFO - __main__ - Step 13242: {'lr': 0.0004929167158251065, 'samples': 2542464, 'steps': 13241, 'loss/train': 1.7549324035644531} -11/06/2021 23:04:38 - INFO - __main__ - Step 13243: {'lr': 0.0004929154614968315, 'samples': 2542656, 'steps': 13242, 'loss/train': 0.5492236614227295} -11/06/2021 23:04:39 - INFO - __main__ - Step 13244: {'lr': 0.0004929142070591026, 'samples': 2542848, 'steps': 13243, 'loss/train': 1.614729404449463} -11/06/2021 23:04:39 - INFO - __main__ - Step 13245: {'lr': 0.0004929129525119203, 'samples': 2543040, 'steps': 13244, 'loss/train': 1.537818193435669} -11/06/2021 23:04:40 - INFO - __main__ - Step 13246: {'lr': 0.0004929116978552851, 'samples': 2543232, 'steps': 13245, 'loss/train': 1.7951061725616455} -11/06/2021 23:04:40 - INFO - __main__ - Step 13247: {'lr': 0.0004929104430891978, 'samples': 2543424, 'steps': 13246, 'loss/train': 1.5061917304992676} -11/06/2021 23:04:40 - INFO - __main__ - Step 13248: {'lr': 0.0004929091882136587, 'samples': 2543616, 'steps': 13247, 'loss/train': 1.6849573850631714} -11/06/2021 23:04:41 - INFO - __main__ - Step 13249: {'lr': 0.0004929079332286685, 'samples': 2543808, 'steps': 13248, 'loss/train': 1.7223663330078125} -11/06/2021 23:04:42 - INFO - __main__ - Step 13250: {'lr': 0.0004929066781342277, 'samples': 2544000, 'steps': 13249, 'loss/train': 1.109410285949707} -11/06/2021 23:04:42 - INFO - __main__ - Step 13251: {'lr': 0.0004929054229303369, 'samples': 2544192, 'steps': 13250, 'loss/train': 1.5786045789718628} -11/06/2021 23:04:42 - INFO - __main__ - Step 13252: {'lr': 0.0004929041676169967, 'samples': 2544384, 'steps': 13251, 'loss/train': 1.4510022401809692} -11/06/2021 23:04:43 - INFO - __main__ - Step 13253: {'lr': 0.0004929029121942077, 'samples': 2544576, 'steps': 13252, 'loss/train': 1.5690830945968628} -11/06/2021 23:04:43 - INFO - __main__ - Step 13254: {'lr': 0.0004929016566619703, 'samples': 2544768, 'steps': 13253, 'loss/train': 1.475024938583374} -11/06/2021 23:04:44 - INFO - __main__ - Step 13255: {'lr': 0.0004929004010202851, 'samples': 2544960, 'steps': 13254, 'loss/train': 1.462422490119934} -11/06/2021 23:04:44 - INFO - __main__ - Step 13256: {'lr': 0.0004928991452691528, 'samples': 2545152, 'steps': 13255, 'loss/train': 1.8692861795425415} -11/06/2021 23:04:45 - INFO - __main__ - Step 13257: {'lr': 0.0004928978894085739, 'samples': 2545344, 'steps': 13256, 'loss/train': 1.8582710027694702} -11/06/2021 23:04:45 - INFO - __main__ - Step 13258: {'lr': 0.000492896633438549, 'samples': 2545536, 'steps': 13257, 'loss/train': 2.016894578933716} -11/06/2021 23:04:46 - INFO - __main__ - Step 13259: {'lr': 0.0004928953773590785, 'samples': 2545728, 'steps': 13258, 'loss/train': 1.6744557619094849} -11/06/2021 23:04:47 - INFO - __main__ - Step 13260: {'lr': 0.0004928941211701632, 'samples': 2545920, 'steps': 13259, 'loss/train': 0.2616555988788605} -11/06/2021 23:04:47 - INFO - __main__ - Step 13261: {'lr': 0.0004928928648718035, 'samples': 2546112, 'steps': 13260, 'loss/train': 1.6083446741104126} -11/06/2021 23:04:47 - INFO - __main__ - Step 13262: {'lr': 0.0004928916084640001, 'samples': 2546304, 'steps': 13261, 'loss/train': 1.1888530254364014} -11/06/2021 23:04:48 - INFO - __main__ - Step 13263: {'lr': 0.0004928903519467534, 'samples': 2546496, 'steps': 13262, 'loss/train': 2.4009814262390137} -11/06/2021 23:04:48 - INFO - __main__ - Step 13264: {'lr': 0.0004928890953200641, 'samples': 2546688, 'steps': 13263, 'loss/train': 1.301665186882019} -11/06/2021 23:04:49 - INFO - __main__ - Step 13265: {'lr': 0.0004928878385839327, 'samples': 2546880, 'steps': 13264, 'loss/train': 1.293091058731079} -11/06/2021 23:04:49 - INFO - __main__ - Step 13266: {'lr': 0.0004928865817383597, 'samples': 2547072, 'steps': 13265, 'loss/train': 1.251847267150879} -11/06/2021 23:04:50 - INFO - __main__ - Step 13267: {'lr': 0.0004928853247833459, 'samples': 2547264, 'steps': 13266, 'loss/train': 1.894822120666504} -11/06/2021 23:04:50 - INFO - __main__ - Step 13268: {'lr': 0.0004928840677188918, 'samples': 2547456, 'steps': 13267, 'loss/train': 1.5503804683685303} -11/06/2021 23:04:50 - INFO - __main__ - Step 13269: {'lr': 0.0004928828105449977, 'samples': 2547648, 'steps': 13268, 'loss/train': 1.885050892829895} -11/06/2021 23:04:52 - INFO - __main__ - Step 13270: {'lr': 0.0004928815532616644, 'samples': 2547840, 'steps': 13269, 'loss/train': 1.5068950653076172} -11/06/2021 23:04:52 - INFO - __main__ - Step 13271: {'lr': 0.0004928802958688924, 'samples': 2548032, 'steps': 13270, 'loss/train': 1.590198040008545} -11/06/2021 23:04:52 - INFO - __main__ - Step 13272: {'lr': 0.0004928790383666823, 'samples': 2548224, 'steps': 13271, 'loss/train': 1.786717176437378} -11/06/2021 23:04:53 - INFO - __main__ - Step 13273: {'lr': 0.0004928777807550348, 'samples': 2548416, 'steps': 13272, 'loss/train': 1.5326136350631714} -11/06/2021 23:04:53 - INFO - __main__ - Step 13274: {'lr': 0.0004928765230339502, 'samples': 2548608, 'steps': 13273, 'loss/train': 2.4051101207733154} -11/06/2021 23:04:54 - INFO - __main__ - Step 13275: {'lr': 0.000492875265203429, 'samples': 2548800, 'steps': 13274, 'loss/train': 2.304696559906006} -11/06/2021 23:04:54 - INFO - __main__ - Step 13276: {'lr': 0.0004928740072634722, 'samples': 2548992, 'steps': 13275, 'loss/train': 2.0685250759124756} -11/06/2021 23:04:55 - INFO - __main__ - Step 13277: {'lr': 0.0004928727492140801, 'samples': 2549184, 'steps': 13276, 'loss/train': 1.733903408050537} -11/06/2021 23:04:55 - INFO - __main__ - Step 13278: {'lr': 0.0004928714910552533, 'samples': 2549376, 'steps': 13277, 'loss/train': 1.8066354990005493} -11/06/2021 23:04:55 - INFO - __main__ - Step 13279: {'lr': 0.0004928702327869922, 'samples': 2549568, 'steps': 13278, 'loss/train': 1.9759420156478882} -11/06/2021 23:04:56 - INFO - __main__ - Step 13280: {'lr': 0.0004928689744092976, 'samples': 2549760, 'steps': 13279, 'loss/train': 1.8017091751098633} -11/06/2021 23:04:57 - INFO - __main__ - Step 13281: {'lr': 0.0004928677159221701, 'samples': 2549952, 'steps': 13280, 'loss/train': 1.4251042604446411} -11/06/2021 23:04:57 - INFO - __main__ - Step 13282: {'lr': 0.00049286645732561, 'samples': 2550144, 'steps': 13281, 'loss/train': 1.3295786380767822} -11/06/2021 23:04:57 - INFO - __main__ - Step 13283: {'lr': 0.0004928651986196181, 'samples': 2550336, 'steps': 13282, 'loss/train': 1.1968010663986206} -11/06/2021 23:04:58 - INFO - __main__ - Step 13284: {'lr': 0.0004928639398041948, 'samples': 2550528, 'steps': 13283, 'loss/train': 1.974739670753479} -11/06/2021 23:04:59 - INFO - __main__ - Step 13285: {'lr': 0.0004928626808793409, 'samples': 2550720, 'steps': 13284, 'loss/train': 1.5590357780456543} -11/06/2021 23:04:59 - INFO - __main__ - Step 13286: {'lr': 0.0004928614218450568, 'samples': 2550912, 'steps': 13285, 'loss/train': 1.4196864366531372} -11/06/2021 23:05:00 - INFO - __main__ - Step 13287: {'lr': 0.000492860162701343, 'samples': 2551104, 'steps': 13286, 'loss/train': 1.4201176166534424} -11/06/2021 23:05:00 - INFO - __main__ - Step 13288: {'lr': 0.0004928589034482001, 'samples': 2551296, 'steps': 13287, 'loss/train': 1.8625463247299194} -11/06/2021 23:05:00 - INFO - __main__ - Step 13289: {'lr': 0.000492857644085629, 'samples': 2551488, 'steps': 13288, 'loss/train': 1.8042540550231934} -11/06/2021 23:05:01 - INFO - __main__ - Step 13290: {'lr': 0.0004928563846136296, 'samples': 2551680, 'steps': 13289, 'loss/train': 1.6024283170700073} -11/06/2021 23:05:02 - INFO - __main__ - Step 13291: {'lr': 0.0004928551250322032, 'samples': 2551872, 'steps': 13290, 'loss/train': 1.5354256629943848} -11/06/2021 23:05:02 - INFO - __main__ - Step 13292: {'lr': 0.0004928538653413499, 'samples': 2552064, 'steps': 13291, 'loss/train': 2.1231536865234375} -11/06/2021 23:05:02 - INFO - __main__ - Step 13293: {'lr': 0.0004928526055410704, 'samples': 2552256, 'steps': 13292, 'loss/train': 1.7034943103790283} -11/06/2021 23:05:03 - INFO - __main__ - Step 13294: {'lr': 0.0004928513456313653, 'samples': 2552448, 'steps': 13293, 'loss/train': 1.6685292720794678} -11/06/2021 23:05:03 - INFO - __main__ - Step 13295: {'lr': 0.000492850085612235, 'samples': 2552640, 'steps': 13294, 'loss/train': 1.6578960418701172} -11/06/2021 23:05:04 - INFO - __main__ - Step 13296: {'lr': 0.0004928488254836804, 'samples': 2552832, 'steps': 13295, 'loss/train': 1.1260663270950317} -11/06/2021 23:05:04 - INFO - __main__ - Step 13297: {'lr': 0.0004928475652457017, 'samples': 2553024, 'steps': 13296, 'loss/train': 1.738349199295044} -11/06/2021 23:05:05 - INFO - __main__ - Step 13298: {'lr': 0.0004928463048982998, 'samples': 2553216, 'steps': 13297, 'loss/train': 1.6107333898544312} -11/06/2021 23:05:05 - INFO - __main__ - Step 13299: {'lr': 0.0004928450444414749, 'samples': 2553408, 'steps': 13298, 'loss/train': 2.0628111362457275} -11/06/2021 23:05:06 - INFO - __main__ - Step 13300: {'lr': 0.0004928437838752278, 'samples': 2553600, 'steps': 13299, 'loss/train': 1.5923441648483276} -11/06/2021 23:05:07 - INFO - __main__ - Step 13301: {'lr': 0.0004928425231995593, 'samples': 2553792, 'steps': 13300, 'loss/train': 1.7554380893707275} -11/06/2021 23:05:07 - INFO - __main__ - Step 13302: {'lr': 0.0004928412624144694, 'samples': 2553984, 'steps': 13301, 'loss/train': 1.8865063190460205} -11/06/2021 23:05:07 - INFO - __main__ - Step 13303: {'lr': 0.0004928400015199591, 'samples': 2554176, 'steps': 13302, 'loss/train': 1.7683358192443848} -11/06/2021 23:05:08 - INFO - __main__ - Step 13304: {'lr': 0.0004928387405160288, 'samples': 2554368, 'steps': 13303, 'loss/train': 1.6909922361373901} -11/06/2021 23:05:08 - INFO - __main__ - Step 13305: {'lr': 0.0004928374794026792, 'samples': 2554560, 'steps': 13304, 'loss/train': 1.3994184732437134} -11/06/2021 23:05:09 - INFO - __main__ - Step 13306: {'lr': 0.0004928362181799107, 'samples': 2554752, 'steps': 13305, 'loss/train': 1.705430030822754} -11/06/2021 23:05:09 - INFO - __main__ - Step 13307: {'lr': 0.0004928349568477239, 'samples': 2554944, 'steps': 13306, 'loss/train': 1.6792200803756714} -11/06/2021 23:05:10 - INFO - __main__ - Step 13308: {'lr': 0.0004928336954061195, 'samples': 2555136, 'steps': 13307, 'loss/train': 1.2497096061706543} -11/06/2021 23:05:10 - INFO - __main__ - Step 13309: {'lr': 0.000492832433855098, 'samples': 2555328, 'steps': 13308, 'loss/train': 1.3893240690231323} -11/06/2021 23:05:10 - INFO - __main__ - Step 13310: {'lr': 0.0004928311721946599, 'samples': 2555520, 'steps': 13309, 'loss/train': 1.5529297590255737} -11/06/2021 23:05:11 - INFO - __main__ - Step 13311: {'lr': 0.0004928299104248059, 'samples': 2555712, 'steps': 13310, 'loss/train': 1.6530280113220215} -11/06/2021 23:05:12 - INFO - __main__ - Step 13312: {'lr': 0.0004928286485455365, 'samples': 2555904, 'steps': 13311, 'loss/train': 1.1228559017181396} -11/06/2021 23:05:12 - INFO - __main__ - Step 13313: {'lr': 0.0004928273865568521, 'samples': 2556096, 'steps': 13312, 'loss/train': 1.5058236122131348} -11/06/2021 23:05:13 - INFO - __main__ - Step 13314: {'lr': 0.0004928261244587536, 'samples': 2556288, 'steps': 13313, 'loss/train': 1.8624576330184937} -11/06/2021 23:05:13 - INFO - __main__ - Step 13315: {'lr': 0.0004928248622512412, 'samples': 2556480, 'steps': 13314, 'loss/train': 1.4049829244613647} -11/06/2021 23:05:14 - INFO - __main__ - Step 13316: {'lr': 0.0004928235999343159, 'samples': 2556672, 'steps': 13315, 'loss/train': 1.9419476985931396} -11/06/2021 23:05:14 - INFO - __main__ - Step 13317: {'lr': 0.0004928223375079778, 'samples': 2556864, 'steps': 13316, 'loss/train': 1.7618058919906616} -11/06/2021 23:05:14 - INFO - __main__ - Step 13318: {'lr': 0.0004928210749722278, 'samples': 2557056, 'steps': 13317, 'loss/train': 1.606778621673584} -11/06/2021 23:05:15 - INFO - __main__ - Step 13319: {'lr': 0.0004928198123270664, 'samples': 2557248, 'steps': 13318, 'loss/train': 1.5688247680664062} -11/06/2021 23:05:15 - INFO - __main__ - Step 13320: {'lr': 0.0004928185495724942, 'samples': 2557440, 'steps': 13319, 'loss/train': 1.9147883653640747} -11/06/2021 23:05:16 - INFO - __main__ - Step 13321: {'lr': 0.0004928172867085115, 'samples': 2557632, 'steps': 13320, 'loss/train': 1.3374717235565186} -11/06/2021 23:05:17 - INFO - __main__ - Step 13322: {'lr': 0.0004928160237351192, 'samples': 2557824, 'steps': 13321, 'loss/train': 1.7408499717712402} -11/06/2021 23:05:17 - INFO - __main__ - Step 13323: {'lr': 0.0004928147606523179, 'samples': 2558016, 'steps': 13322, 'loss/train': 1.20220947265625} -11/06/2021 23:05:17 - INFO - __main__ - Step 13324: {'lr': 0.0004928134974601078, 'samples': 2558208, 'steps': 13323, 'loss/train': 1.730553388595581} -11/06/2021 23:05:18 - INFO - __main__ - Step 13325: {'lr': 0.0004928122341584897, 'samples': 2558400, 'steps': 13324, 'loss/train': 1.704958200454712} -11/06/2021 23:05:18 - INFO - __main__ - Step 13326: {'lr': 0.0004928109707474643, 'samples': 2558592, 'steps': 13325, 'loss/train': 1.6393741369247437} -11/06/2021 23:05:19 - INFO - __main__ - Step 13327: {'lr': 0.0004928097072270319, 'samples': 2558784, 'steps': 13326, 'loss/train': 1.696864366531372} -11/06/2021 23:05:19 - INFO - __main__ - Step 13328: {'lr': 0.0004928084435971932, 'samples': 2558976, 'steps': 13327, 'loss/train': 1.6887147426605225} -11/06/2021 23:05:20 - INFO - __main__ - Step 13329: {'lr': 0.0004928071798579488, 'samples': 2559168, 'steps': 13328, 'loss/train': 1.7880932092666626} -11/06/2021 23:05:20 - INFO - __main__ - Step 13330: {'lr': 0.0004928059160092993, 'samples': 2559360, 'steps': 13329, 'loss/train': 1.7646552324295044} -11/06/2021 23:05:20 - INFO - __main__ - Step 13331: {'lr': 0.000492804652051245, 'samples': 2559552, 'steps': 13330, 'loss/train': 1.588904857635498} -11/06/2021 23:05:22 - INFO - __main__ - Step 13332: {'lr': 0.0004928033879837868, 'samples': 2559744, 'steps': 13331, 'loss/train': 1.295880675315857} -11/06/2021 23:05:22 - INFO - __main__ - Step 13333: {'lr': 0.0004928021238069251, 'samples': 2559936, 'steps': 13332, 'loss/train': 1.5167969465255737} -11/06/2021 23:05:22 - INFO - __main__ - Step 13334: {'lr': 0.0004928008595206605, 'samples': 2560128, 'steps': 13333, 'loss/train': 0.6749269366264343} -11/06/2021 23:05:23 - INFO - __main__ - Step 13335: {'lr': 0.0004927995951249937, 'samples': 2560320, 'steps': 13334, 'loss/train': 1.3417226076126099} -11/06/2021 23:05:23 - INFO - __main__ - Step 13336: {'lr': 0.0004927983306199251, 'samples': 2560512, 'steps': 13335, 'loss/train': 0.18615388870239258} -11/06/2021 23:05:24 - INFO - __main__ - Step 13337: {'lr': 0.0004927970660054552, 'samples': 2560704, 'steps': 13336, 'loss/train': 1.5057356357574463} -11/06/2021 23:05:25 - INFO - __main__ - Step 13338: {'lr': 0.0004927958012815849, 'samples': 2560896, 'steps': 13337, 'loss/train': 1.761964201927185} -11/06/2021 23:05:25 - INFO - __main__ - Step 13339: {'lr': 0.0004927945364483144, 'samples': 2561088, 'steps': 13338, 'loss/train': 1.5232926607131958} -11/06/2021 23:05:25 - INFO - __main__ - Step 13340: {'lr': 0.0004927932715056444, 'samples': 2561280, 'steps': 13339, 'loss/train': 1.5843162536621094} -11/06/2021 23:05:26 - INFO - __main__ - Step 13341: {'lr': 0.0004927920064535756, 'samples': 2561472, 'steps': 13340, 'loss/train': 1.808425784111023} -11/06/2021 23:05:27 - INFO - __main__ - Step 13342: {'lr': 0.0004927907412921084, 'samples': 2561664, 'steps': 13341, 'loss/train': 1.7012680768966675} -11/06/2021 23:05:27 - INFO - __main__ - Step 13343: {'lr': 0.0004927894760212435, 'samples': 2561856, 'steps': 13342, 'loss/train': 1.866380214691162} -11/06/2021 23:05:27 - INFO - __main__ - Step 13344: {'lr': 0.0004927882106409813, 'samples': 2562048, 'steps': 13343, 'loss/train': 0.6757373213768005} -11/06/2021 23:05:28 - INFO - __main__ - Step 13345: {'lr': 0.0004927869451513226, 'samples': 2562240, 'steps': 13344, 'loss/train': 1.5792934894561768} -11/06/2021 23:05:28 - INFO - __main__ - Step 13346: {'lr': 0.0004927856795522678, 'samples': 2562432, 'steps': 13345, 'loss/train': 1.1496813297271729} -11/06/2021 23:05:29 - INFO - __main__ - Step 13347: {'lr': 0.0004927844138438175, 'samples': 2562624, 'steps': 13346, 'loss/train': 1.646971344947815} -11/06/2021 23:05:29 - INFO - __main__ - Step 13348: {'lr': 0.0004927831480259723, 'samples': 2562816, 'steps': 13347, 'loss/train': 1.720847725868225} -11/06/2021 23:05:30 - INFO - __main__ - Step 13349: {'lr': 0.0004927818820987328, 'samples': 2563008, 'steps': 13348, 'loss/train': 1.679519534111023} -11/06/2021 23:05:30 - INFO - __main__ - Step 13350: {'lr': 0.0004927806160620995, 'samples': 2563200, 'steps': 13349, 'loss/train': 2.182821750640869} -11/06/2021 23:05:30 - INFO - __main__ - Step 13351: {'lr': 0.0004927793499160729, 'samples': 2563392, 'steps': 13350, 'loss/train': 2.1079049110412598} -11/06/2021 23:05:31 - INFO - __main__ - Step 13352: {'lr': 0.000492778083660654, 'samples': 2563584, 'steps': 13351, 'loss/train': 1.3878504037857056} -11/06/2021 23:05:32 - INFO - __main__ - Step 13353: {'lr': 0.0004927768172958427, 'samples': 2563776, 'steps': 13352, 'loss/train': 1.9145451784133911} -11/06/2021 23:05:32 - INFO - __main__ - Step 13354: {'lr': 0.00049277555082164, 'samples': 2563968, 'steps': 13353, 'loss/train': 1.463181495666504} -11/06/2021 23:05:33 - INFO - __main__ - Step 13355: {'lr': 0.0004927742842380465, 'samples': 2564160, 'steps': 13354, 'loss/train': 2.1269948482513428} -11/06/2021 23:05:33 - INFO - __main__ - Step 13356: {'lr': 0.0004927730175450626, 'samples': 2564352, 'steps': 13355, 'loss/train': 1.5894335508346558} -11/06/2021 23:05:34 - INFO - __main__ - Step 13357: {'lr': 0.0004927717507426887, 'samples': 2564544, 'steps': 13356, 'loss/train': 1.5174648761749268} -11/06/2021 23:05:34 - INFO - __main__ - Step 13358: {'lr': 0.0004927704838309259, 'samples': 2564736, 'steps': 13357, 'loss/train': 1.6864207983016968} -11/06/2021 23:05:35 - INFO - __main__ - Step 13359: {'lr': 0.0004927692168097743, 'samples': 2564928, 'steps': 13358, 'loss/train': 1.3122807741165161} -11/06/2021 23:05:35 - INFO - __main__ - Step 13360: {'lr': 0.0004927679496792347, 'samples': 2565120, 'steps': 13359, 'loss/train': 1.738892674446106} -11/06/2021 23:05:35 - INFO - __main__ - Step 13361: {'lr': 0.0004927666824393076, 'samples': 2565312, 'steps': 13360, 'loss/train': 0.4052657186985016} -11/06/2021 23:05:36 - INFO - __main__ - Step 13362: {'lr': 0.0004927654150899937, 'samples': 2565504, 'steps': 13361, 'loss/train': 2.3916163444519043} -11/06/2021 23:05:37 - INFO - __main__ - Step 13363: {'lr': 0.0004927641476312932, 'samples': 2565696, 'steps': 13362, 'loss/train': 1.5969182252883911} -11/06/2021 23:05:37 - INFO - __main__ - Step 13364: {'lr': 0.000492762880063207, 'samples': 2565888, 'steps': 13363, 'loss/train': 1.332525610923767} -11/06/2021 23:05:37 - INFO - __main__ - Step 13365: {'lr': 0.0004927616123857357, 'samples': 2566080, 'steps': 13364, 'loss/train': 1.9494463205337524} -11/06/2021 23:05:38 - INFO - __main__ - Step 13366: {'lr': 0.0004927603445988797, 'samples': 2566272, 'steps': 13365, 'loss/train': 1.918675422668457} -11/06/2021 23:05:39 - INFO - __main__ - Step 13367: {'lr': 0.0004927590767026396, 'samples': 2566464, 'steps': 13366, 'loss/train': 2.5392587184906006} -11/06/2021 23:05:39 - INFO - __main__ - Step 13368: {'lr': 0.0004927578086970161, 'samples': 2566656, 'steps': 13367, 'loss/train': 1.7140586376190186} -11/06/2021 23:05:39 - INFO - __main__ - Step 13369: {'lr': 0.0004927565405820096, 'samples': 2566848, 'steps': 13368, 'loss/train': 1.7201263904571533} -11/06/2021 23:05:40 - INFO - __main__ - Step 13370: {'lr': 0.0004927552723576207, 'samples': 2567040, 'steps': 13369, 'loss/train': 1.939740777015686} -11/06/2021 23:05:40 - INFO - __main__ - Step 13371: {'lr': 0.0004927540040238501, 'samples': 2567232, 'steps': 13370, 'loss/train': 1.2085801362991333} -11/06/2021 23:05:41 - INFO - __main__ - Step 13372: {'lr': 0.0004927527355806983, 'samples': 2567424, 'steps': 13371, 'loss/train': 1.3057010173797607} -11/06/2021 23:05:41 - INFO - __main__ - Step 13373: {'lr': 0.0004927514670281659, 'samples': 2567616, 'steps': 13372, 'loss/train': 1.3879728317260742} -11/06/2021 23:05:42 - INFO - __main__ - Step 13374: {'lr': 0.0004927501983662534, 'samples': 2567808, 'steps': 13373, 'loss/train': 2.229905128479004} -11/06/2021 23:05:42 - INFO - __main__ - Step 13375: {'lr': 0.0004927489295949613, 'samples': 2568000, 'steps': 13374, 'loss/train': 1.403855562210083} -11/06/2021 23:05:43 - INFO - __main__ - Step 13376: {'lr': 0.0004927476607142904, 'samples': 2568192, 'steps': 13375, 'loss/train': 1.8529839515686035} -11/06/2021 23:05:44 - INFO - __main__ - Step 13377: {'lr': 0.0004927463917242411, 'samples': 2568384, 'steps': 13376, 'loss/train': 1.6956440210342407} -11/06/2021 23:05:44 - INFO - __main__ - Step 13378: {'lr': 0.0004927451226248141, 'samples': 2568576, 'steps': 13377, 'loss/train': 1.5961147546768188} -11/06/2021 23:05:44 - INFO - __main__ - Step 13379: {'lr': 0.0004927438534160098, 'samples': 2568768, 'steps': 13378, 'loss/train': 1.2757984399795532} -11/06/2021 23:05:45 - INFO - __main__ - Step 13380: {'lr': 0.0004927425840978289, 'samples': 2568960, 'steps': 13379, 'loss/train': 1.361778736114502} -11/06/2021 23:05:45 - INFO - __main__ - Step 13381: {'lr': 0.0004927413146702719, 'samples': 2569152, 'steps': 13380, 'loss/train': 1.2567278146743774} -11/06/2021 23:05:45 - INFO - __main__ - Step 13382: {'lr': 0.0004927400451333394, 'samples': 2569344, 'steps': 13381, 'loss/train': 1.9279859066009521} -11/06/2021 23:05:46 - INFO - __main__ - Step 13383: {'lr': 0.0004927387754870321, 'samples': 2569536, 'steps': 13382, 'loss/train': 0.35177692770957947} -11/06/2021 23:05:47 - INFO - __main__ - Step 13384: {'lr': 0.0004927375057313504, 'samples': 2569728, 'steps': 13383, 'loss/train': 2.1717875003814697} -11/06/2021 23:05:47 - INFO - __main__ - Step 13385: {'lr': 0.0004927362358662948, 'samples': 2569920, 'steps': 13384, 'loss/train': 1.7761980295181274} -11/06/2021 23:05:47 - INFO - __main__ - Step 13386: {'lr': 0.0004927349658918662, 'samples': 2570112, 'steps': 13385, 'loss/train': 1.3248966932296753} -11/06/2021 23:05:48 - INFO - __main__ - Step 13387: {'lr': 0.0004927336958080648, 'samples': 2570304, 'steps': 13386, 'loss/train': 1.88877272605896} -11/06/2021 23:05:49 - INFO - __main__ - Step 13388: {'lr': 0.0004927324256148914, 'samples': 2570496, 'steps': 13387, 'loss/train': 1.2974435091018677} -11/06/2021 23:05:49 - INFO - __main__ - Step 13389: {'lr': 0.0004927311553123465, 'samples': 2570688, 'steps': 13388, 'loss/train': 1.5624191761016846} -11/06/2021 23:05:50 - INFO - __main__ - Step 13390: {'lr': 0.0004927298849004307, 'samples': 2570880, 'steps': 13389, 'loss/train': 1.5980331897735596} -11/06/2021 23:05:50 - INFO - __main__ - Step 13391: {'lr': 0.0004927286143791447, 'samples': 2571072, 'steps': 13390, 'loss/train': 2.0183682441711426} -11/06/2021 23:05:50 - INFO - __main__ - Step 13392: {'lr': 0.0004927273437484888, 'samples': 2571264, 'steps': 13391, 'loss/train': 1.7328522205352783} -11/06/2021 23:05:51 - INFO - __main__ - Step 13393: {'lr': 0.0004927260730084636, 'samples': 2571456, 'steps': 13392, 'loss/train': 1.669248342514038} -11/06/2021 23:05:52 - INFO - __main__ - Step 13394: {'lr': 0.0004927248021590699, 'samples': 2571648, 'steps': 13393, 'loss/train': 2.133970022201538} -11/06/2021 23:05:52 - INFO - __main__ - Step 13395: {'lr': 0.0004927235312003082, 'samples': 2571840, 'steps': 13394, 'loss/train': 1.0649173259735107} -11/06/2021 23:05:52 - INFO - __main__ - Step 13396: {'lr': 0.0004927222601321789, 'samples': 2572032, 'steps': 13395, 'loss/train': 2.6536405086517334} -11/06/2021 23:05:53 - INFO - __main__ - Step 13397: {'lr': 0.0004927209889546828, 'samples': 2572224, 'steps': 13396, 'loss/train': 1.37748122215271} -11/06/2021 23:05:54 - INFO - __main__ - Step 13398: {'lr': 0.0004927197176678203, 'samples': 2572416, 'steps': 13397, 'loss/train': 1.8754839897155762} -11/06/2021 23:05:54 - INFO - __main__ - Step 13399: {'lr': 0.000492718446271592, 'samples': 2572608, 'steps': 13398, 'loss/train': 1.372225284576416} -11/06/2021 23:05:55 - INFO - __main__ - Step 13400: {'lr': 0.0004927171747659986, 'samples': 2572800, 'steps': 13399, 'loss/train': 1.8654577732086182} -11/06/2021 23:05:55 - INFO - __main__ - Step 13401: {'lr': 0.0004927159031510405, 'samples': 2572992, 'steps': 13400, 'loss/train': 0.6154890060424805} -11/06/2021 23:05:55 - INFO - __main__ - Step 13402: {'lr': 0.0004927146314267184, 'samples': 2573184, 'steps': 13401, 'loss/train': 1.4731422662734985} -11/06/2021 23:05:57 - INFO - __main__ - Step 13403: {'lr': 0.000492713359593033, 'samples': 2573376, 'steps': 13402, 'loss/train': 1.8210397958755493} -11/06/2021 23:05:57 - INFO - __main__ - Step 13404: {'lr': 0.0004927120876499846, 'samples': 2573568, 'steps': 13403, 'loss/train': 2.1863057613372803} -11/06/2021 23:05:57 - INFO - __main__ - Step 13405: {'lr': 0.0004927108155975738, 'samples': 2573760, 'steps': 13404, 'loss/train': 1.5386931896209717} -11/06/2021 23:05:58 - INFO - __main__ - Step 13406: {'lr': 0.0004927095434358012, 'samples': 2573952, 'steps': 13405, 'loss/train': 2.4172680377960205} -11/06/2021 23:05:58 - INFO - __main__ - Step 13407: {'lr': 0.0004927082711646676, 'samples': 2574144, 'steps': 13406, 'loss/train': 1.7488776445388794} -11/06/2021 23:05:58 - INFO - __main__ - Step 13408: {'lr': 0.0004927069987841733, 'samples': 2574336, 'steps': 13407, 'loss/train': 2.008625030517578} -11/06/2021 23:05:59 - INFO - __main__ - Step 13409: {'lr': 0.0004927057262943189, 'samples': 2574528, 'steps': 13408, 'loss/train': 1.6773982048034668} -11/06/2021 23:06:00 - INFO - __main__ - Step 13410: {'lr': 0.0004927044536951052, 'samples': 2574720, 'steps': 13409, 'loss/train': 2.1111257076263428} -11/06/2021 23:06:00 - INFO - __main__ - Step 13411: {'lr': 0.0004927031809865324, 'samples': 2574912, 'steps': 13410, 'loss/train': 1.8370585441589355} -11/06/2021 23:06:00 - INFO - __main__ - Step 13412: {'lr': 0.0004927019081686015, 'samples': 2575104, 'steps': 13411, 'loss/train': 1.4143866300582886} -11/06/2021 23:06:01 - INFO - __main__ - Step 13413: {'lr': 0.0004927006352413128, 'samples': 2575296, 'steps': 13412, 'loss/train': 1.1940877437591553} -11/06/2021 23:06:02 - INFO - __main__ - Step 13414: {'lr': 0.000492699362204667, 'samples': 2575488, 'steps': 13413, 'loss/train': 1.8130630254745483} -11/06/2021 23:06:02 - INFO - __main__ - Step 13415: {'lr': 0.0004926980890586645, 'samples': 2575680, 'steps': 13414, 'loss/train': 1.6337990760803223} -11/06/2021 23:06:02 - INFO - __main__ - Step 13416: {'lr': 0.000492696815803306, 'samples': 2575872, 'steps': 13415, 'loss/train': 1.7381833791732788} -11/06/2021 23:06:03 - INFO - __main__ - Step 13417: {'lr': 0.0004926955424385921, 'samples': 2576064, 'steps': 13416, 'loss/train': 1.8581897020339966} -11/06/2021 23:06:03 - INFO - __main__ - Step 13418: {'lr': 0.0004926942689645234, 'samples': 2576256, 'steps': 13417, 'loss/train': 0.9027330875396729} -11/06/2021 23:06:04 - INFO - __main__ - Step 13419: {'lr': 0.0004926929953811003, 'samples': 2576448, 'steps': 13418, 'loss/train': 1.8112411499023438} -11/06/2021 23:06:05 - INFO - __main__ - Step 13420: {'lr': 0.0004926917216883235, 'samples': 2576640, 'steps': 13419, 'loss/train': 1.7219598293304443} -11/06/2021 23:06:05 - INFO - __main__ - Step 13421: {'lr': 0.0004926904478861937, 'samples': 2576832, 'steps': 13420, 'loss/train': 1.8902779817581177} -11/06/2021 23:06:05 - INFO - __main__ - Step 13422: {'lr': 0.0004926891739747111, 'samples': 2577024, 'steps': 13421, 'loss/train': 1.9297341108322144} -11/06/2021 23:06:06 - INFO - __main__ - Step 13423: {'lr': 0.0004926878999538766, 'samples': 2577216, 'steps': 13422, 'loss/train': 1.187242865562439} -11/06/2021 23:06:07 - INFO - __main__ - Step 13424: {'lr': 0.0004926866258236907, 'samples': 2577408, 'steps': 13423, 'loss/train': 2.304779529571533} -11/06/2021 23:06:07 - INFO - __main__ - Step 13425: {'lr': 0.000492685351584154, 'samples': 2577600, 'steps': 13424, 'loss/train': 2.2769415378570557} -11/06/2021 23:06:07 - INFO - __main__ - Step 13426: {'lr': 0.000492684077235267, 'samples': 2577792, 'steps': 13425, 'loss/train': 0.9876941442489624} -11/06/2021 23:06:08 - INFO - __main__ - Step 13427: {'lr': 0.0004926828027770302, 'samples': 2577984, 'steps': 13426, 'loss/train': 1.4643722772598267} -11/06/2021 23:06:08 - INFO - __main__ - Step 13428: {'lr': 0.0004926815282094443, 'samples': 2578176, 'steps': 13427, 'loss/train': 2.2351608276367188} -11/06/2021 23:06:09 - INFO - __main__ - Step 13429: {'lr': 0.00049268025353251, 'samples': 2578368, 'steps': 13428, 'loss/train': 1.725936770439148} -11/06/2021 23:06:09 - INFO - __main__ - Step 13430: {'lr': 0.0004926789787462276, 'samples': 2578560, 'steps': 13429, 'loss/train': 1.8152636289596558} -11/06/2021 23:06:10 - INFO - __main__ - Step 13431: {'lr': 0.0004926777038505978, 'samples': 2578752, 'steps': 13430, 'loss/train': 1.673268437385559} -11/06/2021 23:06:10 - INFO - __main__ - Step 13432: {'lr': 0.0004926764288456212, 'samples': 2578944, 'steps': 13431, 'loss/train': 1.6883317232131958} -11/06/2021 23:06:10 - INFO - __main__ - Step 13433: {'lr': 0.0004926751537312982, 'samples': 2579136, 'steps': 13432, 'loss/train': 1.6265524625778198} -11/06/2021 23:06:11 - INFO - __main__ - Step 13434: {'lr': 0.0004926738785076297, 'samples': 2579328, 'steps': 13433, 'loss/train': 1.6185946464538574} -11/06/2021 23:06:12 - INFO - __main__ - Step 13435: {'lr': 0.000492672603174616, 'samples': 2579520, 'steps': 13434, 'loss/train': 1.6138404607772827} -11/06/2021 23:06:12 - INFO - __main__ - Step 13436: {'lr': 0.0004926713277322579, 'samples': 2579712, 'steps': 13435, 'loss/train': 1.8457807302474976} -11/06/2021 23:06:13 - INFO - __main__ - Step 13437: {'lr': 0.0004926700521805557, 'samples': 2579904, 'steps': 13436, 'loss/train': 1.5972094535827637} -11/06/2021 23:06:13 - INFO - __main__ - Step 13438: {'lr': 0.0004926687765195102, 'samples': 2580096, 'steps': 13437, 'loss/train': 1.67529296875} -11/06/2021 23:06:14 - INFO - __main__ - Step 13439: {'lr': 0.0004926675007491218, 'samples': 2580288, 'steps': 13438, 'loss/train': 1.481308937072754} -11/06/2021 23:06:14 - INFO - __main__ - Step 13440: {'lr': 0.0004926662248693912, 'samples': 2580480, 'steps': 13439, 'loss/train': 1.9427311420440674} -11/06/2021 23:06:15 - INFO - __main__ - Step 13441: {'lr': 0.000492664948880319, 'samples': 2580672, 'steps': 13440, 'loss/train': 1.513269305229187} -11/06/2021 23:06:15 - INFO - __main__ - Step 13442: {'lr': 0.0004926636727819057, 'samples': 2580864, 'steps': 13441, 'loss/train': 2.367624282836914} -11/06/2021 23:06:15 - INFO - __main__ - Step 13443: {'lr': 0.0004926623965741519, 'samples': 2581056, 'steps': 13442, 'loss/train': 1.679581880569458} -11/06/2021 23:06:16 - INFO - __main__ - Step 13444: {'lr': 0.0004926611202570582, 'samples': 2581248, 'steps': 13443, 'loss/train': 1.8118009567260742} -11/06/2021 23:06:17 - INFO - __main__ - Step 13445: {'lr': 0.0004926598438306252, 'samples': 2581440, 'steps': 13444, 'loss/train': 1.1700359582901} -11/06/2021 23:06:17 - INFO - __main__ - Step 13446: {'lr': 0.0004926585672948532, 'samples': 2581632, 'steps': 13445, 'loss/train': 1.750053882598877} -11/06/2021 23:06:17 - INFO - __main__ - Step 13447: {'lr': 0.0004926572906497432, 'samples': 2581824, 'steps': 13446, 'loss/train': 1.81050705909729} -11/06/2021 23:06:18 - INFO - __main__ - Step 13448: {'lr': 0.0004926560138952955, 'samples': 2582016, 'steps': 13447, 'loss/train': 1.7286831140518188} -11/06/2021 23:06:19 - INFO - __main__ - Step 13449: {'lr': 0.0004926547370315106, 'samples': 2582208, 'steps': 13448, 'loss/train': 1.6813172101974487} -11/06/2021 23:06:19 - INFO - __main__ - Step 13450: {'lr': 0.0004926534600583894, 'samples': 2582400, 'steps': 13449, 'loss/train': 3.3553547859191895} -11/06/2021 23:06:20 - INFO - __main__ - Step 13451: {'lr': 0.0004926521829759323, 'samples': 2582592, 'steps': 13450, 'loss/train': 2.9841389656066895} -11/06/2021 23:06:20 - INFO - __main__ - Step 13452: {'lr': 0.0004926509057841397, 'samples': 2582784, 'steps': 13451, 'loss/train': 2.232959032058716} -11/06/2021 23:06:20 - INFO - __main__ - Step 13453: {'lr': 0.0004926496284830125, 'samples': 2582976, 'steps': 13452, 'loss/train': 0.9120754599571228} -11/06/2021 23:06:21 - INFO - __main__ - Step 13454: {'lr': 0.0004926483510725511, 'samples': 2583168, 'steps': 13453, 'loss/train': 0.20907138288021088} -11/06/2021 23:06:22 - INFO - __main__ - Step 13455: {'lr': 0.000492647073552756, 'samples': 2583360, 'steps': 13454, 'loss/train': 0.17836831510066986} -11/06/2021 23:06:22 - INFO - __main__ - Step 13456: {'lr': 0.000492645795923628, 'samples': 2583552, 'steps': 13455, 'loss/train': 1.9313207864761353} -11/06/2021 23:06:23 - INFO - __main__ - Step 13457: {'lr': 0.0004926445181851675, 'samples': 2583744, 'steps': 13456, 'loss/train': 1.514086365699768} -11/06/2021 23:06:23 - INFO - __main__ - Step 13458: {'lr': 0.0004926432403373752, 'samples': 2583936, 'steps': 13457, 'loss/train': 2.219507932662964} -11/06/2021 23:06:23 - INFO - __main__ - Step 13459: {'lr': 0.0004926419623802515, 'samples': 2584128, 'steps': 13458, 'loss/train': 1.9155421257019043} -11/06/2021 23:06:24 - INFO - __main__ - Step 13460: {'lr': 0.0004926406843137971, 'samples': 2584320, 'steps': 13459, 'loss/train': 1.7302833795547485} -11/06/2021 23:06:25 - INFO - __main__ - Step 13461: {'lr': 0.0004926394061380126, 'samples': 2584512, 'steps': 13460, 'loss/train': 1.796723484992981} -11/06/2021 23:06:25 - INFO - __main__ - Step 13462: {'lr': 0.0004926381278528984, 'samples': 2584704, 'steps': 13461, 'loss/train': 1.6994954347610474} -11/06/2021 23:06:25 - INFO - __main__ - Step 13463: {'lr': 0.0004926368494584553, 'samples': 2584896, 'steps': 13462, 'loss/train': 0.4757920205593109} -11/06/2021 23:06:26 - INFO - __main__ - Step 13464: {'lr': 0.0004926355709546838, 'samples': 2585088, 'steps': 13463, 'loss/train': 1.7972795963287354} -11/06/2021 23:06:26 - INFO - __main__ - Step 13465: {'lr': 0.0004926342923415844, 'samples': 2585280, 'steps': 13464, 'loss/train': 1.8750228881835938} -11/06/2021 23:06:27 - INFO - __main__ - Step 13466: {'lr': 0.0004926330136191577, 'samples': 2585472, 'steps': 13465, 'loss/train': 2.082622766494751} -11/06/2021 23:06:28 - INFO - __main__ - Step 13467: {'lr': 0.0004926317347874044, 'samples': 2585664, 'steps': 13466, 'loss/train': 1.9300429821014404} -11/06/2021 23:06:28 - INFO - __main__ - Step 13468: {'lr': 0.000492630455846325, 'samples': 2585856, 'steps': 13467, 'loss/train': 1.32011079788208} -11/06/2021 23:06:28 - INFO - __main__ - Step 13469: {'lr': 0.0004926291767959199, 'samples': 2586048, 'steps': 13468, 'loss/train': 3.767948865890503} -11/06/2021 23:06:29 - INFO - __main__ - Step 13470: {'lr': 0.00049262789763619, 'samples': 2586240, 'steps': 13469, 'loss/train': 1.0086846351623535} -11/06/2021 23:06:30 - INFO - __main__ - Step 13471: {'lr': 0.0004926266183671356, 'samples': 2586432, 'steps': 13470, 'loss/train': 1.8389583826065063} -11/06/2021 23:06:30 - INFO - __main__ - Step 13472: {'lr': 0.0004926253389887575, 'samples': 2586624, 'steps': 13471, 'loss/train': 1.7652056217193604} -11/06/2021 23:06:31 - INFO - __main__ - Step 13473: {'lr': 0.0004926240595010561, 'samples': 2586816, 'steps': 13472, 'loss/train': 1.13629949092865} -11/06/2021 23:06:31 - INFO - __main__ - Step 13474: {'lr': 0.000492622779904032, 'samples': 2587008, 'steps': 13473, 'loss/train': 1.531381368637085} -11/06/2021 23:06:31 - INFO - __main__ - Step 13475: {'lr': 0.000492621500197686, 'samples': 2587200, 'steps': 13474, 'loss/train': 1.4940797090530396} -11/06/2021 23:06:32 - INFO - __main__ - Step 13476: {'lr': 0.0004926202203820182, 'samples': 2587392, 'steps': 13475, 'loss/train': 1.8899670839309692} -11/06/2021 23:06:33 - INFO - __main__ - Step 13477: {'lr': 0.0004926189404570297, 'samples': 2587584, 'steps': 13476, 'loss/train': 1.735036015510559} -11/06/2021 23:06:33 - INFO - __main__ - Step 13478: {'lr': 0.0004926176604227208, 'samples': 2587776, 'steps': 13477, 'loss/train': 1.7047059535980225} -11/06/2021 23:06:33 - INFO - __main__ - Step 13479: {'lr': 0.0004926163802790922, 'samples': 2587968, 'steps': 13478, 'loss/train': 2.1699039936065674} -11/06/2021 23:06:34 - INFO - __main__ - Step 13480: {'lr': 0.0004926151000261442, 'samples': 2588160, 'steps': 13479, 'loss/train': 1.8087481260299683} -11/06/2021 23:06:34 - INFO - __main__ - Step 13481: {'lr': 0.0004926138196638777, 'samples': 2588352, 'steps': 13480, 'loss/train': 1.056817889213562} -11/06/2021 23:06:35 - INFO - __main__ - Step 13482: {'lr': 0.0004926125391922932, 'samples': 2588544, 'steps': 13481, 'loss/train': 1.3383749723434448} -11/06/2021 23:06:36 - INFO - __main__ - Step 13483: {'lr': 0.0004926112586113912, 'samples': 2588736, 'steps': 13482, 'loss/train': 1.4926176071166992} -11/06/2021 23:06:36 - INFO - __main__ - Step 13484: {'lr': 0.0004926099779211723, 'samples': 2588928, 'steps': 13483, 'loss/train': 1.5623829364776611} -11/06/2021 23:06:36 - INFO - __main__ - Step 13485: {'lr': 0.0004926086971216371, 'samples': 2589120, 'steps': 13484, 'loss/train': 1.7945960760116577} -11/06/2021 23:06:37 - INFO - __main__ - Step 13486: {'lr': 0.0004926074162127862, 'samples': 2589312, 'steps': 13485, 'loss/train': 1.6965285539627075} -11/06/2021 23:06:38 - INFO - __main__ - Step 13487: {'lr': 0.0004926061351946201, 'samples': 2589504, 'steps': 13486, 'loss/train': 2.568559169769287} -11/06/2021 23:06:39 - INFO - __main__ - Step 13488: {'lr': 0.0004926048540671394, 'samples': 2589696, 'steps': 13487, 'loss/train': 0.929760754108429} -11/06/2021 23:06:39 - INFO - __main__ - Step 13489: {'lr': 0.0004926035728303447, 'samples': 2589888, 'steps': 13488, 'loss/train': 1.9634153842926025} -11/06/2021 23:06:39 - INFO - __main__ - Step 13490: {'lr': 0.0004926022914842366, 'samples': 2590080, 'steps': 13489, 'loss/train': 0.19946490228176117} -11/06/2021 23:06:40 - INFO - __main__ - Step 13491: {'lr': 0.0004926010100288156, 'samples': 2590272, 'steps': 13490, 'loss/train': 1.7599334716796875} -11/06/2021 23:06:41 - INFO - __main__ - Step 13492: {'lr': 0.0004925997284640823, 'samples': 2590464, 'steps': 13491, 'loss/train': 1.668752908706665} -11/06/2021 23:06:41 - INFO - __main__ - Step 13493: {'lr': 0.0004925984467900374, 'samples': 2590656, 'steps': 13492, 'loss/train': 1.4135771989822388} -11/06/2021 23:06:41 - INFO - __main__ - Step 13494: {'lr': 0.0004925971650066814, 'samples': 2590848, 'steps': 13493, 'loss/train': 2.2493417263031006} -11/06/2021 23:06:42 - INFO - __main__ - Step 13495: {'lr': 0.0004925958831140147, 'samples': 2591040, 'steps': 13494, 'loss/train': 1.576822280883789} -11/06/2021 23:06:42 - INFO - __main__ - Step 13496: {'lr': 0.0004925946011120382, 'samples': 2591232, 'steps': 13495, 'loss/train': 2.3239166736602783} -11/06/2021 23:06:43 - INFO - __main__ - Step 13497: {'lr': 0.0004925933190007523, 'samples': 2591424, 'steps': 13496, 'loss/train': 1.5112223625183105} -11/06/2021 23:06:44 - INFO - __main__ - Step 13498: {'lr': 0.0004925920367801575, 'samples': 2591616, 'steps': 13497, 'loss/train': 1.7464356422424316} -11/06/2021 23:06:44 - INFO - __main__ - Step 13499: {'lr': 0.0004925907544502545, 'samples': 2591808, 'steps': 13498, 'loss/train': 1.7748905420303345} -11/06/2021 23:06:44 - INFO - __main__ - Step 13500: {'lr': 0.000492589472011044, 'samples': 2592000, 'steps': 13499, 'loss/train': 2.0992441177368164} -11/06/2021 23:06:45 - INFO - __main__ - Step 13501: {'lr': 0.0004925881894625263, 'samples': 2592192, 'steps': 13500, 'loss/train': 1.2124189138412476} -11/06/2021 23:06:46 - INFO - __main__ - Step 13502: {'lr': 0.0004925869068047021, 'samples': 2592384, 'steps': 13501, 'loss/train': 1.7404388189315796} -11/06/2021 23:06:46 - INFO - __main__ - Step 13503: {'lr': 0.000492585624037572, 'samples': 2592576, 'steps': 13502, 'loss/train': 1.5108038187026978} -11/06/2021 23:06:46 - INFO - __main__ - Step 13504: {'lr': 0.0004925843411611366, 'samples': 2592768, 'steps': 13503, 'loss/train': 1.60819673538208} -11/06/2021 23:06:47 - INFO - __main__ - Step 13505: {'lr': 0.0004925830581753964, 'samples': 2592960, 'steps': 13504, 'loss/train': 2.066511631011963} -11/06/2021 23:06:47 - INFO - __main__ - Step 13506: {'lr': 0.000492581775080352, 'samples': 2593152, 'steps': 13505, 'loss/train': 1.5650289058685303} -11/06/2021 23:06:48 - INFO - __main__ - Step 13507: {'lr': 0.000492580491876004, 'samples': 2593344, 'steps': 13506, 'loss/train': 1.7949551343917847} -11/06/2021 23:06:48 - INFO - __main__ - Step 13508: {'lr': 0.000492579208562353, 'samples': 2593536, 'steps': 13507, 'loss/train': 1.567403793334961} -11/06/2021 23:06:49 - INFO - __main__ - Step 13509: {'lr': 0.0004925779251393995, 'samples': 2593728, 'steps': 13508, 'loss/train': 2.0398895740509033} -11/06/2021 23:06:49 - INFO - __main__ - Step 13510: {'lr': 0.0004925766416071441, 'samples': 2593920, 'steps': 13509, 'loss/train': 1.7081353664398193} -11/06/2021 23:06:49 - INFO - __main__ - Step 13511: {'lr': 0.0004925753579655876, 'samples': 2594112, 'steps': 13510, 'loss/train': 1.5593316555023193} -11/06/2021 23:06:51 - INFO - __main__ - Step 13512: {'lr': 0.0004925740742147302, 'samples': 2594304, 'steps': 13511, 'loss/train': 1.8523802757263184} -11/06/2021 23:06:51 - INFO - __main__ - Step 13513: {'lr': 0.0004925727903545727, 'samples': 2594496, 'steps': 13512, 'loss/train': 1.662975788116455} -11/06/2021 23:06:51 - INFO - __main__ - Step 13514: {'lr': 0.0004925715063851157, 'samples': 2594688, 'steps': 13513, 'loss/train': 1.6688578128814697} -11/06/2021 23:06:52 - INFO - __main__ - Step 13515: {'lr': 0.0004925702223063597, 'samples': 2594880, 'steps': 13514, 'loss/train': 0.6073575019836426} -11/06/2021 23:06:52 - INFO - __main__ - Step 13516: {'lr': 0.0004925689381183052, 'samples': 2595072, 'steps': 13515, 'loss/train': 1.6856118440628052} -11/06/2021 23:06:52 - INFO - __main__ - Step 13517: {'lr': 0.0004925676538209531, 'samples': 2595264, 'steps': 13516, 'loss/train': 2.147181510925293} -11/06/2021 23:06:53 - INFO - __main__ - Step 13518: {'lr': 0.0004925663694143036, 'samples': 2595456, 'steps': 13517, 'loss/train': 1.5106788873672485} -11/06/2021 23:06:54 - INFO - __main__ - Step 13519: {'lr': 0.0004925650848983575, 'samples': 2595648, 'steps': 13518, 'loss/train': 1.8200280666351318} -11/06/2021 23:06:54 - INFO - __main__ - Step 13520: {'lr': 0.0004925638002731153, 'samples': 2595840, 'steps': 13519, 'loss/train': 1.5269951820373535} -11/06/2021 23:06:54 - INFO - __main__ - Step 13521: {'lr': 0.0004925625155385775, 'samples': 2596032, 'steps': 13520, 'loss/train': 1.926583170890808} -11/06/2021 23:06:55 - INFO - __main__ - Step 13522: {'lr': 0.0004925612306947449, 'samples': 2596224, 'steps': 13521, 'loss/train': 1.5432051420211792} -11/06/2021 23:06:56 - INFO - __main__ - Step 13523: {'lr': 0.0004925599457416179, 'samples': 2596416, 'steps': 13522, 'loss/train': 1.8082655668258667} -11/06/2021 23:06:56 - INFO - __main__ - Step 13524: {'lr': 0.0004925586606791972, 'samples': 2596608, 'steps': 13523, 'loss/train': 1.771362543106079} -11/06/2021 23:06:56 - INFO - __main__ - Step 13525: {'lr': 0.0004925573755074832, 'samples': 2596800, 'steps': 13524, 'loss/train': 1.9710201025009155} -11/06/2021 23:06:57 - INFO - __main__ - Step 13526: {'lr': 0.0004925560902264766, 'samples': 2596992, 'steps': 13525, 'loss/train': 1.8510551452636719} -11/06/2021 23:06:57 - INFO - __main__ - Step 13527: {'lr': 0.000492554804836178, 'samples': 2597184, 'steps': 13526, 'loss/train': 1.7917557954788208} -11/06/2021 23:06:59 - INFO - __main__ - Step 13528: {'lr': 0.000492553519336588, 'samples': 2597376, 'steps': 13527, 'loss/train': 1.3388181924819946} -11/06/2021 23:06:59 - INFO - __main__ - Step 13529: {'lr': 0.000492552233727707, 'samples': 2597568, 'steps': 13528, 'loss/train': 1.9206374883651733} -11/06/2021 23:07:00 - INFO - __main__ - Step 13530: {'lr': 0.0004925509480095358, 'samples': 2597760, 'steps': 13529, 'loss/train': 1.7673835754394531} -11/06/2021 23:07:00 - INFO - __main__ - Step 13531: {'lr': 0.0004925496621820749, 'samples': 2597952, 'steps': 13530, 'loss/train': 1.4747488498687744} -11/06/2021 23:07:00 - INFO - __main__ - Step 13532: {'lr': 0.0004925483762453249, 'samples': 2598144, 'steps': 13531, 'loss/train': 0.7193357944488525} -11/06/2021 23:07:01 - INFO - __main__ - Step 13533: {'lr': 0.0004925470901992863, 'samples': 2598336, 'steps': 13532, 'loss/train': 1.6905871629714966} -11/06/2021 23:07:02 - INFO - __main__ - Step 13534: {'lr': 0.0004925458040439596, 'samples': 2598528, 'steps': 13533, 'loss/train': 1.825111985206604} -11/06/2021 23:07:02 - INFO - __main__ - Step 13535: {'lr': 0.0004925445177793457, 'samples': 2598720, 'steps': 13534, 'loss/train': 1.879388689994812} -11/06/2021 23:07:02 - INFO - __main__ - Step 13536: {'lr': 0.0004925432314054448, 'samples': 2598912, 'steps': 13535, 'loss/train': 1.898144006729126} -11/06/2021 23:07:03 - INFO - __main__ - Step 13537: {'lr': 0.0004925419449222578, 'samples': 2599104, 'steps': 13536, 'loss/train': 2.1349470615386963} -11/06/2021 23:07:04 - INFO - __main__ - Step 13538: {'lr': 0.0004925406583297851, 'samples': 2599296, 'steps': 13537, 'loss/train': 1.8483484983444214} -11/06/2021 23:07:04 - INFO - __main__ - Step 13539: {'lr': 0.0004925393716280274, 'samples': 2599488, 'steps': 13538, 'loss/train': 1.1511164903640747} -11/06/2021 23:07:04 - INFO - __main__ - Step 13540: {'lr': 0.0004925380848169851, 'samples': 2599680, 'steps': 13539, 'loss/train': 1.4362045526504517} -11/06/2021 23:07:05 - INFO - __main__ - Step 13541: {'lr': 0.0004925367978966588, 'samples': 2599872, 'steps': 13540, 'loss/train': 2.184403419494629} -11/06/2021 23:07:05 - INFO - __main__ - Step 13542: {'lr': 0.0004925355108670493, 'samples': 2600064, 'steps': 13541, 'loss/train': 1.5568304061889648} -11/06/2021 23:07:06 - INFO - __main__ - Step 13543: {'lr': 0.0004925342237281571, 'samples': 2600256, 'steps': 13542, 'loss/train': 1.6341681480407715} -11/06/2021 23:07:06 - INFO - __main__ - Step 13544: {'lr': 0.0004925329364799825, 'samples': 2600448, 'steps': 13543, 'loss/train': 1.4727433919906616} -11/06/2021 23:07:07 - INFO - __main__ - Step 13545: {'lr': 0.0004925316491225265, 'samples': 2600640, 'steps': 13544, 'loss/train': 1.715566873550415} -11/06/2021 23:07:07 - INFO - __main__ - Step 13546: {'lr': 0.0004925303616557893, 'samples': 2600832, 'steps': 13545, 'loss/train': 1.6563913822174072} -11/06/2021 23:07:08 - INFO - __main__ - Step 13547: {'lr': 0.0004925290740797718, 'samples': 2601024, 'steps': 13546, 'loss/train': 1.9867644309997559} -11/06/2021 23:07:08 - INFO - __main__ - Step 13548: {'lr': 0.0004925277863944745, 'samples': 2601216, 'steps': 13547, 'loss/train': 2.0575523376464844} -11/06/2021 23:07:09 - INFO - __main__ - Step 13549: {'lr': 0.0004925264985998978, 'samples': 2601408, 'steps': 13548, 'loss/train': 1.7261626720428467} -11/06/2021 23:07:09 - INFO - __main__ - Step 13550: {'lr': 0.0004925252106960425, 'samples': 2601600, 'steps': 13549, 'loss/train': 1.596949577331543} -11/06/2021 23:07:10 - INFO - __main__ - Step 13551: {'lr': 0.000492523922682909, 'samples': 2601792, 'steps': 13550, 'loss/train': 1.3621716499328613} -11/06/2021 23:07:10 - INFO - __main__ - Step 13552: {'lr': 0.0004925226345604979, 'samples': 2601984, 'steps': 13551, 'loss/train': 1.458478569984436} -11/06/2021 23:07:10 - INFO - __main__ - Step 13553: {'lr': 0.0004925213463288099, 'samples': 2602176, 'steps': 13552, 'loss/train': 1.587988257408142} -11/06/2021 23:07:11 - INFO - __main__ - Step 13554: {'lr': 0.0004925200579878456, 'samples': 2602368, 'steps': 13553, 'loss/train': 1.3299733400344849} -11/06/2021 23:07:12 - INFO - __main__ - Step 13555: {'lr': 0.0004925187695376055, 'samples': 2602560, 'steps': 13554, 'loss/train': 1.4566415548324585} -11/06/2021 23:07:12 - INFO - __main__ - Step 13556: {'lr': 0.0004925174809780901, 'samples': 2602752, 'steps': 13555, 'loss/train': 1.6076452732086182} -11/06/2021 23:07:12 - INFO - __main__ - Step 13557: {'lr': 0.0004925161923093001, 'samples': 2602944, 'steps': 13556, 'loss/train': 1.5300875902175903} -11/06/2021 23:07:13 - INFO - __main__ - Step 13558: {'lr': 0.000492514903531236, 'samples': 2603136, 'steps': 13557, 'loss/train': 1.9013261795043945} -11/06/2021 23:07:14 - INFO - __main__ - Step 13559: {'lr': 0.0004925136146438986, 'samples': 2603328, 'steps': 13558, 'loss/train': 1.5588353872299194} -11/06/2021 23:07:14 - INFO - __main__ - Step 13560: {'lr': 0.0004925123256472881, 'samples': 2603520, 'steps': 13559, 'loss/train': 1.529636263847351} -11/06/2021 23:07:14 - INFO - __main__ - Step 13561: {'lr': 0.0004925110365414054, 'samples': 2603712, 'steps': 13560, 'loss/train': 1.6311484575271606} -11/06/2021 23:07:15 - INFO - __main__ - Step 13562: {'lr': 0.0004925097473262509, 'samples': 2603904, 'steps': 13561, 'loss/train': 1.773667573928833} -11/06/2021 23:07:15 - INFO - __main__ - Step 13563: {'lr': 0.0004925084580018253, 'samples': 2604096, 'steps': 13562, 'loss/train': 1.412859559059143} -11/06/2021 23:07:16 - INFO - __main__ - Step 13564: {'lr': 0.0004925071685681292, 'samples': 2604288, 'steps': 13563, 'loss/train': 2.0537023544311523} -11/06/2021 23:07:16 - INFO - __main__ - Step 13565: {'lr': 0.000492505879025163, 'samples': 2604480, 'steps': 13564, 'loss/train': 1.4484230279922485} -11/06/2021 23:07:17 - INFO - __main__ - Step 13566: {'lr': 0.0004925045893729274, 'samples': 2604672, 'steps': 13565, 'loss/train': 1.8159236907958984} -11/06/2021 23:07:17 - INFO - __main__ - Step 13567: {'lr': 0.000492503299611423, 'samples': 2604864, 'steps': 13566, 'loss/train': 1.2261930704116821} -11/06/2021 23:07:18 - INFO - __main__ - Step 13568: {'lr': 0.0004925020097406504, 'samples': 2605056, 'steps': 13567, 'loss/train': 1.8330031633377075} -11/06/2021 23:07:19 - INFO - __main__ - Step 13569: {'lr': 0.00049250071976061, 'samples': 2605248, 'steps': 13568, 'loss/train': 1.5868868827819824} -11/06/2021 23:07:19 - INFO - __main__ - Step 13570: {'lr': 0.0004924994296713026, 'samples': 2605440, 'steps': 13569, 'loss/train': 1.7566038370132446} -11/06/2021 23:07:19 - INFO - __main__ - Step 13571: {'lr': 0.0004924981394727288, 'samples': 2605632, 'steps': 13570, 'loss/train': 1.4361501932144165} -11/06/2021 23:07:20 - INFO - __main__ - Step 13572: {'lr': 0.0004924968491648889, 'samples': 2605824, 'steps': 13571, 'loss/train': 1.6027421951293945} -11/06/2021 23:07:20 - INFO - __main__ - Step 13573: {'lr': 0.0004924955587477837, 'samples': 2606016, 'steps': 13572, 'loss/train': 1.6203863620758057} -11/06/2021 23:07:21 - INFO - __main__ - Step 13574: {'lr': 0.0004924942682214138, 'samples': 2606208, 'steps': 13573, 'loss/train': 1.7938021421432495} -11/06/2021 23:07:21 - INFO - __main__ - Step 13575: {'lr': 0.0004924929775857798, 'samples': 2606400, 'steps': 13574, 'loss/train': 0.9622952938079834} -11/06/2021 23:07:22 - INFO - __main__ - Step 13576: {'lr': 0.0004924916868408821, 'samples': 2606592, 'steps': 13575, 'loss/train': 1.0422208309173584} -11/06/2021 23:07:22 - INFO - __main__ - Step 13577: {'lr': 0.0004924903959867214, 'samples': 2606784, 'steps': 13576, 'loss/train': 1.6397504806518555} -11/06/2021 23:07:22 - INFO - __main__ - Step 13578: {'lr': 0.0004924891050232984, 'samples': 2606976, 'steps': 13577, 'loss/train': 1.8606226444244385} -11/06/2021 23:07:23 - INFO - __main__ - Step 13579: {'lr': 0.0004924878139506134, 'samples': 2607168, 'steps': 13578, 'loss/train': 1.482366681098938} -11/06/2021 23:07:24 - INFO - __main__ - Step 13580: {'lr': 0.0004924865227686671, 'samples': 2607360, 'steps': 13579, 'loss/train': 1.4506975412368774} -11/06/2021 23:07:25 - INFO - __main__ - Step 13581: {'lr': 0.0004924852314774602, 'samples': 2607552, 'steps': 13580, 'loss/train': 2.16103196144104} -11/06/2021 23:07:25 - INFO - __main__ - Step 13582: {'lr': 0.0004924839400769932, 'samples': 2607744, 'steps': 13581, 'loss/train': 1.665818452835083} -11/06/2021 23:07:25 - INFO - __main__ - Step 13583: {'lr': 0.0004924826485672667, 'samples': 2607936, 'steps': 13582, 'loss/train': 0.9627843499183655} -11/06/2021 23:07:26 - INFO - __main__ - Step 13584: {'lr': 0.0004924813569482812, 'samples': 2608128, 'steps': 13583, 'loss/train': 1.1385881900787354} -11/06/2021 23:07:27 - INFO - __main__ - Step 13585: {'lr': 0.0004924800652200373, 'samples': 2608320, 'steps': 13584, 'loss/train': 1.7369372844696045} -11/06/2021 23:07:27 - INFO - __main__ - Step 13586: {'lr': 0.0004924787733825357, 'samples': 2608512, 'steps': 13585, 'loss/train': 2.386915922164917} -11/06/2021 23:07:27 - INFO - __main__ - Step 13587: {'lr': 0.0004924774814357768, 'samples': 2608704, 'steps': 13586, 'loss/train': 1.7782405614852905} -11/06/2021 23:07:28 - INFO - __main__ - Step 13588: {'lr': 0.0004924761893797615, 'samples': 2608896, 'steps': 13587, 'loss/train': 1.8888113498687744} -11/06/2021 23:07:28 - INFO - __main__ - Step 13589: {'lr': 0.00049247489721449, 'samples': 2609088, 'steps': 13588, 'loss/train': 5.811814785003662} -11/06/2021 23:07:29 - INFO - __main__ - Step 13590: {'lr': 0.0004924736049399631, 'samples': 2609280, 'steps': 13589, 'loss/train': 1.3031723499298096} -11/06/2021 23:07:29 - INFO - __main__ - Step 13591: {'lr': 0.0004924723125561813, 'samples': 2609472, 'steps': 13590, 'loss/train': 1.8062859773635864} -11/06/2021 23:07:30 - INFO - __main__ - Step 13592: {'lr': 0.0004924710200631453, 'samples': 2609664, 'steps': 13591, 'loss/train': 1.475710153579712} -11/06/2021 23:07:30 - INFO - __main__ - Step 13593: {'lr': 0.0004924697274608556, 'samples': 2609856, 'steps': 13592, 'loss/train': 1.6289951801300049} -11/06/2021 23:07:31 - INFO - __main__ - Step 13594: {'lr': 0.0004924684347493126, 'samples': 2610048, 'steps': 13593, 'loss/train': 1.741284966468811} -11/06/2021 23:07:32 - INFO - __main__ - Step 13595: {'lr': 0.0004924671419285172, 'samples': 2610240, 'steps': 13594, 'loss/train': 1.871199369430542} -11/06/2021 23:07:32 - INFO - __main__ - Step 13596: {'lr': 0.0004924658489984699, 'samples': 2610432, 'steps': 13595, 'loss/train': 1.5763531923294067} -11/06/2021 23:07:32 - INFO - __main__ - Step 13597: {'lr': 0.0004924645559591712, 'samples': 2610624, 'steps': 13596, 'loss/train': 1.8481301069259644} -11/06/2021 23:07:33 - INFO - __main__ - Step 13598: {'lr': 0.0004924632628106217, 'samples': 2610816, 'steps': 13597, 'loss/train': 1.9725139141082764} -11/06/2021 23:07:33 - INFO - __main__ - Step 13599: {'lr': 0.000492461969552822, 'samples': 2611008, 'steps': 13598, 'loss/train': 1.4551993608474731} -11/06/2021 23:07:33 - INFO - __main__ - Step 13600: {'lr': 0.0004924606761857726, 'samples': 2611200, 'steps': 13599, 'loss/train': 1.2987780570983887} -11/06/2021 23:07:34 - INFO - __main__ - Step 13601: {'lr': 0.0004924593827094744, 'samples': 2611392, 'steps': 13600, 'loss/train': 1.725089430809021} -11/06/2021 23:07:35 - INFO - __main__ - Step 13602: {'lr': 0.0004924580891239274, 'samples': 2611584, 'steps': 13601, 'loss/train': 1.9037177562713623} -11/06/2021 23:07:35 - INFO - __main__ - Step 13603: {'lr': 0.0004924567954291328, 'samples': 2611776, 'steps': 13602, 'loss/train': 1.6505497694015503} -11/06/2021 23:07:35 - INFO - __main__ - Step 13604: {'lr': 0.0004924555016250908, 'samples': 2611968, 'steps': 13603, 'loss/train': 1.9242398738861084} -11/06/2021 23:07:36 - INFO - __main__ - Step 13605: {'lr': 0.0004924542077118021, 'samples': 2612160, 'steps': 13604, 'loss/train': 1.6586657762527466} -11/06/2021 23:07:38 - INFO - __main__ - Step 13606: {'lr': 0.0004924529136892673, 'samples': 2612352, 'steps': 13605, 'loss/train': 1.6785545349121094} -11/06/2021 23:07:38 - INFO - __main__ - Step 13607: {'lr': 0.0004924516195574869, 'samples': 2612544, 'steps': 13606, 'loss/train': 0.57390958070755} -11/06/2021 23:07:39 - INFO - __main__ - Step 13608: {'lr': 0.0004924503253164614, 'samples': 2612736, 'steps': 13607, 'loss/train': 1.4627878665924072} -11/06/2021 23:07:39 - INFO - __main__ - Step 13609: {'lr': 0.0004924490309661918, 'samples': 2612928, 'steps': 13608, 'loss/train': 0.6431192755699158} -11/06/2021 23:07:39 - INFO - __main__ - Step 13610: {'lr': 0.0004924477365066783, 'samples': 2613120, 'steps': 13609, 'loss/train': 1.783947229385376} -11/06/2021 23:07:40 - INFO - __main__ - Step 13611: {'lr': 0.0004924464419379217, 'samples': 2613312, 'steps': 13610, 'loss/train': 1.6398215293884277} -11/06/2021 23:07:41 - INFO - __main__ - Step 13612: {'lr': 0.0004924451472599222, 'samples': 2613504, 'steps': 13611, 'loss/train': 0.23156870901584625} -11/06/2021 23:07:41 - INFO - __main__ - Step 13613: {'lr': 0.000492443852472681, 'samples': 2613696, 'steps': 13612, 'loss/train': 1.843045711517334} -11/06/2021 23:07:41 - INFO - __main__ - Step 13614: {'lr': 0.000492442557576198, 'samples': 2613888, 'steps': 13613, 'loss/train': 1.7973626852035522} -11/06/2021 23:07:42 - INFO - __main__ - Step 13615: {'lr': 0.0004924412625704744, 'samples': 2614080, 'steps': 13614, 'loss/train': 2.342195749282837} -11/06/2021 23:07:42 - INFO - __main__ - Step 13616: {'lr': 0.0004924399674555103, 'samples': 2614272, 'steps': 13615, 'loss/train': 1.5847399234771729} -11/06/2021 23:07:42 - INFO - __main__ - Step 13617: {'lr': 0.0004924386722313066, 'samples': 2614464, 'steps': 13616, 'loss/train': 1.906503438949585} -11/06/2021 23:07:43 - INFO - __main__ - Step 13618: {'lr': 0.0004924373768978638, 'samples': 2614656, 'steps': 13617, 'loss/train': 2.0704801082611084} -11/06/2021 23:07:44 - INFO - __main__ - Step 13619: {'lr': 0.0004924360814551825, 'samples': 2614848, 'steps': 13618, 'loss/train': 1.9433788061141968} -11/06/2021 23:07:44 - INFO - __main__ - Step 13620: {'lr': 0.0004924347859032631, 'samples': 2615040, 'steps': 13619, 'loss/train': 1.7289719581604004} -11/06/2021 23:07:44 - INFO - __main__ - Step 13621: {'lr': 0.0004924334902421065, 'samples': 2615232, 'steps': 13620, 'loss/train': 2.022456407546997} -11/06/2021 23:07:45 - INFO - __main__ - Step 13622: {'lr': 0.0004924321944717129, 'samples': 2615424, 'steps': 13621, 'loss/train': 1.9337289333343506} -11/06/2021 23:07:46 - INFO - __main__ - Step 13623: {'lr': 0.0004924308985920832, 'samples': 2615616, 'steps': 13622, 'loss/train': 2.2961039543151855} -11/06/2021 23:07:46 - INFO - __main__ - Step 13624: {'lr': 0.0004924296026032179, 'samples': 2615808, 'steps': 13623, 'loss/train': 1.2842239141464233} -11/06/2021 23:07:46 - INFO - __main__ - Step 13625: {'lr': 0.0004924283065051176, 'samples': 2616000, 'steps': 13624, 'loss/train': 1.8332487344741821} -11/06/2021 23:07:47 - INFO - __main__ - Step 13626: {'lr': 0.0004924270102977827, 'samples': 2616192, 'steps': 13625, 'loss/train': 2.1077988147735596} -11/06/2021 23:07:47 - INFO - __main__ - Step 13627: {'lr': 0.0004924257139812141, 'samples': 2616384, 'steps': 13626, 'loss/train': 1.8396973609924316} -11/06/2021 23:07:49 - INFO - __main__ - Step 13628: {'lr': 0.0004924244175554121, 'samples': 2616576, 'steps': 13627, 'loss/train': 1.9551353454589844} -11/06/2021 23:07:49 - INFO - __main__ - Step 13629: {'lr': 0.0004924231210203775, 'samples': 2616768, 'steps': 13628, 'loss/train': 1.9722517728805542} -11/06/2021 23:07:49 - INFO - __main__ - Step 13630: {'lr': 0.0004924218243761106, 'samples': 2616960, 'steps': 13629, 'loss/train': 1.3070924282073975} -11/06/2021 23:07:50 - INFO - __main__ - Step 13631: {'lr': 0.0004924205276226123, 'samples': 2617152, 'steps': 13630, 'loss/train': 1.8307408094406128} -11/06/2021 23:07:50 - INFO - __main__ - Step 13632: {'lr': 0.000492419230759883, 'samples': 2617344, 'steps': 13631, 'loss/train': 1.8106156587600708} -11/06/2021 23:07:50 - INFO - __main__ - Step 13633: {'lr': 0.0004924179337879234, 'samples': 2617536, 'steps': 13632, 'loss/train': 1.3615984916687012} -11/06/2021 23:07:51 - INFO - __main__ - Step 13634: {'lr': 0.000492416636706734, 'samples': 2617728, 'steps': 13633, 'loss/train': 1.84334397315979} -11/06/2021 23:07:52 - INFO - __main__ - Step 13635: {'lr': 0.0004924153395163153, 'samples': 2617920, 'steps': 13634, 'loss/train': 1.8057781457901} -11/06/2021 23:07:52 - INFO - __main__ - Step 13636: {'lr': 0.0004924140422166681, 'samples': 2618112, 'steps': 13635, 'loss/train': 1.1118844747543335} -11/06/2021 23:07:52 - INFO - __main__ - Step 13637: {'lr': 0.0004924127448077929, 'samples': 2618304, 'steps': 13636, 'loss/train': 1.283229112625122} -11/06/2021 23:07:53 - INFO - __main__ - Step 13638: {'lr': 0.0004924114472896902, 'samples': 2618496, 'steps': 13637, 'loss/train': 1.547655701637268} -11/06/2021 23:07:54 - INFO - __main__ - Step 13639: {'lr': 0.0004924101496623606, 'samples': 2618688, 'steps': 13638, 'loss/train': 1.6274465322494507} -11/06/2021 23:07:54 - INFO - __main__ - Step 13640: {'lr': 0.0004924088519258049, 'samples': 2618880, 'steps': 13639, 'loss/train': 1.567894697189331} -11/06/2021 23:07:55 - INFO - __main__ - Step 13641: {'lr': 0.0004924075540800233, 'samples': 2619072, 'steps': 13640, 'loss/train': 1.5722965002059937} -11/06/2021 23:07:55 - INFO - __main__ - Step 13642: {'lr': 0.0004924062561250167, 'samples': 2619264, 'steps': 13641, 'loss/train': 1.4436631202697754} -11/06/2021 23:07:55 - INFO - __main__ - Step 13643: {'lr': 0.0004924049580607855, 'samples': 2619456, 'steps': 13642, 'loss/train': 1.4802452325820923} -11/06/2021 23:07:56 - INFO - __main__ - Step 13644: {'lr': 0.0004924036598873305, 'samples': 2619648, 'steps': 13643, 'loss/train': 1.4207649230957031} -11/06/2021 23:07:57 - INFO - __main__ - Step 13645: {'lr': 0.0004924023616046521, 'samples': 2619840, 'steps': 13644, 'loss/train': 0.14849276840686798} -11/06/2021 23:07:57 - INFO - __main__ - Step 13646: {'lr': 0.000492401063212751, 'samples': 2620032, 'steps': 13645, 'loss/train': 1.5605554580688477} -11/06/2021 23:07:57 - INFO - __main__ - Step 13647: {'lr': 0.0004923997647116276, 'samples': 2620224, 'steps': 13646, 'loss/train': 0.61855548620224} -11/06/2021 23:07:58 - INFO - __main__ - Step 13648: {'lr': 0.0004923984661012827, 'samples': 2620416, 'steps': 13647, 'loss/train': 1.0472122430801392} -11/06/2021 23:07:58 - INFO - __main__ - Step 13649: {'lr': 0.0004923971673817167, 'samples': 2620608, 'steps': 13648, 'loss/train': 2.2823336124420166} -11/06/2021 23:07:59 - INFO - __main__ - Step 13650: {'lr': 0.0004923958685529303, 'samples': 2620800, 'steps': 13649, 'loss/train': 1.8961249589920044} -11/06/2021 23:07:59 - INFO - __main__ - Step 13651: {'lr': 0.0004923945696149241, 'samples': 2620992, 'steps': 13650, 'loss/train': 1.9037821292877197} -11/06/2021 23:08:00 - INFO - __main__ - Step 13652: {'lr': 0.0004923932705676986, 'samples': 2621184, 'steps': 13651, 'loss/train': 1.549149990081787} -11/06/2021 23:08:00 - INFO - __main__ - Step 13653: {'lr': 0.0004923919714112545, 'samples': 2621376, 'steps': 13652, 'loss/train': 1.5010502338409424} -11/06/2021 23:08:01 - INFO - __main__ - Step 13654: {'lr': 0.0004923906721455922, 'samples': 2621568, 'steps': 13653, 'loss/train': 1.2696095705032349} -11/06/2021 23:08:01 - INFO - __main__ - Step 13655: {'lr': 0.0004923893727707125, 'samples': 2621760, 'steps': 13654, 'loss/train': 2.0763657093048096} -11/06/2021 23:08:02 - INFO - __main__ - Step 13656: {'lr': 0.0004923880732866159, 'samples': 2621952, 'steps': 13655, 'loss/train': 1.3228414058685303} -11/06/2021 23:08:02 - INFO - __main__ - Step 13657: {'lr': 0.0004923867736933029, 'samples': 2622144, 'steps': 13656, 'loss/train': 1.621604323387146} -11/06/2021 23:08:02 - INFO - __main__ - Step 13658: {'lr': 0.0004923854739907743, 'samples': 2622336, 'steps': 13657, 'loss/train': 1.2240080833435059} -11/06/2021 23:08:03 - INFO - __main__ - Step 13659: {'lr': 0.0004923841741790304, 'samples': 2622528, 'steps': 13658, 'loss/train': 1.7025880813598633} -11/06/2021 23:08:04 - INFO - __main__ - Step 13660: {'lr': 0.0004923828742580719, 'samples': 2622720, 'steps': 13659, 'loss/train': 0.8166983723640442} -11/06/2021 23:08:04 - INFO - __main__ - Step 13661: {'lr': 0.0004923815742278996, 'samples': 2622912, 'steps': 13660, 'loss/train': 1.8481582403182983} -11/06/2021 23:08:05 - INFO - __main__ - Step 13662: {'lr': 0.0004923802740885139, 'samples': 2623104, 'steps': 13661, 'loss/train': 1.9549199342727661} -11/06/2021 23:08:05 - INFO - __main__ - Step 13663: {'lr': 0.0004923789738399152, 'samples': 2623296, 'steps': 13662, 'loss/train': 1.5047688484191895} -11/06/2021 23:08:05 - INFO - __main__ - Step 13664: {'lr': 0.0004923776734821044, 'samples': 2623488, 'steps': 13663, 'loss/train': 1.784568190574646} -11/06/2021 23:08:07 - INFO - __main__ - Step 13665: {'lr': 0.0004923763730150819, 'samples': 2623680, 'steps': 13664, 'loss/train': 1.6027264595031738} -11/06/2021 23:08:07 - INFO - __main__ - Step 13666: {'lr': 0.0004923750724388483, 'samples': 2623872, 'steps': 13665, 'loss/train': 1.826322078704834} -11/06/2021 23:08:07 - INFO - __main__ - Step 13667: {'lr': 0.0004923737717534044, 'samples': 2624064, 'steps': 13666, 'loss/train': 1.9176068305969238} -11/06/2021 23:08:08 - INFO - __main__ - Step 13668: {'lr': 0.0004923724709587504, 'samples': 2624256, 'steps': 13667, 'loss/train': 2.2338030338287354} -11/06/2021 23:08:08 - INFO - __main__ - Step 13669: {'lr': 0.0004923711700548873, 'samples': 2624448, 'steps': 13668, 'loss/train': 1.8430683612823486} -11/06/2021 23:08:09 - INFO - __main__ - Step 13670: {'lr': 0.0004923698690418154, 'samples': 2624640, 'steps': 13669, 'loss/train': 0.9396169781684875} -11/06/2021 23:08:09 - INFO - __main__ - Step 13671: {'lr': 0.0004923685679195355, 'samples': 2624832, 'steps': 13670, 'loss/train': 1.6337071657180786} -11/06/2021 23:08:10 - INFO - __main__ - Step 13672: {'lr': 0.0004923672666880479, 'samples': 2625024, 'steps': 13671, 'loss/train': 1.3676971197128296} -11/06/2021 23:08:10 - INFO - __main__ - Step 13673: {'lr': 0.0004923659653473533, 'samples': 2625216, 'steps': 13672, 'loss/train': 1.6104556322097778} -11/06/2021 23:08:10 - INFO - __main__ - Step 13674: {'lr': 0.0004923646638974524, 'samples': 2625408, 'steps': 13673, 'loss/train': 1.3942358493804932} -11/06/2021 23:08:11 - INFO - __main__ - Step 13675: {'lr': 0.0004923633623383459, 'samples': 2625600, 'steps': 13674, 'loss/train': 1.8581507205963135} -11/06/2021 23:08:12 - INFO - __main__ - Step 13676: {'lr': 0.0004923620606700341, 'samples': 2625792, 'steps': 13675, 'loss/train': 1.0747668743133545} -11/06/2021 23:08:12 - INFO - __main__ - Step 13677: {'lr': 0.0004923607588925177, 'samples': 2625984, 'steps': 13676, 'loss/train': 1.7954381704330444} -11/06/2021 23:08:13 - INFO - __main__ - Step 13678: {'lr': 0.0004923594570057972, 'samples': 2626176, 'steps': 13677, 'loss/train': 1.8228819370269775} -11/06/2021 23:08:13 - INFO - __main__ - Step 13679: {'lr': 0.0004923581550098733, 'samples': 2626368, 'steps': 13678, 'loss/train': 1.6954731941223145} -11/06/2021 23:08:13 - INFO - __main__ - Step 13680: {'lr': 0.0004923568529047466, 'samples': 2626560, 'steps': 13679, 'loss/train': 1.7315030097961426} -11/06/2021 23:08:14 - INFO - __main__ - Step 13681: {'lr': 0.0004923555506904176, 'samples': 2626752, 'steps': 13680, 'loss/train': 1.701892614364624} -11/06/2021 23:08:15 - INFO - __main__ - Step 13682: {'lr': 0.0004923542483668869, 'samples': 2626944, 'steps': 13681, 'loss/train': 1.860314130783081} -11/06/2021 23:08:15 - INFO - __main__ - Step 13683: {'lr': 0.0004923529459341553, 'samples': 2627136, 'steps': 13682, 'loss/train': 1.5771002769470215} -11/06/2021 23:08:15 - INFO - __main__ - Step 13684: {'lr': 0.000492351643392223, 'samples': 2627328, 'steps': 13683, 'loss/train': 2.214824914932251} -11/06/2021 23:08:16 - INFO - __main__ - Step 13685: {'lr': 0.0004923503407410908, 'samples': 2627520, 'steps': 13684, 'loss/train': 1.6392228603363037} -11/06/2021 23:08:17 - INFO - __main__ - Step 13686: {'lr': 0.0004923490379807594, 'samples': 2627712, 'steps': 13685, 'loss/train': 1.5940680503845215} -11/06/2021 23:08:17 - INFO - __main__ - Step 13687: {'lr': 0.0004923477351112291, 'samples': 2627904, 'steps': 13686, 'loss/train': 1.3699396848678589} -11/06/2021 23:08:17 - INFO - __main__ - Step 13688: {'lr': 0.0004923464321325008, 'samples': 2628096, 'steps': 13687, 'loss/train': 2.2057156562805176} -11/06/2021 23:08:18 - INFO - __main__ - Step 13689: {'lr': 0.0004923451290445749, 'samples': 2628288, 'steps': 13688, 'loss/train': 1.5960655212402344} -11/06/2021 23:08:18 - INFO - __main__ - Step 13690: {'lr': 0.000492343825847452, 'samples': 2628480, 'steps': 13689, 'loss/train': 2.2023274898529053} -11/06/2021 23:08:19 - INFO - __main__ - Step 13691: {'lr': 0.0004923425225411328, 'samples': 2628672, 'steps': 13690, 'loss/train': 1.8006644248962402} -11/06/2021 23:08:19 - INFO - __main__ - Step 13692: {'lr': 0.0004923412191256176, 'samples': 2628864, 'steps': 13691, 'loss/train': 1.6855508089065552} -11/06/2021 23:08:20 - INFO - __main__ - Step 13693: {'lr': 0.0004923399156009073, 'samples': 2629056, 'steps': 13692, 'loss/train': 1.91086745262146} -11/06/2021 23:08:20 - INFO - __main__ - Step 13694: {'lr': 0.0004923386119670024, 'samples': 2629248, 'steps': 13693, 'loss/train': 2.243964910507202} -11/06/2021 23:08:20 - INFO - __main__ - Step 13695: {'lr': 0.0004923373082239035, 'samples': 2629440, 'steps': 13694, 'loss/train': 1.8091576099395752} -11/06/2021 23:08:21 - INFO - __main__ - Step 13696: {'lr': 0.000492336004371611, 'samples': 2629632, 'steps': 13695, 'loss/train': 1.891566276550293} -11/06/2021 23:08:22 - INFO - __main__ - Step 13697: {'lr': 0.0004923347004101257, 'samples': 2629824, 'steps': 13696, 'loss/train': 1.8870787620544434} -11/06/2021 23:08:22 - INFO - __main__ - Step 13698: {'lr': 0.0004923333963394482, 'samples': 2630016, 'steps': 13697, 'loss/train': 1.609986424446106} -11/06/2021 23:08:22 - INFO - __main__ - Step 13699: {'lr': 0.000492332092159579, 'samples': 2630208, 'steps': 13698, 'loss/train': 1.5685456991195679} -11/06/2021 23:08:23 - INFO - __main__ - Step 13700: {'lr': 0.0004923307878705186, 'samples': 2630400, 'steps': 13699, 'loss/train': 1.4887804985046387} -11/06/2021 23:08:24 - INFO - __main__ - Step 13701: {'lr': 0.0004923294834722678, 'samples': 2630592, 'steps': 13700, 'loss/train': 1.6135252714157104} -11/06/2021 23:08:24 - INFO - __main__ - Step 13702: {'lr': 0.000492328178964827, 'samples': 2630784, 'steps': 13701, 'loss/train': 1.7054436206817627} -11/06/2021 23:08:25 - INFO - __main__ - Step 13703: {'lr': 0.0004923268743481969, 'samples': 2630976, 'steps': 13702, 'loss/train': 1.3338326215744019} -11/06/2021 23:08:25 - INFO - __main__ - Step 13704: {'lr': 0.000492325569622378, 'samples': 2631168, 'steps': 13703, 'loss/train': 1.5167887210845947} -11/06/2021 23:08:25 - INFO - __main__ - Step 13705: {'lr': 0.0004923242647873709, 'samples': 2631360, 'steps': 13704, 'loss/train': 1.7764374017715454} -11/06/2021 23:08:27 - INFO - __main__ - Step 13706: {'lr': 0.0004923229598431763, 'samples': 2631552, 'steps': 13705, 'loss/train': 1.981156349182129} -11/06/2021 23:08:27 - INFO - __main__ - Step 13707: {'lr': 0.0004923216547897948, 'samples': 2631744, 'steps': 13706, 'loss/train': 1.6128805875778198} -11/06/2021 23:08:27 - INFO - __main__ - Step 13708: {'lr': 0.0004923203496272267, 'samples': 2631936, 'steps': 13707, 'loss/train': 1.7675461769104004} -11/06/2021 23:08:28 - INFO - __main__ - Step 13709: {'lr': 0.0004923190443554729, 'samples': 2632128, 'steps': 13708, 'loss/train': 1.66963529586792} -11/06/2021 23:08:28 - INFO - __main__ - Step 13710: {'lr': 0.0004923177389745339, 'samples': 2632320, 'steps': 13709, 'loss/train': 0.4389937222003937} -11/06/2021 23:08:29 - INFO - __main__ - Step 13711: {'lr': 0.0004923164334844103, 'samples': 2632512, 'steps': 13710, 'loss/train': 1.7726091146469116} -11/06/2021 23:08:29 - INFO - __main__ - Step 13712: {'lr': 0.0004923151278851025, 'samples': 2632704, 'steps': 13711, 'loss/train': 0.9735046029090881} -11/06/2021 23:08:30 - INFO - __main__ - Step 13713: {'lr': 0.0004923138221766114, 'samples': 2632896, 'steps': 13712, 'loss/train': 1.4027715921401978} -11/06/2021 23:08:30 - INFO - __main__ - Step 13714: {'lr': 0.0004923125163589373, 'samples': 2633088, 'steps': 13713, 'loss/train': 1.875281572341919} -11/06/2021 23:08:30 - INFO - __main__ - Step 13715: {'lr': 0.0004923112104320811, 'samples': 2633280, 'steps': 13714, 'loss/train': 1.6900665760040283} -11/06/2021 23:08:32 - INFO - __main__ - Step 13716: {'lr': 0.000492309904396043, 'samples': 2633472, 'steps': 13715, 'loss/train': 1.1452865600585938} -11/06/2021 23:08:32 - INFO - __main__ - Step 13717: {'lr': 0.0004923085982508239, 'samples': 2633664, 'steps': 13716, 'loss/train': 1.9100697040557861} -11/06/2021 23:08:32 - INFO - __main__ - Step 13718: {'lr': 0.0004923072919964243, 'samples': 2633856, 'steps': 13717, 'loss/train': 4.524446964263916} -11/06/2021 23:08:33 - INFO - __main__ - Step 13719: {'lr': 0.0004923059856328447, 'samples': 2634048, 'steps': 13718, 'loss/train': 1.5310945510864258} -11/06/2021 23:08:33 - INFO - __main__ - Step 13720: {'lr': 0.0004923046791600859, 'samples': 2634240, 'steps': 13719, 'loss/train': 1.5483694076538086} -11/06/2021 23:08:34 - INFO - __main__ - Step 13721: {'lr': 0.0004923033725781482, 'samples': 2634432, 'steps': 13720, 'loss/train': 1.6037310361862183} -11/06/2021 23:08:34 - INFO - __main__ - Step 13722: {'lr': 0.0004923020658870324, 'samples': 2634624, 'steps': 13721, 'loss/train': 1.3916311264038086} -11/06/2021 23:08:35 - INFO - __main__ - Step 13723: {'lr': 0.000492300759086739, 'samples': 2634816, 'steps': 13722, 'loss/train': 0.19058111310005188} -11/06/2021 23:08:35 - INFO - __main__ - Step 13724: {'lr': 0.0004922994521772687, 'samples': 2635008, 'steps': 13723, 'loss/train': 1.856695532798767} -11/06/2021 23:08:35 - INFO - __main__ - Step 13725: {'lr': 0.000492298145158622, 'samples': 2635200, 'steps': 13724, 'loss/train': 1.6110961437225342} -11/06/2021 23:08:36 - INFO - __main__ - Step 13726: {'lr': 0.0004922968380307994, 'samples': 2635392, 'steps': 13725, 'loss/train': 2.1884765625} -11/06/2021 23:08:37 - INFO - __main__ - Step 13727: {'lr': 0.0004922955307938016, 'samples': 2635584, 'steps': 13726, 'loss/train': 1.4792718887329102} -11/06/2021 23:08:37 - INFO - __main__ - Step 13728: {'lr': 0.0004922942234476292, 'samples': 2635776, 'steps': 13727, 'loss/train': 0.9615477323532104} -11/06/2021 23:08:38 - INFO - __main__ - Step 13729: {'lr': 0.0004922929159922828, 'samples': 2635968, 'steps': 13728, 'loss/train': 1.467282772064209} -11/06/2021 23:08:38 - INFO - __main__ - Step 13730: {'lr': 0.0004922916084277629, 'samples': 2636160, 'steps': 13729, 'loss/train': 1.4172507524490356} -11/06/2021 23:08:38 - INFO - __main__ - Step 13731: {'lr': 0.0004922903007540701, 'samples': 2636352, 'steps': 13730, 'loss/train': 1.9334453344345093} -11/06/2021 23:08:40 - INFO - __main__ - Step 13732: {'lr': 0.0004922889929712051, 'samples': 2636544, 'steps': 13731, 'loss/train': 1.7975131273269653} -11/06/2021 23:08:40 - INFO - __main__ - Step 13733: {'lr': 0.0004922876850791684, 'samples': 2636736, 'steps': 13732, 'loss/train': 1.5812453031539917} -11/06/2021 23:08:40 - INFO - __main__ - Step 13734: {'lr': 0.0004922863770779606, 'samples': 2636928, 'steps': 13733, 'loss/train': 1.761626124382019} -11/06/2021 23:08:41 - INFO - __main__ - Step 13735: {'lr': 0.0004922850689675823, 'samples': 2637120, 'steps': 13734, 'loss/train': 0.9880645275115967} -11/06/2021 23:08:41 - INFO - __main__ - Step 13736: {'lr': 0.0004922837607480341, 'samples': 2637312, 'steps': 13735, 'loss/train': 1.812021255493164} -11/06/2021 23:08:41 - INFO - __main__ - Step 13737: {'lr': 0.0004922824524193166, 'samples': 2637504, 'steps': 13736, 'loss/train': 1.655940055847168} -11/06/2021 23:08:42 - INFO - __main__ - Step 13738: {'lr': 0.0004922811439814303, 'samples': 2637696, 'steps': 13737, 'loss/train': 3.0965065956115723} -11/06/2021 23:08:43 - INFO - __main__ - Step 13739: {'lr': 0.0004922798354343758, 'samples': 2637888, 'steps': 13738, 'loss/train': 1.1980981826782227} -11/06/2021 23:08:43 - INFO - __main__ - Step 13740: {'lr': 0.0004922785267781539, 'samples': 2638080, 'steps': 13739, 'loss/train': 1.4556937217712402} -11/06/2021 23:08:43 - INFO - __main__ - Step 13741: {'lr': 0.000492277218012765, 'samples': 2638272, 'steps': 13740, 'loss/train': 1.6142842769622803} -11/06/2021 23:08:44 - INFO - __main__ - Step 13742: {'lr': 0.0004922759091382097, 'samples': 2638464, 'steps': 13741, 'loss/train': 2.2603096961975098} -11/06/2021 23:08:45 - INFO - __main__ - Step 13743: {'lr': 0.0004922746001544885, 'samples': 2638656, 'steps': 13742, 'loss/train': 1.3596349954605103} -11/06/2021 23:08:45 - INFO - __main__ - Step 13744: {'lr': 0.0004922732910616023, 'samples': 2638848, 'steps': 13743, 'loss/train': 1.9842960834503174} -11/06/2021 23:08:46 - INFO - __main__ - Step 13745: {'lr': 0.0004922719818595514, 'samples': 2639040, 'steps': 13744, 'loss/train': 2.0623526573181152} -11/06/2021 23:08:46 - INFO - __main__ - Step 13746: {'lr': 0.0004922706725483364, 'samples': 2639232, 'steps': 13745, 'loss/train': 1.9149062633514404} -11/06/2021 23:08:46 - INFO - __main__ - Step 13747: {'lr': 0.0004922693631279581, 'samples': 2639424, 'steps': 13746, 'loss/train': 2.0381317138671875} -11/06/2021 23:08:47 - INFO - __main__ - Step 13748: {'lr': 0.000492268053598417, 'samples': 2639616, 'steps': 13747, 'loss/train': 2.627610445022583} -11/06/2021 23:08:48 - INFO - __main__ - Step 13749: {'lr': 0.0004922667439597136, 'samples': 2639808, 'steps': 13748, 'loss/train': 1.306639552116394} -11/06/2021 23:08:48 - INFO - __main__ - Step 13750: {'lr': 0.0004922654342118484, 'samples': 2640000, 'steps': 13749, 'loss/train': 1.3434464931488037} -11/06/2021 23:08:48 - INFO - __main__ - Step 13751: {'lr': 0.0004922641243548223, 'samples': 2640192, 'steps': 13750, 'loss/train': 2.0326554775238037} -11/06/2021 23:08:49 - INFO - __main__ - Step 13752: {'lr': 0.0004922628143886358, 'samples': 2640384, 'steps': 13751, 'loss/train': 2.049717903137207} -11/06/2021 23:08:49 - INFO - __main__ - Step 13753: {'lr': 0.0004922615043132892, 'samples': 2640576, 'steps': 13752, 'loss/train': 1.6888577938079834} -11/06/2021 23:08:50 - INFO - __main__ - Step 13754: {'lr': 0.0004922601941287835, 'samples': 2640768, 'steps': 13753, 'loss/train': 0.9408217668533325} -11/06/2021 23:08:50 - INFO - __main__ - Step 13755: {'lr': 0.0004922588838351189, 'samples': 2640960, 'steps': 13754, 'loss/train': 1.6507468223571777} -11/06/2021 23:08:51 - INFO - __main__ - Step 13756: {'lr': 0.0004922575734322963, 'samples': 2641152, 'steps': 13755, 'loss/train': 1.7679812908172607} -11/06/2021 23:08:51 - INFO - __main__ - Step 13757: {'lr': 0.0004922562629203161, 'samples': 2641344, 'steps': 13756, 'loss/train': 1.271485447883606} -11/06/2021 23:08:51 - INFO - __main__ - Step 13758: {'lr': 0.0004922549522991791, 'samples': 2641536, 'steps': 13757, 'loss/train': 1.955517053604126} -11/06/2021 23:08:53 - INFO - __main__ - Step 13759: {'lr': 0.0004922536415688856, 'samples': 2641728, 'steps': 13758, 'loss/train': 2.06683349609375} -11/06/2021 23:08:53 - INFO - __main__ - Step 13760: {'lr': 0.0004922523307294364, 'samples': 2641920, 'steps': 13759, 'loss/train': 1.354589581489563} -11/06/2021 23:08:53 - INFO - __main__ - Step 13761: {'lr': 0.0004922510197808321, 'samples': 2642112, 'steps': 13760, 'loss/train': 1.9096133708953857} -11/06/2021 23:08:54 - INFO - __main__ - Step 13762: {'lr': 0.0004922497087230732, 'samples': 2642304, 'steps': 13761, 'loss/train': 1.9483925104141235} -11/06/2021 23:08:54 - INFO - __main__ - Step 13763: {'lr': 0.0004922483975561603, 'samples': 2642496, 'steps': 13762, 'loss/train': 2.073777437210083} -11/06/2021 23:08:55 - INFO - __main__ - Step 13764: {'lr': 0.000492247086280094, 'samples': 2642688, 'steps': 13763, 'loss/train': 1.6551817655563354} -11/06/2021 23:08:55 - INFO - __main__ - Step 13765: {'lr': 0.0004922457748948749, 'samples': 2642880, 'steps': 13764, 'loss/train': 1.7662451267242432} -11/06/2021 23:08:56 - INFO - __main__ - Step 13766: {'lr': 0.0004922444634005037, 'samples': 2643072, 'steps': 13765, 'loss/train': 1.595479965209961} -11/06/2021 23:08:56 - INFO - __main__ - Step 13767: {'lr': 0.0004922431517969808, 'samples': 2643264, 'steps': 13766, 'loss/train': 1.6051268577575684} -11/06/2021 23:08:57 - INFO - __main__ - Step 13768: {'lr': 0.0004922418400843068, 'samples': 2643456, 'steps': 13767, 'loss/train': 0.942782461643219} -11/06/2021 23:08:58 - INFO - __main__ - Step 13769: {'lr': 0.0004922405282624825, 'samples': 2643648, 'steps': 13768, 'loss/train': 0.8302810788154602} -11/06/2021 23:08:58 - INFO - __main__ - Step 13770: {'lr': 0.0004922392163315083, 'samples': 2643840, 'steps': 13769, 'loss/train': 2.0029447078704834} -11/06/2021 23:08:58 - INFO - __main__ - Step 13771: {'lr': 0.0004922379042913848, 'samples': 2644032, 'steps': 13770, 'loss/train': 1.7818113565444946} -11/06/2021 23:08:59 - INFO - __main__ - Step 13772: {'lr': 0.0004922365921421126, 'samples': 2644224, 'steps': 13771, 'loss/train': 2.0600786209106445} -11/06/2021 23:08:59 - INFO - __main__ - Step 13773: {'lr': 0.0004922352798836924, 'samples': 2644416, 'steps': 13772, 'loss/train': 2.0496914386749268} -11/06/2021 23:09:00 - INFO - __main__ - Step 13774: {'lr': 0.0004922339675161248, 'samples': 2644608, 'steps': 13773, 'loss/train': 1.9038617610931396} -11/06/2021 23:09:00 - INFO - __main__ - Step 13775: {'lr': 0.0004922326550394102, 'samples': 2644800, 'steps': 13774, 'loss/train': 1.3252359628677368} -11/06/2021 23:09:01 - INFO - __main__ - Step 13776: {'lr': 0.0004922313424535494, 'samples': 2644992, 'steps': 13775, 'loss/train': 1.8318666219711304} -11/06/2021 23:09:01 - INFO - __main__ - Step 13777: {'lr': 0.0004922300297585428, 'samples': 2645184, 'steps': 13776, 'loss/train': 2.127047061920166} -11/06/2021 23:09:01 - INFO - __main__ - Step 13778: {'lr': 0.0004922287169543911, 'samples': 2645376, 'steps': 13777, 'loss/train': 1.2675795555114746} -11/06/2021 23:09:02 - INFO - __main__ - Step 13779: {'lr': 0.0004922274040410949, 'samples': 2645568, 'steps': 13778, 'loss/train': 1.7878961563110352} -11/06/2021 23:09:03 - INFO - __main__ - Step 13780: {'lr': 0.0004922260910186548, 'samples': 2645760, 'steps': 13779, 'loss/train': 1.97649085521698} -11/06/2021 23:09:03 - INFO - __main__ - Step 13781: {'lr': 0.0004922247778870714, 'samples': 2645952, 'steps': 13780, 'loss/train': 1.6250098943710327} -11/06/2021 23:09:04 - INFO - __main__ - Step 13782: {'lr': 0.0004922234646463451, 'samples': 2646144, 'steps': 13781, 'loss/train': 1.9466784000396729} -11/06/2021 23:09:04 - INFO - __main__ - Step 13783: {'lr': 0.0004922221512964767, 'samples': 2646336, 'steps': 13782, 'loss/train': 1.1106783151626587} -11/06/2021 23:09:04 - INFO - __main__ - Step 13784: {'lr': 0.0004922208378374668, 'samples': 2646528, 'steps': 13783, 'loss/train': 2.0252909660339355} -11/06/2021 23:09:05 - INFO - __main__ - Step 13785: {'lr': 0.0004922195242693159, 'samples': 2646720, 'steps': 13784, 'loss/train': 1.6497094631195068} -11/06/2021 23:09:06 - INFO - __main__ - Step 13786: {'lr': 0.0004922182105920246, 'samples': 2646912, 'steps': 13785, 'loss/train': 1.4474611282348633} -11/06/2021 23:09:06 - INFO - __main__ - Step 13787: {'lr': 0.0004922168968055935, 'samples': 2647104, 'steps': 13786, 'loss/train': 2.291621446609497} -11/06/2021 23:09:06 - INFO - __main__ - Step 13788: {'lr': 0.0004922155829100233, 'samples': 2647296, 'steps': 13787, 'loss/train': 2.148526668548584} -11/06/2021 23:09:07 - INFO - __main__ - Step 13789: {'lr': 0.0004922142689053144, 'samples': 2647488, 'steps': 13788, 'loss/train': 1.9192496538162231} -11/06/2021 23:09:08 - INFO - __main__ - Step 13790: {'lr': 0.0004922129547914675, 'samples': 2647680, 'steps': 13789, 'loss/train': 2.097891330718994} -11/06/2021 23:09:08 - INFO - __main__ - Step 13791: {'lr': 0.0004922116405684832, 'samples': 2647872, 'steps': 13790, 'loss/train': 1.7721515893936157} -11/06/2021 23:09:08 - INFO - __main__ - Step 13792: {'lr': 0.0004922103262363621, 'samples': 2648064, 'steps': 13791, 'loss/train': 1.5414934158325195} -11/06/2021 23:09:09 - INFO - __main__ - Step 13793: {'lr': 0.0004922090117951047, 'samples': 2648256, 'steps': 13792, 'loss/train': 2.323873519897461} -11/06/2021 23:09:09 - INFO - __main__ - Step 13794: {'lr': 0.0004922076972447117, 'samples': 2648448, 'steps': 13793, 'loss/train': 1.157942533493042} -11/06/2021 23:09:10 - INFO - __main__ - Step 13795: {'lr': 0.0004922063825851836, 'samples': 2648640, 'steps': 13794, 'loss/train': 1.609661340713501} -11/06/2021 23:09:10 - INFO - __main__ - Step 13796: {'lr': 0.0004922050678165211, 'samples': 2648832, 'steps': 13795, 'loss/train': 0.9388356804847717} -11/06/2021 23:09:11 - INFO - __main__ - Step 13797: {'lr': 0.0004922037529387247, 'samples': 2649024, 'steps': 13796, 'loss/train': 1.7672147750854492} -11/06/2021 23:09:11 - INFO - __main__ - Step 13798: {'lr': 0.000492202437951795, 'samples': 2649216, 'steps': 13797, 'loss/train': 1.639959454536438} -11/06/2021 23:09:11 - INFO - __main__ - Step 13799: {'lr': 0.0004922011228557327, 'samples': 2649408, 'steps': 13798, 'loss/train': 1.4303568601608276} -11/06/2021 23:09:13 - INFO - __main__ - Step 13800: {'lr': 0.0004921998076505383, 'samples': 2649600, 'steps': 13799, 'loss/train': 1.8134762048721313} -11/06/2021 23:09:13 - INFO - __main__ - Step 13801: {'lr': 0.0004921984923362124, 'samples': 2649792, 'steps': 13800, 'loss/train': 1.5940922498703003} -11/06/2021 23:09:13 - INFO - __main__ - Step 13802: {'lr': 0.0004921971769127555, 'samples': 2649984, 'steps': 13801, 'loss/train': 1.1051990985870361} -11/06/2021 23:09:14 - INFO - __main__ - Step 13803: {'lr': 0.0004921958613801683, 'samples': 2650176, 'steps': 13802, 'loss/train': 1.5847387313842773} -11/06/2021 23:09:14 - INFO - __main__ - Step 13804: {'lr': 0.0004921945457384516, 'samples': 2650368, 'steps': 13803, 'loss/train': 1.840270757675171} -11/06/2021 23:09:15 - INFO - __main__ - Step 13805: {'lr': 0.0004921932299876055, 'samples': 2650560, 'steps': 13804, 'loss/train': 1.712327241897583} -11/06/2021 23:09:15 - INFO - __main__ - Step 13806: {'lr': 0.000492191914127631, 'samples': 2650752, 'steps': 13805, 'loss/train': 2.4084267616271973} -11/06/2021 23:09:16 - INFO - __main__ - Step 13807: {'lr': 0.0004921905981585286, 'samples': 2650944, 'steps': 13806, 'loss/train': 1.3894824981689453} -11/06/2021 23:09:16 - INFO - __main__ - Step 13808: {'lr': 0.0004921892820802988, 'samples': 2651136, 'steps': 13807, 'loss/train': 1.7391257286071777} -11/06/2021 23:09:16 - INFO - __main__ - Step 13809: {'lr': 0.0004921879658929422, 'samples': 2651328, 'steps': 13808, 'loss/train': 4.748656272888184} -11/06/2021 23:09:17 - INFO - __main__ - Step 13810: {'lr': 0.0004921866495964594, 'samples': 2651520, 'steps': 13809, 'loss/train': 1.1638247966766357} -11/06/2021 23:09:18 - INFO - __main__ - Step 13811: {'lr': 0.0004921853331908512, 'samples': 2651712, 'steps': 13810, 'loss/train': 1.9072991609573364} -11/06/2021 23:09:18 - INFO - __main__ - Step 13812: {'lr': 0.000492184016676118, 'samples': 2651904, 'steps': 13811, 'loss/train': 2.309782028198242} -11/06/2021 23:09:18 - INFO - __main__ - Step 13813: {'lr': 0.0004921827000522603, 'samples': 2652096, 'steps': 13812, 'loss/train': 1.5911425352096558} -11/06/2021 23:09:19 - INFO - __main__ - Step 13814: {'lr': 0.0004921813833192788, 'samples': 2652288, 'steps': 13813, 'loss/train': 1.9693739414215088} -11/06/2021 23:09:19 - INFO - __main__ - Step 13815: {'lr': 0.0004921800664771743, 'samples': 2652480, 'steps': 13814, 'loss/train': 1.7779452800750732} -11/06/2021 23:09:20 - INFO - __main__ - Step 13816: {'lr': 0.0004921787495259471, 'samples': 2652672, 'steps': 13815, 'loss/train': 1.5039100646972656} -11/06/2021 23:09:21 - INFO - __main__ - Step 13817: {'lr': 0.0004921774324655978, 'samples': 2652864, 'steps': 13816, 'loss/train': 1.054052472114563} -11/06/2021 23:09:21 - INFO - __main__ - Step 13818: {'lr': 0.0004921761152961271, 'samples': 2653056, 'steps': 13817, 'loss/train': 2.0499536991119385} -11/06/2021 23:09:21 - INFO - __main__ - Step 13819: {'lr': 0.0004921747980175357, 'samples': 2653248, 'steps': 13818, 'loss/train': 1.8573100566864014} -11/06/2021 23:09:22 - INFO - __main__ - Step 13820: {'lr': 0.0004921734806298241, 'samples': 2653440, 'steps': 13819, 'loss/train': 1.531470775604248} -11/06/2021 23:09:23 - INFO - __main__ - Step 13821: {'lr': 0.0004921721631329927, 'samples': 2653632, 'steps': 13820, 'loss/train': 3.0055086612701416} -11/06/2021 23:09:23 - INFO - __main__ - Step 13822: {'lr': 0.0004921708455270424, 'samples': 2653824, 'steps': 13821, 'loss/train': 1.5940738916397095} -11/06/2021 23:09:23 - INFO - __main__ - Step 13823: {'lr': 0.0004921695278119736, 'samples': 2654016, 'steps': 13822, 'loss/train': 2.001136541366577} -11/06/2021 23:09:24 - INFO - __main__ - Step 13824: {'lr': 0.0004921682099877869, 'samples': 2654208, 'steps': 13823, 'loss/train': 1.7149298191070557} -11/06/2021 23:09:24 - INFO - __main__ - Step 13825: {'lr': 0.000492166892054483, 'samples': 2654400, 'steps': 13824, 'loss/train': 1.6777122020721436} -11/06/2021 23:09:25 - INFO - __main__ - Step 13826: {'lr': 0.0004921655740120623, 'samples': 2654592, 'steps': 13825, 'loss/train': 1.5764762163162231} -11/06/2021 23:09:25 - INFO - __main__ - Step 13827: {'lr': 0.0004921642558605257, 'samples': 2654784, 'steps': 13826, 'loss/train': 1.0914108753204346} -11/06/2021 23:09:26 - INFO - __main__ - Step 13828: {'lr': 0.0004921629375998736, 'samples': 2654976, 'steps': 13827, 'loss/train': 1.5501351356506348} -11/06/2021 23:09:26 - INFO - __main__ - Step 13829: {'lr': 0.0004921616192301065, 'samples': 2655168, 'steps': 13828, 'loss/train': 0.7807660102844238} -11/06/2021 23:09:26 - INFO - __main__ - Step 13830: {'lr': 0.0004921603007512253, 'samples': 2655360, 'steps': 13829, 'loss/train': 1.8146405220031738} -11/06/2021 23:09:28 - INFO - __main__ - Step 13831: {'lr': 0.0004921589821632302, 'samples': 2655552, 'steps': 13830, 'loss/train': 1.731347680091858} -11/06/2021 23:09:28 - INFO - __main__ - Step 13832: {'lr': 0.0004921576634661221, 'samples': 2655744, 'steps': 13831, 'loss/train': 1.670548439025879} -11/06/2021 23:09:28 - INFO - __main__ - Step 13833: {'lr': 0.0004921563446599015, 'samples': 2655936, 'steps': 13832, 'loss/train': 1.5320069789886475} -11/06/2021 23:09:29 - INFO - __main__ - Step 13834: {'lr': 0.000492155025744569, 'samples': 2656128, 'steps': 13833, 'loss/train': 1.0628443956375122} -11/06/2021 23:09:29 - INFO - __main__ - Step 13835: {'lr': 0.0004921537067201252, 'samples': 2656320, 'steps': 13834, 'loss/train': 2.1405911445617676} -11/06/2021 23:09:30 - INFO - __main__ - Step 13836: {'lr': 0.0004921523875865706, 'samples': 2656512, 'steps': 13835, 'loss/train': 1.0246696472167969} -11/06/2021 23:09:30 - INFO - __main__ - Step 13837: {'lr': 0.000492151068343906, 'samples': 2656704, 'steps': 13836, 'loss/train': 1.8948359489440918} -11/06/2021 23:09:31 - INFO - __main__ - Step 13838: {'lr': 0.0004921497489921318, 'samples': 2656896, 'steps': 13837, 'loss/train': 1.7364670038223267} -11/06/2021 23:09:31 - INFO - __main__ - Step 13839: {'lr': 0.0004921484295312485, 'samples': 2657088, 'steps': 13838, 'loss/train': 1.4942817687988281} -11/06/2021 23:09:31 - INFO - __main__ - Step 13840: {'lr': 0.0004921471099612571, 'samples': 2657280, 'steps': 13839, 'loss/train': 1.2678571939468384} -11/06/2021 23:09:32 - INFO - __main__ - Step 13841: {'lr': 0.0004921457902821578, 'samples': 2657472, 'steps': 13840, 'loss/train': 1.7979927062988281} -11/06/2021 23:09:33 - INFO - __main__ - Step 13842: {'lr': 0.0004921444704939514, 'samples': 2657664, 'steps': 13841, 'loss/train': 1.2086461782455444} -11/06/2021 23:09:33 - INFO - __main__ - Step 13843: {'lr': 0.0004921431505966384, 'samples': 2657856, 'steps': 13842, 'loss/train': 2.1114842891693115} -11/06/2021 23:09:33 - INFO - __main__ - Step 13844: {'lr': 0.0004921418305902194, 'samples': 2658048, 'steps': 13843, 'loss/train': 1.7268887758255005} -11/06/2021 23:09:34 - INFO - __main__ - Step 13845: {'lr': 0.0004921405104746951, 'samples': 2658240, 'steps': 13844, 'loss/train': 1.4159009456634521} -11/06/2021 23:09:35 - INFO - __main__ - Step 13846: {'lr': 0.0004921391902500661, 'samples': 2658432, 'steps': 13845, 'loss/train': 0.772130012512207} -11/06/2021 23:09:35 - INFO - __main__ - Step 13847: {'lr': 0.0004921378699163328, 'samples': 2658624, 'steps': 13846, 'loss/train': 1.6413114070892334} -11/06/2021 23:09:35 - INFO - __main__ - Step 13848: {'lr': 0.0004921365494734959, 'samples': 2658816, 'steps': 13847, 'loss/train': 2.0871777534484863} -11/06/2021 23:09:36 - INFO - __main__ - Step 13849: {'lr': 0.0004921352289215561, 'samples': 2659008, 'steps': 13848, 'loss/train': 1.6378384828567505} -11/06/2021 23:09:36 - INFO - __main__ - Step 13850: {'lr': 0.0004921339082605137, 'samples': 2659200, 'steps': 13849, 'loss/train': 1.849760890007019} -11/06/2021 23:09:37 - INFO - __main__ - Step 13851: {'lr': 0.0004921325874903697, 'samples': 2659392, 'steps': 13850, 'loss/train': 1.766753077507019} -11/06/2021 23:09:38 - INFO - __main__ - Step 13852: {'lr': 0.0004921312666111245, 'samples': 2659584, 'steps': 13851, 'loss/train': 1.397715449333191} -11/06/2021 23:09:38 - INFO - __main__ - Step 13853: {'lr': 0.0004921299456227785, 'samples': 2659776, 'steps': 13852, 'loss/train': 1.6967663764953613} -11/06/2021 23:09:38 - INFO - __main__ - Step 13854: {'lr': 0.0004921286245253327, 'samples': 2659968, 'steps': 13853, 'loss/train': 1.3301624059677124} -11/06/2021 23:09:39 - INFO - __main__ - Step 13855: {'lr': 0.0004921273033187874, 'samples': 2660160, 'steps': 13854, 'loss/train': 2.2361197471618652} -11/06/2021 23:09:39 - INFO - __main__ - Step 13856: {'lr': 0.0004921259820031431, 'samples': 2660352, 'steps': 13855, 'loss/train': 1.5160555839538574} -11/06/2021 23:09:40 - INFO - __main__ - Step 13857: {'lr': 0.0004921246605784008, 'samples': 2660544, 'steps': 13856, 'loss/train': 1.797963261604309} -11/06/2021 23:09:40 - INFO - __main__ - Step 13858: {'lr': 0.0004921233390445608, 'samples': 2660736, 'steps': 13857, 'loss/train': 1.6788036823272705} -11/06/2021 23:09:41 - INFO - __main__ - Step 13859: {'lr': 0.0004921220174016238, 'samples': 2660928, 'steps': 13858, 'loss/train': 1.196427345275879} -11/06/2021 23:09:41 - INFO - __main__ - Step 13860: {'lr': 0.0004921206956495903, 'samples': 2661120, 'steps': 13859, 'loss/train': 0.5547469854354858} -11/06/2021 23:09:42 - INFO - __main__ - Step 13861: {'lr': 0.000492119373788461, 'samples': 2661312, 'steps': 13860, 'loss/train': 1.9061776399612427} -11/06/2021 23:09:42 - INFO - __main__ - Step 13862: {'lr': 0.0004921180518182363, 'samples': 2661504, 'steps': 13861, 'loss/train': 1.7613266706466675} -11/06/2021 23:09:43 - INFO - __main__ - Step 13863: {'lr': 0.0004921167297389171, 'samples': 2661696, 'steps': 13862, 'loss/train': 1.3482214212417603} -11/06/2021 23:09:43 - INFO - __main__ - Step 13864: {'lr': 0.0004921154075505038, 'samples': 2661888, 'steps': 13863, 'loss/train': 1.8354885578155518} -11/06/2021 23:09:44 - INFO - __main__ - Step 13865: {'lr': 0.0004921140852529969, 'samples': 2662080, 'steps': 13864, 'loss/train': 1.8951635360717773} -11/06/2021 23:09:44 - INFO - __main__ - Step 13866: {'lr': 0.0004921127628463972, 'samples': 2662272, 'steps': 13865, 'loss/train': 1.8773669004440308} -11/06/2021 23:09:44 - INFO - __main__ - Step 13867: {'lr': 0.0004921114403307053, 'samples': 2662464, 'steps': 13866, 'loss/train': 1.8073745965957642} -11/06/2021 23:09:45 - INFO - __main__ - Step 13868: {'lr': 0.0004921101177059218, 'samples': 2662656, 'steps': 13867, 'loss/train': 2.099315881729126} -11/06/2021 23:09:46 - INFO - __main__ - Step 13869: {'lr': 0.0004921087949720471, 'samples': 2662848, 'steps': 13868, 'loss/train': 1.927840232849121} -11/06/2021 23:09:46 - INFO - __main__ - Step 13870: {'lr': 0.0004921074721290819, 'samples': 2663040, 'steps': 13869, 'loss/train': 1.8711230754852295} -11/06/2021 23:09:46 - INFO - __main__ - Step 13871: {'lr': 0.0004921061491770268, 'samples': 2663232, 'steps': 13870, 'loss/train': 1.5287330150604248} -11/06/2021 23:09:47 - INFO - __main__ - Step 13872: {'lr': 0.0004921048261158825, 'samples': 2663424, 'steps': 13871, 'loss/train': 1.6624870300292969} -11/06/2021 23:09:48 - INFO - __main__ - Step 13873: {'lr': 0.0004921035029456493, 'samples': 2663616, 'steps': 13872, 'loss/train': 1.8428698778152466} -11/06/2021 23:09:48 - INFO - __main__ - Step 13874: {'lr': 0.0004921021796663282, 'samples': 2663808, 'steps': 13873, 'loss/train': 1.4383753538131714} -11/06/2021 23:09:49 - INFO - __main__ - Step 13875: {'lr': 0.0004921008562779195, 'samples': 2664000, 'steps': 13874, 'loss/train': 1.4360547065734863} -11/06/2021 23:09:49 - INFO - __main__ - Step 13876: {'lr': 0.0004920995327804239, 'samples': 2664192, 'steps': 13875, 'loss/train': 1.6160893440246582} -11/06/2021 23:09:49 - INFO - __main__ - Step 13877: {'lr': 0.000492098209173842, 'samples': 2664384, 'steps': 13876, 'loss/train': 1.0459492206573486} -11/06/2021 23:09:50 - INFO - __main__ - Step 13878: {'lr': 0.0004920968854581745, 'samples': 2664576, 'steps': 13877, 'loss/train': 1.7214491367340088} -11/06/2021 23:09:51 - INFO - __main__ - Step 13879: {'lr': 0.0004920955616334216, 'samples': 2664768, 'steps': 13878, 'loss/train': 1.4879608154296875} -11/06/2021 23:09:51 - INFO - __main__ - Step 13880: {'lr': 0.0004920942376995844, 'samples': 2664960, 'steps': 13879, 'loss/train': 1.7275727987289429} -11/06/2021 23:09:51 - INFO - __main__ - Step 13881: {'lr': 0.0004920929136566632, 'samples': 2665152, 'steps': 13880, 'loss/train': 1.556997299194336} -11/06/2021 23:09:52 - INFO - __main__ - Step 13882: {'lr': 0.0004920915895046587, 'samples': 2665344, 'steps': 13881, 'loss/train': 1.629291296005249} -11/06/2021 23:09:52 - INFO - __main__ - Step 13883: {'lr': 0.0004920902652435715, 'samples': 2665536, 'steps': 13882, 'loss/train': 2.0257277488708496} -11/06/2021 23:09:53 - INFO - __main__ - Step 13884: {'lr': 0.0004920889408734021, 'samples': 2665728, 'steps': 13883, 'loss/train': 1.8871136903762817} -11/06/2021 23:09:53 - INFO - __main__ - Step 13885: {'lr': 0.0004920876163941511, 'samples': 2665920, 'steps': 13884, 'loss/train': 1.1255569458007812} -11/06/2021 23:09:54 - INFO - __main__ - Step 13886: {'lr': 0.0004920862918058192, 'samples': 2666112, 'steps': 13885, 'loss/train': 1.7489358186721802} -11/06/2021 23:09:54 - INFO - __main__ - Step 13887: {'lr': 0.000492084967108407, 'samples': 2666304, 'steps': 13886, 'loss/train': 2.234173536300659} -11/06/2021 23:09:54 - INFO - __main__ - Step 13888: {'lr': 0.000492083642301915, 'samples': 2666496, 'steps': 13887, 'loss/train': 1.7307212352752686} -11/06/2021 23:09:56 - INFO - __main__ - Step 13889: {'lr': 0.0004920823173863439, 'samples': 2666688, 'steps': 13888, 'loss/train': 1.4370955228805542} -11/06/2021 23:09:56 - INFO - __main__ - Step 13890: {'lr': 0.0004920809923616942, 'samples': 2666880, 'steps': 13889, 'loss/train': 1.8873080015182495} -11/06/2021 23:09:56 - INFO - __main__ - Step 13891: {'lr': 0.0004920796672279666, 'samples': 2667072, 'steps': 13890, 'loss/train': 1.8920522928237915} -11/06/2021 23:09:57 - INFO - __main__ - Step 13892: {'lr': 0.0004920783419851615, 'samples': 2667264, 'steps': 13891, 'loss/train': 5.647333145141602} -11/06/2021 23:09:57 - INFO - __main__ - Step 13893: {'lr': 0.0004920770166332798, 'samples': 2667456, 'steps': 13892, 'loss/train': 1.972109317779541} -11/06/2021 23:09:57 - INFO - __main__ - Step 13894: {'lr': 0.0004920756911723219, 'samples': 2667648, 'steps': 13893, 'loss/train': 2.5524847507476807} -11/06/2021 23:09:59 - INFO - __main__ - Step 13895: {'lr': 0.0004920743656022884, 'samples': 2667840, 'steps': 13894, 'loss/train': 1.815747618675232} -11/06/2021 23:09:59 - INFO - __main__ - Step 13896: {'lr': 0.0004920730399231799, 'samples': 2668032, 'steps': 13895, 'loss/train': 1.4550343751907349} -11/06/2021 23:09:59 - INFO - __main__ - Step 13897: {'lr': 0.000492071714134997, 'samples': 2668224, 'steps': 13896, 'loss/train': 1.4864250421524048} -11/06/2021 23:10:00 - INFO - __main__ - Step 13898: {'lr': 0.0004920703882377403, 'samples': 2668416, 'steps': 13897, 'loss/train': 1.741361141204834} -11/06/2021 23:10:00 - INFO - __main__ - Step 13899: {'lr': 0.0004920690622314105, 'samples': 2668608, 'steps': 13898, 'loss/train': 2.994898796081543} -11/06/2021 23:10:01 - INFO - __main__ - Step 13900: {'lr': 0.0004920677361160081, 'samples': 2668800, 'steps': 13899, 'loss/train': 1.8634357452392578} -11/06/2021 23:10:01 - INFO - __main__ - Step 13901: {'lr': 0.0004920664098915337, 'samples': 2668992, 'steps': 13900, 'loss/train': 1.6608809232711792} -11/06/2021 23:10:02 - INFO - __main__ - Step 13902: {'lr': 0.000492065083557988, 'samples': 2669184, 'steps': 13901, 'loss/train': 1.932618260383606} -11/06/2021 23:10:02 - INFO - __main__ - Step 13903: {'lr': 0.0004920637571153713, 'samples': 2669376, 'steps': 13902, 'loss/train': 1.4454110860824585} -11/06/2021 23:10:02 - INFO - __main__ - Step 13904: {'lr': 0.0004920624305636846, 'samples': 2669568, 'steps': 13903, 'loss/train': 1.8593177795410156} -11/06/2021 23:10:03 - INFO - __main__ - Step 13905: {'lr': 0.0004920611039029283, 'samples': 2669760, 'steps': 13904, 'loss/train': 1.7864686250686646} -11/06/2021 23:10:05 - INFO - __main__ - Step 13906: {'lr': 0.0004920597771331029, 'samples': 2669952, 'steps': 13905, 'loss/train': 2.002392292022705} -11/06/2021 23:10:05 - INFO - __main__ - Step 13907: {'lr': 0.0004920584502542091, 'samples': 2670144, 'steps': 13906, 'loss/train': 0.30893194675445557} -11/06/2021 23:10:06 - INFO - __main__ - Step 13908: {'lr': 0.0004920571232662475, 'samples': 2670336, 'steps': 13907, 'loss/train': 1.9505276679992676} -11/06/2021 23:10:06 - INFO - __main__ - Step 13909: {'lr': 0.0004920557961692188, 'samples': 2670528, 'steps': 13908, 'loss/train': 1.9398505687713623} -11/06/2021 23:10:06 - INFO - __main__ - Step 13910: {'lr': 0.0004920544689631233, 'samples': 2670720, 'steps': 13909, 'loss/train': 2.0230226516723633} -11/06/2021 23:10:07 - INFO - __main__ - Step 13911: {'lr': 0.000492053141647962, 'samples': 2670912, 'steps': 13910, 'loss/train': 1.8889321088790894} -11/06/2021 23:10:07 - INFO - __main__ - Step 13912: {'lr': 0.0004920518142237352, 'samples': 2671104, 'steps': 13911, 'loss/train': 1.33417809009552} -11/06/2021 23:10:07 - INFO - __main__ - Step 13913: {'lr': 0.0004920504866904436, 'samples': 2671296, 'steps': 13912, 'loss/train': 1.29556143283844} -11/06/2021 23:10:09 - INFO - __main__ - Step 13914: {'lr': 0.0004920491590480878, 'samples': 2671488, 'steps': 13913, 'loss/train': 1.9679369926452637} -11/06/2021 23:10:09 - INFO - __main__ - Step 13915: {'lr': 0.0004920478312966683, 'samples': 2671680, 'steps': 13914, 'loss/train': 1.3328757286071777} -11/06/2021 23:10:09 - INFO - __main__ - Step 13916: {'lr': 0.0004920465034361859, 'samples': 2671872, 'steps': 13915, 'loss/train': 1.5501303672790527} -11/06/2021 23:10:10 - INFO - __main__ - Step 13917: {'lr': 0.000492045175466641, 'samples': 2672064, 'steps': 13916, 'loss/train': 1.871131181716919} -11/06/2021 23:10:10 - INFO - __main__ - Step 13918: {'lr': 0.0004920438473880344, 'samples': 2672256, 'steps': 13917, 'loss/train': 2.702326536178589} -11/06/2021 23:10:11 - INFO - __main__ - Step 13919: {'lr': 0.0004920425192003663, 'samples': 2672448, 'steps': 13918, 'loss/train': 1.7303717136383057} -11/06/2021 23:10:11 - INFO - __main__ - Step 13920: {'lr': 0.0004920411909036379, 'samples': 2672640, 'steps': 13919, 'loss/train': 1.9704726934432983} -11/06/2021 23:10:12 - INFO - __main__ - Step 13921: {'lr': 0.0004920398624978493, 'samples': 2672832, 'steps': 13920, 'loss/train': 1.4717364311218262} -11/06/2021 23:10:12 - INFO - __main__ - Step 13922: {'lr': 0.0004920385339830012, 'samples': 2673024, 'steps': 13921, 'loss/train': 1.7774920463562012} -11/06/2021 23:10:12 - INFO - __main__ - Step 13923: {'lr': 0.0004920372053590945, 'samples': 2673216, 'steps': 13922, 'loss/train': 1.853239893913269} -11/06/2021 23:10:13 - INFO - __main__ - Step 13924: {'lr': 0.0004920358766261294, 'samples': 2673408, 'steps': 13923, 'loss/train': 1.9390660524368286} -11/06/2021 23:10:14 - INFO - __main__ - Step 13925: {'lr': 0.0004920345477841067, 'samples': 2673600, 'steps': 13924, 'loss/train': 2.0693888664245605} -11/06/2021 23:10:14 - INFO - __main__ - Step 13926: {'lr': 0.000492033218833027, 'samples': 2673792, 'steps': 13925, 'loss/train': 1.8519387245178223} -11/06/2021 23:10:14 - INFO - __main__ - Step 13927: {'lr': 0.0004920318897728909, 'samples': 2673984, 'steps': 13926, 'loss/train': 1.803276538848877} -11/06/2021 23:10:15 - INFO - __main__ - Step 13928: {'lr': 0.0004920305606036988, 'samples': 2674176, 'steps': 13927, 'loss/train': 1.768867015838623} -11/06/2021 23:10:16 - INFO - __main__ - Step 13929: {'lr': 0.0004920292313254516, 'samples': 2674368, 'steps': 13928, 'loss/train': 2.1696088314056396} -11/06/2021 23:10:16 - INFO - __main__ - Step 13930: {'lr': 0.0004920279019381497, 'samples': 2674560, 'steps': 13929, 'loss/train': 2.3505563735961914} -11/06/2021 23:10:16 - INFO - __main__ - Step 13931: {'lr': 0.0004920265724417938, 'samples': 2674752, 'steps': 13930, 'loss/train': 0.4778132736682892} -11/06/2021 23:10:17 - INFO - __main__ - Step 13932: {'lr': 0.0004920252428363845, 'samples': 2674944, 'steps': 13931, 'loss/train': 1.7751408815383911} -11/06/2021 23:10:17 - INFO - __main__ - Step 13933: {'lr': 0.0004920239131219223, 'samples': 2675136, 'steps': 13932, 'loss/train': 0.7648064494132996} -11/06/2021 23:10:18 - INFO - __main__ - Step 13934: {'lr': 0.0004920225832984079, 'samples': 2675328, 'steps': 13933, 'loss/train': 1.5931404829025269} -11/06/2021 23:10:18 - INFO - __main__ - Step 13935: {'lr': 0.0004920212533658419, 'samples': 2675520, 'steps': 13934, 'loss/train': 2.218579053878784} -11/06/2021 23:10:19 - INFO - __main__ - Step 13936: {'lr': 0.0004920199233242247, 'samples': 2675712, 'steps': 13935, 'loss/train': 1.7814935445785522} -11/06/2021 23:10:19 - INFO - __main__ - Step 13937: {'lr': 0.0004920185931735572, 'samples': 2675904, 'steps': 13936, 'loss/train': 1.8334205150604248} -11/06/2021 23:10:20 - INFO - __main__ - Step 13938: {'lr': 0.0004920172629138399, 'samples': 2676096, 'steps': 13937, 'loss/train': 1.7788243293762207} -11/06/2021 23:10:20 - INFO - __main__ - Step 13939: {'lr': 0.0004920159325450731, 'samples': 2676288, 'steps': 13938, 'loss/train': 1.6450157165527344} -11/06/2021 23:10:21 - INFO - __main__ - Step 13940: {'lr': 0.0004920146020672578, 'samples': 2676480, 'steps': 13939, 'loss/train': 1.6414921283721924} -11/06/2021 23:10:21 - INFO - __main__ - Step 13941: {'lr': 0.0004920132714803946, 'samples': 2676672, 'steps': 13940, 'loss/train': 1.8297538757324219} -11/06/2021 23:10:22 - INFO - __main__ - Step 13942: {'lr': 0.0004920119407844838, 'samples': 2676864, 'steps': 13941, 'loss/train': 1.148298978805542} -11/06/2021 23:10:22 - INFO - __main__ - Step 13943: {'lr': 0.0004920106099795262, 'samples': 2677056, 'steps': 13942, 'loss/train': 2.2544357776641846} -11/06/2021 23:10:22 - INFO - __main__ - Step 13944: {'lr': 0.0004920092790655224, 'samples': 2677248, 'steps': 13943, 'loss/train': 2.0402214527130127} -11/06/2021 23:10:24 - INFO - __main__ - Step 13945: {'lr': 0.0004920079480424728, 'samples': 2677440, 'steps': 13944, 'loss/train': 1.6051249504089355} -11/06/2021 23:10:24 - INFO - __main__ - Step 13946: {'lr': 0.0004920066169103783, 'samples': 2677632, 'steps': 13945, 'loss/train': 1.0051872730255127} -11/06/2021 23:10:24 - INFO - __main__ - Step 13947: {'lr': 0.0004920052856692394, 'samples': 2677824, 'steps': 13946, 'loss/train': 1.7988791465759277} -11/06/2021 23:10:25 - INFO - __main__ - Step 13948: {'lr': 0.0004920039543190565, 'samples': 2678016, 'steps': 13947, 'loss/train': 1.3910020589828491} -11/06/2021 23:10:25 - INFO - __main__ - Step 13949: {'lr': 0.0004920026228598303, 'samples': 2678208, 'steps': 13948, 'loss/train': 1.5859302282333374} -11/06/2021 23:10:26 - INFO - __main__ - Step 13950: {'lr': 0.0004920012912915616, 'samples': 2678400, 'steps': 13949, 'loss/train': 1.9164284467697144} -11/06/2021 23:10:26 - INFO - __main__ - Step 13951: {'lr': 0.0004919999596142508, 'samples': 2678592, 'steps': 13950, 'loss/train': 1.7975435256958008} -11/06/2021 23:10:27 - INFO - __main__ - Step 13952: {'lr': 0.0004919986278278986, 'samples': 2678784, 'steps': 13951, 'loss/train': 1.8759640455245972} -11/06/2021 23:10:27 - INFO - __main__ - Step 13953: {'lr': 0.0004919972959325055, 'samples': 2678976, 'steps': 13952, 'loss/train': 2.344235420227051} -11/06/2021 23:10:27 - INFO - __main__ - Step 13954: {'lr': 0.0004919959639280722, 'samples': 2679168, 'steps': 13953, 'loss/train': 3.453373432159424} -11/06/2021 23:10:28 - INFO - __main__ - Step 13955: {'lr': 0.0004919946318145992, 'samples': 2679360, 'steps': 13954, 'loss/train': 2.145124673843384} -11/06/2021 23:10:29 - INFO - __main__ - Step 13956: {'lr': 0.0004919932995920872, 'samples': 2679552, 'steps': 13955, 'loss/train': 1.7001293897628784} -11/06/2021 23:10:29 - INFO - __main__ - Step 13957: {'lr': 0.0004919919672605366, 'samples': 2679744, 'steps': 13956, 'loss/train': 1.792694330215454} -11/06/2021 23:10:29 - INFO - __main__ - Step 13958: {'lr': 0.0004919906348199483, 'samples': 2679936, 'steps': 13957, 'loss/train': 1.8448896408081055} -11/06/2021 23:10:30 - INFO - __main__ - Step 13959: {'lr': 0.0004919893022703228, 'samples': 2680128, 'steps': 13958, 'loss/train': 1.7649340629577637} -11/06/2021 23:10:31 - INFO - __main__ - Step 13960: {'lr': 0.0004919879696116605, 'samples': 2680320, 'steps': 13959, 'loss/train': 1.3440182209014893} -11/06/2021 23:10:31 - INFO - __main__ - Step 13961: {'lr': 0.0004919866368439624, 'samples': 2680512, 'steps': 13960, 'loss/train': 2.0946123600006104} -11/06/2021 23:10:31 - INFO - __main__ - Step 13962: {'lr': 0.0004919853039672287, 'samples': 2680704, 'steps': 13961, 'loss/train': 1.806232213973999} -11/06/2021 23:10:32 - INFO - __main__ - Step 13963: {'lr': 0.00049198397098146, 'samples': 2680896, 'steps': 13962, 'loss/train': 2.475085496902466} -11/06/2021 23:10:32 - INFO - __main__ - Step 13964: {'lr': 0.0004919826378866573, 'samples': 2681088, 'steps': 13963, 'loss/train': 1.6275722980499268} -11/06/2021 23:10:33 - INFO - __main__ - Step 13965: {'lr': 0.0004919813046828209, 'samples': 2681280, 'steps': 13964, 'loss/train': 1.4893933534622192} -11/06/2021 23:10:34 - INFO - __main__ - Step 13966: {'lr': 0.0004919799713699514, 'samples': 2681472, 'steps': 13965, 'loss/train': 1.8989421129226685} -11/06/2021 23:10:34 - INFO - __main__ - Step 13967: {'lr': 0.0004919786379480494, 'samples': 2681664, 'steps': 13966, 'loss/train': 2.0461950302124023} -11/06/2021 23:10:34 - INFO - __main__ - Step 13968: {'lr': 0.0004919773044171158, 'samples': 2681856, 'steps': 13967, 'loss/train': 1.7117947340011597} -11/06/2021 23:10:35 - INFO - __main__ - Step 13969: {'lr': 0.0004919759707771507, 'samples': 2682048, 'steps': 13968, 'loss/train': 1.7647126913070679} -11/06/2021 23:10:35 - INFO - __main__ - Step 13970: {'lr': 0.0004919746370281551, 'samples': 2682240, 'steps': 13969, 'loss/train': 1.784766435623169} -11/06/2021 23:10:36 - INFO - __main__ - Step 13971: {'lr': 0.0004919733031701295, 'samples': 2682432, 'steps': 13970, 'loss/train': 1.7901809215545654} -11/06/2021 23:10:37 - INFO - __main__ - Step 13972: {'lr': 0.0004919719692030743, 'samples': 2682624, 'steps': 13971, 'loss/train': 1.4720513820648193} -11/06/2021 23:10:37 - INFO - __main__ - Step 13973: {'lr': 0.0004919706351269904, 'samples': 2682816, 'steps': 13972, 'loss/train': 1.9798334836959839} -11/06/2021 23:10:37 - INFO - __main__ - Step 13974: {'lr': 0.0004919693009418782, 'samples': 2683008, 'steps': 13973, 'loss/train': 2.224214553833008} -11/06/2021 23:10:38 - INFO - __main__ - Step 13975: {'lr': 0.0004919679666477384, 'samples': 2683200, 'steps': 13974, 'loss/train': 1.7048498392105103} -11/06/2021 23:10:39 - INFO - __main__ - Step 13976: {'lr': 0.0004919666322445715, 'samples': 2683392, 'steps': 13975, 'loss/train': 1.784834384918213} -11/06/2021 23:10:39 - INFO - __main__ - Step 13977: {'lr': 0.0004919652977323783, 'samples': 2683584, 'steps': 13976, 'loss/train': 1.4972141981124878} -11/06/2021 23:10:39 - INFO - __main__ - Step 13978: {'lr': 0.0004919639631111592, 'samples': 2683776, 'steps': 13977, 'loss/train': 1.7331345081329346} -11/06/2021 23:10:40 - INFO - __main__ - Step 13979: {'lr': 0.0004919626283809149, 'samples': 2683968, 'steps': 13978, 'loss/train': 1.7867261171340942} -11/06/2021 23:10:40 - INFO - __main__ - Step 13980: {'lr': 0.0004919612935416459, 'samples': 2684160, 'steps': 13979, 'loss/train': 1.5536366701126099} -11/06/2021 23:10:41 - INFO - __main__ - Step 13981: {'lr': 0.000491959958593353, 'samples': 2684352, 'steps': 13980, 'loss/train': 1.6696289777755737} -11/06/2021 23:10:41 - INFO - __main__ - Step 13982: {'lr': 0.0004919586235360365, 'samples': 2684544, 'steps': 13981, 'loss/train': 1.6226602792739868} -11/06/2021 23:10:42 - INFO - __main__ - Step 13983: {'lr': 0.0004919572883696974, 'samples': 2684736, 'steps': 13982, 'loss/train': 1.9969899654388428} -11/06/2021 23:10:42 - INFO - __main__ - Step 13984: {'lr': 0.0004919559530943359, 'samples': 2684928, 'steps': 13983, 'loss/train': 1.8502788543701172} -11/06/2021 23:10:43 - INFO - __main__ - Step 13985: {'lr': 0.0004919546177099528, 'samples': 2685120, 'steps': 13984, 'loss/train': 2.2144908905029297} -11/06/2021 23:10:44 - INFO - __main__ - Step 13986: {'lr': 0.0004919532822165487, 'samples': 2685312, 'steps': 13985, 'loss/train': 1.7305831909179688} -11/06/2021 23:10:44 - INFO - __main__ - Step 13987: {'lr': 0.0004919519466141242, 'samples': 2685504, 'steps': 13986, 'loss/train': 2.206554889678955} -11/06/2021 23:10:44 - INFO - __main__ - Step 13988: {'lr': 0.0004919506109026799, 'samples': 2685696, 'steps': 13987, 'loss/train': 2.002794027328491} -11/06/2021 23:10:45 - INFO - __main__ - Step 13989: {'lr': 0.0004919492750822163, 'samples': 2685888, 'steps': 13988, 'loss/train': 1.8074073791503906} -11/06/2021 23:10:45 - INFO - __main__ - Step 13990: {'lr': 0.0004919479391527343, 'samples': 2686080, 'steps': 13989, 'loss/train': 1.7749497890472412} -11/06/2021 23:10:45 - INFO - __main__ - Step 13991: {'lr': 0.0004919466031142342, 'samples': 2686272, 'steps': 13990, 'loss/train': 1.2076705694198608} -11/06/2021 23:10:46 - INFO - __main__ - Step 13992: {'lr': 0.0004919452669667166, 'samples': 2686464, 'steps': 13991, 'loss/train': 3.3132309913635254} -11/06/2021 23:10:47 - INFO - __main__ - Step 13993: {'lr': 0.0004919439307101822, 'samples': 2686656, 'steps': 13992, 'loss/train': 3.050110101699829} -11/06/2021 23:10:47 - INFO - __main__ - Step 13994: {'lr': 0.0004919425943446317, 'samples': 2686848, 'steps': 13993, 'loss/train': 1.7559268474578857} -11/06/2021 23:10:48 - INFO - __main__ - Step 13995: {'lr': 0.0004919412578700654, 'samples': 2687040, 'steps': 13994, 'loss/train': 1.2231806516647339} -11/06/2021 23:10:48 - INFO - __main__ - Step 13996: {'lr': 0.0004919399212864843, 'samples': 2687232, 'steps': 13995, 'loss/train': 1.859178066253662} -11/06/2021 23:10:48 - INFO - __main__ - Step 13997: {'lr': 0.0004919385845938888, 'samples': 2687424, 'steps': 13996, 'loss/train': 1.9321575164794922} -11/06/2021 23:10:49 - INFO - __main__ - Step 13998: {'lr': 0.0004919372477922794, 'samples': 2687616, 'steps': 13997, 'loss/train': 1.7246944904327393} -11/06/2021 23:10:50 - INFO - __main__ - Step 13999: {'lr': 0.0004919359108816569, 'samples': 2687808, 'steps': 13998, 'loss/train': 2.0384068489074707} -11/06/2021 23:10:50 - INFO - __main__ - Step 14000: {'lr': 0.0004919345738620218, 'samples': 2688000, 'steps': 13999, 'loss/train': 1.2765216827392578} -11/06/2021 23:10:50 - INFO - __main__ - Step 14001: {'lr': 0.0004919332367333747, 'samples': 2688192, 'steps': 14000, 'loss/train': 1.9448779821395874} -11/06/2021 23:10:51 - INFO - __main__ - Step 14002: {'lr': 0.0004919318994957162, 'samples': 2688384, 'steps': 14001, 'loss/train': 1.9251288175582886} -11/06/2021 23:10:52 - INFO - __main__ - Step 14003: {'lr': 0.0004919305621490469, 'samples': 2688576, 'steps': 14002, 'loss/train': 2.482295274734497} -11/06/2021 23:10:52 - INFO - __main__ - Step 14004: {'lr': 0.0004919292246933675, 'samples': 2688768, 'steps': 14003, 'loss/train': 1.9574697017669678} -11/06/2021 23:10:52 - INFO - __main__ - Step 14005: {'lr': 0.0004919278871286785, 'samples': 2688960, 'steps': 14004, 'loss/train': 1.896154761314392} -11/06/2021 23:10:53 - INFO - __main__ - Step 14006: {'lr': 0.0004919265494549805, 'samples': 2689152, 'steps': 14005, 'loss/train': 1.633683681488037} -11/06/2021 23:10:53 - INFO - __main__ - Step 14007: {'lr': 0.0004919252116722742, 'samples': 2689344, 'steps': 14006, 'loss/train': 1.4971553087234497} -11/06/2021 23:10:54 - INFO - __main__ - Step 14008: {'lr': 0.0004919238737805601, 'samples': 2689536, 'steps': 14007, 'loss/train': 1.8007830381393433} -11/06/2021 23:10:55 - INFO - __main__ - Step 14009: {'lr': 0.0004919225357798387, 'samples': 2689728, 'steps': 14008, 'loss/train': 1.9640558958053589} -11/06/2021 23:10:55 - INFO - __main__ - Step 14010: {'lr': 0.000491921197670111, 'samples': 2689920, 'steps': 14009, 'loss/train': 1.3045183420181274} -11/06/2021 23:10:55 - INFO - __main__ - Step 14011: {'lr': 0.0004919198594513771, 'samples': 2690112, 'steps': 14010, 'loss/train': 1.3401371240615845} -11/06/2021 23:10:56 - INFO - __main__ - Step 14012: {'lr': 0.0004919185211236379, 'samples': 2690304, 'steps': 14011, 'loss/train': 1.836495280265808} -11/06/2021 23:10:57 - INFO - __main__ - Step 14013: {'lr': 0.000491917182686894, 'samples': 2690496, 'steps': 14012, 'loss/train': 1.7330890893936157} -11/06/2021 23:10:57 - INFO - __main__ - Step 14014: {'lr': 0.0004919158441411459, 'samples': 2690688, 'steps': 14013, 'loss/train': 1.8115290403366089} -11/06/2021 23:10:57 - INFO - __main__ - Step 14015: {'lr': 0.0004919145054863943, 'samples': 2690880, 'steps': 14014, 'loss/train': 1.6873303651809692} -11/06/2021 23:10:58 - INFO - __main__ - Step 14016: {'lr': 0.0004919131667226398, 'samples': 2691072, 'steps': 14015, 'loss/train': 1.5199148654937744} -11/06/2021 23:10:58 - INFO - __main__ - Step 14017: {'lr': 0.0004919118278498828, 'samples': 2691264, 'steps': 14016, 'loss/train': 1.7640634775161743} -11/06/2021 23:10:58 - INFO - __main__ - Step 14018: {'lr': 0.0004919104888681242, 'samples': 2691456, 'steps': 14017, 'loss/train': 2.0215377807617188} -11/06/2021 23:10:59 - INFO - __main__ - Step 14019: {'lr': 0.0004919091497773643, 'samples': 2691648, 'steps': 14018, 'loss/train': 1.64264976978302} -11/06/2021 23:11:00 - INFO - __main__ - Step 14020: {'lr': 0.0004919078105776041, 'samples': 2691840, 'steps': 14019, 'loss/train': 1.904662013053894} -11/06/2021 23:11:00 - INFO - __main__ - Step 14021: {'lr': 0.0004919064712688439, 'samples': 2692032, 'steps': 14020, 'loss/train': 1.8053239583969116} -11/06/2021 23:11:00 - INFO - __main__ - Step 14022: {'lr': 0.0004919051318510844, 'samples': 2692224, 'steps': 14021, 'loss/train': 2.048910617828369} -11/06/2021 23:11:01 - INFO - __main__ - Step 14023: {'lr': 0.0004919037923243261, 'samples': 2692416, 'steps': 14022, 'loss/train': 1.2819080352783203} -11/06/2021 23:11:02 - INFO - __main__ - Step 14024: {'lr': 0.0004919024526885697, 'samples': 2692608, 'steps': 14023, 'loss/train': 1.1374632120132446} -11/06/2021 23:11:02 - INFO - __main__ - Step 14025: {'lr': 0.0004919011129438158, 'samples': 2692800, 'steps': 14024, 'loss/train': 1.4526000022888184} -11/06/2021 23:11:03 - INFO - __main__ - Step 14026: {'lr': 0.0004918997730900649, 'samples': 2692992, 'steps': 14025, 'loss/train': 1.2924232482910156} -11/06/2021 23:11:03 - INFO - __main__ - Step 14027: {'lr': 0.0004918984331273178, 'samples': 2693184, 'steps': 14026, 'loss/train': 2.08219313621521} -11/06/2021 23:11:03 - INFO - __main__ - Step 14028: {'lr': 0.0004918970930555751, 'samples': 2693376, 'steps': 14027, 'loss/train': 1.7137112617492676} -11/06/2021 23:11:04 - INFO - __main__ - Step 14029: {'lr': 0.0004918957528748371, 'samples': 2693568, 'steps': 14028, 'loss/train': 1.5124090909957886} -11/06/2021 23:11:05 - INFO - __main__ - Step 14030: {'lr': 0.0004918944125851047, 'samples': 2693760, 'steps': 14029, 'loss/train': 1.7956403493881226} -11/06/2021 23:11:05 - INFO - __main__ - Step 14031: {'lr': 0.0004918930721863784, 'samples': 2693952, 'steps': 14030, 'loss/train': 0.82200026512146} -11/06/2021 23:11:05 - INFO - __main__ - Step 14032: {'lr': 0.0004918917316786589, 'samples': 2694144, 'steps': 14031, 'loss/train': 1.9360613822937012} -11/06/2021 23:11:06 - INFO - __main__ - Step 14033: {'lr': 0.0004918903910619465, 'samples': 2694336, 'steps': 14032, 'loss/train': 1.157104253768921} -11/06/2021 23:11:07 - INFO - __main__ - Step 14034: {'lr': 0.0004918890503362422, 'samples': 2694528, 'steps': 14033, 'loss/train': 1.9156838655471802} -11/06/2021 23:11:07 - INFO - __main__ - Step 14035: {'lr': 0.0004918877095015465, 'samples': 2694720, 'steps': 14034, 'loss/train': 2.019812822341919} -11/06/2021 23:11:07 - INFO - __main__ - Step 14036: {'lr': 0.0004918863685578598, 'samples': 2694912, 'steps': 14035, 'loss/train': 1.6677758693695068} -11/06/2021 23:11:08 - INFO - __main__ - Step 14037: {'lr': 0.0004918850275051829, 'samples': 2695104, 'steps': 14036, 'loss/train': 2.457850217819214} -11/06/2021 23:11:08 - INFO - __main__ - Step 14038: {'lr': 0.0004918836863435162, 'samples': 2695296, 'steps': 14037, 'loss/train': 2.003868341445923} -11/06/2021 23:11:09 - INFO - __main__ - Step 14039: {'lr': 0.0004918823450728606, 'samples': 2695488, 'steps': 14038, 'loss/train': 1.5999841690063477} -11/06/2021 23:11:10 - INFO - __main__ - Step 14040: {'lr': 0.0004918810036932164, 'samples': 2695680, 'steps': 14039, 'loss/train': 1.710452675819397} -11/06/2021 23:11:10 - INFO - __main__ - Step 14041: {'lr': 0.0004918796622045844, 'samples': 2695872, 'steps': 14040, 'loss/train': 1.9019668102264404} -11/06/2021 23:11:10 - INFO - __main__ - Step 14042: {'lr': 0.0004918783206069652, 'samples': 2696064, 'steps': 14041, 'loss/train': 1.7770543098449707} -11/06/2021 23:11:11 - INFO - __main__ - Step 14043: {'lr': 0.0004918769789003593, 'samples': 2696256, 'steps': 14042, 'loss/train': 1.4025808572769165} -11/06/2021 23:11:11 - INFO - __main__ - Step 14044: {'lr': 0.0004918756370847674, 'samples': 2696448, 'steps': 14043, 'loss/train': 1.5960426330566406} -11/06/2021 23:11:12 - INFO - __main__ - Step 14045: {'lr': 0.0004918742951601902, 'samples': 2696640, 'steps': 14044, 'loss/train': 1.9002901315689087} -11/06/2021 23:11:12 - INFO - __main__ - Step 14046: {'lr': 0.000491872953126628, 'samples': 2696832, 'steps': 14045, 'loss/train': 1.677998661994934} -11/06/2021 23:11:13 - INFO - __main__ - Step 14047: {'lr': 0.0004918716109840817, 'samples': 2697024, 'steps': 14046, 'loss/train': 1.461251139640808} -11/06/2021 23:11:13 - INFO - __main__ - Step 14048: {'lr': 0.0004918702687325517, 'samples': 2697216, 'steps': 14047, 'loss/train': 1.8989447355270386} -11/06/2021 23:11:13 - INFO - __main__ - Step 14049: {'lr': 0.0004918689263720388, 'samples': 2697408, 'steps': 14048, 'loss/train': 1.1831153631210327} -11/06/2021 23:11:14 - INFO - __main__ - Step 14050: {'lr': 0.0004918675839025434, 'samples': 2697600, 'steps': 14049, 'loss/train': 1.7708138227462769} -11/06/2021 23:11:15 - INFO - __main__ - Step 14051: {'lr': 0.0004918662413240662, 'samples': 2697792, 'steps': 14050, 'loss/train': 1.32278311252594} -11/06/2021 23:11:15 - INFO - __main__ - Step 14052: {'lr': 0.0004918648986366078, 'samples': 2697984, 'steps': 14051, 'loss/train': 1.6384484767913818} -11/06/2021 23:11:15 - INFO - __main__ - Step 14053: {'lr': 0.0004918635558401687, 'samples': 2698176, 'steps': 14052, 'loss/train': 2.0729172229766846} -11/06/2021 23:11:16 - INFO - __main__ - Step 14054: {'lr': 0.0004918622129347498, 'samples': 2698368, 'steps': 14053, 'loss/train': 1.6105602979660034} -11/06/2021 23:11:17 - INFO - __main__ - Step 14055: {'lr': 0.0004918608699203515, 'samples': 2698560, 'steps': 14054, 'loss/train': 2.5296216011047363} -11/06/2021 23:11:17 - INFO - __main__ - Step 14056: {'lr': 0.0004918595267969744, 'samples': 2698752, 'steps': 14055, 'loss/train': 1.7558401823043823} -11/06/2021 23:11:18 - INFO - __main__ - Step 14057: {'lr': 0.0004918581835646191, 'samples': 2698944, 'steps': 14056, 'loss/train': 5.832611083984375} -11/06/2021 23:11:18 - INFO - __main__ - Step 14058: {'lr': 0.0004918568402232863, 'samples': 2699136, 'steps': 14057, 'loss/train': 1.5368565320968628} -11/06/2021 23:11:18 - INFO - __main__ - Step 14059: {'lr': 0.0004918554967729764, 'samples': 2699328, 'steps': 14058, 'loss/train': 2.169316291809082} -11/06/2021 23:11:19 - INFO - __main__ - Step 14060: {'lr': 0.0004918541532136902, 'samples': 2699520, 'steps': 14059, 'loss/train': 2.3635847568511963} -11/06/2021 23:11:20 - INFO - __main__ - Step 14061: {'lr': 0.0004918528095454283, 'samples': 2699712, 'steps': 14060, 'loss/train': 1.7770613431930542} -11/06/2021 23:11:20 - INFO - __main__ - Step 14062: {'lr': 0.0004918514657681913, 'samples': 2699904, 'steps': 14061, 'loss/train': 1.688179850578308} -11/06/2021 23:11:20 - INFO - __main__ - Step 14063: {'lr': 0.0004918501218819796, 'samples': 2700096, 'steps': 14062, 'loss/train': 1.860587239265442} -11/06/2021 23:11:21 - INFO - __main__ - Step 14064: {'lr': 0.0004918487778867941, 'samples': 2700288, 'steps': 14063, 'loss/train': 1.8392343521118164} -11/06/2021 23:11:21 - INFO - __main__ - Step 14065: {'lr': 0.0004918474337826353, 'samples': 2700480, 'steps': 14064, 'loss/train': 1.5922415256500244} -11/06/2021 23:11:22 - INFO - __main__ - Step 14066: {'lr': 0.0004918460895695037, 'samples': 2700672, 'steps': 14065, 'loss/train': 1.585329294204712} -11/06/2021 23:11:23 - INFO - __main__ - Step 14067: {'lr': 0.0004918447452474, 'samples': 2700864, 'steps': 14066, 'loss/train': 3.7865922451019287} -11/06/2021 23:11:23 - INFO - __main__ - Step 14068: {'lr': 0.0004918434008163247, 'samples': 2701056, 'steps': 14067, 'loss/train': 1.2407586574554443} -11/06/2021 23:11:23 - INFO - __main__ - Step 14069: {'lr': 0.0004918420562762786, 'samples': 2701248, 'steps': 14068, 'loss/train': 1.7555322647094727} -11/06/2021 23:11:24 - INFO - __main__ - Step 14070: {'lr': 0.0004918407116272622, 'samples': 2701440, 'steps': 14069, 'loss/train': 1.0781822204589844} -11/06/2021 23:11:24 - INFO - __main__ - Step 14071: {'lr': 0.000491839366869276, 'samples': 2701632, 'steps': 14070, 'loss/train': 2.1765549182891846} -11/06/2021 23:11:25 - INFO - __main__ - Step 14072: {'lr': 0.000491838022002321, 'samples': 2701824, 'steps': 14071, 'loss/train': 1.3922725915908813} -11/06/2021 23:11:25 - INFO - __main__ - Step 14073: {'lr': 0.0004918366770263972, 'samples': 2702016, 'steps': 14072, 'loss/train': 1.583871603012085} -11/06/2021 23:11:26 - INFO - __main__ - Step 14074: {'lr': 0.0004918353319415057, 'samples': 2702208, 'steps': 14073, 'loss/train': 1.4345612525939941} -11/06/2021 23:11:26 - INFO - __main__ - Step 14075: {'lr': 0.0004918339867476469, 'samples': 2702400, 'steps': 14074, 'loss/train': 1.5994923114776611} -11/06/2021 23:11:26 - INFO - __main__ - Step 14076: {'lr': 0.0004918326414448214, 'samples': 2702592, 'steps': 14075, 'loss/train': 2.2489395141601562} -11/06/2021 23:11:28 - INFO - __main__ - Step 14077: {'lr': 0.0004918312960330299, 'samples': 2702784, 'steps': 14076, 'loss/train': 1.737290382385254} -11/06/2021 23:11:28 - INFO - __main__ - Step 14078: {'lr': 0.0004918299505122729, 'samples': 2702976, 'steps': 14077, 'loss/train': 1.7684190273284912} -11/06/2021 23:11:28 - INFO - __main__ - Step 14079: {'lr': 0.000491828604882551, 'samples': 2703168, 'steps': 14078, 'loss/train': 1.933387279510498} -11/06/2021 23:11:29 - INFO - __main__ - Step 14080: {'lr': 0.0004918272591438649, 'samples': 2703360, 'steps': 14079, 'loss/train': 2.6290011405944824} -11/06/2021 23:11:29 - INFO - __main__ - Step 14081: {'lr': 0.0004918259132962153, 'samples': 2703552, 'steps': 14080, 'loss/train': 1.1858018636703491} -11/06/2021 23:11:29 - INFO - __main__ - Step 14082: {'lr': 0.0004918245673396025, 'samples': 2703744, 'steps': 14081, 'loss/train': 1.8530510663986206} -11/06/2021 23:11:31 - INFO - __main__ - Step 14083: {'lr': 0.0004918232212740274, 'samples': 2703936, 'steps': 14082, 'loss/train': 0.8487131595611572} -11/06/2021 23:11:31 - INFO - __main__ - Step 14084: {'lr': 0.0004918218750994904, 'samples': 2704128, 'steps': 14083, 'loss/train': 2.605128288269043} -11/06/2021 23:11:32 - INFO - __main__ - Step 14085: {'lr': 0.0004918205288159923, 'samples': 2704320, 'steps': 14084, 'loss/train': 1.6674420833587646} -11/06/2021 23:11:32 - INFO - __main__ - Step 14086: {'lr': 0.0004918191824235335, 'samples': 2704512, 'steps': 14085, 'loss/train': 1.54026198387146} -11/06/2021 23:11:32 - INFO - __main__ - Step 14087: {'lr': 0.0004918178359221147, 'samples': 2704704, 'steps': 14086, 'loss/train': 2.31728196144104} -11/06/2021 23:11:33 - INFO - __main__ - Step 14088: {'lr': 0.0004918164893117366, 'samples': 2704896, 'steps': 14087, 'loss/train': 1.713340401649475} -11/06/2021 23:11:34 - INFO - __main__ - Step 14089: {'lr': 0.0004918151425923996, 'samples': 2705088, 'steps': 14088, 'loss/train': 1.4485218524932861} -11/06/2021 23:11:34 - INFO - __main__ - Step 14090: {'lr': 0.0004918137957641046, 'samples': 2705280, 'steps': 14089, 'loss/train': 1.635068416595459} -11/06/2021 23:11:34 - INFO - __main__ - Step 14091: {'lr': 0.000491812448826852, 'samples': 2705472, 'steps': 14090, 'loss/train': 1.8842805624008179} -11/06/2021 23:11:35 - INFO - __main__ - Step 14092: {'lr': 0.0004918111017806424, 'samples': 2705664, 'steps': 14091, 'loss/train': 1.5843989849090576} -11/06/2021 23:11:35 - INFO - __main__ - Step 14093: {'lr': 0.0004918097546254764, 'samples': 2705856, 'steps': 14092, 'loss/train': 1.812479019165039} -11/06/2021 23:11:36 - INFO - __main__ - Step 14094: {'lr': 0.0004918084073613547, 'samples': 2706048, 'steps': 14093, 'loss/train': 1.6815907955169678} -11/06/2021 23:11:36 - INFO - __main__ - Step 14095: {'lr': 0.0004918070599882778, 'samples': 2706240, 'steps': 14094, 'loss/train': 1.7472896575927734} -11/06/2021 23:11:37 - INFO - __main__ - Step 14096: {'lr': 0.0004918057125062465, 'samples': 2706432, 'steps': 14095, 'loss/train': 1.8674776554107666} -11/06/2021 23:11:37 - INFO - __main__ - Step 14097: {'lr': 0.0004918043649152612, 'samples': 2706624, 'steps': 14096, 'loss/train': 1.9627310037612915} -11/06/2021 23:11:37 - INFO - __main__ - Step 14098: {'lr': 0.0004918030172153225, 'samples': 2706816, 'steps': 14097, 'loss/train': 1.6795316934585571} -11/06/2021 23:11:38 - INFO - __main__ - Step 14099: {'lr': 0.0004918016694064313, 'samples': 2707008, 'steps': 14098, 'loss/train': 1.9474259614944458} -11/06/2021 23:11:39 - INFO - __main__ - Step 14100: {'lr': 0.0004918003214885877, 'samples': 2707200, 'steps': 14099, 'loss/train': 1.1974012851715088} -11/06/2021 23:11:39 - INFO - __main__ - Step 14101: {'lr': 0.0004917989734617928, 'samples': 2707392, 'steps': 14100, 'loss/train': 1.9953140020370483} -11/06/2021 23:11:39 - INFO - __main__ - Step 14102: {'lr': 0.0004917976253260471, 'samples': 2707584, 'steps': 14101, 'loss/train': 1.6123121976852417} -11/06/2021 23:11:40 - INFO - __main__ - Step 14103: {'lr': 0.000491796277081351, 'samples': 2707776, 'steps': 14102, 'loss/train': 1.817934274673462} -11/06/2021 23:11:40 - INFO - __main__ - Step 14104: {'lr': 0.0004917949287277052, 'samples': 2707968, 'steps': 14103, 'loss/train': 2.0339081287384033} -11/06/2021 23:11:41 - INFO - __main__ - Step 14105: {'lr': 0.0004917935802651104, 'samples': 2708160, 'steps': 14104, 'loss/train': 1.8835687637329102} -11/06/2021 23:11:42 - INFO - __main__ - Step 14106: {'lr': 0.0004917922316935671, 'samples': 2708352, 'steps': 14105, 'loss/train': 1.9598747491836548} -11/06/2021 23:11:42 - INFO - __main__ - Step 14107: {'lr': 0.000491790883013076, 'samples': 2708544, 'steps': 14106, 'loss/train': 1.3012551069259644} -11/06/2021 23:11:42 - INFO - __main__ - Step 14108: {'lr': 0.0004917895342236377, 'samples': 2708736, 'steps': 14107, 'loss/train': 1.5593042373657227} -11/06/2021 23:11:43 - INFO - __main__ - Step 14109: {'lr': 0.0004917881853252527, 'samples': 2708928, 'steps': 14108, 'loss/train': 1.7348185777664185} -11/06/2021 23:11:44 - INFO - __main__ - Step 14110: {'lr': 0.0004917868363179216, 'samples': 2709120, 'steps': 14109, 'loss/train': 2.0034899711608887} -11/06/2021 23:11:44 - INFO - __main__ - Step 14111: {'lr': 0.0004917854872016451, 'samples': 2709312, 'steps': 14110, 'loss/train': 1.7014143466949463} -11/06/2021 23:11:44 - INFO - __main__ - Step 14112: {'lr': 0.000491784137976424, 'samples': 2709504, 'steps': 14111, 'loss/train': 0.5290675163269043} -11/06/2021 23:11:45 - INFO - __main__ - Step 14113: {'lr': 0.0004917827886422586, 'samples': 2709696, 'steps': 14112, 'loss/train': 1.854404330253601} -11/06/2021 23:11:45 - INFO - __main__ - Step 14114: {'lr': 0.0004917814391991494, 'samples': 2709888, 'steps': 14113, 'loss/train': 1.8280285596847534} -11/06/2021 23:11:46 - INFO - __main__ - Step 14115: {'lr': 0.0004917800896470974, 'samples': 2710080, 'steps': 14114, 'loss/train': 1.9659100770950317} -11/06/2021 23:11:46 - INFO - __main__ - Step 14116: {'lr': 0.000491778739986103, 'samples': 2710272, 'steps': 14115, 'loss/train': 2.029839515686035} -11/06/2021 23:11:47 - INFO - __main__ - Step 14117: {'lr': 0.0004917773902161669, 'samples': 2710464, 'steps': 14116, 'loss/train': 1.8698660135269165} -11/06/2021 23:11:47 - INFO - __main__ - Step 14118: {'lr': 0.0004917760403372895, 'samples': 2710656, 'steps': 14117, 'loss/train': 1.1892834901809692} -11/06/2021 23:11:47 - INFO - __main__ - Step 14119: {'lr': 0.0004917746903494717, 'samples': 2710848, 'steps': 14118, 'loss/train': 0.9476760029792786} -11/06/2021 23:11:48 - INFO - __main__ - Step 14120: {'lr': 0.0004917733402527138, 'samples': 2711040, 'steps': 14119, 'loss/train': 1.6532700061798096} -11/06/2021 23:11:49 - INFO - __main__ - Step 14121: {'lr': 0.0004917719900470167, 'samples': 2711232, 'steps': 14120, 'loss/train': 1.880062222480774} -11/06/2021 23:11:49 - INFO - __main__ - Step 14122: {'lr': 0.0004917706397323808, 'samples': 2711424, 'steps': 14121, 'loss/train': 2.203761100769043} -11/06/2021 23:11:49 - INFO - __main__ - Step 14123: {'lr': 0.0004917692893088067, 'samples': 2711616, 'steps': 14122, 'loss/train': 1.9275217056274414} -11/06/2021 23:11:50 - INFO - __main__ - Step 14124: {'lr': 0.0004917679387762952, 'samples': 2711808, 'steps': 14123, 'loss/train': 1.9265042543411255} -11/06/2021 23:11:51 - INFO - __main__ - Step 14125: {'lr': 0.0004917665881348467, 'samples': 2712000, 'steps': 14124, 'loss/train': 1.2948485612869263} -11/06/2021 23:11:51 - INFO - __main__ - Step 14126: {'lr': 0.000491765237384462, 'samples': 2712192, 'steps': 14125, 'loss/train': 1.6665414571762085} -11/06/2021 23:11:52 - INFO - __main__ - Step 14127: {'lr': 0.0004917638865251416, 'samples': 2712384, 'steps': 14126, 'loss/train': 0.629708468914032} -11/06/2021 23:11:52 - INFO - __main__ - Step 14128: {'lr': 0.0004917625355568861, 'samples': 2712576, 'steps': 14127, 'loss/train': 1.6347920894622803} -11/06/2021 23:11:53 - INFO - __main__ - Step 14129: {'lr': 0.0004917611844796962, 'samples': 2712768, 'steps': 14128, 'loss/train': 1.388734221458435} -11/06/2021 23:11:54 - INFO - __main__ - Step 14130: {'lr': 0.0004917598332935724, 'samples': 2712960, 'steps': 14129, 'loss/train': 1.3727388381958008} -11/06/2021 23:11:54 - INFO - __main__ - Step 14131: {'lr': 0.0004917584819985153, 'samples': 2713152, 'steps': 14130, 'loss/train': 1.5905683040618896} -11/06/2021 23:11:54 - INFO - __main__ - Step 14132: {'lr': 0.0004917571305945256, 'samples': 2713344, 'steps': 14131, 'loss/train': 1.9821319580078125} -11/06/2021 23:11:55 - INFO - __main__ - Step 14133: {'lr': 0.0004917557790816039, 'samples': 2713536, 'steps': 14132, 'loss/train': 1.3257533311843872} -11/06/2021 23:11:55 - INFO - __main__ - Step 14134: {'lr': 0.0004917544274597507, 'samples': 2713728, 'steps': 14133, 'loss/train': 1.8089780807495117} -11/06/2021 23:11:56 - INFO - __main__ - Step 14135: {'lr': 0.0004917530757289668, 'samples': 2713920, 'steps': 14134, 'loss/train': 1.6792985200881958} -11/06/2021 23:11:56 - INFO - __main__ - Step 14136: {'lr': 0.0004917517238892526, 'samples': 2714112, 'steps': 14135, 'loss/train': 1.4552292823791504} -11/06/2021 23:11:57 - INFO - __main__ - Step 14137: {'lr': 0.0004917503719406087, 'samples': 2714304, 'steps': 14136, 'loss/train': 1.8645858764648438} -11/06/2021 23:11:57 - INFO - __main__ - Step 14138: {'lr': 0.000491749019883036, 'samples': 2714496, 'steps': 14137, 'loss/train': 1.6772507429122925} -11/06/2021 23:11:58 - INFO - __main__ - Step 14139: {'lr': 0.0004917476677165349, 'samples': 2714688, 'steps': 14138, 'loss/train': 1.839224100112915} -11/06/2021 23:11:58 - INFO - __main__ - Step 14140: {'lr': 0.0004917463154411059, 'samples': 2714880, 'steps': 14139, 'loss/train': 1.2386482954025269} -11/06/2021 23:11:59 - INFO - __main__ - Step 14141: {'lr': 0.0004917449630567499, 'samples': 2715072, 'steps': 14140, 'loss/train': 1.9079393148422241} -11/06/2021 23:11:59 - INFO - __main__ - Step 14142: {'lr': 0.0004917436105634673, 'samples': 2715264, 'steps': 14141, 'loss/train': 1.7619988918304443} -11/06/2021 23:12:00 - INFO - __main__ - Step 14143: {'lr': 0.0004917422579612587, 'samples': 2715456, 'steps': 14142, 'loss/train': 1.625560998916626} -11/06/2021 23:12:00 - INFO - __main__ - Step 14144: {'lr': 0.0004917409052501248, 'samples': 2715648, 'steps': 14143, 'loss/train': 1.4624155759811401} -11/06/2021 23:12:00 - INFO - __main__ - Step 14145: {'lr': 0.0004917395524300661, 'samples': 2715840, 'steps': 14144, 'loss/train': 1.0638208389282227} -11/06/2021 23:12:02 - INFO - __main__ - Step 14146: {'lr': 0.0004917381995010834, 'samples': 2716032, 'steps': 14145, 'loss/train': 1.523756980895996} -11/06/2021 23:12:02 - INFO - __main__ - Step 14147: {'lr': 0.0004917368464631772, 'samples': 2716224, 'steps': 14146, 'loss/train': 1.4266034364700317} -11/06/2021 23:12:02 - INFO - __main__ - Step 14148: {'lr': 0.0004917354933163481, 'samples': 2716416, 'steps': 14147, 'loss/train': 2.06866455078125} -11/06/2021 23:12:03 - INFO - __main__ - Step 14149: {'lr': 0.0004917341400605967, 'samples': 2716608, 'steps': 14148, 'loss/train': 1.4128144979476929} -11/06/2021 23:12:03 - INFO - __main__ - Step 14150: {'lr': 0.0004917327866959236, 'samples': 2716800, 'steps': 14149, 'loss/train': 1.0061789751052856} -11/06/2021 23:12:04 - INFO - __main__ - Step 14151: {'lr': 0.0004917314332223295, 'samples': 2716992, 'steps': 14150, 'loss/train': 1.8678841590881348} -11/06/2021 23:12:04 - INFO - __main__ - Step 14152: {'lr': 0.0004917300796398148, 'samples': 2717184, 'steps': 14151, 'loss/train': 1.5144931077957153} -11/06/2021 23:12:05 - INFO - __main__ - Step 14153: {'lr': 0.0004917287259483805, 'samples': 2717376, 'steps': 14152, 'loss/train': 1.836294412612915} -11/06/2021 23:12:05 - INFO - __main__ - Step 14154: {'lr': 0.0004917273721480268, 'samples': 2717568, 'steps': 14153, 'loss/train': 1.3567187786102295} -11/06/2021 23:12:05 - INFO - __main__ - Step 14155: {'lr': 0.0004917260182387545, 'samples': 2717760, 'steps': 14154, 'loss/train': 1.4603012800216675} -11/06/2021 23:12:07 - INFO - __main__ - Step 14156: {'lr': 0.0004917246642205642, 'samples': 2717952, 'steps': 14155, 'loss/train': 1.4038804769515991} -11/06/2021 23:12:07 - INFO - __main__ - Step 14157: {'lr': 0.0004917233100934565, 'samples': 2718144, 'steps': 14156, 'loss/train': 1.8869411945343018} -11/06/2021 23:12:07 - INFO - __main__ - Step 14158: {'lr': 0.0004917219558574319, 'samples': 2718336, 'steps': 14157, 'loss/train': 1.7700613737106323} -11/06/2021 23:12:08 - INFO - __main__ - Step 14159: {'lr': 0.0004917206015124913, 'samples': 2718528, 'steps': 14158, 'loss/train': 0.9594613313674927} -11/06/2021 23:12:08 - INFO - __main__ - Step 14160: {'lr': 0.000491719247058635, 'samples': 2718720, 'steps': 14159, 'loss/train': 1.2669697999954224} -11/06/2021 23:12:08 - INFO - __main__ - Step 14161: {'lr': 0.0004917178924958638, 'samples': 2718912, 'steps': 14160, 'loss/train': 2.0762956142425537} -11/06/2021 23:12:09 - INFO - __main__ - Step 14162: {'lr': 0.0004917165378241782, 'samples': 2719104, 'steps': 14161, 'loss/train': 1.8425633907318115} -11/06/2021 23:12:10 - INFO - __main__ - Step 14163: {'lr': 0.0004917151830435789, 'samples': 2719296, 'steps': 14162, 'loss/train': 1.3636668920516968} -11/06/2021 23:12:10 - INFO - __main__ - Step 14164: {'lr': 0.0004917138281540664, 'samples': 2719488, 'steps': 14163, 'loss/train': 2.4625284671783447} -11/06/2021 23:12:10 - INFO - __main__ - Step 14165: {'lr': 0.0004917124731556415, 'samples': 2719680, 'steps': 14164, 'loss/train': 2.0274415016174316} -11/06/2021 23:12:11 - INFO - __main__ - Step 14166: {'lr': 0.0004917111180483046, 'samples': 2719872, 'steps': 14165, 'loss/train': 1.421899676322937} -11/06/2021 23:12:12 - INFO - __main__ - Step 14167: {'lr': 0.0004917097628320564, 'samples': 2720064, 'steps': 14166, 'loss/train': 1.8181909322738647} -11/06/2021 23:12:12 - INFO - __main__ - Step 14168: {'lr': 0.0004917084075068975, 'samples': 2720256, 'steps': 14167, 'loss/train': 1.8530933856964111} -11/06/2021 23:12:12 - INFO - __main__ - Step 14169: {'lr': 0.0004917070520728286, 'samples': 2720448, 'steps': 14168, 'loss/train': 1.7252720594406128} -11/06/2021 23:12:13 - INFO - __main__ - Step 14170: {'lr': 0.0004917056965298501, 'samples': 2720640, 'steps': 14169, 'loss/train': 1.3021842241287231} -11/06/2021 23:12:13 - INFO - __main__ - Step 14171: {'lr': 0.0004917043408779629, 'samples': 2720832, 'steps': 14170, 'loss/train': 1.746435523033142} -11/06/2021 23:12:14 - INFO - __main__ - Step 14172: {'lr': 0.0004917029851171674, 'samples': 2721024, 'steps': 14171, 'loss/train': 0.15152797102928162} -11/06/2021 23:12:15 - INFO - __main__ - Step 14173: {'lr': 0.0004917016292474642, 'samples': 2721216, 'steps': 14172, 'loss/train': 2.0078635215759277} -11/06/2021 23:12:15 - INFO - __main__ - Step 14174: {'lr': 0.000491700273268854, 'samples': 2721408, 'steps': 14173, 'loss/train': 1.525383472442627} -11/06/2021 23:12:15 - INFO - __main__ - Step 14175: {'lr': 0.0004916989171813374, 'samples': 2721600, 'steps': 14174, 'loss/train': 1.6893455982208252} -11/06/2021 23:12:16 - INFO - __main__ - Step 14176: {'lr': 0.000491697560984915, 'samples': 2721792, 'steps': 14175, 'loss/train': 1.4403749704360962} -11/06/2021 23:12:17 - INFO - __main__ - Step 14177: {'lr': 0.0004916962046795874, 'samples': 2721984, 'steps': 14176, 'loss/train': 2.55890154838562} -11/06/2021 23:12:17 - INFO - __main__ - Step 14178: {'lr': 0.0004916948482653553, 'samples': 2722176, 'steps': 14177, 'loss/train': 1.7743308544158936} -11/06/2021 23:12:17 - INFO - __main__ - Step 14179: {'lr': 0.0004916934917422191, 'samples': 2722368, 'steps': 14178, 'loss/train': 1.5195140838623047} -11/06/2021 23:12:18 - INFO - __main__ - Step 14180: {'lr': 0.0004916921351101796, 'samples': 2722560, 'steps': 14179, 'loss/train': 1.529984951019287} -11/06/2021 23:12:18 - INFO - __main__ - Step 14181: {'lr': 0.0004916907783692374, 'samples': 2722752, 'steps': 14180, 'loss/train': 1.9970260858535767} -11/06/2021 23:12:18 - INFO - __main__ - Step 14182: {'lr': 0.000491689421519393, 'samples': 2722944, 'steps': 14181, 'loss/train': 1.5570197105407715} -11/06/2021 23:12:19 - INFO - __main__ - Step 14183: {'lr': 0.0004916880645606471, 'samples': 2723136, 'steps': 14182, 'loss/train': 1.396638035774231} -11/06/2021 23:12:20 - INFO - __main__ - Step 14184: {'lr': 0.0004916867074930002, 'samples': 2723328, 'steps': 14183, 'loss/train': 1.960241436958313} -11/06/2021 23:12:20 - INFO - __main__ - Step 14185: {'lr': 0.0004916853503164531, 'samples': 2723520, 'steps': 14184, 'loss/train': 1.312820553779602} -11/06/2021 23:12:20 - INFO - __main__ - Step 14186: {'lr': 0.0004916839930310063, 'samples': 2723712, 'steps': 14185, 'loss/train': 1.5989493131637573} -11/06/2021 23:12:21 - INFO - __main__ - Step 14187: {'lr': 0.0004916826356366605, 'samples': 2723904, 'steps': 14186, 'loss/train': 2.3531341552734375} -11/06/2021 23:12:22 - INFO - __main__ - Step 14188: {'lr': 0.0004916812781334161, 'samples': 2724096, 'steps': 14187, 'loss/train': 1.5331050157546997} -11/06/2021 23:12:22 - INFO - __main__ - Step 14189: {'lr': 0.0004916799205212739, 'samples': 2724288, 'steps': 14188, 'loss/train': 1.6796480417251587} -11/06/2021 23:12:23 - INFO - __main__ - Step 14190: {'lr': 0.0004916785628002345, 'samples': 2724480, 'steps': 14189, 'loss/train': 1.338007926940918} -11/06/2021 23:12:23 - INFO - __main__ - Step 14191: {'lr': 0.0004916772049702984, 'samples': 2724672, 'steps': 14190, 'loss/train': 2.13338565826416} -11/06/2021 23:12:23 - INFO - __main__ - Step 14192: {'lr': 0.0004916758470314662, 'samples': 2724864, 'steps': 14191, 'loss/train': 1.8545008897781372} -11/06/2021 23:12:24 - INFO - __main__ - Step 14193: {'lr': 0.0004916744889837388, 'samples': 2725056, 'steps': 14192, 'loss/train': 1.7253385782241821} -11/06/2021 23:12:25 - INFO - __main__ - Step 14194: {'lr': 0.0004916731308271165, 'samples': 2725248, 'steps': 14193, 'loss/train': 1.8852863311767578} -11/06/2021 23:12:25 - INFO - __main__ - Step 14195: {'lr': 0.0004916717725616, 'samples': 2725440, 'steps': 14194, 'loss/train': 1.7347588539123535} -11/06/2021 23:12:25 - INFO - __main__ - Step 14196: {'lr': 0.0004916704141871899, 'samples': 2725632, 'steps': 14195, 'loss/train': 1.6380163431167603} -11/06/2021 23:12:26 - INFO - __main__ - Step 14197: {'lr': 0.000491669055703887, 'samples': 2725824, 'steps': 14196, 'loss/train': 1.5754060745239258} -11/06/2021 23:12:27 - INFO - __main__ - Step 14198: {'lr': 0.0004916676971116916, 'samples': 2726016, 'steps': 14197, 'loss/train': 1.435011863708496} -11/06/2021 23:12:27 - INFO - __main__ - Step 14199: {'lr': 0.0004916663384106045, 'samples': 2726208, 'steps': 14198, 'loss/train': 1.975164771080017} -11/06/2021 23:12:28 - INFO - __main__ - Step 14200: {'lr': 0.0004916649796006263, 'samples': 2726400, 'steps': 14199, 'loss/train': 1.1312105655670166} -11/06/2021 23:12:28 - INFO - __main__ - Step 14201: {'lr': 0.0004916636206817575, 'samples': 2726592, 'steps': 14200, 'loss/train': 1.805939793586731} -11/06/2021 23:12:28 - INFO - __main__ - Step 14202: {'lr': 0.0004916622616539988, 'samples': 2726784, 'steps': 14201, 'loss/train': 1.1680221557617188} -11/06/2021 23:12:29 - INFO - __main__ - Step 14203: {'lr': 0.000491660902517351, 'samples': 2726976, 'steps': 14202, 'loss/train': 1.5965232849121094} -11/06/2021 23:12:30 - INFO - __main__ - Step 14204: {'lr': 0.0004916595432718143, 'samples': 2727168, 'steps': 14203, 'loss/train': 1.660688877105713} -11/06/2021 23:12:30 - INFO - __main__ - Step 14205: {'lr': 0.0004916581839173897, 'samples': 2727360, 'steps': 14204, 'loss/train': 2.3039207458496094} -11/06/2021 23:12:31 - INFO - __main__ - Step 14206: {'lr': 0.0004916568244540776, 'samples': 2727552, 'steps': 14205, 'loss/train': 1.4516968727111816} -11/06/2021 23:12:31 - INFO - __main__ - Step 14207: {'lr': 0.0004916554648818787, 'samples': 2727744, 'steps': 14206, 'loss/train': 1.7223396301269531} -11/06/2021 23:12:31 - INFO - __main__ - Step 14208: {'lr': 0.0004916541052007936, 'samples': 2727936, 'steps': 14207, 'loss/train': 1.0482618808746338} -11/06/2021 23:12:32 - INFO - __main__ - Step 14209: {'lr': 0.0004916527454108227, 'samples': 2728128, 'steps': 14208, 'loss/train': 1.7698308229446411} -11/06/2021 23:12:33 - INFO - __main__ - Step 14210: {'lr': 0.0004916513855119669, 'samples': 2728320, 'steps': 14209, 'loss/train': 2.295707941055298} -11/06/2021 23:12:33 - INFO - __main__ - Step 14211: {'lr': 0.0004916500255042268, 'samples': 2728512, 'steps': 14210, 'loss/train': 1.637235164642334} -11/06/2021 23:12:33 - INFO - __main__ - Step 14212: {'lr': 0.0004916486653876029, 'samples': 2728704, 'steps': 14211, 'loss/train': 1.552703619003296} -11/06/2021 23:12:34 - INFO - __main__ - Step 14213: {'lr': 0.0004916473051620958, 'samples': 2728896, 'steps': 14212, 'loss/train': 2.0507657527923584} -11/06/2021 23:12:35 - INFO - __main__ - Step 14214: {'lr': 0.0004916459448277062, 'samples': 2729088, 'steps': 14213, 'loss/train': 2.118166446685791} -11/06/2021 23:12:35 - INFO - __main__ - Step 14215: {'lr': 0.0004916445843844346, 'samples': 2729280, 'steps': 14214, 'loss/train': 1.8859989643096924} -11/06/2021 23:12:36 - INFO - __main__ - Step 14216: {'lr': 0.0004916432238322818, 'samples': 2729472, 'steps': 14215, 'loss/train': 1.5724775791168213} -11/06/2021 23:12:36 - INFO - __main__ - Step 14217: {'lr': 0.0004916418631712481, 'samples': 2729664, 'steps': 14216, 'loss/train': 1.3125375509262085} -11/06/2021 23:12:36 - INFO - __main__ - Step 14218: {'lr': 0.0004916405024013344, 'samples': 2729856, 'steps': 14217, 'loss/train': 1.8595951795578003} -11/06/2021 23:12:37 - INFO - __main__ - Step 14219: {'lr': 0.0004916391415225413, 'samples': 2730048, 'steps': 14218, 'loss/train': 1.1561071872711182} -11/06/2021 23:12:38 - INFO - __main__ - Step 14220: {'lr': 0.0004916377805348692, 'samples': 2730240, 'steps': 14219, 'loss/train': 1.8915315866470337} -11/06/2021 23:12:38 - INFO - __main__ - Step 14221: {'lr': 0.000491636419438319, 'samples': 2730432, 'steps': 14220, 'loss/train': 1.322358250617981} -11/06/2021 23:12:38 - INFO - __main__ - Step 14222: {'lr': 0.000491635058232891, 'samples': 2730624, 'steps': 14221, 'loss/train': 1.5473992824554443} -11/06/2021 23:12:39 - INFO - __main__ - Step 14223: {'lr': 0.0004916336969185861, 'samples': 2730816, 'steps': 14222, 'loss/train': 0.6478114724159241} -11/06/2021 23:12:40 - INFO - __main__ - Step 14224: {'lr': 0.0004916323354954047, 'samples': 2731008, 'steps': 14223, 'loss/train': 1.2803329229354858} -11/06/2021 23:12:40 - INFO - __main__ - Step 14225: {'lr': 0.0004916309739633475, 'samples': 2731200, 'steps': 14224, 'loss/train': 1.5547466278076172} -11/06/2021 23:12:40 - INFO - __main__ - Step 14226: {'lr': 0.0004916296123224151, 'samples': 2731392, 'steps': 14225, 'loss/train': 2.0657129287719727} -11/06/2021 23:12:41 - INFO - __main__ - Step 14227: {'lr': 0.0004916282505726082, 'samples': 2731584, 'steps': 14226, 'loss/train': 1.7537693977355957} -11/06/2021 23:12:41 - INFO - __main__ - Step 14228: {'lr': 0.0004916268887139272, 'samples': 2731776, 'steps': 14227, 'loss/train': 1.8315138816833496} -11/06/2021 23:12:42 - INFO - __main__ - Step 14229: {'lr': 0.000491625526746373, 'samples': 2731968, 'steps': 14228, 'loss/train': 2.130446434020996} -11/06/2021 23:12:43 - INFO - __main__ - Step 14230: {'lr': 0.000491624164669946, 'samples': 2732160, 'steps': 14229, 'loss/train': 2.0926835536956787} -11/06/2021 23:12:43 - INFO - __main__ - Step 14231: {'lr': 0.0004916228024846469, 'samples': 2732352, 'steps': 14230, 'loss/train': 1.9206883907318115} -11/06/2021 23:12:43 - INFO - __main__ - Step 14232: {'lr': 0.0004916214401904763, 'samples': 2732544, 'steps': 14231, 'loss/train': 1.461196780204773} -11/06/2021 23:12:44 - INFO - __main__ - Step 14233: {'lr': 0.0004916200777874348, 'samples': 2732736, 'steps': 14232, 'loss/train': 1.8770463466644287} -11/06/2021 23:12:45 - INFO - __main__ - Step 14234: {'lr': 0.000491618715275523, 'samples': 2732928, 'steps': 14233, 'loss/train': 2.0279908180236816} -11/06/2021 23:12:46 - INFO - __main__ - Step 14235: {'lr': 0.0004916173526547415, 'samples': 2733120, 'steps': 14234, 'loss/train': 1.2167682647705078} -11/06/2021 23:12:46 - INFO - __main__ - Step 14236: {'lr': 0.000491615989925091, 'samples': 2733312, 'steps': 14235, 'loss/train': 1.5853732824325562} -11/06/2021 23:12:46 - INFO - __main__ - Step 14237: {'lr': 0.0004916146270865721, 'samples': 2733504, 'steps': 14236, 'loss/train': 2.5321567058563232} -11/06/2021 23:12:47 - INFO - __main__ - Step 14238: {'lr': 0.0004916132641391854, 'samples': 2733696, 'steps': 14237, 'loss/train': 1.8508648872375488} -11/06/2021 23:12:47 - INFO - __main__ - Step 14239: {'lr': 0.0004916119010829314, 'samples': 2733888, 'steps': 14238, 'loss/train': 1.860944390296936} -11/06/2021 23:12:47 - INFO - __main__ - Step 14240: {'lr': 0.0004916105379178108, 'samples': 2734080, 'steps': 14239, 'loss/train': 1.910184621810913} -11/06/2021 23:12:48 - INFO - __main__ - Step 14241: {'lr': 0.0004916091746438243, 'samples': 2734272, 'steps': 14240, 'loss/train': 1.9223930835723877} -11/06/2021 23:12:49 - INFO - __main__ - Step 14242: {'lr': 0.0004916078112609724, 'samples': 2734464, 'steps': 14241, 'loss/train': 1.7084510326385498} -11/06/2021 23:12:49 - INFO - __main__ - Step 14243: {'lr': 0.0004916064477692557, 'samples': 2734656, 'steps': 14242, 'loss/train': 0.43883585929870605} -11/06/2021 23:12:49 - INFO - __main__ - Step 14244: {'lr': 0.0004916050841686748, 'samples': 2734848, 'steps': 14243, 'loss/train': 1.6944113969802856} -11/06/2021 23:12:50 - INFO - __main__ - Step 14245: {'lr': 0.0004916037204592306, 'samples': 2735040, 'steps': 14244, 'loss/train': 1.1687214374542236} -11/06/2021 23:12:51 - INFO - __main__ - Step 14246: {'lr': 0.0004916023566409233, 'samples': 2735232, 'steps': 14245, 'loss/train': 2.218296766281128} -11/06/2021 23:12:51 - INFO - __main__ - Step 14247: {'lr': 0.0004916009927137538, 'samples': 2735424, 'steps': 14246, 'loss/train': 1.7040735483169556} -11/06/2021 23:12:52 - INFO - __main__ - Step 14248: {'lr': 0.0004915996286777226, 'samples': 2735616, 'steps': 14247, 'loss/train': 1.2565326690673828} -11/06/2021 23:12:52 - INFO - __main__ - Step 14249: {'lr': 0.0004915982645328304, 'samples': 2735808, 'steps': 14248, 'loss/train': 1.6930842399597168} -11/06/2021 23:12:52 - INFO - __main__ - Step 14250: {'lr': 0.0004915969002790777, 'samples': 2736000, 'steps': 14249, 'loss/train': 1.771859049797058} -11/06/2021 23:12:53 - INFO - __main__ - Step 14251: {'lr': 0.0004915955359164651, 'samples': 2736192, 'steps': 14250, 'loss/train': 1.4663689136505127} -11/06/2021 23:12:54 - INFO - __main__ - Step 14252: {'lr': 0.0004915941714449933, 'samples': 2736384, 'steps': 14251, 'loss/train': 1.6903026103973389} -11/06/2021 23:12:54 - INFO - __main__ - Step 14253: {'lr': 0.000491592806864663, 'samples': 2736576, 'steps': 14252, 'loss/train': 1.7190121412277222} -11/06/2021 23:12:54 - INFO - __main__ - Step 14254: {'lr': 0.0004915914421754746, 'samples': 2736768, 'steps': 14253, 'loss/train': 0.6711317300796509} -11/06/2021 23:12:55 - INFO - __main__ - Step 14255: {'lr': 0.0004915900773774289, 'samples': 2736960, 'steps': 14254, 'loss/train': 1.9526695013046265} -11/06/2021 23:12:55 - INFO - __main__ - Step 14256: {'lr': 0.0004915887124705263, 'samples': 2737152, 'steps': 14255, 'loss/train': 2.055246353149414} -11/06/2021 23:12:56 - INFO - __main__ - Step 14257: {'lr': 0.0004915873474547677, 'samples': 2737344, 'steps': 14256, 'loss/train': 1.7780791521072388} -11/06/2021 23:12:57 - INFO - __main__ - Step 14258: {'lr': 0.0004915859823301535, 'samples': 2737536, 'steps': 14257, 'loss/train': 1.91822350025177} -11/06/2021 23:12:57 - INFO - __main__ - Step 14259: {'lr': 0.0004915846170966845, 'samples': 2737728, 'steps': 14258, 'loss/train': 1.2504817247390747} -11/06/2021 23:12:57 - INFO - __main__ - Step 14260: {'lr': 0.000491583251754361, 'samples': 2737920, 'steps': 14259, 'loss/train': 2.1529762744903564} -11/06/2021 23:12:58 - INFO - __main__ - Step 14261: {'lr': 0.0004915818863031839, 'samples': 2738112, 'steps': 14260, 'loss/train': 2.2141220569610596} -11/06/2021 23:12:58 - INFO - __main__ - Step 14262: {'lr': 0.0004915805207431537, 'samples': 2738304, 'steps': 14261, 'loss/train': 1.4041943550109863} -11/06/2021 23:12:59 - INFO - __main__ - Step 14263: {'lr': 0.0004915791550742712, 'samples': 2738496, 'steps': 14262, 'loss/train': 2.012119770050049} -11/06/2021 23:12:59 - INFO - __main__ - Step 14264: {'lr': 0.0004915777892965368, 'samples': 2738688, 'steps': 14263, 'loss/train': 1.8272478580474854} -11/06/2021 23:13:00 - INFO - __main__ - Step 14265: {'lr': 0.0004915764234099511, 'samples': 2738880, 'steps': 14264, 'loss/train': 1.6100664138793945} -11/06/2021 23:13:00 - INFO - __main__ - Step 14266: {'lr': 0.0004915750574145148, 'samples': 2739072, 'steps': 14265, 'loss/train': 1.9792180061340332} -11/06/2021 23:13:00 - INFO - __main__ - Step 14267: {'lr': 0.0004915736913102285, 'samples': 2739264, 'steps': 14266, 'loss/train': 1.8761942386627197} -11/06/2021 23:13:02 - INFO - __main__ - Step 14268: {'lr': 0.0004915723250970928, 'samples': 2739456, 'steps': 14267, 'loss/train': 2.067959785461426} -11/06/2021 23:13:02 - INFO - __main__ - Step 14269: {'lr': 0.0004915709587751084, 'samples': 2739648, 'steps': 14268, 'loss/train': 2.4542698860168457} -11/06/2021 23:13:02 - INFO - __main__ - Step 14270: {'lr': 0.0004915695923442759, 'samples': 2739840, 'steps': 14269, 'loss/train': 1.489783763885498} -11/06/2021 23:13:03 - INFO - __main__ - Step 14271: {'lr': 0.0004915682258045958, 'samples': 2740032, 'steps': 14270, 'loss/train': 1.8175733089447021} -11/06/2021 23:13:03 - INFO - __main__ - Step 14272: {'lr': 0.0004915668591560688, 'samples': 2740224, 'steps': 14271, 'loss/train': 1.3902310132980347} -11/06/2021 23:13:04 - INFO - __main__ - Step 14273: {'lr': 0.0004915654923986955, 'samples': 2740416, 'steps': 14272, 'loss/train': 1.5795223712921143} -11/06/2021 23:13:04 - INFO - __main__ - Step 14274: {'lr': 0.0004915641255324764, 'samples': 2740608, 'steps': 14273, 'loss/train': 1.8649059534072876} -11/06/2021 23:13:05 - INFO - __main__ - Step 14275: {'lr': 0.0004915627585574124, 'samples': 2740800, 'steps': 14274, 'loss/train': 1.643608570098877} -11/06/2021 23:13:05 - INFO - __main__ - Step 14276: {'lr': 0.0004915613914735038, 'samples': 2740992, 'steps': 14275, 'loss/train': 2.0051262378692627} -11/06/2021 23:13:05 - INFO - __main__ - Step 14277: {'lr': 0.0004915600242807516, 'samples': 2741184, 'steps': 14276, 'loss/train': 1.455479383468628} -11/06/2021 23:13:06 - INFO - __main__ - Step 14278: {'lr': 0.000491558656979156, 'samples': 2741376, 'steps': 14277, 'loss/train': 1.6889221668243408} -11/06/2021 23:13:07 - INFO - __main__ - Step 14279: {'lr': 0.0004915572895687179, 'samples': 2741568, 'steps': 14278, 'loss/train': 1.9221125841140747} -11/06/2021 23:13:07 - INFO - __main__ - Step 14280: {'lr': 0.0004915559220494376, 'samples': 2741760, 'steps': 14279, 'loss/train': 1.842481017112732} -11/06/2021 23:13:07 - INFO - __main__ - Step 14281: {'lr': 0.0004915545544213161, 'samples': 2741952, 'steps': 14280, 'loss/train': 1.5338388681411743} -11/06/2021 23:13:08 - INFO - __main__ - Step 14282: {'lr': 0.0004915531866843539, 'samples': 2742144, 'steps': 14281, 'loss/train': 1.903611660003662} -11/06/2021 23:13:09 - INFO - __main__ - Step 14283: {'lr': 0.0004915518188385514, 'samples': 2742336, 'steps': 14282, 'loss/train': 1.557709813117981} -11/06/2021 23:13:09 - INFO - __main__ - Step 14284: {'lr': 0.0004915504508839095, 'samples': 2742528, 'steps': 14283, 'loss/train': 1.7310574054718018} -11/06/2021 23:13:09 - INFO - __main__ - Step 14285: {'lr': 0.0004915490828204287, 'samples': 2742720, 'steps': 14284, 'loss/train': 1.8797122240066528} -11/06/2021 23:13:10 - INFO - __main__ - Step 14286: {'lr': 0.0004915477146481095, 'samples': 2742912, 'steps': 14285, 'loss/train': 1.9240556955337524} -11/06/2021 23:13:10 - INFO - __main__ - Step 14287: {'lr': 0.0004915463463669527, 'samples': 2743104, 'steps': 14286, 'loss/train': 2.307543992996216} -11/06/2021 23:13:11 - INFO - __main__ - Step 14288: {'lr': 0.0004915449779769589, 'samples': 2743296, 'steps': 14287, 'loss/train': 2.076409339904785} -11/06/2021 23:13:12 - INFO - __main__ - Step 14289: {'lr': 0.0004915436094781285, 'samples': 2743488, 'steps': 14288, 'loss/train': 1.6683952808380127} -11/06/2021 23:13:12 - INFO - __main__ - Step 14290: {'lr': 0.0004915422408704624, 'samples': 2743680, 'steps': 14289, 'loss/train': 1.3777574300765991} -11/06/2021 23:13:12 - INFO - __main__ - Step 14291: {'lr': 0.0004915408721539612, 'samples': 2743872, 'steps': 14290, 'loss/train': 1.556388020515442} -11/06/2021 23:13:13 - INFO - __main__ - Step 14292: {'lr': 0.0004915395033286251, 'samples': 2744064, 'steps': 14291, 'loss/train': 1.8184715509414673} -11/06/2021 23:13:13 - INFO - __main__ - Step 14293: {'lr': 0.0004915381343944552, 'samples': 2744256, 'steps': 14292, 'loss/train': 1.5744520425796509} -11/06/2021 23:13:14 - INFO - __main__ - Step 14294: {'lr': 0.0004915367653514521, 'samples': 2744448, 'steps': 14293, 'loss/train': 1.5268954038619995} -11/06/2021 23:13:14 - INFO - __main__ - Step 14295: {'lr': 0.0004915353961996161, 'samples': 2744640, 'steps': 14294, 'loss/train': 1.4393970966339111} -11/06/2021 23:13:15 - INFO - __main__ - Step 14296: {'lr': 0.000491534026938948, 'samples': 2744832, 'steps': 14295, 'loss/train': 1.8665683269500732} -11/06/2021 23:13:15 - INFO - __main__ - Step 14297: {'lr': 0.0004915326575694484, 'samples': 2745024, 'steps': 14296, 'loss/train': 2.0807924270629883} -11/06/2021 23:13:15 - INFO - __main__ - Step 14298: {'lr': 0.0004915312880911178, 'samples': 2745216, 'steps': 14297, 'loss/train': 1.800079345703125} -11/06/2021 23:13:16 - INFO - __main__ - Step 14299: {'lr': 0.000491529918503957, 'samples': 2745408, 'steps': 14298, 'loss/train': 1.6191036701202393} -11/06/2021 23:13:17 - INFO - __main__ - Step 14300: {'lr': 0.0004915285488079666, 'samples': 2745600, 'steps': 14299, 'loss/train': 1.6357394456863403} -11/06/2021 23:13:17 - INFO - __main__ - Step 14301: {'lr': 0.0004915271790031471, 'samples': 2745792, 'steps': 14300, 'loss/train': 1.8493192195892334} -11/06/2021 23:13:17 - INFO - __main__ - Step 14302: {'lr': 0.0004915258090894993, 'samples': 2745984, 'steps': 14301, 'loss/train': 1.3855708837509155} -11/06/2021 23:13:18 - INFO - __main__ - Step 14303: {'lr': 0.0004915244390670236, 'samples': 2746176, 'steps': 14302, 'loss/train': 1.6835711002349854} -11/06/2021 23:13:19 - INFO - __main__ - Step 14304: {'lr': 0.0004915230689357206, 'samples': 2746368, 'steps': 14303, 'loss/train': 1.9127839803695679} -11/06/2021 23:13:19 - INFO - __main__ - Step 14305: {'lr': 0.0004915216986955913, 'samples': 2746560, 'steps': 14304, 'loss/train': 1.7443958520889282} -11/06/2021 23:13:19 - INFO - __main__ - Step 14306: {'lr': 0.0004915203283466359, 'samples': 2746752, 'steps': 14305, 'loss/train': 1.8569912910461426} -11/06/2021 23:13:20 - INFO - __main__ - Step 14307: {'lr': 0.0004915189578888552, 'samples': 2746944, 'steps': 14306, 'loss/train': 2.002859354019165} -11/06/2021 23:13:20 - INFO - __main__ - Step 14308: {'lr': 0.0004915175873222497, 'samples': 2747136, 'steps': 14307, 'loss/train': 1.7802067995071411} -11/06/2021 23:13:21 - INFO - __main__ - Step 14309: {'lr': 0.0004915162166468201, 'samples': 2747328, 'steps': 14308, 'loss/train': 1.61421799659729} -11/06/2021 23:13:22 - INFO - __main__ - Step 14310: {'lr': 0.0004915148458625671, 'samples': 2747520, 'steps': 14309, 'loss/train': 1.5801818370819092} -11/06/2021 23:13:22 - INFO - __main__ - Step 14311: {'lr': 0.0004915134749694912, 'samples': 2747712, 'steps': 14310, 'loss/train': 1.24630606174469} -11/06/2021 23:13:22 - INFO - __main__ - Step 14312: {'lr': 0.000491512103967593, 'samples': 2747904, 'steps': 14311, 'loss/train': 1.8175888061523438} -11/06/2021 23:13:23 - INFO - __main__ - Step 14313: {'lr': 0.0004915107328568733, 'samples': 2748096, 'steps': 14312, 'loss/train': 1.7059366703033447} -11/06/2021 23:13:23 - INFO - __main__ - Step 14314: {'lr': 0.0004915093616373326, 'samples': 2748288, 'steps': 14313, 'loss/train': 1.2261815071105957} -11/06/2021 23:13:24 - INFO - __main__ - Step 14315: {'lr': 0.0004915079903089714, 'samples': 2748480, 'steps': 14314, 'loss/train': 1.8357681035995483} -11/06/2021 23:13:24 - INFO - __main__ - Step 14316: {'lr': 0.0004915066188717905, 'samples': 2748672, 'steps': 14315, 'loss/train': 1.671004056930542} -11/06/2021 23:13:25 - INFO - __main__ - Step 14317: {'lr': 0.0004915052473257904, 'samples': 2748864, 'steps': 14316, 'loss/train': 1.6903188228607178} -11/06/2021 23:13:25 - INFO - __main__ - Step 14318: {'lr': 0.0004915038756709717, 'samples': 2749056, 'steps': 14317, 'loss/train': 1.4683510065078735} -11/06/2021 23:13:25 - INFO - __main__ - Step 14319: {'lr': 0.0004915025039073352, 'samples': 2749248, 'steps': 14318, 'loss/train': 1.8368884325027466} -11/06/2021 23:13:26 - INFO - __main__ - Step 14320: {'lr': 0.0004915011320348814, 'samples': 2749440, 'steps': 14319, 'loss/train': 1.3511337041854858} -11/06/2021 23:13:27 - INFO - __main__ - Step 14321: {'lr': 0.0004914997600536108, 'samples': 2749632, 'steps': 14320, 'loss/train': 1.4233803749084473} -11/06/2021 23:13:27 - INFO - __main__ - Step 14322: {'lr': 0.0004914983879635242, 'samples': 2749824, 'steps': 14321, 'loss/train': 1.6688144207000732} -11/06/2021 23:13:28 - INFO - __main__ - Step 14323: {'lr': 0.0004914970157646222, 'samples': 2750016, 'steps': 14322, 'loss/train': 1.5857484340667725} -11/06/2021 23:13:28 - INFO - __main__ - Step 14324: {'lr': 0.0004914956434569054, 'samples': 2750208, 'steps': 14323, 'loss/train': 1.8138678073883057} -11/06/2021 23:13:29 - INFO - __main__ - Step 14325: {'lr': 0.0004914942710403743, 'samples': 2750400, 'steps': 14324, 'loss/train': 2.092402935028076} -11/06/2021 23:13:29 - INFO - __main__ - Step 14326: {'lr': 0.0004914928985150296, 'samples': 2750592, 'steps': 14325, 'loss/train': 1.820569396018982} -11/06/2021 23:13:30 - INFO - __main__ - Step 14327: {'lr': 0.0004914915258808719, 'samples': 2750784, 'steps': 14326, 'loss/train': 1.4420838356018066} -11/06/2021 23:13:30 - INFO - __main__ - Step 14328: {'lr': 0.0004914901531379019, 'samples': 2750976, 'steps': 14327, 'loss/train': 1.843706727027893} -11/06/2021 23:13:30 - INFO - __main__ - Step 14329: {'lr': 0.0004914887802861201, 'samples': 2751168, 'steps': 14328, 'loss/train': 1.7319104671478271} -11/06/2021 23:13:32 - INFO - __main__ - Step 14330: {'lr': 0.0004914874073255273, 'samples': 2751360, 'steps': 14329, 'loss/train': 1.3918893337249756} -11/06/2021 23:13:32 - INFO - __main__ - Step 14331: {'lr': 0.0004914860342561239, 'samples': 2751552, 'steps': 14330, 'loss/train': 1.587130069732666} -11/06/2021 23:13:32 - INFO - __main__ - Step 14332: {'lr': 0.0004914846610779107, 'samples': 2751744, 'steps': 14331, 'loss/train': 1.7063366174697876} -11/06/2021 23:13:33 - INFO - __main__ - Step 14333: {'lr': 0.0004914832877908881, 'samples': 2751936, 'steps': 14332, 'loss/train': 1.7004281282424927} -11/06/2021 23:13:33 - INFO - __main__ - Step 14334: {'lr': 0.0004914819143950571, 'samples': 2752128, 'steps': 14333, 'loss/train': 1.0245263576507568} -11/06/2021 23:13:33 - INFO - __main__ - Step 14335: {'lr': 0.0004914805408904179, 'samples': 2752320, 'steps': 14334, 'loss/train': 1.9465148448944092} -11/06/2021 23:13:34 - INFO - __main__ - Step 14336: {'lr': 0.0004914791672769713, 'samples': 2752512, 'steps': 14335, 'loss/train': 1.6169592142105103} -11/06/2021 23:13:35 - INFO - __main__ - Step 14337: {'lr': 0.000491477793554718, 'samples': 2752704, 'steps': 14336, 'loss/train': 1.842124342918396} -11/06/2021 23:13:35 - INFO - __main__ - Step 14338: {'lr': 0.0004914764197236584, 'samples': 2752896, 'steps': 14337, 'loss/train': 2.156404495239258} -11/06/2021 23:13:35 - INFO - __main__ - Step 14339: {'lr': 0.0004914750457837933, 'samples': 2753088, 'steps': 14338, 'loss/train': 2.6054229736328125} -11/06/2021 23:13:36 - INFO - __main__ - Step 14340: {'lr': 0.0004914736717351233, 'samples': 2753280, 'steps': 14339, 'loss/train': 0.8791477084159851} -11/06/2021 23:13:37 - INFO - __main__ - Step 14341: {'lr': 0.000491472297577649, 'samples': 2753472, 'steps': 14340, 'loss/train': 2.0689876079559326} -11/06/2021 23:13:37 - INFO - __main__ - Step 14342: {'lr': 0.000491470923311371, 'samples': 2753664, 'steps': 14341, 'loss/train': 2.8645334243774414} -11/06/2021 23:13:38 - INFO - __main__ - Step 14343: {'lr': 0.0004914695489362899, 'samples': 2753856, 'steps': 14342, 'loss/train': 1.755697250366211} -11/06/2021 23:13:38 - INFO - __main__ - Step 14344: {'lr': 0.0004914681744524064, 'samples': 2754048, 'steps': 14343, 'loss/train': 1.9771595001220703} -11/06/2021 23:13:38 - INFO - __main__ - Step 14345: {'lr': 0.0004914667998597211, 'samples': 2754240, 'steps': 14344, 'loss/train': 1.9034637212753296} -11/06/2021 23:13:39 - INFO - __main__ - Step 14346: {'lr': 0.0004914654251582344, 'samples': 2754432, 'steps': 14345, 'loss/train': 2.0097978115081787} -11/06/2021 23:13:40 - INFO - __main__ - Step 14347: {'lr': 0.0004914640503479473, 'samples': 2754624, 'steps': 14346, 'loss/train': 1.8135510683059692} -11/06/2021 23:13:40 - INFO - __main__ - Step 14348: {'lr': 0.0004914626754288601, 'samples': 2754816, 'steps': 14347, 'loss/train': 2.062073230743408} -11/06/2021 23:13:40 - INFO - __main__ - Step 14349: {'lr': 0.0004914613004009736, 'samples': 2755008, 'steps': 14348, 'loss/train': 1.3072386980056763} -11/06/2021 23:13:41 - INFO - __main__ - Step 14350: {'lr': 0.0004914599252642884, 'samples': 2755200, 'steps': 14349, 'loss/train': 1.7098357677459717} -11/06/2021 23:13:41 - INFO - __main__ - Step 14351: {'lr': 0.000491458550018805, 'samples': 2755392, 'steps': 14350, 'loss/train': 1.7779287099838257} -11/06/2021 23:13:42 - INFO - __main__ - Step 14352: {'lr': 0.0004914571746645242, 'samples': 2755584, 'steps': 14351, 'loss/train': 2.2135913372039795} -11/06/2021 23:13:43 - INFO - __main__ - Step 14353: {'lr': 0.0004914557992014465, 'samples': 2755776, 'steps': 14352, 'loss/train': 1.0863014459609985} -11/06/2021 23:13:43 - INFO - __main__ - Step 14354: {'lr': 0.0004914544236295725, 'samples': 2755968, 'steps': 14353, 'loss/train': 1.349368691444397} -11/06/2021 23:13:43 - INFO - __main__ - Step 14355: {'lr': 0.0004914530479489029, 'samples': 2756160, 'steps': 14354, 'loss/train': 1.2938106060028076} -11/06/2021 23:13:44 - INFO - __main__ - Step 14356: {'lr': 0.0004914516721594382, 'samples': 2756352, 'steps': 14355, 'loss/train': 1.8118442296981812} -11/06/2021 23:13:45 - INFO - __main__ - Step 14357: {'lr': 0.0004914502962611792, 'samples': 2756544, 'steps': 14356, 'loss/train': 1.9531524181365967} -11/06/2021 23:13:45 - INFO - __main__ - Step 14358: {'lr': 0.0004914489202541264, 'samples': 2756736, 'steps': 14357, 'loss/train': 1.827507734298706} -11/06/2021 23:13:45 - INFO - __main__ - Step 14359: {'lr': 0.0004914475441382804, 'samples': 2756928, 'steps': 14358, 'loss/train': 1.6210410594940186} -11/06/2021 23:13:46 - INFO - __main__ - Step 14360: {'lr': 0.0004914461679136419, 'samples': 2757120, 'steps': 14359, 'loss/train': 1.5644958019256592} -11/06/2021 23:13:46 - INFO - __main__ - Step 14361: {'lr': 0.0004914447915802115, 'samples': 2757312, 'steps': 14360, 'loss/train': 1.3498966693878174} -11/06/2021 23:13:47 - INFO - __main__ - Step 14362: {'lr': 0.0004914434151379898, 'samples': 2757504, 'steps': 14361, 'loss/train': 1.2043393850326538} -11/06/2021 23:13:47 - INFO - __main__ - Step 14363: {'lr': 0.0004914420385869773, 'samples': 2757696, 'steps': 14362, 'loss/train': 1.314516544342041} -11/06/2021 23:13:48 - INFO - __main__ - Step 14364: {'lr': 0.0004914406619271749, 'samples': 2757888, 'steps': 14363, 'loss/train': 1.803429126739502} -11/06/2021 23:13:48 - INFO - __main__ - Step 14365: {'lr': 0.0004914392851585829, 'samples': 2758080, 'steps': 14364, 'loss/train': 1.7351176738739014} -11/06/2021 23:13:48 - INFO - __main__ - Step 14366: {'lr': 0.0004914379082812023, 'samples': 2758272, 'steps': 14365, 'loss/train': 1.1345579624176025} -11/06/2021 23:13:49 - INFO - __main__ - Step 14367: {'lr': 0.0004914365312950333, 'samples': 2758464, 'steps': 14366, 'loss/train': 2.234651803970337} -11/06/2021 23:13:50 - INFO - __main__ - Step 14368: {'lr': 0.0004914351542000768, 'samples': 2758656, 'steps': 14367, 'loss/train': 1.3707553148269653} -11/06/2021 23:13:50 - INFO - __main__ - Step 14369: {'lr': 0.0004914337769963334, 'samples': 2758848, 'steps': 14368, 'loss/train': 1.8129569292068481} -11/06/2021 23:13:51 - INFO - __main__ - Step 14370: {'lr': 0.0004914323996838036, 'samples': 2759040, 'steps': 14369, 'loss/train': 1.368338942527771} -11/06/2021 23:13:51 - INFO - __main__ - Step 14371: {'lr': 0.0004914310222624881, 'samples': 2759232, 'steps': 14370, 'loss/train': 1.6486504077911377} -11/06/2021 23:13:51 - INFO - __main__ - Step 14372: {'lr': 0.0004914296447323875, 'samples': 2759424, 'steps': 14371, 'loss/train': 1.776429295539856} -11/06/2021 23:13:52 - INFO - __main__ - Step 14373: {'lr': 0.0004914282670935025, 'samples': 2759616, 'steps': 14372, 'loss/train': 1.8240113258361816} -11/06/2021 23:13:53 - INFO - __main__ - Step 14374: {'lr': 0.0004914268893458336, 'samples': 2759808, 'steps': 14373, 'loss/train': 1.7623484134674072} -11/06/2021 23:13:53 - INFO - __main__ - Step 14375: {'lr': 0.0004914255114893814, 'samples': 2760000, 'steps': 14374, 'loss/train': 1.851312518119812} -11/06/2021 23:13:53 - INFO - __main__ - Step 14376: {'lr': 0.0004914241335241467, 'samples': 2760192, 'steps': 14375, 'loss/train': 1.748906135559082} -11/06/2021 23:13:54 - INFO - __main__ - Step 14377: {'lr': 0.0004914227554501299, 'samples': 2760384, 'steps': 14376, 'loss/train': 0.8111178278923035} -11/06/2021 23:13:55 - INFO - __main__ - Step 14378: {'lr': 0.0004914213772673319, 'samples': 2760576, 'steps': 14377, 'loss/train': 0.3423219919204712} -11/06/2021 23:13:56 - INFO - __main__ - Step 14379: {'lr': 0.0004914199989757529, 'samples': 2760768, 'steps': 14378, 'loss/train': 1.715069055557251} -11/06/2021 23:13:56 - INFO - __main__ - Step 14380: {'lr': 0.000491418620575394, 'samples': 2760960, 'steps': 14379, 'loss/train': 1.3890851736068726} -11/06/2021 23:13:57 - INFO - __main__ - Step 14381: {'lr': 0.0004914172420662556, 'samples': 2761152, 'steps': 14380, 'loss/train': 1.8425896167755127} -11/06/2021 23:13:57 - INFO - __main__ - Step 14382: {'lr': 0.0004914158634483381, 'samples': 2761344, 'steps': 14381, 'loss/train': 1.8168810606002808} -11/06/2021 23:13:57 - INFO - __main__ - Step 14383: {'lr': 0.0004914144847216425, 'samples': 2761536, 'steps': 14382, 'loss/train': 1.2000967264175415} -11/06/2021 23:13:58 - INFO - __main__ - Step 14384: {'lr': 0.0004914131058861693, 'samples': 2761728, 'steps': 14383, 'loss/train': 1.7531344890594482} -11/06/2021 23:13:59 - INFO - __main__ - Step 14385: {'lr': 0.000491411726941919, 'samples': 2761920, 'steps': 14384, 'loss/train': 1.7564046382904053} -11/06/2021 23:13:59 - INFO - __main__ - Step 14386: {'lr': 0.0004914103478888922, 'samples': 2762112, 'steps': 14385, 'loss/train': 1.1627519130706787} -11/06/2021 23:13:59 - INFO - __main__ - Step 14387: {'lr': 0.0004914089687270898, 'samples': 2762304, 'steps': 14386, 'loss/train': 1.7761569023132324} -11/06/2021 23:14:00 - INFO - __main__ - Step 14388: {'lr': 0.0004914075894565122, 'samples': 2762496, 'steps': 14387, 'loss/train': 1.060185194015503} -11/06/2021 23:14:00 - INFO - __main__ - Step 14389: {'lr': 0.00049140621007716, 'samples': 2762688, 'steps': 14388, 'loss/train': 1.5696700811386108} -11/06/2021 23:14:01 - INFO - __main__ - Step 14390: {'lr': 0.0004914048305890339, 'samples': 2762880, 'steps': 14389, 'loss/train': 1.3252995014190674} -11/06/2021 23:14:01 - INFO - __main__ - Step 14391: {'lr': 0.0004914034509921345, 'samples': 2763072, 'steps': 14390, 'loss/train': 2.1088061332702637} -11/06/2021 23:14:02 - INFO - __main__ - Step 14392: {'lr': 0.0004914020712864626, 'samples': 2763264, 'steps': 14391, 'loss/train': 1.9577943086624146} -11/06/2021 23:14:02 - INFO - __main__ - Step 14393: {'lr': 0.0004914006914720184, 'samples': 2763456, 'steps': 14392, 'loss/train': 1.1342967748641968} -11/06/2021 23:14:03 - INFO - __main__ - Step 14394: {'lr': 0.0004913993115488029, 'samples': 2763648, 'steps': 14393, 'loss/train': 1.1955634355545044} -11/06/2021 23:14:03 - INFO - __main__ - Step 14395: {'lr': 0.0004913979315168167, 'samples': 2763840, 'steps': 14394, 'loss/train': 1.5130412578582764} -11/06/2021 23:14:04 - INFO - __main__ - Step 14396: {'lr': 0.0004913965513760601, 'samples': 2764032, 'steps': 14395, 'loss/train': 1.6799837350845337} -11/06/2021 23:14:04 - INFO - __main__ - Step 14397: {'lr': 0.0004913951711265341, 'samples': 2764224, 'steps': 14396, 'loss/train': 1.8832666873931885} -11/06/2021 23:14:05 - INFO - __main__ - Step 14398: {'lr': 0.0004913937907682391, 'samples': 2764416, 'steps': 14397, 'loss/train': 1.6365022659301758} -11/06/2021 23:14:05 - INFO - __main__ - Step 14399: {'lr': 0.0004913924103011757, 'samples': 2764608, 'steps': 14398, 'loss/train': 1.8931413888931274} -11/06/2021 23:14:05 - INFO - __main__ - Step 14400: {'lr': 0.0004913910297253448, 'samples': 2764800, 'steps': 14399, 'loss/train': 1.8184783458709717} -11/06/2021 23:14:06 - INFO - __main__ - Step 14401: {'lr': 0.0004913896490407467, 'samples': 2764992, 'steps': 14400, 'loss/train': 1.6293751001358032} -11/06/2021 23:14:07 - INFO - __main__ - Step 14402: {'lr': 0.0004913882682473821, 'samples': 2765184, 'steps': 14401, 'loss/train': 1.6088601350784302} -11/06/2021 23:14:07 - INFO - __main__ - Step 14403: {'lr': 0.0004913868873452519, 'samples': 2765376, 'steps': 14402, 'loss/train': 1.4631474018096924} -11/06/2021 23:14:07 - INFO - __main__ - Step 14404: {'lr': 0.0004913855063343563, 'samples': 2765568, 'steps': 14403, 'loss/train': 1.457092523574829} -11/06/2021 23:14:08 - INFO - __main__ - Step 14405: {'lr': 0.0004913841252146961, 'samples': 2765760, 'steps': 14404, 'loss/train': 1.6985125541687012} -11/06/2021 23:14:09 - INFO - __main__ - Step 14406: {'lr': 0.000491382743986272, 'samples': 2765952, 'steps': 14405, 'loss/train': 2.084760904312134} -11/06/2021 23:14:09 - INFO - __main__ - Step 14407: {'lr': 0.0004913813626490845, 'samples': 2766144, 'steps': 14406, 'loss/train': 1.3225696086883545} -11/06/2021 23:14:09 - INFO - __main__ - Step 14408: {'lr': 0.0004913799812031343, 'samples': 2766336, 'steps': 14407, 'loss/train': 1.6497886180877686} -11/06/2021 23:14:10 - INFO - __main__ - Step 14409: {'lr': 0.0004913785996484221, 'samples': 2766528, 'steps': 14408, 'loss/train': 1.065016746520996} -11/06/2021 23:14:10 - INFO - __main__ - Step 14410: {'lr': 0.0004913772179849483, 'samples': 2766720, 'steps': 14409, 'loss/train': 1.7048285007476807} -11/06/2021 23:14:11 - INFO - __main__ - Step 14411: {'lr': 0.0004913758362127137, 'samples': 2766912, 'steps': 14410, 'loss/train': 1.4540810585021973} -11/06/2021 23:14:11 - INFO - __main__ - Step 14412: {'lr': 0.0004913744543317189, 'samples': 2767104, 'steps': 14411, 'loss/train': 1.4666005373001099} -11/06/2021 23:14:12 - INFO - __main__ - Step 14413: {'lr': 0.0004913730723419645, 'samples': 2767296, 'steps': 14412, 'loss/train': 1.2720320224761963} -11/06/2021 23:14:12 - INFO - __main__ - Step 14414: {'lr': 0.000491371690243451, 'samples': 2767488, 'steps': 14413, 'loss/train': 1.3805193901062012} -11/06/2021 23:14:12 - INFO - __main__ - Step 14415: {'lr': 0.0004913703080361793, 'samples': 2767680, 'steps': 14414, 'loss/train': 2.1130664348602295} -11/06/2021 23:14:14 - INFO - __main__ - Step 14416: {'lr': 0.0004913689257201499, 'samples': 2767872, 'steps': 14415, 'loss/train': 1.317294955253601} -11/06/2021 23:14:14 - INFO - __main__ - Step 14417: {'lr': 0.0004913675432953633, 'samples': 2768064, 'steps': 14416, 'loss/train': 1.1042780876159668} -11/06/2021 23:14:14 - INFO - __main__ - Step 14418: {'lr': 0.0004913661607618202, 'samples': 2768256, 'steps': 14417, 'loss/train': 2.0876216888427734} -11/06/2021 23:14:15 - INFO - __main__ - Step 14419: {'lr': 0.0004913647781195212, 'samples': 2768448, 'steps': 14418, 'loss/train': 1.5809930562973022} -11/06/2021 23:14:15 - INFO - __main__ - Step 14420: {'lr': 0.000491363395368467, 'samples': 2768640, 'steps': 14419, 'loss/train': 0.730297863483429} -11/06/2021 23:14:15 - INFO - __main__ - Step 14421: {'lr': 0.0004913620125086581, 'samples': 2768832, 'steps': 14420, 'loss/train': 5.8645501136779785} -11/06/2021 23:14:16 - INFO - __main__ - Step 14422: {'lr': 0.0004913606295400953, 'samples': 2769024, 'steps': 14421, 'loss/train': 2.153425455093384} -11/06/2021 23:14:17 - INFO - __main__ - Step 14423: {'lr': 0.000491359246462779, 'samples': 2769216, 'steps': 14422, 'loss/train': 1.7173231840133667} -11/06/2021 23:14:17 - INFO - __main__ - Step 14424: {'lr': 0.0004913578632767101, 'samples': 2769408, 'steps': 14423, 'loss/train': 1.7363717555999756} -11/06/2021 23:14:18 - INFO - __main__ - Step 14425: {'lr': 0.0004913564799818891, 'samples': 2769600, 'steps': 14424, 'loss/train': 1.796966314315796} -11/06/2021 23:14:18 - INFO - __main__ - Step 14426: {'lr': 0.0004913550965783165, 'samples': 2769792, 'steps': 14425, 'loss/train': 1.8378410339355469} -11/06/2021 23:14:19 - INFO - __main__ - Step 14427: {'lr': 0.000491353713065993, 'samples': 2769984, 'steps': 14426, 'loss/train': 1.9022510051727295} -11/06/2021 23:14:19 - INFO - __main__ - Step 14428: {'lr': 0.0004913523294449193, 'samples': 2770176, 'steps': 14427, 'loss/train': 1.5578607320785522} -11/06/2021 23:14:20 - INFO - __main__ - Step 14429: {'lr': 0.0004913509457150959, 'samples': 2770368, 'steps': 14428, 'loss/train': 1.9274928569793701} -11/06/2021 23:14:20 - INFO - __main__ - Step 14430: {'lr': 0.0004913495618765235, 'samples': 2770560, 'steps': 14429, 'loss/train': 1.6800792217254639} -11/06/2021 23:14:20 - INFO - __main__ - Step 14431: {'lr': 0.0004913481779292027, 'samples': 2770752, 'steps': 14430, 'loss/train': 1.7277616262435913} -11/06/2021 23:14:21 - INFO - __main__ - Step 14432: {'lr': 0.0004913467938731341, 'samples': 2770944, 'steps': 14431, 'loss/train': 1.655822992324829} -11/06/2021 23:14:22 - INFO - __main__ - Step 14433: {'lr': 0.0004913454097083185, 'samples': 2771136, 'steps': 14432, 'loss/train': 1.733009696006775} -11/06/2021 23:14:22 - INFO - __main__ - Step 14434: {'lr': 0.0004913440254347563, 'samples': 2771328, 'steps': 14433, 'loss/train': 2.231706380844116} -11/06/2021 23:14:23 - INFO - __main__ - Step 14435: {'lr': 0.0004913426410524482, 'samples': 2771520, 'steps': 14434, 'loss/train': 0.5304341316223145} -11/06/2021 23:14:23 - INFO - __main__ - Step 14436: {'lr': 0.0004913412565613948, 'samples': 2771712, 'steps': 14435, 'loss/train': 1.5568188428878784} -11/06/2021 23:14:23 - INFO - __main__ - Step 14437: {'lr': 0.0004913398719615968, 'samples': 2771904, 'steps': 14436, 'loss/train': 1.682983160018921} -11/06/2021 23:14:24 - INFO - __main__ - Step 14438: {'lr': 0.0004913384872530548, 'samples': 2772096, 'steps': 14437, 'loss/train': 1.6241941452026367} -11/06/2021 23:14:25 - INFO - __main__ - Step 14439: {'lr': 0.0004913371024357694, 'samples': 2772288, 'steps': 14438, 'loss/train': 1.7349668741226196} -11/06/2021 23:14:25 - INFO - __main__ - Step 14440: {'lr': 0.0004913357175097412, 'samples': 2772480, 'steps': 14439, 'loss/train': 2.172203302383423} -11/06/2021 23:14:25 - INFO - __main__ - Step 14441: {'lr': 0.0004913343324749708, 'samples': 2772672, 'steps': 14440, 'loss/train': 0.5017638206481934} -11/06/2021 23:14:26 - INFO - __main__ - Step 14442: {'lr': 0.000491332947331459, 'samples': 2772864, 'steps': 14441, 'loss/train': 1.8418453931808472} -11/06/2021 23:14:27 - INFO - __main__ - Step 14443: {'lr': 0.0004913315620792061, 'samples': 2773056, 'steps': 14442, 'loss/train': 1.784220576286316} -11/06/2021 23:14:27 - INFO - __main__ - Step 14444: {'lr': 0.0004913301767182131, 'samples': 2773248, 'steps': 14443, 'loss/train': 1.6641216278076172} -11/06/2021 23:14:27 - INFO - __main__ - Step 14445: {'lr': 0.0004913287912484804, 'samples': 2773440, 'steps': 14444, 'loss/train': 1.1389085054397583} -11/06/2021 23:14:28 - INFO - __main__ - Step 14446: {'lr': 0.0004913274056700087, 'samples': 2773632, 'steps': 14445, 'loss/train': 1.5397385358810425} -11/06/2021 23:14:28 - INFO - __main__ - Step 14447: {'lr': 0.0004913260199827986, 'samples': 2773824, 'steps': 14446, 'loss/train': 2.1198136806488037} -11/06/2021 23:14:29 - INFO - __main__ - Step 14448: {'lr': 0.0004913246341868506, 'samples': 2774016, 'steps': 14447, 'loss/train': 1.6462889909744263} -11/06/2021 23:14:30 - INFO - __main__ - Step 14449: {'lr': 0.0004913232482821656, 'samples': 2774208, 'steps': 14448, 'loss/train': 1.6559960842132568} -11/06/2021 23:14:30 - INFO - __main__ - Step 14450: {'lr': 0.0004913218622687439, 'samples': 2774400, 'steps': 14449, 'loss/train': 1.4591246843338013} -11/06/2021 23:14:30 - INFO - __main__ - Step 14451: {'lr': 0.0004913204761465864, 'samples': 2774592, 'steps': 14450, 'loss/train': 1.9061264991760254} -11/06/2021 23:14:31 - INFO - __main__ - Step 14452: {'lr': 0.0004913190899156936, 'samples': 2774784, 'steps': 14451, 'loss/train': 1.592616081237793} -11/06/2021 23:14:31 - INFO - __main__ - Step 14453: {'lr': 0.0004913177035760661, 'samples': 2774976, 'steps': 14452, 'loss/train': 1.2767666578292847} -11/06/2021 23:14:32 - INFO - __main__ - Step 14454: {'lr': 0.0004913163171277046, 'samples': 2775168, 'steps': 14453, 'loss/train': 1.2585607767105103} -11/06/2021 23:14:32 - INFO - __main__ - Step 14455: {'lr': 0.0004913149305706097, 'samples': 2775360, 'steps': 14454, 'loss/train': 1.6764591932296753} -11/06/2021 23:14:33 - INFO - __main__ - Step 14456: {'lr': 0.0004913135439047821, 'samples': 2775552, 'steps': 14455, 'loss/train': 1.7716397047042847} -11/06/2021 23:14:33 - INFO - __main__ - Step 14457: {'lr': 0.0004913121571302222, 'samples': 2775744, 'steps': 14456, 'loss/train': 1.690000057220459} -11/06/2021 23:14:33 - INFO - __main__ - Step 14458: {'lr': 0.0004913107702469308, 'samples': 2775936, 'steps': 14457, 'loss/train': 1.5991852283477783} -11/06/2021 23:14:34 - INFO - __main__ - Step 14459: {'lr': 0.0004913093832549085, 'samples': 2776128, 'steps': 14458, 'loss/train': 1.8135044574737549} -11/06/2021 23:14:35 - INFO - __main__ - Step 14460: {'lr': 0.000491307996154156, 'samples': 2776320, 'steps': 14459, 'loss/train': 1.87995445728302} -11/06/2021 23:14:35 - INFO - __main__ - Step 14461: {'lr': 0.0004913066089446737, 'samples': 2776512, 'steps': 14460, 'loss/train': 1.2176554203033447} -11/06/2021 23:14:35 - INFO - __main__ - Step 14462: {'lr': 0.0004913052216264624, 'samples': 2776704, 'steps': 14461, 'loss/train': 1.4758261442184448} -11/06/2021 23:14:36 - INFO - __main__ - Step 14463: {'lr': 0.0004913038341995227, 'samples': 2776896, 'steps': 14462, 'loss/train': 1.7246683835983276} -11/06/2021 23:14:37 - INFO - __main__ - Step 14464: {'lr': 0.0004913024466638553, 'samples': 2777088, 'steps': 14463, 'loss/train': 1.7339403629302979} -11/06/2021 23:14:37 - INFO - __main__ - Step 14465: {'lr': 0.0004913010590194607, 'samples': 2777280, 'steps': 14464, 'loss/train': 1.6634852886199951} -11/06/2021 23:14:37 - INFO - __main__ - Step 14466: {'lr': 0.0004912996712663396, 'samples': 2777472, 'steps': 14465, 'loss/train': 1.24350106716156} -11/06/2021 23:14:38 - INFO - __main__ - Step 14467: {'lr': 0.0004912982834044924, 'samples': 2777664, 'steps': 14466, 'loss/train': 1.8824312686920166} -11/06/2021 23:14:38 - INFO - __main__ - Step 14468: {'lr': 0.0004912968954339202, 'samples': 2777856, 'steps': 14467, 'loss/train': 1.555679202079773} -11/06/2021 23:14:39 - INFO - __main__ - Step 14469: {'lr': 0.0004912955073546231, 'samples': 2778048, 'steps': 14468, 'loss/train': 1.743302345275879} -11/06/2021 23:14:40 - INFO - __main__ - Step 14470: {'lr': 0.0004912941191666021, 'samples': 2778240, 'steps': 14469, 'loss/train': 1.9434269666671753} -11/06/2021 23:14:40 - INFO - __main__ - Step 14471: {'lr': 0.0004912927308698576, 'samples': 2778432, 'steps': 14470, 'loss/train': 1.7462414503097534} -11/06/2021 23:14:40 - INFO - __main__ - Step 14472: {'lr': 0.0004912913424643904, 'samples': 2778624, 'steps': 14471, 'loss/train': 1.8691980838775635} -11/06/2021 23:14:41 - INFO - __main__ - Step 14473: {'lr': 0.0004912899539502011, 'samples': 2778816, 'steps': 14472, 'loss/train': 1.504024624824524} -11/06/2021 23:14:42 - INFO - __main__ - Step 14474: {'lr': 0.0004912885653272902, 'samples': 2779008, 'steps': 14473, 'loss/train': 0.9449915289878845} -11/06/2021 23:14:42 - INFO - __main__ - Step 14475: {'lr': 0.0004912871765956583, 'samples': 2779200, 'steps': 14474, 'loss/train': 1.7823172807693481} -11/06/2021 23:14:43 - INFO - __main__ - Step 14476: {'lr': 0.0004912857877553062, 'samples': 2779392, 'steps': 14475, 'loss/train': 1.6257444620132446} -11/06/2021 23:14:43 - INFO - __main__ - Step 14477: {'lr': 0.0004912843988062345, 'samples': 2779584, 'steps': 14476, 'loss/train': 1.8921669721603394} -11/06/2021 23:14:43 - INFO - __main__ - Step 14478: {'lr': 0.0004912830097484437, 'samples': 2779776, 'steps': 14477, 'loss/train': 1.9633761644363403} -11/06/2021 23:14:44 - INFO - __main__ - Step 14479: {'lr': 0.0004912816205819346, 'samples': 2779968, 'steps': 14478, 'loss/train': 1.5476384162902832} -11/06/2021 23:14:45 - INFO - __main__ - Step 14480: {'lr': 0.0004912802313067076, 'samples': 2780160, 'steps': 14479, 'loss/train': 1.160788893699646} -11/06/2021 23:14:45 - INFO - __main__ - Step 14481: {'lr': 0.0004912788419227635, 'samples': 2780352, 'steps': 14480, 'loss/train': 1.3065866231918335} -11/06/2021 23:14:45 - INFO - __main__ - Step 14482: {'lr': 0.000491277452430103, 'samples': 2780544, 'steps': 14481, 'loss/train': 1.6148895025253296} -11/06/2021 23:14:46 - INFO - __main__ - Step 14483: {'lr': 0.0004912760628287264, 'samples': 2780736, 'steps': 14482, 'loss/train': 0.9406113028526306} -11/06/2021 23:14:46 - INFO - __main__ - Step 14484: {'lr': 0.0004912746731186346, 'samples': 2780928, 'steps': 14483, 'loss/train': 1.4715304374694824} -11/06/2021 23:14:48 - INFO - __main__ - Step 14485: {'lr': 0.0004912732832998281, 'samples': 2781120, 'steps': 14484, 'loss/train': 1.742849349975586} -11/06/2021 23:14:48 - INFO - __main__ - Step 14486: {'lr': 0.0004912718933723077, 'samples': 2781312, 'steps': 14485, 'loss/train': 1.7313225269317627} -11/06/2021 23:14:48 - INFO - __main__ - Step 14487: {'lr': 0.0004912705033360738, 'samples': 2781504, 'steps': 14486, 'loss/train': 1.3565199375152588} -11/06/2021 23:14:49 - INFO - __main__ - Step 14488: {'lr': 0.0004912691131911272, 'samples': 2781696, 'steps': 14487, 'loss/train': 1.073344111442566} -11/06/2021 23:14:49 - INFO - __main__ - Step 14489: {'lr': 0.0004912677229374684, 'samples': 2781888, 'steps': 14488, 'loss/train': 1.5861188173294067} -11/06/2021 23:14:50 - INFO - __main__ - Step 14490: {'lr': 0.0004912663325750982, 'samples': 2782080, 'steps': 14489, 'loss/train': 1.8165336847305298} -11/06/2021 23:14:50 - INFO - __main__ - Step 14491: {'lr': 0.000491264942104017, 'samples': 2782272, 'steps': 14490, 'loss/train': 0.944426953792572} -11/06/2021 23:14:51 - INFO - __main__ - Step 14492: {'lr': 0.0004912635515242257, 'samples': 2782464, 'steps': 14491, 'loss/train': 0.730577826499939} -11/06/2021 23:14:51 - INFO - __main__ - Step 14493: {'lr': 0.0004912621608357246, 'samples': 2782656, 'steps': 14492, 'loss/train': 2.3794353008270264} -11/06/2021 23:14:52 - INFO - __main__ - Step 14494: {'lr': 0.0004912607700385146, 'samples': 2782848, 'steps': 14493, 'loss/train': 1.526907205581665} -11/06/2021 23:14:52 - INFO - __main__ - Step 14495: {'lr': 0.0004912593791325962, 'samples': 2783040, 'steps': 14494, 'loss/train': 0.6017135977745056} -11/06/2021 23:14:52 - INFO - __main__ - Step 14496: {'lr': 0.00049125798811797, 'samples': 2783232, 'steps': 14495, 'loss/train': 1.5702513456344604} -11/06/2021 23:14:53 - INFO - __main__ - Step 14497: {'lr': 0.0004912565969946367, 'samples': 2783424, 'steps': 14496, 'loss/train': 1.7380554676055908} -11/06/2021 23:14:54 - INFO - __main__ - Step 14498: {'lr': 0.0004912552057625969, 'samples': 2783616, 'steps': 14497, 'loss/train': 1.791672706604004} -11/06/2021 23:14:54 - INFO - __main__ - Step 14499: {'lr': 0.0004912538144218512, 'samples': 2783808, 'steps': 14498, 'loss/train': 1.8101961612701416} -11/06/2021 23:14:54 - INFO - __main__ - Step 14500: {'lr': 0.0004912524229724002, 'samples': 2784000, 'steps': 14499, 'loss/train': 1.174378752708435} -11/06/2021 23:14:55 - INFO - __main__ - Step 14501: {'lr': 0.0004912510314142447, 'samples': 2784192, 'steps': 14500, 'loss/train': 1.9984477758407593} -11/06/2021 23:14:56 - INFO - __main__ - Step 14502: {'lr': 0.0004912496397473852, 'samples': 2784384, 'steps': 14501, 'loss/train': 2.0241353511810303} -11/06/2021 23:14:56 - INFO - __main__ - Step 14503: {'lr': 0.0004912482479718223, 'samples': 2784576, 'steps': 14502, 'loss/train': 1.441446304321289} -11/06/2021 23:14:56 - INFO - __main__ - Step 14504: {'lr': 0.0004912468560875566, 'samples': 2784768, 'steps': 14503, 'loss/train': 1.7977668046951294} -11/06/2021 23:14:57 - INFO - __main__ - Step 14505: {'lr': 0.0004912454640945889, 'samples': 2784960, 'steps': 14504, 'loss/train': 1.8055917024612427} -11/06/2021 23:14:57 - INFO - __main__ - Step 14506: {'lr': 0.0004912440719929196, 'samples': 2785152, 'steps': 14505, 'loss/train': 1.3446134328842163} -11/06/2021 23:14:58 - INFO - __main__ - Step 14507: {'lr': 0.0004912426797825495, 'samples': 2785344, 'steps': 14506, 'loss/train': 1.7469252347946167} -11/06/2021 23:14:59 - INFO - __main__ - Step 14508: {'lr': 0.0004912412874634792, 'samples': 2785536, 'steps': 14507, 'loss/train': 1.3988752365112305} -11/06/2021 23:14:59 - INFO - __main__ - Step 14509: {'lr': 0.0004912398950357094, 'samples': 2785728, 'steps': 14508, 'loss/train': 2.2110788822174072} -11/06/2021 23:14:59 - INFO - __main__ - Step 14510: {'lr': 0.0004912385024992404, 'samples': 2785920, 'steps': 14509, 'loss/train': 1.4885571002960205} -11/06/2021 23:15:00 - INFO - __main__ - Step 14511: {'lr': 0.0004912371098540733, 'samples': 2786112, 'steps': 14510, 'loss/train': 2.1764931678771973} -11/06/2021 23:15:01 - INFO - __main__ - Step 14512: {'lr': 0.0004912357171002082, 'samples': 2786304, 'steps': 14511, 'loss/train': 1.1966614723205566} -11/06/2021 23:15:01 - INFO - __main__ - Step 14513: {'lr': 0.0004912343242376462, 'samples': 2786496, 'steps': 14512, 'loss/train': 1.392907738685608} -11/06/2021 23:15:01 - INFO - __main__ - Step 14514: {'lr': 0.0004912329312663877, 'samples': 2786688, 'steps': 14513, 'loss/train': 1.479630947113037} -11/06/2021 23:15:02 - INFO - __main__ - Step 14515: {'lr': 0.0004912315381864333, 'samples': 2786880, 'steps': 14514, 'loss/train': 1.7795805931091309} -11/06/2021 23:15:02 - INFO - __main__ - Step 14516: {'lr': 0.0004912301449977837, 'samples': 2787072, 'steps': 14515, 'loss/train': 1.7214689254760742} -11/06/2021 23:15:02 - INFO - __main__ - Step 14517: {'lr': 0.0004912287517004397, 'samples': 2787264, 'steps': 14516, 'loss/train': 1.5596206188201904} -11/06/2021 23:15:03 - INFO - __main__ - Step 14518: {'lr': 0.0004912273582944015, 'samples': 2787456, 'steps': 14517, 'loss/train': 1.3602560758590698} -11/06/2021 23:15:04 - INFO - __main__ - Step 14519: {'lr': 0.0004912259647796701, 'samples': 2787648, 'steps': 14518, 'loss/train': 1.7231316566467285} -11/06/2021 23:15:04 - INFO - __main__ - Step 14520: {'lr': 0.000491224571156246, 'samples': 2787840, 'steps': 14519, 'loss/train': 1.2232226133346558} -11/06/2021 23:15:05 - INFO - __main__ - Step 14521: {'lr': 0.0004912231774241298, 'samples': 2788032, 'steps': 14520, 'loss/train': 1.797451138496399} -11/06/2021 23:15:05 - INFO - __main__ - Step 14522: {'lr': 0.0004912217835833222, 'samples': 2788224, 'steps': 14521, 'loss/train': 0.9428983926773071} -11/06/2021 23:15:06 - INFO - __main__ - Step 14523: {'lr': 0.0004912203896338238, 'samples': 2788416, 'steps': 14522, 'loss/train': 1.4348275661468506} -11/06/2021 23:15:06 - INFO - __main__ - Step 14524: {'lr': 0.0004912189955756351, 'samples': 2788608, 'steps': 14523, 'loss/train': 1.5228583812713623} -11/06/2021 23:15:07 - INFO - __main__ - Step 14525: {'lr': 0.000491217601408757, 'samples': 2788800, 'steps': 14524, 'loss/train': 1.8126468658447266} -11/06/2021 23:15:07 - INFO - __main__ - Step 14526: {'lr': 0.0004912162071331898, 'samples': 2788992, 'steps': 14525, 'loss/train': 1.6764172315597534} -11/06/2021 23:15:07 - INFO - __main__ - Step 14527: {'lr': 0.0004912148127489345, 'samples': 2789184, 'steps': 14526, 'loss/train': 1.4271752834320068} -11/06/2021 23:15:08 - INFO - __main__ - Step 14528: {'lr': 0.0004912134182559913, 'samples': 2789376, 'steps': 14527, 'loss/train': 1.7659759521484375} -11/06/2021 23:15:09 - INFO - __main__ - Step 14529: {'lr': 0.0004912120236543611, 'samples': 2789568, 'steps': 14528, 'loss/train': 1.7609317302703857} -11/06/2021 23:15:09 - INFO - __main__ - Step 14530: {'lr': 0.0004912106289440446, 'samples': 2789760, 'steps': 14529, 'loss/train': 1.904273271560669} -11/06/2021 23:15:09 - INFO - __main__ - Step 14531: {'lr': 0.0004912092341250422, 'samples': 2789952, 'steps': 14530, 'loss/train': 1.7561595439910889} -11/06/2021 23:15:10 - INFO - __main__ - Step 14532: {'lr': 0.0004912078391973547, 'samples': 2790144, 'steps': 14531, 'loss/train': 1.3714295625686646} -11/06/2021 23:15:11 - INFO - __main__ - Step 14533: {'lr': 0.0004912064441609827, 'samples': 2790336, 'steps': 14532, 'loss/train': 1.4325453042984009} -11/06/2021 23:15:11 - INFO - __main__ - Step 14534: {'lr': 0.0004912050490159268, 'samples': 2790528, 'steps': 14533, 'loss/train': 1.7847373485565186} -11/06/2021 23:15:11 - INFO - __main__ - Step 14535: {'lr': 0.0004912036537621877, 'samples': 2790720, 'steps': 14534, 'loss/train': 2.0088417530059814} -11/06/2021 23:15:12 - INFO - __main__ - Step 14536: {'lr': 0.0004912022583997658, 'samples': 2790912, 'steps': 14535, 'loss/train': 1.3345286846160889} -11/06/2021 23:15:12 - INFO - __main__ - Step 14537: {'lr': 0.0004912008629286619, 'samples': 2791104, 'steps': 14536, 'loss/train': 1.6118730306625366} -11/06/2021 23:15:12 - INFO - __main__ - Step 14538: {'lr': 0.0004911994673488766, 'samples': 2791296, 'steps': 14537, 'loss/train': 1.377058982849121} -11/06/2021 23:15:14 - INFO - __main__ - Step 14539: {'lr': 0.0004911980716604107, 'samples': 2791488, 'steps': 14538, 'loss/train': 1.6407101154327393} -11/06/2021 23:15:14 - INFO - __main__ - Step 14540: {'lr': 0.0004911966758632645, 'samples': 2791680, 'steps': 14539, 'loss/train': 1.8519309759140015} -11/06/2021 23:15:14 - INFO - __main__ - Step 14541: {'lr': 0.000491195279957439, 'samples': 2791872, 'steps': 14540, 'loss/train': 1.6462745666503906} -11/06/2021 23:15:15 - INFO - __main__ - Step 14542: {'lr': 0.0004911938839429344, 'samples': 2792064, 'steps': 14541, 'loss/train': 1.8177210092544556} -11/06/2021 23:15:15 - INFO - __main__ - Step 14543: {'lr': 0.0004911924878197517, 'samples': 2792256, 'steps': 14542, 'loss/train': 2.063103437423706} -11/06/2021 23:15:16 - INFO - __main__ - Step 14544: {'lr': 0.0004911910915878913, 'samples': 2792448, 'steps': 14543, 'loss/train': 2.019076347351074} -11/06/2021 23:15:16 - INFO - __main__ - Step 14545: {'lr': 0.000491189695247354, 'samples': 2792640, 'steps': 14544, 'loss/train': 1.723437786102295} -11/06/2021 23:15:17 - INFO - __main__ - Step 14546: {'lr': 0.0004911882987981404, 'samples': 2792832, 'steps': 14545, 'loss/train': 1.8162659406661987} -11/06/2021 23:15:17 - INFO - __main__ - Step 14547: {'lr': 0.0004911869022402508, 'samples': 2793024, 'steps': 14546, 'loss/train': 1.8774888515472412} -11/06/2021 23:15:17 - INFO - __main__ - Step 14548: {'lr': 0.0004911855055736863, 'samples': 2793216, 'steps': 14547, 'loss/train': 1.6280256509780884} -11/06/2021 23:15:18 - INFO - __main__ - Step 14549: {'lr': 0.0004911841087984473, 'samples': 2793408, 'steps': 14548, 'loss/train': 1.9488242864608765} -11/06/2021 23:15:19 - INFO - __main__ - Step 14550: {'lr': 0.0004911827119145345, 'samples': 2793600, 'steps': 14549, 'loss/train': 2.1403818130493164} -11/06/2021 23:15:19 - INFO - __main__ - Step 14551: {'lr': 0.0004911813149219485, 'samples': 2793792, 'steps': 14550, 'loss/train': 1.7999236583709717} -11/06/2021 23:15:19 - INFO - __main__ - Step 14552: {'lr': 0.0004911799178206899, 'samples': 2793984, 'steps': 14551, 'loss/train': 1.94169020652771} -11/06/2021 23:15:20 - INFO - __main__ - Step 14553: {'lr': 0.0004911785206107592, 'samples': 2794176, 'steps': 14552, 'loss/train': 1.5757359266281128} -11/06/2021 23:15:21 - INFO - __main__ - Step 14554: {'lr': 0.0004911771232921575, 'samples': 2794368, 'steps': 14553, 'loss/train': 1.7550246715545654} -11/06/2021 23:15:21 - INFO - __main__ - Step 14555: {'lr': 0.0004911757258648849, 'samples': 2794560, 'steps': 14554, 'loss/train': 1.0412113666534424} -11/06/2021 23:15:22 - INFO - __main__ - Step 14556: {'lr': 0.0004911743283289423, 'samples': 2794752, 'steps': 14555, 'loss/train': 1.524915337562561} -11/06/2021 23:15:22 - INFO - __main__ - Step 14557: {'lr': 0.0004911729306843302, 'samples': 2794944, 'steps': 14556, 'loss/train': 1.9681403636932373} -11/06/2021 23:15:23 - INFO - __main__ - Step 14558: {'lr': 0.0004911715329310493, 'samples': 2795136, 'steps': 14557, 'loss/train': 1.4831455945968628} -11/06/2021 23:15:23 - INFO - __main__ - Step 14559: {'lr': 0.0004911701350691002, 'samples': 2795328, 'steps': 14558, 'loss/train': 0.9031453132629395} -11/06/2021 23:15:24 - INFO - __main__ - Step 14560: {'lr': 0.0004911687370984836, 'samples': 2795520, 'steps': 14559, 'loss/train': 1.7917287349700928} -11/06/2021 23:15:24 - INFO - __main__ - Step 14561: {'lr': 0.0004911673390192002, 'samples': 2795712, 'steps': 14560, 'loss/train': 1.3398245573043823} -11/06/2021 23:15:25 - INFO - __main__ - Step 14562: {'lr': 0.0004911659408312505, 'samples': 2795904, 'steps': 14561, 'loss/train': 1.7333766222000122} -11/06/2021 23:15:25 - INFO - __main__ - Step 14563: {'lr': 0.000491164542534635, 'samples': 2796096, 'steps': 14562, 'loss/train': 1.9331468343734741} -11/06/2021 23:15:25 - INFO - __main__ - Step 14564: {'lr': 0.0004911631441293546, 'samples': 2796288, 'steps': 14563, 'loss/train': 1.3357164859771729} -11/06/2021 23:15:26 - INFO - __main__ - Step 14565: {'lr': 0.0004911617456154097, 'samples': 2796480, 'steps': 14564, 'loss/train': 1.6416891813278198} -11/06/2021 23:15:27 - INFO - __main__ - Step 14566: {'lr': 0.0004911603469928012, 'samples': 2796672, 'steps': 14565, 'loss/train': 2.241854667663574} -11/06/2021 23:15:27 - INFO - __main__ - Step 14567: {'lr': 0.0004911589482615294, 'samples': 2796864, 'steps': 14566, 'loss/train': 0.8703035116195679} -11/06/2021 23:15:27 - INFO - __main__ - Step 14568: {'lr': 0.0004911575494215952, 'samples': 2797056, 'steps': 14567, 'loss/train': 1.3895127773284912} -11/06/2021 23:15:28 - INFO - __main__ - Step 14569: {'lr': 0.0004911561504729992, 'samples': 2797248, 'steps': 14568, 'loss/train': 3.218695878982544} -11/06/2021 23:15:28 - INFO - __main__ - Step 14570: {'lr': 0.0004911547514157417, 'samples': 2797440, 'steps': 14569, 'loss/train': 1.9162862300872803} -11/06/2021 23:15:29 - INFO - __main__ - Step 14571: {'lr': 0.0004911533522498239, 'samples': 2797632, 'steps': 14570, 'loss/train': 1.7870599031448364} -11/06/2021 23:15:29 - INFO - __main__ - Step 14572: {'lr': 0.0004911519529752459, 'samples': 2797824, 'steps': 14571, 'loss/train': 2.2179548740386963} -11/06/2021 23:15:30 - INFO - __main__ - Step 14573: {'lr': 0.0004911505535920086, 'samples': 2798016, 'steps': 14572, 'loss/train': 1.6157692670822144} -11/06/2021 23:15:30 - INFO - __main__ - Step 14574: {'lr': 0.0004911491541001126, 'samples': 2798208, 'steps': 14573, 'loss/train': 1.6204320192337036} -11/06/2021 23:15:30 - INFO - __main__ - Step 14575: {'lr': 0.0004911477544995585, 'samples': 2798400, 'steps': 14574, 'loss/train': 1.705611228942871} -11/06/2021 23:15:31 - INFO - __main__ - Step 14576: {'lr': 0.000491146354790347, 'samples': 2798592, 'steps': 14575, 'loss/train': 1.5545910596847534} -11/06/2021 23:15:32 - INFO - __main__ - Step 14577: {'lr': 0.0004911449549724786, 'samples': 2798784, 'steps': 14576, 'loss/train': 1.5566593408584595} -11/06/2021 23:15:32 - INFO - __main__ - Step 14578: {'lr': 0.0004911435550459541, 'samples': 2798976, 'steps': 14577, 'loss/train': 2.1471126079559326} -11/06/2021 23:15:32 - INFO - __main__ - Step 14579: {'lr': 0.0004911421550107739, 'samples': 2799168, 'steps': 14578, 'loss/train': 1.5826555490493774} -11/06/2021 23:15:33 - INFO - __main__ - Step 14580: {'lr': 0.0004911407548669389, 'samples': 2799360, 'steps': 14579, 'loss/train': 1.8544542789459229} -11/06/2021 23:15:34 - INFO - __main__ - Step 14581: {'lr': 0.0004911393546144495, 'samples': 2799552, 'steps': 14580, 'loss/train': 1.4082012176513672} -11/06/2021 23:15:34 - INFO - __main__ - Step 14582: {'lr': 0.0004911379542533065, 'samples': 2799744, 'steps': 14581, 'loss/train': 1.3058255910873413} -11/06/2021 23:15:35 - INFO - __main__ - Step 14583: {'lr': 0.0004911365537835105, 'samples': 2799936, 'steps': 14582, 'loss/train': 0.7232246398925781} -11/06/2021 23:15:35 - INFO - __main__ - Step 14584: {'lr': 0.000491135153205062, 'samples': 2800128, 'steps': 14583, 'loss/train': 1.6225132942199707} -11/06/2021 23:15:35 - INFO - __main__ - Step 14585: {'lr': 0.0004911337525179616, 'samples': 2800320, 'steps': 14584, 'loss/train': 1.6813801527023315} -11/06/2021 23:15:36 - INFO - __main__ - Step 14586: {'lr': 0.0004911323517222103, 'samples': 2800512, 'steps': 14585, 'loss/train': 1.8164918422698975} -11/06/2021 23:15:37 - INFO - __main__ - Step 14587: {'lr': 0.0004911309508178084, 'samples': 2800704, 'steps': 14586, 'loss/train': 1.225614309310913} -11/06/2021 23:15:37 - INFO - __main__ - Step 14588: {'lr': 0.0004911295498047565, 'samples': 2800896, 'steps': 14587, 'loss/train': 2.0302164554595947} -11/06/2021 23:15:37 - INFO - __main__ - Step 14589: {'lr': 0.0004911281486830554, 'samples': 2801088, 'steps': 14588, 'loss/train': 1.7795565128326416} -11/06/2021 23:15:38 - INFO - __main__ - Step 14590: {'lr': 0.0004911267474527058, 'samples': 2801280, 'steps': 14589, 'loss/train': 1.4832676649093628} -11/06/2021 23:15:39 - INFO - __main__ - Step 14591: {'lr': 0.000491125346113708, 'samples': 2801472, 'steps': 14590, 'loss/train': 1.647063136100769} -11/06/2021 23:15:39 - INFO - __main__ - Step 14592: {'lr': 0.000491123944666063, 'samples': 2801664, 'steps': 14591, 'loss/train': 1.9390480518341064} -11/06/2021 23:15:39 - INFO - __main__ - Step 14593: {'lr': 0.0004911225431097712, 'samples': 2801856, 'steps': 14592, 'loss/train': 1.7286971807479858} -11/06/2021 23:15:40 - INFO - __main__ - Step 14594: {'lr': 0.0004911211414448333, 'samples': 2802048, 'steps': 14593, 'loss/train': 1.6285250186920166} -11/06/2021 23:15:40 - INFO - __main__ - Step 14595: {'lr': 0.0004911197396712501, 'samples': 2802240, 'steps': 14594, 'loss/train': 1.946718692779541} -11/06/2021 23:15:41 - INFO - __main__ - Step 14596: {'lr': 0.0004911183377890218, 'samples': 2802432, 'steps': 14595, 'loss/train': 1.3001048564910889} -11/06/2021 23:15:42 - INFO - __main__ - Step 14597: {'lr': 0.0004911169357981496, 'samples': 2802624, 'steps': 14596, 'loss/train': 1.6624016761779785} -11/06/2021 23:15:42 - INFO - __main__ - Step 14598: {'lr': 0.0004911155336986335, 'samples': 2802816, 'steps': 14597, 'loss/train': 2.089146614074707} -11/06/2021 23:15:42 - INFO - __main__ - Step 14599: {'lr': 0.0004911141314904747, 'samples': 2803008, 'steps': 14598, 'loss/train': 1.3329648971557617} -11/06/2021 23:15:43 - INFO - __main__ - Step 14600: {'lr': 0.0004911127291736735, 'samples': 2803200, 'steps': 14599, 'loss/train': 1.4260157346725464} -11/06/2021 23:15:43 - INFO - __main__ - Step 14601: {'lr': 0.0004911113267482307, 'samples': 2803392, 'steps': 14600, 'loss/train': 1.7082431316375732} -11/06/2021 23:15:44 - INFO - __main__ - Step 14602: {'lr': 0.0004911099242141467, 'samples': 2803584, 'steps': 14601, 'loss/train': 1.4876233339309692} -11/06/2021 23:15:44 - INFO - __main__ - Step 14603: {'lr': 0.0004911085215714224, 'samples': 2803776, 'steps': 14602, 'loss/train': 1.9533902406692505} -11/06/2021 23:15:45 - INFO - __main__ - Step 14604: {'lr': 0.0004911071188200584, 'samples': 2803968, 'steps': 14603, 'loss/train': 2.090561866760254} -11/06/2021 23:15:45 - INFO - __main__ - Step 14605: {'lr': 0.0004911057159600551, 'samples': 2804160, 'steps': 14604, 'loss/train': 1.5187530517578125} -11/06/2021 23:15:45 - INFO - __main__ - Step 14606: {'lr': 0.0004911043129914133, 'samples': 2804352, 'steps': 14605, 'loss/train': 0.9737354516983032} -11/06/2021 23:15:46 - INFO - __main__ - Step 14607: {'lr': 0.0004911029099141336, 'samples': 2804544, 'steps': 14606, 'loss/train': 1.8305327892303467} -11/06/2021 23:15:47 - INFO - __main__ - Step 14608: {'lr': 0.0004911015067282168, 'samples': 2804736, 'steps': 14607, 'loss/train': 1.8033746480941772} -11/06/2021 23:15:47 - INFO - __main__ - Step 14609: {'lr': 0.0004911001034336633, 'samples': 2804928, 'steps': 14608, 'loss/train': 1.6968247890472412} -11/06/2021 23:15:47 - INFO - __main__ - Step 14610: {'lr': 0.0004910987000304737, 'samples': 2805120, 'steps': 14609, 'loss/train': 1.5940757989883423} -11/06/2021 23:15:48 - INFO - __main__ - Step 14611: {'lr': 0.0004910972965186488, 'samples': 2805312, 'steps': 14610, 'loss/train': 1.7843865156173706} -11/06/2021 23:15:48 - INFO - __main__ - Step 14612: {'lr': 0.0004910958928981893, 'samples': 2805504, 'steps': 14611, 'loss/train': 1.8916642665863037} -11/06/2021 23:15:49 - INFO - __main__ - Step 14613: {'lr': 0.0004910944891690956, 'samples': 2805696, 'steps': 14612, 'loss/train': 1.5665946006774902} -11/06/2021 23:15:49 - INFO - __main__ - Step 14614: {'lr': 0.0004910930853313686, 'samples': 2805888, 'steps': 14613, 'loss/train': 1.1098638772964478} -11/06/2021 23:15:50 - INFO - __main__ - Step 14615: {'lr': 0.0004910916813850086, 'samples': 2806080, 'steps': 14614, 'loss/train': 1.3663274049758911} -11/06/2021 23:15:50 - INFO - __main__ - Step 14616: {'lr': 0.0004910902773300164, 'samples': 2806272, 'steps': 14615, 'loss/train': 1.2368197441101074} -11/06/2021 23:15:51 - INFO - __main__ - Step 14617: {'lr': 0.0004910888731663928, 'samples': 2806464, 'steps': 14616, 'loss/train': 1.519328236579895} -11/06/2021 23:15:52 - INFO - __main__ - Step 14618: {'lr': 0.0004910874688941381, 'samples': 2806656, 'steps': 14617, 'loss/train': 1.4356929063796997} -11/06/2021 23:15:52 - INFO - __main__ - Step 14619: {'lr': 0.0004910860645132532, 'samples': 2806848, 'steps': 14618, 'loss/train': 1.3084660768508911} -11/06/2021 23:15:52 - INFO - __main__ - Step 14620: {'lr': 0.0004910846600237386, 'samples': 2807040, 'steps': 14619, 'loss/train': 1.374779224395752} -11/06/2021 23:15:53 - INFO - __main__ - Step 14621: {'lr': 0.0004910832554255951, 'samples': 2807232, 'steps': 14620, 'loss/train': 1.7540532350540161} -11/06/2021 23:15:53 - INFO - __main__ - Step 14622: {'lr': 0.0004910818507188231, 'samples': 2807424, 'steps': 14621, 'loss/train': 1.5536149740219116} -11/06/2021 23:15:54 - INFO - __main__ - Step 14623: {'lr': 0.0004910804459034233, 'samples': 2807616, 'steps': 14622, 'loss/train': 1.8700112104415894} -11/06/2021 23:15:55 - INFO - __main__ - Step 14624: {'lr': 0.0004910790409793965, 'samples': 2807808, 'steps': 14623, 'loss/train': 1.8716275691986084} -11/06/2021 23:15:55 - INFO - __main__ - Step 14625: {'lr': 0.000491077635946743, 'samples': 2808000, 'steps': 14624, 'loss/train': 1.835631012916565} -11/06/2021 23:15:55 - INFO - __main__ - Step 14626: {'lr': 0.0004910762308054638, 'samples': 2808192, 'steps': 14625, 'loss/train': 1.5419883728027344} -11/06/2021 23:15:56 - INFO - __main__ - Step 14627: {'lr': 0.0004910748255555593, 'samples': 2808384, 'steps': 14626, 'loss/train': 0.7711548805236816} -11/06/2021 23:15:56 - INFO - __main__ - Step 14628: {'lr': 0.0004910734201970302, 'samples': 2808576, 'steps': 14627, 'loss/train': 1.3061710596084595} -11/06/2021 23:15:57 - INFO - __main__ - Step 14629: {'lr': 0.0004910720147298772, 'samples': 2808768, 'steps': 14628, 'loss/train': 1.5132771730422974} -11/06/2021 23:15:58 - INFO - __main__ - Step 14630: {'lr': 0.0004910706091541009, 'samples': 2808960, 'steps': 14629, 'loss/train': 1.1088963747024536} -11/06/2021 23:15:58 - INFO - __main__ - Step 14631: {'lr': 0.0004910692034697018, 'samples': 2809152, 'steps': 14630, 'loss/train': 1.5924564599990845} -11/06/2021 23:15:58 - INFO - __main__ - Step 14632: {'lr': 0.0004910677976766807, 'samples': 2809344, 'steps': 14631, 'loss/train': 1.2352012395858765} -11/06/2021 23:15:59 - INFO - __main__ - Step 14633: {'lr': 0.0004910663917750382, 'samples': 2809536, 'steps': 14632, 'loss/train': 1.8392850160598755} -11/06/2021 23:15:59 - INFO - __main__ - Step 14634: {'lr': 0.0004910649857647748, 'samples': 2809728, 'steps': 14633, 'loss/train': 1.6638622283935547} -11/06/2021 23:16:00 - INFO - __main__ - Step 14635: {'lr': 0.0004910635796458913, 'samples': 2809920, 'steps': 14634, 'loss/train': 2.037661075592041} -11/06/2021 23:16:00 - INFO - __main__ - Step 14636: {'lr': 0.0004910621734183882, 'samples': 2810112, 'steps': 14635, 'loss/train': 0.8195475935935974} -11/06/2021 23:16:01 - INFO - __main__ - Step 14637: {'lr': 0.0004910607670822663, 'samples': 2810304, 'steps': 14636, 'loss/train': 1.5160691738128662} -11/06/2021 23:16:01 - INFO - __main__ - Step 14638: {'lr': 0.0004910593606375261, 'samples': 2810496, 'steps': 14637, 'loss/train': 2.147937297821045} -11/06/2021 23:16:02 - INFO - __main__ - Step 14639: {'lr': 0.0004910579540841683, 'samples': 2810688, 'steps': 14638, 'loss/train': 0.8111184239387512} -11/06/2021 23:16:03 - INFO - __main__ - Step 14640: {'lr': 0.0004910565474221934, 'samples': 2810880, 'steps': 14639, 'loss/train': 1.6241923570632935} -11/06/2021 23:16:03 - INFO - __main__ - Step 14641: {'lr': 0.0004910551406516022, 'samples': 2811072, 'steps': 14640, 'loss/train': 2.166555404663086} -11/06/2021 23:16:03 - INFO - __main__ - Step 14642: {'lr': 0.0004910537337723954, 'samples': 2811264, 'steps': 14641, 'loss/train': 1.8136534690856934} -11/06/2021 23:16:04 - INFO - __main__ - Step 14643: {'lr': 0.0004910523267845733, 'samples': 2811456, 'steps': 14642, 'loss/train': 1.5173137187957764} -11/06/2021 23:16:04 - INFO - __main__ - Step 14644: {'lr': 0.0004910509196881369, 'samples': 2811648, 'steps': 14643, 'loss/train': 1.1134371757507324} -11/06/2021 23:16:05 - INFO - __main__ - Step 14645: {'lr': 0.0004910495124830866, 'samples': 2811840, 'steps': 14644, 'loss/train': 1.4934502840042114} -11/06/2021 23:16:05 - INFO - __main__ - Step 14646: {'lr': 0.0004910481051694231, 'samples': 2812032, 'steps': 14645, 'loss/train': 1.9416497945785522} -11/06/2021 23:16:06 - INFO - __main__ - Step 14647: {'lr': 0.0004910466977471471, 'samples': 2812224, 'steps': 14646, 'loss/train': 1.6827425956726074} -11/06/2021 23:16:06 - INFO - __main__ - Step 14648: {'lr': 0.0004910452902162592, 'samples': 2812416, 'steps': 14647, 'loss/train': 1.602482795715332} -11/06/2021 23:16:06 - INFO - __main__ - Step 14649: {'lr': 0.0004910438825767599, 'samples': 2812608, 'steps': 14648, 'loss/train': 1.5670403242111206} -11/06/2021 23:16:08 - INFO - __main__ - Step 14650: {'lr': 0.00049104247482865, 'samples': 2812800, 'steps': 14649, 'loss/train': 1.4646493196487427} -11/06/2021 23:16:08 - INFO - __main__ - Step 14651: {'lr': 0.0004910410669719301, 'samples': 2812992, 'steps': 14650, 'loss/train': 1.5942716598510742} -11/06/2021 23:16:08 - INFO - __main__ - Step 14652: {'lr': 0.0004910396590066008, 'samples': 2813184, 'steps': 14651, 'loss/train': 1.6040905714035034} -11/06/2021 23:16:09 - INFO - __main__ - Step 14653: {'lr': 0.0004910382509326627, 'samples': 2813376, 'steps': 14652, 'loss/train': 2.0839693546295166} -11/06/2021 23:16:09 - INFO - __main__ - Step 14654: {'lr': 0.0004910368427501166, 'samples': 2813568, 'steps': 14653, 'loss/train': 1.966593861579895} -11/06/2021 23:16:10 - INFO - __main__ - Step 14655: {'lr': 0.000491035434458963, 'samples': 2813760, 'steps': 14654, 'loss/train': 2.07354998588562} -11/06/2021 23:16:10 - INFO - __main__ - Step 14656: {'lr': 0.0004910340260592024, 'samples': 2813952, 'steps': 14655, 'loss/train': 1.6633130311965942} -11/06/2021 23:16:11 - INFO - __main__ - Step 14657: {'lr': 0.0004910326175508357, 'samples': 2814144, 'steps': 14656, 'loss/train': 2.252934694290161} -11/06/2021 23:16:11 - INFO - __main__ - Step 14658: {'lr': 0.0004910312089338634, 'samples': 2814336, 'steps': 14657, 'loss/train': 1.369263768196106} -11/06/2021 23:16:11 - INFO - __main__ - Step 14659: {'lr': 0.0004910298002082863, 'samples': 2814528, 'steps': 14658, 'loss/train': 1.274910807609558} -11/06/2021 23:16:12 - INFO - __main__ - Step 14660: {'lr': 0.0004910283913741047, 'samples': 2814720, 'steps': 14659, 'loss/train': 1.555715560913086} -11/06/2021 23:16:13 - INFO - __main__ - Step 14661: {'lr': 0.0004910269824313194, 'samples': 2814912, 'steps': 14660, 'loss/train': 1.4081352949142456} -11/06/2021 23:16:13 - INFO - __main__ - Step 14662: {'lr': 0.0004910255733799312, 'samples': 2815104, 'steps': 14661, 'loss/train': 1.7849104404449463} -11/06/2021 23:16:13 - INFO - __main__ - Step 14663: {'lr': 0.0004910241642199406, 'samples': 2815296, 'steps': 14662, 'loss/train': 1.4840021133422852} -11/06/2021 23:16:14 - INFO - __main__ - Step 14664: {'lr': 0.0004910227549513481, 'samples': 2815488, 'steps': 14663, 'loss/train': 1.7678169012069702} -11/06/2021 23:16:14 - INFO - __main__ - Step 14665: {'lr': 0.0004910213455741546, 'samples': 2815680, 'steps': 14664, 'loss/train': 1.6775918006896973} -11/06/2021 23:16:15 - INFO - __main__ - Step 14666: {'lr': 0.0004910199360883605, 'samples': 2815872, 'steps': 14665, 'loss/train': 1.950029969215393} -11/06/2021 23:16:16 - INFO - __main__ - Step 14667: {'lr': 0.0004910185264939667, 'samples': 2816064, 'steps': 14666, 'loss/train': 1.7304264307022095} -11/06/2021 23:16:16 - INFO - __main__ - Step 14668: {'lr': 0.0004910171167909734, 'samples': 2816256, 'steps': 14667, 'loss/train': 1.4172935485839844} -11/06/2021 23:16:16 - INFO - __main__ - Step 14669: {'lr': 0.0004910157069793816, 'samples': 2816448, 'steps': 14668, 'loss/train': 1.8779479265213013} -11/06/2021 23:16:17 - INFO - __main__ - Step 14670: {'lr': 0.000491014297059192, 'samples': 2816640, 'steps': 14669, 'loss/train': 1.943215012550354} -11/06/2021 23:16:18 - INFO - __main__ - Step 14671: {'lr': 0.000491012887030405, 'samples': 2816832, 'steps': 14670, 'loss/train': 1.6946277618408203} -11/06/2021 23:16:18 - INFO - __main__ - Step 14672: {'lr': 0.0004910114768930212, 'samples': 2817024, 'steps': 14671, 'loss/train': 1.4919730424880981} -11/06/2021 23:16:18 - INFO - __main__ - Step 14673: {'lr': 0.0004910100666470415, 'samples': 2817216, 'steps': 14672, 'loss/train': 1.942678689956665} -11/06/2021 23:16:19 - INFO - __main__ - Step 14674: {'lr': 0.0004910086562924663, 'samples': 2817408, 'steps': 14673, 'loss/train': 1.5062963962554932} -11/06/2021 23:16:19 - INFO - __main__ - Step 14675: {'lr': 0.0004910072458292963, 'samples': 2817600, 'steps': 14674, 'loss/train': 1.1559689044952393} -11/06/2021 23:16:20 - INFO - __main__ - Step 14676: {'lr': 0.0004910058352575322, 'samples': 2817792, 'steps': 14675, 'loss/train': 1.5200366973876953} -11/06/2021 23:16:20 - INFO - __main__ - Step 14677: {'lr': 0.0004910044245771745, 'samples': 2817984, 'steps': 14676, 'loss/train': 1.2778904438018799} -11/06/2021 23:16:21 - INFO - __main__ - Step 14678: {'lr': 0.0004910030137882241, 'samples': 2818176, 'steps': 14677, 'loss/train': 2.667948007583618} -11/06/2021 23:16:21 - INFO - __main__ - Step 14679: {'lr': 0.0004910016028906813, 'samples': 2818368, 'steps': 14678, 'loss/train': 2.185955047607422} -11/06/2021 23:16:22 - INFO - __main__ - Step 14680: {'lr': 0.000491000191884547, 'samples': 2818560, 'steps': 14679, 'loss/train': 1.723203420639038} -11/06/2021 23:16:23 - INFO - __main__ - Step 14681: {'lr': 0.0004909987807698217, 'samples': 2818752, 'steps': 14680, 'loss/train': 1.139530062675476} -11/06/2021 23:16:23 - INFO - __main__ - Step 14682: {'lr': 0.000490997369546506, 'samples': 2818944, 'steps': 14681, 'loss/train': 1.7487425804138184} -11/06/2021 23:16:23 - INFO - __main__ - Step 14683: {'lr': 0.0004909959582146007, 'samples': 2819136, 'steps': 14682, 'loss/train': 1.6787686347961426} -11/06/2021 23:16:24 - INFO - __main__ - Step 14684: {'lr': 0.0004909945467741063, 'samples': 2819328, 'steps': 14683, 'loss/train': 1.1271356344223022} -11/06/2021 23:16:24 - INFO - __main__ - Step 14685: {'lr': 0.0004909931352250235, 'samples': 2819520, 'steps': 14684, 'loss/train': 3.540257453918457} -11/06/2021 23:16:24 - INFO - __main__ - Step 14686: {'lr': 0.0004909917235673529, 'samples': 2819712, 'steps': 14685, 'loss/train': 1.8830620050430298} -11/06/2021 23:16:25 - INFO - __main__ - Step 14687: {'lr': 0.0004909903118010951, 'samples': 2819904, 'steps': 14686, 'loss/train': 1.717665433883667} -11/06/2021 23:16:26 - INFO - __main__ - Step 14688: {'lr': 0.0004909888999262509, 'samples': 2820096, 'steps': 14687, 'loss/train': 0.35629066824913025} -11/06/2021 23:16:26 - INFO - __main__ - Step 14689: {'lr': 0.0004909874879428207, 'samples': 2820288, 'steps': 14688, 'loss/train': 1.5923266410827637} -11/06/2021 23:16:26 - INFO - __main__ - Step 14690: {'lr': 0.0004909860758508052, 'samples': 2820480, 'steps': 14689, 'loss/train': 1.798073172569275} -11/06/2021 23:16:27 - INFO - __main__ - Step 14691: {'lr': 0.0004909846636502053, 'samples': 2820672, 'steps': 14690, 'loss/train': 1.2456002235412598} -11/06/2021 23:16:28 - INFO - __main__ - Step 14692: {'lr': 0.0004909832513410213, 'samples': 2820864, 'steps': 14691, 'loss/train': 1.8775510787963867} -11/06/2021 23:16:28 - INFO - __main__ - Step 14693: {'lr': 0.000490981838923254, 'samples': 2821056, 'steps': 14692, 'loss/train': 2.1554715633392334} -11/06/2021 23:16:29 - INFO - __main__ - Step 14694: {'lr': 0.000490980426396904, 'samples': 2821248, 'steps': 14693, 'loss/train': 1.8785821199417114} -11/06/2021 23:16:29 - INFO - __main__ - Step 14695: {'lr': 0.0004909790137619719, 'samples': 2821440, 'steps': 14694, 'loss/train': 1.473230242729187} -11/06/2021 23:16:29 - INFO - __main__ - Step 14696: {'lr': 0.0004909776010184585, 'samples': 2821632, 'steps': 14695, 'loss/train': 1.770862340927124} -11/06/2021 23:16:30 - INFO - __main__ - Step 14697: {'lr': 0.0004909761881663642, 'samples': 2821824, 'steps': 14696, 'loss/train': 1.7851510047912598} -11/06/2021 23:16:31 - INFO - __main__ - Step 14698: {'lr': 0.0004909747752056897, 'samples': 2822016, 'steps': 14697, 'loss/train': 1.8535454273223877} -11/06/2021 23:16:31 - INFO - __main__ - Step 14699: {'lr': 0.0004909733621364358, 'samples': 2822208, 'steps': 14698, 'loss/train': 1.4395469427108765} -11/06/2021 23:16:31 - INFO - __main__ - Step 14700: {'lr': 0.0004909719489586029, 'samples': 2822400, 'steps': 14699, 'loss/train': 1.9752013683319092} -11/06/2021 23:16:32 - INFO - __main__ - Step 14701: {'lr': 0.0004909705356721919, 'samples': 2822592, 'steps': 14700, 'loss/train': 1.4780222177505493} -11/06/2021 23:16:32 - INFO - __main__ - Step 14702: {'lr': 0.0004909691222772032, 'samples': 2822784, 'steps': 14701, 'loss/train': 1.6931217908859253} -11/06/2021 23:16:33 - INFO - __main__ - Step 14703: {'lr': 0.0004909677087736375, 'samples': 2822976, 'steps': 14702, 'loss/train': 1.33567214012146} -11/06/2021 23:16:33 - INFO - __main__ - Step 14704: {'lr': 0.0004909662951614955, 'samples': 2823168, 'steps': 14703, 'loss/train': 1.3383984565734863} -11/06/2021 23:16:34 - INFO - __main__ - Step 14705: {'lr': 0.0004909648814407779, 'samples': 2823360, 'steps': 14704, 'loss/train': 1.8960798978805542} -11/06/2021 23:16:34 - INFO - __main__ - Step 14706: {'lr': 0.0004909634676114851, 'samples': 2823552, 'steps': 14705, 'loss/train': 1.757364273071289} -11/06/2021 23:16:34 - INFO - __main__ - Step 14707: {'lr': 0.000490962053673618, 'samples': 2823744, 'steps': 14706, 'loss/train': 1.1211416721343994} -11/06/2021 23:16:36 - INFO - __main__ - Step 14708: {'lr': 0.0004909606396271771, 'samples': 2823936, 'steps': 14707, 'loss/train': 1.9302036762237549} -11/06/2021 23:16:36 - INFO - __main__ - Step 14709: {'lr': 0.000490959225472163, 'samples': 2824128, 'steps': 14708, 'loss/train': 1.3645907640457153} -11/06/2021 23:16:36 - INFO - __main__ - Step 14710: {'lr': 0.0004909578112085764, 'samples': 2824320, 'steps': 14709, 'loss/train': 1.793792724609375} -11/06/2021 23:16:37 - INFO - __main__ - Step 14711: {'lr': 0.0004909563968364179, 'samples': 2824512, 'steps': 14710, 'loss/train': 1.516960859298706} -11/06/2021 23:16:37 - INFO - __main__ - Step 14712: {'lr': 0.0004909549823556883, 'samples': 2824704, 'steps': 14711, 'loss/train': 1.5521596670150757} -11/06/2021 23:16:37 - INFO - __main__ - Step 14713: {'lr': 0.000490953567766388, 'samples': 2824896, 'steps': 14712, 'loss/train': 1.9512124061584473} -11/06/2021 23:16:38 - INFO - __main__ - Step 14714: {'lr': 0.0004909521530685177, 'samples': 2825088, 'steps': 14713, 'loss/train': 2.1272761821746826} -11/06/2021 23:16:39 - INFO - __main__ - Step 14715: {'lr': 0.0004909507382620782, 'samples': 2825280, 'steps': 14714, 'loss/train': 1.705784559249878} -11/06/2021 23:16:39 - INFO - __main__ - Step 14716: {'lr': 0.0004909493233470699, 'samples': 2825472, 'steps': 14715, 'loss/train': 1.458823323249817} -11/06/2021 23:16:40 - INFO - __main__ - Step 14717: {'lr': 0.0004909479083234936, 'samples': 2825664, 'steps': 14716, 'loss/train': 1.4705344438552856} -11/06/2021 23:16:40 - INFO - __main__ - Step 14718: {'lr': 0.0004909464931913499, 'samples': 2825856, 'steps': 14717, 'loss/train': 2.149104118347168} -11/06/2021 23:16:41 - INFO - __main__ - Step 14719: {'lr': 0.0004909450779506393, 'samples': 2826048, 'steps': 14718, 'loss/train': 1.4514827728271484} -11/06/2021 23:16:41 - INFO - __main__ - Step 14720: {'lr': 0.0004909436626013628, 'samples': 2826240, 'steps': 14719, 'loss/train': 1.459384799003601} -11/06/2021 23:16:42 - INFO - __main__ - Step 14721: {'lr': 0.0004909422471435207, 'samples': 2826432, 'steps': 14720, 'loss/train': 1.9327574968338013} -11/06/2021 23:16:42 - INFO - __main__ - Step 14722: {'lr': 0.0004909408315771136, 'samples': 2826624, 'steps': 14721, 'loss/train': 1.8887290954589844} -11/06/2021 23:16:42 - INFO - __main__ - Step 14723: {'lr': 0.0004909394159021425, 'samples': 2826816, 'steps': 14722, 'loss/train': 1.6616466045379639} -11/06/2021 23:16:43 - INFO - __main__ - Step 14724: {'lr': 0.0004909380001186077, 'samples': 2827008, 'steps': 14723, 'loss/train': 1.528913974761963} -11/06/2021 23:16:44 - INFO - __main__ - Step 14725: {'lr': 0.00049093658422651, 'samples': 2827200, 'steps': 14724, 'loss/train': 1.4247432947158813} -11/06/2021 23:16:44 - INFO - __main__ - Step 14726: {'lr': 0.00049093516822585, 'samples': 2827392, 'steps': 14725, 'loss/train': 2.329897165298462} -11/06/2021 23:16:44 - INFO - __main__ - Step 14727: {'lr': 0.0004909337521166282, 'samples': 2827584, 'steps': 14726, 'loss/train': 1.4586058855056763} -11/06/2021 23:16:45 - INFO - __main__ - Step 14728: {'lr': 0.0004909323358988455, 'samples': 2827776, 'steps': 14727, 'loss/train': 1.297971487045288} -11/06/2021 23:16:45 - INFO - __main__ - Step 14729: {'lr': 0.0004909309195725024, 'samples': 2827968, 'steps': 14728, 'loss/train': 1.9658069610595703} -11/06/2021 23:16:46 - INFO - __main__ - Step 14730: {'lr': 0.0004909295031375996, 'samples': 2828160, 'steps': 14729, 'loss/train': 1.5267490148544312} -11/06/2021 23:16:47 - INFO - __main__ - Step 14731: {'lr': 0.0004909280865941375, 'samples': 2828352, 'steps': 14730, 'loss/train': 1.8899013996124268} -11/06/2021 23:16:47 - INFO - __main__ - Step 14732: {'lr': 0.0004909266699421171, 'samples': 2828544, 'steps': 14731, 'loss/train': 1.7061964273452759} -11/06/2021 23:16:47 - INFO - __main__ - Step 14733: {'lr': 0.0004909252531815388, 'samples': 2828736, 'steps': 14732, 'loss/train': 1.6438379287719727} -11/06/2021 23:16:48 - INFO - __main__ - Step 14734: {'lr': 0.0004909238363124033, 'samples': 2828928, 'steps': 14733, 'loss/train': 1.719048023223877} -11/06/2021 23:16:49 - INFO - __main__ - Step 14735: {'lr': 0.0004909224193347112, 'samples': 2829120, 'steps': 14734, 'loss/train': 1.9832409620285034} -11/06/2021 23:16:49 - INFO - __main__ - Step 14736: {'lr': 0.0004909210022484633, 'samples': 2829312, 'steps': 14735, 'loss/train': 2.6759371757507324} -11/06/2021 23:16:49 - INFO - __main__ - Step 14737: {'lr': 0.00049091958505366, 'samples': 2829504, 'steps': 14736, 'loss/train': 1.7943952083587646} -11/06/2021 23:16:50 - INFO - __main__ - Step 14738: {'lr': 0.000490918167750302, 'samples': 2829696, 'steps': 14737, 'loss/train': 1.9066545963287354} -11/06/2021 23:16:50 - INFO - __main__ - Step 14739: {'lr': 0.00049091675033839, 'samples': 2829888, 'steps': 14738, 'loss/train': 1.0074669122695923} -11/06/2021 23:16:51 - INFO - __main__ - Step 14740: {'lr': 0.0004909153328179248, 'samples': 2830080, 'steps': 14739, 'loss/train': 1.9582070112228394} -11/06/2021 23:16:51 - INFO - __main__ - Step 14741: {'lr': 0.0004909139151889067, 'samples': 2830272, 'steps': 14740, 'loss/train': 2.478091239929199} -11/06/2021 23:16:52 - INFO - __main__ - Step 14742: {'lr': 0.0004909124974513366, 'samples': 2830464, 'steps': 14741, 'loss/train': 1.6102755069732666} -11/06/2021 23:16:52 - INFO - __main__ - Step 14743: {'lr': 0.000490911079605215, 'samples': 2830656, 'steps': 14742, 'loss/train': 1.9308674335479736} -11/06/2021 23:16:53 - INFO - __main__ - Step 14744: {'lr': 0.0004909096616505426, 'samples': 2830848, 'steps': 14743, 'loss/train': 1.605130672454834} -11/06/2021 23:16:53 - INFO - __main__ - Step 14745: {'lr': 0.00049090824358732, 'samples': 2831040, 'steps': 14744, 'loss/train': 1.5920521020889282} -11/06/2021 23:16:54 - INFO - __main__ - Step 14746: {'lr': 0.0004909068254155479, 'samples': 2831232, 'steps': 14745, 'loss/train': 1.7607147693634033} -11/06/2021 23:16:55 - INFO - __main__ - Step 14747: {'lr': 0.0004909054071352269, 'samples': 2831424, 'steps': 14746, 'loss/train': 1.231070876121521} -11/06/2021 23:16:55 - INFO - __main__ - Step 14748: {'lr': 0.0004909039887463576, 'samples': 2831616, 'steps': 14747, 'loss/train': 1.5784339904785156} -11/06/2021 23:16:55 - INFO - __main__ - Step 14749: {'lr': 0.0004909025702489407, 'samples': 2831808, 'steps': 14748, 'loss/train': 0.686924934387207} -11/06/2021 23:16:56 - INFO - __main__ - Step 14750: {'lr': 0.0004909011516429768, 'samples': 2832000, 'steps': 14749, 'loss/train': 1.3042925596237183} -11/06/2021 23:16:57 - INFO - __main__ - Step 14751: {'lr': 0.0004908997329284667, 'samples': 2832192, 'steps': 14750, 'loss/train': 1.7104178667068481} -11/06/2021 23:16:57 - INFO - __main__ - Step 14752: {'lr': 0.0004908983141054107, 'samples': 2832384, 'steps': 14751, 'loss/train': 1.4332627058029175} -11/06/2021 23:16:57 - INFO - __main__ - Step 14753: {'lr': 0.0004908968951738098, 'samples': 2832576, 'steps': 14752, 'loss/train': 2.133230209350586} -11/06/2021 23:16:58 - INFO - __main__ - Step 14754: {'lr': 0.0004908954761336643, 'samples': 2832768, 'steps': 14753, 'loss/train': 1.732865333557129} -11/06/2021 23:16:58 - INFO - __main__ - Step 14755: {'lr': 0.0004908940569849751, 'samples': 2832960, 'steps': 14754, 'loss/train': 1.9178493022918701} -11/06/2021 23:16:59 - INFO - __main__ - Step 14756: {'lr': 0.0004908926377277428, 'samples': 2833152, 'steps': 14755, 'loss/train': 1.5390150547027588} -11/06/2021 23:16:59 - INFO - __main__ - Step 14757: {'lr': 0.000490891218361968, 'samples': 2833344, 'steps': 14756, 'loss/train': 1.8167674541473389} -11/06/2021 23:17:00 - INFO - __main__ - Step 14758: {'lr': 0.0004908897988876512, 'samples': 2833536, 'steps': 14757, 'loss/train': 1.5798640251159668} -11/06/2021 23:17:00 - INFO - __main__ - Step 14759: {'lr': 0.0004908883793047934, 'samples': 2833728, 'steps': 14758, 'loss/train': 1.2919437885284424} -11/06/2021 23:17:01 - INFO - __main__ - Step 14760: {'lr': 0.0004908869596133948, 'samples': 2833920, 'steps': 14759, 'loss/train': 2.303706407546997} -11/06/2021 23:17:01 - INFO - __main__ - Step 14761: {'lr': 0.0004908855398134563, 'samples': 2834112, 'steps': 14760, 'loss/train': 1.3456342220306396} -11/06/2021 23:17:02 - INFO - __main__ - Step 14762: {'lr': 0.0004908841199049785, 'samples': 2834304, 'steps': 14761, 'loss/train': 1.4965943098068237} -11/06/2021 23:17:02 - INFO - __main__ - Step 14763: {'lr': 0.0004908826998879621, 'samples': 2834496, 'steps': 14762, 'loss/train': 1.7584352493286133} -11/06/2021 23:17:03 - INFO - __main__ - Step 14764: {'lr': 0.0004908812797624077, 'samples': 2834688, 'steps': 14763, 'loss/train': 1.936519980430603} -11/06/2021 23:17:03 - INFO - __main__ - Step 14765: {'lr': 0.0004908798595283159, 'samples': 2834880, 'steps': 14764, 'loss/train': 2.077310562133789} -11/06/2021 23:17:03 - INFO - __main__ - Step 14766: {'lr': 0.0004908784391856872, 'samples': 2835072, 'steps': 14765, 'loss/train': 1.6648650169372559} -11/06/2021 23:17:05 - INFO - __main__ - Step 14767: {'lr': 0.0004908770187345225, 'samples': 2835264, 'steps': 14766, 'loss/train': 1.7535183429718018} -11/06/2021 23:17:05 - INFO - __main__ - Step 14768: {'lr': 0.0004908755981748223, 'samples': 2835456, 'steps': 14767, 'loss/train': 1.9513096809387207} -11/06/2021 23:17:05 - INFO - __main__ - Step 14769: {'lr': 0.0004908741775065873, 'samples': 2835648, 'steps': 14768, 'loss/train': 2.233029365539551} -11/06/2021 23:17:06 - INFO - __main__ - Step 14770: {'lr': 0.0004908727567298181, 'samples': 2835840, 'steps': 14769, 'loss/train': 1.4736902713775635} -11/06/2021 23:17:06 - INFO - __main__ - Step 14771: {'lr': 0.0004908713358445154, 'samples': 2836032, 'steps': 14770, 'loss/train': 5.864256381988525} -11/06/2021 23:17:06 - INFO - __main__ - Step 14772: {'lr': 0.0004908699148506797, 'samples': 2836224, 'steps': 14771, 'loss/train': 1.9193412065505981} -11/06/2021 23:17:07 - INFO - __main__ - Step 14773: {'lr': 0.0004908684937483119, 'samples': 2836416, 'steps': 14772, 'loss/train': 1.799191951751709} -11/06/2021 23:17:08 - INFO - __main__ - Step 14774: {'lr': 0.0004908670725374122, 'samples': 2836608, 'steps': 14773, 'loss/train': 1.3834148645401} -11/06/2021 23:17:08 - INFO - __main__ - Step 14775: {'lr': 0.0004908656512179817, 'samples': 2836800, 'steps': 14774, 'loss/train': 1.5654276609420776} -11/06/2021 23:17:08 - INFO - __main__ - Step 14776: {'lr': 0.0004908642297900209, 'samples': 2836992, 'steps': 14775, 'loss/train': 1.6006273031234741} -11/06/2021 23:17:09 - INFO - __main__ - Step 14777: {'lr': 0.0004908628082535303, 'samples': 2837184, 'steps': 14776, 'loss/train': 1.8874455690383911} -11/06/2021 23:17:10 - INFO - __main__ - Step 14778: {'lr': 0.0004908613866085106, 'samples': 2837376, 'steps': 14777, 'loss/train': 1.3304411172866821} -11/06/2021 23:17:10 - INFO - __main__ - Step 14779: {'lr': 0.0004908599648549626, 'samples': 2837568, 'steps': 14778, 'loss/train': 1.500115990638733} -11/06/2021 23:17:11 - INFO - __main__ - Step 14780: {'lr': 0.0004908585429928867, 'samples': 2837760, 'steps': 14779, 'loss/train': 1.748668909072876} -11/06/2021 23:17:11 - INFO - __main__ - Step 14781: {'lr': 0.0004908571210222837, 'samples': 2837952, 'steps': 14780, 'loss/train': 1.470587968826294} -11/06/2021 23:17:11 - INFO - __main__ - Step 14782: {'lr': 0.0004908556989431543, 'samples': 2838144, 'steps': 14781, 'loss/train': 0.8396479487419128} -11/06/2021 23:17:12 - INFO - __main__ - Step 14783: {'lr': 0.0004908542767554988, 'samples': 2838336, 'steps': 14782, 'loss/train': 1.8558242321014404} -11/06/2021 23:17:13 - INFO - __main__ - Step 14784: {'lr': 0.0004908528544593184, 'samples': 2838528, 'steps': 14783, 'loss/train': 1.9126049280166626} -11/06/2021 23:17:13 - INFO - __main__ - Step 14785: {'lr': 0.0004908514320546132, 'samples': 2838720, 'steps': 14784, 'loss/train': 1.7966852188110352} -11/06/2021 23:17:13 - INFO - __main__ - Step 14786: {'lr': 0.000490850009541384, 'samples': 2838912, 'steps': 14785, 'loss/train': 1.829959750175476} -11/06/2021 23:17:14 - INFO - __main__ - Step 14787: {'lr': 0.0004908485869196317, 'samples': 2839104, 'steps': 14786, 'loss/train': 1.6409757137298584} -11/06/2021 23:17:15 - INFO - __main__ - Step 14788: {'lr': 0.0004908471641893566, 'samples': 2839296, 'steps': 14787, 'loss/train': 1.4668761491775513} -11/06/2021 23:17:15 - INFO - __main__ - Step 14789: {'lr': 0.0004908457413505596, 'samples': 2839488, 'steps': 14788, 'loss/train': 1.7249447107315063} -11/06/2021 23:17:16 - INFO - __main__ - Step 14790: {'lr': 0.0004908443184032411, 'samples': 2839680, 'steps': 14789, 'loss/train': 1.671472430229187} -11/06/2021 23:17:16 - INFO - __main__ - Step 14791: {'lr': 0.0004908428953474019, 'samples': 2839872, 'steps': 14790, 'loss/train': 1.2302889823913574} -11/06/2021 23:17:16 - INFO - __main__ - Step 14792: {'lr': 0.0004908414721830427, 'samples': 2840064, 'steps': 14791, 'loss/train': 1.5707032680511475} -11/06/2021 23:17:17 - INFO - __main__ - Step 14793: {'lr': 0.000490840048910164, 'samples': 2840256, 'steps': 14792, 'loss/train': 1.8218657970428467} -11/06/2021 23:17:18 - INFO - __main__ - Step 14794: {'lr': 0.0004908386255287664, 'samples': 2840448, 'steps': 14793, 'loss/train': 2.0798017978668213} -11/06/2021 23:17:18 - INFO - __main__ - Step 14795: {'lr': 0.0004908372020388508, 'samples': 2840640, 'steps': 14794, 'loss/train': 1.7213116884231567} -11/06/2021 23:17:18 - INFO - __main__ - Step 14796: {'lr': 0.0004908357784404175, 'samples': 2840832, 'steps': 14795, 'loss/train': 1.5220595598220825} -11/06/2021 23:17:19 - INFO - __main__ - Step 14797: {'lr': 0.0004908343547334674, 'samples': 2841024, 'steps': 14796, 'loss/train': 1.586082100868225} -11/06/2021 23:17:19 - INFO - __main__ - Step 14798: {'lr': 0.0004908329309180011, 'samples': 2841216, 'steps': 14797, 'loss/train': 2.087536573410034} -11/06/2021 23:17:20 - INFO - __main__ - Step 14799: {'lr': 0.0004908315069940191, 'samples': 2841408, 'steps': 14798, 'loss/train': 1.841811180114746} -11/06/2021 23:17:20 - INFO - __main__ - Step 14800: {'lr': 0.0004908300829615222, 'samples': 2841600, 'steps': 14799, 'loss/train': 1.4489543437957764} -11/06/2021 23:17:21 - INFO - __main__ - Step 14801: {'lr': 0.000490828658820511, 'samples': 2841792, 'steps': 14800, 'loss/train': 1.7258611917495728} -11/06/2021 23:17:21 - INFO - __main__ - Step 14802: {'lr': 0.0004908272345709861, 'samples': 2841984, 'steps': 14801, 'loss/train': 1.824029564857483} -11/06/2021 23:17:21 - INFO - __main__ - Step 14803: {'lr': 0.0004908258102129481, 'samples': 2842176, 'steps': 14802, 'loss/train': 1.134230375289917} -11/06/2021 23:17:23 - INFO - __main__ - Step 14804: {'lr': 0.0004908243857463978, 'samples': 2842368, 'steps': 14803, 'loss/train': 1.6424596309661865} -11/06/2021 23:17:23 - INFO - __main__ - Step 14805: {'lr': 0.0004908229611713357, 'samples': 2842560, 'steps': 14804, 'loss/train': 1.7975839376449585} -11/06/2021 23:17:23 - INFO - __main__ - Step 14806: {'lr': 0.0004908215364877625, 'samples': 2842752, 'steps': 14805, 'loss/train': 1.8489753007888794} -11/06/2021 23:17:24 - INFO - __main__ - Step 14807: {'lr': 0.0004908201116956788, 'samples': 2842944, 'steps': 14806, 'loss/train': 4.51678466796875} -11/06/2021 23:17:24 - INFO - __main__ - Step 14808: {'lr': 0.0004908186867950854, 'samples': 2843136, 'steps': 14807, 'loss/train': 1.53168785572052} -11/06/2021 23:17:24 - INFO - __main__ - Step 14809: {'lr': 0.0004908172617859826, 'samples': 2843328, 'steps': 14808, 'loss/train': 1.772919774055481} -11/06/2021 23:17:25 - INFO - __main__ - Step 14810: {'lr': 0.0004908158366683714, 'samples': 2843520, 'steps': 14809, 'loss/train': 2.220637798309326} -11/06/2021 23:17:26 - INFO - __main__ - Step 14811: {'lr': 0.0004908144114422523, 'samples': 2843712, 'steps': 14810, 'loss/train': 0.5302165150642395} -11/06/2021 23:17:26 - INFO - __main__ - Step 14812: {'lr': 0.000490812986107626, 'samples': 2843904, 'steps': 14811, 'loss/train': 1.51813542842865} -11/06/2021 23:17:26 - INFO - __main__ - Step 14813: {'lr': 0.000490811560664493, 'samples': 2844096, 'steps': 14812, 'loss/train': 1.3996822834014893} -11/06/2021 23:17:27 - INFO - __main__ - Step 14814: {'lr': 0.000490810135112854, 'samples': 2844288, 'steps': 14813, 'loss/train': 1.816659688949585} -11/06/2021 23:17:28 - INFO - __main__ - Step 14815: {'lr': 0.0004908087094527097, 'samples': 2844480, 'steps': 14814, 'loss/train': 1.3649659156799316} -11/06/2021 23:17:28 - INFO - __main__ - Step 14816: {'lr': 0.0004908072836840607, 'samples': 2844672, 'steps': 14815, 'loss/train': 1.6869769096374512} -11/06/2021 23:17:29 - INFO - __main__ - Step 14817: {'lr': 0.0004908058578069077, 'samples': 2844864, 'steps': 14816, 'loss/train': 1.6598951816558838} -11/06/2021 23:17:29 - INFO - __main__ - Step 14818: {'lr': 0.0004908044318212512, 'samples': 2845056, 'steps': 14817, 'loss/train': 1.5969890356063843} -11/06/2021 23:17:29 - INFO - __main__ - Step 14819: {'lr': 0.000490803005727092, 'samples': 2845248, 'steps': 14818, 'loss/train': 1.8578797578811646} -11/06/2021 23:17:30 - INFO - __main__ - Step 14820: {'lr': 0.0004908015795244307, 'samples': 2845440, 'steps': 14819, 'loss/train': 1.8108375072479248} -11/06/2021 23:17:31 - INFO - __main__ - Step 14821: {'lr': 0.0004908001532132679, 'samples': 2845632, 'steps': 14820, 'loss/train': 1.6355654001235962} -11/06/2021 23:17:31 - INFO - __main__ - Step 14822: {'lr': 0.0004907987267936042, 'samples': 2845824, 'steps': 14821, 'loss/train': 1.8750498294830322} -11/06/2021 23:17:31 - INFO - __main__ - Step 14823: {'lr': 0.0004907973002654404, 'samples': 2846016, 'steps': 14822, 'loss/train': 1.708099603652954} -11/06/2021 23:17:32 - INFO - __main__ - Step 14824: {'lr': 0.0004907958736287771, 'samples': 2846208, 'steps': 14823, 'loss/train': 1.5635958909988403} -11/06/2021 23:17:33 - INFO - __main__ - Step 14825: {'lr': 0.0004907944468836148, 'samples': 2846400, 'steps': 14824, 'loss/train': 3.393544912338257} -11/06/2021 23:17:33 - INFO - __main__ - Step 14826: {'lr': 0.0004907930200299543, 'samples': 2846592, 'steps': 14825, 'loss/train': 1.548439383506775} -11/06/2021 23:17:33 - INFO - __main__ - Step 14827: {'lr': 0.0004907915930677961, 'samples': 2846784, 'steps': 14826, 'loss/train': 1.3716732263565063} -11/06/2021 23:17:34 - INFO - __main__ - Step 14828: {'lr': 0.000490790165997141, 'samples': 2846976, 'steps': 14827, 'loss/train': 1.7341458797454834} -11/06/2021 23:17:34 - INFO - __main__ - Step 14829: {'lr': 0.0004907887388179896, 'samples': 2847168, 'steps': 14828, 'loss/train': 1.6612669229507446} -11/06/2021 23:17:35 - INFO - __main__ - Step 14830: {'lr': 0.0004907873115303424, 'samples': 2847360, 'steps': 14829, 'loss/train': 1.5637840032577515} -11/06/2021 23:17:36 - INFO - __main__ - Step 14831: {'lr': 0.0004907858841342002, 'samples': 2847552, 'steps': 14830, 'loss/train': 1.3963515758514404} -11/06/2021 23:17:36 - INFO - __main__ - Step 14832: {'lr': 0.0004907844566295637, 'samples': 2847744, 'steps': 14831, 'loss/train': 1.5587491989135742} -11/06/2021 23:17:36 - INFO - __main__ - Step 14833: {'lr': 0.0004907830290164332, 'samples': 2847936, 'steps': 14832, 'loss/train': 1.662847638130188} -11/06/2021 23:17:37 - INFO - __main__ - Step 14834: {'lr': 0.0004907816012948098, 'samples': 2848128, 'steps': 14833, 'loss/train': 2.050675630569458} -11/06/2021 23:17:37 - INFO - __main__ - Step 14835: {'lr': 0.0004907801734646938, 'samples': 2848320, 'steps': 14834, 'loss/train': 1.9373985528945923} -11/06/2021 23:17:38 - INFO - __main__ - Step 14836: {'lr': 0.000490778745526086, 'samples': 2848512, 'steps': 14835, 'loss/train': 1.7804934978485107} -11/06/2021 23:17:38 - INFO - __main__ - Step 14837: {'lr': 0.000490777317478987, 'samples': 2848704, 'steps': 14836, 'loss/train': 1.345388412475586} -11/06/2021 23:17:39 - INFO - __main__ - Step 14838: {'lr': 0.0004907758893233975, 'samples': 2848896, 'steps': 14837, 'loss/train': 1.093638300895691} -11/06/2021 23:17:39 - INFO - __main__ - Step 14839: {'lr': 0.0004907744610593181, 'samples': 2849088, 'steps': 14838, 'loss/train': 1.936640739440918} -11/06/2021 23:17:39 - INFO - __main__ - Step 14840: {'lr': 0.0004907730326867495, 'samples': 2849280, 'steps': 14839, 'loss/train': 1.6983401775360107} -11/06/2021 23:17:40 - INFO - __main__ - Step 14841: {'lr': 0.0004907716042056921, 'samples': 2849472, 'steps': 14840, 'loss/train': 2.199077844619751} -11/06/2021 23:17:41 - INFO - __main__ - Step 14842: {'lr': 0.0004907701756161469, 'samples': 2849664, 'steps': 14841, 'loss/train': 2.0116066932678223} -11/06/2021 23:17:41 - INFO - __main__ - Step 14843: {'lr': 0.0004907687469181143, 'samples': 2849856, 'steps': 14842, 'loss/train': 1.461774230003357} -11/06/2021 23:17:41 - INFO - __main__ - Step 14844: {'lr': 0.000490767318111595, 'samples': 2850048, 'steps': 14843, 'loss/train': 1.6642917394638062} -11/06/2021 23:17:42 - INFO - __main__ - Step 14845: {'lr': 0.0004907658891965897, 'samples': 2850240, 'steps': 14844, 'loss/train': 1.9356948137283325} -11/06/2021 23:17:43 - INFO - __main__ - Step 14846: {'lr': 0.000490764460173099, 'samples': 2850432, 'steps': 14845, 'loss/train': 1.7684423923492432} -11/06/2021 23:17:43 - INFO - __main__ - Step 14847: {'lr': 0.0004907630310411236, 'samples': 2850624, 'steps': 14846, 'loss/train': 1.5917563438415527} -11/06/2021 23:17:43 - INFO - __main__ - Step 14848: {'lr': 0.000490761601800664, 'samples': 2850816, 'steps': 14847, 'loss/train': 1.7513176202774048} -11/06/2021 23:17:44 - INFO - __main__ - Step 14849: {'lr': 0.000490760172451721, 'samples': 2851008, 'steps': 14848, 'loss/train': 1.5119004249572754} -11/06/2021 23:17:44 - INFO - __main__ - Step 14850: {'lr': 0.0004907587429942952, 'samples': 2851200, 'steps': 14849, 'loss/train': 2.091411590576172} -11/06/2021 23:17:45 - INFO - __main__ - Step 14851: {'lr': 0.0004907573134283872, 'samples': 2851392, 'steps': 14850, 'loss/train': 1.808640718460083} -11/06/2021 23:17:45 - INFO - __main__ - Step 14852: {'lr': 0.0004907558837539976, 'samples': 2851584, 'steps': 14851, 'loss/train': 1.7864621877670288} -11/06/2021 23:17:46 - INFO - __main__ - Step 14853: {'lr': 0.0004907544539711272, 'samples': 2851776, 'steps': 14852, 'loss/train': 1.476940631866455} -11/06/2021 23:17:46 - INFO - __main__ - Step 14854: {'lr': 0.0004907530240797765, 'samples': 2851968, 'steps': 14853, 'loss/train': 1.674166202545166} -11/06/2021 23:17:47 - INFO - __main__ - Step 14855: {'lr': 0.0004907515940799463, 'samples': 2852160, 'steps': 14854, 'loss/train': 1.497134804725647} -11/06/2021 23:17:48 - INFO - __main__ - Step 14856: {'lr': 0.000490750163971637, 'samples': 2852352, 'steps': 14855, 'loss/train': 1.8654690980911255} -11/06/2021 23:17:48 - INFO - __main__ - Step 14857: {'lr': 0.0004907487337548495, 'samples': 2852544, 'steps': 14856, 'loss/train': 1.693071722984314} -11/06/2021 23:17:49 - INFO - __main__ - Step 14858: {'lr': 0.0004907473034295843, 'samples': 2852736, 'steps': 14857, 'loss/train': 1.270855188369751} -11/06/2021 23:17:49 - INFO - __main__ - Step 14859: {'lr': 0.0004907458729958422, 'samples': 2852928, 'steps': 14858, 'loss/train': 1.4801957607269287} -11/06/2021 23:17:49 - INFO - __main__ - Step 14860: {'lr': 0.0004907444424536235, 'samples': 2853120, 'steps': 14859, 'loss/train': 1.5060356855392456} -11/06/2021 23:17:50 - INFO - __main__ - Step 14861: {'lr': 0.0004907430118029293, 'samples': 2853312, 'steps': 14860, 'loss/train': 1.8055636882781982} -11/06/2021 23:17:51 - INFO - __main__ - Step 14862: {'lr': 0.0004907415810437598, 'samples': 2853504, 'steps': 14861, 'loss/train': 1.6325714588165283} -11/06/2021 23:17:51 - INFO - __main__ - Step 14863: {'lr': 0.0004907401501761159, 'samples': 2853696, 'steps': 14862, 'loss/train': 1.5240354537963867} -11/06/2021 23:17:51 - INFO - __main__ - Step 14864: {'lr': 0.0004907387191999984, 'samples': 2853888, 'steps': 14863, 'loss/train': 1.4284332990646362} -11/06/2021 23:17:52 - INFO - __main__ - Step 14865: {'lr': 0.0004907372881154075, 'samples': 2854080, 'steps': 14864, 'loss/train': 1.6523523330688477} -11/06/2021 23:17:53 - INFO - __main__ - Step 14866: {'lr': 0.0004907358569223442, 'samples': 2854272, 'steps': 14865, 'loss/train': 1.5434261560440063} -11/06/2021 23:17:53 - INFO - __main__ - Step 14867: {'lr': 0.000490734425620809, 'samples': 2854464, 'steps': 14866, 'loss/train': 1.671189785003662} -11/06/2021 23:17:53 - INFO - __main__ - Step 14868: {'lr': 0.0004907329942108027, 'samples': 2854656, 'steps': 14867, 'loss/train': 1.6853291988372803} -11/06/2021 23:17:54 - INFO - __main__ - Step 14869: {'lr': 0.0004907315626923258, 'samples': 2854848, 'steps': 14868, 'loss/train': 1.1505197286605835} -11/06/2021 23:17:54 - INFO - __main__ - Step 14870: {'lr': 0.0004907301310653789, 'samples': 2855040, 'steps': 14869, 'loss/train': 1.6277196407318115} -11/06/2021 23:17:55 - INFO - __main__ - Step 14871: {'lr': 0.0004907286993299627, 'samples': 2855232, 'steps': 14870, 'loss/train': 2.135899305343628} -11/06/2021 23:17:56 - INFO - __main__ - Step 14872: {'lr': 0.0004907272674860779, 'samples': 2855424, 'steps': 14871, 'loss/train': 2.0826239585876465} -11/06/2021 23:17:56 - INFO - __main__ - Step 14873: {'lr': 0.0004907258355337251, 'samples': 2855616, 'steps': 14872, 'loss/train': 1.8687199354171753} -11/06/2021 23:17:56 - INFO - __main__ - Step 14874: {'lr': 0.0004907244034729049, 'samples': 2855808, 'steps': 14873, 'loss/train': 1.6615655422210693} -11/06/2021 23:17:57 - INFO - __main__ - Step 14875: {'lr': 0.0004907229713036181, 'samples': 2856000, 'steps': 14874, 'loss/train': 1.7533270120620728} -11/06/2021 23:17:57 - INFO - __main__ - Step 14876: {'lr': 0.0004907215390258652, 'samples': 2856192, 'steps': 14875, 'loss/train': 1.654037356376648} -11/06/2021 23:17:58 - INFO - __main__ - Step 14877: {'lr': 0.0004907201066396469, 'samples': 2856384, 'steps': 14876, 'loss/train': 1.8480337858200073} -11/06/2021 23:17:58 - INFO - __main__ - Step 14878: {'lr': 0.0004907186741449638, 'samples': 2856576, 'steps': 14877, 'loss/train': 1.6371917724609375} -11/06/2021 23:17:59 - INFO - __main__ - Step 14879: {'lr': 0.0004907172415418166, 'samples': 2856768, 'steps': 14878, 'loss/train': 1.5165156126022339} -11/06/2021 23:17:59 - INFO - __main__ - Step 14880: {'lr': 0.0004907158088302059, 'samples': 2856960, 'steps': 14879, 'loss/train': 1.6989234685897827} -11/06/2021 23:17:59 - INFO - __main__ - Step 14881: {'lr': 0.0004907143760101325, 'samples': 2857152, 'steps': 14880, 'loss/train': 1.368466854095459} -11/06/2021 23:18:01 - INFO - __main__ - Step 14882: {'lr': 0.0004907129430815968, 'samples': 2857344, 'steps': 14881, 'loss/train': 1.8604637384414673} -11/06/2021 23:18:01 - INFO - __main__ - Step 14883: {'lr': 0.0004907115100445996, 'samples': 2857536, 'steps': 14882, 'loss/train': 1.6678239107131958} -11/06/2021 23:18:01 - INFO - __main__ - Step 14884: {'lr': 0.0004907100768991415, 'samples': 2857728, 'steps': 14883, 'loss/train': 2.169818878173828} -11/06/2021 23:18:02 - INFO - __main__ - Step 14885: {'lr': 0.0004907086436452231, 'samples': 2857920, 'steps': 14884, 'loss/train': 1.5355026721954346} -11/06/2021 23:18:02 - INFO - __main__ - Step 14886: {'lr': 0.0004907072102828451, 'samples': 2858112, 'steps': 14885, 'loss/train': 1.5460067987442017} -11/06/2021 23:18:03 - INFO - __main__ - Step 14887: {'lr': 0.0004907057768120082, 'samples': 2858304, 'steps': 14886, 'loss/train': 1.5537009239196777} -11/06/2021 23:18:03 - INFO - __main__ - Step 14888: {'lr': 0.000490704343232713, 'samples': 2858496, 'steps': 14887, 'loss/train': 1.7863291501998901} -11/06/2021 23:18:04 - INFO - __main__ - Step 14889: {'lr': 0.0004907029095449602, 'samples': 2858688, 'steps': 14888, 'loss/train': 1.847086787223816} -11/06/2021 23:18:04 - INFO - __main__ - Step 14890: {'lr': 0.0004907014757487503, 'samples': 2858880, 'steps': 14889, 'loss/train': 1.9282914400100708} -11/06/2021 23:18:04 - INFO - __main__ - Step 14891: {'lr': 0.0004907000418440839, 'samples': 2859072, 'steps': 14890, 'loss/train': 1.711198091506958} -11/06/2021 23:18:05 - INFO - __main__ - Step 14892: {'lr': 0.000490698607830962, 'samples': 2859264, 'steps': 14891, 'loss/train': 1.5940576791763306} -11/06/2021 23:18:06 - INFO - __main__ - Step 14893: {'lr': 0.0004906971737093849, 'samples': 2859456, 'steps': 14892, 'loss/train': 1.9280325174331665} -11/06/2021 23:18:06 - INFO - __main__ - Step 14894: {'lr': 0.0004906957394793534, 'samples': 2859648, 'steps': 14893, 'loss/train': 1.427196979522705} -11/06/2021 23:18:06 - INFO - __main__ - Step 14895: {'lr': 0.0004906943051408682, 'samples': 2859840, 'steps': 14894, 'loss/train': 1.3355380296707153} -11/06/2021 23:18:07 - INFO - __main__ - Step 14896: {'lr': 0.0004906928706939296, 'samples': 2860032, 'steps': 14895, 'loss/train': 1.7179498672485352} -11/06/2021 23:18:08 - INFO - __main__ - Step 14897: {'lr': 0.0004906914361385387, 'samples': 2860224, 'steps': 14896, 'loss/train': 1.7625758647918701} -11/06/2021 23:18:08 - INFO - __main__ - Step 14898: {'lr': 0.0004906900014746959, 'samples': 2860416, 'steps': 14897, 'loss/train': 1.622707724571228} -11/06/2021 23:18:09 - INFO - __main__ - Step 14899: {'lr': 0.000490688566702402, 'samples': 2860608, 'steps': 14898, 'loss/train': 1.7065162658691406} -11/06/2021 23:18:09 - INFO - __main__ - Step 14900: {'lr': 0.0004906871318216575, 'samples': 2860800, 'steps': 14899, 'loss/train': 1.6930841207504272} -11/06/2021 23:18:09 - INFO - __main__ - Step 14901: {'lr': 0.000490685696832463, 'samples': 2860992, 'steps': 14900, 'loss/train': 1.9356876611709595} -11/06/2021 23:18:10 - INFO - __main__ - Step 14902: {'lr': 0.0004906842617348193, 'samples': 2861184, 'steps': 14901, 'loss/train': 1.8025461435317993} -11/06/2021 23:18:11 - INFO - __main__ - Step 14903: {'lr': 0.000490682826528727, 'samples': 2861376, 'steps': 14902, 'loss/train': 1.7793097496032715} -11/06/2021 23:18:11 - INFO - __main__ - Step 14904: {'lr': 0.0004906813912141868, 'samples': 2861568, 'steps': 14903, 'loss/train': 2.1294806003570557} -11/06/2021 23:18:11 - INFO - __main__ - Step 14905: {'lr': 0.0004906799557911992, 'samples': 2861760, 'steps': 14904, 'loss/train': 1.366396427154541} -11/06/2021 23:18:12 - INFO - __main__ - Step 14906: {'lr': 0.0004906785202597649, 'samples': 2861952, 'steps': 14905, 'loss/train': 1.2872095108032227} -11/06/2021 23:18:13 - INFO - __main__ - Step 14907: {'lr': 0.0004906770846198846, 'samples': 2862144, 'steps': 14906, 'loss/train': 1.8077151775360107} -11/06/2021 23:18:13 - INFO - __main__ - Step 14908: {'lr': 0.0004906756488715589, 'samples': 2862336, 'steps': 14907, 'loss/train': 1.617505669593811} -11/06/2021 23:18:14 - INFO - __main__ - Step 14909: {'lr': 0.0004906742130147884, 'samples': 2862528, 'steps': 14908, 'loss/train': 1.6927767992019653} -11/06/2021 23:18:14 - INFO - __main__ - Step 14910: {'lr': 0.0004906727770495739, 'samples': 2862720, 'steps': 14909, 'loss/train': 1.645467758178711} -11/06/2021 23:18:14 - INFO - __main__ - Step 14911: {'lr': 0.000490671340975916, 'samples': 2862912, 'steps': 14910, 'loss/train': 1.7554125785827637} -11/06/2021 23:18:15 - INFO - __main__ - Step 14912: {'lr': 0.0004906699047938153, 'samples': 2863104, 'steps': 14911, 'loss/train': 1.9322426319122314} -11/06/2021 23:18:16 - INFO - __main__ - Step 14913: {'lr': 0.0004906684685032724, 'samples': 2863296, 'steps': 14912, 'loss/train': 0.9366849064826965} -11/06/2021 23:18:16 - INFO - __main__ - Step 14914: {'lr': 0.0004906670321042881, 'samples': 2863488, 'steps': 14913, 'loss/train': 1.394436240196228} -11/06/2021 23:18:16 - INFO - __main__ - Step 14915: {'lr': 0.0004906655955968628, 'samples': 2863680, 'steps': 14914, 'loss/train': 1.2023478746414185} -11/06/2021 23:18:17 - INFO - __main__ - Step 14916: {'lr': 0.0004906641589809973, 'samples': 2863872, 'steps': 14915, 'loss/train': 2.0545525550842285} -11/06/2021 23:18:17 - INFO - __main__ - Step 14917: {'lr': 0.0004906627222566924, 'samples': 2864064, 'steps': 14916, 'loss/train': 1.4498852491378784} -11/06/2021 23:18:18 - INFO - __main__ - Step 14918: {'lr': 0.0004906612854239485, 'samples': 2864256, 'steps': 14917, 'loss/train': 1.5706671476364136} -11/06/2021 23:18:19 - INFO - __main__ - Step 14919: {'lr': 0.0004906598484827663, 'samples': 2864448, 'steps': 14918, 'loss/train': 1.427777647972107} -11/06/2021 23:18:19 - INFO - __main__ - Step 14920: {'lr': 0.0004906584114331465, 'samples': 2864640, 'steps': 14919, 'loss/train': 1.9566161632537842} -11/06/2021 23:18:19 - INFO - __main__ - Step 14921: {'lr': 0.0004906569742750899, 'samples': 2864832, 'steps': 14920, 'loss/train': 1.7183939218521118} -11/06/2021 23:18:20 - INFO - __main__ - Step 14922: {'lr': 0.0004906555370085968, 'samples': 2865024, 'steps': 14921, 'loss/train': 1.8103671073913574} -11/06/2021 23:18:21 - INFO - __main__ - Step 14923: {'lr': 0.000490654099633668, 'samples': 2865216, 'steps': 14922, 'loss/train': 1.5817921161651611} -11/06/2021 23:18:21 - INFO - __main__ - Step 14924: {'lr': 0.0004906526621503043, 'samples': 2865408, 'steps': 14923, 'loss/train': 1.145911455154419} -11/06/2021 23:18:21 - INFO - __main__ - Step 14925: {'lr': 0.0004906512245585062, 'samples': 2865600, 'steps': 14924, 'loss/train': 2.2841901779174805} -11/06/2021 23:18:22 - INFO - __main__ - Step 14926: {'lr': 0.0004906497868582743, 'samples': 2865792, 'steps': 14925, 'loss/train': 1.4507989883422852} -11/06/2021 23:18:22 - INFO - __main__ - Step 14927: {'lr': 0.0004906483490496093, 'samples': 2865984, 'steps': 14926, 'loss/train': 1.791601538658142} -11/06/2021 23:18:23 - INFO - __main__ - Step 14928: {'lr': 0.000490646911132512, 'samples': 2866176, 'steps': 14927, 'loss/train': 1.7833375930786133} -11/06/2021 23:18:23 - INFO - __main__ - Step 14929: {'lr': 0.0004906454731069828, 'samples': 2866368, 'steps': 14928, 'loss/train': 1.2282170057296753} -11/06/2021 23:18:24 - INFO - __main__ - Step 14930: {'lr': 0.0004906440349730226, 'samples': 2866560, 'steps': 14929, 'loss/train': 1.1155771017074585} -11/06/2021 23:18:24 - INFO - __main__ - Step 14931: {'lr': 0.0004906425967306317, 'samples': 2866752, 'steps': 14930, 'loss/train': 1.8701684474945068} -11/06/2021 23:18:24 - INFO - __main__ - Step 14932: {'lr': 0.0004906411583798112, 'samples': 2866944, 'steps': 14931, 'loss/train': 1.1279278993606567} -11/06/2021 23:18:26 - INFO - __main__ - Step 14933: {'lr': 0.0004906397199205614, 'samples': 2867136, 'steps': 14932, 'loss/train': 1.0893620252609253} -11/06/2021 23:18:26 - INFO - __main__ - Step 14934: {'lr': 0.000490638281352883, 'samples': 2867328, 'steps': 14933, 'loss/train': 1.8908346891403198} -11/06/2021 23:18:26 - INFO - __main__ - Step 14935: {'lr': 0.0004906368426767767, 'samples': 2867520, 'steps': 14934, 'loss/train': 0.6824740767478943} -11/06/2021 23:18:27 - INFO - __main__ - Step 14936: {'lr': 0.0004906354038922432, 'samples': 2867712, 'steps': 14935, 'loss/train': 1.8815536499023438} -11/06/2021 23:18:27 - INFO - __main__ - Step 14937: {'lr': 0.000490633964999283, 'samples': 2867904, 'steps': 14936, 'loss/train': 1.1689196825027466} -11/06/2021 23:18:28 - INFO - __main__ - Step 14938: {'lr': 0.000490632525997897, 'samples': 2868096, 'steps': 14937, 'loss/train': 1.6703389883041382} -11/06/2021 23:18:28 - INFO - __main__ - Step 14939: {'lr': 0.0004906310868880856, 'samples': 2868288, 'steps': 14938, 'loss/train': 1.6411389112472534} -11/06/2021 23:18:29 - INFO - __main__ - Step 14940: {'lr': 0.0004906296476698496, 'samples': 2868480, 'steps': 14939, 'loss/train': 1.2749041318893433} -11/06/2021 23:18:29 - INFO - __main__ - Step 14941: {'lr': 0.0004906282083431897, 'samples': 2868672, 'steps': 14940, 'loss/train': 1.5104907751083374} -11/06/2021 23:18:29 - INFO - __main__ - Step 14942: {'lr': 0.0004906267689081063, 'samples': 2868864, 'steps': 14941, 'loss/train': 1.9198617935180664} -11/06/2021 23:18:30 - INFO - __main__ - Step 14943: {'lr': 0.0004906253293646002, 'samples': 2869056, 'steps': 14942, 'loss/train': 1.7235310077667236} -11/06/2021 23:18:31 - INFO - __main__ - Step 14944: {'lr': 0.0004906238897126721, 'samples': 2869248, 'steps': 14943, 'loss/train': 1.3015567064285278} -11/06/2021 23:18:31 - INFO - __main__ - Step 14945: {'lr': 0.0004906224499523225, 'samples': 2869440, 'steps': 14944, 'loss/train': 1.208406686782837} -11/06/2021 23:18:31 - INFO - __main__ - Step 14946: {'lr': 0.0004906210100835522, 'samples': 2869632, 'steps': 14945, 'loss/train': 1.7185678482055664} -11/06/2021 23:18:32 - INFO - __main__ - Step 14947: {'lr': 0.0004906195701063617, 'samples': 2869824, 'steps': 14946, 'loss/train': 1.6271605491638184} -11/06/2021 23:18:33 - INFO - __main__ - Step 14948: {'lr': 0.0004906181300207518, 'samples': 2870016, 'steps': 14947, 'loss/train': 1.1316771507263184} -11/06/2021 23:18:33 - INFO - __main__ - Step 14949: {'lr': 0.0004906166898267231, 'samples': 2870208, 'steps': 14948, 'loss/train': 1.8571279048919678} -11/06/2021 23:18:34 - INFO - __main__ - Step 14950: {'lr': 0.0004906152495242763, 'samples': 2870400, 'steps': 14949, 'loss/train': 1.3722232580184937} -11/06/2021 23:18:34 - INFO - __main__ - Step 14951: {'lr': 0.0004906138091134118, 'samples': 2870592, 'steps': 14950, 'loss/train': 1.7835454940795898} -11/06/2021 23:18:34 - INFO - __main__ - Step 14952: {'lr': 0.0004906123685941306, 'samples': 2870784, 'steps': 14951, 'loss/train': 1.6602545976638794} -11/06/2021 23:18:35 - INFO - __main__ - Step 14953: {'lr': 0.000490610927966433, 'samples': 2870976, 'steps': 14952, 'loss/train': 1.557942509651184} -11/06/2021 23:18:36 - INFO - __main__ - Step 14954: {'lr': 0.00049060948723032, 'samples': 2871168, 'steps': 14953, 'loss/train': 1.7364459037780762} -11/06/2021 23:18:36 - INFO - __main__ - Step 14955: {'lr': 0.000490608046385792, 'samples': 2871360, 'steps': 14954, 'loss/train': 2.2763864994049072} -11/06/2021 23:18:36 - INFO - __main__ - Step 14956: {'lr': 0.0004906066054328498, 'samples': 2871552, 'steps': 14955, 'loss/train': 1.585302472114563} -11/06/2021 23:18:37 - INFO - __main__ - Step 14957: {'lr': 0.0004906051643714939, 'samples': 2871744, 'steps': 14956, 'loss/train': 1.91652250289917} -11/06/2021 23:18:38 - INFO - __main__ - Step 14958: {'lr': 0.000490603723201725, 'samples': 2871936, 'steps': 14957, 'loss/train': 3.7174441814422607} -11/06/2021 23:18:38 - INFO - __main__ - Step 14959: {'lr': 0.0004906022819235438, 'samples': 2872128, 'steps': 14958, 'loss/train': 1.5262293815612793} -11/06/2021 23:18:38 - INFO - __main__ - Step 14960: {'lr': 0.000490600840536951, 'samples': 2872320, 'steps': 14959, 'loss/train': 1.9472852945327759} -11/06/2021 23:18:39 - INFO - __main__ - Step 14961: {'lr': 0.0004905993990419471, 'samples': 2872512, 'steps': 14960, 'loss/train': 1.6929538249969482} -11/06/2021 23:18:39 - INFO - __main__ - Step 14962: {'lr': 0.0004905979574385328, 'samples': 2872704, 'steps': 14961, 'loss/train': 1.4080133438110352} -11/06/2021 23:18:39 - INFO - __main__ - Step 14963: {'lr': 0.0004905965157267088, 'samples': 2872896, 'steps': 14962, 'loss/train': 1.8805720806121826} -11/06/2021 23:18:41 - INFO - __main__ - Step 14964: {'lr': 0.0004905950739064758, 'samples': 2873088, 'steps': 14963, 'loss/train': 1.8650027513504028} -11/06/2021 23:18:41 - INFO - __main__ - Step 14965: {'lr': 0.0004905936319778343, 'samples': 2873280, 'steps': 14964, 'loss/train': 1.3455829620361328} -11/06/2021 23:18:41 - INFO - __main__ - Step 14966: {'lr': 0.000490592189940785, 'samples': 2873472, 'steps': 14965, 'loss/train': 1.7468905448913574} -11/06/2021 23:18:42 - INFO - __main__ - Step 14967: {'lr': 0.0004905907477953286, 'samples': 2873664, 'steps': 14966, 'loss/train': 1.8428308963775635} -11/06/2021 23:18:42 - INFO - __main__ - Step 14968: {'lr': 0.0004905893055414658, 'samples': 2873856, 'steps': 14967, 'loss/train': 1.5465810298919678} -11/06/2021 23:18:43 - INFO - __main__ - Step 14969: {'lr': 0.0004905878631791971, 'samples': 2874048, 'steps': 14968, 'loss/train': 1.9906973838806152} -11/06/2021 23:18:43 - INFO - __main__ - Step 14970: {'lr': 0.0004905864207085232, 'samples': 2874240, 'steps': 14969, 'loss/train': 1.7254399061203003} -11/06/2021 23:18:44 - INFO - __main__ - Step 14971: {'lr': 0.0004905849781294448, 'samples': 2874432, 'steps': 14970, 'loss/train': 1.8917148113250732} -11/06/2021 23:18:44 - INFO - __main__ - Step 14972: {'lr': 0.0004905835354419625, 'samples': 2874624, 'steps': 14971, 'loss/train': 1.7392559051513672} -11/06/2021 23:18:44 - INFO - __main__ - Step 14973: {'lr': 0.0004905820926460769, 'samples': 2874816, 'steps': 14972, 'loss/train': 1.6358309984207153} -11/06/2021 23:18:45 - INFO - __main__ - Step 14974: {'lr': 0.0004905806497417888, 'samples': 2875008, 'steps': 14973, 'loss/train': 1.6739000082015991} -11/06/2021 23:18:46 - INFO - __main__ - Step 14975: {'lr': 0.0004905792067290988, 'samples': 2875200, 'steps': 14974, 'loss/train': 1.421985387802124} -11/06/2021 23:18:46 - INFO - __main__ - Step 14976: {'lr': 0.0004905777636080075, 'samples': 2875392, 'steps': 14975, 'loss/train': 1.8452321290969849} -11/06/2021 23:18:47 - INFO - __main__ - Step 14977: {'lr': 0.0004905763203785157, 'samples': 2875584, 'steps': 14976, 'loss/train': 1.7335155010223389} -11/06/2021 23:18:47 - INFO - __main__ - Step 14978: {'lr': 0.0004905748770406237, 'samples': 2875776, 'steps': 14977, 'loss/train': 1.7326487302780151} -11/06/2021 23:18:47 - INFO - __main__ - Step 14979: {'lr': 0.0004905734335943325, 'samples': 2875968, 'steps': 14978, 'loss/train': 1.5935941934585571} -11/06/2021 23:18:48 - INFO - __main__ - Step 14980: {'lr': 0.0004905719900396426, 'samples': 2876160, 'steps': 14979, 'loss/train': 1.410271406173706} -11/06/2021 23:18:49 - INFO - __main__ - Step 14981: {'lr': 0.0004905705463765546, 'samples': 2876352, 'steps': 14980, 'loss/train': 1.5823677778244019} -11/06/2021 23:18:49 - INFO - __main__ - Step 14982: {'lr': 0.0004905691026050692, 'samples': 2876544, 'steps': 14981, 'loss/train': 1.2565804719924927} -11/06/2021 23:18:49 - INFO - __main__ - Step 14983: {'lr': 0.0004905676587251873, 'samples': 2876736, 'steps': 14982, 'loss/train': 1.1940447092056274} -11/06/2021 23:18:50 - INFO - __main__ - Step 14984: {'lr': 0.0004905662147369091, 'samples': 2876928, 'steps': 14983, 'loss/train': 2.0281472206115723} -11/06/2021 23:18:50 - INFO - __main__ - Step 14985: {'lr': 0.0004905647706402356, 'samples': 2877120, 'steps': 14984, 'loss/train': 1.4245983362197876} -11/06/2021 23:18:51 - INFO - __main__ - Step 14986: {'lr': 0.0004905633264351673, 'samples': 2877312, 'steps': 14985, 'loss/train': 1.687376856803894} -11/06/2021 23:18:51 - INFO - __main__ - Step 14987: {'lr': 0.0004905618821217048, 'samples': 2877504, 'steps': 14986, 'loss/train': 1.4128832817077637} -11/06/2021 23:18:52 - INFO - __main__ - Step 14988: {'lr': 0.0004905604376998489, 'samples': 2877696, 'steps': 14987, 'loss/train': 1.4120585918426514} -11/06/2021 23:18:52 - INFO - __main__ - Step 14989: {'lr': 0.0004905589931696002, 'samples': 2877888, 'steps': 14988, 'loss/train': 1.6565570831298828} -11/06/2021 23:18:53 - INFO - __main__ - Step 14990: {'lr': 0.0004905575485309593, 'samples': 2878080, 'steps': 14989, 'loss/train': 1.8112573623657227} -11/06/2021 23:18:54 - INFO - __main__ - Step 14991: {'lr': 0.0004905561037839269, 'samples': 2878272, 'steps': 14990, 'loss/train': 1.1115037202835083} -11/06/2021 23:18:54 - INFO - __main__ - Step 14992: {'lr': 0.0004905546589285036, 'samples': 2878464, 'steps': 14991, 'loss/train': 1.6998533010482788} -11/06/2021 23:18:54 - INFO - __main__ - Step 14993: {'lr': 0.0004905532139646901, 'samples': 2878656, 'steps': 14992, 'loss/train': 0.203787699341774} -11/06/2021 23:18:55 - INFO - __main__ - Step 14994: {'lr': 0.000490551768892487, 'samples': 2878848, 'steps': 14993, 'loss/train': 2.0352189540863037} -11/06/2021 23:18:55 - INFO - __main__ - Step 14995: {'lr': 0.000490550323711895, 'samples': 2879040, 'steps': 14994, 'loss/train': 1.996849536895752} -11/06/2021 23:18:56 - INFO - __main__ - Step 14996: {'lr': 0.0004905488784229147, 'samples': 2879232, 'steps': 14995, 'loss/train': 1.7386120557785034} -11/06/2021 23:18:57 - INFO - __main__ - Step 14997: {'lr': 0.000490547433025547, 'samples': 2879424, 'steps': 14996, 'loss/train': 1.7791500091552734} -11/06/2021 23:18:57 - INFO - __main__ - Step 14998: {'lr': 0.0004905459875197921, 'samples': 2879616, 'steps': 14997, 'loss/train': 1.2726280689239502} -11/06/2021 23:18:57 - INFO - __main__ - Step 14999: {'lr': 0.000490544541905651, 'samples': 2879808, 'steps': 14998, 'loss/train': 1.6460684537887573} -11/06/2021 23:18:58 - INFO - __main__ - Step 15000: {'lr': 0.0004905430961831242, 'samples': 2880000, 'steps': 14999, 'loss/train': 0.5816349983215332} -11/06/2021 23:18:58 - INFO - __main__ - Evaluating and saving model checkpoint -11/06/2021 23:22:11 - INFO - __main__ - Step 15000: {'loss/eval': 1.610079050064087, 'perplexity': 5.003206729888916} -11/06/2021 23:22:42 - WARNING - huggingface_hub.repository - remote: ---------------------------------------------------------- -remote: Your push was accepted, but with warnings: -remote: - warning : empty or missing yaml metadata in card (lvwerra/codeparrot-small) -remote: help: please find help at https://huggingface.co/docs/hub/model-repos -remote: ---------------------------------------------------------- -remote: Please find the documentation at: -remote: https://huggingface.co/docs/hub/model-repos(B -remote: ---------------------------------------------------------- -To https://huggingface.co/lvwerra/codeparrot-small - * [new branch] proud-haze-135 -> proud-haze-135 - -11/06/2021 23:22:43 - INFO - __main__ - Step 15001: {'lr': 0.0004905416503522123, 'samples': 2880192, 'steps': 15000, 'loss/train': 1.465524435043335} -11/06/2021 23:22:44 - INFO - __main__ - Step 15002: {'lr': 0.0004905402044129162, 'samples': 2880384, 'steps': 15001, 'loss/train': 2.2312591075897217} -11/06/2021 23:22:44 - INFO - __main__ - Step 15003: {'lr': 0.0004905387583652363, 'samples': 2880576, 'steps': 15002, 'loss/train': 1.7260355949401855} -11/06/2021 23:22:44 - INFO - __main__ - Step 15004: {'lr': 0.0004905373122091734, 'samples': 2880768, 'steps': 15003, 'loss/train': 0.4969237148761749} -11/06/2021 23:22:45 - INFO - __main__ - Step 15005: {'lr': 0.0004905358659447281, 'samples': 2880960, 'steps': 15004, 'loss/train': 1.7188736200332642} -11/06/2021 23:22:45 - INFO - __main__ - Step 15006: {'lr': 0.000490534419571901, 'samples': 2881152, 'steps': 15005, 'loss/train': 1.781702995300293} -11/06/2021 23:22:46 - INFO - __main__ - Step 15007: {'lr': 0.0004905329730906929, 'samples': 2881344, 'steps': 15006, 'loss/train': 1.1889454126358032} -11/06/2021 23:22:46 - INFO - __main__ - Step 15008: {'lr': 0.0004905315265011043, 'samples': 2881536, 'steps': 15007, 'loss/train': 1.3070452213287354} -11/06/2021 23:22:47 - INFO - __main__ - Step 15009: {'lr': 0.0004905300798031359, 'samples': 2881728, 'steps': 15008, 'loss/train': 2.0110666751861572} -11/06/2021 23:22:47 - INFO - __main__ - Step 15010: {'lr': 0.0004905286329967883, 'samples': 2881920, 'steps': 15009, 'loss/train': 1.7228916883468628} -11/06/2021 23:22:48 - INFO - __main__ - Step 15011: {'lr': 0.0004905271860820622, 'samples': 2882112, 'steps': 15010, 'loss/train': 1.8122127056121826} -11/06/2021 23:22:49 - INFO - __main__ - Step 15012: {'lr': 0.0004905257390589585, 'samples': 2882304, 'steps': 15011, 'loss/train': 1.7922598123550415} -11/06/2021 23:22:49 - INFO - __main__ - Step 15013: {'lr': 0.0004905242919274774, 'samples': 2882496, 'steps': 15012, 'loss/train': 1.3931684494018555} -11/06/2021 23:22:49 - INFO - __main__ - Step 15014: {'lr': 0.0004905228446876197, 'samples': 2882688, 'steps': 15013, 'loss/train': 1.860660195350647} -11/06/2021 23:22:50 - INFO - __main__ - Step 15015: {'lr': 0.0004905213973393863, 'samples': 2882880, 'steps': 15014, 'loss/train': 2.3514349460601807} -11/06/2021 23:22:50 - INFO - __main__ - Step 15016: {'lr': 0.0004905199498827776, 'samples': 2883072, 'steps': 15015, 'loss/train': 1.8527649641036987} -11/06/2021 23:22:51 - INFO - __main__ - Step 15017: {'lr': 0.0004905185023177942, 'samples': 2883264, 'steps': 15016, 'loss/train': 1.7189619541168213} -11/06/2021 23:22:51 - INFO - __main__ - Step 15018: {'lr': 0.0004905170546444371, 'samples': 2883456, 'steps': 15017, 'loss/train': 1.7839937210083008} -11/06/2021 23:22:52 - INFO - __main__ - Step 15019: {'lr': 0.0004905156068627065, 'samples': 2883648, 'steps': 15018, 'loss/train': 1.8625094890594482} -11/06/2021 23:22:52 - INFO - __main__ - Step 15020: {'lr': 0.0004905141589726035, 'samples': 2883840, 'steps': 15019, 'loss/train': 1.4955047369003296} -11/06/2021 23:22:52 - INFO - __main__ - Step 15021: {'lr': 0.0004905127109741284, 'samples': 2884032, 'steps': 15020, 'loss/train': 1.9690922498703003} -11/06/2021 23:22:54 - INFO - __main__ - Step 15022: {'lr': 0.000490511262867282, 'samples': 2884224, 'steps': 15021, 'loss/train': 1.777396559715271} -11/06/2021 23:22:54 - INFO - __main__ - Step 15023: {'lr': 0.000490509814652065, 'samples': 2884416, 'steps': 15022, 'loss/train': 2.3741092681884766} -11/06/2021 23:22:54 - INFO - __main__ - Step 15024: {'lr': 0.0004905083663284779, 'samples': 2884608, 'steps': 15023, 'loss/train': 1.2763044834136963} -11/06/2021 23:22:55 - INFO - __main__ - Step 15025: {'lr': 0.0004905069178965214, 'samples': 2884800, 'steps': 15024, 'loss/train': 1.7052578926086426} -11/06/2021 23:22:55 - INFO - __main__ - Step 15026: {'lr': 0.0004905054693561963, 'samples': 2884992, 'steps': 15025, 'loss/train': 1.5424304008483887} -11/06/2021 23:22:55 - INFO - __main__ - Step 15027: {'lr': 0.0004905040207075032, 'samples': 2885184, 'steps': 15026, 'loss/train': 1.7792967557907104} -11/06/2021 23:22:56 - INFO - __main__ - Step 15028: {'lr': 0.0004905025719504426, 'samples': 2885376, 'steps': 15027, 'loss/train': 2.0818092823028564} -11/06/2021 23:22:57 - INFO - __main__ - Step 15029: {'lr': 0.0004905011230850152, 'samples': 2885568, 'steps': 15028, 'loss/train': 1.9193378686904907} -11/06/2021 23:22:57 - INFO - __main__ - Step 15030: {'lr': 0.0004904996741112218, 'samples': 2885760, 'steps': 15029, 'loss/train': 1.4404072761535645} -11/06/2021 23:22:57 - INFO - __main__ - Step 15031: {'lr': 0.0004904982250290629, 'samples': 2885952, 'steps': 15030, 'loss/train': 1.7105932235717773} -11/06/2021 23:22:58 - INFO - __main__ - Step 15032: {'lr': 0.0004904967758385393, 'samples': 2886144, 'steps': 15031, 'loss/train': 1.7881110906600952} -11/06/2021 23:22:59 - INFO - __main__ - Step 15033: {'lr': 0.0004904953265396515, 'samples': 2886336, 'steps': 15032, 'loss/train': 1.9477510452270508} -11/06/2021 23:23:00 - INFO - __main__ - Step 15034: {'lr': 0.0004904938771324002, 'samples': 2886528, 'steps': 15033, 'loss/train': 0.2995307445526123} -11/06/2021 23:23:00 - INFO - __main__ - Step 15035: {'lr': 0.0004904924276167861, 'samples': 2886720, 'steps': 15034, 'loss/train': 1.766963243484497} -11/06/2021 23:23:00 - INFO - __main__ - Step 15036: {'lr': 0.0004904909779928099, 'samples': 2886912, 'steps': 15035, 'loss/train': 1.1945898532867432} -11/06/2021 23:23:01 - INFO - __main__ - Step 15037: {'lr': 0.000490489528260472, 'samples': 2887104, 'steps': 15036, 'loss/train': 1.4538508653640747} -11/06/2021 23:23:01 - INFO - __main__ - Step 15038: {'lr': 0.0004904880784197734, 'samples': 2887296, 'steps': 15037, 'loss/train': 1.6707526445388794} -11/06/2021 23:23:02 - INFO - __main__ - Step 15039: {'lr': 0.0004904866284707144, 'samples': 2887488, 'steps': 15038, 'loss/train': 1.706793189048767} -11/06/2021 23:23:02 - INFO - __main__ - Step 15040: {'lr': 0.000490485178413296, 'samples': 2887680, 'steps': 15039, 'loss/train': 1.7125017642974854} -11/06/2021 23:23:03 - INFO - __main__ - Step 15041: {'lr': 0.0004904837282475186, 'samples': 2887872, 'steps': 15040, 'loss/train': 1.610682487487793} -11/06/2021 23:23:03 - INFO - __main__ - Step 15042: {'lr': 0.000490482277973383, 'samples': 2888064, 'steps': 15041, 'loss/train': 2.108546495437622} -11/06/2021 23:23:03 - INFO - __main__ - Step 15043: {'lr': 0.0004904808275908898, 'samples': 2888256, 'steps': 15042, 'loss/train': 1.7590423822402954} -11/06/2021 23:23:05 - INFO - __main__ - Step 15044: {'lr': 0.0004904793771000396, 'samples': 2888448, 'steps': 15043, 'loss/train': 1.7148654460906982} -11/06/2021 23:23:05 - INFO - __main__ - Step 15045: {'lr': 0.0004904779265008331, 'samples': 2888640, 'steps': 15044, 'loss/train': 1.8898462057113647} -11/06/2021 23:23:05 - INFO - __main__ - Step 15046: {'lr': 0.000490476475793271, 'samples': 2888832, 'steps': 15045, 'loss/train': 0.4562050402164459} -11/06/2021 23:23:06 - INFO - __main__ - Step 15047: {'lr': 0.0004904750249773538, 'samples': 2889024, 'steps': 15046, 'loss/train': 1.8167861700057983} -11/06/2021 23:23:06 - INFO - __main__ - Step 15048: {'lr': 0.0004904735740530825, 'samples': 2889216, 'steps': 15047, 'loss/train': 1.7291828393936157} -11/06/2021 23:23:07 - INFO - __main__ - Step 15049: {'lr': 0.0004904721230204573, 'samples': 2889408, 'steps': 15048, 'loss/train': 1.8959709405899048} -11/06/2021 23:23:07 - INFO - __main__ - Step 15050: {'lr': 0.0004904706718794791, 'samples': 2889600, 'steps': 15049, 'loss/train': 1.5438092947006226} -11/06/2021 23:23:08 - INFO - __main__ - Step 15051: {'lr': 0.0004904692206301487, 'samples': 2889792, 'steps': 15050, 'loss/train': 1.4828404188156128} -11/06/2021 23:23:08 - INFO - __main__ - Step 15052: {'lr': 0.0004904677692724664, 'samples': 2889984, 'steps': 15051, 'loss/train': 1.3407013416290283} -11/06/2021 23:23:08 - INFO - __main__ - Step 15053: {'lr': 0.000490466317806433, 'samples': 2890176, 'steps': 15052, 'loss/train': 1.669877290725708} -11/06/2021 23:23:09 - INFO - __main__ - Step 15054: {'lr': 0.0004904648662320493, 'samples': 2890368, 'steps': 15053, 'loss/train': 1.7544317245483398} -11/06/2021 23:23:10 - INFO - __main__ - Step 15055: {'lr': 0.0004904634145493159, 'samples': 2890560, 'steps': 15054, 'loss/train': 1.4797533750534058} -11/06/2021 23:23:10 - INFO - __main__ - Step 15056: {'lr': 0.0004904619627582332, 'samples': 2890752, 'steps': 15055, 'loss/train': 1.6231729984283447} -11/06/2021 23:23:11 - INFO - __main__ - Step 15057: {'lr': 0.0004904605108588023, 'samples': 2890944, 'steps': 15056, 'loss/train': 1.5444527864456177} -11/06/2021 23:23:11 - INFO - __main__ - Step 15058: {'lr': 0.0004904590588510234, 'samples': 2891136, 'steps': 15057, 'loss/train': 2.30820631980896} -11/06/2021 23:23:11 - INFO - __main__ - Step 15059: {'lr': 0.0004904576067348975, 'samples': 2891328, 'steps': 15058, 'loss/train': 2.174032688140869} -11/06/2021 23:23:12 - INFO - __main__ - Step 15060: {'lr': 0.000490456154510425, 'samples': 2891520, 'steps': 15059, 'loss/train': 1.4963994026184082} -11/06/2021 23:23:13 - INFO - __main__ - Step 15061: {'lr': 0.0004904547021776067, 'samples': 2891712, 'steps': 15060, 'loss/train': 1.3455215692520142} -11/06/2021 23:23:13 - INFO - __main__ - Step 15062: {'lr': 0.0004904532497364432, 'samples': 2891904, 'steps': 15061, 'loss/train': 1.4568783044815063} -11/06/2021 23:23:13 - INFO - __main__ - Step 15063: {'lr': 0.0004904517971869352, 'samples': 2892096, 'steps': 15062, 'loss/train': 1.2581560611724854} -11/06/2021 23:23:14 - INFO - __main__ - Step 15064: {'lr': 0.0004904503445290833, 'samples': 2892288, 'steps': 15063, 'loss/train': 1.4970574378967285} -11/06/2021 23:23:15 - INFO - __main__ - Step 15065: {'lr': 0.0004904488917628882, 'samples': 2892480, 'steps': 15064, 'loss/train': 1.9729082584381104} -11/06/2021 23:23:15 - INFO - __main__ - Step 15066: {'lr': 0.0004904474388883507, 'samples': 2892672, 'steps': 15065, 'loss/train': 1.9454787969589233} -11/06/2021 23:23:15 - INFO - __main__ - Step 15067: {'lr': 0.000490445985905471, 'samples': 2892864, 'steps': 15066, 'loss/train': 1.946716547012329} -11/06/2021 23:23:16 - INFO - __main__ - Step 15068: {'lr': 0.0004904445328142503, 'samples': 2893056, 'steps': 15067, 'loss/train': 1.4555275440216064} -11/06/2021 23:23:16 - INFO - __main__ - Step 15069: {'lr': 0.0004904430796146889, 'samples': 2893248, 'steps': 15068, 'loss/train': 1.6384254693984985} -11/06/2021 23:23:17 - INFO - __main__ - Step 15070: {'lr': 0.0004904416263067876, 'samples': 2893440, 'steps': 15069, 'loss/train': 1.866790533065796} -11/06/2021 23:23:18 - INFO - __main__ - Step 15071: {'lr': 0.0004904401728905469, 'samples': 2893632, 'steps': 15070, 'loss/train': 1.6796128749847412} -11/06/2021 23:23:18 - INFO - __main__ - Step 15072: {'lr': 0.0004904387193659677, 'samples': 2893824, 'steps': 15071, 'loss/train': 1.5711565017700195} -11/06/2021 23:23:18 - INFO - __main__ - Step 15073: {'lr': 0.0004904372657330504, 'samples': 2894016, 'steps': 15072, 'loss/train': 1.440606713294983} -11/06/2021 23:23:19 - INFO - __main__ - Step 15074: {'lr': 0.0004904358119917959, 'samples': 2894208, 'steps': 15073, 'loss/train': 2.0183684825897217} -11/06/2021 23:23:20 - INFO - __main__ - Step 15075: {'lr': 0.0004904343581422047, 'samples': 2894400, 'steps': 15074, 'loss/train': 1.6127521991729736} -11/06/2021 23:23:20 - INFO - __main__ - Step 15076: {'lr': 0.0004904329041842774, 'samples': 2894592, 'steps': 15075, 'loss/train': 1.8341926336288452} -11/06/2021 23:23:20 - INFO - __main__ - Step 15077: {'lr': 0.0004904314501180148, 'samples': 2894784, 'steps': 15076, 'loss/train': 1.8274245262145996} -11/06/2021 23:23:21 - INFO - __main__ - Step 15078: {'lr': 0.0004904299959434175, 'samples': 2894976, 'steps': 15077, 'loss/train': 1.727868676185608} -11/06/2021 23:23:21 - INFO - __main__ - Step 15079: {'lr': 0.0004904285416604862, 'samples': 2895168, 'steps': 15078, 'loss/train': 1.6105992794036865} -11/06/2021 23:23:21 - INFO - __main__ - Step 15080: {'lr': 0.0004904270872692215, 'samples': 2895360, 'steps': 15079, 'loss/train': 1.6114802360534668} -11/06/2021 23:23:23 - INFO - __main__ - Step 15081: {'lr': 0.0004904256327696241, 'samples': 2895552, 'steps': 15080, 'loss/train': 0.8484119772911072} -11/06/2021 23:23:23 - INFO - __main__ - Step 15082: {'lr': 0.0004904241781616945, 'samples': 2895744, 'steps': 15081, 'loss/train': 1.8067805767059326} -11/06/2021 23:23:24 - INFO - __main__ - Step 15083: {'lr': 0.0004904227234454335, 'samples': 2895936, 'steps': 15082, 'loss/train': 1.6496418714523315} -11/06/2021 23:23:24 - INFO - __main__ - Step 15084: {'lr': 0.0004904212686208418, 'samples': 2896128, 'steps': 15083, 'loss/train': 1.4202336072921753} -11/06/2021 23:23:24 - INFO - __main__ - Step 15085: {'lr': 0.00049041981368792, 'samples': 2896320, 'steps': 15084, 'loss/train': 1.955782175064087} -11/06/2021 23:23:25 - INFO - __main__ - Step 15086: {'lr': 0.0004904183586466686, 'samples': 2896512, 'steps': 15085, 'loss/train': 0.5780248641967773} -11/06/2021 23:23:26 - INFO - __main__ - Step 15087: {'lr': 0.0004904169034970885, 'samples': 2896704, 'steps': 15086, 'loss/train': 1.998367190361023} -11/06/2021 23:23:26 - INFO - __main__ - Step 15088: {'lr': 0.0004904154482391803, 'samples': 2896896, 'steps': 15087, 'loss/train': 2.0256190299987793} -11/06/2021 23:23:26 - INFO - __main__ - Step 15089: {'lr': 0.0004904139928729445, 'samples': 2897088, 'steps': 15088, 'loss/train': 1.4871602058410645} -11/06/2021 23:23:27 - INFO - __main__ - Step 15090: {'lr': 0.0004904125373983819, 'samples': 2897280, 'steps': 15089, 'loss/train': 1.7294107675552368} -11/06/2021 23:23:28 - INFO - __main__ - Step 15091: {'lr': 0.0004904110818154931, 'samples': 2897472, 'steps': 15090, 'loss/train': 1.508729100227356} -11/06/2021 23:23:28 - INFO - __main__ - Step 15092: {'lr': 0.0004904096261242789, 'samples': 2897664, 'steps': 15091, 'loss/train': 1.496836543083191} -11/06/2021 23:23:28 - INFO - __main__ - Step 15093: {'lr': 0.0004904081703247397, 'samples': 2897856, 'steps': 15092, 'loss/train': 1.4800703525543213} -11/06/2021 23:23:29 - INFO - __main__ - Step 15094: {'lr': 0.0004904067144168763, 'samples': 2898048, 'steps': 15093, 'loss/train': 1.7554247379302979} -11/06/2021 23:23:29 - INFO - __main__ - Step 15095: {'lr': 0.0004904052584006895, 'samples': 2898240, 'steps': 15094, 'loss/train': 1.2802367210388184} -11/06/2021 23:23:30 - INFO - __main__ - Step 15096: {'lr': 0.0004904038022761797, 'samples': 2898432, 'steps': 15095, 'loss/train': 2.180551767349243} -11/06/2021 23:23:31 - INFO - __main__ - Step 15097: {'lr': 0.0004904023460433475, 'samples': 2898624, 'steps': 15096, 'loss/train': 1.744247555732727} -11/06/2021 23:23:31 - INFO - __main__ - Step 15098: {'lr': 0.0004904008897021939, 'samples': 2898816, 'steps': 15097, 'loss/train': 1.8757344484329224} -11/06/2021 23:23:31 - INFO - __main__ - Step 15099: {'lr': 0.0004903994332527193, 'samples': 2899008, 'steps': 15098, 'loss/train': 1.5103914737701416} -11/06/2021 23:23:32 - INFO - __main__ - Step 15100: {'lr': 0.0004903979766949244, 'samples': 2899200, 'steps': 15099, 'loss/train': 1.7478224039077759} -11/06/2021 23:23:32 - INFO - __main__ - Step 15101: {'lr': 0.00049039652002881, 'samples': 2899392, 'steps': 15100, 'loss/train': 1.6020162105560303} -11/06/2021 23:23:33 - INFO - __main__ - Step 15102: {'lr': 0.0004903950632543766, 'samples': 2899584, 'steps': 15101, 'loss/train': 1.921471357345581} -11/06/2021 23:23:33 - INFO - __main__ - Step 15103: {'lr': 0.0004903936063716248, 'samples': 2899776, 'steps': 15102, 'loss/train': 1.7595106363296509} -11/06/2021 23:23:34 - INFO - __main__ - Step 15104: {'lr': 0.0004903921493805554, 'samples': 2899968, 'steps': 15103, 'loss/train': 1.4765055179595947} -11/06/2021 23:23:34 - INFO - __main__ - Step 15105: {'lr': 0.000490390692281169, 'samples': 2900160, 'steps': 15104, 'loss/train': 1.2814937829971313} -11/06/2021 23:23:34 - INFO - __main__ - Step 15106: {'lr': 0.0004903892350734663, 'samples': 2900352, 'steps': 15105, 'loss/train': 1.4163860082626343} -11/06/2021 23:23:36 - INFO - __main__ - Step 15107: {'lr': 0.0004903877777574479, 'samples': 2900544, 'steps': 15106, 'loss/train': 1.5000590085983276} -11/06/2021 23:23:36 - INFO - __main__ - Step 15108: {'lr': 0.0004903863203331145, 'samples': 2900736, 'steps': 15107, 'loss/train': 1.54270339012146} -11/06/2021 23:23:36 - INFO - __main__ - Step 15109: {'lr': 0.0004903848628004667, 'samples': 2900928, 'steps': 15108, 'loss/train': 1.929103136062622} -11/06/2021 23:23:37 - INFO - __main__ - Step 15110: {'lr': 0.0004903834051595052, 'samples': 2901120, 'steps': 15109, 'loss/train': 1.6631858348846436} -11/06/2021 23:23:37 - INFO - __main__ - Step 15111: {'lr': 0.0004903819474102306, 'samples': 2901312, 'steps': 15110, 'loss/train': 1.7396637201309204} -11/06/2021 23:23:38 - INFO - __main__ - Step 15112: {'lr': 0.0004903804895526437, 'samples': 2901504, 'steps': 15111, 'loss/train': 1.462821125984192} -11/06/2021 23:23:38 - INFO - __main__ - Step 15113: {'lr': 0.0004903790315867449, 'samples': 2901696, 'steps': 15112, 'loss/train': 1.5667641162872314} -11/06/2021 23:23:39 - INFO - __main__ - Step 15114: {'lr': 0.0004903775735125352, 'samples': 2901888, 'steps': 15113, 'loss/train': 1.7718415260314941} -11/06/2021 23:23:39 - INFO - __main__ - Step 15115: {'lr': 0.0004903761153300149, 'samples': 2902080, 'steps': 15114, 'loss/train': 1.5683375597000122} -11/06/2021 23:23:39 - INFO - __main__ - Step 15116: {'lr': 0.000490374657039185, 'samples': 2902272, 'steps': 15115, 'loss/train': 1.12655770778656} -11/06/2021 23:23:40 - INFO - __main__ - Step 15117: {'lr': 0.0004903731986400459, 'samples': 2902464, 'steps': 15116, 'loss/train': 1.7532262802124023} -11/06/2021 23:23:41 - INFO - __main__ - Step 15118: {'lr': 0.0004903717401325983, 'samples': 2902656, 'steps': 15117, 'loss/train': 1.716330885887146} -11/06/2021 23:23:41 - INFO - __main__ - Step 15119: {'lr': 0.000490370281516843, 'samples': 2902848, 'steps': 15118, 'loss/train': 1.9191677570343018} -11/06/2021 23:23:42 - INFO - __main__ - Step 15120: {'lr': 0.0004903688227927806, 'samples': 2903040, 'steps': 15119, 'loss/train': 2.0227084159851074} -11/06/2021 23:23:42 - INFO - __main__ - Step 15121: {'lr': 0.0004903673639604116, 'samples': 2903232, 'steps': 15120, 'loss/train': 1.3265833854675293} -11/06/2021 23:23:43 - INFO - __main__ - Step 15122: {'lr': 0.0004903659050197369, 'samples': 2903424, 'steps': 15121, 'loss/train': 1.751603364944458} -11/06/2021 23:23:43 - INFO - __main__ - Step 15123: {'lr': 0.0004903644459707569, 'samples': 2903616, 'steps': 15122, 'loss/train': 1.6488754749298096} -11/06/2021 23:23:44 - INFO - __main__ - Step 15124: {'lr': 0.0004903629868134725, 'samples': 2903808, 'steps': 15123, 'loss/train': 1.1973127126693726} -11/06/2021 23:23:44 - INFO - __main__ - Step 15125: {'lr': 0.0004903615275478841, 'samples': 2904000, 'steps': 15124, 'loss/train': 1.4743258953094482} -11/06/2021 23:23:44 - INFO - __main__ - Step 15126: {'lr': 0.0004903600681739926, 'samples': 2904192, 'steps': 15125, 'loss/train': 1.5869134664535522} -11/06/2021 23:23:45 - INFO - __main__ - Step 15127: {'lr': 0.0004903586086917986, 'samples': 2904384, 'steps': 15126, 'loss/train': 1.4058135747909546} -11/06/2021 23:23:46 - INFO - __main__ - Step 15128: {'lr': 0.0004903571491013027, 'samples': 2904576, 'steps': 15127, 'loss/train': 0.8983421325683594} -11/06/2021 23:23:46 - INFO - __main__ - Step 15129: {'lr': 0.0004903556894025055, 'samples': 2904768, 'steps': 15128, 'loss/train': 1.5951757431030273} -11/06/2021 23:23:46 - INFO - __main__ - Step 15130: {'lr': 0.0004903542295954077, 'samples': 2904960, 'steps': 15129, 'loss/train': 1.553074836730957} -11/06/2021 23:23:47 - INFO - __main__ - Step 15131: {'lr': 0.0004903527696800102, 'samples': 2905152, 'steps': 15130, 'loss/train': 1.154365062713623} -11/06/2021 23:23:47 - INFO - __main__ - Step 15132: {'lr': 0.0004903513096563133, 'samples': 2905344, 'steps': 15131, 'loss/train': 1.9353693723678589} -11/06/2021 23:23:48 - INFO - __main__ - Step 15133: {'lr': 0.0004903498495243178, 'samples': 2905536, 'steps': 15132, 'loss/train': 2.002183675765991} -11/06/2021 23:23:49 - INFO - __main__ - Step 15134: {'lr': 0.0004903483892840244, 'samples': 2905728, 'steps': 15133, 'loss/train': 1.6886216402053833} -11/06/2021 23:23:49 - INFO - __main__ - Step 15135: {'lr': 0.0004903469289354338, 'samples': 2905920, 'steps': 15134, 'loss/train': 1.5800846815109253} -11/06/2021 23:23:49 - INFO - __main__ - Step 15136: {'lr': 0.0004903454684785465, 'samples': 2906112, 'steps': 15135, 'loss/train': 1.4386088848114014} -11/06/2021 23:23:50 - INFO - __main__ - Step 15137: {'lr': 0.0004903440079133633, 'samples': 2906304, 'steps': 15136, 'loss/train': 1.7239024639129639} -11/06/2021 23:23:51 - INFO - __main__ - Step 15138: {'lr': 0.0004903425472398846, 'samples': 2906496, 'steps': 15137, 'loss/train': 1.53848135471344} -11/06/2021 23:23:51 - INFO - __main__ - Step 15139: {'lr': 0.0004903410864581115, 'samples': 2906688, 'steps': 15138, 'loss/train': 2.4064629077911377} -11/06/2021 23:23:52 - INFO - __main__ - Step 15140: {'lr': 0.0004903396255680443, 'samples': 2906880, 'steps': 15139, 'loss/train': 1.433778166770935} -11/06/2021 23:23:52 - INFO - __main__ - Step 15141: {'lr': 0.0004903381645696838, 'samples': 2907072, 'steps': 15140, 'loss/train': 1.3583641052246094} -11/06/2021 23:23:52 - INFO - __main__ - Step 15142: {'lr': 0.0004903367034630307, 'samples': 2907264, 'steps': 15141, 'loss/train': 2.072575092315674} -11/06/2021 23:23:53 - INFO - __main__ - Step 15143: {'lr': 0.0004903352422480855, 'samples': 2907456, 'steps': 15142, 'loss/train': 1.4871820211410522} -11/06/2021 23:23:54 - INFO - __main__ - Step 15144: {'lr': 0.000490333780924849, 'samples': 2907648, 'steps': 15143, 'loss/train': 2.0281856060028076} -11/06/2021 23:23:54 - INFO - __main__ - Step 15145: {'lr': 0.0004903323194933218, 'samples': 2907840, 'steps': 15144, 'loss/train': 1.3873077630996704} -11/06/2021 23:23:54 - INFO - __main__ - Step 15146: {'lr': 0.0004903308579535045, 'samples': 2908032, 'steps': 15145, 'loss/train': 1.6294296979904175} -11/06/2021 23:23:55 - INFO - __main__ - Step 15147: {'lr': 0.0004903293963053979, 'samples': 2908224, 'steps': 15146, 'loss/train': 1.5592012405395508} -11/06/2021 23:23:56 - INFO - __main__ - Step 15148: {'lr': 0.0004903279345490026, 'samples': 2908416, 'steps': 15147, 'loss/train': 1.804236650466919} -11/06/2021 23:23:56 - INFO - __main__ - Step 15149: {'lr': 0.0004903264726843191, 'samples': 2908608, 'steps': 15148, 'loss/train': 1.6943762302398682} -11/06/2021 23:23:57 - INFO - __main__ - Step 15150: {'lr': 0.0004903250107113483, 'samples': 2908800, 'steps': 15149, 'loss/train': 1.375742793083191} -11/06/2021 23:23:57 - INFO - __main__ - Step 15151: {'lr': 0.0004903235486300908, 'samples': 2908992, 'steps': 15150, 'loss/train': 1.674008846282959} -11/06/2021 23:23:57 - INFO - __main__ - Step 15152: {'lr': 0.0004903220864405471, 'samples': 2909184, 'steps': 15151, 'loss/train': 1.1988589763641357} -11/06/2021 23:23:58 - INFO - __main__ - Step 15153: {'lr': 0.000490320624142718, 'samples': 2909376, 'steps': 15152, 'loss/train': 1.791925072669983} -11/06/2021 23:23:59 - INFO - __main__ - Step 15154: {'lr': 0.0004903191617366043, 'samples': 2909568, 'steps': 15153, 'loss/train': 1.7116177082061768} -11/06/2021 23:23:59 - INFO - __main__ - Step 15155: {'lr': 0.0004903176992222063, 'samples': 2909760, 'steps': 15154, 'loss/train': 1.5216213464736938} -11/06/2021 23:23:59 - INFO - __main__ - Step 15156: {'lr': 0.000490316236599525, 'samples': 2909952, 'steps': 15155, 'loss/train': 1.7094593048095703} -11/06/2021 23:24:00 - INFO - __main__ - Step 15157: {'lr': 0.0004903147738685609, 'samples': 2910144, 'steps': 15156, 'loss/train': 1.712797999382019} -11/06/2021 23:24:00 - INFO - __main__ - Step 15158: {'lr': 0.0004903133110293145, 'samples': 2910336, 'steps': 15157, 'loss/train': 0.5006943941116333} -11/06/2021 23:24:01 - INFO - __main__ - Step 15159: {'lr': 0.0004903118480817868, 'samples': 2910528, 'steps': 15158, 'loss/train': 1.5716854333877563} -11/06/2021 23:24:01 - INFO - __main__ - Step 15160: {'lr': 0.0004903103850259781, 'samples': 2910720, 'steps': 15159, 'loss/train': 1.470730185508728} -11/06/2021 23:24:02 - INFO - __main__ - Step 15161: {'lr': 0.0004903089218618895, 'samples': 2910912, 'steps': 15160, 'loss/train': 1.3954046964645386} -11/06/2021 23:24:02 - INFO - __main__ - Step 15162: {'lr': 0.0004903074585895212, 'samples': 2911104, 'steps': 15161, 'loss/train': 1.755196213722229} -11/06/2021 23:24:02 - INFO - __main__ - Step 15163: {'lr': 0.0004903059952088742, 'samples': 2911296, 'steps': 15162, 'loss/train': 1.6570621728897095} -11/06/2021 23:24:03 - INFO - __main__ - Step 15164: {'lr': 0.0004903045317199489, 'samples': 2911488, 'steps': 15163, 'loss/train': 1.5844322443008423} -11/06/2021 23:24:04 - INFO - __main__ - Step 15165: {'lr': 0.0004903030681227463, 'samples': 2911680, 'steps': 15164, 'loss/train': 1.630523681640625} -11/06/2021 23:24:04 - INFO - __main__ - Step 15166: {'lr': 0.0004903016044172666, 'samples': 2911872, 'steps': 15165, 'loss/train': 1.6046708822250366} -11/06/2021 23:24:04 - INFO - __main__ - Step 15167: {'lr': 0.0004903001406035109, 'samples': 2912064, 'steps': 15166, 'loss/train': 1.7047207355499268} -11/06/2021 23:24:05 - INFO - __main__ - Step 15168: {'lr': 0.0004902986766814795, 'samples': 2912256, 'steps': 15167, 'loss/train': 1.479922890663147} -11/06/2021 23:24:06 - INFO - __main__ - Step 15169: {'lr': 0.0004902972126511734, 'samples': 2912448, 'steps': 15168, 'loss/train': 1.8230383396148682} -11/06/2021 23:24:06 - INFO - __main__ - Step 15170: {'lr': 0.0004902957485125929, 'samples': 2912640, 'steps': 15169, 'loss/train': 1.3802613019943237} -11/06/2021 23:24:07 - INFO - __main__ - Step 15171: {'lr': 0.0004902942842657389, 'samples': 2912832, 'steps': 15170, 'loss/train': 1.3913418054580688} -11/06/2021 23:24:07 - INFO - __main__ - Step 15172: {'lr': 0.0004902928199106121, 'samples': 2913024, 'steps': 15171, 'loss/train': 1.4685401916503906} -11/06/2021 23:24:07 - INFO - __main__ - Step 15173: {'lr': 0.000490291355447213, 'samples': 2913216, 'steps': 15172, 'loss/train': 1.9173450469970703} -11/06/2021 23:24:08 - INFO - __main__ - Step 15174: {'lr': 0.0004902898908755424, 'samples': 2913408, 'steps': 15173, 'loss/train': 3.7974798679351807} -11/06/2021 23:24:09 - INFO - __main__ - Step 15175: {'lr': 0.0004902884261956007, 'samples': 2913600, 'steps': 15174, 'loss/train': 1.4008654356002808} -11/06/2021 23:24:09 - INFO - __main__ - Step 15176: {'lr': 0.0004902869614073889, 'samples': 2913792, 'steps': 15175, 'loss/train': 1.5890427827835083} -11/06/2021 23:24:09 - INFO - __main__ - Step 15177: {'lr': 0.0004902854965109074, 'samples': 2913984, 'steps': 15176, 'loss/train': 1.566736102104187} -11/06/2021 23:24:10 - INFO - __main__ - Step 15178: {'lr': 0.0004902840315061571, 'samples': 2914176, 'steps': 15177, 'loss/train': 1.907994270324707} -11/06/2021 23:24:10 - INFO - __main__ - Step 15179: {'lr': 0.0004902825663931384, 'samples': 2914368, 'steps': 15178, 'loss/train': 1.6074315309524536} -11/06/2021 23:24:11 - INFO - __main__ - Step 15180: {'lr': 0.0004902811011718521, 'samples': 2914560, 'steps': 15179, 'loss/train': 1.366045355796814} -11/06/2021 23:24:12 - INFO - __main__ - Step 15181: {'lr': 0.0004902796358422989, 'samples': 2914752, 'steps': 15180, 'loss/train': 1.674401044845581} -11/06/2021 23:24:12 - INFO - __main__ - Step 15182: {'lr': 0.0004902781704044793, 'samples': 2914944, 'steps': 15181, 'loss/train': 1.410227656364441} -11/06/2021 23:24:12 - INFO - __main__ - Step 15183: {'lr': 0.0004902767048583942, 'samples': 2915136, 'steps': 15182, 'loss/train': 1.924155354499817} -11/06/2021 23:24:13 - INFO - __main__ - Step 15184: {'lr': 0.000490275239204044, 'samples': 2915328, 'steps': 15183, 'loss/train': 1.9920772314071655} -11/06/2021 23:24:14 - INFO - __main__ - Step 15185: {'lr': 0.0004902737734414296, 'samples': 2915520, 'steps': 15184, 'loss/train': 1.6780331134796143} -11/06/2021 23:24:14 - INFO - __main__ - Step 15186: {'lr': 0.0004902723075705514, 'samples': 2915712, 'steps': 15185, 'loss/train': 1.4955074787139893} -11/06/2021 23:24:14 - INFO - __main__ - Step 15187: {'lr': 0.0004902708415914103, 'samples': 2915904, 'steps': 15186, 'loss/train': 1.7642159461975098} -11/06/2021 23:24:15 - INFO - __main__ - Step 15188: {'lr': 0.0004902693755040069, 'samples': 2916096, 'steps': 15187, 'loss/train': 1.1258271932601929} -11/06/2021 23:24:15 - INFO - __main__ - Step 15189: {'lr': 0.0004902679093083418, 'samples': 2916288, 'steps': 15188, 'loss/train': 1.6583342552185059} -11/06/2021 23:24:16 - INFO - __main__ - Step 15190: {'lr': 0.0004902664430044156, 'samples': 2916480, 'steps': 15189, 'loss/train': 1.885223388671875} -11/06/2021 23:24:16 - INFO - __main__ - Step 15191: {'lr': 0.0004902649765922292, 'samples': 2916672, 'steps': 15190, 'loss/train': 1.5591681003570557} -11/06/2021 23:24:17 - INFO - __main__ - Step 15192: {'lr': 0.0004902635100717831, 'samples': 2916864, 'steps': 15191, 'loss/train': 1.050796627998352} -11/06/2021 23:24:17 - INFO - __main__ - Step 15193: {'lr': 0.0004902620434430778, 'samples': 2917056, 'steps': 15192, 'loss/train': 0.23766328394412994} -11/06/2021 23:24:17 - INFO - __main__ - Step 15194: {'lr': 0.0004902605767061142, 'samples': 2917248, 'steps': 15193, 'loss/train': 1.7011011838912964} -11/06/2021 23:24:19 - INFO - __main__ - Step 15195: {'lr': 0.000490259109860893, 'samples': 2917440, 'steps': 15194, 'loss/train': 1.8796442747116089} -11/06/2021 23:24:20 - INFO - __main__ - Step 15196: {'lr': 0.0004902576429074146, 'samples': 2917632, 'steps': 15195, 'loss/train': 1.5257242918014526} -11/06/2021 23:24:20 - INFO - __main__ - Step 15197: {'lr': 0.0004902561758456799, 'samples': 2917824, 'steps': 15196, 'loss/train': 1.9276056289672852} -11/06/2021 23:24:20 - INFO - __main__ - Step 15198: {'lr': 0.0004902547086756895, 'samples': 2918016, 'steps': 15197, 'loss/train': 1.3162223100662231} -11/06/2021 23:24:21 - INFO - __main__ - Step 15199: {'lr': 0.000490253241397444, 'samples': 2918208, 'steps': 15198, 'loss/train': 1.277166724205017} -11/06/2021 23:24:21 - INFO - __main__ - Step 15200: {'lr': 0.0004902517740109441, 'samples': 2918400, 'steps': 15199, 'loss/train': 1.857283592224121} -11/06/2021 23:24:22 - INFO - __main__ - Step 15201: {'lr': 0.0004902503065161905, 'samples': 2918592, 'steps': 15200, 'loss/train': 2.3311972618103027} -11/06/2021 23:24:23 - INFO - __main__ - Step 15202: {'lr': 0.0004902488389131837, 'samples': 2918784, 'steps': 15201, 'loss/train': 1.7067315578460693} -11/06/2021 23:24:23 - INFO - __main__ - Step 15203: {'lr': 0.0004902473712019246, 'samples': 2918976, 'steps': 15202, 'loss/train': 1.788569450378418} -11/06/2021 23:24:23 - INFO - __main__ - Step 15204: {'lr': 0.0004902459033824137, 'samples': 2919168, 'steps': 15203, 'loss/train': 1.7561739683151245} -11/06/2021 23:24:24 - INFO - __main__ - Step 15205: {'lr': 0.0004902444354546516, 'samples': 2919360, 'steps': 15204, 'loss/train': 1.9418166875839233} -11/06/2021 23:24:24 - INFO - __main__ - Step 15206: {'lr': 0.0004902429674186392, 'samples': 2919552, 'steps': 15205, 'loss/train': 1.4655617475509644} -11/06/2021 23:24:25 - INFO - __main__ - Step 15207: {'lr': 0.000490241499274377, 'samples': 2919744, 'steps': 15206, 'loss/train': 1.264890193939209} -11/06/2021 23:24:26 - INFO - __main__ - Step 15208: {'lr': 0.0004902400310218657, 'samples': 2919936, 'steps': 15207, 'loss/train': 1.5054603815078735} -11/06/2021 23:24:26 - INFO - __main__ - Step 15209: {'lr': 0.0004902385626611059, 'samples': 2920128, 'steps': 15208, 'loss/train': 1.2494571208953857} -11/06/2021 23:24:26 - INFO - __main__ - Step 15210: {'lr': 0.0004902370941920984, 'samples': 2920320, 'steps': 15209, 'loss/train': 1.8583664894104004} -11/06/2021 23:24:27 - INFO - __main__ - Step 15211: {'lr': 0.0004902356256148437, 'samples': 2920512, 'steps': 15210, 'loss/train': 1.6945366859436035} -11/06/2021 23:24:27 - INFO - __main__ - Step 15212: {'lr': 0.0004902341569293425, 'samples': 2920704, 'steps': 15211, 'loss/train': 1.7645387649536133} -11/06/2021 23:24:28 - INFO - __main__ - Step 15213: {'lr': 0.0004902326881355955, 'samples': 2920896, 'steps': 15212, 'loss/train': 1.8450555801391602} -11/06/2021 23:24:28 - INFO - __main__ - Step 15214: {'lr': 0.0004902312192336034, 'samples': 2921088, 'steps': 15213, 'loss/train': 2.3038129806518555} -11/06/2021 23:24:29 - INFO - __main__ - Step 15215: {'lr': 0.000490229750223367, 'samples': 2921280, 'steps': 15214, 'loss/train': 0.8343202471733093} -11/06/2021 23:24:29 - INFO - __main__ - Step 15216: {'lr': 0.0004902282811048864, 'samples': 2921472, 'steps': 15215, 'loss/train': 1.9115432500839233} -11/06/2021 23:24:29 - INFO - __main__ - Step 15217: {'lr': 0.000490226811878163, 'samples': 2921664, 'steps': 15216, 'loss/train': 1.8696986436843872} -11/06/2021 23:24:30 - INFO - __main__ - Step 15218: {'lr': 0.0004902253425431969, 'samples': 2921856, 'steps': 15217, 'loss/train': 1.5307645797729492} -11/06/2021 23:24:31 - INFO - __main__ - Step 15219: {'lr': 0.000490223873099989, 'samples': 2922048, 'steps': 15218, 'loss/train': 1.9581738710403442} -11/06/2021 23:24:31 - INFO - __main__ - Step 15220: {'lr': 0.00049022240354854, 'samples': 2922240, 'steps': 15219, 'loss/train': 3.2477519512176514} -11/06/2021 23:24:32 - INFO - __main__ - Step 15221: {'lr': 0.0004902209338888503, 'samples': 2922432, 'steps': 15220, 'loss/train': 2.0752274990081787} -11/06/2021 23:24:32 - INFO - __main__ - Step 15222: {'lr': 0.000490219464120921, 'samples': 2922624, 'steps': 15221, 'loss/train': 1.8632875680923462} -11/06/2021 23:24:33 - INFO - __main__ - Step 15223: {'lr': 0.0004902179942447524, 'samples': 2922816, 'steps': 15222, 'loss/train': 1.554335117340088} -11/06/2021 23:24:33 - INFO - __main__ - Step 15224: {'lr': 0.0004902165242603452, 'samples': 2923008, 'steps': 15223, 'loss/train': 1.9520310163497925} -11/06/2021 23:24:34 - INFO - __main__ - Step 15225: {'lr': 0.0004902150541677003, 'samples': 2923200, 'steps': 15224, 'loss/train': 2.0851187705993652} -11/06/2021 23:24:34 - INFO - __main__ - Step 15226: {'lr': 0.0004902135839668181, 'samples': 2923392, 'steps': 15225, 'loss/train': 2.010134220123291} -11/06/2021 23:24:34 - INFO - __main__ - Step 15227: {'lr': 0.0004902121136576994, 'samples': 2923584, 'steps': 15226, 'loss/train': 1.7734330892562866} -11/06/2021 23:24:35 - INFO - __main__ - Step 15228: {'lr': 0.0004902106432403448, 'samples': 2923776, 'steps': 15227, 'loss/train': 1.354243516921997} -11/06/2021 23:24:36 - INFO - __main__ - Step 15229: {'lr': 0.0004902091727147551, 'samples': 2923968, 'steps': 15228, 'loss/train': 1.7039768695831299} -11/06/2021 23:24:36 - INFO - __main__ - Step 15230: {'lr': 0.0004902077020809307, 'samples': 2924160, 'steps': 15229, 'loss/train': 1.8697679042816162} -11/06/2021 23:24:36 - INFO - __main__ - Step 15231: {'lr': 0.0004902062313388725, 'samples': 2924352, 'steps': 15230, 'loss/train': 1.9331737756729126} -11/06/2021 23:24:37 - INFO - __main__ - Step 15232: {'lr': 0.0004902047604885811, 'samples': 2924544, 'steps': 15231, 'loss/train': 1.9354302883148193} -11/06/2021 23:24:37 - INFO - __main__ - Step 15233: {'lr': 0.0004902032895300571, 'samples': 2924736, 'steps': 15232, 'loss/train': 1.3947269916534424} -11/06/2021 23:24:38 - INFO - __main__ - Step 15234: {'lr': 0.0004902018184633012, 'samples': 2924928, 'steps': 15233, 'loss/train': 1.6846981048583984} -11/06/2021 23:24:39 - INFO - __main__ - Step 15235: {'lr': 0.0004902003472883141, 'samples': 2925120, 'steps': 15234, 'loss/train': 1.5643565654754639} -11/06/2021 23:24:39 - INFO - __main__ - Step 15236: {'lr': 0.0004901988760050964, 'samples': 2925312, 'steps': 15235, 'loss/train': 1.710155963897705} -11/06/2021 23:24:39 - INFO - __main__ - Step 15237: {'lr': 0.0004901974046136488, 'samples': 2925504, 'steps': 15236, 'loss/train': 1.4140377044677734} -11/06/2021 23:24:40 - INFO - __main__ - Step 15238: {'lr': 0.000490195933113972, 'samples': 2925696, 'steps': 15237, 'loss/train': 1.148417353630066} -11/06/2021 23:24:41 - INFO - __main__ - Step 15239: {'lr': 0.0004901944615060665, 'samples': 2925888, 'steps': 15238, 'loss/train': 1.7428512573242188} -11/06/2021 23:24:41 - INFO - __main__ - Step 15240: {'lr': 0.0004901929897899331, 'samples': 2926080, 'steps': 15239, 'loss/train': 1.6310620307922363} -11/06/2021 23:24:41 - INFO - __main__ - Step 15241: {'lr': 0.0004901915179655726, 'samples': 2926272, 'steps': 15240, 'loss/train': 1.1041312217712402} -11/06/2021 23:24:42 - INFO - __main__ - Step 15242: {'lr': 0.0004901900460329853, 'samples': 2926464, 'steps': 15241, 'loss/train': 1.5519336462020874} -11/06/2021 23:24:42 - INFO - __main__ - Step 15243: {'lr': 0.0004901885739921723, 'samples': 2926656, 'steps': 15242, 'loss/train': 2.025369644165039} -11/06/2021 23:24:43 - INFO - __main__ - Step 15244: {'lr': 0.0004901871018431339, 'samples': 2926848, 'steps': 15243, 'loss/train': 1.429811716079712} -11/06/2021 23:24:43 - INFO - __main__ - Step 15245: {'lr': 0.0004901856295858708, 'samples': 2927040, 'steps': 15244, 'loss/train': 1.7202751636505127} -11/06/2021 23:24:44 - INFO - __main__ - Step 15246: {'lr': 0.0004901841572203839, 'samples': 2927232, 'steps': 15245, 'loss/train': 1.7216240167617798} -11/06/2021 23:24:44 - INFO - __main__ - Step 15247: {'lr': 0.0004901826847466738, 'samples': 2927424, 'steps': 15246, 'loss/train': 1.255531668663025} -11/06/2021 23:24:44 - INFO - __main__ - Step 15248: {'lr': 0.000490181212164741, 'samples': 2927616, 'steps': 15247, 'loss/train': 2.0545222759246826} -11/06/2021 23:24:46 - INFO - __main__ - Step 15249: {'lr': 0.0004901797394745861, 'samples': 2927808, 'steps': 15248, 'loss/train': 1.667556643486023} -11/06/2021 23:24:46 - INFO - __main__ - Step 15250: {'lr': 0.0004901782666762102, 'samples': 2928000, 'steps': 15249, 'loss/train': 1.852941870689392} -11/06/2021 23:24:46 - INFO - __main__ - Step 15251: {'lr': 0.0004901767937696135, 'samples': 2928192, 'steps': 15250, 'loss/train': 2.0363755226135254} -11/06/2021 23:24:47 - INFO - __main__ - Step 15252: {'lr': 0.0004901753207547969, 'samples': 2928384, 'steps': 15251, 'loss/train': 1.3573280572891235} -11/06/2021 23:24:47 - INFO - __main__ - Step 15253: {'lr': 0.000490173847631761, 'samples': 2928576, 'steps': 15252, 'loss/train': 1.8147984743118286} -11/06/2021 23:24:47 - INFO - __main__ - Step 15254: {'lr': 0.0004901723744005065, 'samples': 2928768, 'steps': 15253, 'loss/train': 1.7918343544006348} -11/06/2021 23:24:48 - INFO - __main__ - Step 15255: {'lr': 0.0004901709010610339, 'samples': 2928960, 'steps': 15254, 'loss/train': 1.5869040489196777} -11/06/2021 23:24:49 - INFO - __main__ - Step 15256: {'lr': 0.0004901694276133441, 'samples': 2929152, 'steps': 15255, 'loss/train': 1.790469765663147} -11/06/2021 23:24:49 - INFO - __main__ - Step 15257: {'lr': 0.0004901679540574377, 'samples': 2929344, 'steps': 15256, 'loss/train': 1.7606391906738281} -11/06/2021 23:24:49 - INFO - __main__ - Step 15258: {'lr': 0.0004901664803933153, 'samples': 2929536, 'steps': 15257, 'loss/train': 1.265826940536499} -11/06/2021 23:24:50 - INFO - __main__ - Step 15259: {'lr': 0.0004901650066209775, 'samples': 2929728, 'steps': 15258, 'loss/train': 1.744316577911377} -11/06/2021 23:24:51 - INFO - __main__ - Step 15260: {'lr': 0.0004901635327404252, 'samples': 2929920, 'steps': 15259, 'loss/train': 1.8547157049179077} -11/06/2021 23:24:51 - INFO - __main__ - Step 15261: {'lr': 0.0004901620587516587, 'samples': 2930112, 'steps': 15260, 'loss/train': 1.576607346534729} -11/06/2021 23:24:52 - INFO - __main__ - Step 15262: {'lr': 0.0004901605846546791, 'samples': 2930304, 'steps': 15261, 'loss/train': 1.0735132694244385} -11/06/2021 23:24:52 - INFO - __main__ - Step 15263: {'lr': 0.0004901591104494868, 'samples': 2930496, 'steps': 15262, 'loss/train': 2.1972012519836426} -11/06/2021 23:24:52 - INFO - __main__ - Step 15264: {'lr': 0.0004901576361360825, 'samples': 2930688, 'steps': 15263, 'loss/train': 1.0414632558822632} -11/06/2021 23:24:54 - INFO - __main__ - Step 15265: {'lr': 0.0004901561617144667, 'samples': 2930880, 'steps': 15264, 'loss/train': 1.8631575107574463} -11/06/2021 23:24:54 - INFO - __main__ - Step 15266: {'lr': 0.0004901546871846405, 'samples': 2931072, 'steps': 15265, 'loss/train': 0.9033583402633667} -11/06/2021 23:24:54 - INFO - __main__ - Step 15267: {'lr': 0.0004901532125466041, 'samples': 2931264, 'steps': 15266, 'loss/train': 1.4277762174606323} -11/06/2021 23:24:55 - INFO - __main__ - Step 15268: {'lr': 0.0004901517378003584, 'samples': 2931456, 'steps': 15267, 'loss/train': 0.7227610349655151} -11/06/2021 23:24:55 - INFO - __main__ - Step 15269: {'lr': 0.0004901502629459042, 'samples': 2931648, 'steps': 15268, 'loss/train': 0.25619640946388245} -11/06/2021 23:24:56 - INFO - __main__ - Step 15270: {'lr': 0.000490148787983242, 'samples': 2931840, 'steps': 15269, 'loss/train': 1.9297094345092773} -11/06/2021 23:24:56 - INFO - __main__ - Step 15271: {'lr': 0.0004901473129123723, 'samples': 2932032, 'steps': 15270, 'loss/train': 1.359814167022705} -11/06/2021 23:24:57 - INFO - __main__ - Step 15272: {'lr': 0.0004901458377332959, 'samples': 2932224, 'steps': 15271, 'loss/train': 1.641144037246704} -11/06/2021 23:24:57 - INFO - __main__ - Step 15273: {'lr': 0.0004901443624460136, 'samples': 2932416, 'steps': 15272, 'loss/train': 1.692050576210022} -11/06/2021 23:24:57 - INFO - __main__ - Step 15274: {'lr': 0.000490142887050526, 'samples': 2932608, 'steps': 15273, 'loss/train': 0.9697434902191162} -11/06/2021 23:24:59 - INFO - __main__ - Step 15275: {'lr': 0.0004901414115468335, 'samples': 2932800, 'steps': 15274, 'loss/train': 1.5721526145935059} -11/06/2021 23:24:59 - INFO - __main__ - Step 15276: {'lr': 0.0004901399359349372, 'samples': 2932992, 'steps': 15275, 'loss/train': 1.9338434934616089} -11/06/2021 23:24:59 - INFO - __main__ - Step 15277: {'lr': 0.0004901384602148376, 'samples': 2933184, 'steps': 15276, 'loss/train': 1.4072198867797852} -11/06/2021 23:25:00 - INFO - __main__ - Step 15278: {'lr': 0.0004901369843865351, 'samples': 2933376, 'steps': 15277, 'loss/train': 1.9054416418075562} -11/06/2021 23:25:00 - INFO - __main__ - Step 15279: {'lr': 0.0004901355084500307, 'samples': 2933568, 'steps': 15278, 'loss/train': 1.816591501235962} -11/06/2021 23:25:00 - INFO - __main__ - Step 15280: {'lr': 0.000490134032405325, 'samples': 2933760, 'steps': 15279, 'loss/train': 1.780461311340332} -11/06/2021 23:25:01 - INFO - __main__ - Step 15281: {'lr': 0.0004901325562524185, 'samples': 2933952, 'steps': 15280, 'loss/train': 0.4465474784374237} -11/06/2021 23:25:02 - INFO - __main__ - Step 15282: {'lr': 0.0004901310799913121, 'samples': 2934144, 'steps': 15281, 'loss/train': 1.4008394479751587} -11/06/2021 23:25:02 - INFO - __main__ - Step 15283: {'lr': 0.0004901296036220062, 'samples': 2934336, 'steps': 15282, 'loss/train': 1.2545615434646606} -11/06/2021 23:25:03 - INFO - __main__ - Step 15284: {'lr': 0.0004901281271445016, 'samples': 2934528, 'steps': 15283, 'loss/train': 1.5060338973999023} -11/06/2021 23:25:03 - INFO - __main__ - Step 15285: {'lr': 0.000490126650558799, 'samples': 2934720, 'steps': 15284, 'loss/train': 1.5489078760147095} -11/06/2021 23:25:03 - INFO - __main__ - Step 15286: {'lr': 0.000490125173864899, 'samples': 2934912, 'steps': 15285, 'loss/train': 1.5084561109542847} -11/06/2021 23:25:05 - INFO - __main__ - Step 15287: {'lr': 0.0004901236970628024, 'samples': 2935104, 'steps': 15286, 'loss/train': 1.5067825317382812} -11/06/2021 23:25:05 - INFO - __main__ - Step 15288: {'lr': 0.0004901222201525099, 'samples': 2935296, 'steps': 15287, 'loss/train': 1.3645248413085938} -11/06/2021 23:25:05 - INFO - __main__ - Step 15289: {'lr': 0.0004901207431340218, 'samples': 2935488, 'steps': 15288, 'loss/train': 1.7662934064865112} -11/06/2021 23:25:06 - INFO - __main__ - Step 15290: {'lr': 0.000490119266007339, 'samples': 2935680, 'steps': 15289, 'loss/train': 1.3966121673583984} -11/06/2021 23:25:06 - INFO - __main__ - Step 15291: {'lr': 0.0004901177887724623, 'samples': 2935872, 'steps': 15290, 'loss/train': 1.620540976524353} -11/06/2021 23:25:08 - INFO - __main__ - Step 15292: {'lr': 0.0004901163114293921, 'samples': 2936064, 'steps': 15291, 'loss/train': 1.8138169050216675} -11/06/2021 23:25:08 - INFO - __main__ - Step 15293: {'lr': 0.0004901148339781293, 'samples': 2936256, 'steps': 15292, 'loss/train': 1.7931532859802246} -11/06/2021 23:25:09 - INFO - __main__ - Step 15294: {'lr': 0.0004901133564186744, 'samples': 2936448, 'steps': 15293, 'loss/train': 1.5500938892364502} -11/06/2021 23:25:09 - INFO - __main__ - Step 15295: {'lr': 0.0004901118787510281, 'samples': 2936640, 'steps': 15294, 'loss/train': 3.1649906635284424} -11/06/2021 23:25:10 - INFO - __main__ - Step 15296: {'lr': 0.0004901104009751912, 'samples': 2936832, 'steps': 15295, 'loss/train': 0.5988634824752808} -11/06/2021 23:25:10 - INFO - __main__ - Step 15297: {'lr': 0.0004901089230911642, 'samples': 2937024, 'steps': 15296, 'loss/train': 0.5126264095306396} -11/06/2021 23:25:11 - INFO - __main__ - Step 15298: {'lr': 0.0004901074450989479, 'samples': 2937216, 'steps': 15297, 'loss/train': 1.6376423835754395} -11/06/2021 23:25:11 - INFO - __main__ - Step 15299: {'lr': 0.0004901059669985427, 'samples': 2937408, 'steps': 15298, 'loss/train': 2.4724743366241455} -11/06/2021 23:25:12 - INFO - __main__ - Step 15300: {'lr': 0.0004901044887899496, 'samples': 2937600, 'steps': 15299, 'loss/train': 1.8324450254440308} -11/06/2021 23:25:12 - INFO - __main__ - Step 15301: {'lr': 0.0004901030104731691, 'samples': 2937792, 'steps': 15300, 'loss/train': 2.0078108310699463} -11/06/2021 23:25:12 - INFO - __main__ - Step 15302: {'lr': 0.0004901015320482019, 'samples': 2937984, 'steps': 15301, 'loss/train': 1.5919190645217896} -11/06/2021 23:25:13 - INFO - __main__ - Step 15303: {'lr': 0.0004901000535150486, 'samples': 2938176, 'steps': 15302, 'loss/train': 1.7838540077209473} -11/06/2021 23:25:14 - INFO - __main__ - Step 15304: {'lr': 0.0004900985748737101, 'samples': 2938368, 'steps': 15303, 'loss/train': 1.9150638580322266} -11/06/2021 23:25:14 - INFO - __main__ - Step 15305: {'lr': 0.0004900970961241866, 'samples': 2938560, 'steps': 15304, 'loss/train': 1.3544918298721313} -11/06/2021 23:25:14 - INFO - __main__ - Step 15306: {'lr': 0.0004900956172664792, 'samples': 2938752, 'steps': 15305, 'loss/train': 1.8071099519729614} -11/06/2021 23:25:15 - INFO - __main__ - Step 15307: {'lr': 0.0004900941383005884, 'samples': 2938944, 'steps': 15306, 'loss/train': 2.145068883895874} -11/06/2021 23:25:16 - INFO - __main__ - Step 15308: {'lr': 0.0004900926592265149, 'samples': 2939136, 'steps': 15307, 'loss/train': 1.8237600326538086} -11/06/2021 23:25:16 - INFO - __main__ - Step 15309: {'lr': 0.0004900911800442593, 'samples': 2939328, 'steps': 15308, 'loss/train': 1.6788253784179688} -11/06/2021 23:25:16 - INFO - __main__ - Step 15310: {'lr': 0.0004900897007538225, 'samples': 2939520, 'steps': 15309, 'loss/train': 1.255226731300354} -11/06/2021 23:25:17 - INFO - __main__ - Step 15311: {'lr': 0.0004900882213552049, 'samples': 2939712, 'steps': 15310, 'loss/train': 2.2887020111083984} -11/06/2021 23:25:17 - INFO - __main__ - Step 15312: {'lr': 0.0004900867418484072, 'samples': 2939904, 'steps': 15311, 'loss/train': 1.4309970140457153} -11/06/2021 23:25:18 - INFO - __main__ - Step 15313: {'lr': 0.0004900852622334301, 'samples': 2940096, 'steps': 15312, 'loss/train': 1.7414692640304565} -11/06/2021 23:25:18 - INFO - __main__ - Step 15314: {'lr': 0.0004900837825102743, 'samples': 2940288, 'steps': 15313, 'loss/train': 2.0665924549102783} -11/06/2021 23:25:19 - INFO - __main__ - Step 15315: {'lr': 0.0004900823026789405, 'samples': 2940480, 'steps': 15314, 'loss/train': 1.498655080795288} -11/06/2021 23:25:19 - INFO - __main__ - Step 15316: {'lr': 0.0004900808227394293, 'samples': 2940672, 'steps': 15315, 'loss/train': 1.51724112033844} -11/06/2021 23:25:20 - INFO - __main__ - Step 15317: {'lr': 0.0004900793426917412, 'samples': 2940864, 'steps': 15316, 'loss/train': 1.9836689233779907} -11/06/2021 23:25:21 - INFO - __main__ - Step 15318: {'lr': 0.0004900778625358774, 'samples': 2941056, 'steps': 15317, 'loss/train': 1.8022664785385132} -11/06/2021 23:25:21 - INFO - __main__ - Step 15319: {'lr': 0.000490076382271838, 'samples': 2941248, 'steps': 15318, 'loss/train': 1.9844396114349365} -11/06/2021 23:25:21 - INFO - __main__ - Step 15320: {'lr': 0.0004900749018996238, 'samples': 2941440, 'steps': 15319, 'loss/train': 1.9721046686172485} -11/06/2021 23:25:22 - INFO - __main__ - Step 15321: {'lr': 0.0004900734214192358, 'samples': 2941632, 'steps': 15320, 'loss/train': 1.9147781133651733} -11/06/2021 23:25:22 - INFO - __main__ - Step 15322: {'lr': 0.0004900719408306743, 'samples': 2941824, 'steps': 15321, 'loss/train': 1.805896520614624} -11/06/2021 23:25:22 - INFO - __main__ - Step 15323: {'lr': 0.0004900704601339401, 'samples': 2942016, 'steps': 15322, 'loss/train': 1.896042823791504} -11/06/2021 23:25:24 - INFO - __main__ - Step 15324: {'lr': 0.0004900689793290339, 'samples': 2942208, 'steps': 15323, 'loss/train': 1.7801188230514526} -11/06/2021 23:25:24 - INFO - __main__ - Step 15325: {'lr': 0.0004900674984159562, 'samples': 2942400, 'steps': 15324, 'loss/train': 1.7624114751815796} -11/06/2021 23:25:25 - INFO - __main__ - Step 15326: {'lr': 0.0004900660173947079, 'samples': 2942592, 'steps': 15325, 'loss/train': 2.018181324005127} -11/06/2021 23:25:25 - INFO - __main__ - Step 15327: {'lr': 0.0004900645362652895, 'samples': 2942784, 'steps': 15326, 'loss/train': 1.8817495107650757} -11/06/2021 23:25:25 - INFO - __main__ - Step 15328: {'lr': 0.0004900630550277018, 'samples': 2942976, 'steps': 15327, 'loss/train': 2.0773236751556396} -11/06/2021 23:25:26 - INFO - __main__ - Step 15329: {'lr': 0.0004900615736819452, 'samples': 2943168, 'steps': 15328, 'loss/train': 1.9412237405776978} -11/06/2021 23:25:27 - INFO - __main__ - Step 15330: {'lr': 0.0004900600922280207, 'samples': 2943360, 'steps': 15329, 'loss/train': 1.6500606536865234} -11/06/2021 23:25:27 - INFO - __main__ - Step 15331: {'lr': 0.0004900586106659289, 'samples': 2943552, 'steps': 15330, 'loss/train': 2.294801712036133} -11/06/2021 23:25:27 - INFO - __main__ - Step 15332: {'lr': 0.0004900571289956703, 'samples': 2943744, 'steps': 15331, 'loss/train': 0.9480341076850891} -11/06/2021 23:25:28 - INFO - __main__ - Step 15333: {'lr': 0.0004900556472172457, 'samples': 2943936, 'steps': 15332, 'loss/train': 2.6426515579223633} -11/06/2021 23:25:28 - INFO - __main__ - Step 15334: {'lr': 0.0004900541653306557, 'samples': 2944128, 'steps': 15333, 'loss/train': 2.0877530574798584} -11/06/2021 23:25:29 - INFO - __main__ - Step 15335: {'lr': 0.0004900526833359009, 'samples': 2944320, 'steps': 15334, 'loss/train': 1.6220190525054932} -11/06/2021 23:25:30 - INFO - __main__ - Step 15336: {'lr': 0.0004900512012329822, 'samples': 2944512, 'steps': 15335, 'loss/train': 1.7684022188186646} -11/06/2021 23:25:30 - INFO - __main__ - Step 15337: {'lr': 0.0004900497190219002, 'samples': 2944704, 'steps': 15336, 'loss/train': 1.8836572170257568} -11/06/2021 23:25:31 - INFO - __main__ - Step 15338: {'lr': 0.0004900482367026554, 'samples': 2944896, 'steps': 15337, 'loss/train': 0.36830881237983704} -11/06/2021 23:25:31 - INFO - __main__ - Step 15339: {'lr': 0.0004900467542752485, 'samples': 2945088, 'steps': 15338, 'loss/train': 1.869981288909912} -11/06/2021 23:25:31 - INFO - __main__ - Step 15340: {'lr': 0.0004900452717396803, 'samples': 2945280, 'steps': 15339, 'loss/train': 1.5828317403793335} -11/06/2021 23:25:32 - INFO - __main__ - Step 15341: {'lr': 0.0004900437890959515, 'samples': 2945472, 'steps': 15340, 'loss/train': 1.6785833835601807} -11/06/2021 23:25:33 - INFO - __main__ - Step 15342: {'lr': 0.0004900423063440625, 'samples': 2945664, 'steps': 15341, 'loss/train': 1.9623292684555054} -11/06/2021 23:25:33 - INFO - __main__ - Step 15343: {'lr': 0.0004900408234840142, 'samples': 2945856, 'steps': 15342, 'loss/train': 1.8435673713684082} -11/06/2021 23:25:33 - INFO - __main__ - Step 15344: {'lr': 0.0004900393405158073, 'samples': 2946048, 'steps': 15343, 'loss/train': 2.0135602951049805} -11/06/2021 23:25:34 - INFO - __main__ - Step 15345: {'lr': 0.0004900378574394423, 'samples': 2946240, 'steps': 15344, 'loss/train': 1.5645862817764282} -11/06/2021 23:25:34 - INFO - __main__ - Step 15346: {'lr': 0.00049003637425492, 'samples': 2946432, 'steps': 15345, 'loss/train': 6.070239543914795} -11/06/2021 23:25:35 - INFO - __main__ - Step 15347: {'lr': 0.0004900348909622409, 'samples': 2946624, 'steps': 15346, 'loss/train': 2.0285749435424805} -11/06/2021 23:25:35 - INFO - __main__ - Step 15348: {'lr': 0.0004900334075614059, 'samples': 2946816, 'steps': 15347, 'loss/train': 1.966596245765686} -11/06/2021 23:25:36 - INFO - __main__ - Step 15349: {'lr': 0.0004900319240524155, 'samples': 2947008, 'steps': 15348, 'loss/train': 1.8650213479995728} -11/06/2021 23:25:36 - INFO - __main__ - Step 15350: {'lr': 0.0004900304404352704, 'samples': 2947200, 'steps': 15349, 'loss/train': 2.0036559104919434} -11/06/2021 23:25:36 - INFO - __main__ - Step 15351: {'lr': 0.0004900289567099713, 'samples': 2947392, 'steps': 15350, 'loss/train': 1.567614197731018} -11/06/2021 23:25:38 - INFO - __main__ - Step 15352: {'lr': 0.000490027472876519, 'samples': 2947584, 'steps': 15351, 'loss/train': 1.430046558380127} -11/06/2021 23:25:38 - INFO - __main__ - Step 15353: {'lr': 0.0004900259889349138, 'samples': 2947776, 'steps': 15352, 'loss/train': 2.044808864593506} -11/06/2021 23:25:38 - INFO - __main__ - Step 15354: {'lr': 0.0004900245048851567, 'samples': 2947968, 'steps': 15353, 'loss/train': 0.9513130784034729} -11/06/2021 23:25:39 - INFO - __main__ - Step 15355: {'lr': 0.0004900230207272483, 'samples': 2948160, 'steps': 15354, 'loss/train': 1.701623558998108} -11/06/2021 23:25:39 - INFO - __main__ - Step 15356: {'lr': 0.000490021536461189, 'samples': 2948352, 'steps': 15355, 'loss/train': 1.8428715467453003} -11/06/2021 23:25:40 - INFO - __main__ - Step 15357: {'lr': 0.00049002005208698, 'samples': 2948544, 'steps': 15356, 'loss/train': 1.4935647249221802} -11/06/2021 23:25:40 - INFO - __main__ - Step 15358: {'lr': 0.0004900185676046214, 'samples': 2948736, 'steps': 15357, 'loss/train': 1.9879461526870728} -11/06/2021 23:25:41 - INFO - __main__ - Step 15359: {'lr': 0.0004900170830141144, 'samples': 2948928, 'steps': 15358, 'loss/train': 1.5759130716323853} -11/06/2021 23:25:41 - INFO - __main__ - Step 15360: {'lr': 0.0004900155983154592, 'samples': 2949120, 'steps': 15359, 'loss/train': 1.0437538623809814} -11/06/2021 23:25:41 - INFO - __main__ - Step 15361: {'lr': 0.0004900141135086569, 'samples': 2949312, 'steps': 15360, 'loss/train': 1.6635363101959229} -11/06/2021 23:25:43 - INFO - __main__ - Step 15362: {'lr': 0.0004900126285937077, 'samples': 2949504, 'steps': 15361, 'loss/train': 1.9337184429168701} -11/06/2021 23:25:43 - INFO - __main__ - Step 15363: {'lr': 0.0004900111435706127, 'samples': 2949696, 'steps': 15362, 'loss/train': 1.4485169649124146} -11/06/2021 23:25:43 - INFO - __main__ - Step 15364: {'lr': 0.0004900096584393723, 'samples': 2949888, 'steps': 15363, 'loss/train': 1.5810778141021729} -11/06/2021 23:25:44 - INFO - __main__ - Step 15365: {'lr': 0.0004900081731999872, 'samples': 2950080, 'steps': 15364, 'loss/train': 1.6182117462158203} -11/06/2021 23:25:44 - INFO - __main__ - Step 15366: {'lr': 0.0004900066878524582, 'samples': 2950272, 'steps': 15365, 'loss/train': 1.547028660774231} -11/06/2021 23:25:45 - INFO - __main__ - Step 15367: {'lr': 0.0004900052023967859, 'samples': 2950464, 'steps': 15366, 'loss/train': 1.7055131196975708} -11/06/2021 23:25:45 - INFO - __main__ - Step 15368: {'lr': 0.0004900037168329709, 'samples': 2950656, 'steps': 15367, 'loss/train': 1.550373911857605} -11/06/2021 23:25:46 - INFO - __main__ - Step 15369: {'lr': 0.000490002231161014, 'samples': 2950848, 'steps': 15368, 'loss/train': 1.7046164274215698} -11/06/2021 23:25:46 - INFO - __main__ - Step 15370: {'lr': 0.0004900007453809157, 'samples': 2951040, 'steps': 15369, 'loss/train': 1.5732970237731934} -11/06/2021 23:25:46 - INFO - __main__ - Step 15371: {'lr': 0.0004899992594926769, 'samples': 2951232, 'steps': 15370, 'loss/train': 1.3955873250961304} -11/06/2021 23:25:47 - INFO - __main__ - Step 15372: {'lr': 0.000489997773496298, 'samples': 2951424, 'steps': 15371, 'loss/train': 1.5523087978363037} -11/06/2021 23:25:48 - INFO - __main__ - Step 15373: {'lr': 0.0004899962873917798, 'samples': 2951616, 'steps': 15372, 'loss/train': 1.710436463356018} -11/06/2021 23:25:48 - INFO - __main__ - Step 15374: {'lr': 0.000489994801179123, 'samples': 2951808, 'steps': 15373, 'loss/train': 1.610868215560913} -11/06/2021 23:25:49 - INFO - __main__ - Step 15375: {'lr': 0.0004899933148583284, 'samples': 2952000, 'steps': 15374, 'loss/train': 1.4452327489852905} -11/06/2021 23:25:49 - INFO - __main__ - Step 15376: {'lr': 0.0004899918284293964, 'samples': 2952192, 'steps': 15375, 'loss/train': 1.6878875494003296} -11/06/2021 23:25:50 - INFO - __main__ - Step 15377: {'lr': 0.0004899903418923278, 'samples': 2952384, 'steps': 15376, 'loss/train': 1.6669107675552368} -11/06/2021 23:25:50 - INFO - __main__ - Step 15378: {'lr': 0.0004899888552471232, 'samples': 2952576, 'steps': 15377, 'loss/train': 1.7093682289123535} -11/06/2021 23:25:51 - INFO - __main__ - Step 15379: {'lr': 0.0004899873684937833, 'samples': 2952768, 'steps': 15378, 'loss/train': 1.2271426916122437} -11/06/2021 23:25:51 - INFO - __main__ - Step 15380: {'lr': 0.0004899858816323089, 'samples': 2952960, 'steps': 15379, 'loss/train': 1.6182414293289185} -11/06/2021 23:25:51 - INFO - __main__ - Step 15381: {'lr': 0.0004899843946627006, 'samples': 2953152, 'steps': 15380, 'loss/train': 1.7214139699935913} -11/06/2021 23:25:52 - INFO - __main__ - Step 15382: {'lr': 0.0004899829075849589, 'samples': 2953344, 'steps': 15381, 'loss/train': 2.161836624145508} -11/06/2021 23:25:53 - INFO - __main__ - Step 15383: {'lr': 0.0004899814203990847, 'samples': 2953536, 'steps': 15382, 'loss/train': 1.879669189453125} -11/06/2021 23:25:53 - INFO - __main__ - Step 15384: {'lr': 0.0004899799331050785, 'samples': 2953728, 'steps': 15383, 'loss/train': 1.885219693183899} -11/06/2021 23:25:53 - INFO - __main__ - Step 15385: {'lr': 0.0004899784457029411, 'samples': 2953920, 'steps': 15384, 'loss/train': 1.2572287321090698} -11/06/2021 23:25:54 - INFO - __main__ - Step 15386: {'lr': 0.000489976958192673, 'samples': 2954112, 'steps': 15385, 'loss/train': 1.6987992525100708} -11/06/2021 23:25:54 - INFO - __main__ - Step 15387: {'lr': 0.0004899754705742752, 'samples': 2954304, 'steps': 15386, 'loss/train': 2.0075464248657227} -11/06/2021 23:25:55 - INFO - __main__ - Step 15388: {'lr': 0.0004899739828477481, 'samples': 2954496, 'steps': 15387, 'loss/train': 1.6312947273254395} -11/06/2021 23:25:56 - INFO - __main__ - Step 15389: {'lr': 0.0004899724950130923, 'samples': 2954688, 'steps': 15388, 'loss/train': 1.7411924600601196} -11/06/2021 23:25:56 - INFO - __main__ - Step 15390: {'lr': 0.0004899710070703087, 'samples': 2954880, 'steps': 15389, 'loss/train': 5.825747489929199} -11/06/2021 23:25:56 - INFO - __main__ - Step 15391: {'lr': 0.0004899695190193978, 'samples': 2955072, 'steps': 15390, 'loss/train': 1.3837753534317017} -11/06/2021 23:25:57 - INFO - __main__ - Step 15392: {'lr': 0.0004899680308603604, 'samples': 2955264, 'steps': 15391, 'loss/train': 1.489019751548767} -11/06/2021 23:25:57 - INFO - __main__ - Step 15393: {'lr': 0.000489966542593197, 'samples': 2955456, 'steps': 15392, 'loss/train': 1.6282072067260742} -11/06/2021 23:25:58 - INFO - __main__ - Step 15394: {'lr': 0.0004899650542179085, 'samples': 2955648, 'steps': 15393, 'loss/train': 1.1773505210876465} -11/06/2021 23:25:58 - INFO - __main__ - Step 15395: {'lr': 0.0004899635657344954, 'samples': 2955840, 'steps': 15394, 'loss/train': 1.7524396181106567} -11/06/2021 23:25:59 - INFO - __main__ - Step 15396: {'lr': 0.0004899620771429585, 'samples': 2956032, 'steps': 15395, 'loss/train': 1.4660807847976685} -11/06/2021 23:25:59 - INFO - __main__ - Step 15397: {'lr': 0.0004899605884432983, 'samples': 2956224, 'steps': 15396, 'loss/train': 1.6448665857315063} -11/06/2021 23:25:59 - INFO - __main__ - Step 15398: {'lr': 0.0004899590996355155, 'samples': 2956416, 'steps': 15397, 'loss/train': 1.1277403831481934} -11/06/2021 23:26:00 - INFO - __main__ - Step 15399: {'lr': 0.000489957610719611, 'samples': 2956608, 'steps': 15398, 'loss/train': 1.7842482328414917} -11/06/2021 23:26:01 - INFO - __main__ - Step 15400: {'lr': 0.0004899561216955852, 'samples': 2956800, 'steps': 15399, 'loss/train': 1.7123888731002808} -11/06/2021 23:26:01 - INFO - __main__ - Step 15401: {'lr': 0.0004899546325634388, 'samples': 2956992, 'steps': 15400, 'loss/train': 1.379862666130066} -11/06/2021 23:26:01 - INFO - __main__ - Step 15402: {'lr': 0.0004899531433231728, 'samples': 2957184, 'steps': 15401, 'loss/train': 1.210938572883606} -11/06/2021 23:26:02 - INFO - __main__ - Step 15403: {'lr': 0.0004899516539747874, 'samples': 2957376, 'steps': 15402, 'loss/train': 1.3789384365081787} -11/06/2021 23:26:02 - INFO - __main__ - Step 15404: {'lr': 0.0004899501645182835, 'samples': 2957568, 'steps': 15403, 'loss/train': 1.301833987236023} -11/06/2021 23:26:03 - INFO - __main__ - Step 15405: {'lr': 0.0004899486749536618, 'samples': 2957760, 'steps': 15404, 'loss/train': 2.503183603286743} -11/06/2021 23:26:04 - INFO - __main__ - Step 15406: {'lr': 0.000489947185280923, 'samples': 2957952, 'steps': 15405, 'loss/train': 1.348501443862915} -11/06/2021 23:26:04 - INFO - __main__ - Step 15407: {'lr': 0.0004899456955000676, 'samples': 2958144, 'steps': 15406, 'loss/train': 1.6351882219314575} -11/06/2021 23:26:04 - INFO - __main__ - Step 15408: {'lr': 0.0004899442056110964, 'samples': 2958336, 'steps': 15407, 'loss/train': 1.4293309450149536} -11/06/2021 23:26:05 - INFO - __main__ - Step 15409: {'lr': 0.00048994271561401, 'samples': 2958528, 'steps': 15408, 'loss/train': 1.3212099075317383} -11/06/2021 23:26:06 - INFO - __main__ - Step 15410: {'lr': 0.0004899412255088091, 'samples': 2958720, 'steps': 15409, 'loss/train': 1.6057772636413574} -11/06/2021 23:26:06 - INFO - __main__ - Step 15411: {'lr': 0.0004899397352954945, 'samples': 2958912, 'steps': 15410, 'loss/train': 1.645572304725647} -11/06/2021 23:26:06 - INFO - __main__ - Step 15412: {'lr': 0.0004899382449740667, 'samples': 2959104, 'steps': 15411, 'loss/train': 1.9118947982788086} -11/06/2021 23:26:07 - INFO - __main__ - Step 15413: {'lr': 0.0004899367545445264, 'samples': 2959296, 'steps': 15412, 'loss/train': 1.989318609237671} -11/06/2021 23:26:07 - INFO - __main__ - Step 15414: {'lr': 0.0004899352640068743, 'samples': 2959488, 'steps': 15413, 'loss/train': 1.6085702180862427} -11/06/2021 23:26:08 - INFO - __main__ - Step 15415: {'lr': 0.0004899337733611113, 'samples': 2959680, 'steps': 15414, 'loss/train': 1.6412628889083862} -11/06/2021 23:26:09 - INFO - __main__ - Step 15416: {'lr': 0.0004899322826072375, 'samples': 2959872, 'steps': 15415, 'loss/train': 1.6715970039367676} -11/06/2021 23:26:09 - INFO - __main__ - Step 15417: {'lr': 0.0004899307917452542, 'samples': 2960064, 'steps': 15416, 'loss/train': 0.1822996884584427} -11/06/2021 23:26:09 - INFO - __main__ - Step 15418: {'lr': 0.0004899293007751616, 'samples': 2960256, 'steps': 15417, 'loss/train': 1.2673732042312622} -11/06/2021 23:26:10 - INFO - __main__ - Step 15419: {'lr': 0.0004899278096969605, 'samples': 2960448, 'steps': 15418, 'loss/train': 2.0934507846832275} -11/06/2021 23:26:11 - INFO - __main__ - Step 15420: {'lr': 0.0004899263185106518, 'samples': 2960640, 'steps': 15419, 'loss/train': 1.9533450603485107} -11/06/2021 23:26:11 - INFO - __main__ - Step 15421: {'lr': 0.000489924827216236, 'samples': 2960832, 'steps': 15420, 'loss/train': 1.7429298162460327} -11/06/2021 23:26:11 - INFO - __main__ - Step 15422: {'lr': 0.0004899233358137137, 'samples': 2961024, 'steps': 15421, 'loss/train': 1.7253789901733398} -11/06/2021 23:26:12 - INFO - __main__ - Step 15423: {'lr': 0.0004899218443030857, 'samples': 2961216, 'steps': 15422, 'loss/train': 0.9601808786392212} -11/06/2021 23:26:12 - INFO - __main__ - Step 15424: {'lr': 0.0004899203526843526, 'samples': 2961408, 'steps': 15423, 'loss/train': 1.4191993474960327} -11/06/2021 23:26:13 - INFO - __main__ - Step 15425: {'lr': 0.000489918860957515, 'samples': 2961600, 'steps': 15424, 'loss/train': 1.5568323135375977} -11/06/2021 23:26:14 - INFO - __main__ - Step 15426: {'lr': 0.0004899173691225737, 'samples': 2961792, 'steps': 15425, 'loss/train': 1.8269211053848267} -11/06/2021 23:26:14 - INFO - __main__ - Step 15427: {'lr': 0.0004899158771795295, 'samples': 2961984, 'steps': 15426, 'loss/train': 1.576122522354126} -11/06/2021 23:26:14 - INFO - __main__ - Step 15428: {'lr': 0.0004899143851283827, 'samples': 2962176, 'steps': 15427, 'loss/train': 1.3698642253875732} -11/06/2021 23:26:15 - INFO - __main__ - Step 15429: {'lr': 0.0004899128929691343, 'samples': 2962368, 'steps': 15428, 'loss/train': 1.8090990781784058} -11/06/2021 23:26:15 - INFO - __main__ - Step 15430: {'lr': 0.0004899114007017849, 'samples': 2962560, 'steps': 15429, 'loss/train': 1.9394744634628296} -11/06/2021 23:26:16 - INFO - __main__ - Step 15431: {'lr': 0.000489909908326335, 'samples': 2962752, 'steps': 15430, 'loss/train': 1.6963614225387573} -11/06/2021 23:26:17 - INFO - __main__ - Step 15432: {'lr': 0.0004899084158427855, 'samples': 2962944, 'steps': 15431, 'loss/train': 1.5980172157287598} -11/06/2021 23:26:17 - INFO - __main__ - Step 15433: {'lr': 0.0004899069232511368, 'samples': 2963136, 'steps': 15432, 'loss/train': 2.0468621253967285} -11/06/2021 23:26:17 - INFO - __main__ - Step 15434: {'lr': 0.0004899054305513899, 'samples': 2963328, 'steps': 15433, 'loss/train': 2.0248918533325195} -11/06/2021 23:26:18 - INFO - __main__ - Step 15435: {'lr': 0.0004899039377435452, 'samples': 2963520, 'steps': 15434, 'loss/train': 2.0467848777770996} -11/06/2021 23:26:19 - INFO - __main__ - Step 15436: {'lr': 0.0004899024448276036, 'samples': 2963712, 'steps': 15435, 'loss/train': 1.7609314918518066} -11/06/2021 23:26:19 - INFO - __main__ - Step 15437: {'lr': 0.0004899009518035657, 'samples': 2963904, 'steps': 15436, 'loss/train': 1.8569064140319824} -11/06/2021 23:26:19 - INFO - __main__ - Step 15438: {'lr': 0.000489899458671432, 'samples': 2964096, 'steps': 15437, 'loss/train': 1.7970716953277588} -11/06/2021 23:26:20 - INFO - __main__ - Step 15439: {'lr': 0.0004898979654312034, 'samples': 2964288, 'steps': 15438, 'loss/train': 1.7832825183868408} -11/06/2021 23:26:20 - INFO - __main__ - Step 15440: {'lr': 0.0004898964720828804, 'samples': 2964480, 'steps': 15439, 'loss/train': 1.3016754388809204} -11/06/2021 23:26:21 - INFO - __main__ - Step 15441: {'lr': 0.0004898949786264638, 'samples': 2964672, 'steps': 15440, 'loss/train': 1.9825522899627686} -11/06/2021 23:26:22 - INFO - __main__ - Step 15442: {'lr': 0.0004898934850619542, 'samples': 2964864, 'steps': 15441, 'loss/train': 1.5393202304840088} -11/06/2021 23:26:22 - INFO - __main__ - Step 15443: {'lr': 0.0004898919913893522, 'samples': 2965056, 'steps': 15442, 'loss/train': 1.3558751344680786} -11/06/2021 23:26:22 - INFO - __main__ - Step 15444: {'lr': 0.0004898904976086588, 'samples': 2965248, 'steps': 15443, 'loss/train': 1.950610876083374} -11/06/2021 23:26:23 - INFO - __main__ - Step 15445: {'lr': 0.0004898890037198743, 'samples': 2965440, 'steps': 15444, 'loss/train': 1.397348403930664} -11/06/2021 23:26:24 - INFO - __main__ - Step 15446: {'lr': 0.0004898875097229995, 'samples': 2965632, 'steps': 15445, 'loss/train': 2.1958858966827393} -11/06/2021 23:26:24 - INFO - __main__ - Step 15447: {'lr': 0.0004898860156180351, 'samples': 2965824, 'steps': 15446, 'loss/train': 1.3978043794631958} -11/06/2021 23:26:24 - INFO - __main__ - Step 15448: {'lr': 0.0004898845214049818, 'samples': 2966016, 'steps': 15447, 'loss/train': 0.5018529295921326} -11/06/2021 23:26:25 - INFO - __main__ - Step 15449: {'lr': 0.0004898830270838403, 'samples': 2966208, 'steps': 15448, 'loss/train': 1.4868112802505493} -11/06/2021 23:26:25 - INFO - __main__ - Step 15450: {'lr': 0.0004898815326546111, 'samples': 2966400, 'steps': 15449, 'loss/train': 1.6243109703063965} -11/06/2021 23:26:26 - INFO - __main__ - Step 15451: {'lr': 0.0004898800381172951, 'samples': 2966592, 'steps': 15450, 'loss/train': 1.2126389741897583} -11/06/2021 23:26:26 - INFO - __main__ - Step 15452: {'lr': 0.0004898785434718927, 'samples': 2966784, 'steps': 15451, 'loss/train': 1.6377086639404297} -11/06/2021 23:26:27 - INFO - __main__ - Step 15453: {'lr': 0.0004898770487184047, 'samples': 2966976, 'steps': 15452, 'loss/train': 2.266317844390869} -11/06/2021 23:26:27 - INFO - __main__ - Step 15454: {'lr': 0.000489875553856832, 'samples': 2967168, 'steps': 15453, 'loss/train': 2.4078965187072754} -11/06/2021 23:26:27 - INFO - __main__ - Step 15455: {'lr': 0.000489874058887175, 'samples': 2967360, 'steps': 15454, 'loss/train': 2.1697914600372314} -11/06/2021 23:26:29 - INFO - __main__ - Step 15456: {'lr': 0.0004898725638094345, 'samples': 2967552, 'steps': 15455, 'loss/train': 1.5495775938034058} -11/06/2021 23:26:29 - INFO - __main__ - Step 15457: {'lr': 0.0004898710686236109, 'samples': 2967744, 'steps': 15456, 'loss/train': 1.7793976068496704} -11/06/2021 23:26:29 - INFO - __main__ - Step 15458: {'lr': 0.0004898695733297054, 'samples': 2967936, 'steps': 15457, 'loss/train': 1.8634929656982422} -11/06/2021 23:26:30 - INFO - __main__ - Step 15459: {'lr': 0.0004898680779277182, 'samples': 2968128, 'steps': 15458, 'loss/train': 1.4359500408172607} -11/06/2021 23:26:30 - INFO - __main__ - Step 15460: {'lr': 0.0004898665824176502, 'samples': 2968320, 'steps': 15459, 'loss/train': 1.47426176071167} -11/06/2021 23:26:31 - INFO - __main__ - Step 15461: {'lr': 0.000489865086799502, 'samples': 2968512, 'steps': 15460, 'loss/train': 1.6190659999847412} -11/06/2021 23:26:31 - INFO - __main__ - Step 15462: {'lr': 0.0004898635910732743, 'samples': 2968704, 'steps': 15461, 'loss/train': 1.3541996479034424} -11/06/2021 23:26:32 - INFO - __main__ - Step 15463: {'lr': 0.0004898620952389677, 'samples': 2968896, 'steps': 15462, 'loss/train': 0.9938245415687561} -11/06/2021 23:26:32 - INFO - __main__ - Step 15464: {'lr': 0.000489860599296583, 'samples': 2969088, 'steps': 15463, 'loss/train': 1.6961749792099} -11/06/2021 23:26:32 - INFO - __main__ - Step 15465: {'lr': 0.0004898591032461208, 'samples': 2969280, 'steps': 15464, 'loss/train': 1.7099051475524902} -11/06/2021 23:26:33 - INFO - __main__ - Step 15466: {'lr': 0.0004898576070875818, 'samples': 2969472, 'steps': 15465, 'loss/train': 2.1200191974639893} -11/06/2021 23:26:34 - INFO - __main__ - Step 15467: {'lr': 0.0004898561108209667, 'samples': 2969664, 'steps': 15466, 'loss/train': 1.7490513324737549} -11/06/2021 23:26:34 - INFO - __main__ - Step 15468: {'lr': 0.0004898546144462762, 'samples': 2969856, 'steps': 15467, 'loss/train': 1.9029560089111328} -11/06/2021 23:26:34 - INFO - __main__ - Step 15469: {'lr': 0.0004898531179635108, 'samples': 2970048, 'steps': 15468, 'loss/train': 1.0643110275268555} -11/06/2021 23:26:35 - INFO - __main__ - Step 15470: {'lr': 0.0004898516213726712, 'samples': 2970240, 'steps': 15469, 'loss/train': 2.0877974033355713} -11/06/2021 23:26:35 - INFO - __main__ - Step 15471: {'lr': 0.0004898501246737583, 'samples': 2970432, 'steps': 15470, 'loss/train': 1.450588345527649} -11/06/2021 23:26:36 - INFO - __main__ - Step 15472: {'lr': 0.0004898486278667725, 'samples': 2970624, 'steps': 15471, 'loss/train': 1.8085523843765259} -11/06/2021 23:26:36 - INFO - __main__ - Step 15473: {'lr': 0.0004898471309517148, 'samples': 2970816, 'steps': 15472, 'loss/train': 1.8764305114746094} -11/06/2021 23:26:37 - INFO - __main__ - Step 15474: {'lr': 0.0004898456339285857, 'samples': 2971008, 'steps': 15473, 'loss/train': 1.699832558631897} -11/06/2021 23:26:37 - INFO - __main__ - Step 15475: {'lr': 0.0004898441367973856, 'samples': 2971200, 'steps': 15474, 'loss/train': 1.7935590744018555} -11/06/2021 23:26:38 - INFO - __main__ - Step 15476: {'lr': 0.0004898426395581156, 'samples': 2971392, 'steps': 15475, 'loss/train': 2.0866262912750244} -11/06/2021 23:26:39 - INFO - __main__ - Step 15477: {'lr': 0.0004898411422107762, 'samples': 2971584, 'steps': 15476, 'loss/train': 1.2381302118301392} -11/06/2021 23:26:39 - INFO - __main__ - Step 15478: {'lr': 0.0004898396447553681, 'samples': 2971776, 'steps': 15477, 'loss/train': 2.092162847518921} -11/06/2021 23:26:39 - INFO - __main__ - Step 15479: {'lr': 0.000489838147191892, 'samples': 2971968, 'steps': 15478, 'loss/train': 1.3541998863220215} -11/06/2021 23:26:40 - INFO - __main__ - Step 15480: {'lr': 0.0004898366495203483, 'samples': 2972160, 'steps': 15479, 'loss/train': 1.967870831489563} -11/06/2021 23:26:40 - INFO - __main__ - Step 15481: {'lr': 0.0004898351517407381, 'samples': 2972352, 'steps': 15480, 'loss/train': 1.0641893148422241} -11/06/2021 23:26:41 - INFO - __main__ - Step 15482: {'lr': 0.0004898336538530619, 'samples': 2972544, 'steps': 15481, 'loss/train': 1.6130701303482056} -11/06/2021 23:26:41 - INFO - __main__ - Step 15483: {'lr': 0.0004898321558573203, 'samples': 2972736, 'steps': 15482, 'loss/train': 1.8925131559371948} -11/06/2021 23:26:42 - INFO - __main__ - Step 15484: {'lr': 0.000489830657753514, 'samples': 2972928, 'steps': 15483, 'loss/train': 1.3299318552017212} -11/06/2021 23:26:42 - INFO - __main__ - Step 15485: {'lr': 0.0004898291595416438, 'samples': 2973120, 'steps': 15484, 'loss/train': 1.7662090063095093} -11/06/2021 23:26:42 - INFO - __main__ - Step 15486: {'lr': 0.0004898276612217102, 'samples': 2973312, 'steps': 15485, 'loss/train': 1.9618338346481323} -11/06/2021 23:26:43 - INFO - __main__ - Step 15487: {'lr': 0.0004898261627937139, 'samples': 2973504, 'steps': 15486, 'loss/train': 1.4506701231002808} -11/06/2021 23:26:44 - INFO - __main__ - Step 15488: {'lr': 0.0004898246642576559, 'samples': 2973696, 'steps': 15487, 'loss/train': 1.4949243068695068} -11/06/2021 23:26:44 - INFO - __main__ - Step 15489: {'lr': 0.0004898231656135362, 'samples': 2973888, 'steps': 15488, 'loss/train': 1.7489192485809326} -11/06/2021 23:26:44 - INFO - __main__ - Step 15490: {'lr': 0.0004898216668613562, 'samples': 2974080, 'steps': 15489, 'loss/train': 1.7685637474060059} -11/06/2021 23:26:45 - INFO - __main__ - Step 15491: {'lr': 0.0004898201680011161, 'samples': 2974272, 'steps': 15490, 'loss/train': 1.6107263565063477} -11/06/2021 23:26:45 - INFO - __main__ - Step 15492: {'lr': 0.0004898186690328168, 'samples': 2974464, 'steps': 15491, 'loss/train': 1.5681654214859009} -11/06/2021 23:26:46 - INFO - __main__ - Step 15493: {'lr': 0.000489817169956459, 'samples': 2974656, 'steps': 15492, 'loss/train': 1.5541188716888428} -11/06/2021 23:26:46 - INFO - __main__ - Step 15494: {'lr': 0.0004898156707720432, 'samples': 2974848, 'steps': 15493, 'loss/train': 1.5298535823822021} -11/06/2021 23:26:47 - INFO - __main__ - Step 15495: {'lr': 0.0004898141714795701, 'samples': 2975040, 'steps': 15494, 'loss/train': 1.4067524671554565} -11/06/2021 23:26:47 - INFO - __main__ - Step 15496: {'lr': 0.0004898126720790405, 'samples': 2975232, 'steps': 15495, 'loss/train': 1.936280369758606} -11/06/2021 23:26:47 - INFO - __main__ - Step 15497: {'lr': 0.0004898111725704549, 'samples': 2975424, 'steps': 15496, 'loss/train': 1.3486140966415405} -11/06/2021 23:26:49 - INFO - __main__ - Step 15498: {'lr': 0.0004898096729538142, 'samples': 2975616, 'steps': 15497, 'loss/train': 0.8642235398292542} -11/06/2021 23:26:49 - INFO - __main__ - Step 15499: {'lr': 0.000489808173229119, 'samples': 2975808, 'steps': 15498, 'loss/train': 1.4171953201293945} -11/06/2021 23:26:49 - INFO - __main__ - Step 15500: {'lr': 0.0004898066733963699, 'samples': 2976000, 'steps': 15499, 'loss/train': 1.831260085105896} -11/06/2021 23:26:50 - INFO - __main__ - Step 15501: {'lr': 0.0004898051734555676, 'samples': 2976192, 'steps': 15500, 'loss/train': 1.9325761795043945} -11/06/2021 23:26:50 - INFO - __main__ - Step 15502: {'lr': 0.0004898036734067127, 'samples': 2976384, 'steps': 15501, 'loss/train': 1.47348153591156} -11/06/2021 23:26:51 - INFO - __main__ - Step 15503: {'lr': 0.000489802173249806, 'samples': 2976576, 'steps': 15502, 'loss/train': 1.6190365552902222} -11/06/2021 23:26:51 - INFO - __main__ - Step 15504: {'lr': 0.0004898006729848482, 'samples': 2976768, 'steps': 15503, 'loss/train': 2.0817368030548096} -11/06/2021 23:26:52 - INFO - __main__ - Step 15505: {'lr': 0.0004897991726118399, 'samples': 2976960, 'steps': 15504, 'loss/train': 1.478041172027588} -11/06/2021 23:26:52 - INFO - __main__ - Step 15506: {'lr': 0.0004897976721307818, 'samples': 2977152, 'steps': 15505, 'loss/train': 1.7012150287628174} -11/06/2021 23:26:52 - INFO - __main__ - Step 15507: {'lr': 0.0004897961715416746, 'samples': 2977344, 'steps': 15506, 'loss/train': 1.763744592666626} -11/06/2021 23:26:54 - INFO - __main__ - Step 15508: {'lr': 0.0004897946708445189, 'samples': 2977536, 'steps': 15507, 'loss/train': 1.7468358278274536} -11/06/2021 23:26:54 - INFO - __main__ - Step 15509: {'lr': 0.0004897931700393154, 'samples': 2977728, 'steps': 15508, 'loss/train': 1.7361414432525635} -11/06/2021 23:26:54 - INFO - __main__ - Step 15510: {'lr': 0.0004897916691260648, 'samples': 2977920, 'steps': 15509, 'loss/train': 1.7605504989624023} -11/06/2021 23:26:55 - INFO - __main__ - Step 15511: {'lr': 0.0004897901681047679, 'samples': 2978112, 'steps': 15510, 'loss/train': 1.6326351165771484} -11/06/2021 23:26:55 - INFO - __main__ - Step 15512: {'lr': 0.0004897886669754251, 'samples': 2978304, 'steps': 15511, 'loss/train': 0.6337660551071167} -11/06/2021 23:26:56 - INFO - __main__ - Step 15513: {'lr': 0.0004897871657380373, 'samples': 2978496, 'steps': 15512, 'loss/train': 1.2955080270767212} -11/06/2021 23:26:56 - INFO - __main__ - Step 15514: {'lr': 0.0004897856643926051, 'samples': 2978688, 'steps': 15513, 'loss/train': 1.6480381488800049} -11/06/2021 23:26:57 - INFO - __main__ - Step 15515: {'lr': 0.0004897841629391291, 'samples': 2978880, 'steps': 15514, 'loss/train': 1.8163772821426392} -11/06/2021 23:26:57 - INFO - __main__ - Step 15516: {'lr': 0.0004897826613776101, 'samples': 2979072, 'steps': 15515, 'loss/train': 0.7295439839363098} -11/06/2021 23:26:57 - INFO - __main__ - Step 15517: {'lr': 0.0004897811597080488, 'samples': 2979264, 'steps': 15516, 'loss/train': 1.664631962776184} -11/06/2021 23:26:58 - INFO - __main__ - Step 15518: {'lr': 0.0004897796579304458, 'samples': 2979456, 'steps': 15517, 'loss/train': 2.0190608501434326} -11/06/2021 23:26:59 - INFO - __main__ - Step 15519: {'lr': 0.0004897781560448017, 'samples': 2979648, 'steps': 15518, 'loss/train': 2.086932897567749} -11/06/2021 23:26:59 - INFO - __main__ - Step 15520: {'lr': 0.0004897766540511173, 'samples': 2979840, 'steps': 15519, 'loss/train': 1.5068973302841187} -11/06/2021 23:26:59 - INFO - __main__ - Step 15521: {'lr': 0.0004897751519493933, 'samples': 2980032, 'steps': 15520, 'loss/train': 1.2962274551391602} -11/06/2021 23:27:00 - INFO - __main__ - Step 15522: {'lr': 0.0004897736497396303, 'samples': 2980224, 'steps': 15521, 'loss/train': 1.6107763051986694} -11/06/2021 23:27:00 - INFO - __main__ - Step 15523: {'lr': 0.000489772147421829, 'samples': 2980416, 'steps': 15522, 'loss/train': 1.9014201164245605} -11/06/2021 23:27:01 - INFO - __main__ - Step 15524: {'lr': 0.0004897706449959899, 'samples': 2980608, 'steps': 15523, 'loss/train': 0.9415351748466492} -11/06/2021 23:27:02 - INFO - __main__ - Step 15525: {'lr': 0.000489769142462114, 'samples': 2980800, 'steps': 15524, 'loss/train': 1.7568836212158203} -11/06/2021 23:27:02 - INFO - __main__ - Step 15526: {'lr': 0.0004897676398202018, 'samples': 2980992, 'steps': 15525, 'loss/train': 1.8288424015045166} -11/06/2021 23:27:02 - INFO - __main__ - Step 15527: {'lr': 0.000489766137070254, 'samples': 2981184, 'steps': 15526, 'loss/train': 1.7062444686889648} -11/06/2021 23:27:03 - INFO - __main__ - Step 15528: {'lr': 0.0004897646342122713, 'samples': 2981376, 'steps': 15527, 'loss/train': 1.133548378944397} -11/06/2021 23:27:04 - INFO - __main__ - Step 15529: {'lr': 0.0004897631312462544, 'samples': 2981568, 'steps': 15528, 'loss/train': 1.6974700689315796} -11/06/2021 23:27:04 - INFO - __main__ - Step 15530: {'lr': 0.0004897616281722038, 'samples': 2981760, 'steps': 15529, 'loss/train': 1.8842085599899292} -11/06/2021 23:27:04 - INFO - __main__ - Step 15531: {'lr': 0.0004897601249901204, 'samples': 2981952, 'steps': 15530, 'loss/train': 1.8136495351791382} -11/06/2021 23:27:05 - INFO - __main__ - Step 15532: {'lr': 0.0004897586217000047, 'samples': 2982144, 'steps': 15531, 'loss/train': 1.5027600526809692} -11/06/2021 23:27:05 - INFO - __main__ - Step 15533: {'lr': 0.0004897571183018576, 'samples': 2982336, 'steps': 15532, 'loss/train': 1.7708982229232788} -11/06/2021 23:27:06 - INFO - __main__ - Step 15534: {'lr': 0.0004897556147956796, 'samples': 2982528, 'steps': 15533, 'loss/train': 1.2645087242126465} -11/06/2021 23:27:06 - INFO - __main__ - Step 15535: {'lr': 0.0004897541111814714, 'samples': 2982720, 'steps': 15534, 'loss/train': 1.635704755783081} -11/06/2021 23:27:07 - INFO - __main__ - Step 15536: {'lr': 0.0004897526074592337, 'samples': 2982912, 'steps': 15535, 'loss/train': 1.6044889688491821} -11/06/2021 23:27:07 - INFO - __main__ - Step 15537: {'lr': 0.0004897511036289671, 'samples': 2983104, 'steps': 15536, 'loss/train': 1.1408244371414185} -11/06/2021 23:27:07 - INFO - __main__ - Step 15538: {'lr': 0.0004897495996906725, 'samples': 2983296, 'steps': 15537, 'loss/train': 1.5581918954849243} -11/06/2021 23:27:08 - INFO - __main__ - Step 15539: {'lr': 0.0004897480956443503, 'samples': 2983488, 'steps': 15538, 'loss/train': 1.4675657749176025} -11/06/2021 23:27:09 - INFO - __main__ - Step 15540: {'lr': 0.0004897465914900013, 'samples': 2983680, 'steps': 15539, 'loss/train': 1.6012563705444336} -11/06/2021 23:27:09 - INFO - __main__ - Step 15541: {'lr': 0.0004897450872276263, 'samples': 2983872, 'steps': 15540, 'loss/train': 1.357732892036438} -11/06/2021 23:27:10 - INFO - __main__ - Step 15542: {'lr': 0.0004897435828572258, 'samples': 2984064, 'steps': 15541, 'loss/train': 1.6430869102478027} -11/06/2021 23:27:10 - INFO - __main__ - Step 15543: {'lr': 0.0004897420783788006, 'samples': 2984256, 'steps': 15542, 'loss/train': 1.0916229486465454} -11/06/2021 23:27:10 - INFO - __main__ - Step 15544: {'lr': 0.0004897405737923511, 'samples': 2984448, 'steps': 15543, 'loss/train': 1.7726327180862427} -11/06/2021 23:27:11 - INFO - __main__ - Step 15545: {'lr': 0.0004897390690978785, 'samples': 2984640, 'steps': 15544, 'loss/train': 1.823258876800537} -11/06/2021 23:27:12 - INFO - __main__ - Step 15546: {'lr': 0.000489737564295383, 'samples': 2984832, 'steps': 15545, 'loss/train': 1.5735461711883545} -11/06/2021 23:27:12 - INFO - __main__ - Step 15547: {'lr': 0.0004897360593848655, 'samples': 2985024, 'steps': 15546, 'loss/train': 1.367332935333252} -11/06/2021 23:27:12 - INFO - __main__ - Step 15548: {'lr': 0.0004897345543663266, 'samples': 2985216, 'steps': 15547, 'loss/train': 0.22535571455955505} -11/06/2021 23:27:13 - INFO - __main__ - Step 15549: {'lr': 0.000489733049239767, 'samples': 2985408, 'steps': 15548, 'loss/train': 1.6396257877349854} -11/06/2021 23:27:14 - INFO - __main__ - Step 15550: {'lr': 0.0004897315440051874, 'samples': 2985600, 'steps': 15549, 'loss/train': 1.6046090126037598} -11/06/2021 23:27:14 - INFO - __main__ - Step 15551: {'lr': 0.0004897300386625885, 'samples': 2985792, 'steps': 15550, 'loss/train': 1.0172430276870728} -11/06/2021 23:27:15 - INFO - __main__ - Step 15552: {'lr': 0.0004897285332119709, 'samples': 2985984, 'steps': 15551, 'loss/train': 0.5910050272941589} -11/06/2021 23:27:15 - INFO - __main__ - Step 15553: {'lr': 0.0004897270276533355, 'samples': 2986176, 'steps': 15552, 'loss/train': 1.4002232551574707} -11/06/2021 23:27:16 - INFO - __main__ - Step 15554: {'lr': 0.0004897255219866825, 'samples': 2986368, 'steps': 15553, 'loss/train': 1.4650905132293701} -11/06/2021 23:27:16 - INFO - __main__ - Step 15555: {'lr': 0.000489724016212013, 'samples': 2986560, 'steps': 15554, 'loss/train': 0.7079336643218994} -11/06/2021 23:27:17 - INFO - __main__ - Step 15556: {'lr': 0.0004897225103293277, 'samples': 2986752, 'steps': 15555, 'loss/train': 1.5303819179534912} -11/06/2021 23:27:17 - INFO - __main__ - Step 15557: {'lr': 0.0004897210043386269, 'samples': 2986944, 'steps': 15556, 'loss/train': 1.7852060794830322} -11/06/2021 23:27:18 - INFO - __main__ - Step 15558: {'lr': 0.0004897194982399117, 'samples': 2987136, 'steps': 15557, 'loss/train': 1.5519731044769287} -11/06/2021 23:27:18 - INFO - __main__ - Step 15559: {'lr': 0.0004897179920331826, 'samples': 2987328, 'steps': 15558, 'loss/train': 1.4157203435897827} -11/06/2021 23:27:18 - INFO - __main__ - Step 15560: {'lr': 0.0004897164857184401, 'samples': 2987520, 'steps': 15559, 'loss/train': 1.7595874071121216} -11/06/2021 23:27:19 - INFO - __main__ - Step 15561: {'lr': 0.0004897149792956852, 'samples': 2987712, 'steps': 15560, 'loss/train': 1.732194185256958} -11/06/2021 23:27:20 - INFO - __main__ - Step 15562: {'lr': 0.0004897134727649184, 'samples': 2987904, 'steps': 15561, 'loss/train': 1.4084118604660034} -11/06/2021 23:27:20 - INFO - __main__ - Step 15563: {'lr': 0.0004897119661261403, 'samples': 2988096, 'steps': 15562, 'loss/train': 1.490355134010315} -11/06/2021 23:27:20 - INFO - __main__ - Step 15564: {'lr': 0.0004897104593793518, 'samples': 2988288, 'steps': 15563, 'loss/train': 1.779022455215454} -11/06/2021 23:27:21 - INFO - __main__ - Step 15565: {'lr': 0.0004897089525245535, 'samples': 2988480, 'steps': 15564, 'loss/train': 1.8259437084197998} -11/06/2021 23:27:22 - INFO - __main__ - Step 15566: {'lr': 0.000489707445561746, 'samples': 2988672, 'steps': 15565, 'loss/train': 1.727378010749817} -11/06/2021 23:27:22 - INFO - __main__ - Step 15567: {'lr': 0.0004897059384909299, 'samples': 2988864, 'steps': 15566, 'loss/train': 1.8309595584869385} -11/06/2021 23:27:23 - INFO - __main__ - Step 15568: {'lr': 0.0004897044313121061, 'samples': 2989056, 'steps': 15567, 'loss/train': 5.84039306640625} -11/06/2021 23:27:23 - INFO - __main__ - Step 15569: {'lr': 0.0004897029240252753, 'samples': 2989248, 'steps': 15568, 'loss/train': 1.787092685699463} -11/06/2021 23:27:23 - INFO - __main__ - Step 15570: {'lr': 0.000489701416630438, 'samples': 2989440, 'steps': 15569, 'loss/train': 1.3923110961914062} -11/06/2021 23:27:24 - INFO - __main__ - Step 15571: {'lr': 0.0004896999091275948, 'samples': 2989632, 'steps': 15570, 'loss/train': 0.7924749255180359} -11/06/2021 23:27:25 - INFO - __main__ - Step 15572: {'lr': 0.0004896984015167466, 'samples': 2989824, 'steps': 15571, 'loss/train': 1.4174809455871582} -11/06/2021 23:27:25 - INFO - __main__ - Step 15573: {'lr': 0.0004896968937978941, 'samples': 2990016, 'steps': 15572, 'loss/train': 1.8383560180664062} -11/06/2021 23:27:25 - INFO - __main__ - Step 15574: {'lr': 0.0004896953859710379, 'samples': 2990208, 'steps': 15573, 'loss/train': 1.6366064548492432} -11/06/2021 23:27:26 - INFO - __main__ - Step 15575: {'lr': 0.0004896938780361784, 'samples': 2990400, 'steps': 15574, 'loss/train': 1.5936790704727173} -11/06/2021 23:27:26 - INFO - __main__ - Step 15576: {'lr': 0.0004896923699933167, 'samples': 2990592, 'steps': 15575, 'loss/train': 1.7249995470046997} -11/06/2021 23:27:27 - INFO - __main__ - Step 15577: {'lr': 0.0004896908618424533, 'samples': 2990784, 'steps': 15576, 'loss/train': 2.0188241004943848} -11/06/2021 23:27:28 - INFO - __main__ - Step 15578: {'lr': 0.0004896893535835889, 'samples': 2990976, 'steps': 15577, 'loss/train': 1.7882033586502075} -11/06/2021 23:27:28 - INFO - __main__ - Step 15579: {'lr': 0.0004896878452167241, 'samples': 2991168, 'steps': 15578, 'loss/train': 1.9642932415008545} -11/06/2021 23:27:28 - INFO - __main__ - Step 15580: {'lr': 0.0004896863367418598, 'samples': 2991360, 'steps': 15579, 'loss/train': 1.1707956790924072} -11/06/2021 23:27:29 - INFO - __main__ - Step 15581: {'lr': 0.0004896848281589966, 'samples': 2991552, 'steps': 15580, 'loss/train': 1.590392827987671} -11/06/2021 23:27:29 - INFO - __main__ - Step 15582: {'lr': 0.0004896833194681349, 'samples': 2991744, 'steps': 15581, 'loss/train': 2.1214358806610107} -11/06/2021 23:27:30 - INFO - __main__ - Step 15583: {'lr': 0.0004896818106692757, 'samples': 2991936, 'steps': 15582, 'loss/train': 1.77946937084198} -11/06/2021 23:27:30 - INFO - __main__ - Step 15584: {'lr': 0.0004896803017624196, 'samples': 2992128, 'steps': 15583, 'loss/train': 1.9012962579727173} -11/06/2021 23:27:31 - INFO - __main__ - Step 15585: {'lr': 0.0004896787927475671, 'samples': 2992320, 'steps': 15584, 'loss/train': 1.8630757331848145} -11/06/2021 23:27:31 - INFO - __main__ - Step 15586: {'lr': 0.0004896772836247192, 'samples': 2992512, 'steps': 15585, 'loss/train': 1.8197124004364014} -11/06/2021 23:27:31 - INFO - __main__ - Step 15587: {'lr': 0.0004896757743938764, 'samples': 2992704, 'steps': 15586, 'loss/train': 1.4077614545822144} -11/06/2021 23:27:33 - INFO - __main__ - Step 15588: {'lr': 0.0004896742650550393, 'samples': 2992896, 'steps': 15587, 'loss/train': 1.6958098411560059} -11/06/2021 23:27:33 - INFO - __main__ - Step 15589: {'lr': 0.0004896727556082086, 'samples': 2993088, 'steps': 15588, 'loss/train': 1.470612645149231} -11/06/2021 23:27:34 - INFO - __main__ - Step 15590: {'lr': 0.0004896712460533854, 'samples': 2993280, 'steps': 15589, 'loss/train': 0.6105215549468994} -11/06/2021 23:27:34 - INFO - __main__ - Step 15591: {'lr': 0.0004896697363905697, 'samples': 2993472, 'steps': 15590, 'loss/train': 1.653200387954712} -11/06/2021 23:27:34 - INFO - __main__ - Step 15592: {'lr': 0.0004896682266197626, 'samples': 2993664, 'steps': 15591, 'loss/train': 1.4414596557617188} -11/06/2021 23:27:35 - INFO - __main__ - Step 15593: {'lr': 0.0004896667167409648, 'samples': 2993856, 'steps': 15592, 'loss/train': 1.5426613092422485} -11/06/2021 23:27:36 - INFO - __main__ - Step 15594: {'lr': 0.0004896652067541767, 'samples': 2994048, 'steps': 15593, 'loss/train': 1.6049456596374512} -11/06/2021 23:27:36 - INFO - __main__ - Step 15595: {'lr': 0.0004896636966593993, 'samples': 2994240, 'steps': 15594, 'loss/train': 1.4910203218460083} -11/06/2021 23:27:36 - INFO - __main__ - Step 15596: {'lr': 0.0004896621864566331, 'samples': 2994432, 'steps': 15595, 'loss/train': 1.6735210418701172} -11/06/2021 23:27:37 - INFO - __main__ - Step 15597: {'lr': 0.0004896606761458788, 'samples': 2994624, 'steps': 15596, 'loss/train': 1.6641515493392944} -11/06/2021 23:27:38 - INFO - __main__ - Step 15598: {'lr': 0.0004896591657271371, 'samples': 2994816, 'steps': 15597, 'loss/train': 1.6537212133407593} -11/06/2021 23:27:38 - INFO - __main__ - Step 15599: {'lr': 0.0004896576552004087, 'samples': 2995008, 'steps': 15598, 'loss/train': 2.4560248851776123} -11/06/2021 23:27:38 - INFO - __main__ - Step 15600: {'lr': 0.0004896561445656943, 'samples': 2995200, 'steps': 15599, 'loss/train': 1.4348224401474} -11/06/2021 23:27:39 - INFO - __main__ - Step 15601: {'lr': 0.0004896546338229945, 'samples': 2995392, 'steps': 15600, 'loss/train': 1.6731430292129517} -11/06/2021 23:27:39 - INFO - __main__ - Step 15602: {'lr': 0.00048965312297231, 'samples': 2995584, 'steps': 15601, 'loss/train': 1.7863247394561768} -11/06/2021 23:27:39 - INFO - __main__ - Step 15603: {'lr': 0.0004896516120136415, 'samples': 2995776, 'steps': 15602, 'loss/train': 1.5890967845916748} -11/06/2021 23:27:40 - INFO - __main__ - Step 15604: {'lr': 0.0004896501009469896, 'samples': 2995968, 'steps': 15603, 'loss/train': 1.6799132823944092} -11/06/2021 23:27:41 - INFO - __main__ - Step 15605: {'lr': 0.0004896485897723552, 'samples': 2996160, 'steps': 15604, 'loss/train': 1.8443701267242432} -11/06/2021 23:27:41 - INFO - __main__ - Step 15606: {'lr': 0.0004896470784897388, 'samples': 2996352, 'steps': 15605, 'loss/train': 1.6562256813049316} -11/06/2021 23:27:42 - INFO - __main__ - Step 15607: {'lr': 0.0004896455670991411, 'samples': 2996544, 'steps': 15606, 'loss/train': 1.9659929275512695} -11/06/2021 23:27:42 - INFO - __main__ - Step 15608: {'lr': 0.0004896440556005628, 'samples': 2996736, 'steps': 15607, 'loss/train': 1.765615463256836} -11/06/2021 23:27:43 - INFO - __main__ - Step 15609: {'lr': 0.0004896425439940047, 'samples': 2996928, 'steps': 15608, 'loss/train': 1.5836148262023926} -11/06/2021 23:27:43 - INFO - __main__ - Step 15610: {'lr': 0.0004896410322794673, 'samples': 2997120, 'steps': 15609, 'loss/train': 1.9341999292373657} -11/06/2021 23:27:44 - INFO - __main__ - Step 15611: {'lr': 0.0004896395204569512, 'samples': 2997312, 'steps': 15610, 'loss/train': 2.4479007720947266} -11/06/2021 23:27:44 - INFO - __main__ - Step 15612: {'lr': 0.0004896380085264573, 'samples': 2997504, 'steps': 15611, 'loss/train': 1.4598520994186401} -11/06/2021 23:27:45 - INFO - __main__ - Step 15613: {'lr': 0.0004896364964879864, 'samples': 2997696, 'steps': 15612, 'loss/train': 1.7066932916641235} -11/06/2021 23:27:46 - INFO - __main__ - Step 15614: {'lr': 0.0004896349843415389, 'samples': 2997888, 'steps': 15613, 'loss/train': 1.8551546335220337} -11/06/2021 23:27:46 - INFO - __main__ - Step 15615: {'lr': 0.0004896334720871156, 'samples': 2998080, 'steps': 15614, 'loss/train': 1.7236617803573608} -11/06/2021 23:27:46 - INFO - __main__ - Step 15616: {'lr': 0.0004896319597247169, 'samples': 2998272, 'steps': 15615, 'loss/train': 1.543269157409668} -11/06/2021 23:27:47 - INFO - __main__ - Step 15617: {'lr': 0.0004896304472543439, 'samples': 2998464, 'steps': 15616, 'loss/train': 1.2389189004898071} -11/06/2021 23:27:47 - INFO - __main__ - Step 15618: {'lr': 0.0004896289346759973, 'samples': 2998656, 'steps': 15617, 'loss/train': 1.4939310550689697} -11/06/2021 23:27:47 - INFO - __main__ - Step 15619: {'lr': 0.0004896274219896773, 'samples': 2998848, 'steps': 15618, 'loss/train': 1.4448155164718628} -11/06/2021 23:27:49 - INFO - __main__ - Step 15620: {'lr': 0.000489625909195385, 'samples': 2999040, 'steps': 15619, 'loss/train': 1.5308935642242432} -11/06/2021 23:27:49 - INFO - __main__ - Step 15621: {'lr': 0.0004896243962931211, 'samples': 2999232, 'steps': 15620, 'loss/train': 1.9983116388320923} -11/06/2021 23:27:49 - INFO - __main__ - Step 15622: {'lr': 0.0004896228832828861, 'samples': 2999424, 'steps': 15621, 'loss/train': 1.443530559539795} -11/06/2021 23:27:50 - INFO - __main__ - Step 15623: {'lr': 0.0004896213701646806, 'samples': 2999616, 'steps': 15622, 'loss/train': 1.5524290800094604} -11/06/2021 23:27:50 - INFO - __main__ - Step 15624: {'lr': 0.0004896198569385055, 'samples': 2999808, 'steps': 15623, 'loss/train': 1.7541719675064087} -11/06/2021 23:27:51 - INFO - __main__ - Step 15625: {'lr': 0.0004896183436043613, 'samples': 3000000, 'steps': 15624, 'loss/train': 1.905300498008728} -11/06/2021 23:27:51 - INFO - __main__ - Step 15626: {'lr': 0.0004896168301622488, 'samples': 3000192, 'steps': 15625, 'loss/train': 1.9676408767700195} -11/06/2021 23:27:52 - INFO - __main__ - Step 15627: {'lr': 0.0004896153166121688, 'samples': 3000384, 'steps': 15626, 'loss/train': 1.2466262578964233} -11/06/2021 23:27:52 - INFO - __main__ - Step 15628: {'lr': 0.0004896138029541217, 'samples': 3000576, 'steps': 15627, 'loss/train': 1.6408860683441162} -11/06/2021 23:27:52 - INFO - __main__ - Step 15629: {'lr': 0.0004896122891881083, 'samples': 3000768, 'steps': 15628, 'loss/train': 1.4601120948791504} -11/06/2021 23:27:53 - INFO - __main__ - Step 15630: {'lr': 0.0004896107753141293, 'samples': 3000960, 'steps': 15629, 'loss/train': 1.7563142776489258} -11/06/2021 23:27:54 - INFO - __main__ - Step 15631: {'lr': 0.0004896092613321854, 'samples': 3001152, 'steps': 15630, 'loss/train': 2.3639023303985596} -11/06/2021 23:27:54 - INFO - __main__ - Step 15632: {'lr': 0.0004896077472422773, 'samples': 3001344, 'steps': 15631, 'loss/train': 1.8587177991867065} -11/06/2021 23:27:54 - INFO - __main__ - Step 15633: {'lr': 0.0004896062330444057, 'samples': 3001536, 'steps': 15632, 'loss/train': 1.8706539869308472} -11/06/2021 23:27:55 - INFO - __main__ - Step 15634: {'lr': 0.0004896047187385711, 'samples': 3001728, 'steps': 15633, 'loss/train': 1.3826926946640015} -11/06/2021 23:27:56 - INFO - __main__ - Step 15635: {'lr': 0.0004896032043247744, 'samples': 3001920, 'steps': 15634, 'loss/train': 1.9541095495224} -11/06/2021 23:27:56 - INFO - __main__ - Step 15636: {'lr': 0.0004896016898030161, 'samples': 3002112, 'steps': 15635, 'loss/train': 1.0642521381378174} -11/06/2021 23:27:57 - INFO - __main__ - Step 15637: {'lr': 0.0004896001751732971, 'samples': 3002304, 'steps': 15636, 'loss/train': 0.9917707443237305} -11/06/2021 23:27:57 - INFO - __main__ - Step 15638: {'lr': 0.0004895986604356178, 'samples': 3002496, 'steps': 15637, 'loss/train': 1.6697584390640259} -11/06/2021 23:27:57 - INFO - __main__ - Step 15639: {'lr': 0.0004895971455899792, 'samples': 3002688, 'steps': 15638, 'loss/train': 1.6163402795791626} -11/06/2021 23:27:58 - INFO - __main__ - Step 15640: {'lr': 0.0004895956306363818, 'samples': 3002880, 'steps': 15639, 'loss/train': 0.30415403842926025} -11/06/2021 23:27:59 - INFO - __main__ - Step 15641: {'lr': 0.0004895941155748263, 'samples': 3003072, 'steps': 15640, 'loss/train': 1.7623761892318726} -11/06/2021 23:27:59 - INFO - __main__ - Step 15642: {'lr': 0.0004895926004053133, 'samples': 3003264, 'steps': 15641, 'loss/train': 1.5293596982955933} -11/06/2021 23:27:59 - INFO - __main__ - Step 15643: {'lr': 0.0004895910851278436, 'samples': 3003456, 'steps': 15642, 'loss/train': 1.518384575843811} -11/06/2021 23:28:00 - INFO - __main__ - Step 15644: {'lr': 0.0004895895697424179, 'samples': 3003648, 'steps': 15643, 'loss/train': 1.6720932722091675} -11/06/2021 23:28:00 - INFO - __main__ - Step 15645: {'lr': 0.0004895880542490369, 'samples': 3003840, 'steps': 15644, 'loss/train': 1.7592436075210571} -11/06/2021 23:28:01 - INFO - __main__ - Step 15646: {'lr': 0.0004895865386477011, 'samples': 3004032, 'steps': 15645, 'loss/train': 0.32387545704841614} -11/06/2021 23:28:02 - INFO - __main__ - Step 15647: {'lr': 0.0004895850229384113, 'samples': 3004224, 'steps': 15646, 'loss/train': 1.4493197202682495} -11/06/2021 23:28:02 - INFO - __main__ - Step 15648: {'lr': 0.0004895835071211682, 'samples': 3004416, 'steps': 15647, 'loss/train': 1.6152663230895996} -11/06/2021 23:28:02 - INFO - __main__ - Step 15649: {'lr': 0.0004895819911959725, 'samples': 3004608, 'steps': 15648, 'loss/train': 0.838192343711853} -11/06/2021 23:28:03 - INFO - __main__ - Step 15650: {'lr': 0.0004895804751628249, 'samples': 3004800, 'steps': 15649, 'loss/train': 1.9193270206451416} -11/06/2021 23:28:04 - INFO - __main__ - Step 15651: {'lr': 0.0004895789590217259, 'samples': 3004992, 'steps': 15650, 'loss/train': 1.8412024974822998} -11/06/2021 23:28:04 - INFO - __main__ - Step 15652: {'lr': 0.0004895774427726764, 'samples': 3005184, 'steps': 15651, 'loss/train': 1.4921084642410278} -11/06/2021 23:28:04 - INFO - __main__ - Step 15653: {'lr': 0.000489575926415677, 'samples': 3005376, 'steps': 15652, 'loss/train': 0.7553501725196838} -11/06/2021 23:28:05 - INFO - __main__ - Step 15654: {'lr': 0.0004895744099507284, 'samples': 3005568, 'steps': 15653, 'loss/train': 1.9209213256835938} -11/06/2021 23:28:05 - INFO - __main__ - Step 15655: {'lr': 0.0004895728933778313, 'samples': 3005760, 'steps': 15654, 'loss/train': 1.9080966711044312} -11/06/2021 23:28:06 - INFO - __main__ - Step 15656: {'lr': 0.0004895713766969863, 'samples': 3005952, 'steps': 15655, 'loss/train': 1.7056766748428345} -11/06/2021 23:28:06 - INFO - __main__ - Step 15657: {'lr': 0.0004895698599081942, 'samples': 3006144, 'steps': 15656, 'loss/train': 0.8188896775245667} -11/06/2021 23:28:07 - INFO - __main__ - Step 15658: {'lr': 0.0004895683430114555, 'samples': 3006336, 'steps': 15657, 'loss/train': 1.6825709342956543} -11/06/2021 23:28:07 - INFO - __main__ - Step 15659: {'lr': 0.0004895668260067711, 'samples': 3006528, 'steps': 15658, 'loss/train': 1.427496314048767} -11/06/2021 23:28:07 - INFO - __main__ - Step 15660: {'lr': 0.0004895653088941416, 'samples': 3006720, 'steps': 15659, 'loss/train': 1.5132235288619995} -11/06/2021 23:28:09 - INFO - __main__ - Step 15661: {'lr': 0.0004895637916735675, 'samples': 3006912, 'steps': 15660, 'loss/train': 2.0918915271759033} -11/06/2021 23:28:09 - INFO - __main__ - Step 15662: {'lr': 0.0004895622743450497, 'samples': 3007104, 'steps': 15661, 'loss/train': 1.9682589769363403} -11/06/2021 23:28:09 - INFO - __main__ - Step 15663: {'lr': 0.000489560756908589, 'samples': 3007296, 'steps': 15662, 'loss/train': 1.5035189390182495} -11/06/2021 23:28:10 - INFO - __main__ - Step 15664: {'lr': 0.0004895592393641858, 'samples': 3007488, 'steps': 15663, 'loss/train': 2.122490406036377} -11/06/2021 23:28:10 - INFO - __main__ - Step 15665: {'lr': 0.0004895577217118408, 'samples': 3007680, 'steps': 15664, 'loss/train': 1.6128400564193726} -11/06/2021 23:28:10 - INFO - __main__ - Step 15666: {'lr': 0.000489556203951555, 'samples': 3007872, 'steps': 15665, 'loss/train': 1.7595479488372803} -11/06/2021 23:28:11 - INFO - __main__ - Step 15667: {'lr': 0.0004895546860833287, 'samples': 3008064, 'steps': 15666, 'loss/train': 1.5410199165344238} -11/06/2021 23:28:12 - INFO - __main__ - Step 15668: {'lr': 0.000489553168107163, 'samples': 3008256, 'steps': 15667, 'loss/train': 1.6218812465667725} -11/06/2021 23:28:12 - INFO - __main__ - Step 15669: {'lr': 0.0004895516500230581, 'samples': 3008448, 'steps': 15668, 'loss/train': 1.6784151792526245} -11/06/2021 23:28:12 - INFO - __main__ - Step 15670: {'lr': 0.000489550131831015, 'samples': 3008640, 'steps': 15669, 'loss/train': 1.0655637979507446} -11/06/2021 23:28:13 - INFO - __main__ - Step 15671: {'lr': 0.0004895486135310343, 'samples': 3008832, 'steps': 15670, 'loss/train': 1.7083613872528076} -11/06/2021 23:28:14 - INFO - __main__ - Step 15672: {'lr': 0.0004895470951231166, 'samples': 3009024, 'steps': 15671, 'loss/train': 1.3929165601730347} -11/06/2021 23:28:14 - INFO - __main__ - Step 15673: {'lr': 0.0004895455766072629, 'samples': 3009216, 'steps': 15672, 'loss/train': 1.3593981266021729} -11/06/2021 23:28:15 - INFO - __main__ - Step 15674: {'lr': 0.0004895440579834736, 'samples': 3009408, 'steps': 15673, 'loss/train': 2.2362141609191895} -11/06/2021 23:28:15 - INFO - __main__ - Step 15675: {'lr': 0.0004895425392517493, 'samples': 3009600, 'steps': 15674, 'loss/train': 1.799658179283142} -11/06/2021 23:28:15 - INFO - __main__ - Step 15676: {'lr': 0.0004895410204120909, 'samples': 3009792, 'steps': 15675, 'loss/train': 0.6833590865135193} -11/06/2021 23:28:16 - INFO - __main__ - Step 15677: {'lr': 0.000489539501464499, 'samples': 3009984, 'steps': 15676, 'loss/train': 1.8790018558502197} -11/06/2021 23:28:17 - INFO - __main__ - Step 15678: {'lr': 0.0004895379824089743, 'samples': 3010176, 'steps': 15677, 'loss/train': 1.4177005290985107} -11/06/2021 23:28:17 - INFO - __main__ - Step 15679: {'lr': 0.0004895364632455175, 'samples': 3010368, 'steps': 15678, 'loss/train': 1.675038456916809} -11/06/2021 23:28:18 - INFO - __main__ - Step 15680: {'lr': 0.0004895349439741292, 'samples': 3010560, 'steps': 15679, 'loss/train': 1.6020910739898682} -11/06/2021 23:28:18 - INFO - __main__ - Step 15681: {'lr': 0.0004895334245948103, 'samples': 3010752, 'steps': 15680, 'loss/train': 1.6132880449295044} -11/06/2021 23:28:18 - INFO - __main__ - Step 15682: {'lr': 0.0004895319051075612, 'samples': 3010944, 'steps': 15681, 'loss/train': 1.2223986387252808} -11/06/2021 23:28:19 - INFO - __main__ - Step 15683: {'lr': 0.0004895303855123828, 'samples': 3011136, 'steps': 15682, 'loss/train': 1.8160881996154785} -11/06/2021 23:28:20 - INFO - __main__ - Step 15684: {'lr': 0.0004895288658092757, 'samples': 3011328, 'steps': 15683, 'loss/train': 1.8735129833221436} -11/06/2021 23:28:20 - INFO - __main__ - Step 15685: {'lr': 0.0004895273459982406, 'samples': 3011520, 'steps': 15684, 'loss/train': 2.2502872943878174} -11/06/2021 23:28:20 - INFO - __main__ - Step 15686: {'lr': 0.0004895258260792781, 'samples': 3011712, 'steps': 15685, 'loss/train': 1.674849271774292} -11/06/2021 23:28:21 - INFO - __main__ - Step 15687: {'lr': 0.0004895243060523889, 'samples': 3011904, 'steps': 15686, 'loss/train': 1.7530903816223145} -11/06/2021 23:28:22 - INFO - __main__ - Step 15688: {'lr': 0.0004895227859175739, 'samples': 3012096, 'steps': 15687, 'loss/train': 1.8542940616607666} -11/06/2021 23:28:22 - INFO - __main__ - Step 15689: {'lr': 0.0004895212656748336, 'samples': 3012288, 'steps': 15688, 'loss/train': 1.7547863721847534} -11/06/2021 23:28:23 - INFO - __main__ - Step 15690: {'lr': 0.0004895197453241687, 'samples': 3012480, 'steps': 15689, 'loss/train': 1.8645319938659668} -11/06/2021 23:28:23 - INFO - __main__ - Step 15691: {'lr': 0.0004895182248655798, 'samples': 3012672, 'steps': 15690, 'loss/train': 1.0751885175704956} -11/06/2021 23:28:23 - INFO - __main__ - Step 15692: {'lr': 0.0004895167042990678, 'samples': 3012864, 'steps': 15691, 'loss/train': 1.3243579864501953} -11/06/2021 23:28:24 - INFO - __main__ - Step 15693: {'lr': 0.0004895151836246332, 'samples': 3013056, 'steps': 15692, 'loss/train': 0.8072070479393005} -11/06/2021 23:28:25 - INFO - __main__ - Step 15694: {'lr': 0.0004895136628422767, 'samples': 3013248, 'steps': 15693, 'loss/train': 1.9552663564682007} -11/06/2021 23:28:25 - INFO - __main__ - Step 15695: {'lr': 0.0004895121419519992, 'samples': 3013440, 'steps': 15694, 'loss/train': 1.4452375173568726} -11/06/2021 23:28:25 - INFO - __main__ - Step 15696: {'lr': 0.0004895106209538011, 'samples': 3013632, 'steps': 15695, 'loss/train': 1.48054039478302} -11/06/2021 23:28:26 - INFO - __main__ - Step 15697: {'lr': 0.0004895090998476833, 'samples': 3013824, 'steps': 15696, 'loss/train': 1.7760313749313354} -11/06/2021 23:28:27 - INFO - __main__ - Step 15698: {'lr': 0.0004895075786336463, 'samples': 3014016, 'steps': 15697, 'loss/train': 3.4259486198425293} -11/06/2021 23:28:27 - INFO - __main__ - Step 15699: {'lr': 0.000489506057311691, 'samples': 3014208, 'steps': 15698, 'loss/train': 1.669292688369751} -11/06/2021 23:28:28 - INFO - __main__ - Step 15700: {'lr': 0.0004895045358818179, 'samples': 3014400, 'steps': 15699, 'loss/train': 1.6699222326278687} -11/06/2021 23:28:28 - INFO - __main__ - Step 15701: {'lr': 0.0004895030143440278, 'samples': 3014592, 'steps': 15700, 'loss/train': 1.9887073040008545} -11/06/2021 23:28:28 - INFO - __main__ - Step 15702: {'lr': 0.0004895014926983212, 'samples': 3014784, 'steps': 15701, 'loss/train': 2.682663679122925} -11/06/2021 23:28:30 - INFO - __main__ - Step 15703: {'lr': 0.0004894999709446991, 'samples': 3014976, 'steps': 15702, 'loss/train': 1.6473217010498047} -11/06/2021 23:28:31 - INFO - __main__ - Step 15704: {'lr': 0.0004894984490831619, 'samples': 3015168, 'steps': 15703, 'loss/train': 1.7859365940093994} -11/06/2021 23:28:31 - INFO - __main__ - Step 15705: {'lr': 0.0004894969271137104, 'samples': 3015360, 'steps': 15704, 'loss/train': 1.9558829069137573} -11/06/2021 23:28:31 - INFO - __main__ - Step 15706: {'lr': 0.0004894954050363452, 'samples': 3015552, 'steps': 15705, 'loss/train': 0.8179440498352051} -11/06/2021 23:28:32 - INFO - __main__ - Step 15707: {'lr': 0.0004894938828510672, 'samples': 3015744, 'steps': 15706, 'loss/train': 1.4025057554244995} -11/06/2021 23:28:32 - INFO - __main__ - Step 15708: {'lr': 0.000489492360557877, 'samples': 3015936, 'steps': 15707, 'loss/train': 1.384521722793579} -11/06/2021 23:28:32 - INFO - __main__ - Step 15709: {'lr': 0.0004894908381567751, 'samples': 3016128, 'steps': 15708, 'loss/train': 1.8304907083511353} -11/06/2021 23:28:33 - INFO - __main__ - Step 15710: {'lr': 0.0004894893156477623, 'samples': 3016320, 'steps': 15709, 'loss/train': 1.7960162162780762} -11/06/2021 23:28:34 - INFO - __main__ - Step 15711: {'lr': 0.0004894877930308395, 'samples': 3016512, 'steps': 15710, 'loss/train': 0.9428093433380127} -11/06/2021 23:28:34 - INFO - __main__ - Step 15712: {'lr': 0.0004894862703060071, 'samples': 3016704, 'steps': 15711, 'loss/train': 1.633742094039917} -11/06/2021 23:28:35 - INFO - __main__ - Step 15713: {'lr': 0.0004894847474732658, 'samples': 3016896, 'steps': 15712, 'loss/train': 1.6129860877990723} -11/06/2021 23:28:35 - INFO - __main__ - Step 15714: {'lr': 0.0004894832245326165, 'samples': 3017088, 'steps': 15713, 'loss/train': 1.7154533863067627} -11/06/2021 23:28:36 - INFO - __main__ - Step 15715: {'lr': 0.0004894817014840597, 'samples': 3017280, 'steps': 15714, 'loss/train': 0.8715106844902039} -11/06/2021 23:28:36 - INFO - __main__ - Step 15716: {'lr': 0.0004894801783275961, 'samples': 3017472, 'steps': 15715, 'loss/train': 1.5612425804138184} -11/06/2021 23:28:37 - INFO - __main__ - Step 15717: {'lr': 0.0004894786550632264, 'samples': 3017664, 'steps': 15716, 'loss/train': 1.774351954460144} -11/06/2021 23:28:37 - INFO - __main__ - Step 15718: {'lr': 0.0004894771316909514, 'samples': 3017856, 'steps': 15717, 'loss/train': 1.6608457565307617} -11/06/2021 23:28:38 - INFO - __main__ - Step 15719: {'lr': 0.0004894756082107717, 'samples': 3018048, 'steps': 15718, 'loss/train': 1.3828167915344238} -11/06/2021 23:28:38 - INFO - __main__ - Step 15720: {'lr': 0.0004894740846226879, 'samples': 3018240, 'steps': 15719, 'loss/train': 1.9708067178726196} -11/06/2021 23:28:39 - INFO - __main__ - Step 15721: {'lr': 0.0004894725609267009, 'samples': 3018432, 'steps': 15720, 'loss/train': 1.6421191692352295} -11/06/2021 23:28:39 - INFO - __main__ - Step 15722: {'lr': 0.0004894710371228111, 'samples': 3018624, 'steps': 15721, 'loss/train': 1.9015141725540161} -11/06/2021 23:28:40 - INFO - __main__ - Step 15723: {'lr': 0.0004894695132110196, 'samples': 3018816, 'steps': 15722, 'loss/train': 1.9826589822769165} -11/06/2021 23:28:40 - INFO - __main__ - Step 15724: {'lr': 0.0004894679891913266, 'samples': 3019008, 'steps': 15723, 'loss/train': 1.9029018878936768} -11/06/2021 23:28:40 - INFO - __main__ - Step 15725: {'lr': 0.000489466465063733, 'samples': 3019200, 'steps': 15724, 'loss/train': 1.4145636558532715} -11/06/2021 23:28:41 - INFO - __main__ - Step 15726: {'lr': 0.0004894649408282396, 'samples': 3019392, 'steps': 15725, 'loss/train': 1.6551494598388672} -11/06/2021 23:28:42 - INFO - __main__ - Step 15727: {'lr': 0.000489463416484847, 'samples': 3019584, 'steps': 15726, 'loss/train': 1.8325507640838623} -11/06/2021 23:28:42 - INFO - __main__ - Step 15728: {'lr': 0.0004894618920335558, 'samples': 3019776, 'steps': 15727, 'loss/train': 1.8709338903427124} -11/06/2021 23:28:43 - INFO - __main__ - Step 15729: {'lr': 0.0004894603674743668, 'samples': 3019968, 'steps': 15728, 'loss/train': 1.7608121633529663} -11/06/2021 23:28:43 - INFO - __main__ - Step 15730: {'lr': 0.0004894588428072808, 'samples': 3020160, 'steps': 15729, 'loss/train': 1.6138921976089478} -11/06/2021 23:28:43 - INFO - __main__ - Step 15731: {'lr': 0.0004894573180322982, 'samples': 3020352, 'steps': 15730, 'loss/train': 1.558252215385437} -11/06/2021 23:28:44 - INFO - __main__ - Step 15732: {'lr': 0.0004894557931494199, 'samples': 3020544, 'steps': 15731, 'loss/train': 1.370026707649231} -11/06/2021 23:28:45 - INFO - __main__ - Step 15733: {'lr': 0.0004894542681586465, 'samples': 3020736, 'steps': 15732, 'loss/train': 1.6896443367004395} -11/06/2021 23:28:45 - INFO - __main__ - Step 15734: {'lr': 0.0004894527430599786, 'samples': 3020928, 'steps': 15733, 'loss/train': 1.5409351587295532} -11/06/2021 23:28:45 - INFO - __main__ - Step 15735: {'lr': 0.0004894512178534171, 'samples': 3021120, 'steps': 15734, 'loss/train': 1.5735464096069336} -11/06/2021 23:28:46 - INFO - __main__ - Step 15736: {'lr': 0.0004894496925389625, 'samples': 3021312, 'steps': 15735, 'loss/train': 2.1567623615264893} -11/06/2021 23:28:47 - INFO - __main__ - Step 15737: {'lr': 0.0004894481671166155, 'samples': 3021504, 'steps': 15736, 'loss/train': 1.9780317544937134} -11/06/2021 23:28:47 - INFO - __main__ - Step 15738: {'lr': 0.0004894466415863771, 'samples': 3021696, 'steps': 15737, 'loss/train': 1.610995888710022} -11/06/2021 23:28:48 - INFO - __main__ - Step 15739: {'lr': 0.0004894451159482476, 'samples': 3021888, 'steps': 15738, 'loss/train': 1.5764869451522827} -11/06/2021 23:28:48 - INFO - __main__ - Step 15740: {'lr': 0.0004894435902022277, 'samples': 3022080, 'steps': 15739, 'loss/train': 1.3114335536956787} -11/06/2021 23:28:48 - INFO - __main__ - Step 15741: {'lr': 0.0004894420643483184, 'samples': 3022272, 'steps': 15740, 'loss/train': 1.8506090641021729} -11/06/2021 23:28:50 - INFO - __main__ - Step 15742: {'lr': 0.0004894405383865201, 'samples': 3022464, 'steps': 15741, 'loss/train': 1.5209318399429321} -11/06/2021 23:28:50 - INFO - __main__ - Step 15743: {'lr': 0.0004894390123168337, 'samples': 3022656, 'steps': 15742, 'loss/train': 1.4575647115707397} -11/06/2021 23:28:50 - INFO - __main__ - Step 15744: {'lr': 0.0004894374861392596, 'samples': 3022848, 'steps': 15743, 'loss/train': 2.133335828781128} -11/06/2021 23:28:51 - INFO - __main__ - Step 15745: {'lr': 0.0004894359598537987, 'samples': 3023040, 'steps': 15744, 'loss/train': 1.7577073574066162} -11/06/2021 23:28:52 - INFO - __main__ - Step 15746: {'lr': 0.0004894344334604517, 'samples': 3023232, 'steps': 15745, 'loss/train': 0.9471118450164795} -11/06/2021 23:28:52 - INFO - __main__ - Step 15747: {'lr': 0.0004894329069592192, 'samples': 3023424, 'steps': 15746, 'loss/train': 1.9907408952713013} -11/06/2021 23:28:53 - INFO - __main__ - Step 15748: {'lr': 0.000489431380350102, 'samples': 3023616, 'steps': 15747, 'loss/train': 2.8583734035491943} -11/06/2021 23:28:53 - INFO - __main__ - Step 15749: {'lr': 0.0004894298536331007, 'samples': 3023808, 'steps': 15748, 'loss/train': 0.6665930151939392} -11/06/2021 23:28:53 - INFO - __main__ - Step 15750: {'lr': 0.000489428326808216, 'samples': 3024000, 'steps': 15749, 'loss/train': 1.0621652603149414} -11/06/2021 23:28:54 - INFO - __main__ - Step 15751: {'lr': 0.0004894267998754486, 'samples': 3024192, 'steps': 15750, 'loss/train': 1.5037894248962402} -11/06/2021 23:28:55 - INFO - __main__ - Step 15752: {'lr': 0.0004894252728347992, 'samples': 3024384, 'steps': 15751, 'loss/train': 1.6653718948364258} -11/06/2021 23:28:55 - INFO - __main__ - Step 15753: {'lr': 0.0004894237456862684, 'samples': 3024576, 'steps': 15752, 'loss/train': 1.7493863105773926} -11/06/2021 23:28:55 - INFO - __main__ - Step 15754: {'lr': 0.000489422218429857, 'samples': 3024768, 'steps': 15753, 'loss/train': 1.5917749404907227} -11/06/2021 23:28:56 - INFO - __main__ - Step 15755: {'lr': 0.0004894206910655656, 'samples': 3024960, 'steps': 15754, 'loss/train': 1.5232791900634766} -11/06/2021 23:28:56 - INFO - __main__ - Step 15756: {'lr': 0.0004894191635933949, 'samples': 3025152, 'steps': 15755, 'loss/train': 2.1717846393585205} -11/06/2021 23:28:57 - INFO - __main__ - Step 15757: {'lr': 0.0004894176360133456, 'samples': 3025344, 'steps': 15756, 'loss/train': 1.9181817770004272} -11/06/2021 23:28:58 - INFO - __main__ - Step 15758: {'lr': 0.0004894161083254186, 'samples': 3025536, 'steps': 15757, 'loss/train': 2.2715911865234375} -11/06/2021 23:28:58 - INFO - __main__ - Step 15759: {'lr': 0.0004894145805296143, 'samples': 3025728, 'steps': 15758, 'loss/train': 1.8335258960723877} -11/06/2021 23:28:58 - INFO - __main__ - Step 15760: {'lr': 0.0004894130526259334, 'samples': 3025920, 'steps': 15759, 'loss/train': 1.284491777420044} -11/06/2021 23:28:59 - INFO - __main__ - Step 15761: {'lr': 0.0004894115246143768, 'samples': 3026112, 'steps': 15760, 'loss/train': 1.778687834739685} -11/06/2021 23:29:00 - INFO - __main__ - Step 15762: {'lr': 0.0004894099964949449, 'samples': 3026304, 'steps': 15761, 'loss/train': 1.093184471130371} -11/06/2021 23:29:00 - INFO - __main__ - Step 15763: {'lr': 0.0004894084682676387, 'samples': 3026496, 'steps': 15762, 'loss/train': 1.5207335948944092} -11/06/2021 23:29:01 - INFO - __main__ - Step 15764: {'lr': 0.0004894069399324586, 'samples': 3026688, 'steps': 15763, 'loss/train': 1.5955839157104492} -11/06/2021 23:29:01 - INFO - __main__ - Step 15765: {'lr': 0.0004894054114894055, 'samples': 3026880, 'steps': 15764, 'loss/train': 1.9538586139678955} -11/06/2021 23:29:01 - INFO - __main__ - Step 15766: {'lr': 0.00048940388293848, 'samples': 3027072, 'steps': 15765, 'loss/train': 1.9052053689956665} -11/06/2021 23:29:02 - INFO - __main__ - Step 15767: {'lr': 0.000489402354279683, 'samples': 3027264, 'steps': 15766, 'loss/train': 1.6094344854354858} -11/06/2021 23:29:03 - INFO - __main__ - Step 15768: {'lr': 0.0004894008255130147, 'samples': 3027456, 'steps': 15767, 'loss/train': 1.5516875982284546} -11/06/2021 23:29:03 - INFO - __main__ - Step 15769: {'lr': 0.0004893992966384762, 'samples': 3027648, 'steps': 15768, 'loss/train': 2.32871675491333} -11/06/2021 23:29:03 - INFO - __main__ - Step 15770: {'lr': 0.0004893977676560682, 'samples': 3027840, 'steps': 15769, 'loss/train': 1.62233567237854} -11/06/2021 23:29:04 - INFO - __main__ - Step 15771: {'lr': 0.000489396238565791, 'samples': 3028032, 'steps': 15770, 'loss/train': 1.8400375843048096} -11/06/2021 23:29:05 - INFO - __main__ - Step 15772: {'lr': 0.0004893947093676458, 'samples': 3028224, 'steps': 15771, 'loss/train': 1.4160466194152832} -11/06/2021 23:29:05 - INFO - __main__ - Step 15773: {'lr': 0.0004893931800616329, 'samples': 3028416, 'steps': 15772, 'loss/train': 1.8800396919250488} -11/06/2021 23:29:06 - INFO - __main__ - Step 15774: {'lr': 0.0004893916506477532, 'samples': 3028608, 'steps': 15773, 'loss/train': 1.4598236083984375} -11/06/2021 23:29:06 - INFO - __main__ - Step 15775: {'lr': 0.0004893901211260073, 'samples': 3028800, 'steps': 15774, 'loss/train': 1.329248309135437} -11/06/2021 23:29:06 - INFO - __main__ - Step 15776: {'lr': 0.0004893885914963958, 'samples': 3028992, 'steps': 15775, 'loss/train': 1.977927565574646} -11/06/2021 23:29:07 - INFO - __main__ - Step 15777: {'lr': 0.0004893870617589196, 'samples': 3029184, 'steps': 15776, 'loss/train': 2.081711530685425} -11/06/2021 23:29:08 - INFO - __main__ - Step 15778: {'lr': 0.0004893855319135791, 'samples': 3029376, 'steps': 15777, 'loss/train': 1.1884722709655762} -11/06/2021 23:29:08 - INFO - __main__ - Step 15779: {'lr': 0.0004893840019603754, 'samples': 3029568, 'steps': 15778, 'loss/train': 1.492553949356079} -11/06/2021 23:29:08 - INFO - __main__ - Step 15780: {'lr': 0.0004893824718993088, 'samples': 3029760, 'steps': 15779, 'loss/train': 1.4190195798873901} -11/06/2021 23:29:09 - INFO - __main__ - Step 15781: {'lr': 0.0004893809417303803, 'samples': 3029952, 'steps': 15780, 'loss/train': 1.5243641138076782} -11/06/2021 23:29:09 - INFO - __main__ - Step 15782: {'lr': 0.0004893794114535905, 'samples': 3030144, 'steps': 15781, 'loss/train': 1.7579809427261353} -11/06/2021 23:29:10 - INFO - __main__ - Step 15783: {'lr': 0.0004893778810689399, 'samples': 3030336, 'steps': 15782, 'loss/train': 5.995852470397949} -11/06/2021 23:29:11 - INFO - __main__ - Step 15784: {'lr': 0.0004893763505764292, 'samples': 3030528, 'steps': 15783, 'loss/train': 1.6866079568862915} -11/06/2021 23:29:11 - INFO - __main__ - Step 15785: {'lr': 0.0004893748199760594, 'samples': 3030720, 'steps': 15784, 'loss/train': 2.882068157196045} -11/06/2021 23:29:11 - INFO - __main__ - Step 15786: {'lr': 0.0004893732892678309, 'samples': 3030912, 'steps': 15785, 'loss/train': 1.8355077505111694} -11/06/2021 23:29:12 - INFO - __main__ - Step 15787: {'lr': 0.0004893717584517445, 'samples': 3031104, 'steps': 15786, 'loss/train': 1.4316880702972412} -11/06/2021 23:29:12 - INFO - __main__ - Step 15788: {'lr': 0.000489370227527801, 'samples': 3031296, 'steps': 15787, 'loss/train': 1.8777408599853516} -11/06/2021 23:29:13 - INFO - __main__ - Step 15789: {'lr': 0.0004893686964960009, 'samples': 3031488, 'steps': 15788, 'loss/train': 1.4991892576217651} -11/06/2021 23:29:13 - INFO - __main__ - Step 15790: {'lr': 0.0004893671653563448, 'samples': 3031680, 'steps': 15789, 'loss/train': 1.8356255292892456} -11/06/2021 23:29:14 - INFO - __main__ - Step 15791: {'lr': 0.0004893656341088338, 'samples': 3031872, 'steps': 15790, 'loss/train': 1.778326392173767} -11/06/2021 23:29:14 - INFO - __main__ - Step 15792: {'lr': 0.0004893641027534682, 'samples': 3032064, 'steps': 15791, 'loss/train': 1.4932310581207275} -11/06/2021 23:29:15 - INFO - __main__ - Step 15793: {'lr': 0.0004893625712902489, 'samples': 3032256, 'steps': 15792, 'loss/train': 1.2762092351913452} -11/06/2021 23:29:16 - INFO - __main__ - Step 15794: {'lr': 0.0004893610397191764, 'samples': 3032448, 'steps': 15793, 'loss/train': 1.7906181812286377} -11/06/2021 23:29:16 - INFO - __main__ - Step 15795: {'lr': 0.0004893595080402517, 'samples': 3032640, 'steps': 15794, 'loss/train': 1.450931191444397} -11/06/2021 23:29:16 - INFO - __main__ - Step 15796: {'lr': 0.0004893579762534751, 'samples': 3032832, 'steps': 15795, 'loss/train': 1.3250974416732788} -11/06/2021 23:29:17 - INFO - __main__ - Step 15797: {'lr': 0.0004893564443588476, 'samples': 3033024, 'steps': 15796, 'loss/train': 2.3122026920318604} -11/06/2021 23:29:17 - INFO - __main__ - Step 15798: {'lr': 0.0004893549123563697, 'samples': 3033216, 'steps': 15797, 'loss/train': 1.8526376485824585} -11/06/2021 23:29:18 - INFO - __main__ - Step 15799: {'lr': 0.0004893533802460422, 'samples': 3033408, 'steps': 15798, 'loss/train': 1.828189492225647} -11/06/2021 23:29:18 - INFO - __main__ - Step 15800: {'lr': 0.0004893518480278658, 'samples': 3033600, 'steps': 15799, 'loss/train': 1.659311294555664} -11/06/2021 23:29:19 - INFO - __main__ - Step 15801: {'lr': 0.0004893503157018412, 'samples': 3033792, 'steps': 15800, 'loss/train': 2.1041367053985596} -11/06/2021 23:29:19 - INFO - __main__ - Step 15802: {'lr': 0.000489348783267969, 'samples': 3033984, 'steps': 15801, 'loss/train': 1.7049843072891235} -11/06/2021 23:29:19 - INFO - __main__ - Step 15803: {'lr': 0.0004893472507262499, 'samples': 3034176, 'steps': 15802, 'loss/train': 1.8830581903457642} -11/06/2021 23:29:20 - INFO - __main__ - Step 15804: {'lr': 0.0004893457180766846, 'samples': 3034368, 'steps': 15803, 'loss/train': 1.8706032037734985} -11/06/2021 23:29:21 - INFO - __main__ - Step 15805: {'lr': 0.0004893441853192739, 'samples': 3034560, 'steps': 15804, 'loss/train': 1.941593885421753} -11/06/2021 23:29:21 - INFO - __main__ - Step 15806: {'lr': 0.0004893426524540183, 'samples': 3034752, 'steps': 15805, 'loss/train': 1.842943549156189} -11/06/2021 23:29:21 - INFO - __main__ - Step 15807: {'lr': 0.0004893411194809186, 'samples': 3034944, 'steps': 15806, 'loss/train': 1.782511830329895} -11/06/2021 23:29:22 - INFO - __main__ - Step 15808: {'lr': 0.0004893395863999755, 'samples': 3035136, 'steps': 15807, 'loss/train': 2.1695151329040527} -11/06/2021 23:29:22 - INFO - __main__ - Step 15809: {'lr': 0.0004893380532111898, 'samples': 3035328, 'steps': 15808, 'loss/train': 1.792184591293335} -11/06/2021 23:29:23 - INFO - __main__ - Step 15810: {'lr': 0.0004893365199145619, 'samples': 3035520, 'steps': 15809, 'loss/train': 1.3812013864517212} -11/06/2021 23:29:24 - INFO - __main__ - Step 15811: {'lr': 0.0004893349865100927, 'samples': 3035712, 'steps': 15810, 'loss/train': 1.7286027669906616} -11/06/2021 23:29:24 - INFO - __main__ - Step 15812: {'lr': 0.0004893334529977828, 'samples': 3035904, 'steps': 15811, 'loss/train': 1.761993646621704} -11/06/2021 23:29:24 - INFO - __main__ - Step 15813: {'lr': 0.0004893319193776331, 'samples': 3036096, 'steps': 15812, 'loss/train': 1.3216885328292847} -11/06/2021 23:29:25 - INFO - __main__ - Step 15814: {'lr': 0.000489330385649644, 'samples': 3036288, 'steps': 15813, 'loss/train': 1.5407154560089111} -11/06/2021 23:29:26 - INFO - __main__ - Step 15815: {'lr': 0.0004893288518138163, 'samples': 3036480, 'steps': 15814, 'loss/train': 1.7777429819107056} -11/06/2021 23:29:26 - INFO - __main__ - Step 15816: {'lr': 0.0004893273178701508, 'samples': 3036672, 'steps': 15815, 'loss/train': 1.6873787641525269} -11/06/2021 23:29:27 - INFO - __main__ - Step 15817: {'lr': 0.0004893257838186481, 'samples': 3036864, 'steps': 15816, 'loss/train': 2.015655755996704} -11/06/2021 23:29:27 - INFO - __main__ - Step 15818: {'lr': 0.0004893242496593089, 'samples': 3037056, 'steps': 15817, 'loss/train': 1.5864753723144531} -11/06/2021 23:29:27 - INFO - __main__ - Step 15819: {'lr': 0.0004893227153921338, 'samples': 3037248, 'steps': 15818, 'loss/train': 1.5181615352630615} -11/06/2021 23:29:28 - INFO - __main__ - Step 15820: {'lr': 0.0004893211810171237, 'samples': 3037440, 'steps': 15819, 'loss/train': 1.953935980796814} -11/06/2021 23:29:29 - INFO - __main__ - Step 15821: {'lr': 0.0004893196465342791, 'samples': 3037632, 'steps': 15820, 'loss/train': 1.703386664390564} -11/06/2021 23:29:29 - INFO - __main__ - Step 15822: {'lr': 0.0004893181119436007, 'samples': 3037824, 'steps': 15821, 'loss/train': 1.765951156616211} -11/06/2021 23:29:30 - INFO - __main__ - Step 15823: {'lr': 0.0004893165772450893, 'samples': 3038016, 'steps': 15822, 'loss/train': 1.1574418544769287} -11/06/2021 23:29:30 - INFO - __main__ - Step 15824: {'lr': 0.0004893150424387456, 'samples': 3038208, 'steps': 15823, 'loss/train': 2.260741949081421} -11/06/2021 23:29:30 - INFO - __main__ - Step 15825: {'lr': 0.0004893135075245702, 'samples': 3038400, 'steps': 15824, 'loss/train': 1.0996348857879639} -11/06/2021 23:29:31 - INFO - __main__ - Step 15826: {'lr': 0.0004893119725025639, 'samples': 3038592, 'steps': 15825, 'loss/train': 2.232999324798584} -11/06/2021 23:29:32 - INFO - __main__ - Step 15827: {'lr': 0.0004893104373727272, 'samples': 3038784, 'steps': 15826, 'loss/train': 1.5678027868270874} -11/06/2021 23:29:32 - INFO - __main__ - Step 15828: {'lr': 0.0004893089021350609, 'samples': 3038976, 'steps': 15827, 'loss/train': 1.6784107685089111} -11/06/2021 23:29:32 - INFO - __main__ - Step 15829: {'lr': 0.0004893073667895658, 'samples': 3039168, 'steps': 15828, 'loss/train': 1.2464898824691772} -11/06/2021 23:29:33 - INFO - __main__ - Step 15830: {'lr': 0.0004893058313362424, 'samples': 3039360, 'steps': 15829, 'loss/train': 1.7435942888259888} -11/06/2021 23:29:34 - INFO - __main__ - Step 15831: {'lr': 0.0004893042957750916, 'samples': 3039552, 'steps': 15830, 'loss/train': 1.2910295724868774} -11/06/2021 23:29:34 - INFO - __main__ - Step 15832: {'lr': 0.0004893027601061138, 'samples': 3039744, 'steps': 15831, 'loss/train': 1.3004798889160156} -11/06/2021 23:29:35 - INFO - __main__ - Step 15833: {'lr': 0.00048930122432931, 'samples': 3039936, 'steps': 15832, 'loss/train': 1.926435112953186} -11/06/2021 23:29:35 - INFO - __main__ - Step 15834: {'lr': 0.0004892996884446807, 'samples': 3040128, 'steps': 15833, 'loss/train': 1.350760817527771} -11/06/2021 23:29:35 - INFO - __main__ - Step 15835: {'lr': 0.0004892981524522267, 'samples': 3040320, 'steps': 15834, 'loss/train': 1.922597050666809} -11/06/2021 23:29:36 - INFO - __main__ - Step 15836: {'lr': 0.0004892966163519487, 'samples': 3040512, 'steps': 15835, 'loss/train': 1.553952932357788} -11/06/2021 23:29:37 - INFO - __main__ - Step 15837: {'lr': 0.0004892950801438472, 'samples': 3040704, 'steps': 15836, 'loss/train': 1.5477640628814697} -11/06/2021 23:29:37 - INFO - __main__ - Step 15838: {'lr': 0.0004892935438279231, 'samples': 3040896, 'steps': 15837, 'loss/train': 1.4451688528060913} -11/06/2021 23:29:37 - INFO - __main__ - Step 15839: {'lr': 0.0004892920074041771, 'samples': 3041088, 'steps': 15838, 'loss/train': 1.5197027921676636} -11/06/2021 23:29:38 - INFO - __main__ - Step 15840: {'lr': 0.0004892904708726096, 'samples': 3041280, 'steps': 15839, 'loss/train': 1.6010912656784058} -11/06/2021 23:29:38 - INFO - __main__ - Step 15841: {'lr': 0.0004892889342332218, 'samples': 3041472, 'steps': 15840, 'loss/train': 1.8907824754714966} -11/06/2021 23:29:39 - INFO - __main__ - Step 15842: {'lr': 0.000489287397486014, 'samples': 3041664, 'steps': 15841, 'loss/train': 1.3404470682144165} -11/06/2021 23:29:39 - INFO - __main__ - Step 15843: {'lr': 0.0004892858606309868, 'samples': 3041856, 'steps': 15842, 'loss/train': 1.9197810888290405} -11/06/2021 23:29:40 - INFO - __main__ - Step 15844: {'lr': 0.0004892843236681412, 'samples': 3042048, 'steps': 15843, 'loss/train': 1.7280125617980957} -11/06/2021 23:29:40 - INFO - __main__ - Step 15845: {'lr': 0.0004892827865974779, 'samples': 3042240, 'steps': 15844, 'loss/train': 1.8534923791885376} -11/06/2021 23:29:40 - INFO - __main__ - Step 15846: {'lr': 0.0004892812494189973, 'samples': 3042432, 'steps': 15845, 'loss/train': 1.8682761192321777} -11/06/2021 23:29:41 - INFO - __main__ - Step 15847: {'lr': 0.0004892797121327003, 'samples': 3042624, 'steps': 15846, 'loss/train': 1.5605151653289795} -11/06/2021 23:29:42 - INFO - __main__ - Step 15848: {'lr': 0.0004892781747385876, 'samples': 3042816, 'steps': 15847, 'loss/train': 1.5748695135116577} -11/06/2021 23:29:42 - INFO - __main__ - Step 15849: {'lr': 0.0004892766372366598, 'samples': 3043008, 'steps': 15848, 'loss/train': 1.6908271312713623} -11/06/2021 23:29:43 - INFO - __main__ - Step 15850: {'lr': 0.0004892750996269177, 'samples': 3043200, 'steps': 15849, 'loss/train': 1.7898610830307007} -11/06/2021 23:29:43 - INFO - __main__ - Step 15851: {'lr': 0.0004892735619093618, 'samples': 3043392, 'steps': 15850, 'loss/train': 1.9036415815353394} -11/06/2021 23:29:44 - INFO - __main__ - Step 15852: {'lr': 0.0004892720240839931, 'samples': 3043584, 'steps': 15851, 'loss/train': 1.692862629890442} -11/06/2021 23:29:44 - INFO - __main__ - Step 15853: {'lr': 0.0004892704861508121, 'samples': 3043776, 'steps': 15852, 'loss/train': 1.807676076889038} -11/06/2021 23:29:45 - INFO - __main__ - Step 15854: {'lr': 0.0004892689481098193, 'samples': 3043968, 'steps': 15853, 'loss/train': 1.5801000595092773} -11/06/2021 23:29:45 - INFO - __main__ - Step 15855: {'lr': 0.0004892674099610158, 'samples': 3044160, 'steps': 15854, 'loss/train': 1.7234050035476685} -11/06/2021 23:29:45 - INFO - __main__ - Step 15856: {'lr': 0.000489265871704402, 'samples': 3044352, 'steps': 15855, 'loss/train': 1.906105399131775} -11/06/2021 23:29:46 - INFO - __main__ - Step 15857: {'lr': 0.0004892643333399788, 'samples': 3044544, 'steps': 15856, 'loss/train': 1.3132715225219727} -11/06/2021 23:29:47 - INFO - __main__ - Step 15858: {'lr': 0.0004892627948677467, 'samples': 3044736, 'steps': 15857, 'loss/train': 1.1623653173446655} -11/06/2021 23:29:47 - INFO - __main__ - Step 15859: {'lr': 0.0004892612562877066, 'samples': 3044928, 'steps': 15858, 'loss/train': 1.407994270324707} -11/06/2021 23:29:48 - INFO - __main__ - Step 15860: {'lr': 0.0004892597175998589, 'samples': 3045120, 'steps': 15859, 'loss/train': 1.7048394680023193} -11/06/2021 23:29:48 - INFO - __main__ - Step 15861: {'lr': 0.0004892581788042045, 'samples': 3045312, 'steps': 15860, 'loss/train': 1.7856895923614502} -11/06/2021 23:29:49 - INFO - __main__ - Step 15862: {'lr': 0.0004892566399007441, 'samples': 3045504, 'steps': 15861, 'loss/train': 1.6186326742172241} -11/06/2021 23:29:49 - INFO - __main__ - Step 15863: {'lr': 0.0004892551008894784, 'samples': 3045696, 'steps': 15862, 'loss/train': 1.5280269384384155} -11/06/2021 23:29:50 - INFO - __main__ - Step 15864: {'lr': 0.0004892535617704079, 'samples': 3045888, 'steps': 15863, 'loss/train': 1.7535699605941772} -11/06/2021 23:29:50 - INFO - __main__ - Step 15865: {'lr': 0.0004892520225435336, 'samples': 3046080, 'steps': 15864, 'loss/train': 1.7523764371871948} -11/06/2021 23:29:50 - INFO - __main__ - Step 15866: {'lr': 0.000489250483208856, 'samples': 3046272, 'steps': 15865, 'loss/train': 1.8032313585281372} -11/06/2021 23:29:51 - INFO - __main__ - Step 15867: {'lr': 0.0004892489437663758, 'samples': 3046464, 'steps': 15866, 'loss/train': 1.9503204822540283} -11/06/2021 23:29:52 - INFO - __main__ - Step 15868: {'lr': 0.0004892474042160936, 'samples': 3046656, 'steps': 15867, 'loss/train': 1.6175391674041748} -11/06/2021 23:29:52 - INFO - __main__ - Step 15869: {'lr': 0.0004892458645580103, 'samples': 3046848, 'steps': 15868, 'loss/train': 1.700390338897705} -11/06/2021 23:29:53 - INFO - __main__ - Step 15870: {'lr': 0.0004892443247921265, 'samples': 3047040, 'steps': 15869, 'loss/train': 1.867167353630066} -11/06/2021 23:29:53 - INFO - __main__ - Step 15871: {'lr': 0.0004892427849184428, 'samples': 3047232, 'steps': 15870, 'loss/train': 2.022533416748047} -11/06/2021 23:29:53 - INFO - __main__ - Step 15872: {'lr': 0.0004892412449369602, 'samples': 3047424, 'steps': 15871, 'loss/train': 2.038414478302002} -11/06/2021 23:29:54 - INFO - __main__ - Step 15873: {'lr': 0.0004892397048476791, 'samples': 3047616, 'steps': 15872, 'loss/train': 2.008455276489258} -11/06/2021 23:29:55 - INFO - __main__ - Step 15874: {'lr': 0.0004892381646506002, 'samples': 3047808, 'steps': 15873, 'loss/train': 2.3255984783172607} -11/06/2021 23:29:55 - INFO - __main__ - Step 15875: {'lr': 0.0004892366243457244, 'samples': 3048000, 'steps': 15874, 'loss/train': 1.7657088041305542} -11/06/2021 23:29:55 - INFO - __main__ - Step 15876: {'lr': 0.0004892350839330522, 'samples': 3048192, 'steps': 15875, 'loss/train': 1.2648745775222778} -11/06/2021 23:29:56 - INFO - __main__ - Step 15877: {'lr': 0.0004892335434125844, 'samples': 3048384, 'steps': 15876, 'loss/train': 1.686819314956665} -11/06/2021 23:29:57 - INFO - __main__ - Step 15878: {'lr': 0.0004892320027843216, 'samples': 3048576, 'steps': 15877, 'loss/train': 1.774713158607483} -11/06/2021 23:29:57 - INFO - __main__ - Step 15879: {'lr': 0.0004892304620482646, 'samples': 3048768, 'steps': 15878, 'loss/train': 1.8812906742095947} -11/06/2021 23:29:57 - INFO - __main__ - Step 15880: {'lr': 0.000489228921204414, 'samples': 3048960, 'steps': 15879, 'loss/train': 1.9336180686950684} -11/06/2021 23:29:58 - INFO - __main__ - Step 15881: {'lr': 0.0004892273802527706, 'samples': 3049152, 'steps': 15880, 'loss/train': 1.9039198160171509} -11/06/2021 23:29:58 - INFO - __main__ - Step 15882: {'lr': 0.000489225839193335, 'samples': 3049344, 'steps': 15881, 'loss/train': 2.681311845779419} -11/06/2021 23:29:59 - INFO - __main__ - Step 15883: {'lr': 0.0004892242980261079, 'samples': 3049536, 'steps': 15882, 'loss/train': 1.3233872652053833} -11/06/2021 23:30:00 - INFO - __main__ - Step 15884: {'lr': 0.0004892227567510901, 'samples': 3049728, 'steps': 15883, 'loss/train': 1.6366331577301025} -11/06/2021 23:30:00 - INFO - __main__ - Step 15885: {'lr': 0.0004892212153682822, 'samples': 3049920, 'steps': 15884, 'loss/train': 2.0259757041931152} -11/06/2021 23:30:00 - INFO - __main__ - Step 15886: {'lr': 0.0004892196738776848, 'samples': 3050112, 'steps': 15885, 'loss/train': 1.6380057334899902} -11/06/2021 23:30:01 - INFO - __main__ - Step 15887: {'lr': 0.0004892181322792989, 'samples': 3050304, 'steps': 15886, 'loss/train': 1.6762605905532837} -11/06/2021 23:30:01 - INFO - __main__ - Step 15888: {'lr': 0.0004892165905731248, 'samples': 3050496, 'steps': 15887, 'loss/train': 1.6492608785629272} -11/06/2021 23:30:02 - INFO - __main__ - Step 15889: {'lr': 0.0004892150487591635, 'samples': 3050688, 'steps': 15888, 'loss/train': 1.8389976024627686} -11/06/2021 23:30:02 - INFO - __main__ - Step 15890: {'lr': 0.0004892135068374156, 'samples': 3050880, 'steps': 15889, 'loss/train': 1.6473220586776733} -11/06/2021 23:30:03 - INFO - __main__ - Step 15891: {'lr': 0.0004892119648078817, 'samples': 3051072, 'steps': 15890, 'loss/train': 1.6009021997451782} -11/06/2021 23:30:03 - INFO - __main__ - Step 15892: {'lr': 0.0004892104226705627, 'samples': 3051264, 'steps': 15891, 'loss/train': 1.201027512550354} -11/06/2021 23:30:04 - INFO - __main__ - Step 15893: {'lr': 0.0004892088804254591, 'samples': 3051456, 'steps': 15892, 'loss/train': 1.556810736656189} -11/06/2021 23:30:05 - INFO - __main__ - Step 15894: {'lr': 0.0004892073380725716, 'samples': 3051648, 'steps': 15893, 'loss/train': 1.3976141214370728} -11/06/2021 23:30:05 - INFO - __main__ - Step 15895: {'lr': 0.0004892057956119012, 'samples': 3051840, 'steps': 15894, 'loss/train': 1.6373045444488525} -11/06/2021 23:30:05 - INFO - __main__ - Step 15896: {'lr': 0.0004892042530434482, 'samples': 3052032, 'steps': 15895, 'loss/train': 1.500960350036621} -11/06/2021 23:30:06 - INFO - __main__ - Step 15897: {'lr': 0.0004892027103672134, 'samples': 3052224, 'steps': 15896, 'loss/train': 2.280747175216675} -11/06/2021 23:30:06 - INFO - __main__ - Step 15898: {'lr': 0.0004892011675831976, 'samples': 3052416, 'steps': 15897, 'loss/train': 1.7541916370391846} -11/06/2021 23:30:07 - INFO - __main__ - Step 15899: {'lr': 0.0004891996246914014, 'samples': 3052608, 'steps': 15898, 'loss/train': 1.63882315158844} -11/06/2021 23:30:07 - INFO - __main__ - Step 15900: {'lr': 0.0004891980816918257, 'samples': 3052800, 'steps': 15899, 'loss/train': 1.629404902458191} -11/06/2021 23:30:08 - INFO - __main__ - Step 15901: {'lr': 0.0004891965385844709, 'samples': 3052992, 'steps': 15900, 'loss/train': 1.5046894550323486} -11/06/2021 23:30:08 - INFO - __main__ - Step 15902: {'lr': 0.0004891949953693378, 'samples': 3053184, 'steps': 15901, 'loss/train': 1.5247341394424438} -11/06/2021 23:30:08 - INFO - __main__ - Step 15903: {'lr': 0.0004891934520464273, 'samples': 3053376, 'steps': 15902, 'loss/train': 1.785117268562317} -11/06/2021 23:30:09 - INFO - __main__ - Step 15904: {'lr': 0.0004891919086157398, 'samples': 3053568, 'steps': 15903, 'loss/train': 1.4606293439865112} -11/06/2021 23:30:10 - INFO - __main__ - Step 15905: {'lr': 0.000489190365077276, 'samples': 3053760, 'steps': 15904, 'loss/train': 1.7940731048583984} -11/06/2021 23:30:10 - INFO - __main__ - Step 15906: {'lr': 0.0004891888214310369, 'samples': 3053952, 'steps': 15905, 'loss/train': 1.8179190158843994} -11/06/2021 23:30:11 - INFO - __main__ - Step 15907: {'lr': 0.000489187277677023, 'samples': 3054144, 'steps': 15906, 'loss/train': 1.6493617296218872} -11/06/2021 23:30:11 - INFO - __main__ - Step 15908: {'lr': 0.000489185733815235, 'samples': 3054336, 'steps': 15907, 'loss/train': 1.645919919013977} -11/06/2021 23:30:11 - INFO - __main__ - Step 15909: {'lr': 0.0004891841898456735, 'samples': 3054528, 'steps': 15908, 'loss/train': 1.8453730344772339} -11/06/2021 23:30:12 - INFO - __main__ - Step 15910: {'lr': 0.0004891826457683394, 'samples': 3054720, 'steps': 15909, 'loss/train': 1.7440708875656128} -11/06/2021 23:30:13 - INFO - __main__ - Step 15911: {'lr': 0.0004891811015832332, 'samples': 3054912, 'steps': 15910, 'loss/train': 1.6581617593765259} -11/06/2021 23:30:13 - INFO - __main__ - Step 15912: {'lr': 0.0004891795572903557, 'samples': 3055104, 'steps': 15911, 'loss/train': 1.5487264394760132} -11/06/2021 23:30:14 - INFO - __main__ - Step 15913: {'lr': 0.0004891780128897077, 'samples': 3055296, 'steps': 15912, 'loss/train': 1.7143360376358032} -11/06/2021 23:30:14 - INFO - __main__ - Step 15914: {'lr': 0.0004891764683812896, 'samples': 3055488, 'steps': 15913, 'loss/train': 1.7877535820007324} -11/06/2021 23:30:15 - INFO - __main__ - Step 15915: {'lr': 0.0004891749237651024, 'samples': 3055680, 'steps': 15914, 'loss/train': 2.2019176483154297} -11/06/2021 23:30:16 - INFO - __main__ - Step 15916: {'lr': 0.0004891733790411466, 'samples': 3055872, 'steps': 15915, 'loss/train': 1.6177648305892944} -11/06/2021 23:30:16 - INFO - __main__ - Step 15917: {'lr': 0.000489171834209423, 'samples': 3056064, 'steps': 15916, 'loss/train': 2.0790741443634033} -11/06/2021 23:30:16 - INFO - __main__ - Step 15918: {'lr': 0.0004891702892699323, 'samples': 3056256, 'steps': 15917, 'loss/train': 1.2524698972702026} -11/06/2021 23:30:17 - INFO - __main__ - Step 15919: {'lr': 0.0004891687442226751, 'samples': 3056448, 'steps': 15918, 'loss/train': 2.0985350608825684} -11/06/2021 23:30:17 - INFO - __main__ - Step 15920: {'lr': 0.0004891671990676522, 'samples': 3056640, 'steps': 15919, 'loss/train': 1.7934945821762085} -11/06/2021 23:30:18 - INFO - __main__ - Step 15921: {'lr': 0.0004891656538048642, 'samples': 3056832, 'steps': 15920, 'loss/train': 0.5140384435653687} -11/06/2021 23:30:18 - INFO - __main__ - Step 15922: {'lr': 0.0004891641084343118, 'samples': 3057024, 'steps': 15921, 'loss/train': 1.4971164464950562} -11/06/2021 23:30:19 - INFO - __main__ - Step 15923: {'lr': 0.0004891625629559959, 'samples': 3057216, 'steps': 15922, 'loss/train': 2.0432043075561523} -11/06/2021 23:30:19 - INFO - __main__ - Step 15924: {'lr': 0.0004891610173699169, 'samples': 3057408, 'steps': 15923, 'loss/train': 1.4933257102966309} -11/06/2021 23:30:20 - INFO - __main__ - Step 15925: {'lr': 0.0004891594716760757, 'samples': 3057600, 'steps': 15924, 'loss/train': 2.0862317085266113} -11/06/2021 23:30:20 - INFO - __main__ - Step 15926: {'lr': 0.0004891579258744728, 'samples': 3057792, 'steps': 15925, 'loss/train': 1.788038969039917} -11/06/2021 23:30:21 - INFO - __main__ - Step 15927: {'lr': 0.0004891563799651092, 'samples': 3057984, 'steps': 15926, 'loss/train': 1.711025357246399} -11/06/2021 23:30:21 - INFO - __main__ - Step 15928: {'lr': 0.0004891548339479854, 'samples': 3058176, 'steps': 15927, 'loss/train': 1.7549539804458618} -11/06/2021 23:30:22 - INFO - __main__ - Step 15929: {'lr': 0.0004891532878231021, 'samples': 3058368, 'steps': 15928, 'loss/train': 1.9058785438537598} -11/06/2021 23:30:22 - INFO - __main__ - Step 15930: {'lr': 0.00048915174159046, 'samples': 3058560, 'steps': 15929, 'loss/train': 1.3126921653747559} -11/06/2021 23:30:23 - INFO - __main__ - Step 15931: {'lr': 0.0004891501952500599, 'samples': 3058752, 'steps': 15930, 'loss/train': 1.5705853700637817} -11/06/2021 23:30:23 - INFO - __main__ - Step 15932: {'lr': 0.0004891486488019023, 'samples': 3058944, 'steps': 15931, 'loss/train': 1.8984884023666382} -11/06/2021 23:30:24 - INFO - __main__ - Step 15933: {'lr': 0.000489147102245988, 'samples': 3059136, 'steps': 15932, 'loss/train': 1.7881126403808594} -11/06/2021 23:30:24 - INFO - __main__ - Step 15934: {'lr': 0.0004891455555823179, 'samples': 3059328, 'steps': 15933, 'loss/train': 0.8325879573822021} -11/06/2021 23:30:24 - INFO - __main__ - Step 15935: {'lr': 0.0004891440088108923, 'samples': 3059520, 'steps': 15934, 'loss/train': 1.4407297372817993} -11/06/2021 23:30:26 - INFO - __main__ - Step 15936: {'lr': 0.0004891424619317121, 'samples': 3059712, 'steps': 15935, 'loss/train': 1.791204810142517} -11/06/2021 23:30:26 - INFO - __main__ - Step 15937: {'lr': 0.000489140914944778, 'samples': 3059904, 'steps': 15936, 'loss/train': 1.459701657295227} -11/06/2021 23:30:26 - INFO - __main__ - Step 15938: {'lr': 0.0004891393678500909, 'samples': 3060096, 'steps': 15937, 'loss/train': 1.4462066888809204} -11/06/2021 23:30:27 - INFO - __main__ - Step 15939: {'lr': 0.0004891378206476511, 'samples': 3060288, 'steps': 15938, 'loss/train': 1.4875487089157104} -11/06/2021 23:30:27 - INFO - __main__ - Step 15940: {'lr': 0.0004891362733374595, 'samples': 3060480, 'steps': 15939, 'loss/train': 1.7356269359588623} -11/06/2021 23:30:28 - INFO - __main__ - Step 15941: {'lr': 0.0004891347259195168, 'samples': 3060672, 'steps': 15940, 'loss/train': 1.6053783893585205} -11/06/2021 23:30:28 - INFO - __main__ - Step 15942: {'lr': 0.0004891331783938238, 'samples': 3060864, 'steps': 15941, 'loss/train': 1.529934287071228} -11/06/2021 23:30:29 - INFO - __main__ - Step 15943: {'lr': 0.000489131630760381, 'samples': 3061056, 'steps': 15942, 'loss/train': 1.0856684446334839} -11/06/2021 23:30:29 - INFO - __main__ - Step 15944: {'lr': 0.000489130083019189, 'samples': 3061248, 'steps': 15943, 'loss/train': 1.3536427021026611} -11/06/2021 23:30:29 - INFO - __main__ - Step 15945: {'lr': 0.000489128535170249, 'samples': 3061440, 'steps': 15944, 'loss/train': 1.3053251504898071} -11/06/2021 23:30:30 - INFO - __main__ - Step 15946: {'lr': 0.0004891269872135611, 'samples': 3061632, 'steps': 15945, 'loss/train': 2.2223825454711914} -11/06/2021 23:30:31 - INFO - __main__ - Step 15947: {'lr': 0.0004891254391491264, 'samples': 3061824, 'steps': 15946, 'loss/train': 1.6169859170913696} -11/06/2021 23:30:31 - INFO - __main__ - Step 15948: {'lr': 0.0004891238909769454, 'samples': 3062016, 'steps': 15947, 'loss/train': 1.6971629858016968} -11/06/2021 23:30:32 - INFO - __main__ - Step 15949: {'lr': 0.0004891223426970189, 'samples': 3062208, 'steps': 15948, 'loss/train': 1.6054120063781738} -11/06/2021 23:30:32 - INFO - __main__ - Step 15950: {'lr': 0.0004891207943093476, 'samples': 3062400, 'steps': 15949, 'loss/train': 2.358388662338257} -11/06/2021 23:30:32 - INFO - __main__ - Step 15951: {'lr': 0.000489119245813932, 'samples': 3062592, 'steps': 15950, 'loss/train': 2.2552406787872314} -11/06/2021 23:30:34 - INFO - __main__ - Step 15952: {'lr': 0.0004891176972107731, 'samples': 3062784, 'steps': 15951, 'loss/train': 1.8012076616287231} -11/06/2021 23:30:34 - INFO - __main__ - Step 15953: {'lr': 0.0004891161484998715, 'samples': 3062976, 'steps': 15952, 'loss/train': 1.947579264640808} -11/06/2021 23:30:34 - INFO - __main__ - Step 15954: {'lr': 0.0004891145996812279, 'samples': 3063168, 'steps': 15953, 'loss/train': 1.6745511293411255} -11/06/2021 23:30:35 - INFO - __main__ - Step 15955: {'lr': 0.0004891130507548427, 'samples': 3063360, 'steps': 15954, 'loss/train': 2.0542542934417725} -11/06/2021 23:30:35 - INFO - __main__ - Step 15956: {'lr': 0.000489111501720717, 'samples': 3063552, 'steps': 15955, 'loss/train': 1.9397313594818115} -11/06/2021 23:30:36 - INFO - __main__ - Step 15957: {'lr': 0.0004891099525788514, 'samples': 3063744, 'steps': 15956, 'loss/train': 1.229641079902649} -11/06/2021 23:30:36 - INFO - __main__ - Step 15958: {'lr': 0.0004891084033292464, 'samples': 3063936, 'steps': 15957, 'loss/train': 1.033172369003296} -11/06/2021 23:30:37 - INFO - __main__ - Step 15959: {'lr': 0.0004891068539719031, 'samples': 3064128, 'steps': 15958, 'loss/train': 1.7503483295440674} -11/06/2021 23:30:37 - INFO - __main__ - Step 15960: {'lr': 0.0004891053045068217, 'samples': 3064320, 'steps': 15959, 'loss/train': 2.0735301971435547} -11/06/2021 23:30:38 - INFO - __main__ - Step 15961: {'lr': 0.0004891037549340032, 'samples': 3064512, 'steps': 15960, 'loss/train': 1.7163405418395996} -11/06/2021 23:30:38 - INFO - __main__ - Step 15962: {'lr': 0.0004891022052534482, 'samples': 3064704, 'steps': 15961, 'loss/train': 1.817496418952942} -11/06/2021 23:30:39 - INFO - __main__ - Step 15963: {'lr': 0.0004891006554651574, 'samples': 3064896, 'steps': 15962, 'loss/train': 1.744676113128662} -11/06/2021 23:30:39 - INFO - __main__ - Step 15964: {'lr': 0.0004890991055691318, 'samples': 3065088, 'steps': 15963, 'loss/train': 1.987470030784607} -11/06/2021 23:30:40 - INFO - __main__ - Step 15965: {'lr': 0.0004890975555653716, 'samples': 3065280, 'steps': 15964, 'loss/train': 1.5478122234344482} -11/06/2021 23:30:40 - INFO - __main__ - Step 15966: {'lr': 0.0004890960054538778, 'samples': 3065472, 'steps': 15965, 'loss/train': 1.4275331497192383} -11/06/2021 23:30:40 - INFO - __main__ - Step 15967: {'lr': 0.000489094455234651, 'samples': 3065664, 'steps': 15966, 'loss/train': 1.8712700605392456} -11/06/2021 23:30:41 - INFO - __main__ - Step 15968: {'lr': 0.0004890929049076919, 'samples': 3065856, 'steps': 15967, 'loss/train': 1.5248794555664062} -11/06/2021 23:30:42 - INFO - __main__ - Step 15969: {'lr': 0.0004890913544730013, 'samples': 3066048, 'steps': 15968, 'loss/train': 1.28171706199646} -11/06/2021 23:30:42 - INFO - __main__ - Step 15970: {'lr': 0.0004890898039305798, 'samples': 3066240, 'steps': 15969, 'loss/train': 1.9266890287399292} -11/06/2021 23:30:43 - INFO - __main__ - Step 15971: {'lr': 0.000489088253280428, 'samples': 3066432, 'steps': 15970, 'loss/train': 1.6399247646331787} -11/06/2021 23:30:43 - INFO - __main__ - Step 15972: {'lr': 0.0004890867025225469, 'samples': 3066624, 'steps': 15971, 'loss/train': 1.434366226196289} -11/06/2021 23:30:43 - INFO - __main__ - Step 15973: {'lr': 0.000489085151656937, 'samples': 3066816, 'steps': 15972, 'loss/train': 1.9939874410629272} -11/06/2021 23:30:44 - INFO - __main__ - Step 15974: {'lr': 0.000489083600683599, 'samples': 3067008, 'steps': 15973, 'loss/train': 1.6070252656936646} -11/06/2021 23:30:45 - INFO - __main__ - Step 15975: {'lr': 0.0004890820496025335, 'samples': 3067200, 'steps': 15974, 'loss/train': 2.040097236633301} -11/06/2021 23:30:45 - INFO - __main__ - Step 15976: {'lr': 0.0004890804984137415, 'samples': 3067392, 'steps': 15975, 'loss/train': 1.497314691543579} -11/06/2021 23:30:45 - INFO - __main__ - Step 15977: {'lr': 0.0004890789471172233, 'samples': 3067584, 'steps': 15976, 'loss/train': 1.9788398742675781} -11/06/2021 23:30:46 - INFO - __main__ - Step 15978: {'lr': 0.00048907739571298, 'samples': 3067776, 'steps': 15977, 'loss/train': 2.1698567867279053} -11/06/2021 23:30:47 - INFO - __main__ - Step 15979: {'lr': 0.000489075844201012, 'samples': 3067968, 'steps': 15978, 'loss/train': 1.803942084312439} -11/06/2021 23:30:47 - INFO - __main__ - Step 15980: {'lr': 0.0004890742925813202, 'samples': 3068160, 'steps': 15979, 'loss/train': 1.9059771299362183} -11/06/2021 23:30:47 - INFO - __main__ - Step 15981: {'lr': 0.0004890727408539051, 'samples': 3068352, 'steps': 15980, 'loss/train': 1.6169204711914062} -11/06/2021 23:30:48 - INFO - __main__ - Step 15982: {'lr': 0.0004890711890187676, 'samples': 3068544, 'steps': 15981, 'loss/train': 1.6662590503692627} -11/06/2021 23:30:48 - INFO - __main__ - Step 15983: {'lr': 0.0004890696370759085, 'samples': 3068736, 'steps': 15982, 'loss/train': 1.6316263675689697} -11/06/2021 23:30:49 - INFO - __main__ - Step 15984: {'lr': 0.0004890680850253281, 'samples': 3068928, 'steps': 15983, 'loss/train': 1.7431037425994873} -11/06/2021 23:30:50 - INFO - __main__ - Step 15985: {'lr': 0.0004890665328670273, 'samples': 3069120, 'steps': 15984, 'loss/train': 1.7892478704452515} -11/06/2021 23:30:50 - INFO - __main__ - Step 15986: {'lr': 0.0004890649806010067, 'samples': 3069312, 'steps': 15985, 'loss/train': 1.5585905313491821} -11/06/2021 23:30:50 - INFO - __main__ - Step 15987: {'lr': 0.0004890634282272673, 'samples': 3069504, 'steps': 15986, 'loss/train': 1.4312716722488403} -11/06/2021 23:30:51 - INFO - __main__ - Step 15988: {'lr': 0.0004890618757458096, 'samples': 3069696, 'steps': 15987, 'loss/train': 1.3658758401870728} -11/06/2021 23:30:52 - INFO - __main__ - Step 15989: {'lr': 0.0004890603231566343, 'samples': 3069888, 'steps': 15988, 'loss/train': 1.3280619382858276} -11/06/2021 23:30:52 - INFO - __main__ - Step 15990: {'lr': 0.000489058770459742, 'samples': 3070080, 'steps': 15989, 'loss/train': 0.21883493661880493} -11/06/2021 23:30:52 - INFO - __main__ - Step 15991: {'lr': 0.0004890572176551337, 'samples': 3070272, 'steps': 15990, 'loss/train': 1.0338857173919678} -11/06/2021 23:30:53 - INFO - __main__ - Step 15992: {'lr': 0.0004890556647428097, 'samples': 3070464, 'steps': 15991, 'loss/train': 1.804748296737671} -11/06/2021 23:30:53 - INFO - __main__ - Step 15993: {'lr': 0.0004890541117227711, 'samples': 3070656, 'steps': 15992, 'loss/train': 1.1383863687515259} -11/06/2021 23:30:54 - INFO - __main__ - Step 15994: {'lr': 0.0004890525585950181, 'samples': 3070848, 'steps': 15993, 'loss/train': 2.0593109130859375} -11/06/2021 23:30:54 - INFO - __main__ - Step 15995: {'lr': 0.000489051005359552, 'samples': 3071040, 'steps': 15994, 'loss/train': 1.7306606769561768} -11/06/2021 23:30:55 - INFO - __main__ - Step 15996: {'lr': 0.0004890494520163731, 'samples': 3071232, 'steps': 15995, 'loss/train': 1.410784363746643} -11/06/2021 23:30:55 - INFO - __main__ - Step 15997: {'lr': 0.0004890478985654823, 'samples': 3071424, 'steps': 15996, 'loss/train': 1.6601943969726562} -11/06/2021 23:30:56 - INFO - __main__ - Step 15998: {'lr': 0.0004890463450068801, 'samples': 3071616, 'steps': 15997, 'loss/train': 1.836921215057373} -11/06/2021 23:30:57 - INFO - __main__ - Step 15999: {'lr': 0.0004890447913405673, 'samples': 3071808, 'steps': 15998, 'loss/train': 1.627102255821228} -11/06/2021 23:30:57 - INFO - __main__ - Step 16000: {'lr': 0.0004890432375665447, 'samples': 3072000, 'steps': 15999, 'loss/train': 1.4169437885284424} -11/06/2021 23:30:57 - INFO - __main__ - Step 16001: {'lr': 0.0004890416836848127, 'samples': 3072192, 'steps': 16000, 'loss/train': 1.6639877557754517} -11/06/2021 23:30:58 - INFO - __main__ - Step 16002: {'lr': 0.0004890401296953723, 'samples': 3072384, 'steps': 16001, 'loss/train': 1.9044790267944336} -11/06/2021 23:30:58 - INFO - __main__ - Step 16003: {'lr': 0.0004890385755982243, 'samples': 3072576, 'steps': 16002, 'loss/train': 1.7246227264404297} -11/06/2021 23:30:58 - INFO - __main__ - Step 16004: {'lr': 0.0004890370213933691, 'samples': 3072768, 'steps': 16003, 'loss/train': 1.6332004070281982} -11/06/2021 23:30:59 - INFO - __main__ - Step 16005: {'lr': 0.0004890354670808074, 'samples': 3072960, 'steps': 16004, 'loss/train': 2.4110894203186035} -11/06/2021 23:31:00 - INFO - __main__ - Step 16006: {'lr': 0.0004890339126605401, 'samples': 3073152, 'steps': 16005, 'loss/train': 1.834177851676941} -11/06/2021 23:31:00 - INFO - __main__ - Step 16007: {'lr': 0.0004890323581325677, 'samples': 3073344, 'steps': 16006, 'loss/train': 1.876891016960144} -11/06/2021 23:31:00 - INFO - __main__ - Step 16008: {'lr': 0.0004890308034968911, 'samples': 3073536, 'steps': 16007, 'loss/train': 1.4352622032165527} -11/06/2021 23:31:01 - INFO - __main__ - Step 16009: {'lr': 0.0004890292487535108, 'samples': 3073728, 'steps': 16008, 'loss/train': 2.2022879123687744} -11/06/2021 23:31:02 - INFO - __main__ - Step 16010: {'lr': 0.0004890276939024278, 'samples': 3073920, 'steps': 16009, 'loss/train': 0.9346103072166443} -11/06/2021 23:31:02 - INFO - __main__ - Step 16011: {'lr': 0.0004890261389436424, 'samples': 3074112, 'steps': 16010, 'loss/train': 1.6814231872558594} -11/06/2021 23:31:03 - INFO - __main__ - Step 16012: {'lr': 0.0004890245838771557, 'samples': 3074304, 'steps': 16011, 'loss/train': 1.8951748609542847} -11/06/2021 23:31:03 - INFO - __main__ - Step 16013: {'lr': 0.0004890230287029681, 'samples': 3074496, 'steps': 16012, 'loss/train': 1.8367836475372314} -11/06/2021 23:31:03 - INFO - __main__ - Step 16014: {'lr': 0.0004890214734210805, 'samples': 3074688, 'steps': 16013, 'loss/train': 1.9447275400161743} -11/06/2021 23:31:04 - INFO - __main__ - Step 16015: {'lr': 0.0004890199180314935, 'samples': 3074880, 'steps': 16014, 'loss/train': 1.739290714263916} -11/06/2021 23:31:05 - INFO - __main__ - Step 16016: {'lr': 0.0004890183625342078, 'samples': 3075072, 'steps': 16015, 'loss/train': 1.9823334217071533} -11/06/2021 23:31:05 - INFO - __main__ - Step 16017: {'lr': 0.0004890168069292241, 'samples': 3075264, 'steps': 16016, 'loss/train': 1.898835301399231} -11/06/2021 23:31:05 - INFO - __main__ - Step 16018: {'lr': 0.000489015251216543, 'samples': 3075456, 'steps': 16017, 'loss/train': 1.9296048879623413} -11/06/2021 23:31:06 - INFO - __main__ - Step 16019: {'lr': 0.0004890136953961654, 'samples': 3075648, 'steps': 16018, 'loss/train': 1.3645771741867065} -11/06/2021 23:31:07 - INFO - __main__ - Step 16020: {'lr': 0.000489012139468092, 'samples': 3075840, 'steps': 16019, 'loss/train': 1.6032259464263916} -11/06/2021 23:31:07 - INFO - __main__ - Step 16021: {'lr': 0.0004890105834323233, 'samples': 3076032, 'steps': 16020, 'loss/train': 1.5474944114685059} -11/06/2021 23:31:07 - INFO - __main__ - Step 16022: {'lr': 0.0004890090272888602, 'samples': 3076224, 'steps': 16021, 'loss/train': 1.8480674028396606} -11/06/2021 23:31:08 - INFO - __main__ - Step 16023: {'lr': 0.0004890074710377033, 'samples': 3076416, 'steps': 16022, 'loss/train': 1.5558422803878784} -11/06/2021 23:31:08 - INFO - __main__ - Step 16024: {'lr': 0.0004890059146788532, 'samples': 3076608, 'steps': 16023, 'loss/train': 1.956721305847168} -11/06/2021 23:31:09 - INFO - __main__ - Step 16025: {'lr': 0.000489004358212311, 'samples': 3076800, 'steps': 16024, 'loss/train': 1.4700076580047607} -11/06/2021 23:31:10 - INFO - __main__ - Step 16026: {'lr': 0.0004890028016380769, 'samples': 3076992, 'steps': 16025, 'loss/train': 1.5509119033813477} -11/06/2021 23:31:10 - INFO - __main__ - Step 16027: {'lr': 0.0004890012449561518, 'samples': 3077184, 'steps': 16026, 'loss/train': 1.683590292930603} -11/06/2021 23:31:10 - INFO - __main__ - Step 16028: {'lr': 0.0004889996881665366, 'samples': 3077376, 'steps': 16027, 'loss/train': 1.3393259048461914} -11/06/2021 23:31:11 - INFO - __main__ - Step 16029: {'lr': 0.0004889981312692317, 'samples': 3077568, 'steps': 16028, 'loss/train': 1.7740288972854614} -11/06/2021 23:31:11 - INFO - __main__ - Step 16030: {'lr': 0.000488996574264238, 'samples': 3077760, 'steps': 16029, 'loss/train': 1.773305892944336} -11/06/2021 23:31:12 - INFO - __main__ - Step 16031: {'lr': 0.000488995017151556, 'samples': 3077952, 'steps': 16030, 'loss/train': 0.440768837928772} -11/06/2021 23:31:12 - INFO - __main__ - Step 16032: {'lr': 0.0004889934599311867, 'samples': 3078144, 'steps': 16031, 'loss/train': 2.0566556453704834} -11/06/2021 23:31:13 - INFO - __main__ - Step 16033: {'lr': 0.0004889919026031306, 'samples': 3078336, 'steps': 16032, 'loss/train': 1.4847581386566162} -11/06/2021 23:31:13 - INFO - __main__ - Step 16034: {'lr': 0.0004889903451673884, 'samples': 3078528, 'steps': 16033, 'loss/train': 1.6132980585098267} -11/06/2021 23:31:14 - INFO - __main__ - Step 16035: {'lr': 0.0004889887876239608, 'samples': 3078720, 'steps': 16034, 'loss/train': 1.4533771276474} -11/06/2021 23:31:15 - INFO - __main__ - Step 16036: {'lr': 0.0004889872299728486, 'samples': 3078912, 'steps': 16035, 'loss/train': 1.3205077648162842} -11/06/2021 23:31:15 - INFO - __main__ - Step 16037: {'lr': 0.0004889856722140525, 'samples': 3079104, 'steps': 16036, 'loss/train': 1.8552273511886597} -11/06/2021 23:31:15 - INFO - __main__ - Step 16038: {'lr': 0.000488984114347573, 'samples': 3079296, 'steps': 16037, 'loss/train': 1.5201712846755981} -11/06/2021 23:31:16 - INFO - __main__ - Step 16039: {'lr': 0.000488982556373411, 'samples': 3079488, 'steps': 16038, 'loss/train': 1.3169190883636475} -11/06/2021 23:31:16 - INFO - __main__ - Step 16040: {'lr': 0.0004889809982915672, 'samples': 3079680, 'steps': 16039, 'loss/train': 1.6098225116729736} -11/06/2021 23:31:17 - INFO - __main__ - Step 16041: {'lr': 0.0004889794401020422, 'samples': 3079872, 'steps': 16040, 'loss/train': 1.4014536142349243} -11/06/2021 23:31:17 - INFO - __main__ - Step 16042: {'lr': 0.0004889778818048368, 'samples': 3080064, 'steps': 16041, 'loss/train': 1.5248942375183105} -11/06/2021 23:31:18 - INFO - __main__ - Step 16043: {'lr': 0.0004889763233999516, 'samples': 3080256, 'steps': 16042, 'loss/train': 1.8693872690200806} -11/06/2021 23:31:18 - INFO - __main__ - Step 16044: {'lr': 0.0004889747648873874, 'samples': 3080448, 'steps': 16043, 'loss/train': 1.9268662929534912} -11/06/2021 23:31:18 - INFO - __main__ - Step 16045: {'lr': 0.0004889732062671448, 'samples': 3080640, 'steps': 16044, 'loss/train': 1.6837748289108276} -11/06/2021 23:31:19 - INFO - __main__ - Step 16046: {'lr': 0.0004889716475392247, 'samples': 3080832, 'steps': 16045, 'loss/train': 1.4768024682998657} -11/06/2021 23:31:20 - INFO - __main__ - Step 16047: {'lr': 0.0004889700887036275, 'samples': 3081024, 'steps': 16046, 'loss/train': 2.1141278743743896} -11/06/2021 23:31:20 - INFO - __main__ - Step 16048: {'lr': 0.0004889685297603541, 'samples': 3081216, 'steps': 16047, 'loss/train': 1.835368275642395} -11/06/2021 23:31:20 - INFO - __main__ - Step 16049: {'lr': 0.0004889669707094052, 'samples': 3081408, 'steps': 16048, 'loss/train': 1.6546882390975952} -11/06/2021 23:31:21 - INFO - __main__ - Step 16050: {'lr': 0.0004889654115507815, 'samples': 3081600, 'steps': 16049, 'loss/train': 1.2408573627471924} -11/06/2021 23:31:22 - INFO - __main__ - Step 16051: {'lr': 0.0004889638522844836, 'samples': 3081792, 'steps': 16050, 'loss/train': 1.5190356969833374} -11/06/2021 23:31:22 - INFO - __main__ - Step 16052: {'lr': 0.0004889622929105123, 'samples': 3081984, 'steps': 16051, 'loss/train': 2.227968215942383} -11/06/2021 23:31:23 - INFO - __main__ - Step 16053: {'lr': 0.0004889607334288683, 'samples': 3082176, 'steps': 16052, 'loss/train': 1.310071349143982} -11/06/2021 23:31:23 - INFO - __main__ - Step 16054: {'lr': 0.0004889591738395522, 'samples': 3082368, 'steps': 16053, 'loss/train': 1.535683512687683} -11/06/2021 23:31:24 - INFO - __main__ - Step 16055: {'lr': 0.0004889576141425649, 'samples': 3082560, 'steps': 16054, 'loss/train': 1.4733257293701172} -11/06/2021 23:31:24 - INFO - __main__ - Step 16056: {'lr': 0.0004889560543379069, 'samples': 3082752, 'steps': 16055, 'loss/train': 0.716278612613678} -11/06/2021 23:31:25 - INFO - __main__ - Step 16057: {'lr': 0.000488954494425579, 'samples': 3082944, 'steps': 16056, 'loss/train': 1.6750446557998657} -11/06/2021 23:31:25 - INFO - __main__ - Step 16058: {'lr': 0.000488952934405582, 'samples': 3083136, 'steps': 16057, 'loss/train': 2.0339643955230713} -11/06/2021 23:31:26 - INFO - __main__ - Step 16059: {'lr': 0.0004889513742779164, 'samples': 3083328, 'steps': 16058, 'loss/train': 1.7793983221054077} -11/06/2021 23:31:26 - INFO - __main__ - Step 16060: {'lr': 0.0004889498140425829, 'samples': 3083520, 'steps': 16059, 'loss/train': 1.7236640453338623} -11/06/2021 23:31:26 - INFO - __main__ - Step 16061: {'lr': 0.0004889482536995825, 'samples': 3083712, 'steps': 16060, 'loss/train': 1.4017524719238281} -11/06/2021 23:31:28 - INFO - __main__ - Step 16062: {'lr': 0.0004889466932489157, 'samples': 3083904, 'steps': 16061, 'loss/train': 1.0112061500549316} -11/06/2021 23:31:28 - INFO - __main__ - Step 16063: {'lr': 0.0004889451326905831, 'samples': 3084096, 'steps': 16062, 'loss/train': 1.7582470178604126} -11/06/2021 23:31:28 - INFO - __main__ - Step 16064: {'lr': 0.0004889435720245855, 'samples': 3084288, 'steps': 16063, 'loss/train': 1.3274977207183838} -11/06/2021 23:31:29 - INFO - __main__ - Step 16065: {'lr': 0.0004889420112509237, 'samples': 3084480, 'steps': 16064, 'loss/train': 0.20192763209342957} -11/06/2021 23:31:29 - INFO - __main__ - Step 16066: {'lr': 0.0004889404503695983, 'samples': 3084672, 'steps': 16065, 'loss/train': 1.569493293762207} -11/06/2021 23:31:29 - INFO - __main__ - Step 16067: {'lr': 0.0004889388893806099, 'samples': 3084864, 'steps': 16066, 'loss/train': 1.8277945518493652} -11/06/2021 23:31:31 - INFO - __main__ - Step 16068: {'lr': 0.0004889373282839594, 'samples': 3085056, 'steps': 16067, 'loss/train': 1.9361584186553955} -11/06/2021 23:31:31 - INFO - __main__ - Step 16069: {'lr': 0.0004889357670796474, 'samples': 3085248, 'steps': 16068, 'loss/train': 1.7485822439193726} -11/06/2021 23:31:31 - INFO - __main__ - Step 16070: {'lr': 0.0004889342057676748, 'samples': 3085440, 'steps': 16069, 'loss/train': 1.6493250131607056} -11/06/2021 23:31:32 - INFO - __main__ - Step 16071: {'lr': 0.000488932644348042, 'samples': 3085632, 'steps': 16070, 'loss/train': 1.7905906438827515} -11/06/2021 23:31:32 - INFO - __main__ - Step 16072: {'lr': 0.0004889310828207498, 'samples': 3085824, 'steps': 16071, 'loss/train': 1.781125783920288} -11/06/2021 23:31:33 - INFO - __main__ - Step 16073: {'lr': 0.000488929521185799, 'samples': 3086016, 'steps': 16072, 'loss/train': 1.8665831089019775} -11/06/2021 23:31:33 - INFO - __main__ - Step 16074: {'lr': 0.0004889279594431903, 'samples': 3086208, 'steps': 16073, 'loss/train': 1.7310936450958252} -11/06/2021 23:31:34 - INFO - __main__ - Step 16075: {'lr': 0.0004889263975929242, 'samples': 3086400, 'steps': 16074, 'loss/train': 1.4840593338012695} -11/06/2021 23:31:34 - INFO - __main__ - Step 16076: {'lr': 0.0004889248356350016, 'samples': 3086592, 'steps': 16075, 'loss/train': 1.7702844142913818} -11/06/2021 23:31:34 - INFO - __main__ - Step 16077: {'lr': 0.0004889232735694232, 'samples': 3086784, 'steps': 16076, 'loss/train': 1.6397343873977661} -11/06/2021 23:31:35 - INFO - __main__ - Step 16078: {'lr': 0.0004889217113961896, 'samples': 3086976, 'steps': 16077, 'loss/train': 1.6018173694610596} -11/06/2021 23:31:36 - INFO - __main__ - Step 16079: {'lr': 0.0004889201491153016, 'samples': 3087168, 'steps': 16078, 'loss/train': 1.2941079139709473} -11/06/2021 23:31:36 - INFO - __main__ - Step 16080: {'lr': 0.0004889185867267599, 'samples': 3087360, 'steps': 16079, 'loss/train': 1.3023624420166016} -11/06/2021 23:31:36 - INFO - __main__ - Step 16081: {'lr': 0.0004889170242305652, 'samples': 3087552, 'steps': 16080, 'loss/train': 0.6730976104736328} -11/06/2021 23:31:37 - INFO - __main__ - Step 16082: {'lr': 0.0004889154616267181, 'samples': 3087744, 'steps': 16081, 'loss/train': 1.7039793729782104} -11/06/2021 23:31:38 - INFO - __main__ - Step 16083: {'lr': 0.0004889138989152194, 'samples': 3087936, 'steps': 16082, 'loss/train': 1.3806297779083252} -11/06/2021 23:31:38 - INFO - __main__ - Step 16084: {'lr': 0.0004889123360960698, 'samples': 3088128, 'steps': 16083, 'loss/train': 1.7928431034088135} -11/06/2021 23:31:39 - INFO - __main__ - Step 16085: {'lr': 0.0004889107731692699, 'samples': 3088320, 'steps': 16084, 'loss/train': 2.2805731296539307} -11/06/2021 23:31:39 - INFO - __main__ - Step 16086: {'lr': 0.0004889092101348206, 'samples': 3088512, 'steps': 16085, 'loss/train': 1.1894793510437012} -11/06/2021 23:31:39 - INFO - __main__ - Step 16087: {'lr': 0.0004889076469927225, 'samples': 3088704, 'steps': 16086, 'loss/train': 1.330406904220581} -11/06/2021 23:31:40 - INFO - __main__ - Step 16088: {'lr': 0.0004889060837429762, 'samples': 3088896, 'steps': 16087, 'loss/train': 1.6548304557800293} -11/06/2021 23:31:41 - INFO - __main__ - Step 16089: {'lr': 0.0004889045203855826, 'samples': 3089088, 'steps': 16088, 'loss/train': 1.9373817443847656} -11/06/2021 23:31:41 - INFO - __main__ - Step 16090: {'lr': 0.0004889029569205423, 'samples': 3089280, 'steps': 16089, 'loss/train': 1.7468717098236084} -11/06/2021 23:31:41 - INFO - __main__ - Step 16091: {'lr': 0.0004889013933478559, 'samples': 3089472, 'steps': 16090, 'loss/train': 1.9759714603424072} -11/06/2021 23:31:42 - INFO - __main__ - Step 16092: {'lr': 0.0004888998296675243, 'samples': 3089664, 'steps': 16091, 'loss/train': 1.7408642768859863} -11/06/2021 23:31:42 - INFO - __main__ - Step 16093: {'lr': 0.0004888982658795482, 'samples': 3089856, 'steps': 16092, 'loss/train': 1.9443445205688477} -11/06/2021 23:31:43 - INFO - __main__ - Step 16094: {'lr': 0.0004888967019839282, 'samples': 3090048, 'steps': 16093, 'loss/train': 1.6487983465194702} -11/06/2021 23:31:43 - INFO - __main__ - Step 16095: {'lr': 0.000488895137980665, 'samples': 3090240, 'steps': 16094, 'loss/train': 1.88912034034729} -11/06/2021 23:31:44 - INFO - __main__ - Step 16096: {'lr': 0.0004888935738697593, 'samples': 3090432, 'steps': 16095, 'loss/train': 1.3398206233978271} -11/06/2021 23:31:44 - INFO - __main__ - Step 16097: {'lr': 0.0004888920096512118, 'samples': 3090624, 'steps': 16096, 'loss/train': 1.280200481414795} -11/06/2021 23:31:45 - INFO - __main__ - Step 16098: {'lr': 0.0004888904453250233, 'samples': 3090816, 'steps': 16097, 'loss/train': 1.5382581949234009} -11/06/2021 23:31:46 - INFO - __main__ - Step 16099: {'lr': 0.0004888888808911946, 'samples': 3091008, 'steps': 16098, 'loss/train': 2.1261627674102783} -11/06/2021 23:31:46 - INFO - __main__ - Step 16100: {'lr': 0.0004888873163497261, 'samples': 3091200, 'steps': 16099, 'loss/train': 2.079089641571045} -11/06/2021 23:31:46 - INFO - __main__ - Step 16101: {'lr': 0.0004888857517006186, 'samples': 3091392, 'steps': 16100, 'loss/train': 2.2009711265563965} -11/06/2021 23:31:47 - INFO - __main__ - Step 16102: {'lr': 0.000488884186943873, 'samples': 3091584, 'steps': 16101, 'loss/train': 0.620243489742279} -11/06/2021 23:31:48 - INFO - __main__ - Step 16103: {'lr': 0.0004888826220794899, 'samples': 3091776, 'steps': 16102, 'loss/train': 1.991464376449585} -11/06/2021 23:31:48 - INFO - __main__ - Step 16104: {'lr': 0.0004888810571074698, 'samples': 3091968, 'steps': 16103, 'loss/train': 1.6059728860855103} -11/06/2021 23:31:48 - INFO - __main__ - Step 16105: {'lr': 0.0004888794920278137, 'samples': 3092160, 'steps': 16104, 'loss/train': 1.831572413444519} -11/06/2021 23:31:49 - INFO - __main__ - Step 16106: {'lr': 0.0004888779268405223, 'samples': 3092352, 'steps': 16105, 'loss/train': 1.3617275953292847} -11/06/2021 23:31:49 - INFO - __main__ - Step 16107: {'lr': 0.0004888763615455959, 'samples': 3092544, 'steps': 16106, 'loss/train': 1.7099063396453857} -11/06/2021 23:31:49 - INFO - __main__ - Step 16108: {'lr': 0.0004888747961430358, 'samples': 3092736, 'steps': 16107, 'loss/train': 1.6582728624343872} -11/06/2021 23:31:51 - INFO - __main__ - Step 16109: {'lr': 0.0004888732306328422, 'samples': 3092928, 'steps': 16108, 'loss/train': 1.6152935028076172} -11/06/2021 23:31:52 - INFO - __main__ - Step 16110: {'lr': 0.000488871665015016, 'samples': 3093120, 'steps': 16109, 'loss/train': 1.057140588760376} -11/06/2021 23:31:52 - INFO - __main__ - Step 16111: {'lr': 0.0004888700992895581, 'samples': 3093312, 'steps': 16110, 'loss/train': 1.769897699356079} -11/06/2021 23:31:52 - INFO - __main__ - Step 16112: {'lr': 0.0004888685334564688, 'samples': 3093504, 'steps': 16111, 'loss/train': 1.4606374502182007} -11/06/2021 23:31:53 - INFO - __main__ - Step 16113: {'lr': 0.0004888669675157492, 'samples': 3093696, 'steps': 16112, 'loss/train': 1.8256492614746094} -11/06/2021 23:31:53 - INFO - __main__ - Step 16114: {'lr': 0.0004888654014673998, 'samples': 3093888, 'steps': 16113, 'loss/train': 1.8334771394729614} -11/06/2021 23:31:53 - INFO - __main__ - Step 16115: {'lr': 0.0004888638353114212, 'samples': 3094080, 'steps': 16114, 'loss/train': 1.4679832458496094} -11/06/2021 23:31:54 - INFO - __main__ - Step 16116: {'lr': 0.0004888622690478144, 'samples': 3094272, 'steps': 16115, 'loss/train': 1.6196460723876953} -11/06/2021 23:31:55 - INFO - __main__ - Step 16117: {'lr': 0.0004888607026765799, 'samples': 3094464, 'steps': 16116, 'loss/train': 1.916323184967041} -11/06/2021 23:31:55 - INFO - __main__ - Step 16118: {'lr': 0.0004888591361977184, 'samples': 3094656, 'steps': 16117, 'loss/train': 1.9670770168304443} -11/06/2021 23:31:55 - INFO - __main__ - Step 16119: {'lr': 0.0004888575696112308, 'samples': 3094848, 'steps': 16118, 'loss/train': 1.839583158493042} -11/06/2021 23:31:56 - INFO - __main__ - Step 16120: {'lr': 0.0004888560029171175, 'samples': 3095040, 'steps': 16119, 'loss/train': 1.7502155303955078} -11/06/2021 23:31:57 - INFO - __main__ - Step 16121: {'lr': 0.0004888544361153794, 'samples': 3095232, 'steps': 16120, 'loss/train': 1.7904021739959717} -11/06/2021 23:31:57 - INFO - __main__ - Step 16122: {'lr': 0.0004888528692060173, 'samples': 3095424, 'steps': 16121, 'loss/train': 2.108914852142334} -11/06/2021 23:31:58 - INFO - __main__ - Step 16123: {'lr': 0.0004888513021890316, 'samples': 3095616, 'steps': 16122, 'loss/train': 1.400886058807373} -11/06/2021 23:31:58 - INFO - __main__ - Step 16124: {'lr': 0.0004888497350644234, 'samples': 3095808, 'steps': 16123, 'loss/train': 1.7776603698730469} -11/06/2021 23:31:58 - INFO - __main__ - Step 16125: {'lr': 0.000488848167832193, 'samples': 3096000, 'steps': 16124, 'loss/train': 1.5604819059371948} -11/06/2021 23:31:59 - INFO - __main__ - Step 16126: {'lr': 0.0004888466004923413, 'samples': 3096192, 'steps': 16125, 'loss/train': 1.3210574388504028} -11/06/2021 23:32:00 - INFO - __main__ - Step 16127: {'lr': 0.0004888450330448692, 'samples': 3096384, 'steps': 16126, 'loss/train': 1.4687092304229736} -11/06/2021 23:32:00 - INFO - __main__ - Step 16128: {'lr': 0.000488843465489777, 'samples': 3096576, 'steps': 16127, 'loss/train': 1.5735976696014404} -11/06/2021 23:32:00 - INFO - __main__ - Step 16129: {'lr': 0.0004888418978270658, 'samples': 3096768, 'steps': 16128, 'loss/train': 1.747856855392456} -11/06/2021 23:32:01 - INFO - __main__ - Step 16130: {'lr': 0.000488840330056736, 'samples': 3096960, 'steps': 16129, 'loss/train': 2.0261762142181396} -11/06/2021 23:32:02 - INFO - __main__ - Step 16131: {'lr': 0.0004888387621787885, 'samples': 3097152, 'steps': 16130, 'loss/train': 2.1754300594329834} -11/06/2021 23:32:02 - INFO - __main__ - Step 16132: {'lr': 0.0004888371941932239, 'samples': 3097344, 'steps': 16131, 'loss/train': 1.5788387060165405} -11/06/2021 23:32:03 - INFO - __main__ - Step 16133: {'lr': 0.000488835626100043, 'samples': 3097536, 'steps': 16132, 'loss/train': 1.9797744750976562} -11/06/2021 23:32:03 - INFO - __main__ - Step 16134: {'lr': 0.0004888340578992464, 'samples': 3097728, 'steps': 16133, 'loss/train': 1.6595001220703125} -11/06/2021 23:32:03 - INFO - __main__ - Step 16135: {'lr': 0.0004888324895908349, 'samples': 3097920, 'steps': 16134, 'loss/train': 1.8906220197677612} -11/06/2021 23:32:04 - INFO - __main__ - Step 16136: {'lr': 0.0004888309211748091, 'samples': 3098112, 'steps': 16135, 'loss/train': 1.909759759902954} -11/06/2021 23:32:05 - INFO - __main__ - Step 16137: {'lr': 0.0004888293526511697, 'samples': 3098304, 'steps': 16136, 'loss/train': 1.5360649824142456} -11/06/2021 23:32:05 - INFO - __main__ - Step 16138: {'lr': 0.0004888277840199177, 'samples': 3098496, 'steps': 16137, 'loss/train': 1.0076518058776855} -11/06/2021 23:32:05 - INFO - __main__ - Step 16139: {'lr': 0.0004888262152810534, 'samples': 3098688, 'steps': 16138, 'loss/train': 1.4442768096923828} -11/06/2021 23:32:06 - INFO - __main__ - Step 16140: {'lr': 0.0004888246464345779, 'samples': 3098880, 'steps': 16139, 'loss/train': 1.477372646331787} -11/06/2021 23:32:06 - INFO - __main__ - Step 16141: {'lr': 0.0004888230774804915, 'samples': 3099072, 'steps': 16140, 'loss/train': 1.4299622774124146} -11/06/2021 23:32:07 - INFO - __main__ - Step 16142: {'lr': 0.0004888215084187952, 'samples': 3099264, 'steps': 16141, 'loss/train': 1.1523048877716064} -11/06/2021 23:32:07 - INFO - __main__ - Step 16143: {'lr': 0.0004888199392494896, 'samples': 3099456, 'steps': 16142, 'loss/train': 2.0774753093719482} -11/06/2021 23:32:08 - INFO - __main__ - Step 16144: {'lr': 0.0004888183699725755, 'samples': 3099648, 'steps': 16143, 'loss/train': 1.240419864654541} -11/06/2021 23:32:08 - INFO - __main__ - Step 16145: {'lr': 0.0004888168005880533, 'samples': 3099840, 'steps': 16144, 'loss/train': 1.6220906972885132} -11/06/2021 23:32:09 - INFO - __main__ - Step 16146: {'lr': 0.0004888152310959242, 'samples': 3100032, 'steps': 16145, 'loss/train': 1.7612665891647339} -11/06/2021 23:32:10 - INFO - __main__ - Step 16147: {'lr': 0.0004888136614961885, 'samples': 3100224, 'steps': 16146, 'loss/train': 1.4522687196731567} -11/06/2021 23:32:10 - INFO - __main__ - Step 16148: {'lr': 0.000488812091788847, 'samples': 3100416, 'steps': 16147, 'loss/train': 1.4766018390655518} -11/06/2021 23:32:10 - INFO - __main__ - Step 16149: {'lr': 0.0004888105219739005, 'samples': 3100608, 'steps': 16148, 'loss/train': 1.5540204048156738} -11/06/2021 23:32:11 - INFO - __main__ - Step 16150: {'lr': 0.0004888089520513497, 'samples': 3100800, 'steps': 16149, 'loss/train': 1.726388931274414} -11/06/2021 23:32:11 - INFO - __main__ - Step 16151: {'lr': 0.0004888073820211952, 'samples': 3100992, 'steps': 16150, 'loss/train': 1.5844863653182983} -11/06/2021 23:32:12 - INFO - __main__ - Step 16152: {'lr': 0.0004888058118834379, 'samples': 3101184, 'steps': 16151, 'loss/train': 1.4964817762374878} -11/06/2021 23:32:13 - INFO - __main__ - Step 16153: {'lr': 0.0004888042416380784, 'samples': 3101376, 'steps': 16152, 'loss/train': 2.1015524864196777} -11/06/2021 23:32:13 - INFO - __main__ - Step 16154: {'lr': 0.0004888026712851172, 'samples': 3101568, 'steps': 16153, 'loss/train': 1.3865811824798584} -11/06/2021 23:32:13 - INFO - __main__ - Step 16155: {'lr': 0.0004888011008245554, 'samples': 3101760, 'steps': 16154, 'loss/train': 1.5103989839553833} -11/06/2021 23:32:14 - INFO - __main__ - Step 16156: {'lr': 0.0004887995302563934, 'samples': 3101952, 'steps': 16155, 'loss/train': 1.9059851169586182} -11/06/2021 23:32:14 - INFO - __main__ - Step 16157: {'lr': 0.000488797959580632, 'samples': 3102144, 'steps': 16156, 'loss/train': 2.0351128578186035} -11/06/2021 23:32:15 - INFO - __main__ - Step 16158: {'lr': 0.000488796388797272, 'samples': 3102336, 'steps': 16157, 'loss/train': 0.9961912631988525} -11/06/2021 23:32:15 - INFO - __main__ - Step 16159: {'lr': 0.0004887948179063139, 'samples': 3102528, 'steps': 16158, 'loss/train': 1.8558497428894043} -11/06/2021 23:32:16 - INFO - __main__ - Step 16160: {'lr': 0.0004887932469077587, 'samples': 3102720, 'steps': 16159, 'loss/train': 1.6343353986740112} -11/06/2021 23:32:16 - INFO - __main__ - Step 16161: {'lr': 0.0004887916758016069, 'samples': 3102912, 'steps': 16160, 'loss/train': 1.7102398872375488} -11/06/2021 23:32:16 - INFO - __main__ - Step 16162: {'lr': 0.0004887901045878592, 'samples': 3103104, 'steps': 16161, 'loss/train': 1.9250577688217163} -11/06/2021 23:32:18 - INFO - __main__ - Step 16163: {'lr': 0.0004887885332665165, 'samples': 3103296, 'steps': 16162, 'loss/train': 0.9902682900428772} -11/06/2021 23:32:18 - INFO - __main__ - Step 16164: {'lr': 0.0004887869618375793, 'samples': 3103488, 'steps': 16163, 'loss/train': 2.02260160446167} -11/06/2021 23:32:18 - INFO - __main__ - Step 16165: {'lr': 0.0004887853903010483, 'samples': 3103680, 'steps': 16164, 'loss/train': 1.4178218841552734} -11/06/2021 23:32:19 - INFO - __main__ - Step 16166: {'lr': 0.0004887838186569244, 'samples': 3103872, 'steps': 16165, 'loss/train': 1.004329800605774} -11/06/2021 23:32:19 - INFO - __main__ - Step 16167: {'lr': 0.0004887822469052081, 'samples': 3104064, 'steps': 16166, 'loss/train': 1.5798732042312622} -11/06/2021 23:32:20 - INFO - __main__ - Step 16168: {'lr': 0.0004887806750459002, 'samples': 3104256, 'steps': 16167, 'loss/train': 0.9959037899971008} -11/06/2021 23:32:20 - INFO - __main__ - Step 16169: {'lr': 0.0004887791030790016, 'samples': 3104448, 'steps': 16168, 'loss/train': 1.3781802654266357} -11/06/2021 23:32:21 - INFO - __main__ - Step 16170: {'lr': 0.0004887775310045126, 'samples': 3104640, 'steps': 16169, 'loss/train': 1.5973459482192993} -11/06/2021 23:32:21 - INFO - __main__ - Step 16171: {'lr': 0.0004887759588224342, 'samples': 3104832, 'steps': 16170, 'loss/train': 1.6264896392822266} -11/06/2021 23:32:21 - INFO - __main__ - Step 16172: {'lr': 0.000488774386532767, 'samples': 3105024, 'steps': 16171, 'loss/train': 1.583954930305481} -11/06/2021 23:32:23 - INFO - __main__ - Step 16173: {'lr': 0.0004887728141355118, 'samples': 3105216, 'steps': 16172, 'loss/train': 1.6285706758499146} -11/06/2021 23:32:23 - INFO - __main__ - Step 16174: {'lr': 0.0004887712416306693, 'samples': 3105408, 'steps': 16173, 'loss/train': 1.1248019933700562} -11/06/2021 23:32:23 - INFO - __main__ - Step 16175: {'lr': 0.00048876966901824, 'samples': 3105600, 'steps': 16174, 'loss/train': 1.661145567893982} -11/06/2021 23:32:24 - INFO - __main__ - Step 16176: {'lr': 0.0004887680962982249, 'samples': 3105792, 'steps': 16175, 'loss/train': 1.8155841827392578} -11/06/2021 23:32:24 - INFO - __main__ - Step 16177: {'lr': 0.0004887665234706247, 'samples': 3105984, 'steps': 16176, 'loss/train': 1.6168017387390137} -11/06/2021 23:32:25 - INFO - __main__ - Step 16178: {'lr': 0.0004887649505354398, 'samples': 3106176, 'steps': 16177, 'loss/train': 1.7428489923477173} -11/06/2021 23:32:25 - INFO - __main__ - Step 16179: {'lr': 0.000488763377492671, 'samples': 3106368, 'steps': 16178, 'loss/train': 1.9398001432418823} -11/06/2021 23:32:26 - INFO - __main__ - Step 16180: {'lr': 0.0004887618043423194, 'samples': 3106560, 'steps': 16179, 'loss/train': 1.2829269170761108} -11/06/2021 23:32:26 - INFO - __main__ - Step 16181: {'lr': 0.0004887602310843852, 'samples': 3106752, 'steps': 16180, 'loss/train': 2.0834195613861084} -11/06/2021 23:32:26 - INFO - __main__ - Step 16182: {'lr': 0.0004887586577188694, 'samples': 3106944, 'steps': 16181, 'loss/train': 1.844342827796936} -11/06/2021 23:32:27 - INFO - __main__ - Step 16183: {'lr': 0.0004887570842457726, 'samples': 3107136, 'steps': 16182, 'loss/train': 1.410559058189392} -11/06/2021 23:32:28 - INFO - __main__ - Step 16184: {'lr': 0.0004887555106650956, 'samples': 3107328, 'steps': 16183, 'loss/train': 1.3475863933563232} -11/06/2021 23:32:28 - INFO - __main__ - Step 16185: {'lr': 0.000488753936976839, 'samples': 3107520, 'steps': 16184, 'loss/train': 5.809494495391846} -11/06/2021 23:32:29 - INFO - __main__ - Step 16186: {'lr': 0.0004887523631810036, 'samples': 3107712, 'steps': 16185, 'loss/train': 1.431221604347229} -11/06/2021 23:32:29 - INFO - __main__ - Step 16187: {'lr': 0.00048875078927759, 'samples': 3107904, 'steps': 16186, 'loss/train': 1.6781052350997925} -11/06/2021 23:32:29 - INFO - __main__ - Step 16188: {'lr': 0.000488749215266599, 'samples': 3108096, 'steps': 16187, 'loss/train': 2.205307960510254} -11/06/2021 23:32:30 - INFO - __main__ - Step 16189: {'lr': 0.0004887476411480314, 'samples': 3108288, 'steps': 16188, 'loss/train': 1.7173161506652832} -11/06/2021 23:32:31 - INFO - __main__ - Step 16190: {'lr': 0.0004887460669218877, 'samples': 3108480, 'steps': 16189, 'loss/train': 1.8591818809509277} -11/06/2021 23:32:31 - INFO - __main__ - Step 16191: {'lr': 0.0004887444925881688, 'samples': 3108672, 'steps': 16190, 'loss/train': 1.212321162223816} -11/06/2021 23:32:31 - INFO - __main__ - Step 16192: {'lr': 0.0004887429181468752, 'samples': 3108864, 'steps': 16191, 'loss/train': 1.6692414283752441} -11/06/2021 23:32:32 - INFO - __main__ - Step 16193: {'lr': 0.0004887413435980077, 'samples': 3109056, 'steps': 16192, 'loss/train': 1.82635498046875} -11/06/2021 23:32:32 - INFO - __main__ - Step 16194: {'lr': 0.0004887397689415672, 'samples': 3109248, 'steps': 16193, 'loss/train': 2.222364902496338} -11/06/2021 23:32:33 - INFO - __main__ - Step 16195: {'lr': 0.0004887381941775541, 'samples': 3109440, 'steps': 16194, 'loss/train': 1.727850079536438} -11/06/2021 23:32:34 - INFO - __main__ - Step 16196: {'lr': 0.0004887366193059693, 'samples': 3109632, 'steps': 16195, 'loss/train': 1.849395751953125} -11/06/2021 23:32:34 - INFO - __main__ - Step 16197: {'lr': 0.0004887350443268134, 'samples': 3109824, 'steps': 16196, 'loss/train': 1.7201744318008423} -11/06/2021 23:32:34 - INFO - __main__ - Step 16198: {'lr': 0.0004887334692400872, 'samples': 3110016, 'steps': 16197, 'loss/train': 1.6349120140075684} -11/06/2021 23:32:35 - INFO - __main__ - Step 16199: {'lr': 0.0004887318940457915, 'samples': 3110208, 'steps': 16198, 'loss/train': 2.126889944076538} -11/06/2021 23:32:36 - INFO - __main__ - Step 16200: {'lr': 0.0004887303187439267, 'samples': 3110400, 'steps': 16199, 'loss/train': 1.782393455505371} -11/06/2021 23:32:36 - INFO - __main__ - Step 16201: {'lr': 0.0004887287433344939, 'samples': 3110592, 'steps': 16200, 'loss/train': 1.2824130058288574} -11/06/2021 23:32:36 - INFO - __main__ - Step 16202: {'lr': 0.0004887271678174935, 'samples': 3110784, 'steps': 16201, 'loss/train': 1.416832447052002} -11/06/2021 23:32:37 - INFO - __main__ - Step 16203: {'lr': 0.0004887255921929264, 'samples': 3110976, 'steps': 16202, 'loss/train': 1.795426368713379} -11/06/2021 23:32:37 - INFO - __main__ - Step 16204: {'lr': 0.0004887240164607931, 'samples': 3111168, 'steps': 16203, 'loss/train': 2.0454015731811523} -11/06/2021 23:32:38 - INFO - __main__ - Step 16205: {'lr': 0.0004887224406210945, 'samples': 3111360, 'steps': 16204, 'loss/train': 1.9707239866256714} -11/06/2021 23:32:38 - INFO - __main__ - Step 16206: {'lr': 0.0004887208646738312, 'samples': 3111552, 'steps': 16205, 'loss/train': 1.7705655097961426} -11/06/2021 23:32:39 - INFO - __main__ - Step 16207: {'lr': 0.000488719288619004, 'samples': 3111744, 'steps': 16206, 'loss/train': 1.1489686965942383} -11/06/2021 23:32:39 - INFO - __main__ - Step 16208: {'lr': 0.0004887177124566136, 'samples': 3111936, 'steps': 16207, 'loss/train': 1.93928861618042} -11/06/2021 23:32:40 - INFO - __main__ - Step 16209: {'lr': 0.0004887161361866607, 'samples': 3112128, 'steps': 16208, 'loss/train': 1.5540908575057983} -11/06/2021 23:32:40 - INFO - __main__ - Step 16210: {'lr': 0.000488714559809146, 'samples': 3112320, 'steps': 16209, 'loss/train': 1.17920982837677} -11/06/2021 23:32:41 - INFO - __main__ - Step 16211: {'lr': 0.0004887129833240703, 'samples': 3112512, 'steps': 16210, 'loss/train': 1.7366347312927246} -11/06/2021 23:32:41 - INFO - __main__ - Step 16212: {'lr': 0.000488711406731434, 'samples': 3112704, 'steps': 16211, 'loss/train': 2.5286495685577393} -11/06/2021 23:32:42 - INFO - __main__ - Step 16213: {'lr': 0.0004887098300312381, 'samples': 3112896, 'steps': 16212, 'loss/train': 1.7790120840072632} -11/06/2021 23:32:42 - INFO - __main__ - Step 16214: {'lr': 0.0004887082532234832, 'samples': 3113088, 'steps': 16213, 'loss/train': 1.5670133829116821} -11/06/2021 23:32:42 - INFO - __main__ - Step 16215: {'lr': 0.0004887066763081702, 'samples': 3113280, 'steps': 16214, 'loss/train': 1.74317467212677} -11/06/2021 23:32:43 - INFO - __main__ - Step 16216: {'lr': 0.0004887050992852995, 'samples': 3113472, 'steps': 16215, 'loss/train': 1.506385087966919} -11/06/2021 23:32:44 - INFO - __main__ - Step 16217: {'lr': 0.000488703522154872, 'samples': 3113664, 'steps': 16216, 'loss/train': 2.2613461017608643} -11/06/2021 23:32:44 - INFO - __main__ - Step 16218: {'lr': 0.0004887019449168884, 'samples': 3113856, 'steps': 16217, 'loss/train': 1.4380708932876587} -11/06/2021 23:32:44 - INFO - __main__ - Step 16219: {'lr': 0.0004887003675713493, 'samples': 3114048, 'steps': 16218, 'loss/train': 1.0357764959335327} -11/06/2021 23:32:45 - INFO - __main__ - Step 16220: {'lr': 0.0004886987901182556, 'samples': 3114240, 'steps': 16219, 'loss/train': 1.8827407360076904} -11/06/2021 23:32:46 - INFO - __main__ - Step 16221: {'lr': 0.0004886972125576079, 'samples': 3114432, 'steps': 16220, 'loss/train': 1.24242103099823} -11/06/2021 23:32:46 - INFO - __main__ - Step 16222: {'lr': 0.0004886956348894069, 'samples': 3114624, 'steps': 16221, 'loss/train': 1.3726708889007568} -11/06/2021 23:32:47 - INFO - __main__ - Step 16223: {'lr': 0.0004886940571136533, 'samples': 3114816, 'steps': 16222, 'loss/train': 1.7079288959503174} -11/06/2021 23:32:47 - INFO - __main__ - Step 16224: {'lr': 0.0004886924792303479, 'samples': 3115008, 'steps': 16223, 'loss/train': 1.7370092868804932} -11/06/2021 23:32:47 - INFO - __main__ - Step 16225: {'lr': 0.0004886909012394913, 'samples': 3115200, 'steps': 16224, 'loss/train': 1.8899927139282227} -11/06/2021 23:32:48 - INFO - __main__ - Step 16226: {'lr': 0.0004886893231410844, 'samples': 3115392, 'steps': 16225, 'loss/train': 2.2528281211853027} -11/06/2021 23:32:49 - INFO - __main__ - Step 16227: {'lr': 0.0004886877449351276, 'samples': 3115584, 'steps': 16226, 'loss/train': 1.8323493003845215} -11/06/2021 23:32:49 - INFO - __main__ - Step 16228: {'lr': 0.0004886861666216219, 'samples': 3115776, 'steps': 16227, 'loss/train': 1.1392507553100586} -11/06/2021 23:32:49 - INFO - __main__ - Step 16229: {'lr': 0.0004886845882005679, 'samples': 3115968, 'steps': 16228, 'loss/train': 1.4808542728424072} -11/06/2021 23:32:50 - INFO - __main__ - Step 16230: {'lr': 0.0004886830096719662, 'samples': 3116160, 'steps': 16229, 'loss/train': 2.0018463134765625} -11/06/2021 23:32:51 - INFO - __main__ - Step 16231: {'lr': 0.0004886814310358176, 'samples': 3116352, 'steps': 16230, 'loss/train': 1.9077577590942383} -11/06/2021 23:32:51 - INFO - __main__ - Step 16232: {'lr': 0.000488679852292123, 'samples': 3116544, 'steps': 16231, 'loss/train': 1.6845556497573853} -11/06/2021 23:32:52 - INFO - __main__ - Step 16233: {'lr': 0.0004886782734408828, 'samples': 3116736, 'steps': 16232, 'loss/train': 1.8097872734069824} -11/06/2021 23:32:52 - INFO - __main__ - Step 16234: {'lr': 0.0004886766944820979, 'samples': 3116928, 'steps': 16233, 'loss/train': 1.961445927619934} -11/06/2021 23:32:52 - INFO - __main__ - Step 16235: {'lr': 0.0004886751154157689, 'samples': 3117120, 'steps': 16234, 'loss/train': 1.6174712181091309} -11/06/2021 23:32:53 - INFO - __main__ - Step 16236: {'lr': 0.0004886735362418967, 'samples': 3117312, 'steps': 16235, 'loss/train': 1.9013572931289673} -11/06/2021 23:32:54 - INFO - __main__ - Step 16237: {'lr': 0.0004886719569604818, 'samples': 3117504, 'steps': 16236, 'loss/train': 1.3297522068023682} -11/06/2021 23:32:54 - INFO - __main__ - Step 16238: {'lr': 0.000488670377571525, 'samples': 3117696, 'steps': 16237, 'loss/train': 1.2586119174957275} -11/06/2021 23:32:54 - INFO - __main__ - Step 16239: {'lr': 0.0004886687980750271, 'samples': 3117888, 'steps': 16238, 'loss/train': 1.6158231496810913} -11/06/2021 23:32:55 - INFO - __main__ - Step 16240: {'lr': 0.0004886672184709886, 'samples': 3118080, 'steps': 16239, 'loss/train': 1.4461692571640015} -11/06/2021 23:32:55 - INFO - __main__ - Step 16241: {'lr': 0.0004886656387594104, 'samples': 3118272, 'steps': 16240, 'loss/train': 1.8390427827835083} -11/06/2021 23:32:56 - INFO - __main__ - Step 16242: {'lr': 0.0004886640589402932, 'samples': 3118464, 'steps': 16241, 'loss/train': 1.874056339263916} -11/06/2021 23:32:56 - INFO - __main__ - Step 16243: {'lr': 0.0004886624790136375, 'samples': 3118656, 'steps': 16242, 'loss/train': 1.866011619567871} -11/06/2021 23:32:57 - INFO - __main__ - Step 16244: {'lr': 0.0004886608989794443, 'samples': 3118848, 'steps': 16243, 'loss/train': 1.8699171543121338} -11/06/2021 23:32:57 - INFO - __main__ - Step 16245: {'lr': 0.0004886593188377142, 'samples': 3119040, 'steps': 16244, 'loss/train': 1.6724590063095093} -11/06/2021 23:32:57 - INFO - __main__ - Step 16246: {'lr': 0.0004886577385884478, 'samples': 3119232, 'steps': 16245, 'loss/train': 1.6517481803894043} -11/06/2021 23:32:59 - INFO - __main__ - Step 16247: {'lr': 0.0004886561582316458, 'samples': 3119424, 'steps': 16246, 'loss/train': 2.0058236122131348} -11/06/2021 23:32:59 - INFO - __main__ - Step 16248: {'lr': 0.0004886545777673093, 'samples': 3119616, 'steps': 16247, 'loss/train': 1.7186330556869507} -11/06/2021 23:32:59 - INFO - __main__ - Step 16249: {'lr': 0.0004886529971954385, 'samples': 3119808, 'steps': 16248, 'loss/train': 1.8039087057113647} -11/06/2021 23:33:00 - INFO - __main__ - Step 16250: {'lr': 0.0004886514165160345, 'samples': 3120000, 'steps': 16249, 'loss/train': 1.7493343353271484} -11/06/2021 23:33:00 - INFO - __main__ - Step 16251: {'lr': 0.0004886498357290979, 'samples': 3120192, 'steps': 16250, 'loss/train': 2.166086196899414} -11/06/2021 23:33:01 - INFO - __main__ - Step 16252: {'lr': 0.0004886482548346291, 'samples': 3120384, 'steps': 16251, 'loss/train': 2.0029032230377197} -11/06/2021 23:33:01 - INFO - __main__ - Step 16253: {'lr': 0.0004886466738326293, 'samples': 3120576, 'steps': 16252, 'loss/train': 1.9279859066009521} -11/06/2021 23:33:02 - INFO - __main__ - Step 16254: {'lr': 0.000488645092723099, 'samples': 3120768, 'steps': 16253, 'loss/train': 1.5185385942459106} -11/06/2021 23:33:02 - INFO - __main__ - Step 16255: {'lr': 0.0004886435115060388, 'samples': 3120960, 'steps': 16254, 'loss/train': 1.7781718969345093} -11/06/2021 23:33:02 - INFO - __main__ - Step 16256: {'lr': 0.0004886419301814495, 'samples': 3121152, 'steps': 16255, 'loss/train': 1.7876300811767578} -11/06/2021 23:33:03 - INFO - __main__ - Step 16257: {'lr': 0.0004886403487493319, 'samples': 3121344, 'steps': 16256, 'loss/train': 1.7171152830123901} -11/06/2021 23:33:04 - INFO - __main__ - Step 16258: {'lr': 0.0004886387672096866, 'samples': 3121536, 'steps': 16257, 'loss/train': 1.8690319061279297} -11/06/2021 23:33:04 - INFO - __main__ - Step 16259: {'lr': 0.0004886371855625143, 'samples': 3121728, 'steps': 16258, 'loss/train': 1.2483769655227661} -11/06/2021 23:33:04 - INFO - __main__ - Step 16260: {'lr': 0.0004886356038078159, 'samples': 3121920, 'steps': 16259, 'loss/train': 2.029406785964966} -11/06/2021 23:33:05 - INFO - __main__ - Step 16261: {'lr': 0.0004886340219455919, 'samples': 3122112, 'steps': 16260, 'loss/train': 1.9332122802734375} -11/06/2021 23:33:06 - INFO - __main__ - Step 16262: {'lr': 0.0004886324399758431, 'samples': 3122304, 'steps': 16261, 'loss/train': 1.5385150909423828} -11/06/2021 23:33:07 - INFO - __main__ - Step 16263: {'lr': 0.0004886308578985702, 'samples': 3122496, 'steps': 16262, 'loss/train': 1.4591851234436035} -11/06/2021 23:33:07 - INFO - __main__ - Step 16264: {'lr': 0.0004886292757137739, 'samples': 3122688, 'steps': 16263, 'loss/train': 1.4665359258651733} -11/06/2021 23:33:07 - INFO - __main__ - Step 16265: {'lr': 0.0004886276934214551, 'samples': 3122880, 'steps': 16264, 'loss/train': 1.3488205671310425} -11/06/2021 23:33:08 - INFO - __main__ - Step 16266: {'lr': 0.0004886261110216141, 'samples': 3123072, 'steps': 16265, 'loss/train': 1.357380986213684} -11/06/2021 23:33:08 - INFO - __main__ - Step 16267: {'lr': 0.000488624528514252, 'samples': 3123264, 'steps': 16266, 'loss/train': 1.822448968887329} -11/06/2021 23:33:08 - INFO - __main__ - Step 16268: {'lr': 0.0004886229458993693, 'samples': 3123456, 'steps': 16267, 'loss/train': 1.8266669511795044} -11/06/2021 23:33:09 - INFO - __main__ - Step 16269: {'lr': 0.0004886213631769669, 'samples': 3123648, 'steps': 16268, 'loss/train': 1.6113994121551514} -11/06/2021 23:33:10 - INFO - __main__ - Step 16270: {'lr': 0.0004886197803470453, 'samples': 3123840, 'steps': 16269, 'loss/train': 2.0622076988220215} -11/06/2021 23:33:10 - INFO - __main__ - Step 16271: {'lr': 0.0004886181974096052, 'samples': 3124032, 'steps': 16270, 'loss/train': 1.6397887468338013} -11/06/2021 23:33:10 - INFO - __main__ - Step 16272: {'lr': 0.0004886166143646476, 'samples': 3124224, 'steps': 16271, 'loss/train': 1.217058777809143} -11/06/2021 23:33:11 - INFO - __main__ - Step 16273: {'lr': 0.000488615031212173, 'samples': 3124416, 'steps': 16272, 'loss/train': 1.726121187210083} -11/06/2021 23:33:12 - INFO - __main__ - Step 16274: {'lr': 0.0004886134479521821, 'samples': 3124608, 'steps': 16273, 'loss/train': 1.4393755197525024} -11/06/2021 23:33:12 - INFO - __main__ - Step 16275: {'lr': 0.0004886118645846757, 'samples': 3124800, 'steps': 16274, 'loss/train': 2.080183506011963} -11/06/2021 23:33:13 - INFO - __main__ - Step 16276: {'lr': 0.0004886102811096544, 'samples': 3124992, 'steps': 16275, 'loss/train': 1.4109009504318237} -11/06/2021 23:33:13 - INFO - __main__ - Step 16277: {'lr': 0.0004886086975271191, 'samples': 3125184, 'steps': 16276, 'loss/train': 0.7202199101448059} -11/06/2021 23:33:13 - INFO - __main__ - Step 16278: {'lr': 0.0004886071138370704, 'samples': 3125376, 'steps': 16277, 'loss/train': 1.714578628540039} -11/06/2021 23:33:14 - INFO - __main__ - Step 16279: {'lr': 0.000488605530039509, 'samples': 3125568, 'steps': 16278, 'loss/train': 2.0787177085876465} -11/06/2021 23:33:15 - INFO - __main__ - Step 16280: {'lr': 0.0004886039461344356, 'samples': 3125760, 'steps': 16279, 'loss/train': 1.3188015222549438} -11/06/2021 23:33:15 - INFO - __main__ - Step 16281: {'lr': 0.0004886023621218509, 'samples': 3125952, 'steps': 16280, 'loss/train': 0.2149624228477478} -11/06/2021 23:33:15 - INFO - __main__ - Step 16282: {'lr': 0.0004886007780017557, 'samples': 3126144, 'steps': 16281, 'loss/train': 1.910459280014038} -11/06/2021 23:33:16 - INFO - __main__ - Step 16283: {'lr': 0.0004885991937741506, 'samples': 3126336, 'steps': 16282, 'loss/train': 1.2737128734588623} -11/06/2021 23:33:17 - INFO - __main__ - Step 16284: {'lr': 0.0004885976094390366, 'samples': 3126528, 'steps': 16283, 'loss/train': 1.7941306829452515} -11/06/2021 23:33:17 - INFO - __main__ - Step 16285: {'lr': 0.000488596024996414, 'samples': 3126720, 'steps': 16284, 'loss/train': 1.8777819871902466} -11/06/2021 23:33:18 - INFO - __main__ - Step 16286: {'lr': 0.0004885944404462838, 'samples': 3126912, 'steps': 16285, 'loss/train': 1.9789512157440186} -11/06/2021 23:33:18 - INFO - __main__ - Step 16287: {'lr': 0.0004885928557886466, 'samples': 3127104, 'steps': 16286, 'loss/train': 1.347070574760437} -11/06/2021 23:33:18 - INFO - __main__ - Step 16288: {'lr': 0.0004885912710235031, 'samples': 3127296, 'steps': 16287, 'loss/train': 1.7394129037857056} -11/06/2021 23:33:19 - INFO - __main__ - Step 16289: {'lr': 0.0004885896861508541, 'samples': 3127488, 'steps': 16288, 'loss/train': 1.1697927713394165} -11/06/2021 23:33:20 - INFO - __main__ - Step 16290: {'lr': 0.0004885881011707003, 'samples': 3127680, 'steps': 16289, 'loss/train': 1.684749960899353} -11/06/2021 23:33:20 - INFO - __main__ - Step 16291: {'lr': 0.0004885865160830422, 'samples': 3127872, 'steps': 16290, 'loss/train': 1.4211009740829468} -11/06/2021 23:33:20 - INFO - __main__ - Step 16292: {'lr': 0.0004885849308878809, 'samples': 3128064, 'steps': 16291, 'loss/train': 1.1847530603408813} -11/06/2021 23:33:21 - INFO - __main__ - Step 16293: {'lr': 0.0004885833455852169, 'samples': 3128256, 'steps': 16292, 'loss/train': 3.3935234546661377} -11/06/2021 23:33:21 - INFO - __main__ - Step 16294: {'lr': 0.0004885817601750509, 'samples': 3128448, 'steps': 16293, 'loss/train': 1.7725669145584106} -11/06/2021 23:33:22 - INFO - __main__ - Step 16295: {'lr': 0.0004885801746573836, 'samples': 3128640, 'steps': 16294, 'loss/train': 1.7294930219650269} -11/06/2021 23:33:22 - INFO - __main__ - Step 16296: {'lr': 0.0004885785890322158, 'samples': 3128832, 'steps': 16295, 'loss/train': 1.4970622062683105} -11/06/2021 23:33:23 - INFO - __main__ - Step 16297: {'lr': 0.0004885770032995482, 'samples': 3129024, 'steps': 16296, 'loss/train': 2.0539581775665283} -11/06/2021 23:33:23 - INFO - __main__ - Step 16298: {'lr': 0.0004885754174593814, 'samples': 3129216, 'steps': 16297, 'loss/train': 1.6017131805419922} -11/06/2021 23:33:24 - INFO - __main__ - Step 16299: {'lr': 0.0004885738315117162, 'samples': 3129408, 'steps': 16298, 'loss/train': 1.718274474143982} -11/06/2021 23:33:25 - INFO - __main__ - Step 16300: {'lr': 0.0004885722454565534, 'samples': 3129600, 'steps': 16299, 'loss/train': 1.6284193992614746} -11/06/2021 23:33:25 - INFO - __main__ - Step 16301: {'lr': 0.0004885706592938936, 'samples': 3129792, 'steps': 16300, 'loss/train': 1.8225423097610474} -11/06/2021 23:33:26 - INFO - __main__ - Step 16302: {'lr': 0.0004885690730237375, 'samples': 3129984, 'steps': 16301, 'loss/train': 5.086080551147461} -11/06/2021 23:33:26 - INFO - __main__ - Step 16303: {'lr': 0.0004885674866460858, 'samples': 3130176, 'steps': 16302, 'loss/train': 1.6252819299697876} -11/06/2021 23:33:26 - INFO - __main__ - Step 16304: {'lr': 0.0004885659001609393, 'samples': 3130368, 'steps': 16303, 'loss/train': 1.6549954414367676} -11/06/2021 23:33:27 - INFO - __main__ - Step 16305: {'lr': 0.0004885643135682987, 'samples': 3130560, 'steps': 16304, 'loss/train': 1.7220511436462402} -11/06/2021 23:33:28 - INFO - __main__ - Step 16306: {'lr': 0.0004885627268681648, 'samples': 3130752, 'steps': 16305, 'loss/train': 1.3783352375030518} -11/06/2021 23:33:28 - INFO - __main__ - Step 16307: {'lr': 0.0004885611400605381, 'samples': 3130944, 'steps': 16306, 'loss/train': 1.6854547262191772} -11/06/2021 23:33:28 - INFO - __main__ - Step 16308: {'lr': 0.0004885595531454195, 'samples': 3131136, 'steps': 16307, 'loss/train': 1.55535888671875} -11/06/2021 23:33:29 - INFO - __main__ - Step 16309: {'lr': 0.0004885579661228097, 'samples': 3131328, 'steps': 16308, 'loss/train': 1.7425678968429565} -11/06/2021 23:33:29 - INFO - __main__ - Step 16310: {'lr': 0.0004885563789927092, 'samples': 3131520, 'steps': 16309, 'loss/train': 1.6261141300201416} -11/06/2021 23:33:30 - INFO - __main__ - Step 16311: {'lr': 0.0004885547917551189, 'samples': 3131712, 'steps': 16310, 'loss/train': 1.6285531520843506} -11/06/2021 23:33:30 - INFO - __main__ - Step 16312: {'lr': 0.0004885532044100396, 'samples': 3131904, 'steps': 16311, 'loss/train': 2.0965306758880615} -11/06/2021 23:33:31 - INFO - __main__ - Step 16313: {'lr': 0.0004885516169574719, 'samples': 3132096, 'steps': 16312, 'loss/train': 1.7948811054229736} -11/06/2021 23:33:31 - INFO - __main__ - Step 16314: {'lr': 0.0004885500293974165, 'samples': 3132288, 'steps': 16313, 'loss/train': 1.4973307847976685} -11/06/2021 23:33:32 - INFO - __main__ - Step 16315: {'lr': 0.0004885484417298741, 'samples': 3132480, 'steps': 16314, 'loss/train': 1.1816359758377075} -11/06/2021 23:33:32 - INFO - __main__ - Step 16316: {'lr': 0.0004885468539548455, 'samples': 3132672, 'steps': 16315, 'loss/train': 1.3534947633743286} -11/06/2021 23:33:33 - INFO - __main__ - Step 16317: {'lr': 0.0004885452660723313, 'samples': 3132864, 'steps': 16316, 'loss/train': 1.4789822101593018} -11/06/2021 23:33:33 - INFO - __main__ - Step 16318: {'lr': 0.0004885436780823324, 'samples': 3133056, 'steps': 16317, 'loss/train': 1.8241922855377197} -11/06/2021 23:33:34 - INFO - __main__ - Step 16319: {'lr': 0.0004885420899848492, 'samples': 3133248, 'steps': 16318, 'loss/train': 1.9675356149673462} -11/06/2021 23:33:34 - INFO - __main__ - Step 16320: {'lr': 0.0004885405017798828, 'samples': 3133440, 'steps': 16319, 'loss/train': 2.023437023162842} -11/06/2021 23:33:34 - INFO - __main__ - Step 16321: {'lr': 0.0004885389134674337, 'samples': 3133632, 'steps': 16320, 'loss/train': 1.4244306087493896} -11/06/2021 23:33:35 - INFO - __main__ - Step 16322: {'lr': 0.0004885373250475026, 'samples': 3133824, 'steps': 16321, 'loss/train': 1.2528997659683228} -11/06/2021 23:33:36 - INFO - __main__ - Step 16323: {'lr': 0.0004885357365200903, 'samples': 3134016, 'steps': 16322, 'loss/train': 1.5098944902420044} -11/06/2021 23:33:36 - INFO - __main__ - Step 16324: {'lr': 0.0004885341478851975, 'samples': 3134208, 'steps': 16323, 'loss/train': 1.332453966140747} -11/06/2021 23:33:37 - INFO - __main__ - Step 16325: {'lr': 0.0004885325591428248, 'samples': 3134400, 'steps': 16324, 'loss/train': 0.9680758118629456} -11/06/2021 23:33:37 - INFO - __main__ - Step 16326: {'lr': 0.0004885309702929731, 'samples': 3134592, 'steps': 16325, 'loss/train': 2.230714797973633} -11/06/2021 23:33:38 - INFO - __main__ - Step 16327: {'lr': 0.000488529381335643, 'samples': 3134784, 'steps': 16326, 'loss/train': 1.5488425493240356} -11/06/2021 23:33:38 - INFO - __main__ - Step 16328: {'lr': 0.0004885277922708352, 'samples': 3134976, 'steps': 16327, 'loss/train': 1.5818017721176147} -11/06/2021 23:33:39 - INFO - __main__ - Step 16329: {'lr': 0.0004885262030985504, 'samples': 3135168, 'steps': 16328, 'loss/train': 1.6726022958755493} -11/06/2021 23:33:39 - INFO - __main__ - Step 16330: {'lr': 0.0004885246138187896, 'samples': 3135360, 'steps': 16329, 'loss/train': 1.5830050706863403} -11/06/2021 23:33:39 - INFO - __main__ - Step 16331: {'lr': 0.0004885230244315531, 'samples': 3135552, 'steps': 16330, 'loss/train': 1.6243305206298828} -11/06/2021 23:33:40 - INFO - __main__ - Step 16332: {'lr': 0.0004885214349368419, 'samples': 3135744, 'steps': 16331, 'loss/train': 1.477682113647461} -11/06/2021 23:33:41 - INFO - __main__ - Step 16333: {'lr': 0.0004885198453346565, 'samples': 3135936, 'steps': 16332, 'loss/train': 1.5040385723114014} -11/06/2021 23:33:41 - INFO - __main__ - Step 16334: {'lr': 0.0004885182556249978, 'samples': 3136128, 'steps': 16333, 'loss/train': 1.872546672821045} -11/06/2021 23:33:41 - INFO - __main__ - Step 16335: {'lr': 0.0004885166658078666, 'samples': 3136320, 'steps': 16334, 'loss/train': 1.3030028343200684} -11/06/2021 23:33:42 - INFO - __main__ - Step 16336: {'lr': 0.0004885150758832632, 'samples': 3136512, 'steps': 16335, 'loss/train': 1.7622499465942383} -11/06/2021 23:33:43 - INFO - __main__ - Step 16337: {'lr': 0.0004885134858511888, 'samples': 3136704, 'steps': 16336, 'loss/train': 1.5407360792160034} -11/06/2021 23:33:43 - INFO - __main__ - Step 16338: {'lr': 0.0004885118957116438, 'samples': 3136896, 'steps': 16337, 'loss/train': 1.1537578105926514} -11/06/2021 23:33:44 - INFO - __main__ - Step 16339: {'lr': 0.000488510305464629, 'samples': 3137088, 'steps': 16338, 'loss/train': 1.9556260108947754} -11/06/2021 23:33:44 - INFO - __main__ - Step 16340: {'lr': 0.0004885087151101453, 'samples': 3137280, 'steps': 16339, 'loss/train': 1.7774170637130737} -11/06/2021 23:33:44 - INFO - __main__ - Step 16341: {'lr': 0.0004885071246481931, 'samples': 3137472, 'steps': 16340, 'loss/train': 1.5609866380691528} -11/06/2021 23:33:45 - INFO - __main__ - Step 16342: {'lr': 0.0004885055340787733, 'samples': 3137664, 'steps': 16341, 'loss/train': 2.0309407711029053} -11/06/2021 23:33:46 - INFO - __main__ - Step 16343: {'lr': 0.0004885039434018866, 'samples': 3137856, 'steps': 16342, 'loss/train': 1.1930187940597534} -11/06/2021 23:33:46 - INFO - __main__ - Step 16344: {'lr': 0.0004885023526175337, 'samples': 3138048, 'steps': 16343, 'loss/train': 1.741970181465149} -11/06/2021 23:33:46 - INFO - __main__ - Step 16345: {'lr': 0.0004885007617257154, 'samples': 3138240, 'steps': 16344, 'loss/train': 1.7933660745620728} -11/06/2021 23:33:47 - INFO - __main__ - Step 16346: {'lr': 0.0004884991707264322, 'samples': 3138432, 'steps': 16345, 'loss/train': 0.6066716909408569} -11/06/2021 23:33:47 - INFO - __main__ - Step 16347: {'lr': 0.000488497579619685, 'samples': 3138624, 'steps': 16346, 'loss/train': 1.3735432624816895} -11/06/2021 23:33:48 - INFO - __main__ - Step 16348: {'lr': 0.0004884959884054745, 'samples': 3138816, 'steps': 16347, 'loss/train': 1.762027621269226} -11/06/2021 23:33:48 - INFO - __main__ - Step 16349: {'lr': 0.0004884943970838014, 'samples': 3139008, 'steps': 16348, 'loss/train': 1.6400388479232788} -11/06/2021 23:33:49 - INFO - __main__ - Step 16350: {'lr': 0.0004884928056546663, 'samples': 3139200, 'steps': 16349, 'loss/train': 1.1514432430267334} -11/06/2021 23:33:49 - INFO - __main__ - Step 16351: {'lr': 0.0004884912141180701, 'samples': 3139392, 'steps': 16350, 'loss/train': 1.8475518226623535} -11/06/2021 23:33:49 - INFO - __main__ - Step 16352: {'lr': 0.0004884896224740136, 'samples': 3139584, 'steps': 16351, 'loss/train': 2.076098918914795} -11/06/2021 23:33:51 - INFO - __main__ - Step 16353: {'lr': 0.0004884880307224972, 'samples': 3139776, 'steps': 16352, 'loss/train': 1.0980122089385986} -11/06/2021 23:33:52 - INFO - __main__ - Step 16354: {'lr': 0.0004884864388635217, 'samples': 3139968, 'steps': 16353, 'loss/train': 2.0552711486816406} -11/06/2021 23:33:52 - INFO - __main__ - Step 16355: {'lr': 0.0004884848468970879, 'samples': 3140160, 'steps': 16354, 'loss/train': 1.639860987663269} -11/06/2021 23:33:52 - INFO - __main__ - Step 16356: {'lr': 0.0004884832548231966, 'samples': 3140352, 'steps': 16355, 'loss/train': 1.732427716255188} -11/06/2021 23:33:53 - INFO - __main__ - Step 16357: {'lr': 0.0004884816626418484, 'samples': 3140544, 'steps': 16356, 'loss/train': 1.1739200353622437} -11/06/2021 23:33:53 - INFO - __main__ - Step 16358: {'lr': 0.000488480070353044, 'samples': 3140736, 'steps': 16357, 'loss/train': 1.8249778747558594} -11/06/2021 23:33:53 - INFO - __main__ - Step 16359: {'lr': 0.0004884784779567843, 'samples': 3140928, 'steps': 16358, 'loss/train': 1.5144319534301758} -11/06/2021 23:33:55 - INFO - __main__ - Step 16360: {'lr': 0.0004884768854530696, 'samples': 3141120, 'steps': 16359, 'loss/train': 1.685762882232666} -11/06/2021 23:33:55 - INFO - __main__ - Step 16361: {'lr': 0.0004884752928419012, 'samples': 3141312, 'steps': 16360, 'loss/train': 1.7363823652267456} -11/06/2021 23:33:55 - INFO - __main__ - Step 16362: {'lr': 0.0004884737001232793, 'samples': 3141504, 'steps': 16361, 'loss/train': 1.8232380151748657} -11/06/2021 23:33:56 - INFO - __main__ - Step 16363: {'lr': 0.000488472107297205, 'samples': 3141696, 'steps': 16362, 'loss/train': 1.5497318506240845} -11/06/2021 23:33:56 - INFO - __main__ - Step 16364: {'lr': 0.0004884705143636788, 'samples': 3141888, 'steps': 16363, 'loss/train': 0.7053847312927246} -11/06/2021 23:33:57 - INFO - __main__ - Step 16365: {'lr': 0.0004884689213227013, 'samples': 3142080, 'steps': 16364, 'loss/train': 1.7800610065460205} -11/06/2021 23:33:57 - INFO - __main__ - Step 16366: {'lr': 0.0004884673281742736, 'samples': 3142272, 'steps': 16365, 'loss/train': 1.5720760822296143} -11/06/2021 23:33:58 - INFO - __main__ - Step 16367: {'lr': 0.0004884657349183961, 'samples': 3142464, 'steps': 16366, 'loss/train': 1.697306513786316} -11/06/2021 23:33:58 - INFO - __main__ - Step 16368: {'lr': 0.0004884641415550696, 'samples': 3142656, 'steps': 16367, 'loss/train': 1.6368969678878784} -11/06/2021 23:33:58 - INFO - __main__ - Step 16369: {'lr': 0.0004884625480842949, 'samples': 3142848, 'steps': 16368, 'loss/train': 1.6560715436935425} -11/06/2021 23:34:00 - INFO - __main__ - Step 16370: {'lr': 0.0004884609545060726, 'samples': 3143040, 'steps': 16369, 'loss/train': 1.2425155639648438} -11/06/2021 23:34:00 - INFO - __main__ - Step 16371: {'lr': 0.0004884593608204035, 'samples': 3143232, 'steps': 16370, 'loss/train': 1.0383766889572144} -11/06/2021 23:34:00 - INFO - __main__ - Step 16372: {'lr': 0.0004884577670272882, 'samples': 3143424, 'steps': 16371, 'loss/train': 1.6095656156539917} -11/06/2021 23:34:01 - INFO - __main__ - Step 16373: {'lr': 0.0004884561731267278, 'samples': 3143616, 'steps': 16372, 'loss/train': 2.9992105960845947} -11/06/2021 23:34:01 - INFO - __main__ - Step 16374: {'lr': 0.0004884545791187224, 'samples': 3143808, 'steps': 16373, 'loss/train': 1.24136483669281} -11/06/2021 23:34:02 - INFO - __main__ - Step 16375: {'lr': 0.0004884529850032732, 'samples': 3144000, 'steps': 16374, 'loss/train': 0.2827925384044647} -11/06/2021 23:34:03 - INFO - __main__ - Step 16376: {'lr': 0.0004884513907803808, 'samples': 3144192, 'steps': 16375, 'loss/train': 2.1391053199768066} -11/06/2021 23:34:03 - INFO - __main__ - Step 16377: {'lr': 0.0004884497964500457, 'samples': 3144384, 'steps': 16376, 'loss/train': 1.8426679372787476} -11/06/2021 23:34:03 - INFO - __main__ - Step 16378: {'lr': 0.000488448202012269, 'samples': 3144576, 'steps': 16377, 'loss/train': 1.9780805110931396} -11/06/2021 23:34:04 - INFO - __main__ - Step 16379: {'lr': 0.0004884466074670512, 'samples': 3144768, 'steps': 16378, 'loss/train': 1.9465229511260986} -11/06/2021 23:34:05 - INFO - __main__ - Step 16380: {'lr': 0.0004884450128143929, 'samples': 3144960, 'steps': 16379, 'loss/train': 1.7582536935806274} -11/06/2021 23:34:05 - INFO - __main__ - Step 16381: {'lr': 0.000488443418054295, 'samples': 3145152, 'steps': 16380, 'loss/train': 1.4283581972122192} -11/06/2021 23:34:06 - INFO - __main__ - Step 16382: {'lr': 0.0004884418231867583, 'samples': 3145344, 'steps': 16381, 'loss/train': 1.8179876804351807} -11/06/2021 23:34:06 - INFO - __main__ - Step 16383: {'lr': 0.0004884402282117833, 'samples': 3145536, 'steps': 16382, 'loss/train': 0.8137797117233276} -11/06/2021 23:34:06 - INFO - __main__ - Step 16384: {'lr': 0.0004884386331293708, 'samples': 3145728, 'steps': 16383, 'loss/train': 2.007157564163208} -11/06/2021 23:34:07 - INFO - __main__ - Step 16385: {'lr': 0.0004884370379395215, 'samples': 3145920, 'steps': 16384, 'loss/train': 1.2791186571121216} -11/06/2021 23:34:08 - INFO - __main__ - Step 16386: {'lr': 0.0004884354426422363, 'samples': 3146112, 'steps': 16385, 'loss/train': 2.190890073776245} -11/06/2021 23:34:08 - INFO - __main__ - Step 16387: {'lr': 0.0004884338472375156, 'samples': 3146304, 'steps': 16386, 'loss/train': 1.5550997257232666} -11/06/2021 23:34:08 - INFO - __main__ - Step 16388: {'lr': 0.0004884322517253604, 'samples': 3146496, 'steps': 16387, 'loss/train': 1.888465404510498} -11/06/2021 23:34:09 - INFO - __main__ - Step 16389: {'lr': 0.0004884306561057713, 'samples': 3146688, 'steps': 16388, 'loss/train': 1.8606306314468384} -11/06/2021 23:34:09 - INFO - __main__ - Step 16390: {'lr': 0.000488429060378749, 'samples': 3146880, 'steps': 16389, 'loss/train': 1.8474323749542236} -11/06/2021 23:34:09 - INFO - __main__ - Step 16391: {'lr': 0.0004884274645442942, 'samples': 3147072, 'steps': 16390, 'loss/train': 1.6243537664413452} -11/06/2021 23:34:10 - INFO - __main__ - Step 16392: {'lr': 0.0004884258686024077, 'samples': 3147264, 'steps': 16391, 'loss/train': 2.085355758666992} -11/06/2021 23:34:11 - INFO - __main__ - Step 16393: {'lr': 0.0004884242725530902, 'samples': 3147456, 'steps': 16392, 'loss/train': 1.4458762407302856} -11/06/2021 23:34:11 - INFO - __main__ - Step 16394: {'lr': 0.0004884226763963423, 'samples': 3147648, 'steps': 16393, 'loss/train': 1.4372462034225464} -11/06/2021 23:34:12 - INFO - __main__ - Step 16395: {'lr': 0.000488421080132165, 'samples': 3147840, 'steps': 16394, 'loss/train': 1.3019970655441284} -11/06/2021 23:34:12 - INFO - __main__ - Step 16396: {'lr': 0.0004884194837605587, 'samples': 3148032, 'steps': 16395, 'loss/train': 1.6716073751449585} -11/06/2021 23:34:13 - INFO - __main__ - Step 16397: {'lr': 0.0004884178872815243, 'samples': 3148224, 'steps': 16396, 'loss/train': 1.440213680267334} -11/06/2021 23:34:13 - INFO - __main__ - Step 16398: {'lr': 0.0004884162906950624, 'samples': 3148416, 'steps': 16397, 'loss/train': 1.1032469272613525} -11/06/2021 23:34:14 - INFO - __main__ - Step 16399: {'lr': 0.000488414694001174, 'samples': 3148608, 'steps': 16398, 'loss/train': 1.7716431617736816} -11/06/2021 23:34:14 - INFO - __main__ - Step 16400: {'lr': 0.0004884130971998595, 'samples': 3148800, 'steps': 16399, 'loss/train': 1.464718222618103} -11/06/2021 23:34:14 - INFO - __main__ - Step 16401: {'lr': 0.0004884115002911197, 'samples': 3148992, 'steps': 16400, 'loss/train': 2.2289278507232666} -11/06/2021 23:34:15 - INFO - __main__ - Step 16402: {'lr': 0.0004884099032749554, 'samples': 3149184, 'steps': 16401, 'loss/train': 1.3836721181869507} -11/06/2021 23:34:16 - INFO - __main__ - Step 16403: {'lr': 0.0004884083061513672, 'samples': 3149376, 'steps': 16402, 'loss/train': 1.9239706993103027} -11/06/2021 23:34:16 - INFO - __main__ - Step 16404: {'lr': 0.0004884067089203559, 'samples': 3149568, 'steps': 16403, 'loss/train': 1.8463945388793945} -11/06/2021 23:34:16 - INFO - __main__ - Step 16405: {'lr': 0.0004884051115819224, 'samples': 3149760, 'steps': 16404, 'loss/train': 2.2028331756591797} -11/06/2021 23:34:17 - INFO - __main__ - Step 16406: {'lr': 0.000488403514136067, 'samples': 3149952, 'steps': 16405, 'loss/train': 1.876776099205017} -11/06/2021 23:34:18 - INFO - __main__ - Step 16407: {'lr': 0.0004884019165827909, 'samples': 3150144, 'steps': 16406, 'loss/train': 2.1374125480651855} -11/06/2021 23:34:18 - INFO - __main__ - Step 16408: {'lr': 0.0004884003189220945, 'samples': 3150336, 'steps': 16407, 'loss/train': 1.7482624053955078} -11/06/2021 23:34:19 - INFO - __main__ - Step 16409: {'lr': 0.0004883987211539785, 'samples': 3150528, 'steps': 16408, 'loss/train': 1.7053028345108032} -11/06/2021 23:34:19 - INFO - __main__ - Step 16410: {'lr': 0.0004883971232784438, 'samples': 3150720, 'steps': 16409, 'loss/train': 1.538672685623169} -11/06/2021 23:34:19 - INFO - __main__ - Step 16411: {'lr': 0.0004883955252954909, 'samples': 3150912, 'steps': 16410, 'loss/train': 1.7705274820327759} -11/06/2021 23:34:20 - INFO - __main__ - Step 16412: {'lr': 0.0004883939272051208, 'samples': 3151104, 'steps': 16411, 'loss/train': 0.9273844957351685} -11/06/2021 23:34:21 - INFO - __main__ - Step 16413: {'lr': 0.000488392329007334, 'samples': 3151296, 'steps': 16412, 'loss/train': 2.2184743881225586} -11/06/2021 23:34:21 - INFO - __main__ - Step 16414: {'lr': 0.0004883907307021314, 'samples': 3151488, 'steps': 16413, 'loss/train': 1.27170729637146} -11/06/2021 23:34:21 - INFO - __main__ - Step 16415: {'lr': 0.0004883891322895134, 'samples': 3151680, 'steps': 16414, 'loss/train': 1.9354814291000366} -11/06/2021 23:34:22 - INFO - __main__ - Step 16416: {'lr': 0.000488387533769481, 'samples': 3151872, 'steps': 16415, 'loss/train': 1.3187230825424194} -11/06/2021 23:34:22 - INFO - __main__ - Step 16417: {'lr': 0.000488385935142035, 'samples': 3152064, 'steps': 16416, 'loss/train': 1.2268887758255005} -11/06/2021 23:34:23 - INFO - __main__ - Step 16418: {'lr': 0.0004883843364071759, 'samples': 3152256, 'steps': 16417, 'loss/train': 1.435240387916565} -11/06/2021 23:34:23 - INFO - __main__ - Step 16419: {'lr': 0.0004883827375649045, 'samples': 3152448, 'steps': 16418, 'loss/train': 1.6669983863830566} -11/06/2021 23:34:24 - INFO - __main__ - Step 16420: {'lr': 0.0004883811386152216, 'samples': 3152640, 'steps': 16419, 'loss/train': 1.5936235189437866} -11/06/2021 23:34:24 - INFO - __main__ - Step 16421: {'lr': 0.0004883795395581277, 'samples': 3152832, 'steps': 16420, 'loss/train': 1.746578574180603} -11/06/2021 23:34:24 - INFO - __main__ - Step 16422: {'lr': 0.0004883779403936237, 'samples': 3153024, 'steps': 16421, 'loss/train': 2.0167765617370605} -11/06/2021 23:34:26 - INFO - __main__ - Step 16423: {'lr': 0.0004883763411217103, 'samples': 3153216, 'steps': 16422, 'loss/train': 1.6873087882995605} -11/06/2021 23:34:26 - INFO - __main__ - Step 16424: {'lr': 0.0004883747417423882, 'samples': 3153408, 'steps': 16423, 'loss/train': 1.9148794412612915} -11/06/2021 23:34:27 - INFO - __main__ - Step 16425: {'lr': 0.000488373142255658, 'samples': 3153600, 'steps': 16424, 'loss/train': 1.9186967611312866} -11/06/2021 23:34:27 - INFO - __main__ - Step 16426: {'lr': 0.0004883715426615207, 'samples': 3153792, 'steps': 16425, 'loss/train': 1.168741226196289} -11/06/2021 23:34:27 - INFO - __main__ - Step 16427: {'lr': 0.0004883699429599768, 'samples': 3153984, 'steps': 16426, 'loss/train': 1.5318204164505005} -11/06/2021 23:34:28 - INFO - __main__ - Step 16428: {'lr': 0.0004883683431510272, 'samples': 3154176, 'steps': 16427, 'loss/train': 0.9183443784713745} -11/06/2021 23:34:29 - INFO - __main__ - Step 16429: {'lr': 0.0004883667432346723, 'samples': 3154368, 'steps': 16428, 'loss/train': 1.2394202947616577} -11/06/2021 23:34:29 - INFO - __main__ - Step 16430: {'lr': 0.0004883651432109132, 'samples': 3154560, 'steps': 16429, 'loss/train': 1.7920042276382446} -11/06/2021 23:34:29 - INFO - __main__ - Step 16431: {'lr': 0.0004883635430797502, 'samples': 3154752, 'steps': 16430, 'loss/train': 1.7659144401550293} -11/06/2021 23:34:30 - INFO - __main__ - Step 16432: {'lr': 0.0004883619428411846, 'samples': 3154944, 'steps': 16431, 'loss/train': 2.057718276977539} -11/06/2021 23:34:30 - INFO - __main__ - Step 16433: {'lr': 0.0004883603424952165, 'samples': 3155136, 'steps': 16432, 'loss/train': 1.8419935703277588} -11/06/2021 23:34:31 - INFO - __main__ - Step 16434: {'lr': 0.0004883587420418471, 'samples': 3155328, 'steps': 16433, 'loss/train': 1.7195664644241333} -11/06/2021 23:34:32 - INFO - __main__ - Step 16435: {'lr': 0.0004883571414810769, 'samples': 3155520, 'steps': 16434, 'loss/train': 1.438564658164978} -11/06/2021 23:34:32 - INFO - __main__ - Step 16436: {'lr': 0.0004883555408129066, 'samples': 3155712, 'steps': 16435, 'loss/train': 1.904558777809143} -11/06/2021 23:34:32 - INFO - __main__ - Step 16437: {'lr': 0.0004883539400373369, 'samples': 3155904, 'steps': 16436, 'loss/train': 1.708992600440979} -11/06/2021 23:34:33 - INFO - __main__ - Step 16438: {'lr': 0.0004883523391543687, 'samples': 3156096, 'steps': 16437, 'loss/train': 2.0826616287231445} -11/06/2021 23:34:34 - INFO - __main__ - Step 16439: {'lr': 0.0004883507381640026, 'samples': 3156288, 'steps': 16438, 'loss/train': 1.71291184425354} -11/06/2021 23:34:34 - INFO - __main__ - Step 16440: {'lr': 0.0004883491370662393, 'samples': 3156480, 'steps': 16439, 'loss/train': 2.3351950645446777} -11/06/2021 23:34:34 - INFO - __main__ - Step 16441: {'lr': 0.0004883475358610794, 'samples': 3156672, 'steps': 16440, 'loss/train': 1.700568437576294} -11/06/2021 23:34:35 - INFO - __main__ - Step 16442: {'lr': 0.000488345934548524, 'samples': 3156864, 'steps': 16441, 'loss/train': 1.2319788932800293} -11/06/2021 23:34:35 - INFO - __main__ - Step 16443: {'lr': 0.0004883443331285736, 'samples': 3157056, 'steps': 16442, 'loss/train': 1.9203612804412842} -11/06/2021 23:34:36 - INFO - __main__ - Step 16444: {'lr': 0.0004883427316012289, 'samples': 3157248, 'steps': 16443, 'loss/train': 1.382559061050415} -11/06/2021 23:34:36 - INFO - __main__ - Step 16445: {'lr': 0.0004883411299664906, 'samples': 3157440, 'steps': 16444, 'loss/train': 1.7996220588684082} -11/06/2021 23:34:37 - INFO - __main__ - Step 16446: {'lr': 0.0004883395282243595, 'samples': 3157632, 'steps': 16445, 'loss/train': 1.54921293258667} -11/06/2021 23:34:37 - INFO - __main__ - Step 16447: {'lr': 0.0004883379263748363, 'samples': 3157824, 'steps': 16446, 'loss/train': 1.4112991094589233} -11/06/2021 23:34:37 - INFO - __main__ - Step 16448: {'lr': 0.0004883363244179217, 'samples': 3158016, 'steps': 16447, 'loss/train': 2.3577237129211426} -11/06/2021 23:34:38 - INFO - __main__ - Step 16449: {'lr': 0.0004883347223536164, 'samples': 3158208, 'steps': 16448, 'loss/train': 1.258867859840393} -11/06/2021 23:34:39 - INFO - __main__ - Step 16450: {'lr': 0.0004883331201819211, 'samples': 3158400, 'steps': 16449, 'loss/train': 2.188420057296753} -11/06/2021 23:34:39 - INFO - __main__ - Step 16451: {'lr': 0.0004883315179028366, 'samples': 3158592, 'steps': 16450, 'loss/train': 1.7778352499008179} -11/06/2021 23:34:39 - INFO - __main__ - Step 16452: {'lr': 0.0004883299155163636, 'samples': 3158784, 'steps': 16451, 'loss/train': 1.679057002067566} -11/06/2021 23:34:40 - INFO - __main__ - Step 16453: {'lr': 0.0004883283130225029, 'samples': 3158976, 'steps': 16452, 'loss/train': 1.8446472883224487} -11/06/2021 23:34:40 - INFO - __main__ - Step 16454: {'lr': 0.0004883267104212551, 'samples': 3159168, 'steps': 16453, 'loss/train': 0.8045353889465332} -11/06/2021 23:34:42 - INFO - __main__ - Step 16455: {'lr': 0.0004883251077126209, 'samples': 3159360, 'steps': 16454, 'loss/train': 1.5657854080200195} -11/06/2021 23:34:42 - INFO - __main__ - Step 16456: {'lr': 0.0004883235048966011, 'samples': 3159552, 'steps': 16455, 'loss/train': 0.303096204996109} -11/06/2021 23:34:43 - INFO - __main__ - Step 16457: {'lr': 0.0004883219019731964, 'samples': 3159744, 'steps': 16456, 'loss/train': 1.406226634979248} -11/06/2021 23:34:43 - INFO - __main__ - Step 16458: {'lr': 0.0004883202989424076, 'samples': 3159936, 'steps': 16457, 'loss/train': 5.184366226196289} -11/06/2021 23:34:43 - INFO - __main__ - Step 16459: {'lr': 0.0004883186958042354, 'samples': 3160128, 'steps': 16458, 'loss/train': 8.043232917785645} -11/06/2021 23:34:44 - INFO - __main__ - Step 16460: {'lr': 0.0004883170925586804, 'samples': 3160320, 'steps': 16459, 'loss/train': 8.05807876586914} -11/06/2021 23:34:44 - INFO - __main__ - Step 16461: {'lr': 0.0004883154892057433, 'samples': 3160512, 'steps': 16460, 'loss/train': 1.4330828189849854} -11/06/2021 23:34:45 - INFO - __main__ - Step 16462: {'lr': 0.000488313885745425, 'samples': 3160704, 'steps': 16461, 'loss/train': 1.8377580642700195} -11/06/2021 23:34:46 - INFO - __main__ - Step 16463: {'lr': 0.0004883122821777261, 'samples': 3160896, 'steps': 16462, 'loss/train': 1.6536674499511719} -11/06/2021 23:34:46 - INFO - __main__ - Step 16464: {'lr': 0.0004883106785026475, 'samples': 3161088, 'steps': 16463, 'loss/train': 1.4309262037277222} -11/06/2021 23:34:46 - INFO - __main__ - Step 16465: {'lr': 0.0004883090747201897, 'samples': 3161280, 'steps': 16464, 'loss/train': 1.9212692975997925} -11/06/2021 23:34:47 - INFO - __main__ - Step 16466: {'lr': 0.0004883074708303534, 'samples': 3161472, 'steps': 16465, 'loss/train': 8.428525924682617} -11/06/2021 23:34:47 - INFO - __main__ - Step 16467: {'lr': 0.0004883058668331396, 'samples': 3161664, 'steps': 16466, 'loss/train': 1.6166472434997559} -11/06/2021 23:34:48 - INFO - __main__ - Step 16468: {'lr': 0.0004883042627285488, 'samples': 3161856, 'steps': 16467, 'loss/train': 1.0819371938705444} -11/06/2021 23:34:48 - INFO - __main__ - Step 16469: {'lr': 0.0004883026585165817, 'samples': 3162048, 'steps': 16468, 'loss/train': 2.0714237689971924} -11/06/2021 23:34:49 - INFO - __main__ - Step 16470: {'lr': 0.0004883010541972392, 'samples': 3162240, 'steps': 16469, 'loss/train': 1.4929072856903076} -11/06/2021 23:34:49 - INFO - __main__ - Step 16471: {'lr': 0.0004882994497705219, 'samples': 3162432, 'steps': 16470, 'loss/train': 2.0204741954803467} -11/06/2021 23:34:49 - INFO - __main__ - Step 16472: {'lr': 0.0004882978452364305, 'samples': 3162624, 'steps': 16471, 'loss/train': 2.0556139945983887} -11/06/2021 23:34:51 - INFO - __main__ - Step 16473: {'lr': 0.0004882962405949658, 'samples': 3162816, 'steps': 16472, 'loss/train': 1.3556331396102905} -11/06/2021 23:34:51 - INFO - __main__ - Step 16474: {'lr': 0.0004882946358461285, 'samples': 3163008, 'steps': 16473, 'loss/train': 2.0677337646484375} -11/06/2021 23:34:51 - INFO - __main__ - Step 16475: {'lr': 0.0004882930309899192, 'samples': 3163200, 'steps': 16474, 'loss/train': 2.228142738342285} -11/06/2021 23:34:52 - INFO - __main__ - Step 16476: {'lr': 0.000488291426026339, 'samples': 3163392, 'steps': 16475, 'loss/train': 1.9927802085876465} -11/06/2021 23:34:52 - INFO - __main__ - Step 16477: {'lr': 0.0004882898209553881, 'samples': 3163584, 'steps': 16476, 'loss/train': 2.140395164489746} -11/06/2021 23:34:52 - INFO - __main__ - Step 16478: {'lr': 0.0004882882157770676, 'samples': 3163776, 'steps': 16477, 'loss/train': 1.4509589672088623} -11/06/2021 23:34:53 - INFO - __main__ - Step 16479: {'lr': 0.000488286610491378, 'samples': 3163968, 'steps': 16478, 'loss/train': 1.8325351476669312} -11/06/2021 23:34:54 - INFO - __main__ - Step 16480: {'lr': 0.0004882850050983203, 'samples': 3164160, 'steps': 16479, 'loss/train': 1.5992738008499146} -11/06/2021 23:34:54 - INFO - __main__ - Step 16481: {'lr': 0.0004882833995978949, 'samples': 3164352, 'steps': 16480, 'loss/train': 1.4408437013626099} -11/06/2021 23:34:54 - INFO - __main__ - Step 16482: {'lr': 0.0004882817939901027, 'samples': 3164544, 'steps': 16481, 'loss/train': 1.7016760110855103} -11/06/2021 23:34:55 - INFO - __main__ - Step 16483: {'lr': 0.0004882801882749445, 'samples': 3164736, 'steps': 16482, 'loss/train': 1.6935230493545532} -11/06/2021 23:34:56 - INFO - __main__ - Step 16484: {'lr': 0.0004882785824524209, 'samples': 3164928, 'steps': 16483, 'loss/train': 1.9659548997879028} -11/06/2021 23:34:56 - INFO - __main__ - Step 16485: {'lr': 0.0004882769765225326, 'samples': 3165120, 'steps': 16484, 'loss/train': 1.4633811712265015} -11/06/2021 23:34:57 - INFO - __main__ - Step 16486: {'lr': 0.00048827537048528035, 'samples': 3165312, 'steps': 16485, 'loss/train': 1.8877742290496826} -11/06/2021 23:34:57 - INFO - __main__ - Step 16487: {'lr': 0.00048827376434066493, 'samples': 3165504, 'steps': 16486, 'loss/train': 1.910869836807251} -11/06/2021 23:34:57 - INFO - __main__ - Step 16488: {'lr': 0.0004882721580886871, 'samples': 3165696, 'steps': 16487, 'loss/train': 1.7500070333480835} -11/06/2021 23:34:58 - INFO - __main__ - Step 16489: {'lr': 0.00048827055172934744, 'samples': 3165888, 'steps': 16488, 'loss/train': 1.7136714458465576} -11/06/2021 23:34:59 - INFO - __main__ - Step 16490: {'lr': 0.0004882689452626468, 'samples': 3166080, 'steps': 16489, 'loss/train': 1.9867051839828491} -11/06/2021 23:34:59 - INFO - __main__ - Step 16491: {'lr': 0.00048826733868858577, 'samples': 3166272, 'steps': 16490, 'loss/train': 0.20762591063976288} -11/06/2021 23:34:59 - INFO - __main__ - Step 16492: {'lr': 0.00048826573200716516, 'samples': 3166464, 'steps': 16491, 'loss/train': 1.4593125581741333} -11/06/2021 23:35:00 - INFO - __main__ - Step 16493: {'lr': 0.0004882641252183857, 'samples': 3166656, 'steps': 16492, 'loss/train': 1.8210448026657104} -11/06/2021 23:35:00 - INFO - __main__ - Step 16494: {'lr': 0.0004882625183222481, 'samples': 3166848, 'steps': 16493, 'loss/train': 1.7978031635284424} -11/06/2021 23:35:01 - INFO - __main__ - Step 16495: {'lr': 0.00048826091131875317, 'samples': 3167040, 'steps': 16494, 'loss/train': 1.5826845169067383} -11/06/2021 23:35:02 - INFO - __main__ - Step 16496: {'lr': 0.00048825930420790144, 'samples': 3167232, 'steps': 16495, 'loss/train': 1.638830304145813} -11/06/2021 23:35:02 - INFO - __main__ - Step 16497: {'lr': 0.0004882576969896938, 'samples': 3167424, 'steps': 16496, 'loss/train': 1.9118237495422363} -11/06/2021 23:35:02 - INFO - __main__ - Step 16498: {'lr': 0.00048825608966413095, 'samples': 3167616, 'steps': 16497, 'loss/train': 1.3743228912353516} -11/06/2021 23:35:03 - INFO - __main__ - Step 16499: {'lr': 0.0004882544822312135, 'samples': 3167808, 'steps': 16498, 'loss/train': 1.554957628250122} -11/06/2021 23:35:04 - INFO - __main__ - Step 16500: {'lr': 0.00048825287469094224, 'samples': 3168000, 'steps': 16499, 'loss/train': 2.003634452819824} -11/06/2021 23:35:04 - INFO - __main__ - Step 16501: {'lr': 0.000488251267043318, 'samples': 3168192, 'steps': 16500, 'loss/train': 1.7607531547546387} -11/06/2021 23:35:04 - INFO - __main__ - Step 16502: {'lr': 0.00048824965928834143, 'samples': 3168384, 'steps': 16501, 'loss/train': 1.72561776638031} -11/06/2021 23:35:05 - INFO - __main__ - Step 16503: {'lr': 0.0004882480514260131, 'samples': 3168576, 'steps': 16502, 'loss/train': 1.7174887657165527} -11/06/2021 23:35:05 - INFO - __main__ - Step 16504: {'lr': 0.000488246443456334, 'samples': 3168768, 'steps': 16503, 'loss/train': 1.427158236503601} -11/06/2021 23:35:06 - INFO - __main__ - Step 16505: {'lr': 0.0004882448353793048, 'samples': 3168960, 'steps': 16504, 'loss/train': 1.661441445350647} -11/06/2021 23:35:07 - INFO - __main__ - Step 16506: {'lr': 0.000488243227194926, 'samples': 3169152, 'steps': 16505, 'loss/train': 1.6269912719726562} -11/06/2021 23:35:07 - INFO - __main__ - Step 16507: {'lr': 0.00048824161890319854, 'samples': 3169344, 'steps': 16506, 'loss/train': 1.6323604583740234} -11/06/2021 23:35:07 - INFO - __main__ - Step 16508: {'lr': 0.00048824001050412304, 'samples': 3169536, 'steps': 16507, 'loss/train': 1.1805651187896729} -11/06/2021 23:35:08 - INFO - __main__ - Step 16509: {'lr': 0.0004882384019977003, 'samples': 3169728, 'steps': 16508, 'loss/train': 1.7466378211975098} -11/06/2021 23:35:09 - INFO - __main__ - Step 16510: {'lr': 0.000488236793383931, 'samples': 3169920, 'steps': 16509, 'loss/train': 1.939573049545288} -11/06/2021 23:35:09 - INFO - __main__ - Step 16511: {'lr': 0.00048823518466281586, 'samples': 3170112, 'steps': 16510, 'loss/train': 1.5818568468093872} -11/06/2021 23:35:09 - INFO - __main__ - Step 16512: {'lr': 0.0004882335758343557, 'samples': 3170304, 'steps': 16511, 'loss/train': 1.3444141149520874} -11/06/2021 23:35:10 - INFO - __main__ - Step 16513: {'lr': 0.0004882319668985511, 'samples': 3170496, 'steps': 16512, 'loss/train': 1.5488812923431396} -11/06/2021 23:35:10 - INFO - __main__ - Step 16514: {'lr': 0.00048823035785540284, 'samples': 3170688, 'steps': 16513, 'loss/train': 1.5068031549453735} -11/06/2021 23:35:10 - INFO - __main__ - Step 16515: {'lr': 0.0004882287487049117, 'samples': 3170880, 'steps': 16514, 'loss/train': 2.055966854095459} -11/06/2021 23:35:11 - INFO - __main__ - Step 16516: {'lr': 0.00048822713944707833, 'samples': 3171072, 'steps': 16515, 'loss/train': 1.9989991188049316} -11/06/2021 23:35:12 - INFO - __main__ - Step 16517: {'lr': 0.0004882255300819035, 'samples': 3171264, 'steps': 16516, 'loss/train': 1.4609509706497192} -11/06/2021 23:35:12 - INFO - __main__ - Step 16518: {'lr': 0.0004882239206093879, 'samples': 3171456, 'steps': 16517, 'loss/train': 1.803931713104248} -11/06/2021 23:35:12 - INFO - __main__ - Step 16519: {'lr': 0.0004882223110295323, 'samples': 3171648, 'steps': 16518, 'loss/train': 1.8688184022903442} -11/06/2021 23:35:13 - INFO - __main__ - Step 16520: {'lr': 0.00048822070134233743, 'samples': 3171840, 'steps': 16519, 'loss/train': 2.412503719329834} -11/06/2021 23:35:14 - INFO - __main__ - Step 16521: {'lr': 0.000488219091547804, 'samples': 3172032, 'steps': 16520, 'loss/train': 1.5332022905349731} -11/06/2021 23:35:14 - INFO - __main__ - Step 16522: {'lr': 0.0004882174816459326, 'samples': 3172224, 'steps': 16521, 'loss/train': 1.0638723373413086} -11/06/2021 23:35:15 - INFO - __main__ - Step 16523: {'lr': 0.0004882158716367242, 'samples': 3172416, 'steps': 16522, 'loss/train': 1.8770873546600342} -11/06/2021 23:35:15 - INFO - __main__ - Step 16524: {'lr': 0.0004882142615201793, 'samples': 3172608, 'steps': 16523, 'loss/train': 1.3749724626541138} -11/06/2021 23:35:15 - INFO - __main__ - Step 16525: {'lr': 0.00048821265129629887, 'samples': 3172800, 'steps': 16524, 'loss/train': 1.3542416095733643} -11/06/2021 23:35:16 - INFO - __main__ - Step 16526: {'lr': 0.0004882110409650834, 'samples': 3172992, 'steps': 16525, 'loss/train': 1.317636489868164} -11/06/2021 23:35:17 - INFO - __main__ - Step 16527: {'lr': 0.0004882094305265338, 'samples': 3173184, 'steps': 16526, 'loss/train': 1.8596268892288208} -11/06/2021 23:35:17 - INFO - __main__ - Step 16528: {'lr': 0.00048820781998065054, 'samples': 3173376, 'steps': 16527, 'loss/train': 1.1366714239120483} -11/06/2021 23:35:17 - INFO - __main__ - Step 16529: {'lr': 0.00048820620932743465, 'samples': 3173568, 'steps': 16528, 'loss/train': 1.765393853187561} -11/06/2021 23:35:18 - INFO - __main__ - Step 16530: {'lr': 0.0004882045985668867, 'samples': 3173760, 'steps': 16529, 'loss/train': 1.457262635231018} -11/06/2021 23:35:19 - INFO - __main__ - Step 16531: {'lr': 0.0004882029876990074, 'samples': 3173952, 'steps': 16530, 'loss/train': 1.3767226934432983} -11/06/2021 23:35:19 - INFO - __main__ - Step 16532: {'lr': 0.0004882013767237975, 'samples': 3174144, 'steps': 16531, 'loss/train': 1.6697412729263306} -11/06/2021 23:35:20 - INFO - __main__ - Step 16533: {'lr': 0.0004881997656412578, 'samples': 3174336, 'steps': 16532, 'loss/train': 1.7419915199279785} -11/06/2021 23:35:20 - INFO - __main__ - Step 16534: {'lr': 0.0004881981544513889, 'samples': 3174528, 'steps': 16533, 'loss/train': 1.6078473329544067} -11/06/2021 23:35:20 - INFO - __main__ - Step 16535: {'lr': 0.0004881965431541916, 'samples': 3174720, 'steps': 16534, 'loss/train': 1.4096086025238037} -11/06/2021 23:35:21 - INFO - __main__ - Step 16536: {'lr': 0.0004881949317496667, 'samples': 3174912, 'steps': 16535, 'loss/train': 1.502119541168213} -11/06/2021 23:35:22 - INFO - __main__ - Step 16537: {'lr': 0.0004881933202378147, 'samples': 3175104, 'steps': 16536, 'loss/train': 1.3648459911346436} -11/06/2021 23:35:22 - INFO - __main__ - Step 16538: {'lr': 0.0004881917086186365, 'samples': 3175296, 'steps': 16537, 'loss/train': 2.249582290649414} -11/06/2021 23:35:22 - INFO - __main__ - Step 16539: {'lr': 0.0004881900968921328, 'samples': 3175488, 'steps': 16538, 'loss/train': 1.8910950422286987} -11/06/2021 23:35:23 - INFO - __main__ - Step 16540: {'lr': 0.00048818848505830436, 'samples': 3175680, 'steps': 16539, 'loss/train': 0.856475293636322} -11/06/2021 23:35:24 - INFO - __main__ - Step 16541: {'lr': 0.0004881868731171518, 'samples': 3175872, 'steps': 16540, 'loss/train': 1.7443568706512451} -11/06/2021 23:35:24 - INFO - __main__ - Step 16542: {'lr': 0.000488185261068676, 'samples': 3176064, 'steps': 16541, 'loss/train': 1.7981657981872559} -11/06/2021 23:35:25 - INFO - __main__ - Step 16543: {'lr': 0.0004881836489128776, 'samples': 3176256, 'steps': 16542, 'loss/train': 1.6968001127243042} -11/06/2021 23:35:25 - INFO - __main__ - Step 16544: {'lr': 0.00048818203664975727, 'samples': 3176448, 'steps': 16543, 'loss/train': 1.6674453020095825} -11/06/2021 23:35:25 - INFO - __main__ - Step 16545: {'lr': 0.00048818042427931573, 'samples': 3176640, 'steps': 16544, 'loss/train': 1.6024539470672607} -11/06/2021 23:35:26 - INFO - __main__ - Step 16546: {'lr': 0.00048817881180155385, 'samples': 3176832, 'steps': 16545, 'loss/train': 1.7665468454360962} -11/06/2021 23:35:27 - INFO - __main__ - Step 16547: {'lr': 0.0004881771992164722, 'samples': 3177024, 'steps': 16546, 'loss/train': 1.7142109870910645} -11/06/2021 23:35:27 - INFO - __main__ - Step 16548: {'lr': 0.0004881755865240717, 'samples': 3177216, 'steps': 16547, 'loss/train': 1.6377567052841187} -11/06/2021 23:35:27 - INFO - __main__ - Step 16549: {'lr': 0.0004881739737243528, 'samples': 3177408, 'steps': 16548, 'loss/train': 1.363764762878418} -11/06/2021 23:35:28 - INFO - __main__ - Step 16550: {'lr': 0.00048817236081731655, 'samples': 3177600, 'steps': 16549, 'loss/train': 1.6557155847549438} -11/06/2021 23:35:28 - INFO - __main__ - Step 16551: {'lr': 0.0004881707478029634, 'samples': 3177792, 'steps': 16550, 'loss/train': 1.6136027574539185} -11/06/2021 23:35:29 - INFO - __main__ - Step 16552: {'lr': 0.0004881691346812942, 'samples': 3177984, 'steps': 16551, 'loss/train': 1.5945550203323364} -11/06/2021 23:35:30 - INFO - __main__ - Step 16553: {'lr': 0.0004881675214523097, 'samples': 3178176, 'steps': 16552, 'loss/train': 1.704119086265564} -11/06/2021 23:35:30 - INFO - __main__ - Step 16554: {'lr': 0.00048816590811601054, 'samples': 3178368, 'steps': 16553, 'loss/train': 1.5714160203933716} -11/06/2021 23:35:30 - INFO - __main__ - Step 16555: {'lr': 0.0004881642946723975, 'samples': 3178560, 'steps': 16554, 'loss/train': 1.7432516813278198} -11/06/2021 23:35:31 - INFO - __main__ - Step 16556: {'lr': 0.00048816268112147134, 'samples': 3178752, 'steps': 16555, 'loss/train': 0.19290374219417572} -11/06/2021 23:35:32 - INFO - __main__ - Step 16557: {'lr': 0.00048816106746323273, 'samples': 3178944, 'steps': 16556, 'loss/train': 1.346990942955017} -11/06/2021 23:35:32 - INFO - __main__ - Step 16558: {'lr': 0.00048815945369768245, 'samples': 3179136, 'steps': 16557, 'loss/train': 1.5871580839157104} -11/06/2021 23:35:32 - INFO - __main__ - Step 16559: {'lr': 0.00048815783982482115, 'samples': 3179328, 'steps': 16558, 'loss/train': 1.4788908958435059} -11/06/2021 23:35:33 - INFO - __main__ - Step 16560: {'lr': 0.0004881562258446496, 'samples': 3179520, 'steps': 16559, 'loss/train': 1.6638139486312866} -11/06/2021 23:35:33 - INFO - __main__ - Step 16561: {'lr': 0.00048815461175716855, 'samples': 3179712, 'steps': 16560, 'loss/train': 1.913263201713562} -11/06/2021 23:35:35 - INFO - __main__ - Step 16562: {'lr': 0.00048815299756237873, 'samples': 3179904, 'steps': 16561, 'loss/train': 1.9439252614974976} -11/06/2021 23:35:35 - INFO - __main__ - Step 16563: {'lr': 0.0004881513832602808, 'samples': 3180096, 'steps': 16562, 'loss/train': 1.476514458656311} -11/06/2021 23:35:35 - INFO - __main__ - Step 16564: {'lr': 0.0004881497688508756, 'samples': 3180288, 'steps': 16563, 'loss/train': 1.613339900970459} -11/06/2021 23:35:36 - INFO - __main__ - Step 16565: {'lr': 0.0004881481543341637, 'samples': 3180480, 'steps': 16564, 'loss/train': 1.7296475172042847} -11/06/2021 23:35:36 - INFO - __main__ - Step 16566: {'lr': 0.000488146539710146, 'samples': 3180672, 'steps': 16565, 'loss/train': 1.3595619201660156} -11/06/2021 23:35:36 - INFO - __main__ - Step 16567: {'lr': 0.00048814492497882306, 'samples': 3180864, 'steps': 16566, 'loss/train': 1.9055120944976807} -11/06/2021 23:35:38 - INFO - __main__ - Step 16568: {'lr': 0.00048814331014019577, 'samples': 3181056, 'steps': 16567, 'loss/train': 1.4055638313293457} -11/06/2021 23:35:38 - INFO - __main__ - Step 16569: {'lr': 0.0004881416951942647, 'samples': 3181248, 'steps': 16568, 'loss/train': 1.8955738544464111} -11/06/2021 23:35:38 - INFO - __main__ - Step 16570: {'lr': 0.0004881400801410307, 'samples': 3181440, 'steps': 16569, 'loss/train': 1.4749326705932617} -11/06/2021 23:35:39 - INFO - __main__ - Step 16571: {'lr': 0.0004881384649804945, 'samples': 3181632, 'steps': 16570, 'loss/train': 1.6895521879196167} -11/06/2021 23:35:39 - INFO - __main__ - Step 16572: {'lr': 0.0004881368497126567, 'samples': 3181824, 'steps': 16571, 'loss/train': 1.8323323726654053} -11/06/2021 23:35:40 - INFO - __main__ - Step 16573: {'lr': 0.00048813523433751814, 'samples': 3182016, 'steps': 16572, 'loss/train': 1.8884717226028442} -11/06/2021 23:35:40 - INFO - __main__ - Step 16574: {'lr': 0.00048813361885507956, 'samples': 3182208, 'steps': 16573, 'loss/train': 1.50578773021698} -11/06/2021 23:35:41 - INFO - __main__ - Step 16575: {'lr': 0.00048813200326534156, 'samples': 3182400, 'steps': 16574, 'loss/train': 1.8170469999313354} -11/06/2021 23:35:41 - INFO - __main__ - Step 16576: {'lr': 0.00048813038756830506, 'samples': 3182592, 'steps': 16575, 'loss/train': 1.7620586156845093} -11/06/2021 23:35:41 - INFO - __main__ - Step 16577: {'lr': 0.00048812877176397066, 'samples': 3182784, 'steps': 16576, 'loss/train': 1.3254033327102661} -11/06/2021 23:35:42 - INFO - __main__ - Step 16578: {'lr': 0.00048812715585233905, 'samples': 3182976, 'steps': 16577, 'loss/train': 1.8124728202819824} -11/06/2021 23:35:43 - INFO - __main__ - Step 16579: {'lr': 0.000488125539833411, 'samples': 3183168, 'steps': 16578, 'loss/train': 1.7202956676483154} -11/06/2021 23:35:44 - INFO - __main__ - Step 16580: {'lr': 0.0004881239237071873, 'samples': 3183360, 'steps': 16579, 'loss/train': 1.9533145427703857} -11/06/2021 23:35:44 - INFO - __main__ - Step 16581: {'lr': 0.0004881223074736687, 'samples': 3183552, 'steps': 16580, 'loss/train': 1.7170475721359253} -11/06/2021 23:35:44 - INFO - __main__ - Step 16582: {'lr': 0.00048812069113285573, 'samples': 3183744, 'steps': 16581, 'loss/train': 1.8036795854568481} -11/06/2021 23:35:45 - INFO - __main__ - Step 16583: {'lr': 0.00048811907468474934, 'samples': 3183936, 'steps': 16582, 'loss/train': 1.9189525842666626} -11/06/2021 23:35:46 - INFO - __main__ - Step 16584: {'lr': 0.00048811745812935015, 'samples': 3184128, 'steps': 16583, 'loss/train': 1.163478970527649} -11/06/2021 23:35:46 - INFO - __main__ - Step 16585: {'lr': 0.00048811584146665895, 'samples': 3184320, 'steps': 16584, 'loss/train': 2.10164213180542} -11/06/2021 23:35:47 - INFO - __main__ - Step 16586: {'lr': 0.0004881142246966763, 'samples': 3184512, 'steps': 16585, 'loss/train': 2.115177631378174} -11/06/2021 23:35:47 - INFO - __main__ - Step 16587: {'lr': 0.00048811260781940317, 'samples': 3184704, 'steps': 16586, 'loss/train': 1.7502573728561401} -11/06/2021 23:35:47 - INFO - __main__ - Step 16588: {'lr': 0.00048811099083484016, 'samples': 3184896, 'steps': 16587, 'loss/train': 2.0302722454071045} -11/06/2021 23:35:48 - INFO - __main__ - Step 16589: {'lr': 0.000488109373742988, 'samples': 3185088, 'steps': 16588, 'loss/train': 1.9502590894699097} -11/06/2021 23:35:49 - INFO - __main__ - Step 16590: {'lr': 0.0004881077565438474, 'samples': 3185280, 'steps': 16589, 'loss/train': 2.074025869369507} -11/06/2021 23:35:49 - INFO - __main__ - Step 16591: {'lr': 0.0004881061392374192, 'samples': 3185472, 'steps': 16590, 'loss/train': 1.1119537353515625} -11/06/2021 23:35:49 - INFO - __main__ - Step 16592: {'lr': 0.000488104521823704, 'samples': 3185664, 'steps': 16591, 'loss/train': 2.0072836875915527} -11/06/2021 23:35:50 - INFO - __main__ - Step 16593: {'lr': 0.00048810290430270257, 'samples': 3185856, 'steps': 16592, 'loss/train': 1.3514482975006104} -11/06/2021 23:35:50 - INFO - __main__ - Step 16594: {'lr': 0.0004881012866744156, 'samples': 3186048, 'steps': 16593, 'loss/train': 1.91445791721344} -11/06/2021 23:35:51 - INFO - __main__ - Step 16595: {'lr': 0.00048809966893884396, 'samples': 3186240, 'steps': 16594, 'loss/train': 1.6212115287780762} -11/06/2021 23:35:52 - INFO - __main__ - Step 16596: {'lr': 0.00048809805109598813, 'samples': 3186432, 'steps': 16595, 'loss/train': 1.7508177757263184} -11/06/2021 23:35:52 - INFO - __main__ - Step 16597: {'lr': 0.0004880964331458492, 'samples': 3186624, 'steps': 16596, 'loss/train': 1.6479634046554565} -11/06/2021 23:35:52 - INFO - __main__ - Step 16598: {'lr': 0.0004880948150884276, 'samples': 3186816, 'steps': 16597, 'loss/train': 1.4154289960861206} -11/06/2021 23:35:53 - INFO - __main__ - Step 16599: {'lr': 0.00048809319692372406, 'samples': 3187008, 'steps': 16598, 'loss/train': 1.8749748468399048} -11/06/2021 23:35:53 - INFO - __main__ - Step 16600: {'lr': 0.0004880915786517395, 'samples': 3187200, 'steps': 16599, 'loss/train': 1.1239466667175293} -11/06/2021 23:35:54 - INFO - __main__ - Step 16601: {'lr': 0.00048808996027247453, 'samples': 3187392, 'steps': 16600, 'loss/train': 1.6338905096054077} -11/06/2021 23:35:55 - INFO - __main__ - Step 16602: {'lr': 0.0004880883417859299, 'samples': 3187584, 'steps': 16601, 'loss/train': 1.2137621641159058} -11/06/2021 23:35:55 - INFO - __main__ - Step 16603: {'lr': 0.0004880867231921063, 'samples': 3187776, 'steps': 16602, 'loss/train': 1.6289089918136597} -11/06/2021 23:35:55 - INFO - __main__ - Step 16604: {'lr': 0.0004880851044910045, 'samples': 3187968, 'steps': 16603, 'loss/train': 1.77559494972229} -11/06/2021 23:35:56 - INFO - __main__ - Step 16605: {'lr': 0.0004880834856826253, 'samples': 3188160, 'steps': 16604, 'loss/train': 1.5778307914733887} -11/06/2021 23:35:56 - INFO - __main__ - Step 16606: {'lr': 0.0004880818667669693, 'samples': 3188352, 'steps': 16605, 'loss/train': 1.3657011985778809} -11/06/2021 23:35:57 - INFO - __main__ - Step 16607: {'lr': 0.00048808024774403726, 'samples': 3188544, 'steps': 16606, 'loss/train': 1.502026915550232} -11/06/2021 23:35:57 - INFO - __main__ - Step 16608: {'lr': 0.00048807862861382996, 'samples': 3188736, 'steps': 16607, 'loss/train': 1.240162968635559} -11/06/2021 23:35:58 - INFO - __main__ - Step 16609: {'lr': 0.0004880770093763481, 'samples': 3188928, 'steps': 16608, 'loss/train': 1.8014652729034424} -11/06/2021 23:35:58 - INFO - __main__ - Step 16610: {'lr': 0.0004880753900315924, 'samples': 3189120, 'steps': 16609, 'loss/train': 1.908936619758606} -11/06/2021 23:35:59 - INFO - __main__ - Step 16611: {'lr': 0.00048807377057956365, 'samples': 3189312, 'steps': 16610, 'loss/train': 1.7892169952392578} -11/06/2021 23:35:59 - INFO - __main__ - Step 16612: {'lr': 0.00048807215102026247, 'samples': 3189504, 'steps': 16611, 'loss/train': 1.5934950113296509} -11/06/2021 23:36:00 - INFO - __main__ - Step 16613: {'lr': 0.00048807053135368973, 'samples': 3189696, 'steps': 16612, 'loss/train': 2.044344902038574} -11/06/2021 23:36:00 - INFO - __main__ - Step 16614: {'lr': 0.00048806891157984604, 'samples': 3189888, 'steps': 16613, 'loss/train': 2.3011348247528076} -11/06/2021 23:36:01 - INFO - __main__ - Step 16615: {'lr': 0.0004880672916987322, 'samples': 3190080, 'steps': 16614, 'loss/train': 1.4086577892303467} -11/06/2021 23:36:01 - INFO - __main__ - Step 16616: {'lr': 0.0004880656717103489, 'samples': 3190272, 'steps': 16615, 'loss/train': 1.8714768886566162} -11/06/2021 23:36:02 - INFO - __main__ - Step 16617: {'lr': 0.0004880640516146968, 'samples': 3190464, 'steps': 16616, 'loss/train': 1.5197786092758179} -11/06/2021 23:36:02 - INFO - __main__ - Step 16618: {'lr': 0.0004880624314117768, 'samples': 3190656, 'steps': 16617, 'loss/train': 1.993930459022522} -11/06/2021 23:36:03 - INFO - __main__ - Step 16619: {'lr': 0.0004880608111015895, 'samples': 3190848, 'steps': 16618, 'loss/train': 1.221077799797058} -11/06/2021 23:36:03 - INFO - __main__ - Step 16620: {'lr': 0.00048805919068413574, 'samples': 3191040, 'steps': 16619, 'loss/train': 3.036583185195923} -11/06/2021 23:36:03 - INFO - __main__ - Step 16621: {'lr': 0.0004880575701594161, 'samples': 3191232, 'steps': 16620, 'loss/train': 6.032649040222168} -11/06/2021 23:36:04 - INFO - __main__ - Step 16622: {'lr': 0.0004880559495274315, 'samples': 3191424, 'steps': 16621, 'loss/train': 1.834834337234497} -11/06/2021 23:36:05 - INFO - __main__ - Step 16623: {'lr': 0.00048805432878818247, 'samples': 3191616, 'steps': 16622, 'loss/train': 1.6473767757415771} -11/06/2021 23:36:05 - INFO - __main__ - Step 16624: {'lr': 0.0004880527079416698, 'samples': 3191808, 'steps': 16623, 'loss/train': 2.2454183101654053} -11/06/2021 23:36:05 - INFO - __main__ - Step 16625: {'lr': 0.00048805108698789435, 'samples': 3192000, 'steps': 16624, 'loss/train': 1.9317262172698975} -11/06/2021 23:36:06 - INFO - __main__ - Step 16626: {'lr': 0.00048804946592685667, 'samples': 3192192, 'steps': 16625, 'loss/train': 1.8206801414489746} -11/06/2021 23:36:06 - INFO - __main__ - Step 16627: {'lr': 0.0004880478447585576, 'samples': 3192384, 'steps': 16626, 'loss/train': 1.9301916360855103} -11/06/2021 23:36:07 - INFO - __main__ - Step 16628: {'lr': 0.00048804622348299785, 'samples': 3192576, 'steps': 16627, 'loss/train': 1.4593732357025146} -11/06/2021 23:36:08 - INFO - __main__ - Step 16629: {'lr': 0.0004880446021001782, 'samples': 3192768, 'steps': 16628, 'loss/train': 1.5824449062347412} -11/06/2021 23:36:08 - INFO - __main__ - Step 16630: {'lr': 0.00048804298061009925, 'samples': 3192960, 'steps': 16629, 'loss/train': 1.4731026887893677} -11/06/2021 23:36:08 - INFO - __main__ - Step 16631: {'lr': 0.0004880413590127619, 'samples': 3193152, 'steps': 16630, 'loss/train': 2.0067667961120605} -11/06/2021 23:36:09 - INFO - __main__ - Step 16632: {'lr': 0.0004880397373081666, 'samples': 3193344, 'steps': 16631, 'loss/train': 1.5343999862670898} -11/06/2021 23:36:10 - INFO - __main__ - Step 16633: {'lr': 0.0004880381154963145, 'samples': 3193536, 'steps': 16632, 'loss/train': 1.626529574394226} -11/06/2021 23:36:10 - INFO - __main__ - Step 16634: {'lr': 0.0004880364935772059, 'samples': 3193728, 'steps': 16633, 'loss/train': 1.5364887714385986} -11/06/2021 23:36:10 - INFO - __main__ - Step 16635: {'lr': 0.00048803487155084184, 'samples': 3193920, 'steps': 16634, 'loss/train': 1.7955859899520874} -11/06/2021 23:36:11 - INFO - __main__ - Step 16636: {'lr': 0.00048803324941722295, 'samples': 3194112, 'steps': 16635, 'loss/train': 2.057948350906372} -11/06/2021 23:36:11 - INFO - __main__ - Step 16637: {'lr': 0.0004880316271763499, 'samples': 3194304, 'steps': 16636, 'loss/train': 1.8370440006256104} -11/06/2021 23:36:11 - INFO - __main__ - Step 16638: {'lr': 0.0004880300048282235, 'samples': 3194496, 'steps': 16637, 'loss/train': 1.8288404941558838} -11/06/2021 23:36:13 - INFO - __main__ - Step 16639: {'lr': 0.00048802838237284443, 'samples': 3194688, 'steps': 16638, 'loss/train': 2.116184949874878} -11/06/2021 23:36:13 - INFO - __main__ - Step 16640: {'lr': 0.0004880267598102135, 'samples': 3194880, 'steps': 16639, 'loss/train': 1.812418818473816} -11/06/2021 23:36:13 - INFO - __main__ - Step 16641: {'lr': 0.0004880251371403313, 'samples': 3195072, 'steps': 16640, 'loss/train': 1.6309278011322021} -11/06/2021 23:36:14 - INFO - __main__ - Step 16642: {'lr': 0.0004880235143631987, 'samples': 3195264, 'steps': 16641, 'loss/train': 1.4941754341125488} -11/06/2021 23:36:14 - INFO - __main__ - Step 16643: {'lr': 0.0004880218914788164, 'samples': 3195456, 'steps': 16642, 'loss/train': 1.2120184898376465} -11/06/2021 23:36:15 - INFO - __main__ - Step 16644: {'lr': 0.00048802026848718505, 'samples': 3195648, 'steps': 16643, 'loss/train': 2.3507211208343506} -11/06/2021 23:36:15 - INFO - __main__ - Step 16645: {'lr': 0.0004880186453883054, 'samples': 3195840, 'steps': 16644, 'loss/train': 1.6673327684402466} -11/06/2021 23:36:16 - INFO - __main__ - Step 16646: {'lr': 0.00048801702218217834, 'samples': 3196032, 'steps': 16645, 'loss/train': 0.5201470255851746} -11/06/2021 23:36:16 - INFO - __main__ - Step 16647: {'lr': 0.0004880153988688044, 'samples': 3196224, 'steps': 16646, 'loss/train': 1.4588996171951294} -11/06/2021 23:36:16 - INFO - __main__ - Step 16648: {'lr': 0.0004880137754481845, 'samples': 3196416, 'steps': 16647, 'loss/train': 1.8681379556655884} -11/06/2021 23:36:18 - INFO - __main__ - Step 16649: {'lr': 0.0004880121519203191, 'samples': 3196608, 'steps': 16648, 'loss/train': 1.4541462659835815} -11/06/2021 23:36:18 - INFO - __main__ - Step 16650: {'lr': 0.0004880105282852092, 'samples': 3196800, 'steps': 16649, 'loss/train': 1.4326448440551758} -11/06/2021 23:36:18 - INFO - __main__ - Step 16651: {'lr': 0.0004880089045428554, 'samples': 3196992, 'steps': 16650, 'loss/train': 1.7155417203903198} -11/06/2021 23:36:19 - INFO - __main__ - Step 16652: {'lr': 0.0004880072806932585, 'samples': 3197184, 'steps': 16651, 'loss/train': 1.279304027557373} -11/06/2021 23:36:19 - INFO - __main__ - Step 16653: {'lr': 0.00048800565673641917, 'samples': 3197376, 'steps': 16652, 'loss/train': 1.7802386283874512} -11/06/2021 23:36:20 - INFO - __main__ - Step 16654: {'lr': 0.0004880040326723382, 'samples': 3197568, 'steps': 16653, 'loss/train': 1.3103575706481934} -11/06/2021 23:36:20 - INFO - __main__ - Step 16655: {'lr': 0.0004880024085010162, 'samples': 3197760, 'steps': 16654, 'loss/train': 1.8908525705337524} -11/06/2021 23:36:21 - INFO - __main__ - Step 16656: {'lr': 0.00048800078422245406, 'samples': 3197952, 'steps': 16655, 'loss/train': 1.29991614818573} -11/06/2021 23:36:21 - INFO - __main__ - Step 16657: {'lr': 0.0004879991598366524, 'samples': 3198144, 'steps': 16656, 'loss/train': 1.5738615989685059} -11/06/2021 23:36:21 - INFO - __main__ - Step 16658: {'lr': 0.000487997535343612, 'samples': 3198336, 'steps': 16657, 'loss/train': 1.7001148462295532} -11/06/2021 23:36:22 - INFO - __main__ - Step 16659: {'lr': 0.0004879959107433336, 'samples': 3198528, 'steps': 16658, 'loss/train': 2.02748966217041} -11/06/2021 23:36:23 - INFO - __main__ - Step 16660: {'lr': 0.00048799428603581786, 'samples': 3198720, 'steps': 16659, 'loss/train': 1.5537936687469482} -11/06/2021 23:36:23 - INFO - __main__ - Step 16661: {'lr': 0.0004879926612210656, 'samples': 3198912, 'steps': 16660, 'loss/train': 1.3373011350631714} -11/06/2021 23:36:23 - INFO - __main__ - Step 16662: {'lr': 0.0004879910362990775, 'samples': 3199104, 'steps': 16661, 'loss/train': 1.371505856513977} -11/06/2021 23:36:24 - INFO - __main__ - Step 16663: {'lr': 0.0004879894112698544, 'samples': 3199296, 'steps': 16662, 'loss/train': 1.5822465419769287} -11/06/2021 23:36:24 - INFO - __main__ - Step 16664: {'lr': 0.0004879877861333969, 'samples': 3199488, 'steps': 16663, 'loss/train': 1.791337013244629} -11/06/2021 23:36:25 - INFO - __main__ - Step 16665: {'lr': 0.00048798616088970573, 'samples': 3199680, 'steps': 16664, 'loss/train': 1.502487063407898} -11/06/2021 23:36:26 - INFO - __main__ - Step 16666: {'lr': 0.0004879845355387817, 'samples': 3199872, 'steps': 16665, 'loss/train': 1.4889453649520874} -11/06/2021 23:36:26 - INFO - __main__ - Step 16667: {'lr': 0.00048798291008062553, 'samples': 3200064, 'steps': 16666, 'loss/train': 1.684088110923767} -11/06/2021 23:36:26 - INFO - __main__ - Step 16668: {'lr': 0.0004879812845152379, 'samples': 3200256, 'steps': 16667, 'loss/train': 1.8223564624786377} -11/06/2021 23:36:27 - INFO - __main__ - Step 16669: {'lr': 0.0004879796588426195, 'samples': 3200448, 'steps': 16668, 'loss/train': 1.8264342546463013} -11/06/2021 23:36:28 - INFO - __main__ - Step 16670: {'lr': 0.0004879780330627713, 'samples': 3200640, 'steps': 16669, 'loss/train': 1.4178427457809448} -11/06/2021 23:36:28 - INFO - __main__ - Step 16671: {'lr': 0.0004879764071756938, 'samples': 3200832, 'steps': 16670, 'loss/train': 1.6339678764343262} -11/06/2021 23:36:28 - INFO - __main__ - Step 16672: {'lr': 0.00048797478118138777, 'samples': 3201024, 'steps': 16671, 'loss/train': 1.8383632898330688} -11/06/2021 23:36:29 - INFO - __main__ - Step 16673: {'lr': 0.000487973155079854, 'samples': 3201216, 'steps': 16672, 'loss/train': 1.7812671661376953} -11/06/2021 23:36:29 - INFO - __main__ - Step 16674: {'lr': 0.0004879715288710932, 'samples': 3201408, 'steps': 16673, 'loss/train': 0.6627610325813293} -11/06/2021 23:36:30 - INFO - __main__ - Step 16675: {'lr': 0.0004879699025551061, 'samples': 3201600, 'steps': 16674, 'loss/train': 0.5288013815879822} -11/06/2021 23:36:31 - INFO - __main__ - Step 16676: {'lr': 0.0004879682761318934, 'samples': 3201792, 'steps': 16675, 'loss/train': 1.3023256063461304} -11/06/2021 23:36:31 - INFO - __main__ - Step 16677: {'lr': 0.00048796664960145596, 'samples': 3201984, 'steps': 16676, 'loss/train': 1.4314196109771729} -11/06/2021 23:36:31 - INFO - __main__ - Step 16678: {'lr': 0.00048796502296379437, 'samples': 3202176, 'steps': 16677, 'loss/train': 1.5249167680740356} -11/06/2021 23:36:32 - INFO - __main__ - Step 16679: {'lr': 0.0004879633962189094, 'samples': 3202368, 'steps': 16678, 'loss/train': 1.4833424091339111} -11/06/2021 23:36:33 - INFO - __main__ - Step 16680: {'lr': 0.0004879617693668018, 'samples': 3202560, 'steps': 16679, 'loss/train': 2.0442960262298584} -11/06/2021 23:36:33 - INFO - __main__ - Step 16681: {'lr': 0.00048796014240747227, 'samples': 3202752, 'steps': 16680, 'loss/train': 2.0574045181274414} -11/06/2021 23:36:33 - INFO - __main__ - Step 16682: {'lr': 0.0004879585153409216, 'samples': 3202944, 'steps': 16681, 'loss/train': 2.0046627521514893} -11/06/2021 23:36:34 - INFO - __main__ - Step 16683: {'lr': 0.0004879568881671505, 'samples': 3203136, 'steps': 16682, 'loss/train': 1.7298773527145386} -11/06/2021 23:36:34 - INFO - __main__ - Step 16684: {'lr': 0.0004879552608861597, 'samples': 3203328, 'steps': 16683, 'loss/train': 2.0869789123535156} -11/06/2021 23:36:35 - INFO - __main__ - Step 16685: {'lr': 0.00048795363349794996, 'samples': 3203520, 'steps': 16684, 'loss/train': 1.313889741897583} -11/06/2021 23:36:36 - INFO - __main__ - Step 16686: {'lr': 0.00048795200600252193, 'samples': 3203712, 'steps': 16685, 'loss/train': 1.5983039140701294} -11/06/2021 23:36:36 - INFO - __main__ - Step 16687: {'lr': 0.00048795037839987644, 'samples': 3203904, 'steps': 16686, 'loss/train': 1.7276376485824585} -11/06/2021 23:36:36 - INFO - __main__ - Step 16688: {'lr': 0.0004879487506900141, 'samples': 3204096, 'steps': 16687, 'loss/train': 1.1915156841278076} -11/06/2021 23:36:37 - INFO - __main__ - Step 16689: {'lr': 0.0004879471228729358, 'samples': 3204288, 'steps': 16688, 'loss/train': 1.5921833515167236} -11/06/2021 23:36:37 - INFO - __main__ - Step 16690: {'lr': 0.0004879454949486422, 'samples': 3204480, 'steps': 16689, 'loss/train': 1.0146256685256958} -11/06/2021 23:36:38 - INFO - __main__ - Step 16691: {'lr': 0.000487943866917134, 'samples': 3204672, 'steps': 16690, 'loss/train': 1.430779218673706} -11/06/2021 23:36:38 - INFO - __main__ - Step 16692: {'lr': 0.00048794223877841197, 'samples': 3204864, 'steps': 16691, 'loss/train': 1.9642324447631836} -11/06/2021 23:36:39 - INFO - __main__ - Step 16693: {'lr': 0.00048794061053247686, 'samples': 3205056, 'steps': 16692, 'loss/train': 1.744354009628296} -11/06/2021 23:36:39 - INFO - __main__ - Step 16694: {'lr': 0.0004879389821793294, 'samples': 3205248, 'steps': 16693, 'loss/train': 1.6574643850326538} -11/06/2021 23:36:39 - INFO - __main__ - Step 16695: {'lr': 0.00048793735371897027, 'samples': 3205440, 'steps': 16694, 'loss/train': 1.3107839822769165} -11/06/2021 23:36:41 - INFO - __main__ - Step 16696: {'lr': 0.00048793572515140024, 'samples': 3205632, 'steps': 16695, 'loss/train': 1.8585938215255737} -11/06/2021 23:36:41 - INFO - __main__ - Step 16697: {'lr': 0.00048793409647662, 'samples': 3205824, 'steps': 16696, 'loss/train': 1.749839186668396} -11/06/2021 23:36:41 - INFO - __main__ - Step 16698: {'lr': 0.0004879324676946304, 'samples': 3206016, 'steps': 16697, 'loss/train': 6.0391693115234375} -11/06/2021 23:36:42 - INFO - __main__ - Step 16699: {'lr': 0.0004879308388054321, 'samples': 3206208, 'steps': 16698, 'loss/train': 1.5355502367019653} -11/06/2021 23:36:42 - INFO - __main__ - Step 16700: {'lr': 0.0004879292098090258, 'samples': 3206400, 'steps': 16699, 'loss/train': 1.8935089111328125} -11/06/2021 23:36:42 - INFO - __main__ - Step 16701: {'lr': 0.00048792758070541234, 'samples': 3206592, 'steps': 16700, 'loss/train': 1.749446153640747} -11/06/2021 23:36:43 - INFO - __main__ - Step 16702: {'lr': 0.00048792595149459226, 'samples': 3206784, 'steps': 16701, 'loss/train': 5.876288890838623} -11/06/2021 23:36:44 - INFO - __main__ - Step 16703: {'lr': 0.0004879243221765665, 'samples': 3206976, 'steps': 16702, 'loss/train': 5.527763366699219} -11/06/2021 23:36:44 - INFO - __main__ - Step 16704: {'lr': 0.00048792269275133574, 'samples': 3207168, 'steps': 16703, 'loss/train': 1.829983115196228} -11/06/2021 23:36:45 - INFO - __main__ - Step 16705: {'lr': 0.0004879210632189006, 'samples': 3207360, 'steps': 16704, 'loss/train': 1.1864635944366455} -11/06/2021 23:36:45 - INFO - __main__ - Step 16706: {'lr': 0.0004879194335792619, 'samples': 3207552, 'steps': 16705, 'loss/train': 1.3388835191726685} -11/06/2021 23:36:45 - INFO - __main__ - Step 16707: {'lr': 0.0004879178038324205, 'samples': 3207744, 'steps': 16706, 'loss/train': 1.0322556495666504} -11/06/2021 23:36:46 - INFO - __main__ - Step 16708: {'lr': 0.0004879161739783769, 'samples': 3207936, 'steps': 16707, 'loss/train': 1.4637303352355957} -11/06/2021 23:36:47 - INFO - __main__ - Step 16709: {'lr': 0.00048791454401713195, 'samples': 3208128, 'steps': 16708, 'loss/train': 2.0983338356018066} -11/06/2021 23:36:47 - INFO - __main__ - Step 16710: {'lr': 0.00048791291394868644, 'samples': 3208320, 'steps': 16709, 'loss/train': 2.0529398918151855} -11/06/2021 23:36:47 - INFO - __main__ - Step 16711: {'lr': 0.000487911283773041, 'samples': 3208512, 'steps': 16710, 'loss/train': 1.6955748796463013} -11/06/2021 23:36:48 - INFO - __main__ - Step 16712: {'lr': 0.0004879096534901964, 'samples': 3208704, 'steps': 16711, 'loss/train': 1.505379319190979} -11/06/2021 23:36:49 - INFO - __main__ - Step 16713: {'lr': 0.00048790802310015336, 'samples': 3208896, 'steps': 16712, 'loss/train': 1.625261664390564} -11/06/2021 23:36:49 - INFO - __main__ - Step 16714: {'lr': 0.0004879063926029127, 'samples': 3209088, 'steps': 16713, 'loss/train': 1.708368182182312} -11/06/2021 23:36:50 - INFO - __main__ - Step 16715: {'lr': 0.00048790476199847506, 'samples': 3209280, 'steps': 16714, 'loss/train': 1.6214886903762817} -11/06/2021 23:36:50 - INFO - __main__ - Step 16716: {'lr': 0.0004879031312868412, 'samples': 3209472, 'steps': 16715, 'loss/train': 1.734784722328186} -11/06/2021 23:36:50 - INFO - __main__ - Step 16717: {'lr': 0.00048790150046801187, 'samples': 3209664, 'steps': 16716, 'loss/train': 1.8624287843704224} -11/06/2021 23:36:51 - INFO - __main__ - Step 16718: {'lr': 0.0004878998695419877, 'samples': 3209856, 'steps': 16717, 'loss/train': 1.689518690109253} -11/06/2021 23:36:52 - INFO - __main__ - Step 16719: {'lr': 0.0004878982385087697, 'samples': 3210048, 'steps': 16718, 'loss/train': 2.1184022426605225} -11/06/2021 23:36:52 - INFO - __main__ - Step 16720: {'lr': 0.0004878966073683583, 'samples': 3210240, 'steps': 16719, 'loss/train': 1.6878275871276855} -11/06/2021 23:36:52 - INFO - __main__ - Step 16721: {'lr': 0.0004878949761207544, 'samples': 3210432, 'steps': 16720, 'loss/train': 1.9824398756027222} -11/06/2021 23:36:53 - INFO - __main__ - Step 16722: {'lr': 0.0004878933447659587, 'samples': 3210624, 'steps': 16721, 'loss/train': 2.208752155303955} -11/06/2021 23:36:53 - INFO - __main__ - Step 16723: {'lr': 0.0004878917133039719, 'samples': 3210816, 'steps': 16722, 'loss/train': 1.5395011901855469} -11/06/2021 23:36:54 - INFO - __main__ - Step 16724: {'lr': 0.00048789008173479476, 'samples': 3211008, 'steps': 16723, 'loss/train': 1.7593508958816528} -11/06/2021 23:36:54 - INFO - __main__ - Step 16725: {'lr': 0.0004878884500584281, 'samples': 3211200, 'steps': 16724, 'loss/train': 1.9849613904953003} -11/06/2021 23:36:55 - INFO - __main__ - Step 16726: {'lr': 0.0004878868182748725, 'samples': 3211392, 'steps': 16725, 'loss/train': 1.6343092918395996} -11/06/2021 23:36:55 - INFO - __main__ - Step 16727: {'lr': 0.0004878851863841287, 'samples': 3211584, 'steps': 16726, 'loss/train': 1.4157750606536865} -11/06/2021 23:36:55 - INFO - __main__ - Step 16728: {'lr': 0.00048788355438619764, 'samples': 3211776, 'steps': 16727, 'loss/train': 1.9465490579605103} -11/06/2021 23:36:57 - INFO - __main__ - Step 16729: {'lr': 0.00048788192228107986, 'samples': 3211968, 'steps': 16728, 'loss/train': 1.3417645692825317} -11/06/2021 23:36:57 - INFO - __main__ - Step 16730: {'lr': 0.00048788029006877623, 'samples': 3212160, 'steps': 16729, 'loss/train': 1.5599322319030762} -11/06/2021 23:36:57 - INFO - __main__ - Step 16731: {'lr': 0.0004878786577492873, 'samples': 3212352, 'steps': 16730, 'loss/train': 2.0975825786590576} -11/06/2021 23:36:58 - INFO - __main__ - Step 16732: {'lr': 0.00048787702532261396, 'samples': 3212544, 'steps': 16731, 'loss/train': 1.131968379020691} -11/06/2021 23:36:58 - INFO - __main__ - Step 16733: {'lr': 0.0004878753927887569, 'samples': 3212736, 'steps': 16732, 'loss/train': 1.7023571729660034} -11/06/2021 23:36:59 - INFO - __main__ - Step 16734: {'lr': 0.0004878737601477169, 'samples': 3212928, 'steps': 16733, 'loss/train': 1.4870761632919312} -11/06/2021 23:36:59 - INFO - __main__ - Step 16735: {'lr': 0.0004878721273994946, 'samples': 3213120, 'steps': 16734, 'loss/train': 1.8174546957015991} -11/06/2021 23:37:00 - INFO - __main__ - Step 16736: {'lr': 0.00048787049454409085, 'samples': 3213312, 'steps': 16735, 'loss/train': 1.6233512163162231} -11/06/2021 23:37:00 - INFO - __main__ - Step 16737: {'lr': 0.0004878688615815063, 'samples': 3213504, 'steps': 16736, 'loss/train': 1.541832447052002} -11/06/2021 23:37:00 - INFO - __main__ - Step 16738: {'lr': 0.0004878672285117417, 'samples': 3213696, 'steps': 16737, 'loss/train': 1.9334702491760254} -11/06/2021 23:37:01 - INFO - __main__ - Step 16739: {'lr': 0.0004878655953347978, 'samples': 3213888, 'steps': 16738, 'loss/train': 0.17051845788955688} -11/06/2021 23:37:02 - INFO - __main__ - Step 16740: {'lr': 0.0004878639620506753, 'samples': 3214080, 'steps': 16739, 'loss/train': 1.7930675745010376} -11/06/2021 23:37:02 - INFO - __main__ - Step 16741: {'lr': 0.00048786232865937504, 'samples': 3214272, 'steps': 16740, 'loss/train': 1.6320091485977173} -11/06/2021 23:37:02 - INFO - __main__ - Step 16742: {'lr': 0.0004878606951608976, 'samples': 3214464, 'steps': 16741, 'loss/train': 2.05916428565979} -11/06/2021 23:37:03 - INFO - __main__ - Step 16743: {'lr': 0.00048785906155524386, 'samples': 3214656, 'steps': 16742, 'loss/train': 1.2321640253067017} -11/06/2021 23:37:05 - INFO - __main__ - Step 16744: {'lr': 0.0004878574278424145, 'samples': 3214848, 'steps': 16743, 'loss/train': 1.7712355852127075} -11/06/2021 23:37:05 - INFO - __main__ - Step 16745: {'lr': 0.0004878557940224102, 'samples': 3215040, 'steps': 16744, 'loss/train': 1.3392685651779175} -11/06/2021 23:37:05 - INFO - __main__ - Step 16746: {'lr': 0.0004878541600952318, 'samples': 3215232, 'steps': 16745, 'loss/train': 1.2699354887008667} -11/06/2021 23:37:06 - INFO - __main__ - Step 16747: {'lr': 0.00048785252606087996, 'samples': 3215424, 'steps': 16746, 'loss/train': 1.778057336807251} -11/06/2021 23:37:06 - INFO - __main__ - Step 16748: {'lr': 0.0004878508919193555, 'samples': 3215616, 'steps': 16747, 'loss/train': 1.7373347282409668} -11/06/2021 23:37:06 - INFO - __main__ - Step 16749: {'lr': 0.000487849257670659, 'samples': 3215808, 'steps': 16748, 'loss/train': 1.591823935508728} -11/06/2021 23:37:07 - INFO - __main__ - Step 16750: {'lr': 0.0004878476233147914, 'samples': 3216000, 'steps': 16749, 'loss/train': 1.612733006477356} -11/06/2021 23:37:08 - INFO - __main__ - Step 16751: {'lr': 0.00048784598885175324, 'samples': 3216192, 'steps': 16750, 'loss/train': 1.5317606925964355} -11/06/2021 23:37:08 - INFO - __main__ - Step 16752: {'lr': 0.00048784435428154537, 'samples': 3216384, 'steps': 16751, 'loss/train': 1.491845965385437} -11/06/2021 23:37:08 - INFO - __main__ - Step 16753: {'lr': 0.0004878427196041686, 'samples': 3216576, 'steps': 16752, 'loss/train': 1.9473744630813599} -11/06/2021 23:37:09 - INFO - __main__ - Step 16754: {'lr': 0.00048784108481962347, 'samples': 3216768, 'steps': 16753, 'loss/train': 1.4702725410461426} -11/06/2021 23:37:09 - INFO - __main__ - Step 16755: {'lr': 0.00048783944992791085, 'samples': 3216960, 'steps': 16754, 'loss/train': 1.2084376811981201} -11/06/2021 23:37:10 - INFO - __main__ - Step 16756: {'lr': 0.00048783781492903145, 'samples': 3217152, 'steps': 16755, 'loss/train': 1.8387744426727295} -11/06/2021 23:37:11 - INFO - __main__ - Step 16757: {'lr': 0.00048783617982298594, 'samples': 3217344, 'steps': 16756, 'loss/train': 1.6829814910888672} -11/06/2021 23:37:11 - INFO - __main__ - Step 16758: {'lr': 0.00048783454460977517, 'samples': 3217536, 'steps': 16757, 'loss/train': 1.8421169519424438} -11/06/2021 23:37:11 - INFO - __main__ - Step 16759: {'lr': 0.00048783290928939985, 'samples': 3217728, 'steps': 16758, 'loss/train': 1.8196167945861816} -11/06/2021 23:37:12 - INFO - __main__ - Step 16760: {'lr': 0.00048783127386186064, 'samples': 3217920, 'steps': 16759, 'loss/train': 2.0818989276885986} -11/06/2021 23:37:12 - INFO - __main__ - Step 16761: {'lr': 0.00048782963832715834, 'samples': 3218112, 'steps': 16760, 'loss/train': 1.8237532377243042} -11/06/2021 23:37:13 - INFO - __main__ - Step 16762: {'lr': 0.0004878280026852937, 'samples': 3218304, 'steps': 16761, 'loss/train': 1.4099204540252686} -11/06/2021 23:37:14 - INFO - __main__ - Step 16763: {'lr': 0.00048782636693626736, 'samples': 3218496, 'steps': 16762, 'loss/train': 1.4822304248809814} -11/06/2021 23:37:14 - INFO - __main__ - Step 16764: {'lr': 0.0004878247310800802, 'samples': 3218688, 'steps': 16763, 'loss/train': 2.277588367462158} -11/06/2021 23:37:14 - INFO - __main__ - Step 16765: {'lr': 0.0004878230951167328, 'samples': 3218880, 'steps': 16764, 'loss/train': 1.6301047801971436} -11/06/2021 23:37:15 - INFO - __main__ - Step 16766: {'lr': 0.0004878214590462261, 'samples': 3219072, 'steps': 16765, 'loss/train': 1.8547323942184448} -11/06/2021 23:37:15 - INFO - __main__ - Step 16767: {'lr': 0.0004878198228685607, 'samples': 3219264, 'steps': 16766, 'loss/train': 0.8852767944335938} -11/06/2021 23:37:16 - INFO - __main__ - Step 16768: {'lr': 0.00048781818658373734, 'samples': 3219456, 'steps': 16767, 'loss/train': 1.3451430797576904} -11/06/2021 23:37:16 - INFO - __main__ - Step 16769: {'lr': 0.00048781655019175676, 'samples': 3219648, 'steps': 16768, 'loss/train': 2.1409761905670166} -11/06/2021 23:37:17 - INFO - __main__ - Step 16770: {'lr': 0.00048781491369261965, 'samples': 3219840, 'steps': 16769, 'loss/train': 1.503929615020752} -11/06/2021 23:37:17 - INFO - __main__ - Step 16771: {'lr': 0.00048781327708632695, 'samples': 3220032, 'steps': 16770, 'loss/train': 1.9142979383468628} -11/06/2021 23:37:17 - INFO - __main__ - Step 16772: {'lr': 0.0004878116403728792, 'samples': 3220224, 'steps': 16771, 'loss/train': 1.3144738674163818} -11/06/2021 23:37:19 - INFO - __main__ - Step 16773: {'lr': 0.0004878100035522771, 'samples': 3220416, 'steps': 16772, 'loss/train': 1.3985767364501953} -11/06/2021 23:37:19 - INFO - __main__ - Step 16774: {'lr': 0.00048780836662452154, 'samples': 3220608, 'steps': 16773, 'loss/train': 1.2412461042404175} -11/06/2021 23:37:19 - INFO - __main__ - Step 16775: {'lr': 0.00048780672958961325, 'samples': 3220800, 'steps': 16774, 'loss/train': 1.7060500383377075} -11/06/2021 23:37:20 - INFO - __main__ - Step 16776: {'lr': 0.0004878050924475529, 'samples': 3220992, 'steps': 16775, 'loss/train': 1.980871558189392} -11/06/2021 23:37:20 - INFO - __main__ - Step 16777: {'lr': 0.00048780345519834124, 'samples': 3221184, 'steps': 16776, 'loss/train': 1.8724604845046997} -11/06/2021 23:37:21 - INFO - __main__ - Step 16778: {'lr': 0.000487801817841979, 'samples': 3221376, 'steps': 16777, 'loss/train': 0.38344258069992065} -11/06/2021 23:37:21 - INFO - __main__ - Step 16779: {'lr': 0.0004878001803784669, 'samples': 3221568, 'steps': 16778, 'loss/train': 1.6661590337753296} -11/06/2021 23:37:22 - INFO - __main__ - Step 16780: {'lr': 0.00048779854280780576, 'samples': 3221760, 'steps': 16779, 'loss/train': 2.1896467208862305} -11/06/2021 23:37:22 - INFO - __main__ - Step 16781: {'lr': 0.00048779690512999627, 'samples': 3221952, 'steps': 16780, 'loss/train': 1.5965747833251953} -11/06/2021 23:37:22 - INFO - __main__ - Step 16782: {'lr': 0.0004877952673450391, 'samples': 3222144, 'steps': 16781, 'loss/train': 1.6310534477233887} -11/06/2021 23:37:23 - INFO - __main__ - Step 16783: {'lr': 0.0004877936294529351, 'samples': 3222336, 'steps': 16782, 'loss/train': 2.207812786102295} -11/06/2021 23:37:24 - INFO - __main__ - Step 16784: {'lr': 0.00048779199145368494, 'samples': 3222528, 'steps': 16783, 'loss/train': 1.5550755262374878} -11/06/2021 23:37:24 - INFO - __main__ - Step 16785: {'lr': 0.0004877903533472894, 'samples': 3222720, 'steps': 16784, 'loss/train': 1.640083909034729} -11/06/2021 23:37:24 - INFO - __main__ - Step 16786: {'lr': 0.0004877887151337492, 'samples': 3222912, 'steps': 16785, 'loss/train': 1.9522141218185425} -11/06/2021 23:37:25 - INFO - __main__ - Step 16787: {'lr': 0.0004877870768130651, 'samples': 3223104, 'steps': 16786, 'loss/train': 1.743882417678833} -11/06/2021 23:37:26 - INFO - __main__ - Step 16788: {'lr': 0.0004877854383852377, 'samples': 3223296, 'steps': 16787, 'loss/train': 1.766150712966919} -11/06/2021 23:37:26 - INFO - __main__ - Step 16789: {'lr': 0.000487783799850268, 'samples': 3223488, 'steps': 16788, 'loss/train': 2.058748960494995} -11/06/2021 23:37:27 - INFO - __main__ - Step 16790: {'lr': 0.00048778216120815644, 'samples': 3223680, 'steps': 16789, 'loss/train': 1.553648829460144} -11/06/2021 23:37:27 - INFO - __main__ - Step 16791: {'lr': 0.00048778052245890404, 'samples': 3223872, 'steps': 16790, 'loss/train': 1.9870336055755615} -11/06/2021 23:37:27 - INFO - __main__ - Step 16792: {'lr': 0.0004877788836025113, 'samples': 3224064, 'steps': 16791, 'loss/train': 1.8651750087738037} -11/06/2021 23:37:28 - INFO - __main__ - Step 16793: {'lr': 0.0004877772446389791, 'samples': 3224256, 'steps': 16792, 'loss/train': 2.0042312145233154} -11/06/2021 23:37:29 - INFO - __main__ - Step 16794: {'lr': 0.0004877756055683082, 'samples': 3224448, 'steps': 16793, 'loss/train': 1.699658989906311} -11/06/2021 23:37:29 - INFO - __main__ - Step 16795: {'lr': 0.0004877739663904992, 'samples': 3224640, 'steps': 16794, 'loss/train': 1.4867655038833618} -11/06/2021 23:37:29 - INFO - __main__ - Step 16796: {'lr': 0.00048777232710555296, 'samples': 3224832, 'steps': 16795, 'loss/train': 0.9855947494506836} -11/06/2021 23:37:30 - INFO - __main__ - Step 16797: {'lr': 0.0004877706877134702, 'samples': 3225024, 'steps': 16796, 'loss/train': 1.5652852058410645} -11/06/2021 23:37:30 - INFO - __main__ - Step 16798: {'lr': 0.0004877690482142516, 'samples': 3225216, 'steps': 16797, 'loss/train': 1.4271130561828613} -11/06/2021 23:37:31 - INFO - __main__ - Step 16799: {'lr': 0.0004877674086078979, 'samples': 3225408, 'steps': 16798, 'loss/train': 1.6108903884887695} -11/06/2021 23:37:32 - INFO - __main__ - Step 16800: {'lr': 0.0004877657688944099, 'samples': 3225600, 'steps': 16799, 'loss/train': 1.6870945692062378} -11/06/2021 23:37:32 - INFO - __main__ - Step 16801: {'lr': 0.0004877641290737884, 'samples': 3225792, 'steps': 16800, 'loss/train': 1.2492268085479736} -11/06/2021 23:37:32 - INFO - __main__ - Step 16802: {'lr': 0.000487762489146034, 'samples': 3225984, 'steps': 16801, 'loss/train': 1.245894193649292} -11/06/2021 23:37:33 - INFO - __main__ - Step 16803: {'lr': 0.0004877608491111475, 'samples': 3226176, 'steps': 16802, 'loss/train': 1.588663101196289} -11/06/2021 23:37:34 - INFO - __main__ - Step 16804: {'lr': 0.0004877592089691296, 'samples': 3226368, 'steps': 16803, 'loss/train': 1.9212385416030884} -11/06/2021 23:37:34 - INFO - __main__ - Step 16805: {'lr': 0.00048775756871998106, 'samples': 3226560, 'steps': 16804, 'loss/train': 1.954315185546875} -11/06/2021 23:37:34 - INFO - __main__ - Step 16806: {'lr': 0.0004877559283637026, 'samples': 3226752, 'steps': 16805, 'loss/train': 1.4202922582626343} -11/06/2021 23:37:35 - INFO - __main__ - Step 16807: {'lr': 0.0004877542879002951, 'samples': 3226944, 'steps': 16806, 'loss/train': 1.4899168014526367} -11/06/2021 23:37:35 - INFO - __main__ - Step 16808: {'lr': 0.0004877526473297591, 'samples': 3227136, 'steps': 16807, 'loss/train': 1.6989758014678955} -11/06/2021 23:37:36 - INFO - __main__ - Step 16809: {'lr': 0.0004877510066520954, 'samples': 3227328, 'steps': 16808, 'loss/train': 1.953574299812317} -11/06/2021 23:37:37 - INFO - __main__ - Step 16810: {'lr': 0.0004877493658673048, 'samples': 3227520, 'steps': 16809, 'loss/train': 1.6780657768249512} -11/06/2021 23:37:37 - INFO - __main__ - Step 16811: {'lr': 0.00048774772497538806, 'samples': 3227712, 'steps': 16810, 'loss/train': 2.09407114982605} -11/06/2021 23:37:37 - INFO - __main__ - Step 16812: {'lr': 0.0004877460839763458, 'samples': 3227904, 'steps': 16811, 'loss/train': 1.4879274368286133} -11/06/2021 23:37:38 - INFO - __main__ - Step 16813: {'lr': 0.0004877444428701788, 'samples': 3228096, 'steps': 16812, 'loss/train': 1.0444165468215942} -11/06/2021 23:37:38 - INFO - __main__ - Step 16814: {'lr': 0.0004877428016568879, 'samples': 3228288, 'steps': 16813, 'loss/train': 1.6901205778121948} -11/06/2021 23:37:38 - INFO - __main__ - Step 16815: {'lr': 0.00048774116033647373, 'samples': 3228480, 'steps': 16814, 'loss/train': 1.6762943267822266} -11/06/2021 23:37:40 - INFO - __main__ - Step 16816: {'lr': 0.0004877395189089371, 'samples': 3228672, 'steps': 16815, 'loss/train': 2.3396244049072266} -11/06/2021 23:37:40 - INFO - __main__ - Step 16817: {'lr': 0.00048773787737427867, 'samples': 3228864, 'steps': 16816, 'loss/train': 1.7871525287628174} -11/06/2021 23:37:40 - INFO - __main__ - Step 16818: {'lr': 0.0004877362357324992, 'samples': 3229056, 'steps': 16817, 'loss/train': 1.87598717212677} -11/06/2021 23:37:41 - INFO - __main__ - Step 16819: {'lr': 0.0004877345939835995, 'samples': 3229248, 'steps': 16818, 'loss/train': 1.668867826461792} -11/06/2021 23:37:41 - INFO - __main__ - Step 16820: {'lr': 0.0004877329521275802, 'samples': 3229440, 'steps': 16819, 'loss/train': 1.777286171913147} -11/06/2021 23:37:41 - INFO - __main__ - Step 16821: {'lr': 0.0004877313101644422, 'samples': 3229632, 'steps': 16820, 'loss/train': 2.054732084274292} -11/06/2021 23:37:43 - INFO - __main__ - Step 16822: {'lr': 0.000487729668094186, 'samples': 3229824, 'steps': 16821, 'loss/train': 1.3124911785125732} -11/06/2021 23:37:43 - INFO - __main__ - Step 16823: {'lr': 0.0004877280259168125, 'samples': 3230016, 'steps': 16822, 'loss/train': 1.8719760179519653} -11/06/2021 23:37:43 - INFO - __main__ - Step 16824: {'lr': 0.0004877263836323226, 'samples': 3230208, 'steps': 16823, 'loss/train': 1.8889883756637573} -11/06/2021 23:37:44 - INFO - __main__ - Step 16825: {'lr': 0.00048772474124071663, 'samples': 3230400, 'steps': 16824, 'loss/train': 1.6828360557556152} -11/06/2021 23:37:44 - INFO - __main__ - Step 16826: {'lr': 0.0004877230987419957, 'samples': 3230592, 'steps': 16825, 'loss/train': 1.12043035030365} -11/06/2021 23:37:45 - INFO - __main__ - Step 16827: {'lr': 0.00048772145613616035, 'samples': 3230784, 'steps': 16826, 'loss/train': 1.7970967292785645} -11/06/2021 23:37:45 - INFO - __main__ - Step 16828: {'lr': 0.00048771981342321145, 'samples': 3230976, 'steps': 16827, 'loss/train': 1.1399004459381104} -11/06/2021 23:37:46 - INFO - __main__ - Step 16829: {'lr': 0.0004877181706031496, 'samples': 3231168, 'steps': 16828, 'loss/train': 1.6806825399398804} -11/06/2021 23:37:46 - INFO - __main__ - Step 16830: {'lr': 0.00048771652767597563, 'samples': 3231360, 'steps': 16829, 'loss/train': 1.6623328924179077} -11/06/2021 23:37:47 - INFO - __main__ - Step 16831: {'lr': 0.0004877148846416903, 'samples': 3231552, 'steps': 16830, 'loss/train': 1.4326417446136475} -11/06/2021 23:37:48 - INFO - __main__ - Step 16832: {'lr': 0.0004877132415002943, 'samples': 3231744, 'steps': 16831, 'loss/train': 1.1790060997009277} -11/06/2021 23:37:48 - INFO - __main__ - Step 16833: {'lr': 0.00048771159825178827, 'samples': 3231936, 'steps': 16832, 'loss/train': 2.1430394649505615} -11/06/2021 23:37:48 - INFO - __main__ - Step 16834: {'lr': 0.0004877099548961732, 'samples': 3232128, 'steps': 16833, 'loss/train': 1.4152675867080688} -11/06/2021 23:37:49 - INFO - __main__ - Step 16835: {'lr': 0.0004877083114334496, 'samples': 3232320, 'steps': 16834, 'loss/train': 1.6590317487716675} -11/06/2021 23:37:49 - INFO - __main__ - Step 16836: {'lr': 0.0004877066678636184, 'samples': 3232512, 'steps': 16835, 'loss/train': 1.7234406471252441} -11/06/2021 23:37:50 - INFO - __main__ - Step 16837: {'lr': 0.00048770502418668017, 'samples': 3232704, 'steps': 16836, 'loss/train': 1.8991540670394897} -11/06/2021 23:37:50 - INFO - __main__ - Step 16838: {'lr': 0.00048770338040263574, 'samples': 3232896, 'steps': 16837, 'loss/train': 2.06113338470459} -11/06/2021 23:37:51 - INFO - __main__ - Step 16839: {'lr': 0.00048770173651148586, 'samples': 3233088, 'steps': 16838, 'loss/train': 1.2442201375961304} -11/06/2021 23:37:51 - INFO - __main__ - Step 16840: {'lr': 0.0004877000925132312, 'samples': 3233280, 'steps': 16839, 'loss/train': 2.102421760559082} -11/06/2021 23:37:51 - INFO - __main__ - Step 16841: {'lr': 0.0004876984484078726, 'samples': 3233472, 'steps': 16840, 'loss/train': 1.9662206172943115} -11/06/2021 23:37:52 - INFO - __main__ - Step 16842: {'lr': 0.0004876968041954107, 'samples': 3233664, 'steps': 16841, 'loss/train': 2.2481026649475098} -11/06/2021 23:37:53 - INFO - __main__ - Step 16843: {'lr': 0.00048769515987584624, 'samples': 3233856, 'steps': 16842, 'loss/train': 1.3896993398666382} -11/06/2021 23:37:53 - INFO - __main__ - Step 16844: {'lr': 0.0004876935154491801, 'samples': 3234048, 'steps': 16843, 'loss/train': 1.4437320232391357} -11/06/2021 23:37:54 - INFO - __main__ - Step 16845: {'lr': 0.00048769187091541287, 'samples': 3234240, 'steps': 16844, 'loss/train': 1.5791386365890503} -11/06/2021 23:37:54 - INFO - __main__ - Step 16846: {'lr': 0.0004876902262745454, 'samples': 3234432, 'steps': 16845, 'loss/train': 2.008009672164917} -11/06/2021 23:37:54 - INFO - __main__ - Step 16847: {'lr': 0.00048768858152657837, 'samples': 3234624, 'steps': 16846, 'loss/train': 1.5482451915740967} -11/06/2021 23:37:55 - INFO - __main__ - Step 16848: {'lr': 0.0004876869366715125, 'samples': 3234816, 'steps': 16847, 'loss/train': 1.9071651697158813} -11/06/2021 23:37:56 - INFO - __main__ - Step 16849: {'lr': 0.0004876852917093486, 'samples': 3235008, 'steps': 16848, 'loss/train': 1.9252054691314697} -11/06/2021 23:37:56 - INFO - __main__ - Step 16850: {'lr': 0.0004876836466400874, 'samples': 3235200, 'steps': 16849, 'loss/train': 1.199202537536621} -11/06/2021 23:37:56 - INFO - __main__ - Step 16851: {'lr': 0.00048768200146372955, 'samples': 3235392, 'steps': 16850, 'loss/train': 1.9420405626296997} -11/06/2021 23:37:57 - INFO - __main__ - Step 16852: {'lr': 0.00048768035618027597, 'samples': 3235584, 'steps': 16851, 'loss/train': 1.7523447275161743} -11/06/2021 23:37:58 - INFO - __main__ - Step 16853: {'lr': 0.00048767871078972717, 'samples': 3235776, 'steps': 16852, 'loss/train': 1.6883947849273682} -11/06/2021 23:37:58 - INFO - __main__ - Step 16854: {'lr': 0.000487677065292084, 'samples': 3235968, 'steps': 16853, 'loss/train': 1.7545671463012695} -11/06/2021 23:37:58 - INFO - __main__ - Step 16855: {'lr': 0.0004876754196873473, 'samples': 3236160, 'steps': 16854, 'loss/train': 1.6839386224746704} -11/06/2021 23:37:59 - INFO - __main__ - Step 16856: {'lr': 0.00048767377397551773, 'samples': 3236352, 'steps': 16855, 'loss/train': 2.0163164138793945} -11/06/2021 23:37:59 - INFO - __main__ - Step 16857: {'lr': 0.00048767212815659593, 'samples': 3236544, 'steps': 16856, 'loss/train': 1.7172329425811768} -11/06/2021 23:38:00 - INFO - __main__ - Step 16858: {'lr': 0.0004876704822305828, 'samples': 3236736, 'steps': 16857, 'loss/train': 1.4067416191101074} -11/06/2021 23:38:00 - INFO - __main__ - Step 16859: {'lr': 0.00048766883619747906, 'samples': 3236928, 'steps': 16858, 'loss/train': 1.5666910409927368} -11/06/2021 23:38:01 - INFO - __main__ - Step 16860: {'lr': 0.00048766719005728534, 'samples': 3237120, 'steps': 16859, 'loss/train': 1.6902843713760376} -11/06/2021 23:38:01 - INFO - __main__ - Step 16861: {'lr': 0.0004876655438100024, 'samples': 3237312, 'steps': 16860, 'loss/train': 1.7778635025024414} -11/06/2021 23:38:01 - INFO - __main__ - Step 16862: {'lr': 0.00048766389745563113, 'samples': 3237504, 'steps': 16861, 'loss/train': 1.489890217781067} -11/06/2021 23:38:02 - INFO - __main__ - Step 16863: {'lr': 0.00048766225099417215, 'samples': 3237696, 'steps': 16862, 'loss/train': 1.5627225637435913} -11/06/2021 23:38:03 - INFO - __main__ - Step 16864: {'lr': 0.0004876606044256262, 'samples': 3237888, 'steps': 16863, 'loss/train': 1.9307020902633667} -11/06/2021 23:38:03 - INFO - __main__ - Step 16865: {'lr': 0.0004876589577499941, 'samples': 3238080, 'steps': 16864, 'loss/train': 2.422271251678467} -11/06/2021 23:38:04 - INFO - __main__ - Step 16866: {'lr': 0.0004876573109672765, 'samples': 3238272, 'steps': 16865, 'loss/train': 1.67001473903656} -11/06/2021 23:38:04 - INFO - __main__ - Step 16867: {'lr': 0.0004876556640774742, 'samples': 3238464, 'steps': 16866, 'loss/train': 1.8609672784805298} -11/06/2021 23:38:05 - INFO - __main__ - Step 16868: {'lr': 0.0004876540170805879, 'samples': 3238656, 'steps': 16867, 'loss/train': 1.879353642463684} -11/06/2021 23:38:05 - INFO - __main__ - Step 16869: {'lr': 0.00048765236997661845, 'samples': 3238848, 'steps': 16868, 'loss/train': 1.293416142463684} -11/06/2021 23:38:06 - INFO - __main__ - Step 16870: {'lr': 0.0004876507227655664, 'samples': 3239040, 'steps': 16869, 'loss/train': 1.5355979204177856} -11/06/2021 23:38:06 - INFO - __main__ - Step 16871: {'lr': 0.00048764907544743264, 'samples': 3239232, 'steps': 16870, 'loss/train': 2.0187036991119385} -11/06/2021 23:38:06 - INFO - __main__ - Step 16872: {'lr': 0.0004876474280222179, 'samples': 3239424, 'steps': 16871, 'loss/train': 2.1045546531677246} -11/06/2021 23:38:07 - INFO - __main__ - Step 16873: {'lr': 0.00048764578048992284, 'samples': 3239616, 'steps': 16872, 'loss/train': 1.7573167085647583} -11/06/2021 23:38:08 - INFO - __main__ - Step 16874: {'lr': 0.0004876441328505483, 'samples': 3239808, 'steps': 16873, 'loss/train': 1.5508947372436523} -11/06/2021 23:38:08 - INFO - __main__ - Step 16875: {'lr': 0.000487642485104095, 'samples': 3240000, 'steps': 16874, 'loss/train': 1.8752604722976685} -11/06/2021 23:38:08 - INFO - __main__ - Step 16876: {'lr': 0.00048764083725056365, 'samples': 3240192, 'steps': 16875, 'loss/train': 1.2444089651107788} -11/06/2021 23:38:09 - INFO - __main__ - Step 16877: {'lr': 0.00048763918928995496, 'samples': 3240384, 'steps': 16876, 'loss/train': 0.795091450214386} -11/06/2021 23:38:10 - INFO - __main__ - Step 16878: {'lr': 0.00048763754122226977, 'samples': 3240576, 'steps': 16877, 'loss/train': 1.2658640146255493} -11/06/2021 23:38:10 - INFO - __main__ - Step 16879: {'lr': 0.00048763589304750876, 'samples': 3240768, 'steps': 16878, 'loss/train': 1.3780895471572876} -11/06/2021 23:38:11 - INFO - __main__ - Step 16880: {'lr': 0.0004876342447656727, 'samples': 3240960, 'steps': 16879, 'loss/train': 1.6554217338562012} -11/06/2021 23:38:11 - INFO - __main__ - Step 16881: {'lr': 0.00048763259637676226, 'samples': 3241152, 'steps': 16880, 'loss/train': 1.099325180053711} -11/06/2021 23:38:11 - INFO - __main__ - Step 16882: {'lr': 0.00048763094788077834, 'samples': 3241344, 'steps': 16881, 'loss/train': 1.8760645389556885} -11/06/2021 23:38:12 - INFO - __main__ - Step 16883: {'lr': 0.0004876292992777215, 'samples': 3241536, 'steps': 16882, 'loss/train': 1.7464240789413452} -11/06/2021 23:38:13 - INFO - __main__ - Step 16884: {'lr': 0.00048762765056759255, 'samples': 3241728, 'steps': 16883, 'loss/train': 1.7331184148788452} -11/06/2021 23:38:13 - INFO - __main__ - Step 16885: {'lr': 0.00048762600175039227, 'samples': 3241920, 'steps': 16884, 'loss/train': 1.990671157836914} -11/06/2021 23:38:13 - INFO - __main__ - Step 16886: {'lr': 0.0004876243528261214, 'samples': 3242112, 'steps': 16885, 'loss/train': 1.2171714305877686} -11/06/2021 23:38:14 - INFO - __main__ - Step 16887: {'lr': 0.0004876227037947807, 'samples': 3242304, 'steps': 16886, 'loss/train': 1.3176175355911255} -11/06/2021 23:38:14 - INFO - __main__ - Step 16888: {'lr': 0.0004876210546563707, 'samples': 3242496, 'steps': 16887, 'loss/train': 1.400641679763794} -11/06/2021 23:38:15 - INFO - __main__ - Step 16889: {'lr': 0.0004876194054108926, 'samples': 3242688, 'steps': 16888, 'loss/train': 1.618189811706543} -11/06/2021 23:38:15 - INFO - __main__ - Step 16890: {'lr': 0.0004876177560583466, 'samples': 3242880, 'steps': 16889, 'loss/train': 1.4612959623336792} -11/06/2021 23:38:16 - INFO - __main__ - Step 16891: {'lr': 0.00048761610659873387, 'samples': 3243072, 'steps': 16890, 'loss/train': 1.4026546478271484} -11/06/2021 23:38:16 - INFO - __main__ - Step 16892: {'lr': 0.0004876144570320549, 'samples': 3243264, 'steps': 16891, 'loss/train': 1.5020729303359985} -11/06/2021 23:38:16 - INFO - __main__ - Step 16893: {'lr': 0.0004876128073583106, 'samples': 3243456, 'steps': 16892, 'loss/train': 1.9043554067611694} -11/06/2021 23:38:18 - INFO - __main__ - Step 16894: {'lr': 0.00048761115757750155, 'samples': 3243648, 'steps': 16893, 'loss/train': 1.3672549724578857} -11/06/2021 23:38:18 - INFO - __main__ - Step 16895: {'lr': 0.00048760950768962863, 'samples': 3243840, 'steps': 16894, 'loss/train': 1.6721173524856567} -11/06/2021 23:38:18 - INFO - __main__ - Step 16896: {'lr': 0.00048760785769469254, 'samples': 3244032, 'steps': 16895, 'loss/train': 1.9637107849121094} -11/06/2021 23:38:19 - INFO - __main__ - Step 16897: {'lr': 0.00048760620759269403, 'samples': 3244224, 'steps': 16896, 'loss/train': 0.48643603920936584} -11/06/2021 23:38:19 - INFO - __main__ - Step 16898: {'lr': 0.00048760455738363376, 'samples': 3244416, 'steps': 16897, 'loss/train': 2.0343399047851562} -11/06/2021 23:38:19 - INFO - __main__ - Step 16899: {'lr': 0.0004876029070675126, 'samples': 3244608, 'steps': 16898, 'loss/train': 1.2345243692398071} -11/06/2021 23:38:20 - INFO - __main__ - Step 16900: {'lr': 0.0004876012566443312, 'samples': 3244800, 'steps': 16899, 'loss/train': 2.1287524700164795} -11/06/2021 23:38:21 - INFO - __main__ - Step 16901: {'lr': 0.00048759960611409036, 'samples': 3244992, 'steps': 16900, 'loss/train': 3.2728943824768066} -11/06/2021 23:38:21 - INFO - __main__ - Step 16902: {'lr': 0.00048759795547679083, 'samples': 3245184, 'steps': 16901, 'loss/train': 1.828813910484314} -11/06/2021 23:38:21 - INFO - __main__ - Step 16903: {'lr': 0.00048759630473243327, 'samples': 3245376, 'steps': 16902, 'loss/train': 1.6020948886871338} -11/06/2021 23:38:22 - INFO - __main__ - Step 16904: {'lr': 0.00048759465388101855, 'samples': 3245568, 'steps': 16903, 'loss/train': 1.3073654174804688} -11/06/2021 23:38:23 - INFO - __main__ - Step 16905: {'lr': 0.0004875930029225473, 'samples': 3245760, 'steps': 16904, 'loss/train': 1.9156172275543213} -11/06/2021 23:38:23 - INFO - __main__ - Step 16906: {'lr': 0.0004875913518570203, 'samples': 3245952, 'steps': 16905, 'loss/train': 1.7705250978469849} -11/06/2021 23:38:24 - INFO - __main__ - Step 16907: {'lr': 0.0004875897006844383, 'samples': 3246144, 'steps': 16906, 'loss/train': 1.3052102327346802} -11/06/2021 23:38:24 - INFO - __main__ - Step 16908: {'lr': 0.00048758804940480203, 'samples': 3246336, 'steps': 16907, 'loss/train': 1.4894630908966064} -11/06/2021 23:38:24 - INFO - __main__ - Step 16909: {'lr': 0.0004875863980181123, 'samples': 3246528, 'steps': 16908, 'loss/train': 1.704583764076233} -11/06/2021 23:38:25 - INFO - __main__ - Step 16910: {'lr': 0.0004875847465243698, 'samples': 3246720, 'steps': 16909, 'loss/train': 1.5926655530929565} -11/06/2021 23:38:26 - INFO - __main__ - Step 16911: {'lr': 0.00048758309492357533, 'samples': 3246912, 'steps': 16910, 'loss/train': 1.5082074403762817} -11/06/2021 23:38:26 - INFO - __main__ - Step 16912: {'lr': 0.0004875814432157295, 'samples': 3247104, 'steps': 16911, 'loss/train': 0.24572615325450897} -11/06/2021 23:38:26 - INFO - __main__ - Step 16913: {'lr': 0.0004875797914008332, 'samples': 3247296, 'steps': 16912, 'loss/train': 1.7498927116394043} -11/06/2021 23:38:27 - INFO - __main__ - Step 16914: {'lr': 0.00048757813947888706, 'samples': 3247488, 'steps': 16913, 'loss/train': 1.81270432472229} -11/06/2021 23:38:28 - INFO - __main__ - Step 16915: {'lr': 0.0004875764874498919, 'samples': 3247680, 'steps': 16914, 'loss/train': 1.2739442586898804} -11/06/2021 23:38:28 - INFO - __main__ - Step 16916: {'lr': 0.00048757483531384837, 'samples': 3247872, 'steps': 16915, 'loss/train': 1.8057383298873901} -11/06/2021 23:38:28 - INFO - __main__ - Step 16917: {'lr': 0.0004875731830707574, 'samples': 3248064, 'steps': 16916, 'loss/train': 1.790678858757019} -11/06/2021 23:38:29 - INFO - __main__ - Step 16918: {'lr': 0.00048757153072061954, 'samples': 3248256, 'steps': 16917, 'loss/train': 1.7016808986663818} -11/06/2021 23:38:29 - INFO - __main__ - Step 16919: {'lr': 0.0004875698782634357, 'samples': 3248448, 'steps': 16918, 'loss/train': 1.927436113357544} -11/06/2021 23:38:30 - INFO - __main__ - Step 16920: {'lr': 0.00048756822569920647, 'samples': 3248640, 'steps': 16919, 'loss/train': 1.947782278060913} -11/06/2021 23:38:31 - INFO - __main__ - Step 16921: {'lr': 0.0004875665730279326, 'samples': 3248832, 'steps': 16920, 'loss/train': 1.8256161212921143} -11/06/2021 23:38:31 - INFO - __main__ - Step 16922: {'lr': 0.000487564920249615, 'samples': 3249024, 'steps': 16921, 'loss/train': 1.3792588710784912} -11/06/2021 23:38:31 - INFO - __main__ - Step 16923: {'lr': 0.00048756326736425427, 'samples': 3249216, 'steps': 16922, 'loss/train': 1.6660298109054565} -11/06/2021 23:38:32 - INFO - __main__ - Step 16924: {'lr': 0.00048756161437185126, 'samples': 3249408, 'steps': 16923, 'loss/train': 1.9878901243209839} -11/06/2021 23:38:33 - INFO - __main__ - Step 16925: {'lr': 0.0004875599612724066, 'samples': 3249600, 'steps': 16924, 'loss/train': 1.48038649559021} -11/06/2021 23:38:33 - INFO - __main__ - Step 16926: {'lr': 0.00048755830806592105, 'samples': 3249792, 'steps': 16925, 'loss/train': 1.4531468152999878} -11/06/2021 23:38:33 - INFO - __main__ - Step 16927: {'lr': 0.00048755665475239547, 'samples': 3249984, 'steps': 16926, 'loss/train': 1.3796802759170532} -11/06/2021 23:38:34 - INFO - __main__ - Step 16928: {'lr': 0.0004875550013318305, 'samples': 3250176, 'steps': 16927, 'loss/train': 1.5753812789916992} -11/06/2021 23:38:34 - INFO - __main__ - Step 16929: {'lr': 0.0004875533478042269, 'samples': 3250368, 'steps': 16928, 'loss/train': 1.530529260635376} -11/06/2021 23:38:34 - INFO - __main__ - Step 16930: {'lr': 0.00048755169416958544, 'samples': 3250560, 'steps': 16929, 'loss/train': 0.7025906443595886} -11/06/2021 23:38:35 - INFO - __main__ - Step 16931: {'lr': 0.00048755004042790685, 'samples': 3250752, 'steps': 16930, 'loss/train': 1.3983508348464966} -11/06/2021 23:38:36 - INFO - __main__ - Step 16932: {'lr': 0.00048754838657919186, 'samples': 3250944, 'steps': 16931, 'loss/train': 1.5572248697280884} -11/06/2021 23:38:36 - INFO - __main__ - Step 16933: {'lr': 0.00048754673262344124, 'samples': 3251136, 'steps': 16932, 'loss/train': 1.7678862810134888} -11/06/2021 23:38:36 - INFO - __main__ - Step 16934: {'lr': 0.00048754507856065574, 'samples': 3251328, 'steps': 16933, 'loss/train': 1.5842539072036743} -11/06/2021 23:38:37 - INFO - __main__ - Step 16935: {'lr': 0.0004875434243908361, 'samples': 3251520, 'steps': 16934, 'loss/train': 1.8356921672821045} -11/06/2021 23:38:38 - INFO - __main__ - Step 16936: {'lr': 0.00048754177011398303, 'samples': 3251712, 'steps': 16935, 'loss/train': 1.8403395414352417} -11/06/2021 23:38:38 - INFO - __main__ - Step 16937: {'lr': 0.0004875401157300973, 'samples': 3251904, 'steps': 16936, 'loss/train': 1.9707876443862915} -11/06/2021 23:38:38 - INFO - __main__ - Step 16938: {'lr': 0.00048753846123917964, 'samples': 3252096, 'steps': 16937, 'loss/train': 1.436141014099121} -11/06/2021 23:38:39 - INFO - __main__ - Step 16939: {'lr': 0.0004875368066412309, 'samples': 3252288, 'steps': 16938, 'loss/train': 1.4638780355453491} -11/06/2021 23:38:39 - INFO - __main__ - Step 16940: {'lr': 0.00048753515193625165, 'samples': 3252480, 'steps': 16939, 'loss/train': 1.765663981437683} -11/06/2021 23:38:40 - INFO - __main__ - Step 16941: {'lr': 0.00048753349712424277, 'samples': 3252672, 'steps': 16940, 'loss/train': 1.8791602849960327} -11/06/2021 23:38:40 - INFO - __main__ - Step 16942: {'lr': 0.00048753184220520497, 'samples': 3252864, 'steps': 16941, 'loss/train': 1.836533784866333} -11/06/2021 23:38:41 - INFO - __main__ - Step 16943: {'lr': 0.000487530187179139, 'samples': 3253056, 'steps': 16942, 'loss/train': 1.2585967779159546} -11/06/2021 23:38:41 - INFO - __main__ - Step 16944: {'lr': 0.00048752853204604555, 'samples': 3253248, 'steps': 16943, 'loss/train': 1.238154649734497} -11/06/2021 23:38:42 - INFO - __main__ - Step 16945: {'lr': 0.00048752687680592545, 'samples': 3253440, 'steps': 16944, 'loss/train': 1.5847913026809692} -11/06/2021 23:38:43 - INFO - __main__ - Step 16946: {'lr': 0.00048752522145877937, 'samples': 3253632, 'steps': 16945, 'loss/train': 1.8298143148422241} -11/06/2021 23:38:43 - INFO - __main__ - Step 16947: {'lr': 0.0004875235660046081, 'samples': 3253824, 'steps': 16946, 'loss/train': 1.9328862428665161} -11/06/2021 23:38:43 - INFO - __main__ - Step 16948: {'lr': 0.0004875219104434124, 'samples': 3254016, 'steps': 16947, 'loss/train': 1.6540714502334595} -11/06/2021 23:38:44 - INFO - __main__ - Step 16949: {'lr': 0.0004875202547751929, 'samples': 3254208, 'steps': 16948, 'loss/train': 1.6022636890411377} -11/06/2021 23:38:44 - INFO - __main__ - Step 16950: {'lr': 0.00048751859899995054, 'samples': 3254400, 'steps': 16949, 'loss/train': 1.9451600313186646} -11/06/2021 23:38:44 - INFO - __main__ - Step 16951: {'lr': 0.0004875169431176859, 'samples': 3254592, 'steps': 16950, 'loss/train': 1.8131561279296875} -11/06/2021 23:38:45 - INFO - __main__ - Step 16952: {'lr': 0.0004875152871283999, 'samples': 3254784, 'steps': 16951, 'loss/train': 0.9848697185516357} -11/06/2021 23:38:46 - INFO - __main__ - Step 16953: {'lr': 0.0004875136310320931, 'samples': 3254976, 'steps': 16952, 'loss/train': 1.7647054195404053} -11/06/2021 23:38:46 - INFO - __main__ - Step 16954: {'lr': 0.0004875119748287663, 'samples': 3255168, 'steps': 16953, 'loss/train': 1.5684469938278198} -11/06/2021 23:38:46 - INFO - __main__ - Step 16955: {'lr': 0.0004875103185184203, 'samples': 3255360, 'steps': 16954, 'loss/train': 1.8279472589492798} -11/06/2021 23:38:47 - INFO - __main__ - Step 16956: {'lr': 0.00048750866210105583, 'samples': 3255552, 'steps': 16955, 'loss/train': 1.563040018081665} -11/06/2021 23:38:48 - INFO - __main__ - Step 16957: {'lr': 0.0004875070055766736, 'samples': 3255744, 'steps': 16956, 'loss/train': 1.38356614112854} -11/06/2021 23:38:48 - INFO - __main__ - Step 16958: {'lr': 0.0004875053489452743, 'samples': 3255936, 'steps': 16957, 'loss/train': 1.8866616487503052} -11/06/2021 23:38:48 - INFO - __main__ - Step 16959: {'lr': 0.00048750369220685886, 'samples': 3256128, 'steps': 16958, 'loss/train': 2.1793675422668457} -11/06/2021 23:38:49 - INFO - __main__ - Step 16960: {'lr': 0.0004875020353614279, 'samples': 3256320, 'steps': 16959, 'loss/train': 1.5973029136657715} -11/06/2021 23:38:49 - INFO - __main__ - Step 16961: {'lr': 0.0004875003784089822, 'samples': 3256512, 'steps': 16960, 'loss/train': 0.8916923403739929} -11/06/2021 23:38:50 - INFO - __main__ - Step 16962: {'lr': 0.00048749872134952243, 'samples': 3256704, 'steps': 16961, 'loss/train': 1.789965033531189} -11/06/2021 23:38:51 - INFO - __main__ - Step 16963: {'lr': 0.0004874970641830495, 'samples': 3256896, 'steps': 16962, 'loss/train': 1.8704382181167603} -11/06/2021 23:38:51 - INFO - __main__ - Step 16964: {'lr': 0.000487495406909564, 'samples': 3257088, 'steps': 16963, 'loss/train': 1.7221460342407227} -11/06/2021 23:38:51 - INFO - __main__ - Step 16965: {'lr': 0.00048749374952906677, 'samples': 3257280, 'steps': 16964, 'loss/train': 1.4671553373336792} -11/06/2021 23:38:52 - INFO - __main__ - Step 16966: {'lr': 0.0004874920920415584, 'samples': 3257472, 'steps': 16965, 'loss/train': 1.615160346031189} -11/06/2021 23:38:52 - INFO - __main__ - Step 16967: {'lr': 0.0004874904344470399, 'samples': 3257664, 'steps': 16966, 'loss/train': 2.103879690170288} -11/06/2021 23:38:53 - INFO - __main__ - Step 16968: {'lr': 0.00048748877674551183, 'samples': 3257856, 'steps': 16967, 'loss/train': 1.7058079242706299} -11/06/2021 23:38:53 - INFO - __main__ - Step 16969: {'lr': 0.00048748711893697495, 'samples': 3258048, 'steps': 16968, 'loss/train': 1.2930617332458496} -11/06/2021 23:38:54 - INFO - __main__ - Step 16970: {'lr': 0.0004874854610214301, 'samples': 3258240, 'steps': 16969, 'loss/train': 1.7520792484283447} -11/06/2021 23:38:54 - INFO - __main__ - Step 16971: {'lr': 0.00048748380299887793, 'samples': 3258432, 'steps': 16970, 'loss/train': 1.4183677434921265} -11/06/2021 23:38:54 - INFO - __main__ - Step 16972: {'lr': 0.0004874821448693192, 'samples': 3258624, 'steps': 16971, 'loss/train': 1.4067054986953735} -11/06/2021 23:38:56 - INFO - __main__ - Step 16973: {'lr': 0.00048748048663275475, 'samples': 3258816, 'steps': 16972, 'loss/train': 1.6782017946243286} -11/06/2021 23:38:56 - INFO - __main__ - Step 16974: {'lr': 0.00048747882828918524, 'samples': 3259008, 'steps': 16973, 'loss/train': 1.7959372997283936} -11/06/2021 23:38:56 - INFO - __main__ - Step 16975: {'lr': 0.0004874771698386113, 'samples': 3259200, 'steps': 16974, 'loss/train': 1.3942209482192993} -11/06/2021 23:38:57 - INFO - __main__ - Step 16976: {'lr': 0.00048747551128103397, 'samples': 3259392, 'steps': 16975, 'loss/train': 1.8319814205169678} -11/06/2021 23:38:57 - INFO - __main__ - Step 16977: {'lr': 0.00048747385261645377, 'samples': 3259584, 'steps': 16976, 'loss/train': 1.7434256076812744} -11/06/2021 23:38:58 - INFO - __main__ - Step 16978: {'lr': 0.0004874721938448715, 'samples': 3259776, 'steps': 16977, 'loss/train': 1.804638147354126} -11/06/2021 23:38:58 - INFO - __main__ - Step 16979: {'lr': 0.000487470534966288, 'samples': 3259968, 'steps': 16978, 'loss/train': 1.7611198425292969} -11/06/2021 23:38:59 - INFO - __main__ - Step 16980: {'lr': 0.0004874688759807039, 'samples': 3260160, 'steps': 16979, 'loss/train': 1.878199577331543} -11/06/2021 23:38:59 - INFO - __main__ - Step 16981: {'lr': 0.00048746721688812004, 'samples': 3260352, 'steps': 16980, 'loss/train': 1.5293978452682495} -11/06/2021 23:38:59 - INFO - __main__ - Step 16982: {'lr': 0.00048746555768853703, 'samples': 3260544, 'steps': 16981, 'loss/train': 0.42321673035621643} -11/06/2021 23:39:00 - INFO - __main__ - Step 16983: {'lr': 0.00048746389838195573, 'samples': 3260736, 'steps': 16982, 'loss/train': 2.233102560043335} -11/06/2021 23:39:01 - INFO - __main__ - Step 16984: {'lr': 0.0004874622389683768, 'samples': 3260928, 'steps': 16983, 'loss/train': 1.3476516008377075} -11/06/2021 23:39:01 - INFO - __main__ - Step 16985: {'lr': 0.0004874605794478012, 'samples': 3261120, 'steps': 16984, 'loss/train': 2.141995668411255} -11/06/2021 23:39:01 - INFO - __main__ - Step 16986: {'lr': 0.0004874589198202294, 'samples': 3261312, 'steps': 16985, 'loss/train': 1.3058313131332397} -11/06/2021 23:39:02 - INFO - __main__ - Step 16987: {'lr': 0.0004874572600856624, 'samples': 3261504, 'steps': 16986, 'loss/train': 2.046851873397827} -11/06/2021 23:39:03 - INFO - __main__ - Step 16988: {'lr': 0.0004874556002441007, 'samples': 3261696, 'steps': 16987, 'loss/train': 1.474866271018982} -11/06/2021 23:39:03 - INFO - __main__ - Step 16989: {'lr': 0.0004874539402955452, 'samples': 3261888, 'steps': 16988, 'loss/train': 1.660361647605896} -11/06/2021 23:39:04 - INFO - __main__ - Step 16990: {'lr': 0.00048745228023999666, 'samples': 3262080, 'steps': 16989, 'loss/train': 1.2000677585601807} -11/06/2021 23:39:04 - INFO - __main__ - Step 16991: {'lr': 0.0004874506200774557, 'samples': 3262272, 'steps': 16990, 'loss/train': 0.9482690095901489} -11/06/2021 23:39:04 - INFO - __main__ - Step 16992: {'lr': 0.00048744895980792327, 'samples': 3262464, 'steps': 16991, 'loss/train': 1.494470477104187} -11/06/2021 23:39:05 - INFO - __main__ - Step 16993: {'lr': 0.00048744729943139993, 'samples': 3262656, 'steps': 16992, 'loss/train': 2.6627840995788574} -11/06/2021 23:39:06 - INFO - __main__ - Step 16994: {'lr': 0.0004874456389478865, 'samples': 3262848, 'steps': 16993, 'loss/train': 1.9466887712478638} -11/06/2021 23:39:06 - INFO - __main__ - Step 16995: {'lr': 0.00048744397835738377, 'samples': 3263040, 'steps': 16994, 'loss/train': 1.755508542060852} -11/06/2021 23:39:06 - INFO - __main__ - Step 16996: {'lr': 0.00048744231765989246, 'samples': 3263232, 'steps': 16995, 'loss/train': 1.8926562070846558} -11/06/2021 23:39:07 - INFO - __main__ - Step 16997: {'lr': 0.0004874406568554132, 'samples': 3263424, 'steps': 16996, 'loss/train': 2.095759868621826} -11/06/2021 23:39:07 - INFO - __main__ - Step 16998: {'lr': 0.0004874389959439469, 'samples': 3263616, 'steps': 16997, 'loss/train': 1.821245789527893} -11/06/2021 23:39:08 - INFO - __main__ - Step 16999: {'lr': 0.0004874373349254943, 'samples': 3263808, 'steps': 16998, 'loss/train': 1.4103591442108154} -11/06/2021 23:39:09 - INFO - __main__ - Step 17000: {'lr': 0.00048743567380005604, 'samples': 3264000, 'steps': 16999, 'loss/train': 1.9653171300888062} -11/06/2021 23:39:09 - INFO - __main__ - Step 17001: {'lr': 0.000487434012567633, 'samples': 3264192, 'steps': 17000, 'loss/train': 1.2199618816375732} -11/06/2021 23:39:09 - INFO - __main__ - Step 17002: {'lr': 0.0004874323512282258, 'samples': 3264384, 'steps': 17001, 'loss/train': 1.7762051820755005} -11/06/2021 23:39:10 - INFO - __main__ - Step 17003: {'lr': 0.00048743068978183523, 'samples': 3264576, 'steps': 17002, 'loss/train': 1.578262448310852} -11/06/2021 23:39:11 - INFO - __main__ - Step 17004: {'lr': 0.00048742902822846215, 'samples': 3264768, 'steps': 17003, 'loss/train': 1.8485451936721802} -11/06/2021 23:39:11 - INFO - __main__ - Step 17005: {'lr': 0.0004874273665681071, 'samples': 3264960, 'steps': 17004, 'loss/train': 1.8046890497207642} -11/06/2021 23:39:12 - INFO - __main__ - Step 17006: {'lr': 0.00048742570480077096, 'samples': 3265152, 'steps': 17005, 'loss/train': 0.393635630607605} -11/06/2021 23:39:12 - INFO - __main__ - Step 17007: {'lr': 0.0004874240429264545, 'samples': 3265344, 'steps': 17006, 'loss/train': 2.030019760131836} -11/06/2021 23:39:12 - INFO - __main__ - Step 17008: {'lr': 0.00048742238094515844, 'samples': 3265536, 'steps': 17007, 'loss/train': 1.7320748567581177} -11/06/2021 23:39:13 - INFO - __main__ - Step 17009: {'lr': 0.00048742071885688354, 'samples': 3265728, 'steps': 17008, 'loss/train': 1.4661654233932495} -11/06/2021 23:39:14 - INFO - __main__ - Step 17010: {'lr': 0.00048741905666163047, 'samples': 3265920, 'steps': 17009, 'loss/train': 1.0361342430114746} -11/06/2021 23:39:14 - INFO - __main__ - Step 17011: {'lr': 0.00048741739435940003, 'samples': 3266112, 'steps': 17010, 'loss/train': 0.8936920166015625} -11/06/2021 23:39:14 - INFO - __main__ - Step 17012: {'lr': 0.000487415731950193, 'samples': 3266304, 'steps': 17011, 'loss/train': 1.6268352270126343} -11/06/2021 23:39:15 - INFO - __main__ - Step 17013: {'lr': 0.0004874140694340101, 'samples': 3266496, 'steps': 17012, 'loss/train': 1.5285117626190186} -11/06/2021 23:39:16 - INFO - __main__ - Step 17014: {'lr': 0.0004874124068108521, 'samples': 3266688, 'steps': 17013, 'loss/train': 1.6101415157318115} -11/06/2021 23:39:16 - INFO - __main__ - Step 17015: {'lr': 0.00048741074408071975, 'samples': 3266880, 'steps': 17014, 'loss/train': 1.7432715892791748} -11/06/2021 23:39:17 - INFO - __main__ - Step 17016: {'lr': 0.00048740908124361373, 'samples': 3267072, 'steps': 17015, 'loss/train': 1.9835989475250244} -11/06/2021 23:39:17 - INFO - __main__ - Step 17017: {'lr': 0.0004874074182995349, 'samples': 3267264, 'steps': 17016, 'loss/train': 1.999614953994751} -11/06/2021 23:39:17 - INFO - __main__ - Step 17018: {'lr': 0.0004874057552484839, 'samples': 3267456, 'steps': 17017, 'loss/train': 1.9977906942367554} -11/06/2021 23:39:18 - INFO - __main__ - Step 17019: {'lr': 0.00048740409209046154, 'samples': 3267648, 'steps': 17018, 'loss/train': 1.9863004684448242} -11/06/2021 23:39:19 - INFO - __main__ - Step 17020: {'lr': 0.0004874024288254686, 'samples': 3267840, 'steps': 17019, 'loss/train': 1.82778799533844} -11/06/2021 23:39:19 - INFO - __main__ - Step 17021: {'lr': 0.00048740076545350573, 'samples': 3268032, 'steps': 17020, 'loss/train': 3.3035099506378174} -11/06/2021 23:39:19 - INFO - __main__ - Step 17022: {'lr': 0.00048739910197457376, 'samples': 3268224, 'steps': 17021, 'loss/train': 1.5491119623184204} -11/06/2021 23:39:20 - INFO - __main__ - Step 17023: {'lr': 0.00048739743838867344, 'samples': 3268416, 'steps': 17022, 'loss/train': 1.543113112449646} -11/06/2021 23:39:20 - INFO - __main__ - Step 17024: {'lr': 0.00048739577469580545, 'samples': 3268608, 'steps': 17023, 'loss/train': 1.7079392671585083} -11/06/2021 23:39:21 - INFO - __main__ - Step 17025: {'lr': 0.0004873941108959706, 'samples': 3268800, 'steps': 17024, 'loss/train': 1.5123034715652466} -11/06/2021 23:39:21 - INFO - __main__ - Step 17026: {'lr': 0.0004873924469891697, 'samples': 3268992, 'steps': 17025, 'loss/train': 2.073899507522583} -11/06/2021 23:39:22 - INFO - __main__ - Step 17027: {'lr': 0.00048739078297540335, 'samples': 3269184, 'steps': 17026, 'loss/train': 1.565974235534668} -11/06/2021 23:39:22 - INFO - __main__ - Step 17028: {'lr': 0.00048738911885467243, 'samples': 3269376, 'steps': 17027, 'loss/train': 1.5371849536895752} -11/06/2021 23:39:22 - INFO - __main__ - Step 17029: {'lr': 0.00048738745462697754, 'samples': 3269568, 'steps': 17028, 'loss/train': 1.8682217597961426} -11/06/2021 23:39:24 - INFO - __main__ - Step 17030: {'lr': 0.0004873857902923196, 'samples': 3269760, 'steps': 17029, 'loss/train': 1.9690535068511963} -11/06/2021 23:39:24 - INFO - __main__ - Step 17031: {'lr': 0.00048738412585069927, 'samples': 3269952, 'steps': 17030, 'loss/train': 0.5062768459320068} -11/06/2021 23:39:24 - INFO - __main__ - Step 17032: {'lr': 0.00048738246130211734, 'samples': 3270144, 'steps': 17031, 'loss/train': 1.5573618412017822} -11/06/2021 23:39:25 - INFO - __main__ - Step 17033: {'lr': 0.00048738079664657454, 'samples': 3270336, 'steps': 17032, 'loss/train': 1.1958006620407104} -11/06/2021 23:39:25 - INFO - __main__ - Step 17034: {'lr': 0.00048737913188407156, 'samples': 3270528, 'steps': 17033, 'loss/train': 1.5426795482635498} -11/06/2021 23:39:26 - INFO - __main__ - Step 17035: {'lr': 0.00048737746701460927, 'samples': 3270720, 'steps': 17034, 'loss/train': 1.8075716495513916} -11/06/2021 23:39:26 - INFO - __main__ - Step 17036: {'lr': 0.0004873758020381883, 'samples': 3270912, 'steps': 17035, 'loss/train': 1.7565505504608154} -11/06/2021 23:39:27 - INFO - __main__ - Step 17037: {'lr': 0.00048737413695480947, 'samples': 3271104, 'steps': 17036, 'loss/train': 2.1112308502197266} -11/06/2021 23:39:27 - INFO - __main__ - Step 17038: {'lr': 0.00048737247176447354, 'samples': 3271296, 'steps': 17037, 'loss/train': 1.8859508037567139} -11/06/2021 23:39:27 - INFO - __main__ - Step 17039: {'lr': 0.0004873708064671812, 'samples': 3271488, 'steps': 17038, 'loss/train': 1.6623574495315552} -11/06/2021 23:39:28 - INFO - __main__ - Step 17040: {'lr': 0.0004873691410629333, 'samples': 3271680, 'steps': 17039, 'loss/train': 1.8081897497177124} -11/06/2021 23:39:29 - INFO - __main__ - Step 17041: {'lr': 0.0004873674755517304, 'samples': 3271872, 'steps': 17040, 'loss/train': 1.7349417209625244} -11/06/2021 23:39:29 - INFO - __main__ - Step 17042: {'lr': 0.00048736580993357357, 'samples': 3272064, 'steps': 17041, 'loss/train': 1.7138926982879639} -11/06/2021 23:39:29 - INFO - __main__ - Step 17043: {'lr': 0.0004873641442084632, 'samples': 3272256, 'steps': 17042, 'loss/train': 1.552172303199768} -11/06/2021 23:39:30 - INFO - __main__ - Step 17044: {'lr': 0.00048736247837640037, 'samples': 3272448, 'steps': 17043, 'loss/train': 1.3372807502746582} -11/06/2021 23:39:30 - INFO - __main__ - Step 17045: {'lr': 0.0004873608124373855, 'samples': 3272640, 'steps': 17044, 'loss/train': 1.974311113357544} -11/06/2021 23:39:31 - INFO - __main__ - Step 17046: {'lr': 0.00048735914639141964, 'samples': 3272832, 'steps': 17045, 'loss/train': 1.299238920211792} -11/06/2021 23:39:32 - INFO - __main__ - Step 17047: {'lr': 0.00048735748023850337, 'samples': 3273024, 'steps': 17046, 'loss/train': 1.769322156906128} -11/06/2021 23:39:32 - INFO - __main__ - Step 17048: {'lr': 0.00048735581397863745, 'samples': 3273216, 'steps': 17047, 'loss/train': 1.0597976446151733} -11/06/2021 23:39:32 - INFO - __main__ - Step 17049: {'lr': 0.0004873541476118227, 'samples': 3273408, 'steps': 17048, 'loss/train': 5.835102081298828} -11/06/2021 23:39:33 - INFO - __main__ - Step 17050: {'lr': 0.00048735248113805976, 'samples': 3273600, 'steps': 17049, 'loss/train': 1.1489970684051514} -11/06/2021 23:39:34 - INFO - __main__ - Step 17051: {'lr': 0.0004873508145573495, 'samples': 3273792, 'steps': 17050, 'loss/train': 1.3549208641052246} -11/06/2021 23:39:34 - INFO - __main__ - Step 17052: {'lr': 0.00048734914786969266, 'samples': 3273984, 'steps': 17051, 'loss/train': 1.75826895236969} -11/06/2021 23:39:34 - INFO - __main__ - Step 17053: {'lr': 0.00048734748107509, 'samples': 3274176, 'steps': 17052, 'loss/train': 1.9871326684951782} -11/06/2021 23:39:35 - INFO - __main__ - Step 17054: {'lr': 0.0004873458141735421, 'samples': 3274368, 'steps': 17053, 'loss/train': 1.1350014209747314} -11/06/2021 23:39:35 - INFO - __main__ - Step 17055: {'lr': 0.0004873441471650499, 'samples': 3274560, 'steps': 17054, 'loss/train': 1.7989593744277954} -11/06/2021 23:39:35 - INFO - __main__ - Step 17056: {'lr': 0.00048734248004961414, 'samples': 3274752, 'steps': 17055, 'loss/train': 1.6534098386764526} -11/06/2021 23:39:37 - INFO - __main__ - Step 17057: {'lr': 0.00048734081282723543, 'samples': 3274944, 'steps': 17056, 'loss/train': 1.4881923198699951} -11/06/2021 23:39:37 - INFO - __main__ - Step 17058: {'lr': 0.00048733914549791465, 'samples': 3275136, 'steps': 17057, 'loss/train': 1.5087233781814575} -11/06/2021 23:39:37 - INFO - __main__ - Step 17059: {'lr': 0.0004873374780616525, 'samples': 3275328, 'steps': 17058, 'loss/train': 1.679807186126709} -11/06/2021 23:39:38 - INFO - __main__ - Step 17060: {'lr': 0.00048733581051844976, 'samples': 3275520, 'steps': 17059, 'loss/train': 0.27972447872161865} -11/06/2021 23:39:38 - INFO - __main__ - Step 17061: {'lr': 0.00048733414286830716, 'samples': 3275712, 'steps': 17060, 'loss/train': 1.3394430875778198} -11/06/2021 23:39:39 - INFO - __main__ - Step 17062: {'lr': 0.00048733247511122547, 'samples': 3275904, 'steps': 17061, 'loss/train': 1.8187850713729858} -11/06/2021 23:39:40 - INFO - __main__ - Step 17063: {'lr': 0.00048733080724720545, 'samples': 3276096, 'steps': 17062, 'loss/train': 1.4330551624298096} -11/06/2021 23:39:40 - INFO - __main__ - Step 17064: {'lr': 0.00048732913927624776, 'samples': 3276288, 'steps': 17063, 'loss/train': 1.9322031736373901} -11/06/2021 23:39:40 - INFO - __main__ - Step 17065: {'lr': 0.0004873274711983533, 'samples': 3276480, 'steps': 17064, 'loss/train': 1.0093766450881958} -11/06/2021 23:39:41 - INFO - __main__ - Step 17066: {'lr': 0.0004873258030135227, 'samples': 3276672, 'steps': 17065, 'loss/train': 1.3425406217575073} -11/06/2021 23:39:42 - INFO - __main__ - Step 17067: {'lr': 0.0004873241347217567, 'samples': 3276864, 'steps': 17066, 'loss/train': 2.148686647415161} -11/06/2021 23:39:42 - INFO - __main__ - Step 17068: {'lr': 0.0004873224663230562, 'samples': 3277056, 'steps': 17067, 'loss/train': 1.3120168447494507} -11/06/2021 23:39:42 - INFO - __main__ - Step 17069: {'lr': 0.0004873207978174219, 'samples': 3277248, 'steps': 17068, 'loss/train': 1.5943224430084229} -11/06/2021 23:39:43 - INFO - __main__ - Step 17070: {'lr': 0.00048731912920485444, 'samples': 3277440, 'steps': 17069, 'loss/train': 0.7484023571014404} -11/06/2021 23:39:43 - INFO - __main__ - Step 17071: {'lr': 0.0004873174604853546, 'samples': 3277632, 'steps': 17070, 'loss/train': 1.536741018295288} -11/06/2021 23:39:44 - INFO - __main__ - Step 17072: {'lr': 0.00048731579165892325, 'samples': 3277824, 'steps': 17071, 'loss/train': 1.413906455039978} -11/06/2021 23:39:45 - INFO - __main__ - Step 17073: {'lr': 0.000487314122725561, 'samples': 3278016, 'steps': 17072, 'loss/train': 1.606602668762207} -11/06/2021 23:39:45 - INFO - __main__ - Step 17074: {'lr': 0.00048731245368526877, 'samples': 3278208, 'steps': 17073, 'loss/train': 1.9211560487747192} -11/06/2021 23:39:45 - INFO - __main__ - Step 17075: {'lr': 0.0004873107845380471, 'samples': 3278400, 'steps': 17074, 'loss/train': 1.820310115814209} -11/06/2021 23:39:46 - INFO - __main__ - Step 17076: {'lr': 0.00048730911528389686, 'samples': 3278592, 'steps': 17075, 'loss/train': 1.947972059249878} -11/06/2021 23:39:47 - INFO - __main__ - Step 17077: {'lr': 0.0004873074459228188, 'samples': 3278784, 'steps': 17076, 'loss/train': 1.7204302549362183} -11/06/2021 23:39:47 - INFO - __main__ - Step 17078: {'lr': 0.0004873057764548138, 'samples': 3278976, 'steps': 17077, 'loss/train': 1.879388689994812} -11/06/2021 23:39:48 - INFO - __main__ - Step 17079: {'lr': 0.00048730410687988237, 'samples': 3279168, 'steps': 17078, 'loss/train': 1.2664668560028076} -11/06/2021 23:39:48 - INFO - __main__ - Step 17080: {'lr': 0.00048730243719802535, 'samples': 3279360, 'steps': 17079, 'loss/train': 1.9700970649719238} -11/06/2021 23:39:48 - INFO - __main__ - Step 17081: {'lr': 0.00048730076740924355, 'samples': 3279552, 'steps': 17080, 'loss/train': 1.0473175048828125} -11/06/2021 23:39:49 - INFO - __main__ - Step 17082: {'lr': 0.0004872990975135377, 'samples': 3279744, 'steps': 17081, 'loss/train': 1.3515214920043945} -11/06/2021 23:39:49 - INFO - __main__ - Step 17083: {'lr': 0.0004872974275109085, 'samples': 3279936, 'steps': 17082, 'loss/train': 1.463983178138733} -11/06/2021 23:39:50 - INFO - __main__ - Step 17084: {'lr': 0.00048729575740135675, 'samples': 3280128, 'steps': 17083, 'loss/train': 1.5484230518341064} -11/06/2021 23:39:51 - INFO - __main__ - Step 17085: {'lr': 0.0004872940871848832, 'samples': 3280320, 'steps': 17084, 'loss/train': 2.2791638374328613} -11/06/2021 23:39:51 - INFO - __main__ - Step 17086: {'lr': 0.00048729241686148864, 'samples': 3280512, 'steps': 17085, 'loss/train': 1.8296653032302856} -11/06/2021 23:39:51 - INFO - __main__ - Step 17087: {'lr': 0.0004872907464311737, 'samples': 3280704, 'steps': 17086, 'loss/train': 1.4752380847930908} -11/06/2021 23:39:52 - INFO - __main__ - Step 17088: {'lr': 0.0004872890758939392, 'samples': 3280896, 'steps': 17087, 'loss/train': 1.206477165222168} -11/06/2021 23:39:53 - INFO - __main__ - Step 17089: {'lr': 0.00048728740524978597, 'samples': 3281088, 'steps': 17088, 'loss/train': 1.7436742782592773} -11/06/2021 23:39:53 - INFO - __main__ - Step 17090: {'lr': 0.00048728573449871473, 'samples': 3281280, 'steps': 17089, 'loss/train': 1.3805345296859741} -11/06/2021 23:39:53 - INFO - __main__ - Step 17091: {'lr': 0.0004872840636407261, 'samples': 3281472, 'steps': 17090, 'loss/train': 1.2210899591445923} -11/06/2021 23:39:54 - INFO - __main__ - Step 17092: {'lr': 0.00048728239267582096, 'samples': 3281664, 'steps': 17091, 'loss/train': 1.1213079690933228} -11/06/2021 23:39:54 - INFO - __main__ - Step 17093: {'lr': 0.00048728072160400006, 'samples': 3281856, 'steps': 17092, 'loss/train': 1.8094351291656494} -11/06/2021 23:39:55 - INFO - __main__ - Step 17094: {'lr': 0.0004872790504252641, 'samples': 3282048, 'steps': 17093, 'loss/train': 2.475142240524292} -11/06/2021 23:39:55 - INFO - __main__ - Step 17095: {'lr': 0.0004872773791396139, 'samples': 3282240, 'steps': 17094, 'loss/train': 1.4693809747695923} -11/06/2021 23:39:56 - INFO - __main__ - Step 17096: {'lr': 0.0004872757077470502, 'samples': 3282432, 'steps': 17095, 'loss/train': 2.0089285373687744} -11/06/2021 23:39:56 - INFO - __main__ - Step 17097: {'lr': 0.0004872740362475737, 'samples': 3282624, 'steps': 17096, 'loss/train': 1.8510346412658691} -11/06/2021 23:39:57 - INFO - __main__ - Step 17098: {'lr': 0.0004872723646411851, 'samples': 3282816, 'steps': 17097, 'loss/train': 1.2082724571228027} -11/06/2021 23:39:58 - INFO - __main__ - Step 17099: {'lr': 0.0004872706929278853, 'samples': 3283008, 'steps': 17098, 'loss/train': 1.7203577756881714} -11/06/2021 23:39:58 - INFO - __main__ - Step 17100: {'lr': 0.000487269021107675, 'samples': 3283200, 'steps': 17099, 'loss/train': 1.7792285680770874} -11/06/2021 23:39:59 - INFO - __main__ - Step 17101: {'lr': 0.0004872673491805549, 'samples': 3283392, 'steps': 17100, 'loss/train': 1.7158050537109375} -11/06/2021 23:39:59 - INFO - __main__ - Step 17102: {'lr': 0.0004872656771465259, 'samples': 3283584, 'steps': 17101, 'loss/train': 1.6568636894226074} -11/06/2021 23:39:59 - INFO - __main__ - Step 17103: {'lr': 0.00048726400500558856, 'samples': 3283776, 'steps': 17102, 'loss/train': 1.9495559930801392} -11/06/2021 23:40:00 - INFO - __main__ - Step 17104: {'lr': 0.0004872623327577437, 'samples': 3283968, 'steps': 17103, 'loss/train': 1.5772558450698853} -11/06/2021 23:40:01 - INFO - __main__ - Step 17105: {'lr': 0.0004872606604029921, 'samples': 3284160, 'steps': 17104, 'loss/train': 0.8391998410224915} -11/06/2021 23:40:01 - INFO - __main__ - Step 17106: {'lr': 0.00048725898794133455, 'samples': 3284352, 'steps': 17105, 'loss/train': 1.9225443601608276} -11/06/2021 23:40:01 - INFO - __main__ - Step 17107: {'lr': 0.00048725731537277173, 'samples': 3284544, 'steps': 17106, 'loss/train': 1.894831657409668} -11/06/2021 23:40:02 - INFO - __main__ - Step 17108: {'lr': 0.0004872556426973044, 'samples': 3284736, 'steps': 17107, 'loss/train': 1.5045108795166016} -11/06/2021 23:40:02 - INFO - __main__ - Step 17109: {'lr': 0.0004872539699149334, 'samples': 3284928, 'steps': 17108, 'loss/train': 1.9141845703125} -11/06/2021 23:40:03 - INFO - __main__ - Step 17110: {'lr': 0.0004872522970256594, 'samples': 3285120, 'steps': 17109, 'loss/train': 1.4091365337371826} -11/06/2021 23:40:03 - INFO - __main__ - Step 17111: {'lr': 0.00048725062402948314, 'samples': 3285312, 'steps': 17110, 'loss/train': 1.5130109786987305} -11/06/2021 23:40:04 - INFO - __main__ - Step 17112: {'lr': 0.00048724895092640546, 'samples': 3285504, 'steps': 17111, 'loss/train': 1.1645400524139404} -11/06/2021 23:40:04 - INFO - __main__ - Step 17113: {'lr': 0.00048724727771642706, 'samples': 3285696, 'steps': 17112, 'loss/train': 1.6924716234207153} -11/06/2021 23:40:05 - INFO - __main__ - Step 17114: {'lr': 0.00048724560439954867, 'samples': 3285888, 'steps': 17113, 'loss/train': 1.7980364561080933} -11/06/2021 23:40:06 - INFO - __main__ - Step 17115: {'lr': 0.00048724393097577113, 'samples': 3286080, 'steps': 17114, 'loss/train': 1.552628517150879} -11/06/2021 23:40:06 - INFO - __main__ - Step 17116: {'lr': 0.0004872422574450951, 'samples': 3286272, 'steps': 17115, 'loss/train': 1.8925765752792358} -11/06/2021 23:40:06 - INFO - __main__ - Step 17117: {'lr': 0.0004872405838075213, 'samples': 3286464, 'steps': 17116, 'loss/train': 1.6938984394073486} -11/06/2021 23:40:07 - INFO - __main__ - Step 17118: {'lr': 0.00048723891006305066, 'samples': 3286656, 'steps': 17117, 'loss/train': 1.3686352968215942} -11/06/2021 23:40:07 - INFO - __main__ - Step 17119: {'lr': 0.0004872372362116838, 'samples': 3286848, 'steps': 17118, 'loss/train': 1.6649097204208374} -11/06/2021 23:40:08 - INFO - __main__ - Step 17120: {'lr': 0.0004872355622534215, 'samples': 3287040, 'steps': 17119, 'loss/train': 0.5623729825019836} -11/06/2021 23:40:09 - INFO - __main__ - Step 17121: {'lr': 0.0004872338881882644, 'samples': 3287232, 'steps': 17120, 'loss/train': 1.4882264137268066} -11/06/2021 23:40:09 - INFO - __main__ - Step 17122: {'lr': 0.00048723221401621354, 'samples': 3287424, 'steps': 17121, 'loss/train': 2.0259337425231934} -11/06/2021 23:40:09 - INFO - __main__ - Step 17123: {'lr': 0.0004872305397372694, 'samples': 3287616, 'steps': 17122, 'loss/train': 1.6014872789382935} -11/06/2021 23:40:10 - INFO - __main__ - Step 17124: {'lr': 0.0004872288653514329, 'samples': 3287808, 'steps': 17123, 'loss/train': 1.8238401412963867} -11/06/2021 23:40:10 - INFO - __main__ - Step 17125: {'lr': 0.0004872271908587047, 'samples': 3288000, 'steps': 17124, 'loss/train': 1.2414836883544922} -11/06/2021 23:40:11 - INFO - __main__ - Step 17126: {'lr': 0.0004872255162590856, 'samples': 3288192, 'steps': 17125, 'loss/train': 1.3290209770202637} -11/06/2021 23:40:11 - INFO - __main__ - Step 17127: {'lr': 0.0004872238415525764, 'samples': 3288384, 'steps': 17126, 'loss/train': 1.592273235321045} -11/06/2021 23:40:12 - INFO - __main__ - Step 17128: {'lr': 0.0004872221667391777, 'samples': 3288576, 'steps': 17127, 'loss/train': 1.5573184490203857} -11/06/2021 23:40:12 - INFO - __main__ - Step 17129: {'lr': 0.00048722049181889037, 'samples': 3288768, 'steps': 17128, 'loss/train': 1.9449520111083984} -11/06/2021 23:40:12 - INFO - __main__ - Step 17130: {'lr': 0.0004872188167917152, 'samples': 3288960, 'steps': 17129, 'loss/train': 2.0175869464874268} -11/06/2021 23:40:13 - INFO - __main__ - Step 17131: {'lr': 0.00048721714165765286, 'samples': 3289152, 'steps': 17130, 'loss/train': 0.9070045948028564} -11/06/2021 23:40:14 - INFO - __main__ - Step 17132: {'lr': 0.00048721546641670413, 'samples': 3289344, 'steps': 17131, 'loss/train': 1.587490200996399} -11/06/2021 23:40:14 - INFO - __main__ - Step 17133: {'lr': 0.00048721379106886976, 'samples': 3289536, 'steps': 17132, 'loss/train': 1.65146005153656} -11/06/2021 23:40:14 - INFO - __main__ - Step 17134: {'lr': 0.0004872121156141506, 'samples': 3289728, 'steps': 17133, 'loss/train': 1.6445494890213013} -11/06/2021 23:40:15 - INFO - __main__ - Step 17135: {'lr': 0.0004872104400525472, 'samples': 3289920, 'steps': 17134, 'loss/train': 1.1517709493637085} -11/06/2021 23:40:16 - INFO - __main__ - Step 17136: {'lr': 0.0004872087643840605, 'samples': 3290112, 'steps': 17135, 'loss/train': 1.2968612909317017} -11/06/2021 23:40:16 - INFO - __main__ - Step 17137: {'lr': 0.00048720708860869116, 'samples': 3290304, 'steps': 17136, 'loss/train': 1.8563275337219238} -11/06/2021 23:40:17 - INFO - __main__ - Step 17138: {'lr': 0.00048720541272644004, 'samples': 3290496, 'steps': 17137, 'loss/train': 1.7054293155670166} -11/06/2021 23:40:17 - INFO - __main__ - Step 17139: {'lr': 0.00048720373673730773, 'samples': 3290688, 'steps': 17138, 'loss/train': 1.8172038793563843} -11/06/2021 23:40:17 - INFO - __main__ - Step 17140: {'lr': 0.00048720206064129516, 'samples': 3290880, 'steps': 17139, 'loss/train': 1.6057360172271729} -11/06/2021 23:40:18 - INFO - __main__ - Step 17141: {'lr': 0.0004872003844384029, 'samples': 3291072, 'steps': 17140, 'loss/train': 1.466621994972229} -11/06/2021 23:40:19 - INFO - __main__ - Step 17142: {'lr': 0.0004871987081286319, 'samples': 3291264, 'steps': 17141, 'loss/train': 1.6234965324401855} -11/06/2021 23:40:19 - INFO - __main__ - Step 17143: {'lr': 0.0004871970317119828, 'samples': 3291456, 'steps': 17142, 'loss/train': 0.9775916337966919} -11/06/2021 23:40:20 - INFO - __main__ - Step 17144: {'lr': 0.00048719535518845634, 'samples': 3291648, 'steps': 17143, 'loss/train': 0.35061636567115784} -11/06/2021 23:40:20 - INFO - __main__ - Step 17145: {'lr': 0.0004871936785580533, 'samples': 3291840, 'steps': 17144, 'loss/train': 1.0786106586456299} -11/06/2021 23:40:21 - INFO - __main__ - Step 17146: {'lr': 0.0004871920018207745, 'samples': 3292032, 'steps': 17145, 'loss/train': 1.6169389486312866} -11/06/2021 23:40:22 - INFO - __main__ - Step 17147: {'lr': 0.0004871903249766206, 'samples': 3292224, 'steps': 17146, 'loss/train': 1.4403924942016602} -11/06/2021 23:40:23 - INFO - __main__ - Step 17148: {'lr': 0.0004871886480255925, 'samples': 3292416, 'steps': 17147, 'loss/train': 2.0448710918426514} -11/06/2021 23:40:23 - INFO - __main__ - Step 17149: {'lr': 0.0004871869709676907, 'samples': 3292608, 'steps': 17148, 'loss/train': 1.7501180171966553} -11/06/2021 23:40:23 - INFO - __main__ - Step 17150: {'lr': 0.0004871852938029162, 'samples': 3292800, 'steps': 17149, 'loss/train': 1.0432761907577515} -11/06/2021 23:40:24 - INFO - __main__ - Step 17151: {'lr': 0.00048718361653126975, 'samples': 3292992, 'steps': 17150, 'loss/train': 1.692865252494812} -11/06/2021 23:40:24 - INFO - __main__ - Step 17152: {'lr': 0.0004871819391527519, 'samples': 3293184, 'steps': 17151, 'loss/train': 1.8303561210632324} -11/06/2021 23:40:24 - INFO - __main__ - Step 17153: {'lr': 0.0004871802616673636, 'samples': 3293376, 'steps': 17152, 'loss/train': 1.8023126125335693} -11/06/2021 23:40:25 - INFO - __main__ - Step 17154: {'lr': 0.00048717858407510545, 'samples': 3293568, 'steps': 17153, 'loss/train': 1.8174192905426025} -11/06/2021 23:40:26 - INFO - __main__ - Step 17155: {'lr': 0.0004871769063759783, 'samples': 3293760, 'steps': 17154, 'loss/train': 0.8695468306541443} -11/06/2021 23:40:26 - INFO - __main__ - Step 17156: {'lr': 0.000487175228569983, 'samples': 3293952, 'steps': 17155, 'loss/train': 1.9590970277786255} -11/06/2021 23:40:26 - INFO - __main__ - Step 17157: {'lr': 0.0004871735506571201, 'samples': 3294144, 'steps': 17156, 'loss/train': 1.572733759880066} -11/06/2021 23:40:27 - INFO - __main__ - Step 17158: {'lr': 0.00048717187263739046, 'samples': 3294336, 'steps': 17157, 'loss/train': 2.0862021446228027} -11/06/2021 23:40:28 - INFO - __main__ - Step 17159: {'lr': 0.00048717019451079493, 'samples': 3294528, 'steps': 17158, 'loss/train': 1.4682984352111816} -11/06/2021 23:40:28 - INFO - __main__ - Step 17160: {'lr': 0.00048716851627733404, 'samples': 3294720, 'steps': 17159, 'loss/train': 1.938184142112732} -11/06/2021 23:40:28 - INFO - __main__ - Step 17161: {'lr': 0.00048716683793700876, 'samples': 3294912, 'steps': 17160, 'loss/train': 1.7588785886764526} -11/06/2021 23:40:29 - INFO - __main__ - Step 17162: {'lr': 0.00048716515948981975, 'samples': 3295104, 'steps': 17161, 'loss/train': 1.657987117767334} -11/06/2021 23:40:29 - INFO - __main__ - Step 17163: {'lr': 0.0004871634809357678, 'samples': 3295296, 'steps': 17162, 'loss/train': 2.02968430519104} -11/06/2021 23:40:29 - INFO - __main__ - Step 17164: {'lr': 0.00048716180227485365, 'samples': 3295488, 'steps': 17163, 'loss/train': 1.6158461570739746} -11/06/2021 23:40:31 - INFO - __main__ - Step 17165: {'lr': 0.000487160123507078, 'samples': 3295680, 'steps': 17164, 'loss/train': 1.3516970872879028} -11/06/2021 23:40:31 - INFO - __main__ - Step 17166: {'lr': 0.00048715844463244166, 'samples': 3295872, 'steps': 17165, 'loss/train': 1.0224634408950806} -11/06/2021 23:40:32 - INFO - __main__ - Step 17167: {'lr': 0.0004871567656509454, 'samples': 3296064, 'steps': 17166, 'loss/train': 1.6286890506744385} -11/06/2021 23:40:32 - INFO - __main__ - Step 17168: {'lr': 0.00048715508656259, 'samples': 3296256, 'steps': 17167, 'loss/train': 1.054592490196228} -11/06/2021 23:40:32 - INFO - __main__ - Step 17169: {'lr': 0.00048715340736737615, 'samples': 3296448, 'steps': 17168, 'loss/train': 1.4753445386886597} -11/06/2021 23:40:33 - INFO - __main__ - Step 17170: {'lr': 0.0004871517280653046, 'samples': 3296640, 'steps': 17169, 'loss/train': 0.6704396605491638} -11/06/2021 23:40:34 - INFO - __main__ - Step 17171: {'lr': 0.0004871500486563761, 'samples': 3296832, 'steps': 17170, 'loss/train': 1.4900462627410889} -11/06/2021 23:40:34 - INFO - __main__ - Step 17172: {'lr': 0.0004871483691405916, 'samples': 3297024, 'steps': 17171, 'loss/train': 1.7745710611343384} -11/06/2021 23:40:34 - INFO - __main__ - Step 17173: {'lr': 0.0004871466895179516, 'samples': 3297216, 'steps': 17172, 'loss/train': 1.7504075765609741} -11/06/2021 23:40:35 - INFO - __main__ - Step 17174: {'lr': 0.000487145009788457, 'samples': 3297408, 'steps': 17173, 'loss/train': 1.5627763271331787} -11/06/2021 23:40:36 - INFO - __main__ - Step 17175: {'lr': 0.0004871433299521085, 'samples': 3297600, 'steps': 17174, 'loss/train': 1.7707425355911255} -11/06/2021 23:40:36 - INFO - __main__ - Step 17176: {'lr': 0.00048714165000890685, 'samples': 3297792, 'steps': 17175, 'loss/train': 1.890425682067871} -11/06/2021 23:40:36 - INFO - __main__ - Step 17177: {'lr': 0.00048713996995885286, 'samples': 3297984, 'steps': 17176, 'loss/train': 1.6484146118164062} -11/06/2021 23:40:37 - INFO - __main__ - Step 17178: {'lr': 0.0004871382898019472, 'samples': 3298176, 'steps': 17177, 'loss/train': 1.687612771987915} -11/06/2021 23:40:37 - INFO - __main__ - Step 17179: {'lr': 0.0004871366095381908, 'samples': 3298368, 'steps': 17178, 'loss/train': 1.811246633529663} -11/06/2021 23:40:37 - INFO - __main__ - Step 17180: {'lr': 0.00048713492916758425, 'samples': 3298560, 'steps': 17179, 'loss/train': 1.000144124031067} -11/06/2021 23:40:39 - INFO - __main__ - Step 17181: {'lr': 0.00048713324869012833, 'samples': 3298752, 'steps': 17180, 'loss/train': 1.4316315650939941} -11/06/2021 23:40:39 - INFO - __main__ - Step 17182: {'lr': 0.0004871315681058238, 'samples': 3298944, 'steps': 17181, 'loss/train': 1.5694489479064941} -11/06/2021 23:40:39 - INFO - __main__ - Step 17183: {'lr': 0.0004871298874146716, 'samples': 3299136, 'steps': 17182, 'loss/train': 1.7600518465042114} -11/06/2021 23:40:40 - INFO - __main__ - Step 17184: {'lr': 0.00048712820661667215, 'samples': 3299328, 'steps': 17183, 'loss/train': 1.9780511856079102} -11/06/2021 23:40:40 - INFO - __main__ - Step 17185: {'lr': 0.0004871265257118265, 'samples': 3299520, 'steps': 17184, 'loss/train': 1.7205005884170532} -11/06/2021 23:40:41 - INFO - __main__ - Step 17186: {'lr': 0.0004871248447001352, 'samples': 3299712, 'steps': 17185, 'loss/train': 1.8531748056411743} -11/06/2021 23:40:41 - INFO - __main__ - Step 17187: {'lr': 0.0004871231635815992, 'samples': 3299904, 'steps': 17186, 'loss/train': 1.939202904701233} -11/06/2021 23:40:42 - INFO - __main__ - Step 17188: {'lr': 0.0004871214823562191, 'samples': 3300096, 'steps': 17187, 'loss/train': 1.5620630979537964} -11/06/2021 23:40:42 - INFO - __main__ - Step 17189: {'lr': 0.0004871198010239958, 'samples': 3300288, 'steps': 17188, 'loss/train': 1.8698750734329224} -11/06/2021 23:40:42 - INFO - __main__ - Step 17190: {'lr': 0.0004871181195849299, 'samples': 3300480, 'steps': 17189, 'loss/train': 1.9810320138931274} -11/06/2021 23:40:43 - INFO - __main__ - Step 17191: {'lr': 0.00048711643803902227, 'samples': 3300672, 'steps': 17190, 'loss/train': 1.5719085931777954} -11/06/2021 23:40:44 - INFO - __main__ - Step 17192: {'lr': 0.00048711475638627363, 'samples': 3300864, 'steps': 17191, 'loss/train': 2.2363479137420654} -11/06/2021 23:40:44 - INFO - __main__ - Step 17193: {'lr': 0.0004871130746266847, 'samples': 3301056, 'steps': 17192, 'loss/train': 1.8176665306091309} -11/06/2021 23:40:45 - INFO - __main__ - Step 17194: {'lr': 0.00048711139276025626, 'samples': 3301248, 'steps': 17193, 'loss/train': 1.7995778322219849} -11/06/2021 23:40:45 - INFO - __main__ - Step 17195: {'lr': 0.00048710971078698916, 'samples': 3301440, 'steps': 17194, 'loss/train': 1.1480748653411865} -11/06/2021 23:40:46 - INFO - __main__ - Step 17196: {'lr': 0.0004871080287068841, 'samples': 3301632, 'steps': 17195, 'loss/train': 2.0318057537078857} -11/06/2021 23:40:46 - INFO - __main__ - Step 17197: {'lr': 0.00048710634651994176, 'samples': 3301824, 'steps': 17196, 'loss/train': 1.7191940546035767} -11/06/2021 23:40:47 - INFO - __main__ - Step 17198: {'lr': 0.0004871046642261629, 'samples': 3302016, 'steps': 17197, 'loss/train': 1.612969994544983} -11/06/2021 23:40:47 - INFO - __main__ - Step 17199: {'lr': 0.0004871029818255485, 'samples': 3302208, 'steps': 17198, 'loss/train': 2.0721495151519775} -11/06/2021 23:40:47 - INFO - __main__ - Step 17200: {'lr': 0.0004871012993180991, 'samples': 3302400, 'steps': 17199, 'loss/train': 1.4163411855697632} -11/06/2021 23:40:48 - INFO - __main__ - Step 17201: {'lr': 0.0004870996167038154, 'samples': 3302592, 'steps': 17200, 'loss/train': 1.7400089502334595} -11/06/2021 23:40:49 - INFO - __main__ - Step 17202: {'lr': 0.0004870979339826984, 'samples': 3302784, 'steps': 17201, 'loss/train': 2.5178351402282715} -11/06/2021 23:40:49 - INFO - __main__ - Step 17203: {'lr': 0.00048709625115474865, 'samples': 3302976, 'steps': 17202, 'loss/train': 1.433853030204773} -11/06/2021 23:40:49 - INFO - __main__ - Step 17204: {'lr': 0.00048709456821996705, 'samples': 3303168, 'steps': 17203, 'loss/train': 2.0640363693237305} -11/06/2021 23:40:50 - INFO - __main__ - Step 17205: {'lr': 0.0004870928851783543, 'samples': 3303360, 'steps': 17204, 'loss/train': 1.7238097190856934} -11/06/2021 23:40:50 - INFO - __main__ - Step 17206: {'lr': 0.00048709120202991107, 'samples': 3303552, 'steps': 17205, 'loss/train': 1.600435733795166} -11/06/2021 23:40:51 - INFO - __main__ - Step 17207: {'lr': 0.0004870895187746383, 'samples': 3303744, 'steps': 17206, 'loss/train': 0.9599513411521912} -11/06/2021 23:40:51 - INFO - __main__ - Step 17208: {'lr': 0.00048708783541253655, 'samples': 3303936, 'steps': 17207, 'loss/train': 1.8640570640563965} -11/06/2021 23:40:52 - INFO - __main__ - Step 17209: {'lr': 0.00048708615194360675, 'samples': 3304128, 'steps': 17208, 'loss/train': 1.4890220165252686} -11/06/2021 23:40:52 - INFO - __main__ - Step 17210: {'lr': 0.0004870844683678496, 'samples': 3304320, 'steps': 17209, 'loss/train': 1.492447018623352} -11/06/2021 23:40:52 - INFO - __main__ - Step 17211: {'lr': 0.0004870827846852658, 'samples': 3304512, 'steps': 17210, 'loss/train': 1.8645015954971313} -11/06/2021 23:40:53 - INFO - __main__ - Step 17212: {'lr': 0.00048708110089585617, 'samples': 3304704, 'steps': 17211, 'loss/train': 1.7372667789459229} -11/06/2021 23:40:54 - INFO - __main__ - Step 17213: {'lr': 0.00048707941699962143, 'samples': 3304896, 'steps': 17212, 'loss/train': 2.233567953109741} -11/06/2021 23:40:54 - INFO - __main__ - Step 17214: {'lr': 0.0004870777329965624, 'samples': 3305088, 'steps': 17213, 'loss/train': 1.0954010486602783} -11/06/2021 23:40:54 - INFO - __main__ - Step 17215: {'lr': 0.00048707604888667983, 'samples': 3305280, 'steps': 17214, 'loss/train': 0.9866694211959839} -11/06/2021 23:40:55 - INFO - __main__ - Step 17216: {'lr': 0.0004870743646699744, 'samples': 3305472, 'steps': 17215, 'loss/train': 2.072942018508911} -11/06/2021 23:40:56 - INFO - __main__ - Step 17217: {'lr': 0.0004870726803464469, 'samples': 3305664, 'steps': 17216, 'loss/train': 1.3955477476119995} -11/06/2021 23:40:56 - INFO - __main__ - Step 17218: {'lr': 0.00048707099591609816, 'samples': 3305856, 'steps': 17217, 'loss/train': 1.746077060699463} -11/06/2021 23:40:57 - INFO - __main__ - Step 17219: {'lr': 0.0004870693113789289, 'samples': 3306048, 'steps': 17218, 'loss/train': 1.7401597499847412} -11/06/2021 23:40:57 - INFO - __main__ - Step 17220: {'lr': 0.00048706762673493987, 'samples': 3306240, 'steps': 17219, 'loss/train': 1.4887704849243164} -11/06/2021 23:40:57 - INFO - __main__ - Step 17221: {'lr': 0.00048706594198413177, 'samples': 3306432, 'steps': 17220, 'loss/train': 1.8607337474822998} -11/06/2021 23:40:58 - INFO - __main__ - Step 17222: {'lr': 0.0004870642571265054, 'samples': 3306624, 'steps': 17221, 'loss/train': 1.514723539352417} -11/06/2021 23:40:59 - INFO - __main__ - Step 17223: {'lr': 0.0004870625721620616, 'samples': 3306816, 'steps': 17222, 'loss/train': 1.485309362411499} -11/06/2021 23:40:59 - INFO - __main__ - Step 17224: {'lr': 0.00048706088709080103, 'samples': 3307008, 'steps': 17223, 'loss/train': 1.781569004058838} -11/06/2021 23:40:59 - INFO - __main__ - Step 17225: {'lr': 0.00048705920191272447, 'samples': 3307200, 'steps': 17224, 'loss/train': 1.8365702629089355} -11/06/2021 23:41:00 - INFO - __main__ - Step 17226: {'lr': 0.0004870575166278327, 'samples': 3307392, 'steps': 17225, 'loss/train': 1.4333207607269287} -11/06/2021 23:41:00 - INFO - __main__ - Step 17227: {'lr': 0.0004870558312361265, 'samples': 3307584, 'steps': 17226, 'loss/train': 1.2213234901428223} -11/06/2021 23:41:01 - INFO - __main__ - Step 17228: {'lr': 0.0004870541457376066, 'samples': 3307776, 'steps': 17227, 'loss/train': 1.2647724151611328} -11/06/2021 23:41:01 - INFO - __main__ - Step 17229: {'lr': 0.0004870524601322737, 'samples': 3307968, 'steps': 17228, 'loss/train': 1.4165525436401367} -11/06/2021 23:41:02 - INFO - __main__ - Step 17230: {'lr': 0.00048705077442012866, 'samples': 3308160, 'steps': 17229, 'loss/train': 1.423817753791809} -11/06/2021 23:41:02 - INFO - __main__ - Step 17231: {'lr': 0.0004870490886011723, 'samples': 3308352, 'steps': 17230, 'loss/train': 1.821036696434021} -11/06/2021 23:41:02 - INFO - __main__ - Step 17232: {'lr': 0.0004870474026754051, 'samples': 3308544, 'steps': 17231, 'loss/train': 1.5790460109710693} -11/06/2021 23:41:04 - INFO - __main__ - Step 17233: {'lr': 0.00048704571664282806, 'samples': 3308736, 'steps': 17232, 'loss/train': 2.0383269786834717} -11/06/2021 23:41:04 - INFO - __main__ - Step 17234: {'lr': 0.0004870440305034419, 'samples': 3308928, 'steps': 17233, 'loss/train': 1.1566420793533325} -11/06/2021 23:41:04 - INFO - __main__ - Step 17235: {'lr': 0.00048704234425724736, 'samples': 3309120, 'steps': 17234, 'loss/train': 1.1532448530197144} -11/06/2021 23:41:05 - INFO - __main__ - Step 17236: {'lr': 0.0004870406579042452, 'samples': 3309312, 'steps': 17235, 'loss/train': 1.7704163789749146} -11/06/2021 23:41:05 - INFO - __main__ - Step 17237: {'lr': 0.00048703897144443615, 'samples': 3309504, 'steps': 17236, 'loss/train': 1.2826061248779297} -11/06/2021 23:41:05 - INFO - __main__ - Step 17238: {'lr': 0.000487037284877821, 'samples': 3309696, 'steps': 17237, 'loss/train': 1.5143266916275024} -11/06/2021 23:41:06 - INFO - __main__ - Step 17239: {'lr': 0.00048703559820440054, 'samples': 3309888, 'steps': 17238, 'loss/train': 1.221914291381836} -11/06/2021 23:41:07 - INFO - __main__ - Step 17240: {'lr': 0.0004870339114241755, 'samples': 3310080, 'steps': 17239, 'loss/train': 1.3863588571548462} -11/06/2021 23:41:07 - INFO - __main__ - Step 17241: {'lr': 0.00048703222453714656, 'samples': 3310272, 'steps': 17240, 'loss/train': 1.3659840822219849} -11/06/2021 23:41:07 - INFO - __main__ - Step 17242: {'lr': 0.0004870305375433146, 'samples': 3310464, 'steps': 17241, 'loss/train': 1.8747817277908325} -11/06/2021 23:41:08 - INFO - __main__ - Step 17243: {'lr': 0.0004870288504426804, 'samples': 3310656, 'steps': 17242, 'loss/train': 1.3708194494247437} -11/06/2021 23:41:09 - INFO - __main__ - Step 17244: {'lr': 0.0004870271632352446, 'samples': 3310848, 'steps': 17243, 'loss/train': 1.7464226484298706} -11/06/2021 23:41:09 - INFO - __main__ - Step 17245: {'lr': 0.000487025475921008, 'samples': 3311040, 'steps': 17244, 'loss/train': 1.4908338785171509} -11/06/2021 23:41:10 - INFO - __main__ - Step 17246: {'lr': 0.00048702378849997143, 'samples': 3311232, 'steps': 17245, 'loss/train': 1.377392292022705} -11/06/2021 23:41:10 - INFO - __main__ - Step 17247: {'lr': 0.0004870221009721356, 'samples': 3311424, 'steps': 17246, 'loss/train': 2.0922882556915283} -11/06/2021 23:41:10 - INFO - __main__ - Step 17248: {'lr': 0.00048702041333750117, 'samples': 3311616, 'steps': 17247, 'loss/train': 1.4370702505111694} -11/06/2021 23:41:11 - INFO - __main__ - Step 17249: {'lr': 0.0004870187255960691, 'samples': 3311808, 'steps': 17248, 'loss/train': 2.13187313079834} -11/06/2021 23:41:12 - INFO - __main__ - Step 17250: {'lr': 0.00048701703774784, 'samples': 3312000, 'steps': 17249, 'loss/train': 0.7868022918701172} -11/06/2021 23:41:12 - INFO - __main__ - Step 17251: {'lr': 0.0004870153497928147, 'samples': 3312192, 'steps': 17250, 'loss/train': 1.8932836055755615} -11/06/2021 23:41:13 - INFO - __main__ - Step 17252: {'lr': 0.00048701366173099396, 'samples': 3312384, 'steps': 17251, 'loss/train': 2.3235738277435303} -11/06/2021 23:41:13 - INFO - __main__ - Step 17253: {'lr': 0.0004870119735623785, 'samples': 3312576, 'steps': 17252, 'loss/train': 1.8664605617523193} -11/06/2021 23:41:13 - INFO - __main__ - Step 17254: {'lr': 0.00048701028528696914, 'samples': 3312768, 'steps': 17253, 'loss/train': 1.6442269086837769} -11/06/2021 23:41:14 - INFO - __main__ - Step 17255: {'lr': 0.0004870085969047665, 'samples': 3312960, 'steps': 17254, 'loss/train': 1.5786818265914917} -11/06/2021 23:41:15 - INFO - __main__ - Step 17256: {'lr': 0.00048700690841577154, 'samples': 3313152, 'steps': 17255, 'loss/train': 1.9361462593078613} -11/06/2021 23:41:15 - INFO - __main__ - Step 17257: {'lr': 0.0004870052198199849, 'samples': 3313344, 'steps': 17256, 'loss/train': 1.8143517971038818} -11/06/2021 23:41:15 - INFO - __main__ - Step 17258: {'lr': 0.00048700353111740734, 'samples': 3313536, 'steps': 17257, 'loss/train': 1.4683324098587036} -11/06/2021 23:41:16 - INFO - __main__ - Step 17259: {'lr': 0.0004870018423080397, 'samples': 3313728, 'steps': 17258, 'loss/train': 2.0775022506713867} -11/06/2021 23:41:17 - INFO - __main__ - Step 17260: {'lr': 0.00048700015339188266, 'samples': 3313920, 'steps': 17259, 'loss/train': 1.94370698928833} -11/06/2021 23:41:17 - INFO - __main__ - Step 17261: {'lr': 0.0004869984643689369, 'samples': 3314112, 'steps': 17260, 'loss/train': 2.0206258296966553} -11/06/2021 23:41:18 - INFO - __main__ - Step 17262: {'lr': 0.00048699677523920346, 'samples': 3314304, 'steps': 17261, 'loss/train': 1.3398237228393555} -11/06/2021 23:41:18 - INFO - __main__ - Step 17263: {'lr': 0.00048699508600268284, 'samples': 3314496, 'steps': 17262, 'loss/train': 1.1747856140136719} -11/06/2021 23:41:18 - INFO - __main__ - Step 17264: {'lr': 0.00048699339665937594, 'samples': 3314688, 'steps': 17263, 'loss/train': 1.7770746946334839} -11/06/2021 23:41:19 - INFO - __main__ - Step 17265: {'lr': 0.0004869917072092834, 'samples': 3314880, 'steps': 17264, 'loss/train': 1.789361596107483} -11/06/2021 23:41:20 - INFO - __main__ - Step 17266: {'lr': 0.00048699001765240615, 'samples': 3315072, 'steps': 17265, 'loss/train': 1.4973350763320923} -11/06/2021 23:41:20 - INFO - __main__ - Step 17267: {'lr': 0.00048698832798874477, 'samples': 3315264, 'steps': 17266, 'loss/train': 1.6333647966384888} -11/06/2021 23:41:20 - INFO - __main__ - Step 17268: {'lr': 0.0004869866382183001, 'samples': 3315456, 'steps': 17267, 'loss/train': 1.2706983089447021} -11/06/2021 23:41:21 - INFO - __main__ - Step 17269: {'lr': 0.00048698494834107297, 'samples': 3315648, 'steps': 17268, 'loss/train': 1.8148884773254395} -11/06/2021 23:41:21 - INFO - __main__ - Step 17270: {'lr': 0.000486983258357064, 'samples': 3315840, 'steps': 17269, 'loss/train': 2.033538341522217} -11/06/2021 23:41:22 - INFO - __main__ - Step 17271: {'lr': 0.00048698156826627414, 'samples': 3316032, 'steps': 17270, 'loss/train': 1.4283595085144043} -11/06/2021 23:41:23 - INFO - __main__ - Step 17272: {'lr': 0.00048697987806870397, 'samples': 3316224, 'steps': 17271, 'loss/train': 1.6567562818527222} -11/06/2021 23:41:23 - INFO - __main__ - Step 17273: {'lr': 0.0004869781877643543, 'samples': 3316416, 'steps': 17272, 'loss/train': 2.0340371131896973} -11/06/2021 23:41:24 - INFO - __main__ - Step 17274: {'lr': 0.000486976497353226, 'samples': 3316608, 'steps': 17273, 'loss/train': 1.683788537979126} -11/06/2021 23:41:24 - INFO - __main__ - Step 17275: {'lr': 0.0004869748068353197, 'samples': 3316800, 'steps': 17274, 'loss/train': 1.2586175203323364} -11/06/2021 23:41:25 - INFO - __main__ - Step 17276: {'lr': 0.00048697311621063625, 'samples': 3316992, 'steps': 17275, 'loss/train': 0.27130571007728577} -11/06/2021 23:41:25 - INFO - __main__ - Step 17277: {'lr': 0.0004869714254791763, 'samples': 3317184, 'steps': 17276, 'loss/train': 1.1046879291534424} -11/06/2021 23:41:26 - INFO - __main__ - Step 17278: {'lr': 0.00048696973464094076, 'samples': 3317376, 'steps': 17277, 'loss/train': 1.5609723329544067} -11/06/2021 23:41:26 - INFO - __main__ - Step 17279: {'lr': 0.00048696804369593023, 'samples': 3317568, 'steps': 17278, 'loss/train': 1.604174017906189} -11/06/2021 23:41:26 - INFO - __main__ - Step 17280: {'lr': 0.0004869663526441456, 'samples': 3317760, 'steps': 17279, 'loss/train': 1.6268011331558228} -11/06/2021 23:41:28 - INFO - __main__ - Step 17281: {'lr': 0.0004869646614855876, 'samples': 3317952, 'steps': 17280, 'loss/train': 2.258241653442383} -11/06/2021 23:41:28 - INFO - __main__ - Step 17282: {'lr': 0.0004869629702202569, 'samples': 3318144, 'steps': 17281, 'loss/train': 1.8233325481414795} -11/06/2021 23:41:28 - INFO - __main__ - Step 17283: {'lr': 0.0004869612788481544, 'samples': 3318336, 'steps': 17282, 'loss/train': 1.6801536083221436} -11/06/2021 23:41:29 - INFO - __main__ - Step 17284: {'lr': 0.00048695958736928084, 'samples': 3318528, 'steps': 17283, 'loss/train': 1.0620797872543335} -11/06/2021 23:41:29 - INFO - __main__ - Step 17285: {'lr': 0.00048695789578363693, 'samples': 3318720, 'steps': 17284, 'loss/train': 2.001478910446167} -11/06/2021 23:41:29 - INFO - __main__ - Step 17286: {'lr': 0.00048695620409122345, 'samples': 3318912, 'steps': 17285, 'loss/train': 1.4987901449203491} -11/06/2021 23:41:30 - INFO - __main__ - Step 17287: {'lr': 0.00048695451229204115, 'samples': 3319104, 'steps': 17286, 'loss/train': 1.8941746950149536} -11/06/2021 23:41:31 - INFO - __main__ - Step 17288: {'lr': 0.0004869528203860908, 'samples': 3319296, 'steps': 17287, 'loss/train': 1.8230624198913574} -11/06/2021 23:41:31 - INFO - __main__ - Step 17289: {'lr': 0.0004869511283733732, 'samples': 3319488, 'steps': 17288, 'loss/train': 2.0317223072052} -11/06/2021 23:41:32 - INFO - __main__ - Step 17290: {'lr': 0.000486949436253889, 'samples': 3319680, 'steps': 17289, 'loss/train': 1.3601343631744385} -11/06/2021 23:41:32 - INFO - __main__ - Step 17291: {'lr': 0.0004869477440276391, 'samples': 3319872, 'steps': 17290, 'loss/train': 1.6629352569580078} -11/06/2021 23:41:33 - INFO - __main__ - Step 17292: {'lr': 0.00048694605169462415, 'samples': 3320064, 'steps': 17291, 'loss/train': 1.6145473718643188} -11/06/2021 23:41:33 - INFO - __main__ - Step 17293: {'lr': 0.00048694435925484506, 'samples': 3320256, 'steps': 17292, 'loss/train': 1.7590662240982056} -11/06/2021 23:41:34 - INFO - __main__ - Step 17294: {'lr': 0.0004869426667083024, 'samples': 3320448, 'steps': 17293, 'loss/train': 1.9693127870559692} -11/06/2021 23:41:34 - INFO - __main__ - Step 17295: {'lr': 0.00048694097405499703, 'samples': 3320640, 'steps': 17294, 'loss/train': 1.6262609958648682} -11/06/2021 23:41:34 - INFO - __main__ - Step 17296: {'lr': 0.0004869392812949298, 'samples': 3320832, 'steps': 17295, 'loss/train': 1.807649850845337} -11/06/2021 23:41:35 - INFO - __main__ - Step 17297: {'lr': 0.00048693758842810133, 'samples': 3321024, 'steps': 17296, 'loss/train': 1.6670494079589844} -11/06/2021 23:41:36 - INFO - __main__ - Step 17298: {'lr': 0.00048693589545451243, 'samples': 3321216, 'steps': 17297, 'loss/train': 1.5862675905227661} -11/06/2021 23:41:36 - INFO - __main__ - Step 17299: {'lr': 0.00048693420237416393, 'samples': 3321408, 'steps': 17298, 'loss/train': 1.3745173215866089} -11/06/2021 23:41:36 - INFO - __main__ - Step 17300: {'lr': 0.00048693250918705643, 'samples': 3321600, 'steps': 17299, 'loss/train': 1.0434212684631348} -11/06/2021 23:41:37 - INFO - __main__ - Step 17301: {'lr': 0.0004869308158931909, 'samples': 3321792, 'steps': 17300, 'loss/train': 1.2677903175354004} -11/06/2021 23:41:37 - INFO - __main__ - Step 17302: {'lr': 0.00048692912249256794, 'samples': 3321984, 'steps': 17301, 'loss/train': 1.7817742824554443} -11/06/2021 23:41:38 - INFO - __main__ - Step 17303: {'lr': 0.00048692742898518836, 'samples': 3322176, 'steps': 17302, 'loss/train': 0.8955352306365967} -11/06/2021 23:41:38 - INFO - __main__ - Step 17304: {'lr': 0.000486925735371053, 'samples': 3322368, 'steps': 17303, 'loss/train': 1.3537814617156982} -11/06/2021 23:41:39 - INFO - __main__ - Step 17305: {'lr': 0.00048692404165016256, 'samples': 3322560, 'steps': 17304, 'loss/train': 1.636925458908081} -11/06/2021 23:41:39 - INFO - __main__ - Step 17306: {'lr': 0.0004869223478225178, 'samples': 3322752, 'steps': 17305, 'loss/train': 1.4810558557510376} -11/06/2021 23:41:39 - INFO - __main__ - Step 17307: {'lr': 0.00048692065388811944, 'samples': 3322944, 'steps': 17306, 'loss/train': 2.2091891765594482} -11/06/2021 23:41:40 - INFO - __main__ - Step 17308: {'lr': 0.0004869189598469683, 'samples': 3323136, 'steps': 17307, 'loss/train': 1.5620085000991821} -11/06/2021 23:41:41 - INFO - __main__ - Step 17309: {'lr': 0.00048691726569906514, 'samples': 3323328, 'steps': 17308, 'loss/train': 1.429172158241272} -11/06/2021 23:41:41 - INFO - __main__ - Step 17310: {'lr': 0.0004869155714444107, 'samples': 3323520, 'steps': 17309, 'loss/train': 1.6215598583221436} -11/06/2021 23:41:42 - INFO - __main__ - Step 17311: {'lr': 0.00048691387708300584, 'samples': 3323712, 'steps': 17310, 'loss/train': 2.614412307739258} -11/06/2021 23:41:42 - INFO - __main__ - Step 17312: {'lr': 0.00048691218261485113, 'samples': 3323904, 'steps': 17311, 'loss/train': 1.9944758415222168} -11/06/2021 23:41:43 - INFO - __main__ - Step 17313: {'lr': 0.00048691048803994755, 'samples': 3324096, 'steps': 17312, 'loss/train': 1.879599928855896} -11/06/2021 23:41:43 - INFO - __main__ - Step 17314: {'lr': 0.00048690879335829565, 'samples': 3324288, 'steps': 17313, 'loss/train': 1.1751701831817627} -11/06/2021 23:41:44 - INFO - __main__ - Step 17315: {'lr': 0.00048690709856989635, 'samples': 3324480, 'steps': 17314, 'loss/train': 2.111276388168335} -11/06/2021 23:41:44 - INFO - __main__ - Step 17316: {'lr': 0.00048690540367475046, 'samples': 3324672, 'steps': 17315, 'loss/train': 1.5609761476516724} -11/06/2021 23:41:45 - INFO - __main__ - Step 17317: {'lr': 0.00048690370867285847, 'samples': 3324864, 'steps': 17316, 'loss/train': 1.1299504041671753} -11/06/2021 23:41:45 - INFO - __main__ - Step 17318: {'lr': 0.00048690201356422146, 'samples': 3325056, 'steps': 17317, 'loss/train': 2.0143861770629883} -11/06/2021 23:41:46 - INFO - __main__ - Step 17319: {'lr': 0.00048690031834884004, 'samples': 3325248, 'steps': 17318, 'loss/train': 1.9749722480773926} -11/06/2021 23:41:46 - INFO - __main__ - Step 17320: {'lr': 0.00048689862302671495, 'samples': 3325440, 'steps': 17319, 'loss/train': 1.8871047496795654} -11/06/2021 23:41:47 - INFO - __main__ - Step 17321: {'lr': 0.000486896927597847, 'samples': 3325632, 'steps': 17320, 'loss/train': 1.9571623802185059} -11/06/2021 23:41:47 - INFO - __main__ - Step 17322: {'lr': 0.00048689523206223693, 'samples': 3325824, 'steps': 17321, 'loss/train': 1.0182833671569824} -11/06/2021 23:41:47 - INFO - __main__ - Step 17323: {'lr': 0.00048689353641988563, 'samples': 3326016, 'steps': 17322, 'loss/train': 1.170893907546997} -11/06/2021 23:41:48 - INFO - __main__ - Step 17324: {'lr': 0.0004868918406707937, 'samples': 3326208, 'steps': 17323, 'loss/train': 1.7133080959320068} -11/06/2021 23:41:48 - INFO - __main__ - Step 17325: {'lr': 0.00048689014481496197, 'samples': 3326400, 'steps': 17324, 'loss/train': 1.9357455968856812} -11/06/2021 23:41:49 - INFO - __main__ - Step 17326: {'lr': 0.0004868884488523911, 'samples': 3326592, 'steps': 17325, 'loss/train': 1.7280464172363281} -11/06/2021 23:41:49 - INFO - __main__ - Step 17327: {'lr': 0.0004868867527830821, 'samples': 3326784, 'steps': 17326, 'loss/train': 2.280465602874756} -11/06/2021 23:41:50 - INFO - __main__ - Step 17328: {'lr': 0.0004868850566070355, 'samples': 3326976, 'steps': 17327, 'loss/train': 1.5123412609100342} -11/06/2021 23:41:51 - INFO - __main__ - Step 17329: {'lr': 0.00048688336032425217, 'samples': 3327168, 'steps': 17328, 'loss/train': 2.5029807090759277} -11/06/2021 23:41:51 - INFO - __main__ - Step 17330: {'lr': 0.0004868816639347328, 'samples': 3327360, 'steps': 17329, 'loss/train': 1.3121029138565063} -11/06/2021 23:41:52 - INFO - __main__ - Step 17331: {'lr': 0.0004868799674384783, 'samples': 3327552, 'steps': 17330, 'loss/train': 1.6100544929504395} -11/06/2021 23:41:52 - INFO - __main__ - Step 17332: {'lr': 0.0004868782708354893, 'samples': 3327744, 'steps': 17331, 'loss/train': 1.734197735786438} -11/06/2021 23:41:52 - INFO - __main__ - Step 17333: {'lr': 0.0004868765741257666, 'samples': 3327936, 'steps': 17332, 'loss/train': 0.5606326460838318} -11/06/2021 23:41:53 - INFO - __main__ - Step 17334: {'lr': 0.00048687487730931096, 'samples': 3328128, 'steps': 17333, 'loss/train': 1.4768435955047607} -11/06/2021 23:41:54 - INFO - __main__ - Step 17335: {'lr': 0.00048687318038612317, 'samples': 3328320, 'steps': 17334, 'loss/train': 1.0746694803237915} -11/06/2021 23:41:54 - INFO - __main__ - Step 17336: {'lr': 0.000486871483356204, 'samples': 3328512, 'steps': 17335, 'loss/train': 1.6409631967544556} -11/06/2021 23:41:55 - INFO - __main__ - Step 17337: {'lr': 0.00048686978621955416, 'samples': 3328704, 'steps': 17336, 'loss/train': 1.2255845069885254} -11/06/2021 23:41:55 - INFO - __main__ - Step 17338: {'lr': 0.00048686808897617447, 'samples': 3328896, 'steps': 17337, 'loss/train': 1.829113483428955} -11/06/2021 23:41:55 - INFO - __main__ - Step 17339: {'lr': 0.00048686639162606564, 'samples': 3329088, 'steps': 17338, 'loss/train': 1.5854146480560303} -11/06/2021 23:41:56 - INFO - __main__ - Step 17340: {'lr': 0.0004868646941692285, 'samples': 3329280, 'steps': 17339, 'loss/train': 1.6102768182754517} -11/06/2021 23:41:57 - INFO - __main__ - Step 17341: {'lr': 0.0004868629966056638, 'samples': 3329472, 'steps': 17340, 'loss/train': 1.1662577390670776} -11/06/2021 23:41:57 - INFO - __main__ - Step 17342: {'lr': 0.0004868612989353722, 'samples': 3329664, 'steps': 17341, 'loss/train': 1.8177578449249268} -11/06/2021 23:41:57 - INFO - __main__ - Step 17343: {'lr': 0.0004868596011583547, 'samples': 3329856, 'steps': 17342, 'loss/train': 2.0990030765533447} -11/06/2021 23:41:58 - INFO - __main__ - Step 17344: {'lr': 0.00048685790327461184, 'samples': 3330048, 'steps': 17343, 'loss/train': 1.853256106376648} -11/06/2021 23:41:59 - INFO - __main__ - Step 17345: {'lr': 0.0004868562052841444, 'samples': 3330240, 'steps': 17344, 'loss/train': 1.188179612159729} -11/06/2021 23:41:59 - INFO - __main__ - Step 17346: {'lr': 0.00048685450718695335, 'samples': 3330432, 'steps': 17345, 'loss/train': 1.7476564645767212} -11/06/2021 23:42:00 - INFO - __main__ - Step 17347: {'lr': 0.00048685280898303916, 'samples': 3330624, 'steps': 17346, 'loss/train': 1.694496512413025} -11/06/2021 23:42:00 - INFO - __main__ - Step 17348: {'lr': 0.00048685111067240283, 'samples': 3330816, 'steps': 17347, 'loss/train': 1.716973900794983} -11/06/2021 23:42:00 - INFO - __main__ - Step 17349: {'lr': 0.00048684941225504507, 'samples': 3331008, 'steps': 17348, 'loss/train': 2.0338494777679443} -11/06/2021 23:42:01 - INFO - __main__ - Step 17350: {'lr': 0.0004868477137309666, 'samples': 3331200, 'steps': 17349, 'loss/train': 0.9896562695503235} -11/06/2021 23:42:02 - INFO - __main__ - Step 17351: {'lr': 0.00048684601510016817, 'samples': 3331392, 'steps': 17350, 'loss/train': 1.7950968742370605} -11/06/2021 23:42:02 - INFO - __main__ - Step 17352: {'lr': 0.00048684431636265065, 'samples': 3331584, 'steps': 17351, 'loss/train': 1.272135615348816} -11/06/2021 23:42:02 - INFO - __main__ - Step 17353: {'lr': 0.00048684261751841463, 'samples': 3331776, 'steps': 17352, 'loss/train': 1.1567683219909668} -11/06/2021 23:42:03 - INFO - __main__ - Step 17354: {'lr': 0.000486840918567461, 'samples': 3331968, 'steps': 17353, 'loss/train': 1.702507734298706} -11/06/2021 23:42:03 - INFO - __main__ - Step 17355: {'lr': 0.0004868392195097906, 'samples': 3332160, 'steps': 17354, 'loss/train': 1.6192466020584106} -11/06/2021 23:42:04 - INFO - __main__ - Step 17356: {'lr': 0.0004868375203454041, 'samples': 3332352, 'steps': 17355, 'loss/train': 1.33048415184021} -11/06/2021 23:42:05 - INFO - __main__ - Step 17357: {'lr': 0.00048683582107430227, 'samples': 3332544, 'steps': 17356, 'loss/train': 1.4887734651565552} -11/06/2021 23:42:05 - INFO - __main__ - Step 17358: {'lr': 0.0004868341216964858, 'samples': 3332736, 'steps': 17357, 'loss/train': 1.8216099739074707} -11/06/2021 23:42:05 - INFO - __main__ - Step 17359: {'lr': 0.00048683242221195553, 'samples': 3332928, 'steps': 17358, 'loss/train': 1.927954912185669} -11/06/2021 23:42:06 - INFO - __main__ - Step 17360: {'lr': 0.00048683072262071224, 'samples': 3333120, 'steps': 17359, 'loss/train': 1.390279769897461} -11/06/2021 23:42:07 - INFO - __main__ - Step 17361: {'lr': 0.00048682902292275667, 'samples': 3333312, 'steps': 17360, 'loss/train': 1.5254342555999756} -11/06/2021 23:42:07 - INFO - __main__ - Step 17362: {'lr': 0.00048682732311808964, 'samples': 3333504, 'steps': 17361, 'loss/train': 1.4730674028396606} -11/06/2021 23:42:07 - INFO - __main__ - Step 17363: {'lr': 0.00048682562320671185, 'samples': 3333696, 'steps': 17362, 'loss/train': 2.2368764877319336} -11/06/2021 23:42:08 - INFO - __main__ - Step 17364: {'lr': 0.00048682392318862407, 'samples': 3333888, 'steps': 17363, 'loss/train': 1.7727394104003906} -11/06/2021 23:42:08 - INFO - __main__ - Step 17365: {'lr': 0.00048682222306382705, 'samples': 3334080, 'steps': 17364, 'loss/train': 1.5252821445465088} -11/06/2021 23:42:09 - INFO - __main__ - Step 17366: {'lr': 0.0004868205228323217, 'samples': 3334272, 'steps': 17365, 'loss/train': 2.325129508972168} -11/06/2021 23:42:09 - INFO - __main__ - Step 17367: {'lr': 0.0004868188224941086, 'samples': 3334464, 'steps': 17366, 'loss/train': 1.7640018463134766} -11/06/2021 23:42:10 - INFO - __main__ - Step 17368: {'lr': 0.0004868171220491886, 'samples': 3334656, 'steps': 17367, 'loss/train': 1.7070350646972656} -11/06/2021 23:42:10 - INFO - __main__ - Step 17369: {'lr': 0.00048681542149756253, 'samples': 3334848, 'steps': 17368, 'loss/train': 1.49398672580719} -11/06/2021 23:42:10 - INFO - __main__ - Step 17370: {'lr': 0.00048681372083923103, 'samples': 3335040, 'steps': 17369, 'loss/train': 1.4385478496551514} -11/06/2021 23:42:11 - INFO - __main__ - Step 17371: {'lr': 0.0004868120200741949, 'samples': 3335232, 'steps': 17370, 'loss/train': 1.6209843158721924} -11/06/2021 23:42:12 - INFO - __main__ - Step 17372: {'lr': 0.0004868103192024549, 'samples': 3335424, 'steps': 17371, 'loss/train': 1.3664069175720215} -11/06/2021 23:42:12 - INFO - __main__ - Step 17373: {'lr': 0.0004868086182240119, 'samples': 3335616, 'steps': 17372, 'loss/train': 1.0094228982925415} -11/06/2021 23:42:12 - INFO - __main__ - Step 17374: {'lr': 0.00048680691713886653, 'samples': 3335808, 'steps': 17373, 'loss/train': 1.8448344469070435} -11/06/2021 23:42:13 - INFO - __main__ - Step 17375: {'lr': 0.00048680521594701964, 'samples': 3336000, 'steps': 17374, 'loss/train': 1.669421672821045} -11/06/2021 23:42:13 - INFO - __main__ - Step 17376: {'lr': 0.00048680351464847207, 'samples': 3336192, 'steps': 17375, 'loss/train': 1.7565194368362427} -11/06/2021 23:42:14 - INFO - __main__ - Step 17377: {'lr': 0.00048680181324322437, 'samples': 3336384, 'steps': 17376, 'loss/train': 1.2871259450912476} -11/06/2021 23:42:15 - INFO - __main__ - Step 17378: {'lr': 0.00048680011173127746, 'samples': 3336576, 'steps': 17377, 'loss/train': 5.979392051696777} -11/06/2021 23:42:15 - INFO - __main__ - Step 17379: {'lr': 0.00048679841011263204, 'samples': 3336768, 'steps': 17378, 'loss/train': 1.605148434638977} -11/06/2021 23:42:15 - INFO - __main__ - Step 17380: {'lr': 0.00048679670838728894, 'samples': 3336960, 'steps': 17379, 'loss/train': 1.5023822784423828} -11/06/2021 23:42:16 - INFO - __main__ - Step 17381: {'lr': 0.0004867950065552489, 'samples': 3337152, 'steps': 17380, 'loss/train': 1.3871039152145386} -11/06/2021 23:42:17 - INFO - __main__ - Step 17382: {'lr': 0.00048679330461651275, 'samples': 3337344, 'steps': 17381, 'loss/train': 1.6298061609268188} -11/06/2021 23:42:17 - INFO - __main__ - Step 17383: {'lr': 0.00048679160257108107, 'samples': 3337536, 'steps': 17382, 'loss/train': 0.9420875906944275} -11/06/2021 23:42:17 - INFO - __main__ - Step 17384: {'lr': 0.00048678990041895484, 'samples': 3337728, 'steps': 17383, 'loss/train': 1.7141159772872925} -11/06/2021 23:42:18 - INFO - __main__ - Step 17385: {'lr': 0.00048678819816013467, 'samples': 3337920, 'steps': 17384, 'loss/train': 1.5371354818344116} -11/06/2021 23:42:18 - INFO - __main__ - Step 17386: {'lr': 0.0004867864957946214, 'samples': 3338112, 'steps': 17385, 'loss/train': 1.0904605388641357} -11/06/2021 23:42:19 - INFO - __main__ - Step 17387: {'lr': 0.0004867847933224158, 'samples': 3338304, 'steps': 17386, 'loss/train': 1.6519601345062256} -11/06/2021 23:42:20 - INFO - __main__ - Step 17388: {'lr': 0.0004867830907435187, 'samples': 3338496, 'steps': 17387, 'loss/train': 5.8294854164123535} -11/06/2021 23:42:20 - INFO - __main__ - Step 17389: {'lr': 0.0004867813880579307, 'samples': 3338688, 'steps': 17388, 'loss/train': 1.8847965002059937} -11/06/2021 23:42:20 - INFO - __main__ - Step 17390: {'lr': 0.0004867796852656527, 'samples': 3338880, 'steps': 17389, 'loss/train': 1.6456767320632935} -11/06/2021 23:42:21 - INFO - __main__ - Step 17391: {'lr': 0.00048677798236668537, 'samples': 3339072, 'steps': 17390, 'loss/train': 1.7139424085617065} -11/06/2021 23:42:21 - INFO - __main__ - Step 17392: {'lr': 0.00048677627936102966, 'samples': 3339264, 'steps': 17391, 'loss/train': 1.8065518140792847} -11/06/2021 23:42:22 - INFO - __main__ - Step 17393: {'lr': 0.0004867745762486861, 'samples': 3339456, 'steps': 17392, 'loss/train': 2.5346922874450684} -11/06/2021 23:42:22 - INFO - __main__ - Step 17394: {'lr': 0.0004867728730296556, 'samples': 3339648, 'steps': 17393, 'loss/train': 1.5756046772003174} -11/06/2021 23:42:23 - INFO - __main__ - Step 17395: {'lr': 0.0004867711697039389, 'samples': 3339840, 'steps': 17394, 'loss/train': 1.0653622150421143} -11/06/2021 23:42:23 - INFO - __main__ - Step 17396: {'lr': 0.00048676946627153675, 'samples': 3340032, 'steps': 17395, 'loss/train': 1.5175786018371582} -11/06/2021 23:42:24 - INFO - __main__ - Step 17397: {'lr': 0.00048676776273244994, 'samples': 3340224, 'steps': 17396, 'loss/train': 1.1968095302581787} -11/06/2021 23:42:24 - INFO - __main__ - Step 17398: {'lr': 0.00048676605908667926, 'samples': 3340416, 'steps': 17397, 'loss/train': 1.3067097663879395} -11/06/2021 23:42:25 - INFO - __main__ - Step 17399: {'lr': 0.00048676435533422536, 'samples': 3340608, 'steps': 17398, 'loss/train': 2.1273090839385986} -11/06/2021 23:42:25 - INFO - __main__ - Step 17400: {'lr': 0.00048676265147508917, 'samples': 3340800, 'steps': 17399, 'loss/train': 1.887537956237793} -11/06/2021 23:42:26 - INFO - __main__ - Step 17401: {'lr': 0.00048676094750927144, 'samples': 3340992, 'steps': 17400, 'loss/train': 1.2887080907821655} -11/06/2021 23:42:26 - INFO - __main__ - Step 17402: {'lr': 0.0004867592434367728, 'samples': 3341184, 'steps': 17401, 'loss/train': 1.5143498182296753} -11/06/2021 23:42:26 - INFO - __main__ - Step 17403: {'lr': 0.0004867575392575941, 'samples': 3341376, 'steps': 17402, 'loss/train': 1.996867299079895} -11/06/2021 23:42:27 - INFO - __main__ - Step 17404: {'lr': 0.0004867558349717361, 'samples': 3341568, 'steps': 17403, 'loss/train': 1.7546355724334717} -11/06/2021 23:42:28 - INFO - __main__ - Step 17405: {'lr': 0.0004867541305791996, 'samples': 3341760, 'steps': 17404, 'loss/train': 1.6053557395935059} -11/06/2021 23:42:28 - INFO - __main__ - Step 17406: {'lr': 0.00048675242607998533, 'samples': 3341952, 'steps': 17405, 'loss/train': 1.5730146169662476} -11/06/2021 23:42:28 - INFO - __main__ - Step 17407: {'lr': 0.00048675072147409405, 'samples': 3342144, 'steps': 17406, 'loss/train': 1.472575068473816} -11/06/2021 23:42:29 - INFO - __main__ - Step 17408: {'lr': 0.0004867490167615266, 'samples': 3342336, 'steps': 17407, 'loss/train': 1.358944296836853} -11/06/2021 23:42:30 - INFO - __main__ - Step 17409: {'lr': 0.0004867473119422837, 'samples': 3342528, 'steps': 17408, 'loss/train': 1.0930287837982178} -11/06/2021 23:42:30 - INFO - __main__ - Step 17410: {'lr': 0.00048674560701636606, 'samples': 3342720, 'steps': 17409, 'loss/train': 1.447057843208313} -11/06/2021 23:42:30 - INFO - __main__ - Step 17411: {'lr': 0.0004867439019837745, 'samples': 3342912, 'steps': 17410, 'loss/train': 1.6748888492584229} -11/06/2021 23:42:31 - INFO - __main__ - Step 17412: {'lr': 0.00048674219684450985, 'samples': 3343104, 'steps': 17411, 'loss/train': 1.5127593278884888} -11/06/2021 23:42:31 - INFO - __main__ - Step 17413: {'lr': 0.00048674049159857277, 'samples': 3343296, 'steps': 17412, 'loss/train': 1.2442376613616943} -11/06/2021 23:42:32 - INFO - __main__ - Step 17414: {'lr': 0.0004867387862459641, 'samples': 3343488, 'steps': 17413, 'loss/train': 1.1401019096374512} -11/06/2021 23:42:33 - INFO - __main__ - Step 17415: {'lr': 0.0004867370807866845, 'samples': 3343680, 'steps': 17414, 'loss/train': 1.5754122734069824} -11/06/2021 23:42:33 - INFO - __main__ - Step 17416: {'lr': 0.000486735375220735, 'samples': 3343872, 'steps': 17415, 'loss/train': 1.994115948677063} -11/06/2021 23:42:33 - INFO - __main__ - Step 17417: {'lr': 0.00048673366954811605, 'samples': 3344064, 'steps': 17416, 'loss/train': 1.5085574388504028} -11/06/2021 23:42:34 - INFO - __main__ - Step 17418: {'lr': 0.0004867319637688286, 'samples': 3344256, 'steps': 17417, 'loss/train': 1.8701719045639038} -11/06/2021 23:42:34 - INFO - __main__ - Step 17419: {'lr': 0.0004867302578828734, 'samples': 3344448, 'steps': 17418, 'loss/train': 1.6169779300689697} -11/06/2021 23:42:35 - INFO - __main__ - Step 17420: {'lr': 0.0004867285518902512, 'samples': 3344640, 'steps': 17419, 'loss/train': 0.6736646294593811} -11/06/2021 23:42:35 - INFO - __main__ - Step 17421: {'lr': 0.0004867268457909627, 'samples': 3344832, 'steps': 17420, 'loss/train': 1.7313899993896484} -11/06/2021 23:42:36 - INFO - __main__ - Step 17422: {'lr': 0.0004867251395850088, 'samples': 3345024, 'steps': 17421, 'loss/train': 1.910513162612915} -11/06/2021 23:42:36 - INFO - __main__ - Step 17423: {'lr': 0.00048672343327239024, 'samples': 3345216, 'steps': 17422, 'loss/train': 1.4655964374542236} -11/06/2021 23:42:36 - INFO - __main__ - Step 17424: {'lr': 0.00048672172685310767, 'samples': 3345408, 'steps': 17423, 'loss/train': 1.7403993606567383} -11/06/2021 23:42:38 - INFO - __main__ - Step 17425: {'lr': 0.000486720020327162, 'samples': 3345600, 'steps': 17424, 'loss/train': 1.7060999870300293} -11/06/2021 23:42:38 - INFO - __main__ - Step 17426: {'lr': 0.00048671831369455386, 'samples': 3345792, 'steps': 17425, 'loss/train': 1.8607850074768066} -11/06/2021 23:42:38 - INFO - __main__ - Step 17427: {'lr': 0.0004867166069552842, 'samples': 3345984, 'steps': 17426, 'loss/train': 2.2483069896698} -11/06/2021 23:42:39 - INFO - __main__ - Step 17428: {'lr': 0.00048671490010935366, 'samples': 3346176, 'steps': 17427, 'loss/train': 1.5636916160583496} -11/06/2021 23:42:39 - INFO - __main__ - Step 17429: {'lr': 0.00048671319315676305, 'samples': 3346368, 'steps': 17428, 'loss/train': 1.3616186380386353} -11/06/2021 23:42:39 - INFO - __main__ - Step 17430: {'lr': 0.00048671148609751307, 'samples': 3346560, 'steps': 17429, 'loss/train': 2.639005422592163} -11/06/2021 23:42:41 - INFO - __main__ - Step 17431: {'lr': 0.0004867097789316046, 'samples': 3346752, 'steps': 17430, 'loss/train': 1.3610199689865112} -11/06/2021 23:42:41 - INFO - __main__ - Step 17432: {'lr': 0.0004867080716590384, 'samples': 3346944, 'steps': 17431, 'loss/train': 1.6907752752304077} -11/06/2021 23:42:41 - INFO - __main__ - Step 17433: {'lr': 0.0004867063642798151, 'samples': 3347136, 'steps': 17432, 'loss/train': 0.8346073627471924} -11/06/2021 23:42:42 - INFO - __main__ - Step 17434: {'lr': 0.0004867046567939356, 'samples': 3347328, 'steps': 17433, 'loss/train': 0.30705493688583374} -11/06/2021 23:42:42 - INFO - __main__ - Step 17435: {'lr': 0.00048670294920140063, 'samples': 3347520, 'steps': 17434, 'loss/train': 1.677636981010437} -11/06/2021 23:42:42 - INFO - __main__ - Step 17436: {'lr': 0.00048670124150221094, 'samples': 3347712, 'steps': 17435, 'loss/train': 1.5929261445999146} -11/06/2021 23:42:43 - INFO - __main__ - Step 17437: {'lr': 0.00048669953369636737, 'samples': 3347904, 'steps': 17436, 'loss/train': 1.458001971244812} -11/06/2021 23:42:44 - INFO - __main__ - Step 17438: {'lr': 0.00048669782578387067, 'samples': 3348096, 'steps': 17437, 'loss/train': 1.7061351537704468} -11/06/2021 23:42:44 - INFO - __main__ - Step 17439: {'lr': 0.00048669611776472153, 'samples': 3348288, 'steps': 17438, 'loss/train': 1.6646876335144043} -11/06/2021 23:42:44 - INFO - __main__ - Step 17440: {'lr': 0.00048669440963892074, 'samples': 3348480, 'steps': 17439, 'loss/train': 1.8037528991699219} -11/06/2021 23:42:45 - INFO - __main__ - Step 17441: {'lr': 0.00048669270140646914, 'samples': 3348672, 'steps': 17440, 'loss/train': 1.4020469188690186} -11/06/2021 23:42:46 - INFO - __main__ - Step 17442: {'lr': 0.0004866909930673675, 'samples': 3348864, 'steps': 17441, 'loss/train': 1.5615054368972778} -11/06/2021 23:42:46 - INFO - __main__ - Step 17443: {'lr': 0.00048668928462161653, 'samples': 3349056, 'steps': 17442, 'loss/train': 1.6594544649124146} -11/06/2021 23:42:46 - INFO - __main__ - Step 17444: {'lr': 0.000486687576069217, 'samples': 3349248, 'steps': 17443, 'loss/train': 1.418339729309082} -11/06/2021 23:42:47 - INFO - __main__ - Step 17445: {'lr': 0.00048668586741016967, 'samples': 3349440, 'steps': 17444, 'loss/train': 1.9371867179870605} -11/06/2021 23:42:47 - INFO - __main__ - Step 17446: {'lr': 0.0004866841586444754, 'samples': 3349632, 'steps': 17445, 'loss/train': 1.3474305868148804} -11/06/2021 23:42:49 - INFO - __main__ - Step 17447: {'lr': 0.0004866824497721349, 'samples': 3349824, 'steps': 17446, 'loss/train': 0.8789267539978027} -11/06/2021 23:42:49 - INFO - __main__ - Step 17448: {'lr': 0.0004866807407931489, 'samples': 3350016, 'steps': 17447, 'loss/train': 1.4513202905654907} -11/06/2021 23:42:49 - INFO - __main__ - Step 17449: {'lr': 0.0004866790317075182, 'samples': 3350208, 'steps': 17448, 'loss/train': 1.5578341484069824} -11/06/2021 23:42:50 - INFO - __main__ - Step 17450: {'lr': 0.00048667732251524365, 'samples': 3350400, 'steps': 17449, 'loss/train': 1.9759602546691895} -11/06/2021 23:42:50 - INFO - __main__ - Step 17451: {'lr': 0.0004866756132163259, 'samples': 3350592, 'steps': 17450, 'loss/train': 1.5698901414871216} -11/06/2021 23:42:50 - INFO - __main__ - Step 17452: {'lr': 0.0004866739038107658, 'samples': 3350784, 'steps': 17451, 'loss/train': 1.6254311800003052} -11/06/2021 23:42:51 - INFO - __main__ - Step 17453: {'lr': 0.000486672194298564, 'samples': 3350976, 'steps': 17452, 'loss/train': 1.6596328020095825} -11/06/2021 23:42:52 - INFO - __main__ - Step 17454: {'lr': 0.00048667048467972146, 'samples': 3351168, 'steps': 17453, 'loss/train': 1.0186972618103027} -11/06/2021 23:42:52 - INFO - __main__ - Step 17455: {'lr': 0.00048666877495423885, 'samples': 3351360, 'steps': 17454, 'loss/train': 1.5029501914978027} -11/06/2021 23:42:52 - INFO - __main__ - Step 17456: {'lr': 0.0004866670651221169, 'samples': 3351552, 'steps': 17455, 'loss/train': 1.6649607419967651} -11/06/2021 23:42:53 - INFO - __main__ - Step 17457: {'lr': 0.0004866653551833564, 'samples': 3351744, 'steps': 17456, 'loss/train': 1.0854140520095825} -11/06/2021 23:42:53 - INFO - __main__ - Step 17458: {'lr': 0.00048666364513795816, 'samples': 3351936, 'steps': 17457, 'loss/train': 1.361505389213562} -11/06/2021 23:42:54 - INFO - __main__ - Step 17459: {'lr': 0.00048666193498592304, 'samples': 3352128, 'steps': 17458, 'loss/train': 1.6825581789016724} -11/06/2021 23:42:55 - INFO - __main__ - Step 17460: {'lr': 0.0004866602247272516, 'samples': 3352320, 'steps': 17459, 'loss/train': 1.7726678848266602} -11/06/2021 23:42:55 - INFO - __main__ - Step 17461: {'lr': 0.0004866585143619447, 'samples': 3352512, 'steps': 17460, 'loss/train': 1.8011826276779175} -11/06/2021 23:42:55 - INFO - __main__ - Step 17462: {'lr': 0.00048665680389000315, 'samples': 3352704, 'steps': 17461, 'loss/train': 1.5437105894088745} -11/06/2021 23:42:56 - INFO - __main__ - Step 17463: {'lr': 0.0004866550933114277, 'samples': 3352896, 'steps': 17462, 'loss/train': 1.5845763683319092} -11/06/2021 23:42:57 - INFO - __main__ - Step 17464: {'lr': 0.00048665338262621915, 'samples': 3353088, 'steps': 17463, 'loss/train': 1.909666895866394} -11/06/2021 23:42:57 - INFO - __main__ - Step 17465: {'lr': 0.00048665167183437817, 'samples': 3353280, 'steps': 17464, 'loss/train': 1.7902839183807373} -11/06/2021 23:42:57 - INFO - __main__ - Step 17466: {'lr': 0.00048664996093590563, 'samples': 3353472, 'steps': 17465, 'loss/train': 1.6980420351028442} -11/06/2021 23:42:58 - INFO - __main__ - Step 17467: {'lr': 0.0004866482499308023, 'samples': 3353664, 'steps': 17466, 'loss/train': 1.636150598526001} -11/06/2021 23:42:58 - INFO - __main__ - Step 17468: {'lr': 0.0004866465388190689, 'samples': 3353856, 'steps': 17467, 'loss/train': 1.7070634365081787} -11/06/2021 23:42:59 - INFO - __main__ - Step 17469: {'lr': 0.0004866448276007062, 'samples': 3354048, 'steps': 17468, 'loss/train': 1.6868599653244019} -11/06/2021 23:42:59 - INFO - __main__ - Step 17470: {'lr': 0.000486643116275715, 'samples': 3354240, 'steps': 17469, 'loss/train': 1.1477397680282593} -11/06/2021 23:43:00 - INFO - __main__ - Step 17471: {'lr': 0.00048664140484409613, 'samples': 3354432, 'steps': 17470, 'loss/train': 2.090226173400879} -11/06/2021 23:43:00 - INFO - __main__ - Step 17472: {'lr': 0.0004866396933058502, 'samples': 3354624, 'steps': 17471, 'loss/train': 1.5251487493515015} -11/06/2021 23:43:00 - INFO - __main__ - Step 17473: {'lr': 0.00048663798166097814, 'samples': 3354816, 'steps': 17472, 'loss/train': 1.5208324193954468} -11/06/2021 23:43:01 - INFO - __main__ - Step 17474: {'lr': 0.0004866362699094806, 'samples': 3355008, 'steps': 17473, 'loss/train': 1.9953933954238892} -11/06/2021 23:43:02 - INFO - __main__ - Step 17475: {'lr': 0.0004866345580513585, 'samples': 3355200, 'steps': 17474, 'loss/train': 1.5545861721038818} -11/06/2021 23:43:02 - INFO - __main__ - Step 17476: {'lr': 0.0004866328460866124, 'samples': 3355392, 'steps': 17475, 'loss/train': 1.7343254089355469} -11/06/2021 23:43:03 - INFO - __main__ - Step 17477: {'lr': 0.0004866311340152433, 'samples': 3355584, 'steps': 17476, 'loss/train': 1.4653677940368652} -11/06/2021 23:43:03 - INFO - __main__ - Step 17478: {'lr': 0.0004866294218372518, 'samples': 3355776, 'steps': 17477, 'loss/train': 0.9723559617996216} -11/06/2021 23:43:03 - INFO - __main__ - Step 17479: {'lr': 0.0004866277095526387, 'samples': 3355968, 'steps': 17478, 'loss/train': 2.013335943222046} -11/06/2021 23:43:04 - INFO - __main__ - Step 17480: {'lr': 0.00048662599716140485, 'samples': 3356160, 'steps': 17479, 'loss/train': 0.8285233974456787} -11/06/2021 23:43:05 - INFO - __main__ - Step 17481: {'lr': 0.00048662428466355104, 'samples': 3356352, 'steps': 17480, 'loss/train': 1.3983826637268066} -11/06/2021 23:43:05 - INFO - __main__ - Step 17482: {'lr': 0.0004866225720590779, 'samples': 3356544, 'steps': 17481, 'loss/train': 1.461501955986023} -11/06/2021 23:43:05 - INFO - __main__ - Step 17483: {'lr': 0.00048662085934798627, 'samples': 3356736, 'steps': 17482, 'loss/train': 2.3746488094329834} -11/06/2021 23:43:06 - INFO - __main__ - Step 17484: {'lr': 0.00048661914653027694, 'samples': 3356928, 'steps': 17483, 'loss/train': 1.401358962059021} -11/06/2021 23:43:07 - INFO - __main__ - Step 17485: {'lr': 0.0004866174336059507, 'samples': 3357120, 'steps': 17484, 'loss/train': 1.5222047567367554} -11/06/2021 23:43:07 - INFO - __main__ - Step 17486: {'lr': 0.00048661572057500833, 'samples': 3357312, 'steps': 17485, 'loss/train': 1.8743535280227661} -11/06/2021 23:43:07 - INFO - __main__ - Step 17487: {'lr': 0.00048661400743745057, 'samples': 3357504, 'steps': 17486, 'loss/train': 1.2900893688201904} -11/06/2021 23:43:08 - INFO - __main__ - Step 17488: {'lr': 0.00048661229419327806, 'samples': 3357696, 'steps': 17487, 'loss/train': 2.1348865032196045} -11/06/2021 23:43:08 - INFO - __main__ - Step 17489: {'lr': 0.0004866105808424918, 'samples': 3357888, 'steps': 17488, 'loss/train': 1.581131100654602} -11/06/2021 23:43:09 - INFO - __main__ - Step 17490: {'lr': 0.0004866088673850925, 'samples': 3358080, 'steps': 17489, 'loss/train': 1.3917348384857178} -11/06/2021 23:43:09 - INFO - __main__ - Step 17491: {'lr': 0.0004866071538210808, 'samples': 3358272, 'steps': 17490, 'loss/train': 1.749387502670288} -11/06/2021 23:43:10 - INFO - __main__ - Step 17492: {'lr': 0.0004866054401504576, 'samples': 3358464, 'steps': 17491, 'loss/train': 1.3572897911071777} -11/06/2021 23:43:10 - INFO - __main__ - Step 17493: {'lr': 0.0004866037263732237, 'samples': 3358656, 'steps': 17492, 'loss/train': 1.8439452648162842} -11/06/2021 23:43:10 - INFO - __main__ - Step 17494: {'lr': 0.00048660201248937974, 'samples': 3358848, 'steps': 17493, 'loss/train': 1.8274236917495728} -11/06/2021 23:43:12 - INFO - __main__ - Step 17495: {'lr': 0.0004866002984989266, 'samples': 3359040, 'steps': 17494, 'loss/train': 1.4386416673660278} -11/06/2021 23:43:12 - INFO - __main__ - Step 17496: {'lr': 0.000486598584401865, 'samples': 3359232, 'steps': 17495, 'loss/train': 1.7358335256576538} -11/06/2021 23:43:12 - INFO - __main__ - Step 17497: {'lr': 0.0004865968701981958, 'samples': 3359424, 'steps': 17496, 'loss/train': 1.8483222723007202} -11/06/2021 23:43:13 - INFO - __main__ - Step 17498: {'lr': 0.0004865951558879196, 'samples': 3359616, 'steps': 17497, 'loss/train': 1.65242600440979} -11/06/2021 23:43:13 - INFO - __main__ - Step 17499: {'lr': 0.00048659344147103725, 'samples': 3359808, 'steps': 17498, 'loss/train': 1.2766807079315186} -11/06/2021 23:43:14 - INFO - __main__ - Step 17500: {'lr': 0.0004865917269475496, 'samples': 3360000, 'steps': 17499, 'loss/train': 1.5660682916641235} -11/06/2021 23:43:14 - INFO - __main__ - Step 17501: {'lr': 0.00048659001231745734, 'samples': 3360192, 'steps': 17500, 'loss/train': 1.4074636697769165} -11/06/2021 23:43:15 - INFO - __main__ - Step 17502: {'lr': 0.0004865882975807614, 'samples': 3360384, 'steps': 17501, 'loss/train': 1.3170610666275024} -11/06/2021 23:43:15 - INFO - __main__ - Step 17503: {'lr': 0.00048658658273746224, 'samples': 3360576, 'steps': 17502, 'loss/train': 1.7989710569381714} -11/06/2021 23:43:15 - INFO - __main__ - Step 17504: {'lr': 0.00048658486778756097, 'samples': 3360768, 'steps': 17503, 'loss/train': 1.5153037309646606} -11/06/2021 23:43:16 - INFO - __main__ - Step 17505: {'lr': 0.0004865831527310581, 'samples': 3360960, 'steps': 17504, 'loss/train': 1.4141513109207153} -11/06/2021 23:43:17 - INFO - __main__ - Step 17506: {'lr': 0.00048658143756795456, 'samples': 3361152, 'steps': 17505, 'loss/train': 1.6811589002609253} -11/06/2021 23:43:17 - INFO - __main__ - Step 17507: {'lr': 0.0004865797222982511, 'samples': 3361344, 'steps': 17506, 'loss/train': 1.6422348022460938} -11/06/2021 23:43:17 - INFO - __main__ - Step 17508: {'lr': 0.0004865780069219484, 'samples': 3361536, 'steps': 17507, 'loss/train': 1.3525933027267456} -11/06/2021 23:43:18 - INFO - __main__ - Step 17509: {'lr': 0.00048657629143904733, 'samples': 3361728, 'steps': 17508, 'loss/train': 1.62557053565979} -11/06/2021 23:43:19 - INFO - __main__ - Step 17510: {'lr': 0.0004865745758495487, 'samples': 3361920, 'steps': 17509, 'loss/train': 1.487194299697876} -11/06/2021 23:43:19 - INFO - __main__ - Step 17511: {'lr': 0.00048657286015345313, 'samples': 3362112, 'steps': 17510, 'loss/train': 1.7892093658447266} -11/06/2021 23:43:19 - INFO - __main__ - Step 17512: {'lr': 0.00048657114435076153, 'samples': 3362304, 'steps': 17511, 'loss/train': 1.6680396795272827} -11/06/2021 23:43:20 - INFO - __main__ - Step 17513: {'lr': 0.00048656942844147464, 'samples': 3362496, 'steps': 17512, 'loss/train': 3.819169282913208} -11/06/2021 23:43:20 - INFO - __main__ - Step 17514: {'lr': 0.00048656771242559316, 'samples': 3362688, 'steps': 17513, 'loss/train': 1.190946340560913} -11/06/2021 23:43:20 - INFO - __main__ - Step 17515: {'lr': 0.0004865659963031179, 'samples': 3362880, 'steps': 17514, 'loss/train': 1.7531355619430542} -11/06/2021 23:43:22 - INFO - __main__ - Step 17516: {'lr': 0.0004865642800740497, 'samples': 3363072, 'steps': 17515, 'loss/train': 1.5190026760101318} -11/06/2021 23:43:22 - INFO - __main__ - Step 17517: {'lr': 0.0004865625637383893, 'samples': 3363264, 'steps': 17516, 'loss/train': 1.2556828260421753} -11/06/2021 23:43:22 - INFO - __main__ - Step 17518: {'lr': 0.00048656084729613747, 'samples': 3363456, 'steps': 17517, 'loss/train': 1.2229467630386353} -11/06/2021 23:43:23 - INFO - __main__ - Step 17519: {'lr': 0.0004865591307472949, 'samples': 3363648, 'steps': 17518, 'loss/train': 1.7990758419036865} -11/06/2021 23:43:23 - INFO - __main__ - Step 17520: {'lr': 0.0004865574140918625, 'samples': 3363840, 'steps': 17519, 'loss/train': 1.7815418243408203} -11/06/2021 23:43:24 - INFO - __main__ - Step 17521: {'lr': 0.00048655569732984096, 'samples': 3364032, 'steps': 17520, 'loss/train': 1.8178268671035767} -11/06/2021 23:43:24 - INFO - __main__ - Step 17522: {'lr': 0.000486553980461231, 'samples': 3364224, 'steps': 17521, 'loss/train': 1.6401214599609375} -11/06/2021 23:43:25 - INFO - __main__ - Step 17523: {'lr': 0.0004865522634860335, 'samples': 3364416, 'steps': 17522, 'loss/train': 1.9060850143432617} -11/06/2021 23:43:25 - INFO - __main__ - Step 17524: {'lr': 0.00048655054640424936, 'samples': 3364608, 'steps': 17523, 'loss/train': 1.5981122255325317} -11/06/2021 23:43:25 - INFO - __main__ - Step 17525: {'lr': 0.00048654882921587907, 'samples': 3364800, 'steps': 17524, 'loss/train': 1.5546878576278687} -11/06/2021 23:43:27 - INFO - __main__ - Step 17526: {'lr': 0.00048654711192092347, 'samples': 3364992, 'steps': 17525, 'loss/train': 1.4803307056427002} -11/06/2021 23:43:27 - INFO - __main__ - Step 17527: {'lr': 0.0004865453945193835, 'samples': 3365184, 'steps': 17526, 'loss/train': 1.9428281784057617} -11/06/2021 23:43:28 - INFO - __main__ - Step 17528: {'lr': 0.00048654367701125975, 'samples': 3365376, 'steps': 17527, 'loss/train': 1.6251273155212402} -11/06/2021 23:43:28 - INFO - __main__ - Step 17529: {'lr': 0.0004865419593965531, 'samples': 3365568, 'steps': 17528, 'loss/train': 1.402294397354126} -11/06/2021 23:43:28 - INFO - __main__ - Step 17530: {'lr': 0.0004865402416752642, 'samples': 3365760, 'steps': 17529, 'loss/train': 1.7213939428329468} -11/06/2021 23:43:29 - INFO - __main__ - Step 17531: {'lr': 0.0004865385238473941, 'samples': 3365952, 'steps': 17530, 'loss/train': 1.3953073024749756} -11/06/2021 23:43:30 - INFO - __main__ - Step 17532: {'lr': 0.00048653680591294324, 'samples': 3366144, 'steps': 17531, 'loss/train': 1.9114352464675903} -11/06/2021 23:43:30 - INFO - __main__ - Step 17533: {'lr': 0.00048653508787191256, 'samples': 3366336, 'steps': 17532, 'loss/train': 1.8594201803207397} -11/06/2021 23:43:30 - INFO - __main__ - Step 17534: {'lr': 0.00048653336972430297, 'samples': 3366528, 'steps': 17533, 'loss/train': 1.5995358228683472} -11/06/2021 23:43:31 - INFO - __main__ - Step 17535: {'lr': 0.0004865316514701149, 'samples': 3366720, 'steps': 17534, 'loss/train': 1.5479685068130493} -11/06/2021 23:43:32 - INFO - __main__ - Step 17536: {'lr': 0.0004865299331093495, 'samples': 3366912, 'steps': 17535, 'loss/train': 1.3341885805130005} -11/06/2021 23:43:32 - INFO - __main__ - Step 17537: {'lr': 0.0004865282146420072, 'samples': 3367104, 'steps': 17536, 'loss/train': 0.8059349060058594} -11/06/2021 23:43:32 - INFO - __main__ - Step 17538: {'lr': 0.000486526496068089, 'samples': 3367296, 'steps': 17537, 'loss/train': 1.6529076099395752} -11/06/2021 23:43:33 - INFO - __main__ - Step 17539: {'lr': 0.0004865247773875956, 'samples': 3367488, 'steps': 17538, 'loss/train': 1.8571265935897827} -11/06/2021 23:43:33 - INFO - __main__ - Step 17540: {'lr': 0.0004865230586005278, 'samples': 3367680, 'steps': 17539, 'loss/train': 1.6223375797271729} -11/06/2021 23:43:33 - INFO - __main__ - Step 17541: {'lr': 0.00048652133970688633, 'samples': 3367872, 'steps': 17540, 'loss/train': 0.8137564063072205} -11/06/2021 23:43:35 - INFO - __main__ - Step 17542: {'lr': 0.00048651962070667197, 'samples': 3368064, 'steps': 17541, 'loss/train': 1.4748502969741821} -11/06/2021 23:43:35 - INFO - __main__ - Step 17543: {'lr': 0.00048651790159988563, 'samples': 3368256, 'steps': 17542, 'loss/train': 1.915865421295166} -11/06/2021 23:43:35 - INFO - __main__ - Step 17544: {'lr': 0.0004865161823865279, 'samples': 3368448, 'steps': 17543, 'loss/train': 1.7708138227462769} -11/06/2021 23:43:36 - INFO - __main__ - Step 17545: {'lr': 0.0004865144630665996, 'samples': 3368640, 'steps': 17544, 'loss/train': 1.7487539052963257} -11/06/2021 23:43:36 - INFO - __main__ - Step 17546: {'lr': 0.0004865127436401016, 'samples': 3368832, 'steps': 17545, 'loss/train': 0.35892412066459656} -11/06/2021 23:43:37 - INFO - __main__ - Step 17547: {'lr': 0.00048651102410703464, 'samples': 3369024, 'steps': 17546, 'loss/train': 1.7375950813293457} -11/06/2021 23:43:37 - INFO - __main__ - Step 17548: {'lr': 0.00048650930446739936, 'samples': 3369216, 'steps': 17547, 'loss/train': 1.6162850856781006} -11/06/2021 23:43:38 - INFO - __main__ - Step 17549: {'lr': 0.00048650758472119666, 'samples': 3369408, 'steps': 17548, 'loss/train': 1.576440453529358} -11/06/2021 23:43:38 - INFO - __main__ - Step 17550: {'lr': 0.0004865058648684273, 'samples': 3369600, 'steps': 17549, 'loss/train': 1.9157060384750366} -11/06/2021 23:43:38 - INFO - __main__ - Step 17551: {'lr': 0.00048650414490909207, 'samples': 3369792, 'steps': 17550, 'loss/train': 1.5747535228729248} -11/06/2021 23:43:40 - INFO - __main__ - Step 17552: {'lr': 0.00048650242484319175, 'samples': 3369984, 'steps': 17551, 'loss/train': 1.121293544769287} -11/06/2021 23:43:40 - INFO - __main__ - Step 17553: {'lr': 0.000486500704670727, 'samples': 3370176, 'steps': 17552, 'loss/train': 1.5847798585891724} -11/06/2021 23:43:40 - INFO - __main__ - Step 17554: {'lr': 0.0004864989843916987, 'samples': 3370368, 'steps': 17553, 'loss/train': 1.2869236469268799} -11/06/2021 23:43:41 - INFO - __main__ - Step 17555: {'lr': 0.0004864972640061077, 'samples': 3370560, 'steps': 17554, 'loss/train': 2.118384838104248} -11/06/2021 23:43:41 - INFO - __main__ - Step 17556: {'lr': 0.00048649554351395453, 'samples': 3370752, 'steps': 17555, 'loss/train': 1.5035825967788696} -11/06/2021 23:43:42 - INFO - __main__ - Step 17557: {'lr': 0.00048649382291524024, 'samples': 3370944, 'steps': 17556, 'loss/train': 1.856012225151062} -11/06/2021 23:43:42 - INFO - __main__ - Step 17558: {'lr': 0.0004864921022099654, 'samples': 3371136, 'steps': 17557, 'loss/train': 1.5416059494018555} -11/06/2021 23:43:43 - INFO - __main__ - Step 17559: {'lr': 0.00048649038139813097, 'samples': 3371328, 'steps': 17558, 'loss/train': 2.0964815616607666} -11/06/2021 23:43:43 - INFO - __main__ - Step 17560: {'lr': 0.00048648866047973756, 'samples': 3371520, 'steps': 17559, 'loss/train': 1.6892518997192383} -11/06/2021 23:43:43 - INFO - __main__ - Step 17561: {'lr': 0.000486486939454786, 'samples': 3371712, 'steps': 17560, 'loss/train': 1.6873033046722412} -11/06/2021 23:43:44 - INFO - __main__ - Step 17562: {'lr': 0.0004864852183232771, 'samples': 3371904, 'steps': 17561, 'loss/train': 1.7886723279953003} -11/06/2021 23:43:45 - INFO - __main__ - Step 17563: {'lr': 0.0004864834970852116, 'samples': 3372096, 'steps': 17562, 'loss/train': 1.7234721183776855} -11/06/2021 23:43:45 - INFO - __main__ - Step 17564: {'lr': 0.0004864817757405903, 'samples': 3372288, 'steps': 17563, 'loss/train': 1.9006706476211548} -11/06/2021 23:43:45 - INFO - __main__ - Step 17565: {'lr': 0.0004864800542894139, 'samples': 3372480, 'steps': 17564, 'loss/train': 1.8513051271438599} -11/06/2021 23:43:46 - INFO - __main__ - Step 17566: {'lr': 0.0004864783327316833, 'samples': 3372672, 'steps': 17565, 'loss/train': 1.8104248046875} -11/06/2021 23:43:46 - INFO - __main__ - Step 17567: {'lr': 0.0004864766110673992, 'samples': 3372864, 'steps': 17566, 'loss/train': 1.8728556632995605} -11/06/2021 23:43:47 - INFO - __main__ - Step 17568: {'lr': 0.00048647488929656237, 'samples': 3373056, 'steps': 17567, 'loss/train': 2.102489709854126} -11/06/2021 23:43:47 - INFO - __main__ - Step 17569: {'lr': 0.00048647316741917365, 'samples': 3373248, 'steps': 17568, 'loss/train': 1.702294945716858} -11/06/2021 23:43:48 - INFO - __main__ - Step 17570: {'lr': 0.0004864714454352337, 'samples': 3373440, 'steps': 17569, 'loss/train': 1.3519634008407593} -11/06/2021 23:43:48 - INFO - __main__ - Step 17571: {'lr': 0.00048646972334474343, 'samples': 3373632, 'steps': 17570, 'loss/train': 1.59146249294281} -11/06/2021 23:43:49 - INFO - __main__ - Step 17572: {'lr': 0.0004864680011477035, 'samples': 3373824, 'steps': 17571, 'loss/train': 2.0730271339416504} -11/06/2021 23:43:50 - INFO - __main__ - Step 17573: {'lr': 0.00048646627884411475, 'samples': 3374016, 'steps': 17572, 'loss/train': 1.1947308778762817} -11/06/2021 23:43:50 - INFO - __main__ - Step 17574: {'lr': 0.00048646455643397803, 'samples': 3374208, 'steps': 17573, 'loss/train': 1.3798284530639648} -11/06/2021 23:43:50 - INFO - __main__ - Step 17575: {'lr': 0.0004864628339172939, 'samples': 3374400, 'steps': 17574, 'loss/train': 1.0694053173065186} -11/06/2021 23:43:51 - INFO - __main__ - Step 17576: {'lr': 0.00048646111129406336, 'samples': 3374592, 'steps': 17575, 'loss/train': 1.4696110486984253} -11/06/2021 23:43:51 - INFO - __main__ - Step 17577: {'lr': 0.00048645938856428704, 'samples': 3374784, 'steps': 17576, 'loss/train': 1.9787176847457886} -11/06/2021 23:43:52 - INFO - __main__ - Step 17578: {'lr': 0.0004864576657279658, 'samples': 3374976, 'steps': 17577, 'loss/train': 1.9284498691558838} -11/06/2021 23:43:52 - INFO - __main__ - Step 17579: {'lr': 0.0004864559427851003, 'samples': 3375168, 'steps': 17578, 'loss/train': 1.340123176574707} -11/06/2021 23:43:53 - INFO - __main__ - Step 17580: {'lr': 0.0004864542197356915, 'samples': 3375360, 'steps': 17579, 'loss/train': 1.7503732442855835} -11/06/2021 23:43:53 - INFO - __main__ - Step 17581: {'lr': 0.00048645249657974007, 'samples': 3375552, 'steps': 17580, 'loss/train': 1.566757082939148} -11/06/2021 23:43:53 - INFO - __main__ - Step 17582: {'lr': 0.00048645077331724675, 'samples': 3375744, 'steps': 17581, 'loss/train': 1.6894330978393555} -11/06/2021 23:43:54 - INFO - __main__ - Step 17583: {'lr': 0.00048644904994821236, 'samples': 3375936, 'steps': 17582, 'loss/train': 1.7292306423187256} -11/06/2021 23:43:55 - INFO - __main__ - Step 17584: {'lr': 0.0004864473264726377, 'samples': 3376128, 'steps': 17583, 'loss/train': 1.413895606994629} -11/06/2021 23:43:55 - INFO - __main__ - Step 17585: {'lr': 0.00048644560289052354, 'samples': 3376320, 'steps': 17584, 'loss/train': 0.6992756128311157} -11/06/2021 23:43:55 - INFO - __main__ - Step 17586: {'lr': 0.0004864438792018706, 'samples': 3376512, 'steps': 17585, 'loss/train': 1.55809485912323} -11/06/2021 23:43:56 - INFO - __main__ - Step 17587: {'lr': 0.0004864421554066797, 'samples': 3376704, 'steps': 17586, 'loss/train': 1.9367111921310425} -11/06/2021 23:43:56 - INFO - __main__ - Step 17588: {'lr': 0.00048644043150495165, 'samples': 3376896, 'steps': 17587, 'loss/train': 1.8680219650268555} -11/06/2021 23:43:57 - INFO - __main__ - Step 17589: {'lr': 0.00048643870749668717, 'samples': 3377088, 'steps': 17588, 'loss/train': 1.4389081001281738} -11/06/2021 23:43:58 - INFO - __main__ - Step 17590: {'lr': 0.000486436983381887, 'samples': 3377280, 'steps': 17589, 'loss/train': 1.7606362104415894} -11/06/2021 23:43:58 - INFO - __main__ - Step 17591: {'lr': 0.0004864352591605521, 'samples': 3377472, 'steps': 17590, 'loss/train': 1.7748441696166992} -11/06/2021 23:43:58 - INFO - __main__ - Step 17592: {'lr': 0.00048643353483268306, 'samples': 3377664, 'steps': 17591, 'loss/train': 1.770916223526001} -11/06/2021 23:43:59 - INFO - __main__ - Step 17593: {'lr': 0.00048643181039828066, 'samples': 3377856, 'steps': 17592, 'loss/train': 1.82923424243927} -11/06/2021 23:44:00 - INFO - __main__ - Step 17594: {'lr': 0.00048643008585734575, 'samples': 3378048, 'steps': 17593, 'loss/train': 1.802532434463501} -11/06/2021 23:44:00 - INFO - __main__ - Step 17595: {'lr': 0.00048642836120987913, 'samples': 3378240, 'steps': 17594, 'loss/train': 2.2226874828338623} -11/06/2021 23:44:00 - INFO - __main__ - Step 17596: {'lr': 0.0004864266364558816, 'samples': 3378432, 'steps': 17595, 'loss/train': 1.8610355854034424} -11/06/2021 23:44:01 - INFO - __main__ - Step 17597: {'lr': 0.00048642491159535373, 'samples': 3378624, 'steps': 17596, 'loss/train': 1.6837226152420044} -11/06/2021 23:44:01 - INFO - __main__ - Step 17598: {'lr': 0.0004864231866282965, 'samples': 3378816, 'steps': 17597, 'loss/train': 2.052727460861206} -11/06/2021 23:44:02 - INFO - __main__ - Step 17599: {'lr': 0.0004864214615547107, 'samples': 3379008, 'steps': 17598, 'loss/train': 0.28922533988952637} -11/06/2021 23:44:02 - INFO - __main__ - Step 17600: {'lr': 0.000486419736374597, 'samples': 3379200, 'steps': 17599, 'loss/train': 1.3674170970916748} -11/06/2021 23:44:03 - INFO - __main__ - Step 17601: {'lr': 0.0004864180110879562, 'samples': 3379392, 'steps': 17600, 'loss/train': 1.1933001279830933} -11/06/2021 23:44:03 - INFO - __main__ - Step 17602: {'lr': 0.00048641628569478916, 'samples': 3379584, 'steps': 17601, 'loss/train': 1.8393548727035522} -11/06/2021 23:44:03 - INFO - __main__ - Step 17603: {'lr': 0.00048641456019509643, 'samples': 3379776, 'steps': 17602, 'loss/train': 1.6176362037658691} -11/06/2021 23:44:04 - INFO - __main__ - Step 17604: {'lr': 0.0004864128345888791, 'samples': 3379968, 'steps': 17603, 'loss/train': 1.574226975440979} -11/06/2021 23:44:05 - INFO - __main__ - Step 17605: {'lr': 0.0004864111088761377, 'samples': 3380160, 'steps': 17604, 'loss/train': 1.8493263721466064} -11/06/2021 23:44:05 - INFO - __main__ - Step 17606: {'lr': 0.00048640938305687315, 'samples': 3380352, 'steps': 17605, 'loss/train': 1.4664735794067383} -11/06/2021 23:44:06 - INFO - __main__ - Step 17607: {'lr': 0.00048640765713108615, 'samples': 3380544, 'steps': 17606, 'loss/train': 0.9904863238334656} -11/06/2021 23:44:06 - INFO - __main__ - Step 17608: {'lr': 0.00048640593109877754, 'samples': 3380736, 'steps': 17607, 'loss/train': 1.7418029308319092} -11/06/2021 23:44:07 - INFO - __main__ - Step 17609: {'lr': 0.00048640420495994806, 'samples': 3380928, 'steps': 17608, 'loss/train': 1.5066266059875488} -11/06/2021 23:44:07 - INFO - __main__ - Step 17610: {'lr': 0.0004864024787145985, 'samples': 3381120, 'steps': 17609, 'loss/train': 1.6443487405776978} -11/06/2021 23:44:08 - INFO - __main__ - Step 17611: {'lr': 0.00048640075236272963, 'samples': 3381312, 'steps': 17610, 'loss/train': 1.636483073234558} -11/06/2021 23:44:08 - INFO - __main__ - Step 17612: {'lr': 0.00048639902590434214, 'samples': 3381504, 'steps': 17611, 'loss/train': 2.005004405975342} -11/06/2021 23:44:08 - INFO - __main__ - Step 17613: {'lr': 0.000486397299339437, 'samples': 3381696, 'steps': 17612, 'loss/train': 1.4395687580108643} -11/06/2021 23:44:09 - INFO - __main__ - Step 17614: {'lr': 0.0004863955726680149, 'samples': 3381888, 'steps': 17613, 'loss/train': 1.2516988515853882} -11/06/2021 23:44:10 - INFO - __main__ - Step 17615: {'lr': 0.0004863938458900765, 'samples': 3382080, 'steps': 17614, 'loss/train': 1.3464889526367188} -11/06/2021 23:44:10 - INFO - __main__ - Step 17616: {'lr': 0.0004863921190056227, 'samples': 3382272, 'steps': 17615, 'loss/train': 1.286136507987976} -11/06/2021 23:44:10 - INFO - __main__ - Step 17617: {'lr': 0.0004863903920146544, 'samples': 3382464, 'steps': 17616, 'loss/train': 2.09637188911438} -11/06/2021 23:44:11 - INFO - __main__ - Step 17618: {'lr': 0.00048638866491717214, 'samples': 3382656, 'steps': 17617, 'loss/train': 1.8491672277450562} -11/06/2021 23:44:12 - INFO - __main__ - Step 17619: {'lr': 0.00048638693771317675, 'samples': 3382848, 'steps': 17618, 'loss/train': 1.8306879997253418} -11/06/2021 23:44:12 - INFO - __main__ - Step 17620: {'lr': 0.0004863852104026691, 'samples': 3383040, 'steps': 17619, 'loss/train': 2.254307746887207} -11/06/2021 23:44:12 - INFO - __main__ - Step 17621: {'lr': 0.00048638348298564996, 'samples': 3383232, 'steps': 17620, 'loss/train': 1.5837358236312866} -11/06/2021 23:44:13 - INFO - __main__ - Step 17622: {'lr': 0.00048638175546212, 'samples': 3383424, 'steps': 17621, 'loss/train': 1.2425532341003418} -11/06/2021 23:44:13 - INFO - __main__ - Step 17623: {'lr': 0.00048638002783208013, 'samples': 3383616, 'steps': 17622, 'loss/train': 1.2094799280166626} -11/06/2021 23:44:13 - INFO - __main__ - Step 17624: {'lr': 0.000486378300095531, 'samples': 3383808, 'steps': 17623, 'loss/train': 1.8858073949813843} -11/06/2021 23:44:15 - INFO - __main__ - Step 17625: {'lr': 0.0004863765722524735, 'samples': 3384000, 'steps': 17624, 'loss/train': 1.8143595457077026} -11/06/2021 23:44:15 - INFO - __main__ - Step 17626: {'lr': 0.0004863748443029083, 'samples': 3384192, 'steps': 17625, 'loss/train': 1.8148971796035767} -11/06/2021 23:44:15 - INFO - __main__ - Step 17627: {'lr': 0.00048637311624683634, 'samples': 3384384, 'steps': 17626, 'loss/train': 1.8352149724960327} -11/06/2021 23:44:16 - INFO - __main__ - Step 17628: {'lr': 0.0004863713880842583, 'samples': 3384576, 'steps': 17627, 'loss/train': 1.9543405771255493} -11/06/2021 23:44:16 - INFO - __main__ - Step 17629: {'lr': 0.0004863696598151749, 'samples': 3384768, 'steps': 17628, 'loss/train': 1.5006835460662842} -11/06/2021 23:44:17 - INFO - __main__ - Step 17630: {'lr': 0.00048636793143958695, 'samples': 3384960, 'steps': 17629, 'loss/train': 1.918142318725586} -11/06/2021 23:44:17 - INFO - __main__ - Step 17631: {'lr': 0.00048636620295749533, 'samples': 3385152, 'steps': 17630, 'loss/train': 1.7116636037826538} -11/06/2021 23:44:18 - INFO - __main__ - Step 17632: {'lr': 0.00048636447436890075, 'samples': 3385344, 'steps': 17631, 'loss/train': 2.3437066078186035} -11/06/2021 23:44:18 - INFO - __main__ - Step 17633: {'lr': 0.0004863627456738039, 'samples': 3385536, 'steps': 17632, 'loss/train': 1.3445450067520142} -11/06/2021 23:44:18 - INFO - __main__ - Step 17634: {'lr': 0.00048636101687220566, 'samples': 3385728, 'steps': 17633, 'loss/train': 1.811186671257019} -11/06/2021 23:44:20 - INFO - __main__ - Step 17635: {'lr': 0.0004863592879641069, 'samples': 3385920, 'steps': 17634, 'loss/train': 1.7794731855392456} -11/06/2021 23:44:20 - INFO - __main__ - Step 17636: {'lr': 0.0004863575589495082, 'samples': 3386112, 'steps': 17635, 'loss/train': 0.17728441953659058} -11/06/2021 23:44:20 - INFO - __main__ - Step 17637: {'lr': 0.00048635582982841047, 'samples': 3386304, 'steps': 17636, 'loss/train': 1.6846859455108643} -11/06/2021 23:44:21 - INFO - __main__ - Step 17638: {'lr': 0.0004863541006008144, 'samples': 3386496, 'steps': 17637, 'loss/train': 1.8092470169067383} -11/06/2021 23:44:21 - INFO - __main__ - Step 17639: {'lr': 0.0004863523712667209, 'samples': 3386688, 'steps': 17638, 'loss/train': 5.441341400146484} -11/06/2021 23:44:22 - INFO - __main__ - Step 17640: {'lr': 0.00048635064182613063, 'samples': 3386880, 'steps': 17639, 'loss/train': 1.7276121377944946} -11/06/2021 23:44:22 - INFO - __main__ - Step 17641: {'lr': 0.00048634891227904435, 'samples': 3387072, 'steps': 17640, 'loss/train': 1.31169855594635} -11/06/2021 23:44:23 - INFO - __main__ - Step 17642: {'lr': 0.00048634718262546297, 'samples': 3387264, 'steps': 17641, 'loss/train': 1.7238352298736572} -11/06/2021 23:44:23 - INFO - __main__ - Step 17643: {'lr': 0.0004863454528653872, 'samples': 3387456, 'steps': 17642, 'loss/train': 1.691017985343933} -11/06/2021 23:44:23 - INFO - __main__ - Step 17644: {'lr': 0.0004863437229988178, 'samples': 3387648, 'steps': 17643, 'loss/train': 1.94411301612854} -11/06/2021 23:44:24 - INFO - __main__ - Step 17645: {'lr': 0.00048634199302575554, 'samples': 3387840, 'steps': 17644, 'loss/train': 2.1407902240753174} -11/06/2021 23:44:25 - INFO - __main__ - Step 17646: {'lr': 0.00048634026294620125, 'samples': 3388032, 'steps': 17645, 'loss/train': 1.1031410694122314} -11/06/2021 23:44:25 - INFO - __main__ - Step 17647: {'lr': 0.00048633853276015566, 'samples': 3388224, 'steps': 17646, 'loss/train': 1.7941488027572632} -11/06/2021 23:44:25 - INFO - __main__ - Step 17648: {'lr': 0.00048633680246761956, 'samples': 3388416, 'steps': 17647, 'loss/train': 1.232820987701416} -11/06/2021 23:44:26 - INFO - __main__ - Step 17649: {'lr': 0.00048633507206859383, 'samples': 3388608, 'steps': 17648, 'loss/train': 1.629302740097046} -11/06/2021 23:44:26 - INFO - __main__ - Step 17650: {'lr': 0.00048633334156307907, 'samples': 3388800, 'steps': 17649, 'loss/train': 1.1769516468048096} -11/06/2021 23:44:27 - INFO - __main__ - Step 17651: {'lr': 0.0004863316109510762, 'samples': 3388992, 'steps': 17650, 'loss/train': 1.9917153120040894} -11/06/2021 23:44:28 - INFO - __main__ - Step 17652: {'lr': 0.00048632988023258596, 'samples': 3389184, 'steps': 17651, 'loss/train': 1.4906460046768188} -11/06/2021 23:44:28 - INFO - __main__ - Step 17653: {'lr': 0.00048632814940760907, 'samples': 3389376, 'steps': 17652, 'loss/train': 1.6637530326843262} -11/06/2021 23:44:28 - INFO - __main__ - Step 17654: {'lr': 0.00048632641847614645, 'samples': 3389568, 'steps': 17653, 'loss/train': 1.3956372737884521} -11/06/2021 23:44:29 - INFO - __main__ - Step 17655: {'lr': 0.0004863246874381987, 'samples': 3389760, 'steps': 17654, 'loss/train': 1.1515908241271973} -11/06/2021 23:44:30 - INFO - __main__ - Step 17656: {'lr': 0.00048632295629376675, 'samples': 3389952, 'steps': 17655, 'loss/train': 1.2790088653564453} -11/06/2021 23:44:30 - INFO - __main__ - Step 17657: {'lr': 0.00048632122504285133, 'samples': 3390144, 'steps': 17656, 'loss/train': 1.4435092210769653} -11/06/2021 23:44:31 - INFO - __main__ - Step 17658: {'lr': 0.0004863194936854531, 'samples': 3390336, 'steps': 17657, 'loss/train': 1.6653163433074951} -11/06/2021 23:44:31 - INFO - __main__ - Step 17659: {'lr': 0.0004863177622215731, 'samples': 3390528, 'steps': 17658, 'loss/train': 1.276356816291809} -11/06/2021 23:44:31 - INFO - __main__ - Step 17660: {'lr': 0.00048631603065121186, 'samples': 3390720, 'steps': 17659, 'loss/train': 0.5060484409332275} -11/06/2021 23:44:32 - INFO - __main__ - Step 17661: {'lr': 0.00048631429897437033, 'samples': 3390912, 'steps': 17660, 'loss/train': 1.867882251739502} -11/06/2021 23:44:33 - INFO - __main__ - Step 17662: {'lr': 0.0004863125671910492, 'samples': 3391104, 'steps': 17661, 'loss/train': 1.676186203956604} -11/06/2021 23:44:33 - INFO - __main__ - Step 17663: {'lr': 0.00048631083530124934, 'samples': 3391296, 'steps': 17662, 'loss/train': 1.7655481100082397} -11/06/2021 23:44:33 - INFO - __main__ - Step 17664: {'lr': 0.00048630910330497133, 'samples': 3391488, 'steps': 17663, 'loss/train': 2.426825523376465} -11/06/2021 23:44:34 - INFO - __main__ - Step 17665: {'lr': 0.0004863073712022162, 'samples': 3391680, 'steps': 17664, 'loss/train': 1.5191713571548462} -11/06/2021 23:44:34 - INFO - __main__ - Step 17666: {'lr': 0.00048630563899298453, 'samples': 3391872, 'steps': 17665, 'loss/train': 1.772326946258545} -11/06/2021 23:44:35 - INFO - __main__ - Step 17667: {'lr': 0.00048630390667727725, 'samples': 3392064, 'steps': 17666, 'loss/train': 2.8871684074401855} -11/06/2021 23:44:35 - INFO - __main__ - Step 17668: {'lr': 0.00048630217425509503, 'samples': 3392256, 'steps': 17667, 'loss/train': 1.6198441982269287} -11/06/2021 23:44:36 - INFO - __main__ - Step 17669: {'lr': 0.00048630044172643874, 'samples': 3392448, 'steps': 17668, 'loss/train': 1.4763474464416504} -11/06/2021 23:44:36 - INFO - __main__ - Step 17670: {'lr': 0.0004862987090913091, 'samples': 3392640, 'steps': 17669, 'loss/train': 1.4978746175765991} -11/06/2021 23:44:37 - INFO - __main__ - Step 17671: {'lr': 0.0004862969763497069, 'samples': 3392832, 'steps': 17670, 'loss/train': 1.3769848346710205} -11/06/2021 23:44:38 - INFO - __main__ - Step 17672: {'lr': 0.0004862952435016329, 'samples': 3393024, 'steps': 17671, 'loss/train': 1.7096163034439087} -11/06/2021 23:44:38 - INFO - __main__ - Step 17673: {'lr': 0.00048629351054708795, 'samples': 3393216, 'steps': 17672, 'loss/train': 0.3188741207122803} -11/06/2021 23:44:38 - INFO - __main__ - Step 17674: {'lr': 0.0004862917774860728, 'samples': 3393408, 'steps': 17673, 'loss/train': 1.1482633352279663} -11/06/2021 23:44:39 - INFO - __main__ - Step 17675: {'lr': 0.0004862900443185882, 'samples': 3393600, 'steps': 17674, 'loss/train': 1.705519199371338} -11/06/2021 23:44:39 - INFO - __main__ - Step 17676: {'lr': 0.00048628831104463496, 'samples': 3393792, 'steps': 17675, 'loss/train': 1.3742202520370483} -11/06/2021 23:44:40 - INFO - __main__ - Step 17677: {'lr': 0.0004862865776642138, 'samples': 3393984, 'steps': 17676, 'loss/train': 1.4632993936538696} -11/06/2021 23:44:40 - INFO - __main__ - Step 17678: {'lr': 0.00048628484417732567, 'samples': 3394176, 'steps': 17677, 'loss/train': 1.8968327045440674} -11/06/2021 23:44:41 - INFO - __main__ - Step 17679: {'lr': 0.00048628311058397113, 'samples': 3394368, 'steps': 17678, 'loss/train': 1.8257449865341187} -11/06/2021 23:44:41 - INFO - __main__ - Step 17680: {'lr': 0.0004862813768841511, 'samples': 3394560, 'steps': 17679, 'loss/train': 1.2477961778640747} -11/06/2021 23:44:41 - INFO - __main__ - Step 17681: {'lr': 0.0004862796430778663, 'samples': 3394752, 'steps': 17680, 'loss/train': 1.7231652736663818} -11/06/2021 23:44:42 - INFO - __main__ - Step 17682: {'lr': 0.0004862779091651176, 'samples': 3394944, 'steps': 17681, 'loss/train': 1.2031580209732056} -11/06/2021 23:44:44 - INFO - __main__ - Step 17683: {'lr': 0.0004862761751459057, 'samples': 3395136, 'steps': 17682, 'loss/train': 1.4472994804382324} -11/06/2021 23:44:44 - INFO - __main__ - Step 17684: {'lr': 0.0004862744410202314, 'samples': 3395328, 'steps': 17683, 'loss/train': 1.509667158126831} -11/06/2021 23:44:44 - INFO - __main__ - Step 17685: {'lr': 0.00048627270678809544, 'samples': 3395520, 'steps': 17684, 'loss/train': 1.8475730419158936} -11/06/2021 23:44:45 - INFO - __main__ - Step 17686: {'lr': 0.0004862709724494987, 'samples': 3395712, 'steps': 17685, 'loss/train': 0.83989018201828} -11/06/2021 23:44:45 - INFO - __main__ - Step 17687: {'lr': 0.0004862692380044419, 'samples': 3395904, 'steps': 17686, 'loss/train': 0.8706456422805786} -11/06/2021 23:44:45 - INFO - __main__ - Step 17688: {'lr': 0.0004862675034529258, 'samples': 3396096, 'steps': 17687, 'loss/train': 2.1186492443084717} -11/06/2021 23:44:46 - INFO - __main__ - Step 17689: {'lr': 0.0004862657687949512, 'samples': 3396288, 'steps': 17688, 'loss/train': 1.95449960231781} -11/06/2021 23:44:47 - INFO - __main__ - Step 17690: {'lr': 0.00048626403403051894, 'samples': 3396480, 'steps': 17689, 'loss/train': 1.7684614658355713} -11/06/2021 23:44:47 - INFO - __main__ - Step 17691: {'lr': 0.00048626229915962974, 'samples': 3396672, 'steps': 17690, 'loss/train': 1.9429171085357666} -11/06/2021 23:44:47 - INFO - __main__ - Step 17692: {'lr': 0.00048626056418228436, 'samples': 3396864, 'steps': 17691, 'loss/train': 1.7060483694076538} -11/06/2021 23:44:48 - INFO - __main__ - Step 17693: {'lr': 0.0004862588290984836, 'samples': 3397056, 'steps': 17692, 'loss/train': 1.6680606603622437} -11/06/2021 23:44:48 - INFO - __main__ - Step 17694: {'lr': 0.0004862570939082283, 'samples': 3397248, 'steps': 17693, 'loss/train': 1.6972788572311401} -11/06/2021 23:44:49 - INFO - __main__ - Step 17695: {'lr': 0.0004862553586115192, 'samples': 3397440, 'steps': 17694, 'loss/train': 1.4430689811706543} -11/06/2021 23:44:49 - INFO - __main__ - Step 17696: {'lr': 0.00048625362320835707, 'samples': 3397632, 'steps': 17695, 'loss/train': 1.8841452598571777} -11/06/2021 23:44:50 - INFO - __main__ - Step 17697: {'lr': 0.00048625188769874274, 'samples': 3397824, 'steps': 17696, 'loss/train': 1.7126444578170776} -11/06/2021 23:44:50 - INFO - __main__ - Step 17698: {'lr': 0.0004862501520826769, 'samples': 3398016, 'steps': 17697, 'loss/train': 1.623423457145691} -11/06/2021 23:44:50 - INFO - __main__ - Step 17699: {'lr': 0.0004862484163601604, 'samples': 3398208, 'steps': 17698, 'loss/train': 1.2866634130477905} -11/06/2021 23:44:51 - INFO - __main__ - Step 17700: {'lr': 0.000486246680531194, 'samples': 3398400, 'steps': 17699, 'loss/train': 1.8399791717529297} -11/06/2021 23:44:52 - INFO - __main__ - Step 17701: {'lr': 0.0004862449445957785, 'samples': 3398592, 'steps': 17700, 'loss/train': 2.2770066261291504} -11/06/2021 23:44:52 - INFO - __main__ - Step 17702: {'lr': 0.00048624320855391467, 'samples': 3398784, 'steps': 17701, 'loss/train': 1.8665575981140137} -11/06/2021 23:44:53 - INFO - __main__ - Step 17703: {'lr': 0.00048624147240560335, 'samples': 3398976, 'steps': 17702, 'loss/train': 1.7524605989456177} -11/06/2021 23:44:53 - INFO - __main__ - Step 17704: {'lr': 0.00048623973615084516, 'samples': 3399168, 'steps': 17703, 'loss/train': 1.6480399370193481} -11/06/2021 23:44:53 - INFO - __main__ - Step 17705: {'lr': 0.0004862379997896411, 'samples': 3399360, 'steps': 17704, 'loss/train': 1.4674162864685059} -11/06/2021 23:44:55 - INFO - __main__ - Step 17706: {'lr': 0.0004862362633219918, 'samples': 3399552, 'steps': 17705, 'loss/train': 1.4373513460159302} -11/06/2021 23:44:55 - INFO - __main__ - Step 17707: {'lr': 0.000486234526747898, 'samples': 3399744, 'steps': 17706, 'loss/train': 1.3480507135391235} -11/06/2021 23:44:55 - INFO - __main__ - Step 17708: {'lr': 0.0004862327900673607, 'samples': 3399936, 'steps': 17707, 'loss/train': 1.7012041807174683} -11/06/2021 23:44:56 - INFO - __main__ - Step 17709: {'lr': 0.00048623105328038054, 'samples': 3400128, 'steps': 17708, 'loss/train': 1.5123977661132812} -11/06/2021 23:44:56 - INFO - __main__ - Step 17710: {'lr': 0.0004862293163869582, 'samples': 3400320, 'steps': 17709, 'loss/train': 1.932036280632019} -11/06/2021 23:44:56 - INFO - __main__ - Step 17711: {'lr': 0.00048622757938709466, 'samples': 3400512, 'steps': 17710, 'loss/train': 1.562470555305481} -11/06/2021 23:44:57 - INFO - __main__ - Step 17712: {'lr': 0.0004862258422807906, 'samples': 3400704, 'steps': 17711, 'loss/train': 2.740880012512207} -11/06/2021 23:44:58 - INFO - __main__ - Step 17713: {'lr': 0.0004862241050680468, 'samples': 3400896, 'steps': 17712, 'loss/train': 1.3904601335525513} -11/06/2021 23:44:58 - INFO - __main__ - Step 17714: {'lr': 0.00048622236774886415, 'samples': 3401088, 'steps': 17713, 'loss/train': 1.7398821115493774} -11/06/2021 23:44:59 - INFO - __main__ - Step 17715: {'lr': 0.00048622063032324324, 'samples': 3401280, 'steps': 17714, 'loss/train': 1.4588117599487305} -11/06/2021 23:44:59 - INFO - __main__ - Step 17716: {'lr': 0.000486218892791185, 'samples': 3401472, 'steps': 17715, 'loss/train': 1.9582970142364502} -11/06/2021 23:45:00 - INFO - __main__ - Step 17717: {'lr': 0.00048621715515269017, 'samples': 3401664, 'steps': 17716, 'loss/train': 1.8855799436569214} -11/06/2021 23:45:00 - INFO - __main__ - Step 17718: {'lr': 0.0004862154174077595, 'samples': 3401856, 'steps': 17717, 'loss/train': 1.602186918258667} -11/06/2021 23:45:01 - INFO - __main__ - Step 17719: {'lr': 0.00048621367955639395, 'samples': 3402048, 'steps': 17718, 'loss/train': 1.7233091592788696} -11/06/2021 23:45:01 - INFO - __main__ - Step 17720: {'lr': 0.00048621194159859403, 'samples': 3402240, 'steps': 17719, 'loss/train': 1.776808738708496} -11/06/2021 23:45:01 - INFO - __main__ - Step 17721: {'lr': 0.0004862102035343607, 'samples': 3402432, 'steps': 17720, 'loss/train': 1.7947196960449219} -11/06/2021 23:45:02 - INFO - __main__ - Step 17722: {'lr': 0.0004862084653636947, 'samples': 3402624, 'steps': 17721, 'loss/train': 1.6159709692001343} -11/06/2021 23:45:03 - INFO - __main__ - Step 17723: {'lr': 0.00048620672708659675, 'samples': 3402816, 'steps': 17722, 'loss/train': 1.3404769897460938} -11/06/2021 23:45:03 - INFO - __main__ - Step 17724: {'lr': 0.0004862049887030677, 'samples': 3403008, 'steps': 17723, 'loss/train': 1.8909834623336792} -11/06/2021 23:45:04 - INFO - __main__ - Step 17725: {'lr': 0.0004862032502131084, 'samples': 3403200, 'steps': 17724, 'loss/train': 1.3636215925216675} -11/06/2021 23:45:04 - INFO - __main__ - Step 17726: {'lr': 0.00048620151161671955, 'samples': 3403392, 'steps': 17725, 'loss/train': 1.3039368391036987} -11/06/2021 23:45:04 - INFO - __main__ - Step 17727: {'lr': 0.00048619977291390186, 'samples': 3403584, 'steps': 17726, 'loss/train': 1.5515477657318115} -11/06/2021 23:45:05 - INFO - __main__ - Step 17728: {'lr': 0.00048619803410465624, 'samples': 3403776, 'steps': 17727, 'loss/train': 1.6064467430114746} -11/06/2021 23:45:06 - INFO - __main__ - Step 17729: {'lr': 0.00048619629518898344, 'samples': 3403968, 'steps': 17728, 'loss/train': 1.9508514404296875} -11/06/2021 23:45:06 - INFO - __main__ - Step 17730: {'lr': 0.00048619455616688426, 'samples': 3404160, 'steps': 17729, 'loss/train': 1.5443555116653442} -11/06/2021 23:45:06 - INFO - __main__ - Step 17731: {'lr': 0.0004861928170383594, 'samples': 3404352, 'steps': 17730, 'loss/train': 2.0993919372558594} -11/06/2021 23:45:07 - INFO - __main__ - Step 17732: {'lr': 0.0004861910778034098, 'samples': 3404544, 'steps': 17731, 'loss/train': 1.164543628692627} -11/06/2021 23:45:08 - INFO - __main__ - Step 17733: {'lr': 0.00048618933846203606, 'samples': 3404736, 'steps': 17732, 'loss/train': 1.5191380977630615} -11/06/2021 23:45:08 - INFO - __main__ - Step 17734: {'lr': 0.00048618759901423905, 'samples': 3404928, 'steps': 17733, 'loss/train': 1.3447216749191284} -11/06/2021 23:45:08 - INFO - __main__ - Step 17735: {'lr': 0.0004861858594600196, 'samples': 3405120, 'steps': 17734, 'loss/train': 1.69388747215271} -11/06/2021 23:45:09 - INFO - __main__ - Step 17736: {'lr': 0.0004861841197993784, 'samples': 3405312, 'steps': 17735, 'loss/train': 1.55830979347229} -11/06/2021 23:45:09 - INFO - __main__ - Step 17737: {'lr': 0.0004861823800323163, 'samples': 3405504, 'steps': 17736, 'loss/train': 1.009899377822876} -11/06/2021 23:45:10 - INFO - __main__ - Step 17738: {'lr': 0.00048618064015883405, 'samples': 3405696, 'steps': 17737, 'loss/train': 1.4308483600616455} -11/06/2021 23:45:10 - INFO - __main__ - Step 17739: {'lr': 0.0004861789001789325, 'samples': 3405888, 'steps': 17738, 'loss/train': 1.650288462638855} -11/06/2021 23:45:11 - INFO - __main__ - Step 17740: {'lr': 0.00048617716009261236, 'samples': 3406080, 'steps': 17739, 'loss/train': 1.3938745260238647} -11/06/2021 23:45:11 - INFO - __main__ - Step 17741: {'lr': 0.00048617541989987435, 'samples': 3406272, 'steps': 17740, 'loss/train': 2.2797935009002686} -11/06/2021 23:45:11 - INFO - __main__ - Step 17742: {'lr': 0.00048617367960071946, 'samples': 3406464, 'steps': 17741, 'loss/train': 1.6652027368545532} -11/06/2021 23:45:12 - INFO - __main__ - Step 17743: {'lr': 0.0004861719391951483, 'samples': 3406656, 'steps': 17742, 'loss/train': 2.367107629776001} -11/06/2021 23:45:13 - INFO - __main__ - Step 17744: {'lr': 0.0004861701986831617, 'samples': 3406848, 'steps': 17743, 'loss/train': 1.67668616771698} -11/06/2021 23:45:13 - INFO - __main__ - Step 17745: {'lr': 0.0004861684580647605, 'samples': 3407040, 'steps': 17744, 'loss/train': 1.9319639205932617} -11/06/2021 23:45:13 - INFO - __main__ - Step 17746: {'lr': 0.0004861667173399453, 'samples': 3407232, 'steps': 17745, 'loss/train': 1.9441924095153809} -11/06/2021 23:45:14 - INFO - __main__ - Step 17747: {'lr': 0.0004861649765087172, 'samples': 3407424, 'steps': 17746, 'loss/train': 1.659930944442749} -11/06/2021 23:45:15 - INFO - __main__ - Step 17748: {'lr': 0.0004861632355710767, 'samples': 3407616, 'steps': 17747, 'loss/train': 1.866965889930725} -11/06/2021 23:45:15 - INFO - __main__ - Step 17749: {'lr': 0.00048616149452702473, 'samples': 3407808, 'steps': 17748, 'loss/train': 1.0669561624526978} -11/06/2021 23:45:16 - INFO - __main__ - Step 17750: {'lr': 0.00048615975337656204, 'samples': 3408000, 'steps': 17749, 'loss/train': 1.2315871715545654} -11/06/2021 23:45:16 - INFO - __main__ - Step 17751: {'lr': 0.00048615801211968936, 'samples': 3408192, 'steps': 17750, 'loss/train': 1.1719317436218262} -11/06/2021 23:45:16 - INFO - __main__ - Step 17752: {'lr': 0.00048615627075640754, 'samples': 3408384, 'steps': 17751, 'loss/train': 1.6517837047576904} -11/06/2021 23:45:17 - INFO - __main__ - Step 17753: {'lr': 0.00048615452928671746, 'samples': 3408576, 'steps': 17752, 'loss/train': 1.3489247560501099} -11/06/2021 23:45:18 - INFO - __main__ - Step 17754: {'lr': 0.00048615278771061966, 'samples': 3408768, 'steps': 17753, 'loss/train': 1.8767962455749512} -11/06/2021 23:45:18 - INFO - __main__ - Step 17755: {'lr': 0.0004861510460281151, 'samples': 3408960, 'steps': 17754, 'loss/train': 1.8693060874938965} -11/06/2021 23:45:18 - INFO - __main__ - Step 17756: {'lr': 0.0004861493042392045, 'samples': 3409152, 'steps': 17755, 'loss/train': 1.853451132774353} -11/06/2021 23:45:19 - INFO - __main__ - Step 17757: {'lr': 0.00048614756234388866, 'samples': 3409344, 'steps': 17756, 'loss/train': 2.1281392574310303} -11/06/2021 23:45:19 - INFO - __main__ - Step 17758: {'lr': 0.00048614582034216844, 'samples': 3409536, 'steps': 17757, 'loss/train': 1.9277595281600952} -11/06/2021 23:45:20 - INFO - __main__ - Step 17759: {'lr': 0.0004861440782340445, 'samples': 3409728, 'steps': 17758, 'loss/train': 1.6594657897949219} -11/06/2021 23:45:20 - INFO - __main__ - Step 17760: {'lr': 0.0004861423360195177, 'samples': 3409920, 'steps': 17759, 'loss/train': 1.752420425415039} -11/06/2021 23:45:21 - INFO - __main__ - Step 17761: {'lr': 0.0004861405936985888, 'samples': 3410112, 'steps': 17760, 'loss/train': 1.9742324352264404} -11/06/2021 23:45:21 - INFO - __main__ - Step 17762: {'lr': 0.0004861388512712586, 'samples': 3410304, 'steps': 17761, 'loss/train': 1.6699413061141968} -11/06/2021 23:45:21 - INFO - __main__ - Step 17763: {'lr': 0.0004861371087375279, 'samples': 3410496, 'steps': 17762, 'loss/train': 1.9181797504425049} -11/06/2021 23:45:22 - INFO - __main__ - Step 17764: {'lr': 0.0004861353660973974, 'samples': 3410688, 'steps': 17763, 'loss/train': 2.064819812774658} -11/06/2021 23:45:23 - INFO - __main__ - Step 17765: {'lr': 0.00048613362335086797, 'samples': 3410880, 'steps': 17764, 'loss/train': 1.6789594888687134} -11/06/2021 23:45:23 - INFO - __main__ - Step 17766: {'lr': 0.00048613188049794045, 'samples': 3411072, 'steps': 17765, 'loss/train': 1.2881523370742798} -11/06/2021 23:45:23 - INFO - __main__ - Step 17767: {'lr': 0.00048613013753861546, 'samples': 3411264, 'steps': 17766, 'loss/train': 1.05593740940094} -11/06/2021 23:45:24 - INFO - __main__ - Step 17768: {'lr': 0.0004861283944728939, 'samples': 3411456, 'steps': 17767, 'loss/train': 1.651064395904541} -11/06/2021 23:45:25 - INFO - __main__ - Step 17769: {'lr': 0.0004861266513007765, 'samples': 3411648, 'steps': 17768, 'loss/train': 1.3704620599746704} -11/06/2021 23:45:25 - INFO - __main__ - Step 17770: {'lr': 0.00048612490802226415, 'samples': 3411840, 'steps': 17769, 'loss/train': 1.651924729347229} -11/06/2021 23:45:26 - INFO - __main__ - Step 17771: {'lr': 0.0004861231646373575, 'samples': 3412032, 'steps': 17770, 'loss/train': 1.6909313201904297} -11/06/2021 23:45:26 - INFO - __main__ - Step 17772: {'lr': 0.0004861214211460574, 'samples': 3412224, 'steps': 17771, 'loss/train': 1.8236727714538574} -11/06/2021 23:45:26 - INFO - __main__ - Step 17773: {'lr': 0.00048611967754836466, 'samples': 3412416, 'steps': 17772, 'loss/train': 1.6562209129333496} -11/06/2021 23:45:27 - INFO - __main__ - Step 17774: {'lr': 0.00048611793384428006, 'samples': 3412608, 'steps': 17773, 'loss/train': 1.7618428468704224} -11/06/2021 23:45:28 - INFO - __main__ - Step 17775: {'lr': 0.00048611619003380426, 'samples': 3412800, 'steps': 17774, 'loss/train': 1.5506091117858887} -11/06/2021 23:45:28 - INFO - __main__ - Step 17776: {'lr': 0.0004861144461169382, 'samples': 3412992, 'steps': 17775, 'loss/train': 1.73026442527771} -11/06/2021 23:45:28 - INFO - __main__ - Step 17777: {'lr': 0.00048611270209368264, 'samples': 3413184, 'steps': 17776, 'loss/train': 1.560634732246399} -11/06/2021 23:45:29 - INFO - __main__ - Step 17778: {'lr': 0.0004861109579640384, 'samples': 3413376, 'steps': 17777, 'loss/train': 1.7123799324035645} -11/06/2021 23:45:30 - INFO - __main__ - Step 17779: {'lr': 0.0004861092137280061, 'samples': 3413568, 'steps': 17778, 'loss/train': 2.3202054500579834} -11/06/2021 23:45:30 - INFO - __main__ - Step 17780: {'lr': 0.00048610746938558666, 'samples': 3413760, 'steps': 17779, 'loss/train': 1.6584490537643433} -11/06/2021 23:45:30 - INFO - __main__ - Step 17781: {'lr': 0.0004861057249367808, 'samples': 3413952, 'steps': 17780, 'loss/train': 1.4049021005630493} -11/06/2021 23:45:31 - INFO - __main__ - Step 17782: {'lr': 0.00048610398038158943, 'samples': 3414144, 'steps': 17781, 'loss/train': 1.194156527519226} -11/06/2021 23:45:31 - INFO - __main__ - Step 17783: {'lr': 0.00048610223572001315, 'samples': 3414336, 'steps': 17782, 'loss/train': 1.766744613647461} -11/06/2021 23:45:32 - INFO - __main__ - Step 17784: {'lr': 0.0004861004909520529, 'samples': 3414528, 'steps': 17783, 'loss/train': 1.6957181692123413} -11/06/2021 23:45:32 - INFO - __main__ - Step 17785: {'lr': 0.00048609874607770945, 'samples': 3414720, 'steps': 17784, 'loss/train': 1.5701578855514526} -11/06/2021 23:45:33 - INFO - __main__ - Step 17786: {'lr': 0.0004860970010969835, 'samples': 3414912, 'steps': 17785, 'loss/train': 1.456776738166809} -11/06/2021 23:45:33 - INFO - __main__ - Step 17787: {'lr': 0.0004860952560098759, 'samples': 3415104, 'steps': 17786, 'loss/train': 2.101297378540039} -11/06/2021 23:45:34 - INFO - __main__ - Step 17788: {'lr': 0.0004860935108163874, 'samples': 3415296, 'steps': 17787, 'loss/train': 1.8379590511322021} -11/06/2021 23:45:34 - INFO - __main__ - Step 17789: {'lr': 0.0004860917655165188, 'samples': 3415488, 'steps': 17788, 'loss/train': 1.5483107566833496} -11/06/2021 23:45:35 - INFO - __main__ - Step 17790: {'lr': 0.00048609002011027093, 'samples': 3415680, 'steps': 17789, 'loss/train': 1.2295900583267212} -11/06/2021 23:45:36 - INFO - __main__ - Step 17791: {'lr': 0.0004860882745976445, 'samples': 3415872, 'steps': 17790, 'loss/train': 1.2207252979278564} -11/06/2021 23:45:36 - INFO - __main__ - Step 17792: {'lr': 0.00048608652897864034, 'samples': 3416064, 'steps': 17791, 'loss/train': 1.811275601387024} -11/06/2021 23:45:36 - INFO - __main__ - Step 17793: {'lr': 0.0004860847832532593, 'samples': 3416256, 'steps': 17792, 'loss/train': 1.5424718856811523} -11/06/2021 23:45:37 - INFO - __main__ - Step 17794: {'lr': 0.00048608303742150204, 'samples': 3416448, 'steps': 17793, 'loss/train': 1.4225600957870483} -11/06/2021 23:45:37 - INFO - __main__ - Step 17795: {'lr': 0.0004860812914833694, 'samples': 3416640, 'steps': 17794, 'loss/train': 1.653011441230774} -11/06/2021 23:45:38 - INFO - __main__ - Step 17796: {'lr': 0.00048607954543886225, 'samples': 3416832, 'steps': 17795, 'loss/train': 1.1417803764343262} -11/06/2021 23:45:38 - INFO - __main__ - Step 17797: {'lr': 0.00048607779928798125, 'samples': 3417024, 'steps': 17796, 'loss/train': 1.5692245960235596} -11/06/2021 23:45:39 - INFO - __main__ - Step 17798: {'lr': 0.0004860760530307272, 'samples': 3417216, 'steps': 17797, 'loss/train': 2.135267734527588} -11/06/2021 23:45:39 - INFO - __main__ - Step 17799: {'lr': 0.00048607430666710097, 'samples': 3417408, 'steps': 17798, 'loss/train': 1.1966557502746582} -11/06/2021 23:45:40 - INFO - __main__ - Step 17800: {'lr': 0.00048607256019710327, 'samples': 3417600, 'steps': 17799, 'loss/train': 1.4628567695617676} -11/06/2021 23:45:41 - INFO - __main__ - Step 17801: {'lr': 0.0004860708136207349, 'samples': 3417792, 'steps': 17800, 'loss/train': 1.8049674034118652} -11/06/2021 23:45:42 - INFO - __main__ - Step 17802: {'lr': 0.0004860690669379967, 'samples': 3417984, 'steps': 17801, 'loss/train': 1.4776289463043213} -11/06/2021 23:45:42 - INFO - __main__ - Step 17803: {'lr': 0.00048606732014888946, 'samples': 3418176, 'steps': 17802, 'loss/train': 1.5583086013793945} -11/06/2021 23:45:42 - INFO - __main__ - Step 17804: {'lr': 0.0004860655732534138, 'samples': 3418368, 'steps': 17803, 'loss/train': 1.8255856037139893} -11/06/2021 23:45:43 - INFO - __main__ - Step 17805: {'lr': 0.00048606382625157075, 'samples': 3418560, 'steps': 17804, 'loss/train': 2.160865306854248} -11/06/2021 23:45:43 - INFO - __main__ - Step 17806: {'lr': 0.00048606207914336097, 'samples': 3418752, 'steps': 17805, 'loss/train': 1.7955251932144165} -11/06/2021 23:45:43 - INFO - __main__ - Step 17807: {'lr': 0.0004860603319287853, 'samples': 3418944, 'steps': 17806, 'loss/train': 1.7676409482955933} -11/06/2021 23:45:44 - INFO - __main__ - Step 17808: {'lr': 0.0004860585846078444, 'samples': 3419136, 'steps': 17807, 'loss/train': 1.7928861379623413} -11/06/2021 23:45:45 - INFO - __main__ - Step 17809: {'lr': 0.00048605683718053915, 'samples': 3419328, 'steps': 17808, 'loss/train': 1.0694918632507324} -11/06/2021 23:45:45 - INFO - __main__ - Step 17810: {'lr': 0.0004860550896468704, 'samples': 3419520, 'steps': 17809, 'loss/train': 1.7536789178848267} -11/06/2021 23:45:45 - INFO - __main__ - Step 17811: {'lr': 0.00048605334200683883, 'samples': 3419712, 'steps': 17810, 'loss/train': 1.910631537437439} -11/06/2021 23:45:46 - INFO - __main__ - Step 17812: {'lr': 0.0004860515942604452, 'samples': 3419904, 'steps': 17811, 'loss/train': 1.5907909870147705} -11/06/2021 23:45:47 - INFO - __main__ - Step 17813: {'lr': 0.00048604984640769047, 'samples': 3420096, 'steps': 17812, 'loss/train': 1.6828159093856812} -11/06/2021 23:45:47 - INFO - __main__ - Step 17814: {'lr': 0.00048604809844857524, 'samples': 3420288, 'steps': 17813, 'loss/train': 1.5735582113265991} -11/06/2021 23:45:48 - INFO - __main__ - Step 17815: {'lr': 0.0004860463503831004, 'samples': 3420480, 'steps': 17814, 'loss/train': 1.7284306287765503} -11/06/2021 23:45:48 - INFO - __main__ - Step 17816: {'lr': 0.0004860446022112668, 'samples': 3420672, 'steps': 17815, 'loss/train': 1.8749446868896484} -11/06/2021 23:45:48 - INFO - __main__ - Step 17817: {'lr': 0.00048604285393307503, 'samples': 3420864, 'steps': 17816, 'loss/train': 1.7494878768920898} -11/06/2021 23:45:50 - INFO - __main__ - Step 17818: {'lr': 0.000486041105548526, 'samples': 3421056, 'steps': 17817, 'loss/train': 1.6738638877868652} -11/06/2021 23:45:50 - INFO - __main__ - Step 17819: {'lr': 0.00048603935705762057, 'samples': 3421248, 'steps': 17818, 'loss/train': 1.633705496788025} -11/06/2021 23:45:50 - INFO - __main__ - Step 17820: {'lr': 0.0004860376084603594, 'samples': 3421440, 'steps': 17819, 'loss/train': 1.3418101072311401} -11/06/2021 23:45:51 - INFO - __main__ - Step 17821: {'lr': 0.00048603585975674334, 'samples': 3421632, 'steps': 17820, 'loss/train': 0.8659923076629639} -11/06/2021 23:45:51 - INFO - __main__ - Step 17822: {'lr': 0.0004860341109467732, 'samples': 3421824, 'steps': 17821, 'loss/train': 1.9501591920852661} -11/06/2021 23:45:52 - INFO - __main__ - Step 17823: {'lr': 0.00048603236203044963, 'samples': 3422016, 'steps': 17822, 'loss/train': 1.3790924549102783} -11/06/2021 23:45:52 - INFO - __main__ - Step 17824: {'lr': 0.00048603061300777365, 'samples': 3422208, 'steps': 17823, 'loss/train': 1.8731638193130493} -11/06/2021 23:45:53 - INFO - __main__ - Step 17825: {'lr': 0.0004860288638787458, 'samples': 3422400, 'steps': 17824, 'loss/train': 1.725066900253296} -11/06/2021 23:45:53 - INFO - __main__ - Step 17826: {'lr': 0.000486027114643367, 'samples': 3422592, 'steps': 17825, 'loss/train': 1.745100498199463} -11/06/2021 23:45:53 - INFO - __main__ - Step 17827: {'lr': 0.0004860253653016381, 'samples': 3422784, 'steps': 17826, 'loss/train': 1.3238799571990967} -11/06/2021 23:45:54 - INFO - __main__ - Step 17828: {'lr': 0.00048602361585355975, 'samples': 3422976, 'steps': 17827, 'loss/train': 1.8760740756988525} -11/06/2021 23:45:55 - INFO - __main__ - Step 17829: {'lr': 0.0004860218662991328, 'samples': 3423168, 'steps': 17828, 'loss/train': 1.3989863395690918} -11/06/2021 23:45:55 - INFO - __main__ - Step 17830: {'lr': 0.0004860201166383581, 'samples': 3423360, 'steps': 17829, 'loss/train': 1.4480235576629639} -11/06/2021 23:45:56 - INFO - __main__ - Step 17831: {'lr': 0.00048601836687123636, 'samples': 3423552, 'steps': 17830, 'loss/train': 1.3605883121490479} -11/06/2021 23:45:56 - INFO - __main__ - Step 17832: {'lr': 0.00048601661699776834, 'samples': 3423744, 'steps': 17831, 'loss/train': 1.4478638172149658} -11/06/2021 23:45:56 - INFO - __main__ - Step 17833: {'lr': 0.0004860148670179549, 'samples': 3423936, 'steps': 17832, 'loss/train': 1.6285169124603271} -11/06/2021 23:45:57 - INFO - __main__ - Step 17834: {'lr': 0.0004860131169317968, 'samples': 3424128, 'steps': 17833, 'loss/train': 1.9183335304260254} -11/06/2021 23:45:58 - INFO - __main__ - Step 17835: {'lr': 0.0004860113667392948, 'samples': 3424320, 'steps': 17834, 'loss/train': 1.6294353008270264} -11/06/2021 23:45:58 - INFO - __main__ - Step 17836: {'lr': 0.00048600961644044977, 'samples': 3424512, 'steps': 17835, 'loss/train': 1.7146687507629395} -11/06/2021 23:45:58 - INFO - __main__ - Step 17837: {'lr': 0.0004860078660352625, 'samples': 3424704, 'steps': 17836, 'loss/train': 1.918862223625183} -11/06/2021 23:45:59 - INFO - __main__ - Step 17838: {'lr': 0.0004860061155237336, 'samples': 3424896, 'steps': 17837, 'loss/train': 1.628971815109253} -11/06/2021 23:46:00 - INFO - __main__ - Step 17839: {'lr': 0.0004860043649058641, 'samples': 3425088, 'steps': 17838, 'loss/train': 1.5848469734191895} -11/06/2021 23:46:00 - INFO - __main__ - Step 17840: {'lr': 0.00048600261418165456, 'samples': 3425280, 'steps': 17839, 'loss/train': 2.30672025680542} -11/06/2021 23:46:00 - INFO - __main__ - Step 17841: {'lr': 0.00048600086335110593, 'samples': 3425472, 'steps': 17840, 'loss/train': 1.490289568901062} -11/06/2021 23:46:01 - INFO - __main__ - Step 17842: {'lr': 0.000485999112414219, 'samples': 3425664, 'steps': 17841, 'loss/train': 1.1723436117172241} -11/06/2021 23:46:01 - INFO - __main__ - Step 17843: {'lr': 0.0004859973613709945, 'samples': 3425856, 'steps': 17842, 'loss/train': 1.2183293104171753} -11/06/2021 23:46:02 - INFO - __main__ - Step 17844: {'lr': 0.0004859956102214332, 'samples': 3426048, 'steps': 17843, 'loss/train': 1.6532636880874634} -11/06/2021 23:46:02 - INFO - __main__ - Step 17845: {'lr': 0.00048599385896553595, 'samples': 3426240, 'steps': 17844, 'loss/train': 1.6545504331588745} -11/06/2021 23:46:03 - INFO - __main__ - Step 17846: {'lr': 0.0004859921076033034, 'samples': 3426432, 'steps': 17845, 'loss/train': 1.8391602039337158} -11/06/2021 23:46:03 - INFO - __main__ - Step 17847: {'lr': 0.00048599035613473656, 'samples': 3426624, 'steps': 17846, 'loss/train': 1.792570948600769} -11/06/2021 23:46:04 - INFO - __main__ - Step 17848: {'lr': 0.0004859886045598361, 'samples': 3426816, 'steps': 17847, 'loss/train': 1.6841845512390137} -11/06/2021 23:46:05 - INFO - __main__ - Step 17849: {'lr': 0.0004859868528786028, 'samples': 3427008, 'steps': 17848, 'loss/train': 1.8438422679901123} -11/06/2021 23:46:06 - INFO - __main__ - Step 17850: {'lr': 0.0004859851010910374, 'samples': 3427200, 'steps': 17849, 'loss/train': 1.7643811702728271} -11/06/2021 23:46:06 - INFO - __main__ - Step 17851: {'lr': 0.0004859833491971409, 'samples': 3427392, 'steps': 17850, 'loss/train': 1.7371845245361328} -11/06/2021 23:46:06 - INFO - __main__ - Step 17852: {'lr': 0.0004859815971969138, 'samples': 3427584, 'steps': 17851, 'loss/train': 1.7148878574371338} -11/06/2021 23:46:07 - INFO - __main__ - Step 17853: {'lr': 0.0004859798450903571, 'samples': 3427776, 'steps': 17852, 'loss/train': 1.6091628074645996} -11/06/2021 23:46:07 - INFO - __main__ - Step 17854: {'lr': 0.00048597809287747153, 'samples': 3427968, 'steps': 17853, 'loss/train': 1.4261943101882935} -11/06/2021 23:46:07 - INFO - __main__ - Step 17855: {'lr': 0.0004859763405582579, 'samples': 3428160, 'steps': 17854, 'loss/train': 1.8740367889404297} -11/06/2021 23:46:09 - INFO - __main__ - Step 17856: {'lr': 0.00048597458813271686, 'samples': 3428352, 'steps': 17855, 'loss/train': 1.8373491764068604} -11/06/2021 23:46:09 - INFO - __main__ - Step 17857: {'lr': 0.0004859728356008494, 'samples': 3428544, 'steps': 17856, 'loss/train': 1.820371389389038} -11/06/2021 23:46:09 - INFO - __main__ - Step 17858: {'lr': 0.00048597108296265625, 'samples': 3428736, 'steps': 17857, 'loss/train': 1.5134706497192383} -11/06/2021 23:46:10 - INFO - __main__ - Step 17859: {'lr': 0.00048596933021813815, 'samples': 3428928, 'steps': 17858, 'loss/train': 1.1924867630004883} -11/06/2021 23:46:10 - INFO - __main__ - Step 17860: {'lr': 0.0004859675773672959, 'samples': 3429120, 'steps': 17859, 'loss/train': 2.6600170135498047} -11/06/2021 23:46:10 - INFO - __main__ - Step 17861: {'lr': 0.00048596582441013026, 'samples': 3429312, 'steps': 17860, 'loss/train': 1.945163607597351} -11/06/2021 23:46:12 - INFO - __main__ - Step 17862: {'lr': 0.0004859640713466421, 'samples': 3429504, 'steps': 17861, 'loss/train': 1.5751862525939941} -11/06/2021 23:46:12 - INFO - __main__ - Step 17863: {'lr': 0.0004859623181768321, 'samples': 3429696, 'steps': 17862, 'loss/train': 1.3978326320648193} -11/06/2021 23:46:12 - INFO - __main__ - Step 17864: {'lr': 0.0004859605649007012, 'samples': 3429888, 'steps': 17863, 'loss/train': 0.8799737095832825} -11/06/2021 23:46:13 - INFO - __main__ - Step 17865: {'lr': 0.00048595881151825015, 'samples': 3430080, 'steps': 17864, 'loss/train': 1.6823805570602417} -11/06/2021 23:46:13 - INFO - __main__ - Step 17866: {'lr': 0.00048595705802947963, 'samples': 3430272, 'steps': 17865, 'loss/train': 1.4125962257385254} -11/06/2021 23:46:14 - INFO - __main__ - Step 17867: {'lr': 0.0004859553044343905, 'samples': 3430464, 'steps': 17866, 'loss/train': 0.9429519176483154} -11/06/2021 23:46:14 - INFO - __main__ - Step 17868: {'lr': 0.0004859535507329836, 'samples': 3430656, 'steps': 17867, 'loss/train': 1.0948766469955444} -11/06/2021 23:46:15 - INFO - __main__ - Step 17869: {'lr': 0.0004859517969252596, 'samples': 3430848, 'steps': 17868, 'loss/train': 1.6480631828308105} -11/06/2021 23:46:15 - INFO - __main__ - Step 17870: {'lr': 0.0004859500430112194, 'samples': 3431040, 'steps': 17869, 'loss/train': 1.7616888284683228} -11/06/2021 23:46:15 - INFO - __main__ - Step 17871: {'lr': 0.0004859482889908637, 'samples': 3431232, 'steps': 17870, 'loss/train': 1.6862744092941284} -11/06/2021 23:46:17 - INFO - __main__ - Step 17872: {'lr': 0.0004859465348641934, 'samples': 3431424, 'steps': 17871, 'loss/train': 1.6967068910598755} -11/06/2021 23:46:17 - INFO - __main__ - Step 17873: {'lr': 0.0004859447806312093, 'samples': 3431616, 'steps': 17872, 'loss/train': 1.1371982097625732} -11/06/2021 23:46:17 - INFO - __main__ - Step 17874: {'lr': 0.000485943026291912, 'samples': 3431808, 'steps': 17873, 'loss/train': 1.5849249362945557} -11/06/2021 23:46:18 - INFO - __main__ - Step 17875: {'lr': 0.0004859412718463025, 'samples': 3432000, 'steps': 17874, 'loss/train': 1.2743723392486572} -11/06/2021 23:46:18 - INFO - __main__ - Step 17876: {'lr': 0.00048593951729438144, 'samples': 3432192, 'steps': 17875, 'loss/train': 1.4073165655136108} -11/06/2021 23:46:19 - INFO - __main__ - Step 17877: {'lr': 0.0004859377626361497, 'samples': 3432384, 'steps': 17876, 'loss/train': 0.862178385257721} -11/06/2021 23:46:20 - INFO - __main__ - Step 17878: {'lr': 0.00048593600787160806, 'samples': 3432576, 'steps': 17877, 'loss/train': 1.8523950576782227} -11/06/2021 23:46:20 - INFO - __main__ - Step 17879: {'lr': 0.0004859342530007572, 'samples': 3432768, 'steps': 17878, 'loss/train': 2.0718274116516113} -11/06/2021 23:46:20 - INFO - __main__ - Step 17880: {'lr': 0.0004859324980235982, 'samples': 3432960, 'steps': 17879, 'loss/train': 1.829959750175476} -11/06/2021 23:46:21 - INFO - __main__ - Step 17881: {'lr': 0.0004859307429401315, 'samples': 3433152, 'steps': 17880, 'loss/train': 2.3833680152893066} -11/06/2021 23:46:22 - INFO - __main__ - Step 17882: {'lr': 0.0004859289877503581, 'samples': 3433344, 'steps': 17881, 'loss/train': 2.83292293548584} -11/06/2021 23:46:22 - INFO - __main__ - Step 17883: {'lr': 0.00048592723245427874, 'samples': 3433536, 'steps': 17882, 'loss/train': 1.8581055402755737} -11/06/2021 23:46:22 - INFO - __main__ - Step 17884: {'lr': 0.00048592547705189414, 'samples': 3433728, 'steps': 17883, 'loss/train': 1.7676963806152344} -11/06/2021 23:46:23 - INFO - __main__ - Step 17885: {'lr': 0.00048592372154320526, 'samples': 3433920, 'steps': 17884, 'loss/train': 1.4454072713851929} -11/06/2021 23:46:23 - INFO - __main__ - Step 17886: {'lr': 0.0004859219659282127, 'samples': 3434112, 'steps': 17885, 'loss/train': 1.591639518737793} -11/06/2021 23:46:23 - INFO - __main__ - Step 17887: {'lr': 0.00048592021020691745, 'samples': 3434304, 'steps': 17886, 'loss/train': 1.7790858745574951} -11/06/2021 23:46:25 - INFO - __main__ - Step 17888: {'lr': 0.00048591845437932014, 'samples': 3434496, 'steps': 17887, 'loss/train': 1.646702766418457} -11/06/2021 23:46:25 - INFO - __main__ - Step 17889: {'lr': 0.0004859166984454216, 'samples': 3434688, 'steps': 17888, 'loss/train': 1.685816764831543} -11/06/2021 23:46:25 - INFO - __main__ - Step 17890: {'lr': 0.0004859149424052226, 'samples': 3434880, 'steps': 17889, 'loss/train': 1.917184829711914} -11/06/2021 23:46:26 - INFO - __main__ - Step 17891: {'lr': 0.00048591318625872403, 'samples': 3435072, 'steps': 17890, 'loss/train': 1.9429192543029785} -11/06/2021 23:46:26 - INFO - __main__ - Step 17892: {'lr': 0.00048591143000592665, 'samples': 3435264, 'steps': 17891, 'loss/train': 1.4648727178573608} -11/06/2021 23:46:27 - INFO - __main__ - Step 17893: {'lr': 0.00048590967364683116, 'samples': 3435456, 'steps': 17892, 'loss/train': 1.7647534608840942} -11/06/2021 23:46:27 - INFO - __main__ - Step 17894: {'lr': 0.0004859079171814384, 'samples': 3435648, 'steps': 17893, 'loss/train': 2.2489683628082275} -11/06/2021 23:46:28 - INFO - __main__ - Step 17895: {'lr': 0.00048590616060974917, 'samples': 3435840, 'steps': 17894, 'loss/train': 2.1065878868103027} -11/06/2021 23:46:28 - INFO - __main__ - Step 17896: {'lr': 0.00048590440393176434, 'samples': 3436032, 'steps': 17895, 'loss/train': 2.224180221557617} -11/06/2021 23:46:28 - INFO - __main__ - Step 17897: {'lr': 0.00048590264714748455, 'samples': 3436224, 'steps': 17896, 'loss/train': 1.2746485471725464} -11/06/2021 23:46:29 - INFO - __main__ - Step 17898: {'lr': 0.0004859008902569107, 'samples': 3436416, 'steps': 17897, 'loss/train': 1.3870652914047241} -11/06/2021 23:46:30 - INFO - __main__ - Step 17899: {'lr': 0.00048589913326004355, 'samples': 3436608, 'steps': 17898, 'loss/train': 1.7949775457382202} -11/06/2021 23:46:30 - INFO - __main__ - Step 17900: {'lr': 0.0004858973761568839, 'samples': 3436800, 'steps': 17899, 'loss/train': 1.4077565670013428} -11/06/2021 23:46:30 - INFO - __main__ - Step 17901: {'lr': 0.0004858956189474325, 'samples': 3436992, 'steps': 17900, 'loss/train': 1.6623355150222778} -11/06/2021 23:46:31 - INFO - __main__ - Step 17902: {'lr': 0.0004858938616316902, 'samples': 3437184, 'steps': 17901, 'loss/train': 1.7787035703659058} -11/06/2021 23:46:31 - INFO - __main__ - Step 17903: {'lr': 0.00048589210420965775, 'samples': 3437376, 'steps': 17902, 'loss/train': 1.1888090372085571} -11/06/2021 23:46:32 - INFO - __main__ - Step 17904: {'lr': 0.0004858903466813359, 'samples': 3437568, 'steps': 17903, 'loss/train': 2.1995456218719482} -11/06/2021 23:46:33 - INFO - __main__ - Step 17905: {'lr': 0.0004858885890467256, 'samples': 3437760, 'steps': 17904, 'loss/train': 1.9049638509750366} -11/06/2021 23:46:33 - INFO - __main__ - Step 17906: {'lr': 0.00048588683130582755, 'samples': 3437952, 'steps': 17905, 'loss/train': 2.155893087387085} -11/06/2021 23:46:33 - INFO - __main__ - Step 17907: {'lr': 0.00048588507345864246, 'samples': 3438144, 'steps': 17906, 'loss/train': 1.5869488716125488} -11/06/2021 23:46:34 - INFO - __main__ - Step 17908: {'lr': 0.00048588331550517125, 'samples': 3438336, 'steps': 17907, 'loss/train': 2.066535472869873} -11/06/2021 23:46:35 - INFO - __main__ - Step 17909: {'lr': 0.0004858815574454146, 'samples': 3438528, 'steps': 17908, 'loss/train': 1.5409685373306274} -11/06/2021 23:46:35 - INFO - __main__ - Step 17910: {'lr': 0.0004858797992793734, 'samples': 3438720, 'steps': 17909, 'loss/train': 3.083186626434326} -11/06/2021 23:46:35 - INFO - __main__ - Step 17911: {'lr': 0.0004858780410070484, 'samples': 3438912, 'steps': 17910, 'loss/train': 1.5256142616271973} -11/06/2021 23:46:36 - INFO - __main__ - Step 17912: {'lr': 0.0004858762826284404, 'samples': 3439104, 'steps': 17911, 'loss/train': 1.5381463766098022} -11/06/2021 23:46:36 - INFO - __main__ - Step 17913: {'lr': 0.00048587452414355014, 'samples': 3439296, 'steps': 17912, 'loss/train': 1.493998408317566} -11/06/2021 23:46:38 - INFO - __main__ - Step 17914: {'lr': 0.00048587276555237853, 'samples': 3439488, 'steps': 17913, 'loss/train': 1.5796653032302856} -11/06/2021 23:46:38 - INFO - __main__ - Step 17915: {'lr': 0.00048587100685492626, 'samples': 3439680, 'steps': 17914, 'loss/train': 1.4091830253601074} -11/06/2021 23:46:39 - INFO - __main__ - Step 17916: {'lr': 0.00048586924805119416, 'samples': 3439872, 'steps': 17915, 'loss/train': 1.8840548992156982} -11/06/2021 23:46:39 - INFO - __main__ - Step 17917: {'lr': 0.00048586748914118303, 'samples': 3440064, 'steps': 17916, 'loss/train': 1.3594805002212524} -11/06/2021 23:46:39 - INFO - __main__ - Step 17918: {'lr': 0.0004858657301248936, 'samples': 3440256, 'steps': 17917, 'loss/train': 1.8550138473510742} -11/06/2021 23:46:40 - INFO - __main__ - Step 17919: {'lr': 0.00048586397100232673, 'samples': 3440448, 'steps': 17918, 'loss/train': 1.944078803062439} -11/06/2021 23:46:40 - INFO - __main__ - Step 17920: {'lr': 0.00048586221177348323, 'samples': 3440640, 'steps': 17919, 'loss/train': 1.8348121643066406} -11/06/2021 23:46:40 - INFO - __main__ - Step 17921: {'lr': 0.00048586045243836386, 'samples': 3440832, 'steps': 17920, 'loss/train': 1.7867494821548462} -11/06/2021 23:46:41 - INFO - __main__ - Step 17922: {'lr': 0.0004858586929969693, 'samples': 3441024, 'steps': 17921, 'loss/train': 1.8128037452697754} -11/06/2021 23:46:42 - INFO - __main__ - Step 17923: {'lr': 0.0004858569334493006, 'samples': 3441216, 'steps': 17922, 'loss/train': 0.7357732653617859} -11/06/2021 23:46:42 - INFO - __main__ - Step 17924: {'lr': 0.0004858551737953583, 'samples': 3441408, 'steps': 17923, 'loss/train': 1.7629271745681763} -11/06/2021 23:46:42 - INFO - __main__ - Step 17925: {'lr': 0.00048585341403514337, 'samples': 3441600, 'steps': 17924, 'loss/train': 1.7613294124603271} -11/06/2021 23:46:43 - INFO - __main__ - Step 17926: {'lr': 0.0004858516541686565, 'samples': 3441792, 'steps': 17925, 'loss/train': 2.0726709365844727} -11/06/2021 23:46:45 - INFO - __main__ - Step 17927: {'lr': 0.0004858498941958985, 'samples': 3441984, 'steps': 17926, 'loss/train': 1.4030810594558716} -11/06/2021 23:46:45 - INFO - __main__ - Step 17928: {'lr': 0.00048584813411687016, 'samples': 3442176, 'steps': 17927, 'loss/train': 1.4754228591918945} -11/06/2021 23:46:45 - INFO - __main__ - Step 17929: {'lr': 0.00048584637393157235, 'samples': 3442368, 'steps': 17928, 'loss/train': 1.5624349117279053} -11/06/2021 23:46:46 - INFO - __main__ - Step 17930: {'lr': 0.00048584461364000576, 'samples': 3442560, 'steps': 17929, 'loss/train': 1.3149511814117432} -11/06/2021 23:46:46 - INFO - __main__ - Step 17931: {'lr': 0.00048584285324217125, 'samples': 3442752, 'steps': 17930, 'loss/train': 1.7911587953567505} -11/06/2021 23:46:46 - INFO - __main__ - Step 17932: {'lr': 0.00048584109273806954, 'samples': 3442944, 'steps': 17931, 'loss/train': 1.8528138399124146} -11/06/2021 23:46:47 - INFO - __main__ - Step 17933: {'lr': 0.00048583933212770154, 'samples': 3443136, 'steps': 17932, 'loss/train': 1.8300704956054688} -11/06/2021 23:46:48 - INFO - __main__ - Step 17934: {'lr': 0.00048583757141106796, 'samples': 3443328, 'steps': 17933, 'loss/train': 1.5763187408447266} -11/06/2021 23:46:48 - INFO - __main__ - Step 17935: {'lr': 0.00048583581058816956, 'samples': 3443520, 'steps': 17934, 'loss/train': 1.7421388626098633} -11/06/2021 23:46:48 - INFO - __main__ - Step 17936: {'lr': 0.00048583404965900725, 'samples': 3443712, 'steps': 17935, 'loss/train': 1.6953171491622925} -11/06/2021 23:46:49 - INFO - __main__ - Step 17937: {'lr': 0.0004858322886235817, 'samples': 3443904, 'steps': 17936, 'loss/train': 1.5555347204208374} -11/06/2021 23:46:49 - INFO - __main__ - Step 17938: {'lr': 0.0004858305274818938, 'samples': 3444096, 'steps': 17937, 'loss/train': 1.8018510341644287} -11/06/2021 23:46:50 - INFO - __main__ - Step 17939: {'lr': 0.0004858287662339443, 'samples': 3444288, 'steps': 17938, 'loss/train': 1.823989748954773} -11/06/2021 23:46:51 - INFO - __main__ - Step 17940: {'lr': 0.00048582700487973397, 'samples': 3444480, 'steps': 17939, 'loss/train': 5.880978584289551} -11/06/2021 23:46:51 - INFO - __main__ - Step 17941: {'lr': 0.00048582524341926365, 'samples': 3444672, 'steps': 17940, 'loss/train': 1.577499270439148} -11/06/2021 23:46:51 - INFO - __main__ - Step 17942: {'lr': 0.0004858234818525341, 'samples': 3444864, 'steps': 17941, 'loss/train': 1.5800806283950806} -11/06/2021 23:46:52 - INFO - __main__ - Step 17943: {'lr': 0.0004858217201795462, 'samples': 3445056, 'steps': 17942, 'loss/train': 1.5680005550384521} -11/06/2021 23:46:52 - INFO - __main__ - Step 17944: {'lr': 0.0004858199584003006, 'samples': 3445248, 'steps': 17943, 'loss/train': 1.8235677480697632} -11/06/2021 23:46:53 - INFO - __main__ - Step 17945: {'lr': 0.00048581819651479814, 'samples': 3445440, 'steps': 17944, 'loss/train': 1.6470332145690918} -11/06/2021 23:46:53 - INFO - __main__ - Step 17946: {'lr': 0.0004858164345230397, 'samples': 3445632, 'steps': 17945, 'loss/train': 1.935632348060608} -11/06/2021 23:46:54 - INFO - __main__ - Step 17947: {'lr': 0.000485814672425026, 'samples': 3445824, 'steps': 17946, 'loss/train': 1.5922514200210571} -11/06/2021 23:46:54 - INFO - __main__ - Step 17948: {'lr': 0.0004858129102207578, 'samples': 3446016, 'steps': 17947, 'loss/train': 1.7044637203216553} -11/06/2021 23:46:54 - INFO - __main__ - Step 17949: {'lr': 0.0004858111479102359, 'samples': 3446208, 'steps': 17948, 'loss/train': 1.8843209743499756} -11/06/2021 23:46:55 - INFO - __main__ - Step 17950: {'lr': 0.00048580938549346134, 'samples': 3446400, 'steps': 17949, 'loss/train': 1.5622127056121826} -11/06/2021 23:46:56 - INFO - __main__ - Step 17951: {'lr': 0.00048580762297043456, 'samples': 3446592, 'steps': 17950, 'loss/train': 1.3768843412399292} -11/06/2021 23:46:56 - INFO - __main__ - Step 17952: {'lr': 0.00048580586034115646, 'samples': 3446784, 'steps': 17951, 'loss/train': 1.6338905096054077} -11/06/2021 23:46:57 - INFO - __main__ - Step 17953: {'lr': 0.000485804097605628, 'samples': 3446976, 'steps': 17952, 'loss/train': 1.5911237001419067} -11/06/2021 23:46:57 - INFO - __main__ - Step 17954: {'lr': 0.00048580233476384975, 'samples': 3447168, 'steps': 17953, 'loss/train': 1.5193482637405396} -11/06/2021 23:46:58 - INFO - __main__ - Step 17955: {'lr': 0.0004858005718158227, 'samples': 3447360, 'steps': 17954, 'loss/train': 1.441080093383789} -11/06/2021 23:46:58 - INFO - __main__ - Step 17956: {'lr': 0.0004857988087615475, 'samples': 3447552, 'steps': 17955, 'loss/train': 1.336949110031128} -11/06/2021 23:46:59 - INFO - __main__ - Step 17957: {'lr': 0.000485797045601025, 'samples': 3447744, 'steps': 17956, 'loss/train': 1.5038697719573975} -11/06/2021 23:46:59 - INFO - __main__ - Step 17958: {'lr': 0.000485795282334256, 'samples': 3447936, 'steps': 17957, 'loss/train': 1.2776819467544556} -11/06/2021 23:46:59 - INFO - __main__ - Step 17959: {'lr': 0.00048579351896124127, 'samples': 3448128, 'steps': 17958, 'loss/train': 1.4108787775039673} -11/06/2021 23:47:00 - INFO - __main__ - Step 17960: {'lr': 0.0004857917554819816, 'samples': 3448320, 'steps': 17959, 'loss/train': 1.811353087425232} -11/06/2021 23:47:01 - INFO - __main__ - Step 17961: {'lr': 0.00048578999189647786, 'samples': 3448512, 'steps': 17960, 'loss/train': 0.4753451347351074} -11/06/2021 23:47:01 - INFO - __main__ - Step 17962: {'lr': 0.00048578822820473074, 'samples': 3448704, 'steps': 17961, 'loss/train': 1.7303311824798584} -11/06/2021 23:47:01 - INFO - __main__ - Step 17963: {'lr': 0.00048578646440674113, 'samples': 3448896, 'steps': 17962, 'loss/train': 1.7330888509750366} -11/06/2021 23:47:02 - INFO - __main__ - Step 17964: {'lr': 0.0004857847005025097, 'samples': 3449088, 'steps': 17963, 'loss/train': 1.6312006711959839} -11/06/2021 23:47:03 - INFO - __main__ - Step 17965: {'lr': 0.0004857829364920374, 'samples': 3449280, 'steps': 17964, 'loss/train': 1.7061258554458618} -11/06/2021 23:47:04 - INFO - __main__ - Step 17966: {'lr': 0.0004857811723753249, 'samples': 3449472, 'steps': 17965, 'loss/train': 2.2474277019500732} -11/06/2021 23:47:04 - INFO - __main__ - Step 17967: {'lr': 0.00048577940815237305, 'samples': 3449664, 'steps': 17966, 'loss/train': 1.5776370763778687} -11/06/2021 23:47:04 - INFO - __main__ - Step 17968: {'lr': 0.00048577764382318265, 'samples': 3449856, 'steps': 17967, 'loss/train': 1.24309504032135} -11/06/2021 23:47:05 - INFO - __main__ - Step 17969: {'lr': 0.0004857758793877545, 'samples': 3450048, 'steps': 17968, 'loss/train': 1.6525585651397705} -11/06/2021 23:47:05 - INFO - __main__ - Step 17970: {'lr': 0.00048577411484608936, 'samples': 3450240, 'steps': 17969, 'loss/train': 1.6471604108810425} -11/06/2021 23:47:06 - INFO - __main__ - Step 17971: {'lr': 0.000485772350198188, 'samples': 3450432, 'steps': 17970, 'loss/train': 1.7846794128417969} -11/06/2021 23:47:06 - INFO - __main__ - Step 17972: {'lr': 0.00048577058544405126, 'samples': 3450624, 'steps': 17971, 'loss/train': 1.542449951171875} -11/06/2021 23:47:07 - INFO - __main__ - Step 17973: {'lr': 0.00048576882058368, 'samples': 3450816, 'steps': 17972, 'loss/train': 1.9146580696105957} -11/06/2021 23:47:07 - INFO - __main__ - Step 17974: {'lr': 0.0004857670556170749, 'samples': 3451008, 'steps': 17973, 'loss/train': 1.7699105739593506} -11/06/2021 23:47:07 - INFO - __main__ - Step 17975: {'lr': 0.0004857652905442368, 'samples': 3451200, 'steps': 17974, 'loss/train': 1.6144200563430786} -11/06/2021 23:47:08 - INFO - __main__ - Step 17976: {'lr': 0.0004857635253651665, 'samples': 3451392, 'steps': 17975, 'loss/train': 1.4524669647216797} -11/06/2021 23:47:09 - INFO - __main__ - Step 17977: {'lr': 0.00048576176007986485, 'samples': 3451584, 'steps': 17976, 'loss/train': 1.5237561464309692} -11/06/2021 23:47:09 - INFO - __main__ - Step 17978: {'lr': 0.00048575999468833256, 'samples': 3451776, 'steps': 17977, 'loss/train': 1.4829519987106323} -11/06/2021 23:47:10 - INFO - __main__ - Step 17979: {'lr': 0.0004857582291905704, 'samples': 3451968, 'steps': 17978, 'loss/train': 1.7393509149551392} -11/06/2021 23:47:10 - INFO - __main__ - Step 17980: {'lr': 0.00048575646358657934, 'samples': 3452160, 'steps': 17979, 'loss/train': 1.6369855403900146} -11/06/2021 23:47:11 - INFO - __main__ - Step 17981: {'lr': 0.00048575469787635997, 'samples': 3452352, 'steps': 17980, 'loss/train': 1.7648541927337646} -11/06/2021 23:47:11 - INFO - __main__ - Step 17982: {'lr': 0.00048575293205991313, 'samples': 3452544, 'steps': 17981, 'loss/train': 1.6027305126190186} -11/06/2021 23:47:11 - INFO - __main__ - Step 17983: {'lr': 0.0004857511661372397, 'samples': 3452736, 'steps': 17982, 'loss/train': 1.7817578315734863} -11/06/2021 23:47:12 - INFO - __main__ - Step 17984: {'lr': 0.00048574940010834045, 'samples': 3452928, 'steps': 17983, 'loss/train': 1.475091814994812} -11/06/2021 23:47:12 - INFO - __main__ - Step 17985: {'lr': 0.0004857476339732161, 'samples': 3453120, 'steps': 17984, 'loss/train': 1.626041293144226} -11/06/2021 23:47:13 - INFO - __main__ - Step 17986: {'lr': 0.0004857458677318676, 'samples': 3453312, 'steps': 17985, 'loss/train': 2.0042805671691895} -11/06/2021 23:47:14 - INFO - __main__ - Step 17987: {'lr': 0.0004857441013842956, 'samples': 3453504, 'steps': 17986, 'loss/train': 1.843093991279602} -11/06/2021 23:47:14 - INFO - __main__ - Step 17988: {'lr': 0.0004857423349305009, 'samples': 3453696, 'steps': 17987, 'loss/train': 1.5723204612731934} -11/06/2021 23:47:14 - INFO - __main__ - Step 17989: {'lr': 0.00048574056837048443, 'samples': 3453888, 'steps': 17988, 'loss/train': 2.2022082805633545} -11/06/2021 23:47:15 - INFO - __main__ - Step 17990: {'lr': 0.0004857388017042468, 'samples': 3454080, 'steps': 17989, 'loss/train': 1.4242730140686035} -11/06/2021 23:47:15 - INFO - __main__ - Step 17991: {'lr': 0.000485737034931789, 'samples': 3454272, 'steps': 17990, 'loss/train': 1.8824354410171509} -11/06/2021 23:47:16 - INFO - __main__ - Step 17992: {'lr': 0.00048573526805311166, 'samples': 3454464, 'steps': 17991, 'loss/train': 1.777707576751709} -11/06/2021 23:47:17 - INFO - __main__ - Step 17993: {'lr': 0.0004857335010682157, 'samples': 3454656, 'steps': 17992, 'loss/train': 1.7429853677749634} -11/06/2021 23:47:17 - INFO - __main__ - Step 17994: {'lr': 0.0004857317339771018, 'samples': 3454848, 'steps': 17993, 'loss/train': 1.6594009399414062} -11/06/2021 23:47:17 - INFO - __main__ - Step 17995: {'lr': 0.0004857299667797709, 'samples': 3455040, 'steps': 17994, 'loss/train': 1.633614420890808} -11/06/2021 23:47:18 - INFO - __main__ - Step 17996: {'lr': 0.0004857281994762236, 'samples': 3455232, 'steps': 17995, 'loss/train': 1.6758201122283936} -11/06/2021 23:47:19 - INFO - __main__ - Step 17997: {'lr': 0.00048572643206646097, 'samples': 3455424, 'steps': 17996, 'loss/train': 2.020440101623535} -11/06/2021 23:47:19 - INFO - __main__ - Step 17998: {'lr': 0.0004857246645504835, 'samples': 3455616, 'steps': 17997, 'loss/train': 1.609384536743164} -11/06/2021 23:47:19 - INFO - __main__ - Step 17999: {'lr': 0.00048572289692829217, 'samples': 3455808, 'steps': 17998, 'loss/train': 0.954354465007782} -11/06/2021 23:47:20 - INFO - __main__ - Step 18000: {'lr': 0.00048572112919988776, 'samples': 3456000, 'steps': 17999, 'loss/train': 1.7683265209197998} -11/06/2021 23:47:20 - INFO - __main__ - Step 18001: {'lr': 0.00048571936136527106, 'samples': 3456192, 'steps': 18000, 'loss/train': 1.2579536437988281} -11/06/2021 23:47:21 - INFO - __main__ - Step 18002: {'lr': 0.0004857175934244428, 'samples': 3456384, 'steps': 18001, 'loss/train': 1.649789571762085} -11/06/2021 23:47:21 - INFO - __main__ - Step 18003: {'lr': 0.0004857158253774039, 'samples': 3456576, 'steps': 18002, 'loss/train': 1.7836414575576782} -11/06/2021 23:47:22 - INFO - __main__ - Step 18004: {'lr': 0.0004857140572241551, 'samples': 3456768, 'steps': 18003, 'loss/train': 1.7444621324539185} -11/06/2021 23:47:22 - INFO - __main__ - Step 18005: {'lr': 0.00048571228896469713, 'samples': 3456960, 'steps': 18004, 'loss/train': 2.0532634258270264} -11/06/2021 23:47:23 - INFO - __main__ - Step 18006: {'lr': 0.0004857105205990308, 'samples': 3457152, 'steps': 18005, 'loss/train': 1.4198518991470337} -11/06/2021 23:47:24 - INFO - __main__ - Step 18007: {'lr': 0.00048570875212715706, 'samples': 3457344, 'steps': 18006, 'loss/train': 1.4929587841033936} -11/06/2021 23:47:24 - INFO - __main__ - Step 18008: {'lr': 0.0004857069835490765, 'samples': 3457536, 'steps': 18007, 'loss/train': 1.977075457572937} -11/06/2021 23:47:24 - INFO - __main__ - Step 18009: {'lr': 0.00048570521486479004, 'samples': 3457728, 'steps': 18008, 'loss/train': 1.3553253412246704} -11/06/2021 23:47:25 - INFO - __main__ - Step 18010: {'lr': 0.0004857034460742984, 'samples': 3457920, 'steps': 18009, 'loss/train': 2.5607073307037354} -11/06/2021 23:47:25 - INFO - __main__ - Step 18011: {'lr': 0.0004857016771776025, 'samples': 3458112, 'steps': 18010, 'loss/train': 1.862199068069458} -11/06/2021 23:47:27 - INFO - __main__ - Step 18012: {'lr': 0.000485699908174703, 'samples': 3458304, 'steps': 18011, 'loss/train': 1.1634882688522339} -11/06/2021 23:47:27 - INFO - __main__ - Step 18013: {'lr': 0.0004856981390656008, 'samples': 3458496, 'steps': 18012, 'loss/train': 2.178666114807129} -11/06/2021 23:47:27 - INFO - __main__ - Step 18014: {'lr': 0.00048569636985029664, 'samples': 3458688, 'steps': 18013, 'loss/train': 1.3716199398040771} -11/06/2021 23:47:28 - INFO - __main__ - Step 18015: {'lr': 0.00048569460052879136, 'samples': 3458880, 'steps': 18014, 'loss/train': 1.917330265045166} -11/06/2021 23:47:28 - INFO - __main__ - Step 18016: {'lr': 0.0004856928311010857, 'samples': 3459072, 'steps': 18015, 'loss/train': 1.8656532764434814} -11/06/2021 23:47:28 - INFO - __main__ - Step 18017: {'lr': 0.00048569106156718045, 'samples': 3459264, 'steps': 18016, 'loss/train': 1.8904410600662231} -11/06/2021 23:47:29 - INFO - __main__ - Step 18018: {'lr': 0.00048568929192707657, 'samples': 3459456, 'steps': 18017, 'loss/train': 1.839964509010315} -11/06/2021 23:47:30 - INFO - __main__ - Step 18019: {'lr': 0.0004856875221807746, 'samples': 3459648, 'steps': 18018, 'loss/train': 1.3662374019622803} -11/06/2021 23:47:30 - INFO - __main__ - Step 18020: {'lr': 0.0004856857523282755, 'samples': 3459840, 'steps': 18019, 'loss/train': 1.7677093744277954} -11/06/2021 23:47:30 - INFO - __main__ - Step 18021: {'lr': 0.0004856839823695801, 'samples': 3460032, 'steps': 18020, 'loss/train': 0.6586083173751831} -11/06/2021 23:47:31 - INFO - __main__ - Step 18022: {'lr': 0.00048568221230468905, 'samples': 3460224, 'steps': 18021, 'loss/train': 1.783107042312622} -11/06/2021 23:47:31 - INFO - __main__ - Step 18023: {'lr': 0.0004856804421336033, 'samples': 3460416, 'steps': 18022, 'loss/train': 1.4246373176574707} -11/06/2021 23:47:32 - INFO - __main__ - Step 18024: {'lr': 0.0004856786718563235, 'samples': 3460608, 'steps': 18023, 'loss/train': 1.6949611902236938} -11/06/2021 23:47:32 - INFO - __main__ - Step 18025: {'lr': 0.0004856769014728506, 'samples': 3460800, 'steps': 18024, 'loss/train': 1.8121979236602783} -11/06/2021 23:47:33 - INFO - __main__ - Step 18026: {'lr': 0.0004856751309831853, 'samples': 3460992, 'steps': 18025, 'loss/train': 1.5363273620605469} -11/06/2021 23:47:33 - INFO - __main__ - Step 18027: {'lr': 0.00048567336038732843, 'samples': 3461184, 'steps': 18026, 'loss/train': 1.299382209777832} -11/06/2021 23:47:33 - INFO - __main__ - Step 18028: {'lr': 0.0004856715896852808, 'samples': 3461376, 'steps': 18027, 'loss/train': 1.1882447004318237} -11/06/2021 23:47:35 - INFO - __main__ - Step 18029: {'lr': 0.0004856698188770432, 'samples': 3461568, 'steps': 18028, 'loss/train': 1.8871138095855713} -11/06/2021 23:47:35 - INFO - __main__ - Step 18030: {'lr': 0.0004856680479626163, 'samples': 3461760, 'steps': 18029, 'loss/train': 1.3500367403030396} -11/06/2021 23:47:35 - INFO - __main__ - Step 18031: {'lr': 0.0004856662769420012, 'samples': 3461952, 'steps': 18030, 'loss/train': 1.501436471939087} -11/06/2021 23:47:36 - INFO - __main__ - Step 18032: {'lr': 0.0004856645058151984, 'samples': 3462144, 'steps': 18031, 'loss/train': 1.7649421691894531} -11/06/2021 23:47:36 - INFO - __main__ - Step 18033: {'lr': 0.0004856627345822088, 'samples': 3462336, 'steps': 18032, 'loss/train': 1.8708281517028809} -11/06/2021 23:47:37 - INFO - __main__ - Step 18034: {'lr': 0.0004856609632430332, 'samples': 3462528, 'steps': 18033, 'loss/train': 1.811106562614441} -11/06/2021 23:47:37 - INFO - __main__ - Step 18035: {'lr': 0.00048565919179767246, 'samples': 3462720, 'steps': 18034, 'loss/train': 2.175701856613159} -11/06/2021 23:47:38 - INFO - __main__ - Step 18036: {'lr': 0.0004856574202461273, 'samples': 3462912, 'steps': 18035, 'loss/train': 1.7209889888763428} -11/06/2021 23:47:38 - INFO - __main__ - Step 18037: {'lr': 0.0004856556485883985, 'samples': 3463104, 'steps': 18036, 'loss/train': 1.8823835849761963} -11/06/2021 23:47:38 - INFO - __main__ - Step 18038: {'lr': 0.000485653876824487, 'samples': 3463296, 'steps': 18037, 'loss/train': 1.6220828294754028} -11/06/2021 23:47:39 - INFO - __main__ - Step 18039: {'lr': 0.00048565210495439337, 'samples': 3463488, 'steps': 18038, 'loss/train': 1.2623989582061768} -11/06/2021 23:47:40 - INFO - __main__ - Step 18040: {'lr': 0.00048565033297811867, 'samples': 3463680, 'steps': 18039, 'loss/train': 1.4432919025421143} -11/06/2021 23:47:40 - INFO - __main__ - Step 18041: {'lr': 0.0004856485608956635, 'samples': 3463872, 'steps': 18040, 'loss/train': 1.4835745096206665} -11/06/2021 23:47:40 - INFO - __main__ - Step 18042: {'lr': 0.00048564678870702873, 'samples': 3464064, 'steps': 18041, 'loss/train': 1.4812495708465576} -11/06/2021 23:47:41 - INFO - __main__ - Step 18043: {'lr': 0.00048564501641221516, 'samples': 3464256, 'steps': 18042, 'loss/train': 1.9328662157058716} -11/06/2021 23:47:41 - INFO - __main__ - Step 18044: {'lr': 0.00048564324401122357, 'samples': 3464448, 'steps': 18043, 'loss/train': 1.3001339435577393} -11/06/2021 23:47:42 - INFO - __main__ - Step 18045: {'lr': 0.0004856414715040548, 'samples': 3464640, 'steps': 18044, 'loss/train': 1.5383938550949097} -11/06/2021 23:47:43 - INFO - __main__ - Step 18046: {'lr': 0.0004856396988907096, 'samples': 3464832, 'steps': 18045, 'loss/train': 0.6114344596862793} -11/06/2021 23:47:43 - INFO - __main__ - Step 18047: {'lr': 0.00048563792617118876, 'samples': 3465024, 'steps': 18046, 'loss/train': 1.156066656112671} -11/06/2021 23:47:43 - INFO - __main__ - Step 18048: {'lr': 0.00048563615334549316, 'samples': 3465216, 'steps': 18047, 'loss/train': 1.3910892009735107} -11/06/2021 23:47:44 - INFO - __main__ - Step 18049: {'lr': 0.0004856343804136235, 'samples': 3465408, 'steps': 18048, 'loss/train': 1.6260871887207031} -11/06/2021 23:47:45 - INFO - __main__ - Step 18050: {'lr': 0.0004856326073755806, 'samples': 3465600, 'steps': 18049, 'loss/train': 1.7786577939987183} -11/06/2021 23:47:45 - INFO - __main__ - Step 18051: {'lr': 0.0004856308342313653, 'samples': 3465792, 'steps': 18050, 'loss/train': 1.674890398979187} -11/06/2021 23:47:46 - INFO - __main__ - Step 18052: {'lr': 0.00048562906098097847, 'samples': 3465984, 'steps': 18051, 'loss/train': 1.9408053159713745} -11/06/2021 23:47:46 - INFO - __main__ - Step 18053: {'lr': 0.0004856272876244208, 'samples': 3466176, 'steps': 18052, 'loss/train': 1.9470312595367432} -11/06/2021 23:47:46 - INFO - __main__ - Step 18054: {'lr': 0.000485625514161693, 'samples': 3466368, 'steps': 18053, 'loss/train': 1.8458075523376465} -11/06/2021 23:47:47 - INFO - __main__ - Step 18055: {'lr': 0.00048562374059279604, 'samples': 3466560, 'steps': 18054, 'loss/train': 1.438137173652649} -11/06/2021 23:47:48 - INFO - __main__ - Step 18056: {'lr': 0.00048562196691773066, 'samples': 3466752, 'steps': 18055, 'loss/train': 1.7463195323944092} -11/06/2021 23:47:48 - INFO - __main__ - Step 18057: {'lr': 0.00048562019313649766, 'samples': 3466944, 'steps': 18056, 'loss/train': 1.234910249710083} -11/06/2021 23:47:49 - INFO - __main__ - Step 18058: {'lr': 0.0004856184192490979, 'samples': 3467136, 'steps': 18057, 'loss/train': 1.2480186223983765} -11/06/2021 23:47:49 - INFO - __main__ - Step 18059: {'lr': 0.000485616645255532, 'samples': 3467328, 'steps': 18058, 'loss/train': 1.3768389225006104} -11/06/2021 23:47:50 - INFO - __main__ - Step 18060: {'lr': 0.0004856148711558009, 'samples': 3467520, 'steps': 18059, 'loss/train': 1.8986867666244507} -11/06/2021 23:47:50 - INFO - __main__ - Step 18061: {'lr': 0.00048561309694990543, 'samples': 3467712, 'steps': 18060, 'loss/train': 1.514434576034546} -11/06/2021 23:47:51 - INFO - __main__ - Step 18062: {'lr': 0.00048561132263784634, 'samples': 3467904, 'steps': 18061, 'loss/train': 1.9755878448486328} -11/06/2021 23:47:51 - INFO - __main__ - Step 18063: {'lr': 0.00048560954821962434, 'samples': 3468096, 'steps': 18062, 'loss/train': 1.7900665998458862} -11/06/2021 23:47:51 - INFO - __main__ - Step 18064: {'lr': 0.0004856077736952404, 'samples': 3468288, 'steps': 18063, 'loss/train': 2.1173062324523926} -11/06/2021 23:47:52 - INFO - __main__ - Step 18065: {'lr': 0.00048560599906469513, 'samples': 3468480, 'steps': 18064, 'loss/train': 1.6794781684875488} -11/06/2021 23:47:53 - INFO - __main__ - Step 18066: {'lr': 0.00048560422432798956, 'samples': 3468672, 'steps': 18065, 'loss/train': 1.2855576276779175} -11/06/2021 23:47:53 - INFO - __main__ - Step 18067: {'lr': 0.0004856024494851243, 'samples': 3468864, 'steps': 18066, 'loss/train': 0.3096511662006378} -11/06/2021 23:47:54 - INFO - __main__ - Step 18068: {'lr': 0.00048560067453610025, 'samples': 3469056, 'steps': 18067, 'loss/train': 1.4566000699996948} -11/06/2021 23:47:54 - INFO - __main__ - Step 18069: {'lr': 0.00048559889948091814, 'samples': 3469248, 'steps': 18068, 'loss/train': 1.557026743888855} -11/06/2021 23:47:54 - INFO - __main__ - Step 18070: {'lr': 0.0004855971243195788, 'samples': 3469440, 'steps': 18069, 'loss/train': 2.022430181503296} -11/06/2021 23:47:55 - INFO - __main__ - Step 18071: {'lr': 0.00048559534905208304, 'samples': 3469632, 'steps': 18070, 'loss/train': 1.8570542335510254} -11/06/2021 23:47:56 - INFO - __main__ - Step 18072: {'lr': 0.0004855935736784316, 'samples': 3469824, 'steps': 18071, 'loss/train': 1.6132595539093018} -11/06/2021 23:47:56 - INFO - __main__ - Step 18073: {'lr': 0.00048559179819862537, 'samples': 3470016, 'steps': 18072, 'loss/train': 2.393339157104492} -11/06/2021 23:47:57 - INFO - __main__ - Step 18074: {'lr': 0.0004855900226126651, 'samples': 3470208, 'steps': 18073, 'loss/train': 1.808935523033142} -11/06/2021 23:47:57 - INFO - __main__ - Step 18075: {'lr': 0.00048558824692055156, 'samples': 3470400, 'steps': 18074, 'loss/train': 1.6323792934417725} -11/06/2021 23:47:58 - INFO - __main__ - Step 18076: {'lr': 0.0004855864711222857, 'samples': 3470592, 'steps': 18075, 'loss/train': 1.7564913034439087} -11/06/2021 23:47:58 - INFO - __main__ - Step 18077: {'lr': 0.0004855846952178682, 'samples': 3470784, 'steps': 18076, 'loss/train': 1.3942724466323853} -11/06/2021 23:47:59 - INFO - __main__ - Step 18078: {'lr': 0.0004855829192072998, 'samples': 3470976, 'steps': 18077, 'loss/train': 1.9024382829666138} -11/06/2021 23:47:59 - INFO - __main__ - Step 18079: {'lr': 0.00048558114309058144, 'samples': 3471168, 'steps': 18078, 'loss/train': 1.360500693321228} -11/06/2021 23:47:59 - INFO - __main__ - Step 18080: {'lr': 0.00048557936686771376, 'samples': 3471360, 'steps': 18079, 'loss/train': 1.4804255962371826} -11/06/2021 23:48:00 - INFO - __main__ - Step 18081: {'lr': 0.0004855775905386977, 'samples': 3471552, 'steps': 18080, 'loss/train': 1.54103422164917} -11/06/2021 23:48:01 - INFO - __main__ - Step 18082: {'lr': 0.000485575814103534, 'samples': 3471744, 'steps': 18081, 'loss/train': 1.574988842010498} -11/06/2021 23:48:01 - INFO - __main__ - Step 18083: {'lr': 0.0004855740375622235, 'samples': 3471936, 'steps': 18082, 'loss/train': 1.7808576822280884} -11/06/2021 23:48:01 - INFO - __main__ - Step 18084: {'lr': 0.00048557226091476704, 'samples': 3472128, 'steps': 18083, 'loss/train': 1.7548338174819946} -11/06/2021 23:48:02 - INFO - __main__ - Step 18085: {'lr': 0.0004855704841611652, 'samples': 3472320, 'steps': 18084, 'loss/train': 1.2830348014831543} -11/06/2021 23:48:04 - INFO - __main__ - Step 18086: {'lr': 0.00048556870730141906, 'samples': 3472512, 'steps': 18085, 'loss/train': 1.6364481449127197} -11/06/2021 23:48:04 - INFO - __main__ - Step 18087: {'lr': 0.00048556693033552926, 'samples': 3472704, 'steps': 18086, 'loss/train': 1.6514034271240234} -11/06/2021 23:48:05 - INFO - __main__ - Step 18088: {'lr': 0.0004855651532634966, 'samples': 3472896, 'steps': 18087, 'loss/train': 1.5415527820587158} -11/06/2021 23:48:05 - INFO - __main__ - Step 18089: {'lr': 0.00048556337608532196, 'samples': 3473088, 'steps': 18088, 'loss/train': 1.6693471670150757} -11/06/2021 23:48:05 - INFO - __main__ - Step 18090: {'lr': 0.00048556159880100604, 'samples': 3473280, 'steps': 18089, 'loss/train': 1.8687024116516113} -11/06/2021 23:48:06 - INFO - __main__ - Step 18091: {'lr': 0.00048555982141054976, 'samples': 3473472, 'steps': 18090, 'loss/train': 1.8448222875595093} -11/06/2021 23:48:06 - INFO - __main__ - Step 18092: {'lr': 0.0004855580439139539, 'samples': 3473664, 'steps': 18091, 'loss/train': 1.816220998764038} -11/06/2021 23:48:06 - INFO - __main__ - Step 18093: {'lr': 0.00048555626631121906, 'samples': 3473856, 'steps': 18092, 'loss/train': 1.991423487663269} -11/06/2021 23:48:07 - INFO - __main__ - Step 18094: {'lr': 0.0004855544886023463, 'samples': 3474048, 'steps': 18093, 'loss/train': 1.56856107711792} -11/06/2021 23:48:08 - INFO - __main__ - Step 18095: {'lr': 0.00048555271078733637, 'samples': 3474240, 'steps': 18094, 'loss/train': 1.76602303981781} -11/06/2021 23:48:08 - INFO - __main__ - Step 18096: {'lr': 0.00048555093286618996, 'samples': 3474432, 'steps': 18095, 'loss/train': 1.4684127569198608} -11/06/2021 23:48:08 - INFO - __main__ - Step 18097: {'lr': 0.0004855491548389079, 'samples': 3474624, 'steps': 18096, 'loss/train': 1.608511209487915} -11/06/2021 23:48:09 - INFO - __main__ - Step 18098: {'lr': 0.0004855473767054911, 'samples': 3474816, 'steps': 18097, 'loss/train': 1.434108018875122} -11/06/2021 23:48:10 - INFO - __main__ - Step 18099: {'lr': 0.00048554559846594026, 'samples': 3475008, 'steps': 18098, 'loss/train': 1.5190415382385254} -11/06/2021 23:48:10 - INFO - __main__ - Step 18100: {'lr': 0.0004855438201202562, 'samples': 3475200, 'steps': 18099, 'loss/train': 1.5204631090164185} -11/06/2021 23:48:11 - INFO - __main__ - Step 18101: {'lr': 0.0004855420416684398, 'samples': 3475392, 'steps': 18100, 'loss/train': 1.687787652015686} -11/06/2021 23:48:11 - INFO - __main__ - Step 18102: {'lr': 0.0004855402631104917, 'samples': 3475584, 'steps': 18101, 'loss/train': 1.7101457118988037} -11/06/2021 23:48:11 - INFO - __main__ - Step 18103: {'lr': 0.0004855384844464128, 'samples': 3475776, 'steps': 18102, 'loss/train': 0.6320077776908875} -11/06/2021 23:48:12 - INFO - __main__ - Step 18104: {'lr': 0.00048553670567620395, 'samples': 3475968, 'steps': 18103, 'loss/train': 5.830017566680908} -11/06/2021 23:48:13 - INFO - __main__ - Step 18105: {'lr': 0.0004855349267998659, 'samples': 3476160, 'steps': 18104, 'loss/train': 1.7267546653747559} -11/06/2021 23:48:13 - INFO - __main__ - Step 18106: {'lr': 0.0004855331478173994, 'samples': 3476352, 'steps': 18105, 'loss/train': 1.6141504049301147} -11/06/2021 23:48:13 - INFO - __main__ - Step 18107: {'lr': 0.0004855313687288053, 'samples': 3476544, 'steps': 18106, 'loss/train': 1.6809107065200806} -11/06/2021 23:48:14 - INFO - __main__ - Step 18108: {'lr': 0.00048552958953408437, 'samples': 3476736, 'steps': 18107, 'loss/train': 1.5354968309402466} -11/06/2021 23:48:14 - INFO - __main__ - Step 18109: {'lr': 0.0004855278102332375, 'samples': 3476928, 'steps': 18108, 'loss/train': 1.51222562789917} -11/06/2021 23:48:15 - INFO - __main__ - Step 18110: {'lr': 0.0004855260308262654, 'samples': 3477120, 'steps': 18109, 'loss/train': 1.4141589403152466} -11/06/2021 23:48:15 - INFO - __main__ - Step 18111: {'lr': 0.00048552425131316893, 'samples': 3477312, 'steps': 18110, 'loss/train': 1.4904797077178955} -11/06/2021 23:48:16 - INFO - __main__ - Step 18112: {'lr': 0.0004855224716939488, 'samples': 3477504, 'steps': 18111, 'loss/train': 1.6454395055770874} -11/06/2021 23:48:16 - INFO - __main__ - Step 18113: {'lr': 0.0004855206919686059, 'samples': 3477696, 'steps': 18112, 'loss/train': 1.3504629135131836} -11/06/2021 23:48:16 - INFO - __main__ - Step 18114: {'lr': 0.0004855189121371411, 'samples': 3477888, 'steps': 18113, 'loss/train': 2.2587153911590576} -11/06/2021 23:48:17 - INFO - __main__ - Step 18115: {'lr': 0.00048551713219955505, 'samples': 3478080, 'steps': 18114, 'loss/train': 1.7638386487960815} -11/06/2021 23:48:18 - INFO - __main__ - Step 18116: {'lr': 0.00048551535215584865, 'samples': 3478272, 'steps': 18115, 'loss/train': 2.0963571071624756} -11/06/2021 23:48:18 - INFO - __main__ - Step 18117: {'lr': 0.00048551357200602265, 'samples': 3478464, 'steps': 18116, 'loss/train': 2.086501359939575} -11/06/2021 23:48:18 - INFO - __main__ - Step 18118: {'lr': 0.0004855117917500778, 'samples': 3478656, 'steps': 18117, 'loss/train': 1.9306416511535645} -11/06/2021 23:48:19 - INFO - __main__ - Step 18119: {'lr': 0.000485510011388015, 'samples': 3478848, 'steps': 18118, 'loss/train': 1.378063440322876} -11/06/2021 23:48:20 - INFO - __main__ - Step 18120: {'lr': 0.00048550823091983507, 'samples': 3479040, 'steps': 18119, 'loss/train': 1.7439087629318237} -11/06/2021 23:48:20 - INFO - __main__ - Step 18121: {'lr': 0.00048550645034553877, 'samples': 3479232, 'steps': 18120, 'loss/train': 1.3175225257873535} -11/06/2021 23:48:21 - INFO - __main__ - Step 18122: {'lr': 0.00048550466966512684, 'samples': 3479424, 'steps': 18121, 'loss/train': 1.7445465326309204} -11/06/2021 23:48:21 - INFO - __main__ - Step 18123: {'lr': 0.0004855028888786002, 'samples': 3479616, 'steps': 18122, 'loss/train': 1.4202873706817627} -11/06/2021 23:48:21 - INFO - __main__ - Step 18124: {'lr': 0.00048550110798595953, 'samples': 3479808, 'steps': 18123, 'loss/train': 1.469502568244934} -11/06/2021 23:48:23 - INFO - __main__ - Step 18125: {'lr': 0.0004854993269872057, 'samples': 3480000, 'steps': 18124, 'loss/train': 1.5502510070800781} -11/06/2021 23:48:23 - INFO - __main__ - Step 18126: {'lr': 0.0004854975458823396, 'samples': 3480192, 'steps': 18125, 'loss/train': 1.8614351749420166} -11/06/2021 23:48:23 - INFO - __main__ - Step 18127: {'lr': 0.0004854957646713618, 'samples': 3480384, 'steps': 18126, 'loss/train': 1.5096491575241089} -11/06/2021 23:48:24 - INFO - __main__ - Step 18128: {'lr': 0.00048549398335427337, 'samples': 3480576, 'steps': 18127, 'loss/train': 1.1223576068878174} -11/06/2021 23:48:24 - INFO - __main__ - Step 18129: {'lr': 0.0004854922019310749, 'samples': 3480768, 'steps': 18128, 'loss/train': 1.9551997184753418} -11/06/2021 23:48:25 - INFO - __main__ - Step 18130: {'lr': 0.0004854904204017673, 'samples': 3480960, 'steps': 18129, 'loss/train': 1.7446837425231934} -11/06/2021 23:48:25 - INFO - __main__ - Step 18131: {'lr': 0.0004854886387663514, 'samples': 3481152, 'steps': 18130, 'loss/train': 1.8030678033828735} -11/06/2021 23:48:26 - INFO - __main__ - Step 18132: {'lr': 0.0004854868570248279, 'samples': 3481344, 'steps': 18131, 'loss/train': 1.1974247694015503} -11/06/2021 23:48:26 - INFO - __main__ - Step 18133: {'lr': 0.00048548507517719766, 'samples': 3481536, 'steps': 18132, 'loss/train': 1.9085829257965088} -11/06/2021 23:48:26 - INFO - __main__ - Step 18134: {'lr': 0.0004854832932234615, 'samples': 3481728, 'steps': 18133, 'loss/train': 2.1923718452453613} -11/06/2021 23:48:27 - INFO - __main__ - Step 18135: {'lr': 0.0004854815111636202, 'samples': 3481920, 'steps': 18134, 'loss/train': 1.6197718381881714} -11/06/2021 23:48:28 - INFO - __main__ - Step 18136: {'lr': 0.00048547972899767454, 'samples': 3482112, 'steps': 18135, 'loss/train': 1.999104380607605} -11/06/2021 23:48:28 - INFO - __main__ - Step 18137: {'lr': 0.0004854779467256254, 'samples': 3482304, 'steps': 18136, 'loss/train': 1.6554611921310425} -11/06/2021 23:48:28 - INFO - __main__ - Step 18138: {'lr': 0.00048547616434747344, 'samples': 3482496, 'steps': 18137, 'loss/train': 1.7606922388076782} -11/06/2021 23:48:29 - INFO - __main__ - Step 18139: {'lr': 0.0004854743818632196, 'samples': 3482688, 'steps': 18138, 'loss/train': 0.9624412655830383} -11/06/2021 23:48:30 - INFO - __main__ - Step 18140: {'lr': 0.0004854725992728647, 'samples': 3482880, 'steps': 18139, 'loss/train': 1.5731804370880127} -11/06/2021 23:48:30 - INFO - __main__ - Step 18141: {'lr': 0.00048547081657640935, 'samples': 3483072, 'steps': 18140, 'loss/train': 1.5403448343276978} -11/06/2021 23:48:30 - INFO - __main__ - Step 18142: {'lr': 0.00048546903377385457, 'samples': 3483264, 'steps': 18141, 'loss/train': 1.5687254667282104} -11/06/2021 23:48:31 - INFO - __main__ - Step 18143: {'lr': 0.00048546725086520107, 'samples': 3483456, 'steps': 18142, 'loss/train': 1.6424126625061035} -11/06/2021 23:48:31 - INFO - __main__ - Step 18144: {'lr': 0.00048546546785044965, 'samples': 3483648, 'steps': 18143, 'loss/train': 1.4351774454116821} -11/06/2021 23:48:32 - INFO - __main__ - Step 18145: {'lr': 0.00048546368472960114, 'samples': 3483840, 'steps': 18144, 'loss/train': 1.7238658666610718} -11/06/2021 23:48:33 - INFO - __main__ - Step 18146: {'lr': 0.00048546190150265634, 'samples': 3484032, 'steps': 18145, 'loss/train': 1.5560191869735718} -11/06/2021 23:48:33 - INFO - __main__ - Step 18147: {'lr': 0.00048546011816961597, 'samples': 3484224, 'steps': 18146, 'loss/train': 1.6255768537521362} -11/06/2021 23:48:33 - INFO - __main__ - Step 18148: {'lr': 0.00048545833473048094, 'samples': 3484416, 'steps': 18147, 'loss/train': 1.2934846878051758} -11/06/2021 23:48:34 - INFO - __main__ - Step 18149: {'lr': 0.00048545655118525206, 'samples': 3484608, 'steps': 18148, 'loss/train': 1.6034213304519653} -11/06/2021 23:48:34 - INFO - __main__ - Step 18150: {'lr': 0.00048545476753393004, 'samples': 3484800, 'steps': 18149, 'loss/train': 1.2205133438110352} -11/06/2021 23:48:35 - INFO - __main__ - Step 18151: {'lr': 0.0004854529837765158, 'samples': 3484992, 'steps': 18150, 'loss/train': 1.9434911012649536} -11/06/2021 23:48:35 - INFO - __main__ - Step 18152: {'lr': 0.00048545119991301, 'samples': 3485184, 'steps': 18151, 'loss/train': 1.9763034582138062} -11/06/2021 23:48:36 - INFO - __main__ - Step 18153: {'lr': 0.0004854494159434135, 'samples': 3485376, 'steps': 18152, 'loss/train': 1.8863459825515747} -11/06/2021 23:48:36 - INFO - __main__ - Step 18154: {'lr': 0.0004854476318677272, 'samples': 3485568, 'steps': 18153, 'loss/train': 1.7033888101577759} -11/06/2021 23:48:36 - INFO - __main__ - Step 18155: {'lr': 0.00048544584768595185, 'samples': 3485760, 'steps': 18154, 'loss/train': 1.6517353057861328} -11/06/2021 23:48:37 - INFO - __main__ - Step 18156: {'lr': 0.00048544406339808823, 'samples': 3485952, 'steps': 18155, 'loss/train': 1.6695486307144165} -11/06/2021 23:48:38 - INFO - __main__ - Step 18157: {'lr': 0.00048544227900413706, 'samples': 3486144, 'steps': 18156, 'loss/train': 1.761330008506775} -11/06/2021 23:48:38 - INFO - __main__ - Step 18158: {'lr': 0.0004854404945040993, 'samples': 3486336, 'steps': 18157, 'loss/train': 1.339409589767456} -11/06/2021 23:48:38 - INFO - __main__ - Step 18159: {'lr': 0.0004854387098979757, 'samples': 3486528, 'steps': 18158, 'loss/train': 1.1606993675231934} -11/06/2021 23:48:39 - INFO - __main__ - Step 18160: {'lr': 0.000485436925185767, 'samples': 3486720, 'steps': 18159, 'loss/train': 2.2796413898468018} -11/06/2021 23:48:40 - INFO - __main__ - Step 18161: {'lr': 0.00048543514036747404, 'samples': 3486912, 'steps': 18160, 'loss/train': 1.5005325078964233} -11/06/2021 23:48:40 - INFO - __main__ - Step 18162: {'lr': 0.00048543335544309776, 'samples': 3487104, 'steps': 18161, 'loss/train': 1.5606443881988525} -11/06/2021 23:48:41 - INFO - __main__ - Step 18163: {'lr': 0.00048543157041263876, 'samples': 3487296, 'steps': 18162, 'loss/train': 1.3241081237792969} -11/06/2021 23:48:41 - INFO - __main__ - Step 18164: {'lr': 0.0004854297852760979, 'samples': 3487488, 'steps': 18163, 'loss/train': 1.3601914644241333} -11/06/2021 23:48:41 - INFO - __main__ - Step 18165: {'lr': 0.000485428000033476, 'samples': 3487680, 'steps': 18164, 'loss/train': 1.6403565406799316} -11/06/2021 23:48:42 - INFO - __main__ - Step 18166: {'lr': 0.00048542621468477393, 'samples': 3487872, 'steps': 18165, 'loss/train': 1.740988850593567} -11/06/2021 23:48:43 - INFO - __main__ - Step 18167: {'lr': 0.0004854244292299924, 'samples': 3488064, 'steps': 18166, 'loss/train': 1.6933728456497192} -11/06/2021 23:48:43 - INFO - __main__ - Step 18168: {'lr': 0.0004854226436691323, 'samples': 3488256, 'steps': 18167, 'loss/train': 2.1075711250305176} -11/06/2021 23:48:43 - INFO - __main__ - Step 18169: {'lr': 0.0004854208580021944, 'samples': 3488448, 'steps': 18168, 'loss/train': 1.6747791767120361} -11/06/2021 23:48:44 - INFO - __main__ - Step 18170: {'lr': 0.00048541907222917946, 'samples': 3488640, 'steps': 18169, 'loss/train': 1.5540307760238647} -11/06/2021 23:48:45 - INFO - __main__ - Step 18171: {'lr': 0.0004854172863500883, 'samples': 3488832, 'steps': 18170, 'loss/train': 1.7926479578018188} -11/06/2021 23:48:45 - INFO - __main__ - Step 18172: {'lr': 0.00048541550036492175, 'samples': 3489024, 'steps': 18171, 'loss/train': 1.5982003211975098} -11/06/2021 23:48:45 - INFO - __main__ - Step 18173: {'lr': 0.00048541371427368064, 'samples': 3489216, 'steps': 18172, 'loss/train': 1.605031967163086} -11/06/2021 23:48:46 - INFO - __main__ - Step 18174: {'lr': 0.0004854119280763657, 'samples': 3489408, 'steps': 18173, 'loss/train': 2.03631329536438} -11/06/2021 23:48:46 - INFO - __main__ - Step 18175: {'lr': 0.00048541014177297783, 'samples': 3489600, 'steps': 18174, 'loss/train': 1.3513402938842773} -11/06/2021 23:48:46 - INFO - __main__ - Step 18176: {'lr': 0.0004854083553635178, 'samples': 3489792, 'steps': 18175, 'loss/train': 2.2017154693603516} -11/06/2021 23:48:48 - INFO - __main__ - Step 18177: {'lr': 0.00048540656884798626, 'samples': 3489984, 'steps': 18176, 'loss/train': 1.6572513580322266} -11/06/2021 23:48:48 - INFO - __main__ - Step 18178: {'lr': 0.0004854047822263843, 'samples': 3490176, 'steps': 18177, 'loss/train': 1.844321608543396} -11/06/2021 23:48:48 - INFO - __main__ - Step 18179: {'lr': 0.00048540299549871256, 'samples': 3490368, 'steps': 18178, 'loss/train': 1.7020295858383179} -11/06/2021 23:48:49 - INFO - __main__ - Step 18180: {'lr': 0.0004854012086649718, 'samples': 3490560, 'steps': 18179, 'loss/train': 0.9979807734489441} -11/06/2021 23:48:49 - INFO - __main__ - Step 18181: {'lr': 0.00048539942172516295, 'samples': 3490752, 'steps': 18180, 'loss/train': 1.2583417892456055} -11/06/2021 23:48:50 - INFO - __main__ - Step 18182: {'lr': 0.00048539763467928665, 'samples': 3490944, 'steps': 18181, 'loss/train': 1.8729602098464966} -11/06/2021 23:48:50 - INFO - __main__ - Step 18183: {'lr': 0.0004853958475273439, 'samples': 3491136, 'steps': 18182, 'loss/train': 1.4147400856018066} -11/06/2021 23:48:51 - INFO - __main__ - Step 18184: {'lr': 0.0004853940602693354, 'samples': 3491328, 'steps': 18183, 'loss/train': 1.536829948425293} -11/06/2021 23:48:51 - INFO - __main__ - Step 18185: {'lr': 0.00048539227290526194, 'samples': 3491520, 'steps': 18184, 'loss/train': 1.2431416511535645} -11/06/2021 23:48:51 - INFO - __main__ - Step 18186: {'lr': 0.00048539048543512443, 'samples': 3491712, 'steps': 18185, 'loss/train': 1.6529532670974731} -11/06/2021 23:48:52 - INFO - __main__ - Step 18187: {'lr': 0.0004853886978589235, 'samples': 3491904, 'steps': 18186, 'loss/train': 1.608051061630249} -11/06/2021 23:48:53 - INFO - __main__ - Step 18188: {'lr': 0.0004853869101766601, 'samples': 3492096, 'steps': 18187, 'loss/train': 1.734632134437561} -11/06/2021 23:48:53 - INFO - __main__ - Step 18189: {'lr': 0.000485385122388335, 'samples': 3492288, 'steps': 18188, 'loss/train': 1.8401646614074707} -11/06/2021 23:48:53 - INFO - __main__ - Step 18190: {'lr': 0.000485383334493949, 'samples': 3492480, 'steps': 18189, 'loss/train': 1.6987266540527344} -11/06/2021 23:48:54 - INFO - __main__ - Step 18191: {'lr': 0.00048538154649350286, 'samples': 3492672, 'steps': 18190, 'loss/train': 1.5722284317016602} -11/06/2021 23:48:55 - INFO - __main__ - Step 18192: {'lr': 0.00048537975838699744, 'samples': 3492864, 'steps': 18191, 'loss/train': 1.4871503114700317} -11/06/2021 23:48:55 - INFO - __main__ - Step 18193: {'lr': 0.0004853779701744335, 'samples': 3493056, 'steps': 18192, 'loss/train': 1.6807981729507446} -11/06/2021 23:48:56 - INFO - __main__ - Step 18194: {'lr': 0.000485376181855812, 'samples': 3493248, 'steps': 18193, 'loss/train': 1.6861616373062134} -11/06/2021 23:48:56 - INFO - __main__ - Step 18195: {'lr': 0.00048537439343113354, 'samples': 3493440, 'steps': 18194, 'loss/train': 1.648136854171753} -11/06/2021 23:48:56 - INFO - __main__ - Step 18196: {'lr': 0.000485372604900399, 'samples': 3493632, 'steps': 18195, 'loss/train': 2.172215223312378} -11/06/2021 23:48:57 - INFO - __main__ - Step 18197: {'lr': 0.0004853708162636092, 'samples': 3493824, 'steps': 18196, 'loss/train': 1.964274525642395} -11/06/2021 23:48:58 - INFO - __main__ - Step 18198: {'lr': 0.00048536902752076494, 'samples': 3494016, 'steps': 18197, 'loss/train': 1.6822305917739868} -11/06/2021 23:48:58 - INFO - __main__ - Step 18199: {'lr': 0.00048536723867186705, 'samples': 3494208, 'steps': 18198, 'loss/train': 1.7284069061279297} -11/06/2021 23:48:58 - INFO - __main__ - Step 18200: {'lr': 0.0004853654497169163, 'samples': 3494400, 'steps': 18199, 'loss/train': 1.4523322582244873} -11/06/2021 23:48:59 - INFO - __main__ - Step 18201: {'lr': 0.00048536366065591354, 'samples': 3494592, 'steps': 18200, 'loss/train': 1.2845325469970703} -11/06/2021 23:49:00 - INFO - __main__ - Step 18202: {'lr': 0.00048536187148885956, 'samples': 3494784, 'steps': 18201, 'loss/train': 1.542911171913147} -11/06/2021 23:49:00 - INFO - __main__ - Step 18203: {'lr': 0.0004853600822157551, 'samples': 3494976, 'steps': 18202, 'loss/train': 1.685224175453186} -11/06/2021 23:49:00 - INFO - __main__ - Step 18204: {'lr': 0.000485358292836601, 'samples': 3495168, 'steps': 18203, 'loss/train': 2.2215311527252197} -11/06/2021 23:49:01 - INFO - __main__ - Step 18205: {'lr': 0.0004853565033513982, 'samples': 3495360, 'steps': 18204, 'loss/train': 1.5674799680709839} -11/06/2021 23:49:01 - INFO - __main__ - Step 18206: {'lr': 0.0004853547137601473, 'samples': 3495552, 'steps': 18205, 'loss/train': 1.1350946426391602} -11/06/2021 23:49:01 - INFO - __main__ - Step 18207: {'lr': 0.0004853529240628493, 'samples': 3495744, 'steps': 18206, 'loss/train': 1.7013306617736816} -11/06/2021 23:49:02 - INFO - __main__ - Step 18208: {'lr': 0.00048535113425950474, 'samples': 3495936, 'steps': 18207, 'loss/train': 1.4981727600097656} -11/06/2021 23:49:03 - INFO - __main__ - Step 18209: {'lr': 0.0004853493443501147, 'samples': 3496128, 'steps': 18208, 'loss/train': 1.4328523874282837} -11/06/2021 23:49:03 - INFO - __main__ - Step 18210: {'lr': 0.0004853475543346798, 'samples': 3496320, 'steps': 18209, 'loss/train': 1.8389379978179932} -11/06/2021 23:49:04 - INFO - __main__ - Step 18211: {'lr': 0.000485345764213201, 'samples': 3496512, 'steps': 18210, 'loss/train': 1.694120168685913} -11/06/2021 23:49:04 - INFO - __main__ - Step 18212: {'lr': 0.00048534397398567895, 'samples': 3496704, 'steps': 18211, 'loss/train': 1.3739075660705566} -11/06/2021 23:49:05 - INFO - __main__ - Step 18213: {'lr': 0.00048534218365211456, 'samples': 3496896, 'steps': 18212, 'loss/train': 1.0421340465545654} -11/06/2021 23:49:05 - INFO - __main__ - Step 18214: {'lr': 0.0004853403932125087, 'samples': 3497088, 'steps': 18213, 'loss/train': 1.7056995630264282} -11/06/2021 23:49:06 - INFO - __main__ - Step 18215: {'lr': 0.00048533860266686203, 'samples': 3497280, 'steps': 18214, 'loss/train': 1.6891775131225586} -11/06/2021 23:49:06 - INFO - __main__ - Step 18216: {'lr': 0.0004853368120151754, 'samples': 3497472, 'steps': 18215, 'loss/train': 2.0772011280059814} -11/06/2021 23:49:06 - INFO - __main__ - Step 18217: {'lr': 0.00048533502125744967, 'samples': 3497664, 'steps': 18216, 'loss/train': 1.8108474016189575} -11/06/2021 23:49:07 - INFO - __main__ - Step 18218: {'lr': 0.0004853332303936856, 'samples': 3497856, 'steps': 18217, 'loss/train': 1.2649246454238892} -11/06/2021 23:49:08 - INFO - __main__ - Step 18219: {'lr': 0.000485331439423884, 'samples': 3498048, 'steps': 18218, 'loss/train': 1.977997899055481} -11/06/2021 23:49:08 - INFO - __main__ - Step 18220: {'lr': 0.00048532964834804566, 'samples': 3498240, 'steps': 18219, 'loss/train': 1.0719574689865112} -11/06/2021 23:49:08 - INFO - __main__ - Step 18221: {'lr': 0.00048532785716617145, 'samples': 3498432, 'steps': 18220, 'loss/train': 1.237172245979309} -11/06/2021 23:49:09 - INFO - __main__ - Step 18222: {'lr': 0.0004853260658782621, 'samples': 3498624, 'steps': 18221, 'loss/train': 2.3552660942077637} -11/06/2021 23:49:10 - INFO - __main__ - Step 18223: {'lr': 0.0004853242744843185, 'samples': 3498816, 'steps': 18222, 'loss/train': 1.9997755289077759} -11/06/2021 23:49:10 - INFO - __main__ - Step 18224: {'lr': 0.0004853224829843414, 'samples': 3499008, 'steps': 18223, 'loss/train': 1.524446964263916} -11/06/2021 23:49:10 - INFO - __main__ - Step 18225: {'lr': 0.00048532069137833156, 'samples': 3499200, 'steps': 18224, 'loss/train': 1.5553361177444458} -11/06/2021 23:49:11 - INFO - __main__ - Step 18226: {'lr': 0.00048531889966628997, 'samples': 3499392, 'steps': 18225, 'loss/train': 1.2492296695709229} -11/06/2021 23:49:11 - INFO - __main__ - Step 18227: {'lr': 0.00048531710784821726, 'samples': 3499584, 'steps': 18226, 'loss/train': 1.625084638595581} -11/06/2021 23:49:12 - INFO - __main__ - Step 18228: {'lr': 0.0004853153159241143, 'samples': 3499776, 'steps': 18227, 'loss/train': 2.811218500137329} -11/06/2021 23:49:12 - INFO - __main__ - Step 18229: {'lr': 0.0004853135238939818, 'samples': 3499968, 'steps': 18228, 'loss/train': 1.670412540435791} -11/06/2021 23:49:13 - INFO - __main__ - Step 18230: {'lr': 0.0004853117317578207, 'samples': 3500160, 'steps': 18229, 'loss/train': 1.9822686910629272} -11/06/2021 23:49:13 - INFO - __main__ - Step 18231: {'lr': 0.00048530993951563186, 'samples': 3500352, 'steps': 18230, 'loss/train': 1.3493831157684326} -11/06/2021 23:49:14 - INFO - __main__ - Step 18232: {'lr': 0.0004853081471674159, 'samples': 3500544, 'steps': 18231, 'loss/train': 1.558580994606018} -11/06/2021 23:49:14 - INFO - __main__ - Step 18233: {'lr': 0.00048530635471317373, 'samples': 3500736, 'steps': 18232, 'loss/train': 1.388440489768982} -11/06/2021 23:49:15 - INFO - __main__ - Step 18234: {'lr': 0.0004853045621529062, 'samples': 3500928, 'steps': 18233, 'loss/train': 1.910845160484314} -11/06/2021 23:49:15 - INFO - __main__ - Step 18235: {'lr': 0.000485302769486614, 'samples': 3501120, 'steps': 18234, 'loss/train': 0.8962222337722778} -11/06/2021 23:49:16 - INFO - __main__ - Step 18236: {'lr': 0.000485300976714298, 'samples': 3501312, 'steps': 18235, 'loss/train': 1.7857457399368286} -11/06/2021 23:49:16 - INFO - __main__ - Step 18237: {'lr': 0.00048529918383595906, 'samples': 3501504, 'steps': 18236, 'loss/train': 1.4741995334625244} -11/06/2021 23:49:16 - INFO - __main__ - Step 18238: {'lr': 0.0004852973908515979, 'samples': 3501696, 'steps': 18237, 'loss/train': 1.837266206741333} -11/06/2021 23:49:17 - INFO - __main__ - Step 18239: {'lr': 0.0004852955977612154, 'samples': 3501888, 'steps': 18238, 'loss/train': 1.7000993490219116} -11/06/2021 23:49:18 - INFO - __main__ - Step 18240: {'lr': 0.0004852938045648123, 'samples': 3502080, 'steps': 18239, 'loss/train': 1.7775219678878784} -11/06/2021 23:49:18 - INFO - __main__ - Step 18241: {'lr': 0.0004852920112623895, 'samples': 3502272, 'steps': 18240, 'loss/train': 1.721117615699768} -11/06/2021 23:49:18 - INFO - __main__ - Step 18242: {'lr': 0.00048529021785394765, 'samples': 3502464, 'steps': 18241, 'loss/train': 1.123333215713501} -11/06/2021 23:49:19 - INFO - __main__ - Step 18243: {'lr': 0.00048528842433948776, 'samples': 3502656, 'steps': 18242, 'loss/train': 2.0293686389923096} -11/06/2021 23:49:20 - INFO - __main__ - Step 18244: {'lr': 0.00048528663071901047, 'samples': 3502848, 'steps': 18243, 'loss/train': 1.9051157236099243} -11/06/2021 23:49:20 - INFO - __main__ - Step 18245: {'lr': 0.0004852848369925167, 'samples': 3503040, 'steps': 18244, 'loss/train': 1.5317625999450684} -11/06/2021 23:49:21 - INFO - __main__ - Step 18246: {'lr': 0.00048528304316000723, 'samples': 3503232, 'steps': 18245, 'loss/train': 1.8175814151763916} -11/06/2021 23:49:21 - INFO - __main__ - Step 18247: {'lr': 0.0004852812492214828, 'samples': 3503424, 'steps': 18246, 'loss/train': 1.8638849258422852} -11/06/2021 23:49:21 - INFO - __main__ - Step 18248: {'lr': 0.0004852794551769443, 'samples': 3503616, 'steps': 18247, 'loss/train': 1.8089745044708252} -11/06/2021 23:49:22 - INFO - __main__ - Step 18249: {'lr': 0.0004852776610263925, 'samples': 3503808, 'steps': 18248, 'loss/train': 1.6794166564941406} -11/06/2021 23:49:23 - INFO - __main__ - Step 18250: {'lr': 0.0004852758667698282, 'samples': 3504000, 'steps': 18249, 'loss/train': 1.3067717552185059} -11/06/2021 23:49:23 - INFO - __main__ - Step 18251: {'lr': 0.00048527407240725223, 'samples': 3504192, 'steps': 18250, 'loss/train': 2.015906810760498} -11/06/2021 23:49:23 - INFO - __main__ - Step 18252: {'lr': 0.0004852722779386654, 'samples': 3504384, 'steps': 18251, 'loss/train': 0.8979371786117554} -11/06/2021 23:49:24 - INFO - __main__ - Step 18253: {'lr': 0.00048527048336406855, 'samples': 3504576, 'steps': 18252, 'loss/train': 1.830647587776184} -11/06/2021 23:49:24 - INFO - __main__ - Step 18254: {'lr': 0.00048526868868346243, 'samples': 3504768, 'steps': 18253, 'loss/train': 1.9769741296768188} -11/06/2021 23:49:25 - INFO - __main__ - Step 18255: {'lr': 0.0004852668938968478, 'samples': 3504960, 'steps': 18254, 'loss/train': 1.7995449304580688} -11/06/2021 23:49:25 - INFO - __main__ - Step 18256: {'lr': 0.0004852650990042256, 'samples': 3505152, 'steps': 18255, 'loss/train': 1.704633116722107} -11/06/2021 23:49:26 - INFO - __main__ - Step 18257: {'lr': 0.0004852633040055966, 'samples': 3505344, 'steps': 18256, 'loss/train': 0.9128971695899963} -11/06/2021 23:49:26 - INFO - __main__ - Step 18258: {'lr': 0.00048526150890096153, 'samples': 3505536, 'steps': 18257, 'loss/train': 1.5316613912582397} -11/06/2021 23:49:26 - INFO - __main__ - Step 18259: {'lr': 0.0004852597136903213, 'samples': 3505728, 'steps': 18258, 'loss/train': 1.312677264213562} -11/06/2021 23:49:28 - INFO - __main__ - Step 18260: {'lr': 0.0004852579183736766, 'samples': 3505920, 'steps': 18259, 'loss/train': 1.4250472784042358} -11/06/2021 23:49:28 - INFO - __main__ - Step 18261: {'lr': 0.00048525612295102836, 'samples': 3506112, 'steps': 18260, 'loss/train': 1.6988489627838135} -11/06/2021 23:49:28 - INFO - __main__ - Step 18262: {'lr': 0.00048525432742237736, 'samples': 3506304, 'steps': 18261, 'loss/train': 1.2453324794769287} -11/06/2021 23:49:29 - INFO - __main__ - Step 18263: {'lr': 0.00048525253178772435, 'samples': 3506496, 'steps': 18262, 'loss/train': 0.8945806622505188} -11/06/2021 23:49:29 - INFO - __main__ - Step 18264: {'lr': 0.0004852507360470702, 'samples': 3506688, 'steps': 18263, 'loss/train': 1.7507184743881226} -11/06/2021 23:49:30 - INFO - __main__ - Step 18265: {'lr': 0.0004852489402004157, 'samples': 3506880, 'steps': 18264, 'loss/train': 1.6482011079788208} -11/06/2021 23:49:30 - INFO - __main__ - Step 18266: {'lr': 0.0004852471442477617, 'samples': 3507072, 'steps': 18265, 'loss/train': 1.300549864768982} -11/06/2021 23:49:31 - INFO - __main__ - Step 18267: {'lr': 0.0004852453481891089, 'samples': 3507264, 'steps': 18266, 'loss/train': 1.42025887966156} -11/06/2021 23:49:31 - INFO - __main__ - Step 18268: {'lr': 0.00048524355202445827, 'samples': 3507456, 'steps': 18267, 'loss/train': 1.4363129138946533} -11/06/2021 23:49:31 - INFO - __main__ - Step 18269: {'lr': 0.0004852417557538104, 'samples': 3507648, 'steps': 18268, 'loss/train': 1.8137376308441162} -11/06/2021 23:49:32 - INFO - __main__ - Step 18270: {'lr': 0.00048523995937716625, 'samples': 3507840, 'steps': 18269, 'loss/train': 1.8509377241134644} -11/06/2021 23:49:33 - INFO - __main__ - Step 18271: {'lr': 0.0004852381628945267, 'samples': 3508032, 'steps': 18270, 'loss/train': 1.3168461322784424} -11/06/2021 23:49:33 - INFO - __main__ - Step 18272: {'lr': 0.0004852363663058924, 'samples': 3508224, 'steps': 18271, 'loss/train': 1.526947259902954} -11/06/2021 23:49:33 - INFO - __main__ - Step 18273: {'lr': 0.0004852345696112642, 'samples': 3508416, 'steps': 18272, 'loss/train': 1.773221492767334} -11/06/2021 23:49:34 - INFO - __main__ - Step 18274: {'lr': 0.00048523277281064295, 'samples': 3508608, 'steps': 18273, 'loss/train': 1.244134545326233} -11/06/2021 23:49:35 - INFO - __main__ - Step 18275: {'lr': 0.0004852309759040294, 'samples': 3508800, 'steps': 18274, 'loss/train': 1.7051624059677124} -11/06/2021 23:49:35 - INFO - __main__ - Step 18276: {'lr': 0.00048522917889142446, 'samples': 3508992, 'steps': 18275, 'loss/train': 1.3719818592071533} -11/06/2021 23:49:36 - INFO - __main__ - Step 18277: {'lr': 0.00048522738177282887, 'samples': 3509184, 'steps': 18276, 'loss/train': 1.7115142345428467} -11/06/2021 23:49:36 - INFO - __main__ - Step 18278: {'lr': 0.0004852255845482435, 'samples': 3509376, 'steps': 18277, 'loss/train': 1.9277666807174683} -11/06/2021 23:49:36 - INFO - __main__ - Step 18279: {'lr': 0.0004852237872176691, 'samples': 3509568, 'steps': 18278, 'loss/train': 1.5939767360687256} -11/06/2021 23:49:37 - INFO - __main__ - Step 18280: {'lr': 0.00048522198978110645, 'samples': 3509760, 'steps': 18279, 'loss/train': 1.7465685606002808} -11/06/2021 23:49:38 - INFO - __main__ - Step 18281: {'lr': 0.0004852201922385564, 'samples': 3509952, 'steps': 18280, 'loss/train': 1.4472709894180298} -11/06/2021 23:49:38 - INFO - __main__ - Step 18282: {'lr': 0.00048521839459001977, 'samples': 3510144, 'steps': 18281, 'loss/train': 4.651975154876709} -11/06/2021 23:49:38 - INFO - __main__ - Step 18283: {'lr': 0.0004852165968354973, 'samples': 3510336, 'steps': 18282, 'loss/train': 1.702797532081604} -11/06/2021 23:49:39 - INFO - __main__ - Step 18284: {'lr': 0.00048521479897499, 'samples': 3510528, 'steps': 18283, 'loss/train': 0.8926244378089905} -11/06/2021 23:49:39 - INFO - __main__ - Step 18285: {'lr': 0.0004852130010084984, 'samples': 3510720, 'steps': 18284, 'loss/train': 1.6344717741012573} -11/06/2021 23:49:40 - INFO - __main__ - Step 18286: {'lr': 0.0004852112029360235, 'samples': 3510912, 'steps': 18285, 'loss/train': 1.0488026142120361} -11/06/2021 23:49:41 - INFO - __main__ - Step 18287: {'lr': 0.0004852094047575661, 'samples': 3511104, 'steps': 18286, 'loss/train': 0.9467637538909912} -11/06/2021 23:49:41 - INFO - __main__ - Step 18288: {'lr': 0.00048520760647312696, 'samples': 3511296, 'steps': 18287, 'loss/train': 1.3265576362609863} -11/06/2021 23:49:41 - INFO - __main__ - Step 18289: {'lr': 0.00048520580808270687, 'samples': 3511488, 'steps': 18288, 'loss/train': 1.6178340911865234} -11/06/2021 23:49:42 - INFO - __main__ - Step 18290: {'lr': 0.0004852040095863067, 'samples': 3511680, 'steps': 18289, 'loss/train': 1.1068137884140015} -11/06/2021 23:49:43 - INFO - __main__ - Step 18291: {'lr': 0.0004852022109839273, 'samples': 3511872, 'steps': 18290, 'loss/train': 1.9344698190689087} -11/06/2021 23:49:43 - INFO - __main__ - Step 18292: {'lr': 0.0004852004122755693, 'samples': 3512064, 'steps': 18291, 'loss/train': 1.2475080490112305} -11/06/2021 23:49:43 - INFO - __main__ - Step 18293: {'lr': 0.00048519861346123363, 'samples': 3512256, 'steps': 18292, 'loss/train': 1.8506364822387695} -11/06/2021 23:49:44 - INFO - __main__ - Step 18294: {'lr': 0.0004851968145409211, 'samples': 3512448, 'steps': 18293, 'loss/train': 1.8689836263656616} -11/06/2021 23:49:44 - INFO - __main__ - Step 18295: {'lr': 0.00048519501551463255, 'samples': 3512640, 'steps': 18294, 'loss/train': 1.9257316589355469} -11/06/2021 23:49:45 - INFO - __main__ - Step 18296: {'lr': 0.0004851932163823688, 'samples': 3512832, 'steps': 18295, 'loss/train': 1.4464284181594849} -11/06/2021 23:49:45 - INFO - __main__ - Step 18297: {'lr': 0.0004851914171441305, 'samples': 3513024, 'steps': 18296, 'loss/train': 1.7276997566223145} -11/06/2021 23:49:46 - INFO - __main__ - Step 18298: {'lr': 0.00048518961779991866, 'samples': 3513216, 'steps': 18297, 'loss/train': 2.2795534133911133} -11/06/2021 23:49:46 - INFO - __main__ - Step 18299: {'lr': 0.00048518781834973405, 'samples': 3513408, 'steps': 18298, 'loss/train': 1.8023676872253418} -11/06/2021 23:49:46 - INFO - __main__ - Step 18300: {'lr': 0.0004851860187935773, 'samples': 3513600, 'steps': 18299, 'loss/train': 1.8043395280838013} -11/06/2021 23:49:47 - INFO - __main__ - Step 18301: {'lr': 0.0004851842191314494, 'samples': 3513792, 'steps': 18300, 'loss/train': 1.7995017766952515} -11/06/2021 23:49:48 - INFO - __main__ - Step 18302: {'lr': 0.0004851824193633512, 'samples': 3513984, 'steps': 18301, 'loss/train': 1.2116223573684692} -11/06/2021 23:49:48 - INFO - __main__ - Step 18303: {'lr': 0.00048518061948928337, 'samples': 3514176, 'steps': 18302, 'loss/train': 1.6613613367080688} -11/06/2021 23:49:48 - INFO - __main__ - Step 18304: {'lr': 0.0004851788195092468, 'samples': 3514368, 'steps': 18303, 'loss/train': 1.6209909915924072} -11/06/2021 23:49:49 - INFO - __main__ - Step 18305: {'lr': 0.00048517701942324225, 'samples': 3514560, 'steps': 18304, 'loss/train': 1.4889389276504517} -11/06/2021 23:49:50 - INFO - __main__ - Step 18306: {'lr': 0.00048517521923127063, 'samples': 3514752, 'steps': 18305, 'loss/train': 1.5987910032272339} -11/06/2021 23:49:50 - INFO - __main__ - Step 18307: {'lr': 0.00048517341893333267, 'samples': 3514944, 'steps': 18306, 'loss/train': 1.4218535423278809} -11/06/2021 23:49:51 - INFO - __main__ - Step 18308: {'lr': 0.0004851716185294291, 'samples': 3515136, 'steps': 18307, 'loss/train': 1.3307141065597534} -11/06/2021 23:49:51 - INFO - __main__ - Step 18309: {'lr': 0.00048516981801956097, 'samples': 3515328, 'steps': 18308, 'loss/train': 1.0911080837249756} -11/06/2021 23:49:51 - INFO - __main__ - Step 18310: {'lr': 0.00048516801740372886, 'samples': 3515520, 'steps': 18309, 'loss/train': 1.5803437232971191} -11/06/2021 23:49:52 - INFO - __main__ - Step 18311: {'lr': 0.0004851662166819337, 'samples': 3515712, 'steps': 18310, 'loss/train': 1.7632087469100952} -11/06/2021 23:49:53 - INFO - __main__ - Step 18312: {'lr': 0.00048516441585417624, 'samples': 3515904, 'steps': 18311, 'loss/train': 1.3670587539672852} -11/06/2021 23:49:53 - INFO - __main__ - Step 18313: {'lr': 0.0004851626149204573, 'samples': 3516096, 'steps': 18312, 'loss/train': 1.3371531963348389} -11/06/2021 23:49:53 - INFO - __main__ - Step 18314: {'lr': 0.0004851608138807778, 'samples': 3516288, 'steps': 18313, 'loss/train': 1.4870017766952515} -11/06/2021 23:49:54 - INFO - __main__ - Step 18315: {'lr': 0.0004851590127351384, 'samples': 3516480, 'steps': 18314, 'loss/train': 1.754389762878418} -11/06/2021 23:49:54 - INFO - __main__ - Step 18316: {'lr': 0.0004851572114835401, 'samples': 3516672, 'steps': 18315, 'loss/train': 1.351464867591858} -11/06/2021 23:49:55 - INFO - __main__ - Step 18317: {'lr': 0.0004851554101259834, 'samples': 3516864, 'steps': 18316, 'loss/train': 1.2993682622909546} -11/06/2021 23:49:56 - INFO - __main__ - Step 18318: {'lr': 0.00048515360866246943, 'samples': 3517056, 'steps': 18317, 'loss/train': 1.4569814205169678} -11/06/2021 23:49:56 - INFO - __main__ - Step 18319: {'lr': 0.00048515180709299884, 'samples': 3517248, 'steps': 18318, 'loss/train': 1.4474055767059326} -11/06/2021 23:49:56 - INFO - __main__ - Step 18320: {'lr': 0.0004851500054175725, 'samples': 3517440, 'steps': 18319, 'loss/train': 1.655856966972351} -11/06/2021 23:49:57 - INFO - __main__ - Step 18321: {'lr': 0.00048514820363619116, 'samples': 3517632, 'steps': 18320, 'loss/train': 1.7874832153320312} -11/06/2021 23:49:58 - INFO - __main__ - Step 18322: {'lr': 0.0004851464017488556, 'samples': 3517824, 'steps': 18321, 'loss/train': 1.4972641468048096} -11/06/2021 23:49:58 - INFO - __main__ - Step 18323: {'lr': 0.0004851445997555668, 'samples': 3518016, 'steps': 18322, 'loss/train': 1.730514407157898} -11/06/2021 23:49:59 - INFO - __main__ - Step 18324: {'lr': 0.00048514279765632547, 'samples': 3518208, 'steps': 18323, 'loss/train': 1.7246754169464111} -11/06/2021 23:49:59 - INFO - __main__ - Step 18325: {'lr': 0.0004851409954511324, 'samples': 3518400, 'steps': 18324, 'loss/train': 1.5894545316696167} -11/06/2021 23:49:59 - INFO - __main__ - Step 18326: {'lr': 0.0004851391931399884, 'samples': 3518592, 'steps': 18325, 'loss/train': 1.7464122772216797} -11/06/2021 23:50:00 - INFO - __main__ - Step 18327: {'lr': 0.0004851373907228943, 'samples': 3518784, 'steps': 18326, 'loss/train': 0.5367693901062012} -11/06/2021 23:50:01 - INFO - __main__ - Step 18328: {'lr': 0.00048513558819985106, 'samples': 3518976, 'steps': 18327, 'loss/train': 1.6977030038833618} -11/06/2021 23:50:01 - INFO - __main__ - Step 18329: {'lr': 0.0004851337855708592, 'samples': 3519168, 'steps': 18328, 'loss/train': 2.0396475791931152} -11/06/2021 23:50:01 - INFO - __main__ - Step 18330: {'lr': 0.0004851319828359198, 'samples': 3519360, 'steps': 18329, 'loss/train': 1.1017811298370361} -11/06/2021 23:50:02 - INFO - __main__ - Step 18331: {'lr': 0.0004851301799950334, 'samples': 3519552, 'steps': 18330, 'loss/train': 1.9549344778060913} -11/06/2021 23:50:03 - INFO - __main__ - Step 18332: {'lr': 0.00048512837704820107, 'samples': 3519744, 'steps': 18331, 'loss/train': 1.0040029287338257} -11/06/2021 23:50:03 - INFO - __main__ - Step 18333: {'lr': 0.00048512657399542346, 'samples': 3519936, 'steps': 18332, 'loss/train': 1.3319391012191772} -11/06/2021 23:50:04 - INFO - __main__ - Step 18334: {'lr': 0.0004851247708367015, 'samples': 3520128, 'steps': 18333, 'loss/train': 2.4227659702301025} -11/06/2021 23:50:04 - INFO - __main__ - Step 18335: {'lr': 0.000485122967572036, 'samples': 3520320, 'steps': 18334, 'loss/train': 1.6032307147979736} -11/06/2021 23:50:04 - INFO - __main__ - Step 18336: {'lr': 0.0004851211642014276, 'samples': 3520512, 'steps': 18335, 'loss/train': 1.2883901596069336} -11/06/2021 23:50:05 - INFO - __main__ - Step 18337: {'lr': 0.0004851193607248773, 'samples': 3520704, 'steps': 18336, 'loss/train': 1.7592421770095825} -11/06/2021 23:50:06 - INFO - __main__ - Step 18338: {'lr': 0.00048511755714238585, 'samples': 3520896, 'steps': 18337, 'loss/train': 1.8046785593032837} -11/06/2021 23:50:06 - INFO - __main__ - Step 18339: {'lr': 0.0004851157534539541, 'samples': 3521088, 'steps': 18338, 'loss/train': 1.5575534105300903} -11/06/2021 23:50:07 - INFO - __main__ - Step 18340: {'lr': 0.0004851139496595827, 'samples': 3521280, 'steps': 18339, 'loss/train': 2.251190423965454} -11/06/2021 23:50:07 - INFO - __main__ - Step 18341: {'lr': 0.00048511214575927265, 'samples': 3521472, 'steps': 18340, 'loss/train': 2.2171289920806885} -11/06/2021 23:50:07 - INFO - __main__ - Step 18342: {'lr': 0.0004851103417530247, 'samples': 3521664, 'steps': 18341, 'loss/train': 1.7757937908172607} -11/06/2021 23:50:08 - INFO - __main__ - Step 18343: {'lr': 0.0004851085376408396, 'samples': 3521856, 'steps': 18342, 'loss/train': 2.004495143890381} -11/06/2021 23:50:09 - INFO - __main__ - Step 18344: {'lr': 0.0004851067334227183, 'samples': 3522048, 'steps': 18343, 'loss/train': 2.009399175643921} -11/06/2021 23:50:10 - INFO - __main__ - Step 18345: {'lr': 0.0004851049290986615, 'samples': 3522240, 'steps': 18344, 'loss/train': 1.5748186111450195} -11/06/2021 23:50:10 - INFO - __main__ - Step 18346: {'lr': 0.00048510312466867, 'samples': 3522432, 'steps': 18345, 'loss/train': 1.7785025835037231} -11/06/2021 23:50:10 - INFO - __main__ - Step 18347: {'lr': 0.0004851013201327448, 'samples': 3522624, 'steps': 18346, 'loss/train': 1.7600922584533691} -11/06/2021 23:50:11 - INFO - __main__ - Step 18348: {'lr': 0.0004850995154908864, 'samples': 3522816, 'steps': 18347, 'loss/train': 1.7795250415802002} -11/06/2021 23:50:11 - INFO - __main__ - Step 18349: {'lr': 0.0004850977107430959, 'samples': 3523008, 'steps': 18348, 'loss/train': 1.8570597171783447} -11/06/2021 23:50:12 - INFO - __main__ - Step 18350: {'lr': 0.000485095905889374, 'samples': 3523200, 'steps': 18349, 'loss/train': 1.9649345874786377} -11/06/2021 23:50:12 - INFO - __main__ - Step 18351: {'lr': 0.00048509410092972144, 'samples': 3523392, 'steps': 18350, 'loss/train': 1.5948915481567383} -11/06/2021 23:50:13 - INFO - __main__ - Step 18352: {'lr': 0.0004850922958641392, 'samples': 3523584, 'steps': 18351, 'loss/train': 1.2234508991241455} -11/06/2021 23:50:13 - INFO - __main__ - Step 18353: {'lr': 0.0004850904906926279, 'samples': 3523776, 'steps': 18352, 'loss/train': 1.9055534601211548} -11/06/2021 23:50:14 - INFO - __main__ - Step 18354: {'lr': 0.0004850886854151885, 'samples': 3523968, 'steps': 18353, 'loss/train': 1.0320509672164917} -11/06/2021 23:50:14 - INFO - __main__ - Step 18355: {'lr': 0.0004850868800318218, 'samples': 3524160, 'steps': 18354, 'loss/train': 0.8012345433235168} -11/06/2021 23:50:15 - INFO - __main__ - Step 18356: {'lr': 0.00048508507454252846, 'samples': 3524352, 'steps': 18355, 'loss/train': 1.7290698289871216} -11/06/2021 23:50:15 - INFO - __main__ - Step 18357: {'lr': 0.00048508326894730955, 'samples': 3524544, 'steps': 18356, 'loss/train': 1.7813465595245361} -11/06/2021 23:50:16 - INFO - __main__ - Step 18358: {'lr': 0.00048508146324616566, 'samples': 3524736, 'steps': 18357, 'loss/train': 1.5460205078125} -11/06/2021 23:50:16 - INFO - __main__ - Step 18359: {'lr': 0.0004850796574390977, 'samples': 3524928, 'steps': 18358, 'loss/train': 2.392427682876587} -11/06/2021 23:50:16 - INFO - __main__ - Step 18360: {'lr': 0.0004850778515261065, 'samples': 3525120, 'steps': 18359, 'loss/train': 1.592339038848877} -11/06/2021 23:50:17 - INFO - __main__ - Step 18361: {'lr': 0.0004850760455071929, 'samples': 3525312, 'steps': 18360, 'loss/train': 1.4301173686981201} -11/06/2021 23:50:18 - INFO - __main__ - Step 18362: {'lr': 0.0004850742393823576, 'samples': 3525504, 'steps': 18361, 'loss/train': 2.1455750465393066} -11/06/2021 23:50:18 - INFO - __main__ - Step 18363: {'lr': 0.0004850724331516014, 'samples': 3525696, 'steps': 18362, 'loss/train': 1.851510763168335} -11/06/2021 23:50:18 - INFO - __main__ - Step 18364: {'lr': 0.0004850706268149253, 'samples': 3525888, 'steps': 18363, 'loss/train': 1.5681486129760742} -11/06/2021 23:50:19 - INFO - __main__ - Step 18365: {'lr': 0.00048506882037233, 'samples': 3526080, 'steps': 18364, 'loss/train': 1.4631696939468384} -11/06/2021 23:50:20 - INFO - __main__ - Step 18366: {'lr': 0.0004850670138238162, 'samples': 3526272, 'steps': 18365, 'loss/train': 1.7207934856414795} -11/06/2021 23:50:20 - INFO - __main__ - Step 18367: {'lr': 0.00048506520716938496, 'samples': 3526464, 'steps': 18366, 'loss/train': 1.616496205329895} -11/06/2021 23:50:21 - INFO - __main__ - Step 18368: {'lr': 0.00048506340040903697, 'samples': 3526656, 'steps': 18367, 'loss/train': 1.8938003778457642} -11/06/2021 23:50:21 - INFO - __main__ - Step 18369: {'lr': 0.00048506159354277294, 'samples': 3526848, 'steps': 18368, 'loss/train': 1.2933012247085571} -11/06/2021 23:50:21 - INFO - __main__ - Step 18370: {'lr': 0.00048505978657059385, 'samples': 3527040, 'steps': 18369, 'loss/train': 1.8358917236328125} -11/06/2021 23:50:22 - INFO - __main__ - Step 18371: {'lr': 0.0004850579794925004, 'samples': 3527232, 'steps': 18370, 'loss/train': 1.0218453407287598} -11/06/2021 23:50:23 - INFO - __main__ - Step 18372: {'lr': 0.0004850561723084935, 'samples': 3527424, 'steps': 18371, 'loss/train': 1.8021912574768066} -11/06/2021 23:50:23 - INFO - __main__ - Step 18373: {'lr': 0.0004850543650185739, 'samples': 3527616, 'steps': 18372, 'loss/train': 1.755092978477478} -11/06/2021 23:50:23 - INFO - __main__ - Step 18374: {'lr': 0.0004850525576227425, 'samples': 3527808, 'steps': 18373, 'loss/train': 1.9047927856445312} -11/06/2021 23:50:24 - INFO - __main__ - Step 18375: {'lr': 0.000485050750121, 'samples': 3528000, 'steps': 18374, 'loss/train': 1.681142807006836} -11/06/2021 23:50:24 - INFO - __main__ - Step 18376: {'lr': 0.0004850489425133472, 'samples': 3528192, 'steps': 18375, 'loss/train': 2.1112258434295654} -11/06/2021 23:50:25 - INFO - __main__ - Step 18377: {'lr': 0.000485047134799785, 'samples': 3528384, 'steps': 18376, 'loss/train': 1.5793359279632568} -11/06/2021 23:50:25 - INFO - __main__ - Step 18378: {'lr': 0.00048504532698031416, 'samples': 3528576, 'steps': 18377, 'loss/train': 1.8018134832382202} -11/06/2021 23:50:26 - INFO - __main__ - Step 18379: {'lr': 0.0004850435190549356, 'samples': 3528768, 'steps': 18378, 'loss/train': 1.5398601293563843} -11/06/2021 23:50:26 - INFO - __main__ - Step 18380: {'lr': 0.00048504171102365, 'samples': 3528960, 'steps': 18379, 'loss/train': 2.1345901489257812} -11/06/2021 23:50:26 - INFO - __main__ - Step 18381: {'lr': 0.0004850399028864583, 'samples': 3529152, 'steps': 18380, 'loss/train': 1.6549445390701294} -11/06/2021 23:50:27 - INFO - __main__ - Step 18382: {'lr': 0.0004850380946433611, 'samples': 3529344, 'steps': 18381, 'loss/train': 1.5185497999191284} -11/06/2021 23:50:28 - INFO - __main__ - Step 18383: {'lr': 0.00048503628629435947, 'samples': 3529536, 'steps': 18382, 'loss/train': 0.985446572303772} -11/06/2021 23:50:28 - INFO - __main__ - Step 18384: {'lr': 0.0004850344778394541, 'samples': 3529728, 'steps': 18383, 'loss/train': 1.2629421949386597} -11/06/2021 23:50:29 - INFO - __main__ - Step 18385: {'lr': 0.0004850326692786459, 'samples': 3529920, 'steps': 18384, 'loss/train': 1.4181469678878784} -11/06/2021 23:50:29 - INFO - __main__ - Step 18386: {'lr': 0.00048503086061193546, 'samples': 3530112, 'steps': 18385, 'loss/train': 1.1277774572372437} -11/06/2021 23:50:30 - INFO - __main__ - Step 18387: {'lr': 0.0004850290518393238, 'samples': 3530304, 'steps': 18386, 'loss/train': 1.889421820640564} -11/06/2021 23:50:30 - INFO - __main__ - Step 18388: {'lr': 0.0004850272429608117, 'samples': 3530496, 'steps': 18387, 'loss/train': 1.9355649948120117} -11/06/2021 23:50:31 - INFO - __main__ - Step 18389: {'lr': 0.0004850254339764, 'samples': 3530688, 'steps': 18388, 'loss/train': 1.574332356452942} -11/06/2021 23:50:31 - INFO - __main__ - Step 18390: {'lr': 0.00048502362488608933, 'samples': 3530880, 'steps': 18389, 'loss/train': 1.6066454648971558} -11/06/2021 23:50:31 - INFO - __main__ - Step 18391: {'lr': 0.0004850218156898807, 'samples': 3531072, 'steps': 18390, 'loss/train': 1.316588044166565} -11/06/2021 23:50:32 - INFO - __main__ - Step 18392: {'lr': 0.00048502000638777487, 'samples': 3531264, 'steps': 18391, 'loss/train': 1.8195085525512695} -11/06/2021 23:50:33 - INFO - __main__ - Step 18393: {'lr': 0.0004850181969797727, 'samples': 3531456, 'steps': 18392, 'loss/train': 2.008401870727539} -11/06/2021 23:50:33 - INFO - __main__ - Step 18394: {'lr': 0.00048501638746587493, 'samples': 3531648, 'steps': 18393, 'loss/train': 1.5043723583221436} -11/06/2021 23:50:33 - INFO - __main__ - Step 18395: {'lr': 0.0004850145778460824, 'samples': 3531840, 'steps': 18394, 'loss/train': 1.7984856367111206} -11/06/2021 23:50:34 - INFO - __main__ - Step 18396: {'lr': 0.00048501276812039585, 'samples': 3532032, 'steps': 18395, 'loss/train': 1.2785509824752808} -11/06/2021 23:50:34 - INFO - __main__ - Step 18397: {'lr': 0.00048501095828881627, 'samples': 3532224, 'steps': 18396, 'loss/train': 2.095855951309204} -11/06/2021 23:50:35 - INFO - __main__ - Step 18398: {'lr': 0.00048500914835134434, 'samples': 3532416, 'steps': 18397, 'loss/train': 0.8654271364212036} -11/06/2021 23:50:36 - INFO - __main__ - Step 18399: {'lr': 0.00048500733830798094, 'samples': 3532608, 'steps': 18398, 'loss/train': 1.7500832080841064} -11/06/2021 23:50:36 - INFO - __main__ - Step 18400: {'lr': 0.00048500552815872687, 'samples': 3532800, 'steps': 18399, 'loss/train': 1.6068241596221924} -11/06/2021 23:50:36 - INFO - __main__ - Step 18401: {'lr': 0.0004850037179035829, 'samples': 3532992, 'steps': 18400, 'loss/train': 1.3907315731048584} -11/06/2021 23:50:37 - INFO - __main__ - Step 18402: {'lr': 0.00048500190754254994, 'samples': 3533184, 'steps': 18401, 'loss/train': 1.8806012868881226} -11/06/2021 23:50:38 - INFO - __main__ - Step 18403: {'lr': 0.00048500009707562865, 'samples': 3533376, 'steps': 18402, 'loss/train': 1.9587904214859009} -11/06/2021 23:50:38 - INFO - __main__ - Step 18404: {'lr': 0.00048499828650281994, 'samples': 3533568, 'steps': 18403, 'loss/train': 1.476645588874817} -11/06/2021 23:50:38 - INFO - __main__ - Step 18405: {'lr': 0.00048499647582412475, 'samples': 3533760, 'steps': 18404, 'loss/train': 1.2877929210662842} -11/06/2021 23:50:39 - INFO - __main__ - Step 18406: {'lr': 0.0004849946650395437, 'samples': 3533952, 'steps': 18405, 'loss/train': 1.7419734001159668} -11/06/2021 23:50:39 - INFO - __main__ - Step 18407: {'lr': 0.0004849928541490777, 'samples': 3534144, 'steps': 18406, 'loss/train': 1.5446574687957764} -11/06/2021 23:50:40 - INFO - __main__ - Step 18408: {'lr': 0.0004849910431527275, 'samples': 3534336, 'steps': 18407, 'loss/train': 1.6804839372634888} -11/06/2021 23:50:41 - INFO - __main__ - Step 18409: {'lr': 0.000484989232050494, 'samples': 3534528, 'steps': 18408, 'loss/train': 1.753796935081482} -11/06/2021 23:50:41 - INFO - __main__ - Step 18410: {'lr': 0.00048498742084237796, 'samples': 3534720, 'steps': 18409, 'loss/train': 1.7677087783813477} -11/06/2021 23:50:41 - INFO - __main__ - Step 18411: {'lr': 0.00048498560952838025, 'samples': 3534912, 'steps': 18410, 'loss/train': 1.3275538682937622} -11/06/2021 23:50:42 - INFO - __main__ - Step 18412: {'lr': 0.00048498379810850157, 'samples': 3535104, 'steps': 18411, 'loss/train': 1.63711416721344} -11/06/2021 23:50:43 - INFO - __main__ - Step 18413: {'lr': 0.0004849819865827429, 'samples': 3535296, 'steps': 18412, 'loss/train': 1.4949513673782349} -11/06/2021 23:50:43 - INFO - __main__ - Step 18414: {'lr': 0.0004849801749511049, 'samples': 3535488, 'steps': 18413, 'loss/train': 1.6665228605270386} -11/06/2021 23:50:43 - INFO - __main__ - Step 18415: {'lr': 0.00048497836321358855, 'samples': 3535680, 'steps': 18414, 'loss/train': 1.7287325859069824} -11/06/2021 23:50:44 - INFO - __main__ - Step 18416: {'lr': 0.00048497655137019454, 'samples': 3535872, 'steps': 18415, 'loss/train': 1.747482180595398} -11/06/2021 23:50:44 - INFO - __main__ - Step 18417: {'lr': 0.0004849747394209237, 'samples': 3536064, 'steps': 18416, 'loss/train': 1.5815653800964355} -11/06/2021 23:50:45 - INFO - __main__ - Step 18418: {'lr': 0.00048497292736577685, 'samples': 3536256, 'steps': 18417, 'loss/train': 1.05122971534729} -11/06/2021 23:50:45 - INFO - __main__ - Step 18419: {'lr': 0.0004849711152047549, 'samples': 3536448, 'steps': 18418, 'loss/train': 1.965767502784729} -11/06/2021 23:50:46 - INFO - __main__ - Step 18420: {'lr': 0.0004849693029378585, 'samples': 3536640, 'steps': 18419, 'loss/train': 1.3536920547485352} -11/06/2021 23:50:46 - INFO - __main__ - Step 18421: {'lr': 0.0004849674905650886, 'samples': 3536832, 'steps': 18420, 'loss/train': 1.2444932460784912} -11/06/2021 23:50:46 - INFO - __main__ - Step 18422: {'lr': 0.000484965678086446, 'samples': 3537024, 'steps': 18421, 'loss/train': 2.4452176094055176} -11/06/2021 23:50:47 - INFO - __main__ - Step 18423: {'lr': 0.0004849638655019315, 'samples': 3537216, 'steps': 18422, 'loss/train': 1.608303189277649} -11/06/2021 23:50:48 - INFO - __main__ - Step 18424: {'lr': 0.0004849620528115458, 'samples': 3537408, 'steps': 18423, 'loss/train': 1.6960731744766235} -11/06/2021 23:50:48 - INFO - __main__ - Step 18425: {'lr': 0.0004849602400152899, 'samples': 3537600, 'steps': 18424, 'loss/train': 2.0159389972686768} -11/06/2021 23:50:49 - INFO - __main__ - Step 18426: {'lr': 0.0004849584271131646, 'samples': 3537792, 'steps': 18425, 'loss/train': 2.1302671432495117} -11/06/2021 23:50:49 - INFO - __main__ - Step 18427: {'lr': 0.00048495661410517056, 'samples': 3537984, 'steps': 18426, 'loss/train': 1.5923632383346558} -11/06/2021 23:50:49 - INFO - __main__ - Step 18428: {'lr': 0.0004849548009913087, 'samples': 3538176, 'steps': 18427, 'loss/train': 1.6678215265274048} -11/06/2021 23:50:50 - INFO - __main__ - Step 18429: {'lr': 0.00048495298777157994, 'samples': 3538368, 'steps': 18428, 'loss/train': 1.6185996532440186} -11/06/2021 23:50:50 - INFO - __main__ - Step 18430: {'lr': 0.0004849511744459849, 'samples': 3538560, 'steps': 18429, 'loss/train': 1.3633182048797607} -11/06/2021 23:50:51 - INFO - __main__ - Step 18431: {'lr': 0.00048494936101452446, 'samples': 3538752, 'steps': 18430, 'loss/train': 1.138119101524353} -11/06/2021 23:50:51 - INFO - __main__ - Step 18432: {'lr': 0.00048494754747719954, 'samples': 3538944, 'steps': 18431, 'loss/train': 1.6822428703308105} -11/06/2021 23:50:52 - INFO - __main__ - Step 18433: {'lr': 0.00048494573383401084, 'samples': 3539136, 'steps': 18432, 'loss/train': 1.2326446771621704} -11/06/2021 23:50:53 - INFO - __main__ - Step 18434: {'lr': 0.0004849439200849592, 'samples': 3539328, 'steps': 18433, 'loss/train': 1.6924725770950317} -11/06/2021 23:50:53 - INFO - __main__ - Step 18435: {'lr': 0.0004849421062300455, 'samples': 3539520, 'steps': 18434, 'loss/train': 1.6470112800598145} -11/06/2021 23:50:53 - INFO - __main__ - Step 18436: {'lr': 0.0004849402922692705, 'samples': 3539712, 'steps': 18435, 'loss/train': 1.5454944372177124} -11/06/2021 23:50:54 - INFO - __main__ - Step 18437: {'lr': 0.000484938478202635, 'samples': 3539904, 'steps': 18436, 'loss/train': 1.955151915550232} -11/06/2021 23:50:54 - INFO - __main__ - Step 18438: {'lr': 0.0004849366640301399, 'samples': 3540096, 'steps': 18437, 'loss/train': 1.923080563545227} -11/06/2021 23:50:55 - INFO - __main__ - Step 18439: {'lr': 0.00048493484975178593, 'samples': 3540288, 'steps': 18438, 'loss/train': 1.9832425117492676} -11/06/2021 23:50:56 - INFO - __main__ - Step 18440: {'lr': 0.00048493303536757394, 'samples': 3540480, 'steps': 18439, 'loss/train': 1.5207114219665527} -11/06/2021 23:50:56 - INFO - __main__ - Step 18441: {'lr': 0.00048493122087750473, 'samples': 3540672, 'steps': 18440, 'loss/train': 1.084029197692871} -11/06/2021 23:50:56 - INFO - __main__ - Step 18442: {'lr': 0.0004849294062815792, 'samples': 3540864, 'steps': 18441, 'loss/train': 1.1858590841293335} -11/06/2021 23:50:57 - INFO - __main__ - Step 18443: {'lr': 0.000484927591579798, 'samples': 3541056, 'steps': 18442, 'loss/train': 0.3680558204650879} -11/06/2021 23:50:58 - INFO - __main__ - Step 18444: {'lr': 0.0004849257767721622, 'samples': 3541248, 'steps': 18443, 'loss/train': 1.4493937492370605} -11/06/2021 23:50:58 - INFO - __main__ - Step 18445: {'lr': 0.00048492396185867236, 'samples': 3541440, 'steps': 18444, 'loss/train': 1.2673674821853638} -11/06/2021 23:50:59 - INFO - __main__ - Step 18446: {'lr': 0.0004849221468393294, 'samples': 3541632, 'steps': 18445, 'loss/train': 1.6834259033203125} -11/06/2021 23:50:59 - INFO - __main__ - Step 18447: {'lr': 0.00048492033171413425, 'samples': 3541824, 'steps': 18446, 'loss/train': 1.5090739727020264} -11/06/2021 23:50:59 - INFO - __main__ - Step 18448: {'lr': 0.00048491851648308756, 'samples': 3542016, 'steps': 18447, 'loss/train': 1.581689476966858} -11/06/2021 23:51:00 - INFO - __main__ - Step 18449: {'lr': 0.00048491670114619026, 'samples': 3542208, 'steps': 18448, 'loss/train': 1.6174651384353638} -11/06/2021 23:51:01 - INFO - __main__ - Step 18450: {'lr': 0.000484914885703443, 'samples': 3542400, 'steps': 18449, 'loss/train': 0.9411190748214722} -11/06/2021 23:51:01 - INFO - __main__ - Step 18451: {'lr': 0.00048491307015484684, 'samples': 3542592, 'steps': 18450, 'loss/train': 1.7741544246673584} -11/06/2021 23:51:01 - INFO - __main__ - Step 18452: {'lr': 0.0004849112545004024, 'samples': 3542784, 'steps': 18451, 'loss/train': 2.107996940612793} -11/06/2021 23:51:02 - INFO - __main__ - Step 18453: {'lr': 0.00048490943874011054, 'samples': 3542976, 'steps': 18452, 'loss/train': 1.9751431941986084} -11/06/2021 23:51:03 - INFO - __main__ - Step 18454: {'lr': 0.00048490762287397215, 'samples': 3543168, 'steps': 18453, 'loss/train': 1.6343867778778076} -11/06/2021 23:51:03 - INFO - __main__ - Step 18455: {'lr': 0.00048490580690198804, 'samples': 3543360, 'steps': 18454, 'loss/train': 1.3063688278198242} -11/06/2021 23:51:03 - INFO - __main__ - Step 18456: {'lr': 0.000484903990824159, 'samples': 3543552, 'steps': 18455, 'loss/train': 1.9505548477172852} -11/06/2021 23:51:04 - INFO - __main__ - Step 18457: {'lr': 0.0004849021746404859, 'samples': 3543744, 'steps': 18456, 'loss/train': 1.9116475582122803} -11/06/2021 23:51:04 - INFO - __main__ - Step 18458: {'lr': 0.00048490035835096936, 'samples': 3543936, 'steps': 18457, 'loss/train': 1.0650830268859863} -11/06/2021 23:51:05 - INFO - __main__ - Step 18459: {'lr': 0.0004848985419556104, 'samples': 3544128, 'steps': 18458, 'loss/train': 1.4827680587768555} -11/06/2021 23:51:05 - INFO - __main__ - Step 18460: {'lr': 0.0004848967254544099, 'samples': 3544320, 'steps': 18459, 'loss/train': 1.7137441635131836} -11/06/2021 23:51:06 - INFO - __main__ - Step 18461: {'lr': 0.00048489490884736844, 'samples': 3544512, 'steps': 18460, 'loss/train': 1.8879387378692627} -11/06/2021 23:51:06 - INFO - __main__ - Step 18462: {'lr': 0.00048489309213448696, 'samples': 3544704, 'steps': 18461, 'loss/train': 1.5725513696670532} -11/06/2021 23:51:07 - INFO - __main__ - Step 18463: {'lr': 0.00048489127531576627, 'samples': 3544896, 'steps': 18462, 'loss/train': 1.7514148950576782} -11/06/2021 23:51:08 - INFO - __main__ - Step 18464: {'lr': 0.0004848894583912072, 'samples': 3545088, 'steps': 18463, 'loss/train': 1.7304996252059937} -11/06/2021 23:51:08 - INFO - __main__ - Step 18465: {'lr': 0.00048488764136081063, 'samples': 3545280, 'steps': 18464, 'loss/train': 1.7402286529541016} -11/06/2021 23:51:08 - INFO - __main__ - Step 18466: {'lr': 0.00048488582422457726, 'samples': 3545472, 'steps': 18465, 'loss/train': 1.6294695138931274} -11/06/2021 23:51:09 - INFO - __main__ - Step 18467: {'lr': 0.000484884006982508, 'samples': 3545664, 'steps': 18466, 'loss/train': 1.3782211542129517} -11/06/2021 23:51:09 - INFO - __main__ - Step 18468: {'lr': 0.0004848821896346036, 'samples': 3545856, 'steps': 18467, 'loss/train': 1.301269769668579} -11/06/2021 23:51:10 - INFO - __main__ - Step 18469: {'lr': 0.0004848803721808649, 'samples': 3546048, 'steps': 18468, 'loss/train': 1.5572654008865356} -11/06/2021 23:51:10 - INFO - __main__ - Step 18470: {'lr': 0.0004848785546212927, 'samples': 3546240, 'steps': 18469, 'loss/train': 1.7710777521133423} -11/06/2021 23:51:11 - INFO - __main__ - Step 18471: {'lr': 0.00048487673695588794, 'samples': 3546432, 'steps': 18470, 'loss/train': 0.349107563495636} -11/06/2021 23:51:11 - INFO - __main__ - Step 18472: {'lr': 0.00048487491918465135, 'samples': 3546624, 'steps': 18471, 'loss/train': 1.540006399154663} -11/06/2021 23:51:12 - INFO - __main__ - Step 18473: {'lr': 0.00048487310130758366, 'samples': 3546816, 'steps': 18472, 'loss/train': 1.5236613750457764} -11/06/2021 23:51:12 - INFO - __main__ - Step 18474: {'lr': 0.00048487128332468576, 'samples': 3547008, 'steps': 18473, 'loss/train': 2.0391478538513184} -11/06/2021 23:51:13 - INFO - __main__ - Step 18475: {'lr': 0.00048486946523595856, 'samples': 3547200, 'steps': 18474, 'loss/train': 1.7095692157745361} -11/06/2021 23:51:13 - INFO - __main__ - Step 18476: {'lr': 0.00048486764704140276, 'samples': 3547392, 'steps': 18475, 'loss/train': 1.4590822458267212} -11/06/2021 23:51:14 - INFO - __main__ - Step 18477: {'lr': 0.00048486582874101924, 'samples': 3547584, 'steps': 18476, 'loss/train': 1.449753761291504} -11/06/2021 23:51:14 - INFO - __main__ - Step 18478: {'lr': 0.0004848640103348088, 'samples': 3547776, 'steps': 18477, 'loss/train': 1.4348716735839844} -11/06/2021 23:51:14 - INFO - __main__ - Step 18479: {'lr': 0.00048486219182277226, 'samples': 3547968, 'steps': 18478, 'loss/train': 2.534212827682495} -11/06/2021 23:51:15 - INFO - __main__ - Step 18480: {'lr': 0.00048486037320491043, 'samples': 3548160, 'steps': 18479, 'loss/train': 1.7648648023605347} -11/06/2021 23:51:16 - INFO - __main__ - Step 18481: {'lr': 0.0004848585544812242, 'samples': 3548352, 'steps': 18480, 'loss/train': 1.6988426446914673} -11/06/2021 23:51:16 - INFO - __main__ - Step 18482: {'lr': 0.0004848567356517143, 'samples': 3548544, 'steps': 18481, 'loss/train': 1.972807765007019} -11/06/2021 23:51:16 - INFO - __main__ - Step 18483: {'lr': 0.00048485491671638146, 'samples': 3548736, 'steps': 18482, 'loss/train': 2.1826088428497314} -11/06/2021 23:51:17 - INFO - __main__ - Step 18484: {'lr': 0.0004848530976752268, 'samples': 3548928, 'steps': 18483, 'loss/train': 1.9444767236709595} -11/06/2021 23:51:18 - INFO - __main__ - Step 18485: {'lr': 0.0004848512785282508, 'samples': 3549120, 'steps': 18484, 'loss/train': 1.6333898305892944} -11/06/2021 23:51:18 - INFO - __main__ - Step 18486: {'lr': 0.00048484945927545456, 'samples': 3549312, 'steps': 18485, 'loss/train': 0.7610716223716736} -11/06/2021 23:51:18 - INFO - __main__ - Step 18487: {'lr': 0.0004848476399168387, 'samples': 3549504, 'steps': 18486, 'loss/train': 1.0934349298477173} -11/06/2021 23:51:19 - INFO - __main__ - Step 18488: {'lr': 0.0004848458204524042, 'samples': 3549696, 'steps': 18487, 'loss/train': 1.1723536252975464} -11/06/2021 23:51:19 - INFO - __main__ - Step 18489: {'lr': 0.00048484400088215173, 'samples': 3549888, 'steps': 18488, 'loss/train': 1.8059593439102173} -11/06/2021 23:51:20 - INFO - __main__ - Step 18490: {'lr': 0.0004848421812060821, 'samples': 3550080, 'steps': 18489, 'loss/train': 1.5580663681030273} -11/06/2021 23:51:21 - INFO - __main__ - Step 18491: {'lr': 0.0004848403614241964, 'samples': 3550272, 'steps': 18490, 'loss/train': 1.4911553859710693} -11/06/2021 23:51:21 - INFO - __main__ - Step 18492: {'lr': 0.00048483854153649514, 'samples': 3550464, 'steps': 18491, 'loss/train': 1.4916285276412964} -11/06/2021 23:51:21 - INFO - __main__ - Step 18493: {'lr': 0.0004848367215429793, 'samples': 3550656, 'steps': 18492, 'loss/train': 0.5384908318519592} -11/06/2021 23:51:22 - INFO - __main__ - Step 18494: {'lr': 0.0004848349014436496, 'samples': 3550848, 'steps': 18493, 'loss/train': 1.4912225008010864} -11/06/2021 23:51:23 - INFO - __main__ - Step 18495: {'lr': 0.00048483308123850697, 'samples': 3551040, 'steps': 18494, 'loss/train': 1.5729341506958008} -11/06/2021 23:51:23 - INFO - __main__ - Step 18496: {'lr': 0.00048483126092755215, 'samples': 3551232, 'steps': 18495, 'loss/train': 1.8693089485168457} -11/06/2021 23:51:24 - INFO - __main__ - Step 18497: {'lr': 0.000484829440510786, 'samples': 3551424, 'steps': 18496, 'loss/train': 1.8200191259384155} -11/06/2021 23:51:24 - INFO - __main__ - Step 18498: {'lr': 0.0004848276199882093, 'samples': 3551616, 'steps': 18497, 'loss/train': 1.7423537969589233} -11/06/2021 23:51:24 - INFO - __main__ - Step 18499: {'lr': 0.0004848257993598229, 'samples': 3551808, 'steps': 18498, 'loss/train': 0.9620110392570496} -11/06/2021 23:51:25 - INFO - __main__ - Step 18500: {'lr': 0.00048482397862562764, 'samples': 3552000, 'steps': 18499, 'loss/train': 1.7833219766616821} -11/06/2021 23:51:25 - INFO - __main__ - Step 18501: {'lr': 0.00048482215778562434, 'samples': 3552192, 'steps': 18500, 'loss/train': 1.6852136850357056} -11/06/2021 23:51:27 - INFO - __main__ - Step 18502: {'lr': 0.00048482033683981376, 'samples': 3552384, 'steps': 18501, 'loss/train': 1.7665677070617676} -11/06/2021 23:51:27 - INFO - __main__ - Step 18503: {'lr': 0.0004848185157881968, 'samples': 3552576, 'steps': 18502, 'loss/train': 1.2151190042495728} -11/06/2021 23:51:28 - INFO - __main__ - Step 18504: {'lr': 0.0004848166946307742, 'samples': 3552768, 'steps': 18503, 'loss/train': 0.9729933142662048} -11/06/2021 23:51:28 - INFO - __main__ - Step 18505: {'lr': 0.0004848148733675468, 'samples': 3552960, 'steps': 18504, 'loss/train': 0.7332248687744141} -11/06/2021 23:51:28 - INFO - __main__ - Step 18506: {'lr': 0.0004848130519985155, 'samples': 3553152, 'steps': 18505, 'loss/train': 1.4994479417800903} -11/06/2021 23:51:29 - INFO - __main__ - Step 18507: {'lr': 0.000484811230523681, 'samples': 3553344, 'steps': 18506, 'loss/train': 0.5550244450569153} -11/06/2021 23:51:29 - INFO - __main__ - Step 18508: {'lr': 0.00048480940894304425, 'samples': 3553536, 'steps': 18507, 'loss/train': 2.118533134460449} -11/06/2021 23:51:30 - INFO - __main__ - Step 18509: {'lr': 0.000484807587256606, 'samples': 3553728, 'steps': 18508, 'loss/train': 1.753688097000122} -11/06/2021 23:51:30 - INFO - __main__ - Step 18510: {'lr': 0.00048480576546436707, 'samples': 3553920, 'steps': 18509, 'loss/train': 1.6554456949234009} -11/06/2021 23:51:31 - INFO - __main__ - Step 18511: {'lr': 0.0004848039435663282, 'samples': 3554112, 'steps': 18510, 'loss/train': 1.341917634010315} -11/06/2021 23:51:31 - INFO - __main__ - Step 18512: {'lr': 0.0004848021215624904, 'samples': 3554304, 'steps': 18511, 'loss/train': 2.3233754634857178} -11/06/2021 23:51:31 - INFO - __main__ - Step 18513: {'lr': 0.0004848002994528543, 'samples': 3554496, 'steps': 18512, 'loss/train': 1.3712459802627563} -11/06/2021 23:51:32 - INFO - __main__ - Step 18514: {'lr': 0.0004847984772374209, 'samples': 3554688, 'steps': 18513, 'loss/train': 1.0572799444198608} -11/06/2021 23:51:33 - INFO - __main__ - Step 18515: {'lr': 0.0004847966549161909, 'samples': 3554880, 'steps': 18514, 'loss/train': 1.137990117073059} -11/06/2021 23:51:33 - INFO - __main__ - Step 18516: {'lr': 0.0004847948324891651, 'samples': 3555072, 'steps': 18515, 'loss/train': 1.7233134508132935} -11/06/2021 23:51:34 - INFO - __main__ - Step 18517: {'lr': 0.00048479300995634447, 'samples': 3555264, 'steps': 18516, 'loss/train': 1.5515546798706055} -11/06/2021 23:51:34 - INFO - __main__ - Step 18518: {'lr': 0.0004847911873177296, 'samples': 3555456, 'steps': 18517, 'loss/train': 0.4498330056667328} -11/06/2021 23:51:35 - INFO - __main__ - Step 18519: {'lr': 0.0004847893645733216, 'samples': 3555648, 'steps': 18518, 'loss/train': 1.9441230297088623} -11/06/2021 23:51:35 - INFO - __main__ - Step 18520: {'lr': 0.000484787541723121, 'samples': 3555840, 'steps': 18519, 'loss/train': 1.6475194692611694} -11/06/2021 23:51:36 - INFO - __main__ - Step 18521: {'lr': 0.0004847857187671288, 'samples': 3556032, 'steps': 18520, 'loss/train': 1.5261662006378174} -11/06/2021 23:51:36 - INFO - __main__ - Step 18522: {'lr': 0.00048478389570534575, 'samples': 3556224, 'steps': 18521, 'loss/train': 2.240158796310425} -11/06/2021 23:51:36 - INFO - __main__ - Step 18523: {'lr': 0.0004847820725377728, 'samples': 3556416, 'steps': 18522, 'loss/train': 1.3520618677139282} -11/06/2021 23:51:37 - INFO - __main__ - Step 18524: {'lr': 0.0004847802492644106, 'samples': 3556608, 'steps': 18523, 'loss/train': 1.5715515613555908} -11/06/2021 23:51:38 - INFO - __main__ - Step 18525: {'lr': 0.00048477842588526, 'samples': 3556800, 'steps': 18524, 'loss/train': 2.274082899093628} -11/06/2021 23:51:38 - INFO - __main__ - Step 18526: {'lr': 0.000484776602400322, 'samples': 3556992, 'steps': 18525, 'loss/train': 1.5804866552352905} -11/06/2021 23:51:38 - INFO - __main__ - Step 18527: {'lr': 0.00048477477880959715, 'samples': 3557184, 'steps': 18526, 'loss/train': 1.8836625814437866} -11/06/2021 23:51:39 - INFO - __main__ - Step 18528: {'lr': 0.00048477295511308645, 'samples': 3557376, 'steps': 18527, 'loss/train': 2.796858072280884} -11/06/2021 23:51:40 - INFO - __main__ - Step 18529: {'lr': 0.0004847711313107907, 'samples': 3557568, 'steps': 18528, 'loss/train': 1.5906380414962769} -11/06/2021 23:51:40 - INFO - __main__ - Step 18530: {'lr': 0.0004847693074027106, 'samples': 3557760, 'steps': 18529, 'loss/train': 1.6240956783294678} -11/06/2021 23:51:40 - INFO - __main__ - Step 18531: {'lr': 0.0004847674833888472, 'samples': 3557952, 'steps': 18530, 'loss/train': 1.0976725816726685} -11/06/2021 23:51:41 - INFO - __main__ - Step 18532: {'lr': 0.0004847656592692012, 'samples': 3558144, 'steps': 18531, 'loss/train': 1.590442419052124} -11/06/2021 23:51:41 - INFO - __main__ - Step 18533: {'lr': 0.00048476383504377337, 'samples': 3558336, 'steps': 18532, 'loss/train': 2.1366772651672363} -11/06/2021 23:51:41 - INFO - __main__ - Step 18534: {'lr': 0.00048476201071256453, 'samples': 3558528, 'steps': 18533, 'loss/train': 1.71946120262146} -11/06/2021 23:51:43 - INFO - __main__ - Step 18535: {'lr': 0.0004847601862755756, 'samples': 3558720, 'steps': 18534, 'loss/train': 1.520142674446106} -11/06/2021 23:51:43 - INFO - __main__ - Step 18536: {'lr': 0.0004847583617328074, 'samples': 3558912, 'steps': 18535, 'loss/train': 1.7262592315673828} -11/06/2021 23:51:43 - INFO - __main__ - Step 18537: {'lr': 0.00048475653708426067, 'samples': 3559104, 'steps': 18536, 'loss/train': 1.5982173681259155} -11/06/2021 23:51:44 - INFO - __main__ - Step 18538: {'lr': 0.00048475471232993625, 'samples': 3559296, 'steps': 18537, 'loss/train': 1.012058138847351} -11/06/2021 23:51:44 - INFO - __main__ - Step 18539: {'lr': 0.000484752887469835, 'samples': 3559488, 'steps': 18538, 'loss/train': 1.8425029516220093} -11/06/2021 23:51:45 - INFO - __main__ - Step 18540: {'lr': 0.0004847510625039577, 'samples': 3559680, 'steps': 18539, 'loss/train': 1.090240716934204} -11/06/2021 23:51:45 - INFO - __main__ - Step 18541: {'lr': 0.00048474923743230513, 'samples': 3559872, 'steps': 18540, 'loss/train': 1.447522759437561} -11/06/2021 23:51:46 - INFO - __main__ - Step 18542: {'lr': 0.0004847474122548783, 'samples': 3560064, 'steps': 18541, 'loss/train': 1.5654059648513794} -11/06/2021 23:51:46 - INFO - __main__ - Step 18543: {'lr': 0.00048474558697167783, 'samples': 3560256, 'steps': 18542, 'loss/train': 0.9320666790008545} -11/06/2021 23:51:46 - INFO - __main__ - Step 18544: {'lr': 0.0004847437615827046, 'samples': 3560448, 'steps': 18543, 'loss/train': 1.538326621055603} -11/06/2021 23:51:47 - INFO - __main__ - Step 18545: {'lr': 0.0004847419360879596, 'samples': 3560640, 'steps': 18544, 'loss/train': 1.6450234651565552} -11/06/2021 23:51:48 - INFO - __main__ - Step 18546: {'lr': 0.00048474011048744336, 'samples': 3560832, 'steps': 18545, 'loss/train': 0.8614462614059448} -11/06/2021 23:51:48 - INFO - __main__ - Step 18547: {'lr': 0.0004847382847811569, 'samples': 3561024, 'steps': 18546, 'loss/train': 1.2386878728866577} -11/06/2021 23:51:49 - INFO - __main__ - Step 18548: {'lr': 0.00048473645896910094, 'samples': 3561216, 'steps': 18547, 'loss/train': 1.8863868713378906} -11/06/2021 23:51:49 - INFO - __main__ - Step 18549: {'lr': 0.0004847346330512764, 'samples': 3561408, 'steps': 18548, 'loss/train': 1.5607517957687378} -11/06/2021 23:51:50 - INFO - __main__ - Step 18550: {'lr': 0.0004847328070276841, 'samples': 3561600, 'steps': 18549, 'loss/train': 1.6773111820220947} -11/06/2021 23:51:50 - INFO - __main__ - Step 18551: {'lr': 0.00048473098089832475, 'samples': 3561792, 'steps': 18550, 'loss/train': 1.3553521633148193} -11/06/2021 23:51:51 - INFO - __main__ - Step 18552: {'lr': 0.0004847291546631992, 'samples': 3561984, 'steps': 18551, 'loss/train': 1.1575710773468018} -11/06/2021 23:51:51 - INFO - __main__ - Step 18553: {'lr': 0.0004847273283223084, 'samples': 3562176, 'steps': 18552, 'loss/train': 1.689874291419983} -11/06/2021 23:51:51 - INFO - __main__ - Step 18554: {'lr': 0.0004847255018756531, 'samples': 3562368, 'steps': 18553, 'loss/train': 1.8873575925827026} -11/06/2021 23:51:52 - INFO - __main__ - Step 18555: {'lr': 0.0004847236753232341, 'samples': 3562560, 'steps': 18554, 'loss/train': 1.9002426862716675} -11/06/2021 23:51:53 - INFO - __main__ - Step 18556: {'lr': 0.0004847218486650522, 'samples': 3562752, 'steps': 18555, 'loss/train': 1.6513395309448242} -11/06/2021 23:51:53 - INFO - __main__ - Step 18557: {'lr': 0.00048472002190110827, 'samples': 3562944, 'steps': 18556, 'loss/train': 1.091086506843567} -11/06/2021 23:51:53 - INFO - __main__ - Step 18558: {'lr': 0.0004847181950314031, 'samples': 3563136, 'steps': 18557, 'loss/train': 1.3922399282455444} -11/06/2021 23:51:54 - INFO - __main__ - Step 18559: {'lr': 0.00048471636805593756, 'samples': 3563328, 'steps': 18558, 'loss/train': 1.6785709857940674} -11/06/2021 23:51:55 - INFO - __main__ - Step 18560: {'lr': 0.0004847145409747125, 'samples': 3563520, 'steps': 18559, 'loss/train': 1.2590919733047485} -11/06/2021 23:51:55 - INFO - __main__ - Step 18561: {'lr': 0.00048471271378772857, 'samples': 3563712, 'steps': 18560, 'loss/train': 0.998810887336731} -11/06/2021 23:51:56 - INFO - __main__ - Step 18562: {'lr': 0.00048471088649498675, 'samples': 3563904, 'steps': 18561, 'loss/train': 1.4806946516036987} -11/06/2021 23:51:56 - INFO - __main__ - Step 18563: {'lr': 0.0004847090590964879, 'samples': 3564096, 'steps': 18562, 'loss/train': 1.5437051057815552} -11/06/2021 23:51:56 - INFO - __main__ - Step 18564: {'lr': 0.00048470723159223266, 'samples': 3564288, 'steps': 18563, 'loss/train': 1.4612468481063843} -11/06/2021 23:51:57 - INFO - __main__ - Step 18565: {'lr': 0.00048470540398222207, 'samples': 3564480, 'steps': 18564, 'loss/train': 2.0015370845794678} -11/06/2021 23:51:58 - INFO - __main__ - Step 18566: {'lr': 0.00048470357626645676, 'samples': 3564672, 'steps': 18565, 'loss/train': 1.15360689163208} -11/06/2021 23:51:58 - INFO - __main__ - Step 18567: {'lr': 0.0004847017484449377, 'samples': 3564864, 'steps': 18566, 'loss/train': 1.3309861421585083} -11/06/2021 23:51:58 - INFO - __main__ - Step 18568: {'lr': 0.0004846999205176657, 'samples': 3565056, 'steps': 18567, 'loss/train': 1.6591993570327759} -11/06/2021 23:51:59 - INFO - __main__ - Step 18569: {'lr': 0.00048469809248464135, 'samples': 3565248, 'steps': 18568, 'loss/train': 1.9893124103546143} -11/06/2021 23:51:59 - INFO - __main__ - Step 18570: {'lr': 0.0004846962643458658, 'samples': 3565440, 'steps': 18569, 'loss/train': 1.7136503458023071} -11/06/2021 23:52:00 - INFO - __main__ - Step 18571: {'lr': 0.00048469443610133975, 'samples': 3565632, 'steps': 18570, 'loss/train': 1.7042827606201172} -11/06/2021 23:52:00 - INFO - __main__ - Step 18572: {'lr': 0.00048469260775106394, 'samples': 3565824, 'steps': 18571, 'loss/train': 1.9384015798568726} -11/06/2021 23:52:01 - INFO - __main__ - Step 18573: {'lr': 0.0004846907792950393, 'samples': 3566016, 'steps': 18572, 'loss/train': 1.6838961839675903} -11/06/2021 23:52:01 - INFO - __main__ - Step 18574: {'lr': 0.00048468895073326663, 'samples': 3566208, 'steps': 18573, 'loss/train': 1.2497248649597168} -11/06/2021 23:52:01 - INFO - __main__ - Step 18575: {'lr': 0.0004846871220657467, 'samples': 3566400, 'steps': 18574, 'loss/train': 1.6817874908447266} -11/06/2021 23:52:02 - INFO - __main__ - Step 18576: {'lr': 0.0004846852932924804, 'samples': 3566592, 'steps': 18575, 'loss/train': 1.5133883953094482} -11/06/2021 23:52:03 - INFO - __main__ - Step 18577: {'lr': 0.00048468346441346853, 'samples': 3566784, 'steps': 18576, 'loss/train': 2.222951650619507} -11/06/2021 23:52:03 - INFO - __main__ - Step 18578: {'lr': 0.0004846816354287119, 'samples': 3566976, 'steps': 18577, 'loss/train': 1.6888341903686523} -11/06/2021 23:52:03 - INFO - __main__ - Step 18579: {'lr': 0.0004846798063382114, 'samples': 3567168, 'steps': 18578, 'loss/train': 1.3981465101242065} -11/06/2021 23:52:04 - INFO - __main__ - Step 18580: {'lr': 0.0004846779771419677, 'samples': 3567360, 'steps': 18579, 'loss/train': 1.2701265811920166} -11/06/2021 23:52:05 - INFO - __main__ - Step 18581: {'lr': 0.0004846761478399818, 'samples': 3567552, 'steps': 18580, 'loss/train': 2.1845619678497314} -11/06/2021 23:52:06 - INFO - __main__ - Step 18582: {'lr': 0.0004846743184322544, 'samples': 3567744, 'steps': 18581, 'loss/train': 1.6259300708770752} -11/06/2021 23:52:06 - INFO - __main__ - Step 18583: {'lr': 0.00048467248891878644, 'samples': 3567936, 'steps': 18582, 'loss/train': 4.3415937423706055} -11/06/2021 23:52:06 - INFO - __main__ - Step 18584: {'lr': 0.00048467065929957867, 'samples': 3568128, 'steps': 18583, 'loss/train': 4.058262348175049} -11/06/2021 23:52:07 - INFO - __main__ - Step 18585: {'lr': 0.00048466882957463186, 'samples': 3568320, 'steps': 18584, 'loss/train': 1.3394839763641357} -11/06/2021 23:52:07 - INFO - __main__ - Step 18586: {'lr': 0.0004846669997439469, 'samples': 3568512, 'steps': 18585, 'loss/train': 1.6075658798217773} -11/06/2021 23:52:08 - INFO - __main__ - Step 18587: {'lr': 0.0004846651698075246, 'samples': 3568704, 'steps': 18586, 'loss/train': 1.5133603811264038} -11/06/2021 23:52:08 - INFO - __main__ - Step 18588: {'lr': 0.00048466333976536594, 'samples': 3568896, 'steps': 18587, 'loss/train': 1.4529722929000854} -11/06/2021 23:52:09 - INFO - __main__ - Step 18589: {'lr': 0.0004846615096174715, 'samples': 3569088, 'steps': 18588, 'loss/train': 1.5087271928787231} -11/06/2021 23:52:09 - INFO - __main__ - Step 18590: {'lr': 0.00048465967936384217, 'samples': 3569280, 'steps': 18589, 'loss/train': 1.7790948152542114} -11/06/2021 23:52:09 - INFO - __main__ - Step 18591: {'lr': 0.00048465784900447885, 'samples': 3569472, 'steps': 18590, 'loss/train': 1.938625693321228} -11/06/2021 23:52:11 - INFO - __main__ - Step 18592: {'lr': 0.00048465601853938224, 'samples': 3569664, 'steps': 18591, 'loss/train': 1.7642910480499268} -11/06/2021 23:52:11 - INFO - __main__ - Step 18593: {'lr': 0.0004846541879685533, 'samples': 3569856, 'steps': 18592, 'loss/train': 1.766231656074524} -11/06/2021 23:52:11 - INFO - __main__ - Step 18594: {'lr': 0.0004846523572919929, 'samples': 3570048, 'steps': 18593, 'loss/train': 0.5659541487693787} -11/06/2021 23:52:12 - INFO - __main__ - Step 18595: {'lr': 0.00048465052650970166, 'samples': 3570240, 'steps': 18594, 'loss/train': 1.2477904558181763} -11/06/2021 23:52:12 - INFO - __main__ - Step 18596: {'lr': 0.00048464869562168055, 'samples': 3570432, 'steps': 18595, 'loss/train': 2.0898544788360596} -11/06/2021 23:52:12 - INFO - __main__ - Step 18597: {'lr': 0.0004846468646279304, 'samples': 3570624, 'steps': 18596, 'loss/train': 1.4772709608078003} -11/06/2021 23:52:14 - INFO - __main__ - Step 18598: {'lr': 0.0004846450335284519, 'samples': 3570816, 'steps': 18597, 'loss/train': 1.557440161705017} -11/06/2021 23:52:14 - INFO - __main__ - Step 18599: {'lr': 0.00048464320232324604, 'samples': 3571008, 'steps': 18598, 'loss/train': 0.901743471622467} -11/06/2021 23:52:14 - INFO - __main__ - Step 18600: {'lr': 0.00048464137101231355, 'samples': 3571200, 'steps': 18599, 'loss/train': 1.3562065362930298} -11/06/2021 23:52:15 - INFO - __main__ - Step 18601: {'lr': 0.0004846395395956553, 'samples': 3571392, 'steps': 18600, 'loss/train': 1.8090925216674805} -11/06/2021 23:52:15 - INFO - __main__ - Step 18602: {'lr': 0.00048463770807327206, 'samples': 3571584, 'steps': 18601, 'loss/train': 1.758899211883545} -11/06/2021 23:52:16 - INFO - __main__ - Step 18603: {'lr': 0.00048463587644516473, 'samples': 3571776, 'steps': 18602, 'loss/train': 1.4766874313354492} -11/06/2021 23:52:16 - INFO - __main__ - Step 18604: {'lr': 0.00048463404471133404, 'samples': 3571968, 'steps': 18603, 'loss/train': 1.383787989616394} -11/06/2021 23:52:17 - INFO - __main__ - Step 18605: {'lr': 0.00048463221287178094, 'samples': 3572160, 'steps': 18604, 'loss/train': 1.5332286357879639} -11/06/2021 23:52:17 - INFO - __main__ - Step 18606: {'lr': 0.0004846303809265061, 'samples': 3572352, 'steps': 18605, 'loss/train': 3.0497324466705322} -11/06/2021 23:52:18 - INFO - __main__ - Step 18607: {'lr': 0.00048462854887551044, 'samples': 3572544, 'steps': 18606, 'loss/train': 1.8126506805419922} -11/06/2021 23:52:18 - INFO - __main__ - Step 18608: {'lr': 0.0004846267167187949, 'samples': 3572736, 'steps': 18607, 'loss/train': 1.7569042444229126} -11/06/2021 23:52:19 - INFO - __main__ - Step 18609: {'lr': 0.00048462488445636005, 'samples': 3572928, 'steps': 18608, 'loss/train': 1.6716196537017822} -11/06/2021 23:52:19 - INFO - __main__ - Step 18610: {'lr': 0.0004846230520882069, 'samples': 3573120, 'steps': 18609, 'loss/train': 1.321014642715454} -11/06/2021 23:52:20 - INFO - __main__ - Step 18611: {'lr': 0.00048462121961433623, 'samples': 3573312, 'steps': 18610, 'loss/train': 1.7713549137115479} -11/06/2021 23:52:20 - INFO - __main__ - Step 18612: {'lr': 0.00048461938703474886, 'samples': 3573504, 'steps': 18611, 'loss/train': 1.7149677276611328} -11/06/2021 23:52:21 - INFO - __main__ - Step 18613: {'lr': 0.00048461755434944554, 'samples': 3573696, 'steps': 18612, 'loss/train': 2.0057523250579834} -11/06/2021 23:52:21 - INFO - __main__ - Step 18614: {'lr': 0.00048461572155842725, 'samples': 3573888, 'steps': 18613, 'loss/train': 1.244421362876892} -11/06/2021 23:52:22 - INFO - __main__ - Step 18615: {'lr': 0.00048461388866169474, 'samples': 3574080, 'steps': 18614, 'loss/train': 1.7953641414642334} -11/06/2021 23:52:22 - INFO - __main__ - Step 18616: {'lr': 0.00048461205565924884, 'samples': 3574272, 'steps': 18615, 'loss/train': 1.3679205179214478} -11/06/2021 23:52:22 - INFO - __main__ - Step 18617: {'lr': 0.0004846102225510903, 'samples': 3574464, 'steps': 18616, 'loss/train': 1.6835120916366577} -11/06/2021 23:52:23 - INFO - __main__ - Step 18618: {'lr': 0.00048460838933722005, 'samples': 3574656, 'steps': 18617, 'loss/train': 1.978041172027588} -11/06/2021 23:52:24 - INFO - __main__ - Step 18619: {'lr': 0.0004846065560176389, 'samples': 3574848, 'steps': 18618, 'loss/train': 1.8935999870300293} -11/06/2021 23:52:24 - INFO - __main__ - Step 18620: {'lr': 0.00048460472259234764, 'samples': 3575040, 'steps': 18619, 'loss/train': 1.8517574071884155} -11/06/2021 23:52:24 - INFO - __main__ - Step 18621: {'lr': 0.0004846028890613471, 'samples': 3575232, 'steps': 18620, 'loss/train': 1.4925874471664429} -11/06/2021 23:52:25 - INFO - __main__ - Step 18622: {'lr': 0.00048460105542463805, 'samples': 3575424, 'steps': 18621, 'loss/train': 1.666589617729187} -11/06/2021 23:52:26 - INFO - __main__ - Step 18623: {'lr': 0.00048459922168222146, 'samples': 3575616, 'steps': 18622, 'loss/train': 1.772215723991394} -11/06/2021 23:52:26 - INFO - __main__ - Step 18624: {'lr': 0.00048459738783409814, 'samples': 3575808, 'steps': 18623, 'loss/train': 1.7241744995117188} -11/06/2021 23:52:27 - INFO - __main__ - Step 18625: {'lr': 0.0004845955538802688, 'samples': 3576000, 'steps': 18624, 'loss/train': 1.6278271675109863} -11/06/2021 23:52:27 - INFO - __main__ - Step 18626: {'lr': 0.0004845937198207343, 'samples': 3576192, 'steps': 18625, 'loss/train': 1.2264925241470337} -11/06/2021 23:52:27 - INFO - __main__ - Step 18627: {'lr': 0.0004845918856554955, 'samples': 3576384, 'steps': 18626, 'loss/train': 1.4115939140319824} -11/06/2021 23:52:28 - INFO - __main__ - Step 18628: {'lr': 0.00048459005138455326, 'samples': 3576576, 'steps': 18627, 'loss/train': 1.6529324054718018} -11/06/2021 23:52:29 - INFO - __main__ - Step 18629: {'lr': 0.0004845882170079083, 'samples': 3576768, 'steps': 18628, 'loss/train': 1.8150955438613892} -11/06/2021 23:52:29 - INFO - __main__ - Step 18630: {'lr': 0.00048458638252556153, 'samples': 3576960, 'steps': 18629, 'loss/train': 1.786418080329895} -11/06/2021 23:52:29 - INFO - __main__ - Step 18631: {'lr': 0.0004845845479375138, 'samples': 3577152, 'steps': 18630, 'loss/train': 1.7051968574523926} -11/06/2021 23:52:30 - INFO - __main__ - Step 18632: {'lr': 0.00048458271324376586, 'samples': 3577344, 'steps': 18631, 'loss/train': 1.5298038721084595} -11/06/2021 23:52:30 - INFO - __main__ - Step 18633: {'lr': 0.0004845808784443185, 'samples': 3577536, 'steps': 18632, 'loss/train': 1.4666179418563843} -11/06/2021 23:52:31 - INFO - __main__ - Step 18634: {'lr': 0.00048457904353917277, 'samples': 3577728, 'steps': 18633, 'loss/train': 1.4519388675689697} -11/06/2021 23:52:31 - INFO - __main__ - Step 18635: {'lr': 0.0004845772085283292, 'samples': 3577920, 'steps': 18634, 'loss/train': 1.0929064750671387} -11/06/2021 23:52:32 - INFO - __main__ - Step 18636: {'lr': 0.00048457537341178885, 'samples': 3578112, 'steps': 18635, 'loss/train': 1.5843586921691895} -11/06/2021 23:52:32 - INFO - __main__ - Step 18637: {'lr': 0.0004845735381895524, 'samples': 3578304, 'steps': 18636, 'loss/train': 0.8894321322441101} -11/06/2021 23:52:33 - INFO - __main__ - Step 18638: {'lr': 0.0004845717028616208, 'samples': 3578496, 'steps': 18637, 'loss/train': 1.1412678956985474} -11/06/2021 23:52:34 - INFO - __main__ - Step 18639: {'lr': 0.00048456986742799474, 'samples': 3578688, 'steps': 18638, 'loss/train': 1.6525942087173462} -11/06/2021 23:52:34 - INFO - __main__ - Step 18640: {'lr': 0.00048456803188867513, 'samples': 3578880, 'steps': 18639, 'loss/train': 1.3935282230377197} -11/06/2021 23:52:34 - INFO - __main__ - Step 18641: {'lr': 0.00048456619624366284, 'samples': 3579072, 'steps': 18640, 'loss/train': 1.646254301071167} -11/06/2021 23:52:35 - INFO - __main__ - Step 18642: {'lr': 0.0004845643604929586, 'samples': 3579264, 'steps': 18641, 'loss/train': 1.6623493432998657} -11/06/2021 23:52:35 - INFO - __main__ - Step 18643: {'lr': 0.00048456252463656326, 'samples': 3579456, 'steps': 18642, 'loss/train': 2.4156510829925537} -11/06/2021 23:52:36 - INFO - __main__ - Step 18644: {'lr': 0.00048456068867447767, 'samples': 3579648, 'steps': 18643, 'loss/train': 1.8837863206863403} -11/06/2021 23:52:36 - INFO - __main__ - Step 18645: {'lr': 0.0004845588526067027, 'samples': 3579840, 'steps': 18644, 'loss/train': 2.037102460861206} -11/06/2021 23:52:37 - INFO - __main__ - Step 18646: {'lr': 0.00048455701643323914, 'samples': 3580032, 'steps': 18645, 'loss/train': 1.6288491487503052} -11/06/2021 23:52:37 - INFO - __main__ - Step 18647: {'lr': 0.00048455518015408773, 'samples': 3580224, 'steps': 18646, 'loss/train': 1.586424708366394} -11/06/2021 23:52:37 - INFO - __main__ - Step 18648: {'lr': 0.00048455334376924943, 'samples': 3580416, 'steps': 18647, 'loss/train': 1.1939408779144287} -11/06/2021 23:52:39 - INFO - __main__ - Step 18649: {'lr': 0.000484551507278725, 'samples': 3580608, 'steps': 18648, 'loss/train': 1.620247483253479} -11/06/2021 23:52:39 - INFO - __main__ - Step 18650: {'lr': 0.0004845496706825152, 'samples': 3580800, 'steps': 18649, 'loss/train': 0.9347361922264099} -11/06/2021 23:52:40 - INFO - __main__ - Step 18651: {'lr': 0.0004845478339806211, 'samples': 3580992, 'steps': 18650, 'loss/train': 1.3260414600372314} -11/06/2021 23:52:40 - INFO - __main__ - Step 18652: {'lr': 0.00048454599717304327, 'samples': 3581184, 'steps': 18651, 'loss/train': 1.604457139968872} -11/06/2021 23:52:40 - INFO - __main__ - Step 18653: {'lr': 0.0004845441602597826, 'samples': 3581376, 'steps': 18652, 'loss/train': 1.8285481929779053} -11/06/2021 23:52:41 - INFO - __main__ - Step 18654: {'lr': 0.00048454232324084004, 'samples': 3581568, 'steps': 18653, 'loss/train': 1.283732295036316} -11/06/2021 23:52:42 - INFO - __main__ - Step 18655: {'lr': 0.0004845404861162163, 'samples': 3581760, 'steps': 18654, 'loss/train': 0.30630865693092346} -11/06/2021 23:52:42 - INFO - __main__ - Step 18656: {'lr': 0.00048453864888591214, 'samples': 3581952, 'steps': 18655, 'loss/train': 0.8285514712333679} -11/06/2021 23:52:42 - INFO - __main__ - Step 18657: {'lr': 0.0004845368115499286, 'samples': 3582144, 'steps': 18656, 'loss/train': 1.719491720199585} -11/06/2021 23:52:43 - INFO - __main__ - Step 18658: {'lr': 0.0004845349741082663, 'samples': 3582336, 'steps': 18657, 'loss/train': 1.749588131904602} -11/06/2021 23:52:43 - INFO - __main__ - Step 18659: {'lr': 0.00048453313656092624, 'samples': 3582528, 'steps': 18658, 'loss/train': 1.7905672788619995} -11/06/2021 23:52:43 - INFO - __main__ - Step 18660: {'lr': 0.0004845312989079091, 'samples': 3582720, 'steps': 18659, 'loss/train': 1.651228666305542} -11/06/2021 23:52:45 - INFO - __main__ - Step 18661: {'lr': 0.0004845294611492158, 'samples': 3582912, 'steps': 18660, 'loss/train': 1.5173380374908447} -11/06/2021 23:52:45 - INFO - __main__ - Step 18662: {'lr': 0.00048452762328484724, 'samples': 3583104, 'steps': 18661, 'loss/train': 1.6837129592895508} -11/06/2021 23:52:45 - INFO - __main__ - Step 18663: {'lr': 0.000484525785314804, 'samples': 3583296, 'steps': 18662, 'loss/train': 1.4421535730361938} -11/06/2021 23:52:46 - INFO - __main__ - Step 18664: {'lr': 0.0004845239472390872, 'samples': 3583488, 'steps': 18663, 'loss/train': 1.7902997732162476} -11/06/2021 23:52:46 - INFO - __main__ - Step 18665: {'lr': 0.0004845221090576974, 'samples': 3583680, 'steps': 18664, 'loss/train': 2.102501153945923} -11/06/2021 23:52:47 - INFO - __main__ - Step 18666: {'lr': 0.0004845202707706356, 'samples': 3583872, 'steps': 18665, 'loss/train': 2.0066657066345215} -11/06/2021 23:52:47 - INFO - __main__ - Step 18667: {'lr': 0.0004845184323779026, 'samples': 3584064, 'steps': 18666, 'loss/train': 1.397498369216919} -11/06/2021 23:52:48 - INFO - __main__ - Step 18668: {'lr': 0.0004845165938794992, 'samples': 3584256, 'steps': 18667, 'loss/train': 1.3317439556121826} -11/06/2021 23:52:48 - INFO - __main__ - Step 18669: {'lr': 0.0004845147552754263, 'samples': 3584448, 'steps': 18668, 'loss/train': 1.9309141635894775} -11/06/2021 23:52:48 - INFO - __main__ - Step 18670: {'lr': 0.0004845129165656846, 'samples': 3584640, 'steps': 18669, 'loss/train': 1.3592866659164429} -11/06/2021 23:52:49 - INFO - __main__ - Step 18671: {'lr': 0.00048451107775027505, 'samples': 3584832, 'steps': 18670, 'loss/train': 1.5930179357528687} -11/06/2021 23:52:50 - INFO - __main__ - Step 18672: {'lr': 0.0004845092388291984, 'samples': 3585024, 'steps': 18671, 'loss/train': 1.7972415685653687} -11/06/2021 23:52:50 - INFO - __main__ - Step 18673: {'lr': 0.0004845073998024555, 'samples': 3585216, 'steps': 18672, 'loss/train': 2.1059470176696777} -11/06/2021 23:52:50 - INFO - __main__ - Step 18674: {'lr': 0.0004845055606700472, 'samples': 3585408, 'steps': 18673, 'loss/train': 1.6786866188049316} -11/06/2021 23:52:51 - INFO - __main__ - Step 18675: {'lr': 0.0004845037214319743, 'samples': 3585600, 'steps': 18674, 'loss/train': 1.7961063385009766} -11/06/2021 23:52:52 - INFO - __main__ - Step 18676: {'lr': 0.00048450188208823766, 'samples': 3585792, 'steps': 18675, 'loss/train': 1.6116433143615723} -11/06/2021 23:52:52 - INFO - __main__ - Step 18677: {'lr': 0.00048450004263883806, 'samples': 3585984, 'steps': 18676, 'loss/train': 1.9659193754196167} -11/06/2021 23:52:52 - INFO - __main__ - Step 18678: {'lr': 0.00048449820308377634, 'samples': 3586176, 'steps': 18677, 'loss/train': 1.7020381689071655} -11/06/2021 23:52:53 - INFO - __main__ - Step 18679: {'lr': 0.00048449636342305343, 'samples': 3586368, 'steps': 18678, 'loss/train': 1.582143783569336} -11/06/2021 23:52:53 - INFO - __main__ - Step 18680: {'lr': 0.00048449452365667003, 'samples': 3586560, 'steps': 18679, 'loss/train': 1.3421880006790161} -11/06/2021 23:52:54 - INFO - __main__ - Step 18681: {'lr': 0.00048449268378462695, 'samples': 3586752, 'steps': 18680, 'loss/train': 1.1730694770812988} -11/06/2021 23:52:55 - INFO - __main__ - Step 18682: {'lr': 0.00048449084380692523, 'samples': 3586944, 'steps': 18681, 'loss/train': 1.537729024887085} -11/06/2021 23:52:55 - INFO - __main__ - Step 18683: {'lr': 0.0004844890037235654, 'samples': 3587136, 'steps': 18682, 'loss/train': 1.7355479001998901} -11/06/2021 23:52:55 - INFO - __main__ - Step 18684: {'lr': 0.00048448716353454856, 'samples': 3587328, 'steps': 18683, 'loss/train': 1.7572896480560303} -11/06/2021 23:52:56 - INFO - __main__ - Step 18685: {'lr': 0.0004844853232398754, 'samples': 3587520, 'steps': 18684, 'loss/train': 1.7151175737380981} -11/06/2021 23:52:57 - INFO - __main__ - Step 18686: {'lr': 0.00048448348283954674, 'samples': 3587712, 'steps': 18685, 'loss/train': 1.8041529655456543} -11/06/2021 23:52:57 - INFO - __main__ - Step 18687: {'lr': 0.00048448164233356344, 'samples': 3587904, 'steps': 18686, 'loss/train': 1.7413592338562012} -11/06/2021 23:52:57 - INFO - __main__ - Step 18688: {'lr': 0.0004844798017219264, 'samples': 3588096, 'steps': 18687, 'loss/train': 1.6515896320343018} -11/06/2021 23:52:58 - INFO - __main__ - Step 18689: {'lr': 0.00048447796100463625, 'samples': 3588288, 'steps': 18688, 'loss/train': 1.8758485317230225} -11/06/2021 23:52:58 - INFO - __main__ - Step 18690: {'lr': 0.0004844761201816941, 'samples': 3588480, 'steps': 18689, 'loss/train': 1.7205249071121216} -11/06/2021 23:52:59 - INFO - __main__ - Step 18691: {'lr': 0.0004844742792531005, 'samples': 3588672, 'steps': 18690, 'loss/train': 1.1845340728759766} -11/06/2021 23:53:00 - INFO - __main__ - Step 18692: {'lr': 0.00048447243821885644, 'samples': 3588864, 'steps': 18691, 'loss/train': 1.7539175748825073} -11/06/2021 23:53:00 - INFO - __main__ - Step 18693: {'lr': 0.0004844705970789628, 'samples': 3589056, 'steps': 18692, 'loss/train': 1.7191652059555054} -11/06/2021 23:53:00 - INFO - __main__ - Step 18694: {'lr': 0.0004844687558334202, 'samples': 3589248, 'steps': 18693, 'loss/train': 1.35236394405365} -11/06/2021 23:53:01 - INFO - __main__ - Step 18695: {'lr': 0.0004844669144822297, 'samples': 3589440, 'steps': 18694, 'loss/train': 1.8748408555984497} -11/06/2021 23:53:02 - INFO - __main__ - Step 18696: {'lr': 0.000484465073025392, 'samples': 3589632, 'steps': 18695, 'loss/train': 1.7773936986923218} -11/06/2021 23:53:02 - INFO - __main__ - Step 18697: {'lr': 0.00048446323146290795, 'samples': 3589824, 'steps': 18696, 'loss/train': 1.5781259536743164} -11/06/2021 23:53:02 - INFO - __main__ - Step 18698: {'lr': 0.0004844613897947784, 'samples': 3590016, 'steps': 18697, 'loss/train': 1.8103524446487427} -11/06/2021 23:53:03 - INFO - __main__ - Step 18699: {'lr': 0.00048445954802100414, 'samples': 3590208, 'steps': 18698, 'loss/train': 1.5242774486541748} -11/06/2021 23:53:03 - INFO - __main__ - Step 18700: {'lr': 0.000484457706141586, 'samples': 3590400, 'steps': 18699, 'loss/train': 1.4086936712265015} -11/06/2021 23:53:03 - INFO - __main__ - Step 18701: {'lr': 0.0004844558641565249, 'samples': 3590592, 'steps': 18700, 'loss/train': 1.9146695137023926} -11/06/2021 23:53:04 - INFO - __main__ - Step 18702: {'lr': 0.00048445402206582155, 'samples': 3590784, 'steps': 18701, 'loss/train': 1.5071773529052734} -11/06/2021 23:53:05 - INFO - __main__ - Step 18703: {'lr': 0.0004844521798694768, 'samples': 3590976, 'steps': 18702, 'loss/train': 1.537892460823059} -11/06/2021 23:53:05 - INFO - __main__ - Step 18704: {'lr': 0.0004844503375674916, 'samples': 3591168, 'steps': 18703, 'loss/train': 1.0163267850875854} -11/06/2021 23:53:05 - INFO - __main__ - Step 18705: {'lr': 0.0004844484951598667, 'samples': 3591360, 'steps': 18704, 'loss/train': 1.5912625789642334} -11/06/2021 23:53:06 - INFO - __main__ - Step 18706: {'lr': 0.00048444665264660286, 'samples': 3591552, 'steps': 18705, 'loss/train': 1.7461742162704468} -11/06/2021 23:53:07 - INFO - __main__ - Step 18707: {'lr': 0.000484444810027701, 'samples': 3591744, 'steps': 18706, 'loss/train': 1.5173417329788208} -11/06/2021 23:53:07 - INFO - __main__ - Step 18708: {'lr': 0.00048444296730316196, 'samples': 3591936, 'steps': 18707, 'loss/train': 0.8280439972877502} -11/06/2021 23:53:08 - INFO - __main__ - Step 18709: {'lr': 0.0004844411244729865, 'samples': 3592128, 'steps': 18708, 'loss/train': 1.8678555488586426} -11/06/2021 23:53:08 - INFO - __main__ - Step 18710: {'lr': 0.00048443928153717555, 'samples': 3592320, 'steps': 18709, 'loss/train': 2.2123522758483887} -11/06/2021 23:53:08 - INFO - __main__ - Step 18711: {'lr': 0.00048443743849572974, 'samples': 3592512, 'steps': 18710, 'loss/train': 1.4127544164657593} -11/06/2021 23:53:09 - INFO - __main__ - Step 18712: {'lr': 0.00048443559534865017, 'samples': 3592704, 'steps': 18711, 'loss/train': 1.2353262901306152} -11/06/2021 23:53:10 - INFO - __main__ - Step 18713: {'lr': 0.0004844337520959375, 'samples': 3592896, 'steps': 18712, 'loss/train': 1.248792290687561} -11/06/2021 23:53:10 - INFO - __main__ - Step 18714: {'lr': 0.00048443190873759256, 'samples': 3593088, 'steps': 18713, 'loss/train': 0.6155982613563538} -11/06/2021 23:53:10 - INFO - __main__ - Step 18715: {'lr': 0.00048443006527361626, 'samples': 3593280, 'steps': 18714, 'loss/train': 1.6806596517562866} -11/06/2021 23:53:11 - INFO - __main__ - Step 18716: {'lr': 0.0004844282217040094, 'samples': 3593472, 'steps': 18715, 'loss/train': 1.9265437126159668} -11/06/2021 23:53:12 - INFO - __main__ - Step 18717: {'lr': 0.00048442637802877277, 'samples': 3593664, 'steps': 18716, 'loss/train': 1.060073971748352} -11/06/2021 23:53:12 - INFO - __main__ - Step 18718: {'lr': 0.0004844245342479072, 'samples': 3593856, 'steps': 18717, 'loss/train': 1.22144615650177} -11/06/2021 23:53:12 - INFO - __main__ - Step 18719: {'lr': 0.00048442269036141363, 'samples': 3594048, 'steps': 18718, 'loss/train': 2.08038592338562} -11/06/2021 23:53:13 - INFO - __main__ - Step 18720: {'lr': 0.0004844208463692928, 'samples': 3594240, 'steps': 18719, 'loss/train': 1.9108844995498657} -11/06/2021 23:53:13 - INFO - __main__ - Step 18721: {'lr': 0.00048441900227154557, 'samples': 3594432, 'steps': 18720, 'loss/train': 1.4159252643585205} -11/06/2021 23:53:14 - INFO - __main__ - Step 18722: {'lr': 0.00048441715806817265, 'samples': 3594624, 'steps': 18721, 'loss/train': 1.447057843208313} -11/06/2021 23:53:14 - INFO - __main__ - Step 18723: {'lr': 0.0004844153137591751, 'samples': 3594816, 'steps': 18722, 'loss/train': 1.7769197225570679} -11/06/2021 23:53:15 - INFO - __main__ - Step 18724: {'lr': 0.00048441346934455356, 'samples': 3595008, 'steps': 18723, 'loss/train': 0.7423035502433777} -11/06/2021 23:53:15 - INFO - __main__ - Step 18725: {'lr': 0.0004844116248243089, 'samples': 3595200, 'steps': 18724, 'loss/train': 2.38761568069458} -11/06/2021 23:53:15 - INFO - __main__ - Step 18726: {'lr': 0.0004844097801984421, 'samples': 3595392, 'steps': 18725, 'loss/train': 1.1686735153198242} -11/06/2021 23:53:16 - INFO - __main__ - Step 18727: {'lr': 0.0004844079354669537, 'samples': 3595584, 'steps': 18726, 'loss/train': 1.2005784511566162} -11/06/2021 23:53:17 - INFO - __main__ - Step 18728: {'lr': 0.0004844060906298448, 'samples': 3595776, 'steps': 18727, 'loss/train': 1.632523536682129} -11/06/2021 23:53:17 - INFO - __main__ - Step 18729: {'lr': 0.0004844042456871162, 'samples': 3595968, 'steps': 18728, 'loss/train': 1.1527280807495117} -11/06/2021 23:53:17 - INFO - __main__ - Step 18730: {'lr': 0.0004844024006387685, 'samples': 3596160, 'steps': 18729, 'loss/train': 1.233432412147522} -11/06/2021 23:53:18 - INFO - __main__ - Step 18731: {'lr': 0.00048440055548480275, 'samples': 3596352, 'steps': 18730, 'loss/train': 1.747187852859497} -11/06/2021 23:53:18 - INFO - __main__ - Step 18732: {'lr': 0.0004843987102252198, 'samples': 3596544, 'steps': 18731, 'loss/train': 1.3266741037368774} -11/06/2021 23:53:19 - INFO - __main__ - Step 18733: {'lr': 0.0004843968648600204, 'samples': 3596736, 'steps': 18732, 'loss/train': 1.6883686780929565} -11/06/2021 23:53:20 - INFO - __main__ - Step 18734: {'lr': 0.00048439501938920534, 'samples': 3596928, 'steps': 18733, 'loss/train': 1.7252039909362793} -11/06/2021 23:53:20 - INFO - __main__ - Step 18735: {'lr': 0.0004843931738127755, 'samples': 3597120, 'steps': 18734, 'loss/train': 1.1375492811203003} -11/06/2021 23:53:20 - INFO - __main__ - Step 18736: {'lr': 0.0004843913281307317, 'samples': 3597312, 'steps': 18735, 'loss/train': 1.8562067747116089} -11/06/2021 23:53:21 - INFO - __main__ - Step 18737: {'lr': 0.0004843894823430749, 'samples': 3597504, 'steps': 18736, 'loss/train': 1.7384228706359863} -11/06/2021 23:53:22 - INFO - __main__ - Step 18738: {'lr': 0.00048438763644980564, 'samples': 3597696, 'steps': 18737, 'loss/train': 1.3184276819229126} -11/06/2021 23:53:22 - INFO - __main__ - Step 18739: {'lr': 0.0004843857904509251, 'samples': 3597888, 'steps': 18738, 'loss/train': 1.289018154144287} -11/06/2021 23:53:23 - INFO - __main__ - Step 18740: {'lr': 0.00048438394434643386, 'samples': 3598080, 'steps': 18739, 'loss/train': 1.8547766208648682} -11/06/2021 23:53:23 - INFO - __main__ - Step 18741: {'lr': 0.0004843820981363328, 'samples': 3598272, 'steps': 18740, 'loss/train': 1.6665148735046387} -11/06/2021 23:53:23 - INFO - __main__ - Step 18742: {'lr': 0.00048438025182062286, 'samples': 3598464, 'steps': 18741, 'loss/train': 1.8995819091796875} -11/06/2021 23:53:24 - INFO - __main__ - Step 18743: {'lr': 0.00048437840539930466, 'samples': 3598656, 'steps': 18742, 'loss/train': 2.344691514968872} -11/06/2021 23:53:25 - INFO - __main__ - Step 18744: {'lr': 0.0004843765588723793, 'samples': 3598848, 'steps': 18743, 'loss/train': 1.6986535787582397} -11/06/2021 23:53:25 - INFO - __main__ - Step 18745: {'lr': 0.00048437471223984743, 'samples': 3599040, 'steps': 18744, 'loss/train': 1.527302861213684} -11/06/2021 23:53:25 - INFO - __main__ - Step 18746: {'lr': 0.00048437286550170996, 'samples': 3599232, 'steps': 18745, 'loss/train': 1.0772827863693237} -11/06/2021 23:53:26 - INFO - __main__ - Step 18747: {'lr': 0.00048437101865796763, 'samples': 3599424, 'steps': 18746, 'loss/train': 1.4782168865203857} -11/06/2021 23:53:26 - INFO - __main__ - Step 18748: {'lr': 0.0004843691717086214, 'samples': 3599616, 'steps': 18747, 'loss/train': 1.4430029392242432} -11/06/2021 23:53:27 - INFO - __main__ - Step 18749: {'lr': 0.000484367324653672, 'samples': 3599808, 'steps': 18748, 'loss/train': 1.6161614656448364} -11/06/2021 23:53:27 - INFO - __main__ - Step 18750: {'lr': 0.0004843654774931203, 'samples': 3600000, 'steps': 18749, 'loss/train': 1.6915335655212402} -11/06/2021 23:53:28 - INFO - __main__ - Step 18751: {'lr': 0.00048436363022696715, 'samples': 3600192, 'steps': 18750, 'loss/train': 1.6915794610977173} -11/06/2021 23:53:28 - INFO - __main__ - Step 18752: {'lr': 0.0004843617828552134, 'samples': 3600384, 'steps': 18751, 'loss/train': 1.9114357233047485} -11/06/2021 23:53:29 - INFO - __main__ - Step 18753: {'lr': 0.00048435993537785976, 'samples': 3600576, 'steps': 18752, 'loss/train': 0.9509969353675842} -11/06/2021 23:53:30 - INFO - __main__ - Step 18754: {'lr': 0.0004843580877949072, 'samples': 3600768, 'steps': 18753, 'loss/train': 1.7542425394058228} -11/06/2021 23:53:30 - INFO - __main__ - Step 18755: {'lr': 0.0004843562401063565, 'samples': 3600960, 'steps': 18754, 'loss/train': 0.9853984713554382} -11/06/2021 23:53:30 - INFO - __main__ - Step 18756: {'lr': 0.0004843543923122085, 'samples': 3601152, 'steps': 18755, 'loss/train': 1.426131010055542} -11/06/2021 23:53:31 - INFO - __main__ - Step 18757: {'lr': 0.000484352544412464, 'samples': 3601344, 'steps': 18756, 'loss/train': 1.6753501892089844} -11/06/2021 23:53:31 - INFO - __main__ - Step 18758: {'lr': 0.0004843506964071239, 'samples': 3601536, 'steps': 18757, 'loss/train': 1.2865328788757324} -11/06/2021 23:53:32 - INFO - __main__ - Step 18759: {'lr': 0.000484348848296189, 'samples': 3601728, 'steps': 18758, 'loss/train': 1.4032695293426514} -11/06/2021 23:53:32 - INFO - __main__ - Step 18760: {'lr': 0.00048434700007966006, 'samples': 3601920, 'steps': 18759, 'loss/train': 1.8957061767578125} -11/06/2021 23:53:33 - INFO - __main__ - Step 18761: {'lr': 0.000484345151757538, 'samples': 3602112, 'steps': 18760, 'loss/train': 1.5884819030761719} -11/06/2021 23:53:33 - INFO - __main__ - Step 18762: {'lr': 0.0004843433033298237, 'samples': 3602304, 'steps': 18761, 'loss/train': 0.3044757544994354} -11/06/2021 23:53:33 - INFO - __main__ - Step 18763: {'lr': 0.00048434145479651783, 'samples': 3602496, 'steps': 18762, 'loss/train': 2.1938703060150146} -11/06/2021 23:53:34 - INFO - __main__ - Step 18764: {'lr': 0.00048433960615762136, 'samples': 3602688, 'steps': 18763, 'loss/train': 2.144761562347412} -11/06/2021 23:53:35 - INFO - __main__ - Step 18765: {'lr': 0.0004843377574131351, 'samples': 3602880, 'steps': 18764, 'loss/train': 1.4775487184524536} -11/06/2021 23:53:35 - INFO - __main__ - Step 18766: {'lr': 0.0004843359085630598, 'samples': 3603072, 'steps': 18765, 'loss/train': 1.5913273096084595} -11/06/2021 23:53:35 - INFO - __main__ - Step 18767: {'lr': 0.0004843340596073964, 'samples': 3603264, 'steps': 18766, 'loss/train': 1.588987946510315} -11/06/2021 23:53:36 - INFO - __main__ - Step 18768: {'lr': 0.0004843322105461457, 'samples': 3603456, 'steps': 18767, 'loss/train': 1.364917278289795} -11/06/2021 23:53:37 - INFO - __main__ - Step 18769: {'lr': 0.0004843303613793085, 'samples': 3603648, 'steps': 18768, 'loss/train': 1.2008689641952515} -11/06/2021 23:53:37 - INFO - __main__ - Step 18770: {'lr': 0.00048432851210688567, 'samples': 3603840, 'steps': 18769, 'loss/train': 1.6347686052322388} -11/06/2021 23:53:37 - INFO - __main__ - Step 18771: {'lr': 0.00048432666272887805, 'samples': 3604032, 'steps': 18770, 'loss/train': 1.4727251529693604} -11/06/2021 23:53:38 - INFO - __main__ - Step 18772: {'lr': 0.0004843248132452864, 'samples': 3604224, 'steps': 18771, 'loss/train': 0.3945901691913605} -11/06/2021 23:53:38 - INFO - __main__ - Step 18773: {'lr': 0.0004843229636561116, 'samples': 3604416, 'steps': 18772, 'loss/train': 0.9401273131370544} -11/06/2021 23:53:39 - INFO - __main__ - Step 18774: {'lr': 0.00048432111396135447, 'samples': 3604608, 'steps': 18773, 'loss/train': 1.7124041318893433} -11/06/2021 23:53:40 - INFO - __main__ - Step 18775: {'lr': 0.0004843192641610159, 'samples': 3604800, 'steps': 18774, 'loss/train': 1.9197239875793457} -11/06/2021 23:53:40 - INFO - __main__ - Step 18776: {'lr': 0.00048431741425509676, 'samples': 3604992, 'steps': 18775, 'loss/train': 1.211233377456665} -11/06/2021 23:53:40 - INFO - __main__ - Step 18777: {'lr': 0.0004843155642435977, 'samples': 3605184, 'steps': 18776, 'loss/train': 1.7263365983963013} -11/06/2021 23:53:41 - INFO - __main__ - Step 18778: {'lr': 0.0004843137141265197, 'samples': 3605376, 'steps': 18777, 'loss/train': 1.467863917350769} -11/06/2021 23:53:41 - INFO - __main__ - Step 18779: {'lr': 0.00048431186390386356, 'samples': 3605568, 'steps': 18778, 'loss/train': 1.4806694984436035} -11/06/2021 23:53:42 - INFO - __main__ - Step 18780: {'lr': 0.0004843100135756301, 'samples': 3605760, 'steps': 18779, 'loss/train': 1.1883167028427124} -11/06/2021 23:53:42 - INFO - __main__ - Step 18781: {'lr': 0.0004843081631418202, 'samples': 3605952, 'steps': 18780, 'loss/train': 1.6708265542984009} -11/06/2021 23:53:43 - INFO - __main__ - Step 18782: {'lr': 0.00048430631260243465, 'samples': 3606144, 'steps': 18781, 'loss/train': 1.7834099531173706} -11/06/2021 23:53:43 - INFO - __main__ - Step 18783: {'lr': 0.00048430446195747424, 'samples': 3606336, 'steps': 18782, 'loss/train': 1.7206259965896606} -11/06/2021 23:53:43 - INFO - __main__ - Step 18784: {'lr': 0.00048430261120693986, 'samples': 3606528, 'steps': 18783, 'loss/train': 0.8681101202964783} -11/06/2021 23:53:44 - INFO - __main__ - Step 18785: {'lr': 0.0004843007603508324, 'samples': 3606720, 'steps': 18784, 'loss/train': 1.4189516305923462} -11/06/2021 23:53:45 - INFO - __main__ - Step 18786: {'lr': 0.00048429890938915255, 'samples': 3606912, 'steps': 18785, 'loss/train': 1.232398271560669} -11/06/2021 23:53:45 - INFO - __main__ - Step 18787: {'lr': 0.0004842970583219013, 'samples': 3607104, 'steps': 18786, 'loss/train': 1.7327327728271484} -11/06/2021 23:53:45 - INFO - __main__ - Step 18788: {'lr': 0.0004842952071490794, 'samples': 3607296, 'steps': 18787, 'loss/train': 1.8691179752349854} -11/06/2021 23:53:46 - INFO - __main__ - Step 18789: {'lr': 0.0004842933558706877, 'samples': 3607488, 'steps': 18788, 'loss/train': 1.6241750717163086} -11/06/2021 23:53:47 - INFO - __main__ - Step 18790: {'lr': 0.000484291504486727, 'samples': 3607680, 'steps': 18789, 'loss/train': 2.0066754817962646} -11/06/2021 23:53:47 - INFO - __main__ - Step 18791: {'lr': 0.0004842896529971982, 'samples': 3607872, 'steps': 18790, 'loss/train': 1.6360875368118286} -11/06/2021 23:53:48 - INFO - __main__ - Step 18792: {'lr': 0.00048428780140210204, 'samples': 3608064, 'steps': 18791, 'loss/train': 1.7113112211227417} -11/06/2021 23:53:48 - INFO - __main__ - Step 18793: {'lr': 0.0004842859497014394, 'samples': 3608256, 'steps': 18792, 'loss/train': 0.3076252043247223} -11/06/2021 23:53:48 - INFO - __main__ - Step 18794: {'lr': 0.0004842840978952112, 'samples': 3608448, 'steps': 18793, 'loss/train': 0.9483229517936707} -11/06/2021 23:53:49 - INFO - __main__ - Step 18795: {'lr': 0.00048428224598341815, 'samples': 3608640, 'steps': 18794, 'loss/train': 1.8937662839889526} -11/06/2021 23:53:50 - INFO - __main__ - Step 18796: {'lr': 0.0004842803939660612, 'samples': 3608832, 'steps': 18795, 'loss/train': 1.622977614402771} -11/06/2021 23:53:50 - INFO - __main__ - Step 18797: {'lr': 0.00048427854184314103, 'samples': 3609024, 'steps': 18796, 'loss/train': 0.8508211970329285} -11/06/2021 23:53:50 - INFO - __main__ - Step 18798: {'lr': 0.0004842766896146586, 'samples': 3609216, 'steps': 18797, 'loss/train': 1.125472068786621} -11/06/2021 23:53:51 - INFO - __main__ - Step 18799: {'lr': 0.0004842748372806147, 'samples': 3609408, 'steps': 18798, 'loss/train': 1.7149622440338135} -11/06/2021 23:53:51 - INFO - __main__ - Step 18800: {'lr': 0.00048427298484101023, 'samples': 3609600, 'steps': 18799, 'loss/train': 0.749356746673584} -11/06/2021 23:53:52 - INFO - __main__ - Step 18801: {'lr': 0.0004842711322958459, 'samples': 3609792, 'steps': 18800, 'loss/train': 2.0503411293029785} -11/06/2021 23:53:53 - INFO - __main__ - Step 18802: {'lr': 0.0004842692796451226, 'samples': 3609984, 'steps': 18801, 'loss/train': 1.4108389616012573} -11/06/2021 23:53:53 - INFO - __main__ - Step 18803: {'lr': 0.0004842674268888413, 'samples': 3610176, 'steps': 18802, 'loss/train': 1.3129260540008545} -11/06/2021 23:53:53 - INFO - __main__ - Step 18804: {'lr': 0.0004842655740270026, 'samples': 3610368, 'steps': 18803, 'loss/train': 1.4389371871948242} -11/06/2021 23:53:54 - INFO - __main__ - Step 18805: {'lr': 0.0004842637210596075, 'samples': 3610560, 'steps': 18804, 'loss/train': 1.9069589376449585} -11/06/2021 23:53:55 - INFO - __main__ - Step 18806: {'lr': 0.0004842618679866567, 'samples': 3610752, 'steps': 18805, 'loss/train': 1.330498218536377} -11/06/2021 23:53:55 - INFO - __main__ - Step 18807: {'lr': 0.0004842600148081512, 'samples': 3610944, 'steps': 18806, 'loss/train': 1.689779281616211} -11/06/2021 23:53:55 - INFO - __main__ - Step 18808: {'lr': 0.00048425816152409173, 'samples': 3611136, 'steps': 18807, 'loss/train': 1.5551064014434814} -11/06/2021 23:53:56 - INFO - __main__ - Step 18809: {'lr': 0.00048425630813447916, 'samples': 3611328, 'steps': 18808, 'loss/train': 1.4787465333938599} -11/06/2021 23:53:56 - INFO - __main__ - Step 18810: {'lr': 0.0004842544546393143, 'samples': 3611520, 'steps': 18809, 'loss/train': 1.7897770404815674} -11/06/2021 23:53:57 - INFO - __main__ - Step 18811: {'lr': 0.00048425260103859797, 'samples': 3611712, 'steps': 18810, 'loss/train': 1.685746192932129} -11/06/2021 23:53:57 - INFO - __main__ - Step 18812: {'lr': 0.0004842507473323311, 'samples': 3611904, 'steps': 18811, 'loss/train': 1.5817826986312866} -11/06/2021 23:53:58 - INFO - __main__ - Step 18813: {'lr': 0.00048424889352051436, 'samples': 3612096, 'steps': 18812, 'loss/train': 1.8189197778701782} -11/06/2021 23:53:58 - INFO - __main__ - Step 18814: {'lr': 0.00048424703960314876, 'samples': 3612288, 'steps': 18813, 'loss/train': 1.7752747535705566} -11/06/2021 23:53:59 - INFO - __main__ - Step 18815: {'lr': 0.00048424518558023505, 'samples': 3612480, 'steps': 18814, 'loss/train': 1.612984538078308} -11/06/2021 23:54:00 - INFO - __main__ - Step 18816: {'lr': 0.00048424333145177405, 'samples': 3612672, 'steps': 18815, 'loss/train': 1.6740766763687134} -11/06/2021 23:54:00 - INFO - __main__ - Step 18817: {'lr': 0.00048424147721776666, 'samples': 3612864, 'steps': 18816, 'loss/train': 2.1559345722198486} -11/06/2021 23:54:00 - INFO - __main__ - Step 18818: {'lr': 0.00048423962287821366, 'samples': 3613056, 'steps': 18817, 'loss/train': 0.7726074457168579} -11/06/2021 23:54:01 - INFO - __main__ - Step 18819: {'lr': 0.00048423776843311585, 'samples': 3613248, 'steps': 18818, 'loss/train': 1.7637563943862915} -11/06/2021 23:54:01 - INFO - __main__ - Step 18820: {'lr': 0.00048423591388247416, 'samples': 3613440, 'steps': 18819, 'loss/train': 1.7249056100845337} -11/06/2021 23:54:01 - INFO - __main__ - Step 18821: {'lr': 0.0004842340592262894, 'samples': 3613632, 'steps': 18820, 'loss/train': 1.6943449974060059} -11/06/2021 23:54:03 - INFO - __main__ - Step 18822: {'lr': 0.00048423220446456233, 'samples': 3613824, 'steps': 18821, 'loss/train': 1.352774739265442} -11/06/2021 23:54:03 - INFO - __main__ - Step 18823: {'lr': 0.0004842303495972939, 'samples': 3614016, 'steps': 18822, 'loss/train': 2.108214855194092} -11/06/2021 23:54:04 - INFO - __main__ - Step 18824: {'lr': 0.00048422849462448483, 'samples': 3614208, 'steps': 18823, 'loss/train': 1.8044021129608154} -11/06/2021 23:54:04 - INFO - __main__ - Step 18825: {'lr': 0.0004842266395461361, 'samples': 3614400, 'steps': 18824, 'loss/train': 6.426365375518799} -11/06/2021 23:54:04 - INFO - __main__ - Step 18826: {'lr': 0.0004842247843622484, 'samples': 3614592, 'steps': 18825, 'loss/train': 5.2774271965026855} -11/06/2021 23:54:05 - INFO - __main__ - Step 18827: {'lr': 0.0004842229290728226, 'samples': 3614784, 'steps': 18826, 'loss/train': 1.6318795680999756} -11/06/2021 23:54:05 - INFO - __main__ - Step 18828: {'lr': 0.0004842210736778596, 'samples': 3614976, 'steps': 18827, 'loss/train': 1.7528266906738281} -11/06/2021 23:54:06 - INFO - __main__ - Step 18829: {'lr': 0.0004842192181773602, 'samples': 3615168, 'steps': 18828, 'loss/train': 1.5569349527359009} -11/06/2021 23:54:07 - INFO - __main__ - Step 18830: {'lr': 0.0004842173625713252, 'samples': 3615360, 'steps': 18829, 'loss/train': 1.8088799715042114} -11/06/2021 23:54:07 - INFO - __main__ - Step 18831: {'lr': 0.0004842155068597556, 'samples': 3615552, 'steps': 18830, 'loss/train': 1.3919082880020142} -11/06/2021 23:54:07 - INFO - __main__ - Step 18832: {'lr': 0.0004842136510426519, 'samples': 3615744, 'steps': 18831, 'loss/train': 1.83372962474823} -11/06/2021 23:54:08 - INFO - __main__ - Step 18833: {'lr': 0.00048421179512001536, 'samples': 3615936, 'steps': 18832, 'loss/train': 1.6518522500991821} -11/06/2021 23:54:08 - INFO - __main__ - Step 18834: {'lr': 0.0004842099390918464, 'samples': 3616128, 'steps': 18833, 'loss/train': 1.6888887882232666} -11/06/2021 23:54:09 - INFO - __main__ - Step 18835: {'lr': 0.00048420808295814624, 'samples': 3616320, 'steps': 18834, 'loss/train': 1.783157467842102} -11/06/2021 23:54:09 - INFO - __main__ - Step 18836: {'lr': 0.00048420622671891533, 'samples': 3616512, 'steps': 18835, 'loss/train': 1.1677378416061401} -11/06/2021 23:54:10 - INFO - __main__ - Step 18837: {'lr': 0.00048420437037415486, 'samples': 3616704, 'steps': 18836, 'loss/train': 1.6292400360107422} -11/06/2021 23:54:10 - INFO - __main__ - Step 18838: {'lr': 0.00048420251392386547, 'samples': 3616896, 'steps': 18837, 'loss/train': 1.4948904514312744} -11/06/2021 23:54:11 - INFO - __main__ - Step 18839: {'lr': 0.0004842006573680481, 'samples': 3617088, 'steps': 18838, 'loss/train': 2.066965103149414} -11/06/2021 23:54:11 - INFO - __main__ - Step 18840: {'lr': 0.0004841988007067034, 'samples': 3617280, 'steps': 18839, 'loss/train': 1.4668853282928467} -11/06/2021 23:54:12 - INFO - __main__ - Step 18841: {'lr': 0.00048419694393983244, 'samples': 3617472, 'steps': 18840, 'loss/train': 1.542981505393982} -11/06/2021 23:54:12 - INFO - __main__ - Step 18842: {'lr': 0.00048419508706743587, 'samples': 3617664, 'steps': 18841, 'loss/train': 1.729238748550415} -11/06/2021 23:54:12 - INFO - __main__ - Step 18843: {'lr': 0.00048419323008951467, 'samples': 3617856, 'steps': 18842, 'loss/train': 1.618919014930725} -11/06/2021 23:54:13 - INFO - __main__ - Step 18844: {'lr': 0.00048419137300606963, 'samples': 3618048, 'steps': 18843, 'loss/train': 1.8637679815292358} -11/06/2021 23:54:14 - INFO - __main__ - Step 18845: {'lr': 0.00048418951581710154, 'samples': 3618240, 'steps': 18844, 'loss/train': 1.0846983194351196} -11/06/2021 23:54:14 - INFO - __main__ - Step 18846: {'lr': 0.00048418765852261124, 'samples': 3618432, 'steps': 18845, 'loss/train': 1.3119678497314453} -11/06/2021 23:54:14 - INFO - __main__ - Step 18847: {'lr': 0.0004841858011225996, 'samples': 3618624, 'steps': 18846, 'loss/train': 2.0200302600860596} -11/06/2021 23:54:15 - INFO - __main__ - Step 18848: {'lr': 0.0004841839436170675, 'samples': 3618816, 'steps': 18847, 'loss/train': 1.3020848035812378} -11/06/2021 23:54:16 - INFO - __main__ - Step 18849: {'lr': 0.0004841820860060157, 'samples': 3619008, 'steps': 18848, 'loss/train': 1.4073768854141235} -11/06/2021 23:54:16 - INFO - __main__ - Step 18850: {'lr': 0.0004841802282894451, 'samples': 3619200, 'steps': 18849, 'loss/train': 1.74467134475708} -11/06/2021 23:54:16 - INFO - __main__ - Step 18851: {'lr': 0.0004841783704673565, 'samples': 3619392, 'steps': 18850, 'loss/train': 1.4385926723480225} -11/06/2021 23:54:17 - INFO - __main__ - Step 18852: {'lr': 0.00048417651253975067, 'samples': 3619584, 'steps': 18851, 'loss/train': 1.2946964502334595} -11/06/2021 23:54:17 - INFO - __main__ - Step 18853: {'lr': 0.00048417465450662856, 'samples': 3619776, 'steps': 18852, 'loss/train': 1.5022872686386108} -11/06/2021 23:54:18 - INFO - __main__ - Step 18854: {'lr': 0.0004841727963679909, 'samples': 3619968, 'steps': 18853, 'loss/train': 2.3088507652282715} -11/06/2021 23:54:19 - INFO - __main__ - Step 18855: {'lr': 0.0004841709381238387, 'samples': 3620160, 'steps': 18854, 'loss/train': 1.64644455909729} -11/06/2021 23:54:19 - INFO - __main__ - Step 18856: {'lr': 0.0004841690797741726, 'samples': 3620352, 'steps': 18855, 'loss/train': 1.808630347251892} -11/06/2021 23:54:19 - INFO - __main__ - Step 18857: {'lr': 0.0004841672213189936, 'samples': 3620544, 'steps': 18856, 'loss/train': 1.4299774169921875} -11/06/2021 23:54:20 - INFO - __main__ - Step 18858: {'lr': 0.00048416536275830245, 'samples': 3620736, 'steps': 18857, 'loss/train': 1.275566577911377} -11/06/2021 23:54:20 - INFO - __main__ - Step 18859: {'lr': 0.00048416350409209995, 'samples': 3620928, 'steps': 18858, 'loss/train': 1.8275693655014038} -11/06/2021 23:54:21 - INFO - __main__ - Step 18860: {'lr': 0.000484161645320387, 'samples': 3621120, 'steps': 18859, 'loss/train': 0.7486388087272644} -11/06/2021 23:54:22 - INFO - __main__ - Step 18861: {'lr': 0.0004841597864431645, 'samples': 3621312, 'steps': 18860, 'loss/train': 1.5714701414108276} -11/06/2021 23:54:22 - INFO - __main__ - Step 18862: {'lr': 0.00048415792746043314, 'samples': 3621504, 'steps': 18861, 'loss/train': 2.1515393257141113} -11/06/2021 23:54:22 - INFO - __main__ - Step 18863: {'lr': 0.00048415606837219383, 'samples': 3621696, 'steps': 18862, 'loss/train': 0.8803495168685913} -11/06/2021 23:54:23 - INFO - __main__ - Step 18864: {'lr': 0.00048415420917844744, 'samples': 3621888, 'steps': 18863, 'loss/train': 1.059100866317749} -11/06/2021 23:54:23 - INFO - __main__ - Step 18865: {'lr': 0.00048415234987919474, 'samples': 3622080, 'steps': 18864, 'loss/train': 1.3690611124038696} -11/06/2021 23:54:24 - INFO - __main__ - Step 18866: {'lr': 0.0004841504904744367, 'samples': 3622272, 'steps': 18865, 'loss/train': 1.7441192865371704} -11/06/2021 23:54:24 - INFO - __main__ - Step 18867: {'lr': 0.0004841486309641739, 'samples': 3622464, 'steps': 18866, 'loss/train': 1.8263840675354004} -11/06/2021 23:54:25 - INFO - __main__ - Step 18868: {'lr': 0.00048414677134840753, 'samples': 3622656, 'steps': 18867, 'loss/train': 1.3380950689315796} -11/06/2021 23:54:25 - INFO - __main__ - Step 18869: {'lr': 0.00048414491162713814, 'samples': 3622848, 'steps': 18868, 'loss/train': 1.482108473777771} -11/06/2021 23:54:25 - INFO - __main__ - Step 18870: {'lr': 0.00048414305180036665, 'samples': 3623040, 'steps': 18869, 'loss/train': 1.6186736822128296} -11/06/2021 23:54:26 - INFO - __main__ - Step 18871: {'lr': 0.0004841411918680939, 'samples': 3623232, 'steps': 18870, 'loss/train': 1.5286184549331665} -11/06/2021 23:54:27 - INFO - __main__ - Step 18872: {'lr': 0.0004841393318303208, 'samples': 3623424, 'steps': 18871, 'loss/train': 1.8360174894332886} -11/06/2021 23:54:27 - INFO - __main__ - Step 18873: {'lr': 0.0004841374716870481, 'samples': 3623616, 'steps': 18872, 'loss/train': 1.7237398624420166} -11/06/2021 23:54:27 - INFO - __main__ - Step 18874: {'lr': 0.00048413561143827665, 'samples': 3623808, 'steps': 18873, 'loss/train': 1.8056116104125977} -11/06/2021 23:54:28 - INFO - __main__ - Step 18875: {'lr': 0.00048413375108400736, 'samples': 3624000, 'steps': 18874, 'loss/train': 1.8317943811416626} -11/06/2021 23:54:29 - INFO - __main__ - Step 18876: {'lr': 0.000484131890624241, 'samples': 3624192, 'steps': 18875, 'loss/train': 1.52738356590271} -11/06/2021 23:54:29 - INFO - __main__ - Step 18877: {'lr': 0.00048413003005897835, 'samples': 3624384, 'steps': 18876, 'loss/train': 1.5932716131210327} -11/06/2021 23:54:29 - INFO - __main__ - Step 18878: {'lr': 0.0004841281693882204, 'samples': 3624576, 'steps': 18877, 'loss/train': 1.2580933570861816} -11/06/2021 23:54:30 - INFO - __main__ - Step 18879: {'lr': 0.0004841263086119679, 'samples': 3624768, 'steps': 18878, 'loss/train': 1.666326642036438} -11/06/2021 23:54:30 - INFO - __main__ - Step 18880: {'lr': 0.00048412444773022166, 'samples': 3624960, 'steps': 18879, 'loss/train': 1.489951491355896} -11/06/2021 23:54:31 - INFO - __main__ - Step 18881: {'lr': 0.0004841225867429826, 'samples': 3625152, 'steps': 18880, 'loss/train': 1.7064945697784424} -11/06/2021 23:54:32 - INFO - __main__ - Step 18882: {'lr': 0.0004841207256502515, 'samples': 3625344, 'steps': 18881, 'loss/train': 1.4198405742645264} -11/06/2021 23:54:32 - INFO - __main__ - Step 18883: {'lr': 0.0004841188644520292, 'samples': 3625536, 'steps': 18882, 'loss/train': 2.1660537719726562} -11/06/2021 23:54:32 - INFO - __main__ - Step 18884: {'lr': 0.0004841170031483165, 'samples': 3625728, 'steps': 18883, 'loss/train': 1.5875812768936157} -11/06/2021 23:54:33 - INFO - __main__ - Step 18885: {'lr': 0.0004841151417391144, 'samples': 3625920, 'steps': 18884, 'loss/train': 1.3188947439193726} -11/06/2021 23:54:33 - INFO - __main__ - Step 18886: {'lr': 0.00048411328022442357, 'samples': 3626112, 'steps': 18885, 'loss/train': 1.1708683967590332} -11/06/2021 23:54:34 - INFO - __main__ - Step 18887: {'lr': 0.000484111418604245, 'samples': 3626304, 'steps': 18886, 'loss/train': 0.6864486336708069} -11/06/2021 23:54:34 - INFO - __main__ - Step 18888: {'lr': 0.00048410955687857926, 'samples': 3626496, 'steps': 18887, 'loss/train': 1.1706008911132812} -11/06/2021 23:54:35 - INFO - __main__ - Step 18889: {'lr': 0.0004841076950474275, 'samples': 3626688, 'steps': 18888, 'loss/train': 1.363743543624878} -11/06/2021 23:54:35 - INFO - __main__ - Step 18890: {'lr': 0.0004841058331107904, 'samples': 3626880, 'steps': 18889, 'loss/train': 1.5939115285873413} -11/06/2021 23:54:35 - INFO - __main__ - Step 18891: {'lr': 0.00048410397106866883, 'samples': 3627072, 'steps': 18890, 'loss/train': 1.363234281539917} -11/06/2021 23:54:36 - INFO - __main__ - Step 18892: {'lr': 0.0004841021089210636, 'samples': 3627264, 'steps': 18891, 'loss/train': 1.4709104299545288} -11/06/2021 23:54:37 - INFO - __main__ - Step 18893: {'lr': 0.0004841002466679756, 'samples': 3627456, 'steps': 18892, 'loss/train': 1.4250143766403198} -11/06/2021 23:54:37 - INFO - __main__ - Step 18894: {'lr': 0.00048409838430940556, 'samples': 3627648, 'steps': 18893, 'loss/train': 1.4562376737594604} -11/06/2021 23:54:37 - INFO - __main__ - Step 18895: {'lr': 0.00048409652184535447, 'samples': 3627840, 'steps': 18894, 'loss/train': 1.5139254331588745} -11/06/2021 23:54:38 - INFO - __main__ - Step 18896: {'lr': 0.0004840946592758231, 'samples': 3628032, 'steps': 18895, 'loss/train': 1.6306174993515015} -11/06/2021 23:54:39 - INFO - __main__ - Step 18897: {'lr': 0.00048409279660081226, 'samples': 3628224, 'steps': 18896, 'loss/train': 1.2062115669250488} -11/06/2021 23:54:39 - INFO - __main__ - Step 18898: {'lr': 0.0004840909338203229, 'samples': 3628416, 'steps': 18897, 'loss/train': 1.950105905532837} -11/06/2021 23:54:40 - INFO - __main__ - Step 18899: {'lr': 0.0004840890709343557, 'samples': 3628608, 'steps': 18898, 'loss/train': 1.9823861122131348} -11/06/2021 23:54:40 - INFO - __main__ - Step 18900: {'lr': 0.0004840872079429116, 'samples': 3628800, 'steps': 18899, 'loss/train': 1.6326419115066528} -11/06/2021 23:54:40 - INFO - __main__ - Step 18901: {'lr': 0.00048408534484599143, 'samples': 3628992, 'steps': 18900, 'loss/train': 1.2868921756744385} -11/06/2021 23:54:41 - INFO - __main__ - Step 18902: {'lr': 0.00048408348164359594, 'samples': 3629184, 'steps': 18901, 'loss/train': 1.845752477645874} -11/06/2021 23:54:42 - INFO - __main__ - Step 18903: {'lr': 0.00048408161833572613, 'samples': 3629376, 'steps': 18902, 'loss/train': 2.1983730792999268} -11/06/2021 23:54:42 - INFO - __main__ - Step 18904: {'lr': 0.0004840797549223827, 'samples': 3629568, 'steps': 18903, 'loss/train': 1.6073050498962402} -11/06/2021 23:54:42 - INFO - __main__ - Step 18905: {'lr': 0.00048407789140356654, 'samples': 3629760, 'steps': 18904, 'loss/train': 1.3466079235076904} -11/06/2021 23:54:43 - INFO - __main__ - Step 18906: {'lr': 0.00048407602777927856, 'samples': 3629952, 'steps': 18905, 'loss/train': 1.2008774280548096} -11/06/2021 23:54:44 - INFO - __main__ - Step 18907: {'lr': 0.0004840741640495195, 'samples': 3630144, 'steps': 18906, 'loss/train': 2.7398083209991455} -11/06/2021 23:54:44 - INFO - __main__ - Step 18908: {'lr': 0.0004840723002142902, 'samples': 3630336, 'steps': 18907, 'loss/train': 1.9664089679718018} -11/06/2021 23:54:45 - INFO - __main__ - Step 18909: {'lr': 0.0004840704362735916, 'samples': 3630528, 'steps': 18908, 'loss/train': 1.7534114122390747} -11/06/2021 23:54:45 - INFO - __main__ - Step 18910: {'lr': 0.0004840685722274244, 'samples': 3630720, 'steps': 18909, 'loss/train': 1.252254605293274} -11/06/2021 23:54:45 - INFO - __main__ - Step 18911: {'lr': 0.0004840667080757896, 'samples': 3630912, 'steps': 18910, 'loss/train': 1.4434303045272827} -11/06/2021 23:54:46 - INFO - __main__ - Step 18912: {'lr': 0.00048406484381868786, 'samples': 3631104, 'steps': 18911, 'loss/train': 1.8143805265426636} -11/06/2021 23:54:47 - INFO - __main__ - Step 18913: {'lr': 0.0004840629794561202, 'samples': 3631296, 'steps': 18912, 'loss/train': 1.431362509727478} -11/06/2021 23:54:47 - INFO - __main__ - Step 18914: {'lr': 0.0004840611149880873, 'samples': 3631488, 'steps': 18913, 'loss/train': 0.25539538264274597} -11/06/2021 23:54:48 - INFO - __main__ - Step 18915: {'lr': 0.0004840592504145901, 'samples': 3631680, 'steps': 18914, 'loss/train': 1.6547143459320068} -11/06/2021 23:54:48 - INFO - __main__ - Step 18916: {'lr': 0.0004840573857356294, 'samples': 3631872, 'steps': 18915, 'loss/train': 1.5618704557418823} -11/06/2021 23:54:48 - INFO - __main__ - Step 18917: {'lr': 0.0004840555209512061, 'samples': 3632064, 'steps': 18916, 'loss/train': 1.6179587841033936} -11/06/2021 23:54:49 - INFO - __main__ - Step 18918: {'lr': 0.00048405365606132096, 'samples': 3632256, 'steps': 18917, 'loss/train': 1.8452666997909546} -11/06/2021 23:54:50 - INFO - __main__ - Step 18919: {'lr': 0.00048405179106597487, 'samples': 3632448, 'steps': 18918, 'loss/train': 1.6771806478500366} -11/06/2021 23:54:50 - INFO - __main__ - Step 18920: {'lr': 0.0004840499259651686, 'samples': 3632640, 'steps': 18919, 'loss/train': 2.0507524013519287} -11/06/2021 23:54:51 - INFO - __main__ - Step 18921: {'lr': 0.0004840480607589031, 'samples': 3632832, 'steps': 18920, 'loss/train': 2.5290257930755615} -11/06/2021 23:54:51 - INFO - __main__ - Step 18922: {'lr': 0.0004840461954471792, 'samples': 3633024, 'steps': 18921, 'loss/train': 1.8817951679229736} -11/06/2021 23:54:52 - INFO - __main__ - Step 18923: {'lr': 0.00048404433002999757, 'samples': 3633216, 'steps': 18922, 'loss/train': 1.3463006019592285} -11/06/2021 23:54:52 - INFO - __main__ - Step 18924: {'lr': 0.0004840424645073593, 'samples': 3633408, 'steps': 18923, 'loss/train': 1.3242696523666382} -11/06/2021 23:54:53 - INFO - __main__ - Step 18925: {'lr': 0.000484040598879265, 'samples': 3633600, 'steps': 18924, 'loss/train': 1.3132871389389038} -11/06/2021 23:54:53 - INFO - __main__ - Step 18926: {'lr': 0.0004840387331457157, 'samples': 3633792, 'steps': 18925, 'loss/train': 1.4895330667495728} -11/06/2021 23:54:53 - INFO - __main__ - Step 18927: {'lr': 0.00048403686730671215, 'samples': 3633984, 'steps': 18926, 'loss/train': 1.6102023124694824} -11/06/2021 23:54:54 - INFO - __main__ - Step 18928: {'lr': 0.0004840350013622552, 'samples': 3634176, 'steps': 18927, 'loss/train': 1.062371015548706} -11/06/2021 23:54:55 - INFO - __main__ - Step 18929: {'lr': 0.0004840331353123456, 'samples': 3634368, 'steps': 18928, 'loss/train': 1.8671513795852661} -11/06/2021 23:54:55 - INFO - __main__ - Step 18930: {'lr': 0.00048403126915698435, 'samples': 3634560, 'steps': 18929, 'loss/train': 1.2960901260375977} -11/06/2021 23:54:55 - INFO - __main__ - Step 18931: {'lr': 0.00048402940289617223, 'samples': 3634752, 'steps': 18930, 'loss/train': 1.1204884052276611} -11/06/2021 23:54:56 - INFO - __main__ - Step 18932: {'lr': 0.00048402753652991007, 'samples': 3634944, 'steps': 18931, 'loss/train': 1.4577025175094604} -11/06/2021 23:54:57 - INFO - __main__ - Step 18933: {'lr': 0.0004840256700581988, 'samples': 3635136, 'steps': 18932, 'loss/train': 1.4760710000991821} -11/06/2021 23:54:57 - INFO - __main__ - Step 18934: {'lr': 0.000484023803481039, 'samples': 3635328, 'steps': 18933, 'loss/train': 1.0608885288238525} -11/06/2021 23:54:58 - INFO - __main__ - Step 18935: {'lr': 0.00048402193679843175, 'samples': 3635520, 'steps': 18934, 'loss/train': 1.0119448900222778} -11/06/2021 23:54:58 - INFO - __main__ - Step 18936: {'lr': 0.00048402007001037786, 'samples': 3635712, 'steps': 18935, 'loss/train': 1.3457058668136597} -11/06/2021 23:54:58 - INFO - __main__ - Step 18937: {'lr': 0.0004840182031168781, 'samples': 3635904, 'steps': 18936, 'loss/train': 1.7942875623703003} -11/06/2021 23:54:59 - INFO - __main__ - Step 18938: {'lr': 0.0004840163361179334, 'samples': 3636096, 'steps': 18937, 'loss/train': 1.9397997856140137} -11/06/2021 23:55:00 - INFO - __main__ - Step 18939: {'lr': 0.00048401446901354453, 'samples': 3636288, 'steps': 18938, 'loss/train': 1.4605997800827026} -11/06/2021 23:55:00 - INFO - __main__ - Step 18940: {'lr': 0.0004840126018037123, 'samples': 3636480, 'steps': 18939, 'loss/train': 2.040832996368408} -11/06/2021 23:55:00 - INFO - __main__ - Step 18941: {'lr': 0.0004840107344884377, 'samples': 3636672, 'steps': 18940, 'loss/train': 1.2393549680709839} -11/06/2021 23:55:01 - INFO - __main__ - Step 18942: {'lr': 0.0004840088670677214, 'samples': 3636864, 'steps': 18941, 'loss/train': 1.561964988708496} -11/06/2021 23:55:01 - INFO - __main__ - Step 18943: {'lr': 0.0004840069995415643, 'samples': 3637056, 'steps': 18942, 'loss/train': 1.3233683109283447} -11/06/2021 23:55:02 - INFO - __main__ - Step 18944: {'lr': 0.0004840051319099673, 'samples': 3637248, 'steps': 18943, 'loss/train': 1.9745053052902222} -11/06/2021 23:55:02 - INFO - __main__ - Step 18945: {'lr': 0.0004840032641729312, 'samples': 3637440, 'steps': 18944, 'loss/train': 1.7221941947937012} -11/06/2021 23:55:03 - INFO - __main__ - Step 18946: {'lr': 0.0004840013963304568, 'samples': 3637632, 'steps': 18945, 'loss/train': 1.6417832374572754} -11/06/2021 23:55:03 - INFO - __main__ - Step 18947: {'lr': 0.000483999528382545, 'samples': 3637824, 'steps': 18946, 'loss/train': 1.5244332551956177} -11/06/2021 23:55:03 - INFO - __main__ - Step 18948: {'lr': 0.00048399766032919666, 'samples': 3638016, 'steps': 18947, 'loss/train': 1.8366427421569824} -11/06/2021 23:55:05 - INFO - __main__ - Step 18949: {'lr': 0.0004839957921704126, 'samples': 3638208, 'steps': 18948, 'loss/train': 1.1807835102081299} -11/06/2021 23:55:05 - INFO - __main__ - Step 18950: {'lr': 0.0004839939239061936, 'samples': 3638400, 'steps': 18949, 'loss/train': 2.372195243835449} -11/06/2021 23:55:05 - INFO - __main__ - Step 18951: {'lr': 0.00048399205553654046, 'samples': 3638592, 'steps': 18950, 'loss/train': 1.5446722507476807} -11/06/2021 23:55:06 - INFO - __main__ - Step 18952: {'lr': 0.0004839901870614543, 'samples': 3638784, 'steps': 18951, 'loss/train': 1.4252386093139648} -11/06/2021 23:55:06 - INFO - __main__ - Step 18953: {'lr': 0.0004839883184809356, 'samples': 3638976, 'steps': 18952, 'loss/train': 1.5092815160751343} -11/06/2021 23:55:07 - INFO - __main__ - Step 18954: {'lr': 0.00048398644979498543, 'samples': 3639168, 'steps': 18953, 'loss/train': 1.7473726272583008} -11/06/2021 23:55:07 - INFO - __main__ - Step 18955: {'lr': 0.0004839845810036047, 'samples': 3639360, 'steps': 18954, 'loss/train': 1.6918965578079224} -11/06/2021 23:55:08 - INFO - __main__ - Step 18956: {'lr': 0.00048398271210679393, 'samples': 3639552, 'steps': 18955, 'loss/train': 1.3582264184951782} -11/06/2021 23:55:08 - INFO - __main__ - Step 18957: {'lr': 0.0004839808431045543, 'samples': 3639744, 'steps': 18956, 'loss/train': 1.5944629907608032} -11/06/2021 23:55:08 - INFO - __main__ - Step 18958: {'lr': 0.00048397897399688643, 'samples': 3639936, 'steps': 18957, 'loss/train': 1.8873305320739746} -11/06/2021 23:55:09 - INFO - __main__ - Step 18959: {'lr': 0.0004839771047837913, 'samples': 3640128, 'steps': 18958, 'loss/train': 1.7735779285430908} -11/06/2021 23:55:10 - INFO - __main__ - Step 18960: {'lr': 0.00048397523546526966, 'samples': 3640320, 'steps': 18959, 'loss/train': 1.5042515993118286} -11/06/2021 23:55:10 - INFO - __main__ - Step 18961: {'lr': 0.0004839733660413224, 'samples': 3640512, 'steps': 18960, 'loss/train': 1.004091739654541} -11/06/2021 23:55:10 - INFO - __main__ - Step 18962: {'lr': 0.0004839714965119504, 'samples': 3640704, 'steps': 18961, 'loss/train': 1.425974726676941} -11/06/2021 23:55:11 - INFO - __main__ - Step 18963: {'lr': 0.0004839696268771544, 'samples': 3640896, 'steps': 18962, 'loss/train': 0.9318681955337524} -11/06/2021 23:55:12 - INFO - __main__ - Step 18964: {'lr': 0.0004839677571369353, 'samples': 3641088, 'steps': 18963, 'loss/train': 1.7548048496246338} -11/06/2021 23:55:12 - INFO - __main__ - Step 18965: {'lr': 0.000483965887291294, 'samples': 3641280, 'steps': 18964, 'loss/train': 1.1884113550186157} -11/06/2021 23:55:13 - INFO - __main__ - Step 18966: {'lr': 0.0004839640173402312, 'samples': 3641472, 'steps': 18965, 'loss/train': 0.5352546572685242} -11/06/2021 23:55:13 - INFO - __main__ - Step 18967: {'lr': 0.00048396214728374786, 'samples': 3641664, 'steps': 18966, 'loss/train': 1.5210620164871216} -11/06/2021 23:55:13 - INFO - __main__ - Step 18968: {'lr': 0.00048396027712184475, 'samples': 3641856, 'steps': 18967, 'loss/train': 2.4723968505859375} -11/06/2021 23:55:14 - INFO - __main__ - Step 18969: {'lr': 0.0004839584068545228, 'samples': 3642048, 'steps': 18968, 'loss/train': 1.6791962385177612} -11/06/2021 23:55:15 - INFO - __main__ - Step 18970: {'lr': 0.0004839565364817828, 'samples': 3642240, 'steps': 18969, 'loss/train': 1.571922779083252} -11/06/2021 23:55:15 - INFO - __main__ - Step 18971: {'lr': 0.0004839546660036256, 'samples': 3642432, 'steps': 18970, 'loss/train': 1.4152837991714478} -11/06/2021 23:55:15 - INFO - __main__ - Step 18972: {'lr': 0.000483952795420052, 'samples': 3642624, 'steps': 18971, 'loss/train': 1.4770593643188477} -11/06/2021 23:55:16 - INFO - __main__ - Step 18973: {'lr': 0.0004839509247310629, 'samples': 3642816, 'steps': 18972, 'loss/train': 1.4914158582687378} -11/06/2021 23:55:16 - INFO - __main__ - Step 18974: {'lr': 0.00048394905393665913, 'samples': 3643008, 'steps': 18973, 'loss/train': 1.941078543663025} -11/06/2021 23:55:17 - INFO - __main__ - Step 18975: {'lr': 0.00048394718303684147, 'samples': 3643200, 'steps': 18974, 'loss/train': 1.4603451490402222} -11/06/2021 23:55:17 - INFO - __main__ - Step 18976: {'lr': 0.00048394531203161084, 'samples': 3643392, 'steps': 18975, 'loss/train': 1.721853256225586} -11/06/2021 23:55:18 - INFO - __main__ - Step 18977: {'lr': 0.00048394344092096816, 'samples': 3643584, 'steps': 18976, 'loss/train': 1.8595176935195923} -11/06/2021 23:55:18 - INFO - __main__ - Step 18978: {'lr': 0.0004839415697049141, 'samples': 3643776, 'steps': 18977, 'loss/train': 1.1810476779937744} -11/06/2021 23:55:19 - INFO - __main__ - Step 18979: {'lr': 0.00048393969838344956, 'samples': 3643968, 'steps': 18978, 'loss/train': 4.6848673820495605} -11/06/2021 23:55:20 - INFO - __main__ - Step 18980: {'lr': 0.0004839378269565754, 'samples': 3644160, 'steps': 18979, 'loss/train': 1.5944328308105469} -11/06/2021 23:55:20 - INFO - __main__ - Step 18981: {'lr': 0.00048393595542429253, 'samples': 3644352, 'steps': 18980, 'loss/train': 1.6038635969161987} -11/06/2021 23:55:21 - INFO - __main__ - Step 18982: {'lr': 0.0004839340837866016, 'samples': 3644544, 'steps': 18981, 'loss/train': 2.6181952953338623} -11/06/2021 23:55:21 - INFO - __main__ - Step 18983: {'lr': 0.00048393221204350376, 'samples': 3644736, 'steps': 18982, 'loss/train': 1.9288345575332642} -11/06/2021 23:55:21 - INFO - __main__ - Step 18984: {'lr': 0.0004839303401949996, 'samples': 3644928, 'steps': 18983, 'loss/train': 2.2249767780303955} -11/06/2021 23:55:22 - INFO - __main__ - Step 18985: {'lr': 0.00048392846824109, 'samples': 3645120, 'steps': 18984, 'loss/train': 1.4523152112960815} -11/06/2021 23:55:23 - INFO - __main__ - Step 18986: {'lr': 0.00048392659618177585, 'samples': 3645312, 'steps': 18985, 'loss/train': 1.7560415267944336} -11/06/2021 23:55:23 - INFO - __main__ - Step 18987: {'lr': 0.000483924724017058, 'samples': 3645504, 'steps': 18986, 'loss/train': 1.8481801748275757} -11/06/2021 23:55:23 - INFO - __main__ - Step 18988: {'lr': 0.00048392285174693727, 'samples': 3645696, 'steps': 18987, 'loss/train': 0.914047360420227} -11/06/2021 23:55:24 - INFO - __main__ - Step 18989: {'lr': 0.0004839209793714146, 'samples': 3645888, 'steps': 18988, 'loss/train': 1.7691324949264526} -11/06/2021 23:55:24 - INFO - __main__ - Step 18990: {'lr': 0.00048391910689049057, 'samples': 3646080, 'steps': 18989, 'loss/train': 1.0342262983322144} -11/06/2021 23:55:25 - INFO - __main__ - Step 18991: {'lr': 0.00048391723430416634, 'samples': 3646272, 'steps': 18990, 'loss/train': 1.5997928380966187} -11/06/2021 23:55:26 - INFO - __main__ - Step 18992: {'lr': 0.00048391536161244254, 'samples': 3646464, 'steps': 18991, 'loss/train': 1.5818288326263428} -11/06/2021 23:55:26 - INFO - __main__ - Step 18993: {'lr': 0.0004839134888153202, 'samples': 3646656, 'steps': 18992, 'loss/train': 1.9287071228027344} -11/06/2021 23:55:26 - INFO - __main__ - Step 18994: {'lr': 0.00048391161591279994, 'samples': 3646848, 'steps': 18993, 'loss/train': 1.191074252128601} -11/06/2021 23:55:27 - INFO - __main__ - Step 18995: {'lr': 0.0004839097429048827, 'samples': 3647040, 'steps': 18994, 'loss/train': 1.541513442993164} -11/06/2021 23:55:28 - INFO - __main__ - Step 18996: {'lr': 0.00048390786979156944, 'samples': 3647232, 'steps': 18995, 'loss/train': 1.4567269086837769} -11/06/2021 23:55:28 - INFO - __main__ - Step 18997: {'lr': 0.0004839059965728608, 'samples': 3647424, 'steps': 18996, 'loss/train': 1.8564058542251587} -11/06/2021 23:55:28 - INFO - __main__ - Step 18998: {'lr': 0.0004839041232487578, 'samples': 3647616, 'steps': 18997, 'loss/train': 0.6478285193443298} -11/06/2021 23:55:29 - INFO - __main__ - Step 18999: {'lr': 0.0004839022498192612, 'samples': 3647808, 'steps': 18998, 'loss/train': 1.9509828090667725} -11/06/2021 23:55:29 - INFO - __main__ - Step 19000: {'lr': 0.0004839003762843718, 'samples': 3648000, 'steps': 18999, 'loss/train': 1.717009425163269} -11/06/2021 23:55:30 - INFO - __main__ - Step 19001: {'lr': 0.00048389850264409054, 'samples': 3648192, 'steps': 19000, 'loss/train': 2.1301968097686768} -11/06/2021 23:55:30 - INFO - __main__ - Step 19002: {'lr': 0.00048389662889841825, 'samples': 3648384, 'steps': 19001, 'loss/train': 1.4481666088104248} -11/06/2021 23:55:31 - INFO - __main__ - Step 19003: {'lr': 0.0004838947550473557, 'samples': 3648576, 'steps': 19002, 'loss/train': 1.5534554719924927} -11/06/2021 23:55:31 - INFO - __main__ - Step 19004: {'lr': 0.00048389288109090383, 'samples': 3648768, 'steps': 19003, 'loss/train': 1.1992428302764893} -11/06/2021 23:55:31 - INFO - __main__ - Step 19005: {'lr': 0.0004838910070290634, 'samples': 3648960, 'steps': 19004, 'loss/train': 1.6658971309661865} -11/06/2021 23:55:33 - INFO - __main__ - Step 19006: {'lr': 0.00048388913286183535, 'samples': 3649152, 'steps': 19005, 'loss/train': 1.3170843124389648} -11/06/2021 23:55:33 - INFO - __main__ - Step 19007: {'lr': 0.0004838872585892204, 'samples': 3649344, 'steps': 19006, 'loss/train': 1.4023375511169434} -11/06/2021 23:55:33 - INFO - __main__ - Step 19008: {'lr': 0.00048388538421121946, 'samples': 3649536, 'steps': 19007, 'loss/train': 1.516270637512207} -11/06/2021 23:55:34 - INFO - __main__ - Step 19009: {'lr': 0.00048388350972783346, 'samples': 3649728, 'steps': 19008, 'loss/train': 1.362441062927246} -11/06/2021 23:55:34 - INFO - __main__ - Step 19010: {'lr': 0.000483881635139063, 'samples': 3649920, 'steps': 19009, 'loss/train': 1.2651129961013794} -11/06/2021 23:55:35 - INFO - __main__ - Step 19011: {'lr': 0.00048387976044490924, 'samples': 3650112, 'steps': 19010, 'loss/train': 1.373202919960022} -11/06/2021 23:55:35 - INFO - __main__ - Step 19012: {'lr': 0.0004838778856453728, 'samples': 3650304, 'steps': 19011, 'loss/train': 1.5069514513015747} -11/06/2021 23:55:36 - INFO - __main__ - Step 19013: {'lr': 0.00048387601074045464, 'samples': 3650496, 'steps': 19012, 'loss/train': 1.5526649951934814} -11/06/2021 23:55:36 - INFO - __main__ - Step 19014: {'lr': 0.0004838741357301555, 'samples': 3650688, 'steps': 19013, 'loss/train': 1.4588598012924194} -11/06/2021 23:55:36 - INFO - __main__ - Step 19015: {'lr': 0.00048387226061447633, 'samples': 3650880, 'steps': 19014, 'loss/train': 1.072666049003601} -11/06/2021 23:55:37 - INFO - __main__ - Step 19016: {'lr': 0.0004838703853934179, 'samples': 3651072, 'steps': 19015, 'loss/train': 1.7657874822616577} -11/06/2021 23:55:38 - INFO - __main__ - Step 19017: {'lr': 0.0004838685100669811, 'samples': 3651264, 'steps': 19016, 'loss/train': 1.2980928421020508} -11/06/2021 23:55:38 - INFO - __main__ - Step 19018: {'lr': 0.0004838666346351667, 'samples': 3651456, 'steps': 19017, 'loss/train': 1.271425724029541} -11/06/2021 23:55:38 - INFO - __main__ - Step 19019: {'lr': 0.0004838647590979757, 'samples': 3651648, 'steps': 19018, 'loss/train': 1.669057011604309} -11/06/2021 23:55:39 - INFO - __main__ - Step 19020: {'lr': 0.00048386288345540876, 'samples': 3651840, 'steps': 19019, 'loss/train': 1.4595625400543213} -11/06/2021 23:55:39 - INFO - __main__ - Step 19021: {'lr': 0.00048386100770746686, 'samples': 3652032, 'steps': 19020, 'loss/train': 1.5734845399856567} -11/06/2021 23:55:40 - INFO - __main__ - Step 19022: {'lr': 0.00048385913185415076, 'samples': 3652224, 'steps': 19021, 'loss/train': 1.6069128513336182} -11/06/2021 23:55:40 - INFO - __main__ - Step 19023: {'lr': 0.00048385725589546137, 'samples': 3652416, 'steps': 19022, 'loss/train': 1.7868753671646118} -11/06/2021 23:55:41 - INFO - __main__ - Step 19024: {'lr': 0.0004838553798313995, 'samples': 3652608, 'steps': 19023, 'loss/train': 1.7515647411346436} -11/06/2021 23:55:41 - INFO - __main__ - Step 19025: {'lr': 0.000483853503661966, 'samples': 3652800, 'steps': 19024, 'loss/train': 1.6738646030426025} -11/06/2021 23:55:42 - INFO - __main__ - Step 19026: {'lr': 0.00048385162738716174, 'samples': 3652992, 'steps': 19025, 'loss/train': 1.5762358903884888} -11/06/2021 23:55:42 - INFO - __main__ - Step 19027: {'lr': 0.00048384975100698756, 'samples': 3653184, 'steps': 19026, 'loss/train': 1.628257155418396} -11/06/2021 23:55:43 - INFO - __main__ - Step 19028: {'lr': 0.0004838478745214443, 'samples': 3653376, 'steps': 19027, 'loss/train': 1.753998041152954} -11/06/2021 23:55:43 - INFO - __main__ - Step 19029: {'lr': 0.00048384599793053275, 'samples': 3653568, 'steps': 19028, 'loss/train': 1.5790235996246338} -11/06/2021 23:55:44 - INFO - __main__ - Step 19030: {'lr': 0.0004838441212342538, 'samples': 3653760, 'steps': 19029, 'loss/train': 1.3828831911087036} -11/06/2021 23:55:44 - INFO - __main__ - Step 19031: {'lr': 0.0004838422444326084, 'samples': 3653952, 'steps': 19030, 'loss/train': 1.9452617168426514} -11/06/2021 23:55:45 - INFO - __main__ - Step 19032: {'lr': 0.0004838403675255971, 'samples': 3654144, 'steps': 19031, 'loss/train': 1.5351001024246216} -11/06/2021 23:55:45 - INFO - __main__ - Step 19033: {'lr': 0.0004838384905132211, 'samples': 3654336, 'steps': 19032, 'loss/train': 1.7516456842422485} -11/06/2021 23:55:46 - INFO - __main__ - Step 19034: {'lr': 0.000483836613395481, 'samples': 3654528, 'steps': 19033, 'loss/train': 0.5482653379440308} -11/06/2021 23:55:46 - INFO - __main__ - Step 19035: {'lr': 0.0004838347361723778, 'samples': 3654720, 'steps': 19034, 'loss/train': 1.3136703968048096} -11/06/2021 23:55:46 - INFO - __main__ - Step 19036: {'lr': 0.0004838328588439123, 'samples': 3654912, 'steps': 19035, 'loss/train': 1.8250452280044556} -11/06/2021 23:55:47 - INFO - __main__ - Step 19037: {'lr': 0.0004838309814100852, 'samples': 3655104, 'steps': 19036, 'loss/train': 1.3839877843856812} -11/06/2021 23:55:48 - INFO - __main__ - Step 19038: {'lr': 0.0004838291038708975, 'samples': 3655296, 'steps': 19037, 'loss/train': 1.6864336729049683} -11/06/2021 23:55:48 - INFO - __main__ - Step 19039: {'lr': 0.00048382722622635014, 'samples': 3655488, 'steps': 19038, 'loss/train': 1.4272637367248535} -11/06/2021 23:55:48 - INFO - __main__ - Step 19040: {'lr': 0.0004838253484764437, 'samples': 3655680, 'steps': 19039, 'loss/train': 1.7983784675598145} -11/06/2021 23:55:49 - INFO - __main__ - Step 19041: {'lr': 0.0004838234706211792, 'samples': 3655872, 'steps': 19040, 'loss/train': 1.689130187034607} -11/06/2021 23:55:50 - INFO - __main__ - Step 19042: {'lr': 0.00048382159266055746, 'samples': 3656064, 'steps': 19041, 'loss/train': 1.1757745742797852} -11/06/2021 23:55:50 - INFO - __main__ - Step 19043: {'lr': 0.0004838197145945793, 'samples': 3656256, 'steps': 19042, 'loss/train': 1.7386882305145264} -11/06/2021 23:55:51 - INFO - __main__ - Step 19044: {'lr': 0.0004838178364232456, 'samples': 3656448, 'steps': 19043, 'loss/train': 1.588568091392517} -11/06/2021 23:55:51 - INFO - __main__ - Step 19045: {'lr': 0.00048381595814655723, 'samples': 3656640, 'steps': 19044, 'loss/train': 1.907985806465149} -11/06/2021 23:55:51 - INFO - __main__ - Step 19046: {'lr': 0.000483814079764515, 'samples': 3656832, 'steps': 19045, 'loss/train': 1.874314308166504} -11/06/2021 23:55:52 - INFO - __main__ - Step 19047: {'lr': 0.00048381220127711967, 'samples': 3657024, 'steps': 19046, 'loss/train': 1.4793670177459717} -11/06/2021 23:55:53 - INFO - __main__ - Step 19048: {'lr': 0.0004838103226843722, 'samples': 3657216, 'steps': 19047, 'loss/train': 1.9645042419433594} -11/06/2021 23:55:53 - INFO - __main__ - Step 19049: {'lr': 0.00048380844398627343, 'samples': 3657408, 'steps': 19048, 'loss/train': 1.7406543493270874} -11/06/2021 23:55:53 - INFO - __main__ - Step 19050: {'lr': 0.0004838065651828242, 'samples': 3657600, 'steps': 19049, 'loss/train': 1.7106494903564453} -11/06/2021 23:55:54 - INFO - __main__ - Step 19051: {'lr': 0.0004838046862740253, 'samples': 3657792, 'steps': 19050, 'loss/train': 1.5313799381256104} -11/06/2021 23:55:55 - INFO - __main__ - Step 19052: {'lr': 0.0004838028072598777, 'samples': 3657984, 'steps': 19051, 'loss/train': 1.718366265296936} -11/06/2021 23:55:55 - INFO - __main__ - Step 19053: {'lr': 0.00048380092814038204, 'samples': 3658176, 'steps': 19052, 'loss/train': 2.046135425567627} -11/06/2021 23:55:55 - INFO - __main__ - Step 19054: {'lr': 0.0004837990489155394, 'samples': 3658368, 'steps': 19053, 'loss/train': 1.7225055694580078} -11/06/2021 23:55:56 - INFO - __main__ - Step 19055: {'lr': 0.00048379716958535043, 'samples': 3658560, 'steps': 19054, 'loss/train': 1.7493064403533936} -11/06/2021 23:55:56 - INFO - __main__ - Step 19056: {'lr': 0.00048379529014981604, 'samples': 3658752, 'steps': 19055, 'loss/train': 1.859459638595581} -11/06/2021 23:55:57 - INFO - __main__ - Step 19057: {'lr': 0.0004837934106089372, 'samples': 3658944, 'steps': 19056, 'loss/train': 0.9592066407203674} -11/06/2021 23:55:58 - INFO - __main__ - Step 19058: {'lr': 0.0004837915309627146, 'samples': 3659136, 'steps': 19057, 'loss/train': 1.9939336776733398} -11/06/2021 23:55:58 - INFO - __main__ - Step 19059: {'lr': 0.00048378965121114917, 'samples': 3659328, 'steps': 19058, 'loss/train': 1.3354649543762207} -11/06/2021 23:55:58 - INFO - __main__ - Step 19060: {'lr': 0.00048378777135424166, 'samples': 3659520, 'steps': 19059, 'loss/train': 1.3405288457870483} -11/06/2021 23:55:59 - INFO - __main__ - Step 19061: {'lr': 0.0004837858913919931, 'samples': 3659712, 'steps': 19060, 'loss/train': 1.7382433414459229} -11/06/2021 23:56:00 - INFO - __main__ - Step 19062: {'lr': 0.0004837840113244042, 'samples': 3659904, 'steps': 19061, 'loss/train': 1.5361404418945312} -11/06/2021 23:56:00 - INFO - __main__ - Step 19063: {'lr': 0.00048378213115147573, 'samples': 3660096, 'steps': 19062, 'loss/train': 0.8109406232833862} -11/06/2021 23:56:00 - INFO - __main__ - Step 19064: {'lr': 0.00048378025087320877, 'samples': 3660288, 'steps': 19063, 'loss/train': 1.951269507408142} -11/06/2021 23:56:01 - INFO - __main__ - Step 19065: {'lr': 0.0004837783704896039, 'samples': 3660480, 'steps': 19064, 'loss/train': 1.256687879562378} -11/06/2021 23:56:01 - INFO - __main__ - Step 19066: {'lr': 0.0004837764900006623, 'samples': 3660672, 'steps': 19065, 'loss/train': 1.4727357625961304} -11/06/2021 23:56:01 - INFO - __main__ - Step 19067: {'lr': 0.0004837746094063844, 'samples': 3660864, 'steps': 19066, 'loss/train': 1.9289908409118652} -11/06/2021 23:56:02 - INFO - __main__ - Step 19068: {'lr': 0.00048377272870677135, 'samples': 3661056, 'steps': 19067, 'loss/train': 1.5988587141036987} -11/06/2021 23:56:03 - INFO - __main__ - Step 19069: {'lr': 0.000483770847901824, 'samples': 3661248, 'steps': 19068, 'loss/train': 1.1608555316925049} -11/06/2021 23:56:03 - INFO - __main__ - Step 19070: {'lr': 0.000483768966991543, 'samples': 3661440, 'steps': 19069, 'loss/train': 1.5548107624053955} -11/06/2021 23:56:03 - INFO - __main__ - Step 19071: {'lr': 0.0004837670859759294, 'samples': 3661632, 'steps': 19070, 'loss/train': 1.667305827140808} -11/06/2021 23:56:04 - INFO - __main__ - Step 19072: {'lr': 0.0004837652048549839, 'samples': 3661824, 'steps': 19071, 'loss/train': 1.9622819423675537} -11/06/2021 23:56:05 - INFO - __main__ - Step 19073: {'lr': 0.00048376332362870745, 'samples': 3662016, 'steps': 19072, 'loss/train': 1.4648205041885376} -11/06/2021 23:56:05 - INFO - __main__ - Step 19074: {'lr': 0.00048376144229710083, 'samples': 3662208, 'steps': 19073, 'loss/train': 1.6623486280441284} -11/06/2021 23:56:06 - INFO - __main__ - Step 19075: {'lr': 0.00048375956086016495, 'samples': 3662400, 'steps': 19074, 'loss/train': 1.842500925064087} -11/06/2021 23:56:06 - INFO - __main__ - Step 19076: {'lr': 0.0004837576793179005, 'samples': 3662592, 'steps': 19075, 'loss/train': 0.8432311415672302} -11/06/2021 23:56:06 - INFO - __main__ - Step 19077: {'lr': 0.00048375579767030854, 'samples': 3662784, 'steps': 19076, 'loss/train': 1.2110167741775513} -11/06/2021 23:56:07 - INFO - __main__ - Step 19078: {'lr': 0.0004837539159173898, 'samples': 3662976, 'steps': 19077, 'loss/train': 1.565323829650879} -11/06/2021 23:56:08 - INFO - __main__ - Step 19079: {'lr': 0.00048375203405914515, 'samples': 3663168, 'steps': 19078, 'loss/train': 1.4068197011947632} -11/06/2021 23:56:08 - INFO - __main__ - Step 19080: {'lr': 0.00048375015209557547, 'samples': 3663360, 'steps': 19079, 'loss/train': 1.9403846263885498} -11/06/2021 23:56:08 - INFO - __main__ - Step 19081: {'lr': 0.00048374827002668156, 'samples': 3663552, 'steps': 19080, 'loss/train': 1.3041592836380005} -11/06/2021 23:56:09 - INFO - __main__ - Step 19082: {'lr': 0.0004837463878524643, 'samples': 3663744, 'steps': 19081, 'loss/train': 2.0662670135498047} -11/06/2021 23:56:10 - INFO - __main__ - Step 19083: {'lr': 0.0004837445055729245, 'samples': 3663936, 'steps': 19082, 'loss/train': 2.4334311485290527} -11/06/2021 23:56:10 - INFO - __main__ - Step 19084: {'lr': 0.00048374262318806306, 'samples': 3664128, 'steps': 19083, 'loss/train': 1.4202038049697876} -11/06/2021 23:56:10 - INFO - __main__ - Step 19085: {'lr': 0.00048374074069788077, 'samples': 3664320, 'steps': 19084, 'loss/train': 0.9480411410331726} -11/06/2021 23:56:11 - INFO - __main__ - Step 19086: {'lr': 0.0004837388581023785, 'samples': 3664512, 'steps': 19085, 'loss/train': 0.9188286662101746} -11/06/2021 23:56:11 - INFO - __main__ - Step 19087: {'lr': 0.0004837369754015571, 'samples': 3664704, 'steps': 19086, 'loss/train': 1.6863188743591309} -11/06/2021 23:56:12 - INFO - __main__ - Step 19088: {'lr': 0.0004837350925954175, 'samples': 3664896, 'steps': 19087, 'loss/train': 1.5236670970916748} -11/06/2021 23:56:12 - INFO - __main__ - Step 19089: {'lr': 0.00048373320968396043, 'samples': 3665088, 'steps': 19088, 'loss/train': 1.9557360410690308} -11/06/2021 23:56:13 - INFO - __main__ - Step 19090: {'lr': 0.0004837313266671868, 'samples': 3665280, 'steps': 19089, 'loss/train': 1.2220089435577393} -11/06/2021 23:56:13 - INFO - __main__ - Step 19091: {'lr': 0.0004837294435450974, 'samples': 3665472, 'steps': 19090, 'loss/train': 1.4970214366912842} -11/06/2021 23:56:13 - INFO - __main__ - Step 19092: {'lr': 0.00048372756031769316, 'samples': 3665664, 'steps': 19091, 'loss/train': 1.794909119606018} -11/06/2021 23:56:14 - INFO - __main__ - Step 19093: {'lr': 0.00048372567698497487, 'samples': 3665856, 'steps': 19092, 'loss/train': 1.7139893770217896} -11/06/2021 23:56:15 - INFO - __main__ - Step 19094: {'lr': 0.0004837237935469434, 'samples': 3666048, 'steps': 19093, 'loss/train': 1.5381810665130615} -11/06/2021 23:56:15 - INFO - __main__ - Step 19095: {'lr': 0.00048372191000359955, 'samples': 3666240, 'steps': 19094, 'loss/train': 1.4186919927597046} -11/06/2021 23:56:15 - INFO - __main__ - Step 19096: {'lr': 0.00048372002635494425, 'samples': 3666432, 'steps': 19095, 'loss/train': 1.651479721069336} -11/06/2021 23:56:16 - INFO - __main__ - Step 19097: {'lr': 0.00048371814260097834, 'samples': 3666624, 'steps': 19096, 'loss/train': 1.3919228315353394} -11/06/2021 23:56:16 - INFO - __main__ - Step 19098: {'lr': 0.0004837162587417027, 'samples': 3666816, 'steps': 19097, 'loss/train': 2.0199766159057617} -11/06/2021 23:56:17 - INFO - __main__ - Step 19099: {'lr': 0.000483714374777118, 'samples': 3667008, 'steps': 19098, 'loss/train': 1.6757065057754517} -11/06/2021 23:56:18 - INFO - __main__ - Step 19100: {'lr': 0.00048371249070722525, 'samples': 3667200, 'steps': 19099, 'loss/train': 1.7928451299667358} -11/06/2021 23:56:18 - INFO - __main__ - Step 19101: {'lr': 0.0004837106065320253, 'samples': 3667392, 'steps': 19100, 'loss/train': 1.8815168142318726} -11/06/2021 23:56:18 - INFO - __main__ - Step 19102: {'lr': 0.00048370872225151886, 'samples': 3667584, 'steps': 19101, 'loss/train': 1.4708551168441772} -11/06/2021 23:56:19 - INFO - __main__ - Step 19103: {'lr': 0.0004837068378657069, 'samples': 3667776, 'steps': 19102, 'loss/train': 1.1429966688156128} -11/06/2021 23:56:20 - INFO - __main__ - Step 19104: {'lr': 0.0004837049533745903, 'samples': 3667968, 'steps': 19103, 'loss/train': 1.8435603380203247} -11/06/2021 23:56:20 - INFO - __main__ - Step 19105: {'lr': 0.00048370306877816983, 'samples': 3668160, 'steps': 19104, 'loss/train': 1.6147713661193848} -11/06/2021 23:56:20 - INFO - __main__ - Step 19106: {'lr': 0.00048370118407644637, 'samples': 3668352, 'steps': 19105, 'loss/train': 1.210199236869812} -11/06/2021 23:56:21 - INFO - __main__ - Step 19107: {'lr': 0.0004836992992694208, 'samples': 3668544, 'steps': 19106, 'loss/train': 1.3318425416946411} -11/06/2021 23:56:21 - INFO - __main__ - Step 19108: {'lr': 0.00048369741435709383, 'samples': 3668736, 'steps': 19107, 'loss/train': 1.3522213697433472} -11/06/2021 23:56:22 - INFO - __main__ - Step 19109: {'lr': 0.0004836955293394665, 'samples': 3668928, 'steps': 19108, 'loss/train': 1.4460760354995728} -11/06/2021 23:56:22 - INFO - __main__ - Step 19110: {'lr': 0.00048369364421653953, 'samples': 3669120, 'steps': 19109, 'loss/train': 2.3319251537323} -11/06/2021 23:56:23 - INFO - __main__ - Step 19111: {'lr': 0.00048369175898831384, 'samples': 3669312, 'steps': 19110, 'loss/train': 1.8790931701660156} -11/06/2021 23:56:23 - INFO - __main__ - Step 19112: {'lr': 0.0004836898736547902, 'samples': 3669504, 'steps': 19111, 'loss/train': 1.8408292531967163} -11/06/2021 23:56:24 - INFO - __main__ - Step 19113: {'lr': 0.0004836879882159696, 'samples': 3669696, 'steps': 19112, 'loss/train': 1.7793866395950317} -11/06/2021 23:56:24 - INFO - __main__ - Step 19114: {'lr': 0.0004836861026718527, 'samples': 3669888, 'steps': 19113, 'loss/train': 1.2182018756866455} -11/06/2021 23:56:25 - INFO - __main__ - Step 19115: {'lr': 0.00048368421702244045, 'samples': 3670080, 'steps': 19114, 'loss/train': 1.8022509813308716} -11/06/2021 23:56:25 - INFO - __main__ - Step 19116: {'lr': 0.00048368233126773377, 'samples': 3670272, 'steps': 19115, 'loss/train': 1.5703195333480835} -11/06/2021 23:56:26 - INFO - __main__ - Step 19117: {'lr': 0.0004836804454077334, 'samples': 3670464, 'steps': 19116, 'loss/train': 1.6894001960754395} -11/06/2021 23:56:26 - INFO - __main__ - Step 19118: {'lr': 0.0004836785594424402, 'samples': 3670656, 'steps': 19117, 'loss/train': 1.8371540307998657} -11/06/2021 23:56:27 - INFO - __main__ - Step 19119: {'lr': 0.0004836766733718551, 'samples': 3670848, 'steps': 19118, 'loss/train': 1.038614273071289} -11/06/2021 23:56:27 - INFO - __main__ - Step 19120: {'lr': 0.0004836747871959789, 'samples': 3671040, 'steps': 19119, 'loss/train': 1.801282286643982} -11/06/2021 23:56:28 - INFO - __main__ - Step 19121: {'lr': 0.0004836729009148124, 'samples': 3671232, 'steps': 19120, 'loss/train': 1.3906354904174805} -11/06/2021 23:56:28 - INFO - __main__ - Step 19122: {'lr': 0.0004836710145283565, 'samples': 3671424, 'steps': 19121, 'loss/train': 1.6386430263519287} -11/06/2021 23:56:28 - INFO - __main__ - Step 19123: {'lr': 0.0004836691280366121, 'samples': 3671616, 'steps': 19122, 'loss/train': 1.5289560556411743} -11/06/2021 23:56:29 - INFO - __main__ - Step 19124: {'lr': 0.00048366724143958, 'samples': 3671808, 'steps': 19123, 'loss/train': 1.3992829322814941} -11/06/2021 23:56:30 - INFO - __main__ - Step 19125: {'lr': 0.0004836653547372609, 'samples': 3672000, 'steps': 19124, 'loss/train': 1.7073944807052612} -11/06/2021 23:56:30 - INFO - __main__ - Step 19126: {'lr': 0.00048366346792965597, 'samples': 3672192, 'steps': 19125, 'loss/train': 1.8707301616668701} -11/06/2021 23:56:30 - INFO - __main__ - Step 19127: {'lr': 0.0004836615810167658, 'samples': 3672384, 'steps': 19126, 'loss/train': 1.809815764427185} -11/06/2021 23:56:31 - INFO - __main__ - Step 19128: {'lr': 0.00048365969399859134, 'samples': 3672576, 'steps': 19127, 'loss/train': 0.8023385405540466} -11/06/2021 23:56:31 - INFO - __main__ - Step 19129: {'lr': 0.00048365780687513346, 'samples': 3672768, 'steps': 19128, 'loss/train': 0.9183880686759949} -11/06/2021 23:56:32 - INFO - __main__ - Step 19130: {'lr': 0.00048365591964639294, 'samples': 3672960, 'steps': 19129, 'loss/train': 1.3006956577301025} -11/06/2021 23:56:33 - INFO - __main__ - Step 19131: {'lr': 0.0004836540323123707, 'samples': 3673152, 'steps': 19130, 'loss/train': 1.5788049697875977} -11/06/2021 23:56:33 - INFO - __main__ - Step 19132: {'lr': 0.00048365214487306753, 'samples': 3673344, 'steps': 19131, 'loss/train': 2.2502143383026123} -11/06/2021 23:56:33 - INFO - __main__ - Step 19133: {'lr': 0.00048365025732848433, 'samples': 3673536, 'steps': 19132, 'loss/train': 1.1418144702911377} -11/06/2021 23:56:34 - INFO - __main__ - Step 19134: {'lr': 0.0004836483696786219, 'samples': 3673728, 'steps': 19133, 'loss/train': 0.19124336540699005} -11/06/2021 23:56:35 - INFO - __main__ - Step 19135: {'lr': 0.00048364648192348117, 'samples': 3673920, 'steps': 19134, 'loss/train': 1.739778757095337} -11/06/2021 23:56:35 - INFO - __main__ - Step 19136: {'lr': 0.0004836445940630629, 'samples': 3674112, 'steps': 19135, 'loss/train': 1.533406138420105} -11/06/2021 23:56:36 - INFO - __main__ - Step 19137: {'lr': 0.0004836427060973679, 'samples': 3674304, 'steps': 19136, 'loss/train': 1.5858798027038574} -11/06/2021 23:56:36 - INFO - __main__ - Step 19138: {'lr': 0.00048364081802639724, 'samples': 3674496, 'steps': 19137, 'loss/train': 1.5668922662734985} -11/06/2021 23:56:36 - INFO - __main__ - Step 19139: {'lr': 0.00048363892985015157, 'samples': 3674688, 'steps': 19138, 'loss/train': 1.4601547718048096} -11/06/2021 23:56:37 - INFO - __main__ - Step 19140: {'lr': 0.00048363704156863187, 'samples': 3674880, 'steps': 19139, 'loss/train': 1.4852017164230347} -11/06/2021 23:56:38 - INFO - __main__ - Step 19141: {'lr': 0.0004836351531818388, 'samples': 3675072, 'steps': 19140, 'loss/train': 1.2616417407989502} -11/06/2021 23:56:38 - INFO - __main__ - Step 19142: {'lr': 0.00048363326468977343, 'samples': 3675264, 'steps': 19141, 'loss/train': 2.229715585708618} -11/06/2021 23:56:38 - INFO - __main__ - Step 19143: {'lr': 0.00048363137609243654, 'samples': 3675456, 'steps': 19142, 'loss/train': 2.004793643951416} -11/06/2021 23:56:39 - INFO - __main__ - Step 19144: {'lr': 0.0004836294873898289, 'samples': 3675648, 'steps': 19143, 'loss/train': 1.3080763816833496} -11/06/2021 23:56:40 - INFO - __main__ - Step 19145: {'lr': 0.00048362759858195146, 'samples': 3675840, 'steps': 19144, 'loss/train': 1.3160992860794067} -11/06/2021 23:56:41 - INFO - __main__ - Step 19146: {'lr': 0.0004836257096688049, 'samples': 3676032, 'steps': 19145, 'loss/train': 1.665747880935669} -11/06/2021 23:56:41 - INFO - __main__ - Step 19147: {'lr': 0.00048362382065039034, 'samples': 3676224, 'steps': 19146, 'loss/train': 1.2606112957000732} -11/06/2021 23:56:41 - INFO - __main__ - Step 19148: {'lr': 0.00048362193152670847, 'samples': 3676416, 'steps': 19147, 'loss/train': 1.4134140014648438} -11/06/2021 23:56:42 - INFO - __main__ - Step 19149: {'lr': 0.0004836200422977601, 'samples': 3676608, 'steps': 19148, 'loss/train': 2.2859280109405518} -11/06/2021 23:56:42 - INFO - __main__ - Step 19150: {'lr': 0.00048361815296354624, 'samples': 3676800, 'steps': 19149, 'loss/train': 1.893393874168396} -11/06/2021 23:56:43 - INFO - __main__ - Step 19151: {'lr': 0.00048361626352406756, 'samples': 3676992, 'steps': 19150, 'loss/train': 1.5060352087020874} -11/06/2021 23:56:43 - INFO - __main__ - Step 19152: {'lr': 0.00048361437397932504, 'samples': 3677184, 'steps': 19151, 'loss/train': 2.0820343494415283} -11/06/2021 23:56:44 - INFO - __main__ - Step 19153: {'lr': 0.0004836124843293195, 'samples': 3677376, 'steps': 19152, 'loss/train': 1.5182925462722778} -11/06/2021 23:56:44 - INFO - __main__ - Step 19154: {'lr': 0.00048361059457405176, 'samples': 3677568, 'steps': 19153, 'loss/train': 1.160764217376709} -11/06/2021 23:56:45 - INFO - __main__ - Step 19155: {'lr': 0.0004836087047135227, 'samples': 3677760, 'steps': 19154, 'loss/train': 1.0252954959869385} -11/06/2021 23:56:46 - INFO - __main__ - Step 19156: {'lr': 0.0004836068147477331, 'samples': 3677952, 'steps': 19155, 'loss/train': 1.408125638961792} -11/06/2021 23:56:46 - INFO - __main__ - Step 19157: {'lr': 0.0004836049246766839, 'samples': 3678144, 'steps': 19156, 'loss/train': 1.8385653495788574} -11/06/2021 23:56:47 - INFO - __main__ - Step 19158: {'lr': 0.000483603034500376, 'samples': 3678336, 'steps': 19157, 'loss/train': 2.144331216812134} -11/06/2021 23:56:47 - INFO - __main__ - Step 19159: {'lr': 0.0004836011442188101, 'samples': 3678528, 'steps': 19158, 'loss/train': 2.2374393939971924} -11/06/2021 23:56:47 - INFO - __main__ - Step 19160: {'lr': 0.00048359925383198714, 'samples': 3678720, 'steps': 19159, 'loss/train': 1.9010136127471924} -11/06/2021 23:56:48 - INFO - __main__ - Step 19161: {'lr': 0.000483597363339908, 'samples': 3678912, 'steps': 19160, 'loss/train': 2.1621627807617188} -11/06/2021 23:56:49 - INFO - __main__ - Step 19162: {'lr': 0.0004835954727425734, 'samples': 3679104, 'steps': 19161, 'loss/train': 0.9236301779747009} -11/06/2021 23:56:49 - INFO - __main__ - Step 19163: {'lr': 0.0004835935820399844, 'samples': 3679296, 'steps': 19162, 'loss/train': 1.932969331741333} -11/06/2021 23:56:49 - INFO - __main__ - Step 19164: {'lr': 0.0004835916912321417, 'samples': 3679488, 'steps': 19163, 'loss/train': 1.723209261894226} -11/06/2021 23:56:50 - INFO - __main__ - Step 19165: {'lr': 0.0004835898003190462, 'samples': 3679680, 'steps': 19164, 'loss/train': 1.830366611480713} -11/06/2021 23:56:50 - INFO - __main__ - Step 19166: {'lr': 0.00048358790930069876, 'samples': 3679872, 'steps': 19165, 'loss/train': 1.4188361167907715} -11/06/2021 23:56:51 - INFO - __main__ - Step 19167: {'lr': 0.0004835860181771001, 'samples': 3680064, 'steps': 19166, 'loss/train': 1.7501378059387207} -11/06/2021 23:56:51 - INFO - __main__ - Step 19168: {'lr': 0.0004835841269482513, 'samples': 3680256, 'steps': 19167, 'loss/train': 1.277912974357605} -11/06/2021 23:56:52 - INFO - __main__ - Step 19169: {'lr': 0.00048358223561415306, 'samples': 3680448, 'steps': 19168, 'loss/train': 1.2338846921920776} -11/06/2021 23:56:52 - INFO - __main__ - Step 19170: {'lr': 0.0004835803441748062, 'samples': 3680640, 'steps': 19169, 'loss/train': 1.7084600925445557} -11/06/2021 23:56:53 - INFO - __main__ - Step 19171: {'lr': 0.0004835784526302117, 'samples': 3680832, 'steps': 19170, 'loss/train': 1.6762709617614746} -11/06/2021 23:56:54 - INFO - __main__ - Step 19172: {'lr': 0.0004835765609803704, 'samples': 3681024, 'steps': 19171, 'loss/train': 1.5952175855636597} -11/06/2021 23:56:54 - INFO - __main__ - Step 19173: {'lr': 0.00048357466922528306, 'samples': 3681216, 'steps': 19172, 'loss/train': 1.9963054656982422} -11/06/2021 23:56:54 - INFO - __main__ - Step 19174: {'lr': 0.00048357277736495055, 'samples': 3681408, 'steps': 19173, 'loss/train': 1.8751789331436157} -11/06/2021 23:56:55 - INFO - __main__ - Step 19175: {'lr': 0.0004835708853993738, 'samples': 3681600, 'steps': 19174, 'loss/train': 2.0888760089874268} -11/06/2021 23:56:55 - INFO - __main__ - Step 19176: {'lr': 0.0004835689933285536, 'samples': 3681792, 'steps': 19175, 'loss/train': 1.4569809436798096} -11/06/2021 23:56:55 - INFO - __main__ - Step 19177: {'lr': 0.0004835671011524908, 'samples': 3681984, 'steps': 19176, 'loss/train': 1.6103253364562988} -11/06/2021 23:56:56 - INFO - __main__ - Step 19178: {'lr': 0.0004835652088711863, 'samples': 3682176, 'steps': 19177, 'loss/train': 1.5094871520996094} -11/06/2021 23:56:57 - INFO - __main__ - Step 19179: {'lr': 0.0004835633164846409, 'samples': 3682368, 'steps': 19178, 'loss/train': 0.7678648233413696} -11/06/2021 23:56:57 - INFO - __main__ - Step 19180: {'lr': 0.00048356142399285545, 'samples': 3682560, 'steps': 19179, 'loss/train': 2.044360399246216} -11/06/2021 23:56:57 - INFO - __main__ - Step 19181: {'lr': 0.00048355953139583087, 'samples': 3682752, 'steps': 19180, 'loss/train': 1.4923588037490845} -11/06/2021 23:56:58 - INFO - __main__ - Step 19182: {'lr': 0.00048355763869356794, 'samples': 3682944, 'steps': 19181, 'loss/train': 1.9290509223937988} -11/06/2021 23:56:59 - INFO - __main__ - Step 19183: {'lr': 0.0004835557458860675, 'samples': 3683136, 'steps': 19182, 'loss/train': 1.8096939325332642} -11/06/2021 23:56:59 - INFO - __main__ - Step 19184: {'lr': 0.00048355385297333054, 'samples': 3683328, 'steps': 19183, 'loss/train': 1.6977989673614502} -11/06/2021 23:57:00 - INFO - __main__ - Step 19185: {'lr': 0.0004835519599553578, 'samples': 3683520, 'steps': 19184, 'loss/train': 1.9109872579574585} -11/06/2021 23:57:00 - INFO - __main__ - Step 19186: {'lr': 0.0004835500668321501, 'samples': 3683712, 'steps': 19185, 'loss/train': 1.4003887176513672} -11/06/2021 23:57:00 - INFO - __main__ - Step 19187: {'lr': 0.0004835481736037084, 'samples': 3683904, 'steps': 19186, 'loss/train': 1.6025032997131348} -11/06/2021 23:57:01 - INFO - __main__ - Step 19188: {'lr': 0.0004835462802700334, 'samples': 3684096, 'steps': 19187, 'loss/train': 1.638126015663147} -11/06/2021 23:57:02 - INFO - __main__ - Step 19189: {'lr': 0.00048354438683112614, 'samples': 3684288, 'steps': 19188, 'loss/train': 1.3936848640441895} -11/06/2021 23:57:02 - INFO - __main__ - Step 19190: {'lr': 0.00048354249328698743, 'samples': 3684480, 'steps': 19189, 'loss/train': 1.5004618167877197} -11/06/2021 23:57:02 - INFO - __main__ - Step 19191: {'lr': 0.000483540599637618, 'samples': 3684672, 'steps': 19190, 'loss/train': 1.6228737831115723} -11/06/2021 23:57:03 - INFO - __main__ - Step 19192: {'lr': 0.00048353870588301875, 'samples': 3684864, 'steps': 19191, 'loss/train': 1.393079400062561} -11/06/2021 23:57:04 - INFO - __main__ - Step 19193: {'lr': 0.00048353681202319056, 'samples': 3685056, 'steps': 19192, 'loss/train': 1.1348565816879272} -11/06/2021 23:57:04 - INFO - __main__ - Step 19194: {'lr': 0.0004835349180581343, 'samples': 3685248, 'steps': 19193, 'loss/train': 1.383333444595337} -11/06/2021 23:57:05 - INFO - __main__ - Step 19195: {'lr': 0.0004835330239878509, 'samples': 3685440, 'steps': 19194, 'loss/train': 1.5683242082595825} -11/06/2021 23:57:05 - INFO - __main__ - Step 19196: {'lr': 0.00048353112981234104, 'samples': 3685632, 'steps': 19195, 'loss/train': 1.6847158670425415} -11/06/2021 23:57:05 - INFO - __main__ - Step 19197: {'lr': 0.0004835292355316057, 'samples': 3685824, 'steps': 19196, 'loss/train': 1.350108027458191} -11/06/2021 23:57:06 - INFO - __main__ - Step 19198: {'lr': 0.0004835273411456456, 'samples': 3686016, 'steps': 19197, 'loss/train': 1.6436011791229248} -11/06/2021 23:57:07 - INFO - __main__ - Step 19199: {'lr': 0.00048352544665446174, 'samples': 3686208, 'steps': 19198, 'loss/train': 1.8072590827941895} -11/06/2021 23:57:07 - INFO - __main__ - Step 19200: {'lr': 0.000483523552058055, 'samples': 3686400, 'steps': 19199, 'loss/train': 1.4258383512496948} -11/06/2021 23:57:07 - INFO - __main__ - Step 19201: {'lr': 0.00048352165735642607, 'samples': 3686592, 'steps': 19200, 'loss/train': 1.8473409414291382} -11/06/2021 23:57:08 - INFO - __main__ - Step 19202: {'lr': 0.00048351976254957585, 'samples': 3686784, 'steps': 19201, 'loss/train': 1.810278296470642} -11/06/2021 23:57:08 - INFO - __main__ - Step 19203: {'lr': 0.0004835178676375053, 'samples': 3686976, 'steps': 19202, 'loss/train': 1.8077994585037231} -11/06/2021 23:57:09 - INFO - __main__ - Step 19204: {'lr': 0.0004835159726202151, 'samples': 3687168, 'steps': 19203, 'loss/train': 0.6947793364524841} -11/06/2021 23:57:09 - INFO - __main__ - Step 19205: {'lr': 0.0004835140774977063, 'samples': 3687360, 'steps': 19204, 'loss/train': 2.199883222579956} -11/06/2021 23:57:10 - INFO - __main__ - Step 19206: {'lr': 0.0004835121822699796, 'samples': 3687552, 'steps': 19205, 'loss/train': 1.3530951738357544} -11/06/2021 23:57:10 - INFO - __main__ - Step 19207: {'lr': 0.000483510286937036, 'samples': 3687744, 'steps': 19206, 'loss/train': 1.5403071641921997} -11/06/2021 23:57:10 - INFO - __main__ - Step 19208: {'lr': 0.0004835083914988762, 'samples': 3687936, 'steps': 19207, 'loss/train': 1.8505449295043945} -11/06/2021 23:57:11 - INFO - __main__ - Step 19209: {'lr': 0.0004835064959555011, 'samples': 3688128, 'steps': 19208, 'loss/train': 2.985590934753418} -11/06/2021 23:57:12 - INFO - __main__ - Step 19210: {'lr': 0.00048350460030691165, 'samples': 3688320, 'steps': 19209, 'loss/train': 1.5929882526397705} -11/06/2021 23:57:12 - INFO - __main__ - Step 19211: {'lr': 0.00048350270455310864, 'samples': 3688512, 'steps': 19210, 'loss/train': 1.5911760330200195} -11/06/2021 23:57:13 - INFO - __main__ - Step 19212: {'lr': 0.00048350080869409285, 'samples': 3688704, 'steps': 19211, 'loss/train': 1.439744234085083} -11/06/2021 23:57:13 - INFO - __main__ - Step 19213: {'lr': 0.0004834989127298652, 'samples': 3688896, 'steps': 19212, 'loss/train': 2.0591835975646973} -11/06/2021 23:57:14 - INFO - __main__ - Step 19214: {'lr': 0.00048349701666042656, 'samples': 3689088, 'steps': 19213, 'loss/train': 2.5805773735046387} -11/06/2021 23:57:14 - INFO - __main__ - Step 19215: {'lr': 0.00048349512048577784, 'samples': 3689280, 'steps': 19214, 'loss/train': 1.7143360376358032} -11/06/2021 23:57:15 - INFO - __main__ - Step 19216: {'lr': 0.00048349322420591966, 'samples': 3689472, 'steps': 19215, 'loss/train': 1.678261637687683} -11/06/2021 23:57:15 - INFO - __main__ - Step 19217: {'lr': 0.00048349132782085316, 'samples': 3689664, 'steps': 19216, 'loss/train': 2.175565004348755} -11/06/2021 23:57:15 - INFO - __main__ - Step 19218: {'lr': 0.00048348943133057903, 'samples': 3689856, 'steps': 19217, 'loss/train': 1.2457647323608398} -11/06/2021 23:57:17 - INFO - __main__ - Step 19219: {'lr': 0.0004834875347350982, 'samples': 3690048, 'steps': 19218, 'loss/train': 2.0584850311279297} -11/06/2021 23:57:17 - INFO - __main__ - Step 19220: {'lr': 0.00048348563803441146, 'samples': 3690240, 'steps': 19219, 'loss/train': 1.630115270614624} -11/06/2021 23:57:17 - INFO - __main__ - Step 19221: {'lr': 0.0004834837412285197, 'samples': 3690432, 'steps': 19220, 'loss/train': 2.0529630184173584} -11/06/2021 23:57:18 - INFO - __main__ - Step 19222: {'lr': 0.00048348184431742377, 'samples': 3690624, 'steps': 19221, 'loss/train': 1.4660913944244385} -11/06/2021 23:57:18 - INFO - __main__ - Step 19223: {'lr': 0.00048347994730112457, 'samples': 3690816, 'steps': 19222, 'loss/train': 1.7038263082504272} -11/06/2021 23:57:19 - INFO - __main__ - Step 19224: {'lr': 0.00048347805017962274, 'samples': 3691008, 'steps': 19223, 'loss/train': 1.5961427688598633} -11/06/2021 23:57:19 - INFO - __main__ - Step 19225: {'lr': 0.00048347615295291947, 'samples': 3691200, 'steps': 19224, 'loss/train': 1.2532870769500732} -11/06/2021 23:57:20 - INFO - __main__ - Step 19226: {'lr': 0.0004834742556210154, 'samples': 3691392, 'steps': 19225, 'loss/train': 1.9617180824279785} -11/06/2021 23:57:20 - INFO - __main__ - Step 19227: {'lr': 0.00048347235818391144, 'samples': 3691584, 'steps': 19226, 'loss/train': 1.223244071006775} -11/06/2021 23:57:20 - INFO - __main__ - Step 19228: {'lr': 0.0004834704606416084, 'samples': 3691776, 'steps': 19227, 'loss/train': 1.8296163082122803} -11/06/2021 23:57:21 - INFO - __main__ - Step 19229: {'lr': 0.00048346856299410725, 'samples': 3691968, 'steps': 19228, 'loss/train': 1.7569893598556519} -11/06/2021 23:57:22 - INFO - __main__ - Step 19230: {'lr': 0.0004834666652414087, 'samples': 3692160, 'steps': 19229, 'loss/train': 1.1428344249725342} -11/06/2021 23:57:22 - INFO - __main__ - Step 19231: {'lr': 0.0004834647673835137, 'samples': 3692352, 'steps': 19230, 'loss/train': 1.7404580116271973} -11/06/2021 23:57:23 - INFO - __main__ - Step 19232: {'lr': 0.00048346286942042307, 'samples': 3692544, 'steps': 19231, 'loss/train': 1.6448150873184204} -11/06/2021 23:57:23 - INFO - __main__ - Step 19233: {'lr': 0.0004834609713521377, 'samples': 3692736, 'steps': 19232, 'loss/train': 1.1691974401474} -11/06/2021 23:57:24 - INFO - __main__ - Step 19234: {'lr': 0.0004834590731786584, 'samples': 3692928, 'steps': 19233, 'loss/train': 1.48292076587677} -11/06/2021 23:57:24 - INFO - __main__ - Step 19235: {'lr': 0.000483457174899986, 'samples': 3693120, 'steps': 19234, 'loss/train': 1.780066728591919} -11/06/2021 23:57:25 - INFO - __main__ - Step 19236: {'lr': 0.00048345527651612145, 'samples': 3693312, 'steps': 19235, 'loss/train': 1.37631356716156} -11/06/2021 23:57:25 - INFO - __main__ - Step 19237: {'lr': 0.00048345337802706555, 'samples': 3693504, 'steps': 19236, 'loss/train': 1.759711503982544} -11/06/2021 23:57:25 - INFO - __main__ - Step 19238: {'lr': 0.0004834514794328192, 'samples': 3693696, 'steps': 19237, 'loss/train': 1.649255394935608} -11/06/2021 23:57:26 - INFO - __main__ - Step 19239: {'lr': 0.00048344958073338315, 'samples': 3693888, 'steps': 19238, 'loss/train': 0.8222588896751404} -11/06/2021 23:57:27 - INFO - __main__ - Step 19240: {'lr': 0.00048344768192875833, 'samples': 3694080, 'steps': 19239, 'loss/train': 1.4921916723251343} -11/06/2021 23:57:27 - INFO - __main__ - Step 19241: {'lr': 0.00048344578301894557, 'samples': 3694272, 'steps': 19240, 'loss/train': 1.9483696222305298} -11/06/2021 23:57:27 - INFO - __main__ - Step 19242: {'lr': 0.0004834438840039458, 'samples': 3694464, 'steps': 19241, 'loss/train': 1.5134330987930298} -11/06/2021 23:57:28 - INFO - __main__ - Step 19243: {'lr': 0.0004834419848837598, 'samples': 3694656, 'steps': 19242, 'loss/train': 1.6340835094451904} -11/06/2021 23:57:28 - INFO - __main__ - Step 19244: {'lr': 0.00048344008565838844, 'samples': 3694848, 'steps': 19243, 'loss/train': 1.8357398509979248} -11/06/2021 23:57:29 - INFO - __main__ - Step 19245: {'lr': 0.00048343818632783255, 'samples': 3695040, 'steps': 19244, 'loss/train': 1.5533130168914795} -11/06/2021 23:57:30 - INFO - __main__ - Step 19246: {'lr': 0.00048343628689209305, 'samples': 3695232, 'steps': 19245, 'loss/train': 1.3802316188812256} -11/06/2021 23:57:30 - INFO - __main__ - Step 19247: {'lr': 0.00048343438735117076, 'samples': 3695424, 'steps': 19246, 'loss/train': 1.439875841140747} -11/06/2021 23:57:30 - INFO - __main__ - Step 19248: {'lr': 0.00048343248770506655, 'samples': 3695616, 'steps': 19247, 'loss/train': 2.032688856124878} -11/06/2021 23:57:31 - INFO - __main__ - Step 19249: {'lr': 0.0004834305879537812, 'samples': 3695808, 'steps': 19248, 'loss/train': 2.1166164875030518} -11/06/2021 23:57:31 - INFO - __main__ - Step 19250: {'lr': 0.00048342868809731567, 'samples': 3696000, 'steps': 19249, 'loss/train': 5.924430847167969} -11/06/2021 23:57:32 - INFO - __main__ - Step 19251: {'lr': 0.0004834267881356708, 'samples': 3696192, 'steps': 19250, 'loss/train': 1.91569983959198} -11/06/2021 23:57:32 - INFO - __main__ - Step 19252: {'lr': 0.0004834248880688474, 'samples': 3696384, 'steps': 19251, 'loss/train': 1.692755103111267} -11/06/2021 23:57:33 - INFO - __main__ - Step 19253: {'lr': 0.00048342298789684637, 'samples': 3696576, 'steps': 19252, 'loss/train': 0.9209264516830444} -11/06/2021 23:57:33 - INFO - __main__ - Step 19254: {'lr': 0.0004834210876196685, 'samples': 3696768, 'steps': 19253, 'loss/train': 1.80112886428833} -11/06/2021 23:57:33 - INFO - __main__ - Step 19255: {'lr': 0.0004834191872373147, 'samples': 3696960, 'steps': 19254, 'loss/train': 1.6527858972549438} -11/06/2021 23:57:35 - INFO - __main__ - Step 19256: {'lr': 0.0004834172867497858, 'samples': 3697152, 'steps': 19255, 'loss/train': 1.832580804824829} -11/06/2021 23:57:35 - INFO - __main__ - Step 19257: {'lr': 0.0004834153861570827, 'samples': 3697344, 'steps': 19256, 'loss/train': 1.6807947158813477} -11/06/2021 23:57:36 - INFO - __main__ - Step 19258: {'lr': 0.00048341348545920623, 'samples': 3697536, 'steps': 19257, 'loss/train': 1.3076280355453491} -11/06/2021 23:57:36 - INFO - __main__ - Step 19259: {'lr': 0.0004834115846561572, 'samples': 3697728, 'steps': 19258, 'loss/train': 1.2784446477890015} -11/06/2021 23:57:36 - INFO - __main__ - Step 19260: {'lr': 0.0004834096837479366, 'samples': 3697920, 'steps': 19259, 'loss/train': 1.541551113128662} -11/06/2021 23:57:37 - INFO - __main__ - Step 19261: {'lr': 0.00048340778273454514, 'samples': 3698112, 'steps': 19260, 'loss/train': 1.8904051780700684} -11/06/2021 23:57:37 - INFO - __main__ - Step 19262: {'lr': 0.00048340588161598373, 'samples': 3698304, 'steps': 19261, 'loss/train': 1.777864694595337} -11/06/2021 23:57:38 - INFO - __main__ - Step 19263: {'lr': 0.00048340398039225325, 'samples': 3698496, 'steps': 19262, 'loss/train': 1.7768715620040894} -11/06/2021 23:57:38 - INFO - __main__ - Step 19264: {'lr': 0.0004834020790633545, 'samples': 3698688, 'steps': 19263, 'loss/train': 1.5909192562103271} -11/06/2021 23:57:39 - INFO - __main__ - Step 19265: {'lr': 0.00048340017762928843, 'samples': 3698880, 'steps': 19264, 'loss/train': 1.390834093093872} -11/06/2021 23:57:39 - INFO - __main__ - Step 19266: {'lr': 0.00048339827609005583, 'samples': 3699072, 'steps': 19265, 'loss/train': 1.6098217964172363} -11/06/2021 23:57:40 - INFO - __main__ - Step 19267: {'lr': 0.00048339637444565756, 'samples': 3699264, 'steps': 19266, 'loss/train': 1.617615818977356} -11/06/2021 23:57:41 - INFO - __main__ - Step 19268: {'lr': 0.0004833944726960945, 'samples': 3699456, 'steps': 19267, 'loss/train': 2.376567840576172} -11/06/2021 23:57:41 - INFO - __main__ - Step 19269: {'lr': 0.00048339257084136747, 'samples': 3699648, 'steps': 19268, 'loss/train': 1.5636578798294067} -11/06/2021 23:57:41 - INFO - __main__ - Step 19270: {'lr': 0.0004833906688814774, 'samples': 3699840, 'steps': 19269, 'loss/train': 1.7293047904968262} -11/06/2021 23:57:42 - INFO - __main__ - Step 19271: {'lr': 0.00048338876681642504, 'samples': 3700032, 'steps': 19270, 'loss/train': 2.3842742443084717} -11/06/2021 23:57:42 - INFO - __main__ - Step 19272: {'lr': 0.0004833868646462113, 'samples': 3700224, 'steps': 19271, 'loss/train': 0.9048125147819519} -11/06/2021 23:57:43 - INFO - __main__ - Step 19273: {'lr': 0.00048338496237083705, 'samples': 3700416, 'steps': 19272, 'loss/train': 1.2667889595031738} -11/06/2021 23:57:43 - INFO - __main__ - Step 19274: {'lr': 0.00048338305999030313, 'samples': 3700608, 'steps': 19273, 'loss/train': 1.076546311378479} -11/06/2021 23:57:44 - INFO - __main__ - Step 19275: {'lr': 0.00048338115750461044, 'samples': 3700800, 'steps': 19274, 'loss/train': 0.9132834076881409} -11/06/2021 23:57:44 - INFO - __main__ - Step 19276: {'lr': 0.0004833792549137598, 'samples': 3700992, 'steps': 19275, 'loss/train': 0.9541102051734924} -11/06/2021 23:57:44 - INFO - __main__ - Step 19277: {'lr': 0.00048337735221775204, 'samples': 3701184, 'steps': 19276, 'loss/train': 1.4680448770523071} -11/06/2021 23:57:45 - INFO - __main__ - Step 19278: {'lr': 0.000483375449416588, 'samples': 3701376, 'steps': 19277, 'loss/train': 1.483697533607483} -11/06/2021 23:57:46 - INFO - __main__ - Step 19279: {'lr': 0.0004833735465102687, 'samples': 3701568, 'steps': 19278, 'loss/train': 1.5289688110351562} -11/06/2021 23:57:46 - INFO - __main__ - Step 19280: {'lr': 0.0004833716434987948, 'samples': 3701760, 'steps': 19279, 'loss/train': 1.0586185455322266} -11/06/2021 23:57:47 - INFO - __main__ - Step 19281: {'lr': 0.0004833697403821672, 'samples': 3701952, 'steps': 19280, 'loss/train': 1.5551531314849854} -11/06/2021 23:57:47 - INFO - __main__ - Step 19282: {'lr': 0.0004833678371603869, 'samples': 3702144, 'steps': 19281, 'loss/train': 1.4676300287246704} -11/06/2021 23:57:47 - INFO - __main__ - Step 19283: {'lr': 0.0004833659338334546, 'samples': 3702336, 'steps': 19282, 'loss/train': 1.9228662252426147} -11/06/2021 23:57:48 - INFO - __main__ - Step 19284: {'lr': 0.0004833640304013712, 'samples': 3702528, 'steps': 19283, 'loss/train': 1.4458892345428467} -11/06/2021 23:57:49 - INFO - __main__ - Step 19285: {'lr': 0.0004833621268641376, 'samples': 3702720, 'steps': 19284, 'loss/train': 1.6027082204818726} -11/06/2021 23:57:49 - INFO - __main__ - Step 19286: {'lr': 0.0004833602232217546, 'samples': 3702912, 'steps': 19285, 'loss/train': 1.810238242149353} -11/06/2021 23:57:49 - INFO - __main__ - Step 19287: {'lr': 0.0004833583194742231, 'samples': 3703104, 'steps': 19286, 'loss/train': 2.003950595855713} -11/06/2021 23:57:50 - INFO - __main__ - Step 19288: {'lr': 0.00048335641562154396, 'samples': 3703296, 'steps': 19287, 'loss/train': 1.7352495193481445} -11/06/2021 23:57:51 - INFO - __main__ - Step 19289: {'lr': 0.00048335451166371803, 'samples': 3703488, 'steps': 19288, 'loss/train': 1.9271100759506226} -11/06/2021 23:57:51 - INFO - __main__ - Step 19290: {'lr': 0.0004833526076007461, 'samples': 3703680, 'steps': 19289, 'loss/train': 1.5342708826065063} -11/06/2021 23:57:52 - INFO - __main__ - Step 19291: {'lr': 0.0004833507034326291, 'samples': 3703872, 'steps': 19290, 'loss/train': 1.6989701986312866} -11/06/2021 23:57:52 - INFO - __main__ - Step 19292: {'lr': 0.0004833487991593679, 'samples': 3704064, 'steps': 19291, 'loss/train': 1.7094693183898926} -11/06/2021 23:57:52 - INFO - __main__ - Step 19293: {'lr': 0.0004833468947809633, 'samples': 3704256, 'steps': 19292, 'loss/train': 1.513824462890625} -11/06/2021 23:57:53 - INFO - __main__ - Step 19294: {'lr': 0.0004833449902974162, 'samples': 3704448, 'steps': 19293, 'loss/train': 1.898005723953247} -11/06/2021 23:57:54 - INFO - __main__ - Step 19295: {'lr': 0.00048334308570872745, 'samples': 3704640, 'steps': 19294, 'loss/train': 1.7322596311569214} -11/06/2021 23:57:54 - INFO - __main__ - Step 19296: {'lr': 0.00048334118101489793, 'samples': 3704832, 'steps': 19295, 'loss/train': 1.4130336046218872} -11/06/2021 23:57:54 - INFO - __main__ - Step 19297: {'lr': 0.00048333927621592844, 'samples': 3705024, 'steps': 19296, 'loss/train': 1.6878700256347656} -11/06/2021 23:57:55 - INFO - __main__ - Step 19298: {'lr': 0.00048333737131181986, 'samples': 3705216, 'steps': 19297, 'loss/train': 1.5635979175567627} -11/06/2021 23:57:55 - INFO - __main__ - Step 19299: {'lr': 0.00048333546630257315, 'samples': 3705408, 'steps': 19298, 'loss/train': 1.3481976985931396} -11/06/2021 23:57:56 - INFO - __main__ - Step 19300: {'lr': 0.000483333561188189, 'samples': 3705600, 'steps': 19299, 'loss/train': 1.2055301666259766} -11/06/2021 23:57:56 - INFO - __main__ - Step 19301: {'lr': 0.00048333165596866837, 'samples': 3705792, 'steps': 19300, 'loss/train': 1.9592984914779663} -11/06/2021 23:57:57 - INFO - __main__ - Step 19302: {'lr': 0.00048332975064401207, 'samples': 3705984, 'steps': 19301, 'loss/train': 1.6503535509109497} -11/06/2021 23:57:57 - INFO - __main__ - Step 19303: {'lr': 0.000483327845214221, 'samples': 3706176, 'steps': 19302, 'loss/train': 1.752747893333435} -11/06/2021 23:57:57 - INFO - __main__ - Step 19304: {'lr': 0.00048332593967929607, 'samples': 3706368, 'steps': 19303, 'loss/train': 1.8258517980575562} -11/06/2021 23:57:58 - INFO - __main__ - Step 19305: {'lr': 0.000483324034039238, 'samples': 3706560, 'steps': 19304, 'loss/train': 2.0873513221740723} -11/06/2021 23:57:59 - INFO - __main__ - Step 19306: {'lr': 0.00048332212829404775, 'samples': 3706752, 'steps': 19305, 'loss/train': 1.607957363128662} -11/06/2021 23:57:59 - INFO - __main__ - Step 19307: {'lr': 0.0004833202224437261, 'samples': 3706944, 'steps': 19306, 'loss/train': 1.5633206367492676} -11/06/2021 23:57:59 - INFO - __main__ - Step 19308: {'lr': 0.000483318316488274, 'samples': 3707136, 'steps': 19307, 'loss/train': 1.7169498205184937} -11/06/2021 23:58:00 - INFO - __main__ - Step 19309: {'lr': 0.00048331641042769223, 'samples': 3707328, 'steps': 19308, 'loss/train': 2.3175976276397705} -11/06/2021 23:58:01 - INFO - __main__ - Step 19310: {'lr': 0.00048331450426198177, 'samples': 3707520, 'steps': 19309, 'loss/train': 1.9806184768676758} -11/06/2021 23:58:01 - INFO - __main__ - Step 19311: {'lr': 0.0004833125979911434, 'samples': 3707712, 'steps': 19310, 'loss/train': 1.7473728656768799} -11/06/2021 23:58:01 - INFO - __main__ - Step 19312: {'lr': 0.0004833106916151778, 'samples': 3707904, 'steps': 19311, 'loss/train': 1.586052656173706} -11/06/2021 23:58:02 - INFO - __main__ - Step 19313: {'lr': 0.00048330878513408616, 'samples': 3708096, 'steps': 19312, 'loss/train': 1.7465753555297852} -11/06/2021 23:58:02 - INFO - __main__ - Step 19314: {'lr': 0.00048330687854786914, 'samples': 3708288, 'steps': 19313, 'loss/train': 1.9451851844787598} -11/06/2021 23:58:03 - INFO - __main__ - Step 19315: {'lr': 0.00048330497185652765, 'samples': 3708480, 'steps': 19314, 'loss/train': 1.6248364448547363} -11/06/2021 23:58:04 - INFO - __main__ - Step 19316: {'lr': 0.00048330306506006257, 'samples': 3708672, 'steps': 19315, 'loss/train': 1.7191998958587646} -11/06/2021 23:58:04 - INFO - __main__ - Step 19317: {'lr': 0.00048330115815847465, 'samples': 3708864, 'steps': 19316, 'loss/train': 1.3119690418243408} -11/06/2021 23:58:04 - INFO - __main__ - Step 19318: {'lr': 0.0004832992511517649, 'samples': 3709056, 'steps': 19317, 'loss/train': 1.7842353582382202} -11/06/2021 23:58:05 - INFO - __main__ - Step 19319: {'lr': 0.00048329734403993406, 'samples': 3709248, 'steps': 19318, 'loss/train': 1.7536782026290894} -11/06/2021 23:58:06 - INFO - __main__ - Step 19320: {'lr': 0.00048329543682298307, 'samples': 3709440, 'steps': 19319, 'loss/train': 1.9086477756500244} -11/06/2021 23:58:06 - INFO - __main__ - Step 19321: {'lr': 0.0004832935295009127, 'samples': 3709632, 'steps': 19320, 'loss/train': 1.843841791152954} -11/06/2021 23:58:06 - INFO - __main__ - Step 19322: {'lr': 0.0004832916220737239, 'samples': 3709824, 'steps': 19321, 'loss/train': 1.6211942434310913} -11/06/2021 23:58:07 - INFO - __main__ - Step 19323: {'lr': 0.0004832897145414175, 'samples': 3710016, 'steps': 19322, 'loss/train': 1.4943122863769531} -11/06/2021 23:58:07 - INFO - __main__ - Step 19324: {'lr': 0.0004832878069039943, 'samples': 3710208, 'steps': 19323, 'loss/train': 1.5772778987884521} -11/06/2021 23:58:08 - INFO - __main__ - Step 19325: {'lr': 0.0004832858991614553, 'samples': 3710400, 'steps': 19324, 'loss/train': 1.6283198595046997} -11/06/2021 23:58:08 - INFO - __main__ - Step 19326: {'lr': 0.00048328399131380127, 'samples': 3710592, 'steps': 19325, 'loss/train': 1.879858136177063} -11/06/2021 23:58:09 - INFO - __main__ - Step 19327: {'lr': 0.00048328208336103305, 'samples': 3710784, 'steps': 19326, 'loss/train': 1.4845051765441895} -11/06/2021 23:58:09 - INFO - __main__ - Step 19328: {'lr': 0.0004832801753031515, 'samples': 3710976, 'steps': 19327, 'loss/train': 1.7683420181274414} -11/06/2021 23:58:10 - INFO - __main__ - Step 19329: {'lr': 0.00048327826714015756, 'samples': 3711168, 'steps': 19328, 'loss/train': 3.4698245525360107} -11/06/2021 23:58:10 - INFO - __main__ - Step 19330: {'lr': 0.00048327635887205196, 'samples': 3711360, 'steps': 19329, 'loss/train': 1.1537224054336548} -11/06/2021 23:58:11 - INFO - __main__ - Step 19331: {'lr': 0.00048327445049883567, 'samples': 3711552, 'steps': 19330, 'loss/train': 1.5621854066848755} -11/06/2021 23:58:11 - INFO - __main__ - Step 19332: {'lr': 0.0004832725420205095, 'samples': 3711744, 'steps': 19331, 'loss/train': 1.1450562477111816} -11/06/2021 23:58:12 - INFO - __main__ - Step 19333: {'lr': 0.00048327063343707433, 'samples': 3711936, 'steps': 19332, 'loss/train': 1.4444999694824219} -11/06/2021 23:58:12 - INFO - __main__ - Step 19334: {'lr': 0.000483268724748531, 'samples': 3712128, 'steps': 19333, 'loss/train': 1.5540878772735596} -11/06/2021 23:58:12 - INFO - __main__ - Step 19335: {'lr': 0.0004832668159548804, 'samples': 3712320, 'steps': 19334, 'loss/train': 1.3487190008163452} -11/06/2021 23:58:13 - INFO - __main__ - Step 19336: {'lr': 0.00048326490705612337, 'samples': 3712512, 'steps': 19335, 'loss/train': 1.3741018772125244} -11/06/2021 23:58:14 - INFO - __main__ - Step 19337: {'lr': 0.0004832629980522608, 'samples': 3712704, 'steps': 19336, 'loss/train': 1.6172581911087036} -11/06/2021 23:58:14 - INFO - __main__ - Step 19338: {'lr': 0.00048326108894329345, 'samples': 3712896, 'steps': 19337, 'loss/train': 1.6094346046447754} -11/06/2021 23:58:15 - INFO - __main__ - Step 19339: {'lr': 0.00048325917972922227, 'samples': 3713088, 'steps': 19338, 'loss/train': 1.8732949495315552} -11/06/2021 23:58:15 - INFO - __main__ - Step 19340: {'lr': 0.00048325727041004815, 'samples': 3713280, 'steps': 19339, 'loss/train': 2.8026809692382812} -11/06/2021 23:58:16 - INFO - __main__ - Step 19341: {'lr': 0.0004832553609857719, 'samples': 3713472, 'steps': 19340, 'loss/train': 1.4218841791152954} -11/06/2021 23:58:16 - INFO - __main__ - Step 19342: {'lr': 0.0004832534514563943, 'samples': 3713664, 'steps': 19341, 'loss/train': 1.700616717338562} -11/06/2021 23:58:17 - INFO - __main__ - Step 19343: {'lr': 0.0004832515418219164, 'samples': 3713856, 'steps': 19342, 'loss/train': 1.542962908744812} -11/06/2021 23:58:17 - INFO - __main__ - Step 19344: {'lr': 0.0004832496320823389, 'samples': 3714048, 'steps': 19343, 'loss/train': 1.2601964473724365} -11/06/2021 23:58:17 - INFO - __main__ - Step 19345: {'lr': 0.0004832477222376627, 'samples': 3714240, 'steps': 19344, 'loss/train': 1.3057348728179932} -11/06/2021 23:58:18 - INFO - __main__ - Step 19346: {'lr': 0.0004832458122878888, 'samples': 3714432, 'steps': 19345, 'loss/train': 0.8863457441329956} -11/06/2021 23:58:19 - INFO - __main__ - Step 19347: {'lr': 0.0004832439022330178, 'samples': 3714624, 'steps': 19346, 'loss/train': 0.9812582731246948} -11/06/2021 23:58:19 - INFO - __main__ - Step 19348: {'lr': 0.00048324199207305075, 'samples': 3714816, 'steps': 19347, 'loss/train': 1.7008509635925293} -11/06/2021 23:58:19 - INFO - __main__ - Step 19349: {'lr': 0.0004832400818079884, 'samples': 3715008, 'steps': 19348, 'loss/train': 1.88282310962677} -11/06/2021 23:58:20 - INFO - __main__ - Step 19350: {'lr': 0.00048323817143783174, 'samples': 3715200, 'steps': 19349, 'loss/train': 1.5020644664764404} -11/06/2021 23:58:20 - INFO - __main__ - Step 19351: {'lr': 0.0004832362609625815, 'samples': 3715392, 'steps': 19350, 'loss/train': 1.5163544416427612} -11/06/2021 23:58:21 - INFO - __main__ - Step 19352: {'lr': 0.0004832343503822386, 'samples': 3715584, 'steps': 19351, 'loss/train': 1.6568862199783325} -11/06/2021 23:58:21 - INFO - __main__ - Step 19353: {'lr': 0.000483232439696804, 'samples': 3715776, 'steps': 19352, 'loss/train': 1.1262316703796387} -11/06/2021 23:58:22 - INFO - __main__ - Step 19354: {'lr': 0.0004832305289062784, 'samples': 3715968, 'steps': 19353, 'loss/train': 0.9058158993721008} -11/06/2021 23:58:22 - INFO - __main__ - Step 19355: {'lr': 0.00048322861801066265, 'samples': 3716160, 'steps': 19354, 'loss/train': 1.8485344648361206} -11/06/2021 23:58:23 - INFO - __main__ - Step 19356: {'lr': 0.00048322670700995775, 'samples': 3716352, 'steps': 19355, 'loss/train': 2.099125862121582} -11/06/2021 23:58:24 - INFO - __main__ - Step 19357: {'lr': 0.0004832247959041645, 'samples': 3716544, 'steps': 19356, 'loss/train': 1.2258687019348145} -11/06/2021 23:58:24 - INFO - __main__ - Step 19358: {'lr': 0.0004832228846932838, 'samples': 3716736, 'steps': 19357, 'loss/train': 1.7507163286209106} -11/06/2021 23:58:24 - INFO - __main__ - Step 19359: {'lr': 0.0004832209733773164, 'samples': 3716928, 'steps': 19358, 'loss/train': 1.7394636869430542} -11/06/2021 23:58:25 - INFO - __main__ - Step 19360: {'lr': 0.0004832190619562632, 'samples': 3717120, 'steps': 19359, 'loss/train': 1.5605862140655518} -11/06/2021 23:58:25 - INFO - __main__ - Step 19361: {'lr': 0.00048321715043012515, 'samples': 3717312, 'steps': 19360, 'loss/train': 1.5524048805236816} -11/06/2021 23:58:26 - INFO - __main__ - Step 19362: {'lr': 0.00048321523879890307, 'samples': 3717504, 'steps': 19361, 'loss/train': 1.7804820537567139} -11/06/2021 23:58:27 - INFO - __main__ - Step 19363: {'lr': 0.00048321332706259773, 'samples': 3717696, 'steps': 19362, 'loss/train': 1.6952815055847168} -11/06/2021 23:58:27 - INFO - __main__ - Step 19364: {'lr': 0.0004832114152212101, 'samples': 3717888, 'steps': 19363, 'loss/train': 1.2942943572998047} -11/06/2021 23:58:27 - INFO - __main__ - Step 19365: {'lr': 0.000483209503274741, 'samples': 3718080, 'steps': 19364, 'loss/train': 2.1306514739990234} -11/06/2021 23:58:28 - INFO - __main__ - Step 19366: {'lr': 0.0004832075912231913, 'samples': 3718272, 'steps': 19365, 'loss/train': 1.71169114112854} -11/06/2021 23:58:29 - INFO - __main__ - Step 19367: {'lr': 0.0004832056790665619, 'samples': 3718464, 'steps': 19366, 'loss/train': 0.859806478023529} -11/06/2021 23:58:29 - INFO - __main__ - Step 19368: {'lr': 0.0004832037668048536, 'samples': 3718656, 'steps': 19367, 'loss/train': 0.6691350340843201} -11/06/2021 23:58:29 - INFO - __main__ - Step 19369: {'lr': 0.00048320185443806717, 'samples': 3718848, 'steps': 19368, 'loss/train': 1.5839430093765259} -11/06/2021 23:58:30 - INFO - __main__ - Step 19370: {'lr': 0.0004831999419662037, 'samples': 3719040, 'steps': 19369, 'loss/train': 1.3964022397994995} -11/06/2021 23:58:30 - INFO - __main__ - Step 19371: {'lr': 0.0004831980293892639, 'samples': 3719232, 'steps': 19370, 'loss/train': 1.7141057252883911} -11/06/2021 23:58:31 - INFO - __main__ - Step 19372: {'lr': 0.0004831961167072487, 'samples': 3719424, 'steps': 19371, 'loss/train': 1.4822651147842407} -11/06/2021 23:58:31 - INFO - __main__ - Step 19373: {'lr': 0.0004831942039201589, 'samples': 3719616, 'steps': 19372, 'loss/train': 1.7279945611953735} -11/06/2021 23:58:32 - INFO - __main__ - Step 19374: {'lr': 0.0004831922910279954, 'samples': 3719808, 'steps': 19373, 'loss/train': 1.1288522481918335} -11/06/2021 23:58:32 - INFO - __main__ - Step 19375: {'lr': 0.000483190378030759, 'samples': 3720000, 'steps': 19374, 'loss/train': 1.5655479431152344} -11/06/2021 23:58:33 - INFO - __main__ - Step 19376: {'lr': 0.0004831884649284507, 'samples': 3720192, 'steps': 19375, 'loss/train': 1.5669931173324585} -11/06/2021 23:58:33 - INFO - __main__ - Step 19377: {'lr': 0.00048318655172107126, 'samples': 3720384, 'steps': 19376, 'loss/train': 1.8472486734390259} -11/06/2021 23:58:34 - INFO - __main__ - Step 19378: {'lr': 0.0004831846384086215, 'samples': 3720576, 'steps': 19377, 'loss/train': 1.4276505708694458} -11/06/2021 23:58:34 - INFO - __main__ - Step 19379: {'lr': 0.0004831827249911024, 'samples': 3720768, 'steps': 19378, 'loss/train': 2.790935516357422} -11/06/2021 23:58:35 - INFO - __main__ - Step 19380: {'lr': 0.0004831808114685147, 'samples': 3720960, 'steps': 19379, 'loss/train': 2.847355842590332} -11/06/2021 23:58:35 - INFO - __main__ - Step 19381: {'lr': 0.00048317889784085935, 'samples': 3721152, 'steps': 19380, 'loss/train': 1.9903427362442017} -11/06/2021 23:58:35 - INFO - __main__ - Step 19382: {'lr': 0.0004831769841081372, 'samples': 3721344, 'steps': 19381, 'loss/train': 1.8123948574066162} -11/06/2021 23:58:36 - INFO - __main__ - Step 19383: {'lr': 0.00048317507027034913, 'samples': 3721536, 'steps': 19382, 'loss/train': 1.783972978591919} -11/06/2021 23:58:37 - INFO - __main__ - Step 19384: {'lr': 0.0004831731563274959, 'samples': 3721728, 'steps': 19383, 'loss/train': 1.8129934072494507} -11/06/2021 23:58:37 - INFO - __main__ - Step 19385: {'lr': 0.0004831712422795785, 'samples': 3721920, 'steps': 19384, 'loss/train': 1.562839388847351} -11/06/2021 23:58:37 - INFO - __main__ - Step 19386: {'lr': 0.00048316932812659776, 'samples': 3722112, 'steps': 19385, 'loss/train': 1.5851092338562012} -11/06/2021 23:58:38 - INFO - __main__ - Step 19387: {'lr': 0.00048316741386855445, 'samples': 3722304, 'steps': 19386, 'loss/train': 1.541589379310608} -11/06/2021 23:58:39 - INFO - __main__ - Step 19388: {'lr': 0.0004831654995054495, 'samples': 3722496, 'steps': 19387, 'loss/train': 1.533311128616333} -11/06/2021 23:58:40 - INFO - __main__ - Step 19389: {'lr': 0.0004831635850372838, 'samples': 3722688, 'steps': 19388, 'loss/train': 1.626739740371704} -11/06/2021 23:58:40 - INFO - __main__ - Step 19390: {'lr': 0.00048316167046405826, 'samples': 3722880, 'steps': 19389, 'loss/train': 1.7666641473770142} -11/06/2021 23:58:40 - INFO - __main__ - Step 19391: {'lr': 0.0004831597557857735, 'samples': 3723072, 'steps': 19390, 'loss/train': 2.5333597660064697} -11/06/2021 23:58:41 - INFO - __main__ - Step 19392: {'lr': 0.00048315784100243063, 'samples': 3723264, 'steps': 19391, 'loss/train': 2.226302146911621} -11/06/2021 23:58:41 - INFO - __main__ - Step 19393: {'lr': 0.0004831559261140305, 'samples': 3723456, 'steps': 19392, 'loss/train': 1.3086782693862915} -11/06/2021 23:58:42 - INFO - __main__ - Step 19394: {'lr': 0.0004831540111205739, 'samples': 3723648, 'steps': 19393, 'loss/train': 2.0022213459014893} -11/06/2021 23:58:42 - INFO - __main__ - Step 19395: {'lr': 0.00048315209602206165, 'samples': 3723840, 'steps': 19394, 'loss/train': 1.3035863637924194} -11/06/2021 23:58:43 - INFO - __main__ - Step 19396: {'lr': 0.0004831501808184947, 'samples': 3724032, 'steps': 19395, 'loss/train': 1.9788427352905273} -11/06/2021 23:58:43 - INFO - __main__ - Step 19397: {'lr': 0.0004831482655098738, 'samples': 3724224, 'steps': 19396, 'loss/train': 1.7932040691375732} -11/06/2021 23:58:43 - INFO - __main__ - Step 19398: {'lr': 0.00048314635009619997, 'samples': 3724416, 'steps': 19397, 'loss/train': 1.363989233970642} -11/06/2021 23:58:45 - INFO - __main__ - Step 19399: {'lr': 0.0004831444345774739, 'samples': 3724608, 'steps': 19398, 'loss/train': 1.9155510663986206} -11/06/2021 23:58:45 - INFO - __main__ - Step 19400: {'lr': 0.00048314251895369663, 'samples': 3724800, 'steps': 19399, 'loss/train': 1.7524795532226562} -11/06/2021 23:58:45 - INFO - __main__ - Step 19401: {'lr': 0.000483140603224869, 'samples': 3724992, 'steps': 19400, 'loss/train': 1.5705088376998901} -11/06/2021 23:58:46 - INFO - __main__ - Step 19402: {'lr': 0.00048313868739099166, 'samples': 3725184, 'steps': 19401, 'loss/train': 1.9813029766082764} -11/06/2021 23:58:46 - INFO - __main__ - Step 19403: {'lr': 0.0004831367714520657, 'samples': 3725376, 'steps': 19402, 'loss/train': 1.216731071472168} -11/06/2021 23:58:47 - INFO - __main__ - Step 19404: {'lr': 0.0004831348554080919, 'samples': 3725568, 'steps': 19403, 'loss/train': 1.8201124668121338} -11/06/2021 23:58:47 - INFO - __main__ - Step 19405: {'lr': 0.0004831329392590711, 'samples': 3725760, 'steps': 19404, 'loss/train': 1.7847330570220947} -11/06/2021 23:58:48 - INFO - __main__ - Step 19406: {'lr': 0.00048313102300500424, 'samples': 3725952, 'steps': 19405, 'loss/train': 0.5406389236450195} -11/06/2021 23:58:48 - INFO - __main__ - Step 19407: {'lr': 0.00048312910664589215, 'samples': 3726144, 'steps': 19406, 'loss/train': 1.7577673196792603} -11/06/2021 23:58:49 - INFO - __main__ - Step 19408: {'lr': 0.0004831271901817357, 'samples': 3726336, 'steps': 19407, 'loss/train': 1.2659802436828613} -11/06/2021 23:58:50 - INFO - __main__ - Step 19409: {'lr': 0.00048312527361253567, 'samples': 3726528, 'steps': 19408, 'loss/train': 1.87831449508667} -11/06/2021 23:58:50 - INFO - __main__ - Step 19410: {'lr': 0.000483123356938293, 'samples': 3726720, 'steps': 19409, 'loss/train': 1.4174208641052246} -11/06/2021 23:58:50 - INFO - __main__ - Step 19411: {'lr': 0.00048312144015900856, 'samples': 3726912, 'steps': 19410, 'loss/train': 1.6749889850616455} -11/06/2021 23:58:51 - INFO - __main__ - Step 19412: {'lr': 0.00048311952327468325, 'samples': 3727104, 'steps': 19411, 'loss/train': 1.7777684926986694} -11/06/2021 23:58:51 - INFO - __main__ - Step 19413: {'lr': 0.00048311760628531777, 'samples': 3727296, 'steps': 19412, 'loss/train': 1.2066028118133545} -11/06/2021 23:58:52 - INFO - __main__ - Step 19414: {'lr': 0.00048311568919091316, 'samples': 3727488, 'steps': 19413, 'loss/train': 2.1470677852630615} -11/06/2021 23:58:52 - INFO - __main__ - Step 19415: {'lr': 0.00048311377199147023, 'samples': 3727680, 'steps': 19414, 'loss/train': 1.9940916299819946} -11/06/2021 23:58:53 - INFO - __main__ - Step 19416: {'lr': 0.00048311185468698974, 'samples': 3727872, 'steps': 19415, 'loss/train': 2.1364340782165527} -11/06/2021 23:58:53 - INFO - __main__ - Step 19417: {'lr': 0.00048310993727747277, 'samples': 3728064, 'steps': 19416, 'loss/train': 1.5032535791397095} -11/06/2021 23:58:53 - INFO - __main__ - Step 19418: {'lr': 0.00048310801976292, 'samples': 3728256, 'steps': 19417, 'loss/train': 1.4930044412612915} -11/06/2021 23:58:54 - INFO - __main__ - Step 19419: {'lr': 0.0004831061021433323, 'samples': 3728448, 'steps': 19418, 'loss/train': 1.7884739637374878} -11/06/2021 23:58:55 - INFO - __main__ - Step 19420: {'lr': 0.00048310418441871065, 'samples': 3728640, 'steps': 19419, 'loss/train': 1.911501169204712} -11/06/2021 23:58:55 - INFO - __main__ - Step 19421: {'lr': 0.00048310226658905585, 'samples': 3728832, 'steps': 19420, 'loss/train': 2.056422472000122} -11/06/2021 23:58:55 - INFO - __main__ - Step 19422: {'lr': 0.00048310034865436876, 'samples': 3729024, 'steps': 19421, 'loss/train': 1.5690569877624512} -11/06/2021 23:58:56 - INFO - __main__ - Step 19423: {'lr': 0.0004830984306146503, 'samples': 3729216, 'steps': 19422, 'loss/train': 1.1024407148361206} -11/06/2021 23:58:56 - INFO - __main__ - Step 19424: {'lr': 0.0004830965124699012, 'samples': 3729408, 'steps': 19423, 'loss/train': 1.1547913551330566} -11/06/2021 23:58:59 - INFO - __main__ - Step 19425: {'lr': 0.00048309459422012243, 'samples': 3729600, 'steps': 19424, 'loss/train': 1.695124626159668} -11/06/2021 23:58:59 - INFO - __main__ - Step 19426: {'lr': 0.0004830926758653148, 'samples': 3729792, 'steps': 19425, 'loss/train': 1.4162240028381348} -11/06/2021 23:58:59 - INFO - __main__ - Step 19427: {'lr': 0.00048309075740547925, 'samples': 3729984, 'steps': 19426, 'loss/train': 1.3688523769378662} -11/06/2021 23:59:00 - INFO - __main__ - Step 19428: {'lr': 0.0004830888388406166, 'samples': 3730176, 'steps': 19427, 'loss/train': 1.8020360469818115} -11/06/2021 23:59:00 - INFO - __main__ - Step 19429: {'lr': 0.00048308692017072773, 'samples': 3730368, 'steps': 19428, 'loss/train': 1.153029441833496} -11/06/2021 23:59:01 - INFO - __main__ - Step 19430: {'lr': 0.00048308500139581344, 'samples': 3730560, 'steps': 19429, 'loss/train': 1.0884881019592285} -11/06/2021 23:59:01 - INFO - __main__ - Step 19431: {'lr': 0.00048308308251587476, 'samples': 3730752, 'steps': 19430, 'loss/train': 1.7762088775634766} -11/06/2021 23:59:01 - INFO - __main__ - Step 19432: {'lr': 0.00048308116353091234, 'samples': 3730944, 'steps': 19431, 'loss/train': 1.8368065357208252} -11/06/2021 23:59:02 - INFO - __main__ - Step 19433: {'lr': 0.00048307924444092716, 'samples': 3731136, 'steps': 19432, 'loss/train': 1.6261667013168335} -11/06/2021 23:59:02 - INFO - __main__ - Step 19434: {'lr': 0.0004830773252459201, 'samples': 3731328, 'steps': 19433, 'loss/train': 1.6783347129821777} -11/06/2021 23:59:03 - INFO - __main__ - Step 19435: {'lr': 0.00048307540594589194, 'samples': 3731520, 'steps': 19434, 'loss/train': 1.5496079921722412} -11/06/2021 23:59:03 - INFO - __main__ - Step 19436: {'lr': 0.0004830734865408437, 'samples': 3731712, 'steps': 19435, 'loss/train': 1.2190485000610352} -11/06/2021 23:59:04 - INFO - __main__ - Step 19437: {'lr': 0.000483071567030776, 'samples': 3731904, 'steps': 19436, 'loss/train': 1.7005469799041748} -11/06/2021 23:59:05 - INFO - __main__ - Step 19438: {'lr': 0.00048306964741568994, 'samples': 3732096, 'steps': 19437, 'loss/train': 1.5111713409423828} -11/06/2021 23:59:05 - INFO - __main__ - Step 19439: {'lr': 0.00048306772769558624, 'samples': 3732288, 'steps': 19438, 'loss/train': 1.892134189605713} -11/06/2021 23:59:05 - INFO - __main__ - Step 19440: {'lr': 0.0004830658078704659, 'samples': 3732480, 'steps': 19439, 'loss/train': 1.6170473098754883} -11/06/2021 23:59:06 - INFO - __main__ - Step 19441: {'lr': 0.0004830638879403296, 'samples': 3732672, 'steps': 19440, 'loss/train': 1.8451327085494995} -11/06/2021 23:59:06 - INFO - __main__ - Step 19442: {'lr': 0.00048306196790517844, 'samples': 3732864, 'steps': 19441, 'loss/train': 1.871138334274292} -11/06/2021 23:59:07 - INFO - __main__ - Step 19443: {'lr': 0.0004830600477650131, 'samples': 3733056, 'steps': 19442, 'loss/train': 1.3609321117401123} -11/06/2021 23:59:07 - INFO - __main__ - Step 19444: {'lr': 0.0004830581275198344, 'samples': 3733248, 'steps': 19443, 'loss/train': 1.0425359010696411} -11/06/2021 23:59:08 - INFO - __main__ - Step 19445: {'lr': 0.00048305620716964336, 'samples': 3733440, 'steps': 19444, 'loss/train': 2.1450159549713135} -11/06/2021 23:59:08 - INFO - __main__ - Step 19446: {'lr': 0.00048305428671444083, 'samples': 3733632, 'steps': 19445, 'loss/train': 1.0744739770889282} -11/06/2021 23:59:09 - INFO - __main__ - Step 19447: {'lr': 0.00048305236615422763, 'samples': 3733824, 'steps': 19446, 'loss/train': 1.7108923196792603} -11/06/2021 23:59:09 - INFO - __main__ - Step 19448: {'lr': 0.00048305044548900463, 'samples': 3734016, 'steps': 19447, 'loss/train': 1.3483003377914429} -11/06/2021 23:59:10 - INFO - __main__ - Step 19449: {'lr': 0.0004830485247187727, 'samples': 3734208, 'steps': 19448, 'loss/train': 1.7191352844238281} -11/06/2021 23:59:10 - INFO - __main__ - Step 19450: {'lr': 0.0004830466038435327, 'samples': 3734400, 'steps': 19449, 'loss/train': 1.6840806007385254} -11/06/2021 23:59:11 - INFO - __main__ - Step 19451: {'lr': 0.0004830446828632854, 'samples': 3734592, 'steps': 19450, 'loss/train': 1.22652006149292} -11/06/2021 23:59:11 - INFO - __main__ - Step 19452: {'lr': 0.00048304276177803186, 'samples': 3734784, 'steps': 19451, 'loss/train': 1.2331140041351318} -11/06/2021 23:59:12 - INFO - __main__ - Step 19453: {'lr': 0.00048304084058777285, 'samples': 3734976, 'steps': 19452, 'loss/train': 1.9303547143936157} -11/06/2021 23:59:13 - INFO - __main__ - Step 19454: {'lr': 0.00048303891929250923, 'samples': 3735168, 'steps': 19453, 'loss/train': 1.3610291481018066} -11/06/2021 23:59:13 - INFO - __main__ - Step 19455: {'lr': 0.0004830369978922418, 'samples': 3735360, 'steps': 19454, 'loss/train': 1.2890371084213257} -11/06/2021 23:59:13 - INFO - __main__ - Step 19456: {'lr': 0.00048303507638697155, 'samples': 3735552, 'steps': 19455, 'loss/train': 1.549730658531189} -11/06/2021 23:59:14 - INFO - __main__ - Step 19457: {'lr': 0.0004830331547766993, 'samples': 3735744, 'steps': 19456, 'loss/train': 1.8960416316986084} -11/06/2021 23:59:14 - INFO - __main__ - Step 19458: {'lr': 0.0004830312330614259, 'samples': 3735936, 'steps': 19457, 'loss/train': 1.7021613121032715} -11/06/2021 23:59:15 - INFO - __main__ - Step 19459: {'lr': 0.00048302931124115226, 'samples': 3736128, 'steps': 19458, 'loss/train': 1.5494282245635986} -11/06/2021 23:59:15 - INFO - __main__ - Step 19460: {'lr': 0.0004830273893158791, 'samples': 3736320, 'steps': 19459, 'loss/train': 1.4215049743652344} -11/06/2021 23:59:16 - INFO - __main__ - Step 19461: {'lr': 0.0004830254672856075, 'samples': 3736512, 'steps': 19460, 'loss/train': 1.396445393562317} -11/06/2021 23:59:16 - INFO - __main__ - Step 19462: {'lr': 0.00048302354515033813, 'samples': 3736704, 'steps': 19461, 'loss/train': 1.8570998907089233} -11/06/2021 23:59:16 - INFO - __main__ - Step 19463: {'lr': 0.00048302162291007203, 'samples': 3736896, 'steps': 19462, 'loss/train': 1.4819624423980713} -11/06/2021 23:59:17 - INFO - __main__ - Step 19464: {'lr': 0.00048301970056480994, 'samples': 3737088, 'steps': 19463, 'loss/train': 1.6561782360076904} -11/06/2021 23:59:18 - INFO - __main__ - Step 19465: {'lr': 0.00048301777811455274, 'samples': 3737280, 'steps': 19464, 'loss/train': 1.935529351234436} -11/06/2021 23:59:18 - INFO - __main__ - Step 19466: {'lr': 0.0004830158555593014, 'samples': 3737472, 'steps': 19465, 'loss/train': 1.6366750001907349} -11/06/2021 23:59:18 - INFO - __main__ - Step 19467: {'lr': 0.00048301393289905663, 'samples': 3737664, 'steps': 19466, 'loss/train': 1.6262980699539185} -11/06/2021 23:59:19 - INFO - __main__ - Step 19468: {'lr': 0.00048301201013381946, 'samples': 3737856, 'steps': 19467, 'loss/train': 1.4352784156799316} -11/06/2021 23:59:20 - INFO - __main__ - Step 19469: {'lr': 0.00048301008726359064, 'samples': 3738048, 'steps': 19468, 'loss/train': 1.9483211040496826} -11/06/2021 23:59:20 - INFO - __main__ - Step 19470: {'lr': 0.00048300816428837104, 'samples': 3738240, 'steps': 19469, 'loss/train': 1.8832329511642456} -11/06/2021 23:59:20 - INFO - __main__ - Step 19471: {'lr': 0.00048300624120816153, 'samples': 3738432, 'steps': 19470, 'loss/train': 1.5686419010162354} -11/06/2021 23:59:21 - INFO - __main__ - Step 19472: {'lr': 0.0004830043180229631, 'samples': 3738624, 'steps': 19471, 'loss/train': 1.8613708019256592} -11/06/2021 23:59:21 - INFO - __main__ - Step 19473: {'lr': 0.0004830023947327764, 'samples': 3738816, 'steps': 19472, 'loss/train': 1.726355791091919} -11/06/2021 23:59:22 - INFO - __main__ - Step 19474: {'lr': 0.0004830004713376025, 'samples': 3739008, 'steps': 19473, 'loss/train': 1.6512629985809326} -11/06/2021 23:59:23 - INFO - __main__ - Step 19475: {'lr': 0.00048299854783744224, 'samples': 3739200, 'steps': 19474, 'loss/train': 1.8223868608474731} -11/06/2021 23:59:23 - INFO - __main__ - Step 19476: {'lr': 0.0004829966242322963, 'samples': 3739392, 'steps': 19475, 'loss/train': 1.6881176233291626} -11/06/2021 23:59:23 - INFO - __main__ - Step 19477: {'lr': 0.00048299470052216576, 'samples': 3739584, 'steps': 19476, 'loss/train': 1.664871096611023} -11/06/2021 23:59:24 - INFO - __main__ - Step 19478: {'lr': 0.0004829927767070514, 'samples': 3739776, 'steps': 19477, 'loss/train': 1.8570330142974854} -11/06/2021 23:59:25 - INFO - __main__ - Step 19479: {'lr': 0.0004829908527869541, 'samples': 3739968, 'steps': 19478, 'loss/train': 0.8422459363937378} -11/06/2021 23:59:25 - INFO - __main__ - Step 19480: {'lr': 0.0004829889287618746, 'samples': 3740160, 'steps': 19479, 'loss/train': 1.5826501846313477} -11/06/2021 23:59:26 - INFO - __main__ - Step 19481: {'lr': 0.000482987004631814, 'samples': 3740352, 'steps': 19480, 'loss/train': 1.462388515472412} -11/06/2021 23:59:26 - INFO - __main__ - Step 19482: {'lr': 0.000482985080396773, 'samples': 3740544, 'steps': 19481, 'loss/train': 1.5462687015533447} -11/06/2021 23:59:27 - INFO - __main__ - Step 19483: {'lr': 0.00048298315605675257, 'samples': 3740736, 'steps': 19482, 'loss/train': 1.6107537746429443} -11/06/2021 23:59:27 - INFO - __main__ - Step 19484: {'lr': 0.0004829812316117535, 'samples': 3740928, 'steps': 19483, 'loss/train': 1.9696018695831299} -11/06/2021 23:59:28 - INFO - __main__ - Step 19485: {'lr': 0.0004829793070617767, 'samples': 3741120, 'steps': 19484, 'loss/train': 1.904404878616333} -11/06/2021 23:59:28 - INFO - __main__ - Step 19486: {'lr': 0.000482977382406823, 'samples': 3741312, 'steps': 19485, 'loss/train': 1.7050572633743286} -11/06/2021 23:59:29 - INFO - __main__ - Step 19487: {'lr': 0.00048297545764689327, 'samples': 3741504, 'steps': 19486, 'loss/train': 1.5216996669769287} -11/06/2021 23:59:29 - INFO - __main__ - Step 19488: {'lr': 0.00048297353278198843, 'samples': 3741696, 'steps': 19487, 'loss/train': 1.2509301900863647} -11/06/2021 23:59:29 - INFO - __main__ - Step 19489: {'lr': 0.00048297160781210925, 'samples': 3741888, 'steps': 19488, 'loss/train': 1.639148235321045} -11/06/2021 23:59:31 - INFO - __main__ - Step 19490: {'lr': 0.00048296968273725673, 'samples': 3742080, 'steps': 19489, 'loss/train': 1.5672905445098877} -11/06/2021 23:59:31 - INFO - __main__ - Step 19491: {'lr': 0.0004829677575574316, 'samples': 3742272, 'steps': 19490, 'loss/train': 1.7949920892715454} -11/06/2021 23:59:31 - INFO - __main__ - Step 19492: {'lr': 0.0004829658322726348, 'samples': 3742464, 'steps': 19491, 'loss/train': 2.019479751586914} -11/06/2021 23:59:32 - INFO - __main__ - Step 19493: {'lr': 0.00048296390688286724, 'samples': 3742656, 'steps': 19492, 'loss/train': 2.085145950317383} -11/06/2021 23:59:32 - INFO - __main__ - Step 19494: {'lr': 0.00048296198138812974, 'samples': 3742848, 'steps': 19493, 'loss/train': 1.4425673484802246} -11/06/2021 23:59:33 - INFO - __main__ - Step 19495: {'lr': 0.00048296005578842314, 'samples': 3743040, 'steps': 19494, 'loss/train': 1.797430157661438} -11/06/2021 23:59:34 - INFO - __main__ - Step 19496: {'lr': 0.0004829581300837483, 'samples': 3743232, 'steps': 19495, 'loss/train': 1.7276138067245483} -11/06/2021 23:59:34 - INFO - __main__ - Step 19497: {'lr': 0.00048295620427410614, 'samples': 3743424, 'steps': 19496, 'loss/train': 1.0747604370117188} -11/06/2021 23:59:34 - INFO - __main__ - Step 19498: {'lr': 0.00048295427835949757, 'samples': 3743616, 'steps': 19497, 'loss/train': 1.531845211982727} -11/06/2021 23:59:35 - INFO - __main__ - Step 19499: {'lr': 0.0004829523523399233, 'samples': 3743808, 'steps': 19498, 'loss/train': 5.932285785675049} -11/06/2021 23:59:35 - INFO - __main__ - Step 19500: {'lr': 0.0004829504262153844, 'samples': 3744000, 'steps': 19499, 'loss/train': 1.0767468214035034} -11/06/2021 23:59:36 - INFO - __main__ - Step 19501: {'lr': 0.00048294849998588155, 'samples': 3744192, 'steps': 19500, 'loss/train': 2.2038071155548096} -11/06/2021 23:59:36 - INFO - __main__ - Step 19502: {'lr': 0.0004829465736514157, 'samples': 3744384, 'steps': 19501, 'loss/train': 1.7361345291137695} -11/06/2021 23:59:37 - INFO - __main__ - Step 19503: {'lr': 0.0004829446472119878, 'samples': 3744576, 'steps': 19502, 'loss/train': 1.3352776765823364} -11/06/2021 23:59:37 - INFO - __main__ - Step 19504: {'lr': 0.0004829427206675986, 'samples': 3744768, 'steps': 19503, 'loss/train': 1.8171507120132446} -11/06/2021 23:59:37 - INFO - __main__ - Step 19505: {'lr': 0.000482940794018249, 'samples': 3744960, 'steps': 19504, 'loss/train': 1.5799142122268677} -11/06/2021 23:59:39 - INFO - __main__ - Step 19506: {'lr': 0.00048293886726393984, 'samples': 3745152, 'steps': 19505, 'loss/train': 1.4450923204421997} -11/06/2021 23:59:39 - INFO - __main__ - Step 19507: {'lr': 0.00048293694040467205, 'samples': 3745344, 'steps': 19506, 'loss/train': 1.731113076210022} -11/06/2021 23:59:39 - INFO - __main__ - Step 19508: {'lr': 0.00048293501344044644, 'samples': 3745536, 'steps': 19507, 'loss/train': 1.6001505851745605} -11/06/2021 23:59:40 - INFO - __main__ - Step 19509: {'lr': 0.00048293308637126393, 'samples': 3745728, 'steps': 19508, 'loss/train': 0.7838894724845886} -11/06/2021 23:59:40 - INFO - __main__ - Step 19510: {'lr': 0.0004829311591971254, 'samples': 3745920, 'steps': 19509, 'loss/train': 1.8190715312957764} -11/06/2021 23:59:41 - INFO - __main__ - Step 19511: {'lr': 0.0004829292319180316, 'samples': 3746112, 'steps': 19510, 'loss/train': 1.5588487386703491} -11/06/2021 23:59:41 - INFO - __main__ - Step 19512: {'lr': 0.00048292730453398355, 'samples': 3746304, 'steps': 19511, 'loss/train': 1.3858730792999268} -11/06/2021 23:59:42 - INFO - __main__ - Step 19513: {'lr': 0.00048292537704498203, 'samples': 3746496, 'steps': 19512, 'loss/train': 1.3733470439910889} -11/06/2021 23:59:42 - INFO - __main__ - Step 19514: {'lr': 0.00048292344945102795, 'samples': 3746688, 'steps': 19513, 'loss/train': 1.670436143875122} -11/06/2021 23:59:43 - INFO - __main__ - Step 19515: {'lr': 0.0004829215217521221, 'samples': 3746880, 'steps': 19514, 'loss/train': 1.8147488832473755} -11/06/2021 23:59:44 - INFO - __main__ - Step 19516: {'lr': 0.00048291959394826546, 'samples': 3747072, 'steps': 19515, 'loss/train': 1.9264278411865234} -11/06/2021 23:59:44 - INFO - __main__ - Step 19517: {'lr': 0.00048291766603945885, 'samples': 3747264, 'steps': 19516, 'loss/train': 1.1423556804656982} -11/06/2021 23:59:44 - INFO - __main__ - Step 19518: {'lr': 0.0004829157380257031, 'samples': 3747456, 'steps': 19517, 'loss/train': 1.3138654232025146} -11/06/2021 23:59:45 - INFO - __main__ - Step 19519: {'lr': 0.0004829138099069991, 'samples': 3747648, 'steps': 19518, 'loss/train': 1.420883059501648} -11/06/2021 23:59:45 - INFO - __main__ - Step 19520: {'lr': 0.0004829118816833478, 'samples': 3747840, 'steps': 19519, 'loss/train': 2.512575626373291} -11/06/2021 23:59:45 - INFO - __main__ - Step 19521: {'lr': 0.00048290995335474997, 'samples': 3748032, 'steps': 19520, 'loss/train': 1.6682121753692627} -11/06/2021 23:59:47 - INFO - __main__ - Step 19522: {'lr': 0.0004829080249212064, 'samples': 3748224, 'steps': 19521, 'loss/train': 1.5365606546401978} -11/06/2021 23:59:47 - INFO - __main__ - Step 19523: {'lr': 0.00048290609638271823, 'samples': 3748416, 'steps': 19522, 'loss/train': 1.6803691387176514} -11/06/2021 23:59:47 - INFO - __main__ - Step 19524: {'lr': 0.00048290416773928615, 'samples': 3748608, 'steps': 19523, 'loss/train': 1.8752951622009277} -11/06/2021 23:59:48 - INFO - __main__ - Step 19525: {'lr': 0.00048290223899091094, 'samples': 3748800, 'steps': 19524, 'loss/train': 1.8965718746185303} -11/06/2021 23:59:48 - INFO - __main__ - Step 19526: {'lr': 0.0004829003101375937, 'samples': 3748992, 'steps': 19525, 'loss/train': 1.26532781124115} -11/06/2021 23:59:49 - INFO - __main__ - Step 19527: {'lr': 0.00048289838117933505, 'samples': 3749184, 'steps': 19526, 'loss/train': 1.8481258153915405} -11/06/2021 23:59:49 - INFO - __main__ - Step 19528: {'lr': 0.0004828964521161361, 'samples': 3749376, 'steps': 19527, 'loss/train': 1.413066029548645} -11/06/2021 23:59:50 - INFO - __main__ - Step 19529: {'lr': 0.0004828945229479975, 'samples': 3749568, 'steps': 19528, 'loss/train': 1.5402287244796753} -11/06/2021 23:59:50 - INFO - __main__ - Step 19530: {'lr': 0.0004828925936749202, 'samples': 3749760, 'steps': 19529, 'loss/train': 1.5571092367172241} -11/06/2021 23:59:50 - INFO - __main__ - Step 19531: {'lr': 0.0004828906642969052, 'samples': 3749952, 'steps': 19530, 'loss/train': 1.5103822946548462} -11/06/2021 23:59:51 - INFO - __main__ - Step 19532: {'lr': 0.00048288873481395323, 'samples': 3750144, 'steps': 19531, 'loss/train': 1.55597984790802} -11/06/2021 23:59:52 - INFO - __main__ - Step 19533: {'lr': 0.0004828868052260652, 'samples': 3750336, 'steps': 19532, 'loss/train': 1.014290690422058} -11/06/2021 23:59:52 - INFO - __main__ - Step 19534: {'lr': 0.0004828848755332419, 'samples': 3750528, 'steps': 19533, 'loss/train': 1.9036535024642944} -11/06/2021 23:59:52 - INFO - __main__ - Step 19535: {'lr': 0.0004828829457354843, 'samples': 3750720, 'steps': 19534, 'loss/train': 1.6254938840866089} -11/06/2021 23:59:53 - INFO - __main__ - Step 19536: {'lr': 0.0004828810158327933, 'samples': 3750912, 'steps': 19535, 'loss/train': 1.509027361869812} -11/06/2021 23:59:54 - INFO - __main__ - Step 19537: {'lr': 0.00048287908582516964, 'samples': 3751104, 'steps': 19536, 'loss/train': 1.6718204021453857} -11/06/2021 23:59:54 - INFO - __main__ - Step 19538: {'lr': 0.00048287715571261424, 'samples': 3751296, 'steps': 19537, 'loss/train': 1.5779062509536743} -11/06/2021 23:59:54 - INFO - __main__ - Step 19539: {'lr': 0.00048287522549512806, 'samples': 3751488, 'steps': 19538, 'loss/train': 1.7152458429336548} -11/06/2021 23:59:55 - INFO - __main__ - Step 19540: {'lr': 0.0004828732951727119, 'samples': 3751680, 'steps': 19539, 'loss/train': 1.4148067235946655} -11/06/2021 23:59:55 - INFO - __main__ - Step 19541: {'lr': 0.00048287136474536657, 'samples': 3751872, 'steps': 19540, 'loss/train': 2.09765362739563} -11/06/2021 23:59:56 - INFO - __main__ - Step 19542: {'lr': 0.000482869434213093, 'samples': 3752064, 'steps': 19541, 'loss/train': 1.6245235204696655} -11/06/2021 23:59:57 - INFO - __main__ - Step 19543: {'lr': 0.0004828675035758921, 'samples': 3752256, 'steps': 19542, 'loss/train': 1.6489465236663818} -11/06/2021 23:59:57 - INFO - __main__ - Step 19544: {'lr': 0.00048286557283376465, 'samples': 3752448, 'steps': 19543, 'loss/train': 1.6993317604064941} -11/06/2021 23:59:57 - INFO - __main__ - Step 19545: {'lr': 0.0004828636419867116, 'samples': 3752640, 'steps': 19544, 'loss/train': 2.0288567543029785} -11/06/2021 23:59:58 - INFO - __main__ - Step 19546: {'lr': 0.00048286171103473376, 'samples': 3752832, 'steps': 19545, 'loss/train': 1.3089454174041748} -11/07/2021 00:00:00 - INFO - __main__ - Step 19547: {'lr': 0.00048285977997783203, 'samples': 3753024, 'steps': 19546, 'loss/train': 1.9391834735870361} -11/07/2021 00:00:00 - INFO - __main__ - Step 19548: {'lr': 0.0004828578488160073, 'samples': 3753216, 'steps': 19547, 'loss/train': 1.6727211475372314} -11/07/2021 00:00:00 - INFO - __main__ - Step 19549: {'lr': 0.0004828559175492604, 'samples': 3753408, 'steps': 19548, 'loss/train': 1.9620425701141357} -11/07/2021 00:00:01 - INFO - __main__ - Step 19550: {'lr': 0.0004828539861775922, 'samples': 3753600, 'steps': 19549, 'loss/train': 2.087019205093384} -11/07/2021 00:00:01 - INFO - __main__ - Step 19551: {'lr': 0.0004828520547010036, 'samples': 3753792, 'steps': 19550, 'loss/train': 1.887309193611145} -11/07/2021 00:00:01 - INFO - __main__ - Step 19552: {'lr': 0.0004828501231194955, 'samples': 3753984, 'steps': 19551, 'loss/train': 1.9961159229278564} -11/07/2021 00:00:02 - INFO - __main__ - Step 19553: {'lr': 0.0004828481914330687, 'samples': 3754176, 'steps': 19552, 'loss/train': 1.8260117769241333} -11/07/2021 00:00:02 - INFO - __main__ - Step 19554: {'lr': 0.000482846259641724, 'samples': 3754368, 'steps': 19553, 'loss/train': 1.7672523260116577} -11/07/2021 00:00:03 - INFO - __main__ - Step 19555: {'lr': 0.0004828443277454625, 'samples': 3754560, 'steps': 19554, 'loss/train': 1.7993131875991821} -11/07/2021 00:00:04 - INFO - __main__ - Step 19556: {'lr': 0.0004828423957442849, 'samples': 3754752, 'steps': 19555, 'loss/train': 1.248684048652649} -11/07/2021 00:00:04 - INFO - __main__ - Step 19557: {'lr': 0.00048284046363819213, 'samples': 3754944, 'steps': 19556, 'loss/train': 1.7798717021942139} -11/07/2021 00:00:04 - INFO - __main__ - Step 19558: {'lr': 0.000482838531427185, 'samples': 3755136, 'steps': 19557, 'loss/train': 2.2403976917266846} -11/07/2021 00:00:05 - INFO - __main__ - Step 19559: {'lr': 0.00048283659911126445, 'samples': 3755328, 'steps': 19558, 'loss/train': 1.5755736827850342} -11/07/2021 00:00:06 - INFO - __main__ - Step 19560: {'lr': 0.0004828346666904313, 'samples': 3755520, 'steps': 19559, 'loss/train': 1.0093544721603394} -11/07/2021 00:00:06 - INFO - __main__ - Step 19561: {'lr': 0.00048283273416468644, 'samples': 3755712, 'steps': 19560, 'loss/train': 1.3120677471160889} -11/07/2021 00:00:06 - INFO - __main__ - Step 19562: {'lr': 0.0004828308015340307, 'samples': 3755904, 'steps': 19561, 'loss/train': 1.2885136604309082} -11/07/2021 00:00:07 - INFO - __main__ - Step 19563: {'lr': 0.0004828288687984651, 'samples': 3756096, 'steps': 19562, 'loss/train': 1.5286688804626465} -11/07/2021 00:00:07 - INFO - __main__ - Step 19564: {'lr': 0.0004828269359579903, 'samples': 3756288, 'steps': 19563, 'loss/train': 1.8564814329147339} -11/07/2021 00:00:08 - INFO - __main__ - Step 19565: {'lr': 0.00048282500301260735, 'samples': 3756480, 'steps': 19564, 'loss/train': 1.8124595880508423} -11/07/2021 00:00:09 - INFO - __main__ - Step 19566: {'lr': 0.000482823069962317, 'samples': 3756672, 'steps': 19565, 'loss/train': 1.629968285560608} -11/07/2021 00:00:09 - INFO - __main__ - Step 19567: {'lr': 0.0004828211368071202, 'samples': 3756864, 'steps': 19566, 'loss/train': 1.3446823358535767} -11/07/2021 00:00:09 - INFO - __main__ - Step 19568: {'lr': 0.0004828192035470178, 'samples': 3757056, 'steps': 19567, 'loss/train': 1.5391641855239868} -11/07/2021 00:00:10 - INFO - __main__ - Step 19569: {'lr': 0.00048281727018201063, 'samples': 3757248, 'steps': 19568, 'loss/train': 1.3339598178863525} -11/07/2021 00:00:11 - INFO - __main__ - Step 19570: {'lr': 0.00048281533671209955, 'samples': 3757440, 'steps': 19569, 'loss/train': 1.5045450925827026} -11/07/2021 00:00:11 - INFO - __main__ - Step 19571: {'lr': 0.0004828134031372855, 'samples': 3757632, 'steps': 19570, 'loss/train': 1.9711503982543945} -11/07/2021 00:00:11 - INFO - __main__ - Step 19572: {'lr': 0.00048281146945756937, 'samples': 3757824, 'steps': 19571, 'loss/train': 2.07639217376709} -11/07/2021 00:00:12 - INFO - __main__ - Step 19573: {'lr': 0.00048280953567295196, 'samples': 3758016, 'steps': 19572, 'loss/train': 1.6146386861801147} -11/07/2021 00:00:12 - INFO - __main__ - Step 19574: {'lr': 0.0004828076017834342, 'samples': 3758208, 'steps': 19573, 'loss/train': 1.6972767114639282} -11/07/2021 00:00:12 - INFO - __main__ - Step 19575: {'lr': 0.00048280566778901684, 'samples': 3758400, 'steps': 19574, 'loss/train': 1.4834022521972656} -11/07/2021 00:00:13 - INFO - __main__ - Step 19576: {'lr': 0.00048280373368970086, 'samples': 3758592, 'steps': 19575, 'loss/train': 2.030294418334961} -11/07/2021 00:00:14 - INFO - __main__ - Step 19577: {'lr': 0.0004828017994854872, 'samples': 3758784, 'steps': 19576, 'loss/train': 1.447499394416809} -11/07/2021 00:00:14 - INFO - __main__ - Step 19578: {'lr': 0.0004827998651763765, 'samples': 3758976, 'steps': 19577, 'loss/train': 1.5339030027389526} -11/07/2021 00:00:15 - INFO - __main__ - Step 19579: {'lr': 0.0004827979307623699, 'samples': 3759168, 'steps': 19578, 'loss/train': 1.9877415895462036} -11/07/2021 00:00:15 - INFO - __main__ - Step 19580: {'lr': 0.0004827959962434681, 'samples': 3759360, 'steps': 19579, 'loss/train': 1.5659407377243042} -11/07/2021 00:00:16 - INFO - __main__ - Step 19581: {'lr': 0.00048279406161967197, 'samples': 3759552, 'steps': 19580, 'loss/train': 2.1685266494750977} -11/07/2021 00:00:16 - INFO - __main__ - Step 19582: {'lr': 0.0004827921268909825, 'samples': 3759744, 'steps': 19581, 'loss/train': 2.012640953063965} -11/07/2021 00:00:17 - INFO - __main__ - Step 19583: {'lr': 0.0004827901920574005, 'samples': 3759936, 'steps': 19582, 'loss/train': 1.866450548171997} -11/07/2021 00:00:17 - INFO - __main__ - Step 19584: {'lr': 0.0004827882571189268, 'samples': 3760128, 'steps': 19583, 'loss/train': 1.6104263067245483} -11/07/2021 00:00:17 - INFO - __main__ - Step 19585: {'lr': 0.00048278632207556226, 'samples': 3760320, 'steps': 19584, 'loss/train': 1.3908783197402954} -11/07/2021 00:00:19 - INFO - __main__ - Step 19586: {'lr': 0.00048278438692730784, 'samples': 3760512, 'steps': 19585, 'loss/train': 1.4279026985168457} -11/07/2021 00:00:19 - INFO - __main__ - Step 19587: {'lr': 0.00048278245167416434, 'samples': 3760704, 'steps': 19586, 'loss/train': 1.6072896718978882} -11/07/2021 00:00:19 - INFO - __main__ - Step 19588: {'lr': 0.0004827805163161327, 'samples': 3760896, 'steps': 19587, 'loss/train': 1.6472357511520386} -11/07/2021 00:00:20 - INFO - __main__ - Step 19589: {'lr': 0.0004827785808532137, 'samples': 3761088, 'steps': 19588, 'loss/train': 2.886787176132202} -11/07/2021 00:00:20 - INFO - __main__ - Step 19590: {'lr': 0.0004827766452854083, 'samples': 3761280, 'steps': 19589, 'loss/train': 1.579707145690918} -11/07/2021 00:00:20 - INFO - __main__ - Step 19591: {'lr': 0.0004827747096127173, 'samples': 3761472, 'steps': 19590, 'loss/train': 1.1529046297073364} -11/07/2021 00:00:21 - INFO - __main__ - Step 19592: {'lr': 0.00048277277383514165, 'samples': 3761664, 'steps': 19591, 'loss/train': 1.4161953926086426} -11/07/2021 00:00:22 - INFO - __main__ - Step 19593: {'lr': 0.00048277083795268216, 'samples': 3761856, 'steps': 19592, 'loss/train': 2.133817434310913} -11/07/2021 00:00:22 - INFO - __main__ - Step 19594: {'lr': 0.0004827689019653397, 'samples': 3762048, 'steps': 19593, 'loss/train': 1.4859519004821777} -11/07/2021 00:00:22 - INFO - __main__ - Step 19595: {'lr': 0.00048276696587311525, 'samples': 3762240, 'steps': 19594, 'loss/train': 1.380395770072937} -11/07/2021 00:00:23 - INFO - __main__ - Step 19596: {'lr': 0.00048276502967600955, 'samples': 3762432, 'steps': 19595, 'loss/train': 1.3329964876174927} -11/07/2021 00:00:24 - INFO - __main__ - Step 19597: {'lr': 0.00048276309337402345, 'samples': 3762624, 'steps': 19596, 'loss/train': 1.8443204164505005} -11/07/2021 00:00:24 - INFO - __main__ - Step 19598: {'lr': 0.000482761156967158, 'samples': 3762816, 'steps': 19597, 'loss/train': 1.332189917564392} -11/07/2021 00:00:25 - INFO - __main__ - Step 19599: {'lr': 0.0004827592204554139, 'samples': 3763008, 'steps': 19598, 'loss/train': 1.2490015029907227} -11/07/2021 00:00:25 - INFO - __main__ - Step 19600: {'lr': 0.00048275728383879215, 'samples': 3763200, 'steps': 19599, 'loss/train': 1.4692695140838623} -11/07/2021 00:00:25 - INFO - __main__ - Step 19601: {'lr': 0.0004827553471172935, 'samples': 3763392, 'steps': 19600, 'loss/train': 1.5272186994552612} -11/07/2021 00:00:26 - INFO - __main__ - Step 19602: {'lr': 0.00048275341029091885, 'samples': 3763584, 'steps': 19601, 'loss/train': 1.5676167011260986} -11/07/2021 00:00:27 - INFO - __main__ - Step 19603: {'lr': 0.0004827514733596692, 'samples': 3763776, 'steps': 19602, 'loss/train': 1.6951826810836792} -11/07/2021 00:00:27 - INFO - __main__ - Step 19604: {'lr': 0.00048274953632354524, 'samples': 3763968, 'steps': 19603, 'loss/train': 1.893367886543274} -11/07/2021 00:00:27 - INFO - __main__ - Step 19605: {'lr': 0.000482747599182548, 'samples': 3764160, 'steps': 19604, 'loss/train': 1.5247362852096558} -11/07/2021 00:00:28 - INFO - __main__ - Step 19606: {'lr': 0.00048274566193667824, 'samples': 3764352, 'steps': 19605, 'loss/train': 1.5493274927139282} -11/07/2021 00:00:29 - INFO - __main__ - Step 19607: {'lr': 0.0004827437245859369, 'samples': 3764544, 'steps': 19606, 'loss/train': 1.8292338848114014} -11/07/2021 00:00:29 - INFO - __main__ - Step 19608: {'lr': 0.0004827417871303248, 'samples': 3764736, 'steps': 19607, 'loss/train': 1.5020709037780762} -11/07/2021 00:00:29 - INFO - __main__ - Step 19609: {'lr': 0.00048273984956984285, 'samples': 3764928, 'steps': 19608, 'loss/train': 1.4957561492919922} -11/07/2021 00:00:30 - INFO - __main__ - Step 19610: {'lr': 0.0004827379119044919, 'samples': 3765120, 'steps': 19609, 'loss/train': 1.7140650749206543} -11/07/2021 00:00:30 - INFO - __main__ - Step 19611: {'lr': 0.00048273597413427284, 'samples': 3765312, 'steps': 19610, 'loss/train': 1.3099769353866577} -11/07/2021 00:00:30 - INFO - __main__ - Step 19612: {'lr': 0.00048273403625918653, 'samples': 3765504, 'steps': 19611, 'loss/train': 1.9554831981658936} -11/07/2021 00:00:31 - INFO - __main__ - Step 19613: {'lr': 0.0004827320982792339, 'samples': 3765696, 'steps': 19612, 'loss/train': 1.5525972843170166} -11/07/2021 00:00:32 - INFO - __main__ - Step 19614: {'lr': 0.00048273016019441585, 'samples': 3765888, 'steps': 19613, 'loss/train': 1.6005520820617676} -11/07/2021 00:00:32 - INFO - __main__ - Step 19615: {'lr': 0.00048272822200473304, 'samples': 3766080, 'steps': 19614, 'loss/train': 1.727546215057373} -11/07/2021 00:00:32 - INFO - __main__ - Step 19616: {'lr': 0.0004827262837101866, 'samples': 3766272, 'steps': 19615, 'loss/train': 1.532706618309021} -11/07/2021 00:00:33 - INFO - __main__ - Step 19617: {'lr': 0.0004827243453107772, 'samples': 3766464, 'steps': 19616, 'loss/train': 1.8534809350967407} -11/07/2021 00:00:34 - INFO - __main__ - Step 19618: {'lr': 0.0004827224068065058, 'samples': 3766656, 'steps': 19617, 'loss/train': 1.6946210861206055} -11/07/2021 00:00:34 - INFO - __main__ - Step 19619: {'lr': 0.0004827204681973733, 'samples': 3766848, 'steps': 19618, 'loss/train': 1.5758514404296875} -11/07/2021 00:00:35 - INFO - __main__ - Step 19620: {'lr': 0.00048271852948338057, 'samples': 3767040, 'steps': 19619, 'loss/train': 1.195085048675537} -11/07/2021 00:00:35 - INFO - __main__ - Step 19621: {'lr': 0.00048271659066452847, 'samples': 3767232, 'steps': 19620, 'loss/train': 1.3183504343032837} -11/07/2021 00:00:35 - INFO - __main__ - Step 19622: {'lr': 0.0004827146517408178, 'samples': 3767424, 'steps': 19621, 'loss/train': 1.5881609916687012} -11/07/2021 00:00:36 - INFO - __main__ - Step 19623: {'lr': 0.0004827127127122495, 'samples': 3767616, 'steps': 19622, 'loss/train': 1.7038828134536743} -11/07/2021 00:00:37 - INFO - __main__ - Step 19624: {'lr': 0.00048271077357882455, 'samples': 3767808, 'steps': 19623, 'loss/train': 1.7045823335647583} -11/07/2021 00:00:37 - INFO - __main__ - Step 19625: {'lr': 0.00048270883434054364, 'samples': 3768000, 'steps': 19624, 'loss/train': 1.2590144872665405} -11/07/2021 00:00:37 - INFO - __main__ - Step 19626: {'lr': 0.00048270689499740774, 'samples': 3768192, 'steps': 19625, 'loss/train': 1.5791674852371216} -11/07/2021 00:00:38 - INFO - __main__ - Step 19627: {'lr': 0.0004827049555494176, 'samples': 3768384, 'steps': 19626, 'loss/train': 1.9357750415802002} -11/07/2021 00:00:39 - INFO - __main__ - Step 19628: {'lr': 0.00048270301599657436, 'samples': 3768576, 'steps': 19627, 'loss/train': 1.0141645669937134} -11/07/2021 00:00:39 - INFO - __main__ - Step 19629: {'lr': 0.0004827010763388786, 'samples': 3768768, 'steps': 19628, 'loss/train': 1.4488344192504883} -11/07/2021 00:00:39 - INFO - __main__ - Step 19630: {'lr': 0.00048269913657633147, 'samples': 3768960, 'steps': 19629, 'loss/train': 1.4897490739822388} -11/07/2021 00:00:40 - INFO - __main__ - Step 19631: {'lr': 0.00048269719670893357, 'samples': 3769152, 'steps': 19630, 'loss/train': 1.842172384262085} -11/07/2021 00:00:40 - INFO - __main__ - Step 19632: {'lr': 0.00048269525673668595, 'samples': 3769344, 'steps': 19631, 'loss/train': 1.7020254135131836} -11/07/2021 00:00:41 - INFO - __main__ - Step 19633: {'lr': 0.00048269331665958947, 'samples': 3769536, 'steps': 19632, 'loss/train': 1.7664917707443237} -11/07/2021 00:00:42 - INFO - __main__ - Step 19634: {'lr': 0.00048269137647764495, 'samples': 3769728, 'steps': 19633, 'loss/train': 1.8792760372161865} -11/07/2021 00:00:42 - INFO - __main__ - Step 19635: {'lr': 0.00048268943619085325, 'samples': 3769920, 'steps': 19634, 'loss/train': 1.3441412448883057} -11/07/2021 00:00:42 - INFO - __main__ - Step 19636: {'lr': 0.00048268749579921536, 'samples': 3770112, 'steps': 19635, 'loss/train': 1.066512107849121} -11/07/2021 00:00:43 - INFO - __main__ - Step 19637: {'lr': 0.00048268555530273197, 'samples': 3770304, 'steps': 19636, 'loss/train': 2.038100481033325} -11/07/2021 00:00:43 - INFO - __main__ - Step 19638: {'lr': 0.0004826836147014041, 'samples': 3770496, 'steps': 19637, 'loss/train': 1.2827800512313843} -11/07/2021 00:00:44 - INFO - __main__ - Step 19639: {'lr': 0.0004826816739952326, 'samples': 3770688, 'steps': 19638, 'loss/train': 1.3848270177841187} -11/07/2021 00:00:44 - INFO - __main__ - Step 19640: {'lr': 0.0004826797331842183, 'samples': 3770880, 'steps': 19639, 'loss/train': 1.6651759147644043} -11/07/2021 00:00:45 - INFO - __main__ - Step 19641: {'lr': 0.0004826777922683622, 'samples': 3771072, 'steps': 19640, 'loss/train': 1.8310139179229736} -11/07/2021 00:00:45 - INFO - __main__ - Step 19642: {'lr': 0.0004826758512476649, 'samples': 3771264, 'steps': 19641, 'loss/train': 1.6785047054290771} -11/07/2021 00:00:45 - INFO - __main__ - Step 19643: {'lr': 0.0004826739101221276, 'samples': 3771456, 'steps': 19642, 'loss/train': 1.0879031419754028} -11/07/2021 00:00:46 - INFO - __main__ - Step 19644: {'lr': 0.000482671968891751, 'samples': 3771648, 'steps': 19643, 'loss/train': 1.537487268447876} -11/07/2021 00:00:47 - INFO - __main__ - Step 19645: {'lr': 0.000482670027556536, 'samples': 3771840, 'steps': 19644, 'loss/train': 1.6221253871917725} -11/07/2021 00:00:47 - INFO - __main__ - Step 19646: {'lr': 0.0004826680861164834, 'samples': 3772032, 'steps': 19645, 'loss/train': 1.3264529705047607} -11/07/2021 00:00:47 - INFO - __main__ - Step 19647: {'lr': 0.00048266614457159426, 'samples': 3772224, 'steps': 19646, 'loss/train': 1.3037407398223877} -11/07/2021 00:00:48 - INFO - __main__ - Step 19648: {'lr': 0.0004826642029218693, 'samples': 3772416, 'steps': 19647, 'loss/train': 1.428112268447876} -11/07/2021 00:00:49 - INFO - __main__ - Step 19649: {'lr': 0.00048266226116730937, 'samples': 3772608, 'steps': 19648, 'loss/train': 1.5353032350540161} -11/07/2021 00:00:49 - INFO - __main__ - Step 19650: {'lr': 0.00048266031930791555, 'samples': 3772800, 'steps': 19649, 'loss/train': 1.3815804719924927} -11/07/2021 00:00:49 - INFO - __main__ - Step 19651: {'lr': 0.0004826583773436884, 'samples': 3772992, 'steps': 19650, 'loss/train': 1.9578912258148193} -11/07/2021 00:00:50 - INFO - __main__ - Step 19652: {'lr': 0.00048265643527462915, 'samples': 3773184, 'steps': 19651, 'loss/train': 1.3772332668304443} -11/07/2021 00:00:50 - INFO - __main__ - Step 19653: {'lr': 0.00048265449310073847, 'samples': 3773376, 'steps': 19652, 'loss/train': 1.2029601335525513} -11/07/2021 00:00:51 - INFO - __main__ - Step 19654: {'lr': 0.0004826525508220172, 'samples': 3773568, 'steps': 19653, 'loss/train': 1.0753741264343262} -11/07/2021 00:00:52 - INFO - __main__ - Step 19655: {'lr': 0.0004826506084384663, 'samples': 3773760, 'steps': 19654, 'loss/train': 1.2957723140716553} -11/07/2021 00:00:52 - INFO - __main__ - Step 19656: {'lr': 0.00048264866595008665, 'samples': 3773952, 'steps': 19655, 'loss/train': 1.1646695137023926} -11/07/2021 00:00:52 - INFO - __main__ - Step 19657: {'lr': 0.0004826467233568791, 'samples': 3774144, 'steps': 19656, 'loss/train': 1.3596159219741821} -11/07/2021 00:00:53 - INFO - __main__ - Step 19658: {'lr': 0.00048264478065884454, 'samples': 3774336, 'steps': 19657, 'loss/train': 1.6303644180297852} -11/07/2021 00:00:54 - INFO - __main__ - Step 19659: {'lr': 0.0004826428378559838, 'samples': 3774528, 'steps': 19658, 'loss/train': 1.8354287147521973} -11/07/2021 00:00:54 - INFO - __main__ - Step 19660: {'lr': 0.00048264089494829776, 'samples': 3774720, 'steps': 19659, 'loss/train': 1.5434880256652832} -11/07/2021 00:00:54 - INFO - __main__ - Step 19661: {'lr': 0.0004826389519357874, 'samples': 3774912, 'steps': 19660, 'loss/train': 1.5627186298370361} -11/07/2021 00:00:55 - INFO - __main__ - Step 19662: {'lr': 0.00048263700881845346, 'samples': 3775104, 'steps': 19661, 'loss/train': 2.0011045932769775} -11/07/2021 00:00:55 - INFO - __main__ - Step 19663: {'lr': 0.00048263506559629687, 'samples': 3775296, 'steps': 19662, 'loss/train': 1.4480820894241333} -11/07/2021 00:00:56 - INFO - __main__ - Step 19664: {'lr': 0.00048263312226931853, 'samples': 3775488, 'steps': 19663, 'loss/train': 2.256391763687134} -11/07/2021 00:00:56 - INFO - __main__ - Step 19665: {'lr': 0.0004826311788375193, 'samples': 3775680, 'steps': 19664, 'loss/train': 1.180256962776184} -11/07/2021 00:00:57 - INFO - __main__ - Step 19666: {'lr': 0.00048262923530090007, 'samples': 3775872, 'steps': 19665, 'loss/train': 1.7530802488327026} -11/07/2021 00:00:57 - INFO - __main__ - Step 19667: {'lr': 0.0004826272916594616, 'samples': 3776064, 'steps': 19666, 'loss/train': 1.6622743606567383} -11/07/2021 00:00:58 - INFO - __main__ - Step 19668: {'lr': 0.000482625347913205, 'samples': 3776256, 'steps': 19667, 'loss/train': 1.727860450744629} -11/07/2021 00:00:59 - INFO - __main__ - Step 19669: {'lr': 0.0004826234040621309, 'samples': 3776448, 'steps': 19668, 'loss/train': 1.6675604581832886} -11/07/2021 00:00:59 - INFO - __main__ - Step 19670: {'lr': 0.00048262146010624035, 'samples': 3776640, 'steps': 19669, 'loss/train': 1.950370192527771} -11/07/2021 00:00:59 - INFO - __main__ - Step 19671: {'lr': 0.0004826195160455341, 'samples': 3776832, 'steps': 19670, 'loss/train': 1.9079294204711914} -11/07/2021 00:01:00 - INFO - __main__ - Step 19672: {'lr': 0.00048261757188001314, 'samples': 3777024, 'steps': 19671, 'loss/train': 1.0746430158615112} -11/07/2021 00:01:00 - INFO - __main__ - Step 19673: {'lr': 0.00048261562760967824, 'samples': 3777216, 'steps': 19672, 'loss/train': 1.936623215675354} -11/07/2021 00:01:00 - INFO - __main__ - Step 19674: {'lr': 0.0004826136832345304, 'samples': 3777408, 'steps': 19673, 'loss/train': 1.9064000844955444} -11/07/2021 00:01:01 - INFO - __main__ - Step 19675: {'lr': 0.00048261173875457035, 'samples': 3777600, 'steps': 19674, 'loss/train': 2.2525835037231445} -11/07/2021 00:01:02 - INFO - __main__ - Step 19676: {'lr': 0.0004826097941697991, 'samples': 3777792, 'steps': 19675, 'loss/train': 1.700140118598938} -11/07/2021 00:01:02 - INFO - __main__ - Step 19677: {'lr': 0.0004826078494802174, 'samples': 3777984, 'steps': 19676, 'loss/train': 1.8438869714736938} -11/07/2021 00:01:02 - INFO - __main__ - Step 19678: {'lr': 0.00048260590468582624, 'samples': 3778176, 'steps': 19677, 'loss/train': 1.5107479095458984} -11/07/2021 00:01:03 - INFO - __main__ - Step 19679: {'lr': 0.0004826039597866265, 'samples': 3778368, 'steps': 19678, 'loss/train': 1.5821765661239624} -11/07/2021 00:01:04 - INFO - __main__ - Step 19680: {'lr': 0.00048260201478261887, 'samples': 3778560, 'steps': 19679, 'loss/train': 1.5964267253875732} -11/07/2021 00:01:04 - INFO - __main__ - Step 19681: {'lr': 0.0004826000696738045, 'samples': 3778752, 'steps': 19680, 'loss/train': 1.6593513488769531} -11/07/2021 00:01:05 - INFO - __main__ - Step 19682: {'lr': 0.000482598124460184, 'samples': 3778944, 'steps': 19681, 'loss/train': 0.817847490310669} -11/07/2021 00:01:05 - INFO - __main__ - Step 19683: {'lr': 0.00048259617914175846, 'samples': 3779136, 'steps': 19682, 'loss/train': 1.4910651445388794} -11/07/2021 00:01:05 - INFO - __main__ - Step 19684: {'lr': 0.00048259423371852867, 'samples': 3779328, 'steps': 19683, 'loss/train': 1.6026617288589478} -11/07/2021 00:01:06 - INFO - __main__ - Step 19685: {'lr': 0.0004825922881904955, 'samples': 3779520, 'steps': 19684, 'loss/train': 1.4363633394241333} -11/07/2021 00:01:07 - INFO - __main__ - Step 19686: {'lr': 0.00048259034255765984, 'samples': 3779712, 'steps': 19685, 'loss/train': 1.4773492813110352} -11/07/2021 00:01:07 - INFO - __main__ - Step 19687: {'lr': 0.00048258839682002253, 'samples': 3779904, 'steps': 19686, 'loss/train': 0.8131615519523621} -11/07/2021 00:01:07 - INFO - __main__ - Step 19688: {'lr': 0.00048258645097758445, 'samples': 3780096, 'steps': 19687, 'loss/train': 1.3371987342834473} -11/07/2021 00:01:08 - INFO - __main__ - Step 19689: {'lr': 0.0004825845050303466, 'samples': 3780288, 'steps': 19688, 'loss/train': 1.4941506385803223} -11/07/2021 00:01:09 - INFO - __main__ - Step 19690: {'lr': 0.00048258255897830967, 'samples': 3780480, 'steps': 19689, 'loss/train': 1.6974849700927734} -11/07/2021 00:01:09 - INFO - __main__ - Step 19691: {'lr': 0.0004825806128214747, 'samples': 3780672, 'steps': 19690, 'loss/train': 1.7099860906600952} -11/07/2021 00:01:09 - INFO - __main__ - Step 19692: {'lr': 0.00048257866655984237, 'samples': 3780864, 'steps': 19691, 'loss/train': 1.6285266876220703} -11/07/2021 00:01:10 - INFO - __main__ - Step 19693: {'lr': 0.0004825767201934138, 'samples': 3781056, 'steps': 19692, 'loss/train': 1.9358177185058594} -11/07/2021 00:01:10 - INFO - __main__ - Step 19694: {'lr': 0.0004825747737221897, 'samples': 3781248, 'steps': 19693, 'loss/train': 1.5827686786651611} -11/07/2021 00:01:11 - INFO - __main__ - Step 19695: {'lr': 0.000482572827146171, 'samples': 3781440, 'steps': 19694, 'loss/train': 1.8137426376342773} -11/07/2021 00:01:11 - INFO - __main__ - Step 19696: {'lr': 0.00048257088046535864, 'samples': 3781632, 'steps': 19695, 'loss/train': 1.3611456155776978} -11/07/2021 00:01:12 - INFO - __main__ - Step 19697: {'lr': 0.0004825689336797534, 'samples': 3781824, 'steps': 19696, 'loss/train': 1.5496810674667358} -11/07/2021 00:01:12 - INFO - __main__ - Step 19698: {'lr': 0.00048256698678935615, 'samples': 3782016, 'steps': 19697, 'loss/train': 1.8349579572677612} -11/07/2021 00:01:13 - INFO - __main__ - Step 19699: {'lr': 0.00048256503979416776, 'samples': 3782208, 'steps': 19698, 'loss/train': 1.5465449094772339} -11/07/2021 00:01:13 - INFO - __main__ - Step 19700: {'lr': 0.0004825630926941892, 'samples': 3782400, 'steps': 19699, 'loss/train': 1.3311418294906616} -11/07/2021 00:01:14 - INFO - __main__ - Step 19701: {'lr': 0.0004825611454894213, 'samples': 3782592, 'steps': 19700, 'loss/train': 1.6302708387374878} -11/07/2021 00:01:14 - INFO - __main__ - Step 19702: {'lr': 0.000482559198179865, 'samples': 3782784, 'steps': 19701, 'loss/train': 1.5560293197631836} -11/07/2021 00:01:15 - INFO - __main__ - Step 19703: {'lr': 0.00048255725076552103, 'samples': 3782976, 'steps': 19702, 'loss/train': 1.8703819513320923} -11/07/2021 00:01:15 - INFO - __main__ - Step 19704: {'lr': 0.0004825553032463904, 'samples': 3783168, 'steps': 19703, 'loss/train': 1.48812735080719} -11/07/2021 00:01:15 - INFO - __main__ - Step 19705: {'lr': 0.00048255335562247395, 'samples': 3783360, 'steps': 19704, 'loss/train': 1.8443870544433594} -11/07/2021 00:01:16 - INFO - __main__ - Step 19706: {'lr': 0.0004825514078937725, 'samples': 3783552, 'steps': 19705, 'loss/train': 1.9899576902389526} -11/07/2021 00:01:17 - INFO - __main__ - Step 19707: {'lr': 0.000482549460060287, 'samples': 3783744, 'steps': 19706, 'loss/train': 1.6891878843307495} -11/07/2021 00:01:17 - INFO - __main__ - Step 19708: {'lr': 0.0004825475121220183, 'samples': 3783936, 'steps': 19707, 'loss/train': 1.7115875482559204} -11/07/2021 00:01:17 - INFO - __main__ - Step 19709: {'lr': 0.0004825455640789672, 'samples': 3784128, 'steps': 19708, 'loss/train': 2.0251336097717285} -11/07/2021 00:01:18 - INFO - __main__ - Step 19710: {'lr': 0.00048254361593113475, 'samples': 3784320, 'steps': 19709, 'loss/train': 1.9587410688400269} -11/07/2021 00:01:19 - INFO - __main__ - Step 19711: {'lr': 0.0004825416676785217, 'samples': 3784512, 'steps': 19710, 'loss/train': 2.022176742553711} -11/07/2021 00:01:19 - INFO - __main__ - Step 19712: {'lr': 0.000482539719321129, 'samples': 3784704, 'steps': 19711, 'loss/train': 2.0017166137695312} -11/07/2021 00:01:19 - INFO - __main__ - Step 19713: {'lr': 0.00048253777085895745, 'samples': 3784896, 'steps': 19712, 'loss/train': 1.0912806987762451} -11/07/2021 00:01:20 - INFO - __main__ - Step 19714: {'lr': 0.000482535822292008, 'samples': 3785088, 'steps': 19713, 'loss/train': 1.5614527463912964} -11/07/2021 00:01:20 - INFO - __main__ - Step 19715: {'lr': 0.0004825338736202815, 'samples': 3785280, 'steps': 19714, 'loss/train': 1.2009432315826416} -11/07/2021 00:01:21 - INFO - __main__ - Step 19716: {'lr': 0.00048253192484377884, 'samples': 3785472, 'steps': 19715, 'loss/train': 1.6705501079559326} -11/07/2021 00:01:21 - INFO - __main__ - Step 19717: {'lr': 0.0004825299759625008, 'samples': 3785664, 'steps': 19716, 'loss/train': 1.6005103588104248} -11/07/2021 00:01:22 - INFO - __main__ - Step 19718: {'lr': 0.0004825280269764484, 'samples': 3785856, 'steps': 19717, 'loss/train': 1.6898348331451416} -11/07/2021 00:01:22 - INFO - __main__ - Step 19719: {'lr': 0.0004825260778856224, 'samples': 3786048, 'steps': 19718, 'loss/train': 1.2682095766067505} -11/07/2021 00:01:22 - INFO - __main__ - Step 19720: {'lr': 0.0004825241286900238, 'samples': 3786240, 'steps': 19719, 'loss/train': 1.398619294166565} -11/07/2021 00:01:24 - INFO - __main__ - Step 19721: {'lr': 0.0004825221793896535, 'samples': 3786432, 'steps': 19720, 'loss/train': 1.7995117902755737} -11/07/2021 00:01:24 - INFO - __main__ - Step 19722: {'lr': 0.0004825202299845122, 'samples': 3786624, 'steps': 19721, 'loss/train': 1.4003227949142456} -11/07/2021 00:01:24 - INFO - __main__ - Step 19723: {'lr': 0.00048251828047460077, 'samples': 3786816, 'steps': 19722, 'loss/train': 1.677733063697815} -11/07/2021 00:01:25 - INFO - __main__ - Step 19724: {'lr': 0.0004825163308599203, 'samples': 3787008, 'steps': 19723, 'loss/train': 1.8848963975906372} -11/07/2021 00:01:25 - INFO - __main__ - Step 19725: {'lr': 0.0004825143811404716, 'samples': 3787200, 'steps': 19724, 'loss/train': 1.6684176921844482} -11/07/2021 00:01:26 - INFO - __main__ - Step 19726: {'lr': 0.00048251243131625543, 'samples': 3787392, 'steps': 19725, 'loss/train': 1.2181226015090942} -11/07/2021 00:01:27 - INFO - __main__ - Step 19727: {'lr': 0.0004825104813872728, 'samples': 3787584, 'steps': 19726, 'loss/train': 1.703728437423706} -11/07/2021 00:01:27 - INFO - __main__ - Step 19728: {'lr': 0.0004825085313535245, 'samples': 3787776, 'steps': 19727, 'loss/train': 1.7474498748779297} -11/07/2021 00:01:27 - INFO - __main__ - Step 19729: {'lr': 0.00048250658121501145, 'samples': 3787968, 'steps': 19728, 'loss/train': 0.8166286945343018} -11/07/2021 00:01:28 - INFO - __main__ - Step 19730: {'lr': 0.00048250463097173447, 'samples': 3788160, 'steps': 19729, 'loss/train': 1.8923614025115967} -11/07/2021 00:01:29 - INFO - __main__ - Step 19731: {'lr': 0.0004825026806236946, 'samples': 3788352, 'steps': 19730, 'loss/train': 1.692439079284668} -11/07/2021 00:01:29 - INFO - __main__ - Step 19732: {'lr': 0.00048250073017089257, 'samples': 3788544, 'steps': 19731, 'loss/train': 1.34873366355896} -11/07/2021 00:01:30 - INFO - __main__ - Step 19733: {'lr': 0.00048249877961332923, 'samples': 3788736, 'steps': 19732, 'loss/train': 1.4355651140213013} -11/07/2021 00:01:30 - INFO - __main__ - Step 19734: {'lr': 0.0004824968289510056, 'samples': 3788928, 'steps': 19733, 'loss/train': 3.0089304447174072} -11/07/2021 00:01:30 - INFO - __main__ - Step 19735: {'lr': 0.0004824948781839225, 'samples': 3789120, 'steps': 19734, 'loss/train': 1.7068781852722168} -11/07/2021 00:01:31 - INFO - __main__ - Step 19736: {'lr': 0.0004824929273120807, 'samples': 3789312, 'steps': 19735, 'loss/train': 2.0317676067352295} -11/07/2021 00:01:32 - INFO - __main__ - Step 19737: {'lr': 0.0004824909763354813, 'samples': 3789504, 'steps': 19736, 'loss/train': 1.9025362730026245} -11/07/2021 00:01:32 - INFO - __main__ - Step 19738: {'lr': 0.00048248902525412497, 'samples': 3789696, 'steps': 19737, 'loss/train': 1.912577748298645} -11/07/2021 00:01:32 - INFO - __main__ - Step 19739: {'lr': 0.0004824870740680127, 'samples': 3789888, 'steps': 19738, 'loss/train': 2.0602569580078125} -11/07/2021 00:01:33 - INFO - __main__ - Step 19740: {'lr': 0.0004824851227771453, 'samples': 3790080, 'steps': 19739, 'loss/train': 1.4696168899536133} -11/07/2021 00:01:33 - INFO - __main__ - Step 19741: {'lr': 0.00048248317138152374, 'samples': 3790272, 'steps': 19740, 'loss/train': 2.4418163299560547} -11/07/2021 00:01:34 - INFO - __main__ - Step 19742: {'lr': 0.00048248121988114887, 'samples': 3790464, 'steps': 19741, 'loss/train': 1.8438314199447632} -11/07/2021 00:01:34 - INFO - __main__ - Step 19743: {'lr': 0.00048247926827602153, 'samples': 3790656, 'steps': 19742, 'loss/train': 1.5355260372161865} -11/07/2021 00:01:35 - INFO - __main__ - Step 19744: {'lr': 0.0004824773165661426, 'samples': 3790848, 'steps': 19743, 'loss/train': 1.5468591451644897} -11/07/2021 00:01:35 - INFO - __main__ - Step 19745: {'lr': 0.000482475364751513, 'samples': 3791040, 'steps': 19744, 'loss/train': 1.805572271347046} -11/07/2021 00:01:35 - INFO - __main__ - Step 19746: {'lr': 0.0004824734128321335, 'samples': 3791232, 'steps': 19745, 'loss/train': 1.6561604738235474} -11/07/2021 00:01:36 - INFO - __main__ - Step 19747: {'lr': 0.0004824714608080052, 'samples': 3791424, 'steps': 19746, 'loss/train': 1.387292504310608} -11/07/2021 00:01:37 - INFO - __main__ - Step 19748: {'lr': 0.00048246950867912873, 'samples': 3791616, 'steps': 19747, 'loss/train': 1.7688283920288086} -11/07/2021 00:01:37 - INFO - __main__ - Step 19749: {'lr': 0.0004824675564455052, 'samples': 3791808, 'steps': 19748, 'loss/train': 4.455977916717529} -11/07/2021 00:01:38 - INFO - __main__ - Step 19750: {'lr': 0.0004824656041071353, 'samples': 3792000, 'steps': 19749, 'loss/train': 1.741172432899475} -11/07/2021 00:01:38 - INFO - __main__ - Step 19751: {'lr': 0.00048246365166402003, 'samples': 3792192, 'steps': 19750, 'loss/train': 1.72153902053833} -11/07/2021 00:01:39 - INFO - __main__ - Step 19752: {'lr': 0.00048246169911616015, 'samples': 3792384, 'steps': 19751, 'loss/train': 1.7890325784683228} -11/07/2021 00:01:39 - INFO - __main__ - Step 19753: {'lr': 0.00048245974646355673, 'samples': 3792576, 'steps': 19752, 'loss/train': 1.2916069030761719} -11/07/2021 00:01:40 - INFO - __main__ - Step 19754: {'lr': 0.00048245779370621045, 'samples': 3792768, 'steps': 19753, 'loss/train': 1.873506784439087} -11/07/2021 00:01:40 - INFO - __main__ - Step 19755: {'lr': 0.0004824558408441223, 'samples': 3792960, 'steps': 19754, 'loss/train': 1.3477427959442139} -11/07/2021 00:01:40 - INFO - __main__ - Step 19756: {'lr': 0.00048245388787729316, 'samples': 3793152, 'steps': 19755, 'loss/train': 1.5922755002975464} -11/07/2021 00:01:41 - INFO - __main__ - Step 19757: {'lr': 0.00048245193480572383, 'samples': 3793344, 'steps': 19756, 'loss/train': 1.3742207288742065} -11/07/2021 00:01:42 - INFO - __main__ - Step 19758: {'lr': 0.0004824499816294152, 'samples': 3793536, 'steps': 19757, 'loss/train': 1.4603769779205322} -11/07/2021 00:01:42 - INFO - __main__ - Step 19759: {'lr': 0.0004824480283483683, 'samples': 3793728, 'steps': 19758, 'loss/train': 1.604667067527771} -11/07/2021 00:01:42 - INFO - __main__ - Step 19760: {'lr': 0.0004824460749625839, 'samples': 3793920, 'steps': 19759, 'loss/train': 1.4646573066711426} -11/07/2021 00:01:43 - INFO - __main__ - Step 19761: {'lr': 0.00048244412147206283, 'samples': 3794112, 'steps': 19760, 'loss/train': 1.8121919631958008} -11/07/2021 00:01:43 - INFO - __main__ - Step 19762: {'lr': 0.00048244216787680607, 'samples': 3794304, 'steps': 19761, 'loss/train': 1.9884823560714722} -11/07/2021 00:01:44 - INFO - __main__ - Step 19763: {'lr': 0.0004824402141768145, 'samples': 3794496, 'steps': 19762, 'loss/train': 1.7847453355789185} -11/07/2021 00:01:45 - INFO - __main__ - Step 19764: {'lr': 0.0004824382603720888, 'samples': 3794688, 'steps': 19763, 'loss/train': 1.5830997228622437} -11/07/2021 00:01:45 - INFO - __main__ - Step 19765: {'lr': 0.00048243630646263016, 'samples': 3794880, 'steps': 19764, 'loss/train': 0.8904869556427002} -11/07/2021 00:01:46 - INFO - __main__ - Step 19766: {'lr': 0.00048243435244843926, 'samples': 3795072, 'steps': 19765, 'loss/train': 2.7253293991088867} -11/07/2021 00:01:46 - INFO - __main__ - Step 19767: {'lr': 0.000482432398329517, 'samples': 3795264, 'steps': 19766, 'loss/train': 1.6028205156326294} -11/07/2021 00:01:47 - INFO - __main__ - Step 19768: {'lr': 0.00048243044410586433, 'samples': 3795456, 'steps': 19767, 'loss/train': 1.8924862146377563} -11/07/2021 00:01:47 - INFO - __main__ - Step 19769: {'lr': 0.00048242848977748205, 'samples': 3795648, 'steps': 19768, 'loss/train': 1.5213522911071777} -11/07/2021 00:01:48 - INFO - __main__ - Step 19770: {'lr': 0.0004824265353443711, 'samples': 3795840, 'steps': 19769, 'loss/train': 1.878341794013977} -11/07/2021 00:01:48 - INFO - __main__ - Step 19771: {'lr': 0.00048242458080653233, 'samples': 3796032, 'steps': 19770, 'loss/train': 1.079317569732666} -11/07/2021 00:01:48 - INFO - __main__ - Step 19772: {'lr': 0.0004824226261639666, 'samples': 3796224, 'steps': 19771, 'loss/train': 1.2419971227645874} -11/07/2021 00:01:49 - INFO - __main__ - Step 19773: {'lr': 0.00048242067141667487, 'samples': 3796416, 'steps': 19772, 'loss/train': 1.6807929277420044} -11/07/2021 00:01:50 - INFO - __main__ - Step 19774: {'lr': 0.00048241871656465795, 'samples': 3796608, 'steps': 19773, 'loss/train': 1.5872936248779297} -11/07/2021 00:01:50 - INFO - __main__ - Step 19775: {'lr': 0.0004824167616079168, 'samples': 3796800, 'steps': 19774, 'loss/train': 0.9091289639472961} -11/07/2021 00:01:50 - INFO - __main__ - Step 19776: {'lr': 0.0004824148065464522, 'samples': 3796992, 'steps': 19775, 'loss/train': 0.828349232673645} -11/07/2021 00:01:51 - INFO - __main__ - Step 19777: {'lr': 0.00048241285138026505, 'samples': 3797184, 'steps': 19776, 'loss/train': 1.399821400642395} -11/07/2021 00:01:52 - INFO - __main__ - Step 19778: {'lr': 0.00048241089610935627, 'samples': 3797376, 'steps': 19777, 'loss/train': 1.6102732419967651} -11/07/2021 00:01:52 - INFO - __main__ - Step 19779: {'lr': 0.0004824089407337267, 'samples': 3797568, 'steps': 19778, 'loss/train': 1.6403769254684448} -11/07/2021 00:01:52 - INFO - __main__ - Step 19780: {'lr': 0.00048240698525337726, 'samples': 3797760, 'steps': 19779, 'loss/train': 1.7121052742004395} -11/07/2021 00:01:53 - INFO - __main__ - Step 19781: {'lr': 0.0004824050296683089, 'samples': 3797952, 'steps': 19780, 'loss/train': 1.6432030200958252} -11/07/2021 00:01:53 - INFO - __main__ - Step 19782: {'lr': 0.0004824030739785223, 'samples': 3798144, 'steps': 19781, 'loss/train': 1.6968430280685425} -11/07/2021 00:01:53 - INFO - __main__ - Step 19783: {'lr': 0.00048240111818401854, 'samples': 3798336, 'steps': 19782, 'loss/train': 1.702683925628662} -11/07/2021 00:01:55 - INFO - __main__ - Step 19784: {'lr': 0.0004823991622847984, 'samples': 3798528, 'steps': 19783, 'loss/train': 1.420841932296753} -11/07/2021 00:01:55 - INFO - __main__ - Step 19785: {'lr': 0.0004823972062808628, 'samples': 3798720, 'steps': 19784, 'loss/train': 2.2331371307373047} -11/07/2021 00:01:55 - INFO - __main__ - Step 19786: {'lr': 0.0004823952501722126, 'samples': 3798912, 'steps': 19785, 'loss/train': 1.8033604621887207} -11/07/2021 00:01:56 - INFO - __main__ - Step 19787: {'lr': 0.00048239329395884865, 'samples': 3799104, 'steps': 19786, 'loss/train': 1.480093240737915} -11/07/2021 00:01:56 - INFO - __main__ - Step 19788: {'lr': 0.00048239133764077193, 'samples': 3799296, 'steps': 19787, 'loss/train': 1.7165354490280151} -11/07/2021 00:01:57 - INFO - __main__ - Step 19789: {'lr': 0.00048238938121798313, 'samples': 3799488, 'steps': 19788, 'loss/train': 1.7748910188674927} -11/07/2021 00:01:57 - INFO - __main__ - Step 19790: {'lr': 0.00048238742469048344, 'samples': 3799680, 'steps': 19789, 'loss/train': 1.333566427230835} -11/07/2021 00:01:58 - INFO - __main__ - Step 19791: {'lr': 0.00048238546805827345, 'samples': 3799872, 'steps': 19790, 'loss/train': 1.7777206897735596} -11/07/2021 00:01:58 - INFO - __main__ - Step 19792: {'lr': 0.00048238351132135415, 'samples': 3800064, 'steps': 19791, 'loss/train': 1.79335355758667} -11/07/2021 00:01:59 - INFO - __main__ - Step 19793: {'lr': 0.0004823815544797265, 'samples': 3800256, 'steps': 19792, 'loss/train': 1.7088088989257812} -11/07/2021 00:02:00 - INFO - __main__ - Step 19794: {'lr': 0.0004823795975333912, 'samples': 3800448, 'steps': 19793, 'loss/train': 1.7255698442459106} -11/07/2021 00:02:00 - INFO - __main__ - Step 19795: {'lr': 0.0004823776404823493, 'samples': 3800640, 'steps': 19794, 'loss/train': 0.7900757193565369} -11/07/2021 00:02:00 - INFO - __main__ - Step 19796: {'lr': 0.00048237568332660163, 'samples': 3800832, 'steps': 19795, 'loss/train': 1.8653993606567383} -11/07/2021 00:02:01 - INFO - __main__ - Step 19797: {'lr': 0.0004823737260661491, 'samples': 3801024, 'steps': 19796, 'loss/train': 2.3506391048431396} -11/07/2021 00:02:01 - INFO - __main__ - Step 19798: {'lr': 0.00048237176870099256, 'samples': 3801216, 'steps': 19797, 'loss/train': 1.4605416059494019} -11/07/2021 00:02:01 - INFO - __main__ - Step 19799: {'lr': 0.0004823698112311328, 'samples': 3801408, 'steps': 19798, 'loss/train': 1.5340802669525146} -11/07/2021 00:02:02 - INFO - __main__ - Step 19800: {'lr': 0.00048236785365657076, 'samples': 3801600, 'steps': 19799, 'loss/train': 1.685361623764038} -11/07/2021 00:02:03 - INFO - __main__ - Step 19801: {'lr': 0.00048236589597730744, 'samples': 3801792, 'steps': 19800, 'loss/train': 1.3878642320632935} -11/07/2021 00:02:03 - INFO - __main__ - Step 19802: {'lr': 0.00048236393819334363, 'samples': 3801984, 'steps': 19801, 'loss/train': 1.7285722494125366} -11/07/2021 00:02:03 - INFO - __main__ - Step 19803: {'lr': 0.0004823619803046802, 'samples': 3802176, 'steps': 19802, 'loss/train': 1.3159254789352417} -11/07/2021 00:02:04 - INFO - __main__ - Step 19804: {'lr': 0.00048236002231131803, 'samples': 3802368, 'steps': 19803, 'loss/train': 1.5569478273391724} -11/07/2021 00:02:05 - INFO - __main__ - Step 19805: {'lr': 0.00048235806421325803, 'samples': 3802560, 'steps': 19804, 'loss/train': 1.056659460067749} -11/07/2021 00:02:05 - INFO - __main__ - Step 19806: {'lr': 0.0004823561060105011, 'samples': 3802752, 'steps': 19805, 'loss/train': 1.6271388530731201} -11/07/2021 00:02:06 - INFO - __main__ - Step 19807: {'lr': 0.00048235414770304803, 'samples': 3802944, 'steps': 19806, 'loss/train': 1.493626356124878} -11/07/2021 00:02:06 - INFO - __main__ - Step 19808: {'lr': 0.00048235218929089987, 'samples': 3803136, 'steps': 19807, 'loss/train': 0.7152420878410339} -11/07/2021 00:02:06 - INFO - __main__ - Step 19809: {'lr': 0.00048235023077405724, 'samples': 3803328, 'steps': 19808, 'loss/train': 1.6068490743637085} -11/07/2021 00:02:07 - INFO - __main__ - Step 19810: {'lr': 0.0004823482721525213, 'samples': 3803520, 'steps': 19809, 'loss/train': 1.579464316368103} -11/07/2021 00:02:08 - INFO - __main__ - Step 19811: {'lr': 0.0004823463134262928, 'samples': 3803712, 'steps': 19810, 'loss/train': 1.4074981212615967} -11/07/2021 00:02:08 - INFO - __main__ - Step 19812: {'lr': 0.00048234435459537265, 'samples': 3803904, 'steps': 19811, 'loss/train': 1.2117066383361816} -11/07/2021 00:02:08 - INFO - __main__ - Step 19813: {'lr': 0.0004823423956597617, 'samples': 3804096, 'steps': 19812, 'loss/train': 1.3268944025039673} -11/07/2021 00:02:09 - INFO - __main__ - Step 19814: {'lr': 0.0004823404366194608, 'samples': 3804288, 'steps': 19813, 'loss/train': 1.8814929723739624} -11/07/2021 00:02:10 - INFO - __main__ - Step 19815: {'lr': 0.0004823384774744709, 'samples': 3804480, 'steps': 19814, 'loss/train': 1.1520098447799683} -11/07/2021 00:02:10 - INFO - __main__ - Step 19816: {'lr': 0.000482336518224793, 'samples': 3804672, 'steps': 19815, 'loss/train': 1.8974096775054932} -11/07/2021 00:02:11 - INFO - __main__ - Step 19817: {'lr': 0.00048233455887042764, 'samples': 3804864, 'steps': 19816, 'loss/train': 0.9365611672401428} -11/07/2021 00:02:11 - INFO - __main__ - Step 19818: {'lr': 0.0004823325994113761, 'samples': 3805056, 'steps': 19817, 'loss/train': 1.7103739976882935} -11/07/2021 00:02:11 - INFO - __main__ - Step 19819: {'lr': 0.00048233063984763895, 'samples': 3805248, 'steps': 19818, 'loss/train': 1.6624081134796143} -11/07/2021 00:02:12 - INFO - __main__ - Step 19820: {'lr': 0.0004823286801792173, 'samples': 3805440, 'steps': 19819, 'loss/train': 1.8712867498397827} -11/07/2021 00:02:13 - INFO - __main__ - Step 19821: {'lr': 0.0004823267204061118, 'samples': 3805632, 'steps': 19820, 'loss/train': 1.5832374095916748} -11/07/2021 00:02:13 - INFO - __main__ - Step 19822: {'lr': 0.0004823247605283236, 'samples': 3805824, 'steps': 19821, 'loss/train': 1.4720865488052368} -11/07/2021 00:02:13 - INFO - __main__ - Step 19823: {'lr': 0.0004823228005458534, 'samples': 3806016, 'steps': 19822, 'loss/train': 1.4312366247177124} -11/07/2021 00:02:14 - INFO - __main__ - Step 19824: {'lr': 0.00048232084045870204, 'samples': 3806208, 'steps': 19823, 'loss/train': 1.6238641738891602} -11/07/2021 00:02:14 - INFO - __main__ - Step 19825: {'lr': 0.00048231888026687065, 'samples': 3806400, 'steps': 19824, 'loss/train': 1.13937509059906} -11/07/2021 00:02:15 - INFO - __main__ - Step 19826: {'lr': 0.00048231691997035987, 'samples': 3806592, 'steps': 19825, 'loss/train': 1.6825331449508667} -11/07/2021 00:02:15 - INFO - __main__ - Step 19827: {'lr': 0.00048231495956917067, 'samples': 3806784, 'steps': 19826, 'loss/train': 1.4865928888320923} -11/07/2021 00:02:16 - INFO - __main__ - Step 19828: {'lr': 0.00048231299906330397, 'samples': 3806976, 'steps': 19827, 'loss/train': 1.6881486177444458} -11/07/2021 00:02:16 - INFO - __main__ - Step 19829: {'lr': 0.0004823110384527606, 'samples': 3807168, 'steps': 19828, 'loss/train': 1.7928725481033325} -11/07/2021 00:02:16 - INFO - __main__ - Step 19830: {'lr': 0.0004823090777375414, 'samples': 3807360, 'steps': 19829, 'loss/train': 2.1048223972320557} -11/07/2021 00:02:18 - INFO - __main__ - Step 19831: {'lr': 0.0004823071169176474, 'samples': 3807552, 'steps': 19830, 'loss/train': 1.4070188999176025} -11/07/2021 00:02:18 - INFO - __main__ - Step 19832: {'lr': 0.00048230515599307933, 'samples': 3807744, 'steps': 19831, 'loss/train': 1.6805315017700195} -11/07/2021 00:02:18 - INFO - __main__ - Step 19833: {'lr': 0.0004823031949638382, 'samples': 3807936, 'steps': 19832, 'loss/train': 1.3850849866867065} -11/07/2021 00:02:19 - INFO - __main__ - Step 19834: {'lr': 0.0004823012338299248, 'samples': 3808128, 'steps': 19833, 'loss/train': 1.5451176166534424} -11/07/2021 00:02:19 - INFO - __main__ - Step 19835: {'lr': 0.0004822992725913401, 'samples': 3808320, 'steps': 19834, 'loss/train': 1.776845932006836} -11/07/2021 00:02:20 - INFO - __main__ - Step 19836: {'lr': 0.00048229731124808484, 'samples': 3808512, 'steps': 19835, 'loss/train': 1.3738198280334473} -11/07/2021 00:02:20 - INFO - __main__ - Step 19837: {'lr': 0.00048229534980016007, 'samples': 3808704, 'steps': 19836, 'loss/train': 1.5505852699279785} -11/07/2021 00:02:21 - INFO - __main__ - Step 19838: {'lr': 0.0004822933882475666, 'samples': 3808896, 'steps': 19837, 'loss/train': 1.8858225345611572} -11/07/2021 00:02:21 - INFO - __main__ - Step 19839: {'lr': 0.00048229142659030527, 'samples': 3809088, 'steps': 19838, 'loss/train': 1.6088569164276123} -11/07/2021 00:02:21 - INFO - __main__ - Step 19840: {'lr': 0.000482289464828377, 'samples': 3809280, 'steps': 19839, 'loss/train': 2.1285462379455566} -11/07/2021 00:02:22 - INFO - __main__ - Step 19841: {'lr': 0.00048228750296178276, 'samples': 3809472, 'steps': 19840, 'loss/train': 1.7898335456848145} -11/07/2021 00:02:23 - INFO - __main__ - Step 19842: {'lr': 0.0004822855409905233, 'samples': 3809664, 'steps': 19841, 'loss/train': 1.2840629816055298} -11/07/2021 00:02:23 - INFO - __main__ - Step 19843: {'lr': 0.00048228357891459954, 'samples': 3809856, 'steps': 19842, 'loss/train': 1.5152689218521118} -11/07/2021 00:02:24 - INFO - __main__ - Step 19844: {'lr': 0.0004822816167340124, 'samples': 3810048, 'steps': 19843, 'loss/train': 1.5541553497314453} -11/07/2021 00:02:24 - INFO - __main__ - Step 19845: {'lr': 0.00048227965444876277, 'samples': 3810240, 'steps': 19844, 'loss/train': 1.1225873231887817} -11/07/2021 00:02:24 - INFO - __main__ - Step 19846: {'lr': 0.0004822776920588515, 'samples': 3810432, 'steps': 19845, 'loss/train': 1.8110250234603882} -11/07/2021 00:02:25 - INFO - __main__ - Step 19847: {'lr': 0.0004822757295642795, 'samples': 3810624, 'steps': 19846, 'loss/train': 1.0797271728515625} -11/07/2021 00:02:26 - INFO - __main__ - Step 19848: {'lr': 0.00048227376696504765, 'samples': 3810816, 'steps': 19847, 'loss/train': 2.2480528354644775} -11/07/2021 00:02:27 - INFO - __main__ - Step 19849: {'lr': 0.0004822718042611568, 'samples': 3811008, 'steps': 19848, 'loss/train': 1.7323418855667114} -11/07/2021 00:02:27 - INFO - __main__ - Step 19850: {'lr': 0.0004822698414526079, 'samples': 3811200, 'steps': 19849, 'loss/train': 1.9446306228637695} -11/07/2021 00:02:27 - INFO - __main__ - Step 19851: {'lr': 0.0004822678785394017, 'samples': 3811392, 'steps': 19850, 'loss/train': 0.8418163657188416} -11/07/2021 00:02:28 - INFO - __main__ - Step 19852: {'lr': 0.0004822659155215393, 'samples': 3811584, 'steps': 19851, 'loss/train': 1.6243457794189453} -11/07/2021 00:02:28 - INFO - __main__ - Step 19853: {'lr': 0.00048226395239902133, 'samples': 3811776, 'steps': 19852, 'loss/train': 1.8577585220336914} -11/07/2021 00:02:28 - INFO - __main__ - Step 19854: {'lr': 0.00048226198917184886, 'samples': 3811968, 'steps': 19853, 'loss/train': 1.4468683004379272} -11/07/2021 00:02:29 - INFO - __main__ - Step 19855: {'lr': 0.00048226002584002276, 'samples': 3812160, 'steps': 19854, 'loss/train': 1.4608242511749268} -11/07/2021 00:02:30 - INFO - __main__ - Step 19856: {'lr': 0.00048225806240354387, 'samples': 3812352, 'steps': 19855, 'loss/train': 1.6959941387176514} -11/07/2021 00:02:30 - INFO - __main__ - Step 19857: {'lr': 0.0004822560988624131, 'samples': 3812544, 'steps': 19856, 'loss/train': 1.8978437185287476} -11/07/2021 00:02:30 - INFO - __main__ - Step 19858: {'lr': 0.0004822541352166312, 'samples': 3812736, 'steps': 19857, 'loss/train': 1.0776863098144531} -11/07/2021 00:02:31 - INFO - __main__ - Step 19859: {'lr': 0.0004822521714661993, 'samples': 3812928, 'steps': 19858, 'loss/train': 1.6047289371490479} -11/07/2021 00:02:32 - INFO - __main__ - Step 19860: {'lr': 0.0004822502076111181, 'samples': 3813120, 'steps': 19859, 'loss/train': 1.677196741104126} -11/07/2021 00:02:32 - INFO - __main__ - Step 19861: {'lr': 0.0004822482436513885, 'samples': 3813312, 'steps': 19860, 'loss/train': 1.6622592210769653} -11/07/2021 00:02:33 - INFO - __main__ - Step 19862: {'lr': 0.0004822462795870115, 'samples': 3813504, 'steps': 19861, 'loss/train': 1.220088243484497} -11/07/2021 00:02:33 - INFO - __main__ - Step 19863: {'lr': 0.00048224431541798784, 'samples': 3813696, 'steps': 19862, 'loss/train': 1.8354872465133667} -11/07/2021 00:02:33 - INFO - __main__ - Step 19864: {'lr': 0.00048224235114431856, 'samples': 3813888, 'steps': 19863, 'loss/train': 1.6193705797195435} -11/07/2021 00:02:34 - INFO - __main__ - Step 19865: {'lr': 0.0004822403867660044, 'samples': 3814080, 'steps': 19864, 'loss/train': 1.5870299339294434} -11/07/2021 00:02:35 - INFO - __main__ - Step 19866: {'lr': 0.0004822384222830463, 'samples': 3814272, 'steps': 19865, 'loss/train': 0.993768036365509} -11/07/2021 00:02:35 - INFO - __main__ - Step 19867: {'lr': 0.0004822364576954452, 'samples': 3814464, 'steps': 19866, 'loss/train': 2.282621383666992} -11/07/2021 00:02:35 - INFO - __main__ - Step 19868: {'lr': 0.0004822344930032019, 'samples': 3814656, 'steps': 19867, 'loss/train': 1.6406512260437012} -11/07/2021 00:02:36 - INFO - __main__ - Step 19869: {'lr': 0.00048223252820631736, 'samples': 3814848, 'steps': 19868, 'loss/train': 1.61362886428833} -11/07/2021 00:02:37 - INFO - __main__ - Step 19870: {'lr': 0.00048223056330479235, 'samples': 3815040, 'steps': 19869, 'loss/train': 1.9277762174606323} -11/07/2021 00:02:38 - INFO - __main__ - Step 19871: {'lr': 0.00048222859829862784, 'samples': 3815232, 'steps': 19870, 'loss/train': 1.9069395065307617} -11/07/2021 00:02:38 - INFO - __main__ - Step 19872: {'lr': 0.0004822266331878248, 'samples': 3815424, 'steps': 19871, 'loss/train': 1.3378348350524902} -11/07/2021 00:02:38 - INFO - __main__ - Step 19873: {'lr': 0.00048222466797238396, 'samples': 3815616, 'steps': 19872, 'loss/train': 2.248401403427124} -11/07/2021 00:02:39 - INFO - __main__ - Step 19874: {'lr': 0.00048222270265230627, 'samples': 3815808, 'steps': 19873, 'loss/train': 2.2236526012420654} -11/07/2021 00:02:39 - INFO - __main__ - Step 19875: {'lr': 0.0004822207372275926, 'samples': 3816000, 'steps': 19874, 'loss/train': 1.6553248167037964} -11/07/2021 00:02:40 - INFO - __main__ - Step 19876: {'lr': 0.0004822187716982439, 'samples': 3816192, 'steps': 19875, 'loss/train': 1.5618613958358765} -11/07/2021 00:02:40 - INFO - __main__ - Step 19877: {'lr': 0.000482216806064261, 'samples': 3816384, 'steps': 19876, 'loss/train': 1.9362163543701172} -11/07/2021 00:02:41 - INFO - __main__ - Step 19878: {'lr': 0.0004822148403256447, 'samples': 3816576, 'steps': 19877, 'loss/train': 1.5398274660110474} -11/07/2021 00:02:41 - INFO - __main__ - Step 19879: {'lr': 0.00048221287448239604, 'samples': 3816768, 'steps': 19878, 'loss/train': 1.5209888219833374} -11/07/2021 00:02:42 - INFO - __main__ - Step 19880: {'lr': 0.00048221090853451586, 'samples': 3816960, 'steps': 19879, 'loss/train': 2.007349729537964} -11/07/2021 00:02:42 - INFO - __main__ - Step 19881: {'lr': 0.000482208942482005, 'samples': 3817152, 'steps': 19880, 'loss/train': 1.9798191785812378} -11/07/2021 00:02:43 - INFO - __main__ - Step 19882: {'lr': 0.00048220697632486443, 'samples': 3817344, 'steps': 19881, 'loss/train': 1.5395383834838867} -11/07/2021 00:02:43 - INFO - __main__ - Step 19883: {'lr': 0.0004822050100630949, 'samples': 3817536, 'steps': 19882, 'loss/train': 1.7728437185287476} -11/07/2021 00:02:44 - INFO - __main__ - Step 19884: {'lr': 0.0004822030436966974, 'samples': 3817728, 'steps': 19883, 'loss/train': 1.6646522283554077} -11/07/2021 00:02:44 - INFO - __main__ - Step 19885: {'lr': 0.0004822010772256728, 'samples': 3817920, 'steps': 19884, 'loss/train': 1.8511887788772583} -11/07/2021 00:02:44 - INFO - __main__ - Step 19886: {'lr': 0.00048219911065002196, 'samples': 3818112, 'steps': 19885, 'loss/train': 1.541710615158081} -11/07/2021 00:02:45 - INFO - __main__ - Step 19887: {'lr': 0.00048219714396974587, 'samples': 3818304, 'steps': 19886, 'loss/train': 1.7361443042755127} -11/07/2021 00:02:46 - INFO - __main__ - Step 19888: {'lr': 0.0004821951771848452, 'samples': 3818496, 'steps': 19887, 'loss/train': 1.6225528717041016} -11/07/2021 00:02:46 - INFO - __main__ - Step 19889: {'lr': 0.00048219321029532104, 'samples': 3818688, 'steps': 19888, 'loss/train': 1.6663713455200195} -11/07/2021 00:02:46 - INFO - __main__ - Step 19890: {'lr': 0.0004821912433011742, 'samples': 3818880, 'steps': 19889, 'loss/train': 1.6275155544281006} -11/07/2021 00:02:47 - INFO - __main__ - Step 19891: {'lr': 0.00048218927620240557, 'samples': 3819072, 'steps': 19890, 'loss/train': 2.8923377990722656} -11/07/2021 00:02:47 - INFO - __main__ - Step 19892: {'lr': 0.00048218730899901596, 'samples': 3819264, 'steps': 19891, 'loss/train': 1.6975051164627075} -11/07/2021 00:02:48 - INFO - __main__ - Step 19893: {'lr': 0.0004821853416910065, 'samples': 3819456, 'steps': 19892, 'loss/train': 1.6983906030654907} -11/07/2021 00:02:48 - INFO - __main__ - Step 19894: {'lr': 0.0004821833742783778, 'samples': 3819648, 'steps': 19893, 'loss/train': 1.6201729774475098} -11/07/2021 00:02:49 - INFO - __main__ - Step 19895: {'lr': 0.0004821814067611308, 'samples': 3819840, 'steps': 19894, 'loss/train': 1.6576566696166992} -11/07/2021 00:02:49 - INFO - __main__ - Step 19896: {'lr': 0.00048217943913926646, 'samples': 3820032, 'steps': 19895, 'loss/train': 1.4981663227081299} -11/07/2021 00:02:50 - INFO - __main__ - Step 19897: {'lr': 0.00048217747141278574, 'samples': 3820224, 'steps': 19896, 'loss/train': 1.8732210397720337} -11/07/2021 00:02:50 - INFO - __main__ - Step 19898: {'lr': 0.00048217550358168937, 'samples': 3820416, 'steps': 19897, 'loss/train': 1.464651346206665} -11/07/2021 00:02:51 - INFO - __main__ - Step 19899: {'lr': 0.00048217353564597833, 'samples': 3820608, 'steps': 19898, 'loss/train': 1.3284916877746582} -11/07/2021 00:02:51 - INFO - __main__ - Step 19900: {'lr': 0.0004821715676056534, 'samples': 3820800, 'steps': 19899, 'loss/train': 1.760026216506958} -11/07/2021 00:02:52 - INFO - __main__ - Step 19901: {'lr': 0.0004821695994607156, 'samples': 3820992, 'steps': 19900, 'loss/train': 0.7101365923881531} -11/07/2021 00:02:52 - INFO - __main__ - Step 19902: {'lr': 0.0004821676312111658, 'samples': 3821184, 'steps': 19901, 'loss/train': 1.8503962755203247} -11/07/2021 00:02:53 - INFO - __main__ - Step 19903: {'lr': 0.0004821656628570048, 'samples': 3821376, 'steps': 19902, 'loss/train': 2.2400448322296143} -11/07/2021 00:02:53 - INFO - __main__ - Step 19904: {'lr': 0.00048216369439823355, 'samples': 3821568, 'steps': 19903, 'loss/train': 1.7700556516647339} -11/07/2021 00:02:54 - INFO - __main__ - Step 19905: {'lr': 0.0004821617258348529, 'samples': 3821760, 'steps': 19904, 'loss/train': 1.802931785583496} -11/07/2021 00:02:54 - INFO - __main__ - Step 19906: {'lr': 0.0004821597571668638, 'samples': 3821952, 'steps': 19905, 'loss/train': 1.5791219472885132} -11/07/2021 00:02:54 - INFO - __main__ - Step 19907: {'lr': 0.00048215778839426706, 'samples': 3822144, 'steps': 19906, 'loss/train': 1.5165849924087524} -11/07/2021 00:02:55 - INFO - __main__ - Step 19908: {'lr': 0.0004821558195170636, 'samples': 3822336, 'steps': 19907, 'loss/train': 1.3953006267547607} -11/07/2021 00:02:56 - INFO - __main__ - Step 19909: {'lr': 0.00048215385053525434, 'samples': 3822528, 'steps': 19908, 'loss/train': 2.0647053718566895} -11/07/2021 00:02:56 - INFO - __main__ - Step 19910: {'lr': 0.00048215188144884013, 'samples': 3822720, 'steps': 19909, 'loss/train': 1.1711742877960205} -11/07/2021 00:02:57 - INFO - __main__ - Step 19911: {'lr': 0.0004821499122578218, 'samples': 3822912, 'steps': 19910, 'loss/train': 1.7796618938446045} -11/07/2021 00:02:57 - INFO - __main__ - Step 19912: {'lr': 0.00048214794296220045, 'samples': 3823104, 'steps': 19911, 'loss/train': 1.2514482736587524} -11/07/2021 00:02:58 - INFO - __main__ - Step 19913: {'lr': 0.00048214597356197665, 'samples': 3823296, 'steps': 19912, 'loss/train': 1.8508306741714478} -11/07/2021 00:02:58 - INFO - __main__ - Step 19914: {'lr': 0.00048214400405715153, 'samples': 3823488, 'steps': 19913, 'loss/train': 1.087483525276184} -11/07/2021 00:02:59 - INFO - __main__ - Step 19915: {'lr': 0.000482142034447726, 'samples': 3823680, 'steps': 19914, 'loss/train': 2.030345916748047} -11/07/2021 00:02:59 - INFO - __main__ - Step 19916: {'lr': 0.0004821400647337007, 'samples': 3823872, 'steps': 19915, 'loss/train': 1.1114486455917358} -11/07/2021 00:02:59 - INFO - __main__ - Step 19917: {'lr': 0.0004821380949150768, 'samples': 3824064, 'steps': 19916, 'loss/train': 1.6150808334350586} -11/07/2021 00:03:01 - INFO - __main__ - Step 19918: {'lr': 0.0004821361249918549, 'samples': 3824256, 'steps': 19917, 'loss/train': 1.4313181638717651} -11/07/2021 00:03:01 - INFO - __main__ - Step 19919: {'lr': 0.0004821341549640361, 'samples': 3824448, 'steps': 19918, 'loss/train': 1.7815539836883545} -11/07/2021 00:03:01 - INFO - __main__ - Step 19920: {'lr': 0.00048213218483162133, 'samples': 3824640, 'steps': 19919, 'loss/train': 0.6617085337638855} -11/07/2021 00:03:02 - INFO - __main__ - Step 19921: {'lr': 0.0004821302145946113, 'samples': 3824832, 'steps': 19920, 'loss/train': 0.7101051807403564} -11/07/2021 00:03:02 - INFO - __main__ - Step 19922: {'lr': 0.00048212824425300694, 'samples': 3825024, 'steps': 19921, 'loss/train': 1.7854225635528564} -11/07/2021 00:03:02 - INFO - __main__ - Step 19923: {'lr': 0.0004821262738068093, 'samples': 3825216, 'steps': 19922, 'loss/train': 1.6492276191711426} -11/07/2021 00:03:03 - INFO - __main__ - Step 19924: {'lr': 0.00048212430325601905, 'samples': 3825408, 'steps': 19923, 'loss/train': 1.4564239978790283} -11/07/2021 00:03:04 - INFO - __main__ - Step 19925: {'lr': 0.0004821223326006372, 'samples': 3825600, 'steps': 19924, 'loss/train': 1.9753514528274536} -11/07/2021 00:03:04 - INFO - __main__ - Step 19926: {'lr': 0.0004821203618406645, 'samples': 3825792, 'steps': 19925, 'loss/train': 0.9585258364677429} -11/07/2021 00:03:05 - INFO - __main__ - Step 19927: {'lr': 0.0004821183909761021, 'samples': 3825984, 'steps': 19926, 'loss/train': 1.797566294670105} -11/07/2021 00:03:05 - INFO - __main__ - Step 19928: {'lr': 0.00048211642000695065, 'samples': 3826176, 'steps': 19927, 'loss/train': 1.8800297975540161} -11/07/2021 00:03:06 - INFO - __main__ - Step 19929: {'lr': 0.0004821144489332112, 'samples': 3826368, 'steps': 19928, 'loss/train': 2.163250207901001} -11/07/2021 00:03:06 - INFO - __main__ - Step 19930: {'lr': 0.0004821124777548845, 'samples': 3826560, 'steps': 19929, 'loss/train': 1.244161605834961} -11/07/2021 00:03:07 - INFO - __main__ - Step 19931: {'lr': 0.0004821105064719715, 'samples': 3826752, 'steps': 19930, 'loss/train': 1.3511130809783936} -11/07/2021 00:03:07 - INFO - __main__ - Step 19932: {'lr': 0.0004821085350844731, 'samples': 3826944, 'steps': 19931, 'loss/train': 1.8413258790969849} -11/07/2021 00:03:07 - INFO - __main__ - Step 19933: {'lr': 0.0004821065635923902, 'samples': 3827136, 'steps': 19932, 'loss/train': 1.7809979915618896} -11/07/2021 00:03:08 - INFO - __main__ - Step 19934: {'lr': 0.0004821045919957237, 'samples': 3827328, 'steps': 19933, 'loss/train': 1.867737054824829} -11/07/2021 00:03:09 - INFO - __main__ - Step 19935: {'lr': 0.00048210262029447425, 'samples': 3827520, 'steps': 19934, 'loss/train': 2.0068836212158203} -11/07/2021 00:03:09 - INFO - __main__ - Step 19936: {'lr': 0.0004821006484886431, 'samples': 3827712, 'steps': 19935, 'loss/train': 0.7683764100074768} -11/07/2021 00:03:09 - INFO - __main__ - Step 19937: {'lr': 0.000482098676578231, 'samples': 3827904, 'steps': 19936, 'loss/train': 1.7007976770401} -11/07/2021 00:03:10 - INFO - __main__ - Step 19938: {'lr': 0.0004820967045632388, 'samples': 3828096, 'steps': 19937, 'loss/train': 1.0475733280181885} -11/07/2021 00:03:11 - INFO - __main__ - Step 19939: {'lr': 0.00048209473244366737, 'samples': 3828288, 'steps': 19938, 'loss/train': 1.78171706199646} -11/07/2021 00:03:11 - INFO - __main__ - Step 19940: {'lr': 0.00048209276021951765, 'samples': 3828480, 'steps': 19939, 'loss/train': 2.0384621620178223} -11/07/2021 00:03:11 - INFO - __main__ - Step 19941: {'lr': 0.00048209078789079055, 'samples': 3828672, 'steps': 19940, 'loss/train': 1.5990064144134521} -11/07/2021 00:03:12 - INFO - __main__ - Step 19942: {'lr': 0.00048208881545748684, 'samples': 3828864, 'steps': 19941, 'loss/train': 1.893418312072754} -11/07/2021 00:03:12 - INFO - __main__ - Step 19943: {'lr': 0.00048208684291960755, 'samples': 3829056, 'steps': 19942, 'loss/train': 2.1508586406707764} -11/07/2021 00:03:13 - INFO - __main__ - Step 19944: {'lr': 0.0004820848702771535, 'samples': 3829248, 'steps': 19943, 'loss/train': 1.315595269203186} -11/07/2021 00:03:14 - INFO - __main__ - Step 19945: {'lr': 0.0004820828975301256, 'samples': 3829440, 'steps': 19944, 'loss/train': 1.8021361827850342} -11/07/2021 00:03:14 - INFO - __main__ - Step 19946: {'lr': 0.0004820809246785247, 'samples': 3829632, 'steps': 19945, 'loss/train': 1.77168607711792} -11/07/2021 00:03:14 - INFO - __main__ - Step 19947: {'lr': 0.00048207895172235174, 'samples': 3829824, 'steps': 19946, 'loss/train': 0.8945348858833313} -11/07/2021 00:03:15 - INFO - __main__ - Step 19948: {'lr': 0.00048207697866160755, 'samples': 3830016, 'steps': 19947, 'loss/train': 1.6645221710205078} -11/07/2021 00:03:16 - INFO - __main__ - Step 19949: {'lr': 0.0004820750054962931, 'samples': 3830208, 'steps': 19948, 'loss/train': 1.7571378946304321} -11/07/2021 00:03:16 - INFO - __main__ - Step 19950: {'lr': 0.00048207303222640917, 'samples': 3830400, 'steps': 19949, 'loss/train': 1.541943073272705} -11/07/2021 00:03:16 - INFO - __main__ - Step 19951: {'lr': 0.00048207105885195677, 'samples': 3830592, 'steps': 19950, 'loss/train': 1.7315165996551514} -11/07/2021 00:03:17 - INFO - __main__ - Step 19952: {'lr': 0.0004820690853729367, 'samples': 3830784, 'steps': 19951, 'loss/train': 1.8238463401794434} -11/07/2021 00:03:17 - INFO - __main__ - Step 19953: {'lr': 0.00048206711178934994, 'samples': 3830976, 'steps': 19952, 'loss/train': 1.4717843532562256} -11/07/2021 00:03:18 - INFO - __main__ - Step 19954: {'lr': 0.00048206513810119725, 'samples': 3831168, 'steps': 19953, 'loss/train': 1.7660622596740723} -11/07/2021 00:03:18 - INFO - __main__ - Step 19955: {'lr': 0.0004820631643084796, 'samples': 3831360, 'steps': 19954, 'loss/train': 1.2286633253097534} -11/07/2021 00:03:19 - INFO - __main__ - Step 19956: {'lr': 0.00048206119041119787, 'samples': 3831552, 'steps': 19955, 'loss/train': 1.611129879951477} -11/07/2021 00:03:19 - INFO - __main__ - Step 19957: {'lr': 0.000482059216409353, 'samples': 3831744, 'steps': 19956, 'loss/train': 1.5581938028335571} -11/07/2021 00:03:20 - INFO - __main__ - Step 19958: {'lr': 0.0004820572423029458, 'samples': 3831936, 'steps': 19957, 'loss/train': 1.72555410861969} -11/07/2021 00:03:20 - INFO - __main__ - Step 19959: {'lr': 0.00048205526809197717, 'samples': 3832128, 'steps': 19958, 'loss/train': 1.7237474918365479} -11/07/2021 00:03:21 - INFO - __main__ - Step 19960: {'lr': 0.000482053293776448, 'samples': 3832320, 'steps': 19959, 'loss/train': 2.041546106338501} -11/07/2021 00:03:21 - INFO - __main__ - Step 19961: {'lr': 0.0004820513193563593, 'samples': 3832512, 'steps': 19960, 'loss/train': 1.0926424264907837} -11/07/2021 00:03:22 - INFO - __main__ - Step 19962: {'lr': 0.00048204934483171176, 'samples': 3832704, 'steps': 19961, 'loss/train': 1.6191062927246094} -11/07/2021 00:03:22 - INFO - __main__ - Step 19963: {'lr': 0.0004820473702025064, 'samples': 3832896, 'steps': 19962, 'loss/train': 1.6823042631149292} -11/07/2021 00:03:22 - INFO - __main__ - Step 19964: {'lr': 0.000482045395468744, 'samples': 3833088, 'steps': 19963, 'loss/train': 1.7179694175720215} -11/07/2021 00:03:23 - INFO - __main__ - Step 19965: {'lr': 0.0004820434206304256, 'samples': 3833280, 'steps': 19964, 'loss/train': 1.7687020301818848} -11/07/2021 00:03:24 - INFO - __main__ - Step 19966: {'lr': 0.000482041445687552, 'samples': 3833472, 'steps': 19965, 'loss/train': 1.8509191274642944} -11/07/2021 00:03:24 - INFO - __main__ - Step 19967: {'lr': 0.0004820394706401242, 'samples': 3833664, 'steps': 19966, 'loss/train': 1.80912184715271} -11/07/2021 00:03:24 - INFO - __main__ - Step 19968: {'lr': 0.0004820374954881429, 'samples': 3833856, 'steps': 19967, 'loss/train': 1.3538326025009155} -11/07/2021 00:03:25 - INFO - __main__ - Step 19969: {'lr': 0.000482035520231609, 'samples': 3834048, 'steps': 19968, 'loss/train': 1.9789313077926636} -11/07/2021 00:03:26 - INFO - __main__ - Step 19970: {'lr': 0.00048203354487052363, 'samples': 3834240, 'steps': 19969, 'loss/train': 1.5672111511230469} -11/07/2021 00:03:26 - INFO - __main__ - Step 19971: {'lr': 0.00048203156940488745, 'samples': 3834432, 'steps': 19970, 'loss/train': 1.6324018239974976} -11/07/2021 00:03:26 - INFO - __main__ - Step 19972: {'lr': 0.00048202959383470144, 'samples': 3834624, 'steps': 19971, 'loss/train': 1.9827386140823364} -11/07/2021 00:03:27 - INFO - __main__ - Step 19973: {'lr': 0.00048202761815996646, 'samples': 3834816, 'steps': 19972, 'loss/train': 2.020437717437744} -11/07/2021 00:03:27 - INFO - __main__ - Step 19974: {'lr': 0.0004820256423806835, 'samples': 3835008, 'steps': 19973, 'loss/train': 1.4316328763961792} -11/07/2021 00:03:28 - INFO - __main__ - Step 19975: {'lr': 0.00048202366649685325, 'samples': 3835200, 'steps': 19974, 'loss/train': 1.8737499713897705} -11/07/2021 00:03:28 - INFO - __main__ - Step 19976: {'lr': 0.0004820216905084768, 'samples': 3835392, 'steps': 19975, 'loss/train': 1.99074125289917} -11/07/2021 00:03:29 - INFO - __main__ - Step 19977: {'lr': 0.00048201971441555485, 'samples': 3835584, 'steps': 19976, 'loss/train': 1.502482295036316} -11/07/2021 00:03:29 - INFO - __main__ - Step 19978: {'lr': 0.0004820177382180885, 'samples': 3835776, 'steps': 19977, 'loss/train': 1.506314992904663} -11/07/2021 00:03:29 - INFO - __main__ - Step 19979: {'lr': 0.00048201576191607843, 'samples': 3835968, 'steps': 19978, 'loss/train': 1.5382750034332275} -11/07/2021 00:03:31 - INFO - __main__ - Step 19980: {'lr': 0.00048201378550952575, 'samples': 3836160, 'steps': 19979, 'loss/train': 1.3840868473052979} -11/07/2021 00:03:31 - INFO - __main__ - Step 19981: {'lr': 0.0004820118089984312, 'samples': 3836352, 'steps': 19980, 'loss/train': 1.589767336845398} -11/07/2021 00:03:31 - INFO - __main__ - Step 19982: {'lr': 0.0004820098323827957, 'samples': 3836544, 'steps': 19981, 'loss/train': 1.283545732498169} -11/07/2021 00:03:32 - INFO - __main__ - Step 19983: {'lr': 0.0004820078556626202, 'samples': 3836736, 'steps': 19982, 'loss/train': 1.711501955986023} -11/07/2021 00:03:32 - INFO - __main__ - Step 19984: {'lr': 0.0004820058788379055, 'samples': 3836928, 'steps': 19983, 'loss/train': 1.5402511358261108} -11/07/2021 00:03:34 - INFO - __main__ - Step 19985: {'lr': 0.0004820039019086525, 'samples': 3837120, 'steps': 19984, 'loss/train': 1.3763577938079834} -11/07/2021 00:03:34 - INFO - __main__ - Step 19986: {'lr': 0.00048200192487486216, 'samples': 3837312, 'steps': 19985, 'loss/train': 1.419226884841919} -11/07/2021 00:03:34 - INFO - __main__ - Step 19987: {'lr': 0.00048199994773653535, 'samples': 3837504, 'steps': 19986, 'loss/train': 1.899288535118103} -11/07/2021 00:03:35 - INFO - __main__ - Step 19988: {'lr': 0.0004819979704936729, 'samples': 3837696, 'steps': 19987, 'loss/train': 1.6395899057388306} -11/07/2021 00:03:35 - INFO - __main__ - Step 19989: {'lr': 0.00048199599314627576, 'samples': 3837888, 'steps': 19988, 'loss/train': 0.23624520003795624} -11/07/2021 00:03:35 - INFO - __main__ - Step 19990: {'lr': 0.00048199401569434477, 'samples': 3838080, 'steps': 19989, 'loss/train': 1.949768304824829} -11/07/2021 00:03:37 - INFO - __main__ - Step 19991: {'lr': 0.00048199203813788086, 'samples': 3838272, 'steps': 19990, 'loss/train': 1.4753718376159668} -11/07/2021 00:03:37 - INFO - __main__ - Step 19992: {'lr': 0.00048199006047688496, 'samples': 3838464, 'steps': 19991, 'loss/train': 1.7044295072555542} -11/07/2021 00:03:37 - INFO - __main__ - Step 19993: {'lr': 0.0004819880827113579, 'samples': 3838656, 'steps': 19992, 'loss/train': 1.3625941276550293} -11/07/2021 00:03:38 - INFO - __main__ - Step 19994: {'lr': 0.0004819861048413006, 'samples': 3838848, 'steps': 19993, 'loss/train': 2.013521671295166} -11/07/2021 00:03:38 - INFO - __main__ - Step 19995: {'lr': 0.00048198412686671394, 'samples': 3839040, 'steps': 19994, 'loss/train': 1.5377622842788696} -11/07/2021 00:03:39 - INFO - __main__ - Step 19996: {'lr': 0.0004819821487875988, 'samples': 3839232, 'steps': 19995, 'loss/train': 1.0868034362792969} -11/07/2021 00:03:40 - INFO - __main__ - Step 19997: {'lr': 0.0004819801706039561, 'samples': 3839424, 'steps': 19996, 'loss/train': 1.610630989074707} -11/07/2021 00:03:40 - INFO - __main__ - Step 19998: {'lr': 0.0004819781923157867, 'samples': 3839616, 'steps': 19997, 'loss/train': 1.0310406684875488} -11/07/2021 00:03:40 - INFO - __main__ - Step 19999: {'lr': 0.00048197621392309154, 'samples': 3839808, 'steps': 19998, 'loss/train': 1.1806281805038452} -11/07/2021 00:03:41 - INFO - __main__ - Step 20000: {'lr': 0.00048197423542587143, 'samples': 3840000, 'steps': 19999, 'loss/train': 1.3565977811813354} -11/07/2021 00:03:41 - INFO - __main__ - Step 20001: {'lr': 0.0004819722568241274, 'samples': 3840192, 'steps': 20000, 'loss/train': 1.302907109260559} -11/07/2021 00:03:42 - INFO - __main__ - Step 20002: {'lr': 0.0004819702781178601, 'samples': 3840384, 'steps': 20001, 'loss/train': 1.4258530139923096} -11/07/2021 00:03:42 - INFO - __main__ - Step 20003: {'lr': 0.00048196829930707066, 'samples': 3840576, 'steps': 20002, 'loss/train': 1.59110689163208} -11/07/2021 00:03:43 - INFO - __main__ - Step 20004: {'lr': 0.0004819663203917599, 'samples': 3840768, 'steps': 20003, 'loss/train': 1.8877140283584595} -11/07/2021 00:03:43 - INFO - __main__ - Step 20005: {'lr': 0.0004819643413719287, 'samples': 3840960, 'steps': 20004, 'loss/train': 1.347116470336914} -11/07/2021 00:03:44 - INFO - __main__ - Step 20006: {'lr': 0.0004819623622475779, 'samples': 3841152, 'steps': 20005, 'loss/train': 1.6380776166915894} -11/07/2021 00:03:45 - INFO - __main__ - Step 20007: {'lr': 0.00048196038301870847, 'samples': 3841344, 'steps': 20006, 'loss/train': 1.8486162424087524} -11/07/2021 00:03:45 - INFO - __main__ - Step 20008: {'lr': 0.0004819584036853212, 'samples': 3841536, 'steps': 20007, 'loss/train': 1.7656793594360352} -11/07/2021 00:03:45 - INFO - __main__ - Step 20009: {'lr': 0.00048195642424741716, 'samples': 3841728, 'steps': 20008, 'loss/train': 1.735512137413025} -11/07/2021 00:03:46 - INFO - __main__ - Step 20010: {'lr': 0.00048195444470499704, 'samples': 3841920, 'steps': 20009, 'loss/train': 2.8203601837158203} -11/07/2021 00:03:46 - INFO - __main__ - Step 20011: {'lr': 0.0004819524650580619, 'samples': 3842112, 'steps': 20010, 'loss/train': 1.5159910917282104} -11/07/2021 00:03:47 - INFO - __main__ - Step 20012: {'lr': 0.0004819504853066126, 'samples': 3842304, 'steps': 20011, 'loss/train': 1.7866848707199097} -11/07/2021 00:03:47 - INFO - __main__ - Step 20013: {'lr': 0.0004819485054506498, 'samples': 3842496, 'steps': 20012, 'loss/train': 1.8437927961349487} -11/07/2021 00:03:48 - INFO - __main__ - Step 20014: {'lr': 0.00048194652549017484, 'samples': 3842688, 'steps': 20013, 'loss/train': 0.3831263780593872} -11/07/2021 00:03:48 - INFO - __main__ - Step 20015: {'lr': 0.0004819445454251882, 'samples': 3842880, 'steps': 20014, 'loss/train': 1.9873749017715454} -11/07/2021 00:03:48 - INFO - __main__ - Step 20016: {'lr': 0.0004819425652556909, 'samples': 3843072, 'steps': 20015, 'loss/train': 1.6326098442077637} -11/07/2021 00:03:49 - INFO - __main__ - Step 20017: {'lr': 0.0004819405849816839, 'samples': 3843264, 'steps': 20016, 'loss/train': 1.6164615154266357} -11/07/2021 00:03:50 - INFO - __main__ - Step 20018: {'lr': 0.00048193860460316805, 'samples': 3843456, 'steps': 20017, 'loss/train': 1.9409981966018677} -11/07/2021 00:03:50 - INFO - __main__ - Step 20019: {'lr': 0.00048193662412014427, 'samples': 3843648, 'steps': 20018, 'loss/train': 1.6340709924697876} -11/07/2021 00:03:51 - INFO - __main__ - Step 20020: {'lr': 0.0004819346435326134, 'samples': 3843840, 'steps': 20019, 'loss/train': 1.7512751817703247} -11/07/2021 00:03:51 - INFO - __main__ - Step 20021: {'lr': 0.00048193266284057634, 'samples': 3844032, 'steps': 20020, 'loss/train': 1.0968644618988037} -11/07/2021 00:03:51 - INFO - __main__ - Step 20022: {'lr': 0.0004819306820440341, 'samples': 3844224, 'steps': 20021, 'loss/train': 1.8102567195892334} -11/07/2021 00:03:53 - INFO - __main__ - Step 20023: {'lr': 0.0004819287011429874, 'samples': 3844416, 'steps': 20022, 'loss/train': 1.518404483795166} -11/07/2021 00:03:53 - INFO - __main__ - Step 20024: {'lr': 0.0004819267201374372, 'samples': 3844608, 'steps': 20023, 'loss/train': 1.6262191534042358} -11/07/2021 00:03:53 - INFO - __main__ - Step 20025: {'lr': 0.0004819247390273844, 'samples': 3844800, 'steps': 20024, 'loss/train': 1.5133861303329468} -11/07/2021 00:03:54 - INFO - __main__ - Step 20026: {'lr': 0.00048192275781282993, 'samples': 3844992, 'steps': 20025, 'loss/train': 1.825657606124878} -11/07/2021 00:03:54 - INFO - __main__ - Step 20027: {'lr': 0.00048192077649377455, 'samples': 3845184, 'steps': 20026, 'loss/train': 1.623038411140442} -11/07/2021 00:03:55 - INFO - __main__ - Step 20028: {'lr': 0.0004819187950702193, 'samples': 3845376, 'steps': 20027, 'loss/train': 1.3020976781845093} -11/07/2021 00:03:55 - INFO - __main__ - Step 20029: {'lr': 0.00048191681354216504, 'samples': 3845568, 'steps': 20028, 'loss/train': 1.8787384033203125} -11/07/2021 00:03:56 - INFO - __main__ - Step 20030: {'lr': 0.0004819148319096126, 'samples': 3845760, 'steps': 20029, 'loss/train': 1.937517523765564} -11/07/2021 00:03:56 - INFO - __main__ - Step 20031: {'lr': 0.00048191285017256297, 'samples': 3845952, 'steps': 20030, 'loss/train': 1.222166657447815} -11/07/2021 00:03:56 - INFO - __main__ - Step 20032: {'lr': 0.00048191086833101695, 'samples': 3846144, 'steps': 20031, 'loss/train': 1.8381415605545044} -11/07/2021 00:03:57 - INFO - __main__ - Step 20033: {'lr': 0.00048190888638497553, 'samples': 3846336, 'steps': 20032, 'loss/train': 1.8794498443603516} -11/07/2021 00:03:58 - INFO - __main__ - Step 20034: {'lr': 0.00048190690433443946, 'samples': 3846528, 'steps': 20033, 'loss/train': 1.9543792009353638} -11/07/2021 00:03:58 - INFO - __main__ - Step 20035: {'lr': 0.0004819049221794097, 'samples': 3846720, 'steps': 20034, 'loss/train': 1.4590505361557007} -11/07/2021 00:03:59 - INFO - __main__ - Step 20036: {'lr': 0.0004819029399198873, 'samples': 3846912, 'steps': 20035, 'loss/train': 1.4175198078155518} -11/07/2021 00:03:59 - INFO - __main__ - Step 20037: {'lr': 0.0004819009575558729, 'samples': 3847104, 'steps': 20036, 'loss/train': 1.7073240280151367} -11/07/2021 00:03:59 - INFO - __main__ - Step 20038: {'lr': 0.0004818989750873676, 'samples': 3847296, 'steps': 20037, 'loss/train': 1.8141921758651733} -11/07/2021 00:04:00 - INFO - __main__ - Step 20039: {'lr': 0.00048189699251437206, 'samples': 3847488, 'steps': 20038, 'loss/train': 1.413412094116211} -11/07/2021 00:04:01 - INFO - __main__ - Step 20040: {'lr': 0.0004818950098368874, 'samples': 3847680, 'steps': 20039, 'loss/train': 1.2684391736984253} -11/07/2021 00:04:01 - INFO - __main__ - Step 20041: {'lr': 0.00048189302705491446, 'samples': 3847872, 'steps': 20040, 'loss/train': 1.8604671955108643} -11/07/2021 00:04:01 - INFO - __main__ - Step 20042: {'lr': 0.000481891044168454, 'samples': 3848064, 'steps': 20041, 'loss/train': 1.7178666591644287} -11/07/2021 00:04:02 - INFO - __main__ - Step 20043: {'lr': 0.00048188906117750706, 'samples': 3848256, 'steps': 20042, 'loss/train': 1.5165631771087646} -11/07/2021 00:04:03 - INFO - __main__ - Step 20044: {'lr': 0.00048188707808207457, 'samples': 3848448, 'steps': 20043, 'loss/train': 2.249117374420166} -11/07/2021 00:04:03 - INFO - __main__ - Step 20045: {'lr': 0.00048188509488215724, 'samples': 3848640, 'steps': 20044, 'loss/train': 1.760151743888855} -11/07/2021 00:04:03 - INFO - __main__ - Step 20046: {'lr': 0.0004818831115777561, 'samples': 3848832, 'steps': 20045, 'loss/train': 1.6248598098754883} -11/07/2021 00:04:04 - INFO - __main__ - Step 20047: {'lr': 0.00048188112816887203, 'samples': 3849024, 'steps': 20046, 'loss/train': 1.315185785293579} -11/07/2021 00:04:04 - INFO - __main__ - Step 20048: {'lr': 0.0004818791446555059, 'samples': 3849216, 'steps': 20047, 'loss/train': 1.6985441446304321} -11/07/2021 00:04:05 - INFO - __main__ - Step 20049: {'lr': 0.00048187716103765854, 'samples': 3849408, 'steps': 20048, 'loss/train': 1.3543537855148315} -11/07/2021 00:04:06 - INFO - __main__ - Step 20050: {'lr': 0.0004818751773153309, 'samples': 3849600, 'steps': 20049, 'loss/train': 1.623940348625183} -11/07/2021 00:04:06 - INFO - __main__ - Step 20051: {'lr': 0.000481873193488524, 'samples': 3849792, 'steps': 20050, 'loss/train': 1.5104410648345947} -11/07/2021 00:04:06 - INFO - __main__ - Step 20052: {'lr': 0.0004818712095572385, 'samples': 3849984, 'steps': 20051, 'loss/train': 1.4376572370529175} -11/07/2021 00:04:07 - INFO - __main__ - Step 20053: {'lr': 0.0004818692255214755, 'samples': 3850176, 'steps': 20052, 'loss/train': 1.616486668586731} -11/07/2021 00:04:08 - INFO - __main__ - Step 20054: {'lr': 0.00048186724138123577, 'samples': 3850368, 'steps': 20053, 'loss/train': 1.556071162223816} -11/07/2021 00:04:08 - INFO - __main__ - Step 20055: {'lr': 0.00048186525713652024, 'samples': 3850560, 'steps': 20054, 'loss/train': 2.0656604766845703} -11/07/2021 00:04:08 - INFO - __main__ - Step 20056: {'lr': 0.0004818632727873298, 'samples': 3850752, 'steps': 20055, 'loss/train': 1.7116798162460327} -11/07/2021 00:04:09 - INFO - __main__ - Step 20057: {'lr': 0.00048186128833366536, 'samples': 3850944, 'steps': 20056, 'loss/train': 1.7523837089538574} -11/07/2021 00:04:09 - INFO - __main__ - Step 20058: {'lr': 0.0004818593037755278, 'samples': 3851136, 'steps': 20057, 'loss/train': 1.833410620689392} -11/07/2021 00:04:09 - INFO - __main__ - Step 20059: {'lr': 0.000481857319112918, 'samples': 3851328, 'steps': 20058, 'loss/train': 1.7501016855239868} -11/07/2021 00:04:10 - INFO - __main__ - Step 20060: {'lr': 0.0004818553343458368, 'samples': 3851520, 'steps': 20059, 'loss/train': 1.7878509759902954} -11/07/2021 00:04:11 - INFO - __main__ - Step 20061: {'lr': 0.00048185334947428525, 'samples': 3851712, 'steps': 20060, 'loss/train': 3.4654691219329834} -11/07/2021 00:04:11 - INFO - __main__ - Step 20062: {'lr': 0.0004818513644982642, 'samples': 3851904, 'steps': 20061, 'loss/train': 1.6801989078521729} -11/07/2021 00:04:11 - INFO - __main__ - Step 20063: {'lr': 0.0004818493794177744, 'samples': 3852096, 'steps': 20062, 'loss/train': 2.7569499015808105} -11/07/2021 00:04:12 - INFO - __main__ - Step 20064: {'lr': 0.00048184739423281695, 'samples': 3852288, 'steps': 20063, 'loss/train': 1.657804250717163} -11/07/2021 00:04:13 - INFO - __main__ - Step 20065: {'lr': 0.00048184540894339256, 'samples': 3852480, 'steps': 20064, 'loss/train': 1.6313239336013794} -11/07/2021 00:04:13 - INFO - __main__ - Step 20066: {'lr': 0.00048184342354950225, 'samples': 3852672, 'steps': 20065, 'loss/train': 1.8359761238098145} -11/07/2021 00:04:14 - INFO - __main__ - Step 20067: {'lr': 0.00048184143805114684, 'samples': 3852864, 'steps': 20066, 'loss/train': 1.2439062595367432} -11/07/2021 00:04:14 - INFO - __main__ - Step 20068: {'lr': 0.00048183945244832725, 'samples': 3853056, 'steps': 20067, 'loss/train': 2.3377492427825928} -11/07/2021 00:04:14 - INFO - __main__ - Step 20069: {'lr': 0.00048183746674104446, 'samples': 3853248, 'steps': 20068, 'loss/train': 1.7448499202728271} -11/07/2021 00:04:15 - INFO - __main__ - Step 20070: {'lr': 0.00048183548092929916, 'samples': 3853440, 'steps': 20069, 'loss/train': 1.6729365587234497} -11/07/2021 00:04:16 - INFO - __main__ - Step 20071: {'lr': 0.0004818334950130925, 'samples': 3853632, 'steps': 20070, 'loss/train': 1.792672038078308} -11/07/2021 00:04:16 - INFO - __main__ - Step 20072: {'lr': 0.00048183150899242514, 'samples': 3853824, 'steps': 20071, 'loss/train': 2.116844892501831} -11/07/2021 00:04:16 - INFO - __main__ - Step 20073: {'lr': 0.0004818295228672981, 'samples': 3854016, 'steps': 20072, 'loss/train': 2.090991258621216} -11/07/2021 00:04:17 - INFO - __main__ - Step 20074: {'lr': 0.0004818275366377123, 'samples': 3854208, 'steps': 20073, 'loss/train': 1.6128263473510742} -11/07/2021 00:04:18 - INFO - __main__ - Step 20075: {'lr': 0.00048182555030366854, 'samples': 3854400, 'steps': 20074, 'loss/train': 1.7799201011657715} -11/07/2021 00:04:18 - INFO - __main__ - Step 20076: {'lr': 0.0004818235638651678, 'samples': 3854592, 'steps': 20075, 'loss/train': 1.5875736474990845} -11/07/2021 00:04:18 - INFO - __main__ - Step 20077: {'lr': 0.0004818215773222109, 'samples': 3854784, 'steps': 20076, 'loss/train': 0.957347571849823} -11/07/2021 00:04:19 - INFO - __main__ - Step 20078: {'lr': 0.0004818195906747988, 'samples': 3854976, 'steps': 20077, 'loss/train': 1.4278732538223267} -11/07/2021 00:04:19 - INFO - __main__ - Step 20079: {'lr': 0.0004818176039229324, 'samples': 3855168, 'steps': 20078, 'loss/train': 1.445941686630249} -11/07/2021 00:04:20 - INFO - __main__ - Step 20080: {'lr': 0.0004818156170666125, 'samples': 3855360, 'steps': 20079, 'loss/train': 1.3033205270767212} -11/07/2021 00:04:21 - INFO - __main__ - Step 20081: {'lr': 0.0004818136301058401, 'samples': 3855552, 'steps': 20080, 'loss/train': 1.856467604637146} -11/07/2021 00:04:21 - INFO - __main__ - Step 20082: {'lr': 0.0004818116430406161, 'samples': 3855744, 'steps': 20081, 'loss/train': 1.8351445198059082} -11/07/2021 00:04:21 - INFO - __main__ - Step 20083: {'lr': 0.00048180965587094125, 'samples': 3855936, 'steps': 20082, 'loss/train': 1.6008447408676147} -11/07/2021 00:04:22 - INFO - __main__ - Step 20084: {'lr': 0.00048180766859681664, 'samples': 3856128, 'steps': 20083, 'loss/train': 1.4347810745239258} -11/07/2021 00:04:23 - INFO - __main__ - Step 20085: {'lr': 0.000481805681218243, 'samples': 3856320, 'steps': 20084, 'loss/train': 1.5482618808746338} -11/07/2021 00:04:23 - INFO - __main__ - Step 20086: {'lr': 0.0004818036937352214, 'samples': 3856512, 'steps': 20085, 'loss/train': 1.7869243621826172} -11/07/2021 00:04:23 - INFO - __main__ - Step 20087: {'lr': 0.0004818017061477525, 'samples': 3856704, 'steps': 20086, 'loss/train': 1.2508975267410278} -11/07/2021 00:04:24 - INFO - __main__ - Step 20088: {'lr': 0.00048179971845583734, 'samples': 3856896, 'steps': 20087, 'loss/train': 1.7061606645584106} -11/07/2021 00:04:24 - INFO - __main__ - Step 20089: {'lr': 0.00048179773065947683, 'samples': 3857088, 'steps': 20088, 'loss/train': 1.7644474506378174} -11/07/2021 00:04:24 - INFO - __main__ - Step 20090: {'lr': 0.0004817957427586719, 'samples': 3857280, 'steps': 20089, 'loss/train': 1.3199182748794556} -11/07/2021 00:04:25 - INFO - __main__ - Step 20091: {'lr': 0.00048179375475342333, 'samples': 3857472, 'steps': 20090, 'loss/train': 1.5608344078063965} -11/07/2021 00:04:26 - INFO - __main__ - Step 20092: {'lr': 0.00048179176664373214, 'samples': 3857664, 'steps': 20091, 'loss/train': 1.464991569519043} -11/07/2021 00:04:26 - INFO - __main__ - Step 20093: {'lr': 0.0004817897784295991, 'samples': 3857856, 'steps': 20092, 'loss/train': 2.1888020038604736} -11/07/2021 00:04:26 - INFO - __main__ - Step 20094: {'lr': 0.0004817877901110251, 'samples': 3858048, 'steps': 20093, 'loss/train': 2.046032428741455} -11/07/2021 00:04:27 - INFO - __main__ - Step 20095: {'lr': 0.0004817858016880112, 'samples': 3858240, 'steps': 20094, 'loss/train': 2.0262649059295654} -11/07/2021 00:04:28 - INFO - __main__ - Step 20096: {'lr': 0.0004817838131605582, 'samples': 3858432, 'steps': 20095, 'loss/train': 1.6248929500579834} -11/07/2021 00:04:28 - INFO - __main__ - Step 20097: {'lr': 0.00048178182452866694, 'samples': 3858624, 'steps': 20096, 'loss/train': 1.839397668838501} -11/07/2021 00:04:28 - INFO - __main__ - Step 20098: {'lr': 0.0004817798357923384, 'samples': 3858816, 'steps': 20097, 'loss/train': 1.6831201314926147} -11/07/2021 00:04:29 - INFO - __main__ - Step 20099: {'lr': 0.00048177784695157335, 'samples': 3859008, 'steps': 20098, 'loss/train': 1.7522791624069214} -11/07/2021 00:04:29 - INFO - __main__ - Step 20100: {'lr': 0.00048177585800637286, 'samples': 3859200, 'steps': 20099, 'loss/train': 1.5155513286590576} -11/07/2021 00:04:30 - INFO - __main__ - Step 20101: {'lr': 0.00048177386895673774, 'samples': 3859392, 'steps': 20100, 'loss/train': 1.6983426809310913} -11/07/2021 00:04:30 - INFO - __main__ - Step 20102: {'lr': 0.0004817718798026689, 'samples': 3859584, 'steps': 20101, 'loss/train': 1.6446847915649414} -11/07/2021 00:04:31 - INFO - __main__ - Step 20103: {'lr': 0.0004817698905441672, 'samples': 3859776, 'steps': 20102, 'loss/train': 1.7305409908294678} -11/07/2021 00:04:31 - INFO - __main__ - Step 20104: {'lr': 0.0004817679011812336, 'samples': 3859968, 'steps': 20103, 'loss/train': 1.7872097492218018} -11/07/2021 00:04:32 - INFO - __main__ - Step 20105: {'lr': 0.00048176591171386884, 'samples': 3860160, 'steps': 20104, 'loss/train': 1.3828495740890503} -11/07/2021 00:04:33 - INFO - __main__ - Step 20106: {'lr': 0.0004817639221420741, 'samples': 3860352, 'steps': 20105, 'loss/train': 2.1160809993743896} -11/07/2021 00:04:33 - INFO - __main__ - Step 20107: {'lr': 0.00048176193246585, 'samples': 3860544, 'steps': 20106, 'loss/train': 1.92433500289917} -11/07/2021 00:04:33 - INFO - __main__ - Step 20108: {'lr': 0.00048175994268519765, 'samples': 3860736, 'steps': 20107, 'loss/train': 1.871787428855896} -11/07/2021 00:04:34 - INFO - __main__ - Step 20109: {'lr': 0.00048175795280011775, 'samples': 3860928, 'steps': 20108, 'loss/train': 1.485747218132019} -11/07/2021 00:04:34 - INFO - __main__ - Step 20110: {'lr': 0.00048175596281061135, 'samples': 3861120, 'steps': 20109, 'loss/train': 1.0940872430801392} -11/07/2021 00:04:35 - INFO - __main__ - Step 20111: {'lr': 0.00048175397271667925, 'samples': 3861312, 'steps': 20110, 'loss/train': 0.7007030844688416} -11/07/2021 00:04:35 - INFO - __main__ - Step 20112: {'lr': 0.00048175198251832244, 'samples': 3861504, 'steps': 20111, 'loss/train': 1.479366660118103} -11/07/2021 00:04:36 - INFO - __main__ - Step 20113: {'lr': 0.00048174999221554173, 'samples': 3861696, 'steps': 20112, 'loss/train': 1.4841296672821045} -11/07/2021 00:04:36 - INFO - __main__ - Step 20114: {'lr': 0.000481748001808338, 'samples': 3861888, 'steps': 20113, 'loss/train': 1.2486543655395508} -11/07/2021 00:04:36 - INFO - __main__ - Step 20115: {'lr': 0.00048174601129671223, 'samples': 3862080, 'steps': 20114, 'loss/train': 0.9452338218688965} -11/07/2021 00:04:37 - INFO - __main__ - Step 20116: {'lr': 0.00048174402068066534, 'samples': 3862272, 'steps': 20115, 'loss/train': 1.4266661405563354} -11/07/2021 00:04:38 - INFO - __main__ - Step 20117: {'lr': 0.0004817420299601981, 'samples': 3862464, 'steps': 20116, 'loss/train': 2.441077947616577} -11/07/2021 00:04:38 - INFO - __main__ - Step 20118: {'lr': 0.0004817400391353115, 'samples': 3862656, 'steps': 20117, 'loss/train': 1.3544243574142456} -11/07/2021 00:04:39 - INFO - __main__ - Step 20119: {'lr': 0.00048173804820600646, 'samples': 3862848, 'steps': 20118, 'loss/train': 1.8580822944641113} -11/07/2021 00:04:39 - INFO - __main__ - Step 20120: {'lr': 0.0004817360571722838, 'samples': 3863040, 'steps': 20119, 'loss/train': 1.5528236627578735} -11/07/2021 00:04:40 - INFO - __main__ - Step 20121: {'lr': 0.00048173406603414445, 'samples': 3863232, 'steps': 20120, 'loss/train': 1.140297293663025} -11/07/2021 00:04:40 - INFO - __main__ - Step 20122: {'lr': 0.00048173207479158933, 'samples': 3863424, 'steps': 20121, 'loss/train': 0.44841068983078003} -11/07/2021 00:04:41 - INFO - __main__ - Step 20123: {'lr': 0.0004817300834446192, 'samples': 3863616, 'steps': 20122, 'loss/train': 1.983655571937561} -11/07/2021 00:04:41 - INFO - __main__ - Step 20124: {'lr': 0.0004817280919932352, 'samples': 3863808, 'steps': 20123, 'loss/train': 1.480665683746338} -11/07/2021 00:04:42 - INFO - __main__ - Step 20125: {'lr': 0.000481726100437438, 'samples': 3864000, 'steps': 20124, 'loss/train': 1.859569787979126} -11/07/2021 00:04:42 - INFO - __main__ - Step 20126: {'lr': 0.00048172410877722865, 'samples': 3864192, 'steps': 20125, 'loss/train': 1.8540468215942383} -11/07/2021 00:04:43 - INFO - __main__ - Step 20127: {'lr': 0.00048172211701260807, 'samples': 3864384, 'steps': 20126, 'loss/train': 1.706778645515442} -11/07/2021 00:04:43 - INFO - __main__ - Step 20128: {'lr': 0.0004817201251435769, 'samples': 3864576, 'steps': 20127, 'loss/train': 1.863878846168518} -11/07/2021 00:04:44 - INFO - __main__ - Step 20129: {'lr': 0.00048171813317013633, 'samples': 3864768, 'steps': 20128, 'loss/train': 1.8926697969436646} -11/07/2021 00:04:44 - INFO - __main__ - Step 20130: {'lr': 0.00048171614109228714, 'samples': 3864960, 'steps': 20129, 'loss/train': 1.369523048400879} -11/07/2021 00:04:44 - INFO - __main__ - Step 20131: {'lr': 0.0004817141489100302, 'samples': 3865152, 'steps': 20130, 'loss/train': 1.67985999584198} -11/07/2021 00:04:45 - INFO - __main__ - Step 20132: {'lr': 0.0004817121566233665, 'samples': 3865344, 'steps': 20131, 'loss/train': 1.905426025390625} -11/07/2021 00:04:46 - INFO - __main__ - Step 20133: {'lr': 0.0004817101642322968, 'samples': 3865536, 'steps': 20132, 'loss/train': 1.1768156290054321} -11/07/2021 00:04:46 - INFO - __main__ - Step 20134: {'lr': 0.00048170817173682215, 'samples': 3865728, 'steps': 20133, 'loss/train': 1.8267666101455688} -11/07/2021 00:04:47 - INFO - __main__ - Step 20135: {'lr': 0.00048170617913694333, 'samples': 3865920, 'steps': 20134, 'loss/train': 1.8322908878326416} -11/07/2021 00:04:47 - INFO - __main__ - Step 20136: {'lr': 0.00048170418643266125, 'samples': 3866112, 'steps': 20135, 'loss/train': 1.625266671180725} -11/07/2021 00:04:47 - INFO - __main__ - Step 20137: {'lr': 0.00048170219362397685, 'samples': 3866304, 'steps': 20136, 'loss/train': 1.84674870967865} -11/07/2021 00:04:48 - INFO - __main__ - Step 20138: {'lr': 0.00048170020071089105, 'samples': 3866496, 'steps': 20137, 'loss/train': 1.6670939922332764} -11/07/2021 00:04:49 - INFO - __main__ - Step 20139: {'lr': 0.00048169820769340476, 'samples': 3866688, 'steps': 20138, 'loss/train': 1.7214689254760742} -11/07/2021 00:04:49 - INFO - __main__ - Step 20140: {'lr': 0.0004816962145715188, 'samples': 3866880, 'steps': 20139, 'loss/train': 1.1451594829559326} -11/07/2021 00:04:49 - INFO - __main__ - Step 20141: {'lr': 0.00048169422134523404, 'samples': 3867072, 'steps': 20140, 'loss/train': 1.5689804553985596} -11/07/2021 00:04:50 - INFO - __main__ - Step 20142: {'lr': 0.0004816922280145515, 'samples': 3867264, 'steps': 20141, 'loss/train': 1.038034439086914} -11/07/2021 00:04:51 - INFO - __main__ - Step 20143: {'lr': 0.00048169023457947195, 'samples': 3867456, 'steps': 20142, 'loss/train': 2.1106817722320557} -11/07/2021 00:04:51 - INFO - __main__ - Step 20144: {'lr': 0.0004816882410399964, 'samples': 3867648, 'steps': 20143, 'loss/train': 0.2228638380765915} -11/07/2021 00:04:51 - INFO - __main__ - Step 20145: {'lr': 0.00048168624739612577, 'samples': 3867840, 'steps': 20144, 'loss/train': 1.7859293222427368} -11/07/2021 00:04:52 - INFO - __main__ - Step 20146: {'lr': 0.0004816842536478608, 'samples': 3868032, 'steps': 20145, 'loss/train': 2.007317066192627} -11/07/2021 00:04:52 - INFO - __main__ - Step 20147: {'lr': 0.00048168225979520254, 'samples': 3868224, 'steps': 20146, 'loss/train': 1.6304503679275513} -11/07/2021 00:04:53 - INFO - __main__ - Step 20148: {'lr': 0.0004816802658381518, 'samples': 3868416, 'steps': 20147, 'loss/train': 1.0293740034103394} -11/07/2021 00:04:54 - INFO - __main__ - Step 20149: {'lr': 0.00048167827177670946, 'samples': 3868608, 'steps': 20148, 'loss/train': 1.9682854413986206} -11/07/2021 00:04:54 - INFO - __main__ - Step 20150: {'lr': 0.0004816762776108765, 'samples': 3868800, 'steps': 20149, 'loss/train': 1.8390581607818604} -11/07/2021 00:04:54 - INFO - __main__ - Step 20151: {'lr': 0.0004816742833406538, 'samples': 3868992, 'steps': 20150, 'loss/train': 2.0192196369171143} -11/07/2021 00:04:55 - INFO - __main__ - Step 20152: {'lr': 0.0004816722889660423, 'samples': 3869184, 'steps': 20151, 'loss/train': 1.632528305053711} -11/07/2021 00:04:56 - INFO - __main__ - Step 20153: {'lr': 0.00048167029448704273, 'samples': 3869376, 'steps': 20152, 'loss/train': 1.5875515937805176} -11/07/2021 00:04:56 - INFO - __main__ - Step 20154: {'lr': 0.00048166829990365615, 'samples': 3869568, 'steps': 20153, 'loss/train': 2.2908775806427} -11/07/2021 00:04:56 - INFO - __main__ - Step 20155: {'lr': 0.0004816663052158834, 'samples': 3869760, 'steps': 20154, 'loss/train': 2.725844621658325} -11/07/2021 00:04:57 - INFO - __main__ - Step 20156: {'lr': 0.0004816643104237254, 'samples': 3869952, 'steps': 20155, 'loss/train': 1.3609468936920166} -11/07/2021 00:04:57 - INFO - __main__ - Step 20157: {'lr': 0.00048166231552718305, 'samples': 3870144, 'steps': 20156, 'loss/train': 1.328758716583252} -11/07/2021 00:04:57 - INFO - __main__ - Step 20158: {'lr': 0.0004816603205262572, 'samples': 3870336, 'steps': 20157, 'loss/train': 1.8653146028518677} -11/07/2021 00:04:58 - INFO - __main__ - Step 20159: {'lr': 0.0004816583254209488, 'samples': 3870528, 'steps': 20158, 'loss/train': 1.5926765203475952} -11/07/2021 00:04:59 - INFO - __main__ - Step 20160: {'lr': 0.00048165633021125874, 'samples': 3870720, 'steps': 20159, 'loss/train': 1.8898913860321045} -11/07/2021 00:04:59 - INFO - __main__ - Step 20161: {'lr': 0.0004816543348971879, 'samples': 3870912, 'steps': 20160, 'loss/train': 1.354554295539856} -11/07/2021 00:05:00 - INFO - __main__ - Step 20162: {'lr': 0.0004816523394787372, 'samples': 3871104, 'steps': 20161, 'loss/train': 1.504123568534851} -11/07/2021 00:05:00 - INFO - __main__ - Step 20163: {'lr': 0.00048165034395590756, 'samples': 3871296, 'steps': 20162, 'loss/train': 1.4880510568618774} -11/07/2021 00:05:01 - INFO - __main__ - Step 20164: {'lr': 0.0004816483483286998, 'samples': 3871488, 'steps': 20163, 'loss/train': 1.560563087463379} -11/07/2021 00:05:01 - INFO - __main__ - Step 20165: {'lr': 0.0004816463525971149, 'samples': 3871680, 'steps': 20164, 'loss/train': 1.6374289989471436} -11/07/2021 00:05:01 - INFO - __main__ - Step 20166: {'lr': 0.0004816443567611537, 'samples': 3871872, 'steps': 20165, 'loss/train': 1.8701469898223877} -11/07/2021 00:05:02 - INFO - __main__ - Step 20167: {'lr': 0.00048164236082081713, 'samples': 3872064, 'steps': 20166, 'loss/train': 1.5199638605117798} -11/07/2021 00:05:02 - INFO - __main__ - Step 20168: {'lr': 0.00048164036477610616, 'samples': 3872256, 'steps': 20167, 'loss/train': 1.2595298290252686} -11/07/2021 00:05:03 - INFO - __main__ - Step 20169: {'lr': 0.00048163836862702154, 'samples': 3872448, 'steps': 20168, 'loss/train': 0.5841023921966553} -11/07/2021 00:05:04 - INFO - __main__ - Step 20170: {'lr': 0.0004816363723735643, 'samples': 3872640, 'steps': 20169, 'loss/train': 1.7465553283691406} -11/07/2021 00:05:04 - INFO - __main__ - Step 20171: {'lr': 0.00048163437601573525, 'samples': 3872832, 'steps': 20170, 'loss/train': 1.8244073390960693} -11/07/2021 00:05:04 - INFO - __main__ - Step 20172: {'lr': 0.00048163237955353526, 'samples': 3873024, 'steps': 20171, 'loss/train': 1.614901065826416} -11/07/2021 00:05:05 - INFO - __main__ - Step 20173: {'lr': 0.00048163038298696537, 'samples': 3873216, 'steps': 20172, 'loss/train': 1.7259612083435059} -11/07/2021 00:05:06 - INFO - __main__ - Step 20174: {'lr': 0.00048162838631602643, 'samples': 3873408, 'steps': 20173, 'loss/train': 1.643215298652649} -11/07/2021 00:05:06 - INFO - __main__ - Step 20175: {'lr': 0.00048162638954071926, 'samples': 3873600, 'steps': 20174, 'loss/train': 1.6356228590011597} -11/07/2021 00:05:07 - INFO - __main__ - Step 20176: {'lr': 0.0004816243926610448, 'samples': 3873792, 'steps': 20175, 'loss/train': 1.7864456176757812} -11/07/2021 00:05:07 - INFO - __main__ - Step 20177: {'lr': 0.000481622395677004, 'samples': 3873984, 'steps': 20176, 'loss/train': 1.7050282955169678} -11/07/2021 00:05:07 - INFO - __main__ - Step 20178: {'lr': 0.0004816203985885977, 'samples': 3874176, 'steps': 20177, 'loss/train': 1.7557024955749512} -11/07/2021 00:05:08 - INFO - __main__ - Step 20179: {'lr': 0.0004816184013958268, 'samples': 3874368, 'steps': 20178, 'loss/train': 1.1449915170669556} -11/07/2021 00:05:09 - INFO - __main__ - Step 20180: {'lr': 0.0004816164040986923, 'samples': 3874560, 'steps': 20179, 'loss/train': 1.9531196355819702} -11/07/2021 00:05:09 - INFO - __main__ - Step 20181: {'lr': 0.00048161440669719496, 'samples': 3874752, 'steps': 20180, 'loss/train': 1.1801620721817017} -11/07/2021 00:05:09 - INFO - __main__ - Step 20182: {'lr': 0.00048161240919133573, 'samples': 3874944, 'steps': 20181, 'loss/train': 1.5637428760528564} -11/07/2021 00:05:10 - INFO - __main__ - Step 20183: {'lr': 0.00048161041158111564, 'samples': 3875136, 'steps': 20182, 'loss/train': 1.7784135341644287} -11/07/2021 00:05:11 - INFO - __main__ - Step 20184: {'lr': 0.0004816084138665353, 'samples': 3875328, 'steps': 20183, 'loss/train': 1.9407933950424194} -11/07/2021 00:05:11 - INFO - __main__ - Step 20185: {'lr': 0.00048160641604759593, 'samples': 3875520, 'steps': 20184, 'loss/train': 1.4560564756393433} -11/07/2021 00:05:12 - INFO - __main__ - Step 20186: {'lr': 0.0004816044181242982, 'samples': 3875712, 'steps': 20185, 'loss/train': 0.9393236041069031} -11/07/2021 00:05:12 - INFO - __main__ - Step 20187: {'lr': 0.0004816024200966431, 'samples': 3875904, 'steps': 20186, 'loss/train': 1.409131646156311} -11/07/2021 00:05:12 - INFO - __main__ - Step 20188: {'lr': 0.00048160042196463153, 'samples': 3876096, 'steps': 20187, 'loss/train': 1.8766820430755615} -11/07/2021 00:05:13 - INFO - __main__ - Step 20189: {'lr': 0.00048159842372826446, 'samples': 3876288, 'steps': 20188, 'loss/train': 1.3698480129241943} -11/07/2021 00:05:14 - INFO - __main__ - Step 20190: {'lr': 0.0004815964253875426, 'samples': 3876480, 'steps': 20189, 'loss/train': 1.751710295677185} -11/07/2021 00:05:14 - INFO - __main__ - Step 20191: {'lr': 0.000481594426942467, 'samples': 3876672, 'steps': 20190, 'loss/train': 1.5956690311431885} -11/07/2021 00:05:14 - INFO - __main__ - Step 20192: {'lr': 0.0004815924283930385, 'samples': 3876864, 'steps': 20191, 'loss/train': 0.9469591975212097} -11/07/2021 00:05:15 - INFO - __main__ - Step 20193: {'lr': 0.0004815904297392582, 'samples': 3877056, 'steps': 20192, 'loss/train': 1.4563199281692505} -11/07/2021 00:05:15 - INFO - __main__ - Step 20194: {'lr': 0.00048158843098112657, 'samples': 3877248, 'steps': 20193, 'loss/train': 1.7004506587982178} -11/07/2021 00:05:16 - INFO - __main__ - Step 20195: {'lr': 0.00048158643211864495, 'samples': 3877440, 'steps': 20194, 'loss/train': 1.642877221107483} -11/07/2021 00:05:16 - INFO - __main__ - Step 20196: {'lr': 0.000481584433151814, 'samples': 3877632, 'steps': 20195, 'loss/train': 1.9405843019485474} -11/07/2021 00:05:17 - INFO - __main__ - Step 20197: {'lr': 0.00048158243408063465, 'samples': 3877824, 'steps': 20196, 'loss/train': 1.7496905326843262} -11/07/2021 00:05:17 - INFO - __main__ - Step 20198: {'lr': 0.0004815804349051078, 'samples': 3878016, 'steps': 20197, 'loss/train': 0.8492428660392761} -11/07/2021 00:05:17 - INFO - __main__ - Step 20199: {'lr': 0.0004815784356252344, 'samples': 3878208, 'steps': 20198, 'loss/train': 1.2568089962005615} -11/07/2021 00:05:18 - INFO - __main__ - Step 20200: {'lr': 0.0004815764362410154, 'samples': 3878400, 'steps': 20199, 'loss/train': 1.2597923278808594} -11/07/2021 00:05:19 - INFO - __main__ - Step 20201: {'lr': 0.0004815744367524516, 'samples': 3878592, 'steps': 20200, 'loss/train': 1.7262325286865234} -11/07/2021 00:05:19 - INFO - __main__ - Step 20202: {'lr': 0.0004815724371595439, 'samples': 3878784, 'steps': 20201, 'loss/train': 1.7526211738586426} -11/07/2021 00:05:19 - INFO - __main__ - Step 20203: {'lr': 0.00048157043746229324, 'samples': 3878976, 'steps': 20202, 'loss/train': 1.2760602235794067} -11/07/2021 00:05:20 - INFO - __main__ - Step 20204: {'lr': 0.0004815684376607006, 'samples': 3879168, 'steps': 20203, 'loss/train': 1.6638855934143066} -11/07/2021 00:05:21 - INFO - __main__ - Step 20205: {'lr': 0.0004815664377547667, 'samples': 3879360, 'steps': 20204, 'loss/train': 1.7330559492111206} -11/07/2021 00:05:22 - INFO - __main__ - Step 20206: {'lr': 0.00048156443774449254, 'samples': 3879552, 'steps': 20205, 'loss/train': 1.6828453540802002} -11/07/2021 00:05:22 - INFO - __main__ - Step 20207: {'lr': 0.00048156243762987905, 'samples': 3879744, 'steps': 20206, 'loss/train': 1.5695830583572388} -11/07/2021 00:05:22 - INFO - __main__ - Step 20208: {'lr': 0.00048156043741092705, 'samples': 3879936, 'steps': 20207, 'loss/train': 1.6807202100753784} -11/07/2021 00:05:23 - INFO - __main__ - Step 20209: {'lr': 0.00048155843708763755, 'samples': 3880128, 'steps': 20208, 'loss/train': 1.7855095863342285} -11/07/2021 00:05:23 - INFO - __main__ - Step 20210: {'lr': 0.0004815564366600114, 'samples': 3880320, 'steps': 20209, 'loss/train': 1.778202772140503} -11/07/2021 00:05:23 - INFO - __main__ - Step 20211: {'lr': 0.0004815544361280494, 'samples': 3880512, 'steps': 20210, 'loss/train': 1.3515102863311768} -11/07/2021 00:05:25 - INFO - __main__ - Step 20212: {'lr': 0.00048155243549175263, 'samples': 3880704, 'steps': 20211, 'loss/train': 1.462814211845398} -11/07/2021 00:05:25 - INFO - __main__ - Step 20213: {'lr': 0.00048155043475112184, 'samples': 3880896, 'steps': 20212, 'loss/train': 1.8552340269088745} -11/07/2021 00:05:25 - INFO - __main__ - Step 20214: {'lr': 0.0004815484339061581, 'samples': 3881088, 'steps': 20213, 'loss/train': 1.4173270463943481} -11/07/2021 00:05:26 - INFO - __main__ - Step 20215: {'lr': 0.0004815464329568621, 'samples': 3881280, 'steps': 20214, 'loss/train': 1.4815483093261719} -11/07/2021 00:05:26 - INFO - __main__ - Step 20216: {'lr': 0.00048154443190323495, 'samples': 3881472, 'steps': 20215, 'loss/train': 1.7627679109573364} -11/07/2021 00:05:27 - INFO - __main__ - Step 20217: {'lr': 0.0004815424307452774, 'samples': 3881664, 'steps': 20216, 'loss/train': 1.7265102863311768} -11/07/2021 00:05:28 - INFO - __main__ - Step 20218: {'lr': 0.0004815404294829904, 'samples': 3881856, 'steps': 20217, 'loss/train': 1.392214059829712} -11/07/2021 00:05:28 - INFO - __main__ - Step 20219: {'lr': 0.0004815384281163748, 'samples': 3882048, 'steps': 20218, 'loss/train': 1.5504920482635498} -11/07/2021 00:05:28 - INFO - __main__ - Step 20220: {'lr': 0.0004815364266454316, 'samples': 3882240, 'steps': 20219, 'loss/train': 1.3972241878509521} -11/07/2021 00:05:29 - INFO - __main__ - Step 20221: {'lr': 0.00048153442507016173, 'samples': 3882432, 'steps': 20220, 'loss/train': 2.0695390701293945} -11/07/2021 00:05:29 - INFO - __main__ - Step 20222: {'lr': 0.00048153242339056594, 'samples': 3882624, 'steps': 20221, 'loss/train': 0.68231600522995} -11/07/2021 00:05:30 - INFO - __main__ - Step 20223: {'lr': 0.0004815304216066453, 'samples': 3882816, 'steps': 20222, 'loss/train': 1.10834538936615} -11/07/2021 00:05:30 - INFO - __main__ - Step 20224: {'lr': 0.0004815284197184005, 'samples': 3883008, 'steps': 20223, 'loss/train': 0.35353773832321167} -11/07/2021 00:05:31 - INFO - __main__ - Step 20225: {'lr': 0.0004815264177258326, 'samples': 3883200, 'steps': 20224, 'loss/train': 2.266817569732666} -11/07/2021 00:05:31 - INFO - __main__ - Step 20226: {'lr': 0.00048152441562894255, 'samples': 3883392, 'steps': 20225, 'loss/train': 1.4499667882919312} -11/07/2021 00:05:31 - INFO - __main__ - Step 20227: {'lr': 0.0004815224134277311, 'samples': 3883584, 'steps': 20226, 'loss/train': 0.39159658551216125} -11/07/2021 00:05:32 - INFO - __main__ - Step 20228: {'lr': 0.00048152041112219926, 'samples': 3883776, 'steps': 20227, 'loss/train': 1.5912150144577026} -11/07/2021 00:05:33 - INFO - __main__ - Step 20229: {'lr': 0.0004815184087123479, 'samples': 3883968, 'steps': 20228, 'loss/train': 1.2535486221313477} -11/07/2021 00:05:33 - INFO - __main__ - Step 20230: {'lr': 0.0004815164061981778, 'samples': 3884160, 'steps': 20229, 'loss/train': 1.611649990081787} -11/07/2021 00:05:33 - INFO - __main__ - Step 20231: {'lr': 0.0004815144035796901, 'samples': 3884352, 'steps': 20230, 'loss/train': 1.4114503860473633} -11/07/2021 00:05:34 - INFO - __main__ - Step 20232: {'lr': 0.0004815124008568856, 'samples': 3884544, 'steps': 20231, 'loss/train': 1.8829342126846313} -11/07/2021 00:05:35 - INFO - __main__ - Step 20233: {'lr': 0.00048151039802976517, 'samples': 3884736, 'steps': 20232, 'loss/train': 1.1377381086349487} -11/07/2021 00:05:35 - INFO - __main__ - Step 20234: {'lr': 0.00048150839509832966, 'samples': 3884928, 'steps': 20233, 'loss/train': 1.054691195487976} -11/07/2021 00:05:36 - INFO - __main__ - Step 20235: {'lr': 0.0004815063920625801, 'samples': 3885120, 'steps': 20234, 'loss/train': 1.5479214191436768} -11/07/2021 00:05:36 - INFO - __main__ - Step 20236: {'lr': 0.00048150438892251724, 'samples': 3885312, 'steps': 20235, 'loss/train': 1.5953601598739624} -11/07/2021 00:05:36 - INFO - __main__ - Step 20237: {'lr': 0.00048150238567814217, 'samples': 3885504, 'steps': 20236, 'loss/train': 1.5126464366912842} -11/07/2021 00:05:37 - INFO - __main__ - Step 20238: {'lr': 0.0004815003823294557, 'samples': 3885696, 'steps': 20237, 'loss/train': 1.6836274862289429} -11/07/2021 00:05:38 - INFO - __main__ - Step 20239: {'lr': 0.0004814983788764587, 'samples': 3885888, 'steps': 20238, 'loss/train': 1.861586332321167} -11/07/2021 00:05:38 - INFO - __main__ - Step 20240: {'lr': 0.00048149637531915215, 'samples': 3886080, 'steps': 20239, 'loss/train': 1.6984490156173706} -11/07/2021 00:05:38 - INFO - __main__ - Step 20241: {'lr': 0.00048149437165753684, 'samples': 3886272, 'steps': 20240, 'loss/train': 1.4807697534561157} -11/07/2021 00:05:39 - INFO - __main__ - Step 20242: {'lr': 0.00048149236789161374, 'samples': 3886464, 'steps': 20241, 'loss/train': 1.7156288623809814} -11/07/2021 00:05:40 - INFO - __main__ - Step 20243: {'lr': 0.0004814903640213838, 'samples': 3886656, 'steps': 20242, 'loss/train': 1.6998640298843384} -11/07/2021 00:05:40 - INFO - __main__ - Step 20244: {'lr': 0.0004814883600468478, 'samples': 3886848, 'steps': 20243, 'loss/train': 1.2742701768875122} -11/07/2021 00:05:40 - INFO - __main__ - Step 20245: {'lr': 0.0004814863559680068, 'samples': 3887040, 'steps': 20244, 'loss/train': 1.1318578720092773} -11/07/2021 00:05:41 - INFO - __main__ - Step 20246: {'lr': 0.00048148435178486156, 'samples': 3887232, 'steps': 20245, 'loss/train': 0.7671478986740112} -11/07/2021 00:05:41 - INFO - __main__ - Step 20247: {'lr': 0.00048148234749741304, 'samples': 3887424, 'steps': 20246, 'loss/train': 1.5640817880630493} -11/07/2021 00:05:42 - INFO - __main__ - Step 20248: {'lr': 0.0004814803431056622, 'samples': 3887616, 'steps': 20247, 'loss/train': 1.6258333921432495} -11/07/2021 00:05:43 - INFO - __main__ - Step 20249: {'lr': 0.0004814783386096099, 'samples': 3887808, 'steps': 20248, 'loss/train': 1.5049912929534912} -11/07/2021 00:05:43 - INFO - __main__ - Step 20250: {'lr': 0.00048147633400925693, 'samples': 3888000, 'steps': 20249, 'loss/train': 1.4869909286499023} -11/07/2021 00:05:43 - INFO - __main__ - Step 20251: {'lr': 0.00048147432930460433, 'samples': 3888192, 'steps': 20250, 'loss/train': 1.4749869108200073} -11/07/2021 00:05:44 - INFO - __main__ - Step 20252: {'lr': 0.00048147232449565305, 'samples': 3888384, 'steps': 20251, 'loss/train': 1.609937310218811} -11/07/2021 00:05:44 - INFO - __main__ - Step 20253: {'lr': 0.00048147031958240384, 'samples': 3888576, 'steps': 20252, 'loss/train': 1.487269639968872} -11/07/2021 00:05:45 - INFO - __main__ - Step 20254: {'lr': 0.00048146831456485776, 'samples': 3888768, 'steps': 20253, 'loss/train': 1.6627097129821777} -11/07/2021 00:05:45 - INFO - __main__ - Step 20255: {'lr': 0.0004814663094430155, 'samples': 3888960, 'steps': 20254, 'loss/train': 1.5854759216308594} -11/07/2021 00:05:46 - INFO - __main__ - Step 20256: {'lr': 0.00048146430421687817, 'samples': 3889152, 'steps': 20255, 'loss/train': 1.851196527481079} -11/07/2021 00:05:46 - INFO - __main__ - Step 20257: {'lr': 0.00048146229888644656, 'samples': 3889344, 'steps': 20256, 'loss/train': 1.4912571907043457} -11/07/2021 00:05:47 - INFO - __main__ - Step 20258: {'lr': 0.00048146029345172165, 'samples': 3889536, 'steps': 20257, 'loss/train': 1.307698369026184} -11/07/2021 00:05:47 - INFO - __main__ - Step 20259: {'lr': 0.0004814582879127043, 'samples': 3889728, 'steps': 20258, 'loss/train': 1.6989030838012695} -11/07/2021 00:05:48 - INFO - __main__ - Step 20260: {'lr': 0.0004814562822693954, 'samples': 3889920, 'steps': 20259, 'loss/train': 1.2388862371444702} -11/07/2021 00:05:48 - INFO - __main__ - Step 20261: {'lr': 0.00048145427652179583, 'samples': 3890112, 'steps': 20260, 'loss/train': 2.0702147483825684} -11/07/2021 00:05:49 - INFO - __main__ - Step 20262: {'lr': 0.0004814522706699066, 'samples': 3890304, 'steps': 20261, 'loss/train': 1.5232195854187012} -11/07/2021 00:05:49 - INFO - __main__ - Step 20263: {'lr': 0.00048145026471372855, 'samples': 3890496, 'steps': 20262, 'loss/train': 1.651239275932312} -11/07/2021 00:05:50 - INFO - __main__ - Step 20264: {'lr': 0.0004814482586532626, 'samples': 3890688, 'steps': 20263, 'loss/train': 1.808660626411438} -11/07/2021 00:05:50 - INFO - __main__ - Step 20265: {'lr': 0.00048144625248850955, 'samples': 3890880, 'steps': 20264, 'loss/train': 1.8271234035491943} -11/07/2021 00:05:51 - INFO - __main__ - Step 20266: {'lr': 0.0004814442462194704, 'samples': 3891072, 'steps': 20265, 'loss/train': 1.453490972518921} -11/07/2021 00:05:51 - INFO - __main__ - Step 20267: {'lr': 0.0004814422398461461, 'samples': 3891264, 'steps': 20266, 'loss/train': 0.8812512159347534} -11/07/2021 00:05:51 - INFO - __main__ - Step 20268: {'lr': 0.00048144023336853746, 'samples': 3891456, 'steps': 20267, 'loss/train': 1.5316873788833618} -11/07/2021 00:05:52 - INFO - __main__ - Step 20269: {'lr': 0.00048143822678664545, 'samples': 3891648, 'steps': 20268, 'loss/train': 1.776229739189148} -11/07/2021 00:05:53 - INFO - __main__ - Step 20270: {'lr': 0.00048143622010047096, 'samples': 3891840, 'steps': 20269, 'loss/train': 1.6957920789718628} -11/07/2021 00:05:53 - INFO - __main__ - Step 20271: {'lr': 0.0004814342133100149, 'samples': 3892032, 'steps': 20270, 'loss/train': 1.6003910303115845} -11/07/2021 00:05:54 - INFO - __main__ - Step 20272: {'lr': 0.00048143220641527805, 'samples': 3892224, 'steps': 20271, 'loss/train': 0.8694155812263489} -11/07/2021 00:05:54 - INFO - __main__ - Step 20273: {'lr': 0.0004814301994162615, 'samples': 3892416, 'steps': 20272, 'loss/train': 1.7320939302444458} -11/07/2021 00:05:55 - INFO - __main__ - Step 20274: {'lr': 0.000481428192312966, 'samples': 3892608, 'steps': 20273, 'loss/train': 1.8822886943817139} -11/07/2021 00:05:55 - INFO - __main__ - Step 20275: {'lr': 0.0004814261851053926, 'samples': 3892800, 'steps': 20274, 'loss/train': 1.6996090412139893} -11/07/2021 00:05:56 - INFO - __main__ - Step 20276: {'lr': 0.00048142417779354214, 'samples': 3892992, 'steps': 20275, 'loss/train': 1.6192679405212402} -11/07/2021 00:05:56 - INFO - __main__ - Step 20277: {'lr': 0.0004814221703774155, 'samples': 3893184, 'steps': 20276, 'loss/train': 1.9482049942016602} -11/07/2021 00:05:56 - INFO - __main__ - Step 20278: {'lr': 0.00048142016285701356, 'samples': 3893376, 'steps': 20277, 'loss/train': 1.8611611127853394} -11/07/2021 00:05:57 - INFO - __main__ - Step 20279: {'lr': 0.00048141815523233735, 'samples': 3893568, 'steps': 20278, 'loss/train': 1.4806917905807495} -11/07/2021 00:05:58 - INFO - __main__ - Step 20280: {'lr': 0.00048141614750338757, 'samples': 3893760, 'steps': 20279, 'loss/train': 1.6425491571426392} -11/07/2021 00:05:58 - INFO - __main__ - Step 20281: {'lr': 0.00048141413967016535, 'samples': 3893952, 'steps': 20280, 'loss/train': 1.5973680019378662} -11/07/2021 00:05:58 - INFO - __main__ - Step 20282: {'lr': 0.00048141213173267145, 'samples': 3894144, 'steps': 20281, 'loss/train': 2.633230447769165} -11/07/2021 00:05:59 - INFO - __main__ - Step 20283: {'lr': 0.0004814101236909068, 'samples': 3894336, 'steps': 20282, 'loss/train': 1.511309266090393} -11/07/2021 00:05:59 - INFO - __main__ - Step 20284: {'lr': 0.00048140811554487234, 'samples': 3894528, 'steps': 20283, 'loss/train': 0.8016172647476196} -11/07/2021 00:06:00 - INFO - __main__ - Step 20285: {'lr': 0.000481406107294569, 'samples': 3894720, 'steps': 20284, 'loss/train': 1.877029538154602} -11/07/2021 00:06:01 - INFO - __main__ - Step 20286: {'lr': 0.0004814040989399975, 'samples': 3894912, 'steps': 20285, 'loss/train': 0.7532491087913513} -11/07/2021 00:06:01 - INFO - __main__ - Step 20287: {'lr': 0.000481402090481159, 'samples': 3895104, 'steps': 20286, 'loss/train': 1.5717297792434692} -11/07/2021 00:06:01 - INFO - __main__ - Step 20288: {'lr': 0.0004814000819180543, 'samples': 3895296, 'steps': 20287, 'loss/train': 1.7239612340927124} -11/07/2021 00:06:02 - INFO - __main__ - Step 20289: {'lr': 0.00048139807325068423, 'samples': 3895488, 'steps': 20288, 'loss/train': 0.5814390778541565} -11/07/2021 00:06:03 - INFO - __main__ - Step 20290: {'lr': 0.0004813960644790498, 'samples': 3895680, 'steps': 20289, 'loss/train': 1.498609185218811} -11/07/2021 00:06:03 - INFO - __main__ - Step 20291: {'lr': 0.00048139405560315186, 'samples': 3895872, 'steps': 20290, 'loss/train': 1.5184834003448486} -11/07/2021 00:06:03 - INFO - __main__ - Step 20292: {'lr': 0.0004813920466229913, 'samples': 3896064, 'steps': 20291, 'loss/train': 1.1429948806762695} -11/07/2021 00:06:04 - INFO - __main__ - Step 20293: {'lr': 0.0004813900375385691, 'samples': 3896256, 'steps': 20292, 'loss/train': 2.788299083709717} -11/07/2021 00:06:04 - INFO - __main__ - Step 20294: {'lr': 0.0004813880283498861, 'samples': 3896448, 'steps': 20293, 'loss/train': 1.6631759405136108} -11/07/2021 00:06:05 - INFO - __main__ - Step 20295: {'lr': 0.00048138601905694324, 'samples': 3896640, 'steps': 20294, 'loss/train': 1.9560562372207642} -11/07/2021 00:06:06 - INFO - __main__ - Step 20296: {'lr': 0.0004813840096597414, 'samples': 3896832, 'steps': 20295, 'loss/train': 1.8317298889160156} -11/07/2021 00:06:06 - INFO - __main__ - Step 20297: {'lr': 0.00048138200015828146, 'samples': 3897024, 'steps': 20296, 'loss/train': 1.5180134773254395} -11/07/2021 00:06:06 - INFO - __main__ - Step 20298: {'lr': 0.00048137999055256444, 'samples': 3897216, 'steps': 20297, 'loss/train': 1.6339629888534546} -11/07/2021 00:06:07 - INFO - __main__ - Step 20299: {'lr': 0.0004813779808425911, 'samples': 3897408, 'steps': 20298, 'loss/train': 1.5810672044754028} -11/07/2021 00:06:07 - INFO - __main__ - Step 20300: {'lr': 0.0004813759710283624, 'samples': 3897600, 'steps': 20299, 'loss/train': 1.6098214387893677} -11/07/2021 00:06:08 - INFO - __main__ - Step 20301: {'lr': 0.0004813739611098793, 'samples': 3897792, 'steps': 20300, 'loss/train': 1.575744867324829} -11/07/2021 00:06:09 - INFO - __main__ - Step 20302: {'lr': 0.00048137195108714266, 'samples': 3897984, 'steps': 20301, 'loss/train': 0.8211456537246704} -11/07/2021 00:06:09 - INFO - __main__ - Step 20303: {'lr': 0.00048136994096015343, 'samples': 3898176, 'steps': 20302, 'loss/train': 1.674750566482544} -11/07/2021 00:06:09 - INFO - __main__ - Step 20304: {'lr': 0.00048136793072891236, 'samples': 3898368, 'steps': 20303, 'loss/train': 0.8324387669563293} -11/07/2021 00:06:10 - INFO - __main__ - Step 20305: {'lr': 0.00048136592039342053, 'samples': 3898560, 'steps': 20304, 'loss/train': 1.7422436475753784} -11/07/2021 00:06:11 - INFO - __main__ - Step 20306: {'lr': 0.0004813639099536789, 'samples': 3898752, 'steps': 20305, 'loss/train': 1.2161121368408203} -11/07/2021 00:06:11 - INFO - __main__ - Step 20307: {'lr': 0.0004813618994096881, 'samples': 3898944, 'steps': 20306, 'loss/train': 1.429854393005371} -11/07/2021 00:06:11 - INFO - __main__ - Step 20308: {'lr': 0.0004813598887614492, 'samples': 3899136, 'steps': 20307, 'loss/train': 1.7629268169403076} -11/07/2021 00:06:12 - INFO - __main__ - Step 20309: {'lr': 0.0004813578780089632, 'samples': 3899328, 'steps': 20308, 'loss/train': 1.690520167350769} -11/07/2021 00:06:12 - INFO - __main__ - Step 20310: {'lr': 0.00048135586715223087, 'samples': 3899520, 'steps': 20309, 'loss/train': 1.9133003950119019} -11/07/2021 00:06:13 - INFO - __main__ - Step 20311: {'lr': 0.00048135385619125316, 'samples': 3899712, 'steps': 20310, 'loss/train': 1.6012578010559082} -11/07/2021 00:06:13 - INFO - __main__ - Step 20312: {'lr': 0.00048135184512603093, 'samples': 3899904, 'steps': 20311, 'loss/train': 0.8476859927177429} -11/07/2021 00:06:14 - INFO - __main__ - Step 20313: {'lr': 0.00048134983395656516, 'samples': 3900096, 'steps': 20312, 'loss/train': 1.9039126634597778} -11/07/2021 00:06:14 - INFO - __main__ - Step 20314: {'lr': 0.00048134782268285676, 'samples': 3900288, 'steps': 20313, 'loss/train': 1.62480890750885} -11/07/2021 00:06:15 - INFO - __main__ - Step 20315: {'lr': 0.00048134581130490655, 'samples': 3900480, 'steps': 20314, 'loss/train': 1.6092077493667603} -11/07/2021 00:06:15 - INFO - __main__ - Step 20316: {'lr': 0.0004813437998227155, 'samples': 3900672, 'steps': 20315, 'loss/train': 0.9180329442024231} -11/07/2021 00:06:16 - INFO - __main__ - Step 20317: {'lr': 0.00048134178823628455, 'samples': 3900864, 'steps': 20316, 'loss/train': 1.6326484680175781} -11/07/2021 00:06:16 - INFO - __main__ - Step 20318: {'lr': 0.0004813397765456145, 'samples': 3901056, 'steps': 20317, 'loss/train': 1.1808871030807495} -11/07/2021 00:06:17 - INFO - __main__ - Step 20319: {'lr': 0.00048133776475070637, 'samples': 3901248, 'steps': 20318, 'loss/train': 1.7565277814865112} -11/07/2021 00:06:17 - INFO - __main__ - Step 20320: {'lr': 0.00048133575285156093, 'samples': 3901440, 'steps': 20319, 'loss/train': 1.70387864112854} -11/07/2021 00:06:18 - INFO - __main__ - Step 20321: {'lr': 0.00048133374084817927, 'samples': 3901632, 'steps': 20320, 'loss/train': 0.9791955947875977} -11/07/2021 00:06:18 - INFO - __main__ - Step 20322: {'lr': 0.00048133172874056213, 'samples': 3901824, 'steps': 20321, 'loss/train': 1.9139925241470337} -11/07/2021 00:06:19 - INFO - __main__ - Step 20323: {'lr': 0.0004813297165287105, 'samples': 3902016, 'steps': 20322, 'loss/train': 1.494025707244873} -11/07/2021 00:06:19 - INFO - __main__ - Step 20324: {'lr': 0.00048132770421262526, 'samples': 3902208, 'steps': 20323, 'loss/train': 1.3976880311965942} -11/07/2021 00:06:19 - INFO - __main__ - Step 20325: {'lr': 0.00048132569179230736, 'samples': 3902400, 'steps': 20324, 'loss/train': 1.5085182189941406} -11/07/2021 00:06:20 - INFO - __main__ - Step 20326: {'lr': 0.0004813236792677577, 'samples': 3902592, 'steps': 20325, 'loss/train': 1.7275755405426025} -11/07/2021 00:06:21 - INFO - __main__ - Step 20327: {'lr': 0.00048132166663897703, 'samples': 3902784, 'steps': 20326, 'loss/train': 1.1090145111083984} -11/07/2021 00:06:21 - INFO - __main__ - Step 20328: {'lr': 0.0004813196539059665, 'samples': 3902976, 'steps': 20327, 'loss/train': 1.493940830230713} -11/07/2021 00:06:22 - INFO - __main__ - Step 20329: {'lr': 0.0004813176410687269, 'samples': 3903168, 'steps': 20328, 'loss/train': 1.5074502229690552} -11/07/2021 00:06:22 - INFO - __main__ - Step 20330: {'lr': 0.00048131562812725904, 'samples': 3903360, 'steps': 20329, 'loss/train': 1.7746409177780151} -11/07/2021 00:06:22 - INFO - __main__ - Step 20331: {'lr': 0.000481313615081564, 'samples': 3903552, 'steps': 20330, 'loss/train': 5.725223064422607} -11/07/2021 00:06:23 - INFO - __main__ - Step 20332: {'lr': 0.00048131160193164266, 'samples': 3903744, 'steps': 20331, 'loss/train': 1.2115626335144043} -11/07/2021 00:06:24 - INFO - __main__ - Step 20333: {'lr': 0.0004813095886774958, 'samples': 3903936, 'steps': 20332, 'loss/train': 1.7731631994247437} -11/07/2021 00:06:24 - INFO - __main__ - Step 20334: {'lr': 0.00048130757531912447, 'samples': 3904128, 'steps': 20333, 'loss/train': 1.7672775983810425} -11/07/2021 00:06:24 - INFO - __main__ - Step 20335: {'lr': 0.00048130556185652947, 'samples': 3904320, 'steps': 20334, 'loss/train': 1.9235178232192993} -11/07/2021 00:06:25 - INFO - __main__ - Step 20336: {'lr': 0.0004813035482897118, 'samples': 3904512, 'steps': 20335, 'loss/train': 1.494145393371582} -11/07/2021 00:06:25 - INFO - __main__ - Step 20337: {'lr': 0.00048130153461867225, 'samples': 3904704, 'steps': 20336, 'loss/train': 1.8234186172485352} -11/07/2021 00:06:26 - INFO - __main__ - Step 20338: {'lr': 0.0004812995208434119, 'samples': 3904896, 'steps': 20337, 'loss/train': 1.926507592201233} -11/07/2021 00:06:27 - INFO - __main__ - Step 20339: {'lr': 0.00048129750696393144, 'samples': 3905088, 'steps': 20338, 'loss/train': 1.6730066537857056} -11/07/2021 00:06:27 - INFO - __main__ - Step 20340: {'lr': 0.00048129549298023196, 'samples': 3905280, 'steps': 20339, 'loss/train': 1.868593692779541} -11/07/2021 00:06:27 - INFO - __main__ - Step 20341: {'lr': 0.0004812934788923143, 'samples': 3905472, 'steps': 20340, 'loss/train': 1.4159256219863892} -11/07/2021 00:06:28 - INFO - __main__ - Step 20342: {'lr': 0.00048129146470017933, 'samples': 3905664, 'steps': 20341, 'loss/train': 1.5150226354599} -11/07/2021 00:06:29 - INFO - __main__ - Step 20343: {'lr': 0.000481289450403828, 'samples': 3905856, 'steps': 20342, 'loss/train': 1.8831218481063843} -11/07/2021 00:06:29 - INFO - __main__ - Step 20344: {'lr': 0.0004812874360032613, 'samples': 3906048, 'steps': 20343, 'loss/train': 1.6416627168655396} -11/07/2021 00:06:29 - INFO - __main__ - Step 20345: {'lr': 0.0004812854214984799, 'samples': 3906240, 'steps': 20344, 'loss/train': 1.546629548072815} -11/07/2021 00:06:30 - INFO - __main__ - Step 20346: {'lr': 0.000481283406889485, 'samples': 3906432, 'steps': 20345, 'loss/train': 1.5926127433776855} -11/07/2021 00:06:30 - INFO - __main__ - Step 20347: {'lr': 0.00048128139217627725, 'samples': 3906624, 'steps': 20346, 'loss/train': 1.4639637470245361} -11/07/2021 00:06:31 - INFO - __main__ - Step 20348: {'lr': 0.00048127937735885774, 'samples': 3906816, 'steps': 20347, 'loss/train': 1.5859371423721313} -11/07/2021 00:06:32 - INFO - __main__ - Step 20349: {'lr': 0.0004812773624372273, 'samples': 3907008, 'steps': 20348, 'loss/train': 1.5963897705078125} -11/07/2021 00:06:32 - INFO - __main__ - Step 20350: {'lr': 0.0004812753474113869, 'samples': 3907200, 'steps': 20349, 'loss/train': 1.499479055404663} -11/07/2021 00:06:32 - INFO - __main__ - Step 20351: {'lr': 0.0004812733322813373, 'samples': 3907392, 'steps': 20350, 'loss/train': 1.5133908987045288} -11/07/2021 00:06:33 - INFO - __main__ - Step 20352: {'lr': 0.00048127131704707953, 'samples': 3907584, 'steps': 20351, 'loss/train': 1.4553083181381226} -11/07/2021 00:06:34 - INFO - __main__ - Step 20353: {'lr': 0.0004812693017086145, 'samples': 3907776, 'steps': 20352, 'loss/train': 1.3714314699172974} -11/07/2021 00:06:34 - INFO - __main__ - Step 20354: {'lr': 0.00048126728626594315, 'samples': 3907968, 'steps': 20353, 'loss/train': 1.7511000633239746} -11/07/2021 00:06:34 - INFO - __main__ - Step 20355: {'lr': 0.00048126527071906623, 'samples': 3908160, 'steps': 20354, 'loss/train': 1.3997986316680908} -11/07/2021 00:06:35 - INFO - __main__ - Step 20356: {'lr': 0.0004812632550679848, 'samples': 3908352, 'steps': 20355, 'loss/train': 1.9811984300613403} -11/07/2021 00:06:35 - INFO - __main__ - Step 20357: {'lr': 0.00048126123931269973, 'samples': 3908544, 'steps': 20356, 'loss/train': 1.576959252357483} -11/07/2021 00:06:36 - INFO - __main__ - Step 20358: {'lr': 0.0004812592234532118, 'samples': 3908736, 'steps': 20357, 'loss/train': 1.697954535484314} -11/07/2021 00:06:36 - INFO - __main__ - Step 20359: {'lr': 0.00048125720748952216, 'samples': 3908928, 'steps': 20358, 'loss/train': 2.012244939804077} -11/07/2021 00:06:37 - INFO - __main__ - Step 20360: {'lr': 0.00048125519142163157, 'samples': 3909120, 'steps': 20359, 'loss/train': 1.5944174528121948} -11/07/2021 00:06:37 - INFO - __main__ - Step 20361: {'lr': 0.0004812531752495409, 'samples': 3909312, 'steps': 20360, 'loss/train': 1.4070159196853638} -11/07/2021 00:06:37 - INFO - __main__ - Step 20362: {'lr': 0.00048125115897325115, 'samples': 3909504, 'steps': 20361, 'loss/train': 0.829056441783905} -11/07/2021 00:06:39 - INFO - __main__ - Step 20363: {'lr': 0.0004812491425927632, 'samples': 3909696, 'steps': 20362, 'loss/train': 0.8168201446533203} -11/07/2021 00:06:39 - INFO - __main__ - Step 20364: {'lr': 0.000481247126108078, 'samples': 3909888, 'steps': 20363, 'loss/train': 1.7574135065078735} -11/07/2021 00:06:39 - INFO - __main__ - Step 20365: {'lr': 0.00048124510951919633, 'samples': 3910080, 'steps': 20364, 'loss/train': 1.841825008392334} -11/07/2021 00:06:40 - INFO - __main__ - Step 20366: {'lr': 0.0004812430928261192, 'samples': 3910272, 'steps': 20365, 'loss/train': 1.7087429761886597} -11/07/2021 00:06:40 - INFO - __main__ - Step 20367: {'lr': 0.00048124107602884753, 'samples': 3910464, 'steps': 20366, 'loss/train': 1.9521450996398926} -11/07/2021 00:06:40 - INFO - __main__ - Step 20368: {'lr': 0.0004812390591273822, 'samples': 3910656, 'steps': 20367, 'loss/train': 1.9141671657562256} -11/07/2021 00:06:41 - INFO - __main__ - Step 20369: {'lr': 0.00048123704212172416, 'samples': 3910848, 'steps': 20368, 'loss/train': 1.6557412147521973} -11/07/2021 00:06:42 - INFO - __main__ - Step 20370: {'lr': 0.0004812350250118742, 'samples': 3911040, 'steps': 20369, 'loss/train': 2.031385660171509} -11/07/2021 00:06:42 - INFO - __main__ - Step 20371: {'lr': 0.0004812330077978333, 'samples': 3911232, 'steps': 20370, 'loss/train': 1.6474828720092773} -11/07/2021 00:06:42 - INFO - __main__ - Step 20372: {'lr': 0.0004812309904796024, 'samples': 3911424, 'steps': 20371, 'loss/train': 1.5013188123703003} -11/07/2021 00:06:43 - INFO - __main__ - Step 20373: {'lr': 0.0004812289730571824, 'samples': 3911616, 'steps': 20372, 'loss/train': 1.3218475580215454} -11/07/2021 00:06:44 - INFO - __main__ - Step 20374: {'lr': 0.00048122695553057417, 'samples': 3911808, 'steps': 20373, 'loss/train': 1.8798691034317017} -11/07/2021 00:06:44 - INFO - __main__ - Step 20375: {'lr': 0.00048122493789977866, 'samples': 3912000, 'steps': 20374, 'loss/train': 1.5554605722427368} -11/07/2021 00:06:45 - INFO - __main__ - Step 20376: {'lr': 0.00048122292016479674, 'samples': 3912192, 'steps': 20375, 'loss/train': 1.2647597789764404} -11/07/2021 00:06:45 - INFO - __main__ - Step 20377: {'lr': 0.0004812209023256294, 'samples': 3912384, 'steps': 20376, 'loss/train': 5.788717746734619} -11/07/2021 00:06:45 - INFO - __main__ - Step 20378: {'lr': 0.0004812188843822775, 'samples': 3912576, 'steps': 20377, 'loss/train': 1.56723153591156} -11/07/2021 00:06:46 - INFO - __main__ - Step 20379: {'lr': 0.0004812168663347418, 'samples': 3912768, 'steps': 20378, 'loss/train': 1.824082374572754} -11/07/2021 00:06:47 - INFO - __main__ - Step 20380: {'lr': 0.00048121484818302343, 'samples': 3912960, 'steps': 20379, 'loss/train': 1.4097694158554077} -11/07/2021 00:06:47 - INFO - __main__ - Step 20381: {'lr': 0.00048121282992712324, 'samples': 3913152, 'steps': 20380, 'loss/train': 1.7064259052276611} -11/07/2021 00:06:47 - INFO - __main__ - Step 20382: {'lr': 0.00048121081156704207, 'samples': 3913344, 'steps': 20381, 'loss/train': 1.8313816785812378} -11/07/2021 00:06:48 - INFO - __main__ - Step 20383: {'lr': 0.00048120879310278094, 'samples': 3913536, 'steps': 20382, 'loss/train': 0.8189948797225952} -11/07/2021 00:06:48 - INFO - __main__ - Step 20384: {'lr': 0.00048120677453434066, 'samples': 3913728, 'steps': 20383, 'loss/train': 1.7617720365524292} -11/07/2021 00:06:49 - INFO - __main__ - Step 20385: {'lr': 0.00048120475586172217, 'samples': 3913920, 'steps': 20384, 'loss/train': 1.839327335357666} -11/07/2021 00:06:49 - INFO - __main__ - Step 20386: {'lr': 0.00048120273708492637, 'samples': 3914112, 'steps': 20385, 'loss/train': 1.4274979829788208} -11/07/2021 00:06:50 - INFO - __main__ - Step 20387: {'lr': 0.0004812007182039542, 'samples': 3914304, 'steps': 20386, 'loss/train': 1.763704538345337} -11/07/2021 00:06:50 - INFO - __main__ - Step 20388: {'lr': 0.00048119869921880656, 'samples': 3914496, 'steps': 20387, 'loss/train': 1.6406468152999878} -11/07/2021 00:06:50 - INFO - __main__ - Step 20389: {'lr': 0.00048119668012948434, 'samples': 3914688, 'steps': 20388, 'loss/train': 1.7437411546707153} -11/07/2021 00:06:51 - INFO - __main__ - Step 20390: {'lr': 0.0004811946609359885, 'samples': 3914880, 'steps': 20389, 'loss/train': 1.9098658561706543} -11/07/2021 00:06:52 - INFO - __main__ - Step 20391: {'lr': 0.00048119264163831987, 'samples': 3915072, 'steps': 20390, 'loss/train': 1.7999954223632812} -11/07/2021 00:06:52 - INFO - __main__ - Step 20392: {'lr': 0.0004811906222364794, 'samples': 3915264, 'steps': 20391, 'loss/train': 1.9051964282989502} -11/07/2021 00:06:53 - INFO - __main__ - Step 20393: {'lr': 0.00048118860273046804, 'samples': 3915456, 'steps': 20392, 'loss/train': 1.446048378944397} -11/07/2021 00:06:53 - INFO - __main__ - Step 20394: {'lr': 0.00048118658312028663, 'samples': 3915648, 'steps': 20393, 'loss/train': 1.7522889375686646} -11/07/2021 00:06:53 - INFO - __main__ - Step 20395: {'lr': 0.0004811845634059361, 'samples': 3915840, 'steps': 20394, 'loss/train': 1.8213437795639038} -11/07/2021 00:06:54 - INFO - __main__ - Step 20396: {'lr': 0.0004811825435874174, 'samples': 3916032, 'steps': 20395, 'loss/train': 1.985606074333191} -11/07/2021 00:06:55 - INFO - __main__ - Step 20397: {'lr': 0.0004811805236647314, 'samples': 3916224, 'steps': 20396, 'loss/train': 1.8085836172103882} -11/07/2021 00:06:55 - INFO - __main__ - Step 20398: {'lr': 0.0004811785036378791, 'samples': 3916416, 'steps': 20397, 'loss/train': 1.7104543447494507} -11/07/2021 00:06:55 - INFO - __main__ - Step 20399: {'lr': 0.0004811764835068613, 'samples': 3916608, 'steps': 20398, 'loss/train': 1.8539533615112305} -11/07/2021 00:06:56 - INFO - __main__ - Step 20400: {'lr': 0.0004811744632716789, 'samples': 3916800, 'steps': 20399, 'loss/train': 1.566263198852539} -11/07/2021 00:06:57 - INFO - __main__ - Step 20401: {'lr': 0.0004811724429323329, 'samples': 3916992, 'steps': 20400, 'loss/train': 1.7747917175292969} -11/07/2021 00:06:57 - INFO - __main__ - Step 20402: {'lr': 0.0004811704224888241, 'samples': 3917184, 'steps': 20401, 'loss/train': 1.5107859373092651} -11/07/2021 00:06:58 - INFO - __main__ - Step 20403: {'lr': 0.0004811684019411535, 'samples': 3917376, 'steps': 20402, 'loss/train': 1.6205443143844604} -11/07/2021 00:06:58 - INFO - __main__ - Step 20404: {'lr': 0.000481166381289322, 'samples': 3917568, 'steps': 20403, 'loss/train': 1.3343929052352905} -11/07/2021 00:06:58 - INFO - __main__ - Step 20405: {'lr': 0.0004811643605333305, 'samples': 3917760, 'steps': 20404, 'loss/train': 1.218215823173523} -11/07/2021 00:07:00 - INFO - __main__ - Step 20406: {'lr': 0.0004811623396731799, 'samples': 3917952, 'steps': 20405, 'loss/train': 0.7047050595283508} -11/07/2021 00:07:00 - INFO - __main__ - Step 20407: {'lr': 0.0004811603187088711, 'samples': 3918144, 'steps': 20406, 'loss/train': 1.5910859107971191} -11/07/2021 00:07:00 - INFO - __main__ - Step 20408: {'lr': 0.00048115829764040503, 'samples': 3918336, 'steps': 20407, 'loss/train': 1.57695734500885} -11/07/2021 00:07:01 - INFO - __main__ - Step 20409: {'lr': 0.0004811562764677826, 'samples': 3918528, 'steps': 20408, 'loss/train': 2.5446133613586426} -11/07/2021 00:07:01 - INFO - __main__ - Step 20410: {'lr': 0.00048115425519100474, 'samples': 3918720, 'steps': 20409, 'loss/train': 1.1176563501358032} -11/07/2021 00:07:01 - INFO - __main__ - Step 20411: {'lr': 0.0004811522338100723, 'samples': 3918912, 'steps': 20410, 'loss/train': 1.3174539804458618} -11/07/2021 00:07:02 - INFO - __main__ - Step 20412: {'lr': 0.0004811502123249862, 'samples': 3919104, 'steps': 20411, 'loss/train': 1.4090980291366577} -11/07/2021 00:07:03 - INFO - __main__ - Step 20413: {'lr': 0.0004811481907357475, 'samples': 3919296, 'steps': 20412, 'loss/train': 2.012705087661743} -11/07/2021 00:07:03 - INFO - __main__ - Step 20414: {'lr': 0.000481146169042357, 'samples': 3919488, 'steps': 20413, 'loss/train': 1.4001191854476929} -11/07/2021 00:07:03 - INFO - __main__ - Step 20415: {'lr': 0.0004811441472448155, 'samples': 3919680, 'steps': 20414, 'loss/train': 1.7796525955200195} -11/07/2021 00:07:04 - INFO - __main__ - Step 20416: {'lr': 0.000481142125343124, 'samples': 3919872, 'steps': 20415, 'loss/train': 1.5453555583953857} -11/07/2021 00:07:05 - INFO - __main__ - Step 20417: {'lr': 0.0004811401033372835, 'samples': 3920064, 'steps': 20416, 'loss/train': 1.4924184083938599} -11/07/2021 00:07:05 - INFO - __main__ - Step 20418: {'lr': 0.0004811380812272948, 'samples': 3920256, 'steps': 20417, 'loss/train': 1.5377154350280762} -11/07/2021 00:07:06 - INFO - __main__ - Step 20419: {'lr': 0.0004811360590131589, 'samples': 3920448, 'steps': 20418, 'loss/train': 1.6782273054122925} -11/07/2021 00:07:06 - INFO - __main__ - Step 20420: {'lr': 0.00048113403669487655, 'samples': 3920640, 'steps': 20419, 'loss/train': 1.8343051671981812} -11/07/2021 00:07:06 - INFO - __main__ - Step 20421: {'lr': 0.0004811320142724489, 'samples': 3920832, 'steps': 20420, 'loss/train': 1.8262782096862793} -11/07/2021 00:07:07 - INFO - __main__ - Step 20422: {'lr': 0.0004811299917458766, 'samples': 3921024, 'steps': 20421, 'loss/train': 1.108807921409607} -11/07/2021 00:07:08 - INFO - __main__ - Step 20423: {'lr': 0.00048112796911516076, 'samples': 3921216, 'steps': 20422, 'loss/train': 1.0290982723236084} -11/07/2021 00:07:08 - INFO - __main__ - Step 20424: {'lr': 0.00048112594638030225, 'samples': 3921408, 'steps': 20423, 'loss/train': 1.9398106336593628} -11/07/2021 00:07:08 - INFO - __main__ - Step 20425: {'lr': 0.00048112392354130194, 'samples': 3921600, 'steps': 20424, 'loss/train': 1.6747199296951294} -11/07/2021 00:07:09 - INFO - __main__ - Step 20426: {'lr': 0.00048112190059816076, 'samples': 3921792, 'steps': 20425, 'loss/train': 1.918034315109253} -11/07/2021 00:07:10 - INFO - __main__ - Step 20427: {'lr': 0.0004811198775508796, 'samples': 3921984, 'steps': 20426, 'loss/train': 1.8439780473709106} -11/07/2021 00:07:10 - INFO - __main__ - Step 20428: {'lr': 0.0004811178543994593, 'samples': 3922176, 'steps': 20427, 'loss/train': 1.639901876449585} -11/07/2021 00:07:10 - INFO - __main__ - Step 20429: {'lr': 0.000481115831143901, 'samples': 3922368, 'steps': 20428, 'loss/train': 1.5237764120101929} -11/07/2021 00:07:11 - INFO - __main__ - Step 20430: {'lr': 0.00048111380778420544, 'samples': 3922560, 'steps': 20429, 'loss/train': 1.6115946769714355} -11/07/2021 00:07:11 - INFO - __main__ - Step 20431: {'lr': 0.0004811117843203735, 'samples': 3922752, 'steps': 20430, 'loss/train': 1.7255394458770752} -11/07/2021 00:07:12 - INFO - __main__ - Step 20432: {'lr': 0.00048110976075240624, 'samples': 3922944, 'steps': 20431, 'loss/train': 1.728033185005188} -11/07/2021 00:07:13 - INFO - __main__ - Step 20433: {'lr': 0.00048110773708030444, 'samples': 3923136, 'steps': 20432, 'loss/train': 1.7761973142623901} -11/07/2021 00:07:13 - INFO - __main__ - Step 20434: {'lr': 0.00048110571330406903, 'samples': 3923328, 'steps': 20433, 'loss/train': 1.1125842332839966} -11/07/2021 00:07:13 - INFO - __main__ - Step 20435: {'lr': 0.0004811036894237011, 'samples': 3923520, 'steps': 20434, 'loss/train': 1.707023024559021} -11/07/2021 00:07:14 - INFO - __main__ - Step 20436: {'lr': 0.00048110166543920125, 'samples': 3923712, 'steps': 20435, 'loss/train': 1.7297285795211792} -11/07/2021 00:07:14 - INFO - __main__ - Step 20437: {'lr': 0.0004810996413505706, 'samples': 3923904, 'steps': 20436, 'loss/train': 1.4574823379516602} -11/07/2021 00:07:15 - INFO - __main__ - Step 20438: {'lr': 0.0004810976171578101, 'samples': 3924096, 'steps': 20437, 'loss/train': 1.896390676498413} -11/07/2021 00:07:15 - INFO - __main__ - Step 20439: {'lr': 0.00048109559286092047, 'samples': 3924288, 'steps': 20438, 'loss/train': 1.5400142669677734} -11/07/2021 00:07:16 - INFO - __main__ - Step 20440: {'lr': 0.0004810935684599028, 'samples': 3924480, 'steps': 20439, 'loss/train': 2.090247631072998} -11/07/2021 00:07:16 - INFO - __main__ - Step 20441: {'lr': 0.00048109154395475787, 'samples': 3924672, 'steps': 20440, 'loss/train': 1.6449775695800781} -11/07/2021 00:07:16 - INFO - __main__ - Step 20442: {'lr': 0.00048108951934548673, 'samples': 3924864, 'steps': 20441, 'loss/train': 1.5495688915252686} -11/07/2021 00:07:17 - INFO - __main__ - Step 20443: {'lr': 0.0004810874946320901, 'samples': 3925056, 'steps': 20442, 'loss/train': 1.2552711963653564} -11/07/2021 00:07:18 - INFO - __main__ - Step 20444: {'lr': 0.00048108546981456916, 'samples': 3925248, 'steps': 20443, 'loss/train': 1.7868911027908325} -11/07/2021 00:07:18 - INFO - __main__ - Step 20445: {'lr': 0.0004810834448929246, 'samples': 3925440, 'steps': 20444, 'loss/train': 1.2708492279052734} -11/07/2021 00:07:18 - INFO - __main__ - Step 20446: {'lr': 0.0004810814198671574, 'samples': 3925632, 'steps': 20445, 'loss/train': 1.5799506902694702} -11/07/2021 00:07:19 - INFO - __main__ - Step 20447: {'lr': 0.00048107939473726846, 'samples': 3925824, 'steps': 20446, 'loss/train': 1.6609207391738892} -11/07/2021 00:07:20 - INFO - __main__ - Step 20448: {'lr': 0.0004810773695032588, 'samples': 3926016, 'steps': 20447, 'loss/train': 1.4672976732254028} -11/07/2021 00:07:20 - INFO - __main__ - Step 20449: {'lr': 0.00048107534416512915, 'samples': 3926208, 'steps': 20448, 'loss/train': 1.3852245807647705} -11/07/2021 00:07:20 - INFO - __main__ - Step 20450: {'lr': 0.00048107331872288055, 'samples': 3926400, 'steps': 20449, 'loss/train': 1.5605368614196777} -11/07/2021 00:07:21 - INFO - __main__ - Step 20451: {'lr': 0.0004810712931765139, 'samples': 3926592, 'steps': 20450, 'loss/train': 1.519484519958496} -11/07/2021 00:07:21 - INFO - __main__ - Step 20452: {'lr': 0.00048106926752603007, 'samples': 3926784, 'steps': 20451, 'loss/train': 1.3224151134490967} -11/07/2021 00:07:22 - INFO - __main__ - Step 20453: {'lr': 0.00048106724177143, 'samples': 3926976, 'steps': 20452, 'loss/train': 1.81765615940094} -11/07/2021 00:07:23 - INFO - __main__ - Step 20454: {'lr': 0.00048106521591271455, 'samples': 3927168, 'steps': 20453, 'loss/train': 1.5886616706848145} -11/07/2021 00:07:23 - INFO - __main__ - Step 20455: {'lr': 0.00048106318994988476, 'samples': 3927360, 'steps': 20454, 'loss/train': 1.4082697629928589} -11/07/2021 00:07:23 - INFO - __main__ - Step 20456: {'lr': 0.0004810611638829414, 'samples': 3927552, 'steps': 20455, 'loss/train': 1.9213775396347046} -11/07/2021 00:07:24 - INFO - __main__ - Step 20457: {'lr': 0.00048105913771188545, 'samples': 3927744, 'steps': 20456, 'loss/train': 1.3209149837493896} -11/07/2021 00:07:24 - INFO - __main__ - Step 20458: {'lr': 0.00048105711143671783, 'samples': 3927936, 'steps': 20457, 'loss/train': 1.615772008895874} -11/07/2021 00:07:25 - INFO - __main__ - Step 20459: {'lr': 0.0004810550850574394, 'samples': 3928128, 'steps': 20458, 'loss/train': 1.7410712242126465} -11/07/2021 00:07:25 - INFO - __main__ - Step 20460: {'lr': 0.0004810530585740512, 'samples': 3928320, 'steps': 20459, 'loss/train': 1.7318370342254639} -11/07/2021 00:07:26 - INFO - __main__ - Step 20461: {'lr': 0.00048105103198655406, 'samples': 3928512, 'steps': 20460, 'loss/train': 1.6753515005111694} -11/07/2021 00:07:26 - INFO - __main__ - Step 20462: {'lr': 0.0004810490052949488, 'samples': 3928704, 'steps': 20461, 'loss/train': 1.2645617723464966} -11/07/2021 00:07:26 - INFO - __main__ - Step 20463: {'lr': 0.0004810469784992365, 'samples': 3928896, 'steps': 20462, 'loss/train': 1.3526378870010376} -11/07/2021 00:07:27 - INFO - __main__ - Step 20464: {'lr': 0.00048104495159941794, 'samples': 3929088, 'steps': 20463, 'loss/train': 1.643991470336914} -11/07/2021 00:07:28 - INFO - __main__ - Step 20465: {'lr': 0.00048104292459549413, 'samples': 3929280, 'steps': 20464, 'loss/train': 1.367877721786499} -11/07/2021 00:07:28 - INFO - __main__ - Step 20466: {'lr': 0.0004810408974874659, 'samples': 3929472, 'steps': 20465, 'loss/train': 1.9926568269729614} -11/07/2021 00:07:28 - INFO - __main__ - Step 20467: {'lr': 0.0004810388702753342, 'samples': 3929664, 'steps': 20466, 'loss/train': 1.3941420316696167} -11/07/2021 00:07:29 - INFO - __main__ - Step 20468: {'lr': 0.0004810368429591, 'samples': 3929856, 'steps': 20467, 'loss/train': 1.4060722589492798} -11/07/2021 00:07:30 - INFO - __main__ - Step 20469: {'lr': 0.00048103481553876415, 'samples': 3930048, 'steps': 20468, 'loss/train': 1.519386887550354} -11/07/2021 00:07:30 - INFO - __main__ - Step 20470: {'lr': 0.0004810327880143276, 'samples': 3930240, 'steps': 20469, 'loss/train': 1.8691269159317017} -11/07/2021 00:07:31 - INFO - __main__ - Step 20471: {'lr': 0.00048103076038579125, 'samples': 3930432, 'steps': 20470, 'loss/train': 1.5998656749725342} -11/07/2021 00:07:31 - INFO - __main__ - Step 20472: {'lr': 0.00048102873265315596, 'samples': 3930624, 'steps': 20471, 'loss/train': 1.6641353368759155} -11/07/2021 00:07:31 - INFO - __main__ - Step 20473: {'lr': 0.0004810267048164227, 'samples': 3930816, 'steps': 20472, 'loss/train': 1.4810760021209717} -11/07/2021 00:07:32 - INFO - __main__ - Step 20474: {'lr': 0.0004810246768755924, 'samples': 3931008, 'steps': 20473, 'loss/train': 1.4060907363891602} -11/07/2021 00:07:33 - INFO - __main__ - Step 20475: {'lr': 0.0004810226488306659, 'samples': 3931200, 'steps': 20474, 'loss/train': 1.388344407081604} -11/07/2021 00:07:33 - INFO - __main__ - Step 20476: {'lr': 0.00048102062068164413, 'samples': 3931392, 'steps': 20475, 'loss/train': 1.8781498670578003} -11/07/2021 00:07:33 - INFO - __main__ - Step 20477: {'lr': 0.0004810185924285281, 'samples': 3931584, 'steps': 20476, 'loss/train': 1.7342883348464966} -11/07/2021 00:07:34 - INFO - __main__ - Step 20478: {'lr': 0.00048101656407131864, 'samples': 3931776, 'steps': 20477, 'loss/train': 1.5581198930740356} -11/07/2021 00:07:34 - INFO - __main__ - Step 20479: {'lr': 0.00048101453561001667, 'samples': 3931968, 'steps': 20478, 'loss/train': 2.0187954902648926} -11/07/2021 00:07:35 - INFO - __main__ - Step 20480: {'lr': 0.00048101250704462315, 'samples': 3932160, 'steps': 20479, 'loss/train': 1.8168493509292603} -11/07/2021 00:07:36 - INFO - __main__ - Step 20481: {'lr': 0.0004810104783751389, 'samples': 3932352, 'steps': 20480, 'loss/train': 0.9651317000389099} -11/07/2021 00:07:36 - INFO - __main__ - Step 20482: {'lr': 0.00048100844960156496, 'samples': 3932544, 'steps': 20481, 'loss/train': 1.6677086353302002} -11/07/2021 00:07:36 - INFO - __main__ - Step 20483: {'lr': 0.0004810064207239021, 'samples': 3932736, 'steps': 20482, 'loss/train': 1.6259307861328125} -11/07/2021 00:07:37 - INFO - __main__ - Step 20484: {'lr': 0.0004810043917421514, 'samples': 3932928, 'steps': 20483, 'loss/train': 1.52870512008667} -11/07/2021 00:07:38 - INFO - __main__ - Step 20485: {'lr': 0.0004810023626563136, 'samples': 3933120, 'steps': 20484, 'loss/train': 2.194108009338379} -11/07/2021 00:07:38 - INFO - __main__ - Step 20486: {'lr': 0.0004810003334663898, 'samples': 3933312, 'steps': 20485, 'loss/train': 1.8448121547698975} -11/07/2021 00:07:38 - INFO - __main__ - Step 20487: {'lr': 0.0004809983041723807, 'samples': 3933504, 'steps': 20486, 'loss/train': 1.5697786808013916} -11/07/2021 00:07:39 - INFO - __main__ - Step 20488: {'lr': 0.00048099627477428744, 'samples': 3933696, 'steps': 20487, 'loss/train': 1.9467196464538574} -11/07/2021 00:07:39 - INFO - __main__ - Step 20489: {'lr': 0.0004809942452721107, 'samples': 3933888, 'steps': 20488, 'loss/train': 1.9454448223114014} -11/07/2021 00:07:40 - INFO - __main__ - Step 20490: {'lr': 0.0004809922156658516, 'samples': 3934080, 'steps': 20489, 'loss/train': 1.799720048904419} -11/07/2021 00:07:40 - INFO - __main__ - Step 20491: {'lr': 0.00048099018595551096, 'samples': 3934272, 'steps': 20490, 'loss/train': 1.9494208097457886} -11/07/2021 00:07:41 - INFO - __main__ - Step 20492: {'lr': 0.0004809881561410897, 'samples': 3934464, 'steps': 20491, 'loss/train': 1.471197485923767} -11/07/2021 00:07:41 - INFO - __main__ - Step 20493: {'lr': 0.00048098612622258873, 'samples': 3934656, 'steps': 20492, 'loss/train': 1.7744096517562866} -11/07/2021 00:07:42 - INFO - __main__ - Step 20494: {'lr': 0.00048098409620000906, 'samples': 3934848, 'steps': 20493, 'loss/train': 1.5430742502212524} -11/07/2021 00:07:43 - INFO - __main__ - Step 20495: {'lr': 0.00048098206607335135, 'samples': 3935040, 'steps': 20494, 'loss/train': 2.459300994873047} -11/07/2021 00:07:43 - INFO - __main__ - Step 20496: {'lr': 0.00048098003584261684, 'samples': 3935232, 'steps': 20495, 'loss/train': 1.3832452297210693} -11/07/2021 00:07:43 - INFO - __main__ - Step 20497: {'lr': 0.00048097800550780625, 'samples': 3935424, 'steps': 20496, 'loss/train': 1.6852710247039795} -11/07/2021 00:07:44 - INFO - __main__ - Step 20498: {'lr': 0.0004809759750689205, 'samples': 3935616, 'steps': 20497, 'loss/train': 1.6425219774246216} -11/07/2021 00:07:44 - INFO - __main__ - Step 20499: {'lr': 0.00048097394452596053, 'samples': 3935808, 'steps': 20498, 'loss/train': 1.1338953971862793} -11/07/2021 00:07:45 - INFO - __main__ - Step 20500: {'lr': 0.0004809719138789273, 'samples': 3936000, 'steps': 20499, 'loss/train': 1.6991946697235107} -11/07/2021 00:07:45 - INFO - __main__ - Step 20501: {'lr': 0.0004809698831278217, 'samples': 3936192, 'steps': 20500, 'loss/train': 1.4078713655471802} -11/07/2021 00:07:46 - INFO - __main__ - Step 20502: {'lr': 0.0004809678522726446, 'samples': 3936384, 'steps': 20501, 'loss/train': 1.7715500593185425} -11/07/2021 00:07:46 - INFO - __main__ - Step 20503: {'lr': 0.000480965821313397, 'samples': 3936576, 'steps': 20502, 'loss/train': 1.9850037097930908} -11/07/2021 00:07:46 - INFO - __main__ - Step 20504: {'lr': 0.0004809637902500797, 'samples': 3936768, 'steps': 20503, 'loss/train': 1.8379428386688232} -11/07/2021 00:07:47 - INFO - __main__ - Step 20505: {'lr': 0.00048096175908269375, 'samples': 3936960, 'steps': 20504, 'loss/train': 1.2110165357589722} -11/07/2021 00:07:48 - INFO - __main__ - Step 20506: {'lr': 0.00048095972781124, 'samples': 3937152, 'steps': 20505, 'loss/train': 1.5643447637557983} -11/07/2021 00:07:48 - INFO - __main__ - Step 20507: {'lr': 0.00048095769643571927, 'samples': 3937344, 'steps': 20506, 'loss/train': 1.2366441488265991} -11/07/2021 00:07:49 - INFO - __main__ - Step 20508: {'lr': 0.0004809556649561326, 'samples': 3937536, 'steps': 20507, 'loss/train': 1.807586669921875} -11/07/2021 00:07:49 - INFO - __main__ - Step 20509: {'lr': 0.0004809536333724809, 'samples': 3937728, 'steps': 20508, 'loss/train': 1.3580818176269531} -11/07/2021 00:07:49 - INFO - __main__ - Step 20510: {'lr': 0.000480951601684765, 'samples': 3937920, 'steps': 20509, 'loss/train': 1.1185882091522217} -11/07/2021 00:07:50 - INFO - __main__ - Step 20511: {'lr': 0.00048094956989298593, 'samples': 3938112, 'steps': 20510, 'loss/train': 0.8402307629585266} -11/07/2021 00:07:51 - INFO - __main__ - Step 20512: {'lr': 0.0004809475379971445, 'samples': 3938304, 'steps': 20511, 'loss/train': 1.676823377609253} -11/07/2021 00:07:51 - INFO - __main__ - Step 20513: {'lr': 0.00048094550599724176, 'samples': 3938496, 'steps': 20512, 'loss/train': 1.8695015907287598} -11/07/2021 00:07:52 - INFO - __main__ - Step 20514: {'lr': 0.0004809434738932785, 'samples': 3938688, 'steps': 20513, 'loss/train': 2.3277268409729004} -11/07/2021 00:07:52 - INFO - __main__ - Step 20515: {'lr': 0.0004809414416852557, 'samples': 3938880, 'steps': 20514, 'loss/train': 1.4669691324234009} -11/07/2021 00:07:53 - INFO - __main__ - Step 20516: {'lr': 0.00048093940937317414, 'samples': 3939072, 'steps': 20515, 'loss/train': 0.4304567873477936} -11/07/2021 00:07:53 - INFO - __main__ - Step 20517: {'lr': 0.00048093737695703494, 'samples': 3939264, 'steps': 20516, 'loss/train': 1.61251962184906} -11/07/2021 00:07:54 - INFO - __main__ - Step 20518: {'lr': 0.0004809353444368389, 'samples': 3939456, 'steps': 20517, 'loss/train': 1.7847530841827393} -11/07/2021 00:07:54 - INFO - __main__ - Step 20519: {'lr': 0.00048093331181258694, 'samples': 3939648, 'steps': 20518, 'loss/train': 1.8373972177505493} -11/07/2021 00:07:54 - INFO - __main__ - Step 20520: {'lr': 0.00048093127908428, 'samples': 3939840, 'steps': 20519, 'loss/train': 1.905431866645813} -11/07/2021 00:07:55 - INFO - __main__ - Step 20521: {'lr': 0.00048092924625191903, 'samples': 3940032, 'steps': 20520, 'loss/train': 1.9084038734436035} -11/07/2021 00:07:56 - INFO - __main__ - Step 20522: {'lr': 0.0004809272133155048, 'samples': 3940224, 'steps': 20521, 'loss/train': 1.740844964981079} -11/07/2021 00:07:56 - INFO - __main__ - Step 20523: {'lr': 0.00048092518027503844, 'samples': 3940416, 'steps': 20522, 'loss/train': 0.3389599025249481} -11/07/2021 00:07:56 - INFO - __main__ - Step 20524: {'lr': 0.0004809231471305208, 'samples': 3940608, 'steps': 20523, 'loss/train': 1.7005736827850342} -11/07/2021 00:07:57 - INFO - __main__ - Step 20525: {'lr': 0.0004809211138819526, 'samples': 3940800, 'steps': 20524, 'loss/train': 1.737630009651184} -11/07/2021 00:07:57 - INFO - __main__ - Step 20526: {'lr': 0.000480919080529335, 'samples': 3940992, 'steps': 20525, 'loss/train': 1.6942681074142456} -11/07/2021 00:07:58 - INFO - __main__ - Step 20527: {'lr': 0.0004809170470726688, 'samples': 3941184, 'steps': 20526, 'loss/train': 1.7566242218017578} -11/07/2021 00:07:58 - INFO - __main__ - Step 20528: {'lr': 0.00048091501351195495, 'samples': 3941376, 'steps': 20527, 'loss/train': 1.3537952899932861} -11/07/2021 00:07:59 - INFO - __main__ - Step 20529: {'lr': 0.00048091297984719433, 'samples': 3941568, 'steps': 20528, 'loss/train': 1.87349271774292} -11/07/2021 00:07:59 - INFO - __main__ - Step 20530: {'lr': 0.0004809109460783879, 'samples': 3941760, 'steps': 20529, 'loss/train': 1.070335030555725} -11/07/2021 00:07:59 - INFO - __main__ - Step 20531: {'lr': 0.0004809089122055366, 'samples': 3941952, 'steps': 20530, 'loss/train': 1.6043052673339844} -11/07/2021 00:08:00 - INFO - __main__ - Step 20532: {'lr': 0.00048090687822864125, 'samples': 3942144, 'steps': 20531, 'loss/train': 1.5132311582565308} -11/07/2021 00:08:01 - INFO - __main__ - Step 20533: {'lr': 0.00048090484414770284, 'samples': 3942336, 'steps': 20532, 'loss/train': 1.4935758113861084} -11/07/2021 00:08:01 - INFO - __main__ - Step 20534: {'lr': 0.00048090280996272234, 'samples': 3942528, 'steps': 20533, 'loss/train': 0.8592392802238464} -11/07/2021 00:08:01 - INFO - __main__ - Step 20535: {'lr': 0.0004809007756737005, 'samples': 3942720, 'steps': 20534, 'loss/train': 1.2228641510009766} -11/07/2021 00:08:02 - INFO - __main__ - Step 20536: {'lr': 0.0004808987412806384, 'samples': 3942912, 'steps': 20535, 'loss/train': 1.644826889038086} -11/07/2021 00:08:03 - INFO - __main__ - Step 20537: {'lr': 0.0004808967067835369, 'samples': 3943104, 'steps': 20536, 'loss/train': 1.395026683807373} -11/07/2021 00:08:03 - INFO - __main__ - Step 20538: {'lr': 0.00048089467218239687, 'samples': 3943296, 'steps': 20537, 'loss/train': 1.3494728803634644} -11/07/2021 00:08:04 - INFO - __main__ - Step 20539: {'lr': 0.00048089263747721925, 'samples': 3943488, 'steps': 20538, 'loss/train': 1.3986570835113525} -11/07/2021 00:08:04 - INFO - __main__ - Step 20540: {'lr': 0.000480890602668005, 'samples': 3943680, 'steps': 20539, 'loss/train': 1.3758116960525513} -11/07/2021 00:08:04 - INFO - __main__ - Step 20541: {'lr': 0.000480888567754755, 'samples': 3943872, 'steps': 20540, 'loss/train': 2.1255879402160645} -11/07/2021 00:08:05 - INFO - __main__ - Step 20542: {'lr': 0.0004808865327374701, 'samples': 3944064, 'steps': 20541, 'loss/train': 1.351326584815979} -11/07/2021 00:08:06 - INFO - __main__ - Step 20543: {'lr': 0.0004808844976161514, 'samples': 3944256, 'steps': 20542, 'loss/train': 1.5466766357421875} -11/07/2021 00:08:06 - INFO - __main__ - Step 20544: {'lr': 0.0004808824623907997, 'samples': 3944448, 'steps': 20543, 'loss/train': 0.4308020770549774} -11/07/2021 00:08:07 - INFO - __main__ - Step 20545: {'lr': 0.0004808804270614159, 'samples': 3944640, 'steps': 20544, 'loss/train': 1.7366575002670288} -11/07/2021 00:08:07 - INFO - __main__ - Step 20546: {'lr': 0.0004808783916280008, 'samples': 3944832, 'steps': 20545, 'loss/train': 1.2901078462600708} -11/07/2021 00:08:08 - INFO - __main__ - Step 20547: {'lr': 0.0004808763560905557, 'samples': 3945024, 'steps': 20546, 'loss/train': 1.660652995109558} -11/07/2021 00:08:08 - INFO - __main__ - Step 20548: {'lr': 0.0004808743204490811, 'samples': 3945216, 'steps': 20547, 'loss/train': 1.7535828351974487} -11/07/2021 00:08:09 - INFO - __main__ - Step 20549: {'lr': 0.00048087228470357823, 'samples': 3945408, 'steps': 20548, 'loss/train': 1.7939064502716064} -11/07/2021 00:08:09 - INFO - __main__ - Step 20550: {'lr': 0.00048087024885404777, 'samples': 3945600, 'steps': 20549, 'loss/train': 2.644047975540161} -11/07/2021 00:08:09 - INFO - __main__ - Step 20551: {'lr': 0.00048086821290049077, 'samples': 3945792, 'steps': 20550, 'loss/train': 0.19849666953086853} -11/07/2021 00:08:10 - INFO - __main__ - Step 20552: {'lr': 0.00048086617684290814, 'samples': 3945984, 'steps': 20551, 'loss/train': 1.6721930503845215} -11/07/2021 00:08:11 - INFO - __main__ - Step 20553: {'lr': 0.00048086414068130077, 'samples': 3946176, 'steps': 20552, 'loss/train': 1.5216528177261353} -11/07/2021 00:08:11 - INFO - __main__ - Step 20554: {'lr': 0.00048086210441566956, 'samples': 3946368, 'steps': 20553, 'loss/train': 1.0089731216430664} -11/07/2021 00:08:11 - INFO - __main__ - Step 20555: {'lr': 0.00048086006804601544, 'samples': 3946560, 'steps': 20554, 'loss/train': 1.431415319442749} -11/07/2021 00:08:12 - INFO - __main__ - Step 20556: {'lr': 0.00048085803157233933, 'samples': 3946752, 'steps': 20555, 'loss/train': 1.5693162679672241} -11/07/2021 00:08:12 - INFO - __main__ - Step 20557: {'lr': 0.00048085599499464216, 'samples': 3946944, 'steps': 20556, 'loss/train': 1.8088922500610352} -11/07/2021 00:08:13 - INFO - __main__ - Step 20558: {'lr': 0.0004808539583129249, 'samples': 3947136, 'steps': 20557, 'loss/train': 1.1080645322799683} -11/07/2021 00:08:14 - INFO - __main__ - Step 20559: {'lr': 0.0004808519215271884, 'samples': 3947328, 'steps': 20558, 'loss/train': 1.701973795890808} -11/07/2021 00:08:14 - INFO - __main__ - Step 20560: {'lr': 0.0004808498846374335, 'samples': 3947520, 'steps': 20559, 'loss/train': 1.7977246046066284} -11/07/2021 00:08:14 - INFO - __main__ - Step 20561: {'lr': 0.0004808478476436612, 'samples': 3947712, 'steps': 20560, 'loss/train': 0.45990151166915894} -11/07/2021 00:08:15 - INFO - __main__ - Step 20562: {'lr': 0.00048084581054587253, 'samples': 3947904, 'steps': 20561, 'loss/train': 1.6324790716171265} -11/07/2021 00:08:16 - INFO - __main__ - Step 20563: {'lr': 0.0004808437733440682, 'samples': 3948096, 'steps': 20562, 'loss/train': 1.7324868440628052} -11/07/2021 00:08:16 - INFO - __main__ - Step 20564: {'lr': 0.0004808417360382493, 'samples': 3948288, 'steps': 20563, 'loss/train': 1.4390432834625244} -11/07/2021 00:08:17 - INFO - __main__ - Step 20565: {'lr': 0.00048083969862841667, 'samples': 3948480, 'steps': 20564, 'loss/train': 1.9008427858352661} -11/07/2021 00:08:17 - INFO - __main__ - Step 20566: {'lr': 0.00048083766111457115, 'samples': 3948672, 'steps': 20565, 'loss/train': 1.5727438926696777} -11/07/2021 00:08:17 - INFO - __main__ - Step 20567: {'lr': 0.0004808356234967138, 'samples': 3948864, 'steps': 20566, 'loss/train': 1.1518347263336182} -11/07/2021 00:08:18 - INFO - __main__ - Step 20568: {'lr': 0.00048083358577484547, 'samples': 3949056, 'steps': 20567, 'loss/train': 0.17537906765937805} -11/07/2021 00:08:19 - INFO - __main__ - Step 20569: {'lr': 0.0004808315479489671, 'samples': 3949248, 'steps': 20568, 'loss/train': 1.7102299928665161} -11/07/2021 00:08:19 - INFO - __main__ - Step 20570: {'lr': 0.00048082951001907965, 'samples': 3949440, 'steps': 20569, 'loss/train': 1.6897586584091187} -11/07/2021 00:08:20 - INFO - __main__ - Step 20571: {'lr': 0.0004808274719851839, 'samples': 3949632, 'steps': 20570, 'loss/train': 1.6184511184692383} -11/07/2021 00:08:20 - INFO - __main__ - Step 20572: {'lr': 0.0004808254338472809, 'samples': 3949824, 'steps': 20571, 'loss/train': 1.9622421264648438} -11/07/2021 00:08:20 - INFO - __main__ - Step 20573: {'lr': 0.00048082339560537145, 'samples': 3950016, 'steps': 20572, 'loss/train': 1.6746459007263184} -11/07/2021 00:08:21 - INFO - __main__ - Step 20574: {'lr': 0.00048082135725945665, 'samples': 3950208, 'steps': 20573, 'loss/train': 2.0031142234802246} -11/07/2021 00:08:22 - INFO - __main__ - Step 20575: {'lr': 0.0004808193188095372, 'samples': 3950400, 'steps': 20574, 'loss/train': 1.841524362564087} -11/07/2021 00:08:22 - INFO - __main__ - Step 20576: {'lr': 0.0004808172802556142, 'samples': 3950592, 'steps': 20575, 'loss/train': 0.7797104716300964} -11/07/2021 00:08:22 - INFO - __main__ - Step 20577: {'lr': 0.0004808152415976885, 'samples': 3950784, 'steps': 20576, 'loss/train': 1.443601369857788} -11/07/2021 00:08:23 - INFO - __main__ - Step 20578: {'lr': 0.000480813202835761, 'samples': 3950976, 'steps': 20577, 'loss/train': 1.2981877326965332} -11/07/2021 00:08:24 - INFO - __main__ - Step 20579: {'lr': 0.0004808111639698326, 'samples': 3951168, 'steps': 20578, 'loss/train': 1.9003407955169678} -11/07/2021 00:08:24 - INFO - __main__ - Step 20580: {'lr': 0.0004808091249999043, 'samples': 3951360, 'steps': 20579, 'loss/train': 2.1749467849731445} -11/07/2021 00:08:24 - INFO - __main__ - Step 20581: {'lr': 0.0004808070859259769, 'samples': 3951552, 'steps': 20580, 'loss/train': 1.2194863557815552} -11/07/2021 00:08:25 - INFO - __main__ - Step 20582: {'lr': 0.0004808050467480515, 'samples': 3951744, 'steps': 20581, 'loss/train': 1.2447943687438965} -11/07/2021 00:08:25 - INFO - __main__ - Step 20583: {'lr': 0.0004808030074661288, 'samples': 3951936, 'steps': 20582, 'loss/train': 1.7001240253448486} -11/07/2021 00:08:26 - INFO - __main__ - Step 20584: {'lr': 0.0004808009680802099, 'samples': 3952128, 'steps': 20583, 'loss/train': 1.4224902391433716} -11/07/2021 00:08:26 - INFO - __main__ - Step 20585: {'lr': 0.00048079892859029564, 'samples': 3952320, 'steps': 20584, 'loss/train': 1.3647888898849487} -11/07/2021 00:08:27 - INFO - __main__ - Step 20586: {'lr': 0.00048079688899638684, 'samples': 3952512, 'steps': 20585, 'loss/train': 1.5216392278671265} -11/07/2021 00:08:27 - INFO - __main__ - Step 20587: {'lr': 0.0004807948492984846, 'samples': 3952704, 'steps': 20586, 'loss/train': 2.091362476348877} -11/07/2021 00:08:27 - INFO - __main__ - Step 20588: {'lr': 0.0004807928094965898, 'samples': 3952896, 'steps': 20587, 'loss/train': 1.597800612449646} -11/07/2021 00:08:28 - INFO - __main__ - Step 20589: {'lr': 0.0004807907695907032, 'samples': 3953088, 'steps': 20588, 'loss/train': 1.6435033082962036} -11/07/2021 00:08:29 - INFO - __main__ - Step 20590: {'lr': 0.000480788729580826, 'samples': 3953280, 'steps': 20589, 'loss/train': 1.4887282848358154} -11/07/2021 00:08:29 - INFO - __main__ - Step 20591: {'lr': 0.00048078668946695887, 'samples': 3953472, 'steps': 20590, 'loss/train': 1.240483283996582} -11/07/2021 00:08:30 - INFO - __main__ - Step 20592: {'lr': 0.0004807846492491028, 'samples': 3953664, 'steps': 20591, 'loss/train': 1.6103730201721191} -11/07/2021 00:08:30 - INFO - __main__ - Step 20593: {'lr': 0.0004807826089272588, 'samples': 3953856, 'steps': 20592, 'loss/train': 1.8579837083816528} -11/07/2021 00:08:31 - INFO - __main__ - Step 20594: {'lr': 0.0004807805685014277, 'samples': 3954048, 'steps': 20593, 'loss/train': 1.8013089895248413} -11/07/2021 00:08:31 - INFO - __main__ - Step 20595: {'lr': 0.00048077852797161034, 'samples': 3954240, 'steps': 20594, 'loss/train': 1.3747129440307617} -11/07/2021 00:08:32 - INFO - __main__ - Step 20596: {'lr': 0.0004807764873378079, 'samples': 3954432, 'steps': 20595, 'loss/train': 1.2700172662734985} -11/07/2021 00:08:32 - INFO - __main__ - Step 20597: {'lr': 0.000480774446600021, 'samples': 3954624, 'steps': 20596, 'loss/train': 1.3797485828399658} -11/07/2021 00:08:32 - INFO - __main__ - Step 20598: {'lr': 0.00048077240575825075, 'samples': 3954816, 'steps': 20597, 'loss/train': 2.085232973098755} -11/07/2021 00:08:33 - INFO - __main__ - Step 20599: {'lr': 0.000480770364812498, 'samples': 3955008, 'steps': 20598, 'loss/train': 1.6940776109695435} -11/07/2021 00:08:34 - INFO - __main__ - Step 20600: {'lr': 0.0004807683237627637, 'samples': 3955200, 'steps': 20599, 'loss/train': 1.5124833583831787} -11/07/2021 00:08:34 - INFO - __main__ - Step 20601: {'lr': 0.0004807662826090488, 'samples': 3955392, 'steps': 20600, 'loss/train': 1.4219224452972412} -11/07/2021 00:08:34 - INFO - __main__ - Step 20602: {'lr': 0.00048076424135135406, 'samples': 3955584, 'steps': 20601, 'loss/train': 1.5715713500976562} -11/07/2021 00:08:35 - INFO - __main__ - Step 20603: {'lr': 0.00048076219998968055, 'samples': 3955776, 'steps': 20602, 'loss/train': 2.141200304031372} -11/07/2021 00:08:35 - INFO - __main__ - Step 20604: {'lr': 0.0004807601585240292, 'samples': 3955968, 'steps': 20603, 'loss/train': 1.7138773202896118} -11/07/2021 00:08:36 - INFO - __main__ - Step 20605: {'lr': 0.0004807581169544009, 'samples': 3956160, 'steps': 20604, 'loss/train': 1.7838529348373413} -11/07/2021 00:08:37 - INFO - __main__ - Step 20606: {'lr': 0.00048075607528079645, 'samples': 3956352, 'steps': 20605, 'loss/train': 1.4636403322219849} -11/07/2021 00:08:37 - INFO - __main__ - Step 20607: {'lr': 0.0004807540335032169, 'samples': 3956544, 'steps': 20606, 'loss/train': 1.51893949508667} -11/07/2021 00:08:37 - INFO - __main__ - Step 20608: {'lr': 0.0004807519916216633, 'samples': 3956736, 'steps': 20607, 'loss/train': 1.2464053630828857} -11/07/2021 00:08:38 - INFO - __main__ - Step 20609: {'lr': 0.0004807499496361362, 'samples': 3956928, 'steps': 20608, 'loss/train': 1.454918384552002} -11/07/2021 00:08:39 - INFO - __main__ - Step 20610: {'lr': 0.00048074790754663686, 'samples': 3957120, 'steps': 20609, 'loss/train': 1.3798999786376953} -11/07/2021 00:08:39 - INFO - __main__ - Step 20611: {'lr': 0.000480745865353166, 'samples': 3957312, 'steps': 20610, 'loss/train': 1.5794548988342285} -11/07/2021 00:08:39 - INFO - __main__ - Step 20612: {'lr': 0.0004807438230557247, 'samples': 3957504, 'steps': 20611, 'loss/train': 2.0480737686157227} -11/07/2021 00:08:40 - INFO - __main__ - Step 20613: {'lr': 0.00048074178065431373, 'samples': 3957696, 'steps': 20612, 'loss/train': 0.7402926087379456} -11/07/2021 00:08:40 - INFO - __main__ - Step 20614: {'lr': 0.0004807397381489341, 'samples': 3957888, 'steps': 20613, 'loss/train': 1.6169627904891968} -11/07/2021 00:08:41 - INFO - __main__ - Step 20615: {'lr': 0.00048073769553958666, 'samples': 3958080, 'steps': 20614, 'loss/train': 1.4762638807296753} -11/07/2021 00:08:42 - INFO - __main__ - Step 20616: {'lr': 0.00048073565282627246, 'samples': 3958272, 'steps': 20615, 'loss/train': 1.4194600582122803} -11/07/2021 00:08:42 - INFO - __main__ - Step 20617: {'lr': 0.0004807336100089923, 'samples': 3958464, 'steps': 20616, 'loss/train': 1.2621079683303833} -11/07/2021 00:08:42 - INFO - __main__ - Step 20618: {'lr': 0.0004807315670877471, 'samples': 3958656, 'steps': 20617, 'loss/train': 1.8260729312896729} -11/07/2021 00:08:43 - INFO - __main__ - Step 20619: {'lr': 0.00048072952406253783, 'samples': 3958848, 'steps': 20618, 'loss/train': 1.0546283721923828} -11/07/2021 00:08:44 - INFO - __main__ - Step 20620: {'lr': 0.00048072748093336536, 'samples': 3959040, 'steps': 20619, 'loss/train': 1.9476903676986694} -11/07/2021 00:08:44 - INFO - __main__ - Step 20621: {'lr': 0.00048072543770023076, 'samples': 3959232, 'steps': 20620, 'loss/train': 1.710111141204834} -11/07/2021 00:08:44 - INFO - __main__ - Step 20622: {'lr': 0.0004807233943631347, 'samples': 3959424, 'steps': 20621, 'loss/train': 1.7692378759384155} -11/07/2021 00:08:45 - INFO - __main__ - Step 20623: {'lr': 0.0004807213509220784, 'samples': 3959616, 'steps': 20622, 'loss/train': 1.9633917808532715} -11/07/2021 00:08:45 - INFO - __main__ - Step 20624: {'lr': 0.0004807193073770625, 'samples': 3959808, 'steps': 20623, 'loss/train': 1.632491111755371} -11/07/2021 00:08:46 - INFO - __main__ - Step 20625: {'lr': 0.0004807172637280881, 'samples': 3960000, 'steps': 20624, 'loss/train': 1.7137901782989502} -11/07/2021 00:08:46 - INFO - __main__ - Step 20626: {'lr': 0.000480715219975156, 'samples': 3960192, 'steps': 20625, 'loss/train': 1.7485941648483276} -11/07/2021 00:08:47 - INFO - __main__ - Step 20627: {'lr': 0.0004807131761182672, 'samples': 3960384, 'steps': 20626, 'loss/train': 1.6671442985534668} -11/07/2021 00:08:47 - INFO - __main__ - Step 20628: {'lr': 0.00048071113215742263, 'samples': 3960576, 'steps': 20627, 'loss/train': 1.8338042497634888} -11/07/2021 00:08:47 - INFO - __main__ - Step 20629: {'lr': 0.00048070908809262316, 'samples': 3960768, 'steps': 20628, 'loss/train': 1.5052207708358765} -11/07/2021 00:08:48 - INFO - __main__ - Step 20630: {'lr': 0.0004807070439238698, 'samples': 3960960, 'steps': 20629, 'loss/train': 1.7445805072784424} -11/07/2021 00:08:49 - INFO - __main__ - Step 20631: {'lr': 0.0004807049996511633, 'samples': 3961152, 'steps': 20630, 'loss/train': 1.856859564781189} -11/07/2021 00:08:49 - INFO - __main__ - Step 20632: {'lr': 0.00048070295527450474, 'samples': 3961344, 'steps': 20631, 'loss/train': 1.6593570709228516} -11/07/2021 00:08:50 - INFO - __main__ - Step 20633: {'lr': 0.000480700910793895, 'samples': 3961536, 'steps': 20632, 'loss/train': 1.9622411727905273} -11/07/2021 00:08:50 - INFO - __main__ - Step 20634: {'lr': 0.000480698866209335, 'samples': 3961728, 'steps': 20633, 'loss/train': 1.853137731552124} -11/07/2021 00:08:50 - INFO - __main__ - Step 20635: {'lr': 0.0004806968215208256, 'samples': 3961920, 'steps': 20634, 'loss/train': 1.5925242900848389} -11/07/2021 00:08:51 - INFO - __main__ - Step 20636: {'lr': 0.0004806947767283678, 'samples': 3962112, 'steps': 20635, 'loss/train': 1.4025685787200928} -11/07/2021 00:08:52 - INFO - __main__ - Step 20637: {'lr': 0.0004806927318319625, 'samples': 3962304, 'steps': 20636, 'loss/train': 1.8534218072891235} -11/07/2021 00:08:52 - INFO - __main__ - Step 20638: {'lr': 0.0004806906868316106, 'samples': 3962496, 'steps': 20637, 'loss/train': 2.070551633834839} -11/07/2021 00:08:52 - INFO - __main__ - Step 20639: {'lr': 0.000480688641727313, 'samples': 3962688, 'steps': 20638, 'loss/train': 1.5866397619247437} -11/07/2021 00:08:53 - INFO - __main__ - Step 20640: {'lr': 0.00048068659651907076, 'samples': 3962880, 'steps': 20639, 'loss/train': 1.4923686981201172} -11/07/2021 00:08:54 - INFO - __main__ - Step 20641: {'lr': 0.0004806845512068846, 'samples': 3963072, 'steps': 20640, 'loss/train': 1.3124408721923828} -11/07/2021 00:08:55 - INFO - __main__ - Step 20642: {'lr': 0.00048068250579075554, 'samples': 3963264, 'steps': 20641, 'loss/train': 1.4300978183746338} -11/07/2021 00:08:55 - INFO - __main__ - Step 20643: {'lr': 0.00048068046027068456, 'samples': 3963456, 'steps': 20642, 'loss/train': 0.792670726776123} -11/07/2021 00:08:55 - INFO - __main__ - Step 20644: {'lr': 0.0004806784146466726, 'samples': 3963648, 'steps': 20643, 'loss/train': 1.530687928199768} -11/07/2021 00:08:56 - INFO - __main__ - Step 20645: {'lr': 0.00048067636891872036, 'samples': 3963840, 'steps': 20644, 'loss/train': 1.8204725980758667} -11/07/2021 00:08:56 - INFO - __main__ - Step 20646: {'lr': 0.00048067432308682894, 'samples': 3964032, 'steps': 20645, 'loss/train': 1.7493035793304443} -11/07/2021 00:08:58 - INFO - __main__ - Step 20647: {'lr': 0.0004806722771509993, 'samples': 3964224, 'steps': 20646, 'loss/train': 1.4086054563522339} -11/07/2021 00:08:58 - INFO - __main__ - Step 20648: {'lr': 0.0004806702311112322, 'samples': 3964416, 'steps': 20647, 'loss/train': 1.8562865257263184} -11/07/2021 00:08:58 - INFO - __main__ - Step 20649: {'lr': 0.0004806681849675287, 'samples': 3964608, 'steps': 20648, 'loss/train': 0.9947164058685303} -11/07/2021 00:08:59 - INFO - __main__ - Step 20650: {'lr': 0.00048066613871988967, 'samples': 3964800, 'steps': 20649, 'loss/train': 0.8895652890205383} -11/07/2021 00:08:59 - INFO - __main__ - Step 20651: {'lr': 0.00048066409236831607, 'samples': 3964992, 'steps': 20650, 'loss/train': 1.5003318786621094} -11/07/2021 00:08:59 - INFO - __main__ - Step 20652: {'lr': 0.0004806620459128087, 'samples': 3965184, 'steps': 20651, 'loss/train': 2.3419785499572754} -11/07/2021 00:09:00 - INFO - __main__ - Step 20653: {'lr': 0.0004806599993533687, 'samples': 3965376, 'steps': 20652, 'loss/train': 1.5649617910385132} -11/07/2021 00:09:01 - INFO - __main__ - Step 20654: {'lr': 0.00048065795268999677, 'samples': 3965568, 'steps': 20653, 'loss/train': 1.3647540807724} -11/07/2021 00:09:01 - INFO - __main__ - Step 20655: {'lr': 0.00048065590592269393, 'samples': 3965760, 'steps': 20654, 'loss/train': 1.6221338510513306} -11/07/2021 00:09:01 - INFO - __main__ - Step 20656: {'lr': 0.00048065385905146114, 'samples': 3965952, 'steps': 20655, 'loss/train': 1.5131564140319824} -11/07/2021 00:09:02 - INFO - __main__ - Step 20657: {'lr': 0.0004806518120762993, 'samples': 3966144, 'steps': 20656, 'loss/train': 1.148862361907959} -11/07/2021 00:09:02 - INFO - __main__ - Step 20658: {'lr': 0.00048064976499720923, 'samples': 3966336, 'steps': 20657, 'loss/train': 1.2469278573989868} -11/07/2021 00:09:03 - INFO - __main__ - Step 20659: {'lr': 0.000480647717814192, 'samples': 3966528, 'steps': 20658, 'loss/train': 1.5720820426940918} -11/07/2021 00:09:03 - INFO - __main__ - Step 20660: {'lr': 0.0004806456705272484, 'samples': 3966720, 'steps': 20659, 'loss/train': 1.0221384763717651} -11/07/2021 00:09:04 - INFO - __main__ - Step 20661: {'lr': 0.0004806436231363795, 'samples': 3966912, 'steps': 20660, 'loss/train': 1.6063361167907715} -11/07/2021 00:09:04 - INFO - __main__ - Step 20662: {'lr': 0.00048064157564158607, 'samples': 3967104, 'steps': 20661, 'loss/train': 1.519577980041504} -11/07/2021 00:09:04 - INFO - __main__ - Step 20663: {'lr': 0.00048063952804286913, 'samples': 3967296, 'steps': 20662, 'loss/train': 1.8714137077331543} -11/07/2021 00:09:06 - INFO - __main__ - Step 20664: {'lr': 0.0004806374803402296, 'samples': 3967488, 'steps': 20663, 'loss/train': 1.5183724164962769} -11/07/2021 00:09:06 - INFO - __main__ - Step 20665: {'lr': 0.00048063543253366837, 'samples': 3967680, 'steps': 20664, 'loss/train': 0.3621142506599426} -11/07/2021 00:09:06 - INFO - __main__ - Step 20666: {'lr': 0.0004806333846231864, 'samples': 3967872, 'steps': 20665, 'loss/train': 1.2749292850494385} -11/07/2021 00:09:07 - INFO - __main__ - Step 20667: {'lr': 0.00048063133660878455, 'samples': 3968064, 'steps': 20666, 'loss/train': 2.1483118534088135} -11/07/2021 00:09:07 - INFO - __main__ - Step 20668: {'lr': 0.00048062928849046377, 'samples': 3968256, 'steps': 20667, 'loss/train': 1.5145294666290283} -11/07/2021 00:09:08 - INFO - __main__ - Step 20669: {'lr': 0.00048062724026822504, 'samples': 3968448, 'steps': 20668, 'loss/train': 1.9260640144348145} -11/07/2021 00:09:09 - INFO - __main__ - Step 20670: {'lr': 0.00048062519194206916, 'samples': 3968640, 'steps': 20669, 'loss/train': 1.9533888101577759} -11/07/2021 00:09:09 - INFO - __main__ - Step 20671: {'lr': 0.0004806231435119972, 'samples': 3968832, 'steps': 20670, 'loss/train': 1.6754319667816162} -11/07/2021 00:09:09 - INFO - __main__ - Step 20672: {'lr': 0.00048062109497800997, 'samples': 3969024, 'steps': 20671, 'loss/train': 1.9477202892303467} -11/07/2021 00:09:10 - INFO - __main__ - Step 20673: {'lr': 0.00048061904634010845, 'samples': 3969216, 'steps': 20672, 'loss/train': 1.5543469190597534} -11/07/2021 00:09:11 - INFO - __main__ - Step 20674: {'lr': 0.0004806169975982935, 'samples': 3969408, 'steps': 20673, 'loss/train': 1.644513726234436} -11/07/2021 00:09:11 - INFO - __main__ - Step 20675: {'lr': 0.0004806149487525662, 'samples': 3969600, 'steps': 20674, 'loss/train': 2.085134983062744} -11/07/2021 00:09:11 - INFO - __main__ - Step 20676: {'lr': 0.0004806128998029272, 'samples': 3969792, 'steps': 20675, 'loss/train': 1.3123760223388672} -11/07/2021 00:09:12 - INFO - __main__ - Step 20677: {'lr': 0.0004806108507493777, 'samples': 3969984, 'steps': 20676, 'loss/train': 2.046645402908325} -11/07/2021 00:09:12 - INFO - __main__ - Step 20678: {'lr': 0.0004806088015919185, 'samples': 3970176, 'steps': 20677, 'loss/train': 1.390297293663025} -11/07/2021 00:09:13 - INFO - __main__ - Step 20679: {'lr': 0.0004806067523305505, 'samples': 3970368, 'steps': 20678, 'loss/train': 1.6803712844848633} -11/07/2021 00:09:13 - INFO - __main__ - Step 20680: {'lr': 0.0004806047029652747, 'samples': 3970560, 'steps': 20679, 'loss/train': 1.983790636062622} -11/07/2021 00:09:14 - INFO - __main__ - Step 20681: {'lr': 0.00048060265349609193, 'samples': 3970752, 'steps': 20680, 'loss/train': 2.1428070068359375} -11/07/2021 00:09:14 - INFO - __main__ - Step 20682: {'lr': 0.0004806006039230032, 'samples': 3970944, 'steps': 20681, 'loss/train': 1.3993123769760132} -11/07/2021 00:09:14 - INFO - __main__ - Step 20683: {'lr': 0.0004805985542460094, 'samples': 3971136, 'steps': 20682, 'loss/train': 1.8802090883255005} -11/07/2021 00:09:15 - INFO - __main__ - Step 20684: {'lr': 0.00048059650446511136, 'samples': 3971328, 'steps': 20683, 'loss/train': 1.7126437425613403} -11/07/2021 00:09:16 - INFO - __main__ - Step 20685: {'lr': 0.00048059445458031023, 'samples': 3971520, 'steps': 20684, 'loss/train': 1.373525619506836} -11/07/2021 00:09:16 - INFO - __main__ - Step 20686: {'lr': 0.0004805924045916067, 'samples': 3971712, 'steps': 20685, 'loss/train': 1.4744396209716797} -11/07/2021 00:09:17 - INFO - __main__ - Step 20687: {'lr': 0.00048059035449900185, 'samples': 3971904, 'steps': 20686, 'loss/train': 1.5865269899368286} -11/07/2021 00:09:17 - INFO - __main__ - Step 20688: {'lr': 0.0004805883043024965, 'samples': 3972096, 'steps': 20687, 'loss/train': 1.5301727056503296} -11/07/2021 00:09:17 - INFO - __main__ - Step 20689: {'lr': 0.0004805862540020917, 'samples': 3972288, 'steps': 20688, 'loss/train': 1.0273187160491943} -11/07/2021 00:09:18 - INFO - __main__ - Step 20690: {'lr': 0.0004805842035977882, 'samples': 3972480, 'steps': 20689, 'loss/train': 2.583864212036133} -11/07/2021 00:09:19 - INFO - __main__ - Step 20691: {'lr': 0.00048058215308958703, 'samples': 3972672, 'steps': 20690, 'loss/train': 1.1605116128921509} -11/07/2021 00:09:19 - INFO - __main__ - Step 20692: {'lr': 0.00048058010247748904, 'samples': 3972864, 'steps': 20691, 'loss/train': 1.5896633863449097} -11/07/2021 00:09:19 - INFO - __main__ - Step 20693: {'lr': 0.0004805780517614954, 'samples': 3973056, 'steps': 20692, 'loss/train': 1.8313792943954468} -11/07/2021 00:09:20 - INFO - __main__ - Step 20694: {'lr': 0.0004805760009416067, 'samples': 3973248, 'steps': 20693, 'loss/train': 1.637069582939148} -11/07/2021 00:09:21 - INFO - __main__ - Step 20695: {'lr': 0.000480573950017824, 'samples': 3973440, 'steps': 20694, 'loss/train': 1.3542802333831787} -11/07/2021 00:09:21 - INFO - __main__ - Step 20696: {'lr': 0.0004805718989901483, 'samples': 3973632, 'steps': 20695, 'loss/train': 1.9154294729232788} -11/07/2021 00:09:21 - INFO - __main__ - Step 20697: {'lr': 0.00048056984785858046, 'samples': 3973824, 'steps': 20696, 'loss/train': 1.9138669967651367} -11/07/2021 00:09:22 - INFO - __main__ - Step 20698: {'lr': 0.0004805677966231214, 'samples': 3974016, 'steps': 20697, 'loss/train': 1.203387975692749} -11/07/2021 00:09:22 - INFO - __main__ - Step 20699: {'lr': 0.00048056574528377205, 'samples': 3974208, 'steps': 20698, 'loss/train': 1.5315396785736084} -11/07/2021 00:09:23 - INFO - __main__ - Step 20700: {'lr': 0.00048056369384053335, 'samples': 3974400, 'steps': 20699, 'loss/train': 1.4767616987228394} -11/07/2021 00:09:24 - INFO - __main__ - Step 20701: {'lr': 0.00048056164229340613, 'samples': 3974592, 'steps': 20700, 'loss/train': 1.3749315738677979} -11/07/2021 00:09:24 - INFO - __main__ - Step 20702: {'lr': 0.0004805595906423914, 'samples': 3974784, 'steps': 20701, 'loss/train': 1.688059687614441} -11/07/2021 00:09:24 - INFO - __main__ - Step 20703: {'lr': 0.00048055753888749013, 'samples': 3974976, 'steps': 20702, 'loss/train': 1.1523799896240234} -11/07/2021 00:09:25 - INFO - __main__ - Step 20704: {'lr': 0.0004805554870287032, 'samples': 3975168, 'steps': 20703, 'loss/train': 1.2559438943862915} -11/07/2021 00:09:26 - INFO - __main__ - Step 20705: {'lr': 0.0004805534350660315, 'samples': 3975360, 'steps': 20704, 'loss/train': 1.656295657157898} -11/07/2021 00:09:26 - INFO - __main__ - Step 20706: {'lr': 0.000480551382999476, 'samples': 3975552, 'steps': 20705, 'loss/train': 0.858877420425415} -11/07/2021 00:09:26 - INFO - __main__ - Step 20707: {'lr': 0.00048054933082903754, 'samples': 3975744, 'steps': 20706, 'loss/train': 1.4430663585662842} -11/07/2021 00:09:27 - INFO - __main__ - Step 20708: {'lr': 0.00048054727855471717, 'samples': 3975936, 'steps': 20707, 'loss/train': 1.785535216331482} -11/07/2021 00:09:27 - INFO - __main__ - Step 20709: {'lr': 0.00048054522617651575, 'samples': 3976128, 'steps': 20708, 'loss/train': 1.5893622636795044} -11/07/2021 00:09:27 - INFO - __main__ - Step 20710: {'lr': 0.0004805431736944342, 'samples': 3976320, 'steps': 20709, 'loss/train': 2.038050889968872} -11/07/2021 00:09:28 - INFO - __main__ - Step 20711: {'lr': 0.0004805411211084735, 'samples': 3976512, 'steps': 20710, 'loss/train': 1.4637943506240845} -11/07/2021 00:09:29 - INFO - __main__ - Step 20712: {'lr': 0.0004805390684186344, 'samples': 3976704, 'steps': 20711, 'loss/train': 1.8713645935058594} -11/07/2021 00:09:29 - INFO - __main__ - Step 20713: {'lr': 0.00048053701562491804, 'samples': 3976896, 'steps': 20712, 'loss/train': 1.541002869606018} -11/07/2021 00:09:30 - INFO - __main__ - Step 20714: {'lr': 0.0004805349627273253, 'samples': 3977088, 'steps': 20713, 'loss/train': 1.3053054809570312} -11/07/2021 00:09:30 - INFO - __main__ - Step 20715: {'lr': 0.00048053290972585697, 'samples': 3977280, 'steps': 20714, 'loss/train': 1.6590816974639893} -11/07/2021 00:09:31 - INFO - __main__ - Step 20716: {'lr': 0.0004805308566205141, 'samples': 3977472, 'steps': 20715, 'loss/train': 1.4192510843276978} -11/07/2021 00:09:31 - INFO - __main__ - Step 20717: {'lr': 0.00048052880341129764, 'samples': 3977664, 'steps': 20716, 'loss/train': 2.1568589210510254} -11/07/2021 00:09:32 - INFO - __main__ - Step 20718: {'lr': 0.00048052675009820837, 'samples': 3977856, 'steps': 20717, 'loss/train': 1.3425061702728271} -11/07/2021 00:09:32 - INFO - __main__ - Step 20719: {'lr': 0.0004805246966812474, 'samples': 3978048, 'steps': 20718, 'loss/train': 1.3434855937957764} -11/07/2021 00:09:32 - INFO - __main__ - Step 20720: {'lr': 0.0004805226431604155, 'samples': 3978240, 'steps': 20719, 'loss/train': 1.4448708295822144} -11/07/2021 00:09:33 - INFO - __main__ - Step 20721: {'lr': 0.00048052058953571366, 'samples': 3978432, 'steps': 20720, 'loss/train': 1.672785997390747} -11/07/2021 00:09:34 - INFO - __main__ - Step 20722: {'lr': 0.0004805185358071428, 'samples': 3978624, 'steps': 20721, 'loss/train': 1.3219795227050781} -11/07/2021 00:09:34 - INFO - __main__ - Step 20723: {'lr': 0.0004805164819747038, 'samples': 3978816, 'steps': 20722, 'loss/train': 1.7978225946426392} -11/07/2021 00:09:34 - INFO - __main__ - Step 20724: {'lr': 0.0004805144280383977, 'samples': 3979008, 'steps': 20723, 'loss/train': 1.7678934335708618} -11/07/2021 00:09:35 - INFO - __main__ - Step 20725: {'lr': 0.00048051237399822534, 'samples': 3979200, 'steps': 20724, 'loss/train': 1.6825202703475952} -11/07/2021 00:09:36 - INFO - __main__ - Step 20726: {'lr': 0.00048051031985418764, 'samples': 3979392, 'steps': 20725, 'loss/train': 2.1667885780334473} -11/07/2021 00:09:36 - INFO - __main__ - Step 20727: {'lr': 0.0004805082656062856, 'samples': 3979584, 'steps': 20726, 'loss/train': 1.395729422569275} -11/07/2021 00:09:36 - INFO - __main__ - Step 20728: {'lr': 0.00048050621125451996, 'samples': 3979776, 'steps': 20727, 'loss/train': 1.5101127624511719} -11/07/2021 00:09:37 - INFO - __main__ - Step 20729: {'lr': 0.00048050415679889194, 'samples': 3979968, 'steps': 20728, 'loss/train': 1.6429022550582886} -11/07/2021 00:09:37 - INFO - __main__ - Step 20730: {'lr': 0.0004805021022394022, 'samples': 3980160, 'steps': 20729, 'loss/train': 1.715214729309082} -11/07/2021 00:09:38 - INFO - __main__ - Step 20731: {'lr': 0.0004805000475760518, 'samples': 3980352, 'steps': 20730, 'loss/train': 1.8093258142471313} -11/07/2021 00:09:38 - INFO - __main__ - Step 20732: {'lr': 0.0004804979928088417, 'samples': 3980544, 'steps': 20731, 'loss/train': 1.727259874343872} -11/07/2021 00:09:39 - INFO - __main__ - Step 20733: {'lr': 0.0004804959379377727, 'samples': 3980736, 'steps': 20732, 'loss/train': 1.4324378967285156} -11/07/2021 00:09:39 - INFO - __main__ - Step 20734: {'lr': 0.00048049388296284576, 'samples': 3980928, 'steps': 20733, 'loss/train': 1.0420160293579102} -11/07/2021 00:09:40 - INFO - __main__ - Step 20735: {'lr': 0.00048049182788406186, 'samples': 3981120, 'steps': 20734, 'loss/train': 1.1756582260131836} -11/07/2021 00:09:41 - INFO - __main__ - Step 20736: {'lr': 0.0004804897727014219, 'samples': 3981312, 'steps': 20735, 'loss/train': 1.6517256498336792} -11/07/2021 00:09:41 - INFO - __main__ - Step 20737: {'lr': 0.0004804877174149268, 'samples': 3981504, 'steps': 20736, 'loss/train': 1.1860313415527344} -11/07/2021 00:09:41 - INFO - __main__ - Step 20738: {'lr': 0.00048048566202457747, 'samples': 3981696, 'steps': 20737, 'loss/train': 1.743064045906067} -11/07/2021 00:09:42 - INFO - __main__ - Step 20739: {'lr': 0.00048048360653037494, 'samples': 3981888, 'steps': 20738, 'loss/train': 1.2434656620025635} -11/07/2021 00:09:42 - INFO - __main__ - Step 20740: {'lr': 0.00048048155093231994, 'samples': 3982080, 'steps': 20739, 'loss/train': 1.5692754983901978} -11/07/2021 00:09:42 - INFO - __main__ - Step 20741: {'lr': 0.00048047949523041355, 'samples': 3982272, 'steps': 20740, 'loss/train': 1.2839480638504028} -11/07/2021 00:09:44 - INFO - __main__ - Step 20742: {'lr': 0.0004804774394246567, 'samples': 3982464, 'steps': 20741, 'loss/train': 0.8025193214416504} -11/07/2021 00:09:44 - INFO - __main__ - Step 20743: {'lr': 0.0004804753835150503, 'samples': 3982656, 'steps': 20742, 'loss/train': 1.786361813545227} -11/07/2021 00:09:44 - INFO - __main__ - Step 20744: {'lr': 0.0004804733275015951, 'samples': 3982848, 'steps': 20743, 'loss/train': 1.8952442407608032} -11/07/2021 00:09:45 - INFO - __main__ - Step 20745: {'lr': 0.0004804712713842923, 'samples': 3983040, 'steps': 20744, 'loss/train': 1.9803398847579956} -11/07/2021 00:09:46 - INFO - __main__ - Step 20746: {'lr': 0.0004804692151631427, 'samples': 3983232, 'steps': 20745, 'loss/train': 1.8971871137619019} -11/07/2021 00:09:46 - INFO - __main__ - Step 20747: {'lr': 0.00048046715883814716, 'samples': 3983424, 'steps': 20746, 'loss/train': 1.5037178993225098} -11/07/2021 00:09:46 - INFO - __main__ - Step 20748: {'lr': 0.00048046510240930674, 'samples': 3983616, 'steps': 20747, 'loss/train': 1.7305831909179688} -11/07/2021 00:09:47 - INFO - __main__ - Step 20749: {'lr': 0.00048046304587662225, 'samples': 3983808, 'steps': 20748, 'loss/train': 1.7680881023406982} -11/07/2021 00:09:47 - INFO - __main__ - Step 20750: {'lr': 0.00048046098924009467, 'samples': 3984000, 'steps': 20749, 'loss/train': 1.5476644039154053} -11/07/2021 00:09:48 - INFO - __main__ - Step 20751: {'lr': 0.00048045893249972497, 'samples': 3984192, 'steps': 20750, 'loss/train': 1.4620814323425293} -11/07/2021 00:09:48 - INFO - __main__ - Step 20752: {'lr': 0.000480456875655514, 'samples': 3984384, 'steps': 20751, 'loss/train': 1.5789313316345215} -11/07/2021 00:09:49 - INFO - __main__ - Step 20753: {'lr': 0.0004804548187074628, 'samples': 3984576, 'steps': 20752, 'loss/train': 1.754978060722351} -11/07/2021 00:09:49 - INFO - __main__ - Step 20754: {'lr': 0.0004804527616555721, 'samples': 3984768, 'steps': 20753, 'loss/train': 1.7650110721588135} -11/07/2021 00:09:50 - INFO - __main__ - Step 20755: {'lr': 0.00048045070449984295, 'samples': 3984960, 'steps': 20754, 'loss/train': 1.4159955978393555} -11/07/2021 00:09:51 - INFO - __main__ - Step 20756: {'lr': 0.0004804486472402763, 'samples': 3985152, 'steps': 20755, 'loss/train': 1.448042392730713} -11/07/2021 00:09:51 - INFO - __main__ - Step 20757: {'lr': 0.0004804465898768731, 'samples': 3985344, 'steps': 20756, 'loss/train': 1.3452638387680054} -11/07/2021 00:09:51 - INFO - __main__ - Step 20758: {'lr': 0.00048044453240963413, 'samples': 3985536, 'steps': 20757, 'loss/train': 1.4904249906539917} -11/07/2021 00:09:52 - INFO - __main__ - Step 20759: {'lr': 0.00048044247483856043, 'samples': 3985728, 'steps': 20758, 'loss/train': 1.6131950616836548} -11/07/2021 00:09:52 - INFO - __main__ - Step 20760: {'lr': 0.00048044041716365296, 'samples': 3985920, 'steps': 20759, 'loss/train': 1.4273293018341064} -11/07/2021 00:09:52 - INFO - __main__ - Step 20761: {'lr': 0.00048043835938491253, 'samples': 3986112, 'steps': 20760, 'loss/train': 1.341493010520935} -11/07/2021 00:09:54 - INFO - __main__ - Step 20762: {'lr': 0.0004804363015023402, 'samples': 3986304, 'steps': 20761, 'loss/train': 1.4203829765319824} -11/07/2021 00:09:54 - INFO - __main__ - Step 20763: {'lr': 0.00048043424351593676, 'samples': 3986496, 'steps': 20762, 'loss/train': 1.2885338068008423} -11/07/2021 00:09:54 - INFO - __main__ - Step 20764: {'lr': 0.0004804321854257032, 'samples': 3986688, 'steps': 20763, 'loss/train': 1.9818228483200073} -11/07/2021 00:09:55 - INFO - __main__ - Step 20765: {'lr': 0.0004804301272316405, 'samples': 3986880, 'steps': 20764, 'loss/train': 1.5577560663223267} -11/07/2021 00:09:55 - INFO - __main__ - Step 20766: {'lr': 0.0004804280689337496, 'samples': 3987072, 'steps': 20765, 'loss/train': 1.503300428390503} -11/07/2021 00:09:56 - INFO - __main__ - Step 20767: {'lr': 0.00048042601053203125, 'samples': 3987264, 'steps': 20766, 'loss/train': 1.59586763381958} -11/07/2021 00:09:56 - INFO - __main__ - Step 20768: {'lr': 0.00048042395202648646, 'samples': 3987456, 'steps': 20767, 'loss/train': 1.7341300249099731} -11/07/2021 00:09:57 - INFO - __main__ - Step 20769: {'lr': 0.00048042189341711636, 'samples': 3987648, 'steps': 20768, 'loss/train': 1.8474223613739014} -11/07/2021 00:09:57 - INFO - __main__ - Step 20770: {'lr': 0.0004804198347039216, 'samples': 3987840, 'steps': 20769, 'loss/train': 1.3138035535812378} -11/07/2021 00:09:57 - INFO - __main__ - Step 20771: {'lr': 0.0004804177758869032, 'samples': 3988032, 'steps': 20770, 'loss/train': 1.6257972717285156} -11/07/2021 00:09:58 - INFO - __main__ - Step 20772: {'lr': 0.0004804157169660622, 'samples': 3988224, 'steps': 20771, 'loss/train': 1.58247971534729} -11/07/2021 00:09:59 - INFO - __main__ - Step 20773: {'lr': 0.00048041365794139934, 'samples': 3988416, 'steps': 20772, 'loss/train': 2.3430113792419434} -11/07/2021 00:09:59 - INFO - __main__ - Step 20774: {'lr': 0.00048041159881291574, 'samples': 3988608, 'steps': 20773, 'loss/train': 1.5301451683044434} -11/07/2021 00:09:59 - INFO - __main__ - Step 20775: {'lr': 0.0004804095395806122, 'samples': 3988800, 'steps': 20774, 'loss/train': 1.7506057024002075} -11/07/2021 00:10:00 - INFO - __main__ - Step 20776: {'lr': 0.00048040748024448954, 'samples': 3988992, 'steps': 20775, 'loss/train': 1.5352082252502441} -11/07/2021 00:10:01 - INFO - __main__ - Step 20777: {'lr': 0.00048040542080454897, 'samples': 3989184, 'steps': 20776, 'loss/train': 1.5161960124969482} -11/07/2021 00:10:01 - INFO - __main__ - Step 20778: {'lr': 0.0004804033612607912, 'samples': 3989376, 'steps': 20777, 'loss/train': 1.5611916780471802} -11/07/2021 00:10:02 - INFO - __main__ - Step 20779: {'lr': 0.00048040130161321724, 'samples': 3989568, 'steps': 20778, 'loss/train': 1.8434571027755737} -11/07/2021 00:10:02 - INFO - __main__ - Step 20780: {'lr': 0.0004803992418618281, 'samples': 3989760, 'steps': 20779, 'loss/train': 1.56538724899292} -11/07/2021 00:10:02 - INFO - __main__ - Step 20781: {'lr': 0.00048039718200662454, 'samples': 3989952, 'steps': 20780, 'loss/train': 1.558919906616211} -11/07/2021 00:10:03 - INFO - __main__ - Step 20782: {'lr': 0.0004803951220476076, 'samples': 3990144, 'steps': 20781, 'loss/train': 2.473111391067505} -11/07/2021 00:10:04 - INFO - __main__ - Step 20783: {'lr': 0.00048039306198477817, 'samples': 3990336, 'steps': 20782, 'loss/train': 1.4748272895812988} -11/07/2021 00:10:04 - INFO - __main__ - Step 20784: {'lr': 0.0004803910018181371, 'samples': 3990528, 'steps': 20783, 'loss/train': 1.1002256870269775} -11/07/2021 00:10:04 - INFO - __main__ - Step 20785: {'lr': 0.0004803889415476855, 'samples': 3990720, 'steps': 20784, 'loss/train': 1.3398923873901367} -11/07/2021 00:10:05 - INFO - __main__ - Step 20786: {'lr': 0.0004803868811734242, 'samples': 3990912, 'steps': 20785, 'loss/train': 5.52646541595459} -11/07/2021 00:10:05 - INFO - __main__ - Step 20787: {'lr': 0.00048038482069535406, 'samples': 3991104, 'steps': 20786, 'loss/train': 1.664506435394287} -11/07/2021 00:10:06 - INFO - __main__ - Step 20788: {'lr': 0.000480382760113476, 'samples': 3991296, 'steps': 20787, 'loss/train': 1.9385948181152344} -11/07/2021 00:10:07 - INFO - __main__ - Step 20789: {'lr': 0.00048038069942779116, 'samples': 3991488, 'steps': 20788, 'loss/train': 1.4435739517211914} -11/07/2021 00:10:07 - INFO - __main__ - Step 20790: {'lr': 0.00048037863863830034, 'samples': 3991680, 'steps': 20789, 'loss/train': 1.7639094591140747} -11/07/2021 00:10:07 - INFO - __main__ - Step 20791: {'lr': 0.0004803765777450044, 'samples': 3991872, 'steps': 20790, 'loss/train': 2.179063081741333} -11/07/2021 00:10:08 - INFO - __main__ - Step 20792: {'lr': 0.00048037451674790433, 'samples': 3992064, 'steps': 20791, 'loss/train': 1.5259931087493896} -11/07/2021 00:10:09 - INFO - __main__ - Step 20793: {'lr': 0.0004803724556470011, 'samples': 3992256, 'steps': 20792, 'loss/train': 0.41106319427490234} -11/07/2021 00:10:09 - INFO - __main__ - Step 20794: {'lr': 0.0004803703944422956, 'samples': 3992448, 'steps': 20793, 'loss/train': 1.5696848630905151} -11/07/2021 00:10:10 - INFO - __main__ - Step 20795: {'lr': 0.0004803683331337887, 'samples': 3992640, 'steps': 20794, 'loss/train': 1.5306452512741089} -11/07/2021 00:10:10 - INFO - __main__ - Step 20796: {'lr': 0.0004803662717214814, 'samples': 3992832, 'steps': 20795, 'loss/train': 1.5071040391921997} -11/07/2021 00:10:10 - INFO - __main__ - Step 20797: {'lr': 0.00048036421020537464, 'samples': 3993024, 'steps': 20796, 'loss/train': 1.7013245820999146} -11/07/2021 00:10:11 - INFO - __main__ - Step 20798: {'lr': 0.0004803621485854693, 'samples': 3993216, 'steps': 20797, 'loss/train': 0.595490574836731} -11/07/2021 00:10:12 - INFO - __main__ - Step 20799: {'lr': 0.00048036008686176636, 'samples': 3993408, 'steps': 20798, 'loss/train': 1.1961723566055298} -11/07/2021 00:10:12 - INFO - __main__ - Step 20800: {'lr': 0.0004803580250342666, 'samples': 3993600, 'steps': 20799, 'loss/train': 1.7574987411499023} -11/07/2021 00:10:12 - INFO - __main__ - Step 20801: {'lr': 0.00048035596310297125, 'samples': 3993792, 'steps': 20800, 'loss/train': 1.2915315628051758} -11/07/2021 00:10:13 - INFO - __main__ - Step 20802: {'lr': 0.0004803539010678809, 'samples': 3993984, 'steps': 20801, 'loss/train': 1.912282943725586} -11/07/2021 00:10:13 - INFO - __main__ - Step 20803: {'lr': 0.00048035183892899676, 'samples': 3994176, 'steps': 20802, 'loss/train': 1.7721303701400757} -11/07/2021 00:10:14 - INFO - __main__ - Step 20804: {'lr': 0.0004803497766863195, 'samples': 3994368, 'steps': 20803, 'loss/train': 1.472104787826538} -11/07/2021 00:10:14 - INFO - __main__ - Step 20805: {'lr': 0.00048034771433985035, 'samples': 3994560, 'steps': 20804, 'loss/train': 1.4602023363113403} -11/07/2021 00:10:15 - INFO - __main__ - Step 20806: {'lr': 0.00048034565188959, 'samples': 3994752, 'steps': 20805, 'loss/train': 1.452834963798523} -11/07/2021 00:10:15 - INFO - __main__ - Step 20807: {'lr': 0.0004803435893355394, 'samples': 3994944, 'steps': 20806, 'loss/train': 1.882066011428833} -11/07/2021 00:10:15 - INFO - __main__ - Step 20808: {'lr': 0.00048034152667769957, 'samples': 3995136, 'steps': 20807, 'loss/train': 1.5793373584747314} -11/07/2021 00:10:17 - INFO - __main__ - Step 20809: {'lr': 0.0004803394639160714, 'samples': 3995328, 'steps': 20808, 'loss/train': 1.8108179569244385} -11/07/2021 00:10:17 - INFO - __main__ - Step 20810: {'lr': 0.00048033740105065585, 'samples': 3995520, 'steps': 20809, 'loss/train': 2.055591106414795} -11/07/2021 00:10:17 - INFO - __main__ - Step 20811: {'lr': 0.0004803353380814538, 'samples': 3995712, 'steps': 20810, 'loss/train': 1.3634858131408691} -11/07/2021 00:10:18 - INFO - __main__ - Step 20812: {'lr': 0.00048033327500846625, 'samples': 3995904, 'steps': 20811, 'loss/train': 1.299759864807129} -11/07/2021 00:10:18 - INFO - __main__ - Step 20813: {'lr': 0.000480331211831694, 'samples': 3996096, 'steps': 20812, 'loss/train': 1.4120014905929565} -11/07/2021 00:10:19 - INFO - __main__ - Step 20814: {'lr': 0.00048032914855113807, 'samples': 3996288, 'steps': 20813, 'loss/train': 1.361594796180725} -11/07/2021 00:10:19 - INFO - __main__ - Step 20815: {'lr': 0.00048032708516679946, 'samples': 3996480, 'steps': 20814, 'loss/train': 1.8684601783752441} -11/07/2021 00:10:20 - INFO - __main__ - Step 20816: {'lr': 0.00048032502167867896, 'samples': 3996672, 'steps': 20815, 'loss/train': 1.841715693473816} -11/07/2021 00:10:20 - INFO - __main__ - Step 20817: {'lr': 0.0004803229580867775, 'samples': 3996864, 'steps': 20816, 'loss/train': 1.7938896417617798} -11/07/2021 00:10:20 - INFO - __main__ - Step 20818: {'lr': 0.0004803208943910962, 'samples': 3997056, 'steps': 20817, 'loss/train': 1.2337151765823364} -11/07/2021 00:10:21 - INFO - __main__ - Step 20819: {'lr': 0.00048031883059163576, 'samples': 3997248, 'steps': 20818, 'loss/train': 1.5640259981155396} -11/07/2021 00:10:22 - INFO - __main__ - Step 20820: {'lr': 0.00048031676668839723, 'samples': 3997440, 'steps': 20819, 'loss/train': 1.9230550527572632} -11/07/2021 00:10:22 - INFO - __main__ - Step 20821: {'lr': 0.00048031470268138153, 'samples': 3997632, 'steps': 20820, 'loss/train': 1.2242671251296997} -11/07/2021 00:10:22 - INFO - __main__ - Step 20822: {'lr': 0.00048031263857058957, 'samples': 3997824, 'steps': 20821, 'loss/train': 1.852646827697754} -11/07/2021 00:10:23 - INFO - __main__ - Step 20823: {'lr': 0.00048031057435602234, 'samples': 3998016, 'steps': 20822, 'loss/train': 1.4730157852172852} -11/07/2021 00:10:24 - INFO - __main__ - Step 20824: {'lr': 0.0004803085100376807, 'samples': 3998208, 'steps': 20823, 'loss/train': 1.5855153799057007} -11/07/2021 00:10:24 - INFO - __main__ - Step 20825: {'lr': 0.00048030644561556556, 'samples': 3998400, 'steps': 20824, 'loss/train': 1.704028844833374} -11/07/2021 00:10:25 - INFO - __main__ - Step 20826: {'lr': 0.0004803043810896779, 'samples': 3998592, 'steps': 20825, 'loss/train': 1.5183931589126587} -11/07/2021 00:10:25 - INFO - __main__ - Step 20827: {'lr': 0.00048030231646001867, 'samples': 3998784, 'steps': 20826, 'loss/train': 1.6759287118911743} -11/07/2021 00:10:25 - INFO - __main__ - Step 20828: {'lr': 0.0004803002517265887, 'samples': 3998976, 'steps': 20827, 'loss/train': 0.2678111791610718} -11/07/2021 00:10:27 - INFO - __main__ - Step 20829: {'lr': 0.0004802981868893891, 'samples': 3999168, 'steps': 20828, 'loss/train': 1.3716883659362793} -11/07/2021 00:10:27 - INFO - __main__ - Step 20830: {'lr': 0.00048029612194842056, 'samples': 3999360, 'steps': 20829, 'loss/train': 1.400437593460083} -11/07/2021 00:10:27 - INFO - __main__ - Step 20831: {'lr': 0.0004802940569036842, 'samples': 3999552, 'steps': 20830, 'loss/train': 2.0138940811157227} -11/07/2021 00:10:28 - INFO - __main__ - Step 20832: {'lr': 0.0004802919917551809, 'samples': 3999744, 'steps': 20831, 'loss/train': 1.691053867340088} -11/07/2021 00:10:28 - INFO - __main__ - Step 20833: {'lr': 0.00048028992650291156, 'samples': 3999936, 'steps': 20832, 'loss/train': 1.3104307651519775} -11/07/2021 00:10:28 - INFO - __main__ - Step 20834: {'lr': 0.00048028786114687715, 'samples': 4000128, 'steps': 20833, 'loss/train': 1.7613739967346191} -11/07/2021 00:10:29 - INFO - __main__ - Step 20835: {'lr': 0.0004802857956870786, 'samples': 4000320, 'steps': 20834, 'loss/train': 1.5970216989517212} -11/07/2021 00:10:30 - INFO - __main__ - Step 20836: {'lr': 0.00048028373012351684, 'samples': 4000512, 'steps': 20835, 'loss/train': 1.327458143234253} -11/07/2021 00:10:30 - INFO - __main__ - Step 20837: {'lr': 0.00048028166445619275, 'samples': 4000704, 'steps': 20836, 'loss/train': 1.427208423614502} -11/07/2021 00:10:31 - INFO - __main__ - Step 20838: {'lr': 0.0004802795986851073, 'samples': 4000896, 'steps': 20837, 'loss/train': 1.2698725461959839} -11/07/2021 00:10:31 - INFO - __main__ - Step 20839: {'lr': 0.00048027753281026144, 'samples': 4001088, 'steps': 20838, 'loss/train': 1.6905814409255981} -11/07/2021 00:10:32 - INFO - __main__ - Step 20840: {'lr': 0.000480275466831656, 'samples': 4001280, 'steps': 20839, 'loss/train': 1.8319936990737915} -11/07/2021 00:10:32 - INFO - __main__ - Step 20841: {'lr': 0.00048027340074929207, 'samples': 4001472, 'steps': 20840, 'loss/train': 1.751729965209961} -11/07/2021 00:10:33 - INFO - __main__ - Step 20842: {'lr': 0.0004802713345631705, 'samples': 4001664, 'steps': 20841, 'loss/train': 1.7456939220428467} -11/07/2021 00:10:33 - INFO - __main__ - Step 20843: {'lr': 0.0004802692682732922, 'samples': 4001856, 'steps': 20842, 'loss/train': 1.7693142890930176} -11/07/2021 00:10:33 - INFO - __main__ - Step 20844: {'lr': 0.0004802672018796581, 'samples': 4002048, 'steps': 20843, 'loss/train': 1.407902479171753} -11/07/2021 00:10:34 - INFO - __main__ - Step 20845: {'lr': 0.0004802651353822691, 'samples': 4002240, 'steps': 20844, 'loss/train': 1.528710126876831} -11/07/2021 00:10:35 - INFO - __main__ - Step 20846: {'lr': 0.0004802630687811263, 'samples': 4002432, 'steps': 20845, 'loss/train': 1.6070642471313477} -11/07/2021 00:10:35 - INFO - __main__ - Step 20847: {'lr': 0.00048026100207623047, 'samples': 4002624, 'steps': 20846, 'loss/train': 1.699964165687561} -11/07/2021 00:10:35 - INFO - __main__ - Step 20848: {'lr': 0.0004802589352675826, 'samples': 4002816, 'steps': 20847, 'loss/train': 1.9966727495193481} -11/07/2021 00:10:36 - INFO - __main__ - Step 20849: {'lr': 0.0004802568683551836, 'samples': 4003008, 'steps': 20848, 'loss/train': 1.0162174701690674} -11/07/2021 00:10:37 - INFO - __main__ - Step 20850: {'lr': 0.0004802548013390343, 'samples': 4003200, 'steps': 20849, 'loss/train': 1.5560613870620728} -11/07/2021 00:10:37 - INFO - __main__ - Step 20851: {'lr': 0.00048025273421913587, 'samples': 4003392, 'steps': 20850, 'loss/train': 1.6622282266616821} -11/07/2021 00:10:37 - INFO - __main__ - Step 20852: {'lr': 0.0004802506669954891, 'samples': 4003584, 'steps': 20851, 'loss/train': 1.6507529020309448} -11/07/2021 00:10:38 - INFO - __main__ - Step 20853: {'lr': 0.00048024859966809487, 'samples': 4003776, 'steps': 20852, 'loss/train': 1.8268312215805054} -11/07/2021 00:10:38 - INFO - __main__ - Step 20854: {'lr': 0.00048024653223695425, 'samples': 4003968, 'steps': 20853, 'loss/train': 1.3219914436340332} -11/07/2021 00:10:39 - INFO - __main__ - Step 20855: {'lr': 0.00048024446470206806, 'samples': 4004160, 'steps': 20854, 'loss/train': 1.3745572566986084} -11/07/2021 00:10:40 - INFO - __main__ - Step 20856: {'lr': 0.0004802423970634373, 'samples': 4004352, 'steps': 20855, 'loss/train': 1.3092901706695557} -11/07/2021 00:10:40 - INFO - __main__ - Step 20857: {'lr': 0.00048024032932106277, 'samples': 4004544, 'steps': 20856, 'loss/train': 2.9461312294006348} -11/07/2021 00:10:40 - INFO - __main__ - Step 20858: {'lr': 0.00048023826147494556, 'samples': 4004736, 'steps': 20857, 'loss/train': 1.3187404870986938} -11/07/2021 00:10:41 - INFO - __main__ - Step 20859: {'lr': 0.0004802361935250865, 'samples': 4004928, 'steps': 20858, 'loss/train': 1.6424322128295898} -11/07/2021 00:10:42 - INFO - __main__ - Step 20860: {'lr': 0.0004802341254714867, 'samples': 4005120, 'steps': 20859, 'loss/train': 1.394176959991455} -11/07/2021 00:10:42 - INFO - __main__ - Step 20861: {'lr': 0.00048023205731414684, 'samples': 4005312, 'steps': 20860, 'loss/train': 1.5472851991653442} -11/07/2021 00:10:42 - INFO - __main__ - Step 20862: {'lr': 0.00048022998905306795, 'samples': 4005504, 'steps': 20861, 'loss/train': 1.6439249515533447} -11/07/2021 00:10:43 - INFO - __main__ - Step 20863: {'lr': 0.00048022792068825107, 'samples': 4005696, 'steps': 20862, 'loss/train': 1.2037049531936646} -11/07/2021 00:10:43 - INFO - __main__ - Step 20864: {'lr': 0.00048022585221969697, 'samples': 4005888, 'steps': 20863, 'loss/train': 1.481030821800232} -11/07/2021 00:10:43 - INFO - __main__ - Step 20865: {'lr': 0.00048022378364740673, 'samples': 4006080, 'steps': 20864, 'loss/train': 1.4156023263931274} -11/07/2021 00:10:44 - INFO - __main__ - Step 20866: {'lr': 0.0004802217149713811, 'samples': 4006272, 'steps': 20865, 'loss/train': 1.7416797876358032} -11/07/2021 00:10:45 - INFO - __main__ - Step 20867: {'lr': 0.0004802196461916212, 'samples': 4006464, 'steps': 20866, 'loss/train': 1.5621509552001953} -11/07/2021 00:10:45 - INFO - __main__ - Step 20868: {'lr': 0.0004802175773081278, 'samples': 4006656, 'steps': 20867, 'loss/train': 1.5445585250854492} -11/07/2021 00:10:46 - INFO - __main__ - Step 20869: {'lr': 0.000480215508320902, 'samples': 4006848, 'steps': 20868, 'loss/train': 1.958810806274414} -11/07/2021 00:10:46 - INFO - __main__ - Step 20870: {'lr': 0.0004802134392299446, 'samples': 4007040, 'steps': 20869, 'loss/train': 1.8098005056381226} -11/07/2021 00:10:47 - INFO - __main__ - Step 20871: {'lr': 0.0004802113700352566, 'samples': 4007232, 'steps': 20870, 'loss/train': 1.7087562084197998} -11/07/2021 00:10:47 - INFO - __main__ - Step 20872: {'lr': 0.00048020930073683886, 'samples': 4007424, 'steps': 20871, 'loss/train': 1.5298601388931274} -11/07/2021 00:10:48 - INFO - __main__ - Step 20873: {'lr': 0.0004802072313346924, 'samples': 4007616, 'steps': 20872, 'loss/train': 1.7708653211593628} -11/07/2021 00:10:48 - INFO - __main__ - Step 20874: {'lr': 0.00048020516182881813, 'samples': 4007808, 'steps': 20873, 'loss/train': 1.6466927528381348} -11/07/2021 00:10:48 - INFO - __main__ - Step 20875: {'lr': 0.00048020309221921686, 'samples': 4008000, 'steps': 20874, 'loss/train': 1.5985970497131348} -11/07/2021 00:10:49 - INFO - __main__ - Step 20876: {'lr': 0.00048020102250588976, 'samples': 4008192, 'steps': 20875, 'loss/train': 1.2552753686904907} -11/07/2021 00:10:50 - INFO - __main__ - Step 20877: {'lr': 0.00048019895268883764, 'samples': 4008384, 'steps': 20876, 'loss/train': 1.6351234912872314} -11/07/2021 00:10:50 - INFO - __main__ - Step 20878: {'lr': 0.0004801968827680613, 'samples': 4008576, 'steps': 20877, 'loss/train': 1.4687561988830566} -11/07/2021 00:10:50 - INFO - __main__ - Step 20879: {'lr': 0.00048019481274356194, 'samples': 4008768, 'steps': 20878, 'loss/train': 2.0849993228912354} -11/07/2021 00:10:51 - INFO - __main__ - Step 20880: {'lr': 0.0004801927426153402, 'samples': 4008960, 'steps': 20879, 'loss/train': 1.5084853172302246} -11/07/2021 00:10:52 - INFO - __main__ - Step 20881: {'lr': 0.00048019067238339725, 'samples': 4009152, 'steps': 20880, 'loss/train': 1.1716647148132324} -11/07/2021 00:10:52 - INFO - __main__ - Step 20882: {'lr': 0.000480188602047734, 'samples': 4009344, 'steps': 20881, 'loss/train': 1.4270188808441162} -11/07/2021 00:10:52 - INFO - __main__ - Step 20883: {'lr': 0.0004801865316083512, 'samples': 4009536, 'steps': 20882, 'loss/train': 1.583962082862854} -11/07/2021 00:10:53 - INFO - __main__ - Step 20884: {'lr': 0.0004801844610652499, 'samples': 4009728, 'steps': 20883, 'loss/train': 1.8874273300170898} -11/07/2021 00:10:53 - INFO - __main__ - Step 20885: {'lr': 0.0004801823904184311, 'samples': 4009920, 'steps': 20884, 'loss/train': 1.2241159677505493} -11/07/2021 00:10:53 - INFO - __main__ - Step 20886: {'lr': 0.00048018031966789564, 'samples': 4010112, 'steps': 20885, 'loss/train': 1.395066738128662} -11/07/2021 00:10:54 - INFO - __main__ - Step 20887: {'lr': 0.0004801782488136445, 'samples': 4010304, 'steps': 20886, 'loss/train': 1.531816840171814} -11/07/2021 00:10:55 - INFO - __main__ - Step 20888: {'lr': 0.00048017617785567855, 'samples': 4010496, 'steps': 20887, 'loss/train': 1.872235655784607} -11/07/2021 00:10:55 - INFO - __main__ - Step 20889: {'lr': 0.00048017410679399876, 'samples': 4010688, 'steps': 20888, 'loss/train': 1.6539621353149414} -11/07/2021 00:10:56 - INFO - __main__ - Step 20890: {'lr': 0.00048017203562860614, 'samples': 4010880, 'steps': 20889, 'loss/train': 1.7974549531936646} -11/07/2021 00:10:56 - INFO - __main__ - Step 20891: {'lr': 0.0004801699643595015, 'samples': 4011072, 'steps': 20890, 'loss/train': 1.764176845550537} -11/07/2021 00:10:57 - INFO - __main__ - Step 20892: {'lr': 0.00048016789298668583, 'samples': 4011264, 'steps': 20891, 'loss/train': 1.7799986600875854} -11/07/2021 00:10:57 - INFO - __main__ - Step 20893: {'lr': 0.0004801658215101601, 'samples': 4011456, 'steps': 20892, 'loss/train': 1.6527446508407593} -11/07/2021 00:10:58 - INFO - __main__ - Step 20894: {'lr': 0.00048016374992992516, 'samples': 4011648, 'steps': 20893, 'loss/train': 1.2430540323257446} -11/07/2021 00:10:58 - INFO - __main__ - Step 20895: {'lr': 0.000480161678245982, 'samples': 4011840, 'steps': 20894, 'loss/train': 1.2979753017425537} -11/07/2021 00:10:58 - INFO - __main__ - Step 20896: {'lr': 0.0004801596064583315, 'samples': 4012032, 'steps': 20895, 'loss/train': 1.6988540887832642} -11/07/2021 00:11:00 - INFO - __main__ - Step 20897: {'lr': 0.00048015753456697466, 'samples': 4012224, 'steps': 20896, 'loss/train': 1.5440951585769653} -11/07/2021 00:11:00 - INFO - __main__ - Step 20898: {'lr': 0.00048015546257191243, 'samples': 4012416, 'steps': 20897, 'loss/train': 2.084376096725464} -11/07/2021 00:11:00 - INFO - __main__ - Step 20899: {'lr': 0.00048015339047314566, 'samples': 4012608, 'steps': 20898, 'loss/train': 1.7466663122177124} -11/07/2021 00:11:01 - INFO - __main__ - Step 20900: {'lr': 0.00048015131827067534, 'samples': 4012800, 'steps': 20899, 'loss/train': 1.352649450302124} -11/07/2021 00:11:01 - INFO - __main__ - Step 20901: {'lr': 0.0004801492459645024, 'samples': 4012992, 'steps': 20900, 'loss/train': 1.8301000595092773} -11/07/2021 00:11:02 - INFO - __main__ - Step 20902: {'lr': 0.0004801471735546277, 'samples': 4013184, 'steps': 20901, 'loss/train': 1.3566601276397705} -11/07/2021 00:11:02 - INFO - __main__ - Step 20903: {'lr': 0.0004801451010410522, 'samples': 4013376, 'steps': 20902, 'loss/train': 1.7443701028823853} -11/07/2021 00:11:03 - INFO - __main__ - Step 20904: {'lr': 0.000480143028423777, 'samples': 4013568, 'steps': 20903, 'loss/train': 1.2707422971725464} -11/07/2021 00:11:03 - INFO - __main__ - Step 20905: {'lr': 0.0004801409557028028, 'samples': 4013760, 'steps': 20904, 'loss/train': 0.893004834651947} -11/07/2021 00:11:03 - INFO - __main__ - Step 20906: {'lr': 0.0004801388828781307, 'samples': 4013952, 'steps': 20905, 'loss/train': 1.4361201524734497} -11/07/2021 00:11:04 - INFO - __main__ - Step 20907: {'lr': 0.00048013680994976154, 'samples': 4014144, 'steps': 20906, 'loss/train': 1.4615181684494019} -11/07/2021 00:11:05 - INFO - __main__ - Step 20908: {'lr': 0.0004801347369176963, 'samples': 4014336, 'steps': 20907, 'loss/train': 1.5402387380599976} -11/07/2021 00:11:05 - INFO - __main__ - Step 20909: {'lr': 0.00048013266378193586, 'samples': 4014528, 'steps': 20908, 'loss/train': 1.783090591430664} -11/07/2021 00:11:05 - INFO - __main__ - Step 20910: {'lr': 0.00048013059054248134, 'samples': 4014720, 'steps': 20909, 'loss/train': 1.7908695936203003} -11/07/2021 00:11:06 - INFO - __main__ - Step 20911: {'lr': 0.00048012851719933335, 'samples': 4014912, 'steps': 20910, 'loss/train': 1.4883944988250732} -11/07/2021 00:11:06 - INFO - __main__ - Step 20912: {'lr': 0.000480126443752493, 'samples': 4015104, 'steps': 20911, 'loss/train': 1.4716330766677856} -11/07/2021 00:11:07 - INFO - __main__ - Step 20913: {'lr': 0.0004801243702019614, 'samples': 4015296, 'steps': 20912, 'loss/train': 1.7692360877990723} -11/07/2021 00:11:08 - INFO - __main__ - Step 20914: {'lr': 0.00048012229654773915, 'samples': 4015488, 'steps': 20913, 'loss/train': 1.800770878791809} -11/07/2021 00:11:08 - INFO - __main__ - Step 20915: {'lr': 0.0004801202227898274, 'samples': 4015680, 'steps': 20914, 'loss/train': 1.5604429244995117} -11/07/2021 00:11:08 - INFO - __main__ - Step 20916: {'lr': 0.00048011814892822704, 'samples': 4015872, 'steps': 20915, 'loss/train': 1.069279670715332} -11/07/2021 00:11:09 - INFO - __main__ - Step 20917: {'lr': 0.00048011607496293896, 'samples': 4016064, 'steps': 20916, 'loss/train': 1.8001171350479126} -11/07/2021 00:11:10 - INFO - __main__ - Step 20918: {'lr': 0.0004801140008939642, 'samples': 4016256, 'steps': 20917, 'loss/train': 1.5695562362670898} -11/07/2021 00:11:10 - INFO - __main__ - Step 20919: {'lr': 0.00048011192672130356, 'samples': 4016448, 'steps': 20918, 'loss/train': 1.5356251001358032} -11/07/2021 00:11:10 - INFO - __main__ - Step 20920: {'lr': 0.000480109852444958, 'samples': 4016640, 'steps': 20919, 'loss/train': 1.2524460554122925} -11/07/2021 00:11:11 - INFO - __main__ - Step 20921: {'lr': 0.0004801077780649286, 'samples': 4016832, 'steps': 20920, 'loss/train': 1.808414101600647} -11/07/2021 00:11:11 - INFO - __main__ - Step 20922: {'lr': 0.00048010570358121606, 'samples': 4017024, 'steps': 20921, 'loss/train': 1.0232669115066528} -11/07/2021 00:11:12 - INFO - __main__ - Step 20923: {'lr': 0.0004801036289938215, 'samples': 4017216, 'steps': 20922, 'loss/train': 1.1512370109558105} -11/07/2021 00:11:13 - INFO - __main__ - Step 20924: {'lr': 0.0004801015543027458, 'samples': 4017408, 'steps': 20923, 'loss/train': 1.5613585710525513} -11/07/2021 00:11:13 - INFO - __main__ - Step 20925: {'lr': 0.0004800994795079899, 'samples': 4017600, 'steps': 20924, 'loss/train': 1.8445370197296143} -11/07/2021 00:11:13 - INFO - __main__ - Step 20926: {'lr': 0.00048009740460955465, 'samples': 4017792, 'steps': 20925, 'loss/train': 1.7685003280639648} -11/07/2021 00:11:14 - INFO - __main__ - Step 20927: {'lr': 0.00048009532960744116, 'samples': 4017984, 'steps': 20926, 'loss/train': 1.086643099784851} -11/07/2021 00:11:15 - INFO - __main__ - Step 20928: {'lr': 0.0004800932545016502, 'samples': 4018176, 'steps': 20927, 'loss/train': 1.2196599245071411} -11/07/2021 00:11:15 - INFO - __main__ - Step 20929: {'lr': 0.0004800911792921828, 'samples': 4018368, 'steps': 20928, 'loss/train': 1.2705469131469727} -11/07/2021 00:11:15 - INFO - __main__ - Step 20930: {'lr': 0.0004800891039790399, 'samples': 4018560, 'steps': 20929, 'loss/train': 1.3246406316757202} -11/07/2021 00:11:16 - INFO - __main__ - Step 20931: {'lr': 0.00048008702856222233, 'samples': 4018752, 'steps': 20930, 'loss/train': 1.7419018745422363} -11/07/2021 00:11:16 - INFO - __main__ - Step 20932: {'lr': 0.0004800849530417312, 'samples': 4018944, 'steps': 20931, 'loss/train': 1.572576880455017} -11/07/2021 00:11:17 - INFO - __main__ - Step 20933: {'lr': 0.00048008287741756715, 'samples': 4019136, 'steps': 20932, 'loss/train': 1.5679242610931396} -11/07/2021 00:11:17 - INFO - __main__ - Step 20934: {'lr': 0.00048008080168973144, 'samples': 4019328, 'steps': 20933, 'loss/train': 1.1735849380493164} -11/07/2021 00:11:18 - INFO - __main__ - Step 20935: {'lr': 0.00048007872585822486, 'samples': 4019520, 'steps': 20934, 'loss/train': 1.741011619567871} -11/07/2021 00:11:18 - INFO - __main__ - Step 20936: {'lr': 0.00048007664992304834, 'samples': 4019712, 'steps': 20935, 'loss/train': 1.6827812194824219} -11/07/2021 00:11:18 - INFO - __main__ - Step 20937: {'lr': 0.0004800745738842029, 'samples': 4019904, 'steps': 20936, 'loss/train': 1.646528720855713} -11/07/2021 00:11:20 - INFO - __main__ - Step 20938: {'lr': 0.0004800724977416894, 'samples': 4020096, 'steps': 20937, 'loss/train': 2.168165445327759} -11/07/2021 00:11:20 - INFO - __main__ - Step 20939: {'lr': 0.00048007042149550866, 'samples': 4020288, 'steps': 20938, 'loss/train': 1.931329369544983} -11/07/2021 00:11:20 - INFO - __main__ - Step 20940: {'lr': 0.00048006834514566183, 'samples': 4020480, 'steps': 20939, 'loss/train': 1.0786707401275635} -11/07/2021 00:11:21 - INFO - __main__ - Step 20941: {'lr': 0.00048006626869214977, 'samples': 4020672, 'steps': 20940, 'loss/train': 1.6631247997283936} -11/07/2021 00:11:21 - INFO - __main__ - Step 20942: {'lr': 0.00048006419213497334, 'samples': 4020864, 'steps': 20941, 'loss/train': 1.8388252258300781} -11/07/2021 00:11:21 - INFO - __main__ - Step 20943: {'lr': 0.0004800621154741335, 'samples': 4021056, 'steps': 20942, 'loss/train': 3.2117514610290527} -11/07/2021 00:11:22 - INFO - __main__ - Step 20944: {'lr': 0.00048006003870963135, 'samples': 4021248, 'steps': 20943, 'loss/train': 1.8050594329833984} -11/07/2021 00:11:23 - INFO - __main__ - Step 20945: {'lr': 0.0004800579618414676, 'samples': 4021440, 'steps': 20944, 'loss/train': 1.1371890306472778} -11/07/2021 00:11:23 - INFO - __main__ - Step 20946: {'lr': 0.0004800558848696433, 'samples': 4021632, 'steps': 20945, 'loss/train': 1.728974461555481} -11/07/2021 00:11:23 - INFO - __main__ - Step 20947: {'lr': 0.0004800538077941594, 'samples': 4021824, 'steps': 20946, 'loss/train': 1.4030572175979614} -11/07/2021 00:11:24 - INFO - __main__ - Step 20948: {'lr': 0.00048005173061501673, 'samples': 4022016, 'steps': 20947, 'loss/train': 1.3526893854141235} -11/07/2021 00:11:25 - INFO - __main__ - Step 20949: {'lr': 0.0004800496533322164, 'samples': 4022208, 'steps': 20948, 'loss/train': 1.645173192024231} -11/07/2021 00:11:25 - INFO - __main__ - Step 20950: {'lr': 0.00048004757594575923, 'samples': 4022400, 'steps': 20949, 'loss/train': 1.7988004684448242} -11/07/2021 00:11:25 - INFO - __main__ - Step 20951: {'lr': 0.0004800454984556461, 'samples': 4022592, 'steps': 20950, 'loss/train': 1.3141534328460693} -11/07/2021 00:11:26 - INFO - __main__ - Step 20952: {'lr': 0.00048004342086187805, 'samples': 4022784, 'steps': 20951, 'loss/train': 1.546395182609558} -11/07/2021 00:11:26 - INFO - __main__ - Step 20953: {'lr': 0.000480041343164456, 'samples': 4022976, 'steps': 20952, 'loss/train': 1.7359364032745361} -11/07/2021 00:11:27 - INFO - __main__ - Step 20954: {'lr': 0.0004800392653633808, 'samples': 4023168, 'steps': 20953, 'loss/train': 1.3687946796417236} -11/07/2021 00:11:27 - INFO - __main__ - Step 20955: {'lr': 0.0004800371874586535, 'samples': 4023360, 'steps': 20954, 'loss/train': 1.8569425344467163} -11/07/2021 00:11:28 - INFO - __main__ - Step 20956: {'lr': 0.0004800351094502751, 'samples': 4023552, 'steps': 20955, 'loss/train': 1.5773091316223145} -11/07/2021 00:11:28 - INFO - __main__ - Step 20957: {'lr': 0.00048003303133824633, 'samples': 4023744, 'steps': 20956, 'loss/train': 1.7824643850326538} -11/07/2021 00:11:29 - INFO - __main__ - Step 20958: {'lr': 0.0004800309531225683, 'samples': 4023936, 'steps': 20957, 'loss/train': 1.6135205030441284} -11/07/2021 00:11:29 - INFO - __main__ - Step 20959: {'lr': 0.00048002887480324175, 'samples': 4024128, 'steps': 20958, 'loss/train': 1.5606435537338257} -11/07/2021 00:11:30 - INFO - __main__ - Step 20960: {'lr': 0.0004800267963802678, 'samples': 4024320, 'steps': 20959, 'loss/train': 1.4907593727111816} -11/07/2021 00:11:30 - INFO - __main__ - Step 20961: {'lr': 0.0004800247178536473, 'samples': 4024512, 'steps': 20960, 'loss/train': 1.7517757415771484} -11/07/2021 00:11:30 - INFO - __main__ - Step 20962: {'lr': 0.0004800226392233813, 'samples': 4024704, 'steps': 20961, 'loss/train': 1.6995420455932617} -11/07/2021 00:11:31 - INFO - __main__ - Step 20963: {'lr': 0.00048002056048947054, 'samples': 4024896, 'steps': 20962, 'loss/train': 1.690382957458496} -11/07/2021 00:11:32 - INFO - __main__ - Step 20964: {'lr': 0.0004800184816519161, 'samples': 4025088, 'steps': 20963, 'loss/train': 1.702330470085144} -11/07/2021 00:11:32 - INFO - __main__ - Step 20965: {'lr': 0.0004800164027107189, 'samples': 4025280, 'steps': 20964, 'loss/train': 1.4207866191864014} -11/07/2021 00:11:33 - INFO - __main__ - Step 20966: {'lr': 0.0004800143236658798, 'samples': 4025472, 'steps': 20965, 'loss/train': 1.6319961547851562} -11/07/2021 00:11:33 - INFO - __main__ - Step 20967: {'lr': 0.0004800122445173999, 'samples': 4025664, 'steps': 20966, 'loss/train': 1.5580840110778809} -11/07/2021 00:11:33 - INFO - __main__ - Step 20968: {'lr': 0.00048001016526528, 'samples': 4025856, 'steps': 20967, 'loss/train': 1.623712182044983} -11/07/2021 00:11:34 - INFO - __main__ - Step 20969: {'lr': 0.00048000808590952106, 'samples': 4026048, 'steps': 20968, 'loss/train': 1.501164197921753} -11/07/2021 00:11:35 - INFO - __main__ - Step 20970: {'lr': 0.0004800060064501239, 'samples': 4026240, 'steps': 20969, 'loss/train': 1.4817878007888794} -11/07/2021 00:11:35 - INFO - __main__ - Step 20971: {'lr': 0.00048000392688708976, 'samples': 4026432, 'steps': 20970, 'loss/train': 1.5886551141738892} -11/07/2021 00:11:35 - INFO - __main__ - Step 20972: {'lr': 0.00048000184722041934, 'samples': 4026624, 'steps': 20971, 'loss/train': 1.4988945722579956} -11/07/2021 00:11:36 - INFO - __main__ - Step 20973: {'lr': 0.00047999976745011366, 'samples': 4026816, 'steps': 20972, 'loss/train': 1.794215202331543} -11/07/2021 00:11:37 - INFO - __main__ - Step 20974: {'lr': 0.0004799976875761736, 'samples': 4027008, 'steps': 20973, 'loss/train': 1.4776352643966675} -11/07/2021 00:11:37 - INFO - __main__ - Step 20975: {'lr': 0.00047999560759860006, 'samples': 4027200, 'steps': 20974, 'loss/train': 1.5870134830474854} -11/07/2021 00:11:37 - INFO - __main__ - Step 20976: {'lr': 0.00047999352751739414, 'samples': 4027392, 'steps': 20975, 'loss/train': 1.6789779663085938} -11/07/2021 00:11:38 - INFO - __main__ - Step 20977: {'lr': 0.0004799914473325567, 'samples': 4027584, 'steps': 20976, 'loss/train': 1.4126200675964355} -11/07/2021 00:11:38 - INFO - __main__ - Step 20978: {'lr': 0.00047998936704408865, 'samples': 4027776, 'steps': 20977, 'loss/train': 1.6767990589141846} -11/07/2021 00:11:39 - INFO - __main__ - Step 20979: {'lr': 0.00047998728665199085, 'samples': 4027968, 'steps': 20978, 'loss/train': 1.7134089469909668} -11/07/2021 00:11:40 - INFO - __main__ - Step 20980: {'lr': 0.00047998520615626447, 'samples': 4028160, 'steps': 20979, 'loss/train': 1.2816898822784424} -11/07/2021 00:11:40 - INFO - __main__ - Step 20981: {'lr': 0.0004799831255569102, 'samples': 4028352, 'steps': 20980, 'loss/train': 1.301430106163025} -11/07/2021 00:11:40 - INFO - __main__ - Step 20982: {'lr': 0.00047998104485392915, 'samples': 4028544, 'steps': 20981, 'loss/train': 1.5153762102127075} -11/07/2021 00:11:41 - INFO - __main__ - Step 20983: {'lr': 0.0004799789640473221, 'samples': 4028736, 'steps': 20982, 'loss/train': 0.35239240527153015} -11/07/2021 00:11:41 - INFO - __main__ - Step 20984: {'lr': 0.0004799768831370902, 'samples': 4028928, 'steps': 20983, 'loss/train': 1.8679004907608032} -11/07/2021 00:11:42 - INFO - __main__ - Step 20985: {'lr': 0.0004799748021232342, 'samples': 4029120, 'steps': 20984, 'loss/train': 1.7212649583816528} -11/07/2021 00:11:42 - INFO - __main__ - Step 20986: {'lr': 0.00047997272100575505, 'samples': 4029312, 'steps': 20985, 'loss/train': 1.5796945095062256} -11/07/2021 00:11:43 - INFO - __main__ - Step 20987: {'lr': 0.00047997063978465383, 'samples': 4029504, 'steps': 20986, 'loss/train': 1.249659538269043} -11/07/2021 00:11:43 - INFO - __main__ - Step 20988: {'lr': 0.0004799685584599313, 'samples': 4029696, 'steps': 20987, 'loss/train': 1.1187705993652344} -11/07/2021 00:11:43 - INFO - __main__ - Step 20989: {'lr': 0.00047996647703158857, 'samples': 4029888, 'steps': 20988, 'loss/train': 1.584458827972412} -11/07/2021 00:11:45 - INFO - __main__ - Step 20990: {'lr': 0.00047996439549962647, 'samples': 4030080, 'steps': 20989, 'loss/train': 1.601413607597351} -11/07/2021 00:11:45 - INFO - __main__ - Step 20991: {'lr': 0.00047996231386404593, 'samples': 4030272, 'steps': 20990, 'loss/train': 1.417210578918457} -11/07/2021 00:11:45 - INFO - __main__ - Step 20992: {'lr': 0.00047996023212484797, 'samples': 4030464, 'steps': 20991, 'loss/train': 1.6309233903884888} -11/07/2021 00:11:46 - INFO - __main__ - Step 20993: {'lr': 0.00047995815028203346, 'samples': 4030656, 'steps': 20992, 'loss/train': 0.9504069685935974} -11/07/2021 00:11:46 - INFO - __main__ - Step 20994: {'lr': 0.00047995606833560337, 'samples': 4030848, 'steps': 20993, 'loss/train': 1.437409520149231} -11/07/2021 00:11:47 - INFO - __main__ - Step 20995: {'lr': 0.0004799539862855585, 'samples': 4031040, 'steps': 20994, 'loss/train': 1.4952812194824219} -11/07/2021 00:11:47 - INFO - __main__ - Step 20996: {'lr': 0.00047995190413190004, 'samples': 4031232, 'steps': 20995, 'loss/train': 1.3429986238479614} -11/07/2021 00:11:48 - INFO - __main__ - Step 20997: {'lr': 0.00047994982187462876, 'samples': 4031424, 'steps': 20996, 'loss/train': 1.1650660037994385} -11/07/2021 00:11:48 - INFO - __main__ - Step 20998: {'lr': 0.0004799477395137457, 'samples': 4031616, 'steps': 20997, 'loss/train': 1.3438471555709839} -11/07/2021 00:11:49 - INFO - __main__ - Step 20999: {'lr': 0.00047994565704925166, 'samples': 4031808, 'steps': 20998, 'loss/train': 0.818544328212738} -11/07/2021 00:11:50 - INFO - __main__ - Step 21000: {'lr': 0.0004799435744811477, 'samples': 4032000, 'steps': 20999, 'loss/train': 1.3654391765594482} -11/07/2021 00:11:50 - INFO - __main__ - Step 21001: {'lr': 0.0004799414918094347, 'samples': 4032192, 'steps': 21000, 'loss/train': 1.828909993171692} -11/07/2021 00:11:50 - INFO - __main__ - Step 21002: {'lr': 0.0004799394090341136, 'samples': 4032384, 'steps': 21001, 'loss/train': 1.7335715293884277} -11/07/2021 00:11:51 - INFO - __main__ - Step 21003: {'lr': 0.0004799373261551854, 'samples': 4032576, 'steps': 21002, 'loss/train': 1.3147293329238892} -11/07/2021 00:11:51 - INFO - __main__ - Step 21004: {'lr': 0.0004799352431726509, 'samples': 4032768, 'steps': 21003, 'loss/train': 1.6731096506118774} -11/07/2021 00:11:53 - INFO - __main__ - Step 21005: {'lr': 0.0004799331600865112, 'samples': 4032960, 'steps': 21004, 'loss/train': 1.3603119850158691} -11/07/2021 00:11:53 - INFO - __main__ - Step 21006: {'lr': 0.0004799310768967671, 'samples': 4033152, 'steps': 21005, 'loss/train': 1.5929734706878662} -11/07/2021 00:11:53 - INFO - __main__ - Step 21007: {'lr': 0.00047992899360341966, 'samples': 4033344, 'steps': 21006, 'loss/train': 1.6748112440109253} -11/07/2021 00:11:54 - INFO - __main__ - Step 21008: {'lr': 0.0004799269102064698, 'samples': 4033536, 'steps': 21007, 'loss/train': 1.620564579963684} -11/07/2021 00:11:54 - INFO - __main__ - Step 21009: {'lr': 0.0004799248267059183, 'samples': 4033728, 'steps': 21008, 'loss/train': 1.672453761100769} -11/07/2021 00:11:54 - INFO - __main__ - Step 21010: {'lr': 0.0004799227431017663, 'samples': 4033920, 'steps': 21009, 'loss/train': 1.5249580144882202} -11/07/2021 00:11:56 - INFO - __main__ - Step 21011: {'lr': 0.0004799206593940147, 'samples': 4034112, 'steps': 21010, 'loss/train': 4.485203742980957} -11/07/2021 00:11:56 - INFO - __main__ - Step 21012: {'lr': 0.0004799185755826644, 'samples': 4034304, 'steps': 21011, 'loss/train': 1.062135934829712} -11/07/2021 00:11:56 - INFO - __main__ - Step 21013: {'lr': 0.00047991649166771624, 'samples': 4034496, 'steps': 21012, 'loss/train': 1.410986065864563} -11/07/2021 00:11:57 - INFO - __main__ - Step 21014: {'lr': 0.00047991440764917127, 'samples': 4034688, 'steps': 21013, 'loss/train': 1.6308702230453491} -11/07/2021 00:11:57 - INFO - __main__ - Step 21015: {'lr': 0.0004799123235270305, 'samples': 4034880, 'steps': 21014, 'loss/train': 2.6511857509613037} -11/07/2021 00:11:58 - INFO - __main__ - Step 21016: {'lr': 0.0004799102393012947, 'samples': 4035072, 'steps': 21015, 'loss/train': 2.724604845046997} -11/07/2021 00:11:58 - INFO - __main__ - Step 21017: {'lr': 0.0004799081549719649, 'samples': 4035264, 'steps': 21016, 'loss/train': 1.653235673904419} -11/07/2021 00:11:59 - INFO - __main__ - Step 21018: {'lr': 0.0004799060705390421, 'samples': 4035456, 'steps': 21017, 'loss/train': 1.4333916902542114} -11/07/2021 00:11:59 - INFO - __main__ - Step 21019: {'lr': 0.00047990398600252713, 'samples': 4035648, 'steps': 21018, 'loss/train': 1.2776241302490234} -11/07/2021 00:12:00 - INFO - __main__ - Step 21020: {'lr': 0.00047990190136242103, 'samples': 4035840, 'steps': 21019, 'loss/train': 2.232898473739624} -11/07/2021 00:12:00 - INFO - __main__ - Step 21021: {'lr': 0.0004798998166187246, 'samples': 4036032, 'steps': 21020, 'loss/train': 1.4598809480667114} -11/07/2021 00:12:00 - INFO - __main__ - Step 21022: {'lr': 0.0004798977317714389, 'samples': 4036224, 'steps': 21021, 'loss/train': 1.3510398864746094} -11/07/2021 00:12:01 - INFO - __main__ - Step 21023: {'lr': 0.00047989564682056487, 'samples': 4036416, 'steps': 21022, 'loss/train': 2.0689451694488525} -11/07/2021 00:12:02 - INFO - __main__ - Step 21024: {'lr': 0.0004798935617661033, 'samples': 4036608, 'steps': 21023, 'loss/train': 1.3049253225326538} -11/07/2021 00:12:02 - INFO - __main__ - Step 21025: {'lr': 0.0004798914766080553, 'samples': 4036800, 'steps': 21024, 'loss/train': 2.5650393962860107} -11/07/2021 00:12:02 - INFO - __main__ - Step 21026: {'lr': 0.00047988939134642174, 'samples': 4036992, 'steps': 21025, 'loss/train': 1.9371496438980103} -11/07/2021 00:12:03 - INFO - __main__ - Step 21027: {'lr': 0.00047988730598120356, 'samples': 4037184, 'steps': 21026, 'loss/train': 1.7897228002548218} -11/07/2021 00:12:04 - INFO - __main__ - Step 21028: {'lr': 0.00047988522051240173, 'samples': 4037376, 'steps': 21027, 'loss/train': 1.6327519416809082} -11/07/2021 00:12:04 - INFO - __main__ - Step 21029: {'lr': 0.0004798831349400172, 'samples': 4037568, 'steps': 21028, 'loss/train': 4.53317403793335} -11/07/2021 00:12:05 - INFO - __main__ - Step 21030: {'lr': 0.0004798810492640508, 'samples': 4037760, 'steps': 21029, 'loss/train': 1.88721764087677} -11/07/2021 00:12:05 - INFO - __main__ - Step 21031: {'lr': 0.00047987896348450354, 'samples': 4037952, 'steps': 21030, 'loss/train': 1.8528162240982056} -11/07/2021 00:12:05 - INFO - __main__ - Step 21032: {'lr': 0.00047987687760137646, 'samples': 4038144, 'steps': 21031, 'loss/train': 0.6381519436836243} -11/07/2021 00:12:07 - INFO - __main__ - Step 21033: {'lr': 0.00047987479161467033, 'samples': 4038336, 'steps': 21032, 'loss/train': 1.6966015100479126} -11/07/2021 00:12:07 - INFO - __main__ - Step 21034: {'lr': 0.0004798727055243862, 'samples': 4038528, 'steps': 21033, 'loss/train': 1.0211305618286133} -11/07/2021 00:12:07 - INFO - __main__ - Step 21035: {'lr': 0.000479870619330525, 'samples': 4038720, 'steps': 21034, 'loss/train': 1.7424684762954712} -11/07/2021 00:12:08 - INFO - __main__ - Step 21036: {'lr': 0.0004798685330330876, 'samples': 4038912, 'steps': 21035, 'loss/train': 2.236529588699341} -11/07/2021 00:12:08 - INFO - __main__ - Step 21037: {'lr': 0.000479866446632075, 'samples': 4039104, 'steps': 21036, 'loss/train': 1.7629296779632568} -11/07/2021 00:12:09 - INFO - __main__ - Step 21038: {'lr': 0.00047986436012748815, 'samples': 4039296, 'steps': 21037, 'loss/train': 1.6419411897659302} -11/07/2021 00:12:09 - INFO - __main__ - Step 21039: {'lr': 0.00047986227351932785, 'samples': 4039488, 'steps': 21038, 'loss/train': 1.955509901046753} -11/07/2021 00:12:10 - INFO - __main__ - Step 21040: {'lr': 0.00047986018680759525, 'samples': 4039680, 'steps': 21039, 'loss/train': 1.8619760274887085} -11/07/2021 00:12:10 - INFO - __main__ - Step 21041: {'lr': 0.00047985809999229125, 'samples': 4039872, 'steps': 21040, 'loss/train': 1.6903468370437622} -11/07/2021 00:12:10 - INFO - __main__ - Step 21042: {'lr': 0.00047985601307341667, 'samples': 4040064, 'steps': 21041, 'loss/train': 1.6033693552017212} -11/07/2021 00:12:11 - INFO - __main__ - Step 21043: {'lr': 0.0004798539260509725, 'samples': 4040256, 'steps': 21042, 'loss/train': 1.5110589265823364} -11/07/2021 00:12:12 - INFO - __main__ - Step 21044: {'lr': 0.00047985183892495977, 'samples': 4040448, 'steps': 21043, 'loss/train': 1.7737886905670166} -11/07/2021 00:12:12 - INFO - __main__ - Step 21045: {'lr': 0.00047984975169537925, 'samples': 4040640, 'steps': 21044, 'loss/train': 2.1395554542541504} -11/07/2021 00:12:12 - INFO - __main__ - Step 21046: {'lr': 0.00047984766436223205, 'samples': 4040832, 'steps': 21045, 'loss/train': 1.7177172899246216} -11/07/2021 00:12:13 - INFO - __main__ - Step 21047: {'lr': 0.000479845576925519, 'samples': 4041024, 'steps': 21046, 'loss/train': 1.8919692039489746} -11/07/2021 00:12:13 - INFO - __main__ - Step 21048: {'lr': 0.00047984348938524113, 'samples': 4041216, 'steps': 21047, 'loss/train': 1.8316309452056885} -11/07/2021 00:12:14 - INFO - __main__ - Step 21049: {'lr': 0.00047984140174139926, 'samples': 4041408, 'steps': 21048, 'loss/train': 1.637800693511963} -11/07/2021 00:12:14 - INFO - __main__ - Step 21050: {'lr': 0.0004798393139939945, 'samples': 4041600, 'steps': 21049, 'loss/train': 1.1018575429916382} -11/07/2021 00:12:15 - INFO - __main__ - Step 21051: {'lr': 0.0004798372261430276, 'samples': 4041792, 'steps': 21050, 'loss/train': 1.6706420183181763} -11/07/2021 00:12:15 - INFO - __main__ - Step 21052: {'lr': 0.00047983513818849967, 'samples': 4041984, 'steps': 21051, 'loss/train': 1.7306580543518066} -11/07/2021 00:12:15 - INFO - __main__ - Step 21053: {'lr': 0.0004798330501304115, 'samples': 4042176, 'steps': 21052, 'loss/train': 1.6159660816192627} -11/07/2021 00:12:16 - INFO - __main__ - Step 21054: {'lr': 0.00047983096196876413, 'samples': 4042368, 'steps': 21053, 'loss/train': 1.8145487308502197} -11/07/2021 00:12:17 - INFO - __main__ - Step 21055: {'lr': 0.00047982887370355846, 'samples': 4042560, 'steps': 21054, 'loss/train': 0.9376941323280334} -11/07/2021 00:12:17 - INFO - __main__ - Step 21056: {'lr': 0.0004798267853347955, 'samples': 4042752, 'steps': 21055, 'loss/train': 1.15646493434906} -11/07/2021 00:12:17 - INFO - __main__ - Step 21057: {'lr': 0.0004798246968624761, 'samples': 4042944, 'steps': 21056, 'loss/train': 1.7298862934112549} -11/07/2021 00:12:18 - INFO - __main__ - Step 21058: {'lr': 0.00047982260828660124, 'samples': 4043136, 'steps': 21057, 'loss/train': 1.785570502281189} -11/07/2021 00:12:19 - INFO - __main__ - Step 21059: {'lr': 0.0004798205196071719, 'samples': 4043328, 'steps': 21058, 'loss/train': 1.3368200063705444} -11/07/2021 00:12:19 - INFO - __main__ - Step 21060: {'lr': 0.00047981843082418884, 'samples': 4043520, 'steps': 21059, 'loss/train': 1.938208818435669} -11/07/2021 00:12:20 - INFO - __main__ - Step 21061: {'lr': 0.0004798163419376533, 'samples': 4043712, 'steps': 21060, 'loss/train': 1.3998974561691284} -11/07/2021 00:12:20 - INFO - __main__ - Step 21062: {'lr': 0.00047981425294756595, 'samples': 4043904, 'steps': 21061, 'loss/train': 1.4993808269500732} -11/07/2021 00:12:20 - INFO - __main__ - Step 21063: {'lr': 0.00047981216385392796, 'samples': 4044096, 'steps': 21062, 'loss/train': 1.275914192199707} -11/07/2021 00:12:21 - INFO - __main__ - Step 21064: {'lr': 0.0004798100746567401, 'samples': 4044288, 'steps': 21063, 'loss/train': 1.8225252628326416} -11/07/2021 00:12:22 - INFO - __main__ - Step 21065: {'lr': 0.00047980798535600334, 'samples': 4044480, 'steps': 21064, 'loss/train': 2.1295764446258545} -11/07/2021 00:12:22 - INFO - __main__ - Step 21066: {'lr': 0.00047980589595171866, 'samples': 4044672, 'steps': 21065, 'loss/train': 1.8311939239501953} -11/07/2021 00:12:22 - INFO - __main__ - Step 21067: {'lr': 0.000479803806443887, 'samples': 4044864, 'steps': 21066, 'loss/train': 1.5671026706695557} -11/07/2021 00:12:23 - INFO - __main__ - Step 21068: {'lr': 0.0004798017168325093, 'samples': 4045056, 'steps': 21067, 'loss/train': 1.1478503942489624} -11/07/2021 00:12:24 - INFO - __main__ - Step 21069: {'lr': 0.0004797996271175865, 'samples': 4045248, 'steps': 21068, 'loss/train': 1.5180654525756836} -11/07/2021 00:12:24 - INFO - __main__ - Step 21070: {'lr': 0.00047979753729911944, 'samples': 4045440, 'steps': 21069, 'loss/train': 1.7661678791046143} -11/07/2021 00:12:24 - INFO - __main__ - Step 21071: {'lr': 0.00047979544737710925, 'samples': 4045632, 'steps': 21070, 'loss/train': 1.5353820323944092} -11/07/2021 00:12:25 - INFO - __main__ - Step 21072: {'lr': 0.00047979335735155677, 'samples': 4045824, 'steps': 21071, 'loss/train': 1.630466341972351} -11/07/2021 00:12:25 - INFO - __main__ - Step 21073: {'lr': 0.00047979126722246294, 'samples': 4046016, 'steps': 21072, 'loss/train': 1.4065769910812378} -11/07/2021 00:12:26 - INFO - __main__ - Step 21074: {'lr': 0.0004797891769898287, 'samples': 4046208, 'steps': 21073, 'loss/train': 1.6578621864318848} -11/07/2021 00:12:26 - INFO - __main__ - Step 21075: {'lr': 0.00047978708665365503, 'samples': 4046400, 'steps': 21074, 'loss/train': 1.570343017578125} -11/07/2021 00:12:27 - INFO - __main__ - Step 21076: {'lr': 0.0004797849962139428, 'samples': 4046592, 'steps': 21075, 'loss/train': 1.786704421043396} -11/07/2021 00:12:27 - INFO - __main__ - Step 21077: {'lr': 0.00047978290567069306, 'samples': 4046784, 'steps': 21076, 'loss/train': 2.6458792686462402} -11/07/2021 00:12:28 - INFO - __main__ - Step 21078: {'lr': 0.00047978081502390656, 'samples': 4046976, 'steps': 21077, 'loss/train': 0.9769932627677917} -11/07/2021 00:12:29 - INFO - __main__ - Step 21079: {'lr': 0.0004797787242735845, 'samples': 4047168, 'steps': 21078, 'loss/train': 1.5711239576339722} -11/07/2021 00:12:29 - INFO - __main__ - Step 21080: {'lr': 0.00047977663341972765, 'samples': 4047360, 'steps': 21079, 'loss/train': 2.6277008056640625} -11/07/2021 00:12:29 - INFO - __main__ - Step 21081: {'lr': 0.00047977454246233696, 'samples': 4047552, 'steps': 21080, 'loss/train': 1.6991426944732666} -11/07/2021 00:12:30 - INFO - __main__ - Step 21082: {'lr': 0.00047977245140141354, 'samples': 4047744, 'steps': 21081, 'loss/train': 2.114461660385132} -11/07/2021 00:12:30 - INFO - __main__ - Step 21083: {'lr': 0.00047977036023695807, 'samples': 4047936, 'steps': 21082, 'loss/train': 2.2551801204681396} -11/07/2021 00:12:30 - INFO - __main__ - Step 21084: {'lr': 0.00047976826896897165, 'samples': 4048128, 'steps': 21083, 'loss/train': 1.5625381469726562} -11/07/2021 00:12:31 - INFO - __main__ - Step 21085: {'lr': 0.0004797661775974552, 'samples': 4048320, 'steps': 21084, 'loss/train': 1.0512539148330688} -11/07/2021 00:12:32 - INFO - __main__ - Step 21086: {'lr': 0.00047976408612240964, 'samples': 4048512, 'steps': 21085, 'loss/train': 1.6367626190185547} -11/07/2021 00:12:32 - INFO - __main__ - Step 21087: {'lr': 0.00047976199454383595, 'samples': 4048704, 'steps': 21086, 'loss/train': 2.107619285583496} -11/07/2021 00:12:32 - INFO - __main__ - Step 21088: {'lr': 0.00047975990286173504, 'samples': 4048896, 'steps': 21087, 'loss/train': 1.7704498767852783} -11/07/2021 00:12:33 - INFO - __main__ - Step 21089: {'lr': 0.00047975781107610784, 'samples': 4049088, 'steps': 21088, 'loss/train': 1.409651279449463} -11/07/2021 00:12:34 - INFO - __main__ - Step 21090: {'lr': 0.0004797557191869554, 'samples': 4049280, 'steps': 21089, 'loss/train': 1.722057819366455} -11/07/2021 00:12:34 - INFO - __main__ - Step 21091: {'lr': 0.0004797536271942785, 'samples': 4049472, 'steps': 21090, 'loss/train': 0.3714536726474762} -11/07/2021 00:12:35 - INFO - __main__ - Step 21092: {'lr': 0.00047975153509807815, 'samples': 4049664, 'steps': 21091, 'loss/train': 1.37582266330719} -11/07/2021 00:12:35 - INFO - __main__ - Step 21093: {'lr': 0.0004797494428983553, 'samples': 4049856, 'steps': 21092, 'loss/train': 2.382824182510376} -11/07/2021 00:12:35 - INFO - __main__ - Step 21094: {'lr': 0.000479747350595111, 'samples': 4050048, 'steps': 21093, 'loss/train': 1.4000967741012573} -11/07/2021 00:12:36 - INFO - __main__ - Step 21095: {'lr': 0.00047974525818834604, 'samples': 4050240, 'steps': 21094, 'loss/train': 1.4624602794647217} -11/07/2021 00:12:37 - INFO - __main__ - Step 21096: {'lr': 0.0004797431656780613, 'samples': 4050432, 'steps': 21095, 'loss/train': 1.8797059059143066} -11/07/2021 00:12:37 - INFO - __main__ - Step 21097: {'lr': 0.000479741073064258, 'samples': 4050624, 'steps': 21096, 'loss/train': 1.8052655458450317} -11/07/2021 00:12:37 - INFO - __main__ - Step 21098: {'lr': 0.0004797389803469369, 'samples': 4050816, 'steps': 21097, 'loss/train': 1.7806404829025269} -11/07/2021 00:12:38 - INFO - __main__ - Step 21099: {'lr': 0.0004797368875260988, 'samples': 4051008, 'steps': 21098, 'loss/train': 1.817021131515503} -11/07/2021 00:12:39 - INFO - __main__ - Step 21100: {'lr': 0.00047973479460174497, 'samples': 4051200, 'steps': 21099, 'loss/train': 1.438368320465088} -11/07/2021 00:12:39 - INFO - __main__ - Step 21101: {'lr': 0.00047973270157387605, 'samples': 4051392, 'steps': 21100, 'loss/train': 1.0588150024414062} -11/07/2021 00:12:39 - INFO - __main__ - Step 21102: {'lr': 0.0004797306084424932, 'samples': 4051584, 'steps': 21101, 'loss/train': 1.283268690109253} -11/07/2021 00:12:40 - INFO - __main__ - Step 21103: {'lr': 0.0004797285152075973, 'samples': 4051776, 'steps': 21102, 'loss/train': 1.7230778932571411} -11/07/2021 00:12:40 - INFO - __main__ - Step 21104: {'lr': 0.00047972642186918925, 'samples': 4051968, 'steps': 21103, 'loss/train': 1.8024054765701294} -11/07/2021 00:12:41 - INFO - __main__ - Step 21105: {'lr': 0.00047972432842727003, 'samples': 4052160, 'steps': 21104, 'loss/train': 1.590198278427124} -11/07/2021 00:12:41 - INFO - __main__ - Step 21106: {'lr': 0.0004797222348818405, 'samples': 4052352, 'steps': 21105, 'loss/train': 1.9167371988296509} -11/07/2021 00:12:42 - INFO - __main__ - Step 21107: {'lr': 0.00047972014123290183, 'samples': 4052544, 'steps': 21106, 'loss/train': 1.5365687608718872} -11/07/2021 00:12:42 - INFO - __main__ - Step 21108: {'lr': 0.00047971804748045464, 'samples': 4052736, 'steps': 21107, 'loss/train': 1.8305330276489258} -11/07/2021 00:12:43 - INFO - __main__ - Step 21109: {'lr': 0.00047971595362450014, 'samples': 4052928, 'steps': 21108, 'loss/train': 1.5538760423660278} -11/07/2021 00:12:43 - INFO - __main__ - Step 21110: {'lr': 0.00047971385966503923, 'samples': 4053120, 'steps': 21109, 'loss/train': 1.6489356756210327} -11/07/2021 00:12:44 - INFO - __main__ - Step 21111: {'lr': 0.0004797117656020727, 'samples': 4053312, 'steps': 21110, 'loss/train': 1.8342883586883545} -11/07/2021 00:12:44 - INFO - __main__ - Step 21112: {'lr': 0.0004797096714356016, 'samples': 4053504, 'steps': 21111, 'loss/train': 1.6683157682418823} -11/07/2021 00:12:45 - INFO - __main__ - Step 21113: {'lr': 0.0004797075771656269, 'samples': 4053696, 'steps': 21112, 'loss/train': 1.3306695222854614} -11/07/2021 00:12:45 - INFO - __main__ - Step 21114: {'lr': 0.0004797054827921495, 'samples': 4053888, 'steps': 21113, 'loss/train': 0.9768213629722595} -11/07/2021 00:12:45 - INFO - __main__ - Step 21115: {'lr': 0.0004797033883151703, 'samples': 4054080, 'steps': 21114, 'loss/train': 1.3049585819244385} -11/07/2021 00:12:46 - INFO - __main__ - Step 21116: {'lr': 0.0004797012937346904, 'samples': 4054272, 'steps': 21115, 'loss/train': 0.9799783229827881} -11/07/2021 00:12:47 - INFO - __main__ - Step 21117: {'lr': 0.0004796991990507106, 'samples': 4054464, 'steps': 21116, 'loss/train': 1.0931177139282227} -11/07/2021 00:12:47 - INFO - __main__ - Step 21118: {'lr': 0.00047969710426323185, 'samples': 4054656, 'steps': 21117, 'loss/train': 1.5874521732330322} -11/07/2021 00:12:47 - INFO - __main__ - Step 21119: {'lr': 0.0004796950093722552, 'samples': 4054848, 'steps': 21118, 'loss/train': 1.7003940343856812} -11/07/2021 00:12:48 - INFO - __main__ - Step 21120: {'lr': 0.00047969291437778143, 'samples': 4055040, 'steps': 21119, 'loss/train': 1.7281981706619263} -11/07/2021 00:12:49 - INFO - __main__ - Step 21121: {'lr': 0.00047969081927981165, 'samples': 4055232, 'steps': 21120, 'loss/train': 1.3604600429534912} -11/07/2021 00:12:49 - INFO - __main__ - Step 21122: {'lr': 0.0004796887240783467, 'samples': 4055424, 'steps': 21121, 'loss/train': 0.33510664105415344} -11/07/2021 00:12:50 - INFO - __main__ - Step 21123: {'lr': 0.0004796866287733875, 'samples': 4055616, 'steps': 21122, 'loss/train': 1.2340506315231323} -11/07/2021 00:12:50 - INFO - __main__ - Step 21124: {'lr': 0.0004796845333649352, 'samples': 4055808, 'steps': 21123, 'loss/train': 1.552304744720459} -11/07/2021 00:12:51 - INFO - __main__ - Step 21125: {'lr': 0.00047968243785299046, 'samples': 4056000, 'steps': 21124, 'loss/train': 1.78187894821167} -11/07/2021 00:12:51 - INFO - __main__ - Step 21126: {'lr': 0.0004796803422375544, 'samples': 4056192, 'steps': 21125, 'loss/train': 1.5677958726882935} -11/07/2021 00:12:52 - INFO - __main__ - Step 21127: {'lr': 0.0004796782465186279, 'samples': 4056384, 'steps': 21126, 'loss/train': 0.20881569385528564} -11/07/2021 00:12:52 - INFO - __main__ - Step 21128: {'lr': 0.00047967615069621197, 'samples': 4056576, 'steps': 21127, 'loss/train': 1.6353904008865356} -11/07/2021 00:12:53 - INFO - __main__ - Step 21129: {'lr': 0.0004796740547703075, 'samples': 4056768, 'steps': 21128, 'loss/train': 1.5348048210144043} -11/07/2021 00:12:53 - INFO - __main__ - Step 21130: {'lr': 0.00047967195874091547, 'samples': 4056960, 'steps': 21129, 'loss/train': 1.6365200281143188} -11/07/2021 00:12:53 - INFO - __main__ - Step 21131: {'lr': 0.00047966986260803676, 'samples': 4057152, 'steps': 21130, 'loss/train': 1.6884819269180298} -11/07/2021 00:12:54 - INFO - __main__ - Step 21132: {'lr': 0.0004796677663716723, 'samples': 4057344, 'steps': 21131, 'loss/train': 1.2197633981704712} -11/07/2021 00:12:55 - INFO - __main__ - Step 21133: {'lr': 0.00047966567003182315, 'samples': 4057536, 'steps': 21132, 'loss/train': 1.3943464756011963} -11/07/2021 00:12:55 - INFO - __main__ - Step 21134: {'lr': 0.0004796635735884902, 'samples': 4057728, 'steps': 21133, 'loss/train': 1.5279340744018555} -11/07/2021 00:12:56 - INFO - __main__ - Step 21135: {'lr': 0.0004796614770416744, 'samples': 4057920, 'steps': 21134, 'loss/train': 1.308184027671814} -11/07/2021 00:12:56 - INFO - __main__ - Step 21136: {'lr': 0.00047965938039137666, 'samples': 4058112, 'steps': 21135, 'loss/train': 1.3822206258773804} -11/07/2021 00:12:57 - INFO - __main__ - Step 21137: {'lr': 0.000479657283637598, 'samples': 4058304, 'steps': 21136, 'loss/train': 1.382985234260559} -11/07/2021 00:12:57 - INFO - __main__ - Step 21138: {'lr': 0.00047965518678033924, 'samples': 4058496, 'steps': 21137, 'loss/train': 1.4995598793029785} -11/07/2021 00:12:57 - INFO - __main__ - Step 21139: {'lr': 0.00047965308981960143, 'samples': 4058688, 'steps': 21138, 'loss/train': 1.426271915435791} -11/07/2021 00:12:58 - INFO - __main__ - Step 21140: {'lr': 0.0004796509927553854, 'samples': 4058880, 'steps': 21139, 'loss/train': 1.2639167308807373} -11/07/2021 00:12:58 - INFO - __main__ - Step 21141: {'lr': 0.00047964889558769233, 'samples': 4059072, 'steps': 21140, 'loss/train': 1.5699936151504517} -11/07/2021 00:12:59 - INFO - __main__ - Step 21142: {'lr': 0.00047964679831652294, 'samples': 4059264, 'steps': 21141, 'loss/train': 1.2318005561828613} -11/07/2021 00:13:00 - INFO - __main__ - Step 21143: {'lr': 0.00047964470094187815, 'samples': 4059456, 'steps': 21142, 'loss/train': 0.17193424701690674} -11/07/2021 00:13:00 - INFO - __main__ - Step 21144: {'lr': 0.0004796426034637591, 'samples': 4059648, 'steps': 21143, 'loss/train': 1.6715084314346313} -11/07/2021 00:13:00 - INFO - __main__ - Step 21145: {'lr': 0.0004796405058821666, 'samples': 4059840, 'steps': 21144, 'loss/train': 1.1046626567840576} -11/07/2021 00:13:01 - INFO - __main__ - Step 21146: {'lr': 0.0004796384081971017, 'samples': 4060032, 'steps': 21145, 'loss/train': 1.7059005498886108} -11/07/2021 00:13:01 - INFO - __main__ - Step 21147: {'lr': 0.0004796363104085652, 'samples': 4060224, 'steps': 21146, 'loss/train': 1.8541324138641357} -11/07/2021 00:13:02 - INFO - __main__ - Step 21148: {'lr': 0.00047963421251655817, 'samples': 4060416, 'steps': 21147, 'loss/train': 1.7760694026947021} -11/07/2021 00:13:02 - INFO - __main__ - Step 21149: {'lr': 0.00047963211452108144, 'samples': 4060608, 'steps': 21148, 'loss/train': 1.298509955406189} -11/07/2021 00:13:03 - INFO - __main__ - Step 21150: {'lr': 0.0004796300164221361, 'samples': 4060800, 'steps': 21149, 'loss/train': 1.3676725625991821} -11/07/2021 00:13:03 - INFO - __main__ - Step 21151: {'lr': 0.00047962791821972296, 'samples': 4060992, 'steps': 21150, 'loss/train': 1.5314453840255737} -11/07/2021 00:13:03 - INFO - __main__ - Step 21152: {'lr': 0.00047962581991384305, 'samples': 4061184, 'steps': 21151, 'loss/train': 1.3802883625030518} -11/07/2021 00:13:05 - INFO - __main__ - Step 21153: {'lr': 0.0004796237215044973, 'samples': 4061376, 'steps': 21152, 'loss/train': 0.8671078085899353} -11/07/2021 00:13:05 - INFO - __main__ - Step 21154: {'lr': 0.0004796216229916867, 'samples': 4061568, 'steps': 21153, 'loss/train': 2.082179307937622} -11/07/2021 00:13:05 - INFO - __main__ - Step 21155: {'lr': 0.000479619524375412, 'samples': 4061760, 'steps': 21154, 'loss/train': 1.5132710933685303} -11/07/2021 00:13:06 - INFO - __main__ - Step 21156: {'lr': 0.0004796174256556744, 'samples': 4061952, 'steps': 21155, 'loss/train': 1.778990626335144} -11/07/2021 00:13:06 - INFO - __main__ - Step 21157: {'lr': 0.0004796153268324747, 'samples': 4062144, 'steps': 21156, 'loss/train': 2.0939102172851562} -11/07/2021 00:13:07 - INFO - __main__ - Step 21158: {'lr': 0.00047961322790581384, 'samples': 4062336, 'steps': 21157, 'loss/train': 1.0755528211593628} -11/07/2021 00:13:07 - INFO - __main__ - Step 21159: {'lr': 0.00047961112887569285, 'samples': 4062528, 'steps': 21158, 'loss/train': 1.004090666770935} -11/07/2021 00:13:08 - INFO - __main__ - Step 21160: {'lr': 0.0004796090297421126, 'samples': 4062720, 'steps': 21159, 'loss/train': 1.5249578952789307} -11/07/2021 00:13:08 - INFO - __main__ - Step 21161: {'lr': 0.0004796069305050741, 'samples': 4062912, 'steps': 21160, 'loss/train': 1.7508039474487305} -11/07/2021 00:13:08 - INFO - __main__ - Step 21162: {'lr': 0.0004796048311645782, 'samples': 4063104, 'steps': 21161, 'loss/train': 1.584632396697998} -11/07/2021 00:13:09 - INFO - __main__ - Step 21163: {'lr': 0.00047960273172062596, 'samples': 4063296, 'steps': 21162, 'loss/train': 0.974990725517273} -11/07/2021 00:13:10 - INFO - __main__ - Step 21164: {'lr': 0.00047960063217321824, 'samples': 4063488, 'steps': 21163, 'loss/train': 0.8087447285652161} -11/07/2021 00:13:10 - INFO - __main__ - Step 21165: {'lr': 0.0004795985325223561, 'samples': 4063680, 'steps': 21164, 'loss/train': 0.8941444158554077} -11/07/2021 00:13:10 - INFO - __main__ - Step 21166: {'lr': 0.00047959643276804026, 'samples': 4063872, 'steps': 21165, 'loss/train': 2.0346102714538574} -11/07/2021 00:13:11 - INFO - __main__ - Step 21167: {'lr': 0.0004795943329102719, 'samples': 4064064, 'steps': 21166, 'loss/train': 1.8948001861572266} -11/07/2021 00:13:11 - INFO - __main__ - Step 21168: {'lr': 0.00047959223294905185, 'samples': 4064256, 'steps': 21167, 'loss/train': 1.3930824995040894} -11/07/2021 00:13:12 - INFO - __main__ - Step 21169: {'lr': 0.00047959013288438113, 'samples': 4064448, 'steps': 21168, 'loss/train': 2.1027698516845703} -11/07/2021 00:13:13 - INFO - __main__ - Step 21170: {'lr': 0.0004795880327162606, 'samples': 4064640, 'steps': 21169, 'loss/train': 1.8361570835113525} -11/07/2021 00:13:13 - INFO - __main__ - Step 21171: {'lr': 0.0004795859324446912, 'samples': 4064832, 'steps': 21170, 'loss/train': 0.1968582719564438} -11/07/2021 00:13:13 - INFO - __main__ - Step 21172: {'lr': 0.000479583832069674, 'samples': 4065024, 'steps': 21171, 'loss/train': 1.953822374343872} -11/07/2021 00:13:14 - INFO - __main__ - Step 21173: {'lr': 0.00047958173159120984, 'samples': 4065216, 'steps': 21172, 'loss/train': 1.3294357061386108} -11/07/2021 00:13:15 - INFO - __main__ - Step 21174: {'lr': 0.0004795796310092997, 'samples': 4065408, 'steps': 21173, 'loss/train': 1.368573546409607} -11/07/2021 00:13:15 - INFO - __main__ - Step 21175: {'lr': 0.00047957753032394445, 'samples': 4065600, 'steps': 21174, 'loss/train': 1.3646577596664429} -11/07/2021 00:13:15 - INFO - __main__ - Step 21176: {'lr': 0.00047957542953514523, 'samples': 4065792, 'steps': 21175, 'loss/train': 1.5818638801574707} -11/07/2021 00:13:16 - INFO - __main__ - Step 21177: {'lr': 0.00047957332864290283, 'samples': 4065984, 'steps': 21176, 'loss/train': 1.4539034366607666} -11/07/2021 00:13:16 - INFO - __main__ - Step 21178: {'lr': 0.00047957122764721817, 'samples': 4066176, 'steps': 21177, 'loss/train': 1.3946402072906494} -11/07/2021 00:13:17 - INFO - __main__ - Step 21179: {'lr': 0.00047956912654809227, 'samples': 4066368, 'steps': 21178, 'loss/train': 1.720708966255188} -11/07/2021 00:13:18 - INFO - __main__ - Step 21180: {'lr': 0.0004795670253455261, 'samples': 4066560, 'steps': 21179, 'loss/train': 1.664499044418335} -11/07/2021 00:13:18 - INFO - __main__ - Step 21181: {'lr': 0.00047956492403952055, 'samples': 4066752, 'steps': 21180, 'loss/train': 1.7864108085632324} -11/07/2021 00:13:18 - INFO - __main__ - Step 21182: {'lr': 0.00047956282263007663, 'samples': 4066944, 'steps': 21181, 'loss/train': 2.069216728210449} -11/07/2021 00:13:19 - INFO - __main__ - Step 21183: {'lr': 0.00047956072111719517, 'samples': 4067136, 'steps': 21182, 'loss/train': 2.2219934463500977} -11/07/2021 00:13:20 - INFO - __main__ - Step 21184: {'lr': 0.00047955861950087724, 'samples': 4067328, 'steps': 21183, 'loss/train': 1.7120684385299683} -11/07/2021 00:13:20 - INFO - __main__ - Step 21185: {'lr': 0.00047955651778112376, 'samples': 4067520, 'steps': 21184, 'loss/train': 1.7454752922058105} -11/07/2021 00:13:20 - INFO - __main__ - Step 21186: {'lr': 0.00047955441595793556, 'samples': 4067712, 'steps': 21185, 'loss/train': 1.556066632270813} -11/07/2021 00:13:21 - INFO - __main__ - Step 21187: {'lr': 0.0004795523140313138, 'samples': 4067904, 'steps': 21186, 'loss/train': 1.2820478677749634} -11/07/2021 00:13:21 - INFO - __main__ - Step 21188: {'lr': 0.00047955021200125924, 'samples': 4068096, 'steps': 21187, 'loss/train': 1.2648670673370361} -11/07/2021 00:13:22 - INFO - __main__ - Step 21189: {'lr': 0.0004795481098677729, 'samples': 4068288, 'steps': 21188, 'loss/train': 1.7958683967590332} -11/07/2021 00:13:22 - INFO - __main__ - Step 21190: {'lr': 0.00047954600763085577, 'samples': 4068480, 'steps': 21189, 'loss/train': 1.792773723602295} -11/07/2021 00:13:23 - INFO - __main__ - Step 21191: {'lr': 0.0004795439052905087, 'samples': 4068672, 'steps': 21190, 'loss/train': 1.736327052116394} -11/07/2021 00:13:23 - INFO - __main__ - Step 21192: {'lr': 0.0004795418028467327, 'samples': 4068864, 'steps': 21191, 'loss/train': 1.8518633842468262} -11/07/2021 00:13:23 - INFO - __main__ - Step 21193: {'lr': 0.0004795397002995288, 'samples': 4069056, 'steps': 21192, 'loss/train': 1.6165372133255005} -11/07/2021 00:13:24 - INFO - __main__ - Step 21194: {'lr': 0.0004795375976488977, 'samples': 4069248, 'steps': 21193, 'loss/train': 2.0459771156311035} -11/07/2021 00:13:25 - INFO - __main__ - Step 21195: {'lr': 0.00047953549489484056, 'samples': 4069440, 'steps': 21194, 'loss/train': 1.7422749996185303} -11/07/2021 00:13:25 - INFO - __main__ - Step 21196: {'lr': 0.0004795333920373583, 'samples': 4069632, 'steps': 21195, 'loss/train': 1.8609914779663086} -11/07/2021 00:13:25 - INFO - __main__ - Step 21197: {'lr': 0.00047953128907645185, 'samples': 4069824, 'steps': 21196, 'loss/train': 1.623853087425232} -11/07/2021 00:13:26 - INFO - __main__ - Step 21198: {'lr': 0.000479529186012122, 'samples': 4070016, 'steps': 21197, 'loss/train': 1.546166181564331} -11/07/2021 00:13:26 - INFO - __main__ - Step 21199: {'lr': 0.00047952708284437, 'samples': 4070208, 'steps': 21198, 'loss/train': 1.3570958375930786} -11/07/2021 00:13:27 - INFO - __main__ - Step 21200: {'lr': 0.0004795249795731966, 'samples': 4070400, 'steps': 21199, 'loss/train': 1.755671739578247} -11/07/2021 00:13:28 - INFO - __main__ - Step 21201: {'lr': 0.00047952287619860273, 'samples': 4070592, 'steps': 21200, 'loss/train': 1.8419883251190186} -11/07/2021 00:13:28 - INFO - __main__ - Step 21202: {'lr': 0.0004795207727205895, 'samples': 4070784, 'steps': 21201, 'loss/train': 2.0788772106170654} -11/07/2021 00:13:28 - INFO - __main__ - Step 21203: {'lr': 0.00047951866913915767, 'samples': 4070976, 'steps': 21202, 'loss/train': 1.6653965711593628} -11/07/2021 00:13:29 - INFO - __main__ - Step 21204: {'lr': 0.0004795165654543082, 'samples': 4071168, 'steps': 21203, 'loss/train': 2.297816514968872} -11/07/2021 00:13:30 - INFO - __main__ - Step 21205: {'lr': 0.0004795144616660422, 'samples': 4071360, 'steps': 21204, 'loss/train': 1.7352765798568726} -11/07/2021 00:13:30 - INFO - __main__ - Step 21206: {'lr': 0.0004795123577743605, 'samples': 4071552, 'steps': 21205, 'loss/train': 0.8612052798271179} -11/07/2021 00:13:30 - INFO - __main__ - Step 21207: {'lr': 0.0004795102537792641, 'samples': 4071744, 'steps': 21206, 'loss/train': 1.7479983568191528} -11/07/2021 00:13:31 - INFO - __main__ - Step 21208: {'lr': 0.000479508149680754, 'samples': 4071936, 'steps': 21207, 'loss/train': 1.8053940534591675} -11/07/2021 00:13:31 - INFO - __main__ - Step 21209: {'lr': 0.0004795060454788309, 'samples': 4072128, 'steps': 21208, 'loss/train': 1.6106544733047485} -11/07/2021 00:13:32 - INFO - __main__ - Step 21210: {'lr': 0.000479503941173496, 'samples': 4072320, 'steps': 21209, 'loss/train': 2.015735387802124} -11/07/2021 00:13:33 - INFO - __main__ - Step 21211: {'lr': 0.0004795018367647501, 'samples': 4072512, 'steps': 21210, 'loss/train': 1.5669276714324951} -11/07/2021 00:13:33 - INFO - __main__ - Step 21212: {'lr': 0.0004794997322525944, 'samples': 4072704, 'steps': 21211, 'loss/train': 0.42870834469795227} -11/07/2021 00:13:33 - INFO - __main__ - Step 21213: {'lr': 0.0004794976276370295, 'samples': 4072896, 'steps': 21212, 'loss/train': 1.104694128036499} -11/07/2021 00:13:34 - INFO - __main__ - Step 21214: {'lr': 0.00047949552291805654, 'samples': 4073088, 'steps': 21213, 'loss/train': 1.143908977508545} -11/07/2021 00:13:35 - INFO - __main__ - Step 21215: {'lr': 0.0004794934180956764, 'samples': 4073280, 'steps': 21214, 'loss/train': 1.7211107015609741} -11/07/2021 00:13:35 - INFO - __main__ - Step 21216: {'lr': 0.00047949131316989016, 'samples': 4073472, 'steps': 21215, 'loss/train': 1.2839972972869873} -11/07/2021 00:13:35 - INFO - __main__ - Step 21217: {'lr': 0.0004794892081406986, 'samples': 4073664, 'steps': 21216, 'loss/train': 1.9193248748779297} -11/07/2021 00:13:36 - INFO - __main__ - Step 21218: {'lr': 0.00047948710300810276, 'samples': 4073856, 'steps': 21217, 'loss/train': 1.1737147569656372} -11/07/2021 00:13:36 - INFO - __main__ - Step 21219: {'lr': 0.0004794849977721036, 'samples': 4074048, 'steps': 21218, 'loss/train': 1.3072047233581543} -11/07/2021 00:13:37 - INFO - __main__ - Step 21220: {'lr': 0.00047948289243270205, 'samples': 4074240, 'steps': 21219, 'loss/train': 2.3479273319244385} -11/07/2021 00:13:38 - INFO - __main__ - Step 21221: {'lr': 0.000479480786989899, 'samples': 4074432, 'steps': 21220, 'loss/train': 1.474902868270874} -11/07/2021 00:13:38 - INFO - __main__ - Step 21222: {'lr': 0.0004794786814436955, 'samples': 4074624, 'steps': 21221, 'loss/train': 0.7210199236869812} -11/07/2021 00:13:38 - INFO - __main__ - Step 21223: {'lr': 0.0004794765757940924, 'samples': 4074816, 'steps': 21222, 'loss/train': 1.7698161602020264} -11/07/2021 00:13:39 - INFO - __main__ - Step 21224: {'lr': 0.00047947447004109066, 'samples': 4075008, 'steps': 21223, 'loss/train': 1.5735344886779785} -11/07/2021 00:13:40 - INFO - __main__ - Step 21225: {'lr': 0.0004794723641846914, 'samples': 4075200, 'steps': 21224, 'loss/train': 2.287526845932007} -11/07/2021 00:13:40 - INFO - __main__ - Step 21226: {'lr': 0.0004794702582248953, 'samples': 4075392, 'steps': 21225, 'loss/train': 1.3349794149398804} -11/07/2021 00:13:40 - INFO - __main__ - Step 21227: {'lr': 0.0004794681521617035, 'samples': 4075584, 'steps': 21226, 'loss/train': 1.7850278615951538} -11/07/2021 00:13:41 - INFO - __main__ - Step 21228: {'lr': 0.0004794660459951169, 'samples': 4075776, 'steps': 21227, 'loss/train': 1.253070592880249} -11/07/2021 00:13:41 - INFO - __main__ - Step 21229: {'lr': 0.0004794639397251365, 'samples': 4075968, 'steps': 21228, 'loss/train': 1.8737459182739258} -11/07/2021 00:13:42 - INFO - __main__ - Step 21230: {'lr': 0.00047946183335176307, 'samples': 4076160, 'steps': 21229, 'loss/train': 1.4230912923812866} -11/07/2021 00:13:42 - INFO - __main__ - Step 21231: {'lr': 0.00047945972687499775, 'samples': 4076352, 'steps': 21230, 'loss/train': 1.8137074708938599} -11/07/2021 00:13:43 - INFO - __main__ - Step 21232: {'lr': 0.0004794576202948414, 'samples': 4076544, 'steps': 21231, 'loss/train': 1.383471131324768} -11/07/2021 00:13:43 - INFO - __main__ - Step 21233: {'lr': 0.000479455513611295, 'samples': 4076736, 'steps': 21232, 'loss/train': 1.8926209211349487} -11/07/2021 00:13:43 - INFO - __main__ - Step 21234: {'lr': 0.00047945340682435943, 'samples': 4076928, 'steps': 21233, 'loss/train': 1.588423252105713} -11/07/2021 00:13:44 - INFO - __main__ - Step 21235: {'lr': 0.00047945129993403577, 'samples': 4077120, 'steps': 21234, 'loss/train': 1.1220974922180176} -11/07/2021 00:13:45 - INFO - __main__ - Step 21236: {'lr': 0.00047944919294032486, 'samples': 4077312, 'steps': 21235, 'loss/train': 1.501308560371399} -11/07/2021 00:13:45 - INFO - __main__ - Step 21237: {'lr': 0.00047944708584322763, 'samples': 4077504, 'steps': 21236, 'loss/train': 1.2461358308792114} -11/07/2021 00:13:45 - INFO - __main__ - Step 21238: {'lr': 0.00047944497864274517, 'samples': 4077696, 'steps': 21237, 'loss/train': 2.0483508110046387} -11/07/2021 00:13:46 - INFO - __main__ - Step 21239: {'lr': 0.00047944287133887834, 'samples': 4077888, 'steps': 21238, 'loss/train': 1.5501058101654053} -11/07/2021 00:13:47 - INFO - __main__ - Step 21240: {'lr': 0.00047944076393162806, 'samples': 4078080, 'steps': 21239, 'loss/train': 1.4833170175552368} -11/07/2021 00:13:47 - INFO - __main__ - Step 21241: {'lr': 0.00047943865642099525, 'samples': 4078272, 'steps': 21240, 'loss/train': 1.667752981185913} -11/07/2021 00:13:48 - INFO - __main__ - Step 21242: {'lr': 0.00047943654880698106, 'samples': 4078464, 'steps': 21241, 'loss/train': 2.3272855281829834} -11/07/2021 00:13:48 - INFO - __main__ - Step 21243: {'lr': 0.00047943444108958623, 'samples': 4078656, 'steps': 21242, 'loss/train': 3.5779306888580322} -11/07/2021 00:13:48 - INFO - __main__ - Step 21244: {'lr': 0.00047943233326881176, 'samples': 4078848, 'steps': 21243, 'loss/train': 1.0798635482788086} -11/07/2021 00:13:49 - INFO - __main__ - Step 21245: {'lr': 0.00047943022534465866, 'samples': 4079040, 'steps': 21244, 'loss/train': 1.2242178916931152} -11/07/2021 00:13:50 - INFO - __main__ - Step 21246: {'lr': 0.00047942811731712775, 'samples': 4079232, 'steps': 21245, 'loss/train': 1.6346696615219116} -11/07/2021 00:13:50 - INFO - __main__ - Step 21247: {'lr': 0.0004794260091862202, 'samples': 4079424, 'steps': 21246, 'loss/train': 1.1817291975021362} -11/07/2021 00:13:51 - INFO - __main__ - Step 21248: {'lr': 0.0004794239009519368, 'samples': 4079616, 'steps': 21247, 'loss/train': 1.7059050798416138} -11/07/2021 00:13:51 - INFO - __main__ - Step 21249: {'lr': 0.00047942179261427847, 'samples': 4079808, 'steps': 21248, 'loss/train': 1.453378438949585} -11/07/2021 00:13:51 - INFO - __main__ - Step 21250: {'lr': 0.0004794196841732463, 'samples': 4080000, 'steps': 21249, 'loss/train': 2.1280789375305176} -11/07/2021 00:13:52 - INFO - __main__ - Step 21251: {'lr': 0.0004794175756288411, 'samples': 4080192, 'steps': 21250, 'loss/train': 1.54837965965271} -11/07/2021 00:13:53 - INFO - __main__ - Step 21252: {'lr': 0.00047941546698106386, 'samples': 4080384, 'steps': 21251, 'loss/train': 1.0373538732528687} -11/07/2021 00:13:53 - INFO - __main__ - Step 21253: {'lr': 0.0004794133582299156, 'samples': 4080576, 'steps': 21252, 'loss/train': 1.5038514137268066} -11/07/2021 00:13:53 - INFO - __main__ - Step 21254: {'lr': 0.0004794112493753972, 'samples': 4080768, 'steps': 21253, 'loss/train': 1.8955644369125366} -11/07/2021 00:13:54 - INFO - __main__ - Step 21255: {'lr': 0.0004794091404175097, 'samples': 4080960, 'steps': 21254, 'loss/train': 1.3596187829971313} -11/07/2021 00:13:55 - INFO - __main__ - Step 21256: {'lr': 0.00047940703135625386, 'samples': 4081152, 'steps': 21255, 'loss/train': 1.5795459747314453} -11/07/2021 00:13:55 - INFO - __main__ - Step 21257: {'lr': 0.0004794049221916308, 'samples': 4081344, 'steps': 21256, 'loss/train': 1.0606127977371216} -11/07/2021 00:13:55 - INFO - __main__ - Step 21258: {'lr': 0.00047940281292364146, 'samples': 4081536, 'steps': 21257, 'loss/train': 1.7316327095031738} -11/07/2021 00:13:56 - INFO - __main__ - Step 21259: {'lr': 0.0004794007035522867, 'samples': 4081728, 'steps': 21258, 'loss/train': 1.6890673637390137} -11/07/2021 00:13:56 - INFO - __main__ - Step 21260: {'lr': 0.0004793985940775676, 'samples': 4081920, 'steps': 21259, 'loss/train': 1.8833643198013306} -11/07/2021 00:13:57 - INFO - __main__ - Step 21261: {'lr': 0.0004793964844994849, 'samples': 4082112, 'steps': 21260, 'loss/train': 1.4741991758346558} -11/07/2021 00:13:58 - INFO - __main__ - Step 21262: {'lr': 0.00047939437481803984, 'samples': 4082304, 'steps': 21261, 'loss/train': 1.6706597805023193} -11/07/2021 00:13:58 - INFO - __main__ - Step 21263: {'lr': 0.00047939226503323313, 'samples': 4082496, 'steps': 21262, 'loss/train': 2.2536189556121826} -11/07/2021 00:13:59 - INFO - __main__ - Step 21264: {'lr': 0.0004793901551450658, 'samples': 4082688, 'steps': 21263, 'loss/train': 1.888841152191162} -11/07/2021 00:13:59 - INFO - __main__ - Step 21265: {'lr': 0.00047938804515353887, 'samples': 4082880, 'steps': 21264, 'loss/train': 0.34845373034477234} -11/07/2021 00:14:00 - INFO - __main__ - Step 21266: {'lr': 0.00047938593505865315, 'samples': 4083072, 'steps': 21265, 'loss/train': 1.6031692028045654} -11/07/2021 00:14:00 - INFO - __main__ - Step 21267: {'lr': 0.00047938382486040963, 'samples': 4083264, 'steps': 21266, 'loss/train': 0.9460209012031555} -11/07/2021 00:14:01 - INFO - __main__ - Step 21268: {'lr': 0.0004793817145588094, 'samples': 4083456, 'steps': 21267, 'loss/train': 1.3523656129837036} -11/07/2021 00:14:01 - INFO - __main__ - Step 21269: {'lr': 0.0004793796041538533, 'samples': 4083648, 'steps': 21268, 'loss/train': 1.5146702527999878} -11/07/2021 00:14:01 - INFO - __main__ - Step 21270: {'lr': 0.00047937749364554226, 'samples': 4083840, 'steps': 21269, 'loss/train': 0.8026184439659119} -11/07/2021 00:14:02 - INFO - __main__ - Step 21271: {'lr': 0.0004793753830338773, 'samples': 4084032, 'steps': 21270, 'loss/train': 1.6856791973114014} -11/07/2021 00:14:03 - INFO - __main__ - Step 21272: {'lr': 0.00047937327231885925, 'samples': 4084224, 'steps': 21271, 'loss/train': 1.488318920135498} -11/07/2021 00:14:03 - INFO - __main__ - Step 21273: {'lr': 0.0004793711615004892, 'samples': 4084416, 'steps': 21272, 'loss/train': 1.5594409704208374} -11/07/2021 00:14:03 - INFO - __main__ - Step 21274: {'lr': 0.000479369050578768, 'samples': 4084608, 'steps': 21273, 'loss/train': 0.9363613128662109} -11/07/2021 00:14:04 - INFO - __main__ - Step 21275: {'lr': 0.0004793669395536967, 'samples': 4084800, 'steps': 21274, 'loss/train': 1.5633370876312256} -11/07/2021 00:14:04 - INFO - __main__ - Step 21276: {'lr': 0.00047936482842527616, 'samples': 4084992, 'steps': 21275, 'loss/train': 1.7852537631988525} -11/07/2021 00:14:05 - INFO - __main__ - Step 21277: {'lr': 0.00047936271719350743, 'samples': 4085184, 'steps': 21276, 'loss/train': 1.7984212636947632} -11/07/2021 00:14:05 - INFO - __main__ - Step 21278: {'lr': 0.0004793606058583913, 'samples': 4085376, 'steps': 21277, 'loss/train': 1.8766491413116455} -11/07/2021 00:14:06 - INFO - __main__ - Step 21279: {'lr': 0.00047935849441992887, 'samples': 4085568, 'steps': 21278, 'loss/train': 1.998377799987793} -11/07/2021 00:14:06 - INFO - __main__ - Step 21280: {'lr': 0.00047935638287812104, 'samples': 4085760, 'steps': 21279, 'loss/train': 1.6133617162704468} -11/07/2021 00:14:07 - INFO - __main__ - Step 21281: {'lr': 0.00047935427123296884, 'samples': 4085952, 'steps': 21280, 'loss/train': 1.5871071815490723} -11/07/2021 00:14:08 - INFO - __main__ - Step 21282: {'lr': 0.000479352159484473, 'samples': 4086144, 'steps': 21281, 'loss/train': 1.3508565425872803} -11/07/2021 00:14:08 - INFO - __main__ - Step 21283: {'lr': 0.0004793500476326347, 'samples': 4086336, 'steps': 21282, 'loss/train': 1.6303493976593018} -11/07/2021 00:14:08 - INFO - __main__ - Step 21284: {'lr': 0.0004793479356774548, 'samples': 4086528, 'steps': 21283, 'loss/train': 1.6954418420791626} -11/07/2021 00:14:09 - INFO - __main__ - Step 21285: {'lr': 0.00047934582361893423, 'samples': 4086720, 'steps': 21284, 'loss/train': 1.3281868696212769} -11/07/2021 00:14:09 - INFO - __main__ - Step 21286: {'lr': 0.000479343711457074, 'samples': 4086912, 'steps': 21285, 'loss/train': 1.7398327589035034} -11/07/2021 00:14:10 - INFO - __main__ - Step 21287: {'lr': 0.00047934159919187504, 'samples': 4087104, 'steps': 21286, 'loss/train': 1.656062126159668} -11/07/2021 00:14:10 - INFO - __main__ - Step 21288: {'lr': 0.0004793394868233383, 'samples': 4087296, 'steps': 21287, 'loss/train': 1.9397815465927124} -11/07/2021 00:14:11 - INFO - __main__ - Step 21289: {'lr': 0.0004793373743514647, 'samples': 4087488, 'steps': 21288, 'loss/train': 1.4470610618591309} -11/07/2021 00:14:11 - INFO - __main__ - Step 21290: {'lr': 0.0004793352617762552, 'samples': 4087680, 'steps': 21289, 'loss/train': 1.4866148233413696} -11/07/2021 00:14:11 - INFO - __main__ - Step 21291: {'lr': 0.0004793331490977108, 'samples': 4087872, 'steps': 21290, 'loss/train': 1.5853736400604248} -11/07/2021 00:14:12 - INFO - __main__ - Step 21292: {'lr': 0.0004793310363158324, 'samples': 4088064, 'steps': 21291, 'loss/train': 1.5216046571731567} -11/07/2021 00:14:13 - INFO - __main__ - Step 21293: {'lr': 0.00047932892343062103, 'samples': 4088256, 'steps': 21292, 'loss/train': 1.7325321435928345} -11/07/2021 00:14:13 - INFO - __main__ - Step 21294: {'lr': 0.00047932681044207757, 'samples': 4088448, 'steps': 21293, 'loss/train': 1.4280503988265991} -11/07/2021 00:14:13 - INFO - __main__ - Step 21295: {'lr': 0.0004793246973502029, 'samples': 4088640, 'steps': 21294, 'loss/train': 1.394337773323059} -11/07/2021 00:14:14 - INFO - __main__ - Step 21296: {'lr': 0.0004793225841549982, 'samples': 4088832, 'steps': 21295, 'loss/train': 1.7424063682556152} -11/07/2021 00:14:15 - INFO - __main__ - Step 21297: {'lr': 0.00047932047085646416, 'samples': 4089024, 'steps': 21296, 'loss/train': 1.4018278121948242} -11/07/2021 00:14:15 - INFO - __main__ - Step 21298: {'lr': 0.0004793183574546019, 'samples': 4089216, 'steps': 21297, 'loss/train': 1.655775547027588} -11/07/2021 00:14:16 - INFO - __main__ - Step 21299: {'lr': 0.0004793162439494123, 'samples': 4089408, 'steps': 21298, 'loss/train': 1.1595053672790527} -11/07/2021 00:14:16 - INFO - __main__ - Step 21300: {'lr': 0.00047931413034089644, 'samples': 4089600, 'steps': 21299, 'loss/train': 0.8736221194267273} -11/07/2021 00:14:16 - INFO - __main__ - Step 21301: {'lr': 0.00047931201662905503, 'samples': 4089792, 'steps': 21300, 'loss/train': 1.8875302076339722} -11/07/2021 00:14:17 - INFO - __main__ - Step 21302: {'lr': 0.00047930990281388927, 'samples': 4089984, 'steps': 21301, 'loss/train': 1.8271974325180054} -11/07/2021 00:14:18 - INFO - __main__ - Step 21303: {'lr': 0.00047930778889539996, 'samples': 4090176, 'steps': 21302, 'loss/train': 1.5348069667816162} -11/07/2021 00:14:18 - INFO - __main__ - Step 21304: {'lr': 0.00047930567487358813, 'samples': 4090368, 'steps': 21303, 'loss/train': 0.8241930603981018} -11/07/2021 00:14:18 - INFO - __main__ - Step 21305: {'lr': 0.00047930356074845466, 'samples': 4090560, 'steps': 21304, 'loss/train': 1.793365240097046} -11/07/2021 00:14:19 - INFO - __main__ - Step 21306: {'lr': 0.0004793014465200005, 'samples': 4090752, 'steps': 21305, 'loss/train': 1.727817177772522} -11/07/2021 00:14:19 - INFO - __main__ - Step 21307: {'lr': 0.0004792993321882267, 'samples': 4090944, 'steps': 21306, 'loss/train': 1.5948116779327393} -11/07/2021 00:14:20 - INFO - __main__ - Step 21308: {'lr': 0.0004792972177531342, 'samples': 4091136, 'steps': 21307, 'loss/train': 1.57756507396698} -11/07/2021 00:14:20 - INFO - __main__ - Step 21309: {'lr': 0.0004792951032147239, 'samples': 4091328, 'steps': 21308, 'loss/train': 1.8153151273727417} -11/07/2021 00:14:21 - INFO - __main__ - Step 21310: {'lr': 0.00047929298857299677, 'samples': 4091520, 'steps': 21309, 'loss/train': 1.4541163444519043} -11/07/2021 00:14:21 - INFO - __main__ - Step 21311: {'lr': 0.00047929087382795374, 'samples': 4091712, 'steps': 21310, 'loss/train': 1.1384114027023315} -11/07/2021 00:14:21 - INFO - __main__ - Step 21312: {'lr': 0.0004792887589795957, 'samples': 4091904, 'steps': 21311, 'loss/train': 1.6404975652694702} -11/07/2021 00:14:23 - INFO - __main__ - Step 21313: {'lr': 0.00047928664402792376, 'samples': 4092096, 'steps': 21312, 'loss/train': 1.0429054498672485} -11/07/2021 00:14:23 - INFO - __main__ - Step 21314: {'lr': 0.0004792845289729388, 'samples': 4092288, 'steps': 21313, 'loss/train': 1.4683235883712769} -11/07/2021 00:14:23 - INFO - __main__ - Step 21315: {'lr': 0.00047928241381464177, 'samples': 4092480, 'steps': 21314, 'loss/train': 2.05292010307312} -11/07/2021 00:14:24 - INFO - __main__ - Step 21316: {'lr': 0.0004792802985530337, 'samples': 4092672, 'steps': 21315, 'loss/train': 1.7252967357635498} -11/07/2021 00:14:24 - INFO - __main__ - Step 21317: {'lr': 0.0004792781831881153, 'samples': 4092864, 'steps': 21316, 'loss/train': 1.5299564599990845} -11/07/2021 00:14:25 - INFO - __main__ - Step 21318: {'lr': 0.0004792760677198878, 'samples': 4093056, 'steps': 21317, 'loss/train': 0.8147514462471008} -11/07/2021 00:14:25 - INFO - __main__ - Step 21319: {'lr': 0.00047927395214835203, 'samples': 4093248, 'steps': 21318, 'loss/train': 1.686421275138855} -11/07/2021 00:14:26 - INFO - __main__ - Step 21320: {'lr': 0.0004792718364735089, 'samples': 4093440, 'steps': 21319, 'loss/train': 1.8813480138778687} -11/07/2021 00:14:26 - INFO - __main__ - Step 21321: {'lr': 0.00047926972069535945, 'samples': 4093632, 'steps': 21320, 'loss/train': 1.4405698776245117} -11/07/2021 00:14:26 - INFO - __main__ - Step 21322: {'lr': 0.00047926760481390465, 'samples': 4093824, 'steps': 21321, 'loss/train': 1.2762727737426758} -11/07/2021 00:14:28 - INFO - __main__ - Step 21323: {'lr': 0.00047926548882914533, 'samples': 4094016, 'steps': 21322, 'loss/train': 2.274826765060425} -11/07/2021 00:14:28 - INFO - __main__ - Step 21324: {'lr': 0.0004792633727410826, 'samples': 4094208, 'steps': 21323, 'loss/train': 1.5988800525665283} -11/07/2021 00:14:28 - INFO - __main__ - Step 21325: {'lr': 0.0004792612565497172, 'samples': 4094400, 'steps': 21324, 'loss/train': 1.2898582220077515} -11/07/2021 00:14:29 - INFO - __main__ - Step 21326: {'lr': 0.00047925914025505036, 'samples': 4094592, 'steps': 21325, 'loss/train': 1.2253859043121338} -11/07/2021 00:14:29 - INFO - __main__ - Step 21327: {'lr': 0.0004792570238570828, 'samples': 4094784, 'steps': 21326, 'loss/train': 1.2003458738327026} -11/07/2021 00:14:30 - INFO - __main__ - Step 21328: {'lr': 0.00047925490735581557, 'samples': 4094976, 'steps': 21327, 'loss/train': 1.1544514894485474} -11/07/2021 00:14:30 - INFO - __main__ - Step 21329: {'lr': 0.00047925279075124963, 'samples': 4095168, 'steps': 21328, 'loss/train': 1.454081654548645} -11/07/2021 00:14:31 - INFO - __main__ - Step 21330: {'lr': 0.00047925067404338596, 'samples': 4095360, 'steps': 21329, 'loss/train': 1.619686484336853} -11/07/2021 00:14:31 - INFO - __main__ - Step 21331: {'lr': 0.00047924855723222536, 'samples': 4095552, 'steps': 21330, 'loss/train': 1.378673791885376} -11/07/2021 00:14:31 - INFO - __main__ - Step 21332: {'lr': 0.000479246440317769, 'samples': 4095744, 'steps': 21331, 'loss/train': 1.2609995603561401} -11/07/2021 00:14:32 - INFO - __main__ - Step 21333: {'lr': 0.00047924432330001776, 'samples': 4095936, 'steps': 21332, 'loss/train': 1.5046299695968628} -11/07/2021 00:14:33 - INFO - __main__ - Step 21334: {'lr': 0.0004792422061789725, 'samples': 4096128, 'steps': 21333, 'loss/train': 1.7911027669906616} -11/07/2021 00:14:33 - INFO - __main__ - Step 21335: {'lr': 0.0004792400889546342, 'samples': 4096320, 'steps': 21334, 'loss/train': 1.649451494216919} -11/07/2021 00:14:33 - INFO - __main__ - Step 21336: {'lr': 0.00047923797162700393, 'samples': 4096512, 'steps': 21335, 'loss/train': 1.574715495109558} -11/07/2021 00:14:34 - INFO - __main__ - Step 21337: {'lr': 0.0004792358541960826, 'samples': 4096704, 'steps': 21336, 'loss/train': 2.1345772743225098} -11/07/2021 00:14:34 - INFO - __main__ - Step 21338: {'lr': 0.000479233736661871, 'samples': 4096896, 'steps': 21337, 'loss/train': 1.7612472772598267} -11/07/2021 00:14:36 - INFO - __main__ - Step 21339: {'lr': 0.0004792316190243703, 'samples': 4097088, 'steps': 21338, 'loss/train': 1.8308136463165283} -11/07/2021 00:14:36 - INFO - __main__ - Step 21340: {'lr': 0.0004792295012835814, 'samples': 4097280, 'steps': 21339, 'loss/train': 1.3093798160552979} -11/07/2021 00:14:36 - INFO - __main__ - Step 21341: {'lr': 0.0004792273834395052, 'samples': 4097472, 'steps': 21340, 'loss/train': 1.1870094537734985} -11/07/2021 00:14:37 - INFO - __main__ - Step 21342: {'lr': 0.0004792252654921426, 'samples': 4097664, 'steps': 21341, 'loss/train': 0.9535714983940125} -11/07/2021 00:14:37 - INFO - __main__ - Step 21343: {'lr': 0.00047922314744149475, 'samples': 4097856, 'steps': 21342, 'loss/train': 0.45689645409584045} -11/07/2021 00:14:38 - INFO - __main__ - Step 21344: {'lr': 0.0004792210292875624, 'samples': 4098048, 'steps': 21343, 'loss/train': 1.4933922290802002} -11/07/2021 00:14:38 - INFO - __main__ - Step 21345: {'lr': 0.00047921891103034665, 'samples': 4098240, 'steps': 21344, 'loss/train': 1.3660441637039185} -11/07/2021 00:14:39 - INFO - __main__ - Step 21346: {'lr': 0.0004792167926698483, 'samples': 4098432, 'steps': 21345, 'loss/train': 1.77027428150177} -11/07/2021 00:14:39 - INFO - __main__ - Step 21347: {'lr': 0.0004792146742060685, 'samples': 4098624, 'steps': 21346, 'loss/train': 1.3939626216888428} -11/07/2021 00:14:39 - INFO - __main__ - Step 21348: {'lr': 0.00047921255563900813, 'samples': 4098816, 'steps': 21347, 'loss/train': 1.9357357025146484} -11/07/2021 00:14:40 - INFO - __main__ - Step 21349: {'lr': 0.000479210436968668, 'samples': 4099008, 'steps': 21348, 'loss/train': 0.2855474650859833} -11/07/2021 00:14:41 - INFO - __main__ - Step 21350: {'lr': 0.0004792083181950493, 'samples': 4099200, 'steps': 21349, 'loss/train': 1.2464492321014404} -11/07/2021 00:14:41 - INFO - __main__ - Step 21351: {'lr': 0.0004792061993181528, 'samples': 4099392, 'steps': 21350, 'loss/train': 1.0355896949768066} -11/07/2021 00:14:41 - INFO - __main__ - Step 21352: {'lr': 0.00047920408033797954, 'samples': 4099584, 'steps': 21351, 'loss/train': 1.2491384744644165} -11/07/2021 00:14:42 - INFO - __main__ - Step 21353: {'lr': 0.0004792019612545304, 'samples': 4099776, 'steps': 21352, 'loss/train': 1.8609702587127686} -11/07/2021 00:14:43 - INFO - __main__ - Step 21354: {'lr': 0.00047919984206780647, 'samples': 4099968, 'steps': 21353, 'loss/train': 1.1716221570968628} -11/07/2021 00:14:43 - INFO - __main__ - Step 21355: {'lr': 0.0004791977227778086, 'samples': 4100160, 'steps': 21354, 'loss/train': 1.2437918186187744} -11/07/2021 00:14:44 - INFO - __main__ - Step 21356: {'lr': 0.00047919560338453783, 'samples': 4100352, 'steps': 21355, 'loss/train': 1.356000304222107} -11/07/2021 00:14:44 - INFO - __main__ - Step 21357: {'lr': 0.000479193483887995, 'samples': 4100544, 'steps': 21356, 'loss/train': 1.198959469795227} -11/07/2021 00:14:44 - INFO - __main__ - Step 21358: {'lr': 0.0004791913642881811, 'samples': 4100736, 'steps': 21357, 'loss/train': 1.6075674295425415} -11/07/2021 00:14:45 - INFO - __main__ - Step 21359: {'lr': 0.00047918924458509717, 'samples': 4100928, 'steps': 21358, 'loss/train': 1.3278419971466064} -11/07/2021 00:14:46 - INFO - __main__ - Step 21360: {'lr': 0.00047918712477874404, 'samples': 4101120, 'steps': 21359, 'loss/train': 1.41783607006073} -11/07/2021 00:14:46 - INFO - __main__ - Step 21361: {'lr': 0.00047918500486912276, 'samples': 4101312, 'steps': 21360, 'loss/train': 1.095545768737793} -11/07/2021 00:14:46 - INFO - __main__ - Step 21362: {'lr': 0.00047918288485623427, 'samples': 4101504, 'steps': 21361, 'loss/train': 1.4473345279693604} -11/07/2021 00:14:47 - INFO - __main__ - Step 21363: {'lr': 0.0004791807647400795, 'samples': 4101696, 'steps': 21362, 'loss/train': 1.668547511100769} -11/07/2021 00:14:48 - INFO - __main__ - Step 21364: {'lr': 0.0004791786445206594, 'samples': 4101888, 'steps': 21363, 'loss/train': 1.4369771480560303} -11/07/2021 00:14:48 - INFO - __main__ - Step 21365: {'lr': 0.00047917652419797495, 'samples': 4102080, 'steps': 21364, 'loss/train': 1.4824670553207397} -11/07/2021 00:14:48 - INFO - __main__ - Step 21366: {'lr': 0.0004791744037720271, 'samples': 4102272, 'steps': 21365, 'loss/train': 1.810196042060852} -11/07/2021 00:14:49 - INFO - __main__ - Step 21367: {'lr': 0.00047917228324281683, 'samples': 4102464, 'steps': 21366, 'loss/train': 1.1198419332504272} -11/07/2021 00:14:49 - INFO - __main__ - Step 21368: {'lr': 0.00047917016261034496, 'samples': 4102656, 'steps': 21367, 'loss/train': 1.3379572629928589} -11/07/2021 00:14:50 - INFO - __main__ - Step 21369: {'lr': 0.0004791680418746126, 'samples': 4102848, 'steps': 21368, 'loss/train': 1.3369263410568237} -11/07/2021 00:14:51 - INFO - __main__ - Step 21370: {'lr': 0.00047916592103562075, 'samples': 4103040, 'steps': 21369, 'loss/train': 3.3667120933532715} -11/07/2021 00:14:51 - INFO - __main__ - Step 21371: {'lr': 0.00047916380009337014, 'samples': 4103232, 'steps': 21370, 'loss/train': 1.5507954359054565} -11/07/2021 00:14:51 - INFO - __main__ - Step 21372: {'lr': 0.0004791616790478619, 'samples': 4103424, 'steps': 21371, 'loss/train': 0.9956333041191101} -11/07/2021 00:14:52 - INFO - __main__ - Step 21373: {'lr': 0.000479159557899097, 'samples': 4103616, 'steps': 21372, 'loss/train': 1.4630414247512817} -11/07/2021 00:14:52 - INFO - __main__ - Step 21374: {'lr': 0.00047915743664707626, 'samples': 4103808, 'steps': 21373, 'loss/train': 0.219575896859169} -11/07/2021 00:14:53 - INFO - __main__ - Step 21375: {'lr': 0.0004791553152918008, 'samples': 4104000, 'steps': 21374, 'loss/train': 1.7526909112930298} -11/07/2021 00:14:53 - INFO - __main__ - Step 21376: {'lr': 0.0004791531938332714, 'samples': 4104192, 'steps': 21375, 'loss/train': 1.4546867609024048} -11/07/2021 00:14:54 - INFO - __main__ - Step 21377: {'lr': 0.0004791510722714891, 'samples': 4104384, 'steps': 21376, 'loss/train': 1.7402167320251465} -11/07/2021 00:14:54 - INFO - __main__ - Step 21378: {'lr': 0.000479148950606455, 'samples': 4104576, 'steps': 21377, 'loss/train': 1.7246084213256836} -11/07/2021 00:14:54 - INFO - __main__ - Step 21379: {'lr': 0.00047914682883816977, 'samples': 4104768, 'steps': 21378, 'loss/train': 1.3976600170135498} -11/07/2021 00:14:55 - INFO - __main__ - Step 21380: {'lr': 0.00047914470696663457, 'samples': 4104960, 'steps': 21379, 'loss/train': 0.43213319778442383} -11/07/2021 00:14:56 - INFO - __main__ - Step 21381: {'lr': 0.00047914258499185037, 'samples': 4105152, 'steps': 21380, 'loss/train': 1.7519570589065552} -11/07/2021 00:14:56 - INFO - __main__ - Step 21382: {'lr': 0.000479140462913818, 'samples': 4105344, 'steps': 21381, 'loss/train': 1.511462926864624} -11/07/2021 00:14:57 - INFO - __main__ - Step 21383: {'lr': 0.0004791383407325384, 'samples': 4105536, 'steps': 21382, 'loss/train': 1.6584688425064087} -11/07/2021 00:14:57 - INFO - __main__ - Step 21384: {'lr': 0.0004791362184480127, 'samples': 4105728, 'steps': 21383, 'loss/train': 1.2212923765182495} -11/07/2021 00:14:58 - INFO - __main__ - Step 21385: {'lr': 0.0004791340960602417, 'samples': 4105920, 'steps': 21384, 'loss/train': 1.8661881685256958} -11/07/2021 00:14:58 - INFO - __main__ - Step 21386: {'lr': 0.0004791319735692264, 'samples': 4106112, 'steps': 21385, 'loss/train': 1.2798576354980469} -11/07/2021 00:14:59 - INFO - __main__ - Step 21387: {'lr': 0.00047912985097496786, 'samples': 4106304, 'steps': 21386, 'loss/train': 1.0371434688568115} -11/07/2021 00:14:59 - INFO - __main__ - Step 21388: {'lr': 0.00047912772827746685, 'samples': 4106496, 'steps': 21387, 'loss/train': 1.1820610761642456} -11/07/2021 00:14:59 - INFO - __main__ - Step 21389: {'lr': 0.00047912560547672453, 'samples': 4106688, 'steps': 21388, 'loss/train': 1.3891115188598633} -11/07/2021 00:15:00 - INFO - __main__ - Step 21390: {'lr': 0.0004791234825727416, 'samples': 4106880, 'steps': 21389, 'loss/train': 1.801900863647461} -11/07/2021 00:15:01 - INFO - __main__ - Step 21391: {'lr': 0.0004791213595655193, 'samples': 4107072, 'steps': 21390, 'loss/train': 1.3491114377975464} -11/07/2021 00:15:01 - INFO - __main__ - Step 21392: {'lr': 0.0004791192364550584, 'samples': 4107264, 'steps': 21391, 'loss/train': 0.3875841498374939} -11/07/2021 00:15:01 - INFO - __main__ - Step 21393: {'lr': 0.00047911711324135985, 'samples': 4107456, 'steps': 21392, 'loss/train': 0.8895827531814575} -11/07/2021 00:15:02 - INFO - __main__ - Step 21394: {'lr': 0.00047911498992442476, 'samples': 4107648, 'steps': 21393, 'loss/train': 1.6767473220825195} -11/07/2021 00:15:02 - INFO - __main__ - Step 21395: {'lr': 0.0004791128665042539, 'samples': 4107840, 'steps': 21394, 'loss/train': 1.5300005674362183} -11/07/2021 00:15:03 - INFO - __main__ - Step 21396: {'lr': 0.0004791107429808484, 'samples': 4108032, 'steps': 21395, 'loss/train': 1.3103961944580078} -11/07/2021 00:15:03 - INFO - __main__ - Step 21397: {'lr': 0.00047910861935420915, 'samples': 4108224, 'steps': 21396, 'loss/train': 1.617367148399353} -11/07/2021 00:15:04 - INFO - __main__ - Step 21398: {'lr': 0.00047910649562433696, 'samples': 4108416, 'steps': 21397, 'loss/train': 1.543279767036438} -11/07/2021 00:15:04 - INFO - __main__ - Step 21399: {'lr': 0.000479104371791233, 'samples': 4108608, 'steps': 21398, 'loss/train': 1.3778434991836548} -11/07/2021 00:15:04 - INFO - __main__ - Step 21400: {'lr': 0.0004791022478548982, 'samples': 4108800, 'steps': 21399, 'loss/train': 1.259809136390686} -11/07/2021 00:15:06 - INFO - __main__ - Step 21401: {'lr': 0.0004791001238153334, 'samples': 4108992, 'steps': 21400, 'loss/train': 1.7310465574264526} -11/07/2021 00:15:06 - INFO - __main__ - Step 21402: {'lr': 0.00047909799967253957, 'samples': 4109184, 'steps': 21401, 'loss/train': 1.3898957967758179} -11/07/2021 00:15:06 - INFO - __main__ - Step 21403: {'lr': 0.00047909587542651776, 'samples': 4109376, 'steps': 21402, 'loss/train': 2.3288679122924805} -11/07/2021 00:15:07 - INFO - __main__ - Step 21404: {'lr': 0.00047909375107726894, 'samples': 4109568, 'steps': 21403, 'loss/train': 1.4478750228881836} -11/07/2021 00:15:07 - INFO - __main__ - Step 21405: {'lr': 0.000479091626624794, 'samples': 4109760, 'steps': 21404, 'loss/train': 1.4665449857711792} -11/07/2021 00:15:08 - INFO - __main__ - Step 21406: {'lr': 0.00047908950206909385, 'samples': 4109952, 'steps': 21405, 'loss/train': 2.423110008239746} -11/07/2021 00:15:08 - INFO - __main__ - Step 21407: {'lr': 0.0004790873774101695, 'samples': 4110144, 'steps': 21406, 'loss/train': 1.829443097114563} -11/07/2021 00:15:09 - INFO - __main__ - Step 21408: {'lr': 0.00047908525264802194, 'samples': 4110336, 'steps': 21407, 'loss/train': 1.2481427192687988} -11/07/2021 00:15:09 - INFO - __main__ - Step 21409: {'lr': 0.00047908312778265213, 'samples': 4110528, 'steps': 21408, 'loss/train': 1.5026124715805054} -11/07/2021 00:15:09 - INFO - __main__ - Step 21410: {'lr': 0.00047908100281406096, 'samples': 4110720, 'steps': 21409, 'loss/train': 1.617781162261963} -11/07/2021 00:15:10 - INFO - __main__ - Step 21411: {'lr': 0.00047907887774224946, 'samples': 4110912, 'steps': 21410, 'loss/train': 1.7944114208221436} -11/07/2021 00:15:11 - INFO - __main__ - Step 21412: {'lr': 0.0004790767525672185, 'samples': 4111104, 'steps': 21411, 'loss/train': 1.4158649444580078} -11/07/2021 00:15:11 - INFO - __main__ - Step 21413: {'lr': 0.0004790746272889691, 'samples': 4111296, 'steps': 21412, 'loss/train': 1.090224027633667} -11/07/2021 00:15:11 - INFO - __main__ - Step 21414: {'lr': 0.00047907250190750225, 'samples': 4111488, 'steps': 21413, 'loss/train': 1.7329736948013306} -11/07/2021 00:15:12 - INFO - __main__ - Step 21415: {'lr': 0.0004790703764228188, 'samples': 4111680, 'steps': 21414, 'loss/train': 1.5330586433410645} -11/07/2021 00:15:13 - INFO - __main__ - Step 21416: {'lr': 0.0004790682508349198, 'samples': 4111872, 'steps': 21415, 'loss/train': 1.7020710706710815} -11/07/2021 00:15:13 - INFO - __main__ - Step 21417: {'lr': 0.00047906612514380623, 'samples': 4112064, 'steps': 21416, 'loss/train': 2.212350368499756} -11/07/2021 00:15:14 - INFO - __main__ - Step 21418: {'lr': 0.000479063999349479, 'samples': 4112256, 'steps': 21417, 'loss/train': 0.7235398292541504} -11/07/2021 00:15:14 - INFO - __main__ - Step 21419: {'lr': 0.00047906187345193895, 'samples': 4112448, 'steps': 21418, 'loss/train': 1.5190248489379883} -11/07/2021 00:15:14 - INFO - __main__ - Step 21420: {'lr': 0.0004790597474511873, 'samples': 4112640, 'steps': 21419, 'loss/train': 1.4230188131332397} -11/07/2021 00:15:15 - INFO - __main__ - Step 21421: {'lr': 0.0004790576213472248, 'samples': 4112832, 'steps': 21420, 'loss/train': 1.2656906843185425} -11/07/2021 00:15:16 - INFO - __main__ - Step 21422: {'lr': 0.0004790554951400524, 'samples': 4113024, 'steps': 21421, 'loss/train': 1.5593222379684448} -11/07/2021 00:15:16 - INFO - __main__ - Step 21423: {'lr': 0.0004790533688296712, 'samples': 4113216, 'steps': 21422, 'loss/train': 1.5328755378723145} -11/07/2021 00:15:16 - INFO - __main__ - Step 21424: {'lr': 0.0004790512424160821, 'samples': 4113408, 'steps': 21423, 'loss/train': 1.8626660108566284} -11/07/2021 00:15:17 - INFO - __main__ - Step 21425: {'lr': 0.00047904911589928605, 'samples': 4113600, 'steps': 21424, 'loss/train': 1.336646556854248} -11/07/2021 00:15:17 - INFO - __main__ - Step 21426: {'lr': 0.00047904698927928404, 'samples': 4113792, 'steps': 21425, 'loss/train': 1.711372971534729} -11/07/2021 00:15:18 - INFO - __main__ - Step 21427: {'lr': 0.0004790448625560769, 'samples': 4113984, 'steps': 21426, 'loss/train': 1.2243375778198242} -11/07/2021 00:15:18 - INFO - __main__ - Step 21428: {'lr': 0.0004790427357296657, 'samples': 4114176, 'steps': 21427, 'loss/train': 1.5050300359725952} -11/07/2021 00:15:19 - INFO - __main__ - Step 21429: {'lr': 0.0004790406088000514, 'samples': 4114368, 'steps': 21428, 'loss/train': 1.5563852787017822} -11/07/2021 00:15:19 - INFO - __main__ - Step 21430: {'lr': 0.00047903848176723493, 'samples': 4114560, 'steps': 21429, 'loss/train': 1.2160688638687134} -11/07/2021 00:15:19 - INFO - __main__ - Step 21431: {'lr': 0.0004790363546312172, 'samples': 4114752, 'steps': 21430, 'loss/train': 1.644734263420105} -11/07/2021 00:15:20 - INFO - __main__ - Step 21432: {'lr': 0.0004790342273919993, 'samples': 4114944, 'steps': 21431, 'loss/train': 1.6484546661376953} -11/07/2021 00:15:21 - INFO - __main__ - Step 21433: {'lr': 0.00047903210004958207, 'samples': 4115136, 'steps': 21432, 'loss/train': 1.6944466829299927} -11/07/2021 00:15:21 - INFO - __main__ - Step 21434: {'lr': 0.0004790299726039665, 'samples': 4115328, 'steps': 21433, 'loss/train': 1.1725130081176758} -11/07/2021 00:15:22 - INFO - __main__ - Step 21435: {'lr': 0.0004790278450551536, 'samples': 4115520, 'steps': 21434, 'loss/train': 1.5247802734375} -11/07/2021 00:15:22 - INFO - __main__ - Step 21436: {'lr': 0.00047902571740314427, 'samples': 4115712, 'steps': 21435, 'loss/train': 1.878816843032837} -11/07/2021 00:15:23 - INFO - __main__ - Step 21437: {'lr': 0.00047902358964793944, 'samples': 4115904, 'steps': 21436, 'loss/train': 1.6808935403823853} -11/07/2021 00:15:23 - INFO - __main__ - Step 21438: {'lr': 0.0004790214617895402, 'samples': 4116096, 'steps': 21437, 'loss/train': 1.717866063117981} -11/07/2021 00:15:24 - INFO - __main__ - Step 21439: {'lr': 0.0004790193338279474, 'samples': 4116288, 'steps': 21438, 'loss/train': 1.757002353668213} -11/07/2021 00:15:24 - INFO - __main__ - Step 21440: {'lr': 0.000479017205763162, 'samples': 4116480, 'steps': 21439, 'loss/train': 1.3909929990768433} -11/07/2021 00:15:25 - INFO - __main__ - Step 21441: {'lr': 0.000479015077595185, 'samples': 4116672, 'steps': 21440, 'loss/train': 1.5615991353988647} -11/07/2021 00:15:25 - INFO - __main__ - Step 21442: {'lr': 0.0004790129493240173, 'samples': 4116864, 'steps': 21441, 'loss/train': 0.7827515006065369} -11/07/2021 00:15:26 - INFO - __main__ - Step 21443: {'lr': 0.0004790108209496599, 'samples': 4117056, 'steps': 21442, 'loss/train': 1.5710242986679077} -11/07/2021 00:15:26 - INFO - __main__ - Step 21444: {'lr': 0.00047900869247211384, 'samples': 4117248, 'steps': 21443, 'loss/train': 1.5302128791809082} -11/07/2021 00:15:27 - INFO - __main__ - Step 21445: {'lr': 0.0004790065638913799, 'samples': 4117440, 'steps': 21444, 'loss/train': 1.9915907382965088} -11/07/2021 00:15:27 - INFO - __main__ - Step 21446: {'lr': 0.00047900443520745915, 'samples': 4117632, 'steps': 21445, 'loss/train': 1.787115216255188} -11/07/2021 00:15:27 - INFO - __main__ - Step 21447: {'lr': 0.0004790023064203526, 'samples': 4117824, 'steps': 21446, 'loss/train': 1.482800006866455} -11/07/2021 00:15:28 - INFO - __main__ - Step 21448: {'lr': 0.00047900017753006106, 'samples': 4118016, 'steps': 21447, 'loss/train': 1.878015398979187} -11/07/2021 00:15:29 - INFO - __main__ - Step 21449: {'lr': 0.0004789980485365857, 'samples': 4118208, 'steps': 21448, 'loss/train': 1.9219799041748047} -11/07/2021 00:15:29 - INFO - __main__ - Step 21450: {'lr': 0.00047899591943992726, 'samples': 4118400, 'steps': 21449, 'loss/train': 1.6092162132263184} -11/07/2021 00:15:29 - INFO - __main__ - Step 21451: {'lr': 0.0004789937902400868, 'samples': 4118592, 'steps': 21450, 'loss/train': 2.2746288776397705} -11/07/2021 00:15:30 - INFO - __main__ - Step 21452: {'lr': 0.00047899166093706523, 'samples': 4118784, 'steps': 21451, 'loss/train': 1.3884146213531494} -11/07/2021 00:15:31 - INFO - __main__ - Step 21453: {'lr': 0.0004789895315308636, 'samples': 4118976, 'steps': 21452, 'loss/train': 1.2079041004180908} -11/07/2021 00:15:31 - INFO - __main__ - Step 21454: {'lr': 0.00047898740202148284, 'samples': 4119168, 'steps': 21453, 'loss/train': 0.21061697602272034} -11/07/2021 00:15:31 - INFO - __main__ - Step 21455: {'lr': 0.0004789852724089239, 'samples': 4119360, 'steps': 21454, 'loss/train': 1.5838730335235596} -11/07/2021 00:15:32 - INFO - __main__ - Step 21456: {'lr': 0.00047898314269318766, 'samples': 4119552, 'steps': 21455, 'loss/train': 1.8635731935501099} -11/07/2021 00:15:32 - INFO - __main__ - Step 21457: {'lr': 0.00047898101287427523, 'samples': 4119744, 'steps': 21456, 'loss/train': 1.6409664154052734} -11/07/2021 00:15:33 - INFO - __main__ - Step 21458: {'lr': 0.0004789788829521874, 'samples': 4119936, 'steps': 21457, 'loss/train': 1.7607507705688477} -11/07/2021 00:15:34 - INFO - __main__ - Step 21459: {'lr': 0.0004789767529269253, 'samples': 4120128, 'steps': 21458, 'loss/train': 0.8947522640228271} -11/07/2021 00:15:34 - INFO - __main__ - Step 21460: {'lr': 0.0004789746227984897, 'samples': 4120320, 'steps': 21459, 'loss/train': 1.4214286804199219} -11/07/2021 00:15:34 - INFO - __main__ - Step 21461: {'lr': 0.0004789724925668818, 'samples': 4120512, 'steps': 21460, 'loss/train': 1.5798488855361938} -11/07/2021 00:15:35 - INFO - __main__ - Step 21462: {'lr': 0.00047897036223210234, 'samples': 4120704, 'steps': 21461, 'loss/train': 1.2147839069366455} -11/07/2021 00:15:36 - INFO - __main__ - Step 21463: {'lr': 0.00047896823179415237, 'samples': 4120896, 'steps': 21462, 'loss/train': 1.45625638961792} -11/07/2021 00:15:36 - INFO - __main__ - Step 21464: {'lr': 0.0004789661012530329, 'samples': 4121088, 'steps': 21463, 'loss/train': 1.694710612297058} -11/07/2021 00:15:37 - INFO - __main__ - Step 21465: {'lr': 0.00047896397060874485, 'samples': 4121280, 'steps': 21464, 'loss/train': 1.63399076461792} -11/07/2021 00:15:37 - INFO - __main__ - Step 21466: {'lr': 0.0004789618398612891, 'samples': 4121472, 'steps': 21465, 'loss/train': 2.6186089515686035} -11/07/2021 00:15:37 - INFO - __main__ - Step 21467: {'lr': 0.0004789597090106667, 'samples': 4121664, 'steps': 21466, 'loss/train': 1.5475844144821167} -11/07/2021 00:15:38 - INFO - __main__ - Step 21468: {'lr': 0.00047895757805687864, 'samples': 4121856, 'steps': 21467, 'loss/train': 1.74507737159729} -11/07/2021 00:15:39 - INFO - __main__ - Step 21469: {'lr': 0.0004789554469999258, 'samples': 4122048, 'steps': 21468, 'loss/train': 1.5908174514770508} -11/07/2021 00:15:39 - INFO - __main__ - Step 21470: {'lr': 0.0004789533158398091, 'samples': 4122240, 'steps': 21469, 'loss/train': 1.933680772781372} -11/07/2021 00:15:39 - INFO - __main__ - Step 21471: {'lr': 0.00047895118457652965, 'samples': 4122432, 'steps': 21470, 'loss/train': 1.2519850730895996} -11/07/2021 00:15:40 - INFO - __main__ - Step 21472: {'lr': 0.0004789490532100883, 'samples': 4122624, 'steps': 21471, 'loss/train': 3.244593858718872} -11/07/2021 00:15:40 - INFO - __main__ - Step 21473: {'lr': 0.000478946921740486, 'samples': 4122816, 'steps': 21472, 'loss/train': 1.6074554920196533} -11/07/2021 00:15:41 - INFO - __main__ - Step 21474: {'lr': 0.0004789447901677238, 'samples': 4123008, 'steps': 21473, 'loss/train': 0.4565056264400482} -11/07/2021 00:15:41 - INFO - __main__ - Step 21475: {'lr': 0.00047894265849180264, 'samples': 4123200, 'steps': 21474, 'loss/train': 0.8751310110092163} -11/07/2021 00:15:42 - INFO - __main__ - Step 21476: {'lr': 0.00047894052671272337, 'samples': 4123392, 'steps': 21475, 'loss/train': 1.7021253108978271} -11/07/2021 00:15:42 - INFO - __main__ - Step 21477: {'lr': 0.0004789383948304871, 'samples': 4123584, 'steps': 21476, 'loss/train': 1.6824284791946411} -11/07/2021 00:15:42 - INFO - __main__ - Step 21478: {'lr': 0.00047893626284509466, 'samples': 4123776, 'steps': 21477, 'loss/train': 1.7401764392852783} -11/07/2021 00:15:43 - INFO - __main__ - Step 21479: {'lr': 0.0004789341307565471, 'samples': 4123968, 'steps': 21478, 'loss/train': 1.7683900594711304} -11/07/2021 00:15:44 - INFO - __main__ - Step 21480: {'lr': 0.0004789319985648454, 'samples': 4124160, 'steps': 21479, 'loss/train': 1.4364922046661377} -11/07/2021 00:15:44 - INFO - __main__ - Step 21481: {'lr': 0.0004789298662699905, 'samples': 4124352, 'steps': 21480, 'loss/train': 1.1518300771713257} -11/07/2021 00:15:44 - INFO - __main__ - Step 21482: {'lr': 0.0004789277338719832, 'samples': 4124544, 'steps': 21481, 'loss/train': 1.8052656650543213} -11/07/2021 00:15:45 - INFO - __main__ - Step 21483: {'lr': 0.0004789256013708246, 'samples': 4124736, 'steps': 21482, 'loss/train': 1.718207597732544} -11/07/2021 00:15:46 - INFO - __main__ - Step 21484: {'lr': 0.0004789234687665158, 'samples': 4124928, 'steps': 21483, 'loss/train': 1.4353058338165283} -11/07/2021 00:15:46 - INFO - __main__ - Step 21485: {'lr': 0.0004789213360590575, 'samples': 4125120, 'steps': 21484, 'loss/train': 1.7839090824127197} -11/07/2021 00:15:47 - INFO - __main__ - Step 21486: {'lr': 0.00047891920324845085, 'samples': 4125312, 'steps': 21485, 'loss/train': 1.8160103559494019} -11/07/2021 00:15:47 - INFO - __main__ - Step 21487: {'lr': 0.00047891707033469665, 'samples': 4125504, 'steps': 21486, 'loss/train': 1.8308603763580322} -11/07/2021 00:15:47 - INFO - __main__ - Step 21488: {'lr': 0.00047891493731779607, 'samples': 4125696, 'steps': 21487, 'loss/train': 1.8766554594039917} -11/07/2021 00:15:48 - INFO - __main__ - Step 21489: {'lr': 0.00047891280419774985, 'samples': 4125888, 'steps': 21488, 'loss/train': 1.0840020179748535} -11/07/2021 00:15:49 - INFO - __main__ - Step 21490: {'lr': 0.0004789106709745591, 'samples': 4126080, 'steps': 21489, 'loss/train': 1.5869641304016113} -11/07/2021 00:15:49 - INFO - __main__ - Step 21491: {'lr': 0.0004789085376482247, 'samples': 4126272, 'steps': 21490, 'loss/train': 1.71488356590271} -11/07/2021 00:15:49 - INFO - __main__ - Step 21492: {'lr': 0.00047890640421874775, 'samples': 4126464, 'steps': 21491, 'loss/train': 1.5513404607772827} -11/07/2021 00:15:50 - INFO - __main__ - Step 21493: {'lr': 0.000478904270686129, 'samples': 4126656, 'steps': 21492, 'loss/train': 0.9947566390037537} -11/07/2021 00:15:51 - INFO - __main__ - Step 21494: {'lr': 0.00047890213705036955, 'samples': 4126848, 'steps': 21493, 'loss/train': 2.104623794555664} -11/07/2021 00:15:51 - INFO - __main__ - Step 21495: {'lr': 0.00047890000331147033, 'samples': 4127040, 'steps': 21494, 'loss/train': 1.1416540145874023} -11/07/2021 00:15:51 - INFO - __main__ - Step 21496: {'lr': 0.0004788978694694323, 'samples': 4127232, 'steps': 21495, 'loss/train': 1.2822664976119995} -11/07/2021 00:15:52 - INFO - __main__ - Step 21497: {'lr': 0.0004788957355242564, 'samples': 4127424, 'steps': 21496, 'loss/train': 1.5804579257965088} -11/07/2021 00:15:52 - INFO - __main__ - Step 21498: {'lr': 0.00047889360147594363, 'samples': 4127616, 'steps': 21497, 'loss/train': 1.338382363319397} -11/07/2021 00:15:53 - INFO - __main__ - Step 21499: {'lr': 0.00047889146732449497, 'samples': 4127808, 'steps': 21498, 'loss/train': 1.7818214893341064} -11/07/2021 00:15:53 - INFO - __main__ - Step 21500: {'lr': 0.00047888933306991136, 'samples': 4128000, 'steps': 21499, 'loss/train': 2.0857651233673096} -11/07/2021 00:15:54 - INFO - __main__ - Step 21501: {'lr': 0.00047888719871219367, 'samples': 4128192, 'steps': 21500, 'loss/train': 1.147006630897522} -11/07/2021 00:15:54 - INFO - __main__ - Step 21502: {'lr': 0.00047888506425134293, 'samples': 4128384, 'steps': 21501, 'loss/train': 1.8140604496002197} -11/07/2021 00:15:54 - INFO - __main__ - Step 21503: {'lr': 0.0004788829296873601, 'samples': 4128576, 'steps': 21502, 'loss/train': 1.6200863122940063} -11/07/2021 00:15:56 - INFO - __main__ - Step 21504: {'lr': 0.0004788807950202463, 'samples': 4128768, 'steps': 21503, 'loss/train': 1.7840808629989624} -11/07/2021 00:15:56 - INFO - __main__ - Step 21505: {'lr': 0.00047887866025000226, 'samples': 4128960, 'steps': 21504, 'loss/train': 1.6177959442138672} -11/07/2021 00:15:56 - INFO - __main__ - Step 21506: {'lr': 0.000478876525376629, 'samples': 4129152, 'steps': 21505, 'loss/train': 0.20047274231910706} -11/07/2021 00:15:57 - INFO - __main__ - Step 21507: {'lr': 0.00047887439040012755, 'samples': 4129344, 'steps': 21506, 'loss/train': 1.625873327255249} -11/07/2021 00:15:57 - INFO - __main__ - Step 21508: {'lr': 0.0004788722553204988, 'samples': 4129536, 'steps': 21507, 'loss/train': 2.040313720703125} -11/07/2021 00:15:57 - INFO - __main__ - Step 21509: {'lr': 0.0004788701201377438, 'samples': 4129728, 'steps': 21508, 'loss/train': 1.7073478698730469} -11/07/2021 00:15:58 - INFO - __main__ - Step 21510: {'lr': 0.0004788679848518633, 'samples': 4129920, 'steps': 21509, 'loss/train': 2.4196596145629883} -11/07/2021 00:15:59 - INFO - __main__ - Step 21511: {'lr': 0.0004788658494628586, 'samples': 4130112, 'steps': 21510, 'loss/train': 1.1434111595153809} -11/07/2021 00:15:59 - INFO - __main__ - Step 21512: {'lr': 0.0004788637139707304, 'samples': 4130304, 'steps': 21511, 'loss/train': 1.6110708713531494} -11/07/2021 00:15:59 - INFO - __main__ - Step 21513: {'lr': 0.00047886157837547975, 'samples': 4130496, 'steps': 21512, 'loss/train': 1.1308202743530273} -11/07/2021 00:16:00 - INFO - __main__ - Step 21514: {'lr': 0.0004788594426771076, 'samples': 4130688, 'steps': 21513, 'loss/train': 1.610917329788208} -11/07/2021 00:16:01 - INFO - __main__ - Step 21515: {'lr': 0.0004788573068756149, 'samples': 4130880, 'steps': 21514, 'loss/train': 1.7047597169876099} -11/07/2021 00:16:01 - INFO - __main__ - Step 21516: {'lr': 0.0004788551709710027, 'samples': 4131072, 'steps': 21515, 'loss/train': 1.753533124923706} -11/07/2021 00:16:01 - INFO - __main__ - Step 21517: {'lr': 0.0004788530349632718, 'samples': 4131264, 'steps': 21516, 'loss/train': 1.1571195125579834} -11/07/2021 00:16:02 - INFO - __main__ - Step 21518: {'lr': 0.00047885089885242333, 'samples': 4131456, 'steps': 21517, 'loss/train': 1.3207316398620605} -11/07/2021 00:16:02 - INFO - __main__ - Step 21519: {'lr': 0.0004788487626384581, 'samples': 4131648, 'steps': 21518, 'loss/train': 1.6291325092315674} -11/07/2021 00:16:03 - INFO - __main__ - Step 21520: {'lr': 0.0004788466263213772, 'samples': 4131840, 'steps': 21519, 'loss/train': 1.5563868284225464} -11/07/2021 00:16:03 - INFO - __main__ - Step 21521: {'lr': 0.00047884448990118155, 'samples': 4132032, 'steps': 21520, 'loss/train': 1.9897916316986084} -11/07/2021 00:16:04 - INFO - __main__ - Step 21522: {'lr': 0.0004788423533778721, 'samples': 4132224, 'steps': 21521, 'loss/train': 2.186905860900879} -11/07/2021 00:16:04 - INFO - __main__ - Step 21523: {'lr': 0.00047884021675144987, 'samples': 4132416, 'steps': 21522, 'loss/train': 1.3714509010314941} -11/07/2021 00:16:04 - INFO - __main__ - Step 21524: {'lr': 0.0004788380800219156, 'samples': 4132608, 'steps': 21523, 'loss/train': 1.524144172668457} -11/07/2021 00:16:06 - INFO - __main__ - Step 21525: {'lr': 0.0004788359431892706, 'samples': 4132800, 'steps': 21524, 'loss/train': 0.893682062625885} -11/07/2021 00:16:06 - INFO - __main__ - Step 21526: {'lr': 0.00047883380625351557, 'samples': 4132992, 'steps': 21525, 'loss/train': 1.6024296283721924} -11/07/2021 00:16:06 - INFO - __main__ - Step 21527: {'lr': 0.00047883166921465156, 'samples': 4133184, 'steps': 21526, 'loss/train': 1.9296703338623047} -11/07/2021 00:16:07 - INFO - __main__ - Step 21528: {'lr': 0.00047882953207267954, 'samples': 4133376, 'steps': 21527, 'loss/train': 1.8911947011947632} -11/07/2021 00:16:07 - INFO - __main__ - Step 21529: {'lr': 0.00047882739482760044, 'samples': 4133568, 'steps': 21528, 'loss/train': 1.9235213994979858} -11/07/2021 00:16:08 - INFO - __main__ - Step 21530: {'lr': 0.0004788252574794153, 'samples': 4133760, 'steps': 21529, 'loss/train': 1.90152108669281} -11/07/2021 00:16:08 - INFO - __main__ - Step 21531: {'lr': 0.000478823120028125, 'samples': 4133952, 'steps': 21530, 'loss/train': 1.815036654472351} -11/07/2021 00:16:09 - INFO - __main__ - Step 21532: {'lr': 0.0004788209824737305, 'samples': 4134144, 'steps': 21531, 'loss/train': 1.7011241912841797} -11/07/2021 00:16:09 - INFO - __main__ - Step 21533: {'lr': 0.00047881884481623286, 'samples': 4134336, 'steps': 21532, 'loss/train': 1.5776305198669434} -11/07/2021 00:16:10 - INFO - __main__ - Step 21534: {'lr': 0.000478816707055633, 'samples': 4134528, 'steps': 21533, 'loss/train': 1.2953623533248901} -11/07/2021 00:16:11 - INFO - __main__ - Step 21535: {'lr': 0.0004788145691919318, 'samples': 4134720, 'steps': 21534, 'loss/train': 1.5415441989898682} -11/07/2021 00:16:11 - INFO - __main__ - Step 21536: {'lr': 0.0004788124312251303, 'samples': 4134912, 'steps': 21535, 'loss/train': 1.6723524332046509} -11/07/2021 00:16:11 - INFO - __main__ - Step 21537: {'lr': 0.0004788102931552294, 'samples': 4135104, 'steps': 21536, 'loss/train': 2.1559436321258545} -11/07/2021 00:16:12 - INFO - __main__ - Step 21538: {'lr': 0.0004788081549822302, 'samples': 4135296, 'steps': 21537, 'loss/train': 2.0337588787078857} -11/07/2021 00:16:12 - INFO - __main__ - Step 21539: {'lr': 0.0004788060167061335, 'samples': 4135488, 'steps': 21538, 'loss/train': 2.108020782470703} -11/07/2021 00:16:13 - INFO - __main__ - Step 21540: {'lr': 0.0004788038783269404, 'samples': 4135680, 'steps': 21539, 'loss/train': 1.685656189918518} -11/07/2021 00:16:13 - INFO - __main__ - Step 21541: {'lr': 0.00047880173984465174, 'samples': 4135872, 'steps': 21540, 'loss/train': 1.431290626525879} -11/07/2021 00:16:14 - INFO - __main__ - Step 21542: {'lr': 0.0004787996012592686, 'samples': 4136064, 'steps': 21541, 'loss/train': 1.244078278541565} -11/07/2021 00:16:14 - INFO - __main__ - Step 21543: {'lr': 0.0004787974625707919, 'samples': 4136256, 'steps': 21542, 'loss/train': 1.6926815509796143} -11/07/2021 00:16:14 - INFO - __main__ - Step 21544: {'lr': 0.0004787953237792225, 'samples': 4136448, 'steps': 21543, 'loss/train': 1.9875998497009277} -11/07/2021 00:16:15 - INFO - __main__ - Step 21545: {'lr': 0.0004787931848845616, 'samples': 4136640, 'steps': 21544, 'loss/train': 1.8045618534088135} -11/07/2021 00:16:16 - INFO - __main__ - Step 21546: {'lr': 0.00047879104588680987, 'samples': 4136832, 'steps': 21545, 'loss/train': 1.706560492515564} -11/07/2021 00:16:16 - INFO - __main__ - Step 21547: {'lr': 0.00047878890678596854, 'samples': 4137024, 'steps': 21546, 'loss/train': 1.979650616645813} -11/07/2021 00:16:16 - INFO - __main__ - Step 21548: {'lr': 0.00047878676758203844, 'samples': 4137216, 'steps': 21547, 'loss/train': 1.6284128427505493} -11/07/2021 00:16:17 - INFO - __main__ - Step 21549: {'lr': 0.00047878462827502055, 'samples': 4137408, 'steps': 21548, 'loss/train': 1.7756991386413574} -11/07/2021 00:16:17 - INFO - __main__ - Step 21550: {'lr': 0.0004787824888649158, 'samples': 4137600, 'steps': 21549, 'loss/train': 1.996254324913025} -11/07/2021 00:16:18 - INFO - __main__ - Step 21551: {'lr': 0.0004787803493517252, 'samples': 4137792, 'steps': 21550, 'loss/train': 1.7516309022903442} -11/07/2021 00:16:18 - INFO - __main__ - Step 21552: {'lr': 0.0004787782097354497, 'samples': 4137984, 'steps': 21551, 'loss/train': 1.415780782699585} -11/07/2021 00:16:19 - INFO - __main__ - Step 21553: {'lr': 0.00047877607001609035, 'samples': 4138176, 'steps': 21552, 'loss/train': 1.233115553855896} -11/07/2021 00:16:19 - INFO - __main__ - Step 21554: {'lr': 0.00047877393019364796, 'samples': 4138368, 'steps': 21553, 'loss/train': 1.7765933275222778} -11/07/2021 00:16:19 - INFO - __main__ - Step 21555: {'lr': 0.0004787717902681236, 'samples': 4138560, 'steps': 21554, 'loss/train': 1.6584759950637817} -11/07/2021 00:16:21 - INFO - __main__ - Step 21556: {'lr': 0.00047876965023951814, 'samples': 4138752, 'steps': 21555, 'loss/train': 1.7891385555267334} -11/07/2021 00:16:21 - INFO - __main__ - Step 21557: {'lr': 0.00047876751010783266, 'samples': 4138944, 'steps': 21556, 'loss/train': 1.8446043729782104} -11/07/2021 00:16:21 - INFO - __main__ - Step 21558: {'lr': 0.0004787653698730681, 'samples': 4139136, 'steps': 21557, 'loss/train': 1.8145853281021118} -11/07/2021 00:16:22 - INFO - __main__ - Step 21559: {'lr': 0.00047876322953522535, 'samples': 4139328, 'steps': 21558, 'loss/train': 1.5460792779922485} -11/07/2021 00:16:22 - INFO - __main__ - Step 21560: {'lr': 0.00047876108909430536, 'samples': 4139520, 'steps': 21559, 'loss/train': 1.2707014083862305} -11/07/2021 00:16:23 - INFO - __main__ - Step 21561: {'lr': 0.00047875894855030923, 'samples': 4139712, 'steps': 21560, 'loss/train': 1.3773596286773682} -11/07/2021 00:16:23 - INFO - __main__ - Step 21562: {'lr': 0.00047875680790323785, 'samples': 4139904, 'steps': 21561, 'loss/train': 1.5871561765670776} -11/07/2021 00:16:24 - INFO - __main__ - Step 21563: {'lr': 0.0004787546671530921, 'samples': 4140096, 'steps': 21562, 'loss/train': 1.8902066946029663} -11/07/2021 00:16:24 - INFO - __main__ - Step 21564: {'lr': 0.0004787525262998731, 'samples': 4140288, 'steps': 21563, 'loss/train': 1.7794413566589355} -11/07/2021 00:16:24 - INFO - __main__ - Step 21565: {'lr': 0.0004787503853435817, 'samples': 4140480, 'steps': 21564, 'loss/train': 1.6013624668121338} -11/07/2021 00:16:26 - INFO - __main__ - Step 21566: {'lr': 0.00047874824428421897, 'samples': 4140672, 'steps': 21565, 'loss/train': 1.7130855321884155} -11/07/2021 00:16:26 - INFO - __main__ - Step 21567: {'lr': 0.0004787461031217858, 'samples': 4140864, 'steps': 21566, 'loss/train': 1.4191340208053589} -11/07/2021 00:16:26 - INFO - __main__ - Step 21568: {'lr': 0.0004787439618562831, 'samples': 4141056, 'steps': 21567, 'loss/train': 0.9844514727592468} -11/07/2021 00:16:27 - INFO - __main__ - Step 21569: {'lr': 0.000478741820487712, 'samples': 4141248, 'steps': 21568, 'loss/train': 1.362804889678955} -11/07/2021 00:16:27 - INFO - __main__ - Step 21570: {'lr': 0.0004787396790160733, 'samples': 4141440, 'steps': 21569, 'loss/train': 1.464184284210205} -11/07/2021 00:16:28 - INFO - __main__ - Step 21571: {'lr': 0.00047873753744136807, 'samples': 4141632, 'steps': 21570, 'loss/train': 1.4976603984832764} -11/07/2021 00:16:29 - INFO - __main__ - Step 21572: {'lr': 0.0004787353957635971, 'samples': 4141824, 'steps': 21571, 'loss/train': 1.813546895980835} -11/07/2021 00:16:29 - INFO - __main__ - Step 21573: {'lr': 0.0004787332539827617, 'samples': 4142016, 'steps': 21572, 'loss/train': 1.614606261253357} -11/07/2021 00:16:29 - INFO - __main__ - Step 21574: {'lr': 0.00047873111209886245, 'samples': 4142208, 'steps': 21573, 'loss/train': 1.6597931385040283} -11/07/2021 00:16:30 - INFO - __main__ - Step 21575: {'lr': 0.00047872897011190063, 'samples': 4142400, 'steps': 21574, 'loss/train': 0.855787456035614} -11/07/2021 00:16:30 - INFO - __main__ - Step 21576: {'lr': 0.00047872682802187693, 'samples': 4142592, 'steps': 21575, 'loss/train': 1.3936561346054077} -11/07/2021 00:16:31 - INFO - __main__ - Step 21577: {'lr': 0.0004787246858287926, 'samples': 4142784, 'steps': 21576, 'loss/train': 2.4061551094055176} -11/07/2021 00:16:31 - INFO - __main__ - Step 21578: {'lr': 0.0004787225435326483, 'samples': 4142976, 'steps': 21577, 'loss/train': 1.734849452972412} -11/07/2021 00:16:32 - INFO - __main__ - Step 21579: {'lr': 0.0004787204011334453, 'samples': 4143168, 'steps': 21578, 'loss/train': 1.6250495910644531} -11/07/2021 00:16:32 - INFO - __main__ - Step 21580: {'lr': 0.0004787182586311843, 'samples': 4143360, 'steps': 21579, 'loss/train': 1.4872287511825562} -11/07/2021 00:16:32 - INFO - __main__ - Step 21581: {'lr': 0.0004787161160258664, 'samples': 4143552, 'steps': 21580, 'loss/train': 1.6663235425949097} -11/07/2021 00:16:33 - INFO - __main__ - Step 21582: {'lr': 0.00047871397331749254, 'samples': 4143744, 'steps': 21581, 'loss/train': 0.5923960208892822} -11/07/2021 00:16:34 - INFO - __main__ - Step 21583: {'lr': 0.00047871183050606376, 'samples': 4143936, 'steps': 21582, 'loss/train': 1.2236347198486328} -11/07/2021 00:16:34 - INFO - __main__ - Step 21584: {'lr': 0.00047870968759158096, 'samples': 4144128, 'steps': 21583, 'loss/train': 1.7751884460449219} -11/07/2021 00:16:34 - INFO - __main__ - Step 21585: {'lr': 0.000478707544574045, 'samples': 4144320, 'steps': 21584, 'loss/train': 1.1830782890319824} -11/07/2021 00:16:35 - INFO - __main__ - Step 21586: {'lr': 0.000478705401453457, 'samples': 4144512, 'steps': 21585, 'loss/train': 0.7636067867279053} -11/07/2021 00:16:36 - INFO - __main__ - Step 21587: {'lr': 0.000478703258229818, 'samples': 4144704, 'steps': 21586, 'loss/train': 0.18369045853614807} -11/07/2021 00:16:36 - INFO - __main__ - Step 21588: {'lr': 0.0004787011149031287, 'samples': 4144896, 'steps': 21587, 'loss/train': 1.3815462589263916} -11/07/2021 00:16:36 - INFO - __main__ - Step 21589: {'lr': 0.0004786989714733902, 'samples': 4145088, 'steps': 21588, 'loss/train': 0.8793774843215942} -11/07/2021 00:16:37 - INFO - __main__ - Step 21590: {'lr': 0.0004786968279406035, 'samples': 4145280, 'steps': 21589, 'loss/train': 1.5908639430999756} -11/07/2021 00:16:37 - INFO - __main__ - Step 21591: {'lr': 0.0004786946843047696, 'samples': 4145472, 'steps': 21590, 'loss/train': 1.7688531875610352} -11/07/2021 00:16:38 - INFO - __main__ - Step 21592: {'lr': 0.00047869254056588927, 'samples': 4145664, 'steps': 21591, 'loss/train': 1.64926016330719} -11/07/2021 00:16:39 - INFO - __main__ - Step 21593: {'lr': 0.0004786903967239637, 'samples': 4145856, 'steps': 21592, 'loss/train': 1.653084397315979} -11/07/2021 00:16:39 - INFO - __main__ - Step 21594: {'lr': 0.0004786882527789938, 'samples': 4146048, 'steps': 21593, 'loss/train': 2.0507147312164307} -11/07/2021 00:16:39 - INFO - __main__ - Step 21595: {'lr': 0.00047868610873098047, 'samples': 4146240, 'steps': 21594, 'loss/train': 1.6787335872650146} -11/07/2021 00:16:40 - INFO - __main__ - Step 21596: {'lr': 0.0004786839645799247, 'samples': 4146432, 'steps': 21595, 'loss/train': 1.8469722270965576} -11/07/2021 00:16:41 - INFO - __main__ - Step 21597: {'lr': 0.00047868182032582746, 'samples': 4146624, 'steps': 21596, 'loss/train': 1.7321794033050537} -11/07/2021 00:16:41 - INFO - __main__ - Step 21598: {'lr': 0.00047867967596868974, 'samples': 4146816, 'steps': 21597, 'loss/train': 1.0293926000595093} -11/07/2021 00:16:41 - INFO - __main__ - Step 21599: {'lr': 0.00047867753150851244, 'samples': 4147008, 'steps': 21598, 'loss/train': 1.51420259475708} -11/07/2021 00:16:42 - INFO - __main__ - Step 21600: {'lr': 0.0004786753869452966, 'samples': 4147200, 'steps': 21599, 'loss/train': 1.0068912506103516} -11/07/2021 00:16:42 - INFO - __main__ - Step 21601: {'lr': 0.00047867324227904317, 'samples': 4147392, 'steps': 21600, 'loss/train': 1.7972041368484497} -11/07/2021 00:16:43 - INFO - __main__ - Step 21602: {'lr': 0.0004786710975097531, 'samples': 4147584, 'steps': 21601, 'loss/train': 1.9969254732131958} -11/07/2021 00:16:43 - INFO - __main__ - Step 21603: {'lr': 0.0004786689526374274, 'samples': 4147776, 'steps': 21602, 'loss/train': 1.5673604011535645} -11/07/2021 00:16:44 - INFO - __main__ - Step 21604: {'lr': 0.00047866680766206693, 'samples': 4147968, 'steps': 21603, 'loss/train': 1.7802320718765259} -11/07/2021 00:16:44 - INFO - __main__ - Step 21605: {'lr': 0.0004786646625836727, 'samples': 4148160, 'steps': 21604, 'loss/train': 1.153442144393921} -11/07/2021 00:16:44 - INFO - __main__ - Step 21606: {'lr': 0.0004786625174022458, 'samples': 4148352, 'steps': 21605, 'loss/train': 1.1935527324676514} -11/07/2021 00:16:45 - INFO - __main__ - Step 21607: {'lr': 0.00047866037211778705, 'samples': 4148544, 'steps': 21606, 'loss/train': 0.29927515983581543} -11/07/2021 00:16:46 - INFO - __main__ - Step 21608: {'lr': 0.0004786582267302975, 'samples': 4148736, 'steps': 21607, 'loss/train': 0.8351354002952576} -11/07/2021 00:16:47 - INFO - __main__ - Step 21609: {'lr': 0.000478656081239778, 'samples': 4148928, 'steps': 21608, 'loss/train': 1.8804010152816772} -11/07/2021 00:16:47 - INFO - __main__ - Step 21610: {'lr': 0.0004786539356462297, 'samples': 4149120, 'steps': 21609, 'loss/train': 1.4697155952453613} -11/07/2021 00:16:47 - INFO - __main__ - Step 21611: {'lr': 0.0004786517899496534, 'samples': 4149312, 'steps': 21610, 'loss/train': 1.9372228384017944} -11/07/2021 00:16:48 - INFO - __main__ - Step 21612: {'lr': 0.0004786496441500502, 'samples': 4149504, 'steps': 21611, 'loss/train': 1.3799189329147339} -11/07/2021 00:16:49 - INFO - __main__ - Step 21613: {'lr': 0.00047864749824742093, 'samples': 4149696, 'steps': 21612, 'loss/train': 1.8028512001037598} -11/07/2021 00:16:49 - INFO - __main__ - Step 21614: {'lr': 0.00047864535224176666, 'samples': 4149888, 'steps': 21613, 'loss/train': 1.2140483856201172} -11/07/2021 00:16:49 - INFO - __main__ - Step 21615: {'lr': 0.0004786432061330882, 'samples': 4150080, 'steps': 21614, 'loss/train': 1.3646620512008667} -11/07/2021 00:16:50 - INFO - __main__ - Step 21616: {'lr': 0.0004786410599213868, 'samples': 4150272, 'steps': 21615, 'loss/train': 1.2908267974853516} -11/07/2021 00:16:50 - INFO - __main__ - Step 21617: {'lr': 0.00047863891360666323, 'samples': 4150464, 'steps': 21616, 'loss/train': 1.5464023351669312} -11/07/2021 00:16:51 - INFO - __main__ - Step 21618: {'lr': 0.00047863676718891846, 'samples': 4150656, 'steps': 21617, 'loss/train': 1.6251708269119263} -11/07/2021 00:16:51 - INFO - __main__ - Step 21619: {'lr': 0.0004786346206681535, 'samples': 4150848, 'steps': 21618, 'loss/train': 1.4503111839294434} -11/07/2021 00:16:52 - INFO - __main__ - Step 21620: {'lr': 0.0004786324740443693, 'samples': 4151040, 'steps': 21619, 'loss/train': 1.2549147605895996} -11/07/2021 00:16:52 - INFO - __main__ - Step 21621: {'lr': 0.00047863032731756684, 'samples': 4151232, 'steps': 21620, 'loss/train': 1.467907428741455} -11/07/2021 00:16:53 - INFO - __main__ - Step 21622: {'lr': 0.0004786281804877471, 'samples': 4151424, 'steps': 21621, 'loss/train': 1.2028931379318237} -11/07/2021 00:16:54 - INFO - __main__ - Step 21623: {'lr': 0.00047862603355491103, 'samples': 4151616, 'steps': 21622, 'loss/train': 1.0954643487930298} -11/07/2021 00:16:54 - INFO - __main__ - Step 21624: {'lr': 0.0004786238865190595, 'samples': 4151808, 'steps': 21623, 'loss/train': 1.7945252656936646} -11/07/2021 00:16:54 - INFO - __main__ - Step 21625: {'lr': 0.0004786217393801937, 'samples': 4152000, 'steps': 21624, 'loss/train': 1.5487359762191772} -11/07/2021 00:16:55 - INFO - __main__ - Step 21626: {'lr': 0.00047861959213831446, 'samples': 4152192, 'steps': 21625, 'loss/train': 1.6223113536834717} -11/07/2021 00:16:55 - INFO - __main__ - Step 21627: {'lr': 0.0004786174447934227, 'samples': 4152384, 'steps': 21626, 'loss/train': 1.4051604270935059} -11/07/2021 00:16:56 - INFO - __main__ - Step 21628: {'lr': 0.0004786152973455195, 'samples': 4152576, 'steps': 21627, 'loss/train': 1.345228672027588} -11/07/2021 00:16:56 - INFO - __main__ - Step 21629: {'lr': 0.0004786131497946058, 'samples': 4152768, 'steps': 21628, 'loss/train': 0.9680488705635071} -11/07/2021 00:16:57 - INFO - __main__ - Step 21630: {'lr': 0.0004786110021406824, 'samples': 4152960, 'steps': 21629, 'loss/train': 1.176362156867981} -11/07/2021 00:16:57 - INFO - __main__ - Step 21631: {'lr': 0.0004786088543837506, 'samples': 4153152, 'steps': 21630, 'loss/train': 1.5705360174179077} -11/07/2021 00:16:58 - INFO - __main__ - Step 21632: {'lr': 0.00047860670652381105, 'samples': 4153344, 'steps': 21631, 'loss/train': 1.987221598625183} -11/07/2021 00:16:58 - INFO - __main__ - Step 21633: {'lr': 0.00047860455856086487, 'samples': 4153536, 'steps': 21632, 'loss/train': 0.9786133170127869} -11/07/2021 00:16:59 - INFO - __main__ - Step 21634: {'lr': 0.00047860241049491303, 'samples': 4153728, 'steps': 21633, 'loss/train': 1.5743129253387451} -11/07/2021 00:16:59 - INFO - __main__ - Step 21635: {'lr': 0.00047860026232595645, 'samples': 4153920, 'steps': 21634, 'loss/train': 1.7790687084197998} -11/07/2021 00:17:00 - INFO - __main__ - Step 21636: {'lr': 0.0004785981140539961, 'samples': 4154112, 'steps': 21635, 'loss/train': 1.8462978601455688} -11/07/2021 00:17:00 - INFO - __main__ - Step 21637: {'lr': 0.000478595965679033, 'samples': 4154304, 'steps': 21636, 'loss/train': 1.3746877908706665} -11/07/2021 00:17:00 - INFO - __main__ - Step 21638: {'lr': 0.0004785938172010681, 'samples': 4154496, 'steps': 21637, 'loss/train': 1.551901936531067} -11/07/2021 00:17:01 - INFO - __main__ - Step 21639: {'lr': 0.0004785916686201023, 'samples': 4154688, 'steps': 21638, 'loss/train': 2.32190203666687} -11/07/2021 00:17:02 - INFO - __main__ - Step 21640: {'lr': 0.00047858951993613665, 'samples': 4154880, 'steps': 21639, 'loss/train': 1.568753957748413} -11/07/2021 00:17:02 - INFO - __main__ - Step 21641: {'lr': 0.0004785873711491721, 'samples': 4155072, 'steps': 21640, 'loss/train': 2.010477304458618} -11/07/2021 00:17:02 - INFO - __main__ - Step 21642: {'lr': 0.00047858522225920964, 'samples': 4155264, 'steps': 21641, 'loss/train': 0.8399590253829956} -11/07/2021 00:17:03 - INFO - __main__ - Step 21643: {'lr': 0.00047858307326625014, 'samples': 4155456, 'steps': 21642, 'loss/train': 1.774276614189148} -11/07/2021 00:17:04 - INFO - __main__ - Step 21644: {'lr': 0.00047858092417029464, 'samples': 4155648, 'steps': 21643, 'loss/train': 1.7628326416015625} -11/07/2021 00:17:04 - INFO - __main__ - Step 21645: {'lr': 0.00047857877497134416, 'samples': 4155840, 'steps': 21644, 'loss/train': 1.2147215604782104} -11/07/2021 00:17:04 - INFO - __main__ - Step 21646: {'lr': 0.0004785766256693995, 'samples': 4156032, 'steps': 21645, 'loss/train': 1.5541294813156128} -11/07/2021 00:17:05 - INFO - __main__ - Step 21647: {'lr': 0.0004785744762644619, 'samples': 4156224, 'steps': 21646, 'loss/train': 1.1660066843032837} -11/07/2021 00:17:05 - INFO - __main__ - Step 21648: {'lr': 0.00047857232675653207, 'samples': 4156416, 'steps': 21647, 'loss/train': 2.1722161769866943} -11/07/2021 00:17:06 - INFO - __main__ - Step 21649: {'lr': 0.00047857017714561105, 'samples': 4156608, 'steps': 21648, 'loss/train': 1.5793182849884033} -11/07/2021 00:17:07 - INFO - __main__ - Step 21650: {'lr': 0.00047856802743169994, 'samples': 4156800, 'steps': 21649, 'loss/train': 1.588982343673706} -11/07/2021 00:17:07 - INFO - __main__ - Step 21651: {'lr': 0.00047856587761479954, 'samples': 4156992, 'steps': 21650, 'loss/train': 1.7212626934051514} -11/07/2021 00:17:07 - INFO - __main__ - Step 21652: {'lr': 0.00047856372769491083, 'samples': 4157184, 'steps': 21651, 'loss/train': 1.6415342092514038} -11/07/2021 00:17:08 - INFO - __main__ - Step 21653: {'lr': 0.0004785615776720349, 'samples': 4157376, 'steps': 21652, 'loss/train': 1.7163211107254028} -11/07/2021 00:17:09 - INFO - __main__ - Step 21654: {'lr': 0.0004785594275461726, 'samples': 4157568, 'steps': 21653, 'loss/train': 1.6288830041885376} -11/07/2021 00:17:09 - INFO - __main__ - Step 21655: {'lr': 0.00047855727731732503, 'samples': 4157760, 'steps': 21654, 'loss/train': 1.8189113140106201} -11/07/2021 00:17:09 - INFO - __main__ - Step 21656: {'lr': 0.00047855512698549295, 'samples': 4157952, 'steps': 21655, 'loss/train': 1.7791290283203125} -11/07/2021 00:17:10 - INFO - __main__ - Step 21657: {'lr': 0.00047855297655067754, 'samples': 4158144, 'steps': 21656, 'loss/train': 1.4705885648727417} -11/07/2021 00:17:10 - INFO - __main__ - Step 21658: {'lr': 0.0004785508260128797, 'samples': 4158336, 'steps': 21657, 'loss/train': 1.4176886081695557} -11/07/2021 00:17:11 - INFO - __main__ - Step 21659: {'lr': 0.00047854867537210034, 'samples': 4158528, 'steps': 21658, 'loss/train': 1.7595988512039185} -11/07/2021 00:17:12 - INFO - __main__ - Step 21660: {'lr': 0.00047854652462834055, 'samples': 4158720, 'steps': 21659, 'loss/train': 1.7756456136703491} -11/07/2021 00:17:12 - INFO - __main__ - Step 21661: {'lr': 0.0004785443737816012, 'samples': 4158912, 'steps': 21660, 'loss/train': 5.061169147491455} -11/07/2021 00:17:12 - INFO - __main__ - Step 21662: {'lr': 0.0004785422228318832, 'samples': 4159104, 'steps': 21661, 'loss/train': 4.935312747955322} -11/07/2021 00:17:13 - INFO - __main__ - Step 21663: {'lr': 0.0004785400717791877, 'samples': 4159296, 'steps': 21662, 'loss/train': 2.0939254760742188} -11/07/2021 00:17:13 - INFO - __main__ - Step 21664: {'lr': 0.0004785379206235155, 'samples': 4159488, 'steps': 21663, 'loss/train': 1.599906086921692} -11/07/2021 00:17:15 - INFO - __main__ - Step 21665: {'lr': 0.00047853576936486764, 'samples': 4159680, 'steps': 21664, 'loss/train': 1.3704638481140137} -11/07/2021 00:17:15 - INFO - __main__ - Step 21666: {'lr': 0.00047853361800324516, 'samples': 4159872, 'steps': 21665, 'loss/train': 1.3747199773788452} -11/07/2021 00:17:15 - INFO - __main__ - Step 21667: {'lr': 0.0004785314665386489, 'samples': 4160064, 'steps': 21666, 'loss/train': 1.5270380973815918} -11/07/2021 00:17:16 - INFO - __main__ - Step 21668: {'lr': 0.00047852931497107987, 'samples': 4160256, 'steps': 21667, 'loss/train': 0.6752262115478516} -11/07/2021 00:17:16 - INFO - __main__ - Step 21669: {'lr': 0.0004785271633005391, 'samples': 4160448, 'steps': 21668, 'loss/train': 1.6318258047103882} -11/07/2021 00:17:16 - INFO - __main__ - Step 21670: {'lr': 0.0004785250115270275, 'samples': 4160640, 'steps': 21669, 'loss/train': 1.8416980504989624} -11/07/2021 00:17:17 - INFO - __main__ - Step 21671: {'lr': 0.00047852285965054606, 'samples': 4160832, 'steps': 21670, 'loss/train': 1.454700231552124} -11/07/2021 00:17:18 - INFO - __main__ - Step 21672: {'lr': 0.00047852070767109573, 'samples': 4161024, 'steps': 21671, 'loss/train': 1.5401418209075928} -11/07/2021 00:17:18 - INFO - __main__ - Step 21673: {'lr': 0.00047851855558867754, 'samples': 4161216, 'steps': 21672, 'loss/train': 1.6531730890274048} -11/07/2021 00:17:19 - INFO - __main__ - Step 21674: {'lr': 0.0004785164034032924, 'samples': 4161408, 'steps': 21673, 'loss/train': 1.682608962059021} -11/07/2021 00:17:19 - INFO - __main__ - Step 21675: {'lr': 0.0004785142511149412, 'samples': 4161600, 'steps': 21674, 'loss/train': 1.6360929012298584} -11/07/2021 00:17:20 - INFO - __main__ - Step 21676: {'lr': 0.0004785120987236251, 'samples': 4161792, 'steps': 21675, 'loss/train': 1.5555413961410522} -11/07/2021 00:17:20 - INFO - __main__ - Step 21677: {'lr': 0.00047850994622934494, 'samples': 4161984, 'steps': 21676, 'loss/train': 1.3743476867675781} -11/07/2021 00:17:21 - INFO - __main__ - Step 21678: {'lr': 0.0004785077936321018, 'samples': 4162176, 'steps': 21677, 'loss/train': 1.7006787061691284} -11/07/2021 00:17:21 - INFO - __main__ - Step 21679: {'lr': 0.00047850564093189653, 'samples': 4162368, 'steps': 21678, 'loss/train': 1.9067273139953613} -11/07/2021 00:17:21 - INFO - __main__ - Step 21680: {'lr': 0.0004785034881287301, 'samples': 4162560, 'steps': 21679, 'loss/train': 1.681504487991333} -11/07/2021 00:17:22 - INFO - __main__ - Step 21681: {'lr': 0.0004785013352226035, 'samples': 4162752, 'steps': 21680, 'loss/train': 1.96555495262146} -11/07/2021 00:17:23 - INFO - __main__ - Step 21682: {'lr': 0.00047849918221351783, 'samples': 4162944, 'steps': 21681, 'loss/train': 1.4842780828475952} -11/07/2021 00:17:23 - INFO - __main__ - Step 21683: {'lr': 0.0004784970291014739, 'samples': 4163136, 'steps': 21682, 'loss/train': 1.840103268623352} -11/07/2021 00:17:23 - INFO - __main__ - Step 21684: {'lr': 0.0004784948758864727, 'samples': 4163328, 'steps': 21683, 'loss/train': 1.3767606019973755} -11/07/2021 00:17:24 - INFO - __main__ - Step 21685: {'lr': 0.0004784927225685153, 'samples': 4163520, 'steps': 21684, 'loss/train': 1.9550838470458984} -11/07/2021 00:17:24 - INFO - __main__ - Step 21686: {'lr': 0.00047849056914760256, 'samples': 4163712, 'steps': 21685, 'loss/train': 1.6681972742080688} -11/07/2021 00:17:25 - INFO - __main__ - Step 21687: {'lr': 0.00047848841562373557, 'samples': 4163904, 'steps': 21686, 'loss/train': 1.4995859861373901} -11/07/2021 00:17:25 - INFO - __main__ - Step 21688: {'lr': 0.00047848626199691513, 'samples': 4164096, 'steps': 21687, 'loss/train': 1.1082913875579834} -11/07/2021 00:17:26 - INFO - __main__ - Step 21689: {'lr': 0.00047848410826714237, 'samples': 4164288, 'steps': 21688, 'loss/train': 1.973834753036499} -11/07/2021 00:17:26 - INFO - __main__ - Step 21690: {'lr': 0.00047848195443441817, 'samples': 4164480, 'steps': 21689, 'loss/train': 1.8756773471832275} -11/07/2021 00:17:26 - INFO - __main__ - Step 21691: {'lr': 0.0004784798004987435, 'samples': 4164672, 'steps': 21690, 'loss/train': 1.5911768674850464} -11/07/2021 00:17:28 - INFO - __main__ - Step 21692: {'lr': 0.00047847764646011937, 'samples': 4164864, 'steps': 21691, 'loss/train': 2.253713846206665} -11/07/2021 00:17:28 - INFO - __main__ - Step 21693: {'lr': 0.0004784754923185468, 'samples': 4165056, 'steps': 21692, 'loss/train': 1.468682050704956} -11/07/2021 00:17:28 - INFO - __main__ - Step 21694: {'lr': 0.00047847333807402666, 'samples': 4165248, 'steps': 21693, 'loss/train': 1.3054816722869873} -11/07/2021 00:17:29 - INFO - __main__ - Step 21695: {'lr': 0.00047847118372655996, 'samples': 4165440, 'steps': 21694, 'loss/train': 1.7357770204544067} -11/07/2021 00:17:29 - INFO - __main__ - Step 21696: {'lr': 0.00047846902927614767, 'samples': 4165632, 'steps': 21695, 'loss/train': 1.421078085899353} -11/07/2021 00:17:31 - INFO - __main__ - Step 21697: {'lr': 0.0004784668747227907, 'samples': 4165824, 'steps': 21696, 'loss/train': 2.197175979614258} -11/07/2021 00:17:31 - INFO - __main__ - Step 21698: {'lr': 0.00047846472006649016, 'samples': 4166016, 'steps': 21697, 'loss/train': 1.1708250045776367} -11/07/2021 00:17:31 - INFO - __main__ - Step 21699: {'lr': 0.0004784625653072469, 'samples': 4166208, 'steps': 21698, 'loss/train': 1.3094415664672852} -11/07/2021 00:17:32 - INFO - __main__ - Step 21700: {'lr': 0.00047846041044506194, 'samples': 4166400, 'steps': 21699, 'loss/train': 1.742722988128662} -11/07/2021 00:17:32 - INFO - __main__ - Step 21701: {'lr': 0.00047845825547993627, 'samples': 4166592, 'steps': 21700, 'loss/train': 1.8332834243774414} -11/07/2021 00:17:32 - INFO - __main__ - Step 21702: {'lr': 0.0004784561004118708, 'samples': 4166784, 'steps': 21701, 'loss/train': 0.8396803736686707} -11/07/2021 00:17:34 - INFO - __main__ - Step 21703: {'lr': 0.0004784539452408666, 'samples': 4166976, 'steps': 21702, 'loss/train': 1.7695062160491943} -11/07/2021 00:17:34 - INFO - __main__ - Step 21704: {'lr': 0.0004784517899669245, 'samples': 4167168, 'steps': 21703, 'loss/train': 1.3221811056137085} -11/07/2021 00:17:34 - INFO - __main__ - Step 21705: {'lr': 0.00047844963459004565, 'samples': 4167360, 'steps': 21704, 'loss/train': 1.2405515909194946} -11/07/2021 00:17:35 - INFO - __main__ - Step 21706: {'lr': 0.00047844747911023077, 'samples': 4167552, 'steps': 21705, 'loss/train': 1.389700174331665} -11/07/2021 00:17:35 - INFO - __main__ - Step 21707: {'lr': 0.00047844532352748115, 'samples': 4167744, 'steps': 21706, 'loss/train': 1.4688421487808228} -11/07/2021 00:17:35 - INFO - __main__ - Step 21708: {'lr': 0.0004784431678417975, 'samples': 4167936, 'steps': 21707, 'loss/train': 2.301962375640869} -11/07/2021 00:17:36 - INFO - __main__ - Step 21709: {'lr': 0.00047844101205318085, 'samples': 4168128, 'steps': 21708, 'loss/train': 1.7107940912246704} -11/07/2021 00:17:37 - INFO - __main__ - Step 21710: {'lr': 0.0004784388561616323, 'samples': 4168320, 'steps': 21709, 'loss/train': 1.7536522150039673} -11/07/2021 00:17:37 - INFO - __main__ - Step 21711: {'lr': 0.0004784367001671526, 'samples': 4168512, 'steps': 21710, 'loss/train': 1.3904337882995605} -11/07/2021 00:17:37 - INFO - __main__ - Step 21712: {'lr': 0.00047843454406974295, 'samples': 4168704, 'steps': 21711, 'loss/train': 0.41166508197784424} -11/07/2021 00:17:38 - INFO - __main__ - Step 21713: {'lr': 0.00047843238786940423, 'samples': 4168896, 'steps': 21712, 'loss/train': 1.6754117012023926} -11/07/2021 00:17:39 - INFO - __main__ - Step 21714: {'lr': 0.0004784302315661373, 'samples': 4169088, 'steps': 21713, 'loss/train': 1.7005354166030884} -11/07/2021 00:17:39 - INFO - __main__ - Step 21715: {'lr': 0.00047842807515994335, 'samples': 4169280, 'steps': 21714, 'loss/train': 1.8570494651794434} -11/07/2021 00:17:39 - INFO - __main__ - Step 21716: {'lr': 0.00047842591865082315, 'samples': 4169472, 'steps': 21715, 'loss/train': 1.401794672012329} -11/07/2021 00:17:40 - INFO - __main__ - Step 21717: {'lr': 0.0004784237620387778, 'samples': 4169664, 'steps': 21716, 'loss/train': 1.5829322338104248} -11/07/2021 00:17:40 - INFO - __main__ - Step 21718: {'lr': 0.0004784216053238082, 'samples': 4169856, 'steps': 21717, 'loss/train': 1.6291459798812866} -11/07/2021 00:17:41 - INFO - __main__ - Step 21719: {'lr': 0.00047841944850591535, 'samples': 4170048, 'steps': 21718, 'loss/train': 1.6986477375030518} -11/07/2021 00:17:42 - INFO - __main__ - Step 21720: {'lr': 0.0004784172915851003, 'samples': 4170240, 'steps': 21719, 'loss/train': 1.7120718955993652} -11/07/2021 00:17:42 - INFO - __main__ - Step 21721: {'lr': 0.00047841513456136383, 'samples': 4170432, 'steps': 21720, 'loss/train': 1.5299396514892578} -11/07/2021 00:17:42 - INFO - __main__ - Step 21722: {'lr': 0.000478412977434707, 'samples': 4170624, 'steps': 21721, 'loss/train': 1.4899734258651733} -11/07/2021 00:17:43 - INFO - __main__ - Step 21723: {'lr': 0.00047841082020513094, 'samples': 4170816, 'steps': 21722, 'loss/train': 1.4843244552612305} -11/07/2021 00:17:44 - INFO - __main__ - Step 21724: {'lr': 0.0004784086628726364, 'samples': 4171008, 'steps': 21723, 'loss/train': 1.7268753051757812} -11/07/2021 00:17:44 - INFO - __main__ - Step 21725: {'lr': 0.0004784065054372245, 'samples': 4171200, 'steps': 21724, 'loss/train': 1.1709247827529907} -11/07/2021 00:17:44 - INFO - __main__ - Step 21726: {'lr': 0.0004784043478988961, 'samples': 4171392, 'steps': 21725, 'loss/train': 1.5650849342346191} -11/07/2021 00:17:45 - INFO - __main__ - Step 21727: {'lr': 0.00047840219025765225, 'samples': 4171584, 'steps': 21726, 'loss/train': 1.7945908308029175} -11/07/2021 00:17:45 - INFO - __main__ - Step 21728: {'lr': 0.0004784000325134939, 'samples': 4171776, 'steps': 21727, 'loss/train': 1.760206937789917} -11/07/2021 00:17:46 - INFO - __main__ - Step 21729: {'lr': 0.00047839787466642206, 'samples': 4171968, 'steps': 21728, 'loss/train': 1.9748557806015015} -11/07/2021 00:17:46 - INFO - __main__ - Step 21730: {'lr': 0.00047839571671643756, 'samples': 4172160, 'steps': 21729, 'loss/train': 1.7250733375549316} -11/07/2021 00:17:47 - INFO - __main__ - Step 21731: {'lr': 0.0004783935586635415, 'samples': 4172352, 'steps': 21730, 'loss/train': 1.6004855632781982} -11/07/2021 00:17:47 - INFO - __main__ - Step 21732: {'lr': 0.0004783914005077349, 'samples': 4172544, 'steps': 21731, 'loss/train': 1.0612422227859497} -11/07/2021 00:17:48 - INFO - __main__ - Step 21733: {'lr': 0.0004783892422490186, 'samples': 4172736, 'steps': 21732, 'loss/train': 1.5149544477462769} -11/07/2021 00:17:49 - INFO - __main__ - Step 21734: {'lr': 0.00047838708388739365, 'samples': 4172928, 'steps': 21733, 'loss/train': 1.3210654258728027} -11/07/2021 00:17:49 - INFO - __main__ - Step 21735: {'lr': 0.000478384925422861, 'samples': 4173120, 'steps': 21734, 'loss/train': 1.7746955156326294} -11/07/2021 00:17:49 - INFO - __main__ - Step 21736: {'lr': 0.00047838276685542157, 'samples': 4173312, 'steps': 21735, 'loss/train': 1.6839711666107178} -11/07/2021 00:17:50 - INFO - __main__ - Step 21737: {'lr': 0.0004783806081850765, 'samples': 4173504, 'steps': 21736, 'loss/train': 1.643261432647705} -11/07/2021 00:17:50 - INFO - __main__ - Step 21738: {'lr': 0.0004783784494118266, 'samples': 4173696, 'steps': 21737, 'loss/train': 1.1372442245483398} -11/07/2021 00:17:51 - INFO - __main__ - Step 21739: {'lr': 0.00047837629053567286, 'samples': 4173888, 'steps': 21738, 'loss/train': 1.4777683019638062} -11/07/2021 00:17:52 - INFO - __main__ - Step 21740: {'lr': 0.00047837413155661635, 'samples': 4174080, 'steps': 21739, 'loss/train': 1.196178674697876} -11/07/2021 00:17:52 - INFO - __main__ - Step 21741: {'lr': 0.000478371972474658, 'samples': 4174272, 'steps': 21740, 'loss/train': 1.6837353706359863} -11/07/2021 00:17:52 - INFO - __main__ - Step 21742: {'lr': 0.00047836981328979865, 'samples': 4174464, 'steps': 21741, 'loss/train': 1.6639713048934937} -11/07/2021 00:17:53 - INFO - __main__ - Step 21743: {'lr': 0.00047836765400203953, 'samples': 4174656, 'steps': 21742, 'loss/train': 2.0440940856933594} -11/07/2021 00:17:53 - INFO - __main__ - Step 21744: {'lr': 0.00047836549461138133, 'samples': 4174848, 'steps': 21743, 'loss/train': 5.400808334350586} -11/07/2021 00:17:54 - INFO - __main__ - Step 21745: {'lr': 0.00047836333511782524, 'samples': 4175040, 'steps': 21744, 'loss/train': 5.30963659286499} -11/07/2021 00:17:55 - INFO - __main__ - Step 21746: {'lr': 0.00047836117552137213, 'samples': 4175232, 'steps': 21745, 'loss/train': 1.938073992729187} -11/07/2021 00:17:55 - INFO - __main__ - Step 21747: {'lr': 0.00047835901582202303, 'samples': 4175424, 'steps': 21746, 'loss/train': 1.732753872871399} -11/07/2021 00:17:55 - INFO - __main__ - Step 21748: {'lr': 0.00047835685601977886, 'samples': 4175616, 'steps': 21747, 'loss/train': 1.6363345384597778} -11/07/2021 00:17:56 - INFO - __main__ - Step 21749: {'lr': 0.00047835469611464055, 'samples': 4175808, 'steps': 21748, 'loss/train': 1.984601616859436} -11/07/2021 00:17:56 - INFO - __main__ - Step 21750: {'lr': 0.0004783525361066092, 'samples': 4176000, 'steps': 21749, 'loss/train': 1.448114275932312} -11/07/2021 00:17:57 - INFO - __main__ - Step 21751: {'lr': 0.00047835037599568576, 'samples': 4176192, 'steps': 21750, 'loss/train': 1.7460412979125977} -11/07/2021 00:17:57 - INFO - __main__ - Step 21752: {'lr': 0.0004783482157818711, 'samples': 4176384, 'steps': 21751, 'loss/train': 1.7143123149871826} -11/07/2021 00:17:58 - INFO - __main__ - Step 21753: {'lr': 0.0004783460554651663, 'samples': 4176576, 'steps': 21752, 'loss/train': 1.7651176452636719} -11/07/2021 00:17:58 - INFO - __main__ - Step 21754: {'lr': 0.0004783438950455723, 'samples': 4176768, 'steps': 21753, 'loss/train': 2.0488734245300293} -11/07/2021 00:17:59 - INFO - __main__ - Step 21755: {'lr': 0.00047834173452309005, 'samples': 4176960, 'steps': 21754, 'loss/train': 1.682035207748413} -11/07/2021 00:17:59 - INFO - __main__ - Step 21756: {'lr': 0.00047833957389772046, 'samples': 4177152, 'steps': 21755, 'loss/train': 1.6110718250274658} -11/07/2021 00:18:00 - INFO - __main__ - Step 21757: {'lr': 0.0004783374131694647, 'samples': 4177344, 'steps': 21756, 'loss/train': 1.5911036729812622} -11/07/2021 00:18:00 - INFO - __main__ - Step 21758: {'lr': 0.00047833525233832356, 'samples': 4177536, 'steps': 21757, 'loss/train': 1.5307949781417847} -11/07/2021 00:18:00 - INFO - __main__ - Step 21759: {'lr': 0.00047833309140429803, 'samples': 4177728, 'steps': 21758, 'loss/train': 1.8668280839920044} -11/07/2021 00:18:01 - INFO - __main__ - Step 21760: {'lr': 0.0004783309303673892, 'samples': 4177920, 'steps': 21759, 'loss/train': 1.4296553134918213} -11/07/2021 00:18:02 - INFO - __main__ - Step 21761: {'lr': 0.00047832876922759805, 'samples': 4178112, 'steps': 21760, 'loss/train': 1.4576103687286377} -11/07/2021 00:18:02 - INFO - __main__ - Step 21762: {'lr': 0.0004783266079849253, 'samples': 4178304, 'steps': 21761, 'loss/train': 1.7006242275238037} -11/07/2021 00:18:02 - INFO - __main__ - Step 21763: {'lr': 0.00047832444663937227, 'samples': 4178496, 'steps': 21762, 'loss/train': 1.7622902393341064} -11/07/2021 00:18:03 - INFO - __main__ - Step 21764: {'lr': 0.0004783222851909397, 'samples': 4178688, 'steps': 21763, 'loss/train': 1.790881872177124} -11/07/2021 00:18:03 - INFO - __main__ - Step 21765: {'lr': 0.0004783201236396286, 'samples': 4178880, 'steps': 21764, 'loss/train': 1.3149633407592773} -11/07/2021 00:18:04 - INFO - __main__ - Step 21766: {'lr': 0.00047831796198544, 'samples': 4179072, 'steps': 21765, 'loss/train': 1.403822422027588} -11/07/2021 00:18:04 - INFO - __main__ - Step 21767: {'lr': 0.0004783158002283749, 'samples': 4179264, 'steps': 21766, 'loss/train': 1.7273672819137573} -11/07/2021 00:18:05 - INFO - __main__ - Step 21768: {'lr': 0.0004783136383684342, 'samples': 4179456, 'steps': 21767, 'loss/train': 1.5977365970611572} -11/07/2021 00:18:05 - INFO - __main__ - Step 21769: {'lr': 0.0004783114764056188, 'samples': 4179648, 'steps': 21768, 'loss/train': 1.2280904054641724} -11/07/2021 00:18:05 - INFO - __main__ - Step 21770: {'lr': 0.00047830931433992985, 'samples': 4179840, 'steps': 21769, 'loss/train': 0.20790725946426392} -11/07/2021 00:18:07 - INFO - __main__ - Step 21771: {'lr': 0.00047830715217136825, 'samples': 4180032, 'steps': 21770, 'loss/train': 1.8650132417678833} -11/07/2021 00:18:07 - INFO - __main__ - Step 21772: {'lr': 0.000478304989899935, 'samples': 4180224, 'steps': 21771, 'loss/train': 1.264001488685608} -11/07/2021 00:18:07 - INFO - __main__ - Step 21773: {'lr': 0.00047830282752563103, 'samples': 4180416, 'steps': 21772, 'loss/train': 1.614505410194397} -11/07/2021 00:18:08 - INFO - __main__ - Step 21774: {'lr': 0.00047830066504845725, 'samples': 4180608, 'steps': 21773, 'loss/train': 1.6235742568969727} -11/07/2021 00:18:08 - INFO - __main__ - Step 21775: {'lr': 0.0004782985024684148, 'samples': 4180800, 'steps': 21774, 'loss/train': 1.3455910682678223} -11/07/2021 00:18:09 - INFO - __main__ - Step 21776: {'lr': 0.0004782963397855046, 'samples': 4180992, 'steps': 21775, 'loss/train': 1.3944709300994873} -11/07/2021 00:18:09 - INFO - __main__ - Step 21777: {'lr': 0.00047829417699972747, 'samples': 4181184, 'steps': 21776, 'loss/train': 1.57528555393219} -11/07/2021 00:18:10 - INFO - __main__ - Step 21778: {'lr': 0.0004782920141110846, 'samples': 4181376, 'steps': 21777, 'loss/train': 1.8353033065795898} -11/07/2021 00:18:10 - INFO - __main__ - Step 21779: {'lr': 0.0004782898511195768, 'samples': 4181568, 'steps': 21778, 'loss/train': 1.5532902479171753} -11/07/2021 00:18:10 - INFO - __main__ - Step 21780: {'lr': 0.00047828768802520515, 'samples': 4181760, 'steps': 21779, 'loss/train': 1.8849406242370605} -11/07/2021 00:18:11 - INFO - __main__ - Step 21781: {'lr': 0.0004782855248279706, 'samples': 4181952, 'steps': 21780, 'loss/train': 2.070675849914551} -11/07/2021 00:18:12 - INFO - __main__ - Step 21782: {'lr': 0.0004782833615278741, 'samples': 4182144, 'steps': 21781, 'loss/train': 1.6351349353790283} -11/07/2021 00:18:12 - INFO - __main__ - Step 21783: {'lr': 0.00047828119812491664, 'samples': 4182336, 'steps': 21782, 'loss/train': 1.5823655128479004} -11/07/2021 00:18:12 - INFO - __main__ - Step 21784: {'lr': 0.0004782790346190993, 'samples': 4182528, 'steps': 21783, 'loss/train': 1.455492377281189} -11/07/2021 00:18:13 - INFO - __main__ - Step 21785: {'lr': 0.00047827687101042283, 'samples': 4182720, 'steps': 21784, 'loss/train': 1.162865400314331} -11/07/2021 00:18:14 - INFO - __main__ - Step 21786: {'lr': 0.00047827470729888834, 'samples': 4182912, 'steps': 21785, 'loss/train': 1.6407850980758667} -11/07/2021 00:18:14 - INFO - __main__ - Step 21787: {'lr': 0.0004782725434844968, 'samples': 4183104, 'steps': 21786, 'loss/train': 1.9232147932052612} -11/07/2021 00:18:15 - INFO - __main__ - Step 21788: {'lr': 0.00047827037956724915, 'samples': 4183296, 'steps': 21787, 'loss/train': 1.6318410634994507} -11/07/2021 00:18:15 - INFO - __main__ - Step 21789: {'lr': 0.00047826821554714644, 'samples': 4183488, 'steps': 21788, 'loss/train': 1.4995194673538208} -11/07/2021 00:18:15 - INFO - __main__ - Step 21790: {'lr': 0.00047826605142418954, 'samples': 4183680, 'steps': 21789, 'loss/train': 1.456229329109192} -11/07/2021 00:18:17 - INFO - __main__ - Step 21791: {'lr': 0.0004782638871983795, 'samples': 4183872, 'steps': 21790, 'loss/train': 1.5134155750274658} -11/07/2021 00:18:17 - INFO - __main__ - Step 21792: {'lr': 0.0004782617228697173, 'samples': 4184064, 'steps': 21791, 'loss/train': 1.4779579639434814} -11/07/2021 00:18:17 - INFO - __main__ - Step 21793: {'lr': 0.0004782595584382039, 'samples': 4184256, 'steps': 21792, 'loss/train': 2.105910301208496} -11/07/2021 00:18:18 - INFO - __main__ - Step 21794: {'lr': 0.0004782573939038402, 'samples': 4184448, 'steps': 21793, 'loss/train': 1.5484576225280762} -11/07/2021 00:18:18 - INFO - __main__ - Step 21795: {'lr': 0.0004782552292666273, 'samples': 4184640, 'steps': 21794, 'loss/train': 0.4943452775478363} -11/07/2021 00:18:19 - INFO - __main__ - Step 21796: {'lr': 0.0004782530645265661, 'samples': 4184832, 'steps': 21795, 'loss/train': 1.8683432340621948} -11/07/2021 00:18:19 - INFO - __main__ - Step 21797: {'lr': 0.0004782508996836576, 'samples': 4185024, 'steps': 21796, 'loss/train': 1.6919738054275513} -11/07/2021 00:18:20 - INFO - __main__ - Step 21798: {'lr': 0.00047824873473790275, 'samples': 4185216, 'steps': 21797, 'loss/train': 1.65096914768219} -11/07/2021 00:18:20 - INFO - __main__ - Step 21799: {'lr': 0.0004782465696893025, 'samples': 4185408, 'steps': 21798, 'loss/train': 0.8809558749198914} -11/07/2021 00:18:20 - INFO - __main__ - Step 21800: {'lr': 0.0004782444045378579, 'samples': 4185600, 'steps': 21799, 'loss/train': 1.672647476196289} -11/07/2021 00:18:21 - INFO - __main__ - Step 21801: {'lr': 0.00047824223928356993, 'samples': 4185792, 'steps': 21800, 'loss/train': 1.561408281326294} -11/07/2021 00:18:22 - INFO - __main__ - Step 21802: {'lr': 0.0004782400739264395, 'samples': 4185984, 'steps': 21801, 'loss/train': 1.8260188102722168} -11/07/2021 00:18:22 - INFO - __main__ - Step 21803: {'lr': 0.00047823790846646764, 'samples': 4186176, 'steps': 21802, 'loss/train': 1.5481027364730835} -11/07/2021 00:18:23 - INFO - __main__ - Step 21804: {'lr': 0.0004782357429036553, 'samples': 4186368, 'steps': 21803, 'loss/train': 1.6464818716049194} -11/07/2021 00:18:23 - INFO - __main__ - Step 21805: {'lr': 0.00047823357723800344, 'samples': 4186560, 'steps': 21804, 'loss/train': 1.4024767875671387} -11/07/2021 00:18:23 - INFO - __main__ - Step 21806: {'lr': 0.000478231411469513, 'samples': 4186752, 'steps': 21805, 'loss/train': 1.3001028299331665} -11/07/2021 00:18:24 - INFO - __main__ - Step 21807: {'lr': 0.000478229245598185, 'samples': 4186944, 'steps': 21806, 'loss/train': 1.666137933731079} -11/07/2021 00:18:25 - INFO - __main__ - Step 21808: {'lr': 0.00047822707962402055, 'samples': 4187136, 'steps': 21807, 'loss/train': 1.8843587636947632} -11/07/2021 00:18:25 - INFO - __main__ - Step 21809: {'lr': 0.00047822491354702044, 'samples': 4187328, 'steps': 21808, 'loss/train': 1.8649508953094482} -11/07/2021 00:18:25 - INFO - __main__ - Step 21810: {'lr': 0.0004782227473671857, 'samples': 4187520, 'steps': 21809, 'loss/train': 1.851442575454712} -11/07/2021 00:18:26 - INFO - __main__ - Step 21811: {'lr': 0.00047822058108451727, 'samples': 4187712, 'steps': 21810, 'loss/train': 1.5848554372787476} -11/07/2021 00:18:27 - INFO - __main__ - Step 21812: {'lr': 0.0004782184146990162, 'samples': 4187904, 'steps': 21811, 'loss/train': 0.5069980025291443} -11/07/2021 00:18:27 - INFO - __main__ - Step 21813: {'lr': 0.00047821624821068346, 'samples': 4188096, 'steps': 21812, 'loss/train': 1.5223522186279297} -11/07/2021 00:18:28 - INFO - __main__ - Step 21814: {'lr': 0.00047821408161952, 'samples': 4188288, 'steps': 21813, 'loss/train': 1.8222025632858276} -11/07/2021 00:18:28 - INFO - __main__ - Step 21815: {'lr': 0.00047821191492552676, 'samples': 4188480, 'steps': 21814, 'loss/train': 1.5835494995117188} -11/07/2021 00:18:28 - INFO - __main__ - Step 21816: {'lr': 0.00047820974812870477, 'samples': 4188672, 'steps': 21815, 'loss/train': 1.3906757831573486} -11/07/2021 00:18:29 - INFO - __main__ - Step 21817: {'lr': 0.00047820758122905493, 'samples': 4188864, 'steps': 21816, 'loss/train': 0.9313063621520996} -11/07/2021 00:18:29 - INFO - __main__ - Step 21818: {'lr': 0.0004782054142265784, 'samples': 4189056, 'steps': 21817, 'loss/train': 1.363304853439331} -11/07/2021 00:18:30 - INFO - __main__ - Step 21819: {'lr': 0.00047820324712127593, 'samples': 4189248, 'steps': 21818, 'loss/train': 1.2986811399459839} -11/07/2021 00:18:30 - INFO - __main__ - Step 21820: {'lr': 0.0004782010799131487, 'samples': 4189440, 'steps': 21819, 'loss/train': 1.870723843574524} -11/07/2021 00:18:31 - INFO - __main__ - Step 21821: {'lr': 0.0004781989126021975, 'samples': 4189632, 'steps': 21820, 'loss/train': 1.8027942180633545} -11/07/2021 00:18:31 - INFO - __main__ - Step 21822: {'lr': 0.00047819674518842335, 'samples': 4189824, 'steps': 21821, 'loss/train': 2.168245792388916} -11/07/2021 00:18:32 - INFO - __main__ - Step 21823: {'lr': 0.00047819457767182735, 'samples': 4190016, 'steps': 21822, 'loss/train': 1.800366997718811} -11/07/2021 00:18:32 - INFO - __main__ - Step 21824: {'lr': 0.0004781924100524104, 'samples': 4190208, 'steps': 21823, 'loss/train': 1.727982997894287} -11/07/2021 00:18:33 - INFO - __main__ - Step 21825: {'lr': 0.00047819024233017337, 'samples': 4190400, 'steps': 21824, 'loss/train': 1.5247220993041992} -11/07/2021 00:18:33 - INFO - __main__ - Step 21826: {'lr': 0.00047818807450511746, 'samples': 4190592, 'steps': 21825, 'loss/train': 1.1852495670318604} -11/07/2021 00:18:34 - INFO - __main__ - Step 21827: {'lr': 0.00047818590657724345, 'samples': 4190784, 'steps': 21826, 'loss/train': 1.8680647611618042} -11/07/2021 00:18:34 - INFO - __main__ - Step 21828: {'lr': 0.0004781837385465524, 'samples': 4190976, 'steps': 21827, 'loss/train': 1.8202399015426636} -11/07/2021 00:18:35 - INFO - __main__ - Step 21829: {'lr': 0.00047818157041304535, 'samples': 4191168, 'steps': 21828, 'loss/train': 1.9058685302734375} -11/07/2021 00:18:35 - INFO - __main__ - Step 21830: {'lr': 0.00047817940217672315, 'samples': 4191360, 'steps': 21829, 'loss/train': 1.6217126846313477} -11/07/2021 00:18:35 - INFO - __main__ - Step 21831: {'lr': 0.0004781772338375868, 'samples': 4191552, 'steps': 21830, 'loss/train': 1.5916210412979126} -11/07/2021 00:18:36 - INFO - __main__ - Step 21832: {'lr': 0.0004781750653956374, 'samples': 4191744, 'steps': 21831, 'loss/train': 1.7649997472763062} -11/07/2021 00:18:37 - INFO - __main__ - Step 21833: {'lr': 0.00047817289685087575, 'samples': 4191936, 'steps': 21832, 'loss/train': 1.5090216398239136} -11/07/2021 00:18:37 - INFO - __main__ - Step 21834: {'lr': 0.00047817072820330287, 'samples': 4192128, 'steps': 21833, 'loss/train': 0.29298678040504456} -11/07/2021 00:18:37 - INFO - __main__ - Step 21835: {'lr': 0.0004781685594529199, 'samples': 4192320, 'steps': 21834, 'loss/train': 1.3522447347640991} -11/07/2021 00:18:38 - INFO - __main__ - Step 21836: {'lr': 0.00047816639059972767, 'samples': 4192512, 'steps': 21835, 'loss/train': 1.8226150274276733} -11/07/2021 00:18:39 - INFO - __main__ - Step 21837: {'lr': 0.00047816422164372713, 'samples': 4192704, 'steps': 21836, 'loss/train': 1.258782982826233} -11/07/2021 00:18:39 - INFO - __main__ - Step 21838: {'lr': 0.00047816205258491935, 'samples': 4192896, 'steps': 21837, 'loss/train': 1.8745602369308472} -11/07/2021 00:18:40 - INFO - __main__ - Step 21839: {'lr': 0.0004781598834233053, 'samples': 4193088, 'steps': 21838, 'loss/train': 2.18178653717041} -11/07/2021 00:18:40 - INFO - __main__ - Step 21840: {'lr': 0.0004781577141588859, 'samples': 4193280, 'steps': 21839, 'loss/train': 2.1624045372009277} -11/07/2021 00:18:40 - INFO - __main__ - Step 21841: {'lr': 0.0004781555447916621, 'samples': 4193472, 'steps': 21840, 'loss/train': 1.661039113998413} -11/07/2021 00:18:41 - INFO - __main__ - Step 21842: {'lr': 0.000478153375321635, 'samples': 4193664, 'steps': 21841, 'loss/train': 1.5614854097366333} -11/07/2021 00:18:42 - INFO - __main__ - Step 21843: {'lr': 0.0004781512057488055, 'samples': 4193856, 'steps': 21842, 'loss/train': 1.4372495412826538} -11/07/2021 00:18:42 - INFO - __main__ - Step 21844: {'lr': 0.00047814903607317454, 'samples': 4194048, 'steps': 21843, 'loss/train': 1.4852203130722046} -11/07/2021 00:18:42 - INFO - __main__ - Step 21845: {'lr': 0.00047814686629474323, 'samples': 4194240, 'steps': 21844, 'loss/train': 1.8648353815078735} -11/07/2021 00:18:43 - INFO - __main__ - Step 21846: {'lr': 0.00047814469641351237, 'samples': 4194432, 'steps': 21845, 'loss/train': 1.8701627254486084} -11/07/2021 00:18:43 - INFO - __main__ - Step 21847: {'lr': 0.0004781425264294831, 'samples': 4194624, 'steps': 21846, 'loss/train': 0.418106347322464} -11/07/2021 00:18:44 - INFO - __main__ - Step 21848: {'lr': 0.0004781403563426563, 'samples': 4194816, 'steps': 21847, 'loss/train': 0.14467741549015045} -11/07/2021 00:18:44 - INFO - __main__ - Step 21849: {'lr': 0.00047813818615303295, 'samples': 4195008, 'steps': 21848, 'loss/train': 1.6116589307785034} -11/07/2021 00:18:45 - INFO - __main__ - Step 21850: {'lr': 0.00047813601586061414, 'samples': 4195200, 'steps': 21849, 'loss/train': 1.225780725479126} -11/07/2021 00:18:45 - INFO - __main__ - Step 21851: {'lr': 0.0004781338454654007, 'samples': 4195392, 'steps': 21850, 'loss/train': 1.4589381217956543} -11/07/2021 00:18:45 - INFO - __main__ - Step 21852: {'lr': 0.00047813167496739363, 'samples': 4195584, 'steps': 21851, 'loss/train': 1.6310547590255737} -11/07/2021 00:18:47 - INFO - __main__ - Step 21853: {'lr': 0.00047812950436659405, 'samples': 4195776, 'steps': 21852, 'loss/train': 1.6144341230392456} -11/07/2021 00:18:47 - INFO - __main__ - Step 21854: {'lr': 0.0004781273336630028, 'samples': 4195968, 'steps': 21853, 'loss/train': 1.7650673389434814} -11/07/2021 00:18:47 - INFO - __main__ - Step 21855: {'lr': 0.00047812516285662086, 'samples': 4196160, 'steps': 21854, 'loss/train': 1.2556949853897095} -11/07/2021 00:18:48 - INFO - __main__ - Step 21856: {'lr': 0.00047812299194744924, 'samples': 4196352, 'steps': 21855, 'loss/train': 1.4601771831512451} -11/07/2021 00:18:48 - INFO - __main__ - Step 21857: {'lr': 0.0004781208209354889, 'samples': 4196544, 'steps': 21856, 'loss/train': 1.820651888847351} -11/07/2021 00:18:49 - INFO - __main__ - Step 21858: {'lr': 0.00047811864982074087, 'samples': 4196736, 'steps': 21857, 'loss/train': 1.4750192165374756} -11/07/2021 00:18:49 - INFO - __main__ - Step 21859: {'lr': 0.0004781164786032061, 'samples': 4196928, 'steps': 21858, 'loss/train': 0.9147158265113831} -11/07/2021 00:18:50 - INFO - __main__ - Step 21860: {'lr': 0.0004781143072828856, 'samples': 4197120, 'steps': 21859, 'loss/train': 1.3358899354934692} -11/07/2021 00:18:50 - INFO - __main__ - Step 21861: {'lr': 0.00047811213585978023, 'samples': 4197312, 'steps': 21860, 'loss/train': 1.5927478075027466} -11/07/2021 00:18:50 - INFO - __main__ - Step 21862: {'lr': 0.0004781099643338911, 'samples': 4197504, 'steps': 21861, 'loss/train': 1.585418701171875} -11/07/2021 00:18:51 - INFO - __main__ - Step 21863: {'lr': 0.00047810779270521914, 'samples': 4197696, 'steps': 21862, 'loss/train': 1.556623101234436} -11/07/2021 00:18:52 - INFO - __main__ - Step 21864: {'lr': 0.0004781056209737653, 'samples': 4197888, 'steps': 21863, 'loss/train': 1.2449383735656738} -11/07/2021 00:18:52 - INFO - __main__ - Step 21865: {'lr': 0.00047810344913953065, 'samples': 4198080, 'steps': 21864, 'loss/train': 1.4618579149246216} -11/07/2021 00:18:52 - INFO - __main__ - Step 21866: {'lr': 0.0004781012772025161, 'samples': 4198272, 'steps': 21865, 'loss/train': 1.6904577016830444} -11/07/2021 00:18:53 - INFO - __main__ - Step 21867: {'lr': 0.0004780991051627226, 'samples': 4198464, 'steps': 21866, 'loss/train': 1.2188726663589478} -11/07/2021 00:18:53 - INFO - __main__ - Step 21868: {'lr': 0.0004780969330201511, 'samples': 4198656, 'steps': 21867, 'loss/train': 2.0451176166534424} -11/07/2021 00:18:54 - INFO - __main__ - Step 21869: {'lr': 0.0004780947607748027, 'samples': 4198848, 'steps': 21868, 'loss/train': 1.7905349731445312} -11/07/2021 00:18:55 - INFO - __main__ - Step 21870: {'lr': 0.00047809258842667837, 'samples': 4199040, 'steps': 21869, 'loss/train': 1.1601496934890747} -11/07/2021 00:18:55 - INFO - __main__ - Step 21871: {'lr': 0.000478090415975779, 'samples': 4199232, 'steps': 21870, 'loss/train': 1.764669418334961} -11/07/2021 00:18:55 - INFO - __main__ - Step 21872: {'lr': 0.00047808824342210565, 'samples': 4199424, 'steps': 21871, 'loss/train': 2.10385799407959} -11/07/2021 00:18:56 - INFO - __main__ - Step 21873: {'lr': 0.0004780860707656592, 'samples': 4199616, 'steps': 21872, 'loss/train': 1.9181289672851562} -11/07/2021 00:18:57 - INFO - __main__ - Step 21874: {'lr': 0.0004780838980064407, 'samples': 4199808, 'steps': 21873, 'loss/train': 1.509691596031189} -11/07/2021 00:18:57 - INFO - __main__ - Step 21875: {'lr': 0.00047808172514445115, 'samples': 4200000, 'steps': 21874, 'loss/train': 1.487251877784729} -11/07/2021 00:18:57 - INFO - __main__ - Step 21876: {'lr': 0.0004780795521796914, 'samples': 4200192, 'steps': 21875, 'loss/train': 1.7136597633361816} -11/07/2021 00:18:58 - INFO - __main__ - Step 21877: {'lr': 0.0004780773791121626, 'samples': 4200384, 'steps': 21876, 'loss/train': 1.5490812063217163} -11/07/2021 00:18:58 - INFO - __main__ - Step 21878: {'lr': 0.0004780752059418656, 'samples': 4200576, 'steps': 21877, 'loss/train': 1.2752032279968262} -11/07/2021 00:18:59 - INFO - __main__ - Step 21879: {'lr': 0.0004780730326688015, 'samples': 4200768, 'steps': 21878, 'loss/train': 5.443384170532227} -11/07/2021 00:19:00 - INFO - __main__ - Step 21880: {'lr': 0.0004780708592929712, 'samples': 4200960, 'steps': 21879, 'loss/train': 1.6154052019119263} -11/07/2021 00:19:00 - INFO - __main__ - Step 21881: {'lr': 0.0004780686858143756, 'samples': 4201152, 'steps': 21880, 'loss/train': 1.7930195331573486} -11/07/2021 00:19:00 - INFO - __main__ - Step 21882: {'lr': 0.0004780665122330159, 'samples': 4201344, 'steps': 21881, 'loss/train': 1.518471360206604} -11/07/2021 00:19:01 - INFO - __main__ - Step 21883: {'lr': 0.00047806433854889285, 'samples': 4201536, 'steps': 21882, 'loss/train': 0.8893343210220337} -11/07/2021 00:19:01 - INFO - __main__ - Step 21884: {'lr': 0.0004780621647620076, 'samples': 4201728, 'steps': 21883, 'loss/train': 0.4408738613128662} -11/07/2021 00:19:02 - INFO - __main__ - Step 21885: {'lr': 0.00047805999087236097, 'samples': 4201920, 'steps': 21884, 'loss/train': 2.2122480869293213} -11/07/2021 00:19:02 - INFO - __main__ - Step 21886: {'lr': 0.0004780578168799541, 'samples': 4202112, 'steps': 21885, 'loss/train': 0.9583873748779297} -11/07/2021 00:19:03 - INFO - __main__ - Step 21887: {'lr': 0.00047805564278478787, 'samples': 4202304, 'steps': 21886, 'loss/train': 1.2693642377853394} -11/07/2021 00:19:03 - INFO - __main__ - Step 21888: {'lr': 0.00047805346858686325, 'samples': 4202496, 'steps': 21887, 'loss/train': 2.000314474105835} -11/07/2021 00:19:03 - INFO - __main__ - Step 21889: {'lr': 0.0004780512942861813, 'samples': 4202688, 'steps': 21888, 'loss/train': 1.3067866563796997} -11/07/2021 00:19:04 - INFO - __main__ - Step 21890: {'lr': 0.00047804911988274303, 'samples': 4202880, 'steps': 21889, 'loss/train': 1.678052544593811} -11/07/2021 00:19:05 - INFO - __main__ - Step 21891: {'lr': 0.00047804694537654927, 'samples': 4203072, 'steps': 21890, 'loss/train': 1.5158631801605225} -11/07/2021 00:19:05 - INFO - __main__ - Step 21892: {'lr': 0.00047804477076760106, 'samples': 4203264, 'steps': 21891, 'loss/train': 1.5687859058380127} -11/07/2021 00:19:06 - INFO - __main__ - Step 21893: {'lr': 0.0004780425960558994, 'samples': 4203456, 'steps': 21892, 'loss/train': 1.5470932722091675} -11/07/2021 00:19:06 - INFO - __main__ - Step 21894: {'lr': 0.00047804042124144526, 'samples': 4203648, 'steps': 21893, 'loss/train': 1.7719433307647705} -11/07/2021 00:19:07 - INFO - __main__ - Step 21895: {'lr': 0.00047803824632423967, 'samples': 4203840, 'steps': 21894, 'loss/train': 1.6650912761688232} -11/07/2021 00:19:07 - INFO - __main__ - Step 21896: {'lr': 0.0004780360713042835, 'samples': 4204032, 'steps': 21895, 'loss/train': 1.5138376951217651} -11/07/2021 00:19:08 - INFO - __main__ - Step 21897: {'lr': 0.0004780338961815779, 'samples': 4204224, 'steps': 21896, 'loss/train': 2.1411073207855225} -11/07/2021 00:19:08 - INFO - __main__ - Step 21898: {'lr': 0.00047803172095612365, 'samples': 4204416, 'steps': 21897, 'loss/train': 1.6470144987106323} -11/07/2021 00:19:08 - INFO - __main__ - Step 21899: {'lr': 0.00047802954562792185, 'samples': 4204608, 'steps': 21898, 'loss/train': 1.3572453260421753} -11/07/2021 00:19:09 - INFO - __main__ - Step 21900: {'lr': 0.0004780273701969734, 'samples': 4204800, 'steps': 21899, 'loss/train': 1.491538405418396} -11/07/2021 00:19:10 - INFO - __main__ - Step 21901: {'lr': 0.00047802519466327945, 'samples': 4204992, 'steps': 21900, 'loss/train': 2.107398509979248} -11/07/2021 00:19:10 - INFO - __main__ - Step 21902: {'lr': 0.00047802301902684076, 'samples': 4205184, 'steps': 21901, 'loss/train': 1.5457367897033691} -11/07/2021 00:19:10 - INFO - __main__ - Step 21903: {'lr': 0.0004780208432876585, 'samples': 4205376, 'steps': 21902, 'loss/train': 1.2147682905197144} -11/07/2021 00:19:11 - INFO - __main__ - Step 21904: {'lr': 0.00047801866744573353, 'samples': 4205568, 'steps': 21903, 'loss/train': 1.2499436140060425} -11/07/2021 00:19:12 - INFO - __main__ - Step 21905: {'lr': 0.00047801649150106684, 'samples': 4205760, 'steps': 21904, 'loss/train': 1.9765163660049438} -11/07/2021 00:19:12 - INFO - __main__ - Step 21906: {'lr': 0.00047801431545365947, 'samples': 4205952, 'steps': 21905, 'loss/train': 1.6405918598175049} -11/07/2021 00:19:13 - INFO - __main__ - Step 21907: {'lr': 0.0004780121393035124, 'samples': 4206144, 'steps': 21906, 'loss/train': 1.492367148399353} -11/07/2021 00:19:13 - INFO - __main__ - Step 21908: {'lr': 0.0004780099630506265, 'samples': 4206336, 'steps': 21907, 'loss/train': 1.6051231622695923} -11/07/2021 00:19:13 - INFO - __main__ - Step 21909: {'lr': 0.0004780077866950029, 'samples': 4206528, 'steps': 21908, 'loss/train': 5.938828945159912} -11/07/2021 00:19:14 - INFO - __main__ - Step 21910: {'lr': 0.00047800561023664246, 'samples': 4206720, 'steps': 21909, 'loss/train': 1.5359915494918823} -11/07/2021 00:19:15 - INFO - __main__ - Step 21911: {'lr': 0.0004780034336755462, 'samples': 4206912, 'steps': 21910, 'loss/train': 2.409712314605713} -11/07/2021 00:19:15 - INFO - __main__ - Step 21912: {'lr': 0.00047800125701171517, 'samples': 4207104, 'steps': 21911, 'loss/train': 1.6394217014312744} -11/07/2021 00:19:15 - INFO - __main__ - Step 21913: {'lr': 0.00047799908024515026, 'samples': 4207296, 'steps': 21912, 'loss/train': 1.683571457862854} -11/07/2021 00:19:16 - INFO - __main__ - Step 21914: {'lr': 0.0004779969033758525, 'samples': 4207488, 'steps': 21913, 'loss/train': 1.252291202545166} -11/07/2021 00:19:16 - INFO - __main__ - Step 21915: {'lr': 0.00047799472640382287, 'samples': 4207680, 'steps': 21914, 'loss/train': 1.8091762065887451} -11/07/2021 00:19:17 - INFO - __main__ - Step 21916: {'lr': 0.0004779925493290623, 'samples': 4207872, 'steps': 21915, 'loss/train': 1.6336859464645386} -11/07/2021 00:19:17 - INFO - __main__ - Step 21917: {'lr': 0.00047799037215157184, 'samples': 4208064, 'steps': 21916, 'loss/train': 1.4064269065856934} -11/07/2021 00:19:18 - INFO - __main__ - Step 21918: {'lr': 0.0004779881948713524, 'samples': 4208256, 'steps': 21917, 'loss/train': 1.3182247877120972} -11/07/2021 00:19:18 - INFO - __main__ - Step 21919: {'lr': 0.000477986017488405, 'samples': 4208448, 'steps': 21918, 'loss/train': 1.4684267044067383} -11/07/2021 00:19:18 - INFO - __main__ - Step 21920: {'lr': 0.00047798384000273053, 'samples': 4208640, 'steps': 21919, 'loss/train': 0.6165792346000671} -11/07/2021 00:19:20 - INFO - __main__ - Step 21921: {'lr': 0.0004779816624143302, 'samples': 4208832, 'steps': 21920, 'loss/train': 1.593778371810913} -11/07/2021 00:19:20 - INFO - __main__ - Step 21922: {'lr': 0.0004779794847232048, 'samples': 4209024, 'steps': 21921, 'loss/train': 0.12900973856449127} -11/07/2021 00:19:20 - INFO - __main__ - Step 21923: {'lr': 0.0004779773069293554, 'samples': 4209216, 'steps': 21922, 'loss/train': 1.0907976627349854} -11/07/2021 00:19:21 - INFO - __main__ - Step 21924: {'lr': 0.00047797512903278283, 'samples': 4209408, 'steps': 21923, 'loss/train': 1.5280829668045044} -11/07/2021 00:19:21 - INFO - __main__ - Step 21925: {'lr': 0.0004779729510334883, 'samples': 4209600, 'steps': 21924, 'loss/train': 1.7411478757858276} -11/07/2021 00:19:22 - INFO - __main__ - Step 21926: {'lr': 0.0004779707729314726, 'samples': 4209792, 'steps': 21925, 'loss/train': 1.3452696800231934} -11/07/2021 00:19:22 - INFO - __main__ - Step 21927: {'lr': 0.0004779685947267369, 'samples': 4209984, 'steps': 21926, 'loss/train': 1.8387231826782227} -11/07/2021 00:19:23 - INFO - __main__ - Step 21928: {'lr': 0.00047796641641928195, 'samples': 4210176, 'steps': 21927, 'loss/train': 1.7874184846878052} -11/07/2021 00:19:23 - INFO - __main__ - Step 21929: {'lr': 0.00047796423800910894, 'samples': 4210368, 'steps': 21928, 'loss/train': 1.862120270729065} -11/07/2021 00:19:23 - INFO - __main__ - Step 21930: {'lr': 0.00047796205949621873, 'samples': 4210560, 'steps': 21929, 'loss/train': 0.7199652791023254} -11/07/2021 00:19:24 - INFO - __main__ - Step 21931: {'lr': 0.00047795988088061224, 'samples': 4210752, 'steps': 21930, 'loss/train': 1.5282775163650513} -11/07/2021 00:19:25 - INFO - __main__ - Step 21932: {'lr': 0.00047795770216229065, 'samples': 4210944, 'steps': 21931, 'loss/train': 1.4960988759994507} -11/07/2021 00:19:25 - INFO - __main__ - Step 21933: {'lr': 0.0004779555233412548, 'samples': 4211136, 'steps': 21932, 'loss/train': 1.548005223274231} -11/07/2021 00:19:25 - INFO - __main__ - Step 21934: {'lr': 0.0004779533444175058, 'samples': 4211328, 'steps': 21933, 'loss/train': 1.737036108970642} -11/07/2021 00:19:26 - INFO - __main__ - Step 21935: {'lr': 0.00047795116539104445, 'samples': 4211520, 'steps': 21934, 'loss/train': 0.9867969751358032} -11/07/2021 00:19:27 - INFO - __main__ - Step 21936: {'lr': 0.0004779489862618718, 'samples': 4211712, 'steps': 21935, 'loss/train': 1.5135012865066528} -11/07/2021 00:19:27 - INFO - __main__ - Step 21937: {'lr': 0.00047794680702998893, 'samples': 4211904, 'steps': 21936, 'loss/train': 1.431929588317871} -11/07/2021 00:19:28 - INFO - __main__ - Step 21938: {'lr': 0.0004779446276953967, 'samples': 4212096, 'steps': 21937, 'loss/train': 1.4647678136825562} -11/07/2021 00:19:28 - INFO - __main__ - Step 21939: {'lr': 0.00047794244825809614, 'samples': 4212288, 'steps': 21938, 'loss/train': 1.3799632787704468} -11/07/2021 00:19:28 - INFO - __main__ - Step 21940: {'lr': 0.0004779402687180882, 'samples': 4212480, 'steps': 21939, 'loss/train': 1.5208247900009155} -11/07/2021 00:19:29 - INFO - __main__ - Step 21941: {'lr': 0.00047793808907537394, 'samples': 4212672, 'steps': 21940, 'loss/train': 0.8766080141067505} -11/07/2021 00:19:29 - INFO - __main__ - Step 21942: {'lr': 0.0004779359093299543, 'samples': 4212864, 'steps': 21941, 'loss/train': 1.755677342414856} -11/07/2021 00:19:30 - INFO - __main__ - Step 21943: {'lr': 0.00047793372948183024, 'samples': 4213056, 'steps': 21942, 'loss/train': 1.6062308549880981} -11/07/2021 00:19:30 - INFO - __main__ - Step 21944: {'lr': 0.0004779315495310027, 'samples': 4213248, 'steps': 21943, 'loss/train': 1.1306722164154053} -11/07/2021 00:19:31 - INFO - __main__ - Step 21945: {'lr': 0.00047792936947747285, 'samples': 4213440, 'steps': 21944, 'loss/train': 1.6972370147705078} -11/07/2021 00:19:32 - INFO - __main__ - Step 21946: {'lr': 0.00047792718932124147, 'samples': 4213632, 'steps': 21945, 'loss/train': 1.8011847734451294} -11/07/2021 00:19:32 - INFO - __main__ - Step 21947: {'lr': 0.00047792500906230963, 'samples': 4213824, 'steps': 21946, 'loss/train': 1.8816180229187012} -11/07/2021 00:19:32 - INFO - __main__ - Step 21948: {'lr': 0.00047792282870067827, 'samples': 4214016, 'steps': 21947, 'loss/train': 1.5840351581573486} -11/07/2021 00:19:33 - INFO - __main__ - Step 21949: {'lr': 0.0004779206482363484, 'samples': 4214208, 'steps': 21948, 'loss/train': 1.393857479095459} -11/07/2021 00:19:33 - INFO - __main__ - Step 21950: {'lr': 0.000477918467669321, 'samples': 4214400, 'steps': 21949, 'loss/train': 1.2116628885269165} -11/07/2021 00:19:33 - INFO - __main__ - Step 21951: {'lr': 0.0004779162869995971, 'samples': 4214592, 'steps': 21950, 'loss/train': 1.45814049243927} -11/07/2021 00:19:34 - INFO - __main__ - Step 21952: {'lr': 0.00047791410622717757, 'samples': 4214784, 'steps': 21951, 'loss/train': 1.6132930517196655} -11/07/2021 00:19:35 - INFO - __main__ - Step 21953: {'lr': 0.0004779119253520635, 'samples': 4214976, 'steps': 21952, 'loss/train': 0.9097754955291748} -11/07/2021 00:19:35 - INFO - __main__ - Step 21954: {'lr': 0.0004779097443742558, 'samples': 4215168, 'steps': 21953, 'loss/train': 1.3216646909713745} -11/07/2021 00:19:35 - INFO - __main__ - Step 21955: {'lr': 0.0004779075632937556, 'samples': 4215360, 'steps': 21954, 'loss/train': 1.2813609838485718} -11/07/2021 00:19:36 - INFO - __main__ - Step 21956: {'lr': 0.00047790538211056366, 'samples': 4215552, 'steps': 21955, 'loss/train': 1.931445837020874} -11/07/2021 00:19:37 - INFO - __main__ - Step 21957: {'lr': 0.00047790320082468106, 'samples': 4215744, 'steps': 21956, 'loss/train': 1.242431879043579} -11/07/2021 00:19:37 - INFO - __main__ - Step 21958: {'lr': 0.00047790101943610884, 'samples': 4215936, 'steps': 21957, 'loss/train': 1.5784425735473633} -11/07/2021 00:19:37 - INFO - __main__ - Step 21959: {'lr': 0.000477898837944848, 'samples': 4216128, 'steps': 21958, 'loss/train': 1.6640866994857788} -11/07/2021 00:19:38 - INFO - __main__ - Step 21960: {'lr': 0.0004778966563508994, 'samples': 4216320, 'steps': 21959, 'loss/train': 1.7045584917068481} -11/07/2021 00:19:38 - INFO - __main__ - Step 21961: {'lr': 0.00047789447465426406, 'samples': 4216512, 'steps': 21960, 'loss/train': 1.3044613599777222} -11/07/2021 00:19:39 - INFO - __main__ - Step 21962: {'lr': 0.000477892292854943, 'samples': 4216704, 'steps': 21961, 'loss/train': 0.78977370262146} -11/07/2021 00:19:40 - INFO - __main__ - Step 21963: {'lr': 0.00047789011095293723, 'samples': 4216896, 'steps': 21962, 'loss/train': 0.40516743063926697} -11/07/2021 00:19:40 - INFO - __main__ - Step 21964: {'lr': 0.0004778879289482476, 'samples': 4217088, 'steps': 21963, 'loss/train': 1.4810577630996704} -11/07/2021 00:19:40 - INFO - __main__ - Step 21965: {'lr': 0.00047788574684087527, 'samples': 4217280, 'steps': 21964, 'loss/train': 1.5655182600021362} -11/07/2021 00:19:41 - INFO - __main__ - Step 21966: {'lr': 0.0004778835646308211, 'samples': 4217472, 'steps': 21965, 'loss/train': 1.6509648561477661} -11/07/2021 00:19:42 - INFO - __main__ - Step 21967: {'lr': 0.0004778813823180861, 'samples': 4217664, 'steps': 21966, 'loss/train': 1.6567872762680054} -11/07/2021 00:19:42 - INFO - __main__ - Step 21968: {'lr': 0.0004778791999026713, 'samples': 4217856, 'steps': 21967, 'loss/train': 1.728704810142517} -11/07/2021 00:19:42 - INFO - __main__ - Step 21969: {'lr': 0.0004778770173845777, 'samples': 4218048, 'steps': 21968, 'loss/train': 1.5943408012390137} -11/07/2021 00:19:43 - INFO - __main__ - Step 21970: {'lr': 0.00047787483476380613, 'samples': 4218240, 'steps': 21969, 'loss/train': 1.6115553379058838} -11/07/2021 00:19:43 - INFO - __main__ - Step 21971: {'lr': 0.0004778726520403577, 'samples': 4218432, 'steps': 21970, 'loss/train': 2.4777019023895264} -11/07/2021 00:19:44 - INFO - __main__ - Step 21972: {'lr': 0.00047787046921423336, 'samples': 4218624, 'steps': 21971, 'loss/train': 1.0873228311538696} -11/07/2021 00:19:45 - INFO - __main__ - Step 21973: {'lr': 0.00047786828628543416, 'samples': 4218816, 'steps': 21972, 'loss/train': 1.61286199092865} -11/07/2021 00:19:45 - INFO - __main__ - Step 21974: {'lr': 0.00047786610325396096, 'samples': 4219008, 'steps': 21973, 'loss/train': 1.5641791820526123} -11/07/2021 00:19:45 - INFO - __main__ - Step 21975: {'lr': 0.0004778639201198149, 'samples': 4219200, 'steps': 21974, 'loss/train': 1.5207573175430298} -11/07/2021 00:19:46 - INFO - __main__ - Step 21976: {'lr': 0.00047786173688299684, 'samples': 4219392, 'steps': 21975, 'loss/train': 2.1882331371307373} -11/07/2021 00:19:46 - INFO - __main__ - Step 21977: {'lr': 0.00047785955354350776, 'samples': 4219584, 'steps': 21976, 'loss/train': 1.2902092933654785} -11/07/2021 00:19:47 - INFO - __main__ - Step 21978: {'lr': 0.00047785737010134865, 'samples': 4219776, 'steps': 21977, 'loss/train': 1.2863267660140991} -11/07/2021 00:19:47 - INFO - __main__ - Step 21979: {'lr': 0.0004778551865565206, 'samples': 4219968, 'steps': 21978, 'loss/train': 1.791292667388916} -11/07/2021 00:19:48 - INFO - __main__ - Step 21980: {'lr': 0.00047785300290902446, 'samples': 4220160, 'steps': 21979, 'loss/train': 1.2760604619979858} -11/07/2021 00:19:48 - INFO - __main__ - Step 21981: {'lr': 0.0004778508191588613, 'samples': 4220352, 'steps': 21980, 'loss/train': 1.6339510679244995} -11/07/2021 00:19:48 - INFO - __main__ - Step 21982: {'lr': 0.00047784863530603213, 'samples': 4220544, 'steps': 21981, 'loss/train': 1.3932080268859863} -11/07/2021 00:19:49 - INFO - __main__ - Step 21983: {'lr': 0.0004778464513505378, 'samples': 4220736, 'steps': 21982, 'loss/train': 1.6483728885650635} -11/07/2021 00:19:50 - INFO - __main__ - Step 21984: {'lr': 0.0004778442672923794, 'samples': 4220928, 'steps': 21983, 'loss/train': 1.459287166595459} -11/07/2021 00:19:50 - INFO - __main__ - Step 21985: {'lr': 0.0004778420831315579, 'samples': 4221120, 'steps': 21984, 'loss/train': 1.1991043090820312} -11/07/2021 00:19:50 - INFO - __main__ - Step 21986: {'lr': 0.0004778398988680743, 'samples': 4221312, 'steps': 21985, 'loss/train': 1.7007657289505005} -11/07/2021 00:19:51 - INFO - __main__ - Step 21987: {'lr': 0.00047783771450192946, 'samples': 4221504, 'steps': 21986, 'loss/train': 1.4460031986236572} -11/07/2021 00:19:52 - INFO - __main__ - Step 21988: {'lr': 0.00047783553003312456, 'samples': 4221696, 'steps': 21987, 'loss/train': 1.7444876432418823} -11/07/2021 00:19:52 - INFO - __main__ - Step 21989: {'lr': 0.00047783334546166046, 'samples': 4221888, 'steps': 21988, 'loss/train': 1.6182039976119995} -11/07/2021 00:19:52 - INFO - __main__ - Step 21990: {'lr': 0.0004778311607875382, 'samples': 4222080, 'steps': 21989, 'loss/train': 1.2163879871368408} -11/07/2021 00:19:53 - INFO - __main__ - Step 21991: {'lr': 0.0004778289760107587, 'samples': 4222272, 'steps': 21990, 'loss/train': 1.4696317911148071} -11/07/2021 00:19:53 - INFO - __main__ - Step 21992: {'lr': 0.00047782679113132293, 'samples': 4222464, 'steps': 21991, 'loss/train': 1.7996553182601929} -11/07/2021 00:19:54 - INFO - __main__ - Step 21993: {'lr': 0.00047782460614923195, 'samples': 4222656, 'steps': 21992, 'loss/train': 1.3140223026275635} -11/07/2021 00:19:55 - INFO - __main__ - Step 21994: {'lr': 0.00047782242106448675, 'samples': 4222848, 'steps': 21993, 'loss/train': 1.7597932815551758} -11/07/2021 00:19:55 - INFO - __main__ - Step 21995: {'lr': 0.00047782023587708826, 'samples': 4223040, 'steps': 21994, 'loss/train': 1.2252593040466309} -11/07/2021 00:19:55 - INFO - __main__ - Step 21996: {'lr': 0.0004778180505870375, 'samples': 4223232, 'steps': 21995, 'loss/train': 1.802703619003296} -11/07/2021 00:19:56 - INFO - __main__ - Step 21997: {'lr': 0.0004778158651943355, 'samples': 4223424, 'steps': 21996, 'loss/train': 1.5296212434768677} -11/07/2021 00:19:57 - INFO - __main__ - Step 21998: {'lr': 0.0004778136796989831, 'samples': 4223616, 'steps': 21997, 'loss/train': 1.3799338340759277} -11/07/2021 00:19:57 - INFO - __main__ - Step 21999: {'lr': 0.0004778114941009814, 'samples': 4223808, 'steps': 21998, 'loss/train': 1.5359055995941162} -11/07/2021 00:19:58 - INFO - __main__ - Step 22000: {'lr': 0.0004778093084003313, 'samples': 4224000, 'steps': 21999, 'loss/train': 1.4692944288253784} -11/07/2021 00:19:58 - INFO - __main__ - Step 22001: {'lr': 0.00047780712259703394, 'samples': 4224192, 'steps': 22000, 'loss/train': 1.5872262716293335} -11/07/2021 00:19:58 - INFO - __main__ - Step 22002: {'lr': 0.00047780493669109017, 'samples': 4224384, 'steps': 22001, 'loss/train': 1.0057997703552246} -11/07/2021 00:19:59 - INFO - __main__ - Step 22003: {'lr': 0.000477802750682501, 'samples': 4224576, 'steps': 22002, 'loss/train': 1.5224837064743042} -11/07/2021 00:20:00 - INFO - __main__ - Step 22004: {'lr': 0.0004778005645712674, 'samples': 4224768, 'steps': 22003, 'loss/train': 1.6188691854476929} -11/07/2021 00:20:00 - INFO - __main__ - Step 22005: {'lr': 0.00047779837835739043, 'samples': 4224960, 'steps': 22004, 'loss/train': 1.5473153591156006} -11/07/2021 00:20:00 - INFO - __main__ - Step 22006: {'lr': 0.000477796192040871, 'samples': 4225152, 'steps': 22005, 'loss/train': 1.9420137405395508} -11/07/2021 00:20:01 - INFO - __main__ - Step 22007: {'lr': 0.00047779400562171016, 'samples': 4225344, 'steps': 22006, 'loss/train': 1.241431474685669} -11/07/2021 00:20:01 - INFO - __main__ - Step 22008: {'lr': 0.00047779181909990876, 'samples': 4225536, 'steps': 22007, 'loss/train': 1.4020662307739258} -11/07/2021 00:20:02 - INFO - __main__ - Step 22009: {'lr': 0.000477789632475468, 'samples': 4225728, 'steps': 22008, 'loss/train': 1.392614722251892} -11/07/2021 00:20:02 - INFO - __main__ - Step 22010: {'lr': 0.00047778744574838864, 'samples': 4225920, 'steps': 22009, 'loss/train': 1.4451684951782227} -11/07/2021 00:20:03 - INFO - __main__ - Step 22011: {'lr': 0.00047778525891867187, 'samples': 4226112, 'steps': 22010, 'loss/train': 1.806498408317566} -11/07/2021 00:20:03 - INFO - __main__ - Step 22012: {'lr': 0.00047778307198631856, 'samples': 4226304, 'steps': 22011, 'loss/train': 1.545744776725769} -11/07/2021 00:20:03 - INFO - __main__ - Step 22013: {'lr': 0.00047778088495132963, 'samples': 4226496, 'steps': 22012, 'loss/train': 2.2597596645355225} -11/07/2021 00:20:04 - INFO - __main__ - Step 22014: {'lr': 0.0004777786978137062, 'samples': 4226688, 'steps': 22013, 'loss/train': 2.303285598754883} -11/07/2021 00:20:05 - INFO - __main__ - Step 22015: {'lr': 0.00047777651057344915, 'samples': 4226880, 'steps': 22014, 'loss/train': 1.7788605690002441} -11/07/2021 00:20:05 - INFO - __main__ - Step 22016: {'lr': 0.0004777743232305596, 'samples': 4227072, 'steps': 22015, 'loss/train': 1.471137285232544} -11/07/2021 00:20:06 - INFO - __main__ - Step 22017: {'lr': 0.00047777213578503844, 'samples': 4227264, 'steps': 22016, 'loss/train': 1.7673450708389282} -11/07/2021 00:20:06 - INFO - __main__ - Step 22018: {'lr': 0.0004777699482368867, 'samples': 4227456, 'steps': 22017, 'loss/train': 1.6683404445648193} -11/07/2021 00:20:07 - INFO - __main__ - Step 22019: {'lr': 0.00047776776058610525, 'samples': 4227648, 'steps': 22018, 'loss/train': 1.5695788860321045} -11/07/2021 00:20:07 - INFO - __main__ - Step 22020: {'lr': 0.0004777655728326952, 'samples': 4227840, 'steps': 22019, 'loss/train': 1.6337982416152954} -11/07/2021 00:20:08 - INFO - __main__ - Step 22021: {'lr': 0.0004777633849766575, 'samples': 4228032, 'steps': 22020, 'loss/train': 1.395537257194519} -11/07/2021 00:20:08 - INFO - __main__ - Step 22022: {'lr': 0.00047776119701799317, 'samples': 4228224, 'steps': 22021, 'loss/train': 1.1082690954208374} -11/07/2021 00:20:08 - INFO - __main__ - Step 22023: {'lr': 0.0004777590089567031, 'samples': 4228416, 'steps': 22022, 'loss/train': 1.4885226488113403} -11/07/2021 00:20:09 - INFO - __main__ - Step 22024: {'lr': 0.00047775682079278836, 'samples': 4228608, 'steps': 22023, 'loss/train': 2.176821231842041} -11/07/2021 00:20:10 - INFO - __main__ - Step 22025: {'lr': 0.0004777546325262499, 'samples': 4228800, 'steps': 22024, 'loss/train': 1.4476275444030762} -11/07/2021 00:20:10 - INFO - __main__ - Step 22026: {'lr': 0.00047775244415708873, 'samples': 4228992, 'steps': 22025, 'loss/train': 1.2312343120574951} -11/07/2021 00:20:10 - INFO - __main__ - Step 22027: {'lr': 0.0004777502556853058, 'samples': 4229184, 'steps': 22026, 'loss/train': 0.7627279162406921} -11/07/2021 00:20:11 - INFO - __main__ - Step 22028: {'lr': 0.00047774806711090213, 'samples': 4229376, 'steps': 22027, 'loss/train': 1.5808088779449463} -11/07/2021 00:20:12 - INFO - __main__ - Step 22029: {'lr': 0.0004777458784338787, 'samples': 4229568, 'steps': 22028, 'loss/train': 1.5712063312530518} -11/07/2021 00:20:12 - INFO - __main__ - Step 22030: {'lr': 0.00047774368965423653, 'samples': 4229760, 'steps': 22029, 'loss/train': 2.2965681552886963} -11/07/2021 00:20:12 - INFO - __main__ - Step 22031: {'lr': 0.0004777415007719765, 'samples': 4229952, 'steps': 22030, 'loss/train': 1.8073399066925049} -11/07/2021 00:20:13 - INFO - __main__ - Step 22032: {'lr': 0.00047773931178709975, 'samples': 4230144, 'steps': 22031, 'loss/train': 1.4591764211654663} -11/07/2021 00:20:13 - INFO - __main__ - Step 22033: {'lr': 0.00047773712269960714, 'samples': 4230336, 'steps': 22032, 'loss/train': 1.5156131982803345} -11/07/2021 00:20:14 - INFO - __main__ - Step 22034: {'lr': 0.00047773493350949963, 'samples': 4230528, 'steps': 22033, 'loss/train': 2.4903831481933594} -11/07/2021 00:20:15 - INFO - __main__ - Step 22035: {'lr': 0.00047773274421677834, 'samples': 4230720, 'steps': 22034, 'loss/train': 1.9549790620803833} -11/07/2021 00:20:15 - INFO - __main__ - Step 22036: {'lr': 0.0004777305548214442, 'samples': 4230912, 'steps': 22035, 'loss/train': 1.8083499670028687} -11/07/2021 00:20:15 - INFO - __main__ - Step 22037: {'lr': 0.0004777283653234982, 'samples': 4231104, 'steps': 22036, 'loss/train': 1.5485557317733765} -11/07/2021 00:20:16 - INFO - __main__ - Step 22038: {'lr': 0.00047772617572294123, 'samples': 4231296, 'steps': 22037, 'loss/train': 1.876652717590332} -11/07/2021 00:20:16 - INFO - __main__ - Step 22039: {'lr': 0.0004777239860197744, 'samples': 4231488, 'steps': 22038, 'loss/train': 1.5153416395187378} -11/07/2021 00:20:17 - INFO - __main__ - Step 22040: {'lr': 0.0004777217962139987, 'samples': 4231680, 'steps': 22039, 'loss/train': 1.3404922485351562} -11/07/2021 00:20:17 - INFO - __main__ - Step 22041: {'lr': 0.000477719606305615, 'samples': 4231872, 'steps': 22040, 'loss/train': 1.777071475982666} -11/07/2021 00:20:18 - INFO - __main__ - Step 22042: {'lr': 0.0004777174162946244, 'samples': 4232064, 'steps': 22041, 'loss/train': 1.7243245840072632} -11/07/2021 00:20:18 - INFO - __main__ - Step 22043: {'lr': 0.0004777152261810279, 'samples': 4232256, 'steps': 22042, 'loss/train': 1.7015565633773804} -11/07/2021 00:20:18 - INFO - __main__ - Step 22044: {'lr': 0.0004777130359648263, 'samples': 4232448, 'steps': 22043, 'loss/train': 0.8857391476631165} -11/07/2021 00:20:20 - INFO - __main__ - Step 22045: {'lr': 0.0004777108456460208, 'samples': 4232640, 'steps': 22044, 'loss/train': 1.6511143445968628} -11/07/2021 00:20:20 - INFO - __main__ - Step 22046: {'lr': 0.00047770865522461233, 'samples': 4232832, 'steps': 22045, 'loss/train': 2.004149913787842} -11/07/2021 00:20:20 - INFO - __main__ - Step 22047: {'lr': 0.0004777064647006018, 'samples': 4233024, 'steps': 22046, 'loss/train': 1.051743507385254} -11/07/2021 00:20:21 - INFO - __main__ - Step 22048: {'lr': 0.0004777042740739903, 'samples': 4233216, 'steps': 22047, 'loss/train': 0.2091219127178192} -11/07/2021 00:20:21 - INFO - __main__ - Step 22049: {'lr': 0.0004777020833447787, 'samples': 4233408, 'steps': 22048, 'loss/train': 1.2629278898239136} -11/07/2021 00:20:22 - INFO - __main__ - Step 22050: {'lr': 0.0004776998925129681, 'samples': 4233600, 'steps': 22049, 'loss/train': 1.63240647315979} -11/07/2021 00:20:23 - INFO - __main__ - Step 22051: {'lr': 0.0004776977015785595, 'samples': 4233792, 'steps': 22050, 'loss/train': 1.2668564319610596} -11/07/2021 00:20:23 - INFO - __main__ - Step 22052: {'lr': 0.0004776955105415537, 'samples': 4233984, 'steps': 22051, 'loss/train': 0.7824997305870056} -11/07/2021 00:20:23 - INFO - __main__ - Step 22053: {'lr': 0.00047769331940195194, 'samples': 4234176, 'steps': 22052, 'loss/train': 1.4100098609924316} -11/07/2021 00:20:24 - INFO - __main__ - Step 22054: {'lr': 0.00047769112815975503, 'samples': 4234368, 'steps': 22053, 'loss/train': 1.5036020278930664} -11/07/2021 00:20:25 - INFO - __main__ - Step 22055: {'lr': 0.00047768893681496397, 'samples': 4234560, 'steps': 22054, 'loss/train': 1.7130056619644165} -11/07/2021 00:20:25 - INFO - __main__ - Step 22056: {'lr': 0.00047768674536757984, 'samples': 4234752, 'steps': 22055, 'loss/train': 1.361931562423706} -11/07/2021 00:20:25 - INFO - __main__ - Step 22057: {'lr': 0.00047768455381760357, 'samples': 4234944, 'steps': 22056, 'loss/train': 1.6314910650253296} -11/07/2021 00:20:26 - INFO - __main__ - Step 22058: {'lr': 0.00047768236216503613, 'samples': 4235136, 'steps': 22057, 'loss/train': 1.7460706233978271} -11/07/2021 00:20:26 - INFO - __main__ - Step 22059: {'lr': 0.00047768017040987856, 'samples': 4235328, 'steps': 22058, 'loss/train': 1.787089228630066} -11/07/2021 00:20:26 - INFO - __main__ - Step 22060: {'lr': 0.0004776779785521318, 'samples': 4235520, 'steps': 22059, 'loss/train': 0.6601639986038208} -11/07/2021 00:20:27 - INFO - __main__ - Step 22061: {'lr': 0.0004776757865917969, 'samples': 4235712, 'steps': 22060, 'loss/train': 1.0703409910202026} -11/07/2021 00:20:28 - INFO - __main__ - Step 22062: {'lr': 0.0004776735945288747, 'samples': 4235904, 'steps': 22061, 'loss/train': 1.8439667224884033} -11/07/2021 00:20:28 - INFO - __main__ - Step 22063: {'lr': 0.00047767140236336635, 'samples': 4236096, 'steps': 22062, 'loss/train': 1.5141043663024902} -11/07/2021 00:20:28 - INFO - __main__ - Step 22064: {'lr': 0.00047766921009527284, 'samples': 4236288, 'steps': 22063, 'loss/train': 1.7506041526794434} -11/07/2021 00:20:29 - INFO - __main__ - Step 22065: {'lr': 0.00047766701772459505, 'samples': 4236480, 'steps': 22064, 'loss/train': 1.5079345703125} -11/07/2021 00:20:30 - INFO - __main__ - Step 22066: {'lr': 0.00047766482525133405, 'samples': 4236672, 'steps': 22065, 'loss/train': 1.629859209060669} -11/07/2021 00:20:30 - INFO - __main__ - Step 22067: {'lr': 0.00047766263267549073, 'samples': 4236864, 'steps': 22066, 'loss/train': 1.2172280550003052} -11/07/2021 00:20:31 - INFO - __main__ - Step 22068: {'lr': 0.0004776604399970661, 'samples': 4237056, 'steps': 22067, 'loss/train': 1.7213703393936157} -11/07/2021 00:20:31 - INFO - __main__ - Step 22069: {'lr': 0.0004776582472160613, 'samples': 4237248, 'steps': 22068, 'loss/train': 1.041486382484436} -11/07/2021 00:20:32 - INFO - __main__ - Step 22070: {'lr': 0.0004776560543324772, 'samples': 4237440, 'steps': 22069, 'loss/train': 1.5691708326339722} -11/07/2021 00:20:33 - INFO - __main__ - Step 22071: {'lr': 0.0004776538613463147, 'samples': 4237632, 'steps': 22070, 'loss/train': 0.24791944026947021} -11/07/2021 00:20:33 - INFO - __main__ - Step 22072: {'lr': 0.00047765166825757487, 'samples': 4237824, 'steps': 22071, 'loss/train': 1.8586312532424927} -11/07/2021 00:20:33 - INFO - __main__ - Step 22073: {'lr': 0.00047764947506625887, 'samples': 4238016, 'steps': 22072, 'loss/train': 1.8590911626815796} -11/07/2021 00:20:34 - INFO - __main__ - Step 22074: {'lr': 0.00047764728177236736, 'samples': 4238208, 'steps': 22073, 'loss/train': 1.7774806022644043} -11/07/2021 00:20:34 - INFO - __main__ - Step 22075: {'lr': 0.0004776450883759016, 'samples': 4238400, 'steps': 22074, 'loss/train': 1.0848828554153442} -11/07/2021 00:20:35 - INFO - __main__ - Step 22076: {'lr': 0.0004776428948768625, 'samples': 4238592, 'steps': 22075, 'loss/train': 1.9253149032592773} -11/07/2021 00:20:35 - INFO - __main__ - Step 22077: {'lr': 0.00047764070127525096, 'samples': 4238784, 'steps': 22076, 'loss/train': 1.2464487552642822} -11/07/2021 00:20:36 - INFO - __main__ - Step 22078: {'lr': 0.00047763850757106803, 'samples': 4238976, 'steps': 22077, 'loss/train': 1.8914134502410889} -11/07/2021 00:20:36 - INFO - __main__ - Step 22079: {'lr': 0.0004776363137643147, 'samples': 4239168, 'steps': 22078, 'loss/train': 1.6272341012954712} -11/07/2021 00:20:37 - INFO - __main__ - Step 22080: {'lr': 0.000477634119854992, 'samples': 4239360, 'steps': 22079, 'loss/train': 1.0225515365600586} -11/07/2021 00:20:37 - INFO - __main__ - Step 22081: {'lr': 0.00047763192584310087, 'samples': 4239552, 'steps': 22080, 'loss/train': 1.4733610153198242} -11/07/2021 00:20:38 - INFO - __main__ - Step 22082: {'lr': 0.0004776297317286423, 'samples': 4239744, 'steps': 22081, 'loss/train': 1.6918233633041382} -11/07/2021 00:20:38 - INFO - __main__ - Step 22083: {'lr': 0.00047762753751161725, 'samples': 4239936, 'steps': 22082, 'loss/train': 1.4075119495391846} -11/07/2021 00:20:39 - INFO - __main__ - Step 22084: {'lr': 0.0004776253431920268, 'samples': 4240128, 'steps': 22083, 'loss/train': 1.3235876560211182} -11/07/2021 00:20:39 - INFO - __main__ - Step 22085: {'lr': 0.00047762314876987185, 'samples': 4240320, 'steps': 22084, 'loss/train': 1.7621089220046997} -11/07/2021 00:20:39 - INFO - __main__ - Step 22086: {'lr': 0.0004776209542451534, 'samples': 4240512, 'steps': 22085, 'loss/train': 1.2438160181045532} -11/07/2021 00:20:40 - INFO - __main__ - Step 22087: {'lr': 0.0004776187596178725, 'samples': 4240704, 'steps': 22086, 'loss/train': 1.4515008926391602} -11/07/2021 00:20:41 - INFO - __main__ - Step 22088: {'lr': 0.00047761656488803006, 'samples': 4240896, 'steps': 22087, 'loss/train': 1.8013110160827637} -11/07/2021 00:20:41 - INFO - __main__ - Step 22089: {'lr': 0.00047761437005562716, 'samples': 4241088, 'steps': 22088, 'loss/train': 1.7310346364974976} -11/07/2021 00:20:41 - INFO - __main__ - Step 22090: {'lr': 0.00047761217512066475, 'samples': 4241280, 'steps': 22089, 'loss/train': 1.422913908958435} -11/07/2021 00:20:42 - INFO - __main__ - Step 22091: {'lr': 0.0004776099800831437, 'samples': 4241472, 'steps': 22090, 'loss/train': 0.4168950617313385} -11/07/2021 00:20:43 - INFO - __main__ - Step 22092: {'lr': 0.0004776077849430652, 'samples': 4241664, 'steps': 22091, 'loss/train': 1.9819186925888062} -11/07/2021 00:20:43 - INFO - __main__ - Step 22093: {'lr': 0.0004776055897004301, 'samples': 4241856, 'steps': 22092, 'loss/train': 0.8312280178070068} -11/07/2021 00:20:44 - INFO - __main__ - Step 22094: {'lr': 0.0004776033943552395, 'samples': 4242048, 'steps': 22093, 'loss/train': 1.5974825620651245} -11/07/2021 00:20:44 - INFO - __main__ - Step 22095: {'lr': 0.0004776011989074943, 'samples': 4242240, 'steps': 22094, 'loss/train': 1.7879666090011597} -11/07/2021 00:20:44 - INFO - __main__ - Step 22096: {'lr': 0.00047759900335719543, 'samples': 4242432, 'steps': 22095, 'loss/train': 1.5695561170578003} -11/07/2021 00:20:45 - INFO - __main__ - Step 22097: {'lr': 0.00047759680770434405, 'samples': 4242624, 'steps': 22096, 'loss/train': 1.3009862899780273} -11/07/2021 00:20:46 - INFO - __main__ - Step 22098: {'lr': 0.00047759461194894103, 'samples': 4242816, 'steps': 22097, 'loss/train': 1.4749153852462769} -11/07/2021 00:20:46 - INFO - __main__ - Step 22099: {'lr': 0.00047759241609098734, 'samples': 4243008, 'steps': 22098, 'loss/train': 1.5157296657562256} -11/07/2021 00:20:46 - INFO - __main__ - Step 22100: {'lr': 0.00047759022013048417, 'samples': 4243200, 'steps': 22099, 'loss/train': 1.2801927328109741} -11/07/2021 00:20:47 - INFO - __main__ - Step 22101: {'lr': 0.00047758802406743217, 'samples': 4243392, 'steps': 22100, 'loss/train': 1.891735553741455} -11/07/2021 00:20:48 - INFO - __main__ - Step 22102: {'lr': 0.0004775858279018326, 'samples': 4243584, 'steps': 22101, 'loss/train': 1.7186956405639648} -11/07/2021 00:20:48 - INFO - __main__ - Step 22103: {'lr': 0.0004775836316336864, 'samples': 4243776, 'steps': 22102, 'loss/train': 1.5562268495559692} -11/07/2021 00:20:49 - INFO - __main__ - Step 22104: {'lr': 0.00047758143526299446, 'samples': 4243968, 'steps': 22103, 'loss/train': 1.8075950145721436} -11/07/2021 00:20:49 - INFO - __main__ - Step 22105: {'lr': 0.0004775792387897579, 'samples': 4244160, 'steps': 22104, 'loss/train': 0.24321593344211578} -11/07/2021 00:20:49 - INFO - __main__ - Step 22106: {'lr': 0.0004775770422139776, 'samples': 4244352, 'steps': 22105, 'loss/train': 1.5821597576141357} -11/07/2021 00:20:50 - INFO - __main__ - Step 22107: {'lr': 0.00047757484553565465, 'samples': 4244544, 'steps': 22106, 'loss/train': 3.4636902809143066} -11/07/2021 00:20:51 - INFO - __main__ - Step 22108: {'lr': 0.00047757264875478996, 'samples': 4244736, 'steps': 22107, 'loss/train': 1.1725666522979736} -11/07/2021 00:20:51 - INFO - __main__ - Step 22109: {'lr': 0.0004775704518713845, 'samples': 4244928, 'steps': 22108, 'loss/train': 1.034935712814331} -11/07/2021 00:20:52 - INFO - __main__ - Step 22110: {'lr': 0.0004775682548854394, 'samples': 4245120, 'steps': 22109, 'loss/train': 1.4282327890396118} -11/07/2021 00:20:52 - INFO - __main__ - Step 22111: {'lr': 0.0004775660577969555, 'samples': 4245312, 'steps': 22110, 'loss/train': 0.2226470410823822} -11/07/2021 00:20:52 - INFO - __main__ - Step 22112: {'lr': 0.0004775638606059338, 'samples': 4245504, 'steps': 22111, 'loss/train': 1.1546566486358643} -11/07/2021 00:20:53 - INFO - __main__ - Step 22113: {'lr': 0.00047756166331237545, 'samples': 4245696, 'steps': 22112, 'loss/train': 1.7638152837753296} -11/07/2021 00:20:54 - INFO - __main__ - Step 22114: {'lr': 0.00047755946591628126, 'samples': 4245888, 'steps': 22113, 'loss/train': 1.632278561592102} -11/07/2021 00:20:54 - INFO - __main__ - Step 22115: {'lr': 0.00047755726841765224, 'samples': 4246080, 'steps': 22114, 'loss/train': 1.7050201892852783} -11/07/2021 00:20:54 - INFO - __main__ - Step 22116: {'lr': 0.0004775550708164895, 'samples': 4246272, 'steps': 22115, 'loss/train': 1.5752651691436768} -11/07/2021 00:20:55 - INFO - __main__ - Step 22117: {'lr': 0.00047755287311279394, 'samples': 4246464, 'steps': 22116, 'loss/train': 1.260236144065857} -11/07/2021 00:20:56 - INFO - __main__ - Step 22118: {'lr': 0.00047755067530656656, 'samples': 4246656, 'steps': 22117, 'loss/train': 1.4997432231903076} -11/07/2021 00:20:56 - INFO - __main__ - Step 22119: {'lr': 0.00047754847739780835, 'samples': 4246848, 'steps': 22118, 'loss/train': 1.6824851036071777} -11/07/2021 00:20:57 - INFO - __main__ - Step 22120: {'lr': 0.0004775462793865203, 'samples': 4247040, 'steps': 22119, 'loss/train': 1.5758624076843262} -11/07/2021 00:20:57 - INFO - __main__ - Step 22121: {'lr': 0.00047754408127270346, 'samples': 4247232, 'steps': 22120, 'loss/train': 1.820260763168335} -11/07/2021 00:20:57 - INFO - __main__ - Step 22122: {'lr': 0.0004775418830563587, 'samples': 4247424, 'steps': 22121, 'loss/train': 1.8502987623214722} -11/07/2021 00:20:58 - INFO - __main__ - Step 22123: {'lr': 0.0004775396847374871, 'samples': 4247616, 'steps': 22122, 'loss/train': 1.7947843074798584} -11/07/2021 00:20:59 - INFO - __main__ - Step 22124: {'lr': 0.0004775374863160896, 'samples': 4247808, 'steps': 22123, 'loss/train': 1.7967413663864136} -11/07/2021 00:20:59 - INFO - __main__ - Step 22125: {'lr': 0.0004775352877921673, 'samples': 4248000, 'steps': 22124, 'loss/train': 1.6300139427185059} -11/07/2021 00:20:59 - INFO - __main__ - Step 22126: {'lr': 0.000477533089165721, 'samples': 4248192, 'steps': 22125, 'loss/train': 0.9215333461761475} -11/07/2021 00:21:00 - INFO - __main__ - Step 22127: {'lr': 0.0004775308904367519, 'samples': 4248384, 'steps': 22126, 'loss/train': 1.7427397966384888} -11/07/2021 00:21:00 - INFO - __main__ - Step 22128: {'lr': 0.0004775286916052609, 'samples': 4248576, 'steps': 22127, 'loss/train': 1.6542869806289673} -11/07/2021 00:21:01 - INFO - __main__ - Step 22129: {'lr': 0.00047752649267124894, 'samples': 4248768, 'steps': 22128, 'loss/train': 1.5671731233596802} -11/07/2021 00:21:01 - INFO - __main__ - Step 22130: {'lr': 0.0004775242936347171, 'samples': 4248960, 'steps': 22129, 'loss/train': 1.698813796043396} -11/07/2021 00:21:02 - INFO - __main__ - Step 22131: {'lr': 0.0004775220944956662, 'samples': 4249152, 'steps': 22130, 'loss/train': 0.2281908243894577} -11/07/2021 00:21:02 - INFO - __main__ - Step 22132: {'lr': 0.00047751989525409745, 'samples': 4249344, 'steps': 22131, 'loss/train': 1.9468735456466675} -11/07/2021 00:21:02 - INFO - __main__ - Step 22133: {'lr': 0.0004775176959100117, 'samples': 4249536, 'steps': 22132, 'loss/train': 1.6748098134994507} -11/07/2021 00:21:04 - INFO - __main__ - Step 22134: {'lr': 0.00047751549646341007, 'samples': 4249728, 'steps': 22133, 'loss/train': 1.442635178565979} -11/07/2021 00:21:04 - INFO - __main__ - Step 22135: {'lr': 0.0004775132969142934, 'samples': 4249920, 'steps': 22134, 'loss/train': 1.737351417541504} -11/07/2021 00:21:04 - INFO - __main__ - Step 22136: {'lr': 0.00047751109726266273, 'samples': 4250112, 'steps': 22135, 'loss/train': 1.0580017566680908} -11/07/2021 00:21:05 - INFO - __main__ - Step 22137: {'lr': 0.00047750889750851913, 'samples': 4250304, 'steps': 22136, 'loss/train': 0.43822312355041504} -11/07/2021 00:21:05 - INFO - __main__ - Step 22138: {'lr': 0.0004775066976518635, 'samples': 4250496, 'steps': 22137, 'loss/train': 1.7369829416275024} -11/07/2021 00:21:06 - INFO - __main__ - Step 22139: {'lr': 0.00047750449769269686, 'samples': 4250688, 'steps': 22138, 'loss/train': 1.1845433712005615} -11/07/2021 00:21:06 - INFO - __main__ - Step 22140: {'lr': 0.0004775022976310203, 'samples': 4250880, 'steps': 22139, 'loss/train': 1.6305336952209473} -11/07/2021 00:21:07 - INFO - __main__ - Step 22141: {'lr': 0.0004775000974668345, 'samples': 4251072, 'steps': 22140, 'loss/train': 1.4394451379776} -11/07/2021 00:21:07 - INFO - __main__ - Step 22142: {'lr': 0.00047749789720014085, 'samples': 4251264, 'steps': 22141, 'loss/train': 1.3838160037994385} -11/07/2021 00:21:07 - INFO - __main__ - Step 22143: {'lr': 0.00047749569683094015, 'samples': 4251456, 'steps': 22142, 'loss/train': 1.30197012424469} -11/07/2021 00:21:08 - INFO - __main__ - Step 22144: {'lr': 0.00047749349635923334, 'samples': 4251648, 'steps': 22143, 'loss/train': 1.6408462524414062} -11/07/2021 00:21:09 - INFO - __main__ - Step 22145: {'lr': 0.0004774912957850215, 'samples': 4251840, 'steps': 22144, 'loss/train': 0.2188931703567505} -11/07/2021 00:21:09 - INFO - __main__ - Step 22146: {'lr': 0.0004774890951083055, 'samples': 4252032, 'steps': 22145, 'loss/train': 2.0885589122772217} -11/07/2021 00:21:09 - INFO - __main__ - Step 22147: {'lr': 0.00047748689432908654, 'samples': 4252224, 'steps': 22146, 'loss/train': 1.8011268377304077} -11/07/2021 00:21:10 - INFO - __main__ - Step 22148: {'lr': 0.00047748469344736547, 'samples': 4252416, 'steps': 22147, 'loss/train': 2.0035457611083984} -11/07/2021 00:21:10 - INFO - __main__ - Step 22149: {'lr': 0.00047748249246314323, 'samples': 4252608, 'steps': 22148, 'loss/train': 1.6972697973251343} -11/07/2021 00:21:11 - INFO - __main__ - Step 22150: {'lr': 0.000477480291376421, 'samples': 4252800, 'steps': 22149, 'loss/train': 1.4715518951416016} -11/07/2021 00:21:12 - INFO - __main__ - Step 22151: {'lr': 0.0004774780901871996, 'samples': 4252992, 'steps': 22150, 'loss/train': 1.3390496969223022} -11/07/2021 00:21:12 - INFO - __main__ - Step 22152: {'lr': 0.0004774758888954801, 'samples': 4253184, 'steps': 22151, 'loss/train': 1.2156263589859009} -11/07/2021 00:21:12 - INFO - __main__ - Step 22153: {'lr': 0.00047747368750126345, 'samples': 4253376, 'steps': 22152, 'loss/train': 1.6150118112564087} -11/07/2021 00:21:13 - INFO - __main__ - Step 22154: {'lr': 0.0004774714860045507, 'samples': 4253568, 'steps': 22153, 'loss/train': 1.8437851667404175} -11/07/2021 00:21:14 - INFO - __main__ - Step 22155: {'lr': 0.0004774692844053428, 'samples': 4253760, 'steps': 22154, 'loss/train': 1.99979567527771} -11/07/2021 00:21:14 - INFO - __main__ - Step 22156: {'lr': 0.00047746708270364073, 'samples': 4253952, 'steps': 22155, 'loss/train': 1.418305516242981} -11/07/2021 00:21:14 - INFO - __main__ - Step 22157: {'lr': 0.0004774648808994455, 'samples': 4254144, 'steps': 22156, 'loss/train': 1.7593319416046143} -11/07/2021 00:21:15 - INFO - __main__ - Step 22158: {'lr': 0.0004774626789927582, 'samples': 4254336, 'steps': 22157, 'loss/train': 1.7074940204620361} -11/07/2021 00:21:15 - INFO - __main__ - Step 22159: {'lr': 0.0004774604769835796, 'samples': 4254528, 'steps': 22158, 'loss/train': 1.7265609502792358} -11/07/2021 00:21:16 - INFO - __main__ - Step 22160: {'lr': 0.00047745827487191087, 'samples': 4254720, 'steps': 22159, 'loss/train': 1.7802273035049438} -11/07/2021 00:21:17 - INFO - __main__ - Step 22161: {'lr': 0.00047745607265775293, 'samples': 4254912, 'steps': 22160, 'loss/train': 1.9270914793014526} -11/07/2021 00:21:17 - INFO - __main__ - Step 22162: {'lr': 0.0004774538703411069, 'samples': 4255104, 'steps': 22161, 'loss/train': 1.74415922164917} -11/07/2021 00:21:17 - INFO - __main__ - Step 22163: {'lr': 0.00047745166792197353, 'samples': 4255296, 'steps': 22162, 'loss/train': 1.3474476337432861} -11/07/2021 00:21:18 - INFO - __main__ - Step 22164: {'lr': 0.000477449465400354, 'samples': 4255488, 'steps': 22163, 'loss/train': 1.540534496307373} -11/07/2021 00:21:19 - INFO - __main__ - Step 22165: {'lr': 0.00047744726277624926, 'samples': 4255680, 'steps': 22164, 'loss/train': 1.7479281425476074} -11/07/2021 00:21:19 - INFO - __main__ - Step 22166: {'lr': 0.00047744506004966024, 'samples': 4255872, 'steps': 22165, 'loss/train': 1.7287943363189697} -11/07/2021 00:21:19 - INFO - __main__ - Step 22167: {'lr': 0.00047744285722058804, 'samples': 4256064, 'steps': 22166, 'loss/train': 1.6895420551300049} -11/07/2021 00:21:20 - INFO - __main__ - Step 22168: {'lr': 0.0004774406542890336, 'samples': 4256256, 'steps': 22167, 'loss/train': 1.5301826000213623} -11/07/2021 00:21:20 - INFO - __main__ - Step 22169: {'lr': 0.0004774384512549979, 'samples': 4256448, 'steps': 22168, 'loss/train': 1.6606671810150146} -11/07/2021 00:21:20 - INFO - __main__ - Step 22170: {'lr': 0.00047743624811848195, 'samples': 4256640, 'steps': 22169, 'loss/train': 1.5106760263442993} -11/07/2021 00:21:21 - INFO - __main__ - Step 22171: {'lr': 0.00047743404487948673, 'samples': 4256832, 'steps': 22170, 'loss/train': 2.1511363983154297} -11/07/2021 00:21:22 - INFO - __main__ - Step 22172: {'lr': 0.0004774318415380132, 'samples': 4257024, 'steps': 22171, 'loss/train': 1.799678087234497} -11/07/2021 00:21:22 - INFO - __main__ - Step 22173: {'lr': 0.0004774296380940625, 'samples': 4257216, 'steps': 22172, 'loss/train': 1.9480088949203491} -11/07/2021 00:21:23 - INFO - __main__ - Step 22174: {'lr': 0.0004774274345476354, 'samples': 4257408, 'steps': 22173, 'loss/train': 1.6413216590881348} -11/07/2021 00:21:23 - INFO - __main__ - Step 22175: {'lr': 0.00047742523089873304, 'samples': 4257600, 'steps': 22174, 'loss/train': 1.6591426134109497} -11/07/2021 00:21:24 - INFO - __main__ - Step 22176: {'lr': 0.0004774230271473564, 'samples': 4257792, 'steps': 22175, 'loss/train': 1.1572656631469727} -11/07/2021 00:21:24 - INFO - __main__ - Step 22177: {'lr': 0.00047742082329350644, 'samples': 4257984, 'steps': 22176, 'loss/train': 1.5521352291107178} -11/07/2021 00:21:25 - INFO - __main__ - Step 22178: {'lr': 0.0004774186193371841, 'samples': 4258176, 'steps': 22177, 'loss/train': 0.964850664138794} -11/07/2021 00:21:25 - INFO - __main__ - Step 22179: {'lr': 0.00047741641527839054, 'samples': 4258368, 'steps': 22178, 'loss/train': 1.0296980142593384} -11/07/2021 00:21:25 - INFO - __main__ - Step 22180: {'lr': 0.00047741421111712666, 'samples': 4258560, 'steps': 22179, 'loss/train': 1.7389425039291382} -11/07/2021 00:21:26 - INFO - __main__ - Step 22181: {'lr': 0.00047741200685339337, 'samples': 4258752, 'steps': 22180, 'loss/train': 1.7903101444244385} -11/07/2021 00:21:27 - INFO - __main__ - Step 22182: {'lr': 0.0004774098024871918, 'samples': 4258944, 'steps': 22181, 'loss/train': 1.5867414474487305} -11/07/2021 00:21:27 - INFO - __main__ - Step 22183: {'lr': 0.00047740759801852284, 'samples': 4259136, 'steps': 22182, 'loss/train': 1.6548216342926025} -11/07/2021 00:21:27 - INFO - __main__ - Step 22184: {'lr': 0.00047740539344738754, 'samples': 4259328, 'steps': 22183, 'loss/train': 1.6218554973602295} -11/07/2021 00:21:28 - INFO - __main__ - Step 22185: {'lr': 0.00047740318877378685, 'samples': 4259520, 'steps': 22184, 'loss/train': 1.144287347793579} -11/07/2021 00:21:28 - INFO - __main__ - Step 22186: {'lr': 0.00047740098399772185, 'samples': 4259712, 'steps': 22185, 'loss/train': 0.4743185043334961} -11/07/2021 00:21:29 - INFO - __main__ - Step 22187: {'lr': 0.0004773987791191935, 'samples': 4259904, 'steps': 22186, 'loss/train': 1.6326481103897095} -11/07/2021 00:21:29 - INFO - __main__ - Step 22188: {'lr': 0.0004773965741382027, 'samples': 4260096, 'steps': 22187, 'loss/train': 2.2415566444396973} -11/07/2021 00:21:30 - INFO - __main__ - Step 22189: {'lr': 0.00047739436905475054, 'samples': 4260288, 'steps': 22188, 'loss/train': 0.9503546357154846} -11/07/2021 00:21:30 - INFO - __main__ - Step 22190: {'lr': 0.00047739216386883797, 'samples': 4260480, 'steps': 22189, 'loss/train': 1.4760106801986694} -11/07/2021 00:21:31 - INFO - __main__ - Step 22191: {'lr': 0.000477389958580466, 'samples': 4260672, 'steps': 22190, 'loss/train': 1.2762712240219116} -11/07/2021 00:21:32 - INFO - __main__ - Step 22192: {'lr': 0.0004773877531896356, 'samples': 4260864, 'steps': 22191, 'loss/train': 1.569229006767273} -11/07/2021 00:21:32 - INFO - __main__ - Step 22193: {'lr': 0.00047738554769634784, 'samples': 4261056, 'steps': 22192, 'loss/train': 1.164962887763977} -11/07/2021 00:21:32 - INFO - __main__ - Step 22194: {'lr': 0.00047738334210060366, 'samples': 4261248, 'steps': 22193, 'loss/train': 1.5791643857955933} -11/07/2021 00:21:33 - INFO - __main__ - Step 22195: {'lr': 0.000477381136402404, 'samples': 4261440, 'steps': 22194, 'loss/train': 1.462497591972351} -11/07/2021 00:21:33 - INFO - __main__ - Step 22196: {'lr': 0.00047737893060175, 'samples': 4261632, 'steps': 22195, 'loss/train': 1.5324187278747559} -11/07/2021 00:21:34 - INFO - __main__ - Step 22197: {'lr': 0.00047737672469864246, 'samples': 4261824, 'steps': 22196, 'loss/train': 2.1199514865875244} -11/07/2021 00:21:35 - INFO - __main__ - Step 22198: {'lr': 0.0004773745186930825, 'samples': 4262016, 'steps': 22197, 'loss/train': 1.5264184474945068} -11/07/2021 00:21:35 - INFO - __main__ - Step 22199: {'lr': 0.00047737231258507116, 'samples': 4262208, 'steps': 22198, 'loss/train': 1.4578293561935425} -11/07/2021 00:21:35 - INFO - __main__ - Step 22200: {'lr': 0.00047737010637460934, 'samples': 4262400, 'steps': 22199, 'loss/train': 1.3843269348144531} -11/07/2021 00:21:36 - INFO - __main__ - Step 22201: {'lr': 0.00047736790006169794, 'samples': 4262592, 'steps': 22200, 'loss/train': 1.5156464576721191} -11/07/2021 00:21:36 - INFO - __main__ - Step 22202: {'lr': 0.00047736569364633817, 'samples': 4262784, 'steps': 22201, 'loss/train': 2.108410358428955} -11/07/2021 00:21:37 - INFO - __main__ - Step 22203: {'lr': 0.00047736348712853094, 'samples': 4262976, 'steps': 22202, 'loss/train': 1.5299713611602783} -11/07/2021 00:21:37 - INFO - __main__ - Step 22204: {'lr': 0.0004773612805082772, 'samples': 4263168, 'steps': 22203, 'loss/train': 1.304317831993103} -11/07/2021 00:21:38 - INFO - __main__ - Step 22205: {'lr': 0.000477359073785578, 'samples': 4263360, 'steps': 22204, 'loss/train': 1.8367857933044434} -11/07/2021 00:21:38 - INFO - __main__ - Step 22206: {'lr': 0.00047735686696043434, 'samples': 4263552, 'steps': 22205, 'loss/train': 0.7247116565704346} -11/07/2021 00:21:38 - INFO - __main__ - Step 22207: {'lr': 0.0004773546600328471, 'samples': 4263744, 'steps': 22206, 'loss/train': 1.6162457466125488} -11/07/2021 00:21:39 - INFO - __main__ - Step 22208: {'lr': 0.00047735245300281745, 'samples': 4263936, 'steps': 22207, 'loss/train': 1.498029351234436} -11/07/2021 00:21:40 - INFO - __main__ - Step 22209: {'lr': 0.00047735024587034625, 'samples': 4264128, 'steps': 22208, 'loss/train': 2.190403699874878} -11/07/2021 00:21:40 - INFO - __main__ - Step 22210: {'lr': 0.00047734803863543453, 'samples': 4264320, 'steps': 22209, 'loss/train': 1.4946469068527222} -11/07/2021 00:21:40 - INFO - __main__ - Step 22211: {'lr': 0.00047734583129808327, 'samples': 4264512, 'steps': 22210, 'loss/train': 1.5364080667495728} -11/07/2021 00:21:41 - INFO - __main__ - Step 22212: {'lr': 0.00047734362385829356, 'samples': 4264704, 'steps': 22211, 'loss/train': 2.015793561935425} -11/07/2021 00:21:42 - INFO - __main__ - Step 22213: {'lr': 0.0004773414163160662, 'samples': 4264896, 'steps': 22212, 'loss/train': 1.358203649520874} -11/07/2021 00:21:42 - INFO - __main__ - Step 22214: {'lr': 0.00047733920867140244, 'samples': 4265088, 'steps': 22213, 'loss/train': 0.5409196615219116} -11/07/2021 00:21:43 - INFO - __main__ - Step 22215: {'lr': 0.00047733700092430305, 'samples': 4265280, 'steps': 22214, 'loss/train': 1.655433177947998} -11/07/2021 00:21:43 - INFO - __main__ - Step 22216: {'lr': 0.0004773347930747691, 'samples': 4265472, 'steps': 22215, 'loss/train': 1.6212674379348755} -11/07/2021 00:21:43 - INFO - __main__ - Step 22217: {'lr': 0.0004773325851228017, 'samples': 4265664, 'steps': 22216, 'loss/train': 1.560600757598877} -11/07/2021 00:21:44 - INFO - __main__ - Step 22218: {'lr': 0.00047733037706840166, 'samples': 4265856, 'steps': 22217, 'loss/train': 1.4888997077941895} -11/07/2021 00:21:45 - INFO - __main__ - Step 22219: {'lr': 0.0004773281689115701, 'samples': 4266048, 'steps': 22218, 'loss/train': 1.8526577949523926} -11/07/2021 00:21:45 - INFO - __main__ - Step 22220: {'lr': 0.000477325960652308, 'samples': 4266240, 'steps': 22219, 'loss/train': 1.9920580387115479} -11/07/2021 00:21:45 - INFO - __main__ - Step 22221: {'lr': 0.0004773237522906163, 'samples': 4266432, 'steps': 22220, 'loss/train': 1.6304432153701782} -11/07/2021 00:21:46 - INFO - __main__ - Step 22222: {'lr': 0.000477321543826496, 'samples': 4266624, 'steps': 22221, 'loss/train': 1.4741657972335815} -11/07/2021 00:21:46 - INFO - __main__ - Step 22223: {'lr': 0.00047731933525994814, 'samples': 4266816, 'steps': 22222, 'loss/train': 0.9544246196746826} -11/07/2021 00:21:47 - INFO - __main__ - Step 22224: {'lr': 0.0004773171265909737, 'samples': 4267008, 'steps': 22223, 'loss/train': 1.4136073589324951} -11/07/2021 00:21:48 - INFO - __main__ - Step 22225: {'lr': 0.00047731491781957366, 'samples': 4267200, 'steps': 22224, 'loss/train': 1.588415503501892} -11/07/2021 00:21:48 - INFO - __main__ - Step 22226: {'lr': 0.0004773127089457491, 'samples': 4267392, 'steps': 22225, 'loss/train': 1.265699863433838} -11/07/2021 00:21:48 - INFO - __main__ - Step 22227: {'lr': 0.0004773104999695008, 'samples': 4267584, 'steps': 22226, 'loss/train': 1.5060862302780151} -11/07/2021 00:21:49 - INFO - __main__ - Step 22228: {'lr': 0.00047730829089082994, 'samples': 4267776, 'steps': 22227, 'loss/train': 1.5712088346481323} -11/07/2021 00:21:50 - INFO - __main__ - Step 22229: {'lr': 0.00047730608170973754, 'samples': 4267968, 'steps': 22228, 'loss/train': 1.1024203300476074} -11/07/2021 00:21:50 - INFO - __main__ - Step 22230: {'lr': 0.00047730387242622446, 'samples': 4268160, 'steps': 22229, 'loss/train': 1.0003269910812378} -11/07/2021 00:21:51 - INFO - __main__ - Step 22231: {'lr': 0.00047730166304029185, 'samples': 4268352, 'steps': 22230, 'loss/train': 1.664233684539795} -11/07/2021 00:21:51 - INFO - __main__ - Step 22232: {'lr': 0.0004772994535519405, 'samples': 4268544, 'steps': 22231, 'loss/train': 1.1563791036605835} -11/07/2021 00:21:51 - INFO - __main__ - Step 22233: {'lr': 0.0004772972439611716, 'samples': 4268736, 'steps': 22232, 'loss/train': 1.4765862226486206} -11/07/2021 00:21:52 - INFO - __main__ - Step 22234: {'lr': 0.00047729503426798605, 'samples': 4268928, 'steps': 22233, 'loss/train': 1.6917579174041748} -11/07/2021 00:21:53 - INFO - __main__ - Step 22235: {'lr': 0.0004772928244723849, 'samples': 4269120, 'steps': 22234, 'loss/train': 1.5444846153259277} -11/07/2021 00:21:53 - INFO - __main__ - Step 22236: {'lr': 0.00047729061457436905, 'samples': 4269312, 'steps': 22235, 'loss/train': 1.9563812017440796} -11/07/2021 00:21:53 - INFO - __main__ - Step 22237: {'lr': 0.0004772884045739396, 'samples': 4269504, 'steps': 22236, 'loss/train': 1.596703052520752} -11/07/2021 00:21:54 - INFO - __main__ - Step 22238: {'lr': 0.0004772861944710974, 'samples': 4269696, 'steps': 22237, 'loss/train': 0.26425468921661377} -11/07/2021 00:21:55 - INFO - __main__ - Step 22239: {'lr': 0.00047728398426584375, 'samples': 4269888, 'steps': 22238, 'loss/train': 1.3304921388626099} -11/07/2021 00:21:55 - INFO - __main__ - Step 22240: {'lr': 0.0004772817739581793, 'samples': 4270080, 'steps': 22239, 'loss/train': 1.5881335735321045} -11/07/2021 00:21:55 - INFO - __main__ - Step 22241: {'lr': 0.0004772795635481052, 'samples': 4270272, 'steps': 22240, 'loss/train': 1.3964968919754028} -11/07/2021 00:21:56 - INFO - __main__ - Step 22242: {'lr': 0.00047727735303562246, 'samples': 4270464, 'steps': 22241, 'loss/train': 1.6961921453475952} -11/07/2021 00:21:56 - INFO - __main__ - Step 22243: {'lr': 0.000477275142420732, 'samples': 4270656, 'steps': 22242, 'loss/train': 0.41618475317955017} -11/07/2021 00:21:57 - INFO - __main__ - Step 22244: {'lr': 0.000477272931703435, 'samples': 4270848, 'steps': 22243, 'loss/train': 1.7850244045257568} -11/07/2021 00:21:58 - INFO - __main__ - Step 22245: {'lr': 0.0004772707208837322, 'samples': 4271040, 'steps': 22244, 'loss/train': 1.7638630867004395} -11/07/2021 00:21:58 - INFO - __main__ - Step 22246: {'lr': 0.0004772685099616247, 'samples': 4271232, 'steps': 22245, 'loss/train': 1.2982248067855835} -11/07/2021 00:21:58 - INFO - __main__ - Step 22247: {'lr': 0.0004772662989371136, 'samples': 4271424, 'steps': 22246, 'loss/train': 1.7262928485870361} -11/07/2021 00:21:59 - INFO - __main__ - Step 22248: {'lr': 0.0004772640878101998, 'samples': 4271616, 'steps': 22247, 'loss/train': 1.7095729112625122} -11/07/2021 00:22:00 - INFO - __main__ - Step 22249: {'lr': 0.00047726187658088425, 'samples': 4271808, 'steps': 22248, 'loss/train': 1.4458047151565552} -11/07/2021 00:22:00 - INFO - __main__ - Step 22250: {'lr': 0.0004772596652491681, 'samples': 4272000, 'steps': 22249, 'loss/train': 1.6028023958206177} -11/07/2021 00:22:00 - INFO - __main__ - Step 22251: {'lr': 0.0004772574538150522, 'samples': 4272192, 'steps': 22250, 'loss/train': 2.14910888671875} -11/07/2021 00:22:01 - INFO - __main__ - Step 22252: {'lr': 0.0004772552422785376, 'samples': 4272384, 'steps': 22251, 'loss/train': 1.52297043800354} -11/07/2021 00:22:01 - INFO - __main__ - Step 22253: {'lr': 0.00047725303063962535, 'samples': 4272576, 'steps': 22252, 'loss/train': 1.625970721244812} -11/07/2021 00:22:02 - INFO - __main__ - Step 22254: {'lr': 0.00047725081889831626, 'samples': 4272768, 'steps': 22253, 'loss/train': 0.8719094395637512} -11/07/2021 00:22:03 - INFO - __main__ - Step 22255: {'lr': 0.0004772486070546116, 'samples': 4272960, 'steps': 22254, 'loss/train': 1.5029946565628052} -11/07/2021 00:22:03 - INFO - __main__ - Step 22256: {'lr': 0.0004772463951085121, 'samples': 4273152, 'steps': 22255, 'loss/train': 1.6506491899490356} -11/07/2021 00:22:03 - INFO - __main__ - Step 22257: {'lr': 0.00047724418306001895, 'samples': 4273344, 'steps': 22256, 'loss/train': 1.6396294832229614} -11/07/2021 00:22:04 - INFO - __main__ - Step 22258: {'lr': 0.0004772419709091331, 'samples': 4273536, 'steps': 22257, 'loss/train': 1.0318959951400757} -11/07/2021 00:22:04 - INFO - __main__ - Step 22259: {'lr': 0.00047723975865585544, 'samples': 4273728, 'steps': 22258, 'loss/train': 0.9595012068748474} -11/07/2021 00:22:05 - INFO - __main__ - Step 22260: {'lr': 0.00047723754630018715, 'samples': 4273920, 'steps': 22259, 'loss/train': 1.636866569519043} -11/07/2021 00:22:06 - INFO - __main__ - Step 22261: {'lr': 0.000477235333842129, 'samples': 4274112, 'steps': 22260, 'loss/train': 1.8469388484954834} -11/07/2021 00:22:06 - INFO - __main__ - Step 22262: {'lr': 0.00047723312128168226, 'samples': 4274304, 'steps': 22261, 'loss/train': 1.572001576423645} -11/07/2021 00:22:06 - INFO - __main__ - Step 22263: {'lr': 0.00047723090861884773, 'samples': 4274496, 'steps': 22262, 'loss/train': 1.3939660787582397} -11/07/2021 00:22:07 - INFO - __main__ - Step 22264: {'lr': 0.00047722869585362646, 'samples': 4274688, 'steps': 22263, 'loss/train': 1.5644506216049194} -11/07/2021 00:22:08 - INFO - __main__ - Step 22265: {'lr': 0.0004772264829860194, 'samples': 4274880, 'steps': 22264, 'loss/train': 1.638916254043579} -11/07/2021 00:22:08 - INFO - __main__ - Step 22266: {'lr': 0.00047722427001602765, 'samples': 4275072, 'steps': 22265, 'loss/train': 1.7917464971542358} -11/07/2021 00:22:08 - INFO - __main__ - Step 22267: {'lr': 0.0004772220569436521, 'samples': 4275264, 'steps': 22266, 'loss/train': 1.3653619289398193} -11/07/2021 00:22:09 - INFO - __main__ - Step 22268: {'lr': 0.0004772198437688938, 'samples': 4275456, 'steps': 22267, 'loss/train': 1.468030571937561} -11/07/2021 00:22:09 - INFO - __main__ - Step 22269: {'lr': 0.0004772176304917538, 'samples': 4275648, 'steps': 22268, 'loss/train': 1.6017370223999023} -11/07/2021 00:22:10 - INFO - __main__ - Step 22270: {'lr': 0.00047721541711223306, 'samples': 4275840, 'steps': 22269, 'loss/train': 1.4185051918029785} -11/07/2021 00:22:10 - INFO - __main__ - Step 22271: {'lr': 0.00047721320363033247, 'samples': 4276032, 'steps': 22270, 'loss/train': 1.8277918100357056} -11/07/2021 00:22:11 - INFO - __main__ - Step 22272: {'lr': 0.00047721099004605316, 'samples': 4276224, 'steps': 22271, 'loss/train': 1.816880702972412} -11/07/2021 00:22:11 - INFO - __main__ - Step 22273: {'lr': 0.00047720877635939606, 'samples': 4276416, 'steps': 22272, 'loss/train': 1.9079005718231201} -11/07/2021 00:22:12 - INFO - __main__ - Step 22274: {'lr': 0.0004772065625703622, 'samples': 4276608, 'steps': 22273, 'loss/train': 1.729659080505371} -11/07/2021 00:22:12 - INFO - __main__ - Step 22275: {'lr': 0.0004772043486789526, 'samples': 4276800, 'steps': 22274, 'loss/train': 1.4082915782928467} -11/07/2021 00:22:13 - INFO - __main__ - Step 22276: {'lr': 0.0004772021346851682, 'samples': 4276992, 'steps': 22275, 'loss/train': 1.8357642889022827} -11/07/2021 00:22:13 - INFO - __main__ - Step 22277: {'lr': 0.00047719992058901006, 'samples': 4277184, 'steps': 22276, 'loss/train': 1.6172411441802979} -11/07/2021 00:22:13 - INFO - __main__ - Step 22278: {'lr': 0.0004771977063904791, 'samples': 4277376, 'steps': 22277, 'loss/train': 1.0844411849975586} -11/07/2021 00:22:14 - INFO - __main__ - Step 22279: {'lr': 0.00047719549208957636, 'samples': 4277568, 'steps': 22278, 'loss/train': 1.8847882747650146} -11/07/2021 00:22:14 - INFO - __main__ - Step 22280: {'lr': 0.0004771932776863028, 'samples': 4277760, 'steps': 22279, 'loss/train': 1.7806832790374756} -11/07/2021 00:22:15 - INFO - __main__ - Step 22281: {'lr': 0.0004771910631806595, 'samples': 4277952, 'steps': 22280, 'loss/train': 1.5112051963806152} -11/07/2021 00:22:16 - INFO - __main__ - Step 22282: {'lr': 0.00047718884857264745, 'samples': 4278144, 'steps': 22281, 'loss/train': 1.638104796409607} -11/07/2021 00:22:16 - INFO - __main__ - Step 22283: {'lr': 0.0004771866338622676, 'samples': 4278336, 'steps': 22282, 'loss/train': 1.4743871688842773} -11/07/2021 00:22:16 - INFO - __main__ - Step 22284: {'lr': 0.0004771844190495209, 'samples': 4278528, 'steps': 22283, 'loss/train': 1.577344298362732} -11/07/2021 00:22:17 - INFO - __main__ - Step 22285: {'lr': 0.0004771822041344085, 'samples': 4278720, 'steps': 22284, 'loss/train': 1.610754132270813} -11/07/2021 00:22:18 - INFO - __main__ - Step 22286: {'lr': 0.0004771799891169312, 'samples': 4278912, 'steps': 22285, 'loss/train': 1.7802586555480957} -11/07/2021 00:22:18 - INFO - __main__ - Step 22287: {'lr': 0.0004771777739970902, 'samples': 4279104, 'steps': 22286, 'loss/train': 1.3665558099746704} -11/07/2021 00:22:18 - INFO - __main__ - Step 22288: {'lr': 0.0004771755587748863, 'samples': 4279296, 'steps': 22287, 'loss/train': 1.852914571762085} -11/07/2021 00:22:19 - INFO - __main__ - Step 22289: {'lr': 0.00047717334345032065, 'samples': 4279488, 'steps': 22288, 'loss/train': 1.0421020984649658} -11/07/2021 00:22:19 - INFO - __main__ - Step 22290: {'lr': 0.0004771711280233942, 'samples': 4279680, 'steps': 22289, 'loss/train': 1.3669109344482422} -11/07/2021 00:22:20 - INFO - __main__ - Step 22291: {'lr': 0.000477168912494108, 'samples': 4279872, 'steps': 22290, 'loss/train': 1.376916527748108} -11/07/2021 00:22:21 - INFO - __main__ - Step 22292: {'lr': 0.00047716669686246287, 'samples': 4280064, 'steps': 22291, 'loss/train': 0.9953264594078064} -11/07/2021 00:22:21 - INFO - __main__ - Step 22293: {'lr': 0.00047716448112846, 'samples': 4280256, 'steps': 22292, 'loss/train': 1.9123733043670654} -11/07/2021 00:22:21 - INFO - __main__ - Step 22294: {'lr': 0.00047716226529210035, 'samples': 4280448, 'steps': 22293, 'loss/train': 1.8882105350494385} -11/07/2021 00:22:22 - INFO - __main__ - Step 22295: {'lr': 0.00047716004935338484, 'samples': 4280640, 'steps': 22294, 'loss/train': 1.7229362726211548} -11/07/2021 00:22:22 - INFO - __main__ - Step 22296: {'lr': 0.0004771578333123145, 'samples': 4280832, 'steps': 22295, 'loss/train': 0.9274198412895203} -11/07/2021 00:22:23 - INFO - __main__ - Step 22297: {'lr': 0.00047715561716889037, 'samples': 4281024, 'steps': 22296, 'loss/train': 1.4598338603973389} -11/07/2021 00:22:23 - INFO - __main__ - Step 22298: {'lr': 0.0004771534009231134, 'samples': 4281216, 'steps': 22297, 'loss/train': 1.5091946125030518} -11/07/2021 00:22:24 - INFO - __main__ - Step 22299: {'lr': 0.00047715118457498473, 'samples': 4281408, 'steps': 22298, 'loss/train': 1.5219142436981201} -11/07/2021 00:22:24 - INFO - __main__ - Step 22300: {'lr': 0.00047714896812450514, 'samples': 4281600, 'steps': 22299, 'loss/train': 1.509248971939087} -11/07/2021 00:22:25 - INFO - __main__ - Step 22301: {'lr': 0.00047714675157167573, 'samples': 4281792, 'steps': 22300, 'loss/train': 1.7630727291107178} -11/07/2021 00:22:25 - INFO - __main__ - Step 22302: {'lr': 0.00047714453491649753, 'samples': 4281984, 'steps': 22301, 'loss/train': 1.8778845071792603} -11/07/2021 00:22:26 - INFO - __main__ - Step 22303: {'lr': 0.00047714231815897145, 'samples': 4282176, 'steps': 22302, 'loss/train': 1.7316973209381104} -11/07/2021 00:22:26 - INFO - __main__ - Step 22304: {'lr': 0.0004771401012990986, 'samples': 4282368, 'steps': 22303, 'loss/train': 1.1782406568527222} -11/07/2021 00:22:27 - INFO - __main__ - Step 22305: {'lr': 0.0004771378843368799, 'samples': 4282560, 'steps': 22304, 'loss/train': 1.4086192846298218} -11/07/2021 00:22:27 - INFO - __main__ - Step 22306: {'lr': 0.0004771356672723164, 'samples': 4282752, 'steps': 22305, 'loss/train': 1.1016020774841309} -11/07/2021 00:22:28 - INFO - __main__ - Step 22307: {'lr': 0.0004771334501054091, 'samples': 4282944, 'steps': 22306, 'loss/train': 1.1659605503082275} -11/07/2021 00:22:28 - INFO - __main__ - Step 22308: {'lr': 0.0004771312328361589, 'samples': 4283136, 'steps': 22307, 'loss/train': 1.5280841588974} -11/07/2021 00:22:29 - INFO - __main__ - Step 22309: {'lr': 0.0004771290154645669, 'samples': 4283328, 'steps': 22308, 'loss/train': 1.160269021987915} -11/07/2021 00:22:29 - INFO - __main__ - Step 22310: {'lr': 0.0004771267979906341, 'samples': 4283520, 'steps': 22309, 'loss/train': 1.9466007947921753} -11/07/2021 00:22:29 - INFO - __main__ - Step 22311: {'lr': 0.0004771245804143615, 'samples': 4283712, 'steps': 22310, 'loss/train': 1.7830595970153809} -11/07/2021 00:22:30 - INFO - __main__ - Step 22312: {'lr': 0.00047712236273574993, 'samples': 4283904, 'steps': 22311, 'loss/train': 1.239105463027954} -11/07/2021 00:22:31 - INFO - __main__ - Step 22313: {'lr': 0.0004771201449548006, 'samples': 4284096, 'steps': 22312, 'loss/train': 1.8768774271011353} -11/07/2021 00:22:31 - INFO - __main__ - Step 22314: {'lr': 0.0004771179270715145, 'samples': 4284288, 'steps': 22313, 'loss/train': 0.8931715488433838} -11/07/2021 00:22:32 - INFO - __main__ - Step 22315: {'lr': 0.0004771157090858925, 'samples': 4284480, 'steps': 22314, 'loss/train': 1.2766802310943604} -11/07/2021 00:22:32 - INFO - __main__ - Step 22316: {'lr': 0.00047711349099793565, 'samples': 4284672, 'steps': 22315, 'loss/train': 1.6245396137237549} -11/07/2021 00:22:33 - INFO - __main__ - Step 22317: {'lr': 0.00047711127280764497, 'samples': 4284864, 'steps': 22316, 'loss/train': 0.9728535413742065} -11/07/2021 00:22:33 - INFO - __main__ - Step 22318: {'lr': 0.0004771090545150215, 'samples': 4285056, 'steps': 22317, 'loss/train': 2.4875779151916504} -11/07/2021 00:22:34 - INFO - __main__ - Step 22319: {'lr': 0.00047710683612006623, 'samples': 4285248, 'steps': 22318, 'loss/train': 1.8442782163619995} -11/07/2021 00:22:34 - INFO - __main__ - Step 22320: {'lr': 0.00047710461762278, 'samples': 4285440, 'steps': 22319, 'loss/train': 1.5267730951309204} -11/07/2021 00:22:34 - INFO - __main__ - Step 22321: {'lr': 0.00047710239902316404, 'samples': 4285632, 'steps': 22320, 'loss/train': 1.1445330381393433} -11/07/2021 00:22:35 - INFO - __main__ - Step 22322: {'lr': 0.0004771001803212192, 'samples': 4285824, 'steps': 22321, 'loss/train': 1.614621877670288} -11/07/2021 00:22:36 - INFO - __main__ - Step 22323: {'lr': 0.0004770979615169466, 'samples': 4286016, 'steps': 22322, 'loss/train': 1.7761956453323364} -11/07/2021 00:22:36 - INFO - __main__ - Step 22324: {'lr': 0.00047709574261034705, 'samples': 4286208, 'steps': 22323, 'loss/train': 1.923969030380249} -11/07/2021 00:22:36 - INFO - __main__ - Step 22325: {'lr': 0.0004770935236014217, 'samples': 4286400, 'steps': 22324, 'loss/train': 1.6623705625534058} -11/07/2021 00:22:37 - INFO - __main__ - Step 22326: {'lr': 0.00047709130449017154, 'samples': 4286592, 'steps': 22325, 'loss/train': 1.6310282945632935} -11/07/2021 00:22:37 - INFO - __main__ - Step 22327: {'lr': 0.0004770890852765975, 'samples': 4286784, 'steps': 22326, 'loss/train': 1.615903377532959} -11/07/2021 00:22:38 - INFO - __main__ - Step 22328: {'lr': 0.00047708686596070065, 'samples': 4286976, 'steps': 22327, 'loss/train': 1.5300124883651733} -11/07/2021 00:22:38 - INFO - __main__ - Step 22329: {'lr': 0.00047708464654248195, 'samples': 4287168, 'steps': 22328, 'loss/train': 1.8082314729690552} -11/07/2021 00:22:39 - INFO - __main__ - Step 22330: {'lr': 0.0004770824270219424, 'samples': 4287360, 'steps': 22329, 'loss/train': 1.3073426485061646} -11/07/2021 00:22:39 - INFO - __main__ - Step 22331: {'lr': 0.0004770802073990831, 'samples': 4287552, 'steps': 22330, 'loss/train': 1.7682299613952637} -11/07/2021 00:22:40 - INFO - __main__ - Step 22332: {'lr': 0.00047707798767390486, 'samples': 4287744, 'steps': 22331, 'loss/train': 1.6708950996398926} -11/07/2021 00:22:41 - INFO - __main__ - Step 22333: {'lr': 0.00047707576784640883, 'samples': 4287936, 'steps': 22332, 'loss/train': 1.608047604560852} -11/07/2021 00:22:41 - INFO - __main__ - Step 22334: {'lr': 0.00047707354791659594, 'samples': 4288128, 'steps': 22333, 'loss/train': 2.013827085494995} -11/07/2021 00:22:41 - INFO - __main__ - Step 22335: {'lr': 0.0004770713278844672, 'samples': 4288320, 'steps': 22334, 'loss/train': 1.0852205753326416} -11/07/2021 00:22:42 - INFO - __main__ - Step 22336: {'lr': 0.00047706910775002363, 'samples': 4288512, 'steps': 22335, 'loss/train': 1.5838872194290161} -11/07/2021 00:22:42 - INFO - __main__ - Step 22337: {'lr': 0.0004770668875132663, 'samples': 4288704, 'steps': 22336, 'loss/train': 1.68880033493042} -11/07/2021 00:22:43 - INFO - __main__ - Step 22338: {'lr': 0.00047706466717419607, 'samples': 4288896, 'steps': 22337, 'loss/train': 1.2144722938537598} -11/07/2021 00:22:43 - INFO - __main__ - Step 22339: {'lr': 0.000477062446732814, 'samples': 4289088, 'steps': 22338, 'loss/train': 1.7872453927993774} -11/07/2021 00:22:44 - INFO - __main__ - Step 22340: {'lr': 0.0004770602261891211, 'samples': 4289280, 'steps': 22339, 'loss/train': 1.386384129524231} -11/07/2021 00:22:44 - INFO - __main__ - Step 22341: {'lr': 0.00047705800554311836, 'samples': 4289472, 'steps': 22340, 'loss/train': 1.812485694885254} -11/07/2021 00:22:45 - INFO - __main__ - Step 22342: {'lr': 0.0004770557847948068, 'samples': 4289664, 'steps': 22341, 'loss/train': 1.3352690935134888} -11/07/2021 00:22:45 - INFO - __main__ - Step 22343: {'lr': 0.0004770535639441874, 'samples': 4289856, 'steps': 22342, 'loss/train': 1.8325512409210205} -11/07/2021 00:22:46 - INFO - __main__ - Step 22344: {'lr': 0.0004770513429912612, 'samples': 4290048, 'steps': 22343, 'loss/train': 1.429988145828247} -11/07/2021 00:22:46 - INFO - __main__ - Step 22345: {'lr': 0.0004770491219360291, 'samples': 4290240, 'steps': 22344, 'loss/train': 1.3341028690338135} -11/07/2021 00:22:47 - INFO - __main__ - Step 22346: {'lr': 0.00047704690077849223, 'samples': 4290432, 'steps': 22345, 'loss/train': 1.5357767343521118} -11/07/2021 00:22:47 - INFO - __main__ - Step 22347: {'lr': 0.0004770446795186515, 'samples': 4290624, 'steps': 22346, 'loss/train': 1.02168869972229} -11/07/2021 00:22:48 - INFO - __main__ - Step 22348: {'lr': 0.0004770424581565079, 'samples': 4290816, 'steps': 22347, 'loss/train': 2.0495290756225586} -11/07/2021 00:22:48 - INFO - __main__ - Step 22349: {'lr': 0.0004770402366920625, 'samples': 4291008, 'steps': 22348, 'loss/train': 1.4317470788955688} -11/07/2021 00:22:49 - INFO - __main__ - Step 22350: {'lr': 0.00047703801512531636, 'samples': 4291200, 'steps': 22349, 'loss/train': 1.5442404747009277} -11/07/2021 00:22:49 - INFO - __main__ - Step 22351: {'lr': 0.00047703579345627036, 'samples': 4291392, 'steps': 22350, 'loss/train': 1.2991282939910889} -11/07/2021 00:22:49 - INFO - __main__ - Step 22352: {'lr': 0.00047703357168492544, 'samples': 4291584, 'steps': 22351, 'loss/train': 1.0072227716445923} -11/07/2021 00:22:50 - INFO - __main__ - Step 22353: {'lr': 0.0004770313498112828, 'samples': 4291776, 'steps': 22352, 'loss/train': 1.7183367013931274} -11/07/2021 00:22:51 - INFO - __main__ - Step 22354: {'lr': 0.0004770291278353433, 'samples': 4291968, 'steps': 22353, 'loss/train': 1.5203161239624023} -11/07/2021 00:22:51 - INFO - __main__ - Step 22355: {'lr': 0.00047702690575710796, 'samples': 4292160, 'steps': 22354, 'loss/train': 1.6376055479049683} -11/07/2021 00:22:51 - INFO - __main__ - Step 22356: {'lr': 0.0004770246835765778, 'samples': 4292352, 'steps': 22355, 'loss/train': 1.6381512880325317} -11/07/2021 00:22:52 - INFO - __main__ - Step 22357: {'lr': 0.0004770224612937538, 'samples': 4292544, 'steps': 22356, 'loss/train': 1.4302995204925537} -11/07/2021 00:22:52 - INFO - __main__ - Step 22358: {'lr': 0.0004770202389086371, 'samples': 4292736, 'steps': 22357, 'loss/train': 1.8325588703155518} -11/07/2021 00:22:53 - INFO - __main__ - Step 22359: {'lr': 0.0004770180164212284, 'samples': 4292928, 'steps': 22358, 'loss/train': 2.1267189979553223} -11/07/2021 00:22:54 - INFO - __main__ - Step 22360: {'lr': 0.00047701579383152906, 'samples': 4293120, 'steps': 22359, 'loss/train': 1.712369680404663} -11/07/2021 00:22:54 - INFO - __main__ - Step 22361: {'lr': 0.0004770135711395398, 'samples': 4293312, 'steps': 22360, 'loss/train': 1.9101619720458984} -11/07/2021 00:22:54 - INFO - __main__ - Step 22362: {'lr': 0.0004770113483452618, 'samples': 4293504, 'steps': 22361, 'loss/train': 1.594948172569275} -11/07/2021 00:22:55 - INFO - __main__ - Step 22363: {'lr': 0.00047700912544869595, 'samples': 4293696, 'steps': 22362, 'loss/train': 0.9005606174468994} -11/07/2021 00:22:56 - INFO - __main__ - Step 22364: {'lr': 0.0004770069024498433, 'samples': 4293888, 'steps': 22363, 'loss/train': 1.134440541267395} -11/07/2021 00:22:56 - INFO - __main__ - Step 22365: {'lr': 0.00047700467934870484, 'samples': 4294080, 'steps': 22364, 'loss/train': 1.7258731126785278} -11/07/2021 00:22:56 - INFO - __main__ - Step 22366: {'lr': 0.0004770024561452816, 'samples': 4294272, 'steps': 22365, 'loss/train': 1.5210816860198975} -11/07/2021 00:22:57 - INFO - __main__ - Step 22367: {'lr': 0.0004770002328395745, 'samples': 4294464, 'steps': 22366, 'loss/train': 1.8009976148605347} -11/07/2021 00:22:57 - INFO - __main__ - Step 22368: {'lr': 0.00047699800943158454, 'samples': 4294656, 'steps': 22367, 'loss/train': 2.5974385738372803} -11/07/2021 00:22:58 - INFO - __main__ - Step 22369: {'lr': 0.0004769957859213129, 'samples': 4294848, 'steps': 22368, 'loss/train': 1.525080680847168} -11/07/2021 00:22:59 - INFO - __main__ - Step 22370: {'lr': 0.00047699356230876047, 'samples': 4295040, 'steps': 22369, 'loss/train': 1.390128254890442} -11/07/2021 00:22:59 - INFO - __main__ - Step 22371: {'lr': 0.0004769913385939282, 'samples': 4295232, 'steps': 22370, 'loss/train': 1.6059892177581787} -11/07/2021 00:22:59 - INFO - __main__ - Step 22372: {'lr': 0.0004769891147768171, 'samples': 4295424, 'steps': 22371, 'loss/train': 1.6354572772979736} -11/07/2021 00:23:00 - INFO - __main__ - Step 22373: {'lr': 0.00047698689085742823, 'samples': 4295616, 'steps': 22372, 'loss/train': 1.6986100673675537} -11/07/2021 00:23:01 - INFO - __main__ - Step 22374: {'lr': 0.00047698466683576256, 'samples': 4295808, 'steps': 22373, 'loss/train': 1.620169997215271} -11/07/2021 00:23:01 - INFO - __main__ - Step 22375: {'lr': 0.0004769824427118211, 'samples': 4296000, 'steps': 22374, 'loss/train': 1.9812889099121094} -11/07/2021 00:23:01 - INFO - __main__ - Step 22376: {'lr': 0.00047698021848560494, 'samples': 4296192, 'steps': 22375, 'loss/train': 1.9996026754379272} -11/07/2021 00:23:02 - INFO - __main__ - Step 22377: {'lr': 0.0004769779941571149, 'samples': 4296384, 'steps': 22376, 'loss/train': 3.221825361251831} -11/07/2021 00:23:02 - INFO - __main__ - Step 22378: {'lr': 0.00047697576972635213, 'samples': 4296576, 'steps': 22377, 'loss/train': 1.418237328529358} -11/07/2021 00:23:02 - INFO - __main__ - Step 22379: {'lr': 0.0004769735451933176, 'samples': 4296768, 'steps': 22378, 'loss/train': 1.2897299528121948} -11/07/2021 00:23:03 - INFO - __main__ - Step 22380: {'lr': 0.0004769713205580122, 'samples': 4296960, 'steps': 22379, 'loss/train': 1.8298044204711914} -11/07/2021 00:23:04 - INFO - __main__ - Step 22381: {'lr': 0.0004769690958204371, 'samples': 4297152, 'steps': 22380, 'loss/train': 1.7279726266860962} -11/07/2021 00:23:04 - INFO - __main__ - Step 22382: {'lr': 0.0004769668709805932, 'samples': 4297344, 'steps': 22381, 'loss/train': 1.6349552869796753} -11/07/2021 00:23:04 - INFO - __main__ - Step 22383: {'lr': 0.0004769646460384816, 'samples': 4297536, 'steps': 22382, 'loss/train': 1.3800374269485474} -11/07/2021 00:23:05 - INFO - __main__ - Step 22384: {'lr': 0.00047696242099410307, 'samples': 4297728, 'steps': 22383, 'loss/train': 1.1722553968429565} -11/07/2021 00:23:06 - INFO - __main__ - Step 22385: {'lr': 0.00047696019584745887, 'samples': 4297920, 'steps': 22384, 'loss/train': 1.6306506395339966} -11/07/2021 00:23:06 - INFO - __main__ - Step 22386: {'lr': 0.00047695797059854996, 'samples': 4298112, 'steps': 22385, 'loss/train': 1.1783595085144043} -11/07/2021 00:23:06 - INFO - __main__ - Step 22387: {'lr': 0.0004769557452473772, 'samples': 4298304, 'steps': 22386, 'loss/train': 1.5198588371276855} -11/07/2021 00:23:07 - INFO - __main__ - Step 22388: {'lr': 0.00047695351979394173, 'samples': 4298496, 'steps': 22387, 'loss/train': 1.2966810464859009} -11/07/2021 00:23:07 - INFO - __main__ - Step 22389: {'lr': 0.00047695129423824454, 'samples': 4298688, 'steps': 22388, 'loss/train': 1.4684990644454956} -11/07/2021 00:23:08 - INFO - __main__ - Step 22390: {'lr': 0.0004769490685802865, 'samples': 4298880, 'steps': 22389, 'loss/train': 1.5988306999206543} -11/07/2021 00:23:09 - INFO - __main__ - Step 22391: {'lr': 0.00047694684282006885, 'samples': 4299072, 'steps': 22390, 'loss/train': 1.4806081056594849} -11/07/2021 00:23:09 - INFO - __main__ - Step 22392: {'lr': 0.00047694461695759236, 'samples': 4299264, 'steps': 22391, 'loss/train': 1.8315117359161377} -11/07/2021 00:23:09 - INFO - __main__ - Step 22393: {'lr': 0.00047694239099285815, 'samples': 4299456, 'steps': 22392, 'loss/train': 1.7604342699050903} -11/07/2021 00:23:10 - INFO - __main__ - Step 22394: {'lr': 0.00047694016492586715, 'samples': 4299648, 'steps': 22393, 'loss/train': 1.3254797458648682} -11/07/2021 00:23:11 - INFO - __main__ - Step 22395: {'lr': 0.0004769379387566205, 'samples': 4299840, 'steps': 22394, 'loss/train': 1.8817399740219116} -11/07/2021 00:23:11 - INFO - __main__ - Step 22396: {'lr': 0.000476935712485119, 'samples': 4300032, 'steps': 22395, 'loss/train': 1.6139127016067505} -11/07/2021 00:23:12 - INFO - __main__ - Step 22397: {'lr': 0.0004769334861113639, 'samples': 4300224, 'steps': 22396, 'loss/train': 1.4538699388504028} -11/07/2021 00:23:12 - INFO - __main__ - Step 22398: {'lr': 0.000476931259635356, 'samples': 4300416, 'steps': 22397, 'loss/train': 1.6450276374816895} -11/07/2021 00:23:12 - INFO - __main__ - Step 22399: {'lr': 0.00047692903305709646, 'samples': 4300608, 'steps': 22398, 'loss/train': 1.532269835472107} -11/07/2021 00:23:13 - INFO - __main__ - Step 22400: {'lr': 0.0004769268063765861, 'samples': 4300800, 'steps': 22399, 'loss/train': 1.9369391202926636} -11/07/2021 00:23:14 - INFO - __main__ - Step 22401: {'lr': 0.00047692457959382605, 'samples': 4300992, 'steps': 22400, 'loss/train': 1.5004935264587402} -11/07/2021 00:23:14 - INFO - __main__ - Step 22402: {'lr': 0.0004769223527088173, 'samples': 4301184, 'steps': 22401, 'loss/train': 1.646162509918213} -11/07/2021 00:23:14 - INFO - __main__ - Step 22403: {'lr': 0.00047692012572156086, 'samples': 4301376, 'steps': 22402, 'loss/train': 1.83078134059906} -11/07/2021 00:23:15 - INFO - __main__ - Step 22404: {'lr': 0.00047691789863205764, 'samples': 4301568, 'steps': 22403, 'loss/train': 2.1965112686157227} -11/07/2021 00:23:15 - INFO - __main__ - Step 22405: {'lr': 0.0004769156714403088, 'samples': 4301760, 'steps': 22404, 'loss/train': 1.1386685371398926} -11/07/2021 00:23:16 - INFO - __main__ - Step 22406: {'lr': 0.0004769134441463152, 'samples': 4301952, 'steps': 22405, 'loss/train': 1.8415265083312988} -11/07/2021 00:23:16 - INFO - __main__ - Step 22407: {'lr': 0.0004769112167500779, 'samples': 4302144, 'steps': 22406, 'loss/train': 1.3537362813949585} -11/07/2021 00:23:17 - INFO - __main__ - Step 22408: {'lr': 0.00047690898925159796, 'samples': 4302336, 'steps': 22407, 'loss/train': 1.3526972532272339} -11/07/2021 00:23:17 - INFO - __main__ - Step 22409: {'lr': 0.0004769067616508763, 'samples': 4302528, 'steps': 22408, 'loss/train': 2.1145200729370117} -11/07/2021 00:23:17 - INFO - __main__ - Step 22410: {'lr': 0.00047690453394791393, 'samples': 4302720, 'steps': 22409, 'loss/train': 1.4619641304016113} -11/07/2021 00:23:18 - INFO - __main__ - Step 22411: {'lr': 0.0004769023061427119, 'samples': 4302912, 'steps': 22410, 'loss/train': 0.3332456052303314} -11/07/2021 00:23:19 - INFO - __main__ - Step 22412: {'lr': 0.0004769000782352713, 'samples': 4303104, 'steps': 22411, 'loss/train': 1.1623334884643555} -11/07/2021 00:23:19 - INFO - __main__ - Step 22413: {'lr': 0.00047689785022559284, 'samples': 4303296, 'steps': 22412, 'loss/train': 1.511031150817871} -11/07/2021 00:23:19 - INFO - __main__ - Step 22414: {'lr': 0.0004768956221136778, 'samples': 4303488, 'steps': 22413, 'loss/train': 1.2305755615234375} -11/07/2021 00:23:20 - INFO - __main__ - Step 22415: {'lr': 0.00047689339389952713, 'samples': 4303680, 'steps': 22414, 'loss/train': 1.4260704517364502} -11/07/2021 00:23:21 - INFO - __main__ - Step 22416: {'lr': 0.0004768911655831417, 'samples': 4303872, 'steps': 22415, 'loss/train': 2.0966074466705322} -11/07/2021 00:23:21 - INFO - __main__ - Step 22417: {'lr': 0.0004768889371645227, 'samples': 4304064, 'steps': 22416, 'loss/train': 1.5773353576660156} -11/07/2021 00:23:22 - INFO - __main__ - Step 22418: {'lr': 0.000476886708643671, 'samples': 4304256, 'steps': 22417, 'loss/train': 1.4869263172149658} -11/07/2021 00:23:22 - INFO - __main__ - Step 22419: {'lr': 0.0004768844800205877, 'samples': 4304448, 'steps': 22418, 'loss/train': 1.8562376499176025} -11/07/2021 00:23:22 - INFO - __main__ - Step 22420: {'lr': 0.0004768822512952737, 'samples': 4304640, 'steps': 22419, 'loss/train': 1.4217239618301392} -11/07/2021 00:23:23 - INFO - __main__ - Step 22421: {'lr': 0.0004768800224677301, 'samples': 4304832, 'steps': 22420, 'loss/train': 1.4588857889175415} -11/07/2021 00:23:24 - INFO - __main__ - Step 22422: {'lr': 0.0004768777935379578, 'samples': 4305024, 'steps': 22421, 'loss/train': 1.9696581363677979} -11/07/2021 00:23:24 - INFO - __main__ - Step 22423: {'lr': 0.0004768755645059579, 'samples': 4305216, 'steps': 22422, 'loss/train': 1.1590843200683594} -11/07/2021 00:23:24 - INFO - __main__ - Step 22424: {'lr': 0.00047687333537173136, 'samples': 4305408, 'steps': 22423, 'loss/train': 1.8532379865646362} -11/07/2021 00:23:25 - INFO - __main__ - Step 22425: {'lr': 0.00047687110613527924, 'samples': 4305600, 'steps': 22424, 'loss/train': 2.046144485473633} -11/07/2021 00:23:26 - INFO - __main__ - Step 22426: {'lr': 0.00047686887679660253, 'samples': 4305792, 'steps': 22425, 'loss/train': 1.6717745065689087} -11/07/2021 00:23:26 - INFO - __main__ - Step 22427: {'lr': 0.0004768666473557021, 'samples': 4305984, 'steps': 22426, 'loss/train': 1.4736900329589844} -11/07/2021 00:23:26 - INFO - __main__ - Step 22428: {'lr': 0.0004768644178125791, 'samples': 4306176, 'steps': 22427, 'loss/train': 2.280658483505249} -11/07/2021 00:23:27 - INFO - __main__ - Step 22429: {'lr': 0.0004768621881672345, 'samples': 4306368, 'steps': 22428, 'loss/train': 1.1368001699447632} -11/07/2021 00:23:27 - INFO - __main__ - Step 22430: {'lr': 0.00047685995841966936, 'samples': 4306560, 'steps': 22429, 'loss/train': 1.5032750368118286} -11/07/2021 00:23:27 - INFO - __main__ - Step 22431: {'lr': 0.0004768577285698845, 'samples': 4306752, 'steps': 22430, 'loss/train': 1.7891005277633667} -11/07/2021 00:23:28 - INFO - __main__ - Step 22432: {'lr': 0.00047685549861788113, 'samples': 4306944, 'steps': 22431, 'loss/train': 1.7036324739456177} -11/07/2021 00:23:29 - INFO - __main__ - Step 22433: {'lr': 0.0004768532685636602, 'samples': 4307136, 'steps': 22432, 'loss/train': 2.235828161239624} -11/07/2021 00:23:29 - INFO - __main__ - Step 22434: {'lr': 0.0004768510384072226, 'samples': 4307328, 'steps': 22433, 'loss/train': 1.9438023567199707} -11/07/2021 00:23:29 - INFO - __main__ - Step 22435: {'lr': 0.0004768488081485695, 'samples': 4307520, 'steps': 22434, 'loss/train': 0.8506284952163696} -11/07/2021 00:23:30 - INFO - __main__ - Step 22436: {'lr': 0.0004768465777877018, 'samples': 4307712, 'steps': 22435, 'loss/train': 1.2240818738937378} -11/07/2021 00:23:31 - INFO - __main__ - Step 22437: {'lr': 0.0004768443473246205, 'samples': 4307904, 'steps': 22436, 'loss/train': 1.3975337743759155} -11/07/2021 00:23:31 - INFO - __main__ - Step 22438: {'lr': 0.00047684211675932665, 'samples': 4308096, 'steps': 22437, 'loss/train': 2.0789754390716553} -11/07/2021 00:23:32 - INFO - __main__ - Step 22439: {'lr': 0.0004768398860918213, 'samples': 4308288, 'steps': 22438, 'loss/train': 1.650249719619751} -11/07/2021 00:23:32 - INFO - __main__ - Step 22440: {'lr': 0.0004768376553221053, 'samples': 4308480, 'steps': 22439, 'loss/train': 1.447034239768982} -11/07/2021 00:23:32 - INFO - __main__ - Step 22441: {'lr': 0.0004768354244501798, 'samples': 4308672, 'steps': 22440, 'loss/train': 1.8617455959320068} -11/07/2021 00:23:33 - INFO - __main__ - Step 22442: {'lr': 0.0004768331934760458, 'samples': 4308864, 'steps': 22441, 'loss/train': 1.5123012065887451} -11/07/2021 00:23:34 - INFO - __main__ - Step 22443: {'lr': 0.00047683096239970423, 'samples': 4309056, 'steps': 22442, 'loss/train': 1.7382694482803345} -11/07/2021 00:23:34 - INFO - __main__ - Step 22444: {'lr': 0.0004768287312211561, 'samples': 4309248, 'steps': 22443, 'loss/train': 1.417901635169983} -11/07/2021 00:23:34 - INFO - __main__ - Step 22445: {'lr': 0.0004768264999404025, 'samples': 4309440, 'steps': 22444, 'loss/train': 1.5879945755004883} -11/07/2021 00:23:35 - INFO - __main__ - Step 22446: {'lr': 0.00047682426855744434, 'samples': 4309632, 'steps': 22445, 'loss/train': 1.4141817092895508} -11/07/2021 00:23:36 - INFO - __main__ - Step 22447: {'lr': 0.00047682203707228264, 'samples': 4309824, 'steps': 22446, 'loss/train': 1.5829259157180786} -11/07/2021 00:23:36 - INFO - __main__ - Step 22448: {'lr': 0.00047681980548491853, 'samples': 4310016, 'steps': 22447, 'loss/train': 1.159238338470459} -11/07/2021 00:23:36 - INFO - __main__ - Step 22449: {'lr': 0.00047681757379535285, 'samples': 4310208, 'steps': 22448, 'loss/train': 1.684480905532837} -11/07/2021 00:23:37 - INFO - __main__ - Step 22450: {'lr': 0.00047681534200358665, 'samples': 4310400, 'steps': 22449, 'loss/train': 1.75339674949646} -11/07/2021 00:23:37 - INFO - __main__ - Step 22451: {'lr': 0.000476813110109621, 'samples': 4310592, 'steps': 22450, 'loss/train': 1.9512276649475098} -11/07/2021 00:23:38 - INFO - __main__ - Step 22452: {'lr': 0.0004768108781134568, 'samples': 4310784, 'steps': 22451, 'loss/train': 1.0854402780532837} -11/07/2021 00:23:38 - INFO - __main__ - Step 22453: {'lr': 0.0004768086460150952, 'samples': 4310976, 'steps': 22452, 'loss/train': 1.3101853132247925} -11/07/2021 00:23:39 - INFO - __main__ - Step 22454: {'lr': 0.00047680641381453703, 'samples': 4311168, 'steps': 22453, 'loss/train': 1.4491902589797974} -11/07/2021 00:23:39 - INFO - __main__ - Step 22455: {'lr': 0.0004768041815117835, 'samples': 4311360, 'steps': 22454, 'loss/train': 1.6310304403305054} -11/07/2021 00:23:40 - INFO - __main__ - Step 22456: {'lr': 0.00047680194910683545, 'samples': 4311552, 'steps': 22455, 'loss/train': 1.4553643465042114} -11/07/2021 00:23:41 - INFO - __main__ - Step 22457: {'lr': 0.0004767997165996939, 'samples': 4311744, 'steps': 22456, 'loss/train': 1.2861876487731934} -11/07/2021 00:23:41 - INFO - __main__ - Step 22458: {'lr': 0.00047679748399035994, 'samples': 4311936, 'steps': 22457, 'loss/train': 1.3340020179748535} -11/07/2021 00:23:41 - INFO - __main__ - Step 22459: {'lr': 0.00047679525127883456, 'samples': 4312128, 'steps': 22458, 'loss/train': 1.6435513496398926} -11/07/2021 00:23:42 - INFO - __main__ - Step 22460: {'lr': 0.0004767930184651187, 'samples': 4312320, 'steps': 22459, 'loss/train': 1.8718630075454712} -11/07/2021 00:23:42 - INFO - __main__ - Step 22461: {'lr': 0.0004767907855492134, 'samples': 4312512, 'steps': 22460, 'loss/train': 2.1382293701171875} -11/07/2021 00:23:43 - INFO - __main__ - Step 22462: {'lr': 0.0004767885525311197, 'samples': 4312704, 'steps': 22461, 'loss/train': 1.6162583827972412} -11/07/2021 00:23:44 - INFO - __main__ - Step 22463: {'lr': 0.0004767863194108386, 'samples': 4312896, 'steps': 22462, 'loss/train': 1.6668907403945923} -11/07/2021 00:23:44 - INFO - __main__ - Step 22464: {'lr': 0.000476784086188371, 'samples': 4313088, 'steps': 22463, 'loss/train': 0.9273306727409363} -11/07/2021 00:23:44 - INFO - __main__ - Step 22465: {'lr': 0.00047678185286371803, 'samples': 4313280, 'steps': 22464, 'loss/train': 1.323159098625183} -11/07/2021 00:23:45 - INFO - __main__ - Step 22466: {'lr': 0.0004767796194368807, 'samples': 4313472, 'steps': 22465, 'loss/train': 1.5647008419036865} -11/07/2021 00:23:45 - INFO - __main__ - Step 22467: {'lr': 0.00047677738590786, 'samples': 4313664, 'steps': 22466, 'loss/train': 0.24449460208415985} -11/07/2021 00:23:46 - INFO - __main__ - Step 22468: {'lr': 0.0004767751522766568, 'samples': 4313856, 'steps': 22467, 'loss/train': 1.7678805589675903} -11/07/2021 00:23:46 - INFO - __main__ - Step 22469: {'lr': 0.00047677291854327224, 'samples': 4314048, 'steps': 22468, 'loss/train': 1.3814095258712769} -11/07/2021 00:23:47 - INFO - __main__ - Step 22470: {'lr': 0.00047677068470770737, 'samples': 4314240, 'steps': 22469, 'loss/train': 1.6994068622589111} -11/07/2021 00:23:47 - INFO - __main__ - Step 22471: {'lr': 0.00047676845076996305, 'samples': 4314432, 'steps': 22470, 'loss/train': 2.423990488052368} -11/07/2021 00:23:47 - INFO - __main__ - Step 22472: {'lr': 0.0004767662167300404, 'samples': 4314624, 'steps': 22471, 'loss/train': 1.3077157735824585} -11/07/2021 00:23:48 - INFO - __main__ - Step 22473: {'lr': 0.0004767639825879404, 'samples': 4314816, 'steps': 22472, 'loss/train': 1.881967544555664} -11/07/2021 00:23:49 - INFO - __main__ - Step 22474: {'lr': 0.000476761748343664, 'samples': 4315008, 'steps': 22473, 'loss/train': 1.6649399995803833} -11/07/2021 00:23:49 - INFO - __main__ - Step 22475: {'lr': 0.00047675951399721235, 'samples': 4315200, 'steps': 22474, 'loss/train': 1.5792977809906006} -11/07/2021 00:23:49 - INFO - __main__ - Step 22476: {'lr': 0.0004767572795485863, 'samples': 4315392, 'steps': 22475, 'loss/train': 1.1965254545211792} -11/07/2021 00:23:50 - INFO - __main__ - Step 22477: {'lr': 0.00047675504499778695, 'samples': 4315584, 'steps': 22476, 'loss/train': 1.6232327222824097} -11/07/2021 00:23:51 - INFO - __main__ - Step 22478: {'lr': 0.0004767528103448152, 'samples': 4315776, 'steps': 22477, 'loss/train': 1.3932678699493408} -11/07/2021 00:23:51 - INFO - __main__ - Step 22479: {'lr': 0.00047675057558967224, 'samples': 4315968, 'steps': 22478, 'loss/train': 1.8550174236297607} -11/07/2021 00:23:52 - INFO - __main__ - Step 22480: {'lr': 0.0004767483407323589, 'samples': 4316160, 'steps': 22479, 'loss/train': 1.5465221405029297} -11/07/2021 00:23:52 - INFO - __main__ - Step 22481: {'lr': 0.00047674610577287625, 'samples': 4316352, 'steps': 22480, 'loss/train': 1.599327802658081} -11/07/2021 00:23:52 - INFO - __main__ - Step 22482: {'lr': 0.00047674387071122536, 'samples': 4316544, 'steps': 22481, 'loss/train': 1.6746630668640137} -11/07/2021 00:23:53 - INFO - __main__ - Step 22483: {'lr': 0.0004767416355474071, 'samples': 4316736, 'steps': 22482, 'loss/train': 1.7197669744491577} -11/07/2021 00:23:54 - INFO - __main__ - Step 22484: {'lr': 0.00047673940028142265, 'samples': 4316928, 'steps': 22483, 'loss/train': 1.0817619562149048} -11/07/2021 00:23:54 - INFO - __main__ - Step 22485: {'lr': 0.0004767371649132729, 'samples': 4317120, 'steps': 22484, 'loss/train': 1.4430047273635864} -11/07/2021 00:23:54 - INFO - __main__ - Step 22486: {'lr': 0.00047673492944295883, 'samples': 4317312, 'steps': 22485, 'loss/train': 1.4995204210281372} -11/07/2021 00:23:55 - INFO - __main__ - Step 22487: {'lr': 0.0004767326938704816, 'samples': 4317504, 'steps': 22486, 'loss/train': 1.2819911241531372} -11/07/2021 00:23:55 - INFO - __main__ - Step 22488: {'lr': 0.00047673045819584197, 'samples': 4317696, 'steps': 22487, 'loss/train': 1.8140474557876587} -11/07/2021 00:23:56 - INFO - __main__ - Step 22489: {'lr': 0.0004767282224190412, 'samples': 4317888, 'steps': 22488, 'loss/train': 1.7236080169677734} -11/07/2021 00:23:56 - INFO - __main__ - Step 22490: {'lr': 0.00047672598654008015, 'samples': 4318080, 'steps': 22489, 'loss/train': 1.273484468460083} -11/07/2021 00:23:57 - INFO - __main__ - Step 22491: {'lr': 0.0004767237505589599, 'samples': 4318272, 'steps': 22490, 'loss/train': 1.61056649684906} -11/07/2021 00:23:57 - INFO - __main__ - Step 22492: {'lr': 0.0004767215144756814, 'samples': 4318464, 'steps': 22491, 'loss/train': 2.750136137008667} -11/07/2021 00:23:57 - INFO - __main__ - Step 22493: {'lr': 0.0004767192782902457, 'samples': 4318656, 'steps': 22492, 'loss/train': 1.574295163154602} -11/07/2021 00:23:58 - INFO - __main__ - Step 22494: {'lr': 0.0004767170420026538, 'samples': 4318848, 'steps': 22493, 'loss/train': 1.4278780221939087} -11/07/2021 00:23:59 - INFO - __main__ - Step 22495: {'lr': 0.0004767148056129067, 'samples': 4319040, 'steps': 22494, 'loss/train': 1.9771298170089722} -11/07/2021 00:23:59 - INFO - __main__ - Step 22496: {'lr': 0.0004767125691210054, 'samples': 4319232, 'steps': 22495, 'loss/train': 1.6492091417312622} -11/07/2021 00:23:59 - INFO - __main__ - Step 22497: {'lr': 0.00047671033252695083, 'samples': 4319424, 'steps': 22496, 'loss/train': 1.8200469017028809} -11/07/2021 00:24:00 - INFO - __main__ - Step 22498: {'lr': 0.0004767080958307442, 'samples': 4319616, 'steps': 22497, 'loss/train': 2.2042977809906006} -11/07/2021 00:24:00 - INFO - __main__ - Step 22499: {'lr': 0.0004767058590323864, 'samples': 4319808, 'steps': 22498, 'loss/train': 1.707726001739502} -11/07/2021 00:24:01 - INFO - __main__ - Step 22500: {'lr': 0.00047670362213187833, 'samples': 4320000, 'steps': 22499, 'loss/train': 1.839163899421692} -11/07/2021 00:24:02 - INFO - __main__ - Step 22501: {'lr': 0.0004767013851292212, 'samples': 4320192, 'steps': 22500, 'loss/train': 1.605943202972412} -11/07/2021 00:24:02 - INFO - __main__ - Step 22502: {'lr': 0.0004766991480244159, 'samples': 4320384, 'steps': 22501, 'loss/train': 1.4277918338775635} -11/07/2021 00:24:02 - INFO - __main__ - Step 22503: {'lr': 0.0004766969108174635, 'samples': 4320576, 'steps': 22502, 'loss/train': 2.018317699432373} -11/07/2021 00:24:03 - INFO - __main__ - Step 22504: {'lr': 0.0004766946735083649, 'samples': 4320768, 'steps': 22503, 'loss/train': 1.634273648262024} -11/07/2021 00:24:04 - INFO - __main__ - Step 22505: {'lr': 0.0004766924360971212, 'samples': 4320960, 'steps': 22504, 'loss/train': 1.7070815563201904} -11/07/2021 00:24:04 - INFO - __main__ - Step 22506: {'lr': 0.00047669019858373343, 'samples': 4321152, 'steps': 22505, 'loss/train': 0.18323098123073578} -11/07/2021 00:24:04 - INFO - __main__ - Step 22507: {'lr': 0.00047668796096820247, 'samples': 4321344, 'steps': 22506, 'loss/train': 1.6749025583267212} -11/07/2021 00:24:05 - INFO - __main__ - Step 22508: {'lr': 0.00047668572325052953, 'samples': 4321536, 'steps': 22507, 'loss/train': 1.3067169189453125} -11/07/2021 00:24:05 - INFO - __main__ - Step 22509: {'lr': 0.00047668348543071536, 'samples': 4321728, 'steps': 22508, 'loss/train': 2.1704883575439453} -11/07/2021 00:24:06 - INFO - __main__ - Step 22510: {'lr': 0.00047668124750876117, 'samples': 4321920, 'steps': 22509, 'loss/train': 0.7687938213348389} -11/07/2021 00:24:07 - INFO - __main__ - Step 22511: {'lr': 0.0004766790094846679, 'samples': 4322112, 'steps': 22510, 'loss/train': 1.2642887830734253} -11/07/2021 00:24:07 - INFO - __main__ - Step 22512: {'lr': 0.0004766767713584367, 'samples': 4322304, 'steps': 22511, 'loss/train': 1.0644493103027344} -11/07/2021 00:24:07 - INFO - __main__ - Step 22513: {'lr': 0.00047667453313006826, 'samples': 4322496, 'steps': 22512, 'loss/train': 1.282457947731018} -11/07/2021 00:24:08 - INFO - __main__ - Step 22514: {'lr': 0.00047667229479956386, 'samples': 4322688, 'steps': 22513, 'loss/train': 1.6759504079818726} -11/07/2021 00:24:09 - INFO - __main__ - Step 22515: {'lr': 0.0004766700563669244, 'samples': 4322880, 'steps': 22514, 'loss/train': 1.3310102224349976} -11/07/2021 00:24:09 - INFO - __main__ - Step 22516: {'lr': 0.0004766678178321509, 'samples': 4323072, 'steps': 22515, 'loss/train': 1.6661882400512695} -11/07/2021 00:24:09 - INFO - __main__ - Step 22517: {'lr': 0.0004766655791952444, 'samples': 4323264, 'steps': 22516, 'loss/train': 1.630807876586914} -11/07/2021 00:24:10 - INFO - __main__ - Step 22518: {'lr': 0.0004766633404562059, 'samples': 4323456, 'steps': 22517, 'loss/train': 1.046881079673767} -11/07/2021 00:24:10 - INFO - __main__ - Step 22519: {'lr': 0.0004766611016150364, 'samples': 4323648, 'steps': 22518, 'loss/train': 1.5486303567886353} -11/07/2021 00:24:11 - INFO - __main__ - Step 22520: {'lr': 0.00047665886267173686, 'samples': 4323840, 'steps': 22519, 'loss/train': 1.411068320274353} -11/07/2021 00:24:11 - INFO - __main__ - Step 22521: {'lr': 0.00047665662362630836, 'samples': 4324032, 'steps': 22520, 'loss/train': 1.875470519065857} -11/07/2021 00:24:12 - INFO - __main__ - Step 22522: {'lr': 0.00047665438447875186, 'samples': 4324224, 'steps': 22521, 'loss/train': 1.4796826839447021} -11/07/2021 00:24:12 - INFO - __main__ - Step 22523: {'lr': 0.0004766521452290684, 'samples': 4324416, 'steps': 22522, 'loss/train': 1.4865388870239258} -11/07/2021 00:24:12 - INFO - __main__ - Step 22524: {'lr': 0.00047664990587725905, 'samples': 4324608, 'steps': 22523, 'loss/train': 2.097989320755005} -11/07/2021 00:24:13 - INFO - __main__ - Step 22525: {'lr': 0.0004766476664233247, 'samples': 4324800, 'steps': 22524, 'loss/train': 1.7296922206878662} -11/07/2021 00:24:14 - INFO - __main__ - Step 22526: {'lr': 0.0004766454268672664, 'samples': 4324992, 'steps': 22525, 'loss/train': 1.8197253942489624} -11/07/2021 00:24:14 - INFO - __main__ - Step 22527: {'lr': 0.00047664318720908516, 'samples': 4325184, 'steps': 22526, 'loss/train': 1.9192566871643066} -11/07/2021 00:24:15 - INFO - __main__ - Step 22528: {'lr': 0.000476640947448782, 'samples': 4325376, 'steps': 22527, 'loss/train': 1.9041056632995605} -11/07/2021 00:24:15 - INFO - __main__ - Step 22529: {'lr': 0.000476638707586358, 'samples': 4325568, 'steps': 22528, 'loss/train': 1.7667334079742432} -11/07/2021 00:24:15 - INFO - __main__ - Step 22530: {'lr': 0.000476636467621814, 'samples': 4325760, 'steps': 22529, 'loss/train': 1.750614881515503} -11/07/2021 00:24:16 - INFO - __main__ - Step 22531: {'lr': 0.00047663422755515113, 'samples': 4325952, 'steps': 22530, 'loss/train': 1.5936520099639893} -11/07/2021 00:24:17 - INFO - __main__ - Step 22532: {'lr': 0.00047663198738637035, 'samples': 4326144, 'steps': 22531, 'loss/train': 1.118178367614746} -11/07/2021 00:24:17 - INFO - __main__ - Step 22533: {'lr': 0.00047662974711547274, 'samples': 4326336, 'steps': 22532, 'loss/train': 1.724767804145813} -11/07/2021 00:24:17 - INFO - __main__ - Step 22534: {'lr': 0.0004766275067424593, 'samples': 4326528, 'steps': 22533, 'loss/train': 2.0930192470550537} -11/07/2021 00:24:18 - INFO - __main__ - Step 22535: {'lr': 0.0004766252662673309, 'samples': 4326720, 'steps': 22534, 'loss/train': 1.5219659805297852} -11/07/2021 00:24:19 - INFO - __main__ - Step 22536: {'lr': 0.0004766230256900887, 'samples': 4326912, 'steps': 22535, 'loss/train': 2.0084965229034424} -11/07/2021 00:24:19 - INFO - __main__ - Step 22537: {'lr': 0.0004766207850107337, 'samples': 4327104, 'steps': 22536, 'loss/train': 2.0028364658355713} -11/07/2021 00:24:19 - INFO - __main__ - Step 22538: {'lr': 0.00047661854422926674, 'samples': 4327296, 'steps': 22537, 'loss/train': 1.4535870552062988} -11/07/2021 00:24:20 - INFO - __main__ - Step 22539: {'lr': 0.0004766163033456891, 'samples': 4327488, 'steps': 22538, 'loss/train': 1.8392276763916016} -11/07/2021 00:24:20 - INFO - __main__ - Step 22540: {'lr': 0.0004766140623600016, 'samples': 4327680, 'steps': 22539, 'loss/train': 1.4498977661132812} -11/07/2021 00:24:21 - INFO - __main__ - Step 22541: {'lr': 0.0004766118212722053, 'samples': 4327872, 'steps': 22540, 'loss/train': 1.1951019763946533} -11/07/2021 00:24:22 - INFO - __main__ - Step 22542: {'lr': 0.0004766095800823013, 'samples': 4328064, 'steps': 22541, 'loss/train': 1.4123594760894775} -11/07/2021 00:24:22 - INFO - __main__ - Step 22543: {'lr': 0.0004766073387902904, 'samples': 4328256, 'steps': 22542, 'loss/train': 1.3626255989074707} -11/07/2021 00:24:22 - INFO - __main__ - Step 22544: {'lr': 0.00047660509739617376, 'samples': 4328448, 'steps': 22543, 'loss/train': 1.6323630809783936} -11/07/2021 00:24:23 - INFO - __main__ - Step 22545: {'lr': 0.00047660285589995233, 'samples': 4328640, 'steps': 22544, 'loss/train': 1.4572019577026367} -11/07/2021 00:24:24 - INFO - __main__ - Step 22546: {'lr': 0.0004766006143016272, 'samples': 4328832, 'steps': 22545, 'loss/train': 1.5938409566879272} -11/07/2021 00:24:24 - INFO - __main__ - Step 22547: {'lr': 0.0004765983726011993, 'samples': 4329024, 'steps': 22546, 'loss/train': 1.2399224042892456} -11/07/2021 00:24:24 - INFO - __main__ - Step 22548: {'lr': 0.0004765961307986697, 'samples': 4329216, 'steps': 22547, 'loss/train': 1.8739992380142212} -11/07/2021 00:24:25 - INFO - __main__ - Step 22549: {'lr': 0.0004765938888940393, 'samples': 4329408, 'steps': 22548, 'loss/train': 1.5949848890304565} -11/07/2021 00:24:25 - INFO - __main__ - Step 22550: {'lr': 0.00047659164688730935, 'samples': 4329600, 'steps': 22549, 'loss/train': 1.728060007095337} -11/07/2021 00:24:26 - INFO - __main__ - Step 22551: {'lr': 0.00047658940477848056, 'samples': 4329792, 'steps': 22550, 'loss/train': 1.4984592199325562} -11/07/2021 00:24:26 - INFO - __main__ - Step 22552: {'lr': 0.00047658716256755414, 'samples': 4329984, 'steps': 22551, 'loss/train': 1.639998435974121} -11/07/2021 00:24:27 - INFO - __main__ - Step 22553: {'lr': 0.00047658492025453106, 'samples': 4330176, 'steps': 22552, 'loss/train': 1.548398494720459} -11/07/2021 00:24:27 - INFO - __main__ - Step 22554: {'lr': 0.00047658267783941223, 'samples': 4330368, 'steps': 22553, 'loss/train': 1.8560858964920044} -11/07/2021 00:24:27 - INFO - __main__ - Step 22555: {'lr': 0.0004765804353221988, 'samples': 4330560, 'steps': 22554, 'loss/train': 1.5847618579864502} -11/07/2021 00:24:29 - INFO - __main__ - Step 22556: {'lr': 0.0004765781927028917, 'samples': 4330752, 'steps': 22555, 'loss/train': 1.6546162366867065} -11/07/2021 00:24:29 - INFO - __main__ - Step 22557: {'lr': 0.000476575949981492, 'samples': 4330944, 'steps': 22556, 'loss/train': 1.2733675241470337} -11/07/2021 00:24:30 - INFO - __main__ - Step 22558: {'lr': 0.00047657370715800066, 'samples': 4331136, 'steps': 22557, 'loss/train': 1.3643406629562378} -11/07/2021 00:24:30 - INFO - __main__ - Step 22559: {'lr': 0.0004765714642324187, 'samples': 4331328, 'steps': 22558, 'loss/train': 1.1664093732833862} -11/07/2021 00:24:30 - INFO - __main__ - Step 22560: {'lr': 0.0004765692212047471, 'samples': 4331520, 'steps': 22559, 'loss/train': 1.8109169006347656} -11/07/2021 00:24:31 - INFO - __main__ - Step 22561: {'lr': 0.00047656697807498693, 'samples': 4331712, 'steps': 22560, 'loss/train': 0.23743750154972076} -11/07/2021 00:24:32 - INFO - __main__ - Step 22562: {'lr': 0.0004765647348431392, 'samples': 4331904, 'steps': 22561, 'loss/train': 1.1988426446914673} -11/07/2021 00:24:32 - INFO - __main__ - Step 22563: {'lr': 0.00047656249150920485, 'samples': 4332096, 'steps': 22562, 'loss/train': 1.4141286611557007} -11/07/2021 00:24:32 - INFO - __main__ - Step 22564: {'lr': 0.000476560248073185, 'samples': 4332288, 'steps': 22563, 'loss/train': 2.05336856842041} -11/07/2021 00:24:33 - INFO - __main__ - Step 22565: {'lr': 0.0004765580045350805, 'samples': 4332480, 'steps': 22564, 'loss/train': 1.3348045349121094} -11/07/2021 00:24:33 - INFO - __main__ - Step 22566: {'lr': 0.00047655576089489254, 'samples': 4332672, 'steps': 22565, 'loss/train': 1.850450038909912} -11/07/2021 00:24:34 - INFO - __main__ - Step 22567: {'lr': 0.00047655351715262205, 'samples': 4332864, 'steps': 22566, 'loss/train': 2.1595187187194824} -11/07/2021 00:24:34 - INFO - __main__ - Step 22568: {'lr': 0.00047655127330827, 'samples': 4333056, 'steps': 22567, 'loss/train': 1.5340650081634521} -11/07/2021 00:24:35 - INFO - __main__ - Step 22569: {'lr': 0.00047654902936183745, 'samples': 4333248, 'steps': 22568, 'loss/train': 1.7308131456375122} -11/07/2021 00:24:35 - INFO - __main__ - Step 22570: {'lr': 0.00047654678531332544, 'samples': 4333440, 'steps': 22569, 'loss/train': 1.0381836891174316} -11/07/2021 00:24:36 - INFO - __main__ - Step 22571: {'lr': 0.00047654454116273493, 'samples': 4333632, 'steps': 22570, 'loss/train': 1.6245771646499634} -11/07/2021 00:24:37 - INFO - __main__ - Step 22572: {'lr': 0.0004765422969100669, 'samples': 4333824, 'steps': 22571, 'loss/train': 1.6836577653884888} -11/07/2021 00:24:37 - INFO - __main__ - Step 22573: {'lr': 0.00047654005255532247, 'samples': 4334016, 'steps': 22572, 'loss/train': 1.4743589162826538} -11/07/2021 00:24:38 - INFO - __main__ - Step 22574: {'lr': 0.0004765378080985026, 'samples': 4334208, 'steps': 22573, 'loss/train': 1.1934410333633423} -11/07/2021 00:24:38 - INFO - __main__ - Step 22575: {'lr': 0.00047653556353960825, 'samples': 4334400, 'steps': 22574, 'loss/train': 1.6637202501296997} -11/07/2021 00:24:38 - INFO - __main__ - Step 22576: {'lr': 0.0004765333188786404, 'samples': 4334592, 'steps': 22575, 'loss/train': 1.433510661125183} -11/07/2021 00:24:40 - INFO - __main__ - Step 22577: {'lr': 0.00047653107411560025, 'samples': 4334784, 'steps': 22576, 'loss/train': 0.8190040588378906} -11/07/2021 00:24:40 - INFO - __main__ - Step 22578: {'lr': 0.00047652882925048863, 'samples': 4334976, 'steps': 22577, 'loss/train': 1.0744819641113281} -11/07/2021 00:24:40 - INFO - __main__ - Step 22579: {'lr': 0.00047652658428330664, 'samples': 4335168, 'steps': 22578, 'loss/train': 1.8014850616455078} -11/07/2021 00:24:41 - INFO - __main__ - Step 22580: {'lr': 0.00047652433921405526, 'samples': 4335360, 'steps': 22579, 'loss/train': 1.555201530456543} -11/07/2021 00:24:41 - INFO - __main__ - Step 22581: {'lr': 0.0004765220940427355, 'samples': 4335552, 'steps': 22580, 'loss/train': 1.776862621307373} -11/07/2021 00:24:41 - INFO - __main__ - Step 22582: {'lr': 0.0004765198487693484, 'samples': 4335744, 'steps': 22581, 'loss/train': 1.9247335195541382} -11/07/2021 00:24:42 - INFO - __main__ - Step 22583: {'lr': 0.00047651760339389494, 'samples': 4335936, 'steps': 22582, 'loss/train': 1.5864671468734741} -11/07/2021 00:24:43 - INFO - __main__ - Step 22584: {'lr': 0.0004765153579163761, 'samples': 4336128, 'steps': 22583, 'loss/train': 1.8406521081924438} -11/07/2021 00:24:43 - INFO - __main__ - Step 22585: {'lr': 0.000476513112336793, 'samples': 4336320, 'steps': 22584, 'loss/train': 1.4075356721878052} -11/07/2021 00:24:43 - INFO - __main__ - Step 22586: {'lr': 0.00047651086665514655, 'samples': 4336512, 'steps': 22585, 'loss/train': 1.6485368013381958} -11/07/2021 00:24:44 - INFO - __main__ - Step 22587: {'lr': 0.00047650862087143787, 'samples': 4336704, 'steps': 22586, 'loss/train': 1.588104248046875} -11/07/2021 00:24:44 - INFO - __main__ - Step 22588: {'lr': 0.0004765063749856678, 'samples': 4336896, 'steps': 22587, 'loss/train': 1.528891682624817} -11/07/2021 00:24:45 - INFO - __main__ - Step 22589: {'lr': 0.00047650412899783747, 'samples': 4337088, 'steps': 22588, 'loss/train': 1.6844433546066284} -11/07/2021 00:24:45 - INFO - __main__ - Step 22590: {'lr': 0.0004765018829079479, 'samples': 4337280, 'steps': 22589, 'loss/train': 2.1266448497772217} -11/07/2021 00:24:46 - INFO - __main__ - Step 22591: {'lr': 0.0004764996367160001, 'samples': 4337472, 'steps': 22590, 'loss/train': 1.5239567756652832} -11/07/2021 00:24:46 - INFO - __main__ - Step 22592: {'lr': 0.000476497390421995, 'samples': 4337664, 'steps': 22591, 'loss/train': 1.8610912561416626} -11/07/2021 00:24:47 - INFO - __main__ - Step 22593: {'lr': 0.00047649514402593377, 'samples': 4337856, 'steps': 22592, 'loss/train': 1.4386012554168701} -11/07/2021 00:24:48 - INFO - __main__ - Step 22594: {'lr': 0.0004764928975278172, 'samples': 4338048, 'steps': 22593, 'loss/train': 1.2887240648269653} -11/07/2021 00:24:48 - INFO - __main__ - Step 22595: {'lr': 0.0004764906509276465, 'samples': 4338240, 'steps': 22594, 'loss/train': 1.515057921409607} -11/07/2021 00:24:48 - INFO - __main__ - Step 22596: {'lr': 0.0004764884042254226, 'samples': 4338432, 'steps': 22595, 'loss/train': 1.320374846458435} -11/07/2021 00:24:49 - INFO - __main__ - Step 22597: {'lr': 0.0004764861574211465, 'samples': 4338624, 'steps': 22596, 'loss/train': 1.4135661125183105} -11/07/2021 00:24:49 - INFO - __main__ - Step 22598: {'lr': 0.0004764839105148193, 'samples': 4338816, 'steps': 22597, 'loss/train': 1.6835685968399048} -11/07/2021 00:24:49 - INFO - __main__ - Step 22599: {'lr': 0.00047648166350644185, 'samples': 4339008, 'steps': 22598, 'loss/train': 1.2688534259796143} -11/07/2021 00:24:51 - INFO - __main__ - Step 22600: {'lr': 0.00047647941639601535, 'samples': 4339200, 'steps': 22599, 'loss/train': 2.066715955734253} -11/07/2021 00:24:51 - INFO - __main__ - Step 22601: {'lr': 0.00047647716918354066, 'samples': 4339392, 'steps': 22600, 'loss/train': 5.759670734405518} -11/07/2021 00:24:51 - INFO - __main__ - Step 22602: {'lr': 0.00047647492186901884, 'samples': 4339584, 'steps': 22601, 'loss/train': 1.9553258419036865} -11/07/2021 00:24:52 - INFO - __main__ - Step 22603: {'lr': 0.0004764726744524509, 'samples': 4339776, 'steps': 22602, 'loss/train': 1.3782130479812622} -11/07/2021 00:24:52 - INFO - __main__ - Step 22604: {'lr': 0.0004764704269338379, 'samples': 4339968, 'steps': 22603, 'loss/train': 1.4786680936813354} -11/07/2021 00:24:52 - INFO - __main__ - Step 22605: {'lr': 0.00047646817931318086, 'samples': 4340160, 'steps': 22604, 'loss/train': 1.6348986625671387} -11/07/2021 00:24:53 - INFO - __main__ - Step 22606: {'lr': 0.0004764659315904807, 'samples': 4340352, 'steps': 22605, 'loss/train': 1.906373143196106} -11/07/2021 00:24:54 - INFO - __main__ - Step 22607: {'lr': 0.0004764636837657385, 'samples': 4340544, 'steps': 22606, 'loss/train': 1.5434366464614868} -11/07/2021 00:24:54 - INFO - __main__ - Step 22608: {'lr': 0.0004764614358389553, 'samples': 4340736, 'steps': 22607, 'loss/train': 1.7191797494888306} -11/07/2021 00:24:55 - INFO - __main__ - Step 22609: {'lr': 0.00047645918781013196, 'samples': 4340928, 'steps': 22608, 'loss/train': 1.4511476755142212} -11/07/2021 00:24:55 - INFO - __main__ - Step 22610: {'lr': 0.0004764569396792697, 'samples': 4341120, 'steps': 22609, 'loss/train': 1.2064729928970337} -11/07/2021 00:24:56 - INFO - __main__ - Step 22611: {'lr': 0.0004764546914463694, 'samples': 4341312, 'steps': 22610, 'loss/train': 1.7000502347946167} -11/07/2021 00:24:56 - INFO - __main__ - Step 22612: {'lr': 0.0004764524431114321, 'samples': 4341504, 'steps': 22611, 'loss/train': 1.9246582984924316} -11/07/2021 00:24:57 - INFO - __main__ - Step 22613: {'lr': 0.0004764501946744589, 'samples': 4341696, 'steps': 22612, 'loss/train': 1.507423996925354} -11/07/2021 00:24:57 - INFO - __main__ - Step 22614: {'lr': 0.00047644794613545065, 'samples': 4341888, 'steps': 22613, 'loss/train': 1.790145993232727} -11/07/2021 00:24:57 - INFO - __main__ - Step 22615: {'lr': 0.00047644569749440846, 'samples': 4342080, 'steps': 22614, 'loss/train': 1.3438689708709717} -11/07/2021 00:24:58 - INFO - __main__ - Step 22616: {'lr': 0.0004764434487513334, 'samples': 4342272, 'steps': 22615, 'loss/train': 1.449084997177124} -11/07/2021 00:24:59 - INFO - __main__ - Step 22617: {'lr': 0.00047644119990622637, 'samples': 4342464, 'steps': 22616, 'loss/train': 1.7146893739700317} -11/07/2021 00:24:59 - INFO - __main__ - Step 22618: {'lr': 0.0004764389509590884, 'samples': 4342656, 'steps': 22617, 'loss/train': 1.4914770126342773} -11/07/2021 00:24:59 - INFO - __main__ - Step 22619: {'lr': 0.0004764367019099206, 'samples': 4342848, 'steps': 22618, 'loss/train': 1.383577823638916} -11/07/2021 00:25:00 - INFO - __main__ - Step 22620: {'lr': 0.0004764344527587239, 'samples': 4343040, 'steps': 22619, 'loss/train': 1.3901386260986328} -11/07/2021 00:25:01 - INFO - __main__ - Step 22621: {'lr': 0.00047643220350549934, 'samples': 4343232, 'steps': 22620, 'loss/train': 1.5086541175842285} -11/07/2021 00:25:01 - INFO - __main__ - Step 22622: {'lr': 0.0004764299541502478, 'samples': 4343424, 'steps': 22621, 'loss/train': 1.4755960702896118} -11/07/2021 00:25:01 - INFO - __main__ - Step 22623: {'lr': 0.0004764277046929706, 'samples': 4343616, 'steps': 22622, 'loss/train': 1.5495747327804565} -11/07/2021 00:25:02 - INFO - __main__ - Step 22624: {'lr': 0.00047642545513366843, 'samples': 4343808, 'steps': 22623, 'loss/train': 2.366577625274658} -11/07/2021 00:25:02 - INFO - __main__ - Step 22625: {'lr': 0.0004764232054723425, 'samples': 4344000, 'steps': 22624, 'loss/train': 1.5127291679382324} -11/07/2021 00:25:03 - INFO - __main__ - Step 22626: {'lr': 0.0004764209557089938, 'samples': 4344192, 'steps': 22625, 'loss/train': 1.3345847129821777} -11/07/2021 00:25:03 - INFO - __main__ - Step 22627: {'lr': 0.00047641870584362323, 'samples': 4344384, 'steps': 22626, 'loss/train': 1.7284650802612305} -11/07/2021 00:25:04 - INFO - __main__ - Step 22628: {'lr': 0.00047641645587623196, 'samples': 4344576, 'steps': 22627, 'loss/train': 1.660504698753357} -11/07/2021 00:25:04 - INFO - __main__ - Step 22629: {'lr': 0.0004764142058068209, 'samples': 4344768, 'steps': 22628, 'loss/train': 1.7857352495193481} -11/07/2021 00:25:05 - INFO - __main__ - Step 22630: {'lr': 0.00047641195563539107, 'samples': 4344960, 'steps': 22629, 'loss/train': 1.4394036531448364} -11/07/2021 00:25:05 - INFO - __main__ - Step 22631: {'lr': 0.0004764097053619435, 'samples': 4345152, 'steps': 22630, 'loss/train': 1.6884974241256714} -11/07/2021 00:25:06 - INFO - __main__ - Step 22632: {'lr': 0.00047640745498647925, 'samples': 4345344, 'steps': 22631, 'loss/train': 1.6962106227874756} -11/07/2021 00:25:06 - INFO - __main__ - Step 22633: {'lr': 0.00047640520450899926, 'samples': 4345536, 'steps': 22632, 'loss/train': 1.340884804725647} -11/07/2021 00:25:07 - INFO - __main__ - Step 22634: {'lr': 0.0004764029539295046, 'samples': 4345728, 'steps': 22633, 'loss/train': 1.3287487030029297} -11/07/2021 00:25:07 - INFO - __main__ - Step 22635: {'lr': 0.0004764007032479963, 'samples': 4345920, 'steps': 22634, 'loss/train': 1.8320151567459106} -11/07/2021 00:25:07 - INFO - __main__ - Step 22636: {'lr': 0.00047639845246447534, 'samples': 4346112, 'steps': 22635, 'loss/train': 1.7329380512237549} -11/07/2021 00:25:08 - INFO - __main__ - Step 22637: {'lr': 0.00047639620157894264, 'samples': 4346304, 'steps': 22636, 'loss/train': 1.4954795837402344} -11/07/2021 00:25:09 - INFO - __main__ - Step 22638: {'lr': 0.00047639395059139936, 'samples': 4346496, 'steps': 22637, 'loss/train': 1.446747064590454} -11/07/2021 00:25:09 - INFO - __main__ - Step 22639: {'lr': 0.0004763916995018465, 'samples': 4346688, 'steps': 22638, 'loss/train': 1.718592643737793} -11/07/2021 00:25:09 - INFO - __main__ - Step 22640: {'lr': 0.00047638944831028497, 'samples': 4346880, 'steps': 22639, 'loss/train': 1.7990508079528809} -11/07/2021 00:25:10 - INFO - __main__ - Step 22641: {'lr': 0.00047638719701671587, 'samples': 4347072, 'steps': 22640, 'loss/train': 4.697803497314453} -11/07/2021 00:25:11 - INFO - __main__ - Step 22642: {'lr': 0.00047638494562114015, 'samples': 4347264, 'steps': 22641, 'loss/train': 1.645540714263916} -11/07/2021 00:25:11 - INFO - __main__ - Step 22643: {'lr': 0.0004763826941235589, 'samples': 4347456, 'steps': 22642, 'loss/train': 1.7661207914352417} -11/07/2021 00:25:11 - INFO - __main__ - Step 22644: {'lr': 0.00047638044252397313, 'samples': 4347648, 'steps': 22643, 'loss/train': 1.580713152885437} -11/07/2021 00:25:12 - INFO - __main__ - Step 22645: {'lr': 0.0004763781908223838, 'samples': 4347840, 'steps': 22644, 'loss/train': 1.46024489402771} -11/07/2021 00:25:12 - INFO - __main__ - Step 22646: {'lr': 0.00047637593901879194, 'samples': 4348032, 'steps': 22645, 'loss/train': 1.8002101182937622} -11/07/2021 00:25:13 - INFO - __main__ - Step 22647: {'lr': 0.00047637368711319863, 'samples': 4348224, 'steps': 22646, 'loss/train': 2.0005905628204346} -11/07/2021 00:25:14 - INFO - __main__ - Step 22648: {'lr': 0.00047637143510560477, 'samples': 4348416, 'steps': 22647, 'loss/train': 1.71867835521698} -11/07/2021 00:25:14 - INFO - __main__ - Step 22649: {'lr': 0.0004763691829960114, 'samples': 4348608, 'steps': 22648, 'loss/train': 1.8255470991134644} -11/07/2021 00:25:14 - INFO - __main__ - Step 22650: {'lr': 0.00047636693078441963, 'samples': 4348800, 'steps': 22649, 'loss/train': 1.0353654623031616} -11/07/2021 00:25:15 - INFO - __main__ - Step 22651: {'lr': 0.0004763646784708304, 'samples': 4348992, 'steps': 22650, 'loss/train': 1.4039242267608643} -11/07/2021 00:25:15 - INFO - __main__ - Step 22652: {'lr': 0.00047636242605524477, 'samples': 4349184, 'steps': 22651, 'loss/train': 1.3490198850631714} -11/07/2021 00:25:16 - INFO - __main__ - Step 22653: {'lr': 0.0004763601735376637, 'samples': 4349376, 'steps': 22652, 'loss/train': 2.0028791427612305} -11/07/2021 00:25:16 - INFO - __main__ - Step 22654: {'lr': 0.0004763579209180882, 'samples': 4349568, 'steps': 22653, 'loss/train': 1.5570244789123535} -11/07/2021 00:25:17 - INFO - __main__ - Step 22655: {'lr': 0.00047635566819651936, 'samples': 4349760, 'steps': 22654, 'loss/train': 1.7072210311889648} -11/07/2021 00:25:17 - INFO - __main__ - Step 22656: {'lr': 0.00047635341537295814, 'samples': 4349952, 'steps': 22655, 'loss/train': 1.369418740272522} -11/07/2021 00:25:17 - INFO - __main__ - Step 22657: {'lr': 0.0004763511624474055, 'samples': 4350144, 'steps': 22656, 'loss/train': 2.147608518600464} -11/07/2021 00:25:18 - INFO - __main__ - Step 22658: {'lr': 0.00047634890941986263, 'samples': 4350336, 'steps': 22657, 'loss/train': 1.8280770778656006} -11/07/2021 00:25:19 - INFO - __main__ - Step 22659: {'lr': 0.00047634665629033035, 'samples': 4350528, 'steps': 22658, 'loss/train': 1.259914755821228} -11/07/2021 00:25:19 - INFO - __main__ - Step 22660: {'lr': 0.00047634440305880976, 'samples': 4350720, 'steps': 22659, 'loss/train': 1.7895315885543823} -11/07/2021 00:25:19 - INFO - __main__ - Step 22661: {'lr': 0.0004763421497253019, 'samples': 4350912, 'steps': 22660, 'loss/train': 1.1604344844818115} -11/07/2021 00:25:20 - INFO - __main__ - Step 22662: {'lr': 0.0004763398962898078, 'samples': 4351104, 'steps': 22661, 'loss/train': 1.401200771331787} -11/07/2021 00:25:21 - INFO - __main__ - Step 22663: {'lr': 0.0004763376427523284, 'samples': 4351296, 'steps': 22662, 'loss/train': 1.4624043703079224} -11/07/2021 00:25:21 - INFO - __main__ - Step 22664: {'lr': 0.0004763353891128648, 'samples': 4351488, 'steps': 22663, 'loss/train': 0.9483494758605957} -11/07/2021 00:25:22 - INFO - __main__ - Step 22665: {'lr': 0.00047633313537141786, 'samples': 4351680, 'steps': 22664, 'loss/train': 1.6869838237762451} -11/07/2021 00:25:22 - INFO - __main__ - Step 22666: {'lr': 0.00047633088152798875, 'samples': 4351872, 'steps': 22665, 'loss/train': 1.3631956577301025} -11/07/2021 00:25:22 - INFO - __main__ - Step 22667: {'lr': 0.00047632862758257845, 'samples': 4352064, 'steps': 22666, 'loss/train': 1.072783350944519} -11/07/2021 00:25:23 - INFO - __main__ - Step 22668: {'lr': 0.0004763263735351879, 'samples': 4352256, 'steps': 22667, 'loss/train': 1.6640249490737915} -11/07/2021 00:25:24 - INFO - __main__ - Step 22669: {'lr': 0.0004763241193858183, 'samples': 4352448, 'steps': 22668, 'loss/train': 1.0642592906951904} -11/07/2021 00:25:24 - INFO - __main__ - Step 22670: {'lr': 0.00047632186513447045, 'samples': 4352640, 'steps': 22669, 'loss/train': 1.4311997890472412} -11/07/2021 00:25:24 - INFO - __main__ - Step 22671: {'lr': 0.0004763196107811455, 'samples': 4352832, 'steps': 22670, 'loss/train': 1.3761380910873413} -11/07/2021 00:25:25 - INFO - __main__ - Step 22672: {'lr': 0.0004763173563258444, 'samples': 4353024, 'steps': 22671, 'loss/train': 1.5977585315704346} -11/07/2021 00:25:25 - INFO - __main__ - Step 22673: {'lr': 0.0004763151017685682, 'samples': 4353216, 'steps': 22672, 'loss/train': 1.4709689617156982} -11/07/2021 00:25:26 - INFO - __main__ - Step 22674: {'lr': 0.0004763128471093179, 'samples': 4353408, 'steps': 22673, 'loss/train': 1.834922432899475} -11/07/2021 00:25:27 - INFO - __main__ - Step 22675: {'lr': 0.0004763105923480946, 'samples': 4353600, 'steps': 22674, 'loss/train': 1.8651885986328125} -11/07/2021 00:25:27 - INFO - __main__ - Step 22676: {'lr': 0.0004763083374848991, 'samples': 4353792, 'steps': 22675, 'loss/train': 1.3292526006698608} -11/07/2021 00:25:27 - INFO - __main__ - Step 22677: {'lr': 0.00047630608251973265, 'samples': 4353984, 'steps': 22676, 'loss/train': 2.0414798259735107} -11/07/2021 00:25:28 - INFO - __main__ - Step 22678: {'lr': 0.00047630382745259616, 'samples': 4354176, 'steps': 22677, 'loss/train': 1.8651529550552368} -11/07/2021 00:25:29 - INFO - __main__ - Step 22679: {'lr': 0.0004763015722834907, 'samples': 4354368, 'steps': 22678, 'loss/train': 1.882495403289795} -11/07/2021 00:25:29 - INFO - __main__ - Step 22680: {'lr': 0.00047629931701241715, 'samples': 4354560, 'steps': 22679, 'loss/train': 1.380403757095337} -11/07/2021 00:25:29 - INFO - __main__ - Step 22681: {'lr': 0.0004762970616393767, 'samples': 4354752, 'steps': 22680, 'loss/train': 1.7098302841186523} -11/07/2021 00:25:30 - INFO - __main__ - Step 22682: {'lr': 0.0004762948061643702, 'samples': 4354944, 'steps': 22681, 'loss/train': 1.2838383913040161} -11/07/2021 00:25:30 - INFO - __main__ - Step 22683: {'lr': 0.0004762925505873988, 'samples': 4355136, 'steps': 22682, 'loss/train': 1.9014365673065186} -11/07/2021 00:25:31 - INFO - __main__ - Step 22684: {'lr': 0.00047629029490846346, 'samples': 4355328, 'steps': 22683, 'loss/train': 1.598739743232727} -11/07/2021 00:25:31 - INFO - __main__ - Step 22685: {'lr': 0.00047628803912756523, 'samples': 4355520, 'steps': 22684, 'loss/train': 1.638590931892395} -11/07/2021 00:25:32 - INFO - __main__ - Step 22686: {'lr': 0.00047628578324470505, 'samples': 4355712, 'steps': 22685, 'loss/train': 1.5135688781738281} -11/07/2021 00:25:32 - INFO - __main__ - Step 22687: {'lr': 0.00047628352725988406, 'samples': 4355904, 'steps': 22686, 'loss/train': 2.5237491130828857} -11/07/2021 00:25:32 - INFO - __main__ - Step 22688: {'lr': 0.0004762812711731032, 'samples': 4356096, 'steps': 22687, 'loss/train': 1.1969538927078247} -11/07/2021 00:25:34 - INFO - __main__ - Step 22689: {'lr': 0.00047627901498436344, 'samples': 4356288, 'steps': 22688, 'loss/train': 1.1763588190078735} -11/07/2021 00:25:34 - INFO - __main__ - Step 22690: {'lr': 0.0004762767586936658, 'samples': 4356480, 'steps': 22689, 'loss/train': 1.466115117073059} -11/07/2021 00:25:34 - INFO - __main__ - Step 22691: {'lr': 0.00047627450230101144, 'samples': 4356672, 'steps': 22690, 'loss/train': 1.8381071090698242} -11/07/2021 00:25:35 - INFO - __main__ - Step 22692: {'lr': 0.0004762722458064013, 'samples': 4356864, 'steps': 22691, 'loss/train': 2.0725739002227783} -11/07/2021 00:25:35 - INFO - __main__ - Step 22693: {'lr': 0.0004762699892098363, 'samples': 4357056, 'steps': 22692, 'loss/train': 1.396986961364746} -11/07/2021 00:25:36 - INFO - __main__ - Step 22694: {'lr': 0.0004762677325113176, 'samples': 4357248, 'steps': 22693, 'loss/train': 1.1241483688354492} -11/07/2021 00:25:37 - INFO - __main__ - Step 22695: {'lr': 0.0004762654757108461, 'samples': 4357440, 'steps': 22694, 'loss/train': 1.4990808963775635} -11/07/2021 00:25:37 - INFO - __main__ - Step 22696: {'lr': 0.00047626321880842287, 'samples': 4357632, 'steps': 22695, 'loss/train': 1.609912395477295} -11/07/2021 00:25:37 - INFO - __main__ - Step 22697: {'lr': 0.00047626096180404895, 'samples': 4357824, 'steps': 22696, 'loss/train': 0.8824257850646973} -11/07/2021 00:25:38 - INFO - __main__ - Step 22698: {'lr': 0.0004762587046977253, 'samples': 4358016, 'steps': 22697, 'loss/train': 1.386871337890625} -11/07/2021 00:25:38 - INFO - __main__ - Step 22699: {'lr': 0.000476256447489453, 'samples': 4358208, 'steps': 22698, 'loss/train': 1.5603753328323364} -11/07/2021 00:25:39 - INFO - __main__ - Step 22700: {'lr': 0.000476254190179233, 'samples': 4358400, 'steps': 22699, 'loss/train': 1.339954137802124} -11/07/2021 00:25:40 - INFO - __main__ - Step 22701: {'lr': 0.0004762519327670664, 'samples': 4358592, 'steps': 22700, 'loss/train': 1.212175965309143} -11/07/2021 00:25:40 - INFO - __main__ - Step 22702: {'lr': 0.0004762496752529541, 'samples': 4358784, 'steps': 22701, 'loss/train': 1.3022215366363525} -11/07/2021 00:25:40 - INFO - __main__ - Step 22703: {'lr': 0.0004762474176368973, 'samples': 4358976, 'steps': 22702, 'loss/train': 1.2095423936843872} -11/07/2021 00:25:41 - INFO - __main__ - Step 22704: {'lr': 0.00047624515991889684, 'samples': 4359168, 'steps': 22703, 'loss/train': 1.5306414365768433} -11/07/2021 00:25:42 - INFO - __main__ - Step 22705: {'lr': 0.00047624290209895384, 'samples': 4359360, 'steps': 22704, 'loss/train': 1.1710671186447144} -11/07/2021 00:25:42 - INFO - __main__ - Step 22706: {'lr': 0.00047624064417706917, 'samples': 4359552, 'steps': 22705, 'loss/train': 1.3341710567474365} -11/07/2021 00:25:42 - INFO - __main__ - Step 22707: {'lr': 0.00047623838615324407, 'samples': 4359744, 'steps': 22706, 'loss/train': 1.8324825763702393} -11/07/2021 00:25:43 - INFO - __main__ - Step 22708: {'lr': 0.0004762361280274794, 'samples': 4359936, 'steps': 22707, 'loss/train': 1.2356606721878052} -11/07/2021 00:25:43 - INFO - __main__ - Step 22709: {'lr': 0.0004762338697997762, 'samples': 4360128, 'steps': 22708, 'loss/train': 1.3746553659439087} -11/07/2021 00:25:44 - INFO - __main__ - Step 22710: {'lr': 0.00047623161147013557, 'samples': 4360320, 'steps': 22709, 'loss/train': 1.6129733324050903} -11/07/2021 00:25:44 - INFO - __main__ - Step 22711: {'lr': 0.0004762293530385584, 'samples': 4360512, 'steps': 22710, 'loss/train': 1.0353015661239624} -11/07/2021 00:25:45 - INFO - __main__ - Step 22712: {'lr': 0.0004762270945050458, 'samples': 4360704, 'steps': 22711, 'loss/train': 1.751045823097229} -11/07/2021 00:25:45 - INFO - __main__ - Step 22713: {'lr': 0.00047622483586959877, 'samples': 4360896, 'steps': 22712, 'loss/train': 2.044782876968384} -11/07/2021 00:25:45 - INFO - __main__ - Step 22714: {'lr': 0.00047622257713221826, 'samples': 4361088, 'steps': 22713, 'loss/train': 1.5603699684143066} -11/07/2021 00:25:47 - INFO - __main__ - Step 22715: {'lr': 0.00047622031829290545, 'samples': 4361280, 'steps': 22714, 'loss/train': 1.6232585906982422} -11/07/2021 00:25:47 - INFO - __main__ - Step 22716: {'lr': 0.0004762180593516612, 'samples': 4361472, 'steps': 22715, 'loss/train': 1.375087857246399} -11/07/2021 00:25:47 - INFO - __main__ - Step 22717: {'lr': 0.0004762158003084867, 'samples': 4361664, 'steps': 22716, 'loss/train': 1.8091025352478027} -11/07/2021 00:25:48 - INFO - __main__ - Step 22718: {'lr': 0.0004762135411633827, 'samples': 4361856, 'steps': 22717, 'loss/train': 1.6967964172363281} -11/07/2021 00:25:48 - INFO - __main__ - Step 22719: {'lr': 0.0004762112819163504, 'samples': 4362048, 'steps': 22718, 'loss/train': 1.4949711561203003} -11/07/2021 00:25:48 - INFO - __main__ - Step 22720: {'lr': 0.0004762090225673908, 'samples': 4362240, 'steps': 22719, 'loss/train': 1.857780933380127} -11/07/2021 00:25:49 - INFO - __main__ - Step 22721: {'lr': 0.0004762067631165049, 'samples': 4362432, 'steps': 22720, 'loss/train': 1.3588804006576538} -11/07/2021 00:25:50 - INFO - __main__ - Step 22722: {'lr': 0.0004762045035636937, 'samples': 4362624, 'steps': 22721, 'loss/train': 1.1537671089172363} -11/07/2021 00:25:50 - INFO - __main__ - Step 22723: {'lr': 0.0004762022439089583, 'samples': 4362816, 'steps': 22722, 'loss/train': 1.5845859050750732} -11/07/2021 00:25:50 - INFO - __main__ - Step 22724: {'lr': 0.0004761999841522996, 'samples': 4363008, 'steps': 22723, 'loss/train': 1.457655668258667} -11/07/2021 00:25:51 - INFO - __main__ - Step 22725: {'lr': 0.0004761977242937188, 'samples': 4363200, 'steps': 22724, 'loss/train': 1.7326648235321045} -11/07/2021 00:25:52 - INFO - __main__ - Step 22726: {'lr': 0.00047619546433321663, 'samples': 4363392, 'steps': 22725, 'loss/train': 2.0075771808624268} -11/07/2021 00:25:52 - INFO - __main__ - Step 22727: {'lr': 0.00047619320427079437, 'samples': 4363584, 'steps': 22726, 'loss/train': 1.7012308835983276} -11/07/2021 00:25:52 - INFO - __main__ - Step 22728: {'lr': 0.00047619094410645293, 'samples': 4363776, 'steps': 22727, 'loss/train': 1.6955498456954956} -11/07/2021 00:25:53 - INFO - __main__ - Step 22729: {'lr': 0.0004761886838401933, 'samples': 4363968, 'steps': 22728, 'loss/train': 1.3284543752670288} -11/07/2021 00:25:53 - INFO - __main__ - Step 22730: {'lr': 0.0004761864234720166, 'samples': 4364160, 'steps': 22729, 'loss/train': 1.4040530920028687} -11/07/2021 00:25:54 - INFO - __main__ - Step 22731: {'lr': 0.00047618416300192375, 'samples': 4364352, 'steps': 22730, 'loss/train': 1.7706865072250366} -11/07/2021 00:25:55 - INFO - __main__ - Step 22732: {'lr': 0.0004761819024299158, 'samples': 4364544, 'steps': 22731, 'loss/train': 1.3994696140289307} -11/07/2021 00:25:55 - INFO - __main__ - Step 22733: {'lr': 0.0004761796417559938, 'samples': 4364736, 'steps': 22732, 'loss/train': 1.0253995656967163} -11/07/2021 00:25:55 - INFO - __main__ - Step 22734: {'lr': 0.0004761773809801587, 'samples': 4364928, 'steps': 22733, 'loss/train': 1.6148645877838135} -11/07/2021 00:25:56 - INFO - __main__ - Step 22735: {'lr': 0.0004761751201024116, 'samples': 4365120, 'steps': 22734, 'loss/train': 1.7968497276306152} -11/07/2021 00:25:56 - INFO - __main__ - Step 22736: {'lr': 0.0004761728591227535, 'samples': 4365312, 'steps': 22735, 'loss/train': 1.335252285003662} -11/07/2021 00:25:57 - INFO - __main__ - Step 22737: {'lr': 0.00047617059804118536, 'samples': 4365504, 'steps': 22736, 'loss/train': 1.6151665449142456} -11/07/2021 00:25:57 - INFO - __main__ - Step 22738: {'lr': 0.0004761683368577083, 'samples': 4365696, 'steps': 22737, 'loss/train': 1.8413608074188232} -11/07/2021 00:25:58 - INFO - __main__ - Step 22739: {'lr': 0.0004761660755723232, 'samples': 4365888, 'steps': 22738, 'loss/train': 1.8213224411010742} -11/07/2021 00:25:58 - INFO - __main__ - Step 22740: {'lr': 0.0004761638141850312, 'samples': 4366080, 'steps': 22739, 'loss/train': 0.6306785345077515} -11/07/2021 00:25:58 - INFO - __main__ - Step 22741: {'lr': 0.0004761615526958333, 'samples': 4366272, 'steps': 22740, 'loss/train': 2.021019697189331} -11/07/2021 00:26:00 - INFO - __main__ - Step 22742: {'lr': 0.0004761592911047304, 'samples': 4366464, 'steps': 22741, 'loss/train': 1.3894141912460327} -11/07/2021 00:26:00 - INFO - __main__ - Step 22743: {'lr': 0.00047615702941172366, 'samples': 4366656, 'steps': 22742, 'loss/train': 1.7450761795043945} -11/07/2021 00:26:00 - INFO - __main__ - Step 22744: {'lr': 0.0004761547676168141, 'samples': 4366848, 'steps': 22743, 'loss/train': 1.6096402406692505} -11/07/2021 00:26:01 - INFO - __main__ - Step 22745: {'lr': 0.0004761525057200027, 'samples': 4367040, 'steps': 22744, 'loss/train': 1.6301637887954712} -11/07/2021 00:26:01 - INFO - __main__ - Step 22746: {'lr': 0.00047615024372129033, 'samples': 4367232, 'steps': 22745, 'loss/train': 1.208552360534668} -11/07/2021 00:26:01 - INFO - __main__ - Step 22747: {'lr': 0.0004761479816206783, 'samples': 4367424, 'steps': 22746, 'loss/train': 1.8603065013885498} -11/07/2021 00:26:02 - INFO - __main__ - Step 22748: {'lr': 0.00047614571941816743, 'samples': 4367616, 'steps': 22747, 'loss/train': 1.9403351545333862} -11/07/2021 00:26:03 - INFO - __main__ - Step 22749: {'lr': 0.00047614345711375874, 'samples': 4367808, 'steps': 22748, 'loss/train': 1.3546077013015747} -11/07/2021 00:26:03 - INFO - __main__ - Step 22750: {'lr': 0.0004761411947074533, 'samples': 4368000, 'steps': 22749, 'loss/train': 1.303208351135254} -11/07/2021 00:26:03 - INFO - __main__ - Step 22751: {'lr': 0.00047613893219925217, 'samples': 4368192, 'steps': 22750, 'loss/train': 1.6966766119003296} -11/07/2021 00:26:04 - INFO - __main__ - Step 22752: {'lr': 0.00047613666958915636, 'samples': 4368384, 'steps': 22751, 'loss/train': 1.6795576810836792} -11/07/2021 00:26:05 - INFO - __main__ - Step 22753: {'lr': 0.0004761344068771668, 'samples': 4368576, 'steps': 22752, 'loss/train': 1.901644229888916} -11/07/2021 00:26:05 - INFO - __main__ - Step 22754: {'lr': 0.0004761321440632846, 'samples': 4368768, 'steps': 22753, 'loss/train': 1.7572957277297974} -11/07/2021 00:26:05 - INFO - __main__ - Step 22755: {'lr': 0.00047612988114751074, 'samples': 4368960, 'steps': 22754, 'loss/train': 1.728715181350708} -11/07/2021 00:26:06 - INFO - __main__ - Step 22756: {'lr': 0.00047612761812984626, 'samples': 4369152, 'steps': 22755, 'loss/train': 1.803318738937378} -11/07/2021 00:26:06 - INFO - __main__ - Step 22757: {'lr': 0.00047612535501029215, 'samples': 4369344, 'steps': 22756, 'loss/train': 1.694913625717163} -11/07/2021 00:26:07 - INFO - __main__ - Step 22758: {'lr': 0.0004761230917888494, 'samples': 4369536, 'steps': 22757, 'loss/train': 1.8466224670410156} -11/07/2021 00:26:08 - INFO - __main__ - Step 22759: {'lr': 0.00047612082846551913, 'samples': 4369728, 'steps': 22758, 'loss/train': 1.1649069786071777} -11/07/2021 00:26:08 - INFO - __main__ - Step 22760: {'lr': 0.0004761185650403023, 'samples': 4369920, 'steps': 22759, 'loss/train': 1.9606319665908813} -11/07/2021 00:26:08 - INFO - __main__ - Step 22761: {'lr': 0.0004761163015131999, 'samples': 4370112, 'steps': 22760, 'loss/train': 1.2533822059631348} -11/07/2021 00:26:09 - INFO - __main__ - Step 22762: {'lr': 0.00047611403788421305, 'samples': 4370304, 'steps': 22761, 'loss/train': 1.934218168258667} -11/07/2021 00:26:10 - INFO - __main__ - Step 22763: {'lr': 0.0004761117741533426, 'samples': 4370496, 'steps': 22762, 'loss/train': 1.782967209815979} -11/07/2021 00:26:10 - INFO - __main__ - Step 22764: {'lr': 0.0004761095103205897, 'samples': 4370688, 'steps': 22763, 'loss/train': 1.5865823030471802} -11/07/2021 00:26:10 - INFO - __main__ - Step 22765: {'lr': 0.00047610724638595545, 'samples': 4370880, 'steps': 22764, 'loss/train': 1.7549775838851929} -11/07/2021 00:26:11 - INFO - __main__ - Step 22766: {'lr': 0.00047610498234944065, 'samples': 4371072, 'steps': 22765, 'loss/train': 1.639030933380127} -11/07/2021 00:26:11 - INFO - __main__ - Step 22767: {'lr': 0.00047610271821104647, 'samples': 4371264, 'steps': 22766, 'loss/train': 1.582705020904541} -11/07/2021 00:26:12 - INFO - __main__ - Step 22768: {'lr': 0.0004761004539707739, 'samples': 4371456, 'steps': 22767, 'loss/train': 1.0878734588623047} -11/07/2021 00:26:13 - INFO - __main__ - Step 22769: {'lr': 0.00047609818962862394, 'samples': 4371648, 'steps': 22768, 'loss/train': 1.2499237060546875} -11/07/2021 00:26:13 - INFO - __main__ - Step 22770: {'lr': 0.00047609592518459766, 'samples': 4371840, 'steps': 22769, 'loss/train': 1.562828540802002} -11/07/2021 00:26:13 - INFO - __main__ - Step 22771: {'lr': 0.00047609366063869595, 'samples': 4372032, 'steps': 22770, 'loss/train': 1.1859840154647827} -11/07/2021 00:26:14 - INFO - __main__ - Step 22772: {'lr': 0.00047609139599092006, 'samples': 4372224, 'steps': 22771, 'loss/train': 1.7285878658294678} -11/07/2021 00:26:14 - INFO - __main__ - Step 22773: {'lr': 0.0004760891312412708, 'samples': 4372416, 'steps': 22772, 'loss/train': 1.5550551414489746} -11/07/2021 00:26:15 - INFO - __main__ - Step 22774: {'lr': 0.0004760868663897493, 'samples': 4372608, 'steps': 22773, 'loss/train': 1.689923882484436} -11/07/2021 00:26:15 - INFO - __main__ - Step 22775: {'lr': 0.0004760846014363565, 'samples': 4372800, 'steps': 22774, 'loss/train': 1.6872327327728271} -11/07/2021 00:26:16 - INFO - __main__ - Step 22776: {'lr': 0.0004760823363810935, 'samples': 4372992, 'steps': 22775, 'loss/train': 1.6919316053390503} -11/07/2021 00:26:16 - INFO - __main__ - Step 22777: {'lr': 0.0004760800712239612, 'samples': 4373184, 'steps': 22776, 'loss/train': 1.7831788063049316} -11/07/2021 00:26:17 - INFO - __main__ - Step 22778: {'lr': 0.0004760778059649609, 'samples': 4373376, 'steps': 22777, 'loss/train': 1.4779175519943237} -11/07/2021 00:26:17 - INFO - __main__ - Step 22779: {'lr': 0.0004760755406040933, 'samples': 4373568, 'steps': 22778, 'loss/train': 1.4688366651535034} -11/07/2021 00:26:18 - INFO - __main__ - Step 22780: {'lr': 0.00047607327514135955, 'samples': 4373760, 'steps': 22779, 'loss/train': 1.6470462083816528} -11/07/2021 00:26:18 - INFO - __main__ - Step 22781: {'lr': 0.00047607100957676067, 'samples': 4373952, 'steps': 22780, 'loss/train': 1.4926844835281372} -11/07/2021 00:26:18 - INFO - __main__ - Step 22782: {'lr': 0.0004760687439102977, 'samples': 4374144, 'steps': 22781, 'loss/train': 1.4573156833648682} -11/07/2021 00:26:19 - INFO - __main__ - Step 22783: {'lr': 0.0004760664781419717, 'samples': 4374336, 'steps': 22782, 'loss/train': 1.8104127645492554} -11/07/2021 00:26:20 - INFO - __main__ - Step 22784: {'lr': 0.00047606421227178354, 'samples': 4374528, 'steps': 22783, 'loss/train': 1.9405661821365356} -11/07/2021 00:26:20 - INFO - __main__ - Step 22785: {'lr': 0.0004760619462997343, 'samples': 4374720, 'steps': 22784, 'loss/train': 1.883963942527771} -11/07/2021 00:26:20 - INFO - __main__ - Step 22786: {'lr': 0.00047605968022582513, 'samples': 4374912, 'steps': 22785, 'loss/train': 1.4331687688827515} -11/07/2021 00:26:21 - INFO - __main__ - Step 22787: {'lr': 0.000476057414050057, 'samples': 4375104, 'steps': 22786, 'loss/train': 1.257065773010254} -11/07/2021 00:26:21 - INFO - __main__ - Step 22788: {'lr': 0.00047605514777243076, 'samples': 4375296, 'steps': 22787, 'loss/train': 1.6153793334960938} -11/07/2021 00:26:22 - INFO - __main__ - Step 22789: {'lr': 0.0004760528813929476, 'samples': 4375488, 'steps': 22788, 'loss/train': 2.338101387023926} -11/07/2021 00:26:23 - INFO - __main__ - Step 22790: {'lr': 0.0004760506149116085, 'samples': 4375680, 'steps': 22789, 'loss/train': 2.3699982166290283} -11/07/2021 00:26:23 - INFO - __main__ - Step 22791: {'lr': 0.0004760483483284145, 'samples': 4375872, 'steps': 22790, 'loss/train': 1.6395772695541382} -11/07/2021 00:26:23 - INFO - __main__ - Step 22792: {'lr': 0.0004760460816433666, 'samples': 4376064, 'steps': 22791, 'loss/train': 1.8664559125900269} -11/07/2021 00:26:24 - INFO - __main__ - Step 22793: {'lr': 0.0004760438148564659, 'samples': 4376256, 'steps': 22792, 'loss/train': 1.484313726425171} -11/07/2021 00:26:24 - INFO - __main__ - Step 22794: {'lr': 0.00047604154796771327, 'samples': 4376448, 'steps': 22793, 'loss/train': 1.7671095132827759} -11/07/2021 00:26:25 - INFO - __main__ - Step 22795: {'lr': 0.0004760392809771098, 'samples': 4376640, 'steps': 22794, 'loss/train': 1.3843249082565308} -11/07/2021 00:26:25 - INFO - __main__ - Step 22796: {'lr': 0.00047603701388465646, 'samples': 4376832, 'steps': 22795, 'loss/train': 1.696913242340088} -11/07/2021 00:26:26 - INFO - __main__ - Step 22797: {'lr': 0.0004760347466903544, 'samples': 4377024, 'steps': 22796, 'loss/train': 1.2284456491470337} -11/07/2021 00:26:26 - INFO - __main__ - Step 22798: {'lr': 0.0004760324793942046, 'samples': 4377216, 'steps': 22797, 'loss/train': 1.663573145866394} -11/07/2021 00:26:26 - INFO - __main__ - Step 22799: {'lr': 0.000476030211996208, 'samples': 4377408, 'steps': 22798, 'loss/train': 1.5763083696365356} -11/07/2021 00:26:27 - INFO - __main__ - Step 22800: {'lr': 0.0004760279444963657, 'samples': 4377600, 'steps': 22799, 'loss/train': 1.9171547889709473} -11/07/2021 00:26:28 - INFO - __main__ - Step 22801: {'lr': 0.0004760256768946787, 'samples': 4377792, 'steps': 22800, 'loss/train': 1.7655497789382935} -11/07/2021 00:26:28 - INFO - __main__ - Step 22802: {'lr': 0.00047602340919114793, 'samples': 4377984, 'steps': 22801, 'loss/train': 1.8714632987976074} -11/07/2021 00:26:28 - INFO - __main__ - Step 22803: {'lr': 0.00047602114138577464, 'samples': 4378176, 'steps': 22802, 'loss/train': 1.8071902990341187} -11/07/2021 00:26:29 - INFO - __main__ - Step 22804: {'lr': 0.00047601887347855965, 'samples': 4378368, 'steps': 22803, 'loss/train': 1.7482866048812866} -11/07/2021 00:26:30 - INFO - __main__ - Step 22805: {'lr': 0.00047601660546950396, 'samples': 4378560, 'steps': 22804, 'loss/train': 1.632975697517395} -11/07/2021 00:26:30 - INFO - __main__ - Step 22806: {'lr': 0.0004760143373586088, 'samples': 4378752, 'steps': 22805, 'loss/train': 1.297473430633545} -11/07/2021 00:26:30 - INFO - __main__ - Step 22807: {'lr': 0.000476012069145875, 'samples': 4378944, 'steps': 22806, 'loss/train': 1.1406476497650146} -11/07/2021 00:26:31 - INFO - __main__ - Step 22808: {'lr': 0.00047600980083130367, 'samples': 4379136, 'steps': 22807, 'loss/train': 1.5739290714263916} -11/07/2021 00:26:31 - INFO - __main__ - Step 22809: {'lr': 0.0004760075324148959, 'samples': 4379328, 'steps': 22808, 'loss/train': 1.4321844577789307} -11/07/2021 00:26:32 - INFO - __main__ - Step 22810: {'lr': 0.00047600526389665246, 'samples': 4379520, 'steps': 22809, 'loss/train': 2.083242893218994} -11/07/2021 00:26:33 - INFO - __main__ - Step 22811: {'lr': 0.00047600299527657464, 'samples': 4379712, 'steps': 22810, 'loss/train': 1.2935341596603394} -11/07/2021 00:26:33 - INFO - __main__ - Step 22812: {'lr': 0.0004760007265546633, 'samples': 4379904, 'steps': 22811, 'loss/train': 1.2957768440246582} -11/07/2021 00:26:33 - INFO - __main__ - Step 22813: {'lr': 0.00047599845773091957, 'samples': 4380096, 'steps': 22812, 'loss/train': 1.912548303604126} -11/07/2021 00:26:34 - INFO - __main__ - Step 22814: {'lr': 0.0004759961888053444, 'samples': 4380288, 'steps': 22813, 'loss/train': 1.8325461149215698} -11/07/2021 00:26:34 - INFO - __main__ - Step 22815: {'lr': 0.00047599391977793884, 'samples': 4380480, 'steps': 22814, 'loss/train': 2.203472375869751} -11/07/2021 00:26:35 - INFO - __main__ - Step 22816: {'lr': 0.00047599165064870385, 'samples': 4380672, 'steps': 22815, 'loss/train': 1.6262705326080322} -11/07/2021 00:26:36 - INFO - __main__ - Step 22817: {'lr': 0.0004759893814176406, 'samples': 4380864, 'steps': 22816, 'loss/train': 1.609465479850769} -11/07/2021 00:26:36 - INFO - __main__ - Step 22818: {'lr': 0.00047598711208475, 'samples': 4381056, 'steps': 22817, 'loss/train': 1.697596549987793} -11/07/2021 00:26:36 - INFO - __main__ - Step 22819: {'lr': 0.00047598484265003307, 'samples': 4381248, 'steps': 22818, 'loss/train': 1.49398934841156} -11/07/2021 00:26:37 - INFO - __main__ - Step 22820: {'lr': 0.00047598257311349087, 'samples': 4381440, 'steps': 22819, 'loss/train': 1.8012315034866333} -11/07/2021 00:26:38 - INFO - __main__ - Step 22821: {'lr': 0.0004759803034751244, 'samples': 4381632, 'steps': 22820, 'loss/train': 1.7763862609863281} -11/07/2021 00:26:38 - INFO - __main__ - Step 22822: {'lr': 0.0004759780337349347, 'samples': 4381824, 'steps': 22821, 'loss/train': 1.1558592319488525} -11/07/2021 00:26:38 - INFO - __main__ - Step 22823: {'lr': 0.0004759757638929227, 'samples': 4382016, 'steps': 22822, 'loss/train': 1.7096298933029175} -11/07/2021 00:26:39 - INFO - __main__ - Step 22824: {'lr': 0.00047597349394908967, 'samples': 4382208, 'steps': 22823, 'loss/train': 1.0129907131195068} -11/07/2021 00:26:39 - INFO - __main__ - Step 22825: {'lr': 0.0004759712239034364, 'samples': 4382400, 'steps': 22824, 'loss/train': 2.0725107192993164} -11/07/2021 00:26:40 - INFO - __main__ - Step 22826: {'lr': 0.0004759689537559639, 'samples': 4382592, 'steps': 22825, 'loss/train': 0.44292402267456055} -11/07/2021 00:26:41 - INFO - __main__ - Step 22827: {'lr': 0.0004759666835066734, 'samples': 4382784, 'steps': 22826, 'loss/train': 1.713152527809143} -11/07/2021 00:26:41 - INFO - __main__ - Step 22828: {'lr': 0.00047596441315556575, 'samples': 4382976, 'steps': 22827, 'loss/train': 0.9748886227607727} -11/07/2021 00:26:41 - INFO - __main__ - Step 22829: {'lr': 0.00047596214270264204, 'samples': 4383168, 'steps': 22828, 'loss/train': 1.3580565452575684} -11/07/2021 00:26:42 - INFO - __main__ - Step 22830: {'lr': 0.00047595987214790324, 'samples': 4383360, 'steps': 22829, 'loss/train': 1.7348219156265259} -11/07/2021 00:26:43 - INFO - __main__ - Step 22831: {'lr': 0.0004759576014913505, 'samples': 4383552, 'steps': 22830, 'loss/train': 1.497948408126831} -11/07/2021 00:26:43 - INFO - __main__ - Step 22832: {'lr': 0.0004759553307329846, 'samples': 4383744, 'steps': 22831, 'loss/train': 1.397659182548523} -11/07/2021 00:26:43 - INFO - __main__ - Step 22833: {'lr': 0.0004759530598728068, 'samples': 4383936, 'steps': 22832, 'loss/train': 1.3267203569412231} -11/07/2021 00:26:44 - INFO - __main__ - Step 22834: {'lr': 0.000475950788910818, 'samples': 4384128, 'steps': 22833, 'loss/train': 1.3071024417877197} -11/07/2021 00:26:44 - INFO - __main__ - Step 22835: {'lr': 0.0004759485178470193, 'samples': 4384320, 'steps': 22834, 'loss/train': 1.684517502784729} -11/07/2021 00:26:45 - INFO - __main__ - Step 22836: {'lr': 0.0004759462466814117, 'samples': 4384512, 'steps': 22835, 'loss/train': 0.7335377335548401} -11/07/2021 00:26:45 - INFO - __main__ - Step 22837: {'lr': 0.0004759439754139962, 'samples': 4384704, 'steps': 22836, 'loss/train': 1.4387019872665405} -11/07/2021 00:26:46 - INFO - __main__ - Step 22838: {'lr': 0.0004759417040447738, 'samples': 4384896, 'steps': 22837, 'loss/train': 1.5750333070755005} -11/07/2021 00:26:46 - INFO - __main__ - Step 22839: {'lr': 0.00047593943257374563, 'samples': 4385088, 'steps': 22838, 'loss/train': 1.6899166107177734} -11/07/2021 00:26:47 - INFO - __main__ - Step 22840: {'lr': 0.00047593716100091253, 'samples': 4385280, 'steps': 22839, 'loss/train': 1.795365571975708} -11/07/2021 00:26:47 - INFO - __main__ - Step 22841: {'lr': 0.00047593488932627567, 'samples': 4385472, 'steps': 22840, 'loss/train': 1.5965057611465454} -11/07/2021 00:26:48 - INFO - __main__ - Step 22842: {'lr': 0.00047593261754983607, 'samples': 4385664, 'steps': 22841, 'loss/train': 1.7863192558288574} -11/07/2021 00:26:48 - INFO - __main__ - Step 22843: {'lr': 0.00047593034567159465, 'samples': 4385856, 'steps': 22842, 'loss/train': 2.4589531421661377} -11/07/2021 00:26:49 - INFO - __main__ - Step 22844: {'lr': 0.00047592807369155256, 'samples': 4386048, 'steps': 22843, 'loss/train': 1.5386347770690918} -11/07/2021 00:26:49 - INFO - __main__ - Step 22845: {'lr': 0.0004759258016097108, 'samples': 4386240, 'steps': 22844, 'loss/train': 1.98453950881958} -11/07/2021 00:26:49 - INFO - __main__ - Step 22846: {'lr': 0.0004759235294260703, 'samples': 4386432, 'steps': 22845, 'loss/train': 1.771543264389038} -11/07/2021 00:26:50 - INFO - __main__ - Step 22847: {'lr': 0.0004759212571406321, 'samples': 4386624, 'steps': 22846, 'loss/train': 1.4666595458984375} -11/07/2021 00:26:51 - INFO - __main__ - Step 22848: {'lr': 0.00047591898475339735, 'samples': 4386816, 'steps': 22847, 'loss/train': 1.6236677169799805} -11/07/2021 00:26:51 - INFO - __main__ - Step 22849: {'lr': 0.00047591671226436695, 'samples': 4387008, 'steps': 22848, 'loss/train': 1.4926680326461792} -11/07/2021 00:26:51 - INFO - __main__ - Step 22850: {'lr': 0.00047591443967354196, 'samples': 4387200, 'steps': 22849, 'loss/train': 1.6243668794631958} -11/07/2021 00:26:52 - INFO - __main__ - Step 22851: {'lr': 0.00047591216698092344, 'samples': 4387392, 'steps': 22850, 'loss/train': 1.8379485607147217} -11/07/2021 00:26:53 - INFO - __main__ - Step 22852: {'lr': 0.00047590989418651243, 'samples': 4387584, 'steps': 22851, 'loss/train': 1.4109525680541992} -11/07/2021 00:26:53 - INFO - __main__ - Step 22853: {'lr': 0.00047590762129030986, 'samples': 4387776, 'steps': 22852, 'loss/train': 0.5099748969078064} -11/07/2021 00:26:53 - INFO - __main__ - Step 22854: {'lr': 0.00047590534829231675, 'samples': 4387968, 'steps': 22853, 'loss/train': 1.7714526653289795} -11/07/2021 00:26:54 - INFO - __main__ - Step 22855: {'lr': 0.00047590307519253423, 'samples': 4388160, 'steps': 22854, 'loss/train': 1.9432487487792969} -11/07/2021 00:26:54 - INFO - __main__ - Step 22856: {'lr': 0.00047590080199096324, 'samples': 4388352, 'steps': 22855, 'loss/train': 0.7025504112243652} -11/07/2021 00:26:55 - INFO - __main__ - Step 22857: {'lr': 0.00047589852868760486, 'samples': 4388544, 'steps': 22856, 'loss/train': 1.6349374055862427} -11/07/2021 00:26:55 - INFO - __main__ - Step 22858: {'lr': 0.00047589625528246006, 'samples': 4388736, 'steps': 22857, 'loss/train': 1.535549283027649} -11/07/2021 00:26:56 - INFO - __main__ - Step 22859: {'lr': 0.0004758939817755299, 'samples': 4388928, 'steps': 22858, 'loss/train': 1.5929142236709595} -11/07/2021 00:26:56 - INFO - __main__ - Step 22860: {'lr': 0.0004758917081668155, 'samples': 4389120, 'steps': 22859, 'loss/train': 1.5244239568710327} -11/07/2021 00:26:56 - INFO - __main__ - Step 22861: {'lr': 0.00047588943445631767, 'samples': 4389312, 'steps': 22860, 'loss/train': 1.5270912647247314} -11/07/2021 00:26:58 - INFO - __main__ - Step 22862: {'lr': 0.0004758871606440376, 'samples': 4389504, 'steps': 22861, 'loss/train': 1.3322381973266602} -11/07/2021 00:26:58 - INFO - __main__ - Step 22863: {'lr': 0.0004758848867299762, 'samples': 4389696, 'steps': 22862, 'loss/train': 1.7966527938842773} -11/07/2021 00:26:58 - INFO - __main__ - Step 22864: {'lr': 0.0004758826127141346, 'samples': 4389888, 'steps': 22863, 'loss/train': 1.5517232418060303} -11/07/2021 00:26:59 - INFO - __main__ - Step 22865: {'lr': 0.00047588033859651376, 'samples': 4390080, 'steps': 22864, 'loss/train': 1.1566221714019775} -11/07/2021 00:26:59 - INFO - __main__ - Step 22866: {'lr': 0.00047587806437711475, 'samples': 4390272, 'steps': 22865, 'loss/train': 1.6851732730865479} -11/07/2021 00:27:00 - INFO - __main__ - Step 22867: {'lr': 0.0004758757900559385, 'samples': 4390464, 'steps': 22866, 'loss/train': 0.689471960067749} -11/07/2021 00:27:00 - INFO - __main__ - Step 22868: {'lr': 0.0004758735156329862, 'samples': 4390656, 'steps': 22867, 'loss/train': 1.991492748260498} -11/07/2021 00:27:01 - INFO - __main__ - Step 22869: {'lr': 0.00047587124110825874, 'samples': 4390848, 'steps': 22868, 'loss/train': 1.6657304763793945} -11/07/2021 00:27:01 - INFO - __main__ - Step 22870: {'lr': 0.00047586896648175715, 'samples': 4391040, 'steps': 22869, 'loss/train': 1.4751023054122925} -11/07/2021 00:27:01 - INFO - __main__ - Step 22871: {'lr': 0.00047586669175348254, 'samples': 4391232, 'steps': 22870, 'loss/train': 1.5636752843856812} -11/07/2021 00:27:02 - INFO - __main__ - Step 22872: {'lr': 0.0004758644169234359, 'samples': 4391424, 'steps': 22871, 'loss/train': 1.8853099346160889} -11/07/2021 00:27:03 - INFO - __main__ - Step 22873: {'lr': 0.00047586214199161814, 'samples': 4391616, 'steps': 22872, 'loss/train': 1.800837755203247} -11/07/2021 00:27:03 - INFO - __main__ - Step 22874: {'lr': 0.00047585986695803046, 'samples': 4391808, 'steps': 22873, 'loss/train': 1.3251843452453613} -11/07/2021 00:27:04 - INFO - __main__ - Step 22875: {'lr': 0.0004758575918226738, 'samples': 4392000, 'steps': 22874, 'loss/train': 2.003358840942383} -11/07/2021 00:27:04 - INFO - __main__ - Step 22876: {'lr': 0.0004758553165855492, 'samples': 4392192, 'steps': 22875, 'loss/train': 1.644388198852539} -11/07/2021 00:27:04 - INFO - __main__ - Step 22877: {'lr': 0.00047585304124665766, 'samples': 4392384, 'steps': 22876, 'loss/train': 1.8481217622756958} -11/07/2021 00:27:05 - INFO - __main__ - Step 22878: {'lr': 0.0004758507658060003, 'samples': 4392576, 'steps': 22877, 'loss/train': 1.3295446634292603} -11/07/2021 00:27:06 - INFO - __main__ - Step 22879: {'lr': 0.00047584849026357796, 'samples': 4392768, 'steps': 22878, 'loss/train': 1.9172389507293701} -11/07/2021 00:27:06 - INFO - __main__ - Step 22880: {'lr': 0.0004758462146193918, 'samples': 4392960, 'steps': 22879, 'loss/train': 1.363627314567566} -11/07/2021 00:27:06 - INFO - __main__ - Step 22881: {'lr': 0.00047584393887344285, 'samples': 4393152, 'steps': 22880, 'loss/train': 1.7900865077972412} -11/07/2021 00:27:07 - INFO - __main__ - Step 22882: {'lr': 0.00047584166302573204, 'samples': 4393344, 'steps': 22881, 'loss/train': 1.6964235305786133} -11/07/2021 00:27:08 - INFO - __main__ - Step 22883: {'lr': 0.0004758393870762606, 'samples': 4393536, 'steps': 22882, 'loss/train': 1.4693646430969238} -11/07/2021 00:27:08 - INFO - __main__ - Step 22884: {'lr': 0.00047583711102502934, 'samples': 4393728, 'steps': 22883, 'loss/train': 1.5916904211044312} -11/07/2021 00:27:08 - INFO - __main__ - Step 22885: {'lr': 0.0004758348348720393, 'samples': 4393920, 'steps': 22884, 'loss/train': 1.60740327835083} -11/07/2021 00:27:09 - INFO - __main__ - Step 22886: {'lr': 0.00047583255861729167, 'samples': 4394112, 'steps': 22885, 'loss/train': 1.265206217765808} -11/07/2021 00:27:09 - INFO - __main__ - Step 22887: {'lr': 0.00047583028226078734, 'samples': 4394304, 'steps': 22886, 'loss/train': 1.0524832010269165} -11/07/2021 00:27:10 - INFO - __main__ - Step 22888: {'lr': 0.0004758280058025274, 'samples': 4394496, 'steps': 22887, 'loss/train': 0.9584725499153137} -11/07/2021 00:27:10 - INFO - __main__ - Step 22889: {'lr': 0.00047582572924251276, 'samples': 4394688, 'steps': 22888, 'loss/train': 1.4555813074111938} -11/07/2021 00:27:11 - INFO - __main__ - Step 22890: {'lr': 0.00047582345258074453, 'samples': 4394880, 'steps': 22889, 'loss/train': 1.5769598484039307} -11/07/2021 00:27:11 - INFO - __main__ - Step 22891: {'lr': 0.0004758211758172238, 'samples': 4395072, 'steps': 22890, 'loss/train': 1.4620798826217651} -11/07/2021 00:27:11 - INFO - __main__ - Step 22892: {'lr': 0.00047581889895195154, 'samples': 4395264, 'steps': 22891, 'loss/train': 1.7565606832504272} -11/07/2021 00:27:13 - INFO - __main__ - Step 22893: {'lr': 0.00047581662198492873, 'samples': 4395456, 'steps': 22892, 'loss/train': 1.5614871978759766} -11/07/2021 00:27:13 - INFO - __main__ - Step 22894: {'lr': 0.0004758143449161565, 'samples': 4395648, 'steps': 22893, 'loss/train': 0.7110083103179932} -11/07/2021 00:27:13 - INFO - __main__ - Step 22895: {'lr': 0.00047581206774563575, 'samples': 4395840, 'steps': 22894, 'loss/train': 1.7186449766159058} -11/07/2021 00:27:14 - INFO - __main__ - Step 22896: {'lr': 0.0004758097904733676, 'samples': 4396032, 'steps': 22895, 'loss/train': 1.64580500125885} -11/07/2021 00:27:14 - INFO - __main__ - Step 22897: {'lr': 0.000475807513099353, 'samples': 4396224, 'steps': 22896, 'loss/train': 1.555309534072876} -11/07/2021 00:27:14 - INFO - __main__ - Step 22898: {'lr': 0.000475805235623593, 'samples': 4396416, 'steps': 22897, 'loss/train': 1.5211753845214844} -11/07/2021 00:27:15 - INFO - __main__ - Step 22899: {'lr': 0.0004758029580460887, 'samples': 4396608, 'steps': 22898, 'loss/train': 1.6425952911376953} -11/07/2021 00:27:16 - INFO - __main__ - Step 22900: {'lr': 0.0004758006803668411, 'samples': 4396800, 'steps': 22899, 'loss/train': 1.7011586427688599} -11/07/2021 00:27:16 - INFO - __main__ - Step 22901: {'lr': 0.0004757984025858511, 'samples': 4396992, 'steps': 22900, 'loss/train': 1.5620101690292358} -11/07/2021 00:27:16 - INFO - __main__ - Step 22902: {'lr': 0.0004757961247031199, 'samples': 4397184, 'steps': 22901, 'loss/train': 1.7332442998886108} -11/07/2021 00:27:17 - INFO - __main__ - Step 22903: {'lr': 0.00047579384671864845, 'samples': 4397376, 'steps': 22902, 'loss/train': 1.6374011039733887} -11/07/2021 00:27:18 - INFO - __main__ - Step 22904: {'lr': 0.0004757915686324377, 'samples': 4397568, 'steps': 22903, 'loss/train': 1.6759214401245117} -11/07/2021 00:27:18 - INFO - __main__ - Step 22905: {'lr': 0.00047578929044448883, 'samples': 4397760, 'steps': 22904, 'loss/train': 1.2218265533447266} -11/07/2021 00:27:18 - INFO - __main__ - Step 22906: {'lr': 0.0004757870121548028, 'samples': 4397952, 'steps': 22905, 'loss/train': 1.6508798599243164} -11/07/2021 00:27:19 - INFO - __main__ - Step 22907: {'lr': 0.0004757847337633806, 'samples': 4398144, 'steps': 22906, 'loss/train': 1.720141053199768} -11/07/2021 00:27:19 - INFO - __main__ - Step 22908: {'lr': 0.0004757824552702232, 'samples': 4398336, 'steps': 22907, 'loss/train': 0.8543339371681213} -11/07/2021 00:27:20 - INFO - __main__ - Step 22909: {'lr': 0.0004757801766753318, 'samples': 4398528, 'steps': 22908, 'loss/train': 1.0013171434402466} -11/07/2021 00:27:20 - INFO - __main__ - Step 22910: {'lr': 0.00047577789797870743, 'samples': 4398720, 'steps': 22909, 'loss/train': 1.8550013303756714} -11/07/2021 00:27:21 - INFO - __main__ - Step 22911: {'lr': 0.0004757756191803508, 'samples': 4398912, 'steps': 22910, 'loss/train': 0.7047666907310486} -11/07/2021 00:27:21 - INFO - __main__ - Step 22912: {'lr': 0.0004757733402802633, 'samples': 4399104, 'steps': 22911, 'loss/train': 1.7484979629516602} -11/07/2021 00:27:22 - INFO - __main__ - Step 22913: {'lr': 0.0004757710612784458, 'samples': 4399296, 'steps': 22912, 'loss/train': 1.82514488697052} -11/07/2021 00:27:23 - INFO - __main__ - Step 22914: {'lr': 0.0004757687821748994, 'samples': 4399488, 'steps': 22913, 'loss/train': 1.594335675239563} -11/07/2021 00:27:23 - INFO - __main__ - Step 22915: {'lr': 0.00047576650296962496, 'samples': 4399680, 'steps': 22914, 'loss/train': 1.4763436317443848} -11/07/2021 00:27:23 - INFO - __main__ - Step 22916: {'lr': 0.0004757642236626237, 'samples': 4399872, 'steps': 22915, 'loss/train': 1.4962226152420044} -11/07/2021 00:27:24 - INFO - __main__ - Step 22917: {'lr': 0.00047576194425389654, 'samples': 4400064, 'steps': 22916, 'loss/train': 1.6657871007919312} -11/07/2021 00:27:24 - INFO - __main__ - Step 22918: {'lr': 0.00047575966474344445, 'samples': 4400256, 'steps': 22917, 'loss/train': 1.158781886100769} -11/07/2021 00:27:25 - INFO - __main__ - Step 22919: {'lr': 0.00047575738513126867, 'samples': 4400448, 'steps': 22918, 'loss/train': 1.493218183517456} -11/07/2021 00:27:25 - INFO - __main__ - Step 22920: {'lr': 0.00047575510541737, 'samples': 4400640, 'steps': 22919, 'loss/train': 1.7854337692260742} -11/07/2021 00:27:26 - INFO - __main__ - Step 22921: {'lr': 0.0004757528256017496, 'samples': 4400832, 'steps': 22920, 'loss/train': 1.5265958309173584} -11/07/2021 00:27:26 - INFO - __main__ - Step 22922: {'lr': 0.00047575054568440846, 'samples': 4401024, 'steps': 22921, 'loss/train': 1.4380706548690796} -11/07/2021 00:27:26 - INFO - __main__ - Step 22923: {'lr': 0.00047574826566534764, 'samples': 4401216, 'steps': 22922, 'loss/train': 1.1648343801498413} -11/07/2021 00:27:27 - INFO - __main__ - Step 22924: {'lr': 0.0004757459855445681, 'samples': 4401408, 'steps': 22923, 'loss/train': 1.4443479776382446} -11/07/2021 00:27:28 - INFO - __main__ - Step 22925: {'lr': 0.0004757437053220709, 'samples': 4401600, 'steps': 22924, 'loss/train': 1.3270888328552246} -11/07/2021 00:27:28 - INFO - __main__ - Step 22926: {'lr': 0.0004757414249978571, 'samples': 4401792, 'steps': 22925, 'loss/train': 1.6503046751022339} -11/07/2021 00:27:29 - INFO - __main__ - Step 22927: {'lr': 0.0004757391445719277, 'samples': 4401984, 'steps': 22926, 'loss/train': 1.4672082662582397} -11/07/2021 00:27:29 - INFO - __main__ - Step 22928: {'lr': 0.00047573686404428365, 'samples': 4402176, 'steps': 22927, 'loss/train': 1.015838384628296} -11/07/2021 00:27:29 - INFO - __main__ - Step 22929: {'lr': 0.0004757345834149261, 'samples': 4402368, 'steps': 22928, 'loss/train': 1.3925256729125977} -11/07/2021 00:27:30 - INFO - __main__ - Step 22930: {'lr': 0.00047573230268385604, 'samples': 4402560, 'steps': 22929, 'loss/train': 1.4334114789962769} -11/07/2021 00:27:31 - INFO - __main__ - Step 22931: {'lr': 0.0004757300218510745, 'samples': 4402752, 'steps': 22930, 'loss/train': 1.7703146934509277} -11/07/2021 00:27:31 - INFO - __main__ - Step 22932: {'lr': 0.00047572774091658243, 'samples': 4402944, 'steps': 22931, 'loss/train': 1.6377800703048706} -11/07/2021 00:27:31 - INFO - __main__ - Step 22933: {'lr': 0.000475725459880381, 'samples': 4403136, 'steps': 22932, 'loss/train': 1.176165223121643} -11/07/2021 00:27:32 - INFO - __main__ - Step 22934: {'lr': 0.00047572317874247107, 'samples': 4403328, 'steps': 22933, 'loss/train': 1.5558907985687256} -11/07/2021 00:27:33 - INFO - __main__ - Step 22935: {'lr': 0.00047572089750285383, 'samples': 4403520, 'steps': 22934, 'loss/train': 2.0823795795440674} -11/07/2021 00:27:33 - INFO - __main__ - Step 22936: {'lr': 0.00047571861616153025, 'samples': 4403712, 'steps': 22935, 'loss/train': 0.2161761075258255} -11/07/2021 00:27:33 - INFO - __main__ - Step 22937: {'lr': 0.0004757163347185013, 'samples': 4403904, 'steps': 22936, 'loss/train': 1.6220515966415405} -11/07/2021 00:27:34 - INFO - __main__ - Step 22938: {'lr': 0.00047571405317376803, 'samples': 4404096, 'steps': 22937, 'loss/train': 1.4291313886642456} -11/07/2021 00:27:34 - INFO - __main__ - Step 22939: {'lr': 0.0004757117715273316, 'samples': 4404288, 'steps': 22938, 'loss/train': 1.6622034311294556} -11/07/2021 00:27:35 - INFO - __main__ - Step 22940: {'lr': 0.00047570948977919284, 'samples': 4404480, 'steps': 22939, 'loss/train': 1.4840724468231201} -11/07/2021 00:27:35 - INFO - __main__ - Step 22941: {'lr': 0.00047570720792935284, 'samples': 4404672, 'steps': 22940, 'loss/train': 1.6443581581115723} -11/07/2021 00:27:36 - INFO - __main__ - Step 22942: {'lr': 0.00047570492597781274, 'samples': 4404864, 'steps': 22941, 'loss/train': 1.1462692022323608} -11/07/2021 00:27:36 - INFO - __main__ - Step 22943: {'lr': 0.0004757026439245735, 'samples': 4405056, 'steps': 22942, 'loss/train': 1.5172832012176514} -11/07/2021 00:27:37 - INFO - __main__ - Step 22944: {'lr': 0.0004757003617696361, 'samples': 4405248, 'steps': 22943, 'loss/train': 1.5041968822479248} -11/07/2021 00:27:37 - INFO - __main__ - Step 22945: {'lr': 0.0004756980795130015, 'samples': 4405440, 'steps': 22944, 'loss/train': 1.511906623840332} -11/07/2021 00:27:38 - INFO - __main__ - Step 22946: {'lr': 0.00047569579715467093, 'samples': 4405632, 'steps': 22945, 'loss/train': 2.17930269241333} -11/07/2021 00:27:38 - INFO - __main__ - Step 22947: {'lr': 0.00047569351469464526, 'samples': 4405824, 'steps': 22946, 'loss/train': 1.2511581182479858} -11/07/2021 00:27:39 - INFO - __main__ - Step 22948: {'lr': 0.0004756912321329256, 'samples': 4406016, 'steps': 22947, 'loss/train': 1.4924403429031372} -11/07/2021 00:27:39 - INFO - __main__ - Step 22949: {'lr': 0.000475688949469513, 'samples': 4406208, 'steps': 22948, 'loss/train': 1.0683891773223877} -11/07/2021 00:27:41 - INFO - __main__ - Step 22950: {'lr': 0.0004756866667044084, 'samples': 4406400, 'steps': 22949, 'loss/train': 1.3111467361450195} -11/07/2021 00:27:41 - INFO - __main__ - Step 22951: {'lr': 0.0004756843838376128, 'samples': 4406592, 'steps': 22950, 'loss/train': 1.0856906175613403} -11/07/2021 00:27:41 - INFO - __main__ - Step 22952: {'lr': 0.0004756821008691274, 'samples': 4406784, 'steps': 22951, 'loss/train': 1.7769157886505127} -11/07/2021 00:27:42 - INFO - __main__ - Step 22953: {'lr': 0.0004756798177989531, 'samples': 4406976, 'steps': 22952, 'loss/train': 1.7058240175247192} -11/07/2021 00:27:42 - INFO - __main__ - Step 22954: {'lr': 0.00047567753462709095, 'samples': 4407168, 'steps': 22953, 'loss/train': 1.7961945533752441} -11/07/2021 00:27:42 - INFO - __main__ - Step 22955: {'lr': 0.00047567525135354193, 'samples': 4407360, 'steps': 22954, 'loss/train': 1.5496257543563843} -11/07/2021 00:27:43 - INFO - __main__ - Step 22956: {'lr': 0.00047567296797830727, 'samples': 4407552, 'steps': 22955, 'loss/train': 1.9372279644012451} -11/07/2021 00:27:44 - INFO - __main__ - Step 22957: {'lr': 0.00047567068450138773, 'samples': 4407744, 'steps': 22956, 'loss/train': 1.5832316875457764} -11/07/2021 00:27:44 - INFO - __main__ - Step 22958: {'lr': 0.0004756684009227845, 'samples': 4407936, 'steps': 22957, 'loss/train': 1.7091788053512573} -11/07/2021 00:27:44 - INFO - __main__ - Step 22959: {'lr': 0.0004756661172424986, 'samples': 4408128, 'steps': 22958, 'loss/train': 1.709111213684082} -11/07/2021 00:27:45 - INFO - __main__ - Step 22960: {'lr': 0.000475663833460531, 'samples': 4408320, 'steps': 22959, 'loss/train': 1.6512173414230347} -11/07/2021 00:27:45 - INFO - __main__ - Step 22961: {'lr': 0.00047566154957688275, 'samples': 4408512, 'steps': 22960, 'loss/train': 1.5914360284805298} -11/07/2021 00:27:46 - INFO - __main__ - Step 22962: {'lr': 0.0004756592655915549, 'samples': 4408704, 'steps': 22961, 'loss/train': 1.5957335233688354} -11/07/2021 00:27:47 - INFO - __main__ - Step 22963: {'lr': 0.00047565698150454845, 'samples': 4408896, 'steps': 22962, 'loss/train': 1.1223114728927612} -11/07/2021 00:27:47 - INFO - __main__ - Step 22964: {'lr': 0.0004756546973158644, 'samples': 4409088, 'steps': 22963, 'loss/train': 4.726345062255859} -11/07/2021 00:27:47 - INFO - __main__ - Step 22965: {'lr': 0.00047565241302550395, 'samples': 4409280, 'steps': 22964, 'loss/train': 0.8015714883804321} -11/07/2021 00:27:48 - INFO - __main__ - Step 22966: {'lr': 0.0004756501286334679, 'samples': 4409472, 'steps': 22965, 'loss/train': 1.7294597625732422} -11/07/2021 00:27:48 - INFO - __main__ - Step 22967: {'lr': 0.0004756478441397575, 'samples': 4409664, 'steps': 22966, 'loss/train': 1.8136224746704102} -11/07/2021 00:27:49 - INFO - __main__ - Step 22968: {'lr': 0.0004756455595443735, 'samples': 4409856, 'steps': 22967, 'loss/train': 1.3230981826782227} -11/07/2021 00:27:49 - INFO - __main__ - Step 22969: {'lr': 0.00047564327484731725, 'samples': 4410048, 'steps': 22968, 'loss/train': 2.6526639461517334} -11/07/2021 00:27:50 - INFO - __main__ - Step 22970: {'lr': 0.0004756409900485895, 'samples': 4410240, 'steps': 22969, 'loss/train': 1.852148413658142} -11/07/2021 00:27:50 - INFO - __main__ - Step 22971: {'lr': 0.00047563870514819154, 'samples': 4410432, 'steps': 22970, 'loss/train': 0.8799536824226379} -11/07/2021 00:27:50 - INFO - __main__ - Step 22972: {'lr': 0.0004756364201461241, 'samples': 4410624, 'steps': 22971, 'loss/train': 1.9788076877593994} -11/07/2021 00:27:51 - INFO - __main__ - Step 22973: {'lr': 0.00047563413504238847, 'samples': 4410816, 'steps': 22972, 'loss/train': 1.9070225954055786} -11/07/2021 00:27:52 - INFO - __main__ - Step 22974: {'lr': 0.0004756318498369855, 'samples': 4411008, 'steps': 22973, 'loss/train': 1.0210386514663696} -11/07/2021 00:27:52 - INFO - __main__ - Step 22975: {'lr': 0.0004756295645299164, 'samples': 4411200, 'steps': 22974, 'loss/train': 1.6513278484344482} -11/07/2021 00:27:52 - INFO - __main__ - Step 22976: {'lr': 0.00047562727912118206, 'samples': 4411392, 'steps': 22975, 'loss/train': 1.6678000688552856} -11/07/2021 00:27:53 - INFO - __main__ - Step 22977: {'lr': 0.00047562499361078356, 'samples': 4411584, 'steps': 22976, 'loss/train': 1.668380618095398} -11/07/2021 00:27:54 - INFO - __main__ - Step 22978: {'lr': 0.00047562270799872186, 'samples': 4411776, 'steps': 22977, 'loss/train': 2.0028698444366455} -11/07/2021 00:27:54 - INFO - __main__ - Step 22979: {'lr': 0.00047562042228499815, 'samples': 4411968, 'steps': 22978, 'loss/train': 1.7901252508163452} -11/07/2021 00:27:55 - INFO - __main__ - Step 22980: {'lr': 0.00047561813646961325, 'samples': 4412160, 'steps': 22979, 'loss/train': 1.4079407453536987} -11/07/2021 00:27:55 - INFO - __main__ - Step 22981: {'lr': 0.0004756158505525684, 'samples': 4412352, 'steps': 22980, 'loss/train': 1.1839544773101807} -11/07/2021 00:27:55 - INFO - __main__ - Step 22982: {'lr': 0.0004756135645338644, 'samples': 4412544, 'steps': 22981, 'loss/train': 2.2274835109710693} -11/07/2021 00:27:56 - INFO - __main__ - Step 22983: {'lr': 0.00047561127841350256, 'samples': 4412736, 'steps': 22982, 'loss/train': 1.5764931440353394} -11/07/2021 00:27:57 - INFO - __main__ - Step 22984: {'lr': 0.0004756089921914837, 'samples': 4412928, 'steps': 22983, 'loss/train': 1.4414703845977783} -11/07/2021 00:27:57 - INFO - __main__ - Step 22985: {'lr': 0.00047560670586780886, 'samples': 4413120, 'steps': 22984, 'loss/train': 1.398228645324707} -11/07/2021 00:27:57 - INFO - __main__ - Step 22986: {'lr': 0.0004756044194424792, 'samples': 4413312, 'steps': 22985, 'loss/train': 1.8721942901611328} -11/07/2021 00:27:58 - INFO - __main__ - Step 22987: {'lr': 0.0004756021329154956, 'samples': 4413504, 'steps': 22986, 'loss/train': 1.572609305381775} -11/07/2021 00:27:59 - INFO - __main__ - Step 22988: {'lr': 0.0004755998462868592, 'samples': 4413696, 'steps': 22987, 'loss/train': 1.766256332397461} -11/07/2021 00:27:59 - INFO - __main__ - Step 22989: {'lr': 0.00047559755955657097, 'samples': 4413888, 'steps': 22988, 'loss/train': 1.8802845478057861} -11/07/2021 00:27:59 - INFO - __main__ - Step 22990: {'lr': 0.000475595272724632, 'samples': 4414080, 'steps': 22989, 'loss/train': 1.8309953212738037} -11/07/2021 00:28:00 - INFO - __main__ - Step 22991: {'lr': 0.00047559298579104325, 'samples': 4414272, 'steps': 22990, 'loss/train': 1.2643400430679321} -11/07/2021 00:28:00 - INFO - __main__ - Step 22992: {'lr': 0.00047559069875580573, 'samples': 4414464, 'steps': 22991, 'loss/train': 1.68605637550354} -11/07/2021 00:28:01 - INFO - __main__ - Step 22993: {'lr': 0.00047558841161892063, 'samples': 4414656, 'steps': 22992, 'loss/train': 1.7791119813919067} -11/07/2021 00:28:01 - INFO - __main__ - Step 22994: {'lr': 0.00047558612438038887, 'samples': 4414848, 'steps': 22993, 'loss/train': 1.7085627317428589} -11/07/2021 00:28:02 - INFO - __main__ - Step 22995: {'lr': 0.00047558383704021136, 'samples': 4415040, 'steps': 22994, 'loss/train': 0.6871132850646973} -11/07/2021 00:28:02 - INFO - __main__ - Step 22996: {'lr': 0.00047558154959838935, 'samples': 4415232, 'steps': 22995, 'loss/train': 2.3702433109283447} -11/07/2021 00:28:03 - INFO - __main__ - Step 22997: {'lr': 0.0004755792620549237, 'samples': 4415424, 'steps': 22996, 'loss/train': 1.5503305196762085} -11/07/2021 00:28:03 - INFO - __main__ - Step 22998: {'lr': 0.0004755769744098156, 'samples': 4415616, 'steps': 22997, 'loss/train': 1.6456409692764282} -11/07/2021 00:28:03 - INFO - __main__ - Step 22999: {'lr': 0.00047557468666306596, 'samples': 4415808, 'steps': 22998, 'loss/train': 1.2864354848861694} -11/07/2021 00:28:04 - INFO - __main__ - Step 23000: {'lr': 0.00047557239881467584, 'samples': 4416000, 'steps': 22999, 'loss/train': 1.4137681722640991} -11/07/2021 00:28:05 - INFO - __main__ - Step 23001: {'lr': 0.0004755701108646463, 'samples': 4416192, 'steps': 23000, 'loss/train': 1.6158024072647095} -11/07/2021 00:28:05 - INFO - __main__ - Step 23002: {'lr': 0.0004755678228129784, 'samples': 4416384, 'steps': 23001, 'loss/train': 0.7091558575630188} -11/07/2021 00:28:05 - INFO - __main__ - Step 23003: {'lr': 0.000475565534659673, 'samples': 4416576, 'steps': 23002, 'loss/train': 1.7442548274993896} -11/07/2021 00:28:06 - INFO - __main__ - Step 23004: {'lr': 0.00047556324640473134, 'samples': 4416768, 'steps': 23003, 'loss/train': 1.8332017660140991} -11/07/2021 00:28:07 - INFO - __main__ - Step 23005: {'lr': 0.0004755609580481543, 'samples': 4416960, 'steps': 23004, 'loss/train': 1.8451040983200073} -11/07/2021 00:28:07 - INFO - __main__ - Step 23006: {'lr': 0.00047555866958994296, 'samples': 4417152, 'steps': 23005, 'loss/train': 1.5475908517837524} -11/07/2021 00:28:07 - INFO - __main__ - Step 23007: {'lr': 0.00047555638103009845, 'samples': 4417344, 'steps': 23006, 'loss/train': 1.035109519958496} -11/07/2021 00:28:08 - INFO - __main__ - Step 23008: {'lr': 0.0004755540923686217, 'samples': 4417536, 'steps': 23007, 'loss/train': 1.5133399963378906} -11/07/2021 00:28:08 - INFO - __main__ - Step 23009: {'lr': 0.0004755518036055137, 'samples': 4417728, 'steps': 23008, 'loss/train': 1.625259280204773} -11/07/2021 00:28:09 - INFO - __main__ - Step 23010: {'lr': 0.0004755495147407756, 'samples': 4417920, 'steps': 23009, 'loss/train': 1.5169017314910889} -11/07/2021 00:28:09 - INFO - __main__ - Step 23011: {'lr': 0.00047554722577440833, 'samples': 4418112, 'steps': 23010, 'loss/train': 1.5681982040405273} -11/07/2021 00:28:10 - INFO - __main__ - Step 23012: {'lr': 0.00047554493670641296, 'samples': 4418304, 'steps': 23011, 'loss/train': 0.36354389786720276} -11/07/2021 00:28:10 - INFO - __main__ - Step 23013: {'lr': 0.0004755426475367905, 'samples': 4418496, 'steps': 23012, 'loss/train': 1.3803929090499878} -11/07/2021 00:28:11 - INFO - __main__ - Step 23014: {'lr': 0.00047554035826554206, 'samples': 4418688, 'steps': 23013, 'loss/train': 1.3115521669387817} -11/07/2021 00:28:12 - INFO - __main__ - Step 23015: {'lr': 0.0004755380688926686, 'samples': 4418880, 'steps': 23014, 'loss/train': 1.7398924827575684} -11/07/2021 00:28:12 - INFO - __main__ - Step 23016: {'lr': 0.00047553577941817114, 'samples': 4419072, 'steps': 23015, 'loss/train': 1.7361851930618286} -11/07/2021 00:28:12 - INFO - __main__ - Step 23017: {'lr': 0.0004755334898420507, 'samples': 4419264, 'steps': 23016, 'loss/train': 1.8983994722366333} -11/07/2021 00:28:13 - INFO - __main__ - Step 23018: {'lr': 0.00047553120016430837, 'samples': 4419456, 'steps': 23017, 'loss/train': 1.3933513164520264} -11/07/2021 00:28:13 - INFO - __main__ - Step 23019: {'lr': 0.0004755289103849453, 'samples': 4419648, 'steps': 23018, 'loss/train': 1.5074931383132935} -11/07/2021 00:28:14 - INFO - __main__ - Step 23020: {'lr': 0.0004755266205039622, 'samples': 4419840, 'steps': 23019, 'loss/train': 1.4028873443603516} -11/07/2021 00:28:14 - INFO - __main__ - Step 23021: {'lr': 0.00047552433052136034, 'samples': 4420032, 'steps': 23020, 'loss/train': 1.6080424785614014} -11/07/2021 00:28:15 - INFO - __main__ - Step 23022: {'lr': 0.00047552204043714076, 'samples': 4420224, 'steps': 23021, 'loss/train': 1.7918477058410645} -11/07/2021 00:28:15 - INFO - __main__ - Step 23023: {'lr': 0.0004755197502513043, 'samples': 4420416, 'steps': 23022, 'loss/train': 1.549143671989441} -11/07/2021 00:28:15 - INFO - __main__ - Step 23024: {'lr': 0.00047551745996385233, 'samples': 4420608, 'steps': 23023, 'loss/train': 1.5438201427459717} -11/07/2021 00:28:16 - INFO - __main__ - Step 23025: {'lr': 0.00047551516957478545, 'samples': 4420800, 'steps': 23024, 'loss/train': 1.6900150775909424} -11/07/2021 00:28:17 - INFO - __main__ - Step 23026: {'lr': 0.0004755128790841051, 'samples': 4420992, 'steps': 23025, 'loss/train': 1.6069121360778809} -11/07/2021 00:28:17 - INFO - __main__ - Step 23027: {'lr': 0.000475510588491812, 'samples': 4421184, 'steps': 23026, 'loss/train': 2.0397226810455322} -11/07/2021 00:28:18 - INFO - __main__ - Step 23028: {'lr': 0.00047550829779790735, 'samples': 4421376, 'steps': 23027, 'loss/train': 1.342384934425354} -11/07/2021 00:28:18 - INFO - __main__ - Step 23029: {'lr': 0.0004755060070023921, 'samples': 4421568, 'steps': 23028, 'loss/train': 0.19474640488624573} -11/07/2021 00:28:18 - INFO - __main__ - Step 23030: {'lr': 0.0004755037161052674, 'samples': 4421760, 'steps': 23029, 'loss/train': 1.7647830247879028} -11/07/2021 00:28:19 - INFO - __main__ - Step 23031: {'lr': 0.00047550142510653415, 'samples': 4421952, 'steps': 23030, 'loss/train': 2.4951038360595703} -11/07/2021 00:28:20 - INFO - __main__ - Step 23032: {'lr': 0.0004754991340061935, 'samples': 4422144, 'steps': 23031, 'loss/train': 0.8009241223335266} -11/07/2021 00:28:20 - INFO - __main__ - Step 23033: {'lr': 0.0004754968428042463, 'samples': 4422336, 'steps': 23032, 'loss/train': 1.189576268196106} -11/07/2021 00:28:20 - INFO - __main__ - Step 23034: {'lr': 0.0004754945515006938, 'samples': 4422528, 'steps': 23033, 'loss/train': 1.348042368888855} -11/07/2021 00:28:21 - INFO - __main__ - Step 23035: {'lr': 0.0004754922600955369, 'samples': 4422720, 'steps': 23034, 'loss/train': 2.0349338054656982} -11/07/2021 00:28:22 - INFO - __main__ - Step 23036: {'lr': 0.0004754899685887767, 'samples': 4422912, 'steps': 23035, 'loss/train': 1.6004425287246704} -11/07/2021 00:28:22 - INFO - __main__ - Step 23037: {'lr': 0.0004754876769804142, 'samples': 4423104, 'steps': 23036, 'loss/train': 1.6580665111541748} -11/07/2021 00:28:23 - INFO - __main__ - Step 23038: {'lr': 0.00047548538527045035, 'samples': 4423296, 'steps': 23037, 'loss/train': 1.2863857746124268} -11/07/2021 00:28:23 - INFO - __main__ - Step 23039: {'lr': 0.00047548309345888637, 'samples': 4423488, 'steps': 23038, 'loss/train': 0.8549371957778931} -11/07/2021 00:28:23 - INFO - __main__ - Step 23040: {'lr': 0.00047548080154572315, 'samples': 4423680, 'steps': 23039, 'loss/train': 1.5918457508087158} -11/07/2021 00:28:24 - INFO - __main__ - Step 23041: {'lr': 0.00047547850953096174, 'samples': 4423872, 'steps': 23040, 'loss/train': 1.4698606729507446} -11/07/2021 00:28:24 - INFO - __main__ - Step 23042: {'lr': 0.0004754762174146032, 'samples': 4424064, 'steps': 23041, 'loss/train': 1.841143012046814} -11/07/2021 00:28:25 - INFO - __main__ - Step 23043: {'lr': 0.00047547392519664853, 'samples': 4424256, 'steps': 23042, 'loss/train': 1.5102839469909668} -11/07/2021 00:28:26 - INFO - __main__ - Step 23044: {'lr': 0.0004754716328770988, 'samples': 4424448, 'steps': 23043, 'loss/train': 2.0320229530334473} -11/07/2021 00:28:26 - INFO - __main__ - Step 23045: {'lr': 0.00047546934045595516, 'samples': 4424640, 'steps': 23044, 'loss/train': 1.711830973625183} -11/07/2021 00:28:26 - INFO - __main__ - Step 23046: {'lr': 0.00047546704793321835, 'samples': 4424832, 'steps': 23045, 'loss/train': 1.5525362491607666} -11/07/2021 00:28:27 - INFO - __main__ - Step 23047: {'lr': 0.0004754647553088896, 'samples': 4425024, 'steps': 23046, 'loss/train': 1.7210502624511719} -11/07/2021 00:28:28 - INFO - __main__ - Step 23048: {'lr': 0.00047546246258297, 'samples': 4425216, 'steps': 23047, 'loss/train': 2.0603466033935547} -11/07/2021 00:28:28 - INFO - __main__ - Step 23049: {'lr': 0.00047546016975546037, 'samples': 4425408, 'steps': 23048, 'loss/train': 1.2670799493789673} -11/07/2021 00:28:28 - INFO - __main__ - Step 23050: {'lr': 0.00047545787682636194, 'samples': 4425600, 'steps': 23049, 'loss/train': 1.3632519245147705} -11/07/2021 00:28:29 - INFO - __main__ - Step 23051: {'lr': 0.00047545558379567565, 'samples': 4425792, 'steps': 23050, 'loss/train': 1.7283782958984375} -11/07/2021 00:28:29 - INFO - __main__ - Step 23052: {'lr': 0.00047545329066340256, 'samples': 4425984, 'steps': 23051, 'loss/train': 1.7790948152542114} -11/07/2021 00:28:30 - INFO - __main__ - Step 23053: {'lr': 0.00047545099742954367, 'samples': 4426176, 'steps': 23052, 'loss/train': 1.2009434700012207} -11/07/2021 00:28:31 - INFO - __main__ - Step 23054: {'lr': 0.0004754487040941001, 'samples': 4426368, 'steps': 23053, 'loss/train': 1.2071412801742554} -11/07/2021 00:28:31 - INFO - __main__ - Step 23055: {'lr': 0.0004754464106570727, 'samples': 4426560, 'steps': 23054, 'loss/train': 1.412814974784851} -11/07/2021 00:28:31 - INFO - __main__ - Step 23056: {'lr': 0.00047544411711846277, 'samples': 4426752, 'steps': 23055, 'loss/train': 1.5205636024475098} -11/07/2021 00:28:32 - INFO - __main__ - Step 23057: {'lr': 0.00047544182347827114, 'samples': 4426944, 'steps': 23056, 'loss/train': 1.6638517379760742} -11/07/2021 00:28:33 - INFO - __main__ - Step 23058: {'lr': 0.0004754395297364989, 'samples': 4427136, 'steps': 23057, 'loss/train': 1.645391821861267} -11/07/2021 00:28:33 - INFO - __main__ - Step 23059: {'lr': 0.0004754372358931471, 'samples': 4427328, 'steps': 23058, 'loss/train': 1.6849995851516724} -11/07/2021 00:28:33 - INFO - __main__ - Step 23060: {'lr': 0.00047543494194821675, 'samples': 4427520, 'steps': 23059, 'loss/train': 1.4331011772155762} -11/07/2021 00:28:34 - INFO - __main__ - Step 23061: {'lr': 0.00047543264790170887, 'samples': 4427712, 'steps': 23060, 'loss/train': 2.1720664501190186} -11/07/2021 00:28:34 - INFO - __main__ - Step 23062: {'lr': 0.00047543035375362453, 'samples': 4427904, 'steps': 23061, 'loss/train': 1.5246973037719727} -11/07/2021 00:28:34 - INFO - __main__ - Step 23063: {'lr': 0.00047542805950396476, 'samples': 4428096, 'steps': 23062, 'loss/train': 1.4607219696044922} -11/07/2021 00:28:35 - INFO - __main__ - Step 23064: {'lr': 0.00047542576515273064, 'samples': 4428288, 'steps': 23063, 'loss/train': 1.9518522024154663} -11/07/2021 00:28:36 - INFO - __main__ - Step 23065: {'lr': 0.0004754234706999231, 'samples': 4428480, 'steps': 23064, 'loss/train': 1.777788758277893} -11/07/2021 00:28:36 - INFO - __main__ - Step 23066: {'lr': 0.0004754211761455432, 'samples': 4428672, 'steps': 23065, 'loss/train': 1.6558383703231812} -11/07/2021 00:28:36 - INFO - __main__ - Step 23067: {'lr': 0.000475418881489592, 'samples': 4428864, 'steps': 23066, 'loss/train': 1.926710605621338} -11/07/2021 00:28:37 - INFO - __main__ - Step 23068: {'lr': 0.0004754165867320706, 'samples': 4429056, 'steps': 23067, 'loss/train': 1.791853904724121} -11/07/2021 00:28:38 - INFO - __main__ - Step 23069: {'lr': 0.00047541429187297984, 'samples': 4429248, 'steps': 23068, 'loss/train': 1.4585204124450684} -11/07/2021 00:28:38 - INFO - __main__ - Step 23070: {'lr': 0.00047541199691232094, 'samples': 4429440, 'steps': 23069, 'loss/train': 1.8373855352401733} -11/07/2021 00:28:39 - INFO - __main__ - Step 23071: {'lr': 0.0004754097018500949, 'samples': 4429632, 'steps': 23070, 'loss/train': 1.821460247039795} -11/07/2021 00:28:39 - INFO - __main__ - Step 23072: {'lr': 0.0004754074066863027, 'samples': 4429824, 'steps': 23071, 'loss/train': 1.2372655868530273} -11/07/2021 00:28:39 - INFO - __main__ - Step 23073: {'lr': 0.0004754051114209454, 'samples': 4430016, 'steps': 23072, 'loss/train': 1.8181707859039307} -11/07/2021 00:28:40 - INFO - __main__ - Step 23074: {'lr': 0.0004754028160540241, 'samples': 4430208, 'steps': 23073, 'loss/train': 1.5179206132888794} -11/07/2021 00:28:41 - INFO - __main__ - Step 23075: {'lr': 0.0004754005205855397, 'samples': 4430400, 'steps': 23074, 'loss/train': 1.5440561771392822} -11/07/2021 00:28:41 - INFO - __main__ - Step 23076: {'lr': 0.0004753982250154933, 'samples': 4430592, 'steps': 23075, 'loss/train': 1.4330766201019287} -11/07/2021 00:28:41 - INFO - __main__ - Step 23077: {'lr': 0.00047539592934388596, 'samples': 4430784, 'steps': 23076, 'loss/train': 1.4417822360992432} -11/07/2021 00:28:42 - INFO - __main__ - Step 23078: {'lr': 0.0004753936335707187, 'samples': 4430976, 'steps': 23077, 'loss/train': 1.5473705530166626} -11/07/2021 00:28:43 - INFO - __main__ - Step 23079: {'lr': 0.0004753913376959925, 'samples': 4431168, 'steps': 23078, 'loss/train': 1.3038986921310425} -11/07/2021 00:28:43 - INFO - __main__ - Step 23080: {'lr': 0.00047538904171970847, 'samples': 4431360, 'steps': 23079, 'loss/train': 1.5698622465133667} -11/07/2021 00:28:43 - INFO - __main__ - Step 23081: {'lr': 0.0004753867456418677, 'samples': 4431552, 'steps': 23080, 'loss/train': 1.5879743099212646} -11/07/2021 00:28:44 - INFO - __main__ - Step 23082: {'lr': 0.000475384449462471, 'samples': 4431744, 'steps': 23081, 'loss/train': 1.3453717231750488} -11/07/2021 00:28:44 - INFO - __main__ - Step 23083: {'lr': 0.00047538215318151955, 'samples': 4431936, 'steps': 23082, 'loss/train': 1.4228205680847168} -11/07/2021 00:28:45 - INFO - __main__ - Step 23084: {'lr': 0.0004753798567990145, 'samples': 4432128, 'steps': 23083, 'loss/train': 1.6919718980789185} -11/07/2021 00:28:46 - INFO - __main__ - Step 23085: {'lr': 0.00047537756031495673, 'samples': 4432320, 'steps': 23084, 'loss/train': 1.6395727396011353} -11/07/2021 00:28:46 - INFO - __main__ - Step 23086: {'lr': 0.0004753752637293473, 'samples': 4432512, 'steps': 23085, 'loss/train': 1.7249788045883179} -11/07/2021 00:28:46 - INFO - __main__ - Step 23087: {'lr': 0.0004753729670421871, 'samples': 4432704, 'steps': 23086, 'loss/train': 1.9568339586257935} -11/07/2021 00:28:47 - INFO - __main__ - Step 23088: {'lr': 0.0004753706702534775, 'samples': 4432896, 'steps': 23087, 'loss/train': 1.488980770111084} -11/07/2021 00:28:48 - INFO - __main__ - Step 23089: {'lr': 0.0004753683733632193, 'samples': 4433088, 'steps': 23088, 'loss/train': 1.579067349433899} -11/07/2021 00:28:48 - INFO - __main__ - Step 23090: {'lr': 0.0004753660763714136, 'samples': 4433280, 'steps': 23089, 'loss/train': 2.105590581893921} -11/07/2021 00:28:48 - INFO - __main__ - Step 23091: {'lr': 0.00047536377927806143, 'samples': 4433472, 'steps': 23090, 'loss/train': 1.8617920875549316} -11/07/2021 00:28:49 - INFO - __main__ - Step 23092: {'lr': 0.0004753614820831638, 'samples': 4433664, 'steps': 23091, 'loss/train': 1.3575159311294556} -11/07/2021 00:28:49 - INFO - __main__ - Step 23093: {'lr': 0.0004753591847867218, 'samples': 4433856, 'steps': 23092, 'loss/train': 1.422724723815918} -11/07/2021 00:28:50 - INFO - __main__ - Step 23094: {'lr': 0.0004753568873887364, 'samples': 4434048, 'steps': 23093, 'loss/train': 1.7011767625808716} -11/07/2021 00:28:50 - INFO - __main__ - Step 23095: {'lr': 0.00047535458988920865, 'samples': 4434240, 'steps': 23094, 'loss/train': 1.6001523733139038} -11/07/2021 00:28:51 - INFO - __main__ - Step 23096: {'lr': 0.0004753522922881396, 'samples': 4434432, 'steps': 23095, 'loss/train': 1.5050978660583496} -11/07/2021 00:28:51 - INFO - __main__ - Step 23097: {'lr': 0.00047534999458553027, 'samples': 4434624, 'steps': 23096, 'loss/train': 1.705203652381897} -11/07/2021 00:28:51 - INFO - __main__ - Step 23098: {'lr': 0.00047534769678138177, 'samples': 4434816, 'steps': 23097, 'loss/train': 1.208935260772705} -11/07/2021 00:28:52 - INFO - __main__ - Step 23099: {'lr': 0.00047534539887569507, 'samples': 4435008, 'steps': 23098, 'loss/train': 1.8251349925994873} -11/07/2021 00:28:53 - INFO - __main__ - Step 23100: {'lr': 0.00047534310086847116, 'samples': 4435200, 'steps': 23099, 'loss/train': 1.7464089393615723} -11/07/2021 00:28:53 - INFO - __main__ - Step 23101: {'lr': 0.0004753408027597111, 'samples': 4435392, 'steps': 23100, 'loss/train': 1.768896460533142} -11/07/2021 00:28:54 - INFO - __main__ - Step 23102: {'lr': 0.0004753385045494161, 'samples': 4435584, 'steps': 23101, 'loss/train': 1.7746583223342896} -11/07/2021 00:28:54 - INFO - __main__ - Step 23103: {'lr': 0.0004753362062375869, 'samples': 4435776, 'steps': 23102, 'loss/train': 1.792876124382019} -11/07/2021 00:28:54 - INFO - __main__ - Step 23104: {'lr': 0.0004753339078242247, 'samples': 4435968, 'steps': 23103, 'loss/train': 1.5717073678970337} -11/07/2021 00:28:55 - INFO - __main__ - Step 23105: {'lr': 0.00047533160930933054, 'samples': 4436160, 'steps': 23104, 'loss/train': 1.265807032585144} -11/07/2021 00:28:56 - INFO - __main__ - Step 23106: {'lr': 0.00047532931069290546, 'samples': 4436352, 'steps': 23105, 'loss/train': 1.633703351020813} -11/07/2021 00:28:56 - INFO - __main__ - Step 23107: {'lr': 0.00047532701197495043, 'samples': 4436544, 'steps': 23106, 'loss/train': 1.6882529258728027} -11/07/2021 00:28:56 - INFO - __main__ - Step 23108: {'lr': 0.00047532471315546654, 'samples': 4436736, 'steps': 23107, 'loss/train': 1.3140676021575928} -11/07/2021 00:28:57 - INFO - __main__ - Step 23109: {'lr': 0.00047532241423445487, 'samples': 4436928, 'steps': 23108, 'loss/train': 1.6697815656661987} -11/07/2021 00:28:58 - INFO - __main__ - Step 23110: {'lr': 0.00047532011521191634, 'samples': 4437120, 'steps': 23109, 'loss/train': 1.6013033390045166} -11/07/2021 00:28:58 - INFO - __main__ - Step 23111: {'lr': 0.00047531781608785203, 'samples': 4437312, 'steps': 23110, 'loss/train': 1.1691371202468872} -11/07/2021 00:28:58 - INFO - __main__ - Step 23112: {'lr': 0.00047531551686226303, 'samples': 4437504, 'steps': 23111, 'loss/train': 1.359718918800354} -11/07/2021 00:28:59 - INFO - __main__ - Step 23113: {'lr': 0.00047531321753515026, 'samples': 4437696, 'steps': 23112, 'loss/train': 1.4464131593704224} -11/07/2021 00:28:59 - INFO - __main__ - Step 23114: {'lr': 0.0004753109181065149, 'samples': 4437888, 'steps': 23113, 'loss/train': 2.013803482055664} -11/07/2021 00:29:00 - INFO - __main__ - Step 23115: {'lr': 0.00047530861857635786, 'samples': 4438080, 'steps': 23114, 'loss/train': 2.0893020629882812} -11/07/2021 00:29:00 - INFO - __main__ - Step 23116: {'lr': 0.00047530631894468034, 'samples': 4438272, 'steps': 23115, 'loss/train': 1.3252930641174316} -11/07/2021 00:29:01 - INFO - __main__ - Step 23117: {'lr': 0.0004753040192114831, 'samples': 4438464, 'steps': 23116, 'loss/train': 1.6963107585906982} -11/07/2021 00:29:01 - INFO - __main__ - Step 23118: {'lr': 0.00047530171937676754, 'samples': 4438656, 'steps': 23117, 'loss/train': 1.0882844924926758} -11/07/2021 00:29:01 - INFO - __main__ - Step 23119: {'lr': 0.0004752994194405344, 'samples': 4438848, 'steps': 23118, 'loss/train': 1.5661946535110474} -11/07/2021 00:29:02 - INFO - __main__ - Step 23120: {'lr': 0.0004752971194027848, 'samples': 4439040, 'steps': 23119, 'loss/train': 1.7195779085159302} -11/07/2021 00:29:03 - INFO - __main__ - Step 23121: {'lr': 0.0004752948192635198, 'samples': 4439232, 'steps': 23120, 'loss/train': 0.6856600046157837} -11/07/2021 00:29:03 - INFO - __main__ - Step 23122: {'lr': 0.0004752925190227405, 'samples': 4439424, 'steps': 23121, 'loss/train': 0.4748719036579132} -11/07/2021 00:29:04 - INFO - __main__ - Step 23123: {'lr': 0.0004752902186804478, 'samples': 4439616, 'steps': 23122, 'loss/train': 1.5372296571731567} -11/07/2021 00:29:04 - INFO - __main__ - Step 23124: {'lr': 0.0004752879182366429, 'samples': 4439808, 'steps': 23123, 'loss/train': 1.7153961658477783} -11/07/2021 00:29:04 - INFO - __main__ - Step 23125: {'lr': 0.0004752856176913266, 'samples': 4440000, 'steps': 23124, 'loss/train': 1.8751126527786255} -11/07/2021 00:29:06 - INFO - __main__ - Step 23126: {'lr': 0.0004752833170445001, 'samples': 4440192, 'steps': 23125, 'loss/train': 1.5678542852401733} -11/07/2021 00:29:06 - INFO - __main__ - Step 23127: {'lr': 0.0004752810162961645, 'samples': 4440384, 'steps': 23126, 'loss/train': 1.930989146232605} -11/07/2021 00:29:06 - INFO - __main__ - Step 23128: {'lr': 0.0004752787154463207, 'samples': 4440576, 'steps': 23127, 'loss/train': 1.4092589616775513} -11/07/2021 00:29:07 - INFO - __main__ - Step 23129: {'lr': 0.0004752764144949698, 'samples': 4440768, 'steps': 23128, 'loss/train': 1.5948010683059692} -11/07/2021 00:29:07 - INFO - __main__ - Step 23130: {'lr': 0.0004752741134421128, 'samples': 4440960, 'steps': 23129, 'loss/train': 1.9338881969451904} -11/07/2021 00:29:08 - INFO - __main__ - Step 23131: {'lr': 0.00047527181228775077, 'samples': 4441152, 'steps': 23130, 'loss/train': 1.63901948928833} -11/07/2021 00:29:08 - INFO - __main__ - Step 23132: {'lr': 0.0004752695110318848, 'samples': 4441344, 'steps': 23131, 'loss/train': 1.393159031867981} -11/07/2021 00:29:09 - INFO - __main__ - Step 23133: {'lr': 0.00047526720967451573, 'samples': 4441536, 'steps': 23132, 'loss/train': 1.695439100265503} -11/07/2021 00:29:09 - INFO - __main__ - Step 23134: {'lr': 0.0004752649082156448, 'samples': 4441728, 'steps': 23133, 'loss/train': 1.4486114978790283} -11/07/2021 00:29:09 - INFO - __main__ - Step 23135: {'lr': 0.00047526260665527306, 'samples': 4441920, 'steps': 23134, 'loss/train': 1.8586546182632446} -11/07/2021 00:29:11 - INFO - __main__ - Step 23136: {'lr': 0.0004752603049934014, 'samples': 4442112, 'steps': 23135, 'loss/train': 1.6190085411071777} -11/07/2021 00:29:11 - INFO - __main__ - Step 23137: {'lr': 0.0004752580032300309, 'samples': 4442304, 'steps': 23136, 'loss/train': 1.5549322366714478} -11/07/2021 00:29:11 - INFO - __main__ - Step 23138: {'lr': 0.0004752557013651626, 'samples': 4442496, 'steps': 23137, 'loss/train': 1.221572995185852} -11/07/2021 00:29:12 - INFO - __main__ - Step 23139: {'lr': 0.00047525339939879764, 'samples': 4442688, 'steps': 23138, 'loss/train': 1.486706018447876} -11/07/2021 00:29:12 - INFO - __main__ - Step 23140: {'lr': 0.0004752510973309369, 'samples': 4442880, 'steps': 23139, 'loss/train': 1.5068085193634033} -11/07/2021 00:29:13 - INFO - __main__ - Step 23141: {'lr': 0.00047524879516158155, 'samples': 4443072, 'steps': 23140, 'loss/train': 0.5440205931663513} -11/07/2021 00:29:13 - INFO - __main__ - Step 23142: {'lr': 0.00047524649289073254, 'samples': 4443264, 'steps': 23141, 'loss/train': 1.9470374584197998} -11/07/2021 00:29:14 - INFO - __main__ - Step 23143: {'lr': 0.00047524419051839093, 'samples': 4443456, 'steps': 23142, 'loss/train': 1.6084150075912476} -11/07/2021 00:29:14 - INFO - __main__ - Step 23144: {'lr': 0.00047524188804455776, 'samples': 4443648, 'steps': 23143, 'loss/train': 1.1105417013168335} -11/07/2021 00:29:14 - INFO - __main__ - Step 23145: {'lr': 0.0004752395854692341, 'samples': 4443840, 'steps': 23144, 'loss/train': 1.6613856554031372} -11/07/2021 00:29:16 - INFO - __main__ - Step 23146: {'lr': 0.0004752372827924209, 'samples': 4444032, 'steps': 23145, 'loss/train': 1.884938359260559} -11/07/2021 00:29:16 - INFO - __main__ - Step 23147: {'lr': 0.0004752349800141193, 'samples': 4444224, 'steps': 23146, 'loss/train': 1.2518686056137085} -11/07/2021 00:29:16 - INFO - __main__ - Step 23148: {'lr': 0.0004752326771343303, 'samples': 4444416, 'steps': 23147, 'loss/train': 2.7502472400665283} -11/07/2021 00:29:17 - INFO - __main__ - Step 23149: {'lr': 0.00047523037415305494, 'samples': 4444608, 'steps': 23148, 'loss/train': 1.4677647352218628} -11/07/2021 00:29:17 - INFO - __main__ - Step 23150: {'lr': 0.0004752280710702942, 'samples': 4444800, 'steps': 23149, 'loss/train': 1.722581148147583} -11/07/2021 00:29:18 - INFO - __main__ - Step 23151: {'lr': 0.0004752257678860492, 'samples': 4444992, 'steps': 23150, 'loss/train': 1.3895703554153442} -11/07/2021 00:29:18 - INFO - __main__ - Step 23152: {'lr': 0.00047522346460032093, 'samples': 4445184, 'steps': 23151, 'loss/train': 1.1857327222824097} -11/07/2021 00:29:19 - INFO - __main__ - Step 23153: {'lr': 0.0004752211612131104, 'samples': 4445376, 'steps': 23152, 'loss/train': 0.6896765828132629} -11/07/2021 00:29:19 - INFO - __main__ - Step 23154: {'lr': 0.00047521885772441874, 'samples': 4445568, 'steps': 23153, 'loss/train': 1.9018213748931885} -11/07/2021 00:29:19 - INFO - __main__ - Step 23155: {'lr': 0.00047521655413424705, 'samples': 4445760, 'steps': 23154, 'loss/train': 2.1501245498657227} -11/07/2021 00:29:20 - INFO - __main__ - Step 23156: {'lr': 0.0004752142504425961, 'samples': 4445952, 'steps': 23155, 'loss/train': 1.5948129892349243} -11/07/2021 00:29:21 - INFO - __main__ - Step 23157: {'lr': 0.0004752119466494671, 'samples': 4446144, 'steps': 23156, 'loss/train': 1.9892706871032715} -11/07/2021 00:29:21 - INFO - __main__ - Step 23158: {'lr': 0.0004752096427548611, 'samples': 4446336, 'steps': 23157, 'loss/train': 1.5363296270370483} -11/07/2021 00:29:21 - INFO - __main__ - Step 23159: {'lr': 0.00047520733875877906, 'samples': 4446528, 'steps': 23158, 'loss/train': 1.5002020597457886} -11/07/2021 00:29:22 - INFO - __main__ - Step 23160: {'lr': 0.00047520503466122216, 'samples': 4446720, 'steps': 23159, 'loss/train': 1.7415108680725098} -11/07/2021 00:29:22 - INFO - __main__ - Step 23161: {'lr': 0.0004752027304621913, 'samples': 4446912, 'steps': 23160, 'loss/train': 0.3823089003562927} -11/07/2021 00:29:23 - INFO - __main__ - Step 23162: {'lr': 0.0004752004261616876, 'samples': 4447104, 'steps': 23161, 'loss/train': 1.2418301105499268} -11/07/2021 00:29:23 - INFO - __main__ - Step 23163: {'lr': 0.000475198121759712, 'samples': 4447296, 'steps': 23162, 'loss/train': 1.2378976345062256} -11/07/2021 00:29:24 - INFO - __main__ - Step 23164: {'lr': 0.0004751958172562656, 'samples': 4447488, 'steps': 23163, 'loss/train': 1.4196279048919678} -11/07/2021 00:29:24 - INFO - __main__ - Step 23165: {'lr': 0.00047519351265134954, 'samples': 4447680, 'steps': 23164, 'loss/train': 1.934503197669983} -11/07/2021 00:29:24 - INFO - __main__ - Step 23166: {'lr': 0.00047519120794496466, 'samples': 4447872, 'steps': 23165, 'loss/train': 1.7241228818893433} -11/07/2021 00:29:26 - INFO - __main__ - Step 23167: {'lr': 0.00047518890313711217, 'samples': 4448064, 'steps': 23166, 'loss/train': 1.5477992296218872} -11/07/2021 00:29:26 - INFO - __main__ - Step 23168: {'lr': 0.000475186598227793, 'samples': 4448256, 'steps': 23167, 'loss/train': 1.3837860822677612} -11/07/2021 00:29:26 - INFO - __main__ - Step 23169: {'lr': 0.0004751842932170082, 'samples': 4448448, 'steps': 23168, 'loss/train': 1.5913500785827637} -11/07/2021 00:29:27 - INFO - __main__ - Step 23170: {'lr': 0.00047518198810475885, 'samples': 4448640, 'steps': 23169, 'loss/train': 1.5390900373458862} -11/07/2021 00:29:27 - INFO - __main__ - Step 23171: {'lr': 0.00047517968289104596, 'samples': 4448832, 'steps': 23170, 'loss/train': 1.9195278882980347} -11/07/2021 00:29:28 - INFO - __main__ - Step 23172: {'lr': 0.0004751773775758706, 'samples': 4449024, 'steps': 23171, 'loss/train': 1.7877540588378906} -11/07/2021 00:29:28 - INFO - __main__ - Step 23173: {'lr': 0.00047517507215923376, 'samples': 4449216, 'steps': 23172, 'loss/train': 1.3253355026245117} -11/07/2021 00:29:29 - INFO - __main__ - Step 23174: {'lr': 0.00047517276664113653, 'samples': 4449408, 'steps': 23173, 'loss/train': 1.5295782089233398} -11/07/2021 00:29:29 - INFO - __main__ - Step 23175: {'lr': 0.0004751704610215799, 'samples': 4449600, 'steps': 23174, 'loss/train': 0.9073389172554016} -11/07/2021 00:29:29 - INFO - __main__ - Step 23176: {'lr': 0.000475168155300565, 'samples': 4449792, 'steps': 23175, 'loss/train': 1.260116696357727} -11/07/2021 00:29:30 - INFO - __main__ - Step 23177: {'lr': 0.00047516584947809274, 'samples': 4449984, 'steps': 23176, 'loss/train': 1.680338978767395} -11/07/2021 00:29:31 - INFO - __main__ - Step 23178: {'lr': 0.00047516354355416426, 'samples': 4450176, 'steps': 23177, 'loss/train': 1.5092757940292358} -11/07/2021 00:29:31 - INFO - __main__ - Step 23179: {'lr': 0.00047516123752878054, 'samples': 4450368, 'steps': 23178, 'loss/train': 1.9057352542877197} -11/07/2021 00:29:31 - INFO - __main__ - Step 23180: {'lr': 0.00047515893140194265, 'samples': 4450560, 'steps': 23179, 'loss/train': 1.6779406070709229} -11/07/2021 00:29:32 - INFO - __main__ - Step 23181: {'lr': 0.0004751566251736516, 'samples': 4450752, 'steps': 23180, 'loss/train': 1.547135591506958} -11/07/2021 00:29:33 - INFO - __main__ - Step 23182: {'lr': 0.00047515431884390845, 'samples': 4450944, 'steps': 23181, 'loss/train': 1.668994665145874} -11/07/2021 00:29:33 - INFO - __main__ - Step 23183: {'lr': 0.00047515201241271426, 'samples': 4451136, 'steps': 23182, 'loss/train': 2.094433307647705} -11/07/2021 00:29:34 - INFO - __main__ - Step 23184: {'lr': 0.00047514970588007007, 'samples': 4451328, 'steps': 23183, 'loss/train': 1.9435114860534668} -11/07/2021 00:29:34 - INFO - __main__ - Step 23185: {'lr': 0.0004751473992459768, 'samples': 4451520, 'steps': 23184, 'loss/train': 1.3332525491714478} -11/07/2021 00:29:34 - INFO - __main__ - Step 23186: {'lr': 0.0004751450925104357, 'samples': 4451712, 'steps': 23185, 'loss/train': 1.8284626007080078} -11/07/2021 00:29:35 - INFO - __main__ - Step 23187: {'lr': 0.00047514278567344765, 'samples': 4451904, 'steps': 23186, 'loss/train': 1.9439247846603394} -11/07/2021 00:29:36 - INFO - __main__ - Step 23188: {'lr': 0.00047514047873501374, 'samples': 4452096, 'steps': 23187, 'loss/train': 1.6083027124404907} -11/07/2021 00:29:36 - INFO - __main__ - Step 23189: {'lr': 0.000475138171695135, 'samples': 4452288, 'steps': 23188, 'loss/train': 2.0748753547668457} -11/07/2021 00:29:36 - INFO - __main__ - Step 23190: {'lr': 0.00047513586455381245, 'samples': 4452480, 'steps': 23189, 'loss/train': 1.4966256618499756} -11/07/2021 00:29:37 - INFO - __main__ - Step 23191: {'lr': 0.00047513355731104717, 'samples': 4452672, 'steps': 23190, 'loss/train': 1.6222933530807495} -11/07/2021 00:29:37 - INFO - __main__ - Step 23192: {'lr': 0.0004751312499668402, 'samples': 4452864, 'steps': 23191, 'loss/train': 0.9162195324897766} -11/07/2021 00:29:38 - INFO - __main__ - Step 23193: {'lr': 0.00047512894252119256, 'samples': 4453056, 'steps': 23192, 'loss/train': 1.50593101978302} -11/07/2021 00:29:38 - INFO - __main__ - Step 23194: {'lr': 0.0004751266349741053, 'samples': 4453248, 'steps': 23193, 'loss/train': 1.4306085109710693} -11/07/2021 00:29:39 - INFO - __main__ - Step 23195: {'lr': 0.0004751243273255794, 'samples': 4453440, 'steps': 23194, 'loss/train': 1.7216869592666626} -11/07/2021 00:29:39 - INFO - __main__ - Step 23196: {'lr': 0.000475122019575616, 'samples': 4453632, 'steps': 23195, 'loss/train': 1.568893313407898} -11/07/2021 00:29:39 - INFO - __main__ - Step 23197: {'lr': 0.0004751197117242161, 'samples': 4453824, 'steps': 23196, 'loss/train': 1.283979892730713} -11/07/2021 00:29:40 - INFO - __main__ - Step 23198: {'lr': 0.0004751174037713807, 'samples': 4454016, 'steps': 23197, 'loss/train': 1.5490138530731201} -11/07/2021 00:29:41 - INFO - __main__ - Step 23199: {'lr': 0.00047511509571711085, 'samples': 4454208, 'steps': 23198, 'loss/train': 1.2735344171524048} -11/07/2021 00:29:41 - INFO - __main__ - Step 23200: {'lr': 0.00047511278756140766, 'samples': 4454400, 'steps': 23199, 'loss/train': 1.056983232498169} -11/07/2021 00:29:41 - INFO - __main__ - Step 23201: {'lr': 0.00047511047930427216, 'samples': 4454592, 'steps': 23200, 'loss/train': 1.5129168033599854} -11/07/2021 00:29:42 - INFO - __main__ - Step 23202: {'lr': 0.00047510817094570526, 'samples': 4454784, 'steps': 23201, 'loss/train': 1.2528656721115112} -11/07/2021 00:29:43 - INFO - __main__ - Step 23203: {'lr': 0.00047510586248570815, 'samples': 4454976, 'steps': 23202, 'loss/train': 1.2748398780822754} -11/07/2021 00:29:43 - INFO - __main__ - Step 23204: {'lr': 0.00047510355392428176, 'samples': 4455168, 'steps': 23203, 'loss/train': 1.3079149723052979} -11/07/2021 00:29:44 - INFO - __main__ - Step 23205: {'lr': 0.00047510124526142723, 'samples': 4455360, 'steps': 23204, 'loss/train': 1.3610676527023315} -11/07/2021 00:29:44 - INFO - __main__ - Step 23206: {'lr': 0.00047509893649714554, 'samples': 4455552, 'steps': 23205, 'loss/train': 1.3533624410629272} -11/07/2021 00:29:44 - INFO - __main__ - Step 23207: {'lr': 0.00047509662763143775, 'samples': 4455744, 'steps': 23206, 'loss/train': 1.393203854560852} -11/07/2021 00:29:45 - INFO - __main__ - Step 23208: {'lr': 0.00047509431866430487, 'samples': 4455936, 'steps': 23207, 'loss/train': 1.4738633632659912} -11/07/2021 00:29:46 - INFO - __main__ - Step 23209: {'lr': 0.000475092009595748, 'samples': 4456128, 'steps': 23208, 'loss/train': 0.9779757857322693} -11/07/2021 00:29:46 - INFO - __main__ - Step 23210: {'lr': 0.0004750897004257681, 'samples': 4456320, 'steps': 23209, 'loss/train': 0.19317372143268585} -11/07/2021 00:29:46 - INFO - __main__ - Step 23211: {'lr': 0.0004750873911543663, 'samples': 4456512, 'steps': 23210, 'loss/train': 1.6986215114593506} -11/07/2021 00:29:47 - INFO - __main__ - Step 23212: {'lr': 0.00047508508178154354, 'samples': 4456704, 'steps': 23211, 'loss/train': 1.6802526712417603} -11/07/2021 00:29:48 - INFO - __main__ - Step 23213: {'lr': 0.00047508277230730095, 'samples': 4456896, 'steps': 23212, 'loss/train': 1.0024389028549194} -11/07/2021 00:29:48 - INFO - __main__ - Step 23214: {'lr': 0.00047508046273163953, 'samples': 4457088, 'steps': 23213, 'loss/train': 1.4807589054107666} -11/07/2021 00:29:49 - INFO - __main__ - Step 23215: {'lr': 0.0004750781530545603, 'samples': 4457280, 'steps': 23214, 'loss/train': 1.3570733070373535} -11/07/2021 00:29:49 - INFO - __main__ - Step 23216: {'lr': 0.0004750758432760644, 'samples': 4457472, 'steps': 23215, 'loss/train': 1.3327617645263672} -11/07/2021 00:29:49 - INFO - __main__ - Step 23217: {'lr': 0.0004750735333961527, 'samples': 4457664, 'steps': 23216, 'loss/train': 1.9167391061782837} -11/07/2021 00:29:50 - INFO - __main__ - Step 23218: {'lr': 0.00047507122341482644, 'samples': 4457856, 'steps': 23217, 'loss/train': 1.5629518032073975} -11/07/2021 00:29:51 - INFO - __main__ - Step 23219: {'lr': 0.00047506891333208654, 'samples': 4458048, 'steps': 23218, 'loss/train': 1.445533275604248} -11/07/2021 00:29:51 - INFO - __main__ - Step 23220: {'lr': 0.000475066603147934, 'samples': 4458240, 'steps': 23219, 'loss/train': 1.4702428579330444} -11/07/2021 00:29:51 - INFO - __main__ - Step 23221: {'lr': 0.00047506429286236997, 'samples': 4458432, 'steps': 23220, 'loss/train': 0.974677562713623} -11/07/2021 00:29:52 - INFO - __main__ - Step 23222: {'lr': 0.00047506198247539546, 'samples': 4458624, 'steps': 23221, 'loss/train': 2.327030658721924} -11/07/2021 00:29:52 - INFO - __main__ - Step 23223: {'lr': 0.0004750596719870114, 'samples': 4458816, 'steps': 23222, 'loss/train': 1.695296287536621} -11/07/2021 00:29:53 - INFO - __main__ - Step 23224: {'lr': 0.000475057361397219, 'samples': 4459008, 'steps': 23223, 'loss/train': 1.4242885112762451} -11/07/2021 00:29:53 - INFO - __main__ - Step 23225: {'lr': 0.0004750550507060192, 'samples': 4459200, 'steps': 23224, 'loss/train': 1.8439444303512573} -11/07/2021 00:29:54 - INFO - __main__ - Step 23226: {'lr': 0.0004750527399134131, 'samples': 4459392, 'steps': 23225, 'loss/train': 1.62975013256073} -11/07/2021 00:29:54 - INFO - __main__ - Step 23227: {'lr': 0.00047505042901940163, 'samples': 4459584, 'steps': 23226, 'loss/train': 0.7999213933944702} -11/07/2021 00:29:55 - INFO - __main__ - Step 23228: {'lr': 0.00047504811802398603, 'samples': 4459776, 'steps': 23227, 'loss/train': 0.9568268656730652} -11/07/2021 00:29:56 - INFO - __main__ - Step 23229: {'lr': 0.0004750458069271671, 'samples': 4459968, 'steps': 23228, 'loss/train': 1.195821762084961} -11/07/2021 00:29:56 - INFO - __main__ - Step 23230: {'lr': 0.0004750434957289461, 'samples': 4460160, 'steps': 23229, 'loss/train': 1.61564040184021} -11/07/2021 00:29:56 - INFO - __main__ - Step 23231: {'lr': 0.0004750411844293239, 'samples': 4460352, 'steps': 23230, 'loss/train': 1.6031367778778076} -11/07/2021 00:29:57 - INFO - __main__ - Step 23232: {'lr': 0.0004750388730283016, 'samples': 4460544, 'steps': 23231, 'loss/train': 1.7405587434768677} -11/07/2021 00:29:57 - INFO - __main__ - Step 23233: {'lr': 0.0004750365615258804, 'samples': 4460736, 'steps': 23232, 'loss/train': 1.6886457204818726} -11/07/2021 00:29:58 - INFO - __main__ - Step 23234: {'lr': 0.00047503424992206107, 'samples': 4460928, 'steps': 23233, 'loss/train': 1.7403072118759155} -11/07/2021 00:29:59 - INFO - __main__ - Step 23235: {'lr': 0.00047503193821684476, 'samples': 4461120, 'steps': 23234, 'loss/train': 1.0748543739318848} -11/07/2021 00:29:59 - INFO - __main__ - Step 23236: {'lr': 0.0004750296264102326, 'samples': 4461312, 'steps': 23235, 'loss/train': 0.7899654507637024} -11/07/2021 00:29:59 - INFO - __main__ - Step 23237: {'lr': 0.0004750273145022256, 'samples': 4461504, 'steps': 23236, 'loss/train': 1.9232375621795654} -11/07/2021 00:30:00 - INFO - __main__ - Step 23238: {'lr': 0.00047502500249282464, 'samples': 4461696, 'steps': 23237, 'loss/train': 2.210071563720703} -11/07/2021 00:30:00 - INFO - __main__ - Step 23239: {'lr': 0.000475022690382031, 'samples': 4461888, 'steps': 23238, 'loss/train': 1.4127061367034912} -11/07/2021 00:30:01 - INFO - __main__ - Step 23240: {'lr': 0.0004750203781698456, 'samples': 4462080, 'steps': 23239, 'loss/train': 1.924795150756836} -11/07/2021 00:30:02 - INFO - __main__ - Step 23241: {'lr': 0.0004750180658562694, 'samples': 4462272, 'steps': 23240, 'loss/train': 1.7388290166854858} -11/07/2021 00:30:02 - INFO - __main__ - Step 23242: {'lr': 0.00047501575344130356, 'samples': 4462464, 'steps': 23241, 'loss/train': 1.7781851291656494} -11/07/2021 00:30:02 - INFO - __main__ - Step 23243: {'lr': 0.00047501344092494915, 'samples': 4462656, 'steps': 23242, 'loss/train': 1.8841161727905273} -11/07/2021 00:30:03 - INFO - __main__ - Step 23244: {'lr': 0.0004750111283072071, 'samples': 4462848, 'steps': 23243, 'loss/train': 1.3987021446228027} -11/07/2021 00:30:04 - INFO - __main__ - Step 23245: {'lr': 0.00047500881558807854, 'samples': 4463040, 'steps': 23244, 'loss/train': 1.4467869997024536} -11/07/2021 00:30:04 - INFO - __main__ - Step 23246: {'lr': 0.00047500650276756455, 'samples': 4463232, 'steps': 23245, 'loss/train': 1.4589742422103882} -11/07/2021 00:30:04 - INFO - __main__ - Step 23247: {'lr': 0.00047500418984566594, 'samples': 4463424, 'steps': 23246, 'loss/train': 1.8420617580413818} -11/07/2021 00:30:05 - INFO - __main__ - Step 23248: {'lr': 0.000475001876822384, 'samples': 4463616, 'steps': 23247, 'loss/train': 1.821009635925293} -11/07/2021 00:30:05 - INFO - __main__ - Step 23249: {'lr': 0.00047499956369771967, 'samples': 4463808, 'steps': 23248, 'loss/train': 1.7371834516525269} -11/07/2021 00:30:06 - INFO - __main__ - Step 23250: {'lr': 0.00047499725047167406, 'samples': 4464000, 'steps': 23249, 'loss/train': 1.7576009035110474} -11/07/2021 00:30:06 - INFO - __main__ - Step 23251: {'lr': 0.0004749949371442481, 'samples': 4464192, 'steps': 23250, 'loss/train': 1.6941187381744385} -11/07/2021 00:30:07 - INFO - __main__ - Step 23252: {'lr': 0.00047499262371544294, 'samples': 4464384, 'steps': 23251, 'loss/train': 1.533231496810913} -11/07/2021 00:30:07 - INFO - __main__ - Step 23253: {'lr': 0.00047499031018525953, 'samples': 4464576, 'steps': 23252, 'loss/train': 0.6648880839347839} -11/07/2021 00:30:07 - INFO - __main__ - Step 23254: {'lr': 0.00047498799655369895, 'samples': 4464768, 'steps': 23253, 'loss/train': 1.6462962627410889} -11/07/2021 00:30:08 - INFO - __main__ - Step 23255: {'lr': 0.0004749856828207623, 'samples': 4464960, 'steps': 23254, 'loss/train': 2.133352041244507} -11/07/2021 00:30:09 - INFO - __main__ - Step 23256: {'lr': 0.00047498336898645055, 'samples': 4465152, 'steps': 23255, 'loss/train': 1.3252581357955933} -11/07/2021 00:30:09 - INFO - __main__ - Step 23257: {'lr': 0.00047498105505076475, 'samples': 4465344, 'steps': 23256, 'loss/train': 1.2903780937194824} -11/07/2021 00:30:09 - INFO - __main__ - Step 23258: {'lr': 0.000474978741013706, 'samples': 4465536, 'steps': 23257, 'loss/train': 1.5443459749221802} -11/07/2021 00:30:10 - INFO - __main__ - Step 23259: {'lr': 0.0004749764268752753, 'samples': 4465728, 'steps': 23258, 'loss/train': 1.795452356338501} -11/07/2021 00:30:10 - INFO - __main__ - Step 23260: {'lr': 0.0004749741126354736, 'samples': 4465920, 'steps': 23259, 'loss/train': 1.6947624683380127} -11/07/2021 00:30:11 - INFO - __main__ - Step 23261: {'lr': 0.00047497179829430217, 'samples': 4466112, 'steps': 23260, 'loss/train': 1.524401307106018} -11/07/2021 00:30:11 - INFO - __main__ - Step 23262: {'lr': 0.0004749694838517619, 'samples': 4466304, 'steps': 23261, 'loss/train': 1.6715247631072998} -11/07/2021 00:30:12 - INFO - __main__ - Step 23263: {'lr': 0.0004749671693078538, 'samples': 4466496, 'steps': 23262, 'loss/train': 1.1825659275054932} -11/07/2021 00:30:12 - INFO - __main__ - Step 23264: {'lr': 0.00047496485466257896, 'samples': 4466688, 'steps': 23263, 'loss/train': 1.2815076112747192} -11/07/2021 00:30:13 - INFO - __main__ - Step 23265: {'lr': 0.0004749625399159384, 'samples': 4466880, 'steps': 23264, 'loss/train': 0.34565478563308716} -11/07/2021 00:30:14 - INFO - __main__ - Step 23266: {'lr': 0.0004749602250679332, 'samples': 4467072, 'steps': 23265, 'loss/train': 1.8178528547286987} -11/07/2021 00:30:14 - INFO - __main__ - Step 23267: {'lr': 0.00047495791011856447, 'samples': 4467264, 'steps': 23266, 'loss/train': 1.5307931900024414} -11/07/2021 00:30:14 - INFO - __main__ - Step 23268: {'lr': 0.00047495559506783317, 'samples': 4467456, 'steps': 23267, 'loss/train': 1.597183346748352} -11/07/2021 00:30:15 - INFO - __main__ - Step 23269: {'lr': 0.00047495327991574034, 'samples': 4467648, 'steps': 23268, 'loss/train': 1.6375641822814941} -11/07/2021 00:30:15 - INFO - __main__ - Step 23270: {'lr': 0.0004749509646622869, 'samples': 4467840, 'steps': 23269, 'loss/train': 2.025968551635742} -11/07/2021 00:30:16 - INFO - __main__ - Step 23271: {'lr': 0.00047494864930747415, 'samples': 4468032, 'steps': 23270, 'loss/train': 5.877805233001709} -11/07/2021 00:30:17 - INFO - __main__ - Step 23272: {'lr': 0.000474946333851303, 'samples': 4468224, 'steps': 23271, 'loss/train': 0.9324080348014832} -11/07/2021 00:30:17 - INFO - __main__ - Step 23273: {'lr': 0.0004749440182937745, 'samples': 4468416, 'steps': 23272, 'loss/train': 1.8106902837753296} -11/07/2021 00:30:17 - INFO - __main__ - Step 23274: {'lr': 0.0004749417026348897, 'samples': 4468608, 'steps': 23273, 'loss/train': 1.6376235485076904} -11/07/2021 00:30:18 - INFO - __main__ - Step 23275: {'lr': 0.0004749393868746497, 'samples': 4468800, 'steps': 23274, 'loss/train': 1.6495087146759033} -11/07/2021 00:30:18 - INFO - __main__ - Step 23276: {'lr': 0.0004749370710130554, 'samples': 4468992, 'steps': 23275, 'loss/train': 2.2123794555664062} -11/07/2021 00:30:19 - INFO - __main__ - Step 23277: {'lr': 0.00047493475505010793, 'samples': 4469184, 'steps': 23276, 'loss/train': 0.2711905539035797} -11/07/2021 00:30:19 - INFO - __main__ - Step 23278: {'lr': 0.0004749324389858083, 'samples': 4469376, 'steps': 23277, 'loss/train': 1.7561227083206177} -11/07/2021 00:30:20 - INFO - __main__ - Step 23279: {'lr': 0.00047493012282015767, 'samples': 4469568, 'steps': 23278, 'loss/train': 1.7865687608718872} -11/07/2021 00:30:20 - INFO - __main__ - Step 23280: {'lr': 0.00047492780655315693, 'samples': 4469760, 'steps': 23279, 'loss/train': 1.2692395448684692} -11/07/2021 00:30:20 - INFO - __main__ - Step 23281: {'lr': 0.00047492549018480725, 'samples': 4469952, 'steps': 23280, 'loss/train': 1.1253389120101929} -11/07/2021 00:30:21 - INFO - __main__ - Step 23282: {'lr': 0.00047492317371510955, 'samples': 4470144, 'steps': 23281, 'loss/train': 1.7119258642196655} -11/07/2021 00:30:22 - INFO - __main__ - Step 23283: {'lr': 0.00047492085714406497, 'samples': 4470336, 'steps': 23282, 'loss/train': 1.870627760887146} -11/07/2021 00:30:22 - INFO - __main__ - Step 23284: {'lr': 0.00047491854047167453, 'samples': 4470528, 'steps': 23283, 'loss/train': 1.5494314432144165} -11/07/2021 00:30:23 - INFO - __main__ - Step 23285: {'lr': 0.0004749162236979393, 'samples': 4470720, 'steps': 23284, 'loss/train': 1.2017252445220947} -11/07/2021 00:30:23 - INFO - __main__ - Step 23286: {'lr': 0.0004749139068228602, 'samples': 4470912, 'steps': 23285, 'loss/train': 1.548548698425293} -11/07/2021 00:30:24 - INFO - __main__ - Step 23287: {'lr': 0.00047491158984643846, 'samples': 4471104, 'steps': 23286, 'loss/train': 1.3301843404769897} -11/07/2021 00:30:24 - INFO - __main__ - Step 23288: {'lr': 0.0004749092727686749, 'samples': 4471296, 'steps': 23287, 'loss/train': 1.8255505561828613} -11/07/2021 00:30:25 - INFO - __main__ - Step 23289: {'lr': 0.00047490695558957083, 'samples': 4471488, 'steps': 23288, 'loss/train': 1.5257481336593628} -11/07/2021 00:30:25 - INFO - __main__ - Step 23290: {'lr': 0.00047490463830912713, 'samples': 4471680, 'steps': 23289, 'loss/train': 1.5626459121704102} -11/07/2021 00:30:26 - INFO - __main__ - Step 23291: {'lr': 0.0004749023209273448, 'samples': 4471872, 'steps': 23290, 'loss/train': 1.669747233390808} -11/07/2021 00:30:26 - INFO - __main__ - Step 23292: {'lr': 0.000474900003444225, 'samples': 4472064, 'steps': 23291, 'loss/train': 1.540729284286499} -11/07/2021 00:30:27 - INFO - __main__ - Step 23293: {'lr': 0.0004748976858597687, 'samples': 4472256, 'steps': 23292, 'loss/train': 1.4468985795974731} -11/07/2021 00:30:27 - INFO - __main__ - Step 23294: {'lr': 0.00047489536817397706, 'samples': 4472448, 'steps': 23293, 'loss/train': 1.6595637798309326} -11/07/2021 00:30:28 - INFO - __main__ - Step 23295: {'lr': 0.00047489305038685094, 'samples': 4472640, 'steps': 23294, 'loss/train': 1.4057589769363403} -11/07/2021 00:30:28 - INFO - __main__ - Step 23296: {'lr': 0.00047489073249839153, 'samples': 4472832, 'steps': 23295, 'loss/train': 1.657401442527771} -11/07/2021 00:30:29 - INFO - __main__ - Step 23297: {'lr': 0.0004748884145085998, 'samples': 4473024, 'steps': 23296, 'loss/train': 1.5072712898254395} -11/07/2021 00:30:29 - INFO - __main__ - Step 23298: {'lr': 0.0004748860964174768, 'samples': 4473216, 'steps': 23297, 'loss/train': 1.3847980499267578} -11/07/2021 00:30:30 - INFO - __main__ - Step 23299: {'lr': 0.00047488377822502365, 'samples': 4473408, 'steps': 23298, 'loss/train': 1.3205068111419678} -11/07/2021 00:30:30 - INFO - __main__ - Step 23300: {'lr': 0.00047488145993124134, 'samples': 4473600, 'steps': 23299, 'loss/train': 0.8308882713317871} -11/07/2021 00:30:30 - INFO - __main__ - Step 23301: {'lr': 0.0004748791415361309, 'samples': 4473792, 'steps': 23300, 'loss/train': 1.611672043800354} -11/07/2021 00:30:31 - INFO - __main__ - Step 23302: {'lr': 0.00047487682303969336, 'samples': 4473984, 'steps': 23301, 'loss/train': 2.2568047046661377} -11/07/2021 00:30:32 - INFO - __main__ - Step 23303: {'lr': 0.0004748745044419298, 'samples': 4474176, 'steps': 23302, 'loss/train': 1.8289871215820312} -11/07/2021 00:30:32 - INFO - __main__ - Step 23304: {'lr': 0.0004748721857428413, 'samples': 4474368, 'steps': 23303, 'loss/train': 0.8408457040786743} -11/07/2021 00:30:32 - INFO - __main__ - Step 23305: {'lr': 0.00047486986694242887, 'samples': 4474560, 'steps': 23304, 'loss/train': 1.4229025840759277} -11/07/2021 00:30:33 - INFO - __main__ - Step 23306: {'lr': 0.0004748675480406934, 'samples': 4474752, 'steps': 23305, 'loss/train': 1.8904900550842285} -11/07/2021 00:30:33 - INFO - __main__ - Step 23307: {'lr': 0.0004748652290376363, 'samples': 4474944, 'steps': 23306, 'loss/train': 1.0955767631530762} -11/07/2021 00:30:34 - INFO - __main__ - Step 23308: {'lr': 0.00047486290993325824, 'samples': 4475136, 'steps': 23307, 'loss/train': 1.1587820053100586} -11/07/2021 00:30:35 - INFO - __main__ - Step 23309: {'lr': 0.00047486059072756047, 'samples': 4475328, 'steps': 23308, 'loss/train': 1.7340482473373413} -11/07/2021 00:30:35 - INFO - __main__ - Step 23310: {'lr': 0.00047485827142054407, 'samples': 4475520, 'steps': 23309, 'loss/train': 1.6572470664978027} -11/07/2021 00:30:35 - INFO - __main__ - Step 23311: {'lr': 0.0004748559520122099, 'samples': 4475712, 'steps': 23310, 'loss/train': 1.7451789379119873} -11/07/2021 00:30:36 - INFO - __main__ - Step 23312: {'lr': 0.0004748536325025591, 'samples': 4475904, 'steps': 23311, 'loss/train': 0.9648639559745789} -11/07/2021 00:30:37 - INFO - __main__ - Step 23313: {'lr': 0.0004748513128915928, 'samples': 4476096, 'steps': 23312, 'loss/train': 1.480389952659607} -11/07/2021 00:30:37 - INFO - __main__ - Step 23314: {'lr': 0.0004748489931793119, 'samples': 4476288, 'steps': 23313, 'loss/train': 1.9649654626846313} -11/07/2021 00:30:37 - INFO - __main__ - Step 23315: {'lr': 0.00047484667336571753, 'samples': 4476480, 'steps': 23314, 'loss/train': 1.320034384727478} -11/07/2021 00:30:38 - INFO - __main__ - Step 23316: {'lr': 0.0004748443534508107, 'samples': 4476672, 'steps': 23315, 'loss/train': 1.7430577278137207} -11/07/2021 00:30:38 - INFO - __main__ - Step 23317: {'lr': 0.00047484203343459256, 'samples': 4476864, 'steps': 23316, 'loss/train': 1.815623164176941} -11/07/2021 00:30:39 - INFO - __main__ - Step 23318: {'lr': 0.000474839713317064, 'samples': 4477056, 'steps': 23317, 'loss/train': 1.7453724145889282} -11/07/2021 00:30:39 - INFO - __main__ - Step 23319: {'lr': 0.00047483739309822615, 'samples': 4477248, 'steps': 23318, 'loss/train': 1.70332932472229} -11/07/2021 00:30:40 - INFO - __main__ - Step 23320: {'lr': 0.00047483507277808, 'samples': 4477440, 'steps': 23319, 'loss/train': 1.5589721202850342} -11/07/2021 00:30:40 - INFO - __main__ - Step 23321: {'lr': 0.0004748327523566267, 'samples': 4477632, 'steps': 23320, 'loss/train': 1.1599167585372925} -11/07/2021 00:30:40 - INFO - __main__ - Step 23322: {'lr': 0.0004748304318338672, 'samples': 4477824, 'steps': 23321, 'loss/train': 1.7838388681411743} -11/07/2021 00:30:42 - INFO - __main__ - Step 23323: {'lr': 0.00047482811120980254, 'samples': 4478016, 'steps': 23322, 'loss/train': 1.4691747426986694} -11/07/2021 00:30:42 - INFO - __main__ - Step 23324: {'lr': 0.0004748257904844339, 'samples': 4478208, 'steps': 23323, 'loss/train': 1.624101996421814} -11/07/2021 00:30:42 - INFO - __main__ - Step 23325: {'lr': 0.00047482346965776215, 'samples': 4478400, 'steps': 23324, 'loss/train': 1.6079250574111938} -11/07/2021 00:30:43 - INFO - __main__ - Step 23326: {'lr': 0.0004748211487297884, 'samples': 4478592, 'steps': 23325, 'loss/train': 1.8467061519622803} -11/07/2021 00:30:43 - INFO - __main__ - Step 23327: {'lr': 0.00047481882770051377, 'samples': 4478784, 'steps': 23326, 'loss/train': 2.046962261199951} -11/07/2021 00:30:44 - INFO - __main__ - Step 23328: {'lr': 0.00047481650656993924, 'samples': 4478976, 'steps': 23327, 'loss/train': 0.17459586262702942} -11/07/2021 00:30:44 - INFO - __main__ - Step 23329: {'lr': 0.00047481418533806586, 'samples': 4479168, 'steps': 23328, 'loss/train': 1.3363194465637207} -11/07/2021 00:30:45 - INFO - __main__ - Step 23330: {'lr': 0.0004748118640048946, 'samples': 4479360, 'steps': 23329, 'loss/train': 1.5212841033935547} -11/07/2021 00:30:45 - INFO - __main__ - Step 23331: {'lr': 0.00047480954257042666, 'samples': 4479552, 'steps': 23330, 'loss/train': 1.509041428565979} -11/07/2021 00:30:46 - INFO - __main__ - Step 23332: {'lr': 0.000474807221034663, 'samples': 4479744, 'steps': 23331, 'loss/train': 1.1403354406356812} -11/07/2021 00:30:46 - INFO - __main__ - Step 23333: {'lr': 0.0004748048993976046, 'samples': 4479936, 'steps': 23332, 'loss/train': 1.8300435543060303} -11/07/2021 00:30:47 - INFO - __main__ - Step 23334: {'lr': 0.0004748025776592527, 'samples': 4480128, 'steps': 23333, 'loss/train': 1.7769771814346313} -11/07/2021 00:30:47 - INFO - __main__ - Step 23335: {'lr': 0.00047480025581960817, 'samples': 4480320, 'steps': 23334, 'loss/train': 1.5390480756759644} -11/07/2021 00:30:48 - INFO - __main__ - Step 23336: {'lr': 0.0004747979338786721, 'samples': 4480512, 'steps': 23335, 'loss/train': 1.405137062072754} -11/07/2021 00:30:48 - INFO - __main__ - Step 23337: {'lr': 0.00047479561183644557, 'samples': 4480704, 'steps': 23336, 'loss/train': 1.7070698738098145} -11/07/2021 00:30:48 - INFO - __main__ - Step 23338: {'lr': 0.00047479328969292963, 'samples': 4480896, 'steps': 23337, 'loss/train': 1.2690377235412598} -11/07/2021 00:30:49 - INFO - __main__ - Step 23339: {'lr': 0.0004747909674481253, 'samples': 4481088, 'steps': 23338, 'loss/train': 1.9424190521240234} -11/07/2021 00:30:50 - INFO - __main__ - Step 23340: {'lr': 0.00047478864510203355, 'samples': 4481280, 'steps': 23339, 'loss/train': 1.096649169921875} -11/07/2021 00:30:50 - INFO - __main__ - Step 23341: {'lr': 0.0004747863226546556, 'samples': 4481472, 'steps': 23340, 'loss/train': 1.366512417793274} -11/07/2021 00:30:50 - INFO - __main__ - Step 23342: {'lr': 0.0004747840001059923, 'samples': 4481664, 'steps': 23341, 'loss/train': 1.7543566226959229} -11/07/2021 00:30:51 - INFO - __main__ - Step 23343: {'lr': 0.00047478167745604495, 'samples': 4481856, 'steps': 23342, 'loss/train': 1.4305206537246704} -11/07/2021 00:30:52 - INFO - __main__ - Step 23344: {'lr': 0.00047477935470481434, 'samples': 4482048, 'steps': 23343, 'loss/train': 1.8772815465927124} -11/07/2021 00:30:52 - INFO - __main__ - Step 23345: {'lr': 0.00047477703185230157, 'samples': 4482240, 'steps': 23344, 'loss/train': 1.6674097776412964} -11/07/2021 00:30:52 - INFO - __main__ - Step 23346: {'lr': 0.00047477470889850784, 'samples': 4482432, 'steps': 23345, 'loss/train': 1.761983871459961} -11/07/2021 00:30:53 - INFO - __main__ - Step 23347: {'lr': 0.00047477238584343407, 'samples': 4482624, 'steps': 23346, 'loss/train': 1.2408764362335205} -11/07/2021 00:30:53 - INFO - __main__ - Step 23348: {'lr': 0.00047477006268708134, 'samples': 4482816, 'steps': 23347, 'loss/train': 1.8868632316589355} -11/07/2021 00:30:54 - INFO - __main__ - Step 23349: {'lr': 0.00047476773942945063, 'samples': 4483008, 'steps': 23348, 'loss/train': 1.5643318891525269} -11/07/2021 00:30:55 - INFO - __main__ - Step 23350: {'lr': 0.00047476541607054313, 'samples': 4483200, 'steps': 23349, 'loss/train': 0.34093764424324036} -11/07/2021 00:30:55 - INFO - __main__ - Step 23351: {'lr': 0.0004747630926103597, 'samples': 4483392, 'steps': 23350, 'loss/train': 1.2700945138931274} -11/07/2021 00:30:55 - INFO - __main__ - Step 23352: {'lr': 0.0004747607690489015, 'samples': 4483584, 'steps': 23351, 'loss/train': 1.5466938018798828} -11/07/2021 00:30:56 - INFO - __main__ - Step 23353: {'lr': 0.00047475844538616966, 'samples': 4483776, 'steps': 23352, 'loss/train': 1.6921113729476929} -11/07/2021 00:30:57 - INFO - __main__ - Step 23354: {'lr': 0.0004747561216221651, 'samples': 4483968, 'steps': 23353, 'loss/train': 2.1484296321868896} -11/07/2021 00:30:57 - INFO - __main__ - Step 23355: {'lr': 0.0004747537977568889, 'samples': 4484160, 'steps': 23354, 'loss/train': 0.8833921551704407} -11/07/2021 00:30:57 - INFO - __main__ - Step 23356: {'lr': 0.00047475147379034206, 'samples': 4484352, 'steps': 23355, 'loss/train': 1.4659409523010254} -11/07/2021 00:30:58 - INFO - __main__ - Step 23357: {'lr': 0.0004747491497225257, 'samples': 4484544, 'steps': 23356, 'loss/train': 1.5523254871368408} -11/07/2021 00:30:58 - INFO - __main__ - Step 23358: {'lr': 0.00047474682555344083, 'samples': 4484736, 'steps': 23357, 'loss/train': 1.6649246215820312} -11/07/2021 00:30:59 - INFO - __main__ - Step 23359: {'lr': 0.00047474450128308853, 'samples': 4484928, 'steps': 23358, 'loss/train': 1.7693043947219849} -11/07/2021 00:30:59 - INFO - __main__ - Step 23360: {'lr': 0.0004747421769114698, 'samples': 4485120, 'steps': 23359, 'loss/train': 1.51509428024292} -11/07/2021 00:31:00 - INFO - __main__ - Step 23361: {'lr': 0.00047473985243858577, 'samples': 4485312, 'steps': 23360, 'loss/train': 1.0619897842407227} -11/07/2021 00:31:00 - INFO - __main__ - Step 23362: {'lr': 0.00047473752786443736, 'samples': 4485504, 'steps': 23361, 'loss/train': 1.8989733457565308} -11/07/2021 00:31:00 - INFO - __main__ - Step 23363: {'lr': 0.0004747352031890257, 'samples': 4485696, 'steps': 23362, 'loss/train': 1.4395792484283447} -11/07/2021 00:31:02 - INFO - __main__ - Step 23364: {'lr': 0.0004747328784123519, 'samples': 4485888, 'steps': 23363, 'loss/train': 1.523278832435608} -11/07/2021 00:31:02 - INFO - __main__ - Step 23365: {'lr': 0.00047473055353441685, 'samples': 4486080, 'steps': 23364, 'loss/train': 1.8186616897583008} -11/07/2021 00:31:02 - INFO - __main__ - Step 23366: {'lr': 0.0004747282285552217, 'samples': 4486272, 'steps': 23365, 'loss/train': 1.4175355434417725} -11/07/2021 00:31:03 - INFO - __main__ - Step 23367: {'lr': 0.0004747259034747675, 'samples': 4486464, 'steps': 23366, 'loss/train': 1.718819499015808} -11/07/2021 00:31:03 - INFO - __main__ - Step 23368: {'lr': 0.00047472357829305524, 'samples': 4486656, 'steps': 23367, 'loss/train': 1.7335102558135986} -11/07/2021 00:31:04 - INFO - __main__ - Step 23369: {'lr': 0.0004747212530100861, 'samples': 4486848, 'steps': 23368, 'loss/train': 1.7119697332382202} -11/07/2021 00:31:04 - INFO - __main__ - Step 23370: {'lr': 0.0004747189276258609, 'samples': 4487040, 'steps': 23369, 'loss/train': 1.813303828239441} -11/07/2021 00:31:05 - INFO - __main__ - Step 23371: {'lr': 0.0004747166021403809, 'samples': 4487232, 'steps': 23370, 'loss/train': 1.7188760042190552} -11/07/2021 00:31:05 - INFO - __main__ - Step 23372: {'lr': 0.000474714276553647, 'samples': 4487424, 'steps': 23371, 'loss/train': 1.8126929998397827} -11/07/2021 00:31:05 - INFO - __main__ - Step 23373: {'lr': 0.00047471195086566035, 'samples': 4487616, 'steps': 23372, 'loss/train': 1.1047699451446533} -11/07/2021 00:31:06 - INFO - __main__ - Step 23374: {'lr': 0.000474709625076422, 'samples': 4487808, 'steps': 23373, 'loss/train': 2.256373167037964} -11/07/2021 00:31:07 - INFO - __main__ - Step 23375: {'lr': 0.0004747072991859329, 'samples': 4488000, 'steps': 23374, 'loss/train': 1.7977204322814941} -11/07/2021 00:31:07 - INFO - __main__ - Step 23376: {'lr': 0.0004747049731941942, 'samples': 4488192, 'steps': 23375, 'loss/train': 0.995120108127594} -11/07/2021 00:31:07 - INFO - __main__ - Step 23377: {'lr': 0.0004747026471012069, 'samples': 4488384, 'steps': 23376, 'loss/train': 1.240659236907959} -11/07/2021 00:31:08 - INFO - __main__ - Step 23378: {'lr': 0.000474700320906972, 'samples': 4488576, 'steps': 23377, 'loss/train': 1.879565715789795} -11/07/2021 00:31:08 - INFO - __main__ - Step 23379: {'lr': 0.0004746979946114907, 'samples': 4488768, 'steps': 23378, 'loss/train': 1.5867724418640137} -11/07/2021 00:31:09 - INFO - __main__ - Step 23380: {'lr': 0.000474695668214764, 'samples': 4488960, 'steps': 23379, 'loss/train': 1.5567258596420288} -11/07/2021 00:31:09 - INFO - __main__ - Step 23381: {'lr': 0.00047469334171679266, 'samples': 4489152, 'steps': 23380, 'loss/train': 1.4264450073242188} -11/07/2021 00:31:10 - INFO - __main__ - Step 23382: {'lr': 0.00047469101511757815, 'samples': 4489344, 'steps': 23381, 'loss/train': 1.7234845161437988} -11/07/2021 00:31:10 - INFO - __main__ - Step 23383: {'lr': 0.00047468868841712134, 'samples': 4489536, 'steps': 23382, 'loss/train': 1.4425300359725952} -11/07/2021 00:31:10 - INFO - __main__ - Step 23384: {'lr': 0.00047468636161542325, 'samples': 4489728, 'steps': 23383, 'loss/train': 1.4994603395462036} -11/07/2021 00:31:11 - INFO - __main__ - Step 23385: {'lr': 0.0004746840347124849, 'samples': 4489920, 'steps': 23384, 'loss/train': 1.5308146476745605} -11/07/2021 00:31:12 - INFO - __main__ - Step 23386: {'lr': 0.0004746817077083074, 'samples': 4490112, 'steps': 23385, 'loss/train': 1.2547379732131958} -11/07/2021 00:31:12 - INFO - __main__ - Step 23387: {'lr': 0.00047467938060289185, 'samples': 4490304, 'steps': 23386, 'loss/train': 1.469014048576355} -11/07/2021 00:31:13 - INFO - __main__ - Step 23388: {'lr': 0.0004746770533962391, 'samples': 4490496, 'steps': 23387, 'loss/train': 1.6473876237869263} -11/07/2021 00:31:13 - INFO - __main__ - Step 23389: {'lr': 0.0004746747260883505, 'samples': 4490688, 'steps': 23388, 'loss/train': 1.6516025066375732} -11/07/2021 00:31:14 - INFO - __main__ - Step 23390: {'lr': 0.0004746723986792268, 'samples': 4490880, 'steps': 23389, 'loss/train': 1.4926345348358154} -11/07/2021 00:31:14 - INFO - __main__ - Step 23391: {'lr': 0.0004746700711688693, 'samples': 4491072, 'steps': 23390, 'loss/train': 1.5572574138641357} -11/07/2021 00:31:15 - INFO - __main__ - Step 23392: {'lr': 0.0004746677435572789, 'samples': 4491264, 'steps': 23391, 'loss/train': 1.267289161682129} -11/07/2021 00:31:15 - INFO - __main__ - Step 23393: {'lr': 0.00047466541584445667, 'samples': 4491456, 'steps': 23392, 'loss/train': 1.4724624156951904} -11/07/2021 00:31:15 - INFO - __main__ - Step 23394: {'lr': 0.0004746630880304037, 'samples': 4491648, 'steps': 23393, 'loss/train': 1.650766134262085} -11/07/2021 00:31:16 - INFO - __main__ - Step 23395: {'lr': 0.0004746607601151209, 'samples': 4491840, 'steps': 23394, 'loss/train': 1.074090838432312} -11/07/2021 00:31:17 - INFO - __main__ - Step 23396: {'lr': 0.0004746584320986096, 'samples': 4492032, 'steps': 23395, 'loss/train': 1.498843789100647} -11/07/2021 00:31:17 - INFO - __main__ - Step 23397: {'lr': 0.0004746561039808706, 'samples': 4492224, 'steps': 23396, 'loss/train': 1.0642423629760742} -11/07/2021 00:31:17 - INFO - __main__ - Step 23398: {'lr': 0.0004746537757619049, 'samples': 4492416, 'steps': 23397, 'loss/train': 1.7150928974151611} -11/07/2021 00:31:18 - INFO - __main__ - Step 23399: {'lr': 0.00047465144744171387, 'samples': 4492608, 'steps': 23398, 'loss/train': 1.2741963863372803} -11/07/2021 00:31:18 - INFO - __main__ - Step 23400: {'lr': 0.0004746491190202983, 'samples': 4492800, 'steps': 23399, 'loss/train': 1.5653659105300903} -11/07/2021 00:31:19 - INFO - __main__ - Step 23401: {'lr': 0.00047464679049765926, 'samples': 4492992, 'steps': 23400, 'loss/train': 1.7427978515625} -11/07/2021 00:31:20 - INFO - __main__ - Step 23402: {'lr': 0.00047464446187379787, 'samples': 4493184, 'steps': 23401, 'loss/train': 1.8643656969070435} -11/07/2021 00:31:20 - INFO - __main__ - Step 23403: {'lr': 0.00047464213314871514, 'samples': 4493376, 'steps': 23402, 'loss/train': 1.5454072952270508} -11/07/2021 00:31:20 - INFO - __main__ - Step 23404: {'lr': 0.0004746398043224122, 'samples': 4493568, 'steps': 23403, 'loss/train': 1.82225501537323} -11/07/2021 00:31:21 - INFO - __main__ - Step 23405: {'lr': 0.0004746374753948899, 'samples': 4493760, 'steps': 23404, 'loss/train': 1.66446852684021} -11/07/2021 00:31:22 - INFO - __main__ - Step 23406: {'lr': 0.00047463514636614945, 'samples': 4493952, 'steps': 23405, 'loss/train': 0.7836999893188477} -11/07/2021 00:31:22 - INFO - __main__ - Step 23407: {'lr': 0.00047463281723619203, 'samples': 4494144, 'steps': 23406, 'loss/train': 1.2050637006759644} -11/07/2021 00:31:22 - INFO - __main__ - Step 23408: {'lr': 0.00047463048800501837, 'samples': 4494336, 'steps': 23407, 'loss/train': 1.3217005729675293} -11/07/2021 00:31:23 - INFO - __main__ - Step 23409: {'lr': 0.00047462815867262967, 'samples': 4494528, 'steps': 23408, 'loss/train': 1.623984456062317} -11/07/2021 00:31:23 - INFO - __main__ - Step 23410: {'lr': 0.0004746258292390271, 'samples': 4494720, 'steps': 23409, 'loss/train': 1.389218807220459} -11/07/2021 00:31:24 - INFO - __main__ - Step 23411: {'lr': 0.00047462349970421147, 'samples': 4494912, 'steps': 23410, 'loss/train': 1.4058815240859985} -11/07/2021 00:31:25 - INFO - __main__ - Step 23412: {'lr': 0.0004746211700681841, 'samples': 4495104, 'steps': 23411, 'loss/train': 1.352455973625183} -11/07/2021 00:31:25 - INFO - __main__ - Step 23413: {'lr': 0.0004746188403309457, 'samples': 4495296, 'steps': 23412, 'loss/train': 1.3618943691253662} -11/07/2021 00:31:25 - INFO - __main__ - Step 23414: {'lr': 0.00047461651049249764, 'samples': 4495488, 'steps': 23413, 'loss/train': 1.349570393562317} -11/07/2021 00:31:26 - INFO - __main__ - Step 23415: {'lr': 0.0004746141805528409, 'samples': 4495680, 'steps': 23414, 'loss/train': 1.1598076820373535} -11/07/2021 00:31:27 - INFO - __main__ - Step 23416: {'lr': 0.00047461185051197644, 'samples': 4495872, 'steps': 23415, 'loss/train': 0.9544047117233276} -11/07/2021 00:31:27 - INFO - __main__ - Step 23417: {'lr': 0.0004746095203699053, 'samples': 4496064, 'steps': 23416, 'loss/train': 1.0990289449691772} -11/07/2021 00:31:28 - INFO - __main__ - Step 23418: {'lr': 0.00047460719012662857, 'samples': 4496256, 'steps': 23417, 'loss/train': 1.5603042840957642} -11/07/2021 00:31:28 - INFO - __main__ - Step 23419: {'lr': 0.00047460485978214733, 'samples': 4496448, 'steps': 23418, 'loss/train': 1.791231393814087} -11/07/2021 00:31:28 - INFO - __main__ - Step 23420: {'lr': 0.00047460252933646265, 'samples': 4496640, 'steps': 23419, 'loss/train': 1.5584287643432617} -11/07/2021 00:31:29 - INFO - __main__ - Step 23421: {'lr': 0.0004746001987895755, 'samples': 4496832, 'steps': 23420, 'loss/train': 0.7658491134643555} -11/07/2021 00:31:30 - INFO - __main__ - Step 23422: {'lr': 0.00047459786814148697, 'samples': 4497024, 'steps': 23421, 'loss/train': 0.8147704005241394} -11/07/2021 00:31:30 - INFO - __main__ - Step 23423: {'lr': 0.0004745955373921981, 'samples': 4497216, 'steps': 23422, 'loss/train': 1.684801697731018} -11/07/2021 00:31:30 - INFO - __main__ - Step 23424: {'lr': 0.0004745932065417099, 'samples': 4497408, 'steps': 23423, 'loss/train': 0.9494284987449646} -11/07/2021 00:31:31 - INFO - __main__ - Step 23425: {'lr': 0.00047459087559002355, 'samples': 4497600, 'steps': 23424, 'loss/train': 0.885067343711853} -11/07/2021 00:31:31 - INFO - __main__ - Step 23426: {'lr': 0.00047458854453713995, 'samples': 4497792, 'steps': 23425, 'loss/train': 1.3821614980697632} -11/07/2021 00:31:32 - INFO - __main__ - Step 23427: {'lr': 0.0004745862133830603, 'samples': 4497984, 'steps': 23426, 'loss/train': 1.4860104322433472} -11/07/2021 00:31:33 - INFO - __main__ - Step 23428: {'lr': 0.00047458388212778547, 'samples': 4498176, 'steps': 23427, 'loss/train': 1.527248740196228} -11/07/2021 00:31:33 - INFO - __main__ - Step 23429: {'lr': 0.00047458155077131664, 'samples': 4498368, 'steps': 23428, 'loss/train': 1.6233726739883423} -11/07/2021 00:31:33 - INFO - __main__ - Step 23430: {'lr': 0.0004745792193136549, 'samples': 4498560, 'steps': 23429, 'loss/train': 1.2394837141036987} -11/07/2021 00:31:34 - INFO - __main__ - Step 23431: {'lr': 0.00047457688775480114, 'samples': 4498752, 'steps': 23430, 'loss/train': 1.7909239530563354} -11/07/2021 00:31:35 - INFO - __main__ - Step 23432: {'lr': 0.0004745745560947565, 'samples': 4498944, 'steps': 23431, 'loss/train': 1.5196155309677124} -11/07/2021 00:31:35 - INFO - __main__ - Step 23433: {'lr': 0.0004745722243335221, 'samples': 4499136, 'steps': 23432, 'loss/train': 1.977839708328247} -11/07/2021 00:31:35 - INFO - __main__ - Step 23434: {'lr': 0.0004745698924710988, 'samples': 4499328, 'steps': 23433, 'loss/train': 1.6531399488449097} -11/07/2021 00:31:36 - INFO - __main__ - Step 23435: {'lr': 0.00047456756050748793, 'samples': 4499520, 'steps': 23434, 'loss/train': 1.1196846961975098} -11/07/2021 00:31:36 - INFO - __main__ - Step 23436: {'lr': 0.0004745652284426903, 'samples': 4499712, 'steps': 23435, 'loss/train': 1.790719747543335} -11/07/2021 00:31:36 - INFO - __main__ - Step 23437: {'lr': 0.00047456289627670703, 'samples': 4499904, 'steps': 23436, 'loss/train': 1.2567437887191772} -11/07/2021 00:31:37 - INFO - __main__ - Step 23438: {'lr': 0.0004745605640095392, 'samples': 4500096, 'steps': 23437, 'loss/train': 1.2304730415344238} -11/07/2021 00:31:38 - INFO - __main__ - Step 23439: {'lr': 0.00047455823164118787, 'samples': 4500288, 'steps': 23438, 'loss/train': 2.25645112991333} -11/07/2021 00:31:38 - INFO - __main__ - Step 23440: {'lr': 0.00047455589917165406, 'samples': 4500480, 'steps': 23439, 'loss/train': 1.7855865955352783} -11/07/2021 00:31:38 - INFO - __main__ - Step 23441: {'lr': 0.00047455356660093886, 'samples': 4500672, 'steps': 23440, 'loss/train': 1.5271779298782349} -11/07/2021 00:31:39 - INFO - __main__ - Step 23442: {'lr': 0.0004745512339290432, 'samples': 4500864, 'steps': 23441, 'loss/train': 1.948983073234558} -11/07/2021 00:31:40 - INFO - __main__ - Step 23443: {'lr': 0.00047454890115596824, 'samples': 4501056, 'steps': 23442, 'loss/train': 1.409691333770752} -11/07/2021 00:31:40 - INFO - __main__ - Step 23444: {'lr': 0.00047454656828171504, 'samples': 4501248, 'steps': 23443, 'loss/train': 1.1951667070388794} -11/07/2021 00:31:40 - INFO - __main__ - Step 23445: {'lr': 0.0004745442353062846, 'samples': 4501440, 'steps': 23444, 'loss/train': 1.2143166065216064} -11/07/2021 00:31:41 - INFO - __main__ - Step 23446: {'lr': 0.000474541902229678, 'samples': 4501632, 'steps': 23445, 'loss/train': 1.2001657485961914} -11/07/2021 00:31:41 - INFO - __main__ - Step 23447: {'lr': 0.0004745395690518963, 'samples': 4501824, 'steps': 23446, 'loss/train': 1.7846274375915527} -11/07/2021 00:31:42 - INFO - __main__ - Step 23448: {'lr': 0.0004745372357729405, 'samples': 4502016, 'steps': 23447, 'loss/train': 1.5660029649734497} -11/07/2021 00:31:43 - INFO - __main__ - Step 23449: {'lr': 0.0004745349023928117, 'samples': 4502208, 'steps': 23448, 'loss/train': 1.749601125717163} -11/07/2021 00:31:43 - INFO - __main__ - Step 23450: {'lr': 0.000474532568911511, 'samples': 4502400, 'steps': 23449, 'loss/train': 1.29769766330719} -11/07/2021 00:31:43 - INFO - __main__ - Step 23451: {'lr': 0.00047453023532903927, 'samples': 4502592, 'steps': 23450, 'loss/train': 1.027752161026001} -11/07/2021 00:31:44 - INFO - __main__ - Step 23452: {'lr': 0.00047452790164539775, 'samples': 4502784, 'steps': 23451, 'loss/train': 1.5923694372177124} -11/07/2021 00:31:45 - INFO - __main__ - Step 23453: {'lr': 0.00047452556786058744, 'samples': 4502976, 'steps': 23452, 'loss/train': 1.835474967956543} -11/07/2021 00:31:45 - INFO - __main__ - Step 23454: {'lr': 0.0004745232339746094, 'samples': 4503168, 'steps': 23453, 'loss/train': 1.6376953125} -11/07/2021 00:31:45 - INFO - __main__ - Step 23455: {'lr': 0.00047452089998746463, 'samples': 4503360, 'steps': 23454, 'loss/train': 1.2960706949234009} -11/07/2021 00:31:46 - INFO - __main__ - Step 23456: {'lr': 0.0004745185658991541, 'samples': 4503552, 'steps': 23455, 'loss/train': 1.8943711519241333} -11/07/2021 00:31:46 - INFO - __main__ - Step 23457: {'lr': 0.0004745162317096791, 'samples': 4503744, 'steps': 23456, 'loss/train': 1.8373547792434692} -11/07/2021 00:31:47 - INFO - __main__ - Step 23458: {'lr': 0.0004745138974190405, 'samples': 4503936, 'steps': 23457, 'loss/train': 1.8252520561218262} -11/07/2021 00:31:47 - INFO - __main__ - Step 23459: {'lr': 0.0004745115630272394, 'samples': 4504128, 'steps': 23458, 'loss/train': 1.5691437721252441} -11/07/2021 00:31:48 - INFO - __main__ - Step 23460: {'lr': 0.00047450922853427686, 'samples': 4504320, 'steps': 23459, 'loss/train': 1.3738198280334473} -11/07/2021 00:31:48 - INFO - __main__ - Step 23461: {'lr': 0.0004745068939401539, 'samples': 4504512, 'steps': 23460, 'loss/train': 1.3941560983657837} -11/07/2021 00:31:49 - INFO - __main__ - Step 23462: {'lr': 0.0004745045592448717, 'samples': 4504704, 'steps': 23461, 'loss/train': 1.6935898065567017} -11/07/2021 00:31:50 - INFO - __main__ - Step 23463: {'lr': 0.00047450222444843105, 'samples': 4504896, 'steps': 23462, 'loss/train': 1.527276873588562} -11/07/2021 00:31:50 - INFO - __main__ - Step 23464: {'lr': 0.0004744998895508333, 'samples': 4505088, 'steps': 23463, 'loss/train': 1.3515911102294922} -11/07/2021 00:31:50 - INFO - __main__ - Step 23465: {'lr': 0.0004744975545520793, 'samples': 4505280, 'steps': 23464, 'loss/train': 1.4795407056808472} -11/07/2021 00:31:51 - INFO - __main__ - Step 23466: {'lr': 0.00047449521945217016, 'samples': 4505472, 'steps': 23465, 'loss/train': 1.0448362827301025} -11/07/2021 00:31:51 - INFO - __main__ - Step 23467: {'lr': 0.00047449288425110693, 'samples': 4505664, 'steps': 23466, 'loss/train': 1.4558610916137695} -11/07/2021 00:31:52 - INFO - __main__ - Step 23468: {'lr': 0.00047449054894889073, 'samples': 4505856, 'steps': 23467, 'loss/train': 1.4664283990859985} -11/07/2021 00:31:53 - INFO - __main__ - Step 23469: {'lr': 0.00047448821354552253, 'samples': 4506048, 'steps': 23468, 'loss/train': 1.1906158924102783} -11/07/2021 00:31:53 - INFO - __main__ - Step 23470: {'lr': 0.0004744858780410034, 'samples': 4506240, 'steps': 23469, 'loss/train': 0.4644726514816284} -11/07/2021 00:31:53 - INFO - __main__ - Step 23471: {'lr': 0.0004744835424353344, 'samples': 4506432, 'steps': 23470, 'loss/train': 1.616047739982605} -11/07/2021 00:31:54 - INFO - __main__ - Step 23472: {'lr': 0.00047448120672851653, 'samples': 4506624, 'steps': 23471, 'loss/train': 1.0819038152694702} -11/07/2021 00:31:54 - INFO - __main__ - Step 23473: {'lr': 0.0004744788709205509, 'samples': 4506816, 'steps': 23472, 'loss/train': 1.925014853477478} -11/07/2021 00:31:55 - INFO - __main__ - Step 23474: {'lr': 0.0004744765350114386, 'samples': 4507008, 'steps': 23473, 'loss/train': 1.4738006591796875} -11/07/2021 00:31:56 - INFO - __main__ - Step 23475: {'lr': 0.00047447419900118067, 'samples': 4507200, 'steps': 23474, 'loss/train': 1.3570666313171387} -11/07/2021 00:31:56 - INFO - __main__ - Step 23476: {'lr': 0.00047447186288977804, 'samples': 4507392, 'steps': 23475, 'loss/train': 2.686858892440796} -11/07/2021 00:31:56 - INFO - __main__ - Step 23477: {'lr': 0.0004744695266772319, 'samples': 4507584, 'steps': 23476, 'loss/train': 1.099247694015503} -11/07/2021 00:31:57 - INFO - __main__ - Step 23478: {'lr': 0.00047446719036354324, 'samples': 4507776, 'steps': 23477, 'loss/train': 1.62332022190094} -11/07/2021 00:31:58 - INFO - __main__ - Step 23479: {'lr': 0.0004744648539487132, 'samples': 4507968, 'steps': 23478, 'loss/train': 1.5295865535736084} -11/07/2021 00:31:58 - INFO - __main__ - Step 23480: {'lr': 0.00047446251743274263, 'samples': 4508160, 'steps': 23479, 'loss/train': 1.2681844234466553} -11/07/2021 00:31:58 - INFO - __main__ - Step 23481: {'lr': 0.0004744601808156328, 'samples': 4508352, 'steps': 23480, 'loss/train': 1.326259970664978} -11/07/2021 00:31:59 - INFO - __main__ - Step 23482: {'lr': 0.00047445784409738467, 'samples': 4508544, 'steps': 23481, 'loss/train': 1.8529151678085327} -11/07/2021 00:31:59 - INFO - __main__ - Step 23483: {'lr': 0.0004744555072779993, 'samples': 4508736, 'steps': 23482, 'loss/train': 1.6085487604141235} -11/07/2021 00:31:59 - INFO - __main__ - Step 23484: {'lr': 0.0004744531703574777, 'samples': 4508928, 'steps': 23483, 'loss/train': 1.3744274377822876} -11/07/2021 00:32:01 - INFO - __main__ - Step 23485: {'lr': 0.00047445083333582104, 'samples': 4509120, 'steps': 23484, 'loss/train': 1.4718713760375977} -11/07/2021 00:32:01 - INFO - __main__ - Step 23486: {'lr': 0.00047444849621303023, 'samples': 4509312, 'steps': 23485, 'loss/train': 1.6028051376342773} -11/07/2021 00:32:01 - INFO - __main__ - Step 23487: {'lr': 0.00047444615898910644, 'samples': 4509504, 'steps': 23486, 'loss/train': 1.021246314048767} -11/07/2021 00:32:02 - INFO - __main__ - Step 23488: {'lr': 0.00047444382166405067, 'samples': 4509696, 'steps': 23487, 'loss/train': 5.782830238342285} -11/07/2021 00:32:02 - INFO - __main__ - Step 23489: {'lr': 0.0004744414842378639, 'samples': 4509888, 'steps': 23488, 'loss/train': 1.5995277166366577} -11/07/2021 00:32:03 - INFO - __main__ - Step 23490: {'lr': 0.0004744391467105473, 'samples': 4510080, 'steps': 23489, 'loss/train': 0.973374605178833} -11/07/2021 00:32:03 - INFO - __main__ - Step 23491: {'lr': 0.00047443680908210194, 'samples': 4510272, 'steps': 23490, 'loss/train': 2.7277424335479736} -11/07/2021 00:32:04 - INFO - __main__ - Step 23492: {'lr': 0.00047443447135252876, 'samples': 4510464, 'steps': 23491, 'loss/train': 1.391707181930542} -11/07/2021 00:32:04 - INFO - __main__ - Step 23493: {'lr': 0.0004744321335218289, 'samples': 4510656, 'steps': 23492, 'loss/train': 1.6771727800369263} -11/07/2021 00:32:04 - INFO - __main__ - Step 23494: {'lr': 0.0004744297955900034, 'samples': 4510848, 'steps': 23493, 'loss/train': 1.001266360282898} -11/07/2021 00:32:05 - INFO - __main__ - Step 23495: {'lr': 0.00047442745755705326, 'samples': 4511040, 'steps': 23494, 'loss/train': 1.4900996685028076} -11/07/2021 00:32:06 - INFO - __main__ - Step 23496: {'lr': 0.00047442511942297953, 'samples': 4511232, 'steps': 23495, 'loss/train': 1.4952882528305054} -11/07/2021 00:32:06 - INFO - __main__ - Step 23497: {'lr': 0.00047442278118778336, 'samples': 4511424, 'steps': 23496, 'loss/train': 1.5954856872558594} -11/07/2021 00:32:06 - INFO - __main__ - Step 23498: {'lr': 0.0004744204428514658, 'samples': 4511616, 'steps': 23497, 'loss/train': 1.7899006605148315} -11/07/2021 00:32:07 - INFO - __main__ - Step 23499: {'lr': 0.00047441810441402777, 'samples': 4511808, 'steps': 23498, 'loss/train': 0.658106803894043} -11/07/2021 00:32:07 - INFO - __main__ - Step 23500: {'lr': 0.0004744157658754704, 'samples': 4512000, 'steps': 23499, 'loss/train': 1.4799785614013672} -11/07/2021 00:32:08 - INFO - __main__ - Step 23501: {'lr': 0.0004744134272357948, 'samples': 4512192, 'steps': 23500, 'loss/train': 1.6532243490219116} -11/07/2021 00:32:09 - INFO - __main__ - Step 23502: {'lr': 0.0004744110884950019, 'samples': 4512384, 'steps': 23501, 'loss/train': 2.228314161300659} -11/07/2021 00:32:09 - INFO - __main__ - Step 23503: {'lr': 0.00047440874965309286, 'samples': 4512576, 'steps': 23502, 'loss/train': 1.303419589996338} -11/07/2021 00:32:09 - INFO - __main__ - Step 23504: {'lr': 0.00047440641071006874, 'samples': 4512768, 'steps': 23503, 'loss/train': 1.6008127927780151} -11/07/2021 00:32:10 - INFO - __main__ - Step 23505: {'lr': 0.00047440407166593056, 'samples': 4512960, 'steps': 23504, 'loss/train': 1.4751851558685303} -11/07/2021 00:32:11 - INFO - __main__ - Step 23506: {'lr': 0.0004744017325206793, 'samples': 4513152, 'steps': 23505, 'loss/train': 5.9636006355285645} -11/07/2021 00:32:11 - INFO - __main__ - Step 23507: {'lr': 0.00047439939327431613, 'samples': 4513344, 'steps': 23506, 'loss/train': 2.0052008628845215} -11/07/2021 00:32:11 - INFO - __main__ - Step 23508: {'lr': 0.0004743970539268421, 'samples': 4513536, 'steps': 23507, 'loss/train': 1.7036689519882202} -11/07/2021 00:32:12 - INFO - __main__ - Step 23509: {'lr': 0.00047439471447825813, 'samples': 4513728, 'steps': 23508, 'loss/train': 2.1218676567077637} -11/07/2021 00:32:12 - INFO - __main__ - Step 23510: {'lr': 0.00047439237492856543, 'samples': 4513920, 'steps': 23509, 'loss/train': 1.58950674533844} -11/07/2021 00:32:12 - INFO - __main__ - Step 23511: {'lr': 0.0004743900352777649, 'samples': 4514112, 'steps': 23510, 'loss/train': 1.7900227308273315} -11/07/2021 00:32:13 - INFO - __main__ - Step 23512: {'lr': 0.0004743876955258578, 'samples': 4514304, 'steps': 23511, 'loss/train': 1.8968209028244019} -11/07/2021 00:32:14 - INFO - __main__ - Step 23513: {'lr': 0.00047438535567284504, 'samples': 4514496, 'steps': 23512, 'loss/train': 1.653573751449585} -11/07/2021 00:32:14 - INFO - __main__ - Step 23514: {'lr': 0.00047438301571872763, 'samples': 4514688, 'steps': 23513, 'loss/train': 1.7201824188232422} -11/07/2021 00:32:14 - INFO - __main__ - Step 23515: {'lr': 0.00047438067566350675, 'samples': 4514880, 'steps': 23514, 'loss/train': 1.5156289339065552} -11/07/2021 00:32:15 - INFO - __main__ - Step 23516: {'lr': 0.00047437833550718336, 'samples': 4515072, 'steps': 23515, 'loss/train': 1.3097409009933472} -11/07/2021 00:32:16 - INFO - __main__ - Step 23517: {'lr': 0.0004743759952497586, 'samples': 4515264, 'steps': 23516, 'loss/train': 1.3028639554977417} -11/07/2021 00:32:16 - INFO - __main__ - Step 23518: {'lr': 0.0004743736548912334, 'samples': 4515456, 'steps': 23517, 'loss/train': 1.5353991985321045} -11/07/2021 00:32:17 - INFO - __main__ - Step 23519: {'lr': 0.00047437131443160897, 'samples': 4515648, 'steps': 23518, 'loss/train': 1.5825148820877075} -11/07/2021 00:32:17 - INFO - __main__ - Step 23520: {'lr': 0.0004743689738708863, 'samples': 4515840, 'steps': 23519, 'loss/train': 0.6383938193321228} -11/07/2021 00:32:17 - INFO - __main__ - Step 23521: {'lr': 0.0004743666332090664, 'samples': 4516032, 'steps': 23520, 'loss/train': 1.2356423139572144} -11/07/2021 00:32:18 - INFO - __main__ - Step 23522: {'lr': 0.00047436429244615037, 'samples': 4516224, 'steps': 23521, 'loss/train': 1.6078827381134033} -11/07/2021 00:32:19 - INFO - __main__ - Step 23523: {'lr': 0.0004743619515821392, 'samples': 4516416, 'steps': 23522, 'loss/train': 1.2691593170166016} -11/07/2021 00:32:19 - INFO - __main__ - Step 23524: {'lr': 0.00047435961061703403, 'samples': 4516608, 'steps': 23523, 'loss/train': 1.7472574710845947} -11/07/2021 00:32:19 - INFO - __main__ - Step 23525: {'lr': 0.00047435726955083593, 'samples': 4516800, 'steps': 23524, 'loss/train': 1.865501880645752} -11/07/2021 00:32:20 - INFO - __main__ - Step 23526: {'lr': 0.0004743549283835459, 'samples': 4516992, 'steps': 23525, 'loss/train': 1.6130586862564087} -11/07/2021 00:32:21 - INFO - __main__ - Step 23527: {'lr': 0.00047435258711516496, 'samples': 4517184, 'steps': 23526, 'loss/train': 1.3543508052825928} -11/07/2021 00:32:21 - INFO - __main__ - Step 23528: {'lr': 0.0004743502457456942, 'samples': 4517376, 'steps': 23527, 'loss/train': 1.4319701194763184} -11/07/2021 00:32:21 - INFO - __main__ - Step 23529: {'lr': 0.0004743479042751347, 'samples': 4517568, 'steps': 23528, 'loss/train': 2.1460018157958984} -11/07/2021 00:32:22 - INFO - __main__ - Step 23530: {'lr': 0.0004743455627034875, 'samples': 4517760, 'steps': 23529, 'loss/train': 1.602501392364502} -11/07/2021 00:32:22 - INFO - __main__ - Step 23531: {'lr': 0.0004743432210307536, 'samples': 4517952, 'steps': 23530, 'loss/train': 1.7073982954025269} -11/07/2021 00:32:23 - INFO - __main__ - Step 23532: {'lr': 0.00047434087925693415, 'samples': 4518144, 'steps': 23531, 'loss/train': 1.697928547859192} -11/07/2021 00:32:23 - INFO - __main__ - Step 23533: {'lr': 0.00047433853738203013, 'samples': 4518336, 'steps': 23532, 'loss/train': 1.2396883964538574} -11/07/2021 00:32:24 - INFO - __main__ - Step 23534: {'lr': 0.00047433619540604264, 'samples': 4518528, 'steps': 23533, 'loss/train': 2.2235891819000244} -11/07/2021 00:32:24 - INFO - __main__ - Step 23535: {'lr': 0.0004743338533289728, 'samples': 4518720, 'steps': 23534, 'loss/train': 1.1533797979354858} -11/07/2021 00:32:25 - INFO - __main__ - Step 23536: {'lr': 0.0004743315111508215, 'samples': 4518912, 'steps': 23535, 'loss/train': 1.5415807962417603} -11/07/2021 00:32:25 - INFO - __main__ - Step 23537: {'lr': 0.00047432916887158995, 'samples': 4519104, 'steps': 23536, 'loss/train': 1.1145853996276855} -11/07/2021 00:32:26 - INFO - __main__ - Step 23538: {'lr': 0.00047432682649127913, 'samples': 4519296, 'steps': 23537, 'loss/train': 1.335025668144226} -11/07/2021 00:32:26 - INFO - __main__ - Step 23539: {'lr': 0.00047432448400989004, 'samples': 4519488, 'steps': 23538, 'loss/train': 1.3478022813796997} -11/07/2021 00:32:27 - INFO - __main__ - Step 23540: {'lr': 0.0004743221414274238, 'samples': 4519680, 'steps': 23539, 'loss/train': 1.494612693786621} -11/07/2021 00:32:27 - INFO - __main__ - Step 23541: {'lr': 0.00047431979874388154, 'samples': 4519872, 'steps': 23540, 'loss/train': 1.2911465167999268} -11/07/2021 00:32:28 - INFO - __main__ - Step 23542: {'lr': 0.0004743174559592642, 'samples': 4520064, 'steps': 23541, 'loss/train': 1.6779345273971558} -11/07/2021 00:32:28 - INFO - __main__ - Step 23543: {'lr': 0.0004743151130735729, 'samples': 4520256, 'steps': 23542, 'loss/train': 0.7486419677734375} -11/07/2021 00:32:29 - INFO - __main__ - Step 23544: {'lr': 0.0004743127700868086, 'samples': 4520448, 'steps': 23543, 'loss/train': 1.1932936906814575} -11/07/2021 00:32:29 - INFO - __main__ - Step 23545: {'lr': 0.00047431042699897245, 'samples': 4520640, 'steps': 23544, 'loss/train': 1.5103429555892944} -11/07/2021 00:32:29 - INFO - __main__ - Step 23546: {'lr': 0.0004743080838100655, 'samples': 4520832, 'steps': 23545, 'loss/train': 1.6619280576705933} -11/07/2021 00:32:30 - INFO - __main__ - Step 23547: {'lr': 0.0004743057405200888, 'samples': 4521024, 'steps': 23546, 'loss/train': 0.13306494057178497} -11/07/2021 00:32:31 - INFO - __main__ - Step 23548: {'lr': 0.0004743033971290434, 'samples': 4521216, 'steps': 23547, 'loss/train': 1.6675859689712524} -11/07/2021 00:32:31 - INFO - __main__ - Step 23549: {'lr': 0.00047430105363693034, 'samples': 4521408, 'steps': 23548, 'loss/train': 1.4825546741485596} -11/07/2021 00:32:32 - INFO - __main__ - Step 23550: {'lr': 0.0004742987100437507, 'samples': 4521600, 'steps': 23549, 'loss/train': 1.565748691558838} -11/07/2021 00:32:32 - INFO - __main__ - Step 23551: {'lr': 0.00047429636634950545, 'samples': 4521792, 'steps': 23550, 'loss/train': 1.7220901250839233} -11/07/2021 00:32:33 - INFO - __main__ - Step 23552: {'lr': 0.0004742940225541958, 'samples': 4521984, 'steps': 23551, 'loss/train': 1.357005000114441} -11/07/2021 00:32:33 - INFO - __main__ - Step 23553: {'lr': 0.0004742916786578227, 'samples': 4522176, 'steps': 23552, 'loss/train': 1.6558088064193726} -11/07/2021 00:32:34 - INFO - __main__ - Step 23554: {'lr': 0.00047428933466038726, 'samples': 4522368, 'steps': 23553, 'loss/train': 1.8793753385543823} -11/07/2021 00:32:34 - INFO - __main__ - Step 23555: {'lr': 0.00047428699056189047, 'samples': 4522560, 'steps': 23554, 'loss/train': 1.76802396774292} -11/07/2021 00:32:34 - INFO - __main__ - Step 23556: {'lr': 0.0004742846463623334, 'samples': 4522752, 'steps': 23555, 'loss/train': 1.8358832597732544} -11/07/2021 00:32:35 - INFO - __main__ - Step 23557: {'lr': 0.0004742823020617172, 'samples': 4522944, 'steps': 23556, 'loss/train': 1.4426796436309814} -11/07/2021 00:32:36 - INFO - __main__ - Step 23558: {'lr': 0.0004742799576600427, 'samples': 4523136, 'steps': 23557, 'loss/train': 1.814741611480713} -11/07/2021 00:32:36 - INFO - __main__ - Step 23559: {'lr': 0.00047427761315731133, 'samples': 4523328, 'steps': 23558, 'loss/train': 6.1855244636535645} -11/07/2021 00:32:36 - INFO - __main__ - Step 23560: {'lr': 0.0004742752685535238, 'samples': 4523520, 'steps': 23559, 'loss/train': 1.8517687320709229} -11/07/2021 00:32:37 - INFO - __main__ - Step 23561: {'lr': 0.00047427292384868134, 'samples': 4523712, 'steps': 23560, 'loss/train': 1.7739310264587402} -11/07/2021 00:32:37 - INFO - __main__ - Step 23562: {'lr': 0.0004742705790427849, 'samples': 4523904, 'steps': 23561, 'loss/train': 1.4885367155075073} -11/07/2021 00:32:38 - INFO - __main__ - Step 23563: {'lr': 0.00047426823413583563, 'samples': 4524096, 'steps': 23562, 'loss/train': 1.743016242980957} -11/07/2021 00:32:39 - INFO - __main__ - Step 23564: {'lr': 0.0004742658891278346, 'samples': 4524288, 'steps': 23563, 'loss/train': 1.435360074043274} -11/07/2021 00:32:39 - INFO - __main__ - Step 23565: {'lr': 0.0004742635440187828, 'samples': 4524480, 'steps': 23564, 'loss/train': 1.9791362285614014} -11/07/2021 00:32:39 - INFO - __main__ - Step 23566: {'lr': 0.00047426119880868123, 'samples': 4524672, 'steps': 23565, 'loss/train': 1.8396615982055664} -11/07/2021 00:32:40 - INFO - __main__ - Step 23567: {'lr': 0.00047425885349753114, 'samples': 4524864, 'steps': 23566, 'loss/train': 2.3755545616149902} -11/07/2021 00:32:41 - INFO - __main__ - Step 23568: {'lr': 0.0004742565080853334, 'samples': 4525056, 'steps': 23567, 'loss/train': 1.3045393228530884} -11/07/2021 00:32:41 - INFO - __main__ - Step 23569: {'lr': 0.00047425416257208916, 'samples': 4525248, 'steps': 23568, 'loss/train': 1.8492480516433716} -11/07/2021 00:32:41 - INFO - __main__ - Step 23570: {'lr': 0.0004742518169577994, 'samples': 4525440, 'steps': 23569, 'loss/train': 0.9899062514305115} -11/07/2021 00:32:42 - INFO - __main__ - Step 23571: {'lr': 0.0004742494712424653, 'samples': 4525632, 'steps': 23570, 'loss/train': 1.6598799228668213} -11/07/2021 00:32:42 - INFO - __main__ - Step 23572: {'lr': 0.0004742471254260878, 'samples': 4525824, 'steps': 23571, 'loss/train': 1.4144138097763062} -11/07/2021 00:32:43 - INFO - __main__ - Step 23573: {'lr': 0.0004742447795086681, 'samples': 4526016, 'steps': 23572, 'loss/train': 1.53965163230896} -11/07/2021 00:32:43 - INFO - __main__ - Step 23574: {'lr': 0.00047424243349020705, 'samples': 4526208, 'steps': 23573, 'loss/train': 1.7604814767837524} -11/07/2021 00:32:44 - INFO - __main__ - Step 23575: {'lr': 0.0004742400873707059, 'samples': 4526400, 'steps': 23574, 'loss/train': 1.8213621377944946} -11/07/2021 00:32:44 - INFO - __main__ - Step 23576: {'lr': 0.0004742377411501656, 'samples': 4526592, 'steps': 23575, 'loss/train': 1.6603103876113892} -11/07/2021 00:32:44 - INFO - __main__ - Step 23577: {'lr': 0.00047423539482858724, 'samples': 4526784, 'steps': 23576, 'loss/train': 1.6569072008132935} -11/07/2021 00:32:45 - INFO - __main__ - Step 23578: {'lr': 0.0004742330484059718, 'samples': 4526976, 'steps': 23577, 'loss/train': 1.5407042503356934} -11/07/2021 00:32:46 - INFO - __main__ - Step 23579: {'lr': 0.0004742307018823205, 'samples': 4527168, 'steps': 23578, 'loss/train': 1.5448529720306396} -11/07/2021 00:32:46 - INFO - __main__ - Step 23580: {'lr': 0.0004742283552576343, 'samples': 4527360, 'steps': 23579, 'loss/train': 1.6284503936767578} -11/07/2021 00:32:47 - INFO - __main__ - Step 23581: {'lr': 0.0004742260085319142, 'samples': 4527552, 'steps': 23580, 'loss/train': 1.5191917419433594} -11/07/2021 00:32:47 - INFO - __main__ - Step 23582: {'lr': 0.0004742236617051614, 'samples': 4527744, 'steps': 23581, 'loss/train': 1.9894447326660156} -11/07/2021 00:32:48 - INFO - __main__ - Step 23583: {'lr': 0.00047422131477737684, 'samples': 4527936, 'steps': 23582, 'loss/train': 1.6390395164489746} -11/07/2021 00:32:48 - INFO - __main__ - Step 23584: {'lr': 0.00047421896774856156, 'samples': 4528128, 'steps': 23583, 'loss/train': 1.4163792133331299} -11/07/2021 00:32:49 - INFO - __main__ - Step 23585: {'lr': 0.00047421662061871675, 'samples': 4528320, 'steps': 23584, 'loss/train': 1.1335351467132568} -11/07/2021 00:32:49 - INFO - __main__ - Step 23586: {'lr': 0.0004742142733878433, 'samples': 4528512, 'steps': 23585, 'loss/train': 1.5170916318893433} -11/07/2021 00:32:49 - INFO - __main__ - Step 23587: {'lr': 0.0004742119260559424, 'samples': 4528704, 'steps': 23586, 'loss/train': 2.1219773292541504} -11/07/2021 00:32:50 - INFO - __main__ - Step 23588: {'lr': 0.0004742095786230152, 'samples': 4528896, 'steps': 23587, 'loss/train': 1.6570745706558228} -11/07/2021 00:32:51 - INFO - __main__ - Step 23589: {'lr': 0.00047420723108906247, 'samples': 4529088, 'steps': 23588, 'loss/train': 0.7063665986061096} -11/07/2021 00:32:51 - INFO - __main__ - Step 23590: {'lr': 0.0004742048834540855, 'samples': 4529280, 'steps': 23589, 'loss/train': 1.5621718168258667} -11/07/2021 00:32:51 - INFO - __main__ - Step 23591: {'lr': 0.0004742025357180852, 'samples': 4529472, 'steps': 23590, 'loss/train': 1.342724084854126} -11/07/2021 00:32:52 - INFO - __main__ - Step 23592: {'lr': 0.00047420018788106274, 'samples': 4529664, 'steps': 23591, 'loss/train': 1.7082022428512573} -11/07/2021 00:32:53 - INFO - __main__ - Step 23593: {'lr': 0.00047419783994301915, 'samples': 4529856, 'steps': 23592, 'loss/train': 0.6484775543212891} -11/07/2021 00:32:53 - INFO - __main__ - Step 23594: {'lr': 0.0004741954919039554, 'samples': 4530048, 'steps': 23593, 'loss/train': 2.074641466140747} -11/07/2021 00:32:53 - INFO - __main__ - Step 23595: {'lr': 0.0004741931437638727, 'samples': 4530240, 'steps': 23594, 'loss/train': 1.5737087726593018} -11/07/2021 00:32:54 - INFO - __main__ - Step 23596: {'lr': 0.000474190795522772, 'samples': 4530432, 'steps': 23595, 'loss/train': 1.5619804859161377} -11/07/2021 00:32:54 - INFO - __main__ - Step 23597: {'lr': 0.00047418844718065433, 'samples': 4530624, 'steps': 23596, 'loss/train': 1.6500996351242065} -11/07/2021 00:32:54 - INFO - __main__ - Step 23598: {'lr': 0.0004741860987375209, 'samples': 4530816, 'steps': 23597, 'loss/train': 1.5560089349746704} -11/07/2021 00:32:56 - INFO - __main__ - Step 23599: {'lr': 0.00047418375019337263, 'samples': 4531008, 'steps': 23598, 'loss/train': 1.3333616256713867} -11/07/2021 00:32:56 - INFO - __main__ - Step 23600: {'lr': 0.00047418140154821065, 'samples': 4531200, 'steps': 23599, 'loss/train': 1.4364854097366333} -11/07/2021 00:32:56 - INFO - __main__ - Step 23601: {'lr': 0.00047417905280203594, 'samples': 4531392, 'steps': 23600, 'loss/train': 1.3260753154754639} -11/07/2021 00:32:57 - INFO - __main__ - Step 23602: {'lr': 0.00047417670395484963, 'samples': 4531584, 'steps': 23601, 'loss/train': 1.3692469596862793} -11/07/2021 00:32:57 - INFO - __main__ - Step 23603: {'lr': 0.0004741743550066527, 'samples': 4531776, 'steps': 23602, 'loss/train': 1.2754849195480347} -11/07/2021 00:32:58 - INFO - __main__ - Step 23604: {'lr': 0.00047417200595744637, 'samples': 4531968, 'steps': 23603, 'loss/train': 1.112447738647461} -11/07/2021 00:32:58 - INFO - __main__ - Step 23605: {'lr': 0.0004741696568072316, 'samples': 4532160, 'steps': 23604, 'loss/train': 1.3442082405090332} -11/07/2021 00:32:59 - INFO - __main__ - Step 23606: {'lr': 0.00047416730755600936, 'samples': 4532352, 'steps': 23605, 'loss/train': 1.3705646991729736} -11/07/2021 00:32:59 - INFO - __main__ - Step 23607: {'lr': 0.0004741649582037808, 'samples': 4532544, 'steps': 23606, 'loss/train': 1.8504846096038818} -11/07/2021 00:32:59 - INFO - __main__ - Step 23608: {'lr': 0.000474162608750547, 'samples': 4532736, 'steps': 23607, 'loss/train': 2.0150325298309326} -11/07/2021 00:33:00 - INFO - __main__ - Step 23609: {'lr': 0.000474160259196309, 'samples': 4532928, 'steps': 23608, 'loss/train': 1.2820730209350586} -11/07/2021 00:33:01 - INFO - __main__ - Step 23610: {'lr': 0.0004741579095410678, 'samples': 4533120, 'steps': 23609, 'loss/train': 1.6252810955047607} -11/07/2021 00:33:01 - INFO - __main__ - Step 23611: {'lr': 0.0004741555597848245, 'samples': 4533312, 'steps': 23610, 'loss/train': 1.7831580638885498} -11/07/2021 00:33:01 - INFO - __main__ - Step 23612: {'lr': 0.00047415320992758025, 'samples': 4533504, 'steps': 23611, 'loss/train': 1.6855032444000244} -11/07/2021 00:33:02 - INFO - __main__ - Step 23613: {'lr': 0.00047415085996933593, 'samples': 4533696, 'steps': 23612, 'loss/train': 1.319211721420288} -11/07/2021 00:33:03 - INFO - __main__ - Step 23614: {'lr': 0.00047414850991009275, 'samples': 4533888, 'steps': 23613, 'loss/train': 1.65987229347229} -11/07/2021 00:33:03 - INFO - __main__ - Step 23615: {'lr': 0.00047414615974985164, 'samples': 4534080, 'steps': 23614, 'loss/train': 0.9914699792861938} -11/07/2021 00:33:04 - INFO - __main__ - Step 23616: {'lr': 0.0004741438094886138, 'samples': 4534272, 'steps': 23615, 'loss/train': 1.6350009441375732} -11/07/2021 00:33:04 - INFO - __main__ - Step 23617: {'lr': 0.00047414145912638017, 'samples': 4534464, 'steps': 23616, 'loss/train': 2.2170348167419434} -11/07/2021 00:33:04 - INFO - __main__ - Step 23618: {'lr': 0.00047413910866315193, 'samples': 4534656, 'steps': 23617, 'loss/train': 1.1351796388626099} -11/07/2021 00:33:05 - INFO - __main__ - Step 23619: {'lr': 0.00047413675809893, 'samples': 4534848, 'steps': 23618, 'loss/train': 1.7873129844665527} -11/07/2021 00:33:06 - INFO - __main__ - Step 23620: {'lr': 0.0004741344074337155, 'samples': 4535040, 'steps': 23619, 'loss/train': 1.7315502166748047} -11/07/2021 00:33:06 - INFO - __main__ - Step 23621: {'lr': 0.00047413205666750955, 'samples': 4535232, 'steps': 23620, 'loss/train': 1.3562512397766113} -11/07/2021 00:33:06 - INFO - __main__ - Step 23622: {'lr': 0.0004741297058003131, 'samples': 4535424, 'steps': 23621, 'loss/train': 1.4748079776763916} -11/07/2021 00:33:07 - INFO - __main__ - Step 23623: {'lr': 0.00047412735483212725, 'samples': 4535616, 'steps': 23622, 'loss/train': 1.5654685497283936} -11/07/2021 00:33:08 - INFO - __main__ - Step 23624: {'lr': 0.0004741250037629531, 'samples': 4535808, 'steps': 23623, 'loss/train': 1.7665811777114868} -11/07/2021 00:33:08 - INFO - __main__ - Step 23625: {'lr': 0.00047412265259279176, 'samples': 4536000, 'steps': 23624, 'loss/train': 1.4605038166046143} -11/07/2021 00:33:08 - INFO - __main__ - Step 23626: {'lr': 0.0004741203013216441, 'samples': 4536192, 'steps': 23625, 'loss/train': 1.5320707559585571} -11/07/2021 00:33:09 - INFO - __main__ - Step 23627: {'lr': 0.0004741179499495113, 'samples': 4536384, 'steps': 23626, 'loss/train': 1.793100118637085} -11/07/2021 00:33:09 - INFO - __main__ - Step 23628: {'lr': 0.00047411559847639447, 'samples': 4536576, 'steps': 23627, 'loss/train': 2.0532431602478027} -11/07/2021 00:33:10 - INFO - __main__ - Step 23629: {'lr': 0.0004741132469022946, 'samples': 4536768, 'steps': 23628, 'loss/train': 1.0437623262405396} -11/07/2021 00:33:10 - INFO - __main__ - Step 23630: {'lr': 0.00047411089522721275, 'samples': 4536960, 'steps': 23629, 'loss/train': 2.1174731254577637} -11/07/2021 00:33:11 - INFO - __main__ - Step 23631: {'lr': 0.00047410854345114996, 'samples': 4537152, 'steps': 23630, 'loss/train': 0.6693663597106934} -11/07/2021 00:33:11 - INFO - __main__ - Step 23632: {'lr': 0.0004741061915741073, 'samples': 4537344, 'steps': 23631, 'loss/train': 1.8703787326812744} -11/07/2021 00:33:11 - INFO - __main__ - Step 23633: {'lr': 0.0004741038395960859, 'samples': 4537536, 'steps': 23632, 'loss/train': 1.3280048370361328} -11/07/2021 00:33:12 - INFO - __main__ - Step 23634: {'lr': 0.0004741014875170867, 'samples': 4537728, 'steps': 23633, 'loss/train': 1.6490123271942139} -11/07/2021 00:33:13 - INFO - __main__ - Step 23635: {'lr': 0.0004740991353371109, 'samples': 4537920, 'steps': 23634, 'loss/train': 1.6307944059371948} -11/07/2021 00:33:13 - INFO - __main__ - Step 23636: {'lr': 0.0004740967830561595, 'samples': 4538112, 'steps': 23635, 'loss/train': 1.108677864074707} -11/07/2021 00:33:14 - INFO - __main__ - Step 23637: {'lr': 0.0004740944306742335, 'samples': 4538304, 'steps': 23636, 'loss/train': 1.346545934677124} -11/07/2021 00:33:14 - INFO - __main__ - Step 23638: {'lr': 0.00047409207819133406, 'samples': 4538496, 'steps': 23637, 'loss/train': 1.454825520515442} -11/07/2021 00:33:14 - INFO - __main__ - Step 23639: {'lr': 0.0004740897256074621, 'samples': 4538688, 'steps': 23638, 'loss/train': 1.580127239227295} -11/07/2021 00:33:15 - INFO - __main__ - Step 23640: {'lr': 0.00047408737292261883, 'samples': 4538880, 'steps': 23639, 'loss/train': 0.9592517614364624} -11/07/2021 00:33:16 - INFO - __main__ - Step 23641: {'lr': 0.0004740850201368052, 'samples': 4539072, 'steps': 23640, 'loss/train': 1.6052862405776978} -11/07/2021 00:33:16 - INFO - __main__ - Step 23642: {'lr': 0.00047408266725002234, 'samples': 4539264, 'steps': 23641, 'loss/train': 1.3032270669937134} -11/07/2021 00:33:16 - INFO - __main__ - Step 23643: {'lr': 0.00047408031426227136, 'samples': 4539456, 'steps': 23642, 'loss/train': 1.8782343864440918} -11/07/2021 00:33:17 - INFO - __main__ - Step 23644: {'lr': 0.0004740779611735532, 'samples': 4539648, 'steps': 23643, 'loss/train': 1.4260307550430298} -11/07/2021 00:33:18 - INFO - __main__ - Step 23645: {'lr': 0.00047407560798386894, 'samples': 4539840, 'steps': 23644, 'loss/train': 1.8145923614501953} -11/07/2021 00:33:18 - INFO - __main__ - Step 23646: {'lr': 0.00047407325469321973, 'samples': 4540032, 'steps': 23645, 'loss/train': 1.4783227443695068} -11/07/2021 00:33:18 - INFO - __main__ - Step 23647: {'lr': 0.0004740709013016065, 'samples': 4540224, 'steps': 23646, 'loss/train': 1.334385633468628} -11/07/2021 00:33:19 - INFO - __main__ - Step 23648: {'lr': 0.0004740685478090304, 'samples': 4540416, 'steps': 23647, 'loss/train': 1.4337353706359863} -11/07/2021 00:33:19 - INFO - __main__ - Step 23649: {'lr': 0.00047406619421549247, 'samples': 4540608, 'steps': 23648, 'loss/train': 1.5111690759658813} -11/07/2021 00:33:20 - INFO - __main__ - Step 23650: {'lr': 0.0004740638405209938, 'samples': 4540800, 'steps': 23649, 'loss/train': 0.9457454681396484} -11/07/2021 00:33:21 - INFO - __main__ - Step 23651: {'lr': 0.0004740614867255353, 'samples': 4540992, 'steps': 23650, 'loss/train': 1.8303914070129395} -11/07/2021 00:33:21 - INFO - __main__ - Step 23652: {'lr': 0.0004740591328291183, 'samples': 4541184, 'steps': 23651, 'loss/train': 1.987184762954712} -11/07/2021 00:33:21 - INFO - __main__ - Step 23653: {'lr': 0.0004740567788317437, 'samples': 4541376, 'steps': 23652, 'loss/train': 0.5793235301971436} -11/07/2021 00:33:22 - INFO - __main__ - Step 23654: {'lr': 0.00047405442473341246, 'samples': 4541568, 'steps': 23653, 'loss/train': 1.494931936264038} -11/07/2021 00:33:23 - INFO - __main__ - Step 23655: {'lr': 0.0004740520705341259, 'samples': 4541760, 'steps': 23654, 'loss/train': 1.5534117221832275} -11/07/2021 00:33:23 - INFO - __main__ - Step 23656: {'lr': 0.0004740497162338848, 'samples': 4541952, 'steps': 23655, 'loss/train': 1.853484869003296} -11/07/2021 00:33:23 - INFO - __main__ - Step 23657: {'lr': 0.00047404736183269045, 'samples': 4542144, 'steps': 23656, 'loss/train': 1.5425233840942383} -11/07/2021 00:33:24 - INFO - __main__ - Step 23658: {'lr': 0.0004740450073305438, 'samples': 4542336, 'steps': 23657, 'loss/train': 0.7227396368980408} -11/07/2021 00:33:24 - INFO - __main__ - Step 23659: {'lr': 0.00047404265272744586, 'samples': 4542528, 'steps': 23658, 'loss/train': 1.440316081047058} -11/07/2021 00:33:25 - INFO - __main__ - Step 23660: {'lr': 0.0004740402980233978, 'samples': 4542720, 'steps': 23659, 'loss/train': 2.089398145675659} -11/07/2021 00:33:26 - INFO - __main__ - Step 23661: {'lr': 0.00047403794321840064, 'samples': 4542912, 'steps': 23660, 'loss/train': 1.4879977703094482} -11/07/2021 00:33:26 - INFO - __main__ - Step 23662: {'lr': 0.0004740355883124555, 'samples': 4543104, 'steps': 23661, 'loss/train': 1.8466298580169678} -11/07/2021 00:33:26 - INFO - __main__ - Step 23663: {'lr': 0.0004740332333055633, 'samples': 4543296, 'steps': 23662, 'loss/train': 1.6448774337768555} -11/07/2021 00:33:27 - INFO - __main__ - Step 23664: {'lr': 0.00047403087819772517, 'samples': 4543488, 'steps': 23663, 'loss/train': 1.5351874828338623} -11/07/2021 00:33:27 - INFO - __main__ - Step 23665: {'lr': 0.0004740285229889423, 'samples': 4543680, 'steps': 23664, 'loss/train': 1.558956503868103} -11/07/2021 00:33:29 - INFO - __main__ - Step 23666: {'lr': 0.0004740261676792155, 'samples': 4543872, 'steps': 23665, 'loss/train': 0.8988344669342041} -11/07/2021 00:33:29 - INFO - __main__ - Step 23667: {'lr': 0.00047402381226854606, 'samples': 4544064, 'steps': 23666, 'loss/train': 1.6064356565475464} -11/07/2021 00:33:29 - INFO - __main__ - Step 23668: {'lr': 0.0004740214567569349, 'samples': 4544256, 'steps': 23667, 'loss/train': 0.2895216941833496} -11/07/2021 00:33:30 - INFO - __main__ - Step 23669: {'lr': 0.00047401910114438313, 'samples': 4544448, 'steps': 23668, 'loss/train': 1.3126306533813477} -11/07/2021 00:33:30 - INFO - __main__ - Step 23670: {'lr': 0.0004740167454308918, 'samples': 4544640, 'steps': 23669, 'loss/train': 1.4516186714172363} -11/07/2021 00:33:31 - INFO - __main__ - Step 23671: {'lr': 0.00047401438961646206, 'samples': 4544832, 'steps': 23670, 'loss/train': 1.4971883296966553} -11/07/2021 00:33:31 - INFO - __main__ - Step 23672: {'lr': 0.0004740120337010948, 'samples': 4545024, 'steps': 23671, 'loss/train': 1.5388046503067017} -11/07/2021 00:33:32 - INFO - __main__ - Step 23673: {'lr': 0.0004740096776847912, 'samples': 4545216, 'steps': 23672, 'loss/train': 1.6670520305633545} -11/07/2021 00:33:32 - INFO - __main__ - Step 23674: {'lr': 0.0004740073215675523, 'samples': 4545408, 'steps': 23673, 'loss/train': 2.9824087619781494} -11/07/2021 00:33:33 - INFO - __main__ - Step 23675: {'lr': 0.00047400496534937914, 'samples': 4545600, 'steps': 23674, 'loss/train': 1.6415568590164185} -11/07/2021 00:33:33 - INFO - __main__ - Step 23676: {'lr': 0.00047400260903027283, 'samples': 4545792, 'steps': 23675, 'loss/train': 1.2974762916564941} -11/07/2021 00:33:34 - INFO - __main__ - Step 23677: {'lr': 0.0004740002526102344, 'samples': 4545984, 'steps': 23676, 'loss/train': 1.6875091791152954} -11/07/2021 00:33:34 - INFO - __main__ - Step 23678: {'lr': 0.0004739978960892649, 'samples': 4546176, 'steps': 23677, 'loss/train': 1.305275797843933} -11/07/2021 00:33:35 - INFO - __main__ - Step 23679: {'lr': 0.0004739955394673654, 'samples': 4546368, 'steps': 23678, 'loss/train': 1.652904748916626} -11/07/2021 00:33:35 - INFO - __main__ - Step 23680: {'lr': 0.000473993182744537, 'samples': 4546560, 'steps': 23679, 'loss/train': 1.9933096170425415} -11/07/2021 00:33:35 - INFO - __main__ - Step 23681: {'lr': 0.0004739908259207807, 'samples': 4546752, 'steps': 23680, 'loss/train': 1.8885129690170288} -11/07/2021 00:33:36 - INFO - __main__ - Step 23682: {'lr': 0.00047398846899609755, 'samples': 4546944, 'steps': 23681, 'loss/train': 1.5400047302246094} -11/07/2021 00:33:37 - INFO - __main__ - Step 23683: {'lr': 0.0004739861119704887, 'samples': 4547136, 'steps': 23682, 'loss/train': 0.4810228943824768} -11/07/2021 00:33:37 - INFO - __main__ - Step 23684: {'lr': 0.00047398375484395517, 'samples': 4547328, 'steps': 23683, 'loss/train': 0.52688068151474} -11/07/2021 00:33:38 - INFO - __main__ - Step 23685: {'lr': 0.00047398139761649794, 'samples': 4547520, 'steps': 23684, 'loss/train': 1.4102141857147217} -11/07/2021 00:33:38 - INFO - __main__ - Step 23686: {'lr': 0.00047397904028811824, 'samples': 4547712, 'steps': 23685, 'loss/train': 0.9328953623771667} -11/07/2021 00:33:38 - INFO - __main__ - Step 23687: {'lr': 0.000473976682858817, 'samples': 4547904, 'steps': 23686, 'loss/train': 1.6522045135498047} -11/07/2021 00:33:39 - INFO - __main__ - Step 23688: {'lr': 0.00047397432532859533, 'samples': 4548096, 'steps': 23687, 'loss/train': 1.5263078212738037} -11/07/2021 00:33:40 - INFO - __main__ - Step 23689: {'lr': 0.00047397196769745435, 'samples': 4548288, 'steps': 23688, 'loss/train': 2.3755886554718018} -11/07/2021 00:33:40 - INFO - __main__ - Step 23690: {'lr': 0.00047396960996539495, 'samples': 4548480, 'steps': 23689, 'loss/train': 1.8563801050186157} -11/07/2021 00:33:40 - INFO - __main__ - Step 23691: {'lr': 0.00047396725213241835, 'samples': 4548672, 'steps': 23690, 'loss/train': 1.7212902307510376} -11/07/2021 00:33:41 - INFO - __main__ - Step 23692: {'lr': 0.0004739648941985256, 'samples': 4548864, 'steps': 23691, 'loss/train': 1.688942551612854} -11/07/2021 00:33:42 - INFO - __main__ - Step 23693: {'lr': 0.00047396253616371767, 'samples': 4549056, 'steps': 23692, 'loss/train': 1.251467227935791} -11/07/2021 00:33:42 - INFO - __main__ - Step 23694: {'lr': 0.00047396017802799566, 'samples': 4549248, 'steps': 23693, 'loss/train': 1.5889075994491577} -11/07/2021 00:33:42 - INFO - __main__ - Step 23695: {'lr': 0.0004739578197913607, 'samples': 4549440, 'steps': 23694, 'loss/train': 1.5907773971557617} -11/07/2021 00:33:43 - INFO - __main__ - Step 23696: {'lr': 0.00047395546145381377, 'samples': 4549632, 'steps': 23695, 'loss/train': 1.313461184501648} -11/07/2021 00:33:43 - INFO - __main__ - Step 23697: {'lr': 0.000473953103015356, 'samples': 4549824, 'steps': 23696, 'loss/train': 1.1808024644851685} -11/07/2021 00:33:44 - INFO - __main__ - Step 23698: {'lr': 0.0004739507444759884, 'samples': 4550016, 'steps': 23697, 'loss/train': 2.071528196334839} -11/07/2021 00:33:45 - INFO - __main__ - Step 23699: {'lr': 0.0004739483858357121, 'samples': 4550208, 'steps': 23698, 'loss/train': 1.835963249206543} -11/07/2021 00:33:45 - INFO - __main__ - Step 23700: {'lr': 0.00047394602709452806, 'samples': 4550400, 'steps': 23699, 'loss/train': 0.18768851459026337} -11/07/2021 00:33:45 - INFO - __main__ - Step 23701: {'lr': 0.0004739436682524373, 'samples': 4550592, 'steps': 23700, 'loss/train': 1.2520087957382202} -11/07/2021 00:33:46 - INFO - __main__ - Step 23702: {'lr': 0.00047394130930944115, 'samples': 4550784, 'steps': 23701, 'loss/train': 1.1662386655807495} -11/07/2021 00:33:47 - INFO - __main__ - Step 23703: {'lr': 0.0004739389502655404, 'samples': 4550976, 'steps': 23702, 'loss/train': 1.2932790517807007} -11/07/2021 00:33:47 - INFO - __main__ - Step 23704: {'lr': 0.0004739365911207363, 'samples': 4551168, 'steps': 23703, 'loss/train': 0.9172234535217285} -11/07/2021 00:33:48 - INFO - __main__ - Step 23705: {'lr': 0.0004739342318750297, 'samples': 4551360, 'steps': 23704, 'loss/train': 1.4475271701812744} -11/07/2021 00:33:48 - INFO - __main__ - Step 23706: {'lr': 0.00047393187252842183, 'samples': 4551552, 'steps': 23705, 'loss/train': 1.6185001134872437} -11/07/2021 00:33:48 - INFO - __main__ - Step 23707: {'lr': 0.0004739295130809138, 'samples': 4551744, 'steps': 23706, 'loss/train': 1.2477144002914429} -11/07/2021 00:33:49 - INFO - __main__ - Step 23708: {'lr': 0.0004739271535325065, 'samples': 4551936, 'steps': 23707, 'loss/train': 0.19320560991764069} -11/07/2021 00:33:50 - INFO - __main__ - Step 23709: {'lr': 0.00047392479388320106, 'samples': 4552128, 'steps': 23708, 'loss/train': 1.6384211778640747} -11/07/2021 00:33:50 - INFO - __main__ - Step 23710: {'lr': 0.0004739224341329987, 'samples': 4552320, 'steps': 23709, 'loss/train': 1.2958784103393555} -11/07/2021 00:33:50 - INFO - __main__ - Step 23711: {'lr': 0.0004739200742819002, 'samples': 4552512, 'steps': 23710, 'loss/train': 1.7707363367080688} -11/07/2021 00:33:51 - INFO - __main__ - Step 23712: {'lr': 0.0004739177143299068, 'samples': 4552704, 'steps': 23711, 'loss/train': 1.6255106925964355} -11/07/2021 00:33:52 - INFO - __main__ - Step 23713: {'lr': 0.00047391535427701966, 'samples': 4552896, 'steps': 23712, 'loss/train': 1.129692554473877} -11/07/2021 00:33:52 - INFO - __main__ - Step 23714: {'lr': 0.0004739129941232396, 'samples': 4553088, 'steps': 23713, 'loss/train': 1.1649988889694214} -11/07/2021 00:33:52 - INFO - __main__ - Step 23715: {'lr': 0.0004739106338685678, 'samples': 4553280, 'steps': 23714, 'loss/train': 1.1176279783248901} -11/07/2021 00:33:53 - INFO - __main__ - Step 23716: {'lr': 0.00047390827351300537, 'samples': 4553472, 'steps': 23715, 'loss/train': 1.1965147256851196} -11/07/2021 00:33:53 - INFO - __main__ - Step 23717: {'lr': 0.00047390591305655327, 'samples': 4553664, 'steps': 23716, 'loss/train': 1.4697896242141724} -11/07/2021 00:33:54 - INFO - __main__ - Step 23718: {'lr': 0.0004739035524992127, 'samples': 4553856, 'steps': 23717, 'loss/train': 1.6495895385742188} -11/07/2021 00:33:55 - INFO - __main__ - Step 23719: {'lr': 0.00047390119184098455, 'samples': 4554048, 'steps': 23718, 'loss/train': 1.7443530559539795} -11/07/2021 00:33:55 - INFO - __main__ - Step 23720: {'lr': 0.00047389883108187004, 'samples': 4554240, 'steps': 23719, 'loss/train': 1.670081615447998} -11/07/2021 00:33:55 - INFO - __main__ - Step 23721: {'lr': 0.00047389647022187014, 'samples': 4554432, 'steps': 23720, 'loss/train': 1.5686086416244507} -11/07/2021 00:33:56 - INFO - __main__ - Step 23722: {'lr': 0.000473894109260986, 'samples': 4554624, 'steps': 23721, 'loss/train': 1.5855025053024292} -11/07/2021 00:33:57 - INFO - __main__ - Step 23723: {'lr': 0.00047389174819921856, 'samples': 4554816, 'steps': 23722, 'loss/train': 1.3018687963485718} -11/07/2021 00:33:57 - INFO - __main__ - Step 23724: {'lr': 0.000473889387036569, 'samples': 4555008, 'steps': 23723, 'loss/train': 1.0580642223358154} -11/07/2021 00:33:57 - INFO - __main__ - Step 23725: {'lr': 0.0004738870257730383, 'samples': 4555200, 'steps': 23724, 'loss/train': 1.2072584629058838} -11/07/2021 00:33:58 - INFO - __main__ - Step 23726: {'lr': 0.00047388466440862755, 'samples': 4555392, 'steps': 23725, 'loss/train': 1.599613070487976} -11/07/2021 00:33:58 - INFO - __main__ - Step 23727: {'lr': 0.0004738823029433379, 'samples': 4555584, 'steps': 23726, 'loss/train': 1.6899038553237915} -11/07/2021 00:33:59 - INFO - __main__ - Step 23728: {'lr': 0.0004738799413771703, 'samples': 4555776, 'steps': 23727, 'loss/train': 1.2398737668991089} -11/07/2021 00:33:59 - INFO - __main__ - Step 23729: {'lr': 0.0004738775797101258, 'samples': 4555968, 'steps': 23728, 'loss/train': 1.8582526445388794} -11/07/2021 00:34:00 - INFO - __main__ - Step 23730: {'lr': 0.0004738752179422056, 'samples': 4556160, 'steps': 23729, 'loss/train': 1.6827188730239868} -11/07/2021 00:34:00 - INFO - __main__ - Step 23731: {'lr': 0.00047387285607341064, 'samples': 4556352, 'steps': 23730, 'loss/train': 1.5931893587112427} -11/07/2021 00:34:00 - INFO - __main__ - Step 23732: {'lr': 0.00047387049410374207, 'samples': 4556544, 'steps': 23731, 'loss/train': 1.499029517173767} -11/07/2021 00:34:01 - INFO - __main__ - Step 23733: {'lr': 0.00047386813203320084, 'samples': 4556736, 'steps': 23732, 'loss/train': 1.8736869096755981} -11/07/2021 00:34:02 - INFO - __main__ - Step 23734: {'lr': 0.0004738657698617881, 'samples': 4556928, 'steps': 23733, 'loss/train': 1.6546939611434937} -11/07/2021 00:34:02 - INFO - __main__ - Step 23735: {'lr': 0.00047386340758950494, 'samples': 4557120, 'steps': 23734, 'loss/train': 1.7338857650756836} -11/07/2021 00:34:02 - INFO - __main__ - Step 23736: {'lr': 0.0004738610452163523, 'samples': 4557312, 'steps': 23735, 'loss/train': 0.9500973224639893} -11/07/2021 00:34:03 - INFO - __main__ - Step 23737: {'lr': 0.00047385868274233144, 'samples': 4557504, 'steps': 23736, 'loss/train': 1.6614608764648438} -11/07/2021 00:34:03 - INFO - __main__ - Step 23738: {'lr': 0.0004738563201674432, 'samples': 4557696, 'steps': 23737, 'loss/train': 1.8918787240982056} -11/07/2021 00:34:04 - INFO - __main__ - Step 23739: {'lr': 0.00047385395749168885, 'samples': 4557888, 'steps': 23738, 'loss/train': 0.8991847038269043} -11/07/2021 00:34:04 - INFO - __main__ - Step 23740: {'lr': 0.00047385159471506936, 'samples': 4558080, 'steps': 23739, 'loss/train': 1.4461966753005981} -11/07/2021 00:34:05 - INFO - __main__ - Step 23741: {'lr': 0.00047384923183758573, 'samples': 4558272, 'steps': 23740, 'loss/train': 1.3142222166061401} -11/07/2021 00:34:05 - INFO - __main__ - Step 23742: {'lr': 0.0004738468688592391, 'samples': 4558464, 'steps': 23741, 'loss/train': 1.3879821300506592} -11/07/2021 00:34:05 - INFO - __main__ - Step 23743: {'lr': 0.00047384450578003055, 'samples': 4558656, 'steps': 23742, 'loss/train': 1.8437845706939697} -11/07/2021 00:34:07 - INFO - __main__ - Step 23744: {'lr': 0.00047384214259996117, 'samples': 4558848, 'steps': 23743, 'loss/train': 1.3957382440567017} -11/07/2021 00:34:07 - INFO - __main__ - Step 23745: {'lr': 0.0004738397793190319, 'samples': 4559040, 'steps': 23744, 'loss/train': 1.3842023611068726} -11/07/2021 00:34:07 - INFO - __main__ - Step 23746: {'lr': 0.00047383741593724386, 'samples': 4559232, 'steps': 23745, 'loss/train': 1.6281683444976807} -11/07/2021 00:34:08 - INFO - __main__ - Step 23747: {'lr': 0.0004738350524545982, 'samples': 4559424, 'steps': 23746, 'loss/train': 1.2148529291152954} -11/07/2021 00:34:08 - INFO - __main__ - Step 23748: {'lr': 0.0004738326888710959, 'samples': 4559616, 'steps': 23747, 'loss/train': 1.2071878910064697} -11/07/2021 00:34:09 - INFO - __main__ - Step 23749: {'lr': 0.000473830325186738, 'samples': 4559808, 'steps': 23748, 'loss/train': 1.7111480236053467} -11/07/2021 00:34:09 - INFO - __main__ - Step 23750: {'lr': 0.0004738279614015257, 'samples': 4560000, 'steps': 23749, 'loss/train': 1.5095964670181274} -11/07/2021 00:34:10 - INFO - __main__ - Step 23751: {'lr': 0.0004738255975154599, 'samples': 4560192, 'steps': 23750, 'loss/train': 1.6067538261413574} -11/07/2021 00:34:10 - INFO - __main__ - Step 23752: {'lr': 0.0004738232335285417, 'samples': 4560384, 'steps': 23751, 'loss/train': 1.4667108058929443} -11/07/2021 00:34:10 - INFO - __main__ - Step 23753: {'lr': 0.0004738208694407723, 'samples': 4560576, 'steps': 23752, 'loss/train': 1.8321415185928345} -11/07/2021 00:34:11 - INFO - __main__ - Step 23754: {'lr': 0.00047381850525215265, 'samples': 4560768, 'steps': 23753, 'loss/train': 1.9358234405517578} -11/07/2021 00:34:12 - INFO - __main__ - Step 23755: {'lr': 0.0004738161409626838, 'samples': 4560960, 'steps': 23754, 'loss/train': 1.4177026748657227} -11/07/2021 00:34:13 - INFO - __main__ - Step 23756: {'lr': 0.0004738137765723669, 'samples': 4561152, 'steps': 23755, 'loss/train': 1.2879034280776978} -11/07/2021 00:34:13 - INFO - __main__ - Step 23757: {'lr': 0.0004738114120812029, 'samples': 4561344, 'steps': 23756, 'loss/train': 1.8649377822875977} -11/07/2021 00:34:13 - INFO - __main__ - Step 23758: {'lr': 0.000473809047489193, 'samples': 4561536, 'steps': 23757, 'loss/train': 1.4992769956588745} -11/07/2021 00:34:14 - INFO - __main__ - Step 23759: {'lr': 0.00047380668279633814, 'samples': 4561728, 'steps': 23758, 'loss/train': 1.7122327089309692} -11/07/2021 00:34:15 - INFO - __main__ - Step 23760: {'lr': 0.00047380431800263945, 'samples': 4561920, 'steps': 23759, 'loss/train': 1.4459832906723022} -11/07/2021 00:34:15 - INFO - __main__ - Step 23761: {'lr': 0.000473801953108098, 'samples': 4562112, 'steps': 23760, 'loss/train': 2.1364073753356934} -11/07/2021 00:34:15 - INFO - __main__ - Step 23762: {'lr': 0.0004737995881127149, 'samples': 4562304, 'steps': 23761, 'loss/train': 0.9302211403846741} -11/07/2021 00:34:16 - INFO - __main__ - Step 23763: {'lr': 0.0004737972230164911, 'samples': 4562496, 'steps': 23762, 'loss/train': 1.7650277614593506} -11/07/2021 00:34:16 - INFO - __main__ - Step 23764: {'lr': 0.0004737948578194278, 'samples': 4562688, 'steps': 23763, 'loss/train': 1.2138371467590332} -11/07/2021 00:34:17 - INFO - __main__ - Step 23765: {'lr': 0.00047379249252152585, 'samples': 4562880, 'steps': 23764, 'loss/train': 1.6768308877944946} -11/07/2021 00:34:17 - INFO - __main__ - Step 23766: {'lr': 0.00047379012712278656, 'samples': 4563072, 'steps': 23765, 'loss/train': 1.929826259613037} -11/07/2021 00:34:18 - INFO - __main__ - Step 23767: {'lr': 0.0004737877616232108, 'samples': 4563264, 'steps': 23766, 'loss/train': 1.3135716915130615} -11/07/2021 00:34:18 - INFO - __main__ - Step 23768: {'lr': 0.0004737853960227998, 'samples': 4563456, 'steps': 23767, 'loss/train': 1.617723822593689} -11/07/2021 00:34:18 - INFO - __main__ - Step 23769: {'lr': 0.00047378303032155454, 'samples': 4563648, 'steps': 23768, 'loss/train': 1.3294570446014404} -11/07/2021 00:34:20 - INFO - __main__ - Step 23770: {'lr': 0.0004737806645194761, 'samples': 4563840, 'steps': 23769, 'loss/train': 0.6377082467079163} -11/07/2021 00:34:20 - INFO - __main__ - Step 23771: {'lr': 0.00047377829861656556, 'samples': 4564032, 'steps': 23770, 'loss/train': 0.9689741730690002} -11/07/2021 00:34:20 - INFO - __main__ - Step 23772: {'lr': 0.000473775932612824, 'samples': 4564224, 'steps': 23771, 'loss/train': 1.4321142435073853} -11/07/2021 00:34:21 - INFO - __main__ - Step 23773: {'lr': 0.00047377356650825245, 'samples': 4564416, 'steps': 23772, 'loss/train': 1.3861149549484253} -11/07/2021 00:34:21 - INFO - __main__ - Step 23774: {'lr': 0.00047377120030285194, 'samples': 4564608, 'steps': 23773, 'loss/train': 1.1893134117126465} -11/07/2021 00:34:22 - INFO - __main__ - Step 23775: {'lr': 0.0004737688339966235, 'samples': 4564800, 'steps': 23774, 'loss/train': 1.7470072507858276} -11/07/2021 00:34:22 - INFO - __main__ - Step 23776: {'lr': 0.00047376646758956844, 'samples': 4564992, 'steps': 23775, 'loss/train': 1.2687187194824219} -11/07/2021 00:34:23 - INFO - __main__ - Step 23777: {'lr': 0.00047376410108168756, 'samples': 4565184, 'steps': 23776, 'loss/train': 1.6561030149459839} -11/07/2021 00:34:23 - INFO - __main__ - Step 23778: {'lr': 0.0004737617344729821, 'samples': 4565376, 'steps': 23777, 'loss/train': 1.5290687084197998} -11/07/2021 00:34:23 - INFO - __main__ - Step 23779: {'lr': 0.00047375936776345297, 'samples': 4565568, 'steps': 23778, 'loss/train': 1.043493390083313} -11/07/2021 00:34:24 - INFO - __main__ - Step 23780: {'lr': 0.00047375700095310136, 'samples': 4565760, 'steps': 23779, 'loss/train': 1.7410577535629272} -11/07/2021 00:34:25 - INFO - __main__ - Step 23781: {'lr': 0.0004737546340419283, 'samples': 4565952, 'steps': 23780, 'loss/train': 1.6509655714035034} -11/07/2021 00:34:25 - INFO - __main__ - Step 23782: {'lr': 0.0004737522670299349, 'samples': 4566144, 'steps': 23781, 'loss/train': 1.9898253679275513} -11/07/2021 00:34:25 - INFO - __main__ - Step 23783: {'lr': 0.00047374989991712214, 'samples': 4566336, 'steps': 23782, 'loss/train': 1.4818731546401978} -11/07/2021 00:34:26 - INFO - __main__ - Step 23784: {'lr': 0.00047374753270349113, 'samples': 4566528, 'steps': 23783, 'loss/train': 1.6137040853500366} -11/07/2021 00:34:27 - INFO - __main__ - Step 23785: {'lr': 0.00047374516538904287, 'samples': 4566720, 'steps': 23784, 'loss/train': 1.2234424352645874} -11/07/2021 00:34:27 - INFO - __main__ - Step 23786: {'lr': 0.0004737427979737786, 'samples': 4566912, 'steps': 23785, 'loss/train': 1.9149585962295532} -11/07/2021 00:34:28 - INFO - __main__ - Step 23787: {'lr': 0.0004737404304576992, 'samples': 4567104, 'steps': 23786, 'loss/train': 1.2945975065231323} -11/07/2021 00:34:28 - INFO - __main__ - Step 23788: {'lr': 0.0004737380628408059, 'samples': 4567296, 'steps': 23787, 'loss/train': 1.7185180187225342} -11/07/2021 00:34:28 - INFO - __main__ - Step 23789: {'lr': 0.00047373569512309963, 'samples': 4567488, 'steps': 23788, 'loss/train': 1.5824964046478271} -11/07/2021 00:34:30 - INFO - __main__ - Step 23790: {'lr': 0.0004737333273045815, 'samples': 4567680, 'steps': 23789, 'loss/train': 0.2642037570476532} -11/07/2021 00:34:30 - INFO - __main__ - Step 23791: {'lr': 0.00047373095938525256, 'samples': 4567872, 'steps': 23790, 'loss/train': 1.5035150051116943} -11/07/2021 00:34:30 - INFO - __main__ - Step 23792: {'lr': 0.0004737285913651139, 'samples': 4568064, 'steps': 23791, 'loss/train': 1.7068278789520264} -11/07/2021 00:34:31 - INFO - __main__ - Step 23793: {'lr': 0.0004737262232441667, 'samples': 4568256, 'steps': 23792, 'loss/train': 0.1296090930700302} -11/07/2021 00:34:31 - INFO - __main__ - Step 23794: {'lr': 0.00047372385502241176, 'samples': 4568448, 'steps': 23793, 'loss/train': 1.8227049112319946} -11/07/2021 00:34:31 - INFO - __main__ - Step 23795: {'lr': 0.0004737214866998504, 'samples': 4568640, 'steps': 23794, 'loss/train': 1.3710237741470337} -11/07/2021 00:34:32 - INFO - __main__ - Step 23796: {'lr': 0.0004737191182764836, 'samples': 4568832, 'steps': 23795, 'loss/train': 1.4633216857910156} -11/07/2021 00:34:33 - INFO - __main__ - Step 23797: {'lr': 0.0004737167497523124, 'samples': 4569024, 'steps': 23796, 'loss/train': 2.038269281387329} -11/07/2021 00:34:33 - INFO - __main__ - Step 23798: {'lr': 0.0004737143811273379, 'samples': 4569216, 'steps': 23797, 'loss/train': 1.8234018087387085} -11/07/2021 00:34:33 - INFO - __main__ - Step 23799: {'lr': 0.0004737120124015611, 'samples': 4569408, 'steps': 23798, 'loss/train': 1.5387424230575562} -11/07/2021 00:34:34 - INFO - __main__ - Step 23800: {'lr': 0.00047370964357498313, 'samples': 4569600, 'steps': 23799, 'loss/train': 1.482106328010559} -11/07/2021 00:34:35 - INFO - __main__ - Step 23801: {'lr': 0.0004737072746476051, 'samples': 4569792, 'steps': 23800, 'loss/train': 1.0635290145874023} -11/07/2021 00:34:35 - INFO - __main__ - Step 23802: {'lr': 0.00047370490561942795, 'samples': 4569984, 'steps': 23801, 'loss/train': 1.1702690124511719} -11/07/2021 00:34:36 - INFO - __main__ - Step 23803: {'lr': 0.00047370253649045286, 'samples': 4570176, 'steps': 23802, 'loss/train': 1.4020882844924927} -11/07/2021 00:34:36 - INFO - __main__ - Step 23804: {'lr': 0.00047370016726068086, 'samples': 4570368, 'steps': 23803, 'loss/train': 2.384243965148926} -11/07/2021 00:34:36 - INFO - __main__ - Step 23805: {'lr': 0.000473697797930113, 'samples': 4570560, 'steps': 23804, 'loss/train': 1.7264128923416138} -11/07/2021 00:34:37 - INFO - __main__ - Step 23806: {'lr': 0.00047369542849875037, 'samples': 4570752, 'steps': 23805, 'loss/train': 1.715357780456543} -11/07/2021 00:34:38 - INFO - __main__ - Step 23807: {'lr': 0.0004736930589665941, 'samples': 4570944, 'steps': 23806, 'loss/train': 1.3189862966537476} -11/07/2021 00:34:38 - INFO - __main__ - Step 23808: {'lr': 0.0004736906893336451, 'samples': 4571136, 'steps': 23807, 'loss/train': 1.9343082904815674} -11/07/2021 00:34:38 - INFO - __main__ - Step 23809: {'lr': 0.00047368831959990453, 'samples': 4571328, 'steps': 23808, 'loss/train': 1.5713011026382446} -11/07/2021 00:34:39 - INFO - __main__ - Step 23810: {'lr': 0.0004736859497653735, 'samples': 4571520, 'steps': 23809, 'loss/train': 0.9398396611213684} -11/07/2021 00:34:39 - INFO - __main__ - Step 23811: {'lr': 0.0004736835798300531, 'samples': 4571712, 'steps': 23810, 'loss/train': 1.7095924615859985} -11/07/2021 00:34:40 - INFO - __main__ - Step 23812: {'lr': 0.00047368120979394415, 'samples': 4571904, 'steps': 23811, 'loss/train': 2.351248264312744} -11/07/2021 00:34:40 - INFO - __main__ - Step 23813: {'lr': 0.000473678839657048, 'samples': 4572096, 'steps': 23812, 'loss/train': 1.5410054922103882} -11/07/2021 00:34:41 - INFO - __main__ - Step 23814: {'lr': 0.0004736764694193656, 'samples': 4572288, 'steps': 23813, 'loss/train': 0.9509553909301758} -11/07/2021 00:34:41 - INFO - __main__ - Step 23815: {'lr': 0.0004736740990808981, 'samples': 4572480, 'steps': 23814, 'loss/train': 1.646188497543335} -11/07/2021 00:34:42 - INFO - __main__ - Step 23816: {'lr': 0.0004736717286416464, 'samples': 4572672, 'steps': 23815, 'loss/train': 1.1700364351272583} -11/07/2021 00:34:43 - INFO - __main__ - Step 23817: {'lr': 0.0004736693581016117, 'samples': 4572864, 'steps': 23816, 'loss/train': 1.0271397829055786} -11/07/2021 00:34:43 - INFO - __main__ - Step 23818: {'lr': 0.00047366698746079507, 'samples': 4573056, 'steps': 23817, 'loss/train': 1.5787421464920044} -11/07/2021 00:34:43 - INFO - __main__ - Step 23819: {'lr': 0.0004736646167191975, 'samples': 4573248, 'steps': 23818, 'loss/train': 1.5957248210906982} -11/07/2021 00:34:44 - INFO - __main__ - Step 23820: {'lr': 0.00047366224587682017, 'samples': 4573440, 'steps': 23819, 'loss/train': 0.7363741993904114} -11/07/2021 00:34:44 - INFO - __main__ - Step 23821: {'lr': 0.000473659874933664, 'samples': 4573632, 'steps': 23820, 'loss/train': 2.0048911571502686} -11/07/2021 00:34:45 - INFO - __main__ - Step 23822: {'lr': 0.0004736575038897303, 'samples': 4573824, 'steps': 23821, 'loss/train': 1.1328240633010864} -11/07/2021 00:34:45 - INFO - __main__ - Step 23823: {'lr': 0.0004736551327450198, 'samples': 4574016, 'steps': 23822, 'loss/train': 1.430214285850525} -11/07/2021 00:34:46 - INFO - __main__ - Step 23824: {'lr': 0.00047365276149953387, 'samples': 4574208, 'steps': 23823, 'loss/train': 1.3258752822875977} -11/07/2021 00:34:46 - INFO - __main__ - Step 23825: {'lr': 0.0004736503901532734, 'samples': 4574400, 'steps': 23824, 'loss/train': 2.036221504211426} -11/07/2021 00:34:47 - INFO - __main__ - Step 23826: {'lr': 0.00047364801870623954, 'samples': 4574592, 'steps': 23825, 'loss/train': 1.6998757123947144} -11/07/2021 00:34:48 - INFO - __main__ - Step 23827: {'lr': 0.00047364564715843326, 'samples': 4574784, 'steps': 23826, 'loss/train': 1.7433280944824219} -11/07/2021 00:34:48 - INFO - __main__ - Step 23828: {'lr': 0.00047364327550985575, 'samples': 4574976, 'steps': 23827, 'loss/train': 1.8414788246154785} -11/07/2021 00:34:48 - INFO - __main__ - Step 23829: {'lr': 0.00047364090376050805, 'samples': 4575168, 'steps': 23828, 'loss/train': 1.4711476564407349} -11/07/2021 00:34:49 - INFO - __main__ - Step 23830: {'lr': 0.0004736385319103912, 'samples': 4575360, 'steps': 23829, 'loss/train': 0.9364742636680603} -11/07/2021 00:34:49 - INFO - __main__ - Step 23831: {'lr': 0.00047363615995950624, 'samples': 4575552, 'steps': 23830, 'loss/train': 1.699023723602295} -11/07/2021 00:34:50 - INFO - __main__ - Step 23832: {'lr': 0.0004736337879078544, 'samples': 4575744, 'steps': 23831, 'loss/train': 1.367179036140442} -11/07/2021 00:34:50 - INFO - __main__ - Step 23833: {'lr': 0.0004736314157554365, 'samples': 4575936, 'steps': 23832, 'loss/train': 2.1259796619415283} -11/07/2021 00:34:51 - INFO - __main__ - Step 23834: {'lr': 0.00047362904350225376, 'samples': 4576128, 'steps': 23833, 'loss/train': 0.8249647617340088} -11/07/2021 00:34:51 - INFO - __main__ - Step 23835: {'lr': 0.0004736266711483073, 'samples': 4576320, 'steps': 23834, 'loss/train': 1.670304536819458} -11/07/2021 00:34:52 - INFO - __main__ - Step 23836: {'lr': 0.00047362429869359803, 'samples': 4576512, 'steps': 23835, 'loss/train': 1.1619794368743896} -11/07/2021 00:34:53 - INFO - __main__ - Step 23837: {'lr': 0.0004736219261381271, 'samples': 4576704, 'steps': 23836, 'loss/train': 1.7294654846191406} -11/07/2021 00:34:53 - INFO - __main__ - Step 23838: {'lr': 0.0004736195534818956, 'samples': 4576896, 'steps': 23837, 'loss/train': 1.4316507577896118} -11/07/2021 00:34:53 - INFO - __main__ - Step 23839: {'lr': 0.00047361718072490457, 'samples': 4577088, 'steps': 23838, 'loss/train': 1.2505590915679932} -11/07/2021 00:34:54 - INFO - __main__ - Step 23840: {'lr': 0.00047361480786715514, 'samples': 4577280, 'steps': 23839, 'loss/train': 1.3018585443496704} -11/07/2021 00:34:54 - INFO - __main__ - Step 23841: {'lr': 0.00047361243490864826, 'samples': 4577472, 'steps': 23840, 'loss/train': 0.14377540349960327} -11/07/2021 00:34:54 - INFO - __main__ - Step 23842: {'lr': 0.00047361006184938517, 'samples': 4577664, 'steps': 23841, 'loss/train': 4.133652687072754} -11/07/2021 00:34:55 - INFO - __main__ - Step 23843: {'lr': 0.00047360768868936673, 'samples': 4577856, 'steps': 23842, 'loss/train': 1.427064299583435} -11/07/2021 00:34:56 - INFO - __main__ - Step 23844: {'lr': 0.00047360531542859415, 'samples': 4578048, 'steps': 23843, 'loss/train': 1.4833950996398926} -11/07/2021 00:34:56 - INFO - __main__ - Step 23845: {'lr': 0.00047360294206706845, 'samples': 4578240, 'steps': 23844, 'loss/train': 1.6829880475997925} -11/07/2021 00:34:56 - INFO - __main__ - Step 23846: {'lr': 0.0004736005686047907, 'samples': 4578432, 'steps': 23845, 'loss/train': 1.974252462387085} -11/07/2021 00:34:57 - INFO - __main__ - Step 23847: {'lr': 0.000473598195041762, 'samples': 4578624, 'steps': 23846, 'loss/train': 1.9925411939620972} -11/07/2021 00:34:58 - INFO - __main__ - Step 23848: {'lr': 0.0004735958213779835, 'samples': 4578816, 'steps': 23847, 'loss/train': 1.678208351135254} -11/07/2021 00:34:58 - INFO - __main__ - Step 23849: {'lr': 0.0004735934476134561, 'samples': 4579008, 'steps': 23848, 'loss/train': 2.162973165512085} -11/07/2021 00:34:59 - INFO - __main__ - Step 23850: {'lr': 0.0004735910737481809, 'samples': 4579200, 'steps': 23849, 'loss/train': 1.549644112586975} -11/07/2021 00:34:59 - INFO - __main__ - Step 23851: {'lr': 0.0004735886997821591, 'samples': 4579392, 'steps': 23850, 'loss/train': 1.391912579536438} -11/07/2021 00:34:59 - INFO - __main__ - Step 23852: {'lr': 0.00047358632571539163, 'samples': 4579584, 'steps': 23851, 'loss/train': 1.26926851272583} -11/07/2021 00:35:00 - INFO - __main__ - Step 23853: {'lr': 0.0004735839515478796, 'samples': 4579776, 'steps': 23852, 'loss/train': 1.931373119354248} -11/07/2021 00:35:01 - INFO - __main__ - Step 23854: {'lr': 0.0004735815772796241, 'samples': 4579968, 'steps': 23853, 'loss/train': 1.3470486402511597} -11/07/2021 00:35:01 - INFO - __main__ - Step 23855: {'lr': 0.0004735792029106262, 'samples': 4580160, 'steps': 23854, 'loss/train': 1.512963056564331} -11/07/2021 00:35:01 - INFO - __main__ - Step 23856: {'lr': 0.0004735768284408869, 'samples': 4580352, 'steps': 23855, 'loss/train': 1.0526634454727173} -11/07/2021 00:35:02 - INFO - __main__ - Step 23857: {'lr': 0.00047357445387040745, 'samples': 4580544, 'steps': 23856, 'loss/train': 1.524977445602417} -11/07/2021 00:35:03 - INFO - __main__ - Step 23858: {'lr': 0.0004735720791991887, 'samples': 4580736, 'steps': 23857, 'loss/train': 1.551909327507019} -11/07/2021 00:35:03 - INFO - __main__ - Step 23859: {'lr': 0.00047356970442723184, 'samples': 4580928, 'steps': 23858, 'loss/train': 1.7394713163375854} -11/07/2021 00:35:03 - INFO - __main__ - Step 23860: {'lr': 0.00047356732955453794, 'samples': 4581120, 'steps': 23859, 'loss/train': 2.184431791305542} -11/07/2021 00:35:04 - INFO - __main__ - Step 23861: {'lr': 0.00047356495458110806, 'samples': 4581312, 'steps': 23860, 'loss/train': 1.451634168624878} -11/07/2021 00:35:04 - INFO - __main__ - Step 23862: {'lr': 0.00047356257950694326, 'samples': 4581504, 'steps': 23861, 'loss/train': 1.7785993814468384} -11/07/2021 00:35:05 - INFO - __main__ - Step 23863: {'lr': 0.0004735602043320446, 'samples': 4581696, 'steps': 23862, 'loss/train': 1.1716285943984985} -11/07/2021 00:35:06 - INFO - __main__ - Step 23864: {'lr': 0.0004735578290564132, 'samples': 4581888, 'steps': 23863, 'loss/train': 1.9256266355514526} -11/07/2021 00:35:06 - INFO - __main__ - Step 23865: {'lr': 0.00047355545368005003, 'samples': 4582080, 'steps': 23864, 'loss/train': 1.585779070854187} -11/07/2021 00:35:06 - INFO - __main__ - Step 23866: {'lr': 0.00047355307820295625, 'samples': 4582272, 'steps': 23865, 'loss/train': 1.762752890586853} -11/07/2021 00:35:07 - INFO - __main__ - Step 23867: {'lr': 0.00047355070262513287, 'samples': 4582464, 'steps': 23866, 'loss/train': 1.9047404527664185} -11/07/2021 00:35:08 - INFO - __main__ - Step 23868: {'lr': 0.00047354832694658104, 'samples': 4582656, 'steps': 23867, 'loss/train': 2.1007673740386963} -11/07/2021 00:35:08 - INFO - __main__ - Step 23869: {'lr': 0.0004735459511673018, 'samples': 4582848, 'steps': 23868, 'loss/train': 1.7195255756378174} -11/07/2021 00:35:08 - INFO - __main__ - Step 23870: {'lr': 0.0004735435752872962, 'samples': 4583040, 'steps': 23869, 'loss/train': 1.8624155521392822} -11/07/2021 00:35:09 - INFO - __main__ - Step 23871: {'lr': 0.00047354119930656524, 'samples': 4583232, 'steps': 23870, 'loss/train': 1.7606174945831299} -11/07/2021 00:35:09 - INFO - __main__ - Step 23872: {'lr': 0.0004735388232251101, 'samples': 4583424, 'steps': 23871, 'loss/train': 1.514115333557129} -11/07/2021 00:35:10 - INFO - __main__ - Step 23873: {'lr': 0.00047353644704293185, 'samples': 4583616, 'steps': 23872, 'loss/train': 1.6635241508483887} -11/07/2021 00:35:10 - INFO - __main__ - Step 23874: {'lr': 0.0004735340707600315, 'samples': 4583808, 'steps': 23873, 'loss/train': 1.2399150133132935} -11/07/2021 00:35:11 - INFO - __main__ - Step 23875: {'lr': 0.0004735316943764102, 'samples': 4584000, 'steps': 23874, 'loss/train': 1.478752851486206} -11/07/2021 00:35:11 - INFO - __main__ - Step 23876: {'lr': 0.0004735293178920689, 'samples': 4584192, 'steps': 23875, 'loss/train': 1.7473831176757812} -11/07/2021 00:35:11 - INFO - __main__ - Step 23877: {'lr': 0.00047352694130700873, 'samples': 4584384, 'steps': 23876, 'loss/train': 1.5420238971710205} -11/07/2021 00:35:12 - INFO - __main__ - Step 23878: {'lr': 0.00047352456462123086, 'samples': 4584576, 'steps': 23877, 'loss/train': 1.2136842012405396} -11/07/2021 00:35:13 - INFO - __main__ - Step 23879: {'lr': 0.00047352218783473614, 'samples': 4584768, 'steps': 23878, 'loss/train': 1.6738272905349731} -11/07/2021 00:35:13 - INFO - __main__ - Step 23880: {'lr': 0.0004735198109475258, 'samples': 4584960, 'steps': 23879, 'loss/train': 1.5064436197280884} -11/07/2021 00:35:14 - INFO - __main__ - Step 23881: {'lr': 0.000473517433959601, 'samples': 4585152, 'steps': 23880, 'loss/train': 2.9225754737854004} -11/07/2021 00:35:14 - INFO - __main__ - Step 23882: {'lr': 0.00047351505687096257, 'samples': 4585344, 'steps': 23881, 'loss/train': 1.5504294633865356} -11/07/2021 00:35:14 - INFO - __main__ - Step 23883: {'lr': 0.00047351267968161176, 'samples': 4585536, 'steps': 23882, 'loss/train': 1.7049568891525269} -11/07/2021 00:35:15 - INFO - __main__ - Step 23884: {'lr': 0.0004735103023915496, 'samples': 4585728, 'steps': 23883, 'loss/train': 1.40176260471344} -11/07/2021 00:35:16 - INFO - __main__ - Step 23885: {'lr': 0.0004735079250007771, 'samples': 4585920, 'steps': 23884, 'loss/train': 1.1555250883102417} -11/07/2021 00:35:16 - INFO - __main__ - Step 23886: {'lr': 0.00047350554750929543, 'samples': 4586112, 'steps': 23885, 'loss/train': 1.702562689781189} -11/07/2021 00:35:16 - INFO - __main__ - Step 23887: {'lr': 0.0004735031699171055, 'samples': 4586304, 'steps': 23886, 'loss/train': 1.0130150318145752} -11/07/2021 00:35:17 - INFO - __main__ - Step 23888: {'lr': 0.0004735007922242086, 'samples': 4586496, 'steps': 23887, 'loss/train': 2.6597204208374023} -11/07/2021 00:35:18 - INFO - __main__ - Step 23889: {'lr': 0.0004734984144306057, 'samples': 4586688, 'steps': 23888, 'loss/train': 1.794775128364563} -11/07/2021 00:35:18 - INFO - __main__ - Step 23890: {'lr': 0.0004734960365362978, 'samples': 4586880, 'steps': 23889, 'loss/train': 1.3223886489868164} -11/07/2021 00:35:19 - INFO - __main__ - Step 23891: {'lr': 0.0004734936585412861, 'samples': 4587072, 'steps': 23890, 'loss/train': 1.6438193321228027} -11/07/2021 00:35:19 - INFO - __main__ - Step 23892: {'lr': 0.00047349128044557153, 'samples': 4587264, 'steps': 23891, 'loss/train': 1.682618498802185} -11/07/2021 00:35:19 - INFO - __main__ - Step 23893: {'lr': 0.0004734889022491553, 'samples': 4587456, 'steps': 23892, 'loss/train': 1.850300669670105} -11/07/2021 00:35:20 - INFO - __main__ - Step 23894: {'lr': 0.0004734865239520384, 'samples': 4587648, 'steps': 23893, 'loss/train': 1.6257259845733643} -11/07/2021 00:35:21 - INFO - __main__ - Step 23895: {'lr': 0.0004734841455542219, 'samples': 4587840, 'steps': 23894, 'loss/train': 0.8706209659576416} -11/07/2021 00:35:21 - INFO - __main__ - Step 23896: {'lr': 0.0004734817670557069, 'samples': 4588032, 'steps': 23895, 'loss/train': 1.325243353843689} -11/07/2021 00:35:21 - INFO - __main__ - Step 23897: {'lr': 0.00047347938845649447, 'samples': 4588224, 'steps': 23896, 'loss/train': 1.8135654926300049} -11/07/2021 00:35:22 - INFO - __main__ - Step 23898: {'lr': 0.0004734770097565857, 'samples': 4588416, 'steps': 23897, 'loss/train': 1.6204172372817993} -11/07/2021 00:35:23 - INFO - __main__ - Step 23899: {'lr': 0.00047347463095598157, 'samples': 4588608, 'steps': 23898, 'loss/train': 1.4633369445800781} -11/07/2021 00:35:23 - INFO - __main__ - Step 23900: {'lr': 0.00047347225205468323, 'samples': 4588800, 'steps': 23899, 'loss/train': 1.0516488552093506} -11/07/2021 00:35:23 - INFO - __main__ - Step 23901: {'lr': 0.00047346987305269184, 'samples': 4588992, 'steps': 23900, 'loss/train': 1.8633294105529785} -11/07/2021 00:35:24 - INFO - __main__ - Step 23902: {'lr': 0.0004734674939500083, 'samples': 4589184, 'steps': 23901, 'loss/train': 1.2833586931228638} -11/07/2021 00:35:24 - INFO - __main__ - Step 23903: {'lr': 0.0004734651147466338, 'samples': 4589376, 'steps': 23902, 'loss/train': 0.12630239129066467} -11/07/2021 00:35:25 - INFO - __main__ - Step 23904: {'lr': 0.00047346273544256927, 'samples': 4589568, 'steps': 23903, 'loss/train': 1.9274121522903442} -11/07/2021 00:35:26 - INFO - __main__ - Step 23905: {'lr': 0.00047346035603781597, 'samples': 4589760, 'steps': 23904, 'loss/train': 1.7911525964736938} -11/07/2021 00:35:26 - INFO - __main__ - Step 23906: {'lr': 0.00047345797653237486, 'samples': 4589952, 'steps': 23905, 'loss/train': 1.6518858671188354} -11/07/2021 00:35:26 - INFO - __main__ - Step 23907: {'lr': 0.000473455596926247, 'samples': 4590144, 'steps': 23906, 'loss/train': 1.787940502166748} -11/07/2021 00:35:27 - INFO - __main__ - Step 23908: {'lr': 0.0004734532172194335, 'samples': 4590336, 'steps': 23907, 'loss/train': 1.4603474140167236} -11/07/2021 00:35:27 - INFO - __main__ - Step 23909: {'lr': 0.0004734508374119355, 'samples': 4590528, 'steps': 23908, 'loss/train': 1.3073455095291138} -11/07/2021 00:35:28 - INFO - __main__ - Step 23910: {'lr': 0.0004734484575037539, 'samples': 4590720, 'steps': 23909, 'loss/train': 1.4078184366226196} -11/07/2021 00:35:29 - INFO - __main__ - Step 23911: {'lr': 0.00047344607749489, 'samples': 4590912, 'steps': 23910, 'loss/train': 1.5765531063079834} -11/07/2021 00:35:29 - INFO - __main__ - Step 23912: {'lr': 0.00047344369738534466, 'samples': 4591104, 'steps': 23911, 'loss/train': 1.2944846153259277} -11/07/2021 00:35:29 - INFO - __main__ - Step 23913: {'lr': 0.000473441317175119, 'samples': 4591296, 'steps': 23912, 'loss/train': 1.6884845495224} -11/07/2021 00:35:30 - INFO - __main__ - Step 23914: {'lr': 0.0004734389368642142, 'samples': 4591488, 'steps': 23913, 'loss/train': 1.1201519966125488} -11/07/2021 00:35:31 - INFO - __main__ - Step 23915: {'lr': 0.0004734365564526313, 'samples': 4591680, 'steps': 23914, 'loss/train': 1.8650660514831543} -11/07/2021 00:35:31 - INFO - __main__ - Step 23916: {'lr': 0.00047343417594037117, 'samples': 4591872, 'steps': 23915, 'loss/train': 1.3060716390609741} -11/07/2021 00:35:31 - INFO - __main__ - Step 23917: {'lr': 0.00047343179532743516, 'samples': 4592064, 'steps': 23916, 'loss/train': 1.5598535537719727} -11/07/2021 00:35:32 - INFO - __main__ - Step 23918: {'lr': 0.00047342941461382427, 'samples': 4592256, 'steps': 23917, 'loss/train': 1.4983863830566406} -11/07/2021 00:35:32 - INFO - __main__ - Step 23919: {'lr': 0.0004734270337995395, 'samples': 4592448, 'steps': 23918, 'loss/train': 1.1809464693069458} -11/07/2021 00:35:35 - INFO - __main__ - Step 23920: {'lr': 0.0004734246528845819, 'samples': 4592640, 'steps': 23919, 'loss/train': 0.9813411235809326} -11/07/2021 00:35:35 - INFO - __main__ - Step 23921: {'lr': 0.0004734222718689527, 'samples': 4592832, 'steps': 23920, 'loss/train': 2.3573687076568604} -11/07/2021 00:35:35 - INFO - __main__ - Step 23922: {'lr': 0.0004734198907526528, 'samples': 4593024, 'steps': 23921, 'loss/train': 1.912838101387024} -11/07/2021 00:35:36 - INFO - __main__ - Step 23923: {'lr': 0.00047341750953568335, 'samples': 4593216, 'steps': 23922, 'loss/train': 1.816469430923462} -11/07/2021 00:35:36 - INFO - __main__ - Step 23924: {'lr': 0.0004734151282180454, 'samples': 4593408, 'steps': 23923, 'loss/train': 1.8191454410552979} -11/07/2021 00:35:36 - INFO - __main__ - Step 23925: {'lr': 0.0004734127467997401, 'samples': 4593600, 'steps': 23924, 'loss/train': 1.0661303997039795} -11/07/2021 00:35:37 - INFO - __main__ - Step 23926: {'lr': 0.0004734103652807684, 'samples': 4593792, 'steps': 23925, 'loss/train': 1.6279600858688354} -11/07/2021 00:35:38 - INFO - __main__ - Step 23927: {'lr': 0.0004734079836611315, 'samples': 4593984, 'steps': 23926, 'loss/train': 1.4247660636901855} -11/07/2021 00:35:38 - INFO - __main__ - Step 23928: {'lr': 0.0004734056019408304, 'samples': 4594176, 'steps': 23927, 'loss/train': 1.551518201828003} -11/07/2021 00:35:38 - INFO - __main__ - Step 23929: {'lr': 0.00047340322011986614, 'samples': 4594368, 'steps': 23928, 'loss/train': 1.5285148620605469} -11/07/2021 00:35:39 - INFO - __main__ - Step 23930: {'lr': 0.0004734008381982399, 'samples': 4594560, 'steps': 23929, 'loss/train': 1.452463150024414} -11/07/2021 00:35:39 - INFO - __main__ - Step 23931: {'lr': 0.0004733984561759527, 'samples': 4594752, 'steps': 23930, 'loss/train': 1.7026846408843994} -11/07/2021 00:35:39 - INFO - __main__ - Step 23932: {'lr': 0.0004733960740530055, 'samples': 4594944, 'steps': 23931, 'loss/train': 1.6613857746124268} -11/07/2021 00:35:40 - INFO - __main__ - Step 23933: {'lr': 0.0004733936918293995, 'samples': 4595136, 'steps': 23932, 'loss/train': 1.6048064231872559} -11/07/2021 00:35:41 - INFO - __main__ - Step 23934: {'lr': 0.0004733913095051358, 'samples': 4595328, 'steps': 23933, 'loss/train': 1.8170708417892456} -11/07/2021 00:35:41 - INFO - __main__ - Step 23935: {'lr': 0.0004733889270802154, 'samples': 4595520, 'steps': 23934, 'loss/train': 1.6382811069488525} -11/07/2021 00:35:41 - INFO - __main__ - Step 23936: {'lr': 0.00047338654455463935, 'samples': 4595712, 'steps': 23935, 'loss/train': 1.4931180477142334} -11/07/2021 00:35:42 - INFO - __main__ - Step 23937: {'lr': 0.00047338416192840887, 'samples': 4595904, 'steps': 23936, 'loss/train': 1.7660572528839111} -11/07/2021 00:35:43 - INFO - __main__ - Step 23938: {'lr': 0.0004733817792015249, 'samples': 4596096, 'steps': 23937, 'loss/train': 1.0775352716445923} -11/07/2021 00:35:43 - INFO - __main__ - Step 23939: {'lr': 0.00047337939637398855, 'samples': 4596288, 'steps': 23938, 'loss/train': 1.5399011373519897} -11/07/2021 00:35:43 - INFO - __main__ - Step 23940: {'lr': 0.0004733770134458009, 'samples': 4596480, 'steps': 23939, 'loss/train': 1.5492165088653564} -11/07/2021 00:35:44 - INFO - __main__ - Step 23941: {'lr': 0.0004733746304169629, 'samples': 4596672, 'steps': 23940, 'loss/train': 1.623695731163025} -11/07/2021 00:35:44 - INFO - __main__ - Step 23942: {'lr': 0.0004733722472874759, 'samples': 4596864, 'steps': 23941, 'loss/train': 1.8950859308242798} -11/07/2021 00:35:46 - INFO - __main__ - Step 23943: {'lr': 0.0004733698640573407, 'samples': 4597056, 'steps': 23942, 'loss/train': 1.560842752456665} -11/07/2021 00:35:46 - INFO - __main__ - Step 23944: {'lr': 0.0004733674807265585, 'samples': 4597248, 'steps': 23943, 'loss/train': 0.23782792687416077} -11/07/2021 00:35:46 - INFO - __main__ - Step 23945: {'lr': 0.0004733650972951304, 'samples': 4597440, 'steps': 23944, 'loss/train': 1.5143749713897705} -11/07/2021 00:35:47 - INFO - __main__ - Step 23946: {'lr': 0.0004733627137630574, 'samples': 4597632, 'steps': 23945, 'loss/train': 2.1152851581573486} -11/07/2021 00:35:47 - INFO - __main__ - Step 23947: {'lr': 0.00047336033013034063, 'samples': 4597824, 'steps': 23946, 'loss/train': 1.6347516775131226} -11/07/2021 00:35:48 - INFO - __main__ - Step 23948: {'lr': 0.00047335794639698117, 'samples': 4598016, 'steps': 23947, 'loss/train': 1.3954161405563354} -11/07/2021 00:35:48 - INFO - __main__ - Step 23949: {'lr': 0.00047335556256298, 'samples': 4598208, 'steps': 23948, 'loss/train': 1.6793127059936523} -11/07/2021 00:35:49 - INFO - __main__ - Step 23950: {'lr': 0.0004733531786283383, 'samples': 4598400, 'steps': 23949, 'loss/train': 1.897346019744873} -11/07/2021 00:35:49 - INFO - __main__ - Step 23951: {'lr': 0.0004733507945930571, 'samples': 4598592, 'steps': 23950, 'loss/train': 1.4155480861663818} -11/07/2021 00:35:49 - INFO - __main__ - Step 23952: {'lr': 0.0004733484104571375, 'samples': 4598784, 'steps': 23951, 'loss/train': 1.4704738855361938} -11/07/2021 00:35:50 - INFO - __main__ - Step 23953: {'lr': 0.0004733460262205805, 'samples': 4598976, 'steps': 23952, 'loss/train': 1.1455572843551636} -11/07/2021 00:35:51 - INFO - __main__ - Step 23954: {'lr': 0.00047334364188338725, 'samples': 4599168, 'steps': 23953, 'loss/train': 1.7158654928207397} -11/07/2021 00:35:51 - INFO - __main__ - Step 23955: {'lr': 0.0004733412574455588, 'samples': 4599360, 'steps': 23954, 'loss/train': 1.5433906316757202} -11/07/2021 00:35:51 - INFO - __main__ - Step 23956: {'lr': 0.00047333887290709623, 'samples': 4599552, 'steps': 23955, 'loss/train': 1.0119457244873047} -11/07/2021 00:35:52 - INFO - __main__ - Step 23957: {'lr': 0.00047333648826800056, 'samples': 4599744, 'steps': 23956, 'loss/train': 1.6177657842636108} -11/07/2021 00:35:53 - INFO - __main__ - Step 23958: {'lr': 0.000473334103528273, 'samples': 4599936, 'steps': 23957, 'loss/train': 1.7731554508209229} -11/07/2021 00:35:53 - INFO - __main__ - Step 23959: {'lr': 0.00047333171868791453, 'samples': 4600128, 'steps': 23958, 'loss/train': 1.7867491245269775} -11/07/2021 00:35:53 - INFO - __main__ - Step 23960: {'lr': 0.00047332933374692623, 'samples': 4600320, 'steps': 23959, 'loss/train': 1.0234673023223877} -11/07/2021 00:35:54 - INFO - __main__ - Step 23961: {'lr': 0.0004733269487053091, 'samples': 4600512, 'steps': 23960, 'loss/train': 1.6259523630142212} -11/07/2021 00:35:54 - INFO - __main__ - Step 23962: {'lr': 0.0004733245635630644, 'samples': 4600704, 'steps': 23961, 'loss/train': 1.7841717004776} -11/07/2021 00:35:55 - INFO - __main__ - Step 23963: {'lr': 0.000473322178320193, 'samples': 4600896, 'steps': 23962, 'loss/train': 1.3683499097824097} -11/07/2021 00:35:55 - INFO - __main__ - Step 23964: {'lr': 0.0004733197929766961, 'samples': 4601088, 'steps': 23963, 'loss/train': 1.8661178350448608} -11/07/2021 00:35:56 - INFO - __main__ - Step 23965: {'lr': 0.0004733174075325748, 'samples': 4601280, 'steps': 23964, 'loss/train': 0.5968111753463745} -11/07/2021 00:35:56 - INFO - __main__ - Step 23966: {'lr': 0.0004733150219878301, 'samples': 4601472, 'steps': 23965, 'loss/train': 1.1554112434387207} -11/07/2021 00:35:57 - INFO - __main__ - Step 23967: {'lr': 0.00047331263634246314, 'samples': 4601664, 'steps': 23966, 'loss/train': 1.5371090173721313} -11/07/2021 00:35:57 - INFO - __main__ - Step 23968: {'lr': 0.0004733102505964749, 'samples': 4601856, 'steps': 23967, 'loss/train': 1.333052158355713} -11/07/2021 00:35:58 - INFO - __main__ - Step 23969: {'lr': 0.00047330786474986645, 'samples': 4602048, 'steps': 23968, 'loss/train': 1.4831993579864502} -11/07/2021 00:35:58 - INFO - __main__ - Step 23970: {'lr': 0.00047330547880263896, 'samples': 4602240, 'steps': 23969, 'loss/train': 0.468535840511322} -11/07/2021 00:35:59 - INFO - __main__ - Step 23971: {'lr': 0.00047330309275479354, 'samples': 4602432, 'steps': 23970, 'loss/train': 2.043537139892578} -11/07/2021 00:35:59 - INFO - __main__ - Step 23972: {'lr': 0.00047330070660633113, 'samples': 4602624, 'steps': 23971, 'loss/train': 1.6697735786437988} -11/07/2021 00:35:59 - INFO - __main__ - Step 23973: {'lr': 0.00047329832035725286, 'samples': 4602816, 'steps': 23972, 'loss/train': 1.3469334840774536} -11/07/2021 00:36:01 - INFO - __main__ - Step 23974: {'lr': 0.0004732959340075598, 'samples': 4603008, 'steps': 23973, 'loss/train': 1.5206609964370728} -11/07/2021 00:36:01 - INFO - __main__ - Step 23975: {'lr': 0.0004732935475572531, 'samples': 4603200, 'steps': 23974, 'loss/train': 1.446755051612854} -11/07/2021 00:36:01 - INFO - __main__ - Step 23976: {'lr': 0.00047329116100633373, 'samples': 4603392, 'steps': 23975, 'loss/train': 1.2258696556091309} -11/07/2021 00:36:02 - INFO - __main__ - Step 23977: {'lr': 0.0004732887743548028, 'samples': 4603584, 'steps': 23976, 'loss/train': 0.9995880126953125} -11/07/2021 00:36:02 - INFO - __main__ - Step 23978: {'lr': 0.0004732863876026614, 'samples': 4603776, 'steps': 23977, 'loss/train': 1.8663251399993896} -11/07/2021 00:36:03 - INFO - __main__ - Step 23979: {'lr': 0.00047328400074991064, 'samples': 4603968, 'steps': 23978, 'loss/train': 1.5901334285736084} -11/07/2021 00:36:03 - INFO - __main__ - Step 23980: {'lr': 0.00047328161379655155, 'samples': 4604160, 'steps': 23979, 'loss/train': 2.803783416748047} -11/07/2021 00:36:04 - INFO - __main__ - Step 23981: {'lr': 0.00047327922674258516, 'samples': 4604352, 'steps': 23980, 'loss/train': 1.6610171794891357} -11/07/2021 00:36:04 - INFO - __main__ - Step 23982: {'lr': 0.00047327683958801257, 'samples': 4604544, 'steps': 23981, 'loss/train': 1.2914010286331177} -11/07/2021 00:36:04 - INFO - __main__ - Step 23983: {'lr': 0.00047327445233283496, 'samples': 4604736, 'steps': 23982, 'loss/train': 1.675779938697815} -11/07/2021 00:36:05 - INFO - __main__ - Step 23984: {'lr': 0.0004732720649770533, 'samples': 4604928, 'steps': 23983, 'loss/train': 1.0921618938446045} -11/07/2021 00:36:06 - INFO - __main__ - Step 23985: {'lr': 0.00047326967752066876, 'samples': 4605120, 'steps': 23984, 'loss/train': 1.6801031827926636} -11/07/2021 00:36:06 - INFO - __main__ - Step 23986: {'lr': 0.0004732672899636822, 'samples': 4605312, 'steps': 23985, 'loss/train': 1.1205083131790161} -11/07/2021 00:36:06 - INFO - __main__ - Step 23987: {'lr': 0.00047326490230609495, 'samples': 4605504, 'steps': 23986, 'loss/train': 1.521935224533081} -11/07/2021 00:36:07 - INFO - __main__ - Step 23988: {'lr': 0.000473262514547908, 'samples': 4605696, 'steps': 23987, 'loss/train': 1.4000868797302246} -11/07/2021 00:36:07 - INFO - __main__ - Step 23989: {'lr': 0.00047326012668912233, 'samples': 4605888, 'steps': 23988, 'loss/train': 1.2538903951644897} -11/07/2021 00:36:08 - INFO - __main__ - Step 23990: {'lr': 0.0004732577387297391, 'samples': 4606080, 'steps': 23989, 'loss/train': 1.4244943857192993} -11/07/2021 00:36:09 - INFO - __main__ - Step 23991: {'lr': 0.00047325535066975946, 'samples': 4606272, 'steps': 23990, 'loss/train': 1.113530158996582} -11/07/2021 00:36:09 - INFO - __main__ - Step 23992: {'lr': 0.0004732529625091843, 'samples': 4606464, 'steps': 23991, 'loss/train': 0.9550225734710693} -11/07/2021 00:36:09 - INFO - __main__ - Step 23993: {'lr': 0.0004732505742480149, 'samples': 4606656, 'steps': 23992, 'loss/train': 1.4506036043167114} -11/07/2021 00:36:10 - INFO - __main__ - Step 23994: {'lr': 0.00047324818588625214, 'samples': 4606848, 'steps': 23993, 'loss/train': 1.0872936248779297} -11/07/2021 00:36:11 - INFO - __main__ - Step 23995: {'lr': 0.0004732457974238972, 'samples': 4607040, 'steps': 23994, 'loss/train': 1.142677903175354} -11/07/2021 00:36:11 - INFO - __main__ - Step 23996: {'lr': 0.0004732434088609512, 'samples': 4607232, 'steps': 23995, 'loss/train': 1.5826812982559204} -11/07/2021 00:36:11 - INFO - __main__ - Step 23997: {'lr': 0.00047324102019741514, 'samples': 4607424, 'steps': 23996, 'loss/train': 1.9252495765686035} -11/07/2021 00:36:12 - INFO - __main__ - Step 23998: {'lr': 0.00047323863143329016, 'samples': 4607616, 'steps': 23997, 'loss/train': 1.2529178857803345} -11/07/2021 00:36:12 - INFO - __main__ - Step 23999: {'lr': 0.00047323624256857724, 'samples': 4607808, 'steps': 23998, 'loss/train': 1.5744787454605103} -11/07/2021 00:36:13 - INFO - __main__ - Step 24000: {'lr': 0.0004732338536032775, 'samples': 4608000, 'steps': 23999, 'loss/train': 0.7579989433288574} -11/07/2021 00:36:14 - INFO - __main__ - Step 24001: {'lr': 0.0004732314645373921, 'samples': 4608192, 'steps': 24000, 'loss/train': 1.5627518892288208} -11/07/2021 00:36:14 - INFO - __main__ - Step 24002: {'lr': 0.0004732290753709221, 'samples': 4608384, 'steps': 24001, 'loss/train': 1.8776737451553345} -11/07/2021 00:36:14 - INFO - __main__ - Step 24003: {'lr': 0.0004732266861038684, 'samples': 4608576, 'steps': 24002, 'loss/train': 1.3503319025039673} -11/07/2021 00:36:15 - INFO - __main__ - Step 24004: {'lr': 0.0004732242967362322, 'samples': 4608768, 'steps': 24003, 'loss/train': 0.988669753074646} -11/07/2021 00:36:16 - INFO - __main__ - Step 24005: {'lr': 0.00047322190726801464, 'samples': 4608960, 'steps': 24004, 'loss/train': 1.773216962814331} -11/07/2021 00:36:16 - INFO - __main__ - Step 24006: {'lr': 0.0004732195176992167, 'samples': 4609152, 'steps': 24005, 'loss/train': 1.4425705671310425} -11/07/2021 00:36:16 - INFO - __main__ - Step 24007: {'lr': 0.0004732171280298395, 'samples': 4609344, 'steps': 24006, 'loss/train': 1.9128704071044922} -11/07/2021 00:36:17 - INFO - __main__ - Step 24008: {'lr': 0.0004732147382598842, 'samples': 4609536, 'steps': 24007, 'loss/train': 1.3278956413269043} -11/07/2021 00:36:17 - INFO - __main__ - Step 24009: {'lr': 0.00047321234838935164, 'samples': 4609728, 'steps': 24008, 'loss/train': 1.7238233089447021} -11/07/2021 00:36:18 - INFO - __main__ - Step 24010: {'lr': 0.0004732099584182431, 'samples': 4609920, 'steps': 24009, 'loss/train': 1.3841497898101807} -11/07/2021 00:36:18 - INFO - __main__ - Step 24011: {'lr': 0.00047320756834655955, 'samples': 4610112, 'steps': 24010, 'loss/train': 1.14120352268219} -11/07/2021 00:36:19 - INFO - __main__ - Step 24012: {'lr': 0.0004732051781743022, 'samples': 4610304, 'steps': 24011, 'loss/train': 1.303422212600708} -11/07/2021 00:36:19 - INFO - __main__ - Step 24013: {'lr': 0.00047320278790147197, 'samples': 4610496, 'steps': 24012, 'loss/train': 1.3343220949172974} -11/07/2021 00:36:19 - INFO - __main__ - Step 24014: {'lr': 0.00047320039752807, 'samples': 4610688, 'steps': 24013, 'loss/train': 1.3710945844650269} -11/07/2021 00:36:20 - INFO - __main__ - Step 24015: {'lr': 0.0004731980070540974, 'samples': 4610880, 'steps': 24014, 'loss/train': 1.5271550416946411} -11/07/2021 00:36:21 - INFO - __main__ - Step 24016: {'lr': 0.0004731956164795552, 'samples': 4611072, 'steps': 24015, 'loss/train': 1.5088775157928467} -11/07/2021 00:36:21 - INFO - __main__ - Step 24017: {'lr': 0.0004731932258044446, 'samples': 4611264, 'steps': 24016, 'loss/train': 1.6866132020950317} -11/07/2021 00:36:21 - INFO - __main__ - Step 24018: {'lr': 0.00047319083502876647, 'samples': 4611456, 'steps': 24017, 'loss/train': 1.7156354188919067} -11/07/2021 00:36:22 - INFO - __main__ - Step 24019: {'lr': 0.00047318844415252204, 'samples': 4611648, 'steps': 24018, 'loss/train': 1.2008994817733765} -11/07/2021 00:36:23 - INFO - __main__ - Step 24020: {'lr': 0.00047318605317571227, 'samples': 4611840, 'steps': 24019, 'loss/train': 0.9371023774147034} -11/07/2021 00:36:23 - INFO - __main__ - Step 24021: {'lr': 0.0004731836620983384, 'samples': 4612032, 'steps': 24020, 'loss/train': 1.8780555725097656} -11/07/2021 00:36:24 - INFO - __main__ - Step 24022: {'lr': 0.00047318127092040144, 'samples': 4612224, 'steps': 24021, 'loss/train': 1.729790449142456} -11/07/2021 00:36:24 - INFO - __main__ - Step 24023: {'lr': 0.00047317887964190233, 'samples': 4612416, 'steps': 24022, 'loss/train': 1.3617117404937744} -11/07/2021 00:36:24 - INFO - __main__ - Step 24024: {'lr': 0.00047317648826284233, 'samples': 4612608, 'steps': 24023, 'loss/train': 1.4316092729568481} -11/07/2021 00:36:25 - INFO - __main__ - Step 24025: {'lr': 0.0004731740967832224, 'samples': 4612800, 'steps': 24024, 'loss/train': 1.0627192258834839} -11/07/2021 00:36:26 - INFO - __main__ - Step 24026: {'lr': 0.00047317170520304373, 'samples': 4612992, 'steps': 24025, 'loss/train': 1.2190508842468262} -11/07/2021 00:36:26 - INFO - __main__ - Step 24027: {'lr': 0.0004731693135223073, 'samples': 4613184, 'steps': 24026, 'loss/train': 1.520830750465393} -11/07/2021 00:36:26 - INFO - __main__ - Step 24028: {'lr': 0.0004731669217410142, 'samples': 4613376, 'steps': 24027, 'loss/train': 1.6594531536102295} -11/07/2021 00:36:27 - INFO - __main__ - Step 24029: {'lr': 0.0004731645298591656, 'samples': 4613568, 'steps': 24028, 'loss/train': 1.5065810680389404} -11/07/2021 00:36:28 - INFO - __main__ - Step 24030: {'lr': 0.0004731621378767624, 'samples': 4613760, 'steps': 24029, 'loss/train': 1.4267277717590332} -11/07/2021 00:36:28 - INFO - __main__ - Step 24031: {'lr': 0.0004731597457938059, 'samples': 4613952, 'steps': 24030, 'loss/train': 1.7742807865142822} -11/07/2021 00:36:29 - INFO - __main__ - Step 24032: {'lr': 0.000473157353610297, 'samples': 4614144, 'steps': 24031, 'loss/train': 1.6197173595428467} -11/07/2021 00:36:29 - INFO - __main__ - Step 24033: {'lr': 0.0004731549613262368, 'samples': 4614336, 'steps': 24032, 'loss/train': 1.5604989528656006} -11/07/2021 00:36:29 - INFO - __main__ - Step 24034: {'lr': 0.0004731525689416265, 'samples': 4614528, 'steps': 24033, 'loss/train': 2.0325191020965576} -11/07/2021 00:36:30 - INFO - __main__ - Step 24035: {'lr': 0.0004731501764564671, 'samples': 4614720, 'steps': 24034, 'loss/train': 1.6932367086410522} -11/07/2021 00:36:31 - INFO - __main__ - Step 24036: {'lr': 0.00047314778387075963, 'samples': 4614912, 'steps': 24035, 'loss/train': 0.7694287300109863} -11/07/2021 00:36:31 - INFO - __main__ - Step 24037: {'lr': 0.00047314539118450516, 'samples': 4615104, 'steps': 24036, 'loss/train': 1.7597320079803467} -11/07/2021 00:36:31 - INFO - __main__ - Step 24038: {'lr': 0.0004731429983977049, 'samples': 4615296, 'steps': 24037, 'loss/train': 1.971815586090088} -11/07/2021 00:36:32 - INFO - __main__ - Step 24039: {'lr': 0.00047314060551035983, 'samples': 4615488, 'steps': 24038, 'loss/train': 1.4033492803573608} -11/07/2021 00:36:32 - INFO - __main__ - Step 24040: {'lr': 0.00047313821252247104, 'samples': 4615680, 'steps': 24039, 'loss/train': 1.4914271831512451} -11/07/2021 00:36:33 - INFO - __main__ - Step 24041: {'lr': 0.00047313581943403963, 'samples': 4615872, 'steps': 24040, 'loss/train': 1.5378525257110596} -11/07/2021 00:36:33 - INFO - __main__ - Step 24042: {'lr': 0.0004731334262450666, 'samples': 4616064, 'steps': 24041, 'loss/train': 1.4748715162277222} -11/07/2021 00:36:34 - INFO - __main__ - Step 24043: {'lr': 0.00047313103295555317, 'samples': 4616256, 'steps': 24042, 'loss/train': 1.4187289476394653} -11/07/2021 00:36:34 - INFO - __main__ - Step 24044: {'lr': 0.0004731286395655003, 'samples': 4616448, 'steps': 24043, 'loss/train': 1.6412248611450195} -11/07/2021 00:36:34 - INFO - __main__ - Step 24045: {'lr': 0.00047312624607490913, 'samples': 4616640, 'steps': 24044, 'loss/train': 1.356187105178833} -11/07/2021 00:36:35 - INFO - __main__ - Step 24046: {'lr': 0.0004731238524837807, 'samples': 4616832, 'steps': 24045, 'loss/train': 1.3819315433502197} -11/07/2021 00:36:36 - INFO - __main__ - Step 24047: {'lr': 0.00047312145879211607, 'samples': 4617024, 'steps': 24046, 'loss/train': 1.857301115989685} -11/07/2021 00:36:36 - INFO - __main__ - Step 24048: {'lr': 0.0004731190649999164, 'samples': 4617216, 'steps': 24047, 'loss/train': 1.4999340772628784} -11/07/2021 00:36:36 - INFO - __main__ - Step 24049: {'lr': 0.0004731166711071827, 'samples': 4617408, 'steps': 24048, 'loss/train': 1.6041375398635864} -11/07/2021 00:36:37 - INFO - __main__ - Step 24050: {'lr': 0.0004731142771139161, 'samples': 4617600, 'steps': 24049, 'loss/train': 1.6878598928451538} -11/07/2021 00:36:38 - INFO - __main__ - Step 24051: {'lr': 0.00047311188302011766, 'samples': 4617792, 'steps': 24050, 'loss/train': 1.9721226692199707} -11/07/2021 00:36:38 - INFO - __main__ - Step 24052: {'lr': 0.00047310948882578843, 'samples': 4617984, 'steps': 24051, 'loss/train': 1.548930287361145} -11/07/2021 00:36:38 - INFO - __main__ - Step 24053: {'lr': 0.0004731070945309295, 'samples': 4618176, 'steps': 24052, 'loss/train': 1.5730412006378174} -11/07/2021 00:36:39 - INFO - __main__ - Step 24054: {'lr': 0.00047310470013554195, 'samples': 4618368, 'steps': 24053, 'loss/train': 1.6378589868545532} -11/07/2021 00:36:39 - INFO - __main__ - Step 24055: {'lr': 0.0004731023056396269, 'samples': 4618560, 'steps': 24054, 'loss/train': 1.4226047992706299} -11/07/2021 00:36:40 - INFO - __main__ - Step 24056: {'lr': 0.00047309991104318533, 'samples': 4618752, 'steps': 24055, 'loss/train': 1.3241724967956543} -11/07/2021 00:36:41 - INFO - __main__ - Step 24057: {'lr': 0.00047309751634621845, 'samples': 4618944, 'steps': 24056, 'loss/train': 1.4396579265594482} -11/07/2021 00:36:41 - INFO - __main__ - Step 24058: {'lr': 0.0004730951215487272, 'samples': 4619136, 'steps': 24057, 'loss/train': 1.5071772336959839} -11/07/2021 00:36:41 - INFO - __main__ - Step 24059: {'lr': 0.0004730927266507128, 'samples': 4619328, 'steps': 24058, 'loss/train': 1.7581125497817993} -11/07/2021 00:36:42 - INFO - __main__ - Step 24060: {'lr': 0.00047309033165217617, 'samples': 4619520, 'steps': 24059, 'loss/train': 1.6549838781356812} -11/07/2021 00:36:43 - INFO - __main__ - Step 24061: {'lr': 0.00047308793655311855, 'samples': 4619712, 'steps': 24060, 'loss/train': 1.6436907052993774} -11/07/2021 00:36:43 - INFO - __main__ - Step 24062: {'lr': 0.000473085541353541, 'samples': 4619904, 'steps': 24061, 'loss/train': 1.756529688835144} -11/07/2021 00:36:43 - INFO - __main__ - Step 24063: {'lr': 0.00047308314605344447, 'samples': 4620096, 'steps': 24062, 'loss/train': 1.4223600625991821} -11/07/2021 00:36:44 - INFO - __main__ - Step 24064: {'lr': 0.00047308075065283006, 'samples': 4620288, 'steps': 24063, 'loss/train': 1.6613905429840088} -11/07/2021 00:36:44 - INFO - __main__ - Step 24065: {'lr': 0.00047307835515169905, 'samples': 4620480, 'steps': 24064, 'loss/train': 1.8377280235290527} -11/07/2021 00:36:45 - INFO - __main__ - Step 24066: {'lr': 0.00047307595955005226, 'samples': 4620672, 'steps': 24065, 'loss/train': 1.2982749938964844} -11/07/2021 00:36:45 - INFO - __main__ - Step 24067: {'lr': 0.000473073563847891, 'samples': 4620864, 'steps': 24066, 'loss/train': 1.9799203872680664} -11/07/2021 00:36:46 - INFO - __main__ - Step 24068: {'lr': 0.0004730711680452161, 'samples': 4621056, 'steps': 24067, 'loss/train': 1.3927499055862427} -11/07/2021 00:36:46 - INFO - __main__ - Step 24069: {'lr': 0.00047306877214202885, 'samples': 4621248, 'steps': 24068, 'loss/train': 1.6838091611862183} -11/07/2021 00:36:46 - INFO - __main__ - Step 24070: {'lr': 0.00047306637613833024, 'samples': 4621440, 'steps': 24069, 'loss/train': 1.380083441734314} -11/07/2021 00:36:47 - INFO - __main__ - Step 24071: {'lr': 0.00047306398003412137, 'samples': 4621632, 'steps': 24070, 'loss/train': 2.2692599296569824} -11/07/2021 00:36:48 - INFO - __main__ - Step 24072: {'lr': 0.00047306158382940327, 'samples': 4621824, 'steps': 24071, 'loss/train': 1.4450585842132568} -11/07/2021 00:36:48 - INFO - __main__ - Step 24073: {'lr': 0.0004730591875241771, 'samples': 4622016, 'steps': 24072, 'loss/train': 1.9368537664413452} -11/07/2021 00:36:48 - INFO - __main__ - Step 24074: {'lr': 0.0004730567911184439, 'samples': 4622208, 'steps': 24073, 'loss/train': 1.387794852256775} -11/07/2021 00:36:49 - INFO - __main__ - Step 24075: {'lr': 0.00047305439461220477, 'samples': 4622400, 'steps': 24074, 'loss/train': 1.5761562585830688} -11/07/2021 00:36:49 - INFO - __main__ - Step 24076: {'lr': 0.00047305199800546077, 'samples': 4622592, 'steps': 24075, 'loss/train': 1.4723130464553833} -11/07/2021 00:36:50 - INFO - __main__ - Step 24077: {'lr': 0.00047304960129821295, 'samples': 4622784, 'steps': 24076, 'loss/train': 1.2436383962631226} -11/07/2021 00:36:51 - INFO - __main__ - Step 24078: {'lr': 0.00047304720449046247, 'samples': 4622976, 'steps': 24077, 'loss/train': 1.5036218166351318} -11/07/2021 00:36:51 - INFO - __main__ - Step 24079: {'lr': 0.0004730448075822103, 'samples': 4623168, 'steps': 24078, 'loss/train': 1.3758183717727661} -11/07/2021 00:36:52 - INFO - __main__ - Step 24080: {'lr': 0.0004730424105734576, 'samples': 4623360, 'steps': 24079, 'loss/train': 1.9877567291259766} -11/07/2021 00:36:52 - INFO - __main__ - Step 24081: {'lr': 0.00047304001346420543, 'samples': 4623552, 'steps': 24080, 'loss/train': 0.17084410786628723} -11/07/2021 00:36:53 - INFO - __main__ - Step 24082: {'lr': 0.0004730376162544549, 'samples': 4623744, 'steps': 24081, 'loss/train': 1.7236641645431519} -11/07/2021 00:36:53 - INFO - __main__ - Step 24083: {'lr': 0.00047303521894420707, 'samples': 4623936, 'steps': 24082, 'loss/train': 1.7466765642166138} -11/07/2021 00:36:54 - INFO - __main__ - Step 24084: {'lr': 0.00047303282153346297, 'samples': 4624128, 'steps': 24083, 'loss/train': 1.492013931274414} -11/07/2021 00:36:54 - INFO - __main__ - Step 24085: {'lr': 0.00047303042402222373, 'samples': 4624320, 'steps': 24084, 'loss/train': 1.3853580951690674} -11/07/2021 00:36:54 - INFO - __main__ - Step 24086: {'lr': 0.00047302802641049045, 'samples': 4624512, 'steps': 24085, 'loss/train': 1.2335377931594849} -11/07/2021 00:36:56 - INFO - __main__ - Step 24087: {'lr': 0.00047302562869826415, 'samples': 4624704, 'steps': 24086, 'loss/train': 1.3577960729599} -11/07/2021 00:36:56 - INFO - __main__ - Step 24088: {'lr': 0.000473023230885546, 'samples': 4624896, 'steps': 24087, 'loss/train': 1.374523639678955} -11/07/2021 00:36:56 - INFO - __main__ - Step 24089: {'lr': 0.00047302083297233693, 'samples': 4625088, 'steps': 24088, 'loss/train': 0.7093602418899536} -11/07/2021 00:36:57 - INFO - __main__ - Step 24090: {'lr': 0.0004730184349586382, 'samples': 4625280, 'steps': 24089, 'loss/train': 0.1390826255083084} -11/07/2021 00:36:57 - INFO - __main__ - Step 24091: {'lr': 0.0004730160368444507, 'samples': 4625472, 'steps': 24090, 'loss/train': 2.2058796882629395} -11/07/2021 00:36:58 - INFO - __main__ - Step 24092: {'lr': 0.00047301363862977574, 'samples': 4625664, 'steps': 24091, 'loss/train': 1.3440006971359253} -11/07/2021 00:36:58 - INFO - __main__ - Step 24093: {'lr': 0.00047301124031461425, 'samples': 4625856, 'steps': 24092, 'loss/train': 1.485878825187683} -11/07/2021 00:36:59 - INFO - __main__ - Step 24094: {'lr': 0.00047300884189896734, 'samples': 4626048, 'steps': 24093, 'loss/train': 1.568880319595337} -11/07/2021 00:36:59 - INFO - __main__ - Step 24095: {'lr': 0.00047300644338283597, 'samples': 4626240, 'steps': 24094, 'loss/train': 1.0832172632217407} -11/07/2021 00:36:59 - INFO - __main__ - Step 24096: {'lr': 0.00047300404476622145, 'samples': 4626432, 'steps': 24095, 'loss/train': 2.009178638458252} -11/07/2021 00:37:00 - INFO - __main__ - Step 24097: {'lr': 0.0004730016460491247, 'samples': 4626624, 'steps': 24096, 'loss/train': 1.7144906520843506} -11/07/2021 00:37:01 - INFO - __main__ - Step 24098: {'lr': 0.00047299924723154686, 'samples': 4626816, 'steps': 24097, 'loss/train': 1.5741411447525024} -11/07/2021 00:37:01 - INFO - __main__ - Step 24099: {'lr': 0.000472996848313489, 'samples': 4627008, 'steps': 24098, 'loss/train': 1.6352746486663818} -11/07/2021 00:37:01 - INFO - __main__ - Step 24100: {'lr': 0.0004729944492949523, 'samples': 4627200, 'steps': 24099, 'loss/train': 1.3924369812011719} -11/07/2021 00:37:02 - INFO - __main__ - Step 24101: {'lr': 0.0004729920501759376, 'samples': 4627392, 'steps': 24100, 'loss/train': 1.5177526473999023} -11/07/2021 00:37:03 - INFO - __main__ - Step 24102: {'lr': 0.0004729896509564462, 'samples': 4627584, 'steps': 24101, 'loss/train': 1.8052873611450195} -11/07/2021 00:37:03 - INFO - __main__ - Step 24103: {'lr': 0.00047298725163647903, 'samples': 4627776, 'steps': 24102, 'loss/train': 1.3988844156265259} -11/07/2021 00:37:03 - INFO - __main__ - Step 24104: {'lr': 0.00047298485221603735, 'samples': 4627968, 'steps': 24103, 'loss/train': 1.4751757383346558} -11/07/2021 00:37:04 - INFO - __main__ - Step 24105: {'lr': 0.0004729824526951221, 'samples': 4628160, 'steps': 24104, 'loss/train': 1.4389196634292603} -11/07/2021 00:37:04 - INFO - __main__ - Step 24106: {'lr': 0.0004729800530737344, 'samples': 4628352, 'steps': 24105, 'loss/train': 1.3307538032531738} -11/07/2021 00:37:05 - INFO - __main__ - Step 24107: {'lr': 0.0004729776533518753, 'samples': 4628544, 'steps': 24106, 'loss/train': 1.9035096168518066} -11/07/2021 00:37:06 - INFO - __main__ - Step 24108: {'lr': 0.00047297525352954587, 'samples': 4628736, 'steps': 24107, 'loss/train': 1.3840570449829102} -11/07/2021 00:37:06 - INFO - __main__ - Step 24109: {'lr': 0.00047297285360674724, 'samples': 4628928, 'steps': 24108, 'loss/train': 1.2842854261398315} -11/07/2021 00:37:06 - INFO - __main__ - Step 24110: {'lr': 0.0004729704535834806, 'samples': 4629120, 'steps': 24109, 'loss/train': 1.7016844749450684} -11/07/2021 00:37:07 - INFO - __main__ - Step 24111: {'lr': 0.0004729680534597468, 'samples': 4629312, 'steps': 24110, 'loss/train': 1.310340166091919} -11/07/2021 00:37:08 - INFO - __main__ - Step 24112: {'lr': 0.0004729656532355471, 'samples': 4629504, 'steps': 24111, 'loss/train': 1.403632640838623} -11/07/2021 00:37:08 - INFO - __main__ - Step 24113: {'lr': 0.00047296325291088247, 'samples': 4629696, 'steps': 24112, 'loss/train': 1.713728666305542} -11/07/2021 00:37:08 - INFO - __main__ - Step 24114: {'lr': 0.00047296085248575405, 'samples': 4629888, 'steps': 24113, 'loss/train': 2.0353336334228516} -11/07/2021 00:37:09 - INFO - __main__ - Step 24115: {'lr': 0.000472958451960163, 'samples': 4630080, 'steps': 24114, 'loss/train': 1.6103174686431885} -11/07/2021 00:37:09 - INFO - __main__ - Step 24116: {'lr': 0.0004729560513341101, 'samples': 4630272, 'steps': 24115, 'loss/train': 1.0083428621292114} -11/07/2021 00:37:10 - INFO - __main__ - Step 24117: {'lr': 0.0004729536506075969, 'samples': 4630464, 'steps': 24116, 'loss/train': 1.5582096576690674} -11/07/2021 00:37:10 - INFO - __main__ - Step 24118: {'lr': 0.000472951249780624, 'samples': 4630656, 'steps': 24117, 'loss/train': 1.225318193435669} -11/07/2021 00:37:11 - INFO - __main__ - Step 24119: {'lr': 0.0004729488488531928, 'samples': 4630848, 'steps': 24118, 'loss/train': 1.7452466487884521} -11/07/2021 00:37:11 - INFO - __main__ - Step 24120: {'lr': 0.00047294644782530437, 'samples': 4631040, 'steps': 24119, 'loss/train': 1.7983100414276123} -11/07/2021 00:37:11 - INFO - __main__ - Step 24121: {'lr': 0.0004729440466969596, 'samples': 4631232, 'steps': 24120, 'loss/train': 1.7422473430633545} -11/07/2021 00:37:12 - INFO - __main__ - Step 24122: {'lr': 0.00047294164546815977, 'samples': 4631424, 'steps': 24121, 'loss/train': 1.831278920173645} -11/07/2021 00:37:13 - INFO - __main__ - Step 24123: {'lr': 0.0004729392441389058, 'samples': 4631616, 'steps': 24122, 'loss/train': 1.5722295045852661} -11/07/2021 00:37:13 - INFO - __main__ - Step 24124: {'lr': 0.0004729368427091989, 'samples': 4631808, 'steps': 24123, 'loss/train': 1.10862398147583} -11/07/2021 00:37:14 - INFO - __main__ - Step 24125: {'lr': 0.0004729344411790401, 'samples': 4632000, 'steps': 24124, 'loss/train': 1.5833975076675415} -11/07/2021 00:37:14 - INFO - __main__ - Step 24126: {'lr': 0.00047293203954843036, 'samples': 4632192, 'steps': 24125, 'loss/train': 1.5960149765014648} -11/07/2021 00:37:14 - INFO - __main__ - Step 24127: {'lr': 0.000472929637817371, 'samples': 4632384, 'steps': 24126, 'loss/train': 1.4709511995315552} -11/07/2021 00:37:15 - INFO - __main__ - Step 24128: {'lr': 0.00047292723598586295, 'samples': 4632576, 'steps': 24127, 'loss/train': 1.7393834590911865} -11/07/2021 00:37:16 - INFO - __main__ - Step 24129: {'lr': 0.0004729248340539074, 'samples': 4632768, 'steps': 24128, 'loss/train': 1.2329339981079102} -11/07/2021 00:37:16 - INFO - __main__ - Step 24130: {'lr': 0.00047292243202150524, 'samples': 4632960, 'steps': 24129, 'loss/train': 1.3833272457122803} -11/07/2021 00:37:16 - INFO - __main__ - Step 24131: {'lr': 0.00047292002988865773, 'samples': 4633152, 'steps': 24130, 'loss/train': 1.295301914215088} -11/07/2021 00:37:17 - INFO - __main__ - Step 24132: {'lr': 0.0004729176276553659, 'samples': 4633344, 'steps': 24131, 'loss/train': 1.6785240173339844} -11/07/2021 00:37:18 - INFO - __main__ - Step 24133: {'lr': 0.00047291522532163084, 'samples': 4633536, 'steps': 24132, 'loss/train': 0.7390657067298889} -11/07/2021 00:37:18 - INFO - __main__ - Step 24134: {'lr': 0.0004729128228874536, 'samples': 4633728, 'steps': 24133, 'loss/train': 1.5403138399124146} -11/07/2021 00:37:18 - INFO - __main__ - Step 24135: {'lr': 0.0004729104203528353, 'samples': 4633920, 'steps': 24134, 'loss/train': 1.6307657957077026} -11/07/2021 00:37:19 - INFO - __main__ - Step 24136: {'lr': 0.0004729080177177769, 'samples': 4634112, 'steps': 24135, 'loss/train': 1.8441475629806519} -11/07/2021 00:37:19 - INFO - __main__ - Step 24137: {'lr': 0.0004729056149822797, 'samples': 4634304, 'steps': 24136, 'loss/train': 1.516968011856079} -11/07/2021 00:37:20 - INFO - __main__ - Step 24138: {'lr': 0.0004729032121463447, 'samples': 4634496, 'steps': 24137, 'loss/train': 2.146589517593384} -11/07/2021 00:37:20 - INFO - __main__ - Step 24139: {'lr': 0.00047290080920997285, 'samples': 4634688, 'steps': 24138, 'loss/train': 1.5535197257995605} -11/07/2021 00:37:21 - INFO - __main__ - Step 24140: {'lr': 0.0004728984061731654, 'samples': 4634880, 'steps': 24139, 'loss/train': 1.5095983743667603} -11/07/2021 00:37:21 - INFO - __main__ - Step 24141: {'lr': 0.00047289600303592334, 'samples': 4635072, 'steps': 24140, 'loss/train': 1.7222843170166016} -11/07/2021 00:37:22 - INFO - __main__ - Step 24142: {'lr': 0.00047289359979824774, 'samples': 4635264, 'steps': 24141, 'loss/train': 1.3944061994552612} -11/07/2021 00:37:23 - INFO - __main__ - Step 24143: {'lr': 0.0004728911964601398, 'samples': 4635456, 'steps': 24142, 'loss/train': 1.880142092704773} -11/07/2021 00:37:23 - INFO - __main__ - Step 24144: {'lr': 0.00047288879302160046, 'samples': 4635648, 'steps': 24143, 'loss/train': 1.4885319471359253} -11/07/2021 00:37:24 - INFO - __main__ - Step 24145: {'lr': 0.000472886389482631, 'samples': 4635840, 'steps': 24144, 'loss/train': 1.4777766466140747} -11/07/2021 00:37:24 - INFO - __main__ - Step 24146: {'lr': 0.00047288398584323225, 'samples': 4636032, 'steps': 24145, 'loss/train': 1.4003963470458984} -11/07/2021 00:37:24 - INFO - __main__ - Step 24147: {'lr': 0.0004728815821034055, 'samples': 4636224, 'steps': 24146, 'loss/train': 1.7480651140213013} -11/07/2021 00:37:25 - INFO - __main__ - Step 24148: {'lr': 0.00047287917826315163, 'samples': 4636416, 'steps': 24147, 'loss/train': 1.4331068992614746} -11/07/2021 00:37:26 - INFO - __main__ - Step 24149: {'lr': 0.00047287677432247187, 'samples': 4636608, 'steps': 24148, 'loss/train': 0.24684494733810425} -11/07/2021 00:37:26 - INFO - __main__ - Step 24150: {'lr': 0.0004728743702813674, 'samples': 4636800, 'steps': 24149, 'loss/train': 1.3840608596801758} -11/07/2021 00:37:26 - INFO - __main__ - Step 24151: {'lr': 0.00047287196613983906, 'samples': 4636992, 'steps': 24150, 'loss/train': 1.2256970405578613} -11/07/2021 00:37:27 - INFO - __main__ - Step 24152: {'lr': 0.00047286956189788803, 'samples': 4637184, 'steps': 24151, 'loss/train': 1.6570688486099243} -11/07/2021 00:37:27 - INFO - __main__ - Step 24153: {'lr': 0.0004728671575555155, 'samples': 4637376, 'steps': 24152, 'loss/train': 1.3276275396347046} -11/07/2021 00:37:28 - INFO - __main__ - Step 24154: {'lr': 0.00047286475311272244, 'samples': 4637568, 'steps': 24153, 'loss/train': 1.9737012386322021} -11/07/2021 00:37:28 - INFO - __main__ - Step 24155: {'lr': 0.00047286234856950995, 'samples': 4637760, 'steps': 24154, 'loss/train': 1.142815351486206} -11/07/2021 00:37:29 - INFO - __main__ - Step 24156: {'lr': 0.0004728599439258791, 'samples': 4637952, 'steps': 24155, 'loss/train': 1.1040961742401123} -11/07/2021 00:37:29 - INFO - __main__ - Step 24157: {'lr': 0.00047285753918183105, 'samples': 4638144, 'steps': 24156, 'loss/train': 1.6647619009017944} -11/07/2021 00:37:30 - INFO - __main__ - Step 24158: {'lr': 0.0004728551343373668, 'samples': 4638336, 'steps': 24157, 'loss/train': 1.5001345872879028} -11/07/2021 00:37:31 - INFO - __main__ - Step 24159: {'lr': 0.0004728527293924875, 'samples': 4638528, 'steps': 24158, 'loss/train': 1.7175570726394653} -11/07/2021 00:37:31 - INFO - __main__ - Step 24160: {'lr': 0.0004728503243471941, 'samples': 4638720, 'steps': 24159, 'loss/train': 2.3899855613708496} -11/07/2021 00:37:32 - INFO - __main__ - Step 24161: {'lr': 0.00047284791920148786, 'samples': 4638912, 'steps': 24160, 'loss/train': 2.2988929748535156} -11/07/2021 00:37:32 - INFO - __main__ - Step 24162: {'lr': 0.0004728455139553698, 'samples': 4639104, 'steps': 24161, 'loss/train': 1.3547323942184448} -11/07/2021 00:37:32 - INFO - __main__ - Step 24163: {'lr': 0.00047284310860884097, 'samples': 4639296, 'steps': 24162, 'loss/train': 1.4184315204620361} -11/07/2021 00:37:33 - INFO - __main__ - Step 24164: {'lr': 0.0004728407031619025, 'samples': 4639488, 'steps': 24163, 'loss/train': 1.7893747091293335} -11/07/2021 00:37:34 - INFO - __main__ - Step 24165: {'lr': 0.00047283829761455545, 'samples': 4639680, 'steps': 24164, 'loss/train': 1.2855308055877686} -11/07/2021 00:37:34 - INFO - __main__ - Step 24166: {'lr': 0.00047283589196680083, 'samples': 4639872, 'steps': 24165, 'loss/train': 1.3909536600112915} -11/07/2021 00:37:35 - INFO - __main__ - Step 24167: {'lr': 0.00047283348621863987, 'samples': 4640064, 'steps': 24166, 'loss/train': 1.9475990533828735} -11/07/2021 00:37:35 - INFO - __main__ - Step 24168: {'lr': 0.0004728310803700735, 'samples': 4640256, 'steps': 24167, 'loss/train': 1.5293444395065308} -11/07/2021 00:37:35 - INFO - __main__ - Step 24169: {'lr': 0.00047282867442110296, 'samples': 4640448, 'steps': 24168, 'loss/train': 1.4277057647705078} -11/07/2021 00:37:36 - INFO - __main__ - Step 24170: {'lr': 0.0004728262683717292, 'samples': 4640640, 'steps': 24169, 'loss/train': 1.4179643392562866} -11/07/2021 00:37:37 - INFO - __main__ - Step 24171: {'lr': 0.0004728238622219534, 'samples': 4640832, 'steps': 24170, 'loss/train': 1.114132046699524} -11/07/2021 00:37:37 - INFO - __main__ - Step 24172: {'lr': 0.0004728214559717766, 'samples': 4641024, 'steps': 24171, 'loss/train': 0.9853553771972656} -11/07/2021 00:37:37 - INFO - __main__ - Step 24173: {'lr': 0.0004728190496211999, 'samples': 4641216, 'steps': 24172, 'loss/train': 1.9363664388656616} -11/07/2021 00:37:38 - INFO - __main__ - Step 24174: {'lr': 0.0004728166431702243, 'samples': 4641408, 'steps': 24173, 'loss/train': 1.4757331609725952} -11/07/2021 00:37:39 - INFO - __main__ - Step 24175: {'lr': 0.0004728142366188511, 'samples': 4641600, 'steps': 24174, 'loss/train': 1.9317572116851807} -11/07/2021 00:37:39 - INFO - __main__ - Step 24176: {'lr': 0.0004728118299670812, 'samples': 4641792, 'steps': 24175, 'loss/train': 1.3534637689590454} -11/07/2021 00:37:40 - INFO - __main__ - Step 24177: {'lr': 0.0004728094232149156, 'samples': 4641984, 'steps': 24176, 'loss/train': 1.609655499458313} -11/07/2021 00:37:40 - INFO - __main__ - Step 24178: {'lr': 0.0004728070163623557, 'samples': 4642176, 'steps': 24177, 'loss/train': 1.2836956977844238} -11/07/2021 00:37:40 - INFO - __main__ - Step 24179: {'lr': 0.00047280460940940224, 'samples': 4642368, 'steps': 24178, 'loss/train': 2.0768063068389893} -11/07/2021 00:37:41 - INFO - __main__ - Step 24180: {'lr': 0.00047280220235605653, 'samples': 4642560, 'steps': 24179, 'loss/train': 1.5663083791732788} -11/07/2021 00:37:42 - INFO - __main__ - Step 24181: {'lr': 0.00047279979520231956, 'samples': 4642752, 'steps': 24180, 'loss/train': 1.7623138427734375} -11/07/2021 00:37:42 - INFO - __main__ - Step 24182: {'lr': 0.0004727973879481925, 'samples': 4642944, 'steps': 24181, 'loss/train': 1.9315279722213745} -11/07/2021 00:37:42 - INFO - __main__ - Step 24183: {'lr': 0.0004727949805936763, 'samples': 4643136, 'steps': 24182, 'loss/train': 1.6259862184524536} -11/07/2021 00:37:43 - INFO - __main__ - Step 24184: {'lr': 0.00047279257313877216, 'samples': 4643328, 'steps': 24183, 'loss/train': 1.3279659748077393} -11/07/2021 00:37:44 - INFO - __main__ - Step 24185: {'lr': 0.00047279016558348107, 'samples': 4643520, 'steps': 24184, 'loss/train': 1.1774322986602783} -11/07/2021 00:37:45 - INFO - __main__ - Step 24186: {'lr': 0.00047278775792780424, 'samples': 4643712, 'steps': 24185, 'loss/train': 1.7688424587249756} -11/07/2021 00:37:45 - INFO - __main__ - Step 24187: {'lr': 0.00047278535017174266, 'samples': 4643904, 'steps': 24186, 'loss/train': 1.6855511665344238} -11/07/2021 00:37:45 - INFO - __main__ - Step 24188: {'lr': 0.00047278294231529745, 'samples': 4644096, 'steps': 24187, 'loss/train': 1.364418387413025} -11/07/2021 00:37:46 - INFO - __main__ - Step 24189: {'lr': 0.0004727805343584697, 'samples': 4644288, 'steps': 24188, 'loss/train': 1.5109294652938843} -11/07/2021 00:37:47 - INFO - __main__ - Step 24190: {'lr': 0.00047277812630126044, 'samples': 4644480, 'steps': 24189, 'loss/train': 0.2451678216457367} -11/07/2021 00:37:47 - INFO - __main__ - Step 24191: {'lr': 0.0004727757181436708, 'samples': 4644672, 'steps': 24190, 'loss/train': 1.7502609491348267} -11/07/2021 00:37:47 - INFO - __main__ - Step 24192: {'lr': 0.0004727733098857019, 'samples': 4644864, 'steps': 24191, 'loss/train': 1.4970722198486328} -11/07/2021 00:37:48 - INFO - __main__ - Step 24193: {'lr': 0.0004727709015273547, 'samples': 4645056, 'steps': 24192, 'loss/train': 1.2383203506469727} -11/07/2021 00:37:48 - INFO - __main__ - Step 24194: {'lr': 0.00047276849306863045, 'samples': 4645248, 'steps': 24193, 'loss/train': 1.1926645040512085} -11/07/2021 00:37:49 - INFO - __main__ - Step 24195: {'lr': 0.0004727660845095301, 'samples': 4645440, 'steps': 24194, 'loss/train': 0.7111749649047852} -11/07/2021 00:37:49 - INFO - __main__ - Step 24196: {'lr': 0.0004727636758500548, 'samples': 4645632, 'steps': 24195, 'loss/train': 2.057713031768799} -11/07/2021 00:37:50 - INFO - __main__ - Step 24197: {'lr': 0.0004727612670902057, 'samples': 4645824, 'steps': 24196, 'loss/train': 1.836399793624878} -11/07/2021 00:37:50 - INFO - __main__ - Step 24198: {'lr': 0.0004727588582299837, 'samples': 4646016, 'steps': 24197, 'loss/train': 1.88862943649292} -11/07/2021 00:37:50 - INFO - __main__ - Step 24199: {'lr': 0.00047275644926939004, 'samples': 4646208, 'steps': 24198, 'loss/train': 2.0900471210479736} -11/07/2021 00:37:51 - INFO - __main__ - Step 24200: {'lr': 0.0004727540402084258, 'samples': 4646400, 'steps': 24199, 'loss/train': 1.6688822507858276} -11/07/2021 00:37:52 - INFO - __main__ - Step 24201: {'lr': 0.00047275163104709196, 'samples': 4646592, 'steps': 24200, 'loss/train': 1.583453893661499} -11/07/2021 00:37:52 - INFO - __main__ - Step 24202: {'lr': 0.0004727492217853897, 'samples': 4646784, 'steps': 24201, 'loss/train': 1.6207613945007324} -11/07/2021 00:37:53 - INFO - __main__ - Step 24203: {'lr': 0.0004727468124233201, 'samples': 4646976, 'steps': 24202, 'loss/train': 1.7906291484832764} -11/07/2021 00:37:53 - INFO - __main__ - Step 24204: {'lr': 0.0004727444029608842, 'samples': 4647168, 'steps': 24203, 'loss/train': 1.4829760789871216} -11/07/2021 00:37:53 - INFO - __main__ - Step 24205: {'lr': 0.0004727419933980831, 'samples': 4647360, 'steps': 24204, 'loss/train': 1.8701109886169434} -11/07/2021 00:37:54 - INFO - __main__ - Step 24206: {'lr': 0.00047273958373491795, 'samples': 4647552, 'steps': 24205, 'loss/train': 0.45274531841278076} -11/07/2021 00:37:55 - INFO - __main__ - Step 24207: {'lr': 0.0004727371739713897, 'samples': 4647744, 'steps': 24206, 'loss/train': 2.36594820022583} -11/07/2021 00:37:55 - INFO - __main__ - Step 24208: {'lr': 0.0004727347641074996, 'samples': 4647936, 'steps': 24207, 'loss/train': 1.223652958869934} -11/07/2021 00:37:55 - INFO - __main__ - Step 24209: {'lr': 0.0004727323541432486, 'samples': 4648128, 'steps': 24208, 'loss/train': 1.4723137617111206} -11/07/2021 00:37:56 - INFO - __main__ - Step 24210: {'lr': 0.0004727299440786378, 'samples': 4648320, 'steps': 24209, 'loss/train': 1.9725641012191772} -11/07/2021 00:37:57 - INFO - __main__ - Step 24211: {'lr': 0.0004727275339136684, 'samples': 4648512, 'steps': 24210, 'loss/train': 1.6833373308181763} -11/07/2021 00:37:57 - INFO - __main__ - Step 24212: {'lr': 0.0004727251236483414, 'samples': 4648704, 'steps': 24211, 'loss/train': 1.6619133949279785} -11/07/2021 00:37:58 - INFO - __main__ - Step 24213: {'lr': 0.0004727227132826579, 'samples': 4648896, 'steps': 24212, 'loss/train': 1.7764638662338257} -11/07/2021 00:37:58 - INFO - __main__ - Step 24214: {'lr': 0.00047272030281661894, 'samples': 4649088, 'steps': 24213, 'loss/train': 1.306481957435608} -11/07/2021 00:37:58 - INFO - __main__ - Step 24215: {'lr': 0.0004727178922502257, 'samples': 4649280, 'steps': 24214, 'loss/train': 1.9462131261825562} -11/07/2021 00:37:59 - INFO - __main__ - Step 24216: {'lr': 0.00047271548158347917, 'samples': 4649472, 'steps': 24215, 'loss/train': 1.5835012197494507} -11/07/2021 00:38:00 - INFO - __main__ - Step 24217: {'lr': 0.00047271307081638047, 'samples': 4649664, 'steps': 24216, 'loss/train': 0.829211950302124} -11/07/2021 00:38:00 - INFO - __main__ - Step 24218: {'lr': 0.0004727106599489307, 'samples': 4649856, 'steps': 24217, 'loss/train': 1.5512961149215698} -11/07/2021 00:38:00 - INFO - __main__ - Step 24219: {'lr': 0.000472708248981131, 'samples': 4650048, 'steps': 24218, 'loss/train': 1.442055106163025} -11/07/2021 00:38:01 - INFO - __main__ - Step 24220: {'lr': 0.0004727058379129824, 'samples': 4650240, 'steps': 24219, 'loss/train': 1.6307088136672974} -11/07/2021 00:38:02 - INFO - __main__ - Step 24221: {'lr': 0.00047270342674448593, 'samples': 4650432, 'steps': 24220, 'loss/train': 1.9180172681808472} -11/07/2021 00:38:02 - INFO - __main__ - Step 24222: {'lr': 0.0004727010154756427, 'samples': 4650624, 'steps': 24221, 'loss/train': 1.7712818384170532} -11/07/2021 00:38:03 - INFO - __main__ - Step 24223: {'lr': 0.00047269860410645395, 'samples': 4650816, 'steps': 24222, 'loss/train': 1.4384461641311646} -11/07/2021 00:38:03 - INFO - __main__ - Step 24224: {'lr': 0.00047269619263692056, 'samples': 4651008, 'steps': 24223, 'loss/train': 1.6635693311691284} -11/07/2021 00:38:03 - INFO - __main__ - Step 24225: {'lr': 0.0004726937810670437, 'samples': 4651200, 'steps': 24224, 'loss/train': 1.4228426218032837} -11/07/2021 00:38:04 - INFO - __main__ - Step 24226: {'lr': 0.00047269136939682445, 'samples': 4651392, 'steps': 24225, 'loss/train': 1.688468337059021} -11/07/2021 00:38:05 - INFO - __main__ - Step 24227: {'lr': 0.00047268895762626396, 'samples': 4651584, 'steps': 24226, 'loss/train': 1.0655486583709717} -11/07/2021 00:38:05 - INFO - __main__ - Step 24228: {'lr': 0.00047268654575536326, 'samples': 4651776, 'steps': 24227, 'loss/train': 1.910609245300293} -11/07/2021 00:38:05 - INFO - __main__ - Step 24229: {'lr': 0.0004726841337841234, 'samples': 4651968, 'steps': 24228, 'loss/train': 1.3337944746017456} -11/07/2021 00:38:06 - INFO - __main__ - Step 24230: {'lr': 0.00047268172171254554, 'samples': 4652160, 'steps': 24229, 'loss/train': 1.2254079580307007} -11/07/2021 00:38:07 - INFO - __main__ - Step 24231: {'lr': 0.00047267930954063064, 'samples': 4652352, 'steps': 24230, 'loss/train': 1.4541743993759155} -11/07/2021 00:38:07 - INFO - __main__ - Step 24232: {'lr': 0.00047267689726838004, 'samples': 4652544, 'steps': 24231, 'loss/train': 1.456627607345581} -11/07/2021 00:38:07 - INFO - __main__ - Step 24233: {'lr': 0.00047267448489579455, 'samples': 4652736, 'steps': 24232, 'loss/train': 1.5871590375900269} -11/07/2021 00:38:08 - INFO - __main__ - Step 24234: {'lr': 0.00047267207242287536, 'samples': 4652928, 'steps': 24233, 'loss/train': 1.5154452323913574} -11/07/2021 00:38:08 - INFO - __main__ - Step 24235: {'lr': 0.0004726696598496236, 'samples': 4653120, 'steps': 24234, 'loss/train': 1.6475778818130493} -11/07/2021 00:38:09 - INFO - __main__ - Step 24236: {'lr': 0.0004726672471760404, 'samples': 4653312, 'steps': 24235, 'loss/train': 1.373233675956726} -11/07/2021 00:38:09 - INFO - __main__ - Step 24237: {'lr': 0.0004726648344021267, 'samples': 4653504, 'steps': 24236, 'loss/train': 1.330606460571289} -11/07/2021 00:38:10 - INFO - __main__ - Step 24238: {'lr': 0.0004726624215278836, 'samples': 4653696, 'steps': 24237, 'loss/train': 1.8774495124816895} -11/07/2021 00:38:10 - INFO - __main__ - Step 24239: {'lr': 0.0004726600085533124, 'samples': 4653888, 'steps': 24238, 'loss/train': 1.6375892162322998} -11/07/2021 00:38:10 - INFO - __main__ - Step 24240: {'lr': 0.0004726575954784139, 'samples': 4654080, 'steps': 24239, 'loss/train': 1.302065372467041} -11/07/2021 00:38:12 - INFO - __main__ - Step 24241: {'lr': 0.0004726551823031894, 'samples': 4654272, 'steps': 24240, 'loss/train': 1.6037311553955078} -11/07/2021 00:38:12 - INFO - __main__ - Step 24242: {'lr': 0.0004726527690276399, 'samples': 4654464, 'steps': 24241, 'loss/train': 1.7429577112197876} -11/07/2021 00:38:12 - INFO - __main__ - Step 24243: {'lr': 0.0004726503556517665, 'samples': 4654656, 'steps': 24242, 'loss/train': 1.6608726978302002} -11/07/2021 00:38:13 - INFO - __main__ - Step 24244: {'lr': 0.0004726479421755703, 'samples': 4654848, 'steps': 24243, 'loss/train': 1.3861039876937866} -11/07/2021 00:38:13 - INFO - __main__ - Step 24245: {'lr': 0.0004726455285990523, 'samples': 4655040, 'steps': 24244, 'loss/train': 1.6974471807479858} -11/07/2021 00:38:14 - INFO - __main__ - Step 24246: {'lr': 0.00047264311492221375, 'samples': 4655232, 'steps': 24245, 'loss/train': 1.9845205545425415} -11/07/2021 00:38:14 - INFO - __main__ - Step 24247: {'lr': 0.00047264070114505556, 'samples': 4655424, 'steps': 24246, 'loss/train': 1.592573642730713} -11/07/2021 00:38:15 - INFO - __main__ - Step 24248: {'lr': 0.00047263828726757897, 'samples': 4655616, 'steps': 24247, 'loss/train': 1.737914800643921} -11/07/2021 00:38:15 - INFO - __main__ - Step 24249: {'lr': 0.00047263587328978495, 'samples': 4655808, 'steps': 24248, 'loss/train': 0.9708447456359863} -11/07/2021 00:38:15 - INFO - __main__ - Step 24250: {'lr': 0.00047263345921167473, 'samples': 4656000, 'steps': 24249, 'loss/train': 1.1999269723892212} -11/07/2021 00:38:17 - INFO - __main__ - Step 24251: {'lr': 0.00047263104503324926, 'samples': 4656192, 'steps': 24250, 'loss/train': 2.622537851333618} -11/07/2021 00:38:17 - INFO - __main__ - Step 24252: {'lr': 0.00047262863075450966, 'samples': 4656384, 'steps': 24251, 'loss/train': 1.4589124917984009} -11/07/2021 00:38:17 - INFO - __main__ - Step 24253: {'lr': 0.0004726262163754571, 'samples': 4656576, 'steps': 24252, 'loss/train': 1.5837563276290894} -11/07/2021 00:38:18 - INFO - __main__ - Step 24254: {'lr': 0.00047262380189609253, 'samples': 4656768, 'steps': 24253, 'loss/train': 1.8602099418640137} -11/07/2021 00:38:18 - INFO - __main__ - Step 24255: {'lr': 0.0004726213873164171, 'samples': 4656960, 'steps': 24254, 'loss/train': 1.4900504350662231} -11/07/2021 00:38:18 - INFO - __main__ - Step 24256: {'lr': 0.00047261897263643196, 'samples': 4657152, 'steps': 24255, 'loss/train': 2.08562970161438} -11/07/2021 00:38:19 - INFO - __main__ - Step 24257: {'lr': 0.0004726165578561381, 'samples': 4657344, 'steps': 24256, 'loss/train': 1.4003256559371948} -11/07/2021 00:38:20 - INFO - __main__ - Step 24258: {'lr': 0.0004726141429755367, 'samples': 4657536, 'steps': 24257, 'loss/train': 0.9711540937423706} -11/07/2021 00:38:20 - INFO - __main__ - Step 24259: {'lr': 0.0004726117279946288, 'samples': 4657728, 'steps': 24258, 'loss/train': 1.806656837463379} -11/07/2021 00:38:20 - INFO - __main__ - Step 24260: {'lr': 0.0004726093129134155, 'samples': 4657920, 'steps': 24259, 'loss/train': 1.3886107206344604} -11/07/2021 00:38:21 - INFO - __main__ - Step 24261: {'lr': 0.0004726068977318978, 'samples': 4658112, 'steps': 24260, 'loss/train': 1.43341064453125} -11/07/2021 00:38:22 - INFO - __main__ - Step 24262: {'lr': 0.0004726044824500769, 'samples': 4658304, 'steps': 24261, 'loss/train': 1.469969391822815} -11/07/2021 00:38:22 - INFO - __main__ - Step 24263: {'lr': 0.0004726020670679538, 'samples': 4658496, 'steps': 24262, 'loss/train': 1.5351600646972656} -11/07/2021 00:38:22 - INFO - __main__ - Step 24264: {'lr': 0.00047259965158552976, 'samples': 4658688, 'steps': 24263, 'loss/train': 1.5944650173187256} -11/07/2021 00:38:23 - INFO - __main__ - Step 24265: {'lr': 0.00047259723600280573, 'samples': 4658880, 'steps': 24264, 'loss/train': 1.7254376411437988} -11/07/2021 00:38:23 - INFO - __main__ - Step 24266: {'lr': 0.0004725948203197828, 'samples': 4659072, 'steps': 24265, 'loss/train': 1.1550707817077637} -11/07/2021 00:38:24 - INFO - __main__ - Step 24267: {'lr': 0.0004725924045364621, 'samples': 4659264, 'steps': 24266, 'loss/train': 1.764291524887085} -11/07/2021 00:38:24 - INFO - __main__ - Step 24268: {'lr': 0.00047258998865284463, 'samples': 4659456, 'steps': 24267, 'loss/train': 1.3322783708572388} -11/07/2021 00:38:25 - INFO - __main__ - Step 24269: {'lr': 0.0004725875726689316, 'samples': 4659648, 'steps': 24268, 'loss/train': 1.2680037021636963} -11/07/2021 00:38:25 - INFO - __main__ - Step 24270: {'lr': 0.000472585156584724, 'samples': 4659840, 'steps': 24269, 'loss/train': 1.5329806804656982} -11/07/2021 00:38:26 - INFO - __main__ - Step 24271: {'lr': 0.00047258274040022305, 'samples': 4660032, 'steps': 24270, 'loss/train': 1.2585711479187012} -11/07/2021 00:38:28 - INFO - __main__ - Step 24272: {'lr': 0.0004725803241154297, 'samples': 4660224, 'steps': 24271, 'loss/train': 1.7784254550933838} -11/07/2021 00:38:28 - INFO - __main__ - Step 24273: {'lr': 0.0004725779077303451, 'samples': 4660416, 'steps': 24272, 'loss/train': 1.6816685199737549} -11/07/2021 00:38:28 - INFO - __main__ - Step 24274: {'lr': 0.0004725754912449703, 'samples': 4660608, 'steps': 24273, 'loss/train': 1.7606521844863892} -11/07/2021 00:38:29 - INFO - __main__ - Step 24275: {'lr': 0.0004725730746593064, 'samples': 4660800, 'steps': 24274, 'loss/train': 1.7844398021697998} -11/07/2021 00:38:29 - INFO - __main__ - Step 24276: {'lr': 0.0004725706579733546, 'samples': 4660992, 'steps': 24275, 'loss/train': 1.0492531061172485} -11/07/2021 00:38:29 - INFO - __main__ - Step 24277: {'lr': 0.00047256824118711583, 'samples': 4661184, 'steps': 24276, 'loss/train': 1.2214933633804321} -11/07/2021 00:38:30 - INFO - __main__ - Step 24278: {'lr': 0.00047256582430059126, 'samples': 4661376, 'steps': 24277, 'loss/train': 1.601622462272644} -11/07/2021 00:38:31 - INFO - __main__ - Step 24279: {'lr': 0.00047256340731378194, 'samples': 4661568, 'steps': 24278, 'loss/train': 1.6877448558807373} -11/07/2021 00:38:31 - INFO - __main__ - Step 24280: {'lr': 0.00047256099022668896, 'samples': 4661760, 'steps': 24279, 'loss/train': 1.3454322814941406} -11/07/2021 00:38:32 - INFO - __main__ - Step 24281: {'lr': 0.00047255857303931347, 'samples': 4661952, 'steps': 24280, 'loss/train': 1.8590461015701294} -11/07/2021 00:38:32 - INFO - __main__ - Step 24282: {'lr': 0.00047255615575165653, 'samples': 4662144, 'steps': 24281, 'loss/train': 1.8316879272460938} -11/07/2021 00:38:32 - INFO - __main__ - Step 24283: {'lr': 0.0004725537383637193, 'samples': 4662336, 'steps': 24282, 'loss/train': 1.5933130979537964} -11/07/2021 00:38:33 - INFO - __main__ - Step 24284: {'lr': 0.0004725513208755027, 'samples': 4662528, 'steps': 24283, 'loss/train': 1.4665334224700928} -11/07/2021 00:38:34 - INFO - __main__ - Step 24285: {'lr': 0.0004725489032870079, 'samples': 4662720, 'steps': 24284, 'loss/train': 1.6883810758590698} -11/07/2021 00:38:34 - INFO - __main__ - Step 24286: {'lr': 0.000472546485598236, 'samples': 4662912, 'steps': 24285, 'loss/train': 1.6891326904296875} -11/07/2021 00:38:34 - INFO - __main__ - Step 24287: {'lr': 0.0004725440678091881, 'samples': 4663104, 'steps': 24286, 'loss/train': 1.5643234252929688} -11/07/2021 00:38:35 - INFO - __main__ - Step 24288: {'lr': 0.00047254164991986525, 'samples': 4663296, 'steps': 24287, 'loss/train': 1.4116101264953613} -11/07/2021 00:38:36 - INFO - __main__ - Step 24289: {'lr': 0.0004725392319302686, 'samples': 4663488, 'steps': 24288, 'loss/train': 1.825372576713562} -11/07/2021 00:38:36 - INFO - __main__ - Step 24290: {'lr': 0.0004725368138403992, 'samples': 4663680, 'steps': 24289, 'loss/train': 1.5913466215133667} -11/07/2021 00:38:36 - INFO - __main__ - Step 24291: {'lr': 0.00047253439565025815, 'samples': 4663872, 'steps': 24290, 'loss/train': 1.3589271306991577} -11/07/2021 00:38:37 - INFO - __main__ - Step 24292: {'lr': 0.00047253197735984653, 'samples': 4664064, 'steps': 24291, 'loss/train': 1.9609973430633545} -11/07/2021 00:38:37 - INFO - __main__ - Step 24293: {'lr': 0.00047252955896916546, 'samples': 4664256, 'steps': 24292, 'loss/train': 1.183845043182373} -11/07/2021 00:38:38 - INFO - __main__ - Step 24294: {'lr': 0.000472527140478216, 'samples': 4664448, 'steps': 24293, 'loss/train': 2.545880079269409} -11/07/2021 00:38:38 - INFO - __main__ - Step 24295: {'lr': 0.00047252472188699917, 'samples': 4664640, 'steps': 24294, 'loss/train': 1.872978925704956} -11/07/2021 00:38:39 - INFO - __main__ - Step 24296: {'lr': 0.0004725223031955162, 'samples': 4664832, 'steps': 24295, 'loss/train': 1.5187020301818848} -11/07/2021 00:38:39 - INFO - __main__ - Step 24297: {'lr': 0.0004725198844037681, 'samples': 4665024, 'steps': 24296, 'loss/train': 1.612744927406311} -11/07/2021 00:38:39 - INFO - __main__ - Step 24298: {'lr': 0.00047251746551175603, 'samples': 4665216, 'steps': 24297, 'loss/train': 1.7143771648406982} -11/07/2021 00:38:40 - INFO - __main__ - Step 24299: {'lr': 0.000472515046519481, 'samples': 4665408, 'steps': 24298, 'loss/train': 1.7912428379058838} -11/07/2021 00:38:41 - INFO - __main__ - Step 24300: {'lr': 0.000472512627426944, 'samples': 4665600, 'steps': 24299, 'loss/train': 1.251631736755371} -11/07/2021 00:38:41 - INFO - __main__ - Step 24301: {'lr': 0.0004725102082341464, 'samples': 4665792, 'steps': 24300, 'loss/train': 1.328009843826294} -11/07/2021 00:38:42 - INFO - __main__ - Step 24302: {'lr': 0.00047250778894108905, 'samples': 4665984, 'steps': 24301, 'loss/train': 0.9645561575889587} -11/07/2021 00:38:42 - INFO - __main__ - Step 24303: {'lr': 0.0004725053695477731, 'samples': 4666176, 'steps': 24302, 'loss/train': 1.8826731443405151} -11/07/2021 00:38:42 - INFO - __main__ - Step 24304: {'lr': 0.0004725029500541997, 'samples': 4666368, 'steps': 24303, 'loss/train': 1.9238576889038086} -11/07/2021 00:38:43 - INFO - __main__ - Step 24305: {'lr': 0.00047250053046036996, 'samples': 4666560, 'steps': 24304, 'loss/train': 1.5398913621902466} -11/07/2021 00:38:44 - INFO - __main__ - Step 24306: {'lr': 0.00047249811076628483, 'samples': 4666752, 'steps': 24305, 'loss/train': 2.0788919925689697} -11/07/2021 00:38:44 - INFO - __main__ - Step 24307: {'lr': 0.00047249569097194554, 'samples': 4666944, 'steps': 24306, 'loss/train': 1.6412384510040283} -11/07/2021 00:38:44 - INFO - __main__ - Step 24308: {'lr': 0.0004724932710773531, 'samples': 4667136, 'steps': 24307, 'loss/train': 1.1404309272766113} -11/07/2021 00:38:45 - INFO - __main__ - Step 24309: {'lr': 0.00047249085108250867, 'samples': 4667328, 'steps': 24308, 'loss/train': 1.5579737424850464} -11/07/2021 00:38:46 - INFO - __main__ - Step 24310: {'lr': 0.0004724884309874132, 'samples': 4667520, 'steps': 24309, 'loss/train': 1.768725872039795} -11/07/2021 00:38:46 - INFO - __main__ - Step 24311: {'lr': 0.00047248601079206797, 'samples': 4667712, 'steps': 24310, 'loss/train': 1.9995254278182983} -11/07/2021 00:38:47 - INFO - __main__ - Step 24312: {'lr': 0.0004724835904964739, 'samples': 4667904, 'steps': 24311, 'loss/train': 1.5800747871398926} -11/07/2021 00:38:47 - INFO - __main__ - Step 24313: {'lr': 0.0004724811701006322, 'samples': 4668096, 'steps': 24312, 'loss/train': 0.16031067073345184} -11/07/2021 00:38:48 - INFO - __main__ - Step 24314: {'lr': 0.00047247874960454394, 'samples': 4668288, 'steps': 24313, 'loss/train': 1.0861700773239136} -11/07/2021 00:38:48 - INFO - __main__ - Step 24315: {'lr': 0.0004724763290082102, 'samples': 4668480, 'steps': 24314, 'loss/train': 0.15731477737426758} -11/07/2021 00:38:49 - INFO - __main__ - Step 24316: {'lr': 0.000472473908311632, 'samples': 4668672, 'steps': 24315, 'loss/train': 0.9294226169586182} -11/07/2021 00:38:49 - INFO - __main__ - Step 24317: {'lr': 0.0004724714875148105, 'samples': 4668864, 'steps': 24316, 'loss/train': 1.470827579498291} -11/07/2021 00:38:50 - INFO - __main__ - Step 24318: {'lr': 0.0004724690666177468, 'samples': 4669056, 'steps': 24317, 'loss/train': 1.5593488216400146} -11/07/2021 00:38:50 - INFO - __main__ - Step 24319: {'lr': 0.00047246664562044193, 'samples': 4669248, 'steps': 24318, 'loss/train': 1.581626296043396} -11/07/2021 00:38:51 - INFO - __main__ - Step 24320: {'lr': 0.0004724642245228971, 'samples': 4669440, 'steps': 24319, 'loss/train': 1.706702709197998} -11/07/2021 00:38:51 - INFO - __main__ - Step 24321: {'lr': 0.0004724618033251133, 'samples': 4669632, 'steps': 24320, 'loss/train': 1.5025871992111206} -11/07/2021 00:38:52 - INFO - __main__ - Step 24322: {'lr': 0.0004724593820270916, 'samples': 4669824, 'steps': 24321, 'loss/train': 1.7909736633300781} -11/07/2021 00:38:52 - INFO - __main__ - Step 24323: {'lr': 0.00047245696062883316, 'samples': 4670016, 'steps': 24322, 'loss/train': 2.027930736541748} -11/07/2021 00:38:52 - INFO - __main__ - Step 24324: {'lr': 0.0004724545391303391, 'samples': 4670208, 'steps': 24323, 'loss/train': 1.6163299083709717} -11/07/2021 00:38:53 - INFO - __main__ - Step 24325: {'lr': 0.0004724521175316103, 'samples': 4670400, 'steps': 24324, 'loss/train': 1.5050382614135742} -11/07/2021 00:38:54 - INFO - __main__ - Step 24326: {'lr': 0.0004724496958326482, 'samples': 4670592, 'steps': 24325, 'loss/train': 0.8827059268951416} -11/07/2021 00:38:54 - INFO - __main__ - Step 24327: {'lr': 0.00047244727403345356, 'samples': 4670784, 'steps': 24326, 'loss/train': 1.293052315711975} -11/07/2021 00:38:55 - INFO - __main__ - Step 24328: {'lr': 0.00047244485213402765, 'samples': 4670976, 'steps': 24327, 'loss/train': 1.496334195137024} -11/07/2021 00:38:55 - INFO - __main__ - Step 24329: {'lr': 0.0004724424301343716, 'samples': 4671168, 'steps': 24328, 'loss/train': 1.7034502029418945} -11/07/2021 00:38:56 - INFO - __main__ - Step 24330: {'lr': 0.00047244000803448635, 'samples': 4671360, 'steps': 24329, 'loss/train': 1.240768551826477} -11/07/2021 00:38:56 - INFO - __main__ - Step 24331: {'lr': 0.000472437585834373, 'samples': 4671552, 'steps': 24330, 'loss/train': 1.2295843362808228} -11/07/2021 00:38:57 - INFO - __main__ - Step 24332: {'lr': 0.00047243516353403283, 'samples': 4671744, 'steps': 24331, 'loss/train': 1.6633962392807007} -11/07/2021 00:38:57 - INFO - __main__ - Step 24333: {'lr': 0.0004724327411334668, 'samples': 4671936, 'steps': 24332, 'loss/train': 0.921309232711792} -11/07/2021 00:38:57 - INFO - __main__ - Step 24334: {'lr': 0.00047243031863267594, 'samples': 4672128, 'steps': 24333, 'loss/train': 1.7888855934143066} -11/07/2021 00:38:58 - INFO - __main__ - Step 24335: {'lr': 0.0004724278960316615, 'samples': 4672320, 'steps': 24334, 'loss/train': 0.4477072060108185} -11/07/2021 00:38:59 - INFO - __main__ - Step 24336: {'lr': 0.00047242547333042434, 'samples': 4672512, 'steps': 24335, 'loss/train': 1.5591822862625122} -11/07/2021 00:38:59 - INFO - __main__ - Step 24337: {'lr': 0.0004724230505289658, 'samples': 4672704, 'steps': 24336, 'loss/train': 2.1904563903808594} -11/07/2021 00:38:59 - INFO - __main__ - Step 24338: {'lr': 0.0004724206276272868, 'samples': 4672896, 'steps': 24337, 'loss/train': 1.5123300552368164} -11/07/2021 00:39:00 - INFO - __main__ - Step 24339: {'lr': 0.0004724182046253885, 'samples': 4673088, 'steps': 24338, 'loss/train': 1.6610440015792847} -11/07/2021 00:39:01 - INFO - __main__ - Step 24340: {'lr': 0.0004724157815232721, 'samples': 4673280, 'steps': 24339, 'loss/train': 1.870625615119934} -11/07/2021 00:39:01 - INFO - __main__ - Step 24341: {'lr': 0.00047241335832093844, 'samples': 4673472, 'steps': 24340, 'loss/train': 1.2395048141479492} -11/07/2021 00:39:01 - INFO - __main__ - Step 24342: {'lr': 0.00047241093501838887, 'samples': 4673664, 'steps': 24341, 'loss/train': 1.3462673425674438} -11/07/2021 00:39:02 - INFO - __main__ - Step 24343: {'lr': 0.00047240851161562433, 'samples': 4673856, 'steps': 24342, 'loss/train': 1.980881929397583} -11/07/2021 00:39:02 - INFO - __main__ - Step 24344: {'lr': 0.00047240608811264595, 'samples': 4674048, 'steps': 24343, 'loss/train': 1.5272406339645386} -11/07/2021 00:39:03 - INFO - __main__ - Step 24345: {'lr': 0.0004724036645094548, 'samples': 4674240, 'steps': 24344, 'loss/train': 1.0640920400619507} -11/07/2021 00:39:03 - INFO - __main__ - Step 24346: {'lr': 0.00047240124080605197, 'samples': 4674432, 'steps': 24345, 'loss/train': 1.4234856367111206} -11/07/2021 00:39:04 - INFO - __main__ - Step 24347: {'lr': 0.0004723988170024386, 'samples': 4674624, 'steps': 24346, 'loss/train': 1.3413307666778564} -11/07/2021 00:39:04 - INFO - __main__ - Step 24348: {'lr': 0.0004723963930986157, 'samples': 4674816, 'steps': 24347, 'loss/train': 1.1005454063415527} -11/07/2021 00:39:05 - INFO - __main__ - Step 24349: {'lr': 0.0004723939690945845, 'samples': 4675008, 'steps': 24348, 'loss/train': 1.8610029220581055} -11/07/2021 00:39:05 - INFO - __main__ - Step 24350: {'lr': 0.000472391544990346, 'samples': 4675200, 'steps': 24349, 'loss/train': 1.0002992153167725} -11/07/2021 00:39:06 - INFO - __main__ - Step 24351: {'lr': 0.0004723891207859012, 'samples': 4675392, 'steps': 24350, 'loss/train': 1.4413059949874878} -11/07/2021 00:39:06 - INFO - __main__ - Step 24352: {'lr': 0.00047238669648125146, 'samples': 4675584, 'steps': 24351, 'loss/train': 1.5541919469833374} -11/07/2021 00:39:07 - INFO - __main__ - Step 24353: {'lr': 0.00047238427207639755, 'samples': 4675776, 'steps': 24352, 'loss/train': 1.7751007080078125} -11/07/2021 00:39:07 - INFO - __main__ - Step 24354: {'lr': 0.0004723818475713408, 'samples': 4675968, 'steps': 24353, 'loss/train': 1.778316617012024} -11/07/2021 00:39:07 - INFO - __main__ - Step 24355: {'lr': 0.00047237942296608223, 'samples': 4676160, 'steps': 24354, 'loss/train': 1.353247046470642} -11/07/2021 00:39:08 - INFO - __main__ - Step 24356: {'lr': 0.00047237699826062286, 'samples': 4676352, 'steps': 24355, 'loss/train': 1.6153926849365234} -11/07/2021 00:39:09 - INFO - __main__ - Step 24357: {'lr': 0.0004723745734549639, 'samples': 4676544, 'steps': 24356, 'loss/train': 1.786283016204834} -11/07/2021 00:39:09 - INFO - __main__ - Step 24358: {'lr': 0.0004723721485491064, 'samples': 4676736, 'steps': 24357, 'loss/train': 1.4685715436935425} -11/07/2021 00:39:09 - INFO - __main__ - Step 24359: {'lr': 0.0004723697235430514, 'samples': 4676928, 'steps': 24358, 'loss/train': 1.738546371459961} -11/07/2021 00:39:10 - INFO - __main__ - Step 24360: {'lr': 0.0004723672984368, 'samples': 4677120, 'steps': 24359, 'loss/train': 1.305877447128296} -11/07/2021 00:39:11 - INFO - __main__ - Step 24361: {'lr': 0.00047236487323035344, 'samples': 4677312, 'steps': 24360, 'loss/train': 1.785787582397461} -11/07/2021 00:39:11 - INFO - __main__ - Step 24362: {'lr': 0.00047236244792371265, 'samples': 4677504, 'steps': 24361, 'loss/train': 1.4389066696166992} -11/07/2021 00:39:12 - INFO - __main__ - Step 24363: {'lr': 0.0004723600225168787, 'samples': 4677696, 'steps': 24362, 'loss/train': 1.5341063737869263} -11/07/2021 00:39:12 - INFO - __main__ - Step 24364: {'lr': 0.0004723575970098528, 'samples': 4677888, 'steps': 24363, 'loss/train': 1.7367303371429443} -11/07/2021 00:39:12 - INFO - __main__ - Step 24365: {'lr': 0.00047235517140263605, 'samples': 4678080, 'steps': 24364, 'loss/train': 1.672031283378601} -11/07/2021 00:39:13 - INFO - __main__ - Step 24366: {'lr': 0.00047235274569522946, 'samples': 4678272, 'steps': 24365, 'loss/train': 1.890123724937439} -11/07/2021 00:39:14 - INFO - __main__ - Step 24367: {'lr': 0.0004723503198876341, 'samples': 4678464, 'steps': 24366, 'loss/train': 1.6104552745819092} -11/07/2021 00:39:14 - INFO - __main__ - Step 24368: {'lr': 0.0004723478939798512, 'samples': 4678656, 'steps': 24367, 'loss/train': 0.4229798913002014} -11/07/2021 00:39:14 - INFO - __main__ - Step 24369: {'lr': 0.0004723454679718817, 'samples': 4678848, 'steps': 24368, 'loss/train': 2.6394357681274414} -11/07/2021 00:39:15 - INFO - __main__ - Step 24370: {'lr': 0.00047234304186372685, 'samples': 4679040, 'steps': 24369, 'loss/train': 1.6752501726150513} -11/07/2021 00:39:15 - INFO - __main__ - Step 24371: {'lr': 0.00047234061565538753, 'samples': 4679232, 'steps': 24370, 'loss/train': 1.5303529500961304} -11/07/2021 00:39:16 - INFO - __main__ - Step 24372: {'lr': 0.0004723381893468651, 'samples': 4679424, 'steps': 24371, 'loss/train': 1.88096022605896} -11/07/2021 00:39:16 - INFO - __main__ - Step 24373: {'lr': 0.00047233576293816045, 'samples': 4679616, 'steps': 24372, 'loss/train': 1.6431019306182861} -11/07/2021 00:39:17 - INFO - __main__ - Step 24374: {'lr': 0.00047233333642927465, 'samples': 4679808, 'steps': 24373, 'loss/train': 0.9329357743263245} -11/07/2021 00:39:17 - INFO - __main__ - Step 24375: {'lr': 0.000472330909820209, 'samples': 4680000, 'steps': 24374, 'loss/train': 1.458146095275879} -11/07/2021 00:39:18 - INFO - __main__ - Step 24376: {'lr': 0.0004723284831109644, 'samples': 4680192, 'steps': 24375, 'loss/train': 1.1037852764129639} -11/07/2021 00:39:19 - INFO - __main__ - Step 24377: {'lr': 0.0004723260563015421, 'samples': 4680384, 'steps': 24376, 'loss/train': 1.6638442277908325} -11/07/2021 00:39:19 - INFO - __main__ - Step 24378: {'lr': 0.00047232362939194305, 'samples': 4680576, 'steps': 24377, 'loss/train': 0.7501077055931091} -11/07/2021 00:39:19 - INFO - __main__ - Step 24379: {'lr': 0.0004723212023821684, 'samples': 4680768, 'steps': 24378, 'loss/train': 1.5712947845458984} -11/07/2021 00:39:20 - INFO - __main__ - Step 24380: {'lr': 0.0004723187752722193, 'samples': 4680960, 'steps': 24379, 'loss/train': 1.0134202241897583} -11/07/2021 00:39:20 - INFO - __main__ - Step 24381: {'lr': 0.00047231634806209675, 'samples': 4681152, 'steps': 24380, 'loss/train': 1.6158535480499268} -11/07/2021 00:39:21 - INFO - __main__ - Step 24382: {'lr': 0.0004723139207518019, 'samples': 4681344, 'steps': 24381, 'loss/train': 1.6911224126815796} -11/07/2021 00:39:21 - INFO - __main__ - Step 24383: {'lr': 0.00047231149334133577, 'samples': 4681536, 'steps': 24382, 'loss/train': 1.647817850112915} -11/07/2021 00:39:22 - INFO - __main__ - Step 24384: {'lr': 0.00047230906583069953, 'samples': 4681728, 'steps': 24383, 'loss/train': 1.6826653480529785} -11/07/2021 00:39:22 - INFO - __main__ - Step 24385: {'lr': 0.0004723066382198943, 'samples': 4681920, 'steps': 24384, 'loss/train': 1.359289288520813} -11/07/2021 00:39:22 - INFO - __main__ - Step 24386: {'lr': 0.00047230421050892116, 'samples': 4682112, 'steps': 24385, 'loss/train': 1.6030157804489136} -11/07/2021 00:39:23 - INFO - __main__ - Step 24387: {'lr': 0.00047230178269778105, 'samples': 4682304, 'steps': 24386, 'loss/train': 1.5881558656692505} -11/07/2021 00:39:24 - INFO - __main__ - Step 24388: {'lr': 0.00047229935478647524, 'samples': 4682496, 'steps': 24387, 'loss/train': 1.7504736185073853} -11/07/2021 00:39:24 - INFO - __main__ - Step 24389: {'lr': 0.0004722969267750048, 'samples': 4682688, 'steps': 24388, 'loss/train': 1.652161717414856} -11/07/2021 00:39:24 - INFO - __main__ - Step 24390: {'lr': 0.0004722944986633708, 'samples': 4682880, 'steps': 24389, 'loss/train': 5.803641319274902} -11/07/2021 00:39:25 - INFO - __main__ - Step 24391: {'lr': 0.0004722920704515743, 'samples': 4683072, 'steps': 24390, 'loss/train': 1.418088674545288} -11/07/2021 00:39:26 - INFO - __main__ - Step 24392: {'lr': 0.00047228964213961647, 'samples': 4683264, 'steps': 24391, 'loss/train': 1.6268666982650757} -11/07/2021 00:39:26 - INFO - __main__ - Step 24393: {'lr': 0.00047228721372749826, 'samples': 4683456, 'steps': 24392, 'loss/train': 1.702316164970398} -11/07/2021 00:39:27 - INFO - __main__ - Step 24394: {'lr': 0.000472284785215221, 'samples': 4683648, 'steps': 24393, 'loss/train': 1.6218605041503906} -11/07/2021 00:39:27 - INFO - __main__ - Step 24395: {'lr': 0.0004722823566027855, 'samples': 4683840, 'steps': 24394, 'loss/train': 1.5702743530273438} -11/07/2021 00:39:27 - INFO - __main__ - Step 24396: {'lr': 0.00047227992789019316, 'samples': 4684032, 'steps': 24395, 'loss/train': 1.2061114311218262} -11/07/2021 00:39:28 - INFO - __main__ - Step 24397: {'lr': 0.0004722774990774448, 'samples': 4684224, 'steps': 24396, 'loss/train': 1.7952961921691895} -11/07/2021 00:39:29 - INFO - __main__ - Step 24398: {'lr': 0.00047227507016454163, 'samples': 4684416, 'steps': 24397, 'loss/train': 1.4876207113265991} -11/07/2021 00:39:29 - INFO - __main__ - Step 24399: {'lr': 0.00047227264115148475, 'samples': 4684608, 'steps': 24398, 'loss/train': 1.480579137802124} -11/07/2021 00:39:29 - INFO - __main__ - Step 24400: {'lr': 0.00047227021203827523, 'samples': 4684800, 'steps': 24399, 'loss/train': 1.2277770042419434} -11/07/2021 00:39:30 - INFO - __main__ - Step 24401: {'lr': 0.0004722677828249142, 'samples': 4684992, 'steps': 24400, 'loss/train': 1.7811293601989746} -11/07/2021 00:39:31 - INFO - __main__ - Step 24402: {'lr': 0.0004722653535114028, 'samples': 4685184, 'steps': 24401, 'loss/train': 1.2663511037826538} -11/07/2021 00:39:31 - INFO - __main__ - Step 24403: {'lr': 0.00047226292409774205, 'samples': 4685376, 'steps': 24402, 'loss/train': 1.9359652996063232} -11/07/2021 00:39:31 - INFO - __main__ - Step 24404: {'lr': 0.00047226049458393306, 'samples': 4685568, 'steps': 24403, 'loss/train': 1.5348832607269287} -11/07/2021 00:39:32 - INFO - __main__ - Step 24405: {'lr': 0.0004722580649699768, 'samples': 4685760, 'steps': 24404, 'loss/train': 1.8864802122116089} -11/07/2021 00:39:32 - INFO - __main__ - Step 24406: {'lr': 0.00047225563525587463, 'samples': 4685952, 'steps': 24405, 'loss/train': 1.5111305713653564} -11/07/2021 00:39:32 - INFO - __main__ - Step 24407: {'lr': 0.0004722532054416274, 'samples': 4686144, 'steps': 24406, 'loss/train': 1.830599308013916} -11/07/2021 00:39:33 - INFO - __main__ - Step 24408: {'lr': 0.0004722507755272364, 'samples': 4686336, 'steps': 24407, 'loss/train': 2.113673210144043} -11/07/2021 00:39:34 - INFO - __main__ - Step 24409: {'lr': 0.0004722483455127026, 'samples': 4686528, 'steps': 24408, 'loss/train': 2.154162645339966} -11/07/2021 00:39:34 - INFO - __main__ - Step 24410: {'lr': 0.000472245915398027, 'samples': 4686720, 'steps': 24409, 'loss/train': 1.6176613569259644} -11/07/2021 00:39:35 - INFO - __main__ - Step 24411: {'lr': 0.0004722434851832109, 'samples': 4686912, 'steps': 24410, 'loss/train': 1.844570279121399} -11/07/2021 00:39:35 - INFO - __main__ - Step 24412: {'lr': 0.00047224105486825543, 'samples': 4687104, 'steps': 24411, 'loss/train': 1.7264853715896606} -11/07/2021 00:39:36 - INFO - __main__ - Step 24413: {'lr': 0.0004722386244531615, 'samples': 4687296, 'steps': 24412, 'loss/train': 1.0778053998947144} -11/07/2021 00:39:37 - INFO - __main__ - Step 24414: {'lr': 0.0004722361939379302, 'samples': 4687488, 'steps': 24413, 'loss/train': 1.4467507600784302} -11/07/2021 00:39:37 - INFO - __main__ - Step 24415: {'lr': 0.0004722337633225627, 'samples': 4687680, 'steps': 24414, 'loss/train': 0.16399438679218292} -11/07/2021 00:39:37 - INFO - __main__ - Step 24416: {'lr': 0.0004722313326070602, 'samples': 4687872, 'steps': 24415, 'loss/train': 1.982115626335144} -11/07/2021 00:39:38 - INFO - __main__ - Step 24417: {'lr': 0.00047222890179142365, 'samples': 4688064, 'steps': 24416, 'loss/train': 1.489362359046936} -11/07/2021 00:39:39 - INFO - __main__ - Step 24418: {'lr': 0.00047222647087565413, 'samples': 4688256, 'steps': 24417, 'loss/train': 1.4437440633773804} -11/07/2021 00:39:39 - INFO - __main__ - Step 24419: {'lr': 0.0004722240398597528, 'samples': 4688448, 'steps': 24418, 'loss/train': 1.2767196893692017} -11/07/2021 00:39:39 - INFO - __main__ - Step 24420: {'lr': 0.0004722216087437208, 'samples': 4688640, 'steps': 24419, 'loss/train': 1.2910867929458618} -11/07/2021 00:39:40 - INFO - __main__ - Step 24421: {'lr': 0.0004722191775275592, 'samples': 4688832, 'steps': 24420, 'loss/train': 1.8720062971115112} -11/07/2021 00:39:40 - INFO - __main__ - Step 24422: {'lr': 0.00047221674621126896, 'samples': 4689024, 'steps': 24421, 'loss/train': 1.386762022972107} -11/07/2021 00:39:41 - INFO - __main__ - Step 24423: {'lr': 0.0004722143147948513, 'samples': 4689216, 'steps': 24422, 'loss/train': 0.547491192817688} -11/07/2021 00:39:42 - INFO - __main__ - Step 24424: {'lr': 0.0004722118832783074, 'samples': 4689408, 'steps': 24423, 'loss/train': 1.6926751136779785} -11/07/2021 00:39:42 - INFO - __main__ - Step 24425: {'lr': 0.0004722094516616382, 'samples': 4689600, 'steps': 24424, 'loss/train': 1.9092614650726318} -11/07/2021 00:39:42 - INFO - __main__ - Step 24426: {'lr': 0.0004722070199448448, 'samples': 4689792, 'steps': 24425, 'loss/train': 1.6068289279937744} -11/07/2021 00:39:43 - INFO - __main__ - Step 24427: {'lr': 0.00047220458812792846, 'samples': 4689984, 'steps': 24426, 'loss/train': 0.16781136393547058} -11/07/2021 00:39:44 - INFO - __main__ - Step 24428: {'lr': 0.00047220215621089005, 'samples': 4690176, 'steps': 24427, 'loss/train': 0.6731496453285217} -11/07/2021 00:39:44 - INFO - __main__ - Step 24429: {'lr': 0.00047219972419373083, 'samples': 4690368, 'steps': 24428, 'loss/train': 1.3694257736206055} -11/07/2021 00:39:45 - INFO - __main__ - Step 24430: {'lr': 0.00047219729207645183, 'samples': 4690560, 'steps': 24429, 'loss/train': 0.8720505833625793} -11/07/2021 00:39:45 - INFO - __main__ - Step 24431: {'lr': 0.0004721948598590542, 'samples': 4690752, 'steps': 24430, 'loss/train': 1.5635464191436768} -11/07/2021 00:39:46 - INFO - __main__ - Step 24432: {'lr': 0.0004721924275415389, 'samples': 4690944, 'steps': 24431, 'loss/train': 0.15982936322689056} -11/07/2021 00:39:46 - INFO - __main__ - Step 24433: {'lr': 0.0004721899951239072, 'samples': 4691136, 'steps': 24432, 'loss/train': 1.6448273658752441} -11/07/2021 00:39:47 - INFO - __main__ - Step 24434: {'lr': 0.0004721875626061601, 'samples': 4691328, 'steps': 24433, 'loss/train': 1.455288290977478} -11/07/2021 00:39:47 - INFO - __main__ - Step 24435: {'lr': 0.00047218512998829874, 'samples': 4691520, 'steps': 24434, 'loss/train': 0.9792460799217224} -11/07/2021 00:39:48 - INFO - __main__ - Step 24436: {'lr': 0.00047218269727032413, 'samples': 4691712, 'steps': 24435, 'loss/train': 1.4665985107421875} -11/07/2021 00:39:48 - INFO - __main__ - Step 24437: {'lr': 0.00047218026445223745, 'samples': 4691904, 'steps': 24436, 'loss/train': 1.6033726930618286} -11/07/2021 00:39:48 - INFO - __main__ - Step 24438: {'lr': 0.0004721778315340398, 'samples': 4692096, 'steps': 24437, 'loss/train': 1.4006061553955078} -11/07/2021 00:39:49 - INFO - __main__ - Step 24439: {'lr': 0.0004721753985157322, 'samples': 4692288, 'steps': 24438, 'loss/train': 1.8944119215011597} -11/07/2021 00:39:50 - INFO - __main__ - Step 24440: {'lr': 0.0004721729653973158, 'samples': 4692480, 'steps': 24439, 'loss/train': 1.4278517961502075} -11/07/2021 00:39:50 - INFO - __main__ - Step 24441: {'lr': 0.0004721705321787917, 'samples': 4692672, 'steps': 24440, 'loss/train': 1.145422101020813} -11/07/2021 00:39:50 - INFO - __main__ - Step 24442: {'lr': 0.00047216809886016097, 'samples': 4692864, 'steps': 24441, 'loss/train': 1.344766616821289} -11/07/2021 00:39:51 - INFO - __main__ - Step 24443: {'lr': 0.0004721656654414248, 'samples': 4693056, 'steps': 24442, 'loss/train': 2.641737461090088} -11/07/2021 00:39:52 - INFO - __main__ - Step 24444: {'lr': 0.00047216323192258416, 'samples': 4693248, 'steps': 24443, 'loss/train': 1.642939567565918} -11/07/2021 00:39:52 - INFO - __main__ - Step 24445: {'lr': 0.0004721607983036401, 'samples': 4693440, 'steps': 24444, 'loss/train': 1.9018218517303467} -11/07/2021 00:39:53 - INFO - __main__ - Step 24446: {'lr': 0.00047215836458459393, 'samples': 4693632, 'steps': 24445, 'loss/train': 1.1468150615692139} -11/07/2021 00:39:53 - INFO - __main__ - Step 24447: {'lr': 0.00047215593076544663, 'samples': 4693824, 'steps': 24446, 'loss/train': 1.8059026002883911} -11/07/2021 00:39:53 - INFO - __main__ - Step 24448: {'lr': 0.0004721534968461992, 'samples': 4694016, 'steps': 24447, 'loss/train': 1.7327210903167725} -11/07/2021 00:39:54 - INFO - __main__ - Step 24449: {'lr': 0.00047215106282685296, 'samples': 4694208, 'steps': 24448, 'loss/train': 1.154772162437439} -11/07/2021 00:39:55 - INFO - __main__ - Step 24450: {'lr': 0.0004721486287074088, 'samples': 4694400, 'steps': 24449, 'loss/train': 1.3429368734359741} -11/07/2021 00:39:55 - INFO - __main__ - Step 24451: {'lr': 0.0004721461944878679, 'samples': 4694592, 'steps': 24450, 'loss/train': 1.561524510383606} -11/07/2021 00:39:55 - INFO - __main__ - Step 24452: {'lr': 0.00047214376016823143, 'samples': 4694784, 'steps': 24451, 'loss/train': 1.277727484703064} -11/07/2021 00:39:56 - INFO - __main__ - Step 24453: {'lr': 0.0004721413257485003, 'samples': 4694976, 'steps': 24452, 'loss/train': 1.6690208911895752} -11/07/2021 00:39:57 - INFO - __main__ - Step 24454: {'lr': 0.0004721388912286758, 'samples': 4695168, 'steps': 24453, 'loss/train': 1.5438530445098877} -11/07/2021 00:39:57 - INFO - __main__ - Step 24455: {'lr': 0.0004721364566087589, 'samples': 4695360, 'steps': 24454, 'loss/train': 1.6763454675674438} -11/07/2021 00:39:57 - INFO - __main__ - Step 24456: {'lr': 0.00047213402188875077, 'samples': 4695552, 'steps': 24455, 'loss/train': 1.7971174716949463} -11/07/2021 00:39:58 - INFO - __main__ - Step 24457: {'lr': 0.00047213158706865246, 'samples': 4695744, 'steps': 24456, 'loss/train': 1.4079968929290771} -11/07/2021 00:39:58 - INFO - __main__ - Step 24458: {'lr': 0.000472129152148465, 'samples': 4695936, 'steps': 24457, 'loss/train': 1.0568734407424927} -11/07/2021 00:39:59 - INFO - __main__ - Step 24459: {'lr': 0.0004721267171281897, 'samples': 4696128, 'steps': 24458, 'loss/train': 1.2152099609375} -11/07/2021 00:39:59 - INFO - __main__ - Step 24460: {'lr': 0.00047212428200782744, 'samples': 4696320, 'steps': 24459, 'loss/train': 1.297367811203003} -11/07/2021 00:40:00 - INFO - __main__ - Step 24461: {'lr': 0.00047212184678737946, 'samples': 4696512, 'steps': 24460, 'loss/train': 1.7175503969192505} -11/07/2021 00:40:00 - INFO - __main__ - Step 24462: {'lr': 0.00047211941146684677, 'samples': 4696704, 'steps': 24461, 'loss/train': 1.3215069770812988} -11/07/2021 00:40:00 - INFO - __main__ - Step 24463: {'lr': 0.00047211697604623056, 'samples': 4696896, 'steps': 24462, 'loss/train': 1.438876748085022} -11/07/2021 00:40:02 - INFO - __main__ - Step 24464: {'lr': 0.0004721145405255318, 'samples': 4697088, 'steps': 24463, 'loss/train': 1.4503346681594849} -11/07/2021 00:40:02 - INFO - __main__ - Step 24465: {'lr': 0.00047211210490475167, 'samples': 4697280, 'steps': 24464, 'loss/train': 1.847247838973999} -11/07/2021 00:40:02 - INFO - __main__ - Step 24466: {'lr': 0.0004721096691838913, 'samples': 4697472, 'steps': 24465, 'loss/train': 0.15198959410190582} -11/07/2021 00:40:03 - INFO - __main__ - Step 24467: {'lr': 0.00047210723336295167, 'samples': 4697664, 'steps': 24466, 'loss/train': 1.6651211977005005} -11/07/2021 00:40:03 - INFO - __main__ - Step 24468: {'lr': 0.00047210479744193404, 'samples': 4697856, 'steps': 24467, 'loss/train': 1.6929770708084106} -11/07/2021 00:40:04 - INFO - __main__ - Step 24469: {'lr': 0.0004721023614208393, 'samples': 4698048, 'steps': 24468, 'loss/train': 1.1923024654388428} -11/07/2021 00:40:05 - INFO - __main__ - Step 24470: {'lr': 0.0004720999252996687, 'samples': 4698240, 'steps': 24469, 'loss/train': 1.750717282295227} -11/07/2021 00:40:05 - INFO - __main__ - Step 24471: {'lr': 0.00047209748907842337, 'samples': 4698432, 'steps': 24470, 'loss/train': 1.480593204498291} -11/07/2021 00:40:05 - INFO - __main__ - Step 24472: {'lr': 0.0004720950527571043, 'samples': 4698624, 'steps': 24471, 'loss/train': 2.0582070350646973} -11/07/2021 00:40:06 - INFO - __main__ - Step 24473: {'lr': 0.0004720926163357126, 'samples': 4698816, 'steps': 24472, 'loss/train': 1.538037896156311} -11/07/2021 00:40:07 - INFO - __main__ - Step 24474: {'lr': 0.0004720901798142494, 'samples': 4699008, 'steps': 24473, 'loss/train': 1.019331932067871} -11/07/2021 00:40:07 - INFO - __main__ - Step 24475: {'lr': 0.00047208774319271586, 'samples': 4699200, 'steps': 24474, 'loss/train': 1.8132907152175903} -11/07/2021 00:40:07 - INFO - __main__ - Step 24476: {'lr': 0.00047208530647111294, 'samples': 4699392, 'steps': 24475, 'loss/train': 1.8565229177474976} -11/07/2021 00:40:08 - INFO - __main__ - Step 24477: {'lr': 0.0004720828696494418, 'samples': 4699584, 'steps': 24476, 'loss/train': 1.696797251701355} -11/07/2021 00:40:08 - INFO - __main__ - Step 24478: {'lr': 0.00047208043272770354, 'samples': 4699776, 'steps': 24477, 'loss/train': 0.24086450040340424} -11/07/2021 00:40:09 - INFO - __main__ - Step 24479: {'lr': 0.0004720779957058993, 'samples': 4699968, 'steps': 24478, 'loss/train': 1.553345799446106} -11/07/2021 00:40:10 - INFO - __main__ - Step 24480: {'lr': 0.0004720755585840302, 'samples': 4700160, 'steps': 24479, 'loss/train': 1.356393814086914} -11/07/2021 00:40:10 - INFO - __main__ - Step 24481: {'lr': 0.0004720731213620972, 'samples': 4700352, 'steps': 24480, 'loss/train': 1.7137320041656494} -11/07/2021 00:40:10 - INFO - __main__ - Step 24482: {'lr': 0.00047207068404010147, 'samples': 4700544, 'steps': 24481, 'loss/train': 1.1787151098251343} -11/07/2021 00:40:11 - INFO - __main__ - Step 24483: {'lr': 0.00047206824661804415, 'samples': 4700736, 'steps': 24482, 'loss/train': 1.1076496839523315} -11/07/2021 00:40:11 - INFO - __main__ - Step 24484: {'lr': 0.0004720658090959263, 'samples': 4700928, 'steps': 24483, 'loss/train': 1.8427814245224} -11/07/2021 00:40:12 - INFO - __main__ - Step 24485: {'lr': 0.000472063371473749, 'samples': 4701120, 'steps': 24484, 'loss/train': 1.2564271688461304} -11/07/2021 00:40:12 - INFO - __main__ - Step 24486: {'lr': 0.0004720609337515134, 'samples': 4701312, 'steps': 24485, 'loss/train': 0.3722918629646301} -11/07/2021 00:40:13 - INFO - __main__ - Step 24487: {'lr': 0.00047205849592922057, 'samples': 4701504, 'steps': 24486, 'loss/train': 1.6480177640914917} -11/07/2021 00:40:13 - INFO - __main__ - Step 24488: {'lr': 0.00047205605800687154, 'samples': 4701696, 'steps': 24487, 'loss/train': 0.6376531720161438} -11/07/2021 00:40:13 - INFO - __main__ - Step 24489: {'lr': 0.0004720536199844676, 'samples': 4701888, 'steps': 24488, 'loss/train': 1.692022442817688} -11/07/2021 00:40:14 - INFO - __main__ - Step 24490: {'lr': 0.00047205118186200963, 'samples': 4702080, 'steps': 24489, 'loss/train': 1.5425223112106323} -11/07/2021 00:40:15 - INFO - __main__ - Step 24491: {'lr': 0.00047204874363949886, 'samples': 4702272, 'steps': 24490, 'loss/train': 1.1524288654327393} -11/07/2021 00:40:15 - INFO - __main__ - Step 24492: {'lr': 0.00047204630531693634, 'samples': 4702464, 'steps': 24491, 'loss/train': 2.0011699199676514} -11/07/2021 00:40:15 - INFO - __main__ - Step 24493: {'lr': 0.0004720438668943232, 'samples': 4702656, 'steps': 24492, 'loss/train': 1.3901020288467407} -11/07/2021 00:40:16 - INFO - __main__ - Step 24494: {'lr': 0.0004720414283716605, 'samples': 4702848, 'steps': 24493, 'loss/train': 1.6455399990081787} -11/07/2021 00:40:17 - INFO - __main__ - Step 24495: {'lr': 0.00047203898974894934, 'samples': 4703040, 'steps': 24494, 'loss/train': 1.5917654037475586} -11/07/2021 00:40:17 - INFO - __main__ - Step 24496: {'lr': 0.0004720365510261909, 'samples': 4703232, 'steps': 24495, 'loss/train': 1.9656726121902466} -11/07/2021 00:40:18 - INFO - __main__ - Step 24497: {'lr': 0.00047203411220338615, 'samples': 4703424, 'steps': 24496, 'loss/train': 1.6324363946914673} -11/07/2021 00:40:18 - INFO - __main__ - Step 24498: {'lr': 0.00047203167328053634, 'samples': 4703616, 'steps': 24497, 'loss/train': 1.4276381731033325} -11/07/2021 00:40:18 - INFO - __main__ - Step 24499: {'lr': 0.0004720292342576423, 'samples': 4703808, 'steps': 24498, 'loss/train': 1.9737954139709473} -11/07/2021 00:40:19 - INFO - __main__ - Step 24500: {'lr': 0.0004720267951347055, 'samples': 4704000, 'steps': 24499, 'loss/train': 1.656864881515503} -11/07/2021 00:40:20 - INFO - __main__ - Step 24501: {'lr': 0.00047202435591172677, 'samples': 4704192, 'steps': 24500, 'loss/train': 1.9080573320388794} -11/07/2021 00:40:20 - INFO - __main__ - Step 24502: {'lr': 0.00047202191658870737, 'samples': 4704384, 'steps': 24501, 'loss/train': 1.2758409976959229} -11/07/2021 00:40:20 - INFO - __main__ - Step 24503: {'lr': 0.00047201947716564826, 'samples': 4704576, 'steps': 24502, 'loss/train': 1.6238764524459839} -11/07/2021 00:40:21 - INFO - __main__ - Step 24504: {'lr': 0.00047201703764255057, 'samples': 4704768, 'steps': 24503, 'loss/train': 1.4966262578964233} -11/07/2021 00:40:22 - INFO - __main__ - Step 24505: {'lr': 0.0004720145980194155, 'samples': 4704960, 'steps': 24504, 'loss/train': 2.0411877632141113} -11/07/2021 00:40:22 - INFO - __main__ - Step 24506: {'lr': 0.000472012158296244, 'samples': 4705152, 'steps': 24505, 'loss/train': 1.6829310655593872} -11/07/2021 00:40:22 - INFO - __main__ - Step 24507: {'lr': 0.0004720097184730373, 'samples': 4705344, 'steps': 24506, 'loss/train': 2.1145436763763428} -11/07/2021 00:40:23 - INFO - __main__ - Step 24508: {'lr': 0.00047200727854979644, 'samples': 4705536, 'steps': 24507, 'loss/train': 1.7645108699798584} -11/07/2021 00:40:23 - INFO - __main__ - Step 24509: {'lr': 0.00047200483852652257, 'samples': 4705728, 'steps': 24508, 'loss/train': 1.630983591079712} -11/07/2021 00:40:24 - INFO - __main__ - Step 24510: {'lr': 0.0004720023984032167, 'samples': 4705920, 'steps': 24509, 'loss/train': 1.414451003074646} -11/07/2021 00:40:25 - INFO - __main__ - Step 24511: {'lr': 0.00047199995817987997, 'samples': 4706112, 'steps': 24510, 'loss/train': 1.2542831897735596} -11/07/2021 00:40:25 - INFO - __main__ - Step 24512: {'lr': 0.00047199751785651346, 'samples': 4706304, 'steps': 24511, 'loss/train': 1.7242752313613892} -11/07/2021 00:40:25 - INFO - __main__ - Step 24513: {'lr': 0.0004719950774331183, 'samples': 4706496, 'steps': 24512, 'loss/train': 1.3297889232635498} -11/07/2021 00:40:26 - INFO - __main__ - Step 24514: {'lr': 0.00047199263690969563, 'samples': 4706688, 'steps': 24513, 'loss/train': 1.5910593271255493} -11/07/2021 00:40:27 - INFO - __main__ - Step 24515: {'lr': 0.00047199019628624647, 'samples': 4706880, 'steps': 24514, 'loss/train': 1.3865641355514526} -11/07/2021 00:40:27 - INFO - __main__ - Step 24516: {'lr': 0.00047198775556277195, 'samples': 4707072, 'steps': 24515, 'loss/train': 1.639611005783081} -11/07/2021 00:40:27 - INFO - __main__ - Step 24517: {'lr': 0.0004719853147392732, 'samples': 4707264, 'steps': 24516, 'loss/train': 2.0972113609313965} -11/07/2021 00:40:28 - INFO - __main__ - Step 24518: {'lr': 0.0004719828738157512, 'samples': 4707456, 'steps': 24517, 'loss/train': 1.7587006092071533} -11/07/2021 00:40:28 - INFO - __main__ - Step 24519: {'lr': 0.0004719804327922073, 'samples': 4707648, 'steps': 24518, 'loss/train': 0.929109513759613} -11/07/2021 00:40:29 - INFO - __main__ - Step 24520: {'lr': 0.00047197799166864233, 'samples': 4707840, 'steps': 24519, 'loss/train': 1.3555177450180054} -11/07/2021 00:40:29 - INFO - __main__ - Step 24521: {'lr': 0.00047197555044505756, 'samples': 4708032, 'steps': 24520, 'loss/train': 1.371085286140442} -11/07/2021 00:40:30 - INFO - __main__ - Step 24522: {'lr': 0.000471973109121454, 'samples': 4708224, 'steps': 24521, 'loss/train': 1.789271354675293} -11/07/2021 00:40:30 - INFO - __main__ - Step 24523: {'lr': 0.00047197066769783284, 'samples': 4708416, 'steps': 24522, 'loss/train': 2.5680861473083496} -11/07/2021 00:40:30 - INFO - __main__ - Step 24524: {'lr': 0.000471968226174195, 'samples': 4708608, 'steps': 24523, 'loss/train': 1.28214430809021} -11/07/2021 00:40:31 - INFO - __main__ - Step 24525: {'lr': 0.00047196578455054175, 'samples': 4708800, 'steps': 24524, 'loss/train': 1.6914494037628174} -11/07/2021 00:40:32 - INFO - __main__ - Step 24526: {'lr': 0.00047196334282687414, 'samples': 4708992, 'steps': 24525, 'loss/train': 1.08967125415802} -11/07/2021 00:40:32 - INFO - __main__ - Step 24527: {'lr': 0.00047196090100319333, 'samples': 4709184, 'steps': 24526, 'loss/train': 2.022808313369751} -11/07/2021 00:40:32 - INFO - __main__ - Step 24528: {'lr': 0.00047195845907950035, 'samples': 4709376, 'steps': 24527, 'loss/train': 1.8660812377929688} -11/07/2021 00:40:33 - INFO - __main__ - Step 24529: {'lr': 0.0004719560170557963, 'samples': 4709568, 'steps': 24528, 'loss/train': 0.7722143530845642} -11/07/2021 00:40:34 - INFO - __main__ - Step 24530: {'lr': 0.0004719535749320823, 'samples': 4709760, 'steps': 24529, 'loss/train': 1.6197178363800049} -11/07/2021 00:40:34 - INFO - __main__ - Step 24531: {'lr': 0.0004719511327083594, 'samples': 4709952, 'steps': 24530, 'loss/train': 1.1182323694229126} -11/07/2021 00:40:35 - INFO - __main__ - Step 24532: {'lr': 0.0004719486903846288, 'samples': 4710144, 'steps': 24531, 'loss/train': 1.2211271524429321} -11/07/2021 00:40:35 - INFO - __main__ - Step 24533: {'lr': 0.0004719462479608915, 'samples': 4710336, 'steps': 24532, 'loss/train': 1.649878978729248} -11/07/2021 00:40:35 - INFO - __main__ - Step 24534: {'lr': 0.0004719438054371487, 'samples': 4710528, 'steps': 24533, 'loss/train': 1.3666858673095703} -11/07/2021 00:40:36 - INFO - __main__ - Step 24535: {'lr': 0.00047194136281340137, 'samples': 4710720, 'steps': 24534, 'loss/train': 1.4466700553894043} -11/07/2021 00:40:37 - INFO - __main__ - Step 24536: {'lr': 0.00047193892008965077, 'samples': 4710912, 'steps': 24535, 'loss/train': 0.9865069389343262} -11/07/2021 00:40:37 - INFO - __main__ - Step 24537: {'lr': 0.0004719364772658978, 'samples': 4711104, 'steps': 24536, 'loss/train': 1.7701717615127563} -11/07/2021 00:40:38 - INFO - __main__ - Step 24538: {'lr': 0.00047193403434214385, 'samples': 4711296, 'steps': 24537, 'loss/train': 1.671497106552124} -11/07/2021 00:40:38 - INFO - __main__ - Step 24539: {'lr': 0.0004719315913183897, 'samples': 4711488, 'steps': 24538, 'loss/train': 1.300622582435608} -11/07/2021 00:40:38 - INFO - __main__ - Step 24540: {'lr': 0.0004719291481946367, 'samples': 4711680, 'steps': 24539, 'loss/train': 1.2521655559539795} -11/07/2021 00:40:39 - INFO - __main__ - Step 24541: {'lr': 0.00047192670497088577, 'samples': 4711872, 'steps': 24540, 'loss/train': 1.7195566892623901} -11/07/2021 00:40:40 - INFO - __main__ - Step 24542: {'lr': 0.0004719242616471381, 'samples': 4712064, 'steps': 24541, 'loss/train': 1.094425916671753} -11/07/2021 00:40:40 - INFO - __main__ - Step 24543: {'lr': 0.00047192181822339484, 'samples': 4712256, 'steps': 24542, 'loss/train': 1.9918973445892334} -11/07/2021 00:40:40 - INFO - __main__ - Step 24544: {'lr': 0.000471919374699657, 'samples': 4712448, 'steps': 24543, 'loss/train': 1.5135279893875122} -11/07/2021 00:40:41 - INFO - __main__ - Step 24545: {'lr': 0.0004719169310759257, 'samples': 4712640, 'steps': 24544, 'loss/train': 1.1496442556381226} -11/07/2021 00:40:42 - INFO - __main__ - Step 24546: {'lr': 0.0004719144873522021, 'samples': 4712832, 'steps': 24545, 'loss/train': 1.596967339515686} -11/07/2021 00:40:42 - INFO - __main__ - Step 24547: {'lr': 0.0004719120435284872, 'samples': 4713024, 'steps': 24546, 'loss/train': 1.982956886291504} -11/07/2021 00:40:42 - INFO - __main__ - Step 24548: {'lr': 0.0004719095996047822, 'samples': 4713216, 'steps': 24547, 'loss/train': 1.156897783279419} -11/07/2021 00:40:43 - INFO - __main__ - Step 24549: {'lr': 0.0004719071555810881, 'samples': 4713408, 'steps': 24548, 'loss/train': 1.8267337083816528} -11/07/2021 00:40:43 - INFO - __main__ - Step 24550: {'lr': 0.00047190471145740616, 'samples': 4713600, 'steps': 24549, 'loss/train': 1.2680888175964355} -11/07/2021 00:40:43 - INFO - __main__ - Step 24551: {'lr': 0.0004719022672337373, 'samples': 4713792, 'steps': 24550, 'loss/train': 1.3638585805892944} -11/07/2021 00:40:44 - INFO - __main__ - Step 24552: {'lr': 0.0004718998229100827, 'samples': 4713984, 'steps': 24551, 'loss/train': 1.6720409393310547} -11/07/2021 00:40:45 - INFO - __main__ - Step 24553: {'lr': 0.00047189737848644356, 'samples': 4714176, 'steps': 24552, 'loss/train': 1.2578575611114502} -11/07/2021 00:40:45 - INFO - __main__ - Step 24554: {'lr': 0.0004718949339628208, 'samples': 4714368, 'steps': 24553, 'loss/train': 0.9185448288917542} -11/07/2021 00:40:46 - INFO - __main__ - Step 24555: {'lr': 0.0004718924893392156, 'samples': 4714560, 'steps': 24554, 'loss/train': 1.4076365232467651} -11/07/2021 00:40:46 - INFO - __main__ - Step 24556: {'lr': 0.0004718900446156291, 'samples': 4714752, 'steps': 24555, 'loss/train': 1.4986615180969238} -11/07/2021 00:40:47 - INFO - __main__ - Step 24557: {'lr': 0.00047188759979206236, 'samples': 4714944, 'steps': 24556, 'loss/train': 0.7693179845809937} -11/07/2021 00:40:47 - INFO - __main__ - Step 24558: {'lr': 0.00047188515486851646, 'samples': 4715136, 'steps': 24557, 'loss/train': 1.5965371131896973} -11/07/2021 00:40:48 - INFO - __main__ - Step 24559: {'lr': 0.0004718827098449926, 'samples': 4715328, 'steps': 24558, 'loss/train': 1.1753389835357666} -11/07/2021 00:40:48 - INFO - __main__ - Step 24560: {'lr': 0.00047188026472149184, 'samples': 4715520, 'steps': 24559, 'loss/train': 1.8036824464797974} -11/07/2021 00:40:48 - INFO - __main__ - Step 24561: {'lr': 0.0004718778194980151, 'samples': 4715712, 'steps': 24560, 'loss/train': 1.3673409223556519} -11/07/2021 00:40:50 - INFO - __main__ - Step 24562: {'lr': 0.00047187537417456375, 'samples': 4715904, 'steps': 24561, 'loss/train': 1.8237707614898682} -11/07/2021 00:40:50 - INFO - __main__ - Step 24563: {'lr': 0.00047187292875113874, 'samples': 4716096, 'steps': 24562, 'loss/train': 1.5906968116760254} -11/07/2021 00:40:50 - INFO - __main__ - Step 24564: {'lr': 0.0004718704832277413, 'samples': 4716288, 'steps': 24563, 'loss/train': 1.953343152999878} -11/07/2021 00:40:51 - INFO - __main__ - Step 24565: {'lr': 0.0004718680376043724, 'samples': 4716480, 'steps': 24564, 'loss/train': 0.17302846908569336} -11/07/2021 00:40:51 - INFO - __main__ - Step 24566: {'lr': 0.00047186559188103314, 'samples': 4716672, 'steps': 24565, 'loss/train': 1.684582233428955} -11/07/2021 00:40:51 - INFO - __main__ - Step 24567: {'lr': 0.00047186314605772466, 'samples': 4716864, 'steps': 24566, 'loss/train': 1.2550259828567505} -11/07/2021 00:40:52 - INFO - __main__ - Step 24568: {'lr': 0.00047186070013444814, 'samples': 4717056, 'steps': 24567, 'loss/train': 1.7285406589508057} -11/07/2021 00:40:53 - INFO - __main__ - Step 24569: {'lr': 0.00047185825411120454, 'samples': 4717248, 'steps': 24568, 'loss/train': 1.6954476833343506} -11/07/2021 00:40:53 - INFO - __main__ - Step 24570: {'lr': 0.0004718558079879951, 'samples': 4717440, 'steps': 24569, 'loss/train': 1.5529531240463257} -11/07/2021 00:40:53 - INFO - __main__ - Step 24571: {'lr': 0.00047185336176482084, 'samples': 4717632, 'steps': 24570, 'loss/train': 1.6657012701034546} -11/07/2021 00:40:54 - INFO - __main__ - Step 24572: {'lr': 0.00047185091544168286, 'samples': 4717824, 'steps': 24571, 'loss/train': 1.475118637084961} -11/07/2021 00:40:55 - INFO - __main__ - Step 24573: {'lr': 0.00047184846901858225, 'samples': 4718016, 'steps': 24572, 'loss/train': 1.6777819395065308} -11/07/2021 00:40:55 - INFO - __main__ - Step 24574: {'lr': 0.0004718460224955202, 'samples': 4718208, 'steps': 24573, 'loss/train': 1.7281380891799927} -11/07/2021 00:40:55 - INFO - __main__ - Step 24575: {'lr': 0.0004718435758724977, 'samples': 4718400, 'steps': 24574, 'loss/train': 1.850234031677246} -11/07/2021 00:40:56 - INFO - __main__ - Step 24576: {'lr': 0.000471841129149516, 'samples': 4718592, 'steps': 24575, 'loss/train': 1.2701635360717773} -11/07/2021 00:40:56 - INFO - __main__ - Step 24577: {'lr': 0.000471838682326576, 'samples': 4718784, 'steps': 24576, 'loss/train': 1.5703866481781006} -11/07/2021 00:40:57 - INFO - __main__ - Step 24578: {'lr': 0.000471836235403679, 'samples': 4718976, 'steps': 24577, 'loss/train': 2.2552669048309326} -11/07/2021 00:40:58 - INFO - __main__ - Step 24579: {'lr': 0.000471833788380826, 'samples': 4719168, 'steps': 24578, 'loss/train': 1.2086560726165771} -11/07/2021 00:40:58 - INFO - __main__ - Step 24580: {'lr': 0.0004718313412580181, 'samples': 4719360, 'steps': 24579, 'loss/train': 1.2085537910461426} -11/07/2021 00:40:58 - INFO - __main__ - Step 24581: {'lr': 0.0004718288940352564, 'samples': 4719552, 'steps': 24580, 'loss/train': 1.4074021577835083} -11/07/2021 00:40:59 - INFO - __main__ - Step 24582: {'lr': 0.00047182644671254207, 'samples': 4719744, 'steps': 24581, 'loss/train': 1.8190374374389648} -11/07/2021 00:41:00 - INFO - __main__ - Step 24583: {'lr': 0.0004718239992898761, 'samples': 4719936, 'steps': 24582, 'loss/train': 1.3924469947814941} -11/07/2021 00:41:00 - INFO - __main__ - Step 24584: {'lr': 0.00047182155176725974, 'samples': 4720128, 'steps': 24583, 'loss/train': 1.4869482517242432} -11/07/2021 00:41:00 - INFO - __main__ - Step 24585: {'lr': 0.00047181910414469396, 'samples': 4720320, 'steps': 24584, 'loss/train': 1.1537373065948486} -11/07/2021 00:41:01 - INFO - __main__ - Step 24586: {'lr': 0.0004718166564221799, 'samples': 4720512, 'steps': 24585, 'loss/train': 1.821776032447815} -11/07/2021 00:41:01 - INFO - __main__ - Step 24587: {'lr': 0.0004718142085997187, 'samples': 4720704, 'steps': 24586, 'loss/train': 1.1884390115737915} -11/07/2021 00:41:02 - INFO - __main__ - Step 24588: {'lr': 0.0004718117606773115, 'samples': 4720896, 'steps': 24587, 'loss/train': 3.4263834953308105} -11/07/2021 00:41:03 - INFO - __main__ - Step 24589: {'lr': 0.0004718093126549592, 'samples': 4721088, 'steps': 24588, 'loss/train': 1.226837396621704} -11/07/2021 00:41:03 - INFO - __main__ - Step 24590: {'lr': 0.0004718068645326632, 'samples': 4721280, 'steps': 24589, 'loss/train': 0.8642450571060181} -11/07/2021 00:41:03 - INFO - __main__ - Step 24591: {'lr': 0.0004718044163104244, 'samples': 4721472, 'steps': 24590, 'loss/train': 1.049943447113037} -11/07/2021 00:41:04 - INFO - __main__ - Step 24592: {'lr': 0.0004718019679882439, 'samples': 4721664, 'steps': 24591, 'loss/train': 1.2182432413101196} -11/07/2021 00:41:04 - INFO - __main__ - Step 24593: {'lr': 0.0004717995195661229, 'samples': 4721856, 'steps': 24592, 'loss/train': 3.1901888847351074} -11/07/2021 00:41:05 - INFO - __main__ - Step 24594: {'lr': 0.00047179707104406243, 'samples': 4722048, 'steps': 24593, 'loss/train': 1.1043592691421509} -11/07/2021 00:41:05 - INFO - __main__ - Step 24595: {'lr': 0.0004717946224220637, 'samples': 4722240, 'steps': 24594, 'loss/train': 1.4727208614349365} -11/07/2021 00:41:06 - INFO - __main__ - Step 24596: {'lr': 0.0004717921737001276, 'samples': 4722432, 'steps': 24595, 'loss/train': 1.3377717733383179} -11/07/2021 00:41:06 - INFO - __main__ - Step 24597: {'lr': 0.0004717897248782555, 'samples': 4722624, 'steps': 24596, 'loss/train': 1.4173022508621216} -11/07/2021 00:41:06 - INFO - __main__ - Step 24598: {'lr': 0.0004717872759564483, 'samples': 4722816, 'steps': 24597, 'loss/train': 1.6326979398727417} -11/07/2021 00:41:07 - INFO - __main__ - Step 24599: {'lr': 0.00047178482693470723, 'samples': 4723008, 'steps': 24598, 'loss/train': 1.0094153881072998} -11/07/2021 00:41:08 - INFO - __main__ - Step 24600: {'lr': 0.0004717823778130333, 'samples': 4723200, 'steps': 24599, 'loss/train': 1.2238973379135132} -11/07/2021 00:41:08 - INFO - __main__ - Step 24601: {'lr': 0.0004717799285914276, 'samples': 4723392, 'steps': 24600, 'loss/train': 1.5726311206817627} -11/07/2021 00:41:09 - INFO - __main__ - Step 24602: {'lr': 0.00047177747926989134, 'samples': 4723584, 'steps': 24601, 'loss/train': 1.7290757894515991} -11/07/2021 00:41:09 - INFO - __main__ - Step 24603: {'lr': 0.00047177502984842556, 'samples': 4723776, 'steps': 24602, 'loss/train': 1.8465595245361328} -11/07/2021 00:41:10 - INFO - __main__ - Step 24604: {'lr': 0.0004717725803270314, 'samples': 4723968, 'steps': 24603, 'loss/train': 1.3708162307739258} -11/07/2021 00:41:11 - INFO - __main__ - Step 24605: {'lr': 0.00047177013070570997, 'samples': 4724160, 'steps': 24604, 'loss/train': 1.8157235383987427} -11/07/2021 00:41:11 - INFO - __main__ - Step 24606: {'lr': 0.00047176768098446234, 'samples': 4724352, 'steps': 24605, 'loss/train': 1.3547577857971191} -11/07/2021 00:41:11 - INFO - __main__ - Step 24607: {'lr': 0.0004717652311632895, 'samples': 4724544, 'steps': 24606, 'loss/train': 1.55780029296875} -11/07/2021 00:41:12 - INFO - __main__ - Step 24608: {'lr': 0.00047176278124219276, 'samples': 4724736, 'steps': 24607, 'loss/train': 1.9747414588928223} -11/07/2021 00:41:12 - INFO - __main__ - Step 24609: {'lr': 0.0004717603312211731, 'samples': 4724928, 'steps': 24608, 'loss/train': 1.699101209640503} -11/07/2021 00:41:13 - INFO - __main__ - Step 24610: {'lr': 0.0004717578811002317, 'samples': 4725120, 'steps': 24609, 'loss/train': 1.3912477493286133} -11/07/2021 00:41:13 - INFO - __main__ - Step 24611: {'lr': 0.00047175543087936954, 'samples': 4725312, 'steps': 24610, 'loss/train': 1.4214597940444946} -11/07/2021 00:41:14 - INFO - __main__ - Step 24612: {'lr': 0.0004717529805585879, 'samples': 4725504, 'steps': 24611, 'loss/train': 1.5167274475097656} -11/07/2021 00:41:14 - INFO - __main__ - Step 24613: {'lr': 0.0004717505301378877, 'samples': 4725696, 'steps': 24612, 'loss/train': 1.8070693016052246} -11/07/2021 00:41:14 - INFO - __main__ - Step 24614: {'lr': 0.0004717480796172702, 'samples': 4725888, 'steps': 24613, 'loss/train': 1.4449204206466675} -11/07/2021 00:41:16 - INFO - __main__ - Step 24615: {'lr': 0.00047174562899673645, 'samples': 4726080, 'steps': 24614, 'loss/train': 1.1564642190933228} -11/07/2021 00:41:16 - INFO - __main__ - Step 24616: {'lr': 0.0004717431782762875, 'samples': 4726272, 'steps': 24615, 'loss/train': 1.9751918315887451} -11/07/2021 00:41:16 - INFO - __main__ - Step 24617: {'lr': 0.0004717407274559245, 'samples': 4726464, 'steps': 24616, 'loss/train': 1.8290555477142334} -11/07/2021 00:41:17 - INFO - __main__ - Step 24618: {'lr': 0.0004717382765356485, 'samples': 4726656, 'steps': 24617, 'loss/train': 1.8763755559921265} -11/07/2021 00:41:17 - INFO - __main__ - Step 24619: {'lr': 0.0004717358255154607, 'samples': 4726848, 'steps': 24618, 'loss/train': 0.9470406770706177} -11/07/2021 00:41:18 - INFO - __main__ - Step 24620: {'lr': 0.0004717333743953622, 'samples': 4727040, 'steps': 24619, 'loss/train': 0.10981487482786179} -11/07/2021 00:41:18 - INFO - __main__ - Step 24621: {'lr': 0.00047173092317535404, 'samples': 4727232, 'steps': 24620, 'loss/train': 1.7464439868927002} -11/07/2021 00:41:19 - INFO - __main__ - Step 24622: {'lr': 0.0004717284718554373, 'samples': 4727424, 'steps': 24621, 'loss/train': 1.660263180732727} -11/07/2021 00:41:19 - INFO - __main__ - Step 24623: {'lr': 0.00047172602043561317, 'samples': 4727616, 'steps': 24622, 'loss/train': 1.3084211349487305} -11/07/2021 00:41:19 - INFO - __main__ - Step 24624: {'lr': 0.00047172356891588273, 'samples': 4727808, 'steps': 24623, 'loss/train': 2.0479350090026855} -11/07/2021 00:41:21 - INFO - __main__ - Step 24625: {'lr': 0.0004717211172962471, 'samples': 4728000, 'steps': 24624, 'loss/train': 1.5201829671859741} -11/07/2021 00:41:21 - INFO - __main__ - Step 24626: {'lr': 0.0004717186655767073, 'samples': 4728192, 'steps': 24625, 'loss/train': 1.1362905502319336} -11/07/2021 00:41:21 - INFO - __main__ - Step 24627: {'lr': 0.0004717162137572645, 'samples': 4728384, 'steps': 24626, 'loss/train': 1.5421643257141113} -11/07/2021 00:41:22 - INFO - __main__ - Step 24628: {'lr': 0.0004717137618379198, 'samples': 4728576, 'steps': 24627, 'loss/train': 1.5219807624816895} -11/07/2021 00:41:22 - INFO - __main__ - Step 24629: {'lr': 0.0004717113098186743, 'samples': 4728768, 'steps': 24628, 'loss/train': 1.4583017826080322} -11/07/2021 00:41:22 - INFO - __main__ - Step 24630: {'lr': 0.00047170885769952907, 'samples': 4728960, 'steps': 24629, 'loss/train': 1.637890338897705} -11/07/2021 00:41:24 - INFO - __main__ - Step 24631: {'lr': 0.00047170640548048525, 'samples': 4729152, 'steps': 24630, 'loss/train': 1.4171907901763916} -11/07/2021 00:41:24 - INFO - __main__ - Step 24632: {'lr': 0.000471703953161544, 'samples': 4729344, 'steps': 24631, 'loss/train': 1.9250282049179077} -11/07/2021 00:41:24 - INFO - __main__ - Step 24633: {'lr': 0.00047170150074270635, 'samples': 4729536, 'steps': 24632, 'loss/train': 1.8162815570831299} -11/07/2021 00:41:25 - INFO - __main__ - Step 24634: {'lr': 0.0004716990482239735, 'samples': 4729728, 'steps': 24633, 'loss/train': 1.6207184791564941} -11/07/2021 00:41:25 - INFO - __main__ - Step 24635: {'lr': 0.0004716965956053463, 'samples': 4729920, 'steps': 24634, 'loss/train': 1.1402711868286133} -11/07/2021 00:41:26 - INFO - __main__ - Step 24636: {'lr': 0.00047169414288682616, 'samples': 4730112, 'steps': 24635, 'loss/train': 1.40772545337677} -11/07/2021 00:41:26 - INFO - __main__ - Step 24637: {'lr': 0.0004716916900684141, 'samples': 4730304, 'steps': 24636, 'loss/train': 1.7439367771148682} -11/07/2021 00:41:27 - INFO - __main__ - Step 24638: {'lr': 0.00047168923715011103, 'samples': 4730496, 'steps': 24637, 'loss/train': 1.7972429990768433} -11/07/2021 00:41:27 - INFO - __main__ - Step 24639: {'lr': 0.00047168678413191833, 'samples': 4730688, 'steps': 24638, 'loss/train': 1.9872496128082275} -11/07/2021 00:41:27 - INFO - __main__ - Step 24640: {'lr': 0.00047168433101383694, 'samples': 4730880, 'steps': 24639, 'loss/train': 1.5553479194641113} -11/07/2021 00:41:28 - INFO - __main__ - Step 24641: {'lr': 0.000471681877795868, 'samples': 4731072, 'steps': 24640, 'loss/train': 1.7604968547821045} -11/07/2021 00:41:29 - INFO - __main__ - Step 24642: {'lr': 0.0004716794244780127, 'samples': 4731264, 'steps': 24641, 'loss/train': 1.5986493825912476} -11/07/2021 00:41:29 - INFO - __main__ - Step 24643: {'lr': 0.0004716769710602721, 'samples': 4731456, 'steps': 24642, 'loss/train': 1.5960829257965088} -11/07/2021 00:41:29 - INFO - __main__ - Step 24644: {'lr': 0.00047167451754264714, 'samples': 4731648, 'steps': 24643, 'loss/train': 1.3092007637023926} -11/07/2021 00:41:30 - INFO - __main__ - Step 24645: {'lr': 0.0004716720639251392, 'samples': 4731840, 'steps': 24644, 'loss/train': 1.645534873008728} -11/07/2021 00:41:31 - INFO - __main__ - Step 24646: {'lr': 0.0004716696102077491, 'samples': 4732032, 'steps': 24645, 'loss/train': 0.7927688956260681} -11/07/2021 00:41:31 - INFO - __main__ - Step 24647: {'lr': 0.0004716671563904782, 'samples': 4732224, 'steps': 24646, 'loss/train': 1.4662938117980957} -11/07/2021 00:41:32 - INFO - __main__ - Step 24648: {'lr': 0.0004716647024733275, 'samples': 4732416, 'steps': 24647, 'loss/train': 1.9069128036499023} -11/07/2021 00:41:32 - INFO - __main__ - Step 24649: {'lr': 0.00047166224845629804, 'samples': 4732608, 'steps': 24648, 'loss/train': 1.5420812368392944} -11/07/2021 00:41:32 - INFO - __main__ - Step 24650: {'lr': 0.000471659794339391, 'samples': 4732800, 'steps': 24649, 'loss/train': 1.5934165716171265} -11/07/2021 00:41:33 - INFO - __main__ - Step 24651: {'lr': 0.00047165734012260754, 'samples': 4732992, 'steps': 24650, 'loss/train': 1.610710859298706} -11/07/2021 00:41:34 - INFO - __main__ - Step 24652: {'lr': 0.0004716548858059486, 'samples': 4733184, 'steps': 24651, 'loss/train': 1.2758663892745972} -11/07/2021 00:41:34 - INFO - __main__ - Step 24653: {'lr': 0.0004716524313894155, 'samples': 4733376, 'steps': 24652, 'loss/train': 1.113743782043457} -11/07/2021 00:41:34 - INFO - __main__ - Step 24654: {'lr': 0.0004716499768730092, 'samples': 4733568, 'steps': 24653, 'loss/train': 1.840376853942871} -11/07/2021 00:41:35 - INFO - __main__ - Step 24655: {'lr': 0.0004716475222567308, 'samples': 4733760, 'steps': 24654, 'loss/train': 1.646635890007019} -11/07/2021 00:41:36 - INFO - __main__ - Step 24656: {'lr': 0.0004716450675405815, 'samples': 4733952, 'steps': 24655, 'loss/train': 1.5526431798934937} -11/07/2021 00:41:36 - INFO - __main__ - Step 24657: {'lr': 0.0004716426127245623, 'samples': 4734144, 'steps': 24656, 'loss/train': 1.4510862827301025} -11/07/2021 00:41:36 - INFO - __main__ - Step 24658: {'lr': 0.00047164015780867444, 'samples': 4734336, 'steps': 24657, 'loss/train': 1.7362557649612427} -11/07/2021 00:41:37 - INFO - __main__ - Step 24659: {'lr': 0.0004716377027929189, 'samples': 4734528, 'steps': 24658, 'loss/train': 1.2027533054351807} -11/07/2021 00:41:37 - INFO - __main__ - Step 24660: {'lr': 0.00047163524767729684, 'samples': 4734720, 'steps': 24659, 'loss/train': 1.1476722955703735} -11/07/2021 00:41:38 - INFO - __main__ - Step 24661: {'lr': 0.0004716327924618093, 'samples': 4734912, 'steps': 24660, 'loss/train': 1.578438639640808} -11/07/2021 00:41:38 - INFO - __main__ - Step 24662: {'lr': 0.0004716303371464575, 'samples': 4735104, 'steps': 24661, 'loss/train': 2.1853394508361816} -11/07/2021 00:41:39 - INFO - __main__ - Step 24663: {'lr': 0.0004716278817312425, 'samples': 4735296, 'steps': 24662, 'loss/train': 1.361633062362671} -11/07/2021 00:41:39 - INFO - __main__ - Step 24664: {'lr': 0.0004716254262161653, 'samples': 4735488, 'steps': 24663, 'loss/train': 1.9795877933502197} -11/07/2021 00:41:39 - INFO - __main__ - Step 24665: {'lr': 0.00047162297060122726, 'samples': 4735680, 'steps': 24664, 'loss/train': 1.582615613937378} -11/07/2021 00:41:40 - INFO - __main__ - Step 24666: {'lr': 0.0004716205148864292, 'samples': 4735872, 'steps': 24665, 'loss/train': 1.3622562885284424} -11/07/2021 00:41:41 - INFO - __main__ - Step 24667: {'lr': 0.0004716180590717724, 'samples': 4736064, 'steps': 24666, 'loss/train': 0.957697868347168} -11/07/2021 00:41:41 - INFO - __main__ - Step 24668: {'lr': 0.0004716156031572579, 'samples': 4736256, 'steps': 24667, 'loss/train': 1.5222654342651367} -11/07/2021 00:41:41 - INFO - __main__ - Step 24669: {'lr': 0.00047161314714288697, 'samples': 4736448, 'steps': 24668, 'loss/train': 1.4493942260742188} -11/07/2021 00:41:42 - INFO - __main__ - Step 24670: {'lr': 0.00047161069102866037, 'samples': 4736640, 'steps': 24669, 'loss/train': 1.5919777154922485} -11/07/2021 00:41:43 - INFO - __main__ - Step 24671: {'lr': 0.00047160823481457955, 'samples': 4736832, 'steps': 24670, 'loss/train': 1.7107733488082886} -11/07/2021 00:41:43 - INFO - __main__ - Step 24672: {'lr': 0.0004716057785006454, 'samples': 4737024, 'steps': 24671, 'loss/train': 1.3636122941970825} -11/07/2021 00:41:44 - INFO - __main__ - Step 24673: {'lr': 0.00047160332208685915, 'samples': 4737216, 'steps': 24672, 'loss/train': 3.1674327850341797} -11/07/2021 00:41:44 - INFO - __main__ - Step 24674: {'lr': 0.00047160086557322185, 'samples': 4737408, 'steps': 24673, 'loss/train': 1.5195907354354858} -11/07/2021 00:41:44 - INFO - __main__ - Step 24675: {'lr': 0.0004715984089597346, 'samples': 4737600, 'steps': 24674, 'loss/train': 0.8802253007888794} -11/07/2021 00:41:45 - INFO - __main__ - Step 24676: {'lr': 0.00047159595224639854, 'samples': 4737792, 'steps': 24675, 'loss/train': 1.9900333881378174} -11/07/2021 00:41:46 - INFO - __main__ - Step 24677: {'lr': 0.00047159349543321477, 'samples': 4737984, 'steps': 24676, 'loss/train': 1.7431213855743408} -11/07/2021 00:41:46 - INFO - __main__ - Step 24678: {'lr': 0.00047159103852018443, 'samples': 4738176, 'steps': 24677, 'loss/train': 1.8001621961593628} -11/07/2021 00:41:46 - INFO - __main__ - Step 24679: {'lr': 0.00047158858150730856, 'samples': 4738368, 'steps': 24678, 'loss/train': 1.2686253786087036} -11/07/2021 00:41:47 - INFO - __main__ - Step 24680: {'lr': 0.00047158612439458824, 'samples': 4738560, 'steps': 24679, 'loss/train': 1.2404592037200928} -11/07/2021 00:41:48 - INFO - __main__ - Step 24681: {'lr': 0.00047158366718202466, 'samples': 4738752, 'steps': 24680, 'loss/train': 1.5559760332107544} -11/07/2021 00:41:48 - INFO - __main__ - Step 24682: {'lr': 0.00047158120986961897, 'samples': 4738944, 'steps': 24681, 'loss/train': 1.5051125288009644} -11/07/2021 00:41:49 - INFO - __main__ - Step 24683: {'lr': 0.00047157875245737213, 'samples': 4739136, 'steps': 24682, 'loss/train': 1.294028401374817} -11/07/2021 00:41:49 - INFO - __main__ - Step 24684: {'lr': 0.0004715762949452853, 'samples': 4739328, 'steps': 24683, 'loss/train': 0.12313494086265564} -11/07/2021 00:41:49 - INFO - __main__ - Step 24685: {'lr': 0.0004715738373333597, 'samples': 4739520, 'steps': 24684, 'loss/train': 1.85573410987854} -11/07/2021 00:41:50 - INFO - __main__ - Step 24686: {'lr': 0.00047157137962159626, 'samples': 4739712, 'steps': 24685, 'loss/train': 1.5269348621368408} -11/07/2021 00:41:51 - INFO - __main__ - Step 24687: {'lr': 0.00047156892180999624, 'samples': 4739904, 'steps': 24686, 'loss/train': 1.6515963077545166} -11/07/2021 00:41:51 - INFO - __main__ - Step 24688: {'lr': 0.0004715664638985606, 'samples': 4740096, 'steps': 24687, 'loss/train': 1.681512713432312} -11/07/2021 00:41:51 - INFO - __main__ - Step 24689: {'lr': 0.00047156400588729066, 'samples': 4740288, 'steps': 24688, 'loss/train': 1.5862340927124023} -11/07/2021 00:41:52 - INFO - __main__ - Step 24690: {'lr': 0.0004715615477761873, 'samples': 4740480, 'steps': 24689, 'loss/train': 1.5726406574249268} -11/07/2021 00:41:52 - INFO - __main__ - Step 24691: {'lr': 0.00047155908956525173, 'samples': 4740672, 'steps': 24690, 'loss/train': 1.6381641626358032} -11/07/2021 00:41:53 - INFO - __main__ - Step 24692: {'lr': 0.00047155663125448514, 'samples': 4740864, 'steps': 24691, 'loss/train': 1.716679334640503} -11/07/2021 00:41:53 - INFO - __main__ - Step 24693: {'lr': 0.00047155417284388846, 'samples': 4741056, 'steps': 24692, 'loss/train': 1.490833044052124} -11/07/2021 00:41:54 - INFO - __main__ - Step 24694: {'lr': 0.0004715517143334629, 'samples': 4741248, 'steps': 24693, 'loss/train': 0.8225095272064209} -11/07/2021 00:41:54 - INFO - __main__ - Step 24695: {'lr': 0.00047154925572320957, 'samples': 4741440, 'steps': 24694, 'loss/train': 1.3117071390151978} -11/07/2021 00:41:55 - INFO - __main__ - Step 24696: {'lr': 0.00047154679701312953, 'samples': 4741632, 'steps': 24695, 'loss/train': 1.989949107170105} -11/07/2021 00:41:55 - INFO - __main__ - Step 24697: {'lr': 0.00047154433820322395, 'samples': 4741824, 'steps': 24696, 'loss/train': 1.3134007453918457} -11/07/2021 00:41:56 - INFO - __main__ - Step 24698: {'lr': 0.0004715418792934939, 'samples': 4742016, 'steps': 24697, 'loss/train': 0.13016371428966522} -11/07/2021 00:41:56 - INFO - __main__ - Step 24699: {'lr': 0.00047153942028394056, 'samples': 4742208, 'steps': 24698, 'loss/train': 1.5684603452682495} -11/07/2021 00:41:57 - INFO - __main__ - Step 24700: {'lr': 0.0004715369611745649, 'samples': 4742400, 'steps': 24699, 'loss/train': 1.6034104824066162} -11/07/2021 00:41:57 - INFO - __main__ - Step 24701: {'lr': 0.00047153450196536816, 'samples': 4742592, 'steps': 24700, 'loss/train': 1.284940242767334} -11/07/2021 00:41:57 - INFO - __main__ - Step 24702: {'lr': 0.00047153204265635136, 'samples': 4742784, 'steps': 24701, 'loss/train': 1.3234397172927856} -11/07/2021 00:41:59 - INFO - __main__ - Step 24703: {'lr': 0.0004715295832475156, 'samples': 4742976, 'steps': 24702, 'loss/train': 1.516232967376709} -11/07/2021 00:41:59 - INFO - __main__ - Step 24704: {'lr': 0.0004715271237388621, 'samples': 4743168, 'steps': 24703, 'loss/train': 1.805282711982727} -11/07/2021 00:41:59 - INFO - __main__ - Step 24705: {'lr': 0.00047152466413039187, 'samples': 4743360, 'steps': 24704, 'loss/train': 2.048011541366577} -11/07/2021 00:42:00 - INFO - __main__ - Step 24706: {'lr': 0.000471522204422106, 'samples': 4743552, 'steps': 24705, 'loss/train': 1.764803409576416} -11/07/2021 00:42:00 - INFO - __main__ - Step 24707: {'lr': 0.0004715197446140057, 'samples': 4743744, 'steps': 24706, 'loss/train': 0.7026177644729614} -11/07/2021 00:42:01 - INFO - __main__ - Step 24708: {'lr': 0.000471517284706092, 'samples': 4743936, 'steps': 24707, 'loss/train': 1.6084614992141724} -11/07/2021 00:42:01 - INFO - __main__ - Step 24709: {'lr': 0.0004715148246983661, 'samples': 4744128, 'steps': 24708, 'loss/train': 1.4565328359603882} -11/07/2021 00:42:02 - INFO - __main__ - Step 24710: {'lr': 0.000471512364590829, 'samples': 4744320, 'steps': 24709, 'loss/train': 1.3672226667404175} -11/07/2021 00:42:02 - INFO - __main__ - Step 24711: {'lr': 0.0004715099043834818, 'samples': 4744512, 'steps': 24710, 'loss/train': 1.6812454462051392} -11/07/2021 00:42:02 - INFO - __main__ - Step 24712: {'lr': 0.00047150744407632565, 'samples': 4744704, 'steps': 24711, 'loss/train': 1.1659122705459595} -11/07/2021 00:42:03 - INFO - __main__ - Step 24713: {'lr': 0.00047150498366936165, 'samples': 4744896, 'steps': 24712, 'loss/train': 1.7485889196395874} -11/07/2021 00:42:04 - INFO - __main__ - Step 24714: {'lr': 0.000471502523162591, 'samples': 4745088, 'steps': 24713, 'loss/train': 1.2086975574493408} -11/07/2021 00:42:04 - INFO - __main__ - Step 24715: {'lr': 0.00047150006255601475, 'samples': 4745280, 'steps': 24714, 'loss/train': 1.3149487972259521} -11/07/2021 00:42:04 - INFO - __main__ - Step 24716: {'lr': 0.00047149760184963385, 'samples': 4745472, 'steps': 24715, 'loss/train': 1.8487763404846191} -11/07/2021 00:42:05 - INFO - __main__ - Step 24717: {'lr': 0.0004714951410434497, 'samples': 4745664, 'steps': 24716, 'loss/train': 1.807113528251648} -11/07/2021 00:42:06 - INFO - __main__ - Step 24718: {'lr': 0.00047149268013746317, 'samples': 4745856, 'steps': 24717, 'loss/train': 1.892370343208313} -11/07/2021 00:42:06 - INFO - __main__ - Step 24719: {'lr': 0.00047149021913167545, 'samples': 4746048, 'steps': 24718, 'loss/train': 1.6956562995910645} -11/07/2021 00:42:06 - INFO - __main__ - Step 24720: {'lr': 0.0004714877580260877, 'samples': 4746240, 'steps': 24719, 'loss/train': 1.3320220708847046} -11/07/2021 00:42:07 - INFO - __main__ - Step 24721: {'lr': 0.00047148529682070094, 'samples': 4746432, 'steps': 24720, 'loss/train': 0.9560302495956421} -11/07/2021 00:42:07 - INFO - __main__ - Step 24722: {'lr': 0.00047148283551551643, 'samples': 4746624, 'steps': 24721, 'loss/train': 1.4561172723770142} -11/07/2021 00:42:08 - INFO - __main__ - Step 24723: {'lr': 0.000471480374110535, 'samples': 4746816, 'steps': 24722, 'loss/train': 1.6286498308181763} -11/07/2021 00:42:09 - INFO - __main__ - Step 24724: {'lr': 0.00047147791260575804, 'samples': 4747008, 'steps': 24723, 'loss/train': 1.5712597370147705} -11/07/2021 00:42:09 - INFO - __main__ - Step 24725: {'lr': 0.0004714754510011866, 'samples': 4747200, 'steps': 24724, 'loss/train': 1.409942865371704} -11/07/2021 00:42:09 - INFO - __main__ - Step 24726: {'lr': 0.0004714729892968216, 'samples': 4747392, 'steps': 24725, 'loss/train': 1.7029197216033936} -11/07/2021 00:42:10 - INFO - __main__ - Step 24727: {'lr': 0.0004714705274926644, 'samples': 4747584, 'steps': 24726, 'loss/train': 1.8137012720108032} -11/07/2021 00:42:11 - INFO - __main__ - Step 24728: {'lr': 0.00047146806558871594, 'samples': 4747776, 'steps': 24727, 'loss/train': 1.5736908912658691} -11/07/2021 00:42:11 - INFO - __main__ - Step 24729: {'lr': 0.0004714656035849774, 'samples': 4747968, 'steps': 24728, 'loss/train': 1.6693710088729858} -11/07/2021 00:42:11 - INFO - __main__ - Step 24730: {'lr': 0.00047146314148144986, 'samples': 4748160, 'steps': 24729, 'loss/train': 2.116982936859131} -11/07/2021 00:42:12 - INFO - __main__ - Step 24731: {'lr': 0.00047146067927813454, 'samples': 4748352, 'steps': 24730, 'loss/train': 1.2648699283599854} -11/07/2021 00:42:12 - INFO - __main__ - Step 24732: {'lr': 0.00047145821697503235, 'samples': 4748544, 'steps': 24731, 'loss/train': 1.6949464082717896} -11/07/2021 00:42:12 - INFO - __main__ - Step 24733: {'lr': 0.00047145575457214453, 'samples': 4748736, 'steps': 24732, 'loss/train': 1.6670206785202026} -11/07/2021 00:42:13 - INFO - __main__ - Step 24734: {'lr': 0.00047145329206947216, 'samples': 4748928, 'steps': 24733, 'loss/train': 1.1943016052246094} -11/07/2021 00:42:14 - INFO - __main__ - Step 24735: {'lr': 0.0004714508294670164, 'samples': 4749120, 'steps': 24734, 'loss/train': 1.3442723751068115} -11/07/2021 00:42:14 - INFO - __main__ - Step 24736: {'lr': 0.00047144836676477823, 'samples': 4749312, 'steps': 24735, 'loss/train': 1.4667487144470215} -11/07/2021 00:42:14 - INFO - __main__ - Step 24737: {'lr': 0.00047144590396275895, 'samples': 4749504, 'steps': 24736, 'loss/train': 1.4250119924545288} -11/07/2021 00:42:15 - INFO - __main__ - Step 24738: {'lr': 0.0004714434410609595, 'samples': 4749696, 'steps': 24737, 'loss/train': 1.235796332359314} -11/07/2021 00:42:16 - INFO - __main__ - Step 24739: {'lr': 0.00047144097805938104, 'samples': 4749888, 'steps': 24738, 'loss/train': 1.1943650245666504} -11/07/2021 00:42:16 - INFO - __main__ - Step 24740: {'lr': 0.0004714385149580247, 'samples': 4750080, 'steps': 24739, 'loss/train': 1.6702942848205566} -11/07/2021 00:42:17 - INFO - __main__ - Step 24741: {'lr': 0.0004714360517568916, 'samples': 4750272, 'steps': 24740, 'loss/train': 1.8867982625961304} -11/07/2021 00:42:17 - INFO - __main__ - Step 24742: {'lr': 0.00047143358845598283, 'samples': 4750464, 'steps': 24741, 'loss/train': 1.4710402488708496} -11/07/2021 00:42:17 - INFO - __main__ - Step 24743: {'lr': 0.0004714311250552995, 'samples': 4750656, 'steps': 24742, 'loss/train': 1.4312278032302856} -11/07/2021 00:42:18 - INFO - __main__ - Step 24744: {'lr': 0.0004714286615548427, 'samples': 4750848, 'steps': 24743, 'loss/train': 1.7704944610595703} -11/07/2021 00:42:19 - INFO - __main__ - Step 24745: {'lr': 0.00047142619795461363, 'samples': 4751040, 'steps': 24744, 'loss/train': 1.7733451128005981} -11/07/2021 00:42:19 - INFO - __main__ - Step 24746: {'lr': 0.0004714237342546133, 'samples': 4751232, 'steps': 24745, 'loss/train': 1.678723692893982} -11/07/2021 00:42:19 - INFO - __main__ - Step 24747: {'lr': 0.0004714212704548428, 'samples': 4751424, 'steps': 24746, 'loss/train': 1.2840992212295532} -11/07/2021 00:42:20 - INFO - __main__ - Step 24748: {'lr': 0.0004714188065553033, 'samples': 4751616, 'steps': 24747, 'loss/train': 1.23397696018219} -11/07/2021 00:42:21 - INFO - __main__ - Step 24749: {'lr': 0.000471416342555996, 'samples': 4751808, 'steps': 24748, 'loss/train': 1.9683762788772583} -11/07/2021 00:42:21 - INFO - __main__ - Step 24750: {'lr': 0.00047141387845692174, 'samples': 4752000, 'steps': 24749, 'loss/train': 1.8132466077804565} -11/07/2021 00:42:21 - INFO - __main__ - Step 24751: {'lr': 0.0004714114142580819, 'samples': 4752192, 'steps': 24750, 'loss/train': 1.5070856809616089} -11/07/2021 00:42:22 - INFO - __main__ - Step 24752: {'lr': 0.00047140894995947755, 'samples': 4752384, 'steps': 24751, 'loss/train': 1.3774813413619995} -11/07/2021 00:42:22 - INFO - __main__ - Step 24753: {'lr': 0.00047140648556110966, 'samples': 4752576, 'steps': 24752, 'loss/train': 1.7825654745101929} -11/07/2021 00:42:23 - INFO - __main__ - Step 24754: {'lr': 0.00047140402106297946, 'samples': 4752768, 'steps': 24753, 'loss/train': 1.9710283279418945} -11/07/2021 00:42:24 - INFO - __main__ - Step 24755: {'lr': 0.000471401556465088, 'samples': 4752960, 'steps': 24754, 'loss/train': 1.391543984413147} -11/07/2021 00:42:24 - INFO - __main__ - Step 24756: {'lr': 0.00047139909176743643, 'samples': 4753152, 'steps': 24755, 'loss/train': 1.6651687622070312} -11/07/2021 00:42:24 - INFO - __main__ - Step 24757: {'lr': 0.0004713966269700259, 'samples': 4753344, 'steps': 24756, 'loss/train': 1.1757967472076416} -11/07/2021 00:42:25 - INFO - __main__ - Step 24758: {'lr': 0.0004713941620728574, 'samples': 4753536, 'steps': 24757, 'loss/train': 1.1249995231628418} -11/07/2021 00:42:25 - INFO - __main__ - Step 24759: {'lr': 0.0004713916970759321, 'samples': 4753728, 'steps': 24758, 'loss/train': 1.7377405166625977} -11/07/2021 00:42:26 - INFO - __main__ - Step 24760: {'lr': 0.0004713892319792512, 'samples': 4753920, 'steps': 24759, 'loss/train': 2.043972969055176} -11/07/2021 00:42:26 - INFO - __main__ - Step 24761: {'lr': 0.00047138676678281564, 'samples': 4754112, 'steps': 24760, 'loss/train': 1.4563531875610352} -11/07/2021 00:42:27 - INFO - __main__ - Step 24762: {'lr': 0.00047138430148662666, 'samples': 4754304, 'steps': 24761, 'loss/train': 1.994339942932129} -11/07/2021 00:42:27 - INFO - __main__ - Step 24763: {'lr': 0.0004713818360906853, 'samples': 4754496, 'steps': 24762, 'loss/train': 1.8650447130203247} -11/07/2021 00:42:27 - INFO - __main__ - Step 24764: {'lr': 0.0004713793705949927, 'samples': 4754688, 'steps': 24763, 'loss/train': 0.8770702481269836} -11/07/2021 00:42:29 - INFO - __main__ - Step 24765: {'lr': 0.00047137690499955, 'samples': 4754880, 'steps': 24764, 'loss/train': 1.3111677169799805} -11/07/2021 00:42:29 - INFO - __main__ - Step 24766: {'lr': 0.0004713744393043583, 'samples': 4755072, 'steps': 24765, 'loss/train': 1.0300610065460205} -11/07/2021 00:42:30 - INFO - __main__ - Step 24767: {'lr': 0.00047137197350941864, 'samples': 4755264, 'steps': 24766, 'loss/train': 1.0892693996429443} -11/07/2021 00:42:30 - INFO - __main__ - Step 24768: {'lr': 0.0004713695076147322, 'samples': 4755456, 'steps': 24767, 'loss/train': 0.11573341488838196} -11/07/2021 00:42:30 - INFO - __main__ - Step 24769: {'lr': 0.0004713670416203001, 'samples': 4755648, 'steps': 24768, 'loss/train': 1.62954580783844} -11/07/2021 00:42:31 - INFO - __main__ - Step 24770: {'lr': 0.00047136457552612344, 'samples': 4755840, 'steps': 24769, 'loss/train': 0.083526112139225} -11/07/2021 00:42:32 - INFO - __main__ - Step 24771: {'lr': 0.00047136210933220325, 'samples': 4756032, 'steps': 24770, 'loss/train': 1.3785045146942139} -11/07/2021 00:42:32 - INFO - __main__ - Step 24772: {'lr': 0.0004713596430385408, 'samples': 4756224, 'steps': 24771, 'loss/train': 2.175171375274658} -11/07/2021 00:42:32 - INFO - __main__ - Step 24773: {'lr': 0.00047135717664513704, 'samples': 4756416, 'steps': 24772, 'loss/train': 1.426689863204956} -11/07/2021 00:42:33 - INFO - __main__ - Step 24774: {'lr': 0.00047135471015199315, 'samples': 4756608, 'steps': 24773, 'loss/train': 1.5172810554504395} -11/07/2021 00:42:33 - INFO - __main__ - Step 24775: {'lr': 0.00047135224355911035, 'samples': 4756800, 'steps': 24774, 'loss/train': 1.5251126289367676} -11/07/2021 00:42:34 - INFO - __main__ - Step 24776: {'lr': 0.0004713497768664895, 'samples': 4756992, 'steps': 24775, 'loss/train': 1.8335155248641968} -11/07/2021 00:42:34 - INFO - __main__ - Step 24777: {'lr': 0.00047134731007413195, 'samples': 4757184, 'steps': 24776, 'loss/train': 1.5030866861343384} -11/07/2021 00:42:35 - INFO - __main__ - Step 24778: {'lr': 0.0004713448431820387, 'samples': 4757376, 'steps': 24777, 'loss/train': 1.5333009958267212} -11/07/2021 00:42:35 - INFO - __main__ - Step 24779: {'lr': 0.00047134237619021085, 'samples': 4757568, 'steps': 24778, 'loss/train': 1.6005456447601318} -11/07/2021 00:42:36 - INFO - __main__ - Step 24780: {'lr': 0.00047133990909864953, 'samples': 4757760, 'steps': 24779, 'loss/train': 1.6143572330474854} -11/07/2021 00:42:36 - INFO - __main__ - Step 24781: {'lr': 0.0004713374419073559, 'samples': 4757952, 'steps': 24780, 'loss/train': 1.168927550315857} -11/07/2021 00:42:37 - INFO - __main__ - Step 24782: {'lr': 0.000471334974616331, 'samples': 4758144, 'steps': 24781, 'loss/train': 1.3281073570251465} -11/07/2021 00:42:37 - INFO - __main__ - Step 24783: {'lr': 0.0004713325072255761, 'samples': 4758336, 'steps': 24782, 'loss/train': 1.2812906503677368} -11/07/2021 00:42:38 - INFO - __main__ - Step 24784: {'lr': 0.000471330039735092, 'samples': 4758528, 'steps': 24783, 'loss/train': 1.1857270002365112} -11/07/2021 00:42:38 - INFO - __main__ - Step 24785: {'lr': 0.0004713275721448801, 'samples': 4758720, 'steps': 24784, 'loss/train': 1.8095072507858276} -11/07/2021 00:42:39 - INFO - __main__ - Step 24786: {'lr': 0.0004713251044549414, 'samples': 4758912, 'steps': 24785, 'loss/train': 1.5033193826675415} -11/07/2021 00:42:39 - INFO - __main__ - Step 24787: {'lr': 0.000471322636665277, 'samples': 4759104, 'steps': 24786, 'loss/train': 1.3253549337387085} -11/07/2021 00:42:40 - INFO - __main__ - Step 24788: {'lr': 0.0004713201687758881, 'samples': 4759296, 'steps': 24787, 'loss/train': 1.9118258953094482} -11/07/2021 00:42:40 - INFO - __main__ - Step 24789: {'lr': 0.00047131770078677574, 'samples': 4759488, 'steps': 24788, 'loss/train': 1.806757926940918} -11/07/2021 00:42:40 - INFO - __main__ - Step 24790: {'lr': 0.000471315232697941, 'samples': 4759680, 'steps': 24789, 'loss/train': 1.7934147119522095} -11/07/2021 00:42:41 - INFO - __main__ - Step 24791: {'lr': 0.000471312764509385, 'samples': 4759872, 'steps': 24790, 'loss/train': 1.5426182746887207} -11/07/2021 00:42:42 - INFO - __main__ - Step 24792: {'lr': 0.0004713102962211089, 'samples': 4760064, 'steps': 24791, 'loss/train': 1.2751450538635254} -11/07/2021 00:42:42 - INFO - __main__ - Step 24793: {'lr': 0.0004713078278331138, 'samples': 4760256, 'steps': 24792, 'loss/train': 1.8063607215881348} -11/07/2021 00:42:42 - INFO - __main__ - Step 24794: {'lr': 0.00047130535934540086, 'samples': 4760448, 'steps': 24793, 'loss/train': 1.7444671392440796} -11/07/2021 00:42:43 - INFO - __main__ - Step 24795: {'lr': 0.00047130289075797107, 'samples': 4760640, 'steps': 24794, 'loss/train': 1.5532677173614502} -11/07/2021 00:42:44 - INFO - __main__ - Step 24796: {'lr': 0.0004713004220708257, 'samples': 4760832, 'steps': 24795, 'loss/train': 1.6229361295700073} -11/07/2021 00:42:44 - INFO - __main__ - Step 24797: {'lr': 0.0004712979532839656, 'samples': 4761024, 'steps': 24796, 'loss/train': 1.5406346321105957} -11/07/2021 00:42:44 - INFO - __main__ - Step 24798: {'lr': 0.00047129548439739225, 'samples': 4761216, 'steps': 24797, 'loss/train': 1.52739417552948} -11/07/2021 00:42:45 - INFO - __main__ - Step 24799: {'lr': 0.0004712930154111065, 'samples': 4761408, 'steps': 24798, 'loss/train': 1.6242315769195557} -11/07/2021 00:42:45 - INFO - __main__ - Step 24800: {'lr': 0.00047129054632510947, 'samples': 4761600, 'steps': 24799, 'loss/train': 0.9558914303779602} -11/07/2021 00:42:46 - INFO - __main__ - Step 24801: {'lr': 0.00047128807713940244, 'samples': 4761792, 'steps': 24800, 'loss/train': 1.9542592763900757} -11/07/2021 00:42:46 - INFO - __main__ - Step 24802: {'lr': 0.00047128560785398633, 'samples': 4761984, 'steps': 24801, 'loss/train': 2.2053301334381104} -11/07/2021 00:42:47 - INFO - __main__ - Step 24803: {'lr': 0.0004712831384688624, 'samples': 4762176, 'steps': 24802, 'loss/train': 1.2068068981170654} -11/07/2021 00:42:47 - INFO - __main__ - Step 24804: {'lr': 0.00047128066898403166, 'samples': 4762368, 'steps': 24803, 'loss/train': 1.2261611223220825} -11/07/2021 00:42:47 - INFO - __main__ - Step 24805: {'lr': 0.00047127819939949534, 'samples': 4762560, 'steps': 24804, 'loss/train': 1.5846295356750488} -11/07/2021 00:42:49 - INFO - __main__ - Step 24806: {'lr': 0.00047127572971525437, 'samples': 4762752, 'steps': 24805, 'loss/train': 1.7221107482910156} -11/07/2021 00:42:49 - INFO - __main__ - Step 24807: {'lr': 0.00047127325993131006, 'samples': 4762944, 'steps': 24806, 'loss/train': 1.6136387586593628} -11/07/2021 00:42:49 - INFO - __main__ - Step 24808: {'lr': 0.0004712707900476634, 'samples': 4763136, 'steps': 24807, 'loss/train': 1.6903235912322998} -11/07/2021 00:42:50 - INFO - __main__ - Step 24809: {'lr': 0.00047126832006431555, 'samples': 4763328, 'steps': 24808, 'loss/train': 1.5415527820587158} -11/07/2021 00:42:50 - INFO - __main__ - Step 24810: {'lr': 0.00047126584998126756, 'samples': 4763520, 'steps': 24809, 'loss/train': 1.7238624095916748} -11/07/2021 00:42:51 - INFO - __main__ - Step 24811: {'lr': 0.0004712633797985206, 'samples': 4763712, 'steps': 24810, 'loss/train': 2.1266679763793945} -11/07/2021 00:42:51 - INFO - __main__ - Step 24812: {'lr': 0.0004712609095160758, 'samples': 4763904, 'steps': 24811, 'loss/train': 1.6983754634857178} -11/07/2021 00:42:52 - INFO - __main__ - Step 24813: {'lr': 0.0004712584391339343, 'samples': 4764096, 'steps': 24812, 'loss/train': 1.1013861894607544} -11/07/2021 00:42:52 - INFO - __main__ - Step 24814: {'lr': 0.0004712559686520971, 'samples': 4764288, 'steps': 24813, 'loss/train': 0.8070735335350037} -11/07/2021 00:42:52 - INFO - __main__ - Step 24815: {'lr': 0.0004712534980705654, 'samples': 4764480, 'steps': 24814, 'loss/train': 1.4523907899856567} -11/07/2021 00:42:53 - INFO - __main__ - Step 24816: {'lr': 0.0004712510273893402, 'samples': 4764672, 'steps': 24815, 'loss/train': 2.0529558658599854} -11/07/2021 00:42:54 - INFO - __main__ - Step 24817: {'lr': 0.00047124855660842283, 'samples': 4764864, 'steps': 24816, 'loss/train': 1.5841693878173828} -11/07/2021 00:42:54 - INFO - __main__ - Step 24818: {'lr': 0.00047124608572781426, 'samples': 4765056, 'steps': 24817, 'loss/train': 0.8408837914466858} -11/07/2021 00:42:54 - INFO - __main__ - Step 24819: {'lr': 0.0004712436147475155, 'samples': 4765248, 'steps': 24818, 'loss/train': 1.3041859865188599} -11/07/2021 00:42:55 - INFO - __main__ - Step 24820: {'lr': 0.0004712411436675279, 'samples': 4765440, 'steps': 24819, 'loss/train': 2.031338691711426} -11/07/2021 00:42:56 - INFO - __main__ - Step 24821: {'lr': 0.0004712386724878524, 'samples': 4765632, 'steps': 24820, 'loss/train': 1.229081392288208} -11/07/2021 00:42:56 - INFO - __main__ - Step 24822: {'lr': 0.0004712362012084902, 'samples': 4765824, 'steps': 24821, 'loss/train': 1.6977263689041138} -11/07/2021 00:42:57 - INFO - __main__ - Step 24823: {'lr': 0.00047123372982944237, 'samples': 4766016, 'steps': 24822, 'loss/train': 1.9030191898345947} -11/07/2021 00:42:57 - INFO - __main__ - Step 24824: {'lr': 0.00047123125835071004, 'samples': 4766208, 'steps': 24823, 'loss/train': 1.301546573638916} -11/07/2021 00:42:57 - INFO - __main__ - Step 24825: {'lr': 0.00047122878677229426, 'samples': 4766400, 'steps': 24824, 'loss/train': 2.0315120220184326} -11/07/2021 00:42:58 - INFO - __main__ - Step 24826: {'lr': 0.0004712263150941962, 'samples': 4766592, 'steps': 24825, 'loss/train': 1.5814260244369507} -11/07/2021 00:42:59 - INFO - __main__ - Step 24827: {'lr': 0.0004712238433164171, 'samples': 4766784, 'steps': 24826, 'loss/train': 1.3355937004089355} -11/07/2021 00:42:59 - INFO - __main__ - Step 24828: {'lr': 0.00047122137143895785, 'samples': 4766976, 'steps': 24827, 'loss/train': 1.3185474872589111} -11/07/2021 00:42:59 - INFO - __main__ - Step 24829: {'lr': 0.0004712188994618197, 'samples': 4767168, 'steps': 24828, 'loss/train': 1.5112864971160889} -11/07/2021 00:43:00 - INFO - __main__ - Step 24830: {'lr': 0.0004712164273850037, 'samples': 4767360, 'steps': 24829, 'loss/train': 1.3218666315078735} -11/07/2021 00:43:01 - INFO - __main__ - Step 24831: {'lr': 0.00047121395520851103, 'samples': 4767552, 'steps': 24830, 'loss/train': 0.8458890914916992} -11/07/2021 00:43:01 - INFO - __main__ - Step 24832: {'lr': 0.00047121148293234274, 'samples': 4767744, 'steps': 24831, 'loss/train': 1.7730728387832642} -11/07/2021 00:43:02 - INFO - __main__ - Step 24833: {'lr': 0.00047120901055649995, 'samples': 4767936, 'steps': 24832, 'loss/train': 1.6675069332122803} -11/07/2021 00:43:02 - INFO - __main__ - Step 24834: {'lr': 0.0004712065380809838, 'samples': 4768128, 'steps': 24833, 'loss/train': 1.794461965560913} -11/07/2021 00:43:02 - INFO - __main__ - Step 24835: {'lr': 0.0004712040655057954, 'samples': 4768320, 'steps': 24834, 'loss/train': 1.578720211982727} -11/07/2021 00:43:03 - INFO - __main__ - Step 24836: {'lr': 0.0004712015928309359, 'samples': 4768512, 'steps': 24835, 'loss/train': 1.6604273319244385} -11/07/2021 00:43:04 - INFO - __main__ - Step 24837: {'lr': 0.0004711991200564064, 'samples': 4768704, 'steps': 24836, 'loss/train': 1.5459864139556885} -11/07/2021 00:43:04 - INFO - __main__ - Step 24838: {'lr': 0.0004711966471822079, 'samples': 4768896, 'steps': 24837, 'loss/train': 1.748180627822876} -11/07/2021 00:43:04 - INFO - __main__ - Step 24839: {'lr': 0.00047119417420834163, 'samples': 4769088, 'steps': 24838, 'loss/train': 1.8245811462402344} -11/07/2021 00:43:05 - INFO - __main__ - Step 24840: {'lr': 0.00047119170113480867, 'samples': 4769280, 'steps': 24839, 'loss/train': 1.0669902563095093} -11/07/2021 00:43:05 - INFO - __main__ - Step 24841: {'lr': 0.00047118922796161026, 'samples': 4769472, 'steps': 24840, 'loss/train': 0.9569848775863647} -11/07/2021 00:43:06 - INFO - __main__ - Step 24842: {'lr': 0.00047118675468874727, 'samples': 4769664, 'steps': 24841, 'loss/train': 1.7010862827301025} -11/07/2021 00:43:06 - INFO - __main__ - Step 24843: {'lr': 0.00047118428131622095, 'samples': 4769856, 'steps': 24842, 'loss/train': 1.2079625129699707} -11/07/2021 00:43:07 - INFO - __main__ - Step 24844: {'lr': 0.00047118180784403243, 'samples': 4770048, 'steps': 24843, 'loss/train': 1.1464524269104004} -11/07/2021 00:43:07 - INFO - __main__ - Step 24845: {'lr': 0.0004711793342721828, 'samples': 4770240, 'steps': 24844, 'loss/train': 1.9089672565460205} -11/07/2021 00:43:07 - INFO - __main__ - Step 24846: {'lr': 0.00047117686060067315, 'samples': 4770432, 'steps': 24845, 'loss/train': 1.6078968048095703} -11/07/2021 00:43:08 - INFO - __main__ - Step 24847: {'lr': 0.00047117438682950467, 'samples': 4770624, 'steps': 24846, 'loss/train': 1.0903383493423462} -11/07/2021 00:43:09 - INFO - __main__ - Step 24848: {'lr': 0.0004711719129586784, 'samples': 4770816, 'steps': 24847, 'loss/train': 1.6833618879318237} -11/07/2021 00:43:09 - INFO - __main__ - Step 24849: {'lr': 0.0004711694389881955, 'samples': 4771008, 'steps': 24848, 'loss/train': 1.607546329498291} -11/07/2021 00:43:09 - INFO - __main__ - Step 24850: {'lr': 0.000471166964918057, 'samples': 4771200, 'steps': 24849, 'loss/train': 1.469663381576538} -11/07/2021 00:43:10 - INFO - __main__ - Step 24851: {'lr': 0.0004711644907482641, 'samples': 4771392, 'steps': 24850, 'loss/train': 1.3836008310317993} -11/07/2021 00:43:11 - INFO - __main__ - Step 24852: {'lr': 0.00047116201647881794, 'samples': 4771584, 'steps': 24851, 'loss/train': 1.6112840175628662} -11/07/2021 00:43:11 - INFO - __main__ - Step 24853: {'lr': 0.00047115954210971955, 'samples': 4771776, 'steps': 24852, 'loss/train': 1.1933653354644775} -11/07/2021 00:43:12 - INFO - __main__ - Step 24854: {'lr': 0.0004711570676409701, 'samples': 4771968, 'steps': 24853, 'loss/train': 0.9327288866043091} -11/07/2021 00:43:12 - INFO - __main__ - Step 24855: {'lr': 0.0004711545930725707, 'samples': 4772160, 'steps': 24854, 'loss/train': 1.3270524740219116} -11/07/2021 00:43:12 - INFO - __main__ - Step 24856: {'lr': 0.0004711521184045224, 'samples': 4772352, 'steps': 24855, 'loss/train': 1.958956241607666} -11/07/2021 00:43:13 - INFO - __main__ - Step 24857: {'lr': 0.0004711496436368264, 'samples': 4772544, 'steps': 24856, 'loss/train': 1.4110667705535889} -11/07/2021 00:43:14 - INFO - __main__ - Step 24858: {'lr': 0.00047114716876948384, 'samples': 4772736, 'steps': 24857, 'loss/train': 2.1115291118621826} -11/07/2021 00:43:14 - INFO - __main__ - Step 24859: {'lr': 0.0004711446938024957, 'samples': 4772928, 'steps': 24858, 'loss/train': 1.4857505559921265} -11/07/2021 00:43:14 - INFO - __main__ - Step 24860: {'lr': 0.00047114221873586316, 'samples': 4773120, 'steps': 24859, 'loss/train': 1.7145774364471436} -11/07/2021 00:43:15 - INFO - __main__ - Step 24861: {'lr': 0.00047113974356958744, 'samples': 4773312, 'steps': 24860, 'loss/train': 1.6529386043548584} -11/07/2021 00:43:16 - INFO - __main__ - Step 24862: {'lr': 0.0004711372683036695, 'samples': 4773504, 'steps': 24861, 'loss/train': 1.7494276762008667} -11/07/2021 00:43:16 - INFO - __main__ - Step 24863: {'lr': 0.0004711347929381105, 'samples': 4773696, 'steps': 24862, 'loss/train': 1.3992499113082886} -11/07/2021 00:43:16 - INFO - __main__ - Step 24864: {'lr': 0.00047113231747291165, 'samples': 4773888, 'steps': 24863, 'loss/train': 1.5058045387268066} -11/07/2021 00:43:17 - INFO - __main__ - Step 24865: {'lr': 0.0004711298419080739, 'samples': 4774080, 'steps': 24864, 'loss/train': 1.6152267456054688} -11/07/2021 00:43:17 - INFO - __main__ - Step 24866: {'lr': 0.00047112736624359855, 'samples': 4774272, 'steps': 24865, 'loss/train': 1.489564061164856} -11/07/2021 00:43:18 - INFO - __main__ - Step 24867: {'lr': 0.00047112489047948655, 'samples': 4774464, 'steps': 24866, 'loss/train': 1.7998241186141968} -11/07/2021 00:43:18 - INFO - __main__ - Step 24868: {'lr': 0.00047112241461573913, 'samples': 4774656, 'steps': 24867, 'loss/train': 1.6361345052719116} -11/07/2021 00:43:19 - INFO - __main__ - Step 24869: {'lr': 0.0004711199386523573, 'samples': 4774848, 'steps': 24868, 'loss/train': 1.5118496417999268} -11/07/2021 00:43:19 - INFO - __main__ - Step 24870: {'lr': 0.0004711174625893423, 'samples': 4775040, 'steps': 24869, 'loss/train': 1.597435474395752} -11/07/2021 00:43:20 - INFO - __main__ - Step 24871: {'lr': 0.00047111498642669517, 'samples': 4775232, 'steps': 24870, 'loss/train': 2.201490640640259} -11/07/2021 00:43:20 - INFO - __main__ - Step 24872: {'lr': 0.00047111251016441704, 'samples': 4775424, 'steps': 24871, 'loss/train': 1.4889650344848633} -11/07/2021 00:43:21 - INFO - __main__ - Step 24873: {'lr': 0.0004711100338025089, 'samples': 4775616, 'steps': 24872, 'loss/train': 1.5616157054901123} -11/07/2021 00:43:21 - INFO - __main__ - Step 24874: {'lr': 0.00047110755734097216, 'samples': 4775808, 'steps': 24873, 'loss/train': 1.6636919975280762} -11/07/2021 00:43:22 - INFO - __main__ - Step 24875: {'lr': 0.00047110508077980774, 'samples': 4776000, 'steps': 24874, 'loss/train': 1.9187812805175781} -11/07/2021 00:43:22 - INFO - __main__ - Step 24876: {'lr': 0.00047110260411901674, 'samples': 4776192, 'steps': 24875, 'loss/train': 1.4029637575149536} -11/07/2021 00:43:22 - INFO - __main__ - Step 24877: {'lr': 0.0004711001273586003, 'samples': 4776384, 'steps': 24876, 'loss/train': 1.7008123397827148} -11/07/2021 00:43:23 - INFO - __main__ - Step 24878: {'lr': 0.0004710976504985596, 'samples': 4776576, 'steps': 24877, 'loss/train': 1.076745629310608} -11/07/2021 00:43:24 - INFO - __main__ - Step 24879: {'lr': 0.00047109517353889575, 'samples': 4776768, 'steps': 24878, 'loss/train': 1.3435444831848145} -11/07/2021 00:43:24 - INFO - __main__ - Step 24880: {'lr': 0.0004710926964796097, 'samples': 4776960, 'steps': 24879, 'loss/train': 1.8936501741409302} -11/07/2021 00:43:25 - INFO - __main__ - Step 24881: {'lr': 0.00047109021932070284, 'samples': 4777152, 'steps': 24880, 'loss/train': 1.713632345199585} -11/07/2021 00:43:25 - INFO - __main__ - Step 24882: {'lr': 0.00047108774206217605, 'samples': 4777344, 'steps': 24881, 'loss/train': 1.4235851764678955} -11/07/2021 00:43:26 - INFO - __main__ - Step 24883: {'lr': 0.00047108526470403055, 'samples': 4777536, 'steps': 24882, 'loss/train': 1.850601077079773} -11/07/2021 00:43:26 - INFO - __main__ - Step 24884: {'lr': 0.0004710827872462674, 'samples': 4777728, 'steps': 24883, 'loss/train': 1.433193564414978} -11/07/2021 00:43:27 - INFO - __main__ - Step 24885: {'lr': 0.00047108030968888784, 'samples': 4777920, 'steps': 24884, 'loss/train': 1.4146473407745361} -11/07/2021 00:43:27 - INFO - __main__ - Step 24886: {'lr': 0.00047107783203189285, 'samples': 4778112, 'steps': 24885, 'loss/train': 1.2156516313552856} -11/07/2021 00:43:27 - INFO - __main__ - Step 24887: {'lr': 0.0004710753542752836, 'samples': 4778304, 'steps': 24886, 'loss/train': 1.2330988645553589} -11/07/2021 00:43:29 - INFO - __main__ - Step 24888: {'lr': 0.0004710728764190612, 'samples': 4778496, 'steps': 24887, 'loss/train': 1.2248584032058716} -11/07/2021 00:43:29 - INFO - __main__ - Step 24889: {'lr': 0.0004710703984632268, 'samples': 4778688, 'steps': 24888, 'loss/train': 1.356774926185608} -11/07/2021 00:43:29 - INFO - __main__ - Step 24890: {'lr': 0.0004710679204077815, 'samples': 4778880, 'steps': 24889, 'loss/train': 1.610066294670105} -11/07/2021 00:43:30 - INFO - __main__ - Step 24891: {'lr': 0.0004710654422527264, 'samples': 4779072, 'steps': 24890, 'loss/train': 1.2098134756088257} -11/07/2021 00:43:30 - INFO - __main__ - Step 24892: {'lr': 0.0004710629639980626, 'samples': 4779264, 'steps': 24891, 'loss/train': 1.6932626962661743} -11/07/2021 00:43:30 - INFO - __main__ - Step 24893: {'lr': 0.0004710604856437912, 'samples': 4779456, 'steps': 24892, 'loss/train': 1.8135350942611694} -11/07/2021 00:43:31 - INFO - __main__ - Step 24894: {'lr': 0.00047105800718991343, 'samples': 4779648, 'steps': 24893, 'loss/train': 2.8847551345825195} -11/07/2021 00:43:32 - INFO - __main__ - Step 24895: {'lr': 0.0004710555286364303, 'samples': 4779840, 'steps': 24894, 'loss/train': 2.1138551235198975} -11/07/2021 00:43:32 - INFO - __main__ - Step 24896: {'lr': 0.000471053049983343, 'samples': 4780032, 'steps': 24895, 'loss/train': 0.3590337634086609} -11/07/2021 00:43:32 - INFO - __main__ - Step 24897: {'lr': 0.0004710505712306526, 'samples': 4780224, 'steps': 24896, 'loss/train': 1.4603281021118164} -11/07/2021 00:43:33 - INFO - __main__ - Step 24898: {'lr': 0.00047104809237836023, 'samples': 4780416, 'steps': 24897, 'loss/train': 1.2135181427001953} -11/07/2021 00:43:34 - INFO - __main__ - Step 24899: {'lr': 0.0004710456134264669, 'samples': 4780608, 'steps': 24898, 'loss/train': 1.645835518836975} -11/07/2021 00:43:34 - INFO - __main__ - Step 24900: {'lr': 0.0004710431343749739, 'samples': 4780800, 'steps': 24899, 'loss/train': 1.6387699842453003} -11/07/2021 00:43:35 - INFO - __main__ - Step 24901: {'lr': 0.0004710406552238823, 'samples': 4780992, 'steps': 24900, 'loss/train': 1.8654963970184326} -11/07/2021 00:43:35 - INFO - __main__ - Step 24902: {'lr': 0.0004710381759731932, 'samples': 4781184, 'steps': 24901, 'loss/train': 1.5616538524627686} -11/07/2021 00:43:35 - INFO - __main__ - Step 24903: {'lr': 0.0004710356966229077, 'samples': 4781376, 'steps': 24902, 'loss/train': 0.9458338022232056} -11/07/2021 00:43:36 - INFO - __main__ - Step 24904: {'lr': 0.00047103321717302684, 'samples': 4781568, 'steps': 24903, 'loss/train': 1.0792574882507324} -11/07/2021 00:43:37 - INFO - __main__ - Step 24905: {'lr': 0.00047103073762355186, 'samples': 4781760, 'steps': 24904, 'loss/train': 1.4467488527297974} -11/07/2021 00:43:37 - INFO - __main__ - Step 24906: {'lr': 0.0004710282579744839, 'samples': 4781952, 'steps': 24905, 'loss/train': 2.028386116027832} -11/07/2021 00:43:38 - INFO - __main__ - Step 24907: {'lr': 0.000471025778225824, 'samples': 4782144, 'steps': 24906, 'loss/train': 1.469319462776184} -11/07/2021 00:43:38 - INFO - __main__ - Step 24908: {'lr': 0.0004710232983775733, 'samples': 4782336, 'steps': 24907, 'loss/train': 1.626294493675232} -11/07/2021 00:43:39 - INFO - __main__ - Step 24909: {'lr': 0.0004710208184297329, 'samples': 4782528, 'steps': 24908, 'loss/train': 0.9432609677314758} -11/07/2021 00:43:39 - INFO - __main__ - Step 24910: {'lr': 0.0004710183383823039, 'samples': 4782720, 'steps': 24909, 'loss/train': 1.1606712341308594} -11/07/2021 00:43:40 - INFO - __main__ - Step 24911: {'lr': 0.00047101585823528745, 'samples': 4782912, 'steps': 24910, 'loss/train': 1.397504210472107} -11/07/2021 00:43:40 - INFO - __main__ - Step 24912: {'lr': 0.0004710133779886847, 'samples': 4783104, 'steps': 24911, 'loss/train': 1.5968561172485352} -11/07/2021 00:43:40 - INFO - __main__ - Step 24913: {'lr': 0.00047101089764249674, 'samples': 4783296, 'steps': 24912, 'loss/train': 1.6054977178573608} -11/07/2021 00:43:42 - INFO - __main__ - Step 24914: {'lr': 0.0004710084171967246, 'samples': 4783488, 'steps': 24913, 'loss/train': 1.6846996545791626} -11/07/2021 00:43:42 - INFO - __main__ - Step 24915: {'lr': 0.00047100593665136946, 'samples': 4783680, 'steps': 24914, 'loss/train': 1.5156437158584595} -11/07/2021 00:43:42 - INFO - __main__ - Step 24916: {'lr': 0.0004710034560064326, 'samples': 4783872, 'steps': 24915, 'loss/train': 1.3427435159683228} -11/07/2021 00:43:43 - INFO - __main__ - Step 24917: {'lr': 0.00047100097526191486, 'samples': 4784064, 'steps': 24916, 'loss/train': 0.7655185461044312} -11/07/2021 00:43:43 - INFO - __main__ - Step 24918: {'lr': 0.0004709984944178176, 'samples': 4784256, 'steps': 24917, 'loss/train': 1.5302414894104004} -11/07/2021 00:43:43 - INFO - __main__ - Step 24919: {'lr': 0.0004709960134741418, 'samples': 4784448, 'steps': 24918, 'loss/train': 1.8170706033706665} -11/07/2021 00:43:44 - INFO - __main__ - Step 24920: {'lr': 0.00047099353243088856, 'samples': 4784640, 'steps': 24919, 'loss/train': 1.6895228624343872} -11/07/2021 00:43:45 - INFO - __main__ - Step 24921: {'lr': 0.00047099105128805906, 'samples': 4784832, 'steps': 24920, 'loss/train': 1.7223882675170898} -11/07/2021 00:43:45 - INFO - __main__ - Step 24922: {'lr': 0.00047098857004565444, 'samples': 4785024, 'steps': 24921, 'loss/train': 2.0453617572784424} -11/07/2021 00:43:45 - INFO - __main__ - Step 24923: {'lr': 0.00047098608870367576, 'samples': 4785216, 'steps': 24922, 'loss/train': 1.4374672174453735} -11/07/2021 00:43:46 - INFO - __main__ - Step 24924: {'lr': 0.00047098360726212406, 'samples': 4785408, 'steps': 24923, 'loss/train': 1.454687237739563} -11/07/2021 00:43:47 - INFO - __main__ - Step 24925: {'lr': 0.0004709811257210007, 'samples': 4785600, 'steps': 24924, 'loss/train': 1.4822044372558594} -11/07/2021 00:43:47 - INFO - __main__ - Step 24926: {'lr': 0.0004709786440803066, 'samples': 4785792, 'steps': 24925, 'loss/train': 2.3867578506469727} -11/07/2021 00:43:48 - INFO - __main__ - Step 24927: {'lr': 0.00047097616234004295, 'samples': 4785984, 'steps': 24926, 'loss/train': 4.5228352546691895} -11/07/2021 00:43:48 - INFO - __main__ - Step 24928: {'lr': 0.00047097368050021083, 'samples': 4786176, 'steps': 24927, 'loss/train': 2.299553394317627} -11/07/2021 00:43:48 - INFO - __main__ - Step 24929: {'lr': 0.0004709711985608114, 'samples': 4786368, 'steps': 24928, 'loss/train': 1.8573694229125977} -11/07/2021 00:43:49 - INFO - __main__ - Step 24930: {'lr': 0.0004709687165218457, 'samples': 4786560, 'steps': 24929, 'loss/train': 5.637241363525391} -11/07/2021 00:43:50 - INFO - __main__ - Step 24931: {'lr': 0.00047096623438331497, 'samples': 4786752, 'steps': 24930, 'loss/train': 0.7219381332397461} -11/07/2021 00:43:50 - INFO - __main__ - Step 24932: {'lr': 0.00047096375214522026, 'samples': 4786944, 'steps': 24931, 'loss/train': 1.7461594343185425} -11/07/2021 00:43:50 - INFO - __main__ - Step 24933: {'lr': 0.0004709612698075627, 'samples': 4787136, 'steps': 24932, 'loss/train': 2.014444351196289} -11/07/2021 00:43:51 - INFO - __main__ - Step 24934: {'lr': 0.00047095878737034335, 'samples': 4787328, 'steps': 24933, 'loss/train': 1.3692693710327148} -11/07/2021 00:43:51 - INFO - __main__ - Step 24935: {'lr': 0.00047095630483356336, 'samples': 4787520, 'steps': 24934, 'loss/train': 1.5486135482788086} -11/07/2021 00:43:52 - INFO - __main__ - Step 24936: {'lr': 0.00047095382219722396, 'samples': 4787712, 'steps': 24935, 'loss/train': 1.3866608142852783} -11/07/2021 00:43:52 - INFO - __main__ - Step 24937: {'lr': 0.0004709513394613261, 'samples': 4787904, 'steps': 24936, 'loss/train': 1.516735315322876} -11/07/2021 00:43:53 - INFO - __main__ - Step 24938: {'lr': 0.00047094885662587104, 'samples': 4788096, 'steps': 24937, 'loss/train': 1.4386154413223267} -11/07/2021 00:43:53 - INFO - __main__ - Step 24939: {'lr': 0.0004709463736908598, 'samples': 4788288, 'steps': 24938, 'loss/train': 2.102384090423584} -11/07/2021 00:43:53 - INFO - __main__ - Step 24940: {'lr': 0.0004709438906562935, 'samples': 4788480, 'steps': 24939, 'loss/train': 1.9339085817337036} -11/07/2021 00:43:55 - INFO - __main__ - Step 24941: {'lr': 0.0004709414075221734, 'samples': 4788672, 'steps': 24940, 'loss/train': 1.0070801973342896} -11/07/2021 00:43:55 - INFO - __main__ - Step 24942: {'lr': 0.0004709389242885004, 'samples': 4788864, 'steps': 24941, 'loss/train': 1.6432303190231323} -11/07/2021 00:43:55 - INFO - __main__ - Step 24943: {'lr': 0.00047093644095527574, 'samples': 4789056, 'steps': 24942, 'loss/train': 1.5137380361557007} -11/07/2021 00:43:56 - INFO - __main__ - Step 24944: {'lr': 0.00047093395752250056, 'samples': 4789248, 'steps': 24943, 'loss/train': 1.3559476137161255} -11/07/2021 00:43:56 - INFO - __main__ - Step 24945: {'lr': 0.000470931473990176, 'samples': 4789440, 'steps': 24944, 'loss/train': 0.49037522077560425} -11/07/2021 00:43:58 - INFO - __main__ - Step 24946: {'lr': 0.00047092899035830303, 'samples': 4789632, 'steps': 24945, 'loss/train': 1.1880199909210205} -11/07/2021 00:43:58 - INFO - __main__ - Step 24947: {'lr': 0.00047092650662688295, 'samples': 4789824, 'steps': 24946, 'loss/train': 2.1021833419799805} -11/07/2021 00:43:58 - INFO - __main__ - Step 24948: {'lr': 0.00047092402279591674, 'samples': 4790016, 'steps': 24947, 'loss/train': 1.6405055522918701} -11/07/2021 00:43:59 - INFO - __main__ - Step 24949: {'lr': 0.00047092153886540554, 'samples': 4790208, 'steps': 24948, 'loss/train': 0.7883797883987427} -11/07/2021 00:43:59 - INFO - __main__ - Step 24950: {'lr': 0.0004709190548353506, 'samples': 4790400, 'steps': 24949, 'loss/train': 1.515425205230713} -11/07/2021 00:43:59 - INFO - __main__ - Step 24951: {'lr': 0.0004709165707057529, 'samples': 4790592, 'steps': 24950, 'loss/train': 1.6825127601623535} -11/07/2021 00:44:00 - INFO - __main__ - Step 24952: {'lr': 0.0004709140864766136, 'samples': 4790784, 'steps': 24951, 'loss/train': 1.4859381914138794} -11/07/2021 00:44:01 - INFO - __main__ - Step 24953: {'lr': 0.0004709116021479338, 'samples': 4790976, 'steps': 24952, 'loss/train': 1.4513448476791382} -11/07/2021 00:44:01 - INFO - __main__ - Step 24954: {'lr': 0.00047090911771971466, 'samples': 4791168, 'steps': 24953, 'loss/train': 1.3714603185653687} -11/07/2021 00:44:02 - INFO - __main__ - Step 24955: {'lr': 0.0004709066331919573, 'samples': 4791360, 'steps': 24954, 'loss/train': 1.8338035345077515} -11/07/2021 00:44:02 - INFO - __main__ - Step 24956: {'lr': 0.0004709041485646628, 'samples': 4791552, 'steps': 24955, 'loss/train': 1.6190221309661865} -11/07/2021 00:44:02 - INFO - __main__ - Step 24957: {'lr': 0.0004709016638378323, 'samples': 4791744, 'steps': 24956, 'loss/train': 1.393989086151123} -11/07/2021 00:44:03 - INFO - __main__ - Step 24958: {'lr': 0.00047089917901146694, 'samples': 4791936, 'steps': 24957, 'loss/train': 1.3725248575210571} -11/07/2021 00:44:04 - INFO - __main__ - Step 24959: {'lr': 0.0004708966940855678, 'samples': 4792128, 'steps': 24958, 'loss/train': 1.7774754762649536} -11/07/2021 00:44:04 - INFO - __main__ - Step 24960: {'lr': 0.00047089420906013603, 'samples': 4792320, 'steps': 24959, 'loss/train': 1.6581379175186157} -11/07/2021 00:44:04 - INFO - __main__ - Step 24961: {'lr': 0.0004708917239351727, 'samples': 4792512, 'steps': 24960, 'loss/train': 1.5697776079177856} -11/07/2021 00:44:05 - INFO - __main__ - Step 24962: {'lr': 0.000470889238710679, 'samples': 4792704, 'steps': 24961, 'loss/train': 1.5028849840164185} -11/07/2021 00:44:06 - INFO - __main__ - Step 24963: {'lr': 0.00047088675338665596, 'samples': 4792896, 'steps': 24962, 'loss/train': 1.3876596689224243} -11/07/2021 00:44:06 - INFO - __main__ - Step 24964: {'lr': 0.00047088426796310486, 'samples': 4793088, 'steps': 24963, 'loss/train': 1.650161862373352} -11/07/2021 00:44:06 - INFO - __main__ - Step 24965: {'lr': 0.00047088178244002665, 'samples': 4793280, 'steps': 24964, 'loss/train': 1.6179430484771729} -11/07/2021 00:44:07 - INFO - __main__ - Step 24966: {'lr': 0.00047087929681742253, 'samples': 4793472, 'steps': 24965, 'loss/train': 1.5869165658950806} -11/07/2021 00:44:07 - INFO - __main__ - Step 24967: {'lr': 0.00047087681109529364, 'samples': 4793664, 'steps': 24966, 'loss/train': 2.0685853958129883} -11/07/2021 00:44:08 - INFO - __main__ - Step 24968: {'lr': 0.00047087432527364106, 'samples': 4793856, 'steps': 24967, 'loss/train': 1.5191277265548706} -11/07/2021 00:44:08 - INFO - __main__ - Step 24969: {'lr': 0.0004708718393524659, 'samples': 4794048, 'steps': 24968, 'loss/train': 1.5035487413406372} -11/07/2021 00:44:09 - INFO - __main__ - Step 24970: {'lr': 0.0004708693533317693, 'samples': 4794240, 'steps': 24969, 'loss/train': 1.6295180320739746} -11/07/2021 00:44:09 - INFO - __main__ - Step 24971: {'lr': 0.00047086686721155237, 'samples': 4794432, 'steps': 24970, 'loss/train': 1.0224506855010986} -11/07/2021 00:44:10 - INFO - __main__ - Step 24972: {'lr': 0.00047086438099181615, 'samples': 4794624, 'steps': 24971, 'loss/train': 1.4066888093948364} -11/07/2021 00:44:10 - INFO - __main__ - Step 24973: {'lr': 0.00047086189467256194, 'samples': 4794816, 'steps': 24972, 'loss/train': 1.5826265811920166} -11/07/2021 00:44:11 - INFO - __main__ - Step 24974: {'lr': 0.0004708594082537908, 'samples': 4795008, 'steps': 24973, 'loss/train': 1.7132618427276611} -11/07/2021 00:44:11 - INFO - __main__ - Step 24975: {'lr': 0.00047085692173550375, 'samples': 4795200, 'steps': 24974, 'loss/train': 0.9648758769035339} -11/07/2021 00:44:12 - INFO - __main__ - Step 24976: {'lr': 0.00047085443511770206, 'samples': 4795392, 'steps': 24975, 'loss/train': 1.7411245107650757} -11/07/2021 00:44:12 - INFO - __main__ - Step 24977: {'lr': 0.0004708519484003867, 'samples': 4795584, 'steps': 24976, 'loss/train': 1.4710562229156494} -11/07/2021 00:44:12 - INFO - __main__ - Step 24978: {'lr': 0.0004708494615835589, 'samples': 4795776, 'steps': 24977, 'loss/train': 1.6182292699813843} -11/07/2021 00:44:13 - INFO - __main__ - Step 24979: {'lr': 0.00047084697466721973, 'samples': 4795968, 'steps': 24978, 'loss/train': 1.6603829860687256} -11/07/2021 00:44:14 - INFO - __main__ - Step 24980: {'lr': 0.0004708444876513703, 'samples': 4796160, 'steps': 24979, 'loss/train': 1.8253313302993774} -11/07/2021 00:44:14 - INFO - __main__ - Step 24981: {'lr': 0.0004708420005360118, 'samples': 4796352, 'steps': 24980, 'loss/train': 1.5156065225601196} -11/07/2021 00:44:14 - INFO - __main__ - Step 24982: {'lr': 0.0004708395133211452, 'samples': 4796544, 'steps': 24981, 'loss/train': 1.6060330867767334} -11/07/2021 00:44:15 - INFO - __main__ - Step 24983: {'lr': 0.0004708370260067718, 'samples': 4796736, 'steps': 24982, 'loss/train': 1.74071204662323} -11/07/2021 00:44:16 - INFO - __main__ - Step 24984: {'lr': 0.00047083453859289267, 'samples': 4796928, 'steps': 24983, 'loss/train': 1.570011019706726} -11/07/2021 00:44:16 - INFO - __main__ - Step 24985: {'lr': 0.00047083205107950886, 'samples': 4797120, 'steps': 24984, 'loss/train': 2.2700695991516113} -11/07/2021 00:44:16 - INFO - __main__ - Step 24986: {'lr': 0.00047082956346662153, 'samples': 4797312, 'steps': 24985, 'loss/train': 2.238264799118042} -11/07/2021 00:44:17 - INFO - __main__ - Step 24987: {'lr': 0.00047082707575423177, 'samples': 4797504, 'steps': 24986, 'loss/train': 1.502872109413147} -11/07/2021 00:44:17 - INFO - __main__ - Step 24988: {'lr': 0.00047082458794234087, 'samples': 4797696, 'steps': 24987, 'loss/train': 1.5819875001907349} -11/07/2021 00:44:18 - INFO - __main__ - Step 24989: {'lr': 0.0004708221000309497, 'samples': 4797888, 'steps': 24988, 'loss/train': 1.5078585147857666} -11/07/2021 00:44:18 - INFO - __main__ - Step 24990: {'lr': 0.0004708196120200595, 'samples': 4798080, 'steps': 24989, 'loss/train': 1.8042079210281372} -11/07/2021 00:44:19 - INFO - __main__ - Step 24991: {'lr': 0.0004708171239096715, 'samples': 4798272, 'steps': 24990, 'loss/train': 3.638201951980591} -11/07/2021 00:44:19 - INFO - __main__ - Step 24992: {'lr': 0.00047081463569978655, 'samples': 4798464, 'steps': 24991, 'loss/train': 1.200833797454834} -11/07/2021 00:44:20 - INFO - __main__ - Step 24993: {'lr': 0.00047081214739040606, 'samples': 4798656, 'steps': 24992, 'loss/train': 1.1243364810943604} -11/07/2021 00:44:21 - INFO - __main__ - Step 24994: {'lr': 0.000470809658981531, 'samples': 4798848, 'steps': 24993, 'loss/train': 1.4025392532348633} -11/07/2021 00:44:21 - INFO - __main__ - Step 24995: {'lr': 0.00047080717047316245, 'samples': 4799040, 'steps': 24994, 'loss/train': 1.8197518587112427} -11/07/2021 00:44:21 - INFO - __main__ - Step 24996: {'lr': 0.0004708046818653017, 'samples': 4799232, 'steps': 24995, 'loss/train': 1.973433256149292} -11/07/2021 00:44:22 - INFO - __main__ - Step 24997: {'lr': 0.0004708021931579497, 'samples': 4799424, 'steps': 24996, 'loss/train': 1.774387001991272} -11/07/2021 00:44:22 - INFO - __main__ - Step 24998: {'lr': 0.00047079970435110765, 'samples': 4799616, 'steps': 24997, 'loss/train': 1.645456314086914} -11/07/2021 00:44:24 - INFO - __main__ - Step 24999: {'lr': 0.0004707972154447766, 'samples': 4799808, 'steps': 24998, 'loss/train': 1.5165650844573975} -11/07/2021 00:44:24 - INFO - __main__ - Step 25000: {'lr': 0.00047079472643895784, 'samples': 4800000, 'steps': 24999, 'loss/train': 1.743245005607605} -11/07/2021 00:44:24 - INFO - __main__ - Step 25001: {'lr': 0.00047079223733365234, 'samples': 4800192, 'steps': 25000, 'loss/train': 2.0800983905792236} -11/07/2021 00:44:25 - INFO - __main__ - Step 25002: {'lr': 0.0004707897481288612, 'samples': 4800384, 'steps': 25001, 'loss/train': 1.7442258596420288} -11/07/2021 00:44:25 - INFO - __main__ - Step 25003: {'lr': 0.00047078725882458575, 'samples': 4800576, 'steps': 25002, 'loss/train': 1.497467279434204} -11/07/2021 00:44:25 - INFO - __main__ - Step 25004: {'lr': 0.0004707847694208269, 'samples': 4800768, 'steps': 25003, 'loss/train': 2.7911336421966553} -11/07/2021 00:44:26 - INFO - __main__ - Step 25005: {'lr': 0.0004707822799175858, 'samples': 4800960, 'steps': 25004, 'loss/train': 2.8122925758361816} -11/07/2021 00:44:27 - INFO - __main__ - Step 25006: {'lr': 0.00047077979031486363, 'samples': 4801152, 'steps': 25005, 'loss/train': 1.652961015701294} -11/07/2021 00:44:27 - INFO - __main__ - Step 25007: {'lr': 0.0004707773006126615, 'samples': 4801344, 'steps': 25006, 'loss/train': 1.2835978269577026} -11/07/2021 00:44:28 - INFO - __main__ - Step 25008: {'lr': 0.0004707748108109805, 'samples': 4801536, 'steps': 25007, 'loss/train': 1.211061716079712} -11/07/2021 00:44:28 - INFO - __main__ - Step 25009: {'lr': 0.0004707723209098218, 'samples': 4801728, 'steps': 25008, 'loss/train': 1.343076229095459} -11/07/2021 00:44:28 - INFO - __main__ - Step 25010: {'lr': 0.0004707698309091865, 'samples': 4801920, 'steps': 25009, 'loss/train': 1.59666109085083} -11/07/2021 00:44:29 - INFO - __main__ - Step 25011: {'lr': 0.00047076734080907576, 'samples': 4802112, 'steps': 25010, 'loss/train': 2.856903314590454} -11/07/2021 00:44:30 - INFO - __main__ - Step 25012: {'lr': 0.0004707648506094906, 'samples': 4802304, 'steps': 25011, 'loss/train': 1.2666581869125366} -11/07/2021 00:44:30 - INFO - __main__ - Step 25013: {'lr': 0.0004707623603104322, 'samples': 4802496, 'steps': 25012, 'loss/train': 1.4336587190628052} -11/07/2021 00:44:30 - INFO - __main__ - Step 25014: {'lr': 0.0004707598699119018, 'samples': 4802688, 'steps': 25013, 'loss/train': 1.6630597114562988} -11/07/2021 00:44:31 - INFO - __main__ - Step 25015: {'lr': 0.0004707573794139003, 'samples': 4802880, 'steps': 25014, 'loss/train': 1.6455538272857666} -11/07/2021 00:44:31 - INFO - __main__ - Step 25016: {'lr': 0.0004707548888164289, 'samples': 4803072, 'steps': 25015, 'loss/train': 1.7798850536346436} -11/07/2021 00:44:32 - INFO - __main__ - Step 25017: {'lr': 0.0004707523981194889, 'samples': 4803264, 'steps': 25016, 'loss/train': 1.1420173645019531} -11/07/2021 00:44:32 - INFO - __main__ - Step 25018: {'lr': 0.00047074990732308116, 'samples': 4803456, 'steps': 25017, 'loss/train': 1.7825181484222412} -11/07/2021 00:44:33 - INFO - __main__ - Step 25019: {'lr': 0.00047074741642720694, 'samples': 4803648, 'steps': 25018, 'loss/train': 1.617344856262207} -11/07/2021 00:44:33 - INFO - __main__ - Step 25020: {'lr': 0.0004707449254318673, 'samples': 4803840, 'steps': 25019, 'loss/train': 1.0126532316207886} -11/07/2021 00:44:34 - INFO - __main__ - Step 25021: {'lr': 0.0004707424343370635, 'samples': 4804032, 'steps': 25020, 'loss/train': 1.3363791704177856} -11/07/2021 00:44:35 - INFO - __main__ - Step 25022: {'lr': 0.00047073994314279647, 'samples': 4804224, 'steps': 25021, 'loss/train': 1.4168652296066284} -11/07/2021 00:44:35 - INFO - __main__ - Step 25023: {'lr': 0.0004707374518490675, 'samples': 4804416, 'steps': 25022, 'loss/train': 1.7937602996826172} -11/07/2021 00:44:35 - INFO - __main__ - Step 25024: {'lr': 0.0004707349604558776, 'samples': 4804608, 'steps': 25023, 'loss/train': 0.8730416893959045} -11/07/2021 00:44:36 - INFO - __main__ - Step 25025: {'lr': 0.00047073246896322797, 'samples': 4804800, 'steps': 25024, 'loss/train': 1.6327455043792725} -11/07/2021 00:44:36 - INFO - __main__ - Step 25026: {'lr': 0.00047072997737111966, 'samples': 4804992, 'steps': 25025, 'loss/train': 1.2765804529190063} -11/07/2021 00:44:37 - INFO - __main__ - Step 25027: {'lr': 0.0004707274856795538, 'samples': 4805184, 'steps': 25026, 'loss/train': 1.6824760437011719} -11/07/2021 00:44:37 - INFO - __main__ - Step 25028: {'lr': 0.00047072499388853164, 'samples': 4805376, 'steps': 25027, 'loss/train': 1.6089210510253906} -11/07/2021 00:44:38 - INFO - __main__ - Step 25029: {'lr': 0.0004707225019980541, 'samples': 4805568, 'steps': 25028, 'loss/train': 1.705112338066101} -11/07/2021 00:44:38 - INFO - __main__ - Step 25030: {'lr': 0.00047072001000812247, 'samples': 4805760, 'steps': 25029, 'loss/train': 2.295302391052246} -11/07/2021 00:44:38 - INFO - __main__ - Step 25031: {'lr': 0.00047071751791873774, 'samples': 4805952, 'steps': 25030, 'loss/train': 1.5089826583862305} -11/07/2021 00:44:39 - INFO - __main__ - Step 25032: {'lr': 0.0004707150257299012, 'samples': 4806144, 'steps': 25031, 'loss/train': 1.7053147554397583} -11/07/2021 00:44:40 - INFO - __main__ - Step 25033: {'lr': 0.0004707125334416138, 'samples': 4806336, 'steps': 25032, 'loss/train': 1.095575213432312} -11/07/2021 00:44:40 - INFO - __main__ - Step 25034: {'lr': 0.00047071004105387677, 'samples': 4806528, 'steps': 25033, 'loss/train': 1.6223604679107666} -11/07/2021 00:44:40 - INFO - __main__ - Step 25035: {'lr': 0.00047070754856669115, 'samples': 4806720, 'steps': 25034, 'loss/train': 1.5200324058532715} -11/07/2021 00:44:41 - INFO - __main__ - Step 25036: {'lr': 0.0004707050559800582, 'samples': 4806912, 'steps': 25035, 'loss/train': 1.3381532430648804} -11/07/2021 00:44:42 - INFO - __main__ - Step 25037: {'lr': 0.00047070256329397893, 'samples': 4807104, 'steps': 25036, 'loss/train': 1.9821909666061401} -11/07/2021 00:44:42 - INFO - __main__ - Step 25038: {'lr': 0.0004707000705084545, 'samples': 4807296, 'steps': 25037, 'loss/train': 0.9232311248779297} -11/07/2021 00:44:43 - INFO - __main__ - Step 25039: {'lr': 0.000470697577623486, 'samples': 4807488, 'steps': 25038, 'loss/train': 1.5496188402175903} -11/07/2021 00:44:43 - INFO - __main__ - Step 25040: {'lr': 0.0004706950846390746, 'samples': 4807680, 'steps': 25039, 'loss/train': 1.9020907878875732} -11/07/2021 00:44:43 - INFO - __main__ - Step 25041: {'lr': 0.00047069259155522135, 'samples': 4807872, 'steps': 25040, 'loss/train': 1.5948377847671509} -11/07/2021 00:44:44 - INFO - __main__ - Step 25042: {'lr': 0.0004706900983719274, 'samples': 4808064, 'steps': 25041, 'loss/train': 1.7538772821426392} -11/07/2021 00:44:45 - INFO - __main__ - Step 25043: {'lr': 0.000470687605089194, 'samples': 4808256, 'steps': 25042, 'loss/train': 1.5355638265609741} -11/07/2021 00:44:45 - INFO - __main__ - Step 25044: {'lr': 0.0004706851117070221, 'samples': 4808448, 'steps': 25043, 'loss/train': 1.604849100112915} -11/07/2021 00:44:45 - INFO - __main__ - Step 25045: {'lr': 0.0004706826182254129, 'samples': 4808640, 'steps': 25044, 'loss/train': 1.7193337678909302} -11/07/2021 00:44:46 - INFO - __main__ - Step 25046: {'lr': 0.0004706801246443676, 'samples': 4808832, 'steps': 25045, 'loss/train': 1.6934117078781128} -11/07/2021 00:44:46 - INFO - __main__ - Step 25047: {'lr': 0.00047067763096388717, 'samples': 4809024, 'steps': 25046, 'loss/train': 1.499121069908142} -11/07/2021 00:44:47 - INFO - __main__ - Step 25048: {'lr': 0.00047067513718397283, 'samples': 4809216, 'steps': 25047, 'loss/train': 1.7033010721206665} -11/07/2021 00:44:47 - INFO - __main__ - Step 25049: {'lr': 0.0004706726433046256, 'samples': 4809408, 'steps': 25048, 'loss/train': 1.6697512865066528} -11/07/2021 00:44:48 - INFO - __main__ - Step 25050: {'lr': 0.00047067014932584674, 'samples': 4809600, 'steps': 25049, 'loss/train': 2.169337272644043} -11/07/2021 00:44:48 - INFO - __main__ - Step 25051: {'lr': 0.0004706676552476373, 'samples': 4809792, 'steps': 25050, 'loss/train': 1.871291995048523} -11/07/2021 00:44:48 - INFO - __main__ - Step 25052: {'lr': 0.0004706651610699985, 'samples': 4809984, 'steps': 25051, 'loss/train': 1.3978254795074463} -11/07/2021 00:44:49 - INFO - __main__ - Step 25053: {'lr': 0.00047066266679293125, 'samples': 4810176, 'steps': 25052, 'loss/train': 1.6824945211410522} -11/07/2021 00:44:50 - INFO - __main__ - Step 25054: {'lr': 0.0004706601724164369, 'samples': 4810368, 'steps': 25053, 'loss/train': 4.329379558563232} -11/07/2021 00:44:50 - INFO - __main__ - Step 25055: {'lr': 0.0004706576779405165, 'samples': 4810560, 'steps': 25054, 'loss/train': 1.64674973487854} -11/07/2021 00:44:50 - INFO - __main__ - Step 25056: {'lr': 0.0004706551833651711, 'samples': 4810752, 'steps': 25055, 'loss/train': 1.7119991779327393} -11/07/2021 00:44:51 - INFO - __main__ - Step 25057: {'lr': 0.0004706526886904019, 'samples': 4810944, 'steps': 25056, 'loss/train': 1.7684483528137207} -11/07/2021 00:44:51 - INFO - __main__ - Step 25058: {'lr': 0.00047065019391621, 'samples': 4811136, 'steps': 25057, 'loss/train': 2.1801724433898926} -11/07/2021 00:44:52 - INFO - __main__ - Step 25059: {'lr': 0.0004706476990425965, 'samples': 4811328, 'steps': 25058, 'loss/train': 1.6123212575912476} -11/07/2021 00:44:52 - INFO - __main__ - Step 25060: {'lr': 0.0004706452040695626, 'samples': 4811520, 'steps': 25059, 'loss/train': 1.2272355556488037} -11/07/2021 00:44:53 - INFO - __main__ - Step 25061: {'lr': 0.0004706427089971093, 'samples': 4811712, 'steps': 25060, 'loss/train': 1.624558448791504} -11/07/2021 00:44:53 - INFO - __main__ - Step 25062: {'lr': 0.0004706402138252379, 'samples': 4811904, 'steps': 25061, 'loss/train': 1.537904143333435} -11/07/2021 00:44:54 - INFO - __main__ - Step 25063: {'lr': 0.00047063771855394935, 'samples': 4812096, 'steps': 25062, 'loss/train': 1.5233983993530273} -11/07/2021 00:44:55 - INFO - __main__ - Step 25064: {'lr': 0.00047063522318324484, 'samples': 4812288, 'steps': 25063, 'loss/train': 1.688103199005127} -11/07/2021 00:44:55 - INFO - __main__ - Step 25065: {'lr': 0.00047063272771312556, 'samples': 4812480, 'steps': 25064, 'loss/train': 2.031040668487549} -11/07/2021 00:44:55 - INFO - __main__ - Step 25066: {'lr': 0.0004706302321435926, 'samples': 4812672, 'steps': 25065, 'loss/train': 1.943956971168518} -11/07/2021 00:44:56 - INFO - __main__ - Step 25067: {'lr': 0.00047062773647464694, 'samples': 4812864, 'steps': 25066, 'loss/train': 2.0383780002593994} -11/07/2021 00:44:56 - INFO - __main__ - Step 25068: {'lr': 0.00047062524070628993, 'samples': 4813056, 'steps': 25067, 'loss/train': 0.8462532162666321} -11/07/2021 00:44:57 - INFO - __main__ - Step 25069: {'lr': 0.00047062274483852253, 'samples': 4813248, 'steps': 25068, 'loss/train': 1.6836276054382324} -11/07/2021 00:44:57 - INFO - __main__ - Step 25070: {'lr': 0.000470620248871346, 'samples': 4813440, 'steps': 25069, 'loss/train': 2.15901517868042} -11/07/2021 00:44:58 - INFO - __main__ - Step 25071: {'lr': 0.00047061775280476134, 'samples': 4813632, 'steps': 25070, 'loss/train': 2.193253993988037} -11/07/2021 00:44:58 - INFO - __main__ - Step 25072: {'lr': 0.0004706152566387697, 'samples': 4813824, 'steps': 25071, 'loss/train': 1.4540574550628662} -11/07/2021 00:44:58 - INFO - __main__ - Step 25073: {'lr': 0.0004706127603733723, 'samples': 4814016, 'steps': 25072, 'loss/train': 1.4969120025634766} -11/07/2021 00:44:59 - INFO - __main__ - Step 25074: {'lr': 0.00047061026400857015, 'samples': 4814208, 'steps': 25073, 'loss/train': 1.4810075759887695} -11/07/2021 00:45:00 - INFO - __main__ - Step 25075: {'lr': 0.0004706077675443644, 'samples': 4814400, 'steps': 25074, 'loss/train': 1.5527960062026978} -11/07/2021 00:45:00 - INFO - __main__ - Step 25076: {'lr': 0.00047060527098075625, 'samples': 4814592, 'steps': 25075, 'loss/train': 0.34231331944465637} -11/07/2021 00:45:00 - INFO - __main__ - Step 25077: {'lr': 0.0004706027743177467, 'samples': 4814784, 'steps': 25076, 'loss/train': 1.1344234943389893} -11/07/2021 00:45:01 - INFO - __main__ - Step 25078: {'lr': 0.000470600277555337, 'samples': 4814976, 'steps': 25077, 'loss/train': 1.5538222789764404} -11/07/2021 00:45:01 - INFO - __main__ - Step 25079: {'lr': 0.0004705977806935282, 'samples': 4815168, 'steps': 25078, 'loss/train': 1.3463051319122314} -11/07/2021 00:45:02 - INFO - __main__ - Step 25080: {'lr': 0.00047059528373232147, 'samples': 4815360, 'steps': 25079, 'loss/train': 1.8053596019744873} -11/07/2021 00:45:03 - INFO - __main__ - Step 25081: {'lr': 0.0004705927866717179, 'samples': 4815552, 'steps': 25080, 'loss/train': 0.673611044883728} -11/07/2021 00:45:03 - INFO - __main__ - Step 25082: {'lr': 0.0004705902895117186, 'samples': 4815744, 'steps': 25081, 'loss/train': 2.0037245750427246} -11/07/2021 00:45:03 - INFO - __main__ - Step 25083: {'lr': 0.00047058779225232474, 'samples': 4815936, 'steps': 25082, 'loss/train': 1.377502679824829} -11/07/2021 00:45:04 - INFO - __main__ - Step 25084: {'lr': 0.0004705852948935374, 'samples': 4816128, 'steps': 25083, 'loss/train': 2.0240447521209717} -11/07/2021 00:45:05 - INFO - __main__ - Step 25085: {'lr': 0.00047058279743535775, 'samples': 4816320, 'steps': 25084, 'loss/train': 1.436004877090454} -11/07/2021 00:45:05 - INFO - __main__ - Step 25086: {'lr': 0.0004705802998777869, 'samples': 4816512, 'steps': 25085, 'loss/train': 1.718674898147583} -11/07/2021 00:45:05 - INFO - __main__ - Step 25087: {'lr': 0.0004705778022208259, 'samples': 4816704, 'steps': 25086, 'loss/train': 1.7859622240066528} -11/07/2021 00:45:06 - INFO - __main__ - Step 25088: {'lr': 0.000470575304464476, 'samples': 4816896, 'steps': 25087, 'loss/train': 1.8729404211044312} -11/07/2021 00:45:06 - INFO - __main__ - Step 25089: {'lr': 0.00047057280660873835, 'samples': 4817088, 'steps': 25088, 'loss/train': 1.590794563293457} -11/07/2021 00:45:07 - INFO - __main__ - Step 25090: {'lr': 0.00047057030865361397, 'samples': 4817280, 'steps': 25089, 'loss/train': 1.306519627571106} -11/07/2021 00:45:07 - INFO - __main__ - Step 25091: {'lr': 0.0004705678105991039, 'samples': 4817472, 'steps': 25090, 'loss/train': 1.7953321933746338} -11/07/2021 00:45:08 - INFO - __main__ - Step 25092: {'lr': 0.00047056531244520945, 'samples': 4817664, 'steps': 25091, 'loss/train': 1.5451993942260742} -11/07/2021 00:45:08 - INFO - __main__ - Step 25093: {'lr': 0.0004705628141919317, 'samples': 4817856, 'steps': 25092, 'loss/train': 1.4345879554748535} -11/07/2021 00:45:09 - INFO - __main__ - Step 25094: {'lr': 0.00047056031583927175, 'samples': 4818048, 'steps': 25093, 'loss/train': 1.4095795154571533} -11/07/2021 00:45:10 - INFO - __main__ - Step 25095: {'lr': 0.00047055781738723063, 'samples': 4818240, 'steps': 25094, 'loss/train': 1.395472526550293} -11/07/2021 00:45:10 - INFO - __main__ - Step 25096: {'lr': 0.0004705553188358096, 'samples': 4818432, 'steps': 25095, 'loss/train': 1.569098711013794} -11/07/2021 00:45:10 - INFO - __main__ - Step 25097: {'lr': 0.00047055282018500976, 'samples': 4818624, 'steps': 25096, 'loss/train': 1.5912185907363892} -11/07/2021 00:45:11 - INFO - __main__ - Step 25098: {'lr': 0.0004705503214348323, 'samples': 4818816, 'steps': 25097, 'loss/train': 1.6429988145828247} -11/07/2021 00:45:11 - INFO - __main__ - Step 25099: {'lr': 0.0004705478225852782, 'samples': 4819008, 'steps': 25098, 'loss/train': 1.2610902786254883} -11/07/2021 00:45:12 - INFO - __main__ - Step 25100: {'lr': 0.0004705453236363486, 'samples': 4819200, 'steps': 25099, 'loss/train': 1.843684434890747} -11/07/2021 00:45:12 - INFO - __main__ - Step 25101: {'lr': 0.00047054282458804477, 'samples': 4819392, 'steps': 25100, 'loss/train': 1.653101921081543} -11/07/2021 00:45:13 - INFO - __main__ - Step 25102: {'lr': 0.0004705403254403677, 'samples': 4819584, 'steps': 25101, 'loss/train': 1.8327016830444336} -11/07/2021 00:45:13 - INFO - __main__ - Step 25103: {'lr': 0.0004705378261933186, 'samples': 4819776, 'steps': 25102, 'loss/train': 1.6882308721542358} -11/07/2021 00:45:13 - INFO - __main__ - Step 25104: {'lr': 0.0004705353268468985, 'samples': 4819968, 'steps': 25103, 'loss/train': 1.575581431388855} -11/07/2021 00:45:14 - INFO - __main__ - Step 25105: {'lr': 0.00047053282740110863, 'samples': 4820160, 'steps': 25104, 'loss/train': 1.2449451684951782} -11/07/2021 00:45:15 - INFO - __main__ - Step 25106: {'lr': 0.00047053032785595005, 'samples': 4820352, 'steps': 25105, 'loss/train': 1.3807636499404907} -11/07/2021 00:45:15 - INFO - __main__ - Step 25107: {'lr': 0.0004705278282114239, 'samples': 4820544, 'steps': 25106, 'loss/train': 1.588875651359558} -11/07/2021 00:45:15 - INFO - __main__ - Step 25108: {'lr': 0.0004705253284675314, 'samples': 4820736, 'steps': 25107, 'loss/train': 1.394099473953247} -11/07/2021 00:45:16 - INFO - __main__ - Step 25109: {'lr': 0.00047052282862427355, 'samples': 4820928, 'steps': 25108, 'loss/train': 1.948533058166504} -11/07/2021 00:45:16 - INFO - __main__ - Step 25110: {'lr': 0.0004705203286816514, 'samples': 4821120, 'steps': 25109, 'loss/train': 1.3867086172103882} -11/07/2021 00:45:17 - INFO - __main__ - Step 25111: {'lr': 0.0004705178286396663, 'samples': 4821312, 'steps': 25110, 'loss/train': 1.4365869760513306} -11/07/2021 00:45:17 - INFO - __main__ - Step 25112: {'lr': 0.0004705153284983192, 'samples': 4821504, 'steps': 25111, 'loss/train': 1.374193787574768} -11/07/2021 00:45:18 - INFO - __main__ - Step 25113: {'lr': 0.00047051282825761145, 'samples': 4821696, 'steps': 25112, 'loss/train': 1.4067364931106567} -11/07/2021 00:45:18 - INFO - __main__ - Step 25114: {'lr': 0.0004705103279175439, 'samples': 4821888, 'steps': 25113, 'loss/train': 1.631029725074768} -11/07/2021 00:45:19 - INFO - __main__ - Step 25115: {'lr': 0.0004705078274781178, 'samples': 4822080, 'steps': 25114, 'loss/train': 1.4061105251312256} -11/07/2021 00:45:20 - INFO - __main__ - Step 25116: {'lr': 0.0004705053269393343, 'samples': 4822272, 'steps': 25115, 'loss/train': 1.379422664642334} -11/07/2021 00:45:20 - INFO - __main__ - Step 25117: {'lr': 0.00047050282630119444, 'samples': 4822464, 'steps': 25116, 'loss/train': 1.5515828132629395} -11/07/2021 00:45:20 - INFO - __main__ - Step 25118: {'lr': 0.0004705003255636995, 'samples': 4822656, 'steps': 25117, 'loss/train': 1.743276596069336} -11/07/2021 00:45:21 - INFO - __main__ - Step 25119: {'lr': 0.0004704978247268505, 'samples': 4822848, 'steps': 25118, 'loss/train': 1.158705472946167} -11/07/2021 00:45:21 - INFO - __main__ - Step 25120: {'lr': 0.0004704953237906485, 'samples': 4823040, 'steps': 25119, 'loss/train': 1.197891354560852} -11/07/2021 00:45:22 - INFO - __main__ - Step 25121: {'lr': 0.0004704928227550949, 'samples': 4823232, 'steps': 25120, 'loss/train': 1.9623627662658691} -11/07/2021 00:45:22 - INFO - __main__ - Step 25122: {'lr': 0.00047049032162019044, 'samples': 4823424, 'steps': 25121, 'loss/train': 1.642743468284607} -11/07/2021 00:45:23 - INFO - __main__ - Step 25123: {'lr': 0.0004704878203859365, 'samples': 4823616, 'steps': 25122, 'loss/train': 1.1424055099487305} -11/07/2021 00:45:23 - INFO - __main__ - Step 25124: {'lr': 0.0004704853190523342, 'samples': 4823808, 'steps': 25123, 'loss/train': 0.8902316093444824} -11/07/2021 00:45:23 - INFO - __main__ - Step 25125: {'lr': 0.00047048281761938456, 'samples': 4824000, 'steps': 25124, 'loss/train': 1.7656041383743286} -11/07/2021 00:45:24 - INFO - __main__ - Step 25126: {'lr': 0.00047048031608708875, 'samples': 4824192, 'steps': 25125, 'loss/train': 1.437725305557251} -11/07/2021 00:45:25 - INFO - __main__ - Step 25127: {'lr': 0.000470477814455448, 'samples': 4824384, 'steps': 25126, 'loss/train': 1.609181523323059} -11/07/2021 00:45:25 - INFO - __main__ - Step 25128: {'lr': 0.0004704753127244633, 'samples': 4824576, 'steps': 25127, 'loss/train': 1.2707256078720093} -11/07/2021 00:45:25 - INFO - __main__ - Step 25129: {'lr': 0.0004704728108941358, 'samples': 4824768, 'steps': 25128, 'loss/train': 1.8579035997390747} -11/07/2021 00:45:26 - INFO - __main__ - Step 25130: {'lr': 0.00047047030896446665, 'samples': 4824960, 'steps': 25129, 'loss/train': 1.7406295537948608} -11/07/2021 00:45:27 - INFO - __main__ - Step 25131: {'lr': 0.000470467806935457, 'samples': 4825152, 'steps': 25130, 'loss/train': 1.0406829118728638} -11/07/2021 00:45:27 - INFO - __main__ - Step 25132: {'lr': 0.000470465304807108, 'samples': 4825344, 'steps': 25131, 'loss/train': 1.3713059425354004} -11/07/2021 00:45:28 - INFO - __main__ - Step 25133: {'lr': 0.00047046280257942067, 'samples': 4825536, 'steps': 25132, 'loss/train': 1.7930819988250732} -11/07/2021 00:45:28 - INFO - __main__ - Step 25134: {'lr': 0.0004704603002523962, 'samples': 4825728, 'steps': 25133, 'loss/train': 2.26041579246521} -11/07/2021 00:45:28 - INFO - __main__ - Step 25135: {'lr': 0.00047045779782603584, 'samples': 4825920, 'steps': 25134, 'loss/train': 1.8254454135894775} -11/07/2021 00:45:29 - INFO - __main__ - Step 25136: {'lr': 0.0004704552953003405, 'samples': 4826112, 'steps': 25135, 'loss/train': 1.814273715019226} -11/07/2021 00:45:30 - INFO - __main__ - Step 25137: {'lr': 0.0004704527926753114, 'samples': 4826304, 'steps': 25136, 'loss/train': 1.6575398445129395} -11/07/2021 00:45:30 - INFO - __main__ - Step 25138: {'lr': 0.00047045028995094967, 'samples': 4826496, 'steps': 25137, 'loss/train': 1.343518853187561} -11/07/2021 00:45:30 - INFO - __main__ - Step 25139: {'lr': 0.0004704477871272564, 'samples': 4826688, 'steps': 25138, 'loss/train': 1.4930167198181152} -11/07/2021 00:45:31 - INFO - __main__ - Step 25140: {'lr': 0.0004704452842042329, 'samples': 4826880, 'steps': 25139, 'loss/train': 1.235864520072937} -11/07/2021 00:45:32 - INFO - __main__ - Step 25141: {'lr': 0.00047044278118188004, 'samples': 4827072, 'steps': 25140, 'loss/train': 1.7771896123886108} -11/07/2021 00:45:32 - INFO - __main__ - Step 25142: {'lr': 0.00047044027806019914, 'samples': 4827264, 'steps': 25141, 'loss/train': 0.8156598210334778} -11/07/2021 00:45:32 - INFO - __main__ - Step 25143: {'lr': 0.0004704377748391912, 'samples': 4827456, 'steps': 25142, 'loss/train': 1.9012995958328247} -11/07/2021 00:45:33 - INFO - __main__ - Step 25144: {'lr': 0.0004704352715188574, 'samples': 4827648, 'steps': 25143, 'loss/train': 1.625672698020935} -11/07/2021 00:45:33 - INFO - __main__ - Step 25145: {'lr': 0.0004704327680991989, 'samples': 4827840, 'steps': 25144, 'loss/train': 1.3845484256744385} -11/07/2021 00:45:34 - INFO - __main__ - Step 25146: {'lr': 0.00047043026458021677, 'samples': 4828032, 'steps': 25145, 'loss/train': 1.3643563985824585} -11/07/2021 00:45:34 - INFO - __main__ - Step 25147: {'lr': 0.0004704277609619122, 'samples': 4828224, 'steps': 25146, 'loss/train': 0.5338404178619385} -11/07/2021 00:45:35 - INFO - __main__ - Step 25148: {'lr': 0.0004704252572442862, 'samples': 4828416, 'steps': 25147, 'loss/train': 1.316985845565796} -11/07/2021 00:45:35 - INFO - __main__ - Step 25149: {'lr': 0.00047042275342734006, 'samples': 4828608, 'steps': 25148, 'loss/train': 1.718420147895813} -11/07/2021 00:45:35 - INFO - __main__ - Step 25150: {'lr': 0.0004704202495110748, 'samples': 4828800, 'steps': 25149, 'loss/train': 1.6761091947555542} -11/07/2021 00:45:36 - INFO - __main__ - Step 25151: {'lr': 0.00047041774549549156, 'samples': 4828992, 'steps': 25150, 'loss/train': 1.5337203741073608} -11/07/2021 00:45:37 - INFO - __main__ - Step 25152: {'lr': 0.00047041524138059153, 'samples': 4829184, 'steps': 25151, 'loss/train': 0.9986521601676941} -11/07/2021 00:45:37 - INFO - __main__ - Step 25153: {'lr': 0.00047041273716637576, 'samples': 4829376, 'steps': 25152, 'loss/train': 2.1026737689971924} -11/07/2021 00:45:37 - INFO - __main__ - Step 25154: {'lr': 0.00047041023285284545, 'samples': 4829568, 'steps': 25153, 'loss/train': 1.5758517980575562} -11/07/2021 00:45:38 - INFO - __main__ - Step 25155: {'lr': 0.0004704077284400017, 'samples': 4829760, 'steps': 25154, 'loss/train': 1.3530430793762207} -11/07/2021 00:45:39 - INFO - __main__ - Step 25156: {'lr': 0.0004704052239278456, 'samples': 4829952, 'steps': 25155, 'loss/train': 1.5704340934753418} -11/07/2021 00:45:39 - INFO - __main__ - Step 25157: {'lr': 0.00047040271931637824, 'samples': 4830144, 'steps': 25156, 'loss/train': 1.4760314226150513} -11/07/2021 00:45:40 - INFO - __main__ - Step 25158: {'lr': 0.0004704002146056009, 'samples': 4830336, 'steps': 25157, 'loss/train': 1.5786726474761963} -11/07/2021 00:45:40 - INFO - __main__ - Step 25159: {'lr': 0.0004703977097955146, 'samples': 4830528, 'steps': 25158, 'loss/train': 1.7212551832199097} -11/07/2021 00:45:40 - INFO - __main__ - Step 25160: {'lr': 0.0004703952048861204, 'samples': 4830720, 'steps': 25159, 'loss/train': 1.3970686197280884} -11/07/2021 00:45:41 - INFO - __main__ - Step 25161: {'lr': 0.00047039269987741967, 'samples': 4830912, 'steps': 25160, 'loss/train': 1.5743192434310913} -11/07/2021 00:45:42 - INFO - __main__ - Step 25162: {'lr': 0.0004703901947694134, 'samples': 4831104, 'steps': 25161, 'loss/train': 1.6837447881698608} -11/07/2021 00:45:42 - INFO - __main__ - Step 25163: {'lr': 0.0004703876895621025, 'samples': 4831296, 'steps': 25162, 'loss/train': 1.656884789466858} -11/07/2021 00:45:42 - INFO - __main__ - Step 25164: {'lr': 0.0004703851842554885, 'samples': 4831488, 'steps': 25163, 'loss/train': 1.3900341987609863} -11/07/2021 00:45:43 - INFO - __main__ - Step 25165: {'lr': 0.0004703826788495723, 'samples': 4831680, 'steps': 25164, 'loss/train': 1.7015156745910645} -11/07/2021 00:45:43 - INFO - __main__ - Step 25166: {'lr': 0.00047038017334435504, 'samples': 4831872, 'steps': 25165, 'loss/train': 1.4276436567306519} -11/07/2021 00:45:44 - INFO - __main__ - Step 25167: {'lr': 0.00047037766773983794, 'samples': 4832064, 'steps': 25166, 'loss/train': 1.9233454465866089} -11/07/2021 00:45:44 - INFO - __main__ - Step 25168: {'lr': 0.00047037516203602195, 'samples': 4832256, 'steps': 25167, 'loss/train': 0.7028411626815796} -11/07/2021 00:45:45 - INFO - __main__ - Step 25169: {'lr': 0.0004703726562329084, 'samples': 4832448, 'steps': 25168, 'loss/train': 1.5089735984802246} -11/07/2021 00:45:45 - INFO - __main__ - Step 25170: {'lr': 0.0004703701503304983, 'samples': 4832640, 'steps': 25169, 'loss/train': 1.633947491645813} -11/07/2021 00:45:45 - INFO - __main__ - Step 25171: {'lr': 0.0004703676443287928, 'samples': 4832832, 'steps': 25170, 'loss/train': 1.2644140720367432} -11/07/2021 00:45:47 - INFO - __main__ - Step 25172: {'lr': 0.000470365138227793, 'samples': 4833024, 'steps': 25171, 'loss/train': 1.6214765310287476} -11/07/2021 00:45:47 - INFO - __main__ - Step 25173: {'lr': 0.0004703626320275002, 'samples': 4833216, 'steps': 25172, 'loss/train': 1.574013352394104} -11/07/2021 00:45:47 - INFO - __main__ - Step 25174: {'lr': 0.0004703601257279153, 'samples': 4833408, 'steps': 25173, 'loss/train': 1.7189385890960693} -11/07/2021 00:45:48 - INFO - __main__ - Step 25175: {'lr': 0.0004703576193290395, 'samples': 4833600, 'steps': 25174, 'loss/train': 0.7705118060112} -11/07/2021 00:45:48 - INFO - __main__ - Step 25176: {'lr': 0.0004703551128308741, 'samples': 4833792, 'steps': 25175, 'loss/train': 1.8714972734451294} -11/07/2021 00:45:49 - INFO - __main__ - Step 25177: {'lr': 0.00047035260623341996, 'samples': 4833984, 'steps': 25176, 'loss/train': 2.0388734340667725} -11/07/2021 00:45:49 - INFO - __main__ - Step 25178: {'lr': 0.0004703500995366784, 'samples': 4834176, 'steps': 25177, 'loss/train': 1.363921046257019} -11/07/2021 00:45:50 - INFO - __main__ - Step 25179: {'lr': 0.00047034759274065043, 'samples': 4834368, 'steps': 25178, 'loss/train': 1.8861095905303955} -11/07/2021 00:45:50 - INFO - __main__ - Step 25180: {'lr': 0.00047034508584533724, 'samples': 4834560, 'steps': 25179, 'loss/train': 1.4527485370635986} -11/07/2021 00:45:50 - INFO - __main__ - Step 25181: {'lr': 0.00047034257885074, 'samples': 4834752, 'steps': 25180, 'loss/train': 1.6563856601715088} -11/07/2021 00:45:51 - INFO - __main__ - Step 25182: {'lr': 0.00047034007175685976, 'samples': 4834944, 'steps': 25181, 'loss/train': 1.1298303604125977} -11/07/2021 00:45:52 - INFO - __main__ - Step 25183: {'lr': 0.0004703375645636977, 'samples': 4835136, 'steps': 25182, 'loss/train': 1.9646518230438232} -11/07/2021 00:45:52 - INFO - __main__ - Step 25184: {'lr': 0.0004703350572712549, 'samples': 4835328, 'steps': 25183, 'loss/train': 1.3798952102661133} -11/07/2021 00:45:52 - INFO - __main__ - Step 25185: {'lr': 0.00047033254987953254, 'samples': 4835520, 'steps': 25184, 'loss/train': 2.0689175128936768} -11/07/2021 00:45:53 - INFO - __main__ - Step 25186: {'lr': 0.0004703300423885318, 'samples': 4835712, 'steps': 25185, 'loss/train': 1.8879923820495605} -11/07/2021 00:45:54 - INFO - __main__ - Step 25187: {'lr': 0.0004703275347982536, 'samples': 4835904, 'steps': 25186, 'loss/train': 0.9834343194961548} -11/07/2021 00:45:54 - INFO - __main__ - Step 25188: {'lr': 0.00047032502710869935, 'samples': 4836096, 'steps': 25187, 'loss/train': 1.7398415803909302} -11/07/2021 00:45:55 - INFO - __main__ - Step 25189: {'lr': 0.00047032251931987, 'samples': 4836288, 'steps': 25188, 'loss/train': 1.4668735265731812} -11/07/2021 00:45:55 - INFO - __main__ - Step 25190: {'lr': 0.0004703200114317667, 'samples': 4836480, 'steps': 25189, 'loss/train': 1.608988881111145} -11/07/2021 00:45:55 - INFO - __main__ - Step 25191: {'lr': 0.0004703175034443906, 'samples': 4836672, 'steps': 25190, 'loss/train': 1.460955262184143} -11/07/2021 00:45:56 - INFO - __main__ - Step 25192: {'lr': 0.00047031499535774284, 'samples': 4836864, 'steps': 25191, 'loss/train': 1.9606585502624512} -11/07/2021 00:45:57 - INFO - __main__ - Step 25193: {'lr': 0.00047031248717182455, 'samples': 4837056, 'steps': 25192, 'loss/train': 1.4068056344985962} -11/07/2021 00:45:57 - INFO - __main__ - Step 25194: {'lr': 0.00047030997888663687, 'samples': 4837248, 'steps': 25193, 'loss/train': 1.0019291639328003} -11/07/2021 00:45:57 - INFO - __main__ - Step 25195: {'lr': 0.00047030747050218094, 'samples': 4837440, 'steps': 25194, 'loss/train': 1.4449735879898071} -11/07/2021 00:45:58 - INFO - __main__ - Step 25196: {'lr': 0.0004703049620184578, 'samples': 4837632, 'steps': 25195, 'loss/train': 1.705001711845398} -11/07/2021 00:45:58 - INFO - __main__ - Step 25197: {'lr': 0.0004703024534354686, 'samples': 4837824, 'steps': 25196, 'loss/train': 2.5124318599700928} -11/07/2021 00:45:59 - INFO - __main__ - Step 25198: {'lr': 0.0004702999447532146, 'samples': 4838016, 'steps': 25197, 'loss/train': 2.303138494491577} -11/07/2021 00:45:59 - INFO - __main__ - Step 25199: {'lr': 0.00047029743597169684, 'samples': 4838208, 'steps': 25198, 'loss/train': 1.051732063293457} -11/07/2021 00:46:00 - INFO - __main__ - Step 25200: {'lr': 0.0004702949270909164, 'samples': 4838400, 'steps': 25199, 'loss/train': 1.731921672821045} -11/07/2021 00:46:00 - INFO - __main__ - Step 25201: {'lr': 0.0004702924181108745, 'samples': 4838592, 'steps': 25200, 'loss/train': 1.6654285192489624} -11/07/2021 00:46:00 - INFO - __main__ - Step 25202: {'lr': 0.00047028990903157233, 'samples': 4838784, 'steps': 25201, 'loss/train': 1.3601429462432861} -11/07/2021 00:46:02 - INFO - __main__ - Step 25203: {'lr': 0.0004702873998530108, 'samples': 4838976, 'steps': 25202, 'loss/train': 1.6603739261627197} -11/07/2021 00:46:02 - INFO - __main__ - Step 25204: {'lr': 0.0004702848905751912, 'samples': 4839168, 'steps': 25203, 'loss/train': 1.4916635751724243} -11/07/2021 00:46:02 - INFO - __main__ - Step 25205: {'lr': 0.0004702823811981146, 'samples': 4839360, 'steps': 25204, 'loss/train': 1.0334322452545166} -11/07/2021 00:46:03 - INFO - __main__ - Step 25206: {'lr': 0.0004702798717217822, 'samples': 4839552, 'steps': 25205, 'loss/train': 1.5200536251068115} -11/07/2021 00:46:03 - INFO - __main__ - Step 25207: {'lr': 0.0004702773621461951, 'samples': 4839744, 'steps': 25206, 'loss/train': 1.2788139581680298} -11/07/2021 00:46:04 - INFO - __main__ - Step 25208: {'lr': 0.0004702748524713544, 'samples': 4839936, 'steps': 25207, 'loss/train': 1.8211277723312378} -11/07/2021 00:46:04 - INFO - __main__ - Step 25209: {'lr': 0.00047027234269726123, 'samples': 4840128, 'steps': 25208, 'loss/train': 1.4257100820541382} -11/07/2021 00:46:05 - INFO - __main__ - Step 25210: {'lr': 0.0004702698328239167, 'samples': 4840320, 'steps': 25209, 'loss/train': 1.4680659770965576} -11/07/2021 00:46:05 - INFO - __main__ - Step 25211: {'lr': 0.0004702673228513221, 'samples': 4840512, 'steps': 25210, 'loss/train': 0.9686245322227478} -11/07/2021 00:46:05 - INFO - __main__ - Step 25212: {'lr': 0.00047026481277947835, 'samples': 4840704, 'steps': 25211, 'loss/train': 1.9399867057800293} -11/07/2021 00:46:06 - INFO - __main__ - Step 25213: {'lr': 0.0004702623026083867, 'samples': 4840896, 'steps': 25212, 'loss/train': 1.4516819715499878} -11/07/2021 00:46:07 - INFO - __main__ - Step 25214: {'lr': 0.00047025979233804825, 'samples': 4841088, 'steps': 25213, 'loss/train': 1.4941320419311523} -11/07/2021 00:46:07 - INFO - __main__ - Step 25215: {'lr': 0.00047025728196846417, 'samples': 4841280, 'steps': 25214, 'loss/train': 1.2123286724090576} -11/07/2021 00:46:07 - INFO - __main__ - Step 25216: {'lr': 0.0004702547714996355, 'samples': 4841472, 'steps': 25215, 'loss/train': 1.6218972206115723} -11/07/2021 00:46:08 - INFO - __main__ - Step 25217: {'lr': 0.00047025226093156346, 'samples': 4841664, 'steps': 25216, 'loss/train': 1.8326835632324219} -11/07/2021 00:46:09 - INFO - __main__ - Step 25218: {'lr': 0.0004702497502642492, 'samples': 4841856, 'steps': 25217, 'loss/train': 1.7213815450668335} -11/07/2021 00:46:09 - INFO - __main__ - Step 25219: {'lr': 0.0004702472394976938, 'samples': 4842048, 'steps': 25218, 'loss/train': 1.4464116096496582} -11/07/2021 00:46:09 - INFO - __main__ - Step 25220: {'lr': 0.0004702447286318983, 'samples': 4842240, 'steps': 25219, 'loss/train': 1.173579454421997} -11/07/2021 00:46:10 - INFO - __main__ - Step 25221: {'lr': 0.0004702422176668639, 'samples': 4842432, 'steps': 25220, 'loss/train': 0.8121039867401123} -11/07/2021 00:46:10 - INFO - __main__ - Step 25222: {'lr': 0.00047023970660259193, 'samples': 4842624, 'steps': 25221, 'loss/train': 1.5761325359344482} -11/07/2021 00:46:11 - INFO - __main__ - Step 25223: {'lr': 0.0004702371954390832, 'samples': 4842816, 'steps': 25222, 'loss/train': 1.708838939666748} -11/07/2021 00:46:12 - INFO - __main__ - Step 25224: {'lr': 0.00047023468417633905, 'samples': 4843008, 'steps': 25223, 'loss/train': 1.512524962425232} -11/07/2021 00:46:12 - INFO - __main__ - Step 25225: {'lr': 0.0004702321728143605, 'samples': 4843200, 'steps': 25224, 'loss/train': 1.0887199640274048} -11/07/2021 00:46:12 - INFO - __main__ - Step 25226: {'lr': 0.0004702296613531488, 'samples': 4843392, 'steps': 25225, 'loss/train': 1.1451746225357056} -11/07/2021 00:46:13 - INFO - __main__ - Step 25227: {'lr': 0.00047022714979270497, 'samples': 4843584, 'steps': 25226, 'loss/train': 1.372851848602295} -11/07/2021 00:46:14 - INFO - __main__ - Step 25228: {'lr': 0.0004702246381330302, 'samples': 4843776, 'steps': 25227, 'loss/train': 1.5111043453216553} -11/07/2021 00:46:14 - INFO - __main__ - Step 25229: {'lr': 0.00047022212637412553, 'samples': 4843968, 'steps': 25228, 'loss/train': 1.1899921894073486} -11/07/2021 00:46:14 - INFO - __main__ - Step 25230: {'lr': 0.00047021961451599226, 'samples': 4844160, 'steps': 25229, 'loss/train': 1.3683167695999146} -11/07/2021 00:46:15 - INFO - __main__ - Step 25231: {'lr': 0.00047021710255863144, 'samples': 4844352, 'steps': 25230, 'loss/train': 1.5361984968185425} -11/07/2021 00:46:15 - INFO - __main__ - Step 25232: {'lr': 0.0004702145905020442, 'samples': 4844544, 'steps': 25231, 'loss/train': 1.7946422100067139} -11/07/2021 00:46:15 - INFO - __main__ - Step 25233: {'lr': 0.0004702120783462316, 'samples': 4844736, 'steps': 25232, 'loss/train': 1.4184598922729492} -11/07/2021 00:46:16 - INFO - __main__ - Step 25234: {'lr': 0.00047020956609119483, 'samples': 4844928, 'steps': 25233, 'loss/train': 3.4014549255371094} -11/07/2021 00:46:17 - INFO - __main__ - Step 25235: {'lr': 0.0004702070537369351, 'samples': 4845120, 'steps': 25234, 'loss/train': 1.3262993097305298} -11/07/2021 00:46:17 - INFO - __main__ - Step 25236: {'lr': 0.00047020454128345333, 'samples': 4845312, 'steps': 25235, 'loss/train': 1.4103611707687378} -11/07/2021 00:46:17 - INFO - __main__ - Step 25237: {'lr': 0.00047020202873075093, 'samples': 4845504, 'steps': 25236, 'loss/train': 1.9136335849761963} -11/07/2021 00:46:18 - INFO - __main__ - Step 25238: {'lr': 0.00047019951607882884, 'samples': 4845696, 'steps': 25237, 'loss/train': 1.7273340225219727} -11/07/2021 00:46:19 - INFO - __main__ - Step 25239: {'lr': 0.0004701970033276882, 'samples': 4845888, 'steps': 25238, 'loss/train': 1.530830979347229} -11/07/2021 00:46:19 - INFO - __main__ - Step 25240: {'lr': 0.0004701944904773303, 'samples': 4846080, 'steps': 25239, 'loss/train': 1.5841394662857056} -11/07/2021 00:46:20 - INFO - __main__ - Step 25241: {'lr': 0.0004701919775277561, 'samples': 4846272, 'steps': 25240, 'loss/train': 1.6559784412384033} -11/07/2021 00:46:20 - INFO - __main__ - Step 25242: {'lr': 0.0004701894644789668, 'samples': 4846464, 'steps': 25241, 'loss/train': 1.7496247291564941} -11/07/2021 00:46:20 - INFO - __main__ - Step 25243: {'lr': 0.0004701869513309635, 'samples': 4846656, 'steps': 25242, 'loss/train': 1.0005935430526733} -11/07/2021 00:46:21 - INFO - __main__ - Step 25244: {'lr': 0.0004701844380837474, 'samples': 4846848, 'steps': 25243, 'loss/train': 1.9548184871673584} -11/07/2021 00:46:22 - INFO - __main__ - Step 25245: {'lr': 0.00047018192473731956, 'samples': 4847040, 'steps': 25244, 'loss/train': 1.5735375881195068} -11/07/2021 00:46:22 - INFO - __main__ - Step 25246: {'lr': 0.0004701794112916812, 'samples': 4847232, 'steps': 25245, 'loss/train': 0.7068080306053162} -11/07/2021 00:46:22 - INFO - __main__ - Step 25247: {'lr': 0.00047017689774683325, 'samples': 4847424, 'steps': 25246, 'loss/train': 2.1233181953430176} -11/07/2021 00:46:23 - INFO - __main__ - Step 25248: {'lr': 0.0004701743841027771, 'samples': 4847616, 'steps': 25247, 'loss/train': 1.7109966278076172} -11/07/2021 00:46:24 - INFO - __main__ - Step 25249: {'lr': 0.0004701718703595138, 'samples': 4847808, 'steps': 25248, 'loss/train': 1.3317124843597412} -11/07/2021 00:46:24 - INFO - __main__ - Step 25250: {'lr': 0.0004701693565170444, 'samples': 4848000, 'steps': 25249, 'loss/train': 1.6570696830749512} -11/07/2021 00:46:24 - INFO - __main__ - Step 25251: {'lr': 0.0004701668425753701, 'samples': 4848192, 'steps': 25250, 'loss/train': 1.3250230550765991} -11/07/2021 00:46:25 - INFO - __main__ - Step 25252: {'lr': 0.000470164328534492, 'samples': 4848384, 'steps': 25251, 'loss/train': 1.9276931285858154} -11/07/2021 00:46:25 - INFO - __main__ - Step 25253: {'lr': 0.00047016181439441126, 'samples': 4848576, 'steps': 25252, 'loss/train': 2.1577646732330322} -11/07/2021 00:46:26 - INFO - __main__ - Step 25254: {'lr': 0.000470159300155129, 'samples': 4848768, 'steps': 25253, 'loss/train': 1.3344687223434448} -11/07/2021 00:46:27 - INFO - __main__ - Step 25255: {'lr': 0.00047015678581664635, 'samples': 4848960, 'steps': 25254, 'loss/train': 1.5740892887115479} -11/07/2021 00:46:27 - INFO - __main__ - Step 25256: {'lr': 0.00047015427137896446, 'samples': 4849152, 'steps': 25255, 'loss/train': 1.5407794713974} -11/07/2021 00:46:27 - INFO - __main__ - Step 25257: {'lr': 0.0004701517568420844, 'samples': 4849344, 'steps': 25256, 'loss/train': 1.5174570083618164} -11/07/2021 00:46:28 - INFO - __main__ - Step 25258: {'lr': 0.0004701492422060074, 'samples': 4849536, 'steps': 25257, 'loss/train': 1.896033525466919} -11/07/2021 00:46:28 - INFO - __main__ - Step 25259: {'lr': 0.0004701467274707346, 'samples': 4849728, 'steps': 25258, 'loss/train': 1.2070672512054443} -11/07/2021 00:46:29 - INFO - __main__ - Step 25260: {'lr': 0.0004701442126362671, 'samples': 4849920, 'steps': 25259, 'loss/train': 1.9618362188339233} -11/07/2021 00:46:29 - INFO - __main__ - Step 25261: {'lr': 0.0004701416977026059, 'samples': 4850112, 'steps': 25260, 'loss/train': 1.8493741750717163} -11/07/2021 00:46:30 - INFO - __main__ - Step 25262: {'lr': 0.0004701391826697523, 'samples': 4850304, 'steps': 25261, 'loss/train': 2.0049753189086914} -11/07/2021 00:46:30 - INFO - __main__ - Step 25263: {'lr': 0.00047013666753770736, 'samples': 4850496, 'steps': 25262, 'loss/train': 1.62056303024292} -11/07/2021 00:46:30 - INFO - __main__ - Step 25264: {'lr': 0.00047013415230647227, 'samples': 4850688, 'steps': 25263, 'loss/train': 0.6673987507820129} -11/07/2021 00:46:32 - INFO - __main__ - Step 25265: {'lr': 0.0004701316369760481, 'samples': 4850880, 'steps': 25264, 'loss/train': 1.8424373865127563} -11/07/2021 00:46:32 - INFO - __main__ - Step 25266: {'lr': 0.00047012912154643607, 'samples': 4851072, 'steps': 25265, 'loss/train': 1.5502065420150757} -11/07/2021 00:46:32 - INFO - __main__ - Step 25267: {'lr': 0.0004701266060176372, 'samples': 4851264, 'steps': 25266, 'loss/train': 2.0707805156707764} -11/07/2021 00:46:33 - INFO - __main__ - Step 25268: {'lr': 0.00047012409038965267, 'samples': 4851456, 'steps': 25267, 'loss/train': 1.219706416130066} -11/07/2021 00:46:33 - INFO - __main__ - Step 25269: {'lr': 0.0004701215746624836, 'samples': 4851648, 'steps': 25268, 'loss/train': 1.712836503982544} -11/07/2021 00:46:34 - INFO - __main__ - Step 25270: {'lr': 0.0004701190588361312, 'samples': 4851840, 'steps': 25269, 'loss/train': 1.7841097116470337} -11/07/2021 00:46:34 - INFO - __main__ - Step 25271: {'lr': 0.0004701165429105966, 'samples': 4852032, 'steps': 25270, 'loss/train': 1.5034170150756836} -11/07/2021 00:46:35 - INFO - __main__ - Step 25272: {'lr': 0.0004701140268858808, 'samples': 4852224, 'steps': 25271, 'loss/train': 3.784604787826538} -11/07/2021 00:46:35 - INFO - __main__ - Step 25273: {'lr': 0.000470111510761985, 'samples': 4852416, 'steps': 25272, 'loss/train': 1.329630970954895} -11/07/2021 00:46:35 - INFO - __main__ - Step 25274: {'lr': 0.0004701089945389104, 'samples': 4852608, 'steps': 25273, 'loss/train': 0.9505113959312439} -11/07/2021 00:46:36 - INFO - __main__ - Step 25275: {'lr': 0.00047010647821665803, 'samples': 4852800, 'steps': 25274, 'loss/train': 1.4187085628509521} -11/07/2021 00:46:37 - INFO - __main__ - Step 25276: {'lr': 0.0004701039617952291, 'samples': 4852992, 'steps': 25275, 'loss/train': 0.9424089193344116} -11/07/2021 00:46:37 - INFO - __main__ - Step 25277: {'lr': 0.00047010144527462474, 'samples': 4853184, 'steps': 25276, 'loss/train': 2.3901946544647217} -11/07/2021 00:46:37 - INFO - __main__ - Step 25278: {'lr': 0.00047009892865484607, 'samples': 4853376, 'steps': 25277, 'loss/train': 1.3440847396850586} -11/07/2021 00:46:38 - INFO - __main__ - Step 25279: {'lr': 0.00047009641193589423, 'samples': 4853568, 'steps': 25278, 'loss/train': 1.3197660446166992} -11/07/2021 00:46:38 - INFO - __main__ - Step 25280: {'lr': 0.00047009389511777036, 'samples': 4853760, 'steps': 25279, 'loss/train': 1.6327497959136963} -11/07/2021 00:46:39 - INFO - __main__ - Step 25281: {'lr': 0.0004700913782004755, 'samples': 4853952, 'steps': 25280, 'loss/train': 1.8389418125152588} -11/07/2021 00:46:40 - INFO - __main__ - Step 25282: {'lr': 0.00047008886118401084, 'samples': 4854144, 'steps': 25281, 'loss/train': 1.55793297290802} -11/07/2021 00:46:40 - INFO - __main__ - Step 25283: {'lr': 0.0004700863440683776, 'samples': 4854336, 'steps': 25282, 'loss/train': 1.6414594650268555} -11/07/2021 00:46:40 - INFO - __main__ - Step 25284: {'lr': 0.00047008382685357686, 'samples': 4854528, 'steps': 25283, 'loss/train': 1.131192684173584} -11/07/2021 00:46:41 - INFO - __main__ - Step 25285: {'lr': 0.0004700813095396098, 'samples': 4854720, 'steps': 25284, 'loss/train': 1.6616283655166626} -11/07/2021 00:46:42 - INFO - __main__ - Step 25286: {'lr': 0.00047007879212647744, 'samples': 4854912, 'steps': 25285, 'loss/train': 1.4370410442352295} -11/07/2021 00:46:42 - INFO - __main__ - Step 25287: {'lr': 0.0004700762746141809, 'samples': 4855104, 'steps': 25286, 'loss/train': 1.078500509262085} -11/07/2021 00:46:42 - INFO - __main__ - Step 25288: {'lr': 0.0004700737570027214, 'samples': 4855296, 'steps': 25287, 'loss/train': 1.5888121128082275} -11/07/2021 00:46:43 - INFO - __main__ - Step 25289: {'lr': 0.00047007123929210015, 'samples': 4855488, 'steps': 25288, 'loss/train': 1.627748966217041} -11/07/2021 00:46:43 - INFO - __main__ - Step 25290: {'lr': 0.00047006872148231814, 'samples': 4855680, 'steps': 25289, 'loss/train': 1.8425540924072266} -11/07/2021 00:46:44 - INFO - __main__ - Step 25291: {'lr': 0.0004700662035733766, 'samples': 4855872, 'steps': 25290, 'loss/train': 1.4199053049087524} -11/07/2021 00:46:44 - INFO - __main__ - Step 25292: {'lr': 0.0004700636855652766, 'samples': 4856064, 'steps': 25291, 'loss/train': 1.9728237390518188} -11/07/2021 00:46:45 - INFO - __main__ - Step 25293: {'lr': 0.0004700611674580193, 'samples': 4856256, 'steps': 25292, 'loss/train': 1.901063323020935} -11/07/2021 00:46:45 - INFO - __main__ - Step 25294: {'lr': 0.0004700586492516058, 'samples': 4856448, 'steps': 25293, 'loss/train': 1.5009207725524902} -11/07/2021 00:46:45 - INFO - __main__ - Step 25295: {'lr': 0.00047005613094603727, 'samples': 4856640, 'steps': 25294, 'loss/train': 1.6654140949249268} -11/07/2021 00:46:46 - INFO - __main__ - Step 25296: {'lr': 0.0004700536125413149, 'samples': 4856832, 'steps': 25295, 'loss/train': 1.5214890241622925} -11/07/2021 00:46:47 - INFO - __main__ - Step 25297: {'lr': 0.00047005109403743976, 'samples': 4857024, 'steps': 25296, 'loss/train': 1.6599291563034058} -11/07/2021 00:46:47 - INFO - __main__ - Step 25298: {'lr': 0.00047004857543441294, 'samples': 4857216, 'steps': 25297, 'loss/train': 1.448982834815979} -11/07/2021 00:46:47 - INFO - __main__ - Step 25299: {'lr': 0.00047004605673223567, 'samples': 4857408, 'steps': 25298, 'loss/train': 1.1666847467422485} -11/07/2021 00:46:48 - INFO - __main__ - Step 25300: {'lr': 0.00047004353793090903, 'samples': 4857600, 'steps': 25299, 'loss/train': 1.232759714126587} -11/07/2021 00:46:48 - INFO - __main__ - Step 25301: {'lr': 0.00047004101903043416, 'samples': 4857792, 'steps': 25300, 'loss/train': 0.6032378673553467} -11/07/2021 00:46:49 - INFO - __main__ - Step 25302: {'lr': 0.00047003850003081215, 'samples': 4857984, 'steps': 25301, 'loss/train': 1.9542654752731323} -11/07/2021 00:46:50 - INFO - __main__ - Step 25303: {'lr': 0.0004700359809320443, 'samples': 4858176, 'steps': 25302, 'loss/train': 1.7449018955230713} -11/07/2021 00:46:50 - INFO - __main__ - Step 25304: {'lr': 0.0004700334617341316, 'samples': 4858368, 'steps': 25303, 'loss/train': 1.4991850852966309} -11/07/2021 00:46:50 - INFO - __main__ - Step 25305: {'lr': 0.0004700309424370752, 'samples': 4858560, 'steps': 25304, 'loss/train': 1.3455928564071655} -11/07/2021 00:46:51 - INFO - __main__ - Step 25306: {'lr': 0.00047002842304087625, 'samples': 4858752, 'steps': 25305, 'loss/train': 0.9700114130973816} -11/07/2021 00:46:52 - INFO - __main__ - Step 25307: {'lr': 0.00047002590354553586, 'samples': 4858944, 'steps': 25306, 'loss/train': 0.09950239956378937} -11/07/2021 00:46:52 - INFO - __main__ - Step 25308: {'lr': 0.00047002338395105527, 'samples': 4859136, 'steps': 25307, 'loss/train': 2.488790988922119} -11/07/2021 00:46:53 - INFO - __main__ - Step 25309: {'lr': 0.00047002086425743545, 'samples': 4859328, 'steps': 25308, 'loss/train': 1.6912132501602173} -11/07/2021 00:46:53 - INFO - __main__ - Step 25310: {'lr': 0.0004700183444646776, 'samples': 4859520, 'steps': 25309, 'loss/train': 1.379109263420105} -11/07/2021 00:46:53 - INFO - __main__ - Step 25311: {'lr': 0.000470015824572783, 'samples': 4859712, 'steps': 25310, 'loss/train': 1.4917999505996704} -11/07/2021 00:46:54 - INFO - __main__ - Step 25312: {'lr': 0.00047001330458175264, 'samples': 4859904, 'steps': 25311, 'loss/train': 1.5213574171066284} -11/07/2021 00:46:55 - INFO - __main__ - Step 25313: {'lr': 0.0004700107844915876, 'samples': 4860096, 'steps': 25312, 'loss/train': 0.6688195466995239} -11/07/2021 00:46:55 - INFO - __main__ - Step 25314: {'lr': 0.00047000826430228915, 'samples': 4860288, 'steps': 25313, 'loss/train': 1.4643245935440063} -11/07/2021 00:46:55 - INFO - __main__ - Step 25315: {'lr': 0.00047000574401385835, 'samples': 4860480, 'steps': 25314, 'loss/train': 1.6544361114501953} -11/07/2021 00:46:56 - INFO - __main__ - Step 25316: {'lr': 0.0004700032236262964, 'samples': 4860672, 'steps': 25315, 'loss/train': 1.5297194719314575} -11/07/2021 00:46:57 - INFO - __main__ - Step 25317: {'lr': 0.00047000070313960436, 'samples': 4860864, 'steps': 25316, 'loss/train': 1.2998043298721313} -11/07/2021 00:46:57 - INFO - __main__ - Step 25318: {'lr': 0.00046999818255378335, 'samples': 4861056, 'steps': 25317, 'loss/train': 1.546887755393982} -11/07/2021 00:46:57 - INFO - __main__ - Step 25319: {'lr': 0.00046999566186883466, 'samples': 4861248, 'steps': 25318, 'loss/train': 1.403463363647461} -11/07/2021 00:46:58 - INFO - __main__ - Step 25320: {'lr': 0.0004699931410847592, 'samples': 4861440, 'steps': 25319, 'loss/train': 1.6991873979568481} -11/07/2021 00:46:58 - INFO - __main__ - Step 25321: {'lr': 0.00046999062020155834, 'samples': 4861632, 'steps': 25320, 'loss/train': 1.4992635250091553} -11/07/2021 00:46:59 - INFO - __main__ - Step 25322: {'lr': 0.00046998809921923305, 'samples': 4861824, 'steps': 25321, 'loss/train': 1.5245031118392944} -11/07/2021 00:46:59 - INFO - __main__ - Step 25323: {'lr': 0.0004699855781377845, 'samples': 4862016, 'steps': 25322, 'loss/train': 0.9190696477890015} -11/07/2021 00:47:00 - INFO - __main__ - Step 25324: {'lr': 0.0004699830569572139, 'samples': 4862208, 'steps': 25323, 'loss/train': 1.7949877977371216} -11/07/2021 00:47:00 - INFO - __main__ - Step 25325: {'lr': 0.00046998053567752225, 'samples': 4862400, 'steps': 25324, 'loss/train': 1.261948585510254} -11/07/2021 00:47:01 - INFO - __main__ - Step 25326: {'lr': 0.0004699780142987108, 'samples': 4862592, 'steps': 25325, 'loss/train': 1.4420384168624878} -11/07/2021 00:47:01 - INFO - __main__ - Step 25327: {'lr': 0.0004699754928207807, 'samples': 4862784, 'steps': 25326, 'loss/train': 1.365442156791687} -11/07/2021 00:47:02 - INFO - __main__ - Step 25328: {'lr': 0.00046997297124373293, 'samples': 4862976, 'steps': 25327, 'loss/train': 1.9386059045791626} -11/07/2021 00:47:02 - INFO - __main__ - Step 25329: {'lr': 0.00046997044956756883, 'samples': 4863168, 'steps': 25328, 'loss/train': 1.3372117280960083} -11/07/2021 00:47:03 - INFO - __main__ - Step 25330: {'lr': 0.00046996792779228935, 'samples': 4863360, 'steps': 25329, 'loss/train': 1.326066255569458} -11/07/2021 00:47:03 - INFO - __main__ - Step 25331: {'lr': 0.00046996540591789584, 'samples': 4863552, 'steps': 25330, 'loss/train': 1.7588785886764526} -11/07/2021 00:47:03 - INFO - __main__ - Step 25332: {'lr': 0.00046996288394438924, 'samples': 4863744, 'steps': 25331, 'loss/train': 1.963739275932312} -11/07/2021 00:47:06 - INFO - __main__ - Step 25333: {'lr': 0.00046996036187177073, 'samples': 4863936, 'steps': 25332, 'loss/train': 1.4010385274887085} -11/07/2021 00:47:06 - INFO - __main__ - Step 25334: {'lr': 0.0004699578397000415, 'samples': 4864128, 'steps': 25333, 'loss/train': 1.7472310066223145} -11/07/2021 00:47:06 - INFO - __main__ - Step 25335: {'lr': 0.00046995531742920264, 'samples': 4864320, 'steps': 25334, 'loss/train': 1.6207789182662964} -11/07/2021 00:47:07 - INFO - __main__ - Step 25336: {'lr': 0.00046995279505925535, 'samples': 4864512, 'steps': 25335, 'loss/train': 1.2272355556488037} -11/07/2021 00:47:07 - INFO - __main__ - Step 25337: {'lr': 0.00046995027259020075, 'samples': 4864704, 'steps': 25336, 'loss/train': 1.8280538320541382} -11/07/2021 00:47:07 - INFO - __main__ - Step 25338: {'lr': 0.00046994775002203994, 'samples': 4864896, 'steps': 25337, 'loss/train': 1.7909228801727295} -11/07/2021 00:47:08 - INFO - __main__ - Step 25339: {'lr': 0.000469945227354774, 'samples': 4865088, 'steps': 25338, 'loss/train': 0.8646075129508972} -11/07/2021 00:47:08 - INFO - __main__ - Step 25340: {'lr': 0.00046994270458840416, 'samples': 4865280, 'steps': 25339, 'loss/train': 1.7977173328399658} -11/07/2021 00:47:09 - INFO - __main__ - Step 25341: {'lr': 0.0004699401817229316, 'samples': 4865472, 'steps': 25340, 'loss/train': 0.9084984064102173} -11/07/2021 00:47:09 - INFO - __main__ - Step 25342: {'lr': 0.0004699376587583573, 'samples': 4865664, 'steps': 25341, 'loss/train': 1.1019365787506104} -11/07/2021 00:47:10 - INFO - __main__ - Step 25343: {'lr': 0.0004699351356946825, 'samples': 4865856, 'steps': 25342, 'loss/train': 1.4869623184204102} -11/07/2021 00:47:10 - INFO - __main__ - Step 25344: {'lr': 0.00046993261253190833, 'samples': 4866048, 'steps': 25343, 'loss/train': 1.684993863105774} -11/07/2021 00:47:10 - INFO - __main__ - Step 25345: {'lr': 0.000469930089270036, 'samples': 4866240, 'steps': 25344, 'loss/train': 1.3853352069854736} -11/07/2021 00:47:12 - INFO - __main__ - Step 25346: {'lr': 0.0004699275659090665, 'samples': 4866432, 'steps': 25345, 'loss/train': 1.6964845657348633} -11/07/2021 00:47:12 - INFO - __main__ - Step 25347: {'lr': 0.000469925042449001, 'samples': 4866624, 'steps': 25346, 'loss/train': 1.242707371711731} -11/07/2021 00:47:12 - INFO - __main__ - Step 25348: {'lr': 0.0004699225188898407, 'samples': 4866816, 'steps': 25347, 'loss/train': 1.0095255374908447} -11/07/2021 00:47:13 - INFO - __main__ - Step 25349: {'lr': 0.00046991999523158666, 'samples': 4867008, 'steps': 25348, 'loss/train': 1.6084877252578735} -11/07/2021 00:47:13 - INFO - __main__ - Step 25350: {'lr': 0.0004699174714742401, 'samples': 4867200, 'steps': 25349, 'loss/train': 1.6201637983322144} -11/07/2021 00:47:14 - INFO - __main__ - Step 25351: {'lr': 0.0004699149476178022, 'samples': 4867392, 'steps': 25350, 'loss/train': 1.87870192527771} -11/07/2021 00:47:14 - INFO - __main__ - Step 25352: {'lr': 0.00046991242366227395, 'samples': 4867584, 'steps': 25351, 'loss/train': 0.11543884128332138} -11/07/2021 00:47:15 - INFO - __main__ - Step 25353: {'lr': 0.0004699098996076565, 'samples': 4867776, 'steps': 25352, 'loss/train': 1.4073505401611328} -11/07/2021 00:47:15 - INFO - __main__ - Step 25354: {'lr': 0.0004699073754539511, 'samples': 4867968, 'steps': 25353, 'loss/train': 1.281815767288208} -11/07/2021 00:47:15 - INFO - __main__ - Step 25355: {'lr': 0.0004699048512011588, 'samples': 4868160, 'steps': 25354, 'loss/train': 2.1738197803497314} -11/07/2021 00:47:17 - INFO - __main__ - Step 25356: {'lr': 0.0004699023268492808, 'samples': 4868352, 'steps': 25355, 'loss/train': 1.910334587097168} -11/07/2021 00:47:17 - INFO - __main__ - Step 25357: {'lr': 0.0004698998023983182, 'samples': 4868544, 'steps': 25356, 'loss/train': 1.4859049320220947} -11/07/2021 00:47:17 - INFO - __main__ - Step 25358: {'lr': 0.0004698972778482722, 'samples': 4868736, 'steps': 25357, 'loss/train': 1.4127469062805176} -11/07/2021 00:47:18 - INFO - __main__ - Step 25359: {'lr': 0.0004698947531991438, 'samples': 4868928, 'steps': 25358, 'loss/train': 1.5658401250839233} -11/07/2021 00:47:18 - INFO - __main__ - Step 25360: {'lr': 0.0004698922284509342, 'samples': 4869120, 'steps': 25359, 'loss/train': 1.7960599660873413} -11/07/2021 00:47:19 - INFO - __main__ - Step 25361: {'lr': 0.00046988970360364456, 'samples': 4869312, 'steps': 25360, 'loss/train': 1.8280835151672363} -11/07/2021 00:47:19 - INFO - __main__ - Step 25362: {'lr': 0.0004698871786572761, 'samples': 4869504, 'steps': 25361, 'loss/train': 1.5560333728790283} -11/07/2021 00:47:20 - INFO - __main__ - Step 25363: {'lr': 0.0004698846536118298, 'samples': 4869696, 'steps': 25362, 'loss/train': 1.4659595489501953} -11/07/2021 00:47:20 - INFO - __main__ - Step 25364: {'lr': 0.00046988212846730686, 'samples': 4869888, 'steps': 25363, 'loss/train': 1.324087142944336} -11/07/2021 00:47:21 - INFO - __main__ - Step 25365: {'lr': 0.0004698796032237085, 'samples': 4870080, 'steps': 25364, 'loss/train': 1.577052354812622} -11/07/2021 00:47:22 - INFO - __main__ - Step 25366: {'lr': 0.0004698770778810357, 'samples': 4870272, 'steps': 25365, 'loss/train': 1.8698196411132812} -11/07/2021 00:47:22 - INFO - __main__ - Step 25367: {'lr': 0.00046987455243928974, 'samples': 4870464, 'steps': 25366, 'loss/train': 1.6207579374313354} -11/07/2021 00:47:22 - INFO - __main__ - Step 25368: {'lr': 0.00046987202689847165, 'samples': 4870656, 'steps': 25367, 'loss/train': 1.9728107452392578} -11/07/2021 00:47:23 - INFO - __main__ - Step 25369: {'lr': 0.00046986950125858264, 'samples': 4870848, 'steps': 25368, 'loss/train': 1.1386518478393555} -11/07/2021 00:47:23 - INFO - __main__ - Step 25370: {'lr': 0.0004698669755196239, 'samples': 4871040, 'steps': 25369, 'loss/train': 1.3435550928115845} -11/07/2021 00:47:24 - INFO - __main__ - Step 25371: {'lr': 0.0004698644496815964, 'samples': 4871232, 'steps': 25370, 'loss/train': 1.5909816026687622} -11/07/2021 00:47:24 - INFO - __main__ - Step 25372: {'lr': 0.0004698619237445013, 'samples': 4871424, 'steps': 25371, 'loss/train': 1.7607204914093018} -11/07/2021 00:47:25 - INFO - __main__ - Step 25373: {'lr': 0.00046985939770834, 'samples': 4871616, 'steps': 25372, 'loss/train': 1.651863932609558} -11/07/2021 00:47:25 - INFO - __main__ - Step 25374: {'lr': 0.0004698568715731133, 'samples': 4871808, 'steps': 25373, 'loss/train': 1.8538455963134766} -11/07/2021 00:47:25 - INFO - __main__ - Step 25375: {'lr': 0.00046985434533882255, 'samples': 4872000, 'steps': 25374, 'loss/train': 1.5987008810043335} -11/07/2021 00:47:27 - INFO - __main__ - Step 25376: {'lr': 0.00046985181900546883, 'samples': 4872192, 'steps': 25375, 'loss/train': 1.637808084487915} -11/07/2021 00:47:27 - INFO - __main__ - Step 25377: {'lr': 0.0004698492925730532, 'samples': 4872384, 'steps': 25376, 'loss/train': 1.5053311586380005} -11/07/2021 00:47:27 - INFO - __main__ - Step 25378: {'lr': 0.00046984676604157696, 'samples': 4872576, 'steps': 25377, 'loss/train': 1.6534550189971924} -11/07/2021 00:47:28 - INFO - __main__ - Step 25379: {'lr': 0.0004698442394110411, 'samples': 4872768, 'steps': 25378, 'loss/train': 1.3638150691986084} -11/07/2021 00:47:28 - INFO - __main__ - Step 25380: {'lr': 0.0004698417126814468, 'samples': 4872960, 'steps': 25379, 'loss/train': 1.1215922832489014} -11/07/2021 00:47:28 - INFO - __main__ - Step 25381: {'lr': 0.0004698391858527953, 'samples': 4873152, 'steps': 25380, 'loss/train': 1.7826118469238281} -11/07/2021 00:47:29 - INFO - __main__ - Step 25382: {'lr': 0.0004698366589250876, 'samples': 4873344, 'steps': 25381, 'loss/train': 1.8529301881790161} -11/07/2021 00:47:30 - INFO - __main__ - Step 25383: {'lr': 0.0004698341318983249, 'samples': 4873536, 'steps': 25382, 'loss/train': 0.7573006749153137} -11/07/2021 00:47:30 - INFO - __main__ - Step 25384: {'lr': 0.00046983160477250837, 'samples': 4873728, 'steps': 25383, 'loss/train': 1.7131630182266235} -11/07/2021 00:47:30 - INFO - __main__ - Step 25385: {'lr': 0.00046982907754763905, 'samples': 4873920, 'steps': 25384, 'loss/train': 1.6886578798294067} -11/07/2021 00:47:31 - INFO - __main__ - Step 25386: {'lr': 0.0004698265502237182, 'samples': 4874112, 'steps': 25385, 'loss/train': 1.656398892402649} -11/07/2021 00:47:32 - INFO - __main__ - Step 25387: {'lr': 0.0004698240228007469, 'samples': 4874304, 'steps': 25386, 'loss/train': 1.6194496154785156} -11/07/2021 00:47:32 - INFO - __main__ - Step 25388: {'lr': 0.0004698214952787262, 'samples': 4874496, 'steps': 25387, 'loss/train': 1.8319562673568726} -11/07/2021 00:47:33 - INFO - __main__ - Step 25389: {'lr': 0.0004698189676576574, 'samples': 4874688, 'steps': 25388, 'loss/train': 0.9109418988227844} -11/07/2021 00:47:33 - INFO - __main__ - Step 25390: {'lr': 0.00046981643993754155, 'samples': 4874880, 'steps': 25389, 'loss/train': 1.946299433708191} -11/07/2021 00:47:33 - INFO - __main__ - Step 25391: {'lr': 0.0004698139121183798, 'samples': 4875072, 'steps': 25390, 'loss/train': 1.7080029249191284} -11/07/2021 00:47:34 - INFO - __main__ - Step 25392: {'lr': 0.00046981138420017335, 'samples': 4875264, 'steps': 25391, 'loss/train': 1.9860248565673828} -11/07/2021 00:47:35 - INFO - __main__ - Step 25393: {'lr': 0.00046980885618292317, 'samples': 4875456, 'steps': 25392, 'loss/train': 1.5345799922943115} -11/07/2021 00:47:35 - INFO - __main__ - Step 25394: {'lr': 0.0004698063280666306, 'samples': 4875648, 'steps': 25393, 'loss/train': 1.693505883216858} -11/07/2021 00:47:35 - INFO - __main__ - Step 25395: {'lr': 0.0004698037998512966, 'samples': 4875840, 'steps': 25394, 'loss/train': 1.2428244352340698} -11/07/2021 00:47:36 - INFO - __main__ - Step 25396: {'lr': 0.00046980127153692256, 'samples': 4876032, 'steps': 25395, 'loss/train': 1.3942155838012695} -11/07/2021 00:47:36 - INFO - __main__ - Step 25397: {'lr': 0.00046979874312350935, 'samples': 4876224, 'steps': 25396, 'loss/train': 1.598301887512207} -11/07/2021 00:47:37 - INFO - __main__ - Step 25398: {'lr': 0.00046979621461105817, 'samples': 4876416, 'steps': 25397, 'loss/train': 1.7649084329605103} -11/07/2021 00:47:37 - INFO - __main__ - Step 25399: {'lr': 0.0004697936859995703, 'samples': 4876608, 'steps': 25398, 'loss/train': 1.5303013324737549} -11/07/2021 00:47:38 - INFO - __main__ - Step 25400: {'lr': 0.00046979115728904675, 'samples': 4876800, 'steps': 25399, 'loss/train': 1.4458239078521729} -11/07/2021 00:47:38 - INFO - __main__ - Step 25401: {'lr': 0.0004697886284794887, 'samples': 4876992, 'steps': 25400, 'loss/train': 1.4247881174087524} -11/07/2021 00:47:38 - INFO - __main__ - Step 25402: {'lr': 0.00046978609957089724, 'samples': 4877184, 'steps': 25401, 'loss/train': 1.2821444272994995} -11/07/2021 00:47:40 - INFO - __main__ - Step 25403: {'lr': 0.0004697835705632736, 'samples': 4877376, 'steps': 25402, 'loss/train': 1.5100736618041992} -11/07/2021 00:47:40 - INFO - __main__ - Step 25404: {'lr': 0.00046978104145661885, 'samples': 4877568, 'steps': 25403, 'loss/train': 1.4307785034179688} -11/07/2021 00:47:40 - INFO - __main__ - Step 25405: {'lr': 0.00046977851225093423, 'samples': 4877760, 'steps': 25404, 'loss/train': 2.60892915725708} -11/07/2021 00:47:41 - INFO - __main__ - Step 25406: {'lr': 0.0004697759829462207, 'samples': 4877952, 'steps': 25405, 'loss/train': 1.7201303243637085} -11/07/2021 00:47:41 - INFO - __main__ - Step 25407: {'lr': 0.0004697734535424796, 'samples': 4878144, 'steps': 25406, 'loss/train': 1.4767811298370361} -11/07/2021 00:47:42 - INFO - __main__ - Step 25408: {'lr': 0.0004697709240397119, 'samples': 4878336, 'steps': 25407, 'loss/train': 1.5929255485534668} -11/07/2021 00:47:42 - INFO - __main__ - Step 25409: {'lr': 0.00046976839443791887, 'samples': 4878528, 'steps': 25408, 'loss/train': 1.598000168800354} -11/07/2021 00:47:43 - INFO - __main__ - Step 25410: {'lr': 0.00046976586473710156, 'samples': 4878720, 'steps': 25409, 'loss/train': 1.6824252605438232} -11/07/2021 00:47:43 - INFO - __main__ - Step 25411: {'lr': 0.0004697633349372611, 'samples': 4878912, 'steps': 25410, 'loss/train': 1.4303624629974365} -11/07/2021 00:47:43 - INFO - __main__ - Step 25412: {'lr': 0.00046976080503839874, 'samples': 4879104, 'steps': 25411, 'loss/train': 1.5920426845550537} -11/07/2021 00:47:44 - INFO - __main__ - Step 25413: {'lr': 0.0004697582750405155, 'samples': 4879296, 'steps': 25412, 'loss/train': 1.718862771987915} -11/07/2021 00:47:45 - INFO - __main__ - Step 25414: {'lr': 0.00046975574494361263, 'samples': 4879488, 'steps': 25413, 'loss/train': 1.545186996459961} -11/07/2021 00:47:45 - INFO - __main__ - Step 25415: {'lr': 0.00046975321474769115, 'samples': 4879680, 'steps': 25414, 'loss/train': 1.6828172206878662} -11/07/2021 00:47:45 - INFO - __main__ - Step 25416: {'lr': 0.0004697506844527523, 'samples': 4879872, 'steps': 25415, 'loss/train': 1.047653079032898} -11/07/2021 00:47:46 - INFO - __main__ - Step 25417: {'lr': 0.0004697481540587972, 'samples': 4880064, 'steps': 25416, 'loss/train': 1.7983813285827637} -11/07/2021 00:47:47 - INFO - __main__ - Step 25418: {'lr': 0.00046974562356582694, 'samples': 4880256, 'steps': 25417, 'loss/train': 1.5987099409103394} -11/07/2021 00:47:47 - INFO - __main__ - Step 25419: {'lr': 0.0004697430929738427, 'samples': 4880448, 'steps': 25418, 'loss/train': 1.3499351739883423} -11/07/2021 00:47:48 - INFO - __main__ - Step 25420: {'lr': 0.0004697405622828456, 'samples': 4880640, 'steps': 25419, 'loss/train': 1.1702313423156738} -11/07/2021 00:47:48 - INFO - __main__ - Step 25421: {'lr': 0.00046973803149283686, 'samples': 4880832, 'steps': 25420, 'loss/train': 1.7239376306533813} -11/07/2021 00:47:48 - INFO - __main__ - Step 25422: {'lr': 0.0004697355006038175, 'samples': 4881024, 'steps': 25421, 'loss/train': 1.0425162315368652} -11/07/2021 00:47:49 - INFO - __main__ - Step 25423: {'lr': 0.0004697329696157887, 'samples': 4881216, 'steps': 25422, 'loss/train': 0.6917325854301453} -11/07/2021 00:47:50 - INFO - __main__ - Step 25424: {'lr': 0.00046973043852875163, 'samples': 4881408, 'steps': 25423, 'loss/train': 1.6703858375549316} -11/07/2021 00:47:50 - INFO - __main__ - Step 25425: {'lr': 0.00046972790734270745, 'samples': 4881600, 'steps': 25424, 'loss/train': 1.1467617750167847} -11/07/2021 00:47:50 - INFO - __main__ - Step 25426: {'lr': 0.0004697253760576572, 'samples': 4881792, 'steps': 25425, 'loss/train': 1.9418889284133911} -11/07/2021 00:47:51 - INFO - __main__ - Step 25427: {'lr': 0.00046972284467360217, 'samples': 4881984, 'steps': 25426, 'loss/train': 1.6337294578552246} -11/07/2021 00:47:52 - INFO - __main__ - Step 25428: {'lr': 0.0004697203131905433, 'samples': 4882176, 'steps': 25427, 'loss/train': 1.8798770904541016} -11/07/2021 00:47:52 - INFO - __main__ - Step 25429: {'lr': 0.00046971778160848196, 'samples': 4882368, 'steps': 25428, 'loss/train': 1.0612508058547974} -11/07/2021 00:47:52 - INFO - __main__ - Step 25430: {'lr': 0.0004697152499274191, 'samples': 4882560, 'steps': 25429, 'loss/train': 1.4720540046691895} -11/07/2021 00:47:53 - INFO - __main__ - Step 25431: {'lr': 0.00046971271814735593, 'samples': 4882752, 'steps': 25430, 'loss/train': 1.638587236404419} -11/07/2021 00:47:53 - INFO - __main__ - Step 25432: {'lr': 0.0004697101862682936, 'samples': 4882944, 'steps': 25431, 'loss/train': 1.127353310585022} -11/07/2021 00:47:54 - INFO - __main__ - Step 25433: {'lr': 0.00046970765429023336, 'samples': 4883136, 'steps': 25432, 'loss/train': 1.723750352859497} -11/07/2021 00:47:54 - INFO - __main__ - Step 25434: {'lr': 0.00046970512221317616, 'samples': 4883328, 'steps': 25433, 'loss/train': 1.5742734670639038} -11/07/2021 00:47:55 - INFO - __main__ - Step 25435: {'lr': 0.00046970259003712323, 'samples': 4883520, 'steps': 25434, 'loss/train': 1.4120583534240723} -11/07/2021 00:47:55 - INFO - __main__ - Step 25436: {'lr': 0.00046970005776207575, 'samples': 4883712, 'steps': 25435, 'loss/train': 1.7156976461410522} -11/07/2021 00:47:55 - INFO - __main__ - Step 25437: {'lr': 0.00046969752538803477, 'samples': 4883904, 'steps': 25436, 'loss/train': 1.1509177684783936} -11/07/2021 00:47:57 - INFO - __main__ - Step 25438: {'lr': 0.0004696949929150015, 'samples': 4884096, 'steps': 25437, 'loss/train': 1.466771125793457} -11/07/2021 00:47:57 - INFO - __main__ - Step 25439: {'lr': 0.00046969246034297697, 'samples': 4884288, 'steps': 25438, 'loss/train': 1.768174171447754} -11/07/2021 00:47:57 - INFO - __main__ - Step 25440: {'lr': 0.0004696899276719625, 'samples': 4884480, 'steps': 25439, 'loss/train': 1.7499266862869263} -11/07/2021 00:47:58 - INFO - __main__ - Step 25441: {'lr': 0.0004696873949019591, 'samples': 4884672, 'steps': 25440, 'loss/train': 1.9094892740249634} -11/07/2021 00:47:58 - INFO - __main__ - Step 25442: {'lr': 0.000469684862032968, 'samples': 4884864, 'steps': 25441, 'loss/train': 1.8627663850784302} -11/07/2021 00:47:58 - INFO - __main__ - Step 25443: {'lr': 0.0004696823290649902, 'samples': 4885056, 'steps': 25442, 'loss/train': 1.0269948244094849} -11/07/2021 00:48:00 - INFO - __main__ - Step 25444: {'lr': 0.000469679795998027, 'samples': 4885248, 'steps': 25443, 'loss/train': 2.533825635910034} -11/07/2021 00:48:00 - INFO - __main__ - Step 25445: {'lr': 0.00046967726283207945, 'samples': 4885440, 'steps': 25444, 'loss/train': 0.38005244731903076} -11/07/2021 00:48:00 - INFO - __main__ - Step 25446: {'lr': 0.0004696747295671487, 'samples': 4885632, 'steps': 25445, 'loss/train': 1.8956398963928223} -11/07/2021 00:48:01 - INFO - __main__ - Step 25447: {'lr': 0.000469672196203236, 'samples': 4885824, 'steps': 25446, 'loss/train': 1.2691547870635986} -11/07/2021 00:48:01 - INFO - __main__ - Step 25448: {'lr': 0.0004696696627403423, 'samples': 4886016, 'steps': 25447, 'loss/train': 1.8741952180862427} -11/07/2021 00:48:01 - INFO - __main__ - Step 25449: {'lr': 0.00046966712917846887, 'samples': 4886208, 'steps': 25448, 'loss/train': 1.662883996963501} -11/07/2021 00:48:02 - INFO - __main__ - Step 25450: {'lr': 0.00046966459551761684, 'samples': 4886400, 'steps': 25449, 'loss/train': 0.8091161847114563} -11/07/2021 00:48:03 - INFO - __main__ - Step 25451: {'lr': 0.00046966206175778723, 'samples': 4886592, 'steps': 25450, 'loss/train': 1.5671682357788086} -11/07/2021 00:48:03 - INFO - __main__ - Step 25452: {'lr': 0.0004696595278989814, 'samples': 4886784, 'steps': 25451, 'loss/train': 1.5331019163131714} -11/07/2021 00:48:03 - INFO - __main__ - Step 25453: {'lr': 0.00046965699394120033, 'samples': 4886976, 'steps': 25452, 'loss/train': 1.3922358751296997} -11/07/2021 00:48:04 - INFO - __main__ - Step 25454: {'lr': 0.0004696544598844452, 'samples': 4887168, 'steps': 25453, 'loss/train': 1.3637266159057617} -11/07/2021 00:48:05 - INFO - __main__ - Step 25455: {'lr': 0.00046965192572871723, 'samples': 4887360, 'steps': 25454, 'loss/train': 2.091482400894165} -11/07/2021 00:48:05 - INFO - __main__ - Step 25456: {'lr': 0.0004696493914740174, 'samples': 4887552, 'steps': 25455, 'loss/train': 1.694266676902771} -11/07/2021 00:48:05 - INFO - __main__ - Step 25457: {'lr': 0.00046964685712034697, 'samples': 4887744, 'steps': 25456, 'loss/train': 1.2359060049057007} -11/07/2021 00:48:06 - INFO - __main__ - Step 25458: {'lr': 0.00046964432266770713, 'samples': 4887936, 'steps': 25457, 'loss/train': 2.6210789680480957} -11/07/2021 00:48:06 - INFO - __main__ - Step 25459: {'lr': 0.0004696417881160989, 'samples': 4888128, 'steps': 25458, 'loss/train': 1.7765331268310547} -11/07/2021 00:48:07 - INFO - __main__ - Step 25460: {'lr': 0.0004696392534655234, 'samples': 4888320, 'steps': 25459, 'loss/train': 1.8273237943649292} -11/07/2021 00:48:07 - INFO - __main__ - Step 25461: {'lr': 0.0004696367187159819, 'samples': 4888512, 'steps': 25460, 'loss/train': 0.9927650094032288} -11/07/2021 00:48:08 - INFO - __main__ - Step 25462: {'lr': 0.00046963418386747547, 'samples': 4888704, 'steps': 25461, 'loss/train': 0.6545084118843079} -11/07/2021 00:48:08 - INFO - __main__ - Step 25463: {'lr': 0.0004696316489200053, 'samples': 4888896, 'steps': 25462, 'loss/train': 1.4440584182739258} -11/07/2021 00:48:08 - INFO - __main__ - Step 25464: {'lr': 0.00046962911387357246, 'samples': 4889088, 'steps': 25463, 'loss/train': 1.741220474243164} -11/07/2021 00:48:09 - INFO - __main__ - Step 25465: {'lr': 0.0004696265787281782, 'samples': 4889280, 'steps': 25464, 'loss/train': 1.5621095895767212} -11/07/2021 00:48:10 - INFO - __main__ - Step 25466: {'lr': 0.0004696240434838235, 'samples': 4889472, 'steps': 25465, 'loss/train': 1.0889923572540283} -11/07/2021 00:48:10 - INFO - __main__ - Step 25467: {'lr': 0.00046962150814050963, 'samples': 4889664, 'steps': 25466, 'loss/train': 1.4495553970336914} -11/07/2021 00:48:10 - INFO - __main__ - Step 25468: {'lr': 0.0004696189726982377, 'samples': 4889856, 'steps': 25467, 'loss/train': 1.2441531419754028} -11/07/2021 00:48:11 - INFO - __main__ - Step 25469: {'lr': 0.00046961643715700885, 'samples': 4890048, 'steps': 25468, 'loss/train': 1.3702870607376099} -11/07/2021 00:48:12 - INFO - __main__ - Step 25470: {'lr': 0.00046961390151682426, 'samples': 4890240, 'steps': 25469, 'loss/train': 1.9373600482940674} -11/07/2021 00:48:12 - INFO - __main__ - Step 25471: {'lr': 0.000469611365777685, 'samples': 4890432, 'steps': 25470, 'loss/train': 1.69800865650177} -11/07/2021 00:48:13 - INFO - __main__ - Step 25472: {'lr': 0.0004696088299395922, 'samples': 4890624, 'steps': 25471, 'loss/train': 0.9789637923240662} -11/07/2021 00:48:13 - INFO - __main__ - Step 25473: {'lr': 0.0004696062940025471, 'samples': 4890816, 'steps': 25472, 'loss/train': 1.6684023141860962} -11/07/2021 00:48:13 - INFO - __main__ - Step 25474: {'lr': 0.0004696037579665509, 'samples': 4891008, 'steps': 25473, 'loss/train': 1.4424618482589722} -11/07/2021 00:48:14 - INFO - __main__ - Step 25475: {'lr': 0.00046960122183160446, 'samples': 4891200, 'steps': 25474, 'loss/train': 1.417409062385559} -11/07/2021 00:48:15 - INFO - __main__ - Step 25476: {'lr': 0.00046959868559770914, 'samples': 4891392, 'steps': 25475, 'loss/train': 1.8746399879455566} -11/07/2021 00:48:15 - INFO - __main__ - Step 25477: {'lr': 0.00046959614926486606, 'samples': 4891584, 'steps': 25476, 'loss/train': 1.3747764825820923} -11/07/2021 00:48:16 - INFO - __main__ - Step 25478: {'lr': 0.00046959361283307636, 'samples': 4891776, 'steps': 25477, 'loss/train': 2.681973457336426} -11/07/2021 00:48:16 - INFO - __main__ - Step 25479: {'lr': 0.0004695910763023412, 'samples': 4891968, 'steps': 25478, 'loss/train': 1.392314076423645} -11/07/2021 00:48:16 - INFO - __main__ - Step 25480: {'lr': 0.0004695885396726616, 'samples': 4892160, 'steps': 25479, 'loss/train': 1.7377015352249146} -11/07/2021 00:48:17 - INFO - __main__ - Step 25481: {'lr': 0.00046958600294403887, 'samples': 4892352, 'steps': 25480, 'loss/train': 1.588399887084961} -11/07/2021 00:48:18 - INFO - __main__ - Step 25482: {'lr': 0.000469583466116474, 'samples': 4892544, 'steps': 25481, 'loss/train': 1.237380862236023} -11/07/2021 00:48:18 - INFO - __main__ - Step 25483: {'lr': 0.00046958092918996823, 'samples': 4892736, 'steps': 25482, 'loss/train': 1.4674667119979858} -11/07/2021 00:48:18 - INFO - __main__ - Step 25484: {'lr': 0.0004695783921645227, 'samples': 4892928, 'steps': 25483, 'loss/train': 2.004992961883545} -11/07/2021 00:48:19 - INFO - __main__ - Step 25485: {'lr': 0.00046957585504013853, 'samples': 4893120, 'steps': 25484, 'loss/train': 1.6140029430389404} -11/07/2021 00:48:20 - INFO - __main__ - Step 25486: {'lr': 0.0004695733178168169, 'samples': 4893312, 'steps': 25485, 'loss/train': 2.1163148880004883} -11/07/2021 00:48:20 - INFO - __main__ - Step 25487: {'lr': 0.00046957078049455895, 'samples': 4893504, 'steps': 25486, 'loss/train': 1.0973618030548096} -11/07/2021 00:48:21 - INFO - __main__ - Step 25488: {'lr': 0.00046956824307336565, 'samples': 4893696, 'steps': 25487, 'loss/train': 1.2262341976165771} -11/07/2021 00:48:21 - INFO - __main__ - Step 25489: {'lr': 0.0004695657055532384, 'samples': 4893888, 'steps': 25488, 'loss/train': 1.464012622833252} -11/07/2021 00:48:21 - INFO - __main__ - Step 25490: {'lr': 0.0004695631679341782, 'samples': 4894080, 'steps': 25489, 'loss/train': 1.6566625833511353} -11/07/2021 00:48:23 - INFO - __main__ - Step 25491: {'lr': 0.0004695606302161862, 'samples': 4894272, 'steps': 25490, 'loss/train': 1.4544919729232788} -11/07/2021 00:48:24 - INFO - __main__ - Step 25492: {'lr': 0.0004695580923992636, 'samples': 4894464, 'steps': 25491, 'loss/train': 5.552804946899414} -11/07/2021 00:48:24 - INFO - __main__ - Step 25493: {'lr': 0.0004695555544834116, 'samples': 4894656, 'steps': 25492, 'loss/train': 5.530755043029785} -11/07/2021 00:48:24 - INFO - __main__ - Step 25494: {'lr': 0.00046955301646863114, 'samples': 4894848, 'steps': 25493, 'loss/train': 5.656627178192139} -11/07/2021 00:48:25 - INFO - __main__ - Step 25495: {'lr': 0.0004695504783549235, 'samples': 4895040, 'steps': 25494, 'loss/train': 5.666793346405029} -11/07/2021 00:48:25 - INFO - __main__ - Step 25496: {'lr': 0.0004695479401422898, 'samples': 4895232, 'steps': 25495, 'loss/train': 1.751136302947998} -11/07/2021 00:48:25 - INFO - __main__ - Step 25497: {'lr': 0.0004695454018307312, 'samples': 4895424, 'steps': 25496, 'loss/train': 1.942580223083496} -11/07/2021 00:48:26 - INFO - __main__ - Step 25498: {'lr': 0.0004695428634202488, 'samples': 4895616, 'steps': 25497, 'loss/train': 1.7638825178146362} -11/07/2021 00:48:27 - INFO - __main__ - Step 25499: {'lr': 0.0004695403249108438, 'samples': 4895808, 'steps': 25498, 'loss/train': 1.5841854810714722} -11/07/2021 00:48:27 - INFO - __main__ - Step 25500: {'lr': 0.0004695377863025173, 'samples': 4896000, 'steps': 25499, 'loss/train': 1.8827564716339111} -11/07/2021 00:48:28 - INFO - __main__ - Step 25501: {'lr': 0.00046953524759527055, 'samples': 4896192, 'steps': 25500, 'loss/train': 1.5366376638412476} -11/07/2021 00:48:28 - INFO - __main__ - Step 25502: {'lr': 0.0004695327087891045, 'samples': 4896384, 'steps': 25501, 'loss/train': 1.039491891860962} -11/07/2021 00:48:28 - INFO - __main__ - Step 25503: {'lr': 0.00046953016988402044, 'samples': 4896576, 'steps': 25502, 'loss/train': 1.6493101119995117} -11/07/2021 00:48:29 - INFO - __main__ - Step 25504: {'lr': 0.0004695276308800194, 'samples': 4896768, 'steps': 25503, 'loss/train': 1.5515714883804321} -11/07/2021 00:48:30 - INFO - __main__ - Step 25505: {'lr': 0.00046952509177710267, 'samples': 4896960, 'steps': 25504, 'loss/train': 1.435947299003601} -11/07/2021 00:48:30 - INFO - __main__ - Step 25506: {'lr': 0.00046952255257527134, 'samples': 4897152, 'steps': 25505, 'loss/train': 1.8032622337341309} -11/07/2021 00:48:31 - INFO - __main__ - Step 25507: {'lr': 0.0004695200132745265, 'samples': 4897344, 'steps': 25506, 'loss/train': 1.7287282943725586} -11/07/2021 00:48:31 - INFO - __main__ - Step 25508: {'lr': 0.00046951747387486933, 'samples': 4897536, 'steps': 25507, 'loss/train': 1.765174388885498} -11/07/2021 00:48:32 - INFO - __main__ - Step 25509: {'lr': 0.00046951493437630097, 'samples': 4897728, 'steps': 25508, 'loss/train': 1.709006667137146} -11/07/2021 00:48:33 - INFO - __main__ - Step 25510: {'lr': 0.0004695123947788226, 'samples': 4897920, 'steps': 25509, 'loss/train': 1.191457748413086} -11/07/2021 00:48:33 - INFO - __main__ - Step 25511: {'lr': 0.0004695098550824353, 'samples': 4898112, 'steps': 25510, 'loss/train': 2.3190207481384277} -11/07/2021 00:48:33 - INFO - __main__ - Step 25512: {'lr': 0.0004695073152871403, 'samples': 4898304, 'steps': 25511, 'loss/train': 1.6699031591415405} -11/07/2021 00:48:34 - INFO - __main__ - Step 25513: {'lr': 0.00046950477539293864, 'samples': 4898496, 'steps': 25512, 'loss/train': 0.8998978734016418} -11/07/2021 00:48:35 - INFO - __main__ - Step 25514: {'lr': 0.0004695022353998315, 'samples': 4898688, 'steps': 25513, 'loss/train': 0.20698074996471405} -11/07/2021 00:48:35 - INFO - __main__ - Step 25515: {'lr': 0.0004694996953078201, 'samples': 4898880, 'steps': 25514, 'loss/train': 1.1759369373321533} -11/07/2021 00:48:35 - INFO - __main__ - Step 25516: {'lr': 0.0004694971551169055, 'samples': 4899072, 'steps': 25515, 'loss/train': 2.215197801589966} -11/07/2021 00:48:36 - INFO - __main__ - Step 25517: {'lr': 0.00046949461482708875, 'samples': 4899264, 'steps': 25516, 'loss/train': 1.4564876556396484} -11/07/2021 00:48:36 - INFO - __main__ - Step 25518: {'lr': 0.0004694920744383713, 'samples': 4899456, 'steps': 25517, 'loss/train': 1.4380667209625244} -11/07/2021 00:48:37 - INFO - __main__ - Step 25519: {'lr': 0.000469489533950754, 'samples': 4899648, 'steps': 25518, 'loss/train': 2.123898506164551} -11/07/2021 00:48:37 - INFO - __main__ - Step 25520: {'lr': 0.00046948699336423817, 'samples': 4899840, 'steps': 25519, 'loss/train': 1.817137598991394} -11/07/2021 00:48:38 - INFO - __main__ - Step 25521: {'lr': 0.0004694844526788248, 'samples': 4900032, 'steps': 25520, 'loss/train': 1.683441162109375} -11/07/2021 00:48:38 - INFO - __main__ - Step 25522: {'lr': 0.0004694819118945152, 'samples': 4900224, 'steps': 25521, 'loss/train': 1.1400400400161743} -11/07/2021 00:48:39 - INFO - __main__ - Step 25523: {'lr': 0.00046947937101131046, 'samples': 4900416, 'steps': 25522, 'loss/train': 2.1464781761169434} -11/07/2021 00:48:39 - INFO - __main__ - Step 25524: {'lr': 0.0004694768300292116, 'samples': 4900608, 'steps': 25523, 'loss/train': 6.091759204864502} -11/07/2021 00:48:40 - INFO - __main__ - Step 25525: {'lr': 0.0004694742889482199, 'samples': 4900800, 'steps': 25524, 'loss/train': 1.5668319463729858} -11/07/2021 00:48:40 - INFO - __main__ - Step 25526: {'lr': 0.0004694717477683365, 'samples': 4900992, 'steps': 25525, 'loss/train': 1.4446377754211426} -11/07/2021 00:48:41 - INFO - __main__ - Step 25527: {'lr': 0.0004694692064895625, 'samples': 4901184, 'steps': 25526, 'loss/train': 0.9974812865257263} -11/07/2021 00:48:41 - INFO - __main__ - Step 25528: {'lr': 0.0004694666651118991, 'samples': 4901376, 'steps': 25527, 'loss/train': 1.7450157403945923} -11/07/2021 00:48:41 - INFO - __main__ - Step 25529: {'lr': 0.00046946412363534735, 'samples': 4901568, 'steps': 25528, 'loss/train': 1.9022449254989624} -11/07/2021 00:48:43 - INFO - __main__ - Step 25530: {'lr': 0.0004694615820599085, 'samples': 4901760, 'steps': 25529, 'loss/train': 1.3847417831420898} -11/07/2021 00:48:43 - INFO - __main__ - Step 25531: {'lr': 0.00046945904038558364, 'samples': 4901952, 'steps': 25530, 'loss/train': 1.3199286460876465} -11/07/2021 00:48:43 - INFO - __main__ - Step 25532: {'lr': 0.00046945649861237387, 'samples': 4902144, 'steps': 25531, 'loss/train': 1.8600738048553467} -11/07/2021 00:48:44 - INFO - __main__ - Step 25533: {'lr': 0.00046945395674028047, 'samples': 4902336, 'steps': 25532, 'loss/train': 1.9562991857528687} -11/07/2021 00:48:44 - INFO - __main__ - Step 25534: {'lr': 0.0004694514147693044, 'samples': 4902528, 'steps': 25533, 'loss/train': 1.8586628437042236} -11/07/2021 00:48:45 - INFO - __main__ - Step 25535: {'lr': 0.000469448872699447, 'samples': 4902720, 'steps': 25534, 'loss/train': 1.3385511636734009} -11/07/2021 00:48:45 - INFO - __main__ - Step 25536: {'lr': 0.0004694463305307093, 'samples': 4902912, 'steps': 25535, 'loss/train': 1.7087907791137695} -11/07/2021 00:48:46 - INFO - __main__ - Step 25537: {'lr': 0.00046944378826309244, 'samples': 4903104, 'steps': 25536, 'loss/train': 1.7909225225448608} -11/07/2021 00:48:46 - INFO - __main__ - Step 25538: {'lr': 0.00046944124589659765, 'samples': 4903296, 'steps': 25537, 'loss/train': 1.7152092456817627} -11/07/2021 00:48:47 - INFO - __main__ - Step 25539: {'lr': 0.00046943870343122595, 'samples': 4903488, 'steps': 25538, 'loss/train': 1.7453871965408325} -11/07/2021 00:48:47 - INFO - __main__ - Step 25540: {'lr': 0.0004694361608669786, 'samples': 4903680, 'steps': 25539, 'loss/train': 1.4773492813110352} -11/07/2021 00:48:47 - INFO - __main__ - Step 25541: {'lr': 0.0004694336182038567, 'samples': 4903872, 'steps': 25540, 'loss/train': 1.7164955139160156} -11/07/2021 00:48:48 - INFO - __main__ - Step 25542: {'lr': 0.00046943107544186144, 'samples': 4904064, 'steps': 25541, 'loss/train': 1.448752760887146} -11/07/2021 00:48:49 - INFO - __main__ - Step 25543: {'lr': 0.0004694285325809938, 'samples': 4904256, 'steps': 25542, 'loss/train': 1.6738860607147217} -11/07/2021 00:48:49 - INFO - __main__ - Step 25544: {'lr': 0.00046942598962125515, 'samples': 4904448, 'steps': 25543, 'loss/train': 1.511159062385559} -11/07/2021 00:48:49 - INFO - __main__ - Step 25545: {'lr': 0.00046942344656264657, 'samples': 4904640, 'steps': 25544, 'loss/train': 1.6937353610992432} -11/07/2021 00:48:50 - INFO - __main__ - Step 25546: {'lr': 0.0004694209034051691, 'samples': 4904832, 'steps': 25545, 'loss/train': 1.914302945137024} -11/07/2021 00:48:51 - INFO - __main__ - Step 25547: {'lr': 0.00046941836014882394, 'samples': 4905024, 'steps': 25546, 'loss/train': 1.5163538455963135} -11/07/2021 00:48:51 - INFO - __main__ - Step 25548: {'lr': 0.00046941581679361234, 'samples': 4905216, 'steps': 25547, 'loss/train': 1.1521172523498535} -11/07/2021 00:48:51 - INFO - __main__ - Step 25549: {'lr': 0.00046941327333953526, 'samples': 4905408, 'steps': 25548, 'loss/train': 1.5841848850250244} -11/07/2021 00:48:52 - INFO - __main__ - Step 25550: {'lr': 0.00046941072978659397, 'samples': 4905600, 'steps': 25549, 'loss/train': 1.1602411270141602} -11/07/2021 00:48:52 - INFO - __main__ - Step 25551: {'lr': 0.00046940818613478964, 'samples': 4905792, 'steps': 25550, 'loss/train': 1.572580337524414} -11/07/2021 00:48:53 - INFO - __main__ - Step 25552: {'lr': 0.0004694056423841233, 'samples': 4905984, 'steps': 25551, 'loss/train': 1.8355903625488281} -11/07/2021 00:48:54 - INFO - __main__ - Step 25553: {'lr': 0.00046940309853459625, 'samples': 4906176, 'steps': 25552, 'loss/train': 1.4142526388168335} -11/07/2021 00:48:54 - INFO - __main__ - Step 25554: {'lr': 0.00046940055458620945, 'samples': 4906368, 'steps': 25553, 'loss/train': 1.5380394458770752} -11/07/2021 00:48:54 - INFO - __main__ - Step 25555: {'lr': 0.0004693980105389642, 'samples': 4906560, 'steps': 25554, 'loss/train': 1.888519287109375} -11/07/2021 00:48:55 - INFO - __main__ - Step 25556: {'lr': 0.00046939546639286156, 'samples': 4906752, 'steps': 25555, 'loss/train': 1.2919965982437134} -11/07/2021 00:48:56 - INFO - __main__ - Step 25557: {'lr': 0.00046939292214790275, 'samples': 4906944, 'steps': 25556, 'loss/train': 1.5348103046417236} -11/07/2021 00:48:56 - INFO - __main__ - Step 25558: {'lr': 0.0004693903778040889, 'samples': 4907136, 'steps': 25557, 'loss/train': 1.0258276462554932} -11/07/2021 00:48:56 - INFO - __main__ - Step 25559: {'lr': 0.0004693878333614211, 'samples': 4907328, 'steps': 25558, 'loss/train': 1.624510407447815} -11/07/2021 00:48:57 - INFO - __main__ - Step 25560: {'lr': 0.0004693852888199005, 'samples': 4907520, 'steps': 25559, 'loss/train': 1.7044670581817627} -11/07/2021 00:48:57 - INFO - __main__ - Step 25561: {'lr': 0.0004693827441795283, 'samples': 4907712, 'steps': 25560, 'loss/train': 1.3589155673980713} -11/07/2021 00:48:57 - INFO - __main__ - Step 25562: {'lr': 0.00046938019944030556, 'samples': 4907904, 'steps': 25561, 'loss/train': 1.0206115245819092} -11/07/2021 00:48:58 - INFO - __main__ - Step 25563: {'lr': 0.00046937765460223357, 'samples': 4908096, 'steps': 25562, 'loss/train': 1.426313877105713} -11/07/2021 00:48:59 - INFO - __main__ - Step 25564: {'lr': 0.0004693751096653134, 'samples': 4908288, 'steps': 25563, 'loss/train': 1.781064510345459} -11/07/2021 00:48:59 - INFO - __main__ - Step 25565: {'lr': 0.00046937256462954615, 'samples': 4908480, 'steps': 25564, 'loss/train': 0.6571682691574097} -11/07/2021 00:48:59 - INFO - __main__ - Step 25566: {'lr': 0.00046937001949493294, 'samples': 4908672, 'steps': 25565, 'loss/train': 1.5839568376541138} -11/07/2021 00:49:00 - INFO - __main__ - Step 25567: {'lr': 0.0004693674742614751, 'samples': 4908864, 'steps': 25566, 'loss/train': 1.3333218097686768} -11/07/2021 00:49:01 - INFO - __main__ - Step 25568: {'lr': 0.0004693649289291736, 'samples': 4909056, 'steps': 25567, 'loss/train': 1.342308759689331} -11/07/2021 00:49:01 - INFO - __main__ - Step 25569: {'lr': 0.0004693623834980297, 'samples': 4909248, 'steps': 25568, 'loss/train': 1.3374139070510864} -11/07/2021 00:49:02 - INFO - __main__ - Step 25570: {'lr': 0.00046935983796804443, 'samples': 4909440, 'steps': 25569, 'loss/train': 0.830653727054596} -11/07/2021 00:49:02 - INFO - __main__ - Step 25571: {'lr': 0.000469357292339219, 'samples': 4909632, 'steps': 25570, 'loss/train': 1.6451069116592407} -11/07/2021 00:49:02 - INFO - __main__ - Step 25572: {'lr': 0.00046935474661155465, 'samples': 4909824, 'steps': 25571, 'loss/train': 1.5277132987976074} -11/07/2021 00:49:03 - INFO - __main__ - Step 25573: {'lr': 0.00046935220078505235, 'samples': 4910016, 'steps': 25572, 'loss/train': 1.750598430633545} -11/07/2021 00:49:04 - INFO - __main__ - Step 25574: {'lr': 0.00046934965485971337, 'samples': 4910208, 'steps': 25573, 'loss/train': 0.6289024353027344} -11/07/2021 00:49:04 - INFO - __main__ - Step 25575: {'lr': 0.00046934710883553884, 'samples': 4910400, 'steps': 25574, 'loss/train': 1.674824595451355} -11/07/2021 00:49:04 - INFO - __main__ - Step 25576: {'lr': 0.00046934456271252985, 'samples': 4910592, 'steps': 25575, 'loss/train': 1.5637032985687256} -11/07/2021 00:49:05 - INFO - __main__ - Step 25577: {'lr': 0.0004693420164906876, 'samples': 4910784, 'steps': 25576, 'loss/train': 1.707536220550537} -11/07/2021 00:49:06 - INFO - __main__ - Step 25578: {'lr': 0.0004693394701700132, 'samples': 4910976, 'steps': 25577, 'loss/train': 1.2549412250518799} -11/07/2021 00:49:06 - INFO - __main__ - Step 25579: {'lr': 0.00046933692375050783, 'samples': 4911168, 'steps': 25578, 'loss/train': 0.6779226064682007} -11/07/2021 00:49:06 - INFO - __main__ - Step 25580: {'lr': 0.00046933437723217265, 'samples': 4911360, 'steps': 25579, 'loss/train': 1.3821730613708496} -11/07/2021 00:49:07 - INFO - __main__ - Step 25581: {'lr': 0.0004693318306150087, 'samples': 4911552, 'steps': 25580, 'loss/train': 2.004680633544922} -11/07/2021 00:49:07 - INFO - __main__ - Step 25582: {'lr': 0.0004693292838990173, 'samples': 4911744, 'steps': 25581, 'loss/train': 1.2198615074157715} -11/07/2021 00:49:08 - INFO - __main__ - Step 25583: {'lr': 0.0004693267370841995, 'samples': 4911936, 'steps': 25582, 'loss/train': 1.6979387998580933} -11/07/2021 00:49:09 - INFO - __main__ - Step 25584: {'lr': 0.00046932419017055646, 'samples': 4912128, 'steps': 25583, 'loss/train': 1.5728169679641724} -11/07/2021 00:49:09 - INFO - __main__ - Step 25585: {'lr': 0.0004693216431580893, 'samples': 4912320, 'steps': 25584, 'loss/train': 1.439206838607788} -11/07/2021 00:49:09 - INFO - __main__ - Step 25586: {'lr': 0.00046931909604679925, 'samples': 4912512, 'steps': 25585, 'loss/train': 1.6354206800460815} -11/07/2021 00:49:10 - INFO - __main__ - Step 25587: {'lr': 0.0004693165488366873, 'samples': 4912704, 'steps': 25586, 'loss/train': 1.040775179862976} -11/07/2021 00:49:11 - INFO - __main__ - Step 25588: {'lr': 0.00046931400152775473, 'samples': 4912896, 'steps': 25587, 'loss/train': 1.4883759021759033} -11/07/2021 00:49:11 - INFO - __main__ - Step 25589: {'lr': 0.00046931145412000265, 'samples': 4913088, 'steps': 25588, 'loss/train': 1.6937187910079956} -11/07/2021 00:49:11 - INFO - __main__ - Step 25590: {'lr': 0.00046930890661343226, 'samples': 4913280, 'steps': 25589, 'loss/train': 1.5540019273757935} -11/07/2021 00:49:12 - INFO - __main__ - Step 25591: {'lr': 0.00046930635900804466, 'samples': 4913472, 'steps': 25590, 'loss/train': 1.1948552131652832} -11/07/2021 00:49:12 - INFO - __main__ - Step 25592: {'lr': 0.0004693038113038409, 'samples': 4913664, 'steps': 25591, 'loss/train': 1.5493038892745972} -11/07/2021 00:49:13 - INFO - __main__ - Step 25593: {'lr': 0.0004693012635008224, 'samples': 4913856, 'steps': 25592, 'loss/train': 1.657433271408081} -11/07/2021 00:49:13 - INFO - __main__ - Step 25594: {'lr': 0.00046929871559898994, 'samples': 4914048, 'steps': 25593, 'loss/train': 1.1808425188064575} -11/07/2021 00:49:14 - INFO - __main__ - Step 25595: {'lr': 0.00046929616759834505, 'samples': 4914240, 'steps': 25594, 'loss/train': 1.7247182130813599} -11/07/2021 00:49:14 - INFO - __main__ - Step 25596: {'lr': 0.00046929361949888857, 'samples': 4914432, 'steps': 25595, 'loss/train': 1.9493794441223145} -11/07/2021 00:49:14 - INFO - __main__ - Step 25597: {'lr': 0.00046929107130062176, 'samples': 4914624, 'steps': 25596, 'loss/train': 1.5374634265899658} -11/07/2021 00:49:15 - INFO - __main__ - Step 25598: {'lr': 0.00046928852300354585, 'samples': 4914816, 'steps': 25597, 'loss/train': 1.6057541370391846} -11/07/2021 00:49:16 - INFO - __main__ - Step 25599: {'lr': 0.0004692859746076619, 'samples': 4915008, 'steps': 25598, 'loss/train': 1.3104592561721802} -11/07/2021 00:49:16 - INFO - __main__ - Step 25600: {'lr': 0.00046928342611297105, 'samples': 4915200, 'steps': 25599, 'loss/train': 1.26352059841156} -11/07/2021 00:49:16 - INFO - __main__ - Step 25601: {'lr': 0.00046928087751947444, 'samples': 4915392, 'steps': 25600, 'loss/train': 1.4352083206176758} -11/07/2021 00:49:17 - INFO - __main__ - Step 25602: {'lr': 0.00046927832882717323, 'samples': 4915584, 'steps': 25601, 'loss/train': 1.254616618156433} -11/07/2021 00:49:18 - INFO - __main__ - Step 25603: {'lr': 0.0004692757800360687, 'samples': 4915776, 'steps': 25602, 'loss/train': 1.7988314628601074} -11/07/2021 00:49:18 - INFO - __main__ - Step 25604: {'lr': 0.0004692732311461618, 'samples': 4915968, 'steps': 25603, 'loss/train': 1.255089521408081} -11/07/2021 00:49:18 - INFO - __main__ - Step 25605: {'lr': 0.0004692706821574538, 'samples': 4916160, 'steps': 25604, 'loss/train': 1.0325216054916382} -11/07/2021 00:49:19 - INFO - __main__ - Step 25606: {'lr': 0.00046926813306994586, 'samples': 4916352, 'steps': 25605, 'loss/train': 1.6360634565353394} -11/07/2021 00:49:19 - INFO - __main__ - Step 25607: {'lr': 0.00046926558388363904, 'samples': 4916544, 'steps': 25606, 'loss/train': 1.79670250415802} -11/07/2021 00:49:20 - INFO - __main__ - Step 25608: {'lr': 0.00046926303459853447, 'samples': 4916736, 'steps': 25607, 'loss/train': 1.8682706356048584} -11/07/2021 00:49:21 - INFO - __main__ - Step 25609: {'lr': 0.00046926048521463344, 'samples': 4916928, 'steps': 25608, 'loss/train': 1.3411468267440796} -11/07/2021 00:49:21 - INFO - __main__ - Step 25610: {'lr': 0.000469257935731937, 'samples': 4917120, 'steps': 25609, 'loss/train': 1.0871062278747559} -11/07/2021 00:49:21 - INFO - __main__ - Step 25611: {'lr': 0.0004692553861504463, 'samples': 4917312, 'steps': 25610, 'loss/train': 1.6056123971939087} -11/07/2021 00:49:22 - INFO - __main__ - Step 25612: {'lr': 0.00046925283647016253, 'samples': 4917504, 'steps': 25611, 'loss/train': 1.4586424827575684} -11/07/2021 00:49:23 - INFO - __main__ - Step 25613: {'lr': 0.0004692502866910868, 'samples': 4917696, 'steps': 25612, 'loss/train': 1.538058876991272} -11/07/2021 00:49:23 - INFO - __main__ - Step 25614: {'lr': 0.0004692477368132203, 'samples': 4917888, 'steps': 25613, 'loss/train': 1.575411319732666} -11/07/2021 00:49:23 - INFO - __main__ - Step 25615: {'lr': 0.0004692451868365641, 'samples': 4918080, 'steps': 25614, 'loss/train': 1.7118977308273315} -11/07/2021 00:49:24 - INFO - __main__ - Step 25616: {'lr': 0.00046924263676111945, 'samples': 4918272, 'steps': 25615, 'loss/train': 2.131321907043457} -11/07/2021 00:49:24 - INFO - __main__ - Step 25617: {'lr': 0.00046924008658688745, 'samples': 4918464, 'steps': 25616, 'loss/train': 2.023993968963623} -11/07/2021 00:49:25 - INFO - __main__ - Step 25618: {'lr': 0.00046923753631386924, 'samples': 4918656, 'steps': 25617, 'loss/train': 1.8225526809692383} -11/07/2021 00:49:25 - INFO - __main__ - Step 25619: {'lr': 0.0004692349859420659, 'samples': 4918848, 'steps': 25618, 'loss/train': 1.5940064191818237} -11/07/2021 00:49:26 - INFO - __main__ - Step 25620: {'lr': 0.00046923243547147874, 'samples': 4919040, 'steps': 25619, 'loss/train': 1.45718252658844} -11/07/2021 00:49:26 - INFO - __main__ - Step 25621: {'lr': 0.0004692298849021088, 'samples': 4919232, 'steps': 25620, 'loss/train': 1.6011896133422852} -11/07/2021 00:49:26 - INFO - __main__ - Step 25622: {'lr': 0.00046922733423395736, 'samples': 4919424, 'steps': 25621, 'loss/train': 1.3006465435028076} -11/07/2021 00:49:27 - INFO - __main__ - Step 25623: {'lr': 0.0004692247834670253, 'samples': 4919616, 'steps': 25622, 'loss/train': 1.3544636964797974} -11/07/2021 00:49:28 - INFO - __main__ - Step 25624: {'lr': 0.000469222232601314, 'samples': 4919808, 'steps': 25623, 'loss/train': 1.1881569623947144} -11/07/2021 00:49:28 - INFO - __main__ - Step 25625: {'lr': 0.0004692196816368246, 'samples': 4920000, 'steps': 25624, 'loss/train': 1.6739518642425537} -11/07/2021 00:49:28 - INFO - __main__ - Step 25626: {'lr': 0.00046921713057355817, 'samples': 4920192, 'steps': 25625, 'loss/train': 1.2167147397994995} -11/07/2021 00:49:29 - INFO - __main__ - Step 25627: {'lr': 0.0004692145794115159, 'samples': 4920384, 'steps': 25626, 'loss/train': 1.683274269104004} -11/07/2021 00:49:29 - INFO - __main__ - Step 25628: {'lr': 0.00046921202815069883, 'samples': 4920576, 'steps': 25627, 'loss/train': 1.4491691589355469} -11/07/2021 00:49:30 - INFO - __main__ - Step 25629: {'lr': 0.00046920947679110833, 'samples': 4920768, 'steps': 25628, 'loss/train': 1.2186248302459717} -11/07/2021 00:49:31 - INFO - __main__ - Step 25630: {'lr': 0.00046920692533274533, 'samples': 4920960, 'steps': 25629, 'loss/train': 1.3265304565429688} -11/07/2021 00:49:31 - INFO - __main__ - Step 25631: {'lr': 0.0004692043737756111, 'samples': 4921152, 'steps': 25630, 'loss/train': 1.4819444417953491} -11/07/2021 00:49:31 - INFO - __main__ - Step 25632: {'lr': 0.00046920182211970677, 'samples': 4921344, 'steps': 25631, 'loss/train': 0.8713647127151489} -11/07/2021 00:49:32 - INFO - __main__ - Step 25633: {'lr': 0.00046919927036503353, 'samples': 4921536, 'steps': 25632, 'loss/train': 1.6610690355300903} -11/07/2021 00:49:33 - INFO - __main__ - Step 25634: {'lr': 0.0004691967185115924, 'samples': 4921728, 'steps': 25633, 'loss/train': 1.2283509969711304} -11/07/2021 00:49:33 - INFO - __main__ - Step 25635: {'lr': 0.00046919416655938465, 'samples': 4921920, 'steps': 25634, 'loss/train': 1.736107349395752} -11/07/2021 00:49:34 - INFO - __main__ - Step 25636: {'lr': 0.0004691916145084113, 'samples': 4922112, 'steps': 25635, 'loss/train': 1.667926549911499} -11/07/2021 00:49:34 - INFO - __main__ - Step 25637: {'lr': 0.0004691890623586737, 'samples': 4922304, 'steps': 25636, 'loss/train': 0.921523928642273} -11/07/2021 00:49:35 - INFO - __main__ - Step 25638: {'lr': 0.00046918651011017287, 'samples': 4922496, 'steps': 25637, 'loss/train': 1.4885398149490356} -11/07/2021 00:49:35 - INFO - __main__ - Step 25639: {'lr': 0.00046918395776290997, 'samples': 4922688, 'steps': 25638, 'loss/train': 1.7190399169921875} -11/07/2021 00:49:36 - INFO - __main__ - Step 25640: {'lr': 0.0004691814053168861, 'samples': 4922880, 'steps': 25639, 'loss/train': 1.4409922361373901} -11/07/2021 00:49:36 - INFO - __main__ - Step 25641: {'lr': 0.0004691788527721026, 'samples': 4923072, 'steps': 25640, 'loss/train': 1.4608443975448608} -11/07/2021 00:49:36 - INFO - __main__ - Step 25642: {'lr': 0.0004691763001285604, 'samples': 4923264, 'steps': 25641, 'loss/train': 1.7773683071136475} -11/07/2021 00:49:37 - INFO - __main__ - Step 25643: {'lr': 0.0004691737473862607, 'samples': 4923456, 'steps': 25642, 'loss/train': 1.7889008522033691} -11/07/2021 00:49:38 - INFO - __main__ - Step 25644: {'lr': 0.00046917119454520487, 'samples': 4923648, 'steps': 25643, 'loss/train': 1.1047998666763306} -11/07/2021 00:49:38 - INFO - __main__ - Step 25645: {'lr': 0.00046916864160539376, 'samples': 4923840, 'steps': 25644, 'loss/train': 1.7732115983963013} -11/07/2021 00:49:38 - INFO - __main__ - Step 25646: {'lr': 0.00046916608856682865, 'samples': 4924032, 'steps': 25645, 'loss/train': 1.751808524131775} -11/07/2021 00:49:39 - INFO - __main__ - Step 25647: {'lr': 0.0004691635354295106, 'samples': 4924224, 'steps': 25646, 'loss/train': 1.6011745929718018} -11/07/2021 00:49:39 - INFO - __main__ - Step 25648: {'lr': 0.00046916098219344093, 'samples': 4924416, 'steps': 25647, 'loss/train': 1.3450523614883423} -11/07/2021 00:49:40 - INFO - __main__ - Step 25649: {'lr': 0.0004691584288586207, 'samples': 4924608, 'steps': 25648, 'loss/train': 0.7353626489639282} -11/07/2021 00:49:41 - INFO - __main__ - Step 25650: {'lr': 0.0004691558754250511, 'samples': 4924800, 'steps': 25649, 'loss/train': 0.6195133328437805} -11/07/2021 00:49:41 - INFO - __main__ - Step 25651: {'lr': 0.0004691533218927332, 'samples': 4924992, 'steps': 25650, 'loss/train': 1.8022180795669556} -11/07/2021 00:49:41 - INFO - __main__ - Step 25652: {'lr': 0.00046915076826166814, 'samples': 4925184, 'steps': 25651, 'loss/train': 1.5118467807769775} -11/07/2021 00:49:42 - INFO - __main__ - Step 25653: {'lr': 0.0004691482145318572, 'samples': 4925376, 'steps': 25652, 'loss/train': 1.5533722639083862} -11/07/2021 00:49:43 - INFO - __main__ - Step 25654: {'lr': 0.00046914566070330144, 'samples': 4925568, 'steps': 25653, 'loss/train': 2.113215446472168} -11/07/2021 00:49:43 - INFO - __main__ - Step 25655: {'lr': 0.00046914310677600204, 'samples': 4925760, 'steps': 25654, 'loss/train': 1.3403749465942383} -11/07/2021 00:49:43 - INFO - __main__ - Step 25656: {'lr': 0.00046914055274996017, 'samples': 4925952, 'steps': 25655, 'loss/train': 1.0155887603759766} -11/07/2021 00:49:44 - INFO - __main__ - Step 25657: {'lr': 0.00046913799862517686, 'samples': 4926144, 'steps': 25656, 'loss/train': 0.8465630412101746} -11/07/2021 00:49:44 - INFO - __main__ - Step 25658: {'lr': 0.0004691354444016534, 'samples': 4926336, 'steps': 25657, 'loss/train': 1.2985042333602905} -11/07/2021 00:49:45 - INFO - __main__ - Step 25659: {'lr': 0.00046913289007939087, 'samples': 4926528, 'steps': 25658, 'loss/train': 1.632158875465393} -11/07/2021 00:49:45 - INFO - __main__ - Step 25660: {'lr': 0.00046913033565839046, 'samples': 4926720, 'steps': 25659, 'loss/train': 1.7725186347961426} -11/07/2021 00:49:46 - INFO - __main__ - Step 25661: {'lr': 0.0004691277811386533, 'samples': 4926912, 'steps': 25660, 'loss/train': 1.2652547359466553} -11/07/2021 00:49:46 - INFO - __main__ - Step 25662: {'lr': 0.0004691252265201805, 'samples': 4927104, 'steps': 25661, 'loss/train': 1.4861279726028442} -11/07/2021 00:49:46 - INFO - __main__ - Step 25663: {'lr': 0.00046912267180297337, 'samples': 4927296, 'steps': 25662, 'loss/train': 1.463240385055542} -11/07/2021 00:49:47 - INFO - __main__ - Step 25664: {'lr': 0.0004691201169870328, 'samples': 4927488, 'steps': 25663, 'loss/train': 1.071416974067688} -11/07/2021 00:49:48 - INFO - __main__ - Step 25665: {'lr': 0.00046911756207236024, 'samples': 4927680, 'steps': 25664, 'loss/train': 0.5899576544761658} -11/07/2021 00:49:48 - INFO - __main__ - Step 25666: {'lr': 0.0004691150070589566, 'samples': 4927872, 'steps': 25665, 'loss/train': 1.5438692569732666} -11/07/2021 00:49:49 - INFO - __main__ - Step 25667: {'lr': 0.00046911245194682306, 'samples': 4928064, 'steps': 25666, 'loss/train': 0.9179422855377197} -11/07/2021 00:49:49 - INFO - __main__ - Step 25668: {'lr': 0.00046910989673596093, 'samples': 4928256, 'steps': 25667, 'loss/train': 1.6727534532546997} -11/07/2021 00:49:49 - INFO - __main__ - Step 25669: {'lr': 0.00046910734142637124, 'samples': 4928448, 'steps': 25668, 'loss/train': 1.525063157081604} -11/07/2021 00:49:50 - INFO - __main__ - Step 25670: {'lr': 0.00046910478601805514, 'samples': 4928640, 'steps': 25669, 'loss/train': 5.881829738616943} -11/07/2021 00:49:51 - INFO - __main__ - Step 25671: {'lr': 0.0004691022305110138, 'samples': 4928832, 'steps': 25670, 'loss/train': 1.5334299802780151} -11/07/2021 00:49:51 - INFO - __main__ - Step 25672: {'lr': 0.0004690996749052484, 'samples': 4929024, 'steps': 25671, 'loss/train': 1.8652445077896118} -11/07/2021 00:49:51 - INFO - __main__ - Step 25673: {'lr': 0.00046909711920076, 'samples': 4929216, 'steps': 25672, 'loss/train': 1.9792180061340332} -11/07/2021 00:49:52 - INFO - __main__ - Step 25674: {'lr': 0.0004690945633975499, 'samples': 4929408, 'steps': 25673, 'loss/train': 0.8824723362922668} -11/07/2021 00:49:52 - INFO - __main__ - Step 25675: {'lr': 0.00046909200749561914, 'samples': 4929600, 'steps': 25674, 'loss/train': 1.751390814781189} -11/07/2021 00:49:53 - INFO - __main__ - Step 25676: {'lr': 0.00046908945149496897, 'samples': 4929792, 'steps': 25675, 'loss/train': 1.4224282503128052} -11/07/2021 00:49:53 - INFO - __main__ - Step 25677: {'lr': 0.00046908689539560034, 'samples': 4929984, 'steps': 25676, 'loss/train': 1.8100460767745972} -11/07/2021 00:49:54 - INFO - __main__ - Step 25678: {'lr': 0.0004690843391975146, 'samples': 4930176, 'steps': 25677, 'loss/train': 1.1137361526489258} -11/07/2021 00:49:54 - INFO - __main__ - Step 25679: {'lr': 0.0004690817829007129, 'samples': 4930368, 'steps': 25678, 'loss/train': 1.2293751239776611} -11/07/2021 00:49:55 - INFO - __main__ - Step 25680: {'lr': 0.00046907922650519623, 'samples': 4930560, 'steps': 25679, 'loss/train': 1.0705848932266235} -11/07/2021 00:49:56 - INFO - __main__ - Step 25681: {'lr': 0.0004690766700109659, 'samples': 4930752, 'steps': 25680, 'loss/train': 1.33608877658844} -11/07/2021 00:49:56 - INFO - __main__ - Step 25682: {'lr': 0.00046907411341802295, 'samples': 4930944, 'steps': 25681, 'loss/train': 1.132555603981018} -11/07/2021 00:49:56 - INFO - __main__ - Step 25683: {'lr': 0.0004690715567263687, 'samples': 4931136, 'steps': 25682, 'loss/train': 1.588343858718872} -11/07/2021 00:49:57 - INFO - __main__ - Step 25684: {'lr': 0.00046906899993600406, 'samples': 4931328, 'steps': 25683, 'loss/train': 1.7066028118133545} -11/07/2021 00:49:57 - INFO - __main__ - Step 25685: {'lr': 0.00046906644304693033, 'samples': 4931520, 'steps': 25684, 'loss/train': 1.7568970918655396} -11/07/2021 00:49:58 - INFO - __main__ - Step 25686: {'lr': 0.0004690638860591487, 'samples': 4931712, 'steps': 25685, 'loss/train': 1.4653843641281128} -11/07/2021 00:49:58 - INFO - __main__ - Step 25687: {'lr': 0.00046906132897266026, 'samples': 4931904, 'steps': 25686, 'loss/train': 1.3618601560592651} -11/07/2021 00:49:59 - INFO - __main__ - Step 25688: {'lr': 0.00046905877178746614, 'samples': 4932096, 'steps': 25687, 'loss/train': 1.6840893030166626} -11/07/2021 00:49:59 - INFO - __main__ - Step 25689: {'lr': 0.0004690562145035675, 'samples': 4932288, 'steps': 25688, 'loss/train': 1.1401145458221436} -11/07/2021 00:49:59 - INFO - __main__ - Step 25690: {'lr': 0.00046905365712096553, 'samples': 4932480, 'steps': 25689, 'loss/train': 2.9032070636749268} -11/07/2021 00:50:00 - INFO - __main__ - Step 25691: {'lr': 0.0004690510996396614, 'samples': 4932672, 'steps': 25690, 'loss/train': 2.0789008140563965} -11/07/2021 00:50:01 - INFO - __main__ - Step 25692: {'lr': 0.0004690485420596561, 'samples': 4932864, 'steps': 25691, 'loss/train': 1.3529332876205444} -11/07/2021 00:50:01 - INFO - __main__ - Step 25693: {'lr': 0.000469045984380951, 'samples': 4933056, 'steps': 25692, 'loss/train': 1.932854413986206} -11/07/2021 00:50:02 - INFO - __main__ - Step 25694: {'lr': 0.0004690434266035471, 'samples': 4933248, 'steps': 25693, 'loss/train': 1.516493320465088} -11/07/2021 00:50:02 - INFO - __main__ - Step 25695: {'lr': 0.00046904086872744577, 'samples': 4933440, 'steps': 25694, 'loss/train': 1.5998808145523071} -11/07/2021 00:50:02 - INFO - __main__ - Step 25696: {'lr': 0.0004690383107526479, 'samples': 4933632, 'steps': 25695, 'loss/train': 1.5363796949386597} -11/07/2021 00:50:03 - INFO - __main__ - Step 25697: {'lr': 0.0004690357526791547, 'samples': 4933824, 'steps': 25696, 'loss/train': 1.045938491821289} -11/07/2021 00:50:04 - INFO - __main__ - Step 25698: {'lr': 0.00046903319450696744, 'samples': 4934016, 'steps': 25697, 'loss/train': 1.6437040567398071} -11/07/2021 00:50:04 - INFO - __main__ - Step 25699: {'lr': 0.00046903063623608714, 'samples': 4934208, 'steps': 25698, 'loss/train': 1.6086574792861938} -11/07/2021 00:50:04 - INFO - __main__ - Step 25700: {'lr': 0.00046902807786651507, 'samples': 4934400, 'steps': 25699, 'loss/train': 1.112980604171753} -11/07/2021 00:50:05 - INFO - __main__ - Step 25701: {'lr': 0.00046902551939825236, 'samples': 4934592, 'steps': 25700, 'loss/train': 1.9607683420181274} -11/07/2021 00:50:06 - INFO - __main__ - Step 25702: {'lr': 0.00046902296083130003, 'samples': 4934784, 'steps': 25701, 'loss/train': 1.5503727197647095} -11/07/2021 00:50:06 - INFO - __main__ - Step 25703: {'lr': 0.00046902040216565945, 'samples': 4934976, 'steps': 25702, 'loss/train': 2.105358362197876} -11/07/2021 00:50:06 - INFO - __main__ - Step 25704: {'lr': 0.0004690178434013316, 'samples': 4935168, 'steps': 25703, 'loss/train': 1.0405181646347046} -11/07/2021 00:50:07 - INFO - __main__ - Step 25705: {'lr': 0.00046901528453831764, 'samples': 4935360, 'steps': 25704, 'loss/train': 1.5190848112106323} -11/07/2021 00:50:07 - INFO - __main__ - Step 25706: {'lr': 0.0004690127255766188, 'samples': 4935552, 'steps': 25705, 'loss/train': 1.511635661125183} -11/07/2021 00:50:08 - INFO - __main__ - Step 25707: {'lr': 0.0004690101665162362, 'samples': 4935744, 'steps': 25706, 'loss/train': 1.6795202493667603} -11/07/2021 00:50:09 - INFO - __main__ - Step 25708: {'lr': 0.00046900760735717103, 'samples': 4935936, 'steps': 25707, 'loss/train': 1.828741192817688} -11/07/2021 00:50:09 - INFO - __main__ - Step 25709: {'lr': 0.00046900504809942433, 'samples': 4936128, 'steps': 25708, 'loss/train': 0.857280969619751} -11/07/2021 00:50:09 - INFO - __main__ - Step 25710: {'lr': 0.00046900248874299746, 'samples': 4936320, 'steps': 25709, 'loss/train': 1.425267219543457} -11/07/2021 00:50:10 - INFO - __main__ - Step 25711: {'lr': 0.0004689999292878914, 'samples': 4936512, 'steps': 25710, 'loss/train': 0.9910033345222473} -11/07/2021 00:50:11 - INFO - __main__ - Step 25712: {'lr': 0.00046899736973410734, 'samples': 4936704, 'steps': 25711, 'loss/train': 1.9840439558029175} -11/07/2021 00:50:11 - INFO - __main__ - Step 25713: {'lr': 0.0004689948100816465, 'samples': 4936896, 'steps': 25712, 'loss/train': 1.0799232721328735} -11/07/2021 00:50:11 - INFO - __main__ - Step 25714: {'lr': 0.00046899225033050985, 'samples': 4937088, 'steps': 25713, 'loss/train': 1.4242122173309326} -11/07/2021 00:50:12 - INFO - __main__ - Step 25715: {'lr': 0.0004689896904806987, 'samples': 4937280, 'steps': 25714, 'loss/train': 1.2976279258728027} -11/07/2021 00:50:12 - INFO - __main__ - Step 25716: {'lr': 0.0004689871305322143, 'samples': 4937472, 'steps': 25715, 'loss/train': 1.7055093050003052} -11/07/2021 00:50:13 - INFO - __main__ - Step 25717: {'lr': 0.0004689845704850576, 'samples': 4937664, 'steps': 25716, 'loss/train': 1.5551862716674805} -11/07/2021 00:50:13 - INFO - __main__ - Step 25718: {'lr': 0.0004689820103392298, 'samples': 4937856, 'steps': 25717, 'loss/train': 1.6573007106781006} -11/07/2021 00:50:14 - INFO - __main__ - Step 25719: {'lr': 0.0004689794500947321, 'samples': 4938048, 'steps': 25718, 'loss/train': 1.3254516124725342} -11/07/2021 00:50:14 - INFO - __main__ - Step 25720: {'lr': 0.0004689768897515657, 'samples': 4938240, 'steps': 25719, 'loss/train': 1.4422892332077026} -11/07/2021 00:50:15 - INFO - __main__ - Step 25721: {'lr': 0.0004689743293097316, 'samples': 4938432, 'steps': 25720, 'loss/train': 1.3288673162460327} -11/07/2021 00:50:16 - INFO - __main__ - Step 25722: {'lr': 0.0004689717687692311, 'samples': 4938624, 'steps': 25721, 'loss/train': 1.748436689376831} -11/07/2021 00:50:16 - INFO - __main__ - Step 25723: {'lr': 0.0004689692081300653, 'samples': 4938816, 'steps': 25722, 'loss/train': 1.3790818452835083} -11/07/2021 00:50:16 - INFO - __main__ - Step 25724: {'lr': 0.0004689666473922354, 'samples': 4939008, 'steps': 25723, 'loss/train': 1.511187195777893} -11/07/2021 00:50:17 - INFO - __main__ - Step 25725: {'lr': 0.0004689640865557424, 'samples': 4939200, 'steps': 25724, 'loss/train': 1.4920438528060913} -11/07/2021 00:50:17 - INFO - __main__ - Step 25726: {'lr': 0.0004689615256205876, 'samples': 4939392, 'steps': 25725, 'loss/train': 1.3425120115280151} -11/07/2021 00:50:17 - INFO - __main__ - Step 25727: {'lr': 0.0004689589645867721, 'samples': 4939584, 'steps': 25726, 'loss/train': 1.7583677768707275} -11/07/2021 00:50:18 - INFO - __main__ - Step 25728: {'lr': 0.0004689564034542971, 'samples': 4939776, 'steps': 25727, 'loss/train': 1.1632046699523926} -11/07/2021 00:50:19 - INFO - __main__ - Step 25729: {'lr': 0.00046895384222316375, 'samples': 4939968, 'steps': 25728, 'loss/train': 1.4341073036193848} -11/07/2021 00:50:19 - INFO - __main__ - Step 25730: {'lr': 0.0004689512808933731, 'samples': 4940160, 'steps': 25729, 'loss/train': 1.5172381401062012} -11/07/2021 00:50:19 - INFO - __main__ - Step 25731: {'lr': 0.0004689487194649265, 'samples': 4940352, 'steps': 25730, 'loss/train': 1.843948245048523} -11/07/2021 00:50:20 - INFO - __main__ - Step 25732: {'lr': 0.0004689461579378249, 'samples': 4940544, 'steps': 25731, 'loss/train': 1.2686885595321655} -11/07/2021 00:50:21 - INFO - __main__ - Step 25733: {'lr': 0.0004689435963120696, 'samples': 4940736, 'steps': 25732, 'loss/train': 0.15897658467292786} -11/07/2021 00:50:21 - INFO - __main__ - Step 25734: {'lr': 0.00046894103458766163, 'samples': 4940928, 'steps': 25733, 'loss/train': 1.826562523841858} -11/07/2021 00:50:22 - INFO - __main__ - Step 25735: {'lr': 0.0004689384727646022, 'samples': 4941120, 'steps': 25734, 'loss/train': 1.2627410888671875} -11/07/2021 00:50:22 - INFO - __main__ - Step 25736: {'lr': 0.00046893591084289256, 'samples': 4941312, 'steps': 25735, 'loss/train': 1.6012457609176636} -11/07/2021 00:50:22 - INFO - __main__ - Step 25737: {'lr': 0.0004689333488225337, 'samples': 4941504, 'steps': 25736, 'loss/train': 1.6334772109985352} -11/07/2021 00:50:23 - INFO - __main__ - Step 25738: {'lr': 0.00046893078670352686, 'samples': 4941696, 'steps': 25737, 'loss/train': 0.9714683294296265} -11/07/2021 00:50:24 - INFO - __main__ - Step 25739: {'lr': 0.0004689282244858732, 'samples': 4941888, 'steps': 25738, 'loss/train': 1.7057424783706665} -11/07/2021 00:50:24 - INFO - __main__ - Step 25740: {'lr': 0.00046892566216957387, 'samples': 4942080, 'steps': 25739, 'loss/train': 1.7884376049041748} -11/07/2021 00:50:24 - INFO - __main__ - Step 25741: {'lr': 0.00046892309975463, 'samples': 4942272, 'steps': 25740, 'loss/train': 1.3078798055648804} -11/07/2021 00:50:25 - INFO - __main__ - Step 25742: {'lr': 0.0004689205372410427, 'samples': 4942464, 'steps': 25741, 'loss/train': 0.8204142451286316} -11/07/2021 00:50:25 - INFO - __main__ - Step 25743: {'lr': 0.00046891797462881327, 'samples': 4942656, 'steps': 25742, 'loss/train': 1.6207472085952759} -11/07/2021 00:50:27 - INFO - __main__ - Step 25744: {'lr': 0.0004689154119179427, 'samples': 4942848, 'steps': 25743, 'loss/train': 0.8706039786338806} -11/07/2021 00:50:27 - INFO - __main__ - Step 25745: {'lr': 0.00046891284910843237, 'samples': 4943040, 'steps': 25744, 'loss/train': 1.7266850471496582} -11/07/2021 00:50:27 - INFO - __main__ - Step 25746: {'lr': 0.0004689102862002832, 'samples': 4943232, 'steps': 25745, 'loss/train': 0.45676106214523315} -11/07/2021 00:50:28 - INFO - __main__ - Step 25747: {'lr': 0.00046890772319349637, 'samples': 4943424, 'steps': 25746, 'loss/train': 0.28906792402267456} -11/07/2021 00:50:28 - INFO - __main__ - Step 25748: {'lr': 0.00046890516008807315, 'samples': 4943616, 'steps': 25747, 'loss/train': 1.7977261543273926} -11/07/2021 00:50:30 - INFO - __main__ - Step 25749: {'lr': 0.0004689025968840147, 'samples': 4943808, 'steps': 25748, 'loss/train': 1.4963880777359009} -11/07/2021 00:50:30 - INFO - __main__ - Step 25750: {'lr': 0.00046890003358132204, 'samples': 4944000, 'steps': 25749, 'loss/train': 1.0647135972976685} -11/07/2021 00:50:30 - INFO - __main__ - Step 25751: {'lr': 0.0004688974701799964, 'samples': 4944192, 'steps': 25750, 'loss/train': 1.5756062269210815} -11/07/2021 00:50:31 - INFO - __main__ - Step 25752: {'lr': 0.00046889490668003896, 'samples': 4944384, 'steps': 25751, 'loss/train': 1.8758376836776733} -11/07/2021 00:50:31 - INFO - __main__ - Step 25753: {'lr': 0.0004688923430814509, 'samples': 4944576, 'steps': 25752, 'loss/train': 1.2992342710494995} -11/07/2021 00:50:31 - INFO - __main__ - Step 25754: {'lr': 0.00046888977938423326, 'samples': 4944768, 'steps': 25753, 'loss/train': 1.5431861877441406} -11/07/2021 00:50:33 - INFO - __main__ - Step 25755: {'lr': 0.00046888721558838734, 'samples': 4944960, 'steps': 25754, 'loss/train': 1.9197421073913574} -11/07/2021 00:50:33 - INFO - __main__ - Step 25756: {'lr': 0.00046888465169391414, 'samples': 4945152, 'steps': 25755, 'loss/train': 1.1083108186721802} -11/07/2021 00:50:33 - INFO - __main__ - Step 25757: {'lr': 0.00046888208770081493, 'samples': 4945344, 'steps': 25756, 'loss/train': 1.2790623903274536} -11/07/2021 00:50:34 - INFO - __main__ - Step 25758: {'lr': 0.0004688795236090908, 'samples': 4945536, 'steps': 25757, 'loss/train': 1.6210299730300903} -11/07/2021 00:50:34 - INFO - __main__ - Step 25759: {'lr': 0.000468876959418743, 'samples': 4945728, 'steps': 25758, 'loss/train': 1.7421590089797974} -11/07/2021 00:50:35 - INFO - __main__ - Step 25760: {'lr': 0.0004688743951297726, 'samples': 4945920, 'steps': 25759, 'loss/train': 1.5871471166610718} -11/07/2021 00:50:35 - INFO - __main__ - Step 25761: {'lr': 0.0004688718307421807, 'samples': 4946112, 'steps': 25760, 'loss/train': 1.4662115573883057} -11/07/2021 00:50:36 - INFO - __main__ - Step 25762: {'lr': 0.0004688692662559686, 'samples': 4946304, 'steps': 25761, 'loss/train': 1.6176438331604004} -11/07/2021 00:50:36 - INFO - __main__ - Step 25763: {'lr': 0.00046886670167113734, 'samples': 4946496, 'steps': 25762, 'loss/train': 1.8013571500778198} -11/07/2021 00:50:36 - INFO - __main__ - Step 25764: {'lr': 0.00046886413698768816, 'samples': 4946688, 'steps': 25763, 'loss/train': 1.3539690971374512} -11/07/2021 00:50:38 - INFO - __main__ - Step 25765: {'lr': 0.0004688615722056222, 'samples': 4946880, 'steps': 25764, 'loss/train': 1.3331290483474731} -11/07/2021 00:50:38 - INFO - __main__ - Step 25766: {'lr': 0.00046885900732494053, 'samples': 4947072, 'steps': 25765, 'loss/train': 1.4751242399215698} -11/07/2021 00:50:38 - INFO - __main__ - Step 25767: {'lr': 0.0004688564423456444, 'samples': 4947264, 'steps': 25766, 'loss/train': 1.634786605834961} -11/07/2021 00:50:39 - INFO - __main__ - Step 25768: {'lr': 0.00046885387726773494, 'samples': 4947456, 'steps': 25767, 'loss/train': 0.9453241229057312} -11/07/2021 00:50:39 - INFO - __main__ - Step 25769: {'lr': 0.0004688513120912133, 'samples': 4947648, 'steps': 25768, 'loss/train': 2.193246364593506} -11/07/2021 00:50:40 - INFO - __main__ - Step 25770: {'lr': 0.0004688487468160806, 'samples': 4947840, 'steps': 25769, 'loss/train': 1.9358593225479126} -11/07/2021 00:50:40 - INFO - __main__ - Step 25771: {'lr': 0.000468846181442338, 'samples': 4948032, 'steps': 25770, 'loss/train': 1.1964941024780273} -11/07/2021 00:50:41 - INFO - __main__ - Step 25772: {'lr': 0.0004688436159699868, 'samples': 4948224, 'steps': 25771, 'loss/train': 1.4133274555206299} -11/07/2021 00:50:41 - INFO - __main__ - Step 25773: {'lr': 0.000468841050399028, 'samples': 4948416, 'steps': 25772, 'loss/train': 1.092087984085083} -11/07/2021 00:50:41 - INFO - __main__ - Step 25774: {'lr': 0.0004688384847294628, 'samples': 4948608, 'steps': 25773, 'loss/train': 2.0307538509368896} -11/07/2021 00:50:42 - INFO - __main__ - Step 25775: {'lr': 0.0004688359189612923, 'samples': 4948800, 'steps': 25774, 'loss/train': 1.6210196018218994} -11/07/2021 00:50:43 - INFO - __main__ - Step 25776: {'lr': 0.0004688333530945178, 'samples': 4948992, 'steps': 25775, 'loss/train': 1.1951122283935547} -11/07/2021 00:50:43 - INFO - __main__ - Step 25777: {'lr': 0.0004688307871291403, 'samples': 4949184, 'steps': 25776, 'loss/train': 1.7040596008300781} -11/07/2021 00:50:44 - INFO - __main__ - Step 25778: {'lr': 0.0004688282210651611, 'samples': 4949376, 'steps': 25777, 'loss/train': 1.745054841041565} -11/07/2021 00:50:44 - INFO - __main__ - Step 25779: {'lr': 0.00046882565490258125, 'samples': 4949568, 'steps': 25778, 'loss/train': 1.9911561012268066} -11/07/2021 00:50:44 - INFO - __main__ - Step 25780: {'lr': 0.0004688230886414019, 'samples': 4949760, 'steps': 25779, 'loss/train': 1.8546158075332642} -11/07/2021 00:50:45 - INFO - __main__ - Step 25781: {'lr': 0.0004688205222816242, 'samples': 4949952, 'steps': 25780, 'loss/train': 1.5687676668167114} -11/07/2021 00:50:46 - INFO - __main__ - Step 25782: {'lr': 0.00046881795582324944, 'samples': 4950144, 'steps': 25781, 'loss/train': 1.6519067287445068} -11/07/2021 00:50:46 - INFO - __main__ - Step 25783: {'lr': 0.00046881538926627864, 'samples': 4950336, 'steps': 25782, 'loss/train': 1.1861686706542969} -11/07/2021 00:50:46 - INFO - __main__ - Step 25784: {'lr': 0.000468812822610713, 'samples': 4950528, 'steps': 25783, 'loss/train': 1.4683573246002197} -11/07/2021 00:50:47 - INFO - __main__ - Step 25785: {'lr': 0.00046881025585655367, 'samples': 4950720, 'steps': 25784, 'loss/train': 1.6115069389343262} -11/07/2021 00:50:48 - INFO - __main__ - Step 25786: {'lr': 0.0004688076890038019, 'samples': 4950912, 'steps': 25785, 'loss/train': 1.5832531452178955} -11/07/2021 00:50:48 - INFO - __main__ - Step 25787: {'lr': 0.00046880512205245867, 'samples': 4951104, 'steps': 25786, 'loss/train': 1.3586066961288452} -11/07/2021 00:50:48 - INFO - __main__ - Step 25788: {'lr': 0.00046880255500252526, 'samples': 4951296, 'steps': 25787, 'loss/train': 1.8434799909591675} -11/07/2021 00:50:49 - INFO - __main__ - Step 25789: {'lr': 0.0004687999878540028, 'samples': 4951488, 'steps': 25788, 'loss/train': 1.8325769901275635} -11/07/2021 00:50:49 - INFO - __main__ - Step 25790: {'lr': 0.00046879742060689243, 'samples': 4951680, 'steps': 25789, 'loss/train': 1.702770709991455} -11/07/2021 00:50:50 - INFO - __main__ - Step 25791: {'lr': 0.0004687948532611953, 'samples': 4951872, 'steps': 25790, 'loss/train': 1.678737998008728} -11/07/2021 00:50:51 - INFO - __main__ - Step 25792: {'lr': 0.0004687922858169126, 'samples': 4952064, 'steps': 25791, 'loss/train': 1.7778791189193726} -11/07/2021 00:50:51 - INFO - __main__ - Step 25793: {'lr': 0.0004687897182740455, 'samples': 4952256, 'steps': 25792, 'loss/train': 1.9369837045669556} -11/07/2021 00:50:51 - INFO - __main__ - Step 25794: {'lr': 0.0004687871506325951, 'samples': 4952448, 'steps': 25793, 'loss/train': 1.0146952867507935} -11/07/2021 00:50:52 - INFO - __main__ - Step 25795: {'lr': 0.00046878458289256264, 'samples': 4952640, 'steps': 25794, 'loss/train': 1.5751017332077026} -11/07/2021 00:50:53 - INFO - __main__ - Step 25796: {'lr': 0.00046878201505394913, 'samples': 4952832, 'steps': 25795, 'loss/train': 1.5337727069854736} -11/07/2021 00:50:53 - INFO - __main__ - Step 25797: {'lr': 0.0004687794471167559, 'samples': 4953024, 'steps': 25796, 'loss/train': 1.672663927078247} -11/07/2021 00:50:53 - INFO - __main__ - Step 25798: {'lr': 0.00046877687908098396, 'samples': 4953216, 'steps': 25797, 'loss/train': 1.6757265329360962} -11/07/2021 00:50:54 - INFO - __main__ - Step 25799: {'lr': 0.0004687743109466346, 'samples': 4953408, 'steps': 25798, 'loss/train': 1.7293604612350464} -11/07/2021 00:50:54 - INFO - __main__ - Step 25800: {'lr': 0.00046877174271370894, 'samples': 4953600, 'steps': 25799, 'loss/train': 1.3573501110076904} -11/07/2021 00:50:55 - INFO - __main__ - Step 25801: {'lr': 0.000468769174382208, 'samples': 4953792, 'steps': 25800, 'loss/train': 1.5040295124053955} -11/07/2021 00:50:56 - INFO - __main__ - Step 25802: {'lr': 0.0004687666059521331, 'samples': 4953984, 'steps': 25801, 'loss/train': 1.2513548135757446} -11/07/2021 00:50:56 - INFO - __main__ - Step 25803: {'lr': 0.0004687640374234854, 'samples': 4954176, 'steps': 25802, 'loss/train': 0.8608061075210571} -11/07/2021 00:50:56 - INFO - __main__ - Step 25804: {'lr': 0.0004687614687962659, 'samples': 4954368, 'steps': 25803, 'loss/train': 1.5000717639923096} -11/07/2021 00:50:57 - INFO - __main__ - Step 25805: {'lr': 0.0004687589000704759, 'samples': 4954560, 'steps': 25804, 'loss/train': 1.4666575193405151} -11/07/2021 00:50:57 - INFO - __main__ - Step 25806: {'lr': 0.0004687563312461165, 'samples': 4954752, 'steps': 25805, 'loss/train': 1.379432201385498} -11/07/2021 00:50:58 - INFO - __main__ - Step 25807: {'lr': 0.00046875376232318887, 'samples': 4954944, 'steps': 25806, 'loss/train': 0.6750864386558533} -11/07/2021 00:50:59 - INFO - __main__ - Step 25808: {'lr': 0.00046875119330169426, 'samples': 4955136, 'steps': 25807, 'loss/train': 1.6305607557296753} -11/07/2021 00:50:59 - INFO - __main__ - Step 25809: {'lr': 0.00046874862418163363, 'samples': 4955328, 'steps': 25808, 'loss/train': 1.6389553546905518} -11/07/2021 00:50:59 - INFO - __main__ - Step 25810: {'lr': 0.00046874605496300824, 'samples': 4955520, 'steps': 25809, 'loss/train': 1.5285234451293945} -11/07/2021 00:51:00 - INFO - __main__ - Step 25811: {'lr': 0.00046874348564581933, 'samples': 4955712, 'steps': 25810, 'loss/train': 1.624723196029663} -11/07/2021 00:51:00 - INFO - __main__ - Step 25812: {'lr': 0.00046874091623006793, 'samples': 4955904, 'steps': 25811, 'loss/train': 1.0928027629852295} -11/07/2021 00:51:01 - INFO - __main__ - Step 25813: {'lr': 0.0004687383467157553, 'samples': 4956096, 'steps': 25812, 'loss/train': 1.514067530632019} -11/07/2021 00:51:01 - INFO - __main__ - Step 25814: {'lr': 0.0004687357771028825, 'samples': 4956288, 'steps': 25813, 'loss/train': 0.9820759296417236} -11/07/2021 00:51:02 - INFO - __main__ - Step 25815: {'lr': 0.00046873320739145073, 'samples': 4956480, 'steps': 25814, 'loss/train': 1.932958722114563} -11/07/2021 00:51:02 - INFO - __main__ - Step 25816: {'lr': 0.0004687306375814612, 'samples': 4956672, 'steps': 25815, 'loss/train': 1.3385789394378662} -11/07/2021 00:51:02 - INFO - __main__ - Step 25817: {'lr': 0.000468728067672915, 'samples': 4956864, 'steps': 25816, 'loss/train': 1.031846284866333} -11/07/2021 00:51:03 - INFO - __main__ - Step 25818: {'lr': 0.00046872549766581326, 'samples': 4957056, 'steps': 25817, 'loss/train': 1.293784737586975} -11/07/2021 00:51:04 - INFO - __main__ - Step 25819: {'lr': 0.00046872292756015724, 'samples': 4957248, 'steps': 25818, 'loss/train': 1.3724759817123413} -11/07/2021 00:51:04 - INFO - __main__ - Step 25820: {'lr': 0.000468720357355948, 'samples': 4957440, 'steps': 25819, 'loss/train': 1.1009554862976074} -11/07/2021 00:51:04 - INFO - __main__ - Step 25821: {'lr': 0.00046871778705318673, 'samples': 4957632, 'steps': 25820, 'loss/train': 1.3064281940460205} -11/07/2021 00:51:05 - INFO - __main__ - Step 25822: {'lr': 0.0004687152166518747, 'samples': 4957824, 'steps': 25821, 'loss/train': 1.665042757987976} -11/07/2021 00:51:06 - INFO - __main__ - Step 25823: {'lr': 0.0004687126461520128, 'samples': 4958016, 'steps': 25822, 'loss/train': 1.5745177268981934} -11/07/2021 00:51:06 - INFO - __main__ - Step 25824: {'lr': 0.0004687100755536025, 'samples': 4958208, 'steps': 25823, 'loss/train': 1.9364532232284546} -11/07/2021 00:51:07 - INFO - __main__ - Step 25825: {'lr': 0.00046870750485664484, 'samples': 4958400, 'steps': 25824, 'loss/train': 1.2087626457214355} -11/07/2021 00:51:07 - INFO - __main__ - Step 25826: {'lr': 0.00046870493406114084, 'samples': 4958592, 'steps': 25825, 'loss/train': 1.2004915475845337} -11/07/2021 00:51:07 - INFO - __main__ - Step 25827: {'lr': 0.0004687023631670918, 'samples': 4958784, 'steps': 25826, 'loss/train': 1.7887715101242065} -11/07/2021 00:51:08 - INFO - __main__ - Step 25828: {'lr': 0.0004686997921744989, 'samples': 4958976, 'steps': 25827, 'loss/train': 1.3411016464233398} -11/07/2021 00:51:09 - INFO - __main__ - Step 25829: {'lr': 0.0004686972210833632, 'samples': 4959168, 'steps': 25828, 'loss/train': 1.493360996246338} -11/07/2021 00:51:09 - INFO - __main__ - Step 25830: {'lr': 0.0004686946498936859, 'samples': 4959360, 'steps': 25829, 'loss/train': 1.9060460329055786} -11/07/2021 00:51:09 - INFO - __main__ - Step 25831: {'lr': 0.00046869207860546826, 'samples': 4959552, 'steps': 25830, 'loss/train': 1.3489595651626587} -11/07/2021 00:51:10 - INFO - __main__ - Step 25832: {'lr': 0.00046868950721871126, 'samples': 4959744, 'steps': 25831, 'loss/train': 1.4942917823791504} -11/07/2021 00:51:10 - INFO - __main__ - Step 25833: {'lr': 0.00046868693573341616, 'samples': 4959936, 'steps': 25832, 'loss/train': 1.5614725351333618} -11/07/2021 00:51:11 - INFO - __main__ - Step 25834: {'lr': 0.00046868436414958405, 'samples': 4960128, 'steps': 25833, 'loss/train': 1.7506455183029175} -11/07/2021 00:51:12 - INFO - __main__ - Step 25835: {'lr': 0.00046868179246721623, 'samples': 4960320, 'steps': 25834, 'loss/train': 1.282240390777588} -11/07/2021 00:51:12 - INFO - __main__ - Step 25836: {'lr': 0.00046867922068631374, 'samples': 4960512, 'steps': 25835, 'loss/train': 1.5849071741104126} -11/07/2021 00:51:12 - INFO - __main__ - Step 25837: {'lr': 0.00046867664880687775, 'samples': 4960704, 'steps': 25836, 'loss/train': 2.374248743057251} -11/07/2021 00:51:13 - INFO - __main__ - Step 25838: {'lr': 0.00046867407682890937, 'samples': 4960896, 'steps': 25837, 'loss/train': 1.8533856868743896} -11/07/2021 00:51:14 - INFO - __main__ - Step 25839: {'lr': 0.00046867150475240994, 'samples': 4961088, 'steps': 25838, 'loss/train': 1.5554496049880981} -11/07/2021 00:51:14 - INFO - __main__ - Step 25840: {'lr': 0.0004686689325773805, 'samples': 4961280, 'steps': 25839, 'loss/train': 1.4998165369033813} -11/07/2021 00:51:14 - INFO - __main__ - Step 25841: {'lr': 0.00046866636030382217, 'samples': 4961472, 'steps': 25840, 'loss/train': 1.7674634456634521} -11/07/2021 00:51:15 - INFO - __main__ - Step 25842: {'lr': 0.00046866378793173616, 'samples': 4961664, 'steps': 25841, 'loss/train': 1.5353429317474365} -11/07/2021 00:51:15 - INFO - __main__ - Step 25843: {'lr': 0.0004686612154611236, 'samples': 4961856, 'steps': 25842, 'loss/train': 2.041708469390869} -11/07/2021 00:51:16 - INFO - __main__ - Step 25844: {'lr': 0.0004686586428919857, 'samples': 4962048, 'steps': 25843, 'loss/train': 1.6728260517120361} -11/07/2021 00:51:16 - INFO - __main__ - Step 25845: {'lr': 0.00046865607022432356, 'samples': 4962240, 'steps': 25844, 'loss/train': 1.5199110507965088} -11/07/2021 00:51:17 - INFO - __main__ - Step 25846: {'lr': 0.00046865349745813835, 'samples': 4962432, 'steps': 25845, 'loss/train': 0.546825110912323} -11/07/2021 00:51:17 - INFO - __main__ - Step 25847: {'lr': 0.00046865092459343126, 'samples': 4962624, 'steps': 25846, 'loss/train': 1.6953691244125366} -11/07/2021 00:51:17 - INFO - __main__ - Step 25848: {'lr': 0.00046864835163020353, 'samples': 4962816, 'steps': 25847, 'loss/train': 1.7198363542556763} -11/07/2021 00:51:19 - INFO - __main__ - Step 25849: {'lr': 0.00046864577856845613, 'samples': 4963008, 'steps': 25848, 'loss/train': 1.6675834655761719} -11/07/2021 00:51:19 - INFO - __main__ - Step 25850: {'lr': 0.0004686432054081904, 'samples': 4963200, 'steps': 25849, 'loss/train': 1.765515685081482} -11/07/2021 00:51:19 - INFO - __main__ - Step 25851: {'lr': 0.00046864063214940735, 'samples': 4963392, 'steps': 25850, 'loss/train': 1.7096325159072876} -11/07/2021 00:51:20 - INFO - __main__ - Step 25852: {'lr': 0.0004686380587921082, 'samples': 4963584, 'steps': 25851, 'loss/train': 1.2849268913269043} -11/07/2021 00:51:20 - INFO - __main__ - Step 25853: {'lr': 0.00046863548533629406, 'samples': 4963776, 'steps': 25852, 'loss/train': 1.6374523639678955} -11/07/2021 00:51:21 - INFO - __main__ - Step 25854: {'lr': 0.00046863291178196625, 'samples': 4963968, 'steps': 25853, 'loss/train': 1.1156255006790161} -11/07/2021 00:51:21 - INFO - __main__ - Step 25855: {'lr': 0.0004686303381291258, 'samples': 4964160, 'steps': 25854, 'loss/train': 0.7119954228401184} -11/07/2021 00:51:22 - INFO - __main__ - Step 25856: {'lr': 0.00046862776437777386, 'samples': 4964352, 'steps': 25855, 'loss/train': 1.733963131904602} -11/07/2021 00:51:22 - INFO - __main__ - Step 25857: {'lr': 0.00046862519052791166, 'samples': 4964544, 'steps': 25856, 'loss/train': 1.4181243181228638} -11/07/2021 00:51:22 - INFO - __main__ - Step 25858: {'lr': 0.00046862261657954033, 'samples': 4964736, 'steps': 25857, 'loss/train': 1.3477070331573486} -11/07/2021 00:51:23 - INFO - __main__ - Step 25859: {'lr': 0.000468620042532661, 'samples': 4964928, 'steps': 25858, 'loss/train': 1.6740336418151855} -11/07/2021 00:51:24 - INFO - __main__ - Step 25860: {'lr': 0.0004686174683872748, 'samples': 4965120, 'steps': 25859, 'loss/train': 1.1245931386947632} -11/07/2021 00:51:24 - INFO - __main__ - Step 25861: {'lr': 0.00046861489414338304, 'samples': 4965312, 'steps': 25860, 'loss/train': 1.3914529085159302} -11/07/2021 00:51:24 - INFO - __main__ - Step 25862: {'lr': 0.0004686123198009867, 'samples': 4965504, 'steps': 25861, 'loss/train': 1.3693437576293945} -11/07/2021 00:51:25 - INFO - __main__ - Step 25863: {'lr': 0.00046860974536008706, 'samples': 4965696, 'steps': 25862, 'loss/train': 3.1253714561462402} -11/07/2021 00:51:25 - INFO - __main__ - Step 25864: {'lr': 0.0004686071708206853, 'samples': 4965888, 'steps': 25863, 'loss/train': 1.4004058837890625} -11/07/2021 00:51:26 - INFO - __main__ - Step 25865: {'lr': 0.0004686045961827824, 'samples': 4966080, 'steps': 25864, 'loss/train': 1.5016511678695679} -11/07/2021 00:51:26 - INFO - __main__ - Step 25866: {'lr': 0.00046860202144637976, 'samples': 4966272, 'steps': 25865, 'loss/train': 1.7874298095703125} -11/07/2021 00:51:27 - INFO - __main__ - Step 25867: {'lr': 0.00046859944661147837, 'samples': 4966464, 'steps': 25866, 'loss/train': 1.6364786624908447} -11/07/2021 00:51:27 - INFO - __main__ - Step 25868: {'lr': 0.00046859687167807943, 'samples': 4966656, 'steps': 25867, 'loss/train': 1.4097360372543335} -11/07/2021 00:51:28 - INFO - __main__ - Step 25869: {'lr': 0.0004685942966461841, 'samples': 4966848, 'steps': 25868, 'loss/train': 1.6922928094863892} -11/07/2021 00:51:29 - INFO - __main__ - Step 25870: {'lr': 0.00046859172151579354, 'samples': 4967040, 'steps': 25869, 'loss/train': 1.5949517488479614} -11/07/2021 00:51:29 - INFO - __main__ - Step 25871: {'lr': 0.00046858914628690896, 'samples': 4967232, 'steps': 25870, 'loss/train': 1.5514227151870728} -11/07/2021 00:51:29 - INFO - __main__ - Step 25872: {'lr': 0.0004685865709595315, 'samples': 4967424, 'steps': 25871, 'loss/train': 1.4934883117675781} -11/07/2021 00:51:30 - INFO - __main__ - Step 25873: {'lr': 0.00046858399553366224, 'samples': 4967616, 'steps': 25872, 'loss/train': 1.4775656461715698} -11/07/2021 00:51:30 - INFO - __main__ - Step 25874: {'lr': 0.0004685814200093025, 'samples': 4967808, 'steps': 25873, 'loss/train': 1.5905988216400146} -11/07/2021 00:51:31 - INFO - __main__ - Step 25875: {'lr': 0.00046857884438645327, 'samples': 4968000, 'steps': 25874, 'loss/train': 1.4419405460357666} -11/07/2021 00:51:31 - INFO - __main__ - Step 25876: {'lr': 0.0004685762686651158, 'samples': 4968192, 'steps': 25875, 'loss/train': 1.5453418493270874} -11/07/2021 00:51:32 - INFO - __main__ - Step 25877: {'lr': 0.0004685736928452913, 'samples': 4968384, 'steps': 25876, 'loss/train': 1.4005645513534546} -11/07/2021 00:51:32 - INFO - __main__ - Step 25878: {'lr': 0.00046857111692698083, 'samples': 4968576, 'steps': 25877, 'loss/train': 1.641775131225586} -11/07/2021 00:51:32 - INFO - __main__ - Step 25879: {'lr': 0.0004685685409101855, 'samples': 4968768, 'steps': 25878, 'loss/train': 1.3810776472091675} -11/07/2021 00:51:33 - INFO - __main__ - Step 25880: {'lr': 0.00046856596479490667, 'samples': 4968960, 'steps': 25879, 'loss/train': 1.6162208318710327} -11/07/2021 00:51:34 - INFO - __main__ - Step 25881: {'lr': 0.0004685633885811453, 'samples': 4969152, 'steps': 25880, 'loss/train': 1.7117780447006226} -11/07/2021 00:51:34 - INFO - __main__ - Step 25882: {'lr': 0.0004685608122689027, 'samples': 4969344, 'steps': 25881, 'loss/train': 1.4712426662445068} -11/07/2021 00:51:34 - INFO - __main__ - Step 25883: {'lr': 0.00046855823585818004, 'samples': 4969536, 'steps': 25882, 'loss/train': 0.21515725553035736} -11/07/2021 00:51:35 - INFO - __main__ - Step 25884: {'lr': 0.0004685556593489783, 'samples': 4969728, 'steps': 25883, 'loss/train': 1.5416388511657715} -11/07/2021 00:51:36 - INFO - __main__ - Step 25885: {'lr': 0.0004685530827412988, 'samples': 4969920, 'steps': 25884, 'loss/train': 1.395815372467041} -11/07/2021 00:51:36 - INFO - __main__ - Step 25886: {'lr': 0.0004685505060351426, 'samples': 4970112, 'steps': 25885, 'loss/train': 1.784235954284668} -11/07/2021 00:51:37 - INFO - __main__ - Step 25887: {'lr': 0.00046854792923051094, 'samples': 4970304, 'steps': 25886, 'loss/train': 0.9251062870025635} -11/07/2021 00:51:37 - INFO - __main__ - Step 25888: {'lr': 0.00046854535232740505, 'samples': 4970496, 'steps': 25887, 'loss/train': 1.6409744024276733} -11/07/2021 00:51:37 - INFO - __main__ - Step 25889: {'lr': 0.00046854277532582585, 'samples': 4970688, 'steps': 25888, 'loss/train': 1.5012282133102417} -11/07/2021 00:51:38 - INFO - __main__ - Step 25890: {'lr': 0.0004685401982257747, 'samples': 4970880, 'steps': 25889, 'loss/train': 1.4797322750091553} -11/07/2021 00:51:39 - INFO - __main__ - Step 25891: {'lr': 0.0004685376210272527, 'samples': 4971072, 'steps': 25890, 'loss/train': 1.2445049285888672} -11/07/2021 00:51:39 - INFO - __main__ - Step 25892: {'lr': 0.00046853504373026107, 'samples': 4971264, 'steps': 25891, 'loss/train': 1.618612289428711} -11/07/2021 00:51:40 - INFO - __main__ - Step 25893: {'lr': 0.00046853246633480087, 'samples': 4971456, 'steps': 25892, 'loss/train': 0.987562358379364} -11/07/2021 00:51:40 - INFO - __main__ - Step 25894: {'lr': 0.0004685298888408733, 'samples': 4971648, 'steps': 25893, 'loss/train': 1.8932851552963257} -11/07/2021 00:51:40 - INFO - __main__ - Step 25895: {'lr': 0.0004685273112484796, 'samples': 4971840, 'steps': 25894, 'loss/train': 1.9858580827713013} -11/07/2021 00:51:41 - INFO - __main__ - Step 25896: {'lr': 0.0004685247335576209, 'samples': 4972032, 'steps': 25895, 'loss/train': 0.9556924104690552} -11/07/2021 00:51:42 - INFO - __main__ - Step 25897: {'lr': 0.00046852215576829824, 'samples': 4972224, 'steps': 25896, 'loss/train': 1.6164839267730713} -11/07/2021 00:51:42 - INFO - __main__ - Step 25898: {'lr': 0.0004685195778805129, 'samples': 4972416, 'steps': 25897, 'loss/train': 1.8304446935653687} -11/07/2021 00:51:42 - INFO - __main__ - Step 25899: {'lr': 0.000468516999894266, 'samples': 4972608, 'steps': 25898, 'loss/train': 1.8032854795455933} -11/07/2021 00:51:43 - INFO - __main__ - Step 25900: {'lr': 0.0004685144218095587, 'samples': 4972800, 'steps': 25899, 'loss/train': 1.3517341613769531} -11/07/2021 00:51:44 - INFO - __main__ - Step 25901: {'lr': 0.00046851184362639223, 'samples': 4972992, 'steps': 25900, 'loss/train': 1.5504690408706665} -11/07/2021 00:51:44 - INFO - __main__ - Step 25902: {'lr': 0.0004685092653447676, 'samples': 4973184, 'steps': 25901, 'loss/train': 1.3224358558654785} -11/07/2021 00:51:45 - INFO - __main__ - Step 25903: {'lr': 0.00046850668696468614, 'samples': 4973376, 'steps': 25902, 'loss/train': 1.6287102699279785} -11/07/2021 00:51:45 - INFO - __main__ - Step 25904: {'lr': 0.0004685041084861489, 'samples': 4973568, 'steps': 25903, 'loss/train': 1.6833339929580688} -11/07/2021 00:51:45 - INFO - __main__ - Step 25905: {'lr': 0.00046850152990915705, 'samples': 4973760, 'steps': 25904, 'loss/train': 1.308502435684204} -11/07/2021 00:51:46 - INFO - __main__ - Step 25906: {'lr': 0.0004684989512337119, 'samples': 4973952, 'steps': 25905, 'loss/train': 1.5645153522491455} -11/07/2021 00:51:47 - INFO - __main__ - Step 25907: {'lr': 0.00046849637245981434, 'samples': 4974144, 'steps': 25906, 'loss/train': 0.9965031147003174} -11/07/2021 00:51:47 - INFO - __main__ - Step 25908: {'lr': 0.0004684937935874658, 'samples': 4974336, 'steps': 25907, 'loss/train': 1.4623723030090332} -11/07/2021 00:51:47 - INFO - __main__ - Step 25909: {'lr': 0.00046849121461666734, 'samples': 4974528, 'steps': 25908, 'loss/train': 1.144979476928711} -11/07/2021 00:51:48 - INFO - __main__ - Step 25910: {'lr': 0.00046848863554742006, 'samples': 4974720, 'steps': 25909, 'loss/train': 1.27719247341156} -11/07/2021 00:51:49 - INFO - __main__ - Step 25911: {'lr': 0.0004684860563797252, 'samples': 4974912, 'steps': 25910, 'loss/train': 1.6980345249176025} -11/07/2021 00:51:49 - INFO - __main__ - Step 25912: {'lr': 0.00046848347711358384, 'samples': 4975104, 'steps': 25911, 'loss/train': 1.4265433549880981} -11/07/2021 00:51:49 - INFO - __main__ - Step 25913: {'lr': 0.0004684808977489973, 'samples': 4975296, 'steps': 25912, 'loss/train': 1.625329613685608} -11/07/2021 00:51:50 - INFO - __main__ - Step 25914: {'lr': 0.00046847831828596647, 'samples': 4975488, 'steps': 25913, 'loss/train': 1.4921817779541016} -11/07/2021 00:51:50 - INFO - __main__ - Step 25915: {'lr': 0.0004684757387244928, 'samples': 4975680, 'steps': 25914, 'loss/train': 1.9082525968551636} -11/07/2021 00:51:51 - INFO - __main__ - Step 25916: {'lr': 0.00046847315906457733, 'samples': 4975872, 'steps': 25915, 'loss/train': 1.6177970170974731} -11/07/2021 00:51:52 - INFO - __main__ - Step 25917: {'lr': 0.0004684705793062212, 'samples': 4976064, 'steps': 25916, 'loss/train': 1.7028489112854004} -11/07/2021 00:51:52 - INFO - __main__ - Step 25918: {'lr': 0.00046846799944942564, 'samples': 4976256, 'steps': 25917, 'loss/train': 0.4418361485004425} -11/07/2021 00:51:52 - INFO - __main__ - Step 25919: {'lr': 0.00046846541949419177, 'samples': 4976448, 'steps': 25918, 'loss/train': 1.2632676362991333} -11/07/2021 00:51:53 - INFO - __main__ - Step 25920: {'lr': 0.00046846283944052073, 'samples': 4976640, 'steps': 25919, 'loss/train': 1.417981743812561} -11/07/2021 00:51:54 - INFO - __main__ - Step 25921: {'lr': 0.0004684602592884136, 'samples': 4976832, 'steps': 25920, 'loss/train': 2.107151985168457} -11/07/2021 00:51:54 - INFO - __main__ - Step 25922: {'lr': 0.0004684576790378718, 'samples': 4977024, 'steps': 25921, 'loss/train': 1.2924543619155884} -11/07/2021 00:51:54 - INFO - __main__ - Step 25923: {'lr': 0.00046845509868889625, 'samples': 4977216, 'steps': 25922, 'loss/train': 1.6383317708969116} -11/07/2021 00:51:55 - INFO - __main__ - Step 25924: {'lr': 0.00046845251824148825, 'samples': 4977408, 'steps': 25923, 'loss/train': 1.748632788658142} -11/07/2021 00:51:55 - INFO - __main__ - Step 25925: {'lr': 0.0004684499376956489, 'samples': 4977600, 'steps': 25924, 'loss/train': 1.5455869436264038} -11/07/2021 00:51:55 - INFO - __main__ - Step 25926: {'lr': 0.00046844735705137944, 'samples': 4977792, 'steps': 25925, 'loss/train': 1.6856175661087036} -11/07/2021 00:51:56 - INFO - __main__ - Step 25927: {'lr': 0.0004684447763086809, 'samples': 4977984, 'steps': 25926, 'loss/train': 1.0863152742385864} -11/07/2021 00:51:57 - INFO - __main__ - Step 25928: {'lr': 0.00046844219546755454, 'samples': 4978176, 'steps': 25927, 'loss/train': 1.6790918111801147} -11/07/2021 00:51:57 - INFO - __main__ - Step 25929: {'lr': 0.0004684396145280014, 'samples': 4978368, 'steps': 25928, 'loss/train': 1.7366427183151245} -11/07/2021 00:51:57 - INFO - __main__ - Step 25930: {'lr': 0.00046843703349002286, 'samples': 4978560, 'steps': 25929, 'loss/train': 1.4150608777999878} -11/07/2021 00:51:58 - INFO - __main__ - Step 25931: {'lr': 0.00046843445235361994, 'samples': 4978752, 'steps': 25930, 'loss/train': 1.5314158201217651} -11/07/2021 00:51:59 - INFO - __main__ - Step 25932: {'lr': 0.0004684318711187938, 'samples': 4978944, 'steps': 25931, 'loss/train': 1.862462043762207} -11/07/2021 00:51:59 - INFO - __main__ - Step 25933: {'lr': 0.0004684292897855457, 'samples': 4979136, 'steps': 25932, 'loss/train': 2.1105966567993164} -11/07/2021 00:52:00 - INFO - __main__ - Step 25934: {'lr': 0.00046842670835387667, 'samples': 4979328, 'steps': 25933, 'loss/train': 1.3371798992156982} -11/07/2021 00:52:00 - INFO - __main__ - Step 25935: {'lr': 0.00046842412682378796, 'samples': 4979520, 'steps': 25934, 'loss/train': 1.817678451538086} -11/07/2021 00:52:00 - INFO - __main__ - Step 25936: {'lr': 0.0004684215451952807, 'samples': 4979712, 'steps': 25935, 'loss/train': 1.6571016311645508} -11/07/2021 00:52:01 - INFO - __main__ - Step 25937: {'lr': 0.000468418963468356, 'samples': 4979904, 'steps': 25936, 'loss/train': 1.8304779529571533} -11/07/2021 00:52:02 - INFO - __main__ - Step 25938: {'lr': 0.0004684163816430152, 'samples': 4980096, 'steps': 25937, 'loss/train': 1.5367423295974731} -11/07/2021 00:52:02 - INFO - __main__ - Step 25939: {'lr': 0.00046841379971925923, 'samples': 4980288, 'steps': 25938, 'loss/train': 1.5942084789276123} -11/07/2021 00:52:02 - INFO - __main__ - Step 25940: {'lr': 0.0004684112176970895, 'samples': 4980480, 'steps': 25939, 'loss/train': 1.5396287441253662} -11/07/2021 00:52:03 - INFO - __main__ - Step 25941: {'lr': 0.0004684086355765069, 'samples': 4980672, 'steps': 25940, 'loss/train': 1.4727085828781128} -11/07/2021 00:52:04 - INFO - __main__ - Step 25942: {'lr': 0.00046840605335751284, 'samples': 4980864, 'steps': 25941, 'loss/train': 1.663288950920105} -11/07/2021 00:52:04 - INFO - __main__ - Step 25943: {'lr': 0.0004684034710401084, 'samples': 4981056, 'steps': 25942, 'loss/train': 1.538399577140808} -11/07/2021 00:52:05 - INFO - __main__ - Step 25944: {'lr': 0.00046840088862429465, 'samples': 4981248, 'steps': 25943, 'loss/train': 1.3046379089355469} -11/07/2021 00:52:05 - INFO - __main__ - Step 25945: {'lr': 0.00046839830611007297, 'samples': 4981440, 'steps': 25944, 'loss/train': 1.7420538663864136} -11/07/2021 00:52:05 - INFO - __main__ - Step 25946: {'lr': 0.00046839572349744417, 'samples': 4981632, 'steps': 25945, 'loss/train': 1.4014198780059814} -11/07/2021 00:52:06 - INFO - __main__ - Step 25947: {'lr': 0.0004683931407864098, 'samples': 4981824, 'steps': 25946, 'loss/train': 1.6909465789794922} -11/07/2021 00:52:07 - INFO - __main__ - Step 25948: {'lr': 0.0004683905579769708, 'samples': 4982016, 'steps': 25947, 'loss/train': 1.726481556892395} -11/07/2021 00:52:07 - INFO - __main__ - Step 25949: {'lr': 0.0004683879750691283, 'samples': 4982208, 'steps': 25948, 'loss/train': 1.3670543432235718} -11/07/2021 00:52:07 - INFO - __main__ - Step 25950: {'lr': 0.00046838539206288366, 'samples': 4982400, 'steps': 25949, 'loss/train': 1.9250874519348145} -11/07/2021 00:52:08 - INFO - __main__ - Step 25951: {'lr': 0.00046838280895823795, 'samples': 4982592, 'steps': 25950, 'loss/train': 1.8457273244857788} -11/07/2021 00:52:08 - INFO - __main__ - Step 25952: {'lr': 0.0004683802257551922, 'samples': 4982784, 'steps': 25951, 'loss/train': 1.3912980556488037} -11/07/2021 00:52:09 - INFO - __main__ - Step 25953: {'lr': 0.00046837764245374777, 'samples': 4982976, 'steps': 25952, 'loss/train': 1.2061102390289307} -11/07/2021 00:52:10 - INFO - __main__ - Step 25954: {'lr': 0.0004683750590539057, 'samples': 4983168, 'steps': 25953, 'loss/train': 1.2821147441864014} -11/07/2021 00:52:10 - INFO - __main__ - Step 25955: {'lr': 0.00046837247555566727, 'samples': 4983360, 'steps': 25954, 'loss/train': 1.5056250095367432} -11/07/2021 00:52:10 - INFO - __main__ - Step 25956: {'lr': 0.00046836989195903344, 'samples': 4983552, 'steps': 25955, 'loss/train': 1.6103827953338623} -11/07/2021 00:52:11 - INFO - __main__ - Step 25957: {'lr': 0.00046836730826400565, 'samples': 4983744, 'steps': 25956, 'loss/train': 2.7427055835723877} -11/07/2021 00:52:12 - INFO - __main__ - Step 25958: {'lr': 0.00046836472447058485, 'samples': 4983936, 'steps': 25957, 'loss/train': 1.5038542747497559} -11/07/2021 00:52:12 - INFO - __main__ - Step 25959: {'lr': 0.0004683621405787723, 'samples': 4984128, 'steps': 25958, 'loss/train': 1.4676628112792969} -11/07/2021 00:52:12 - INFO - __main__ - Step 25960: {'lr': 0.0004683595565885691, 'samples': 4984320, 'steps': 25959, 'loss/train': 1.1955684423446655} -11/07/2021 00:52:13 - INFO - __main__ - Step 25961: {'lr': 0.0004683569724999765, 'samples': 4984512, 'steps': 25960, 'loss/train': 1.4902448654174805} -11/07/2021 00:52:13 - INFO - __main__ - Step 25962: {'lr': 0.0004683543883129956, 'samples': 4984704, 'steps': 25961, 'loss/train': 1.6452752351760864} -11/07/2021 00:52:14 - INFO - __main__ - Step 25963: {'lr': 0.00046835180402762756, 'samples': 4984896, 'steps': 25962, 'loss/train': 1.4151829481124878} -11/07/2021 00:52:14 - INFO - __main__ - Step 25964: {'lr': 0.00046834921964387363, 'samples': 4985088, 'steps': 25963, 'loss/train': 1.4597492218017578} -11/07/2021 00:52:15 - INFO - __main__ - Step 25965: {'lr': 0.0004683466351617348, 'samples': 4985280, 'steps': 25964, 'loss/train': 1.5860645771026611} -11/07/2021 00:52:15 - INFO - __main__ - Step 25966: {'lr': 0.00046834405058121244, 'samples': 4985472, 'steps': 25965, 'loss/train': 1.5850639343261719} -11/07/2021 00:52:15 - INFO - __main__ - Step 25967: {'lr': 0.0004683414659023076, 'samples': 4985664, 'steps': 25966, 'loss/train': 1.1708070039749146} -11/07/2021 00:52:16 - INFO - __main__ - Step 25968: {'lr': 0.0004683388811250214, 'samples': 4985856, 'steps': 25967, 'loss/train': 1.4193698167800903} -11/07/2021 00:52:17 - INFO - __main__ - Step 25969: {'lr': 0.0004683362962493552, 'samples': 4986048, 'steps': 25968, 'loss/train': 1.1845221519470215} -11/07/2021 00:52:17 - INFO - __main__ - Step 25970: {'lr': 0.00046833371127530995, 'samples': 4986240, 'steps': 25969, 'loss/train': 1.4896739721298218} -11/07/2021 00:52:18 - INFO - __main__ - Step 25971: {'lr': 0.00046833112620288684, 'samples': 4986432, 'steps': 25970, 'loss/train': 1.51420259475708} -11/07/2021 00:52:18 - INFO - __main__ - Step 25972: {'lr': 0.0004683285410320872, 'samples': 4986624, 'steps': 25971, 'loss/train': 1.2518377304077148} -11/07/2021 00:52:19 - INFO - __main__ - Step 25973: {'lr': 0.000468325955762912, 'samples': 4986816, 'steps': 25972, 'loss/train': 1.53132164478302} -11/07/2021 00:52:19 - INFO - __main__ - Step 25974: {'lr': 0.0004683233703953626, 'samples': 4987008, 'steps': 25973, 'loss/train': 1.5884449481964111} -11/07/2021 00:52:20 - INFO - __main__ - Step 25975: {'lr': 0.00046832078492944, 'samples': 4987200, 'steps': 25974, 'loss/train': 1.120357871055603} -11/07/2021 00:52:20 - INFO - __main__ - Step 25976: {'lr': 0.0004683181993651454, 'samples': 4987392, 'steps': 25975, 'loss/train': 1.7608742713928223} -11/07/2021 00:52:20 - INFO - __main__ - Step 25977: {'lr': 0.0004683156137024801, 'samples': 4987584, 'steps': 25976, 'loss/train': 1.5439300537109375} -11/07/2021 00:52:21 - INFO - __main__ - Step 25978: {'lr': 0.00046831302794144504, 'samples': 4987776, 'steps': 25977, 'loss/train': 1.1016311645507812} -11/07/2021 00:52:22 - INFO - __main__ - Step 25979: {'lr': 0.00046831044208204154, 'samples': 4987968, 'steps': 25978, 'loss/train': 1.5977383852005005} -11/07/2021 00:52:22 - INFO - __main__ - Step 25980: {'lr': 0.0004683078561242707, 'samples': 4988160, 'steps': 25979, 'loss/train': 1.0856884717941284} -11/07/2021 00:52:22 - INFO - __main__ - Step 25981: {'lr': 0.00046830527006813373, 'samples': 4988352, 'steps': 25980, 'loss/train': 1.28452730178833} -11/07/2021 00:52:23 - INFO - __main__ - Step 25982: {'lr': 0.00046830268391363176, 'samples': 4988544, 'steps': 25981, 'loss/train': 1.5783252716064453} -11/07/2021 00:52:24 - INFO - __main__ - Step 25983: {'lr': 0.0004683000976607659, 'samples': 4988736, 'steps': 25982, 'loss/train': 2.0148348808288574} -11/07/2021 00:52:24 - INFO - __main__ - Step 25984: {'lr': 0.00046829751130953747, 'samples': 4988928, 'steps': 25983, 'loss/train': 2.1376888751983643} -11/07/2021 00:52:25 - INFO - __main__ - Step 25985: {'lr': 0.0004682949248599476, 'samples': 4989120, 'steps': 25984, 'loss/train': 1.2700146436691284} -11/07/2021 00:52:25 - INFO - __main__ - Step 25986: {'lr': 0.0004682923383119973, 'samples': 4989312, 'steps': 25985, 'loss/train': 1.7473276853561401} -11/07/2021 00:52:25 - INFO - __main__ - Step 25987: {'lr': 0.0004682897516656879, 'samples': 4989504, 'steps': 25986, 'loss/train': 1.577156662940979} -11/07/2021 00:52:26 - INFO - __main__ - Step 25988: {'lr': 0.00046828716492102043, 'samples': 4989696, 'steps': 25987, 'loss/train': 1.371836543083191} -11/07/2021 00:52:27 - INFO - __main__ - Step 25989: {'lr': 0.0004682845780779962, 'samples': 4989888, 'steps': 25988, 'loss/train': 1.2244542837142944} -11/07/2021 00:52:27 - INFO - __main__ - Step 25990: {'lr': 0.00046828199113661627, 'samples': 4990080, 'steps': 25989, 'loss/train': 1.1802819967269897} -11/07/2021 00:52:27 - INFO - __main__ - Step 25991: {'lr': 0.0004682794040968819, 'samples': 4990272, 'steps': 25990, 'loss/train': 1.1837917566299438} -11/07/2021 00:52:28 - INFO - __main__ - Step 25992: {'lr': 0.0004682768169587942, 'samples': 4990464, 'steps': 25991, 'loss/train': 1.503637671470642} -11/07/2021 00:52:28 - INFO - __main__ - Step 25993: {'lr': 0.0004682742297223543, 'samples': 4990656, 'steps': 25992, 'loss/train': 1.3802827596664429} -11/07/2021 00:52:29 - INFO - __main__ - Step 25994: {'lr': 0.00046827164238756337, 'samples': 4990848, 'steps': 25993, 'loss/train': 1.4477992057800293} -11/07/2021 00:52:30 - INFO - __main__ - Step 25995: {'lr': 0.00046826905495442263, 'samples': 4991040, 'steps': 25994, 'loss/train': 1.8412169218063354} -11/07/2021 00:52:30 - INFO - __main__ - Step 25996: {'lr': 0.00046826646742293326, 'samples': 4991232, 'steps': 25995, 'loss/train': 1.4182357788085938} -11/07/2021 00:52:30 - INFO - __main__ - Step 25997: {'lr': 0.00046826387979309635, 'samples': 4991424, 'steps': 25996, 'loss/train': 1.7624053955078125} -11/07/2021 00:52:31 - INFO - __main__ - Step 25998: {'lr': 0.0004682612920649131, 'samples': 4991616, 'steps': 25997, 'loss/train': 1.870514988899231} -11/07/2021 00:52:32 - INFO - __main__ - Step 25999: {'lr': 0.00046825870423838466, 'samples': 4991808, 'steps': 25998, 'loss/train': 1.5395135879516602} -11/07/2021 00:52:32 - INFO - __main__ - Step 26000: {'lr': 0.00046825611631351227, 'samples': 4992000, 'steps': 25999, 'loss/train': 1.233712911605835} -11/07/2021 00:52:32 - INFO - __main__ - Step 26001: {'lr': 0.00046825352829029705, 'samples': 4992192, 'steps': 26000, 'loss/train': 1.740976095199585} -11/07/2021 00:52:33 - INFO - __main__ - Step 26002: {'lr': 0.00046825094016874014, 'samples': 4992384, 'steps': 26001, 'loss/train': 1.8134573698043823} -11/07/2021 00:52:33 - INFO - __main__ - Step 26003: {'lr': 0.00046824835194884273, 'samples': 4992576, 'steps': 26002, 'loss/train': 1.9249521493911743} -11/07/2021 00:52:34 - INFO - __main__ - Step 26004: {'lr': 0.0004682457636306059, 'samples': 4992768, 'steps': 26003, 'loss/train': 1.6932024955749512} -11/07/2021 00:52:35 - INFO - __main__ - Step 26005: {'lr': 0.000468243175214031, 'samples': 4992960, 'steps': 26004, 'loss/train': 1.567561149597168} -11/07/2021 00:52:35 - INFO - __main__ - Step 26006: {'lr': 0.00046824058669911906, 'samples': 4993152, 'steps': 26005, 'loss/train': 1.3454017639160156} -11/07/2021 00:52:35 - INFO - __main__ - Step 26007: {'lr': 0.00046823799808587126, 'samples': 4993344, 'steps': 26006, 'loss/train': 2.0492119789123535} -11/07/2021 00:52:36 - INFO - __main__ - Step 26008: {'lr': 0.00046823540937428876, 'samples': 4993536, 'steps': 26007, 'loss/train': 1.4472533464431763} -11/07/2021 00:52:37 - INFO - __main__ - Step 26009: {'lr': 0.0004682328205643728, 'samples': 4993728, 'steps': 26008, 'loss/train': 2.2082765102386475} -11/07/2021 00:52:37 - INFO - __main__ - Step 26010: {'lr': 0.00046823023165612455, 'samples': 4993920, 'steps': 26009, 'loss/train': 1.7340260744094849} -11/07/2021 00:52:37 - INFO - __main__ - Step 26011: {'lr': 0.000468227642649545, 'samples': 4994112, 'steps': 26010, 'loss/train': 1.229740858078003} -11/07/2021 00:52:38 - INFO - __main__ - Step 26012: {'lr': 0.00046822505354463553, 'samples': 4994304, 'steps': 26011, 'loss/train': 1.5559407472610474} -11/07/2021 00:52:38 - INFO - __main__ - Step 26013: {'lr': 0.0004682224643413972, 'samples': 4994496, 'steps': 26012, 'loss/train': 1.1459075212478638} -11/07/2021 00:52:39 - INFO - __main__ - Step 26014: {'lr': 0.0004682198750398312, 'samples': 4994688, 'steps': 26013, 'loss/train': 1.929360032081604} -11/07/2021 00:52:39 - INFO - __main__ - Step 26015: {'lr': 0.00046821728563993867, 'samples': 4994880, 'steps': 26014, 'loss/train': 1.8622995615005493} -11/07/2021 00:52:40 - INFO - __main__ - Step 26016: {'lr': 0.0004682146961417208, 'samples': 4995072, 'steps': 26015, 'loss/train': 1.5445281267166138} -11/07/2021 00:52:40 - INFO - __main__ - Step 26017: {'lr': 0.00046821210654517874, 'samples': 4995264, 'steps': 26016, 'loss/train': 1.3797636032104492} -11/07/2021 00:52:40 - INFO - __main__ - Step 26018: {'lr': 0.0004682095168503137, 'samples': 4995456, 'steps': 26017, 'loss/train': 1.3731129169464111} -11/07/2021 00:52:41 - INFO - __main__ - Step 26019: {'lr': 0.00046820692705712685, 'samples': 4995648, 'steps': 26018, 'loss/train': 2.186852216720581} -11/07/2021 00:52:42 - INFO - __main__ - Step 26020: {'lr': 0.00046820433716561927, 'samples': 4995840, 'steps': 26019, 'loss/train': 1.5869444608688354} -11/07/2021 00:52:42 - INFO - __main__ - Step 26021: {'lr': 0.0004682017471757922, 'samples': 4996032, 'steps': 26020, 'loss/train': 1.7409318685531616} -11/07/2021 00:52:42 - INFO - __main__ - Step 26022: {'lr': 0.0004681991570876468, 'samples': 4996224, 'steps': 26021, 'loss/train': 1.7557164430618286} -11/07/2021 00:52:43 - INFO - __main__ - Step 26023: {'lr': 0.00046819656690118424, 'samples': 4996416, 'steps': 26022, 'loss/train': 1.6353843212127686} -11/07/2021 00:52:44 - INFO - __main__ - Step 26024: {'lr': 0.00046819397661640563, 'samples': 4996608, 'steps': 26023, 'loss/train': 1.4602898359298706} -11/07/2021 00:52:44 - INFO - __main__ - Step 26025: {'lr': 0.0004681913862333122, 'samples': 4996800, 'steps': 26024, 'loss/train': 1.1732585430145264} -11/07/2021 00:52:45 - INFO - __main__ - Step 26026: {'lr': 0.0004681887957519051, 'samples': 4996992, 'steps': 26025, 'loss/train': 1.5690240859985352} -11/07/2021 00:52:45 - INFO - __main__ - Step 26027: {'lr': 0.00046818620517218544, 'samples': 4997184, 'steps': 26026, 'loss/train': 1.5888382196426392} -11/07/2021 00:52:45 - INFO - __main__ - Step 26028: {'lr': 0.00046818361449415456, 'samples': 4997376, 'steps': 26027, 'loss/train': 1.7676751613616943} -11/07/2021 00:52:46 - INFO - __main__ - Step 26029: {'lr': 0.00046818102371781343, 'samples': 4997568, 'steps': 26028, 'loss/train': 1.2550809383392334} -11/07/2021 00:52:47 - INFO - __main__ - Step 26030: {'lr': 0.0004681784328431633, 'samples': 4997760, 'steps': 26029, 'loss/train': 1.797165036201477} -11/07/2021 00:52:47 - INFO - __main__ - Step 26031: {'lr': 0.0004681758418702054, 'samples': 4997952, 'steps': 26030, 'loss/train': 1.6159076690673828} -11/07/2021 00:52:47 - INFO - __main__ - Step 26032: {'lr': 0.0004681732507989408, 'samples': 4998144, 'steps': 26031, 'loss/train': 1.2013065814971924} -11/07/2021 00:52:48 - INFO - __main__ - Step 26033: {'lr': 0.00046817065962937067, 'samples': 4998336, 'steps': 26032, 'loss/train': 1.5733553171157837} -11/07/2021 00:52:48 - INFO - __main__ - Step 26034: {'lr': 0.00046816806836149624, 'samples': 4998528, 'steps': 26033, 'loss/train': 1.91973078250885} -11/07/2021 00:52:49 - INFO - __main__ - Step 26035: {'lr': 0.00046816547699531866, 'samples': 4998720, 'steps': 26034, 'loss/train': 1.1797672510147095} -11/07/2021 00:52:49 - INFO - __main__ - Step 26036: {'lr': 0.000468162885530839, 'samples': 4998912, 'steps': 26035, 'loss/train': 2.0054972171783447} -11/07/2021 00:52:50 - INFO - __main__ - Step 26037: {'lr': 0.00046816029396805857, 'samples': 4999104, 'steps': 26036, 'loss/train': 1.3194879293441772} -11/07/2021 00:52:50 - INFO - __main__ - Step 26038: {'lr': 0.00046815770230697844, 'samples': 4999296, 'steps': 26037, 'loss/train': 1.9048802852630615} -11/07/2021 00:52:50 - INFO - __main__ - Step 26039: {'lr': 0.0004681551105475999, 'samples': 4999488, 'steps': 26038, 'loss/train': 1.6333225965499878} -11/07/2021 00:52:51 - INFO - __main__ - Step 26040: {'lr': 0.0004681525186899239, 'samples': 4999680, 'steps': 26039, 'loss/train': 0.944560170173645} -11/07/2021 00:52:52 - INFO - __main__ - Step 26041: {'lr': 0.00046814992673395185, 'samples': 4999872, 'steps': 26040, 'loss/train': 2.0325982570648193} -11/07/2021 00:52:52 - INFO - __main__ - Step 26042: {'lr': 0.0004681473346796848, 'samples': 5000064, 'steps': 26041, 'loss/train': 1.6044882535934448} -11/07/2021 00:52:52 - INFO - __main__ - Step 26043: {'lr': 0.0004681447425271239, 'samples': 5000256, 'steps': 26042, 'loss/train': 1.1876591444015503} -11/07/2021 00:52:53 - INFO - __main__ - Step 26044: {'lr': 0.0004681421502762704, 'samples': 5000448, 'steps': 26043, 'loss/train': 1.3685396909713745} -11/07/2021 00:52:54 - INFO - __main__ - Step 26045: {'lr': 0.0004681395579271253, 'samples': 5000640, 'steps': 26044, 'loss/train': 1.4207525253295898} -11/07/2021 00:52:54 - INFO - __main__ - Step 26046: {'lr': 0.00046813696547969, 'samples': 5000832, 'steps': 26045, 'loss/train': 1.6542054414749146} -11/07/2021 00:52:55 - INFO - __main__ - Step 26047: {'lr': 0.00046813437293396543, 'samples': 5001024, 'steps': 26046, 'loss/train': 1.1289676427841187} -11/07/2021 00:52:55 - INFO - __main__ - Step 26048: {'lr': 0.000468131780289953, 'samples': 5001216, 'steps': 26047, 'loss/train': 1.707362174987793} -11/07/2021 00:52:55 - INFO - __main__ - Step 26049: {'lr': 0.00046812918754765364, 'samples': 5001408, 'steps': 26048, 'loss/train': 1.5160295963287354} -11/07/2021 00:52:57 - INFO - __main__ - Step 26050: {'lr': 0.00046812659470706877, 'samples': 5001600, 'steps': 26049, 'loss/train': 1.486424207687378} -11/07/2021 00:52:57 - INFO - __main__ - Step 26051: {'lr': 0.0004681240017681993, 'samples': 5001792, 'steps': 26050, 'loss/train': 1.995141863822937} -11/07/2021 00:52:57 - INFO - __main__ - Step 26052: {'lr': 0.00046812140873104657, 'samples': 5001984, 'steps': 26051, 'loss/train': 0.976646363735199} -11/07/2021 00:52:58 - INFO - __main__ - Step 26053: {'lr': 0.00046811881559561167, 'samples': 5002176, 'steps': 26052, 'loss/train': 1.8532328605651855} -11/07/2021 00:52:58 - INFO - __main__ - Step 26054: {'lr': 0.00046811622236189585, 'samples': 5002368, 'steps': 26053, 'loss/train': 1.7580597400665283} -11/07/2021 00:52:58 - INFO - __main__ - Step 26055: {'lr': 0.0004681136290299002, 'samples': 5002560, 'steps': 26054, 'loss/train': 1.3783228397369385} -11/07/2021 00:52:59 - INFO - __main__ - Step 26056: {'lr': 0.00046811103559962585, 'samples': 5002752, 'steps': 26055, 'loss/train': 1.3633968830108643} -11/07/2021 00:53:00 - INFO - __main__ - Step 26057: {'lr': 0.00046810844207107415, 'samples': 5002944, 'steps': 26056, 'loss/train': 1.6410704851150513} -11/07/2021 00:53:00 - INFO - __main__ - Step 26058: {'lr': 0.0004681058484442461, 'samples': 5003136, 'steps': 26057, 'loss/train': 1.8240699768066406} -11/07/2021 00:53:00 - INFO - __main__ - Step 26059: {'lr': 0.00046810325471914295, 'samples': 5003328, 'steps': 26058, 'loss/train': 1.9498460292816162} -11/07/2021 00:53:01 - INFO - __main__ - Step 26060: {'lr': 0.00046810066089576573, 'samples': 5003520, 'steps': 26059, 'loss/train': 1.6209688186645508} -11/07/2021 00:53:01 - INFO - __main__ - Step 26061: {'lr': 0.00046809806697411583, 'samples': 5003712, 'steps': 26060, 'loss/train': 1.3615363836288452} -11/07/2021 00:53:02 - INFO - __main__ - Step 26062: {'lr': 0.0004680954729541942, 'samples': 5003904, 'steps': 26061, 'loss/train': 1.435072898864746} -11/07/2021 00:53:03 - INFO - __main__ - Step 26063: {'lr': 0.00046809287883600227, 'samples': 5004096, 'steps': 26062, 'loss/train': 1.6992723941802979} -11/07/2021 00:53:03 - INFO - __main__ - Step 26064: {'lr': 0.00046809028461954093, 'samples': 5004288, 'steps': 26063, 'loss/train': 1.3957271575927734} -11/07/2021 00:53:03 - INFO - __main__ - Step 26065: {'lr': 0.00046808769030481153, 'samples': 5004480, 'steps': 26064, 'loss/train': 1.38559091091156} -11/07/2021 00:53:04 - INFO - __main__ - Step 26066: {'lr': 0.00046808509589181513, 'samples': 5004672, 'steps': 26065, 'loss/train': 1.3515117168426514} -11/07/2021 00:53:05 - INFO - __main__ - Step 26067: {'lr': 0.00046808250138055305, 'samples': 5004864, 'steps': 26066, 'loss/train': 1.3374156951904297} -11/07/2021 00:53:05 - INFO - __main__ - Step 26068: {'lr': 0.0004680799067710263, 'samples': 5005056, 'steps': 26067, 'loss/train': 1.1858316659927368} -11/07/2021 00:53:05 - INFO - __main__ - Step 26069: {'lr': 0.00046807731206323605, 'samples': 5005248, 'steps': 26068, 'loss/train': 1.3988279104232788} -11/07/2021 00:53:06 - INFO - __main__ - Step 26070: {'lr': 0.00046807471725718357, 'samples': 5005440, 'steps': 26069, 'loss/train': 1.8223246335983276} -11/07/2021 00:53:06 - INFO - __main__ - Step 26071: {'lr': 0.00046807212235287, 'samples': 5005632, 'steps': 26070, 'loss/train': 1.149131417274475} -11/07/2021 00:53:07 - INFO - __main__ - Step 26072: {'lr': 0.0004680695273502965, 'samples': 5005824, 'steps': 26071, 'loss/train': 1.7531110048294067} -11/07/2021 00:53:08 - INFO - __main__ - Step 26073: {'lr': 0.00046806693224946426, 'samples': 5006016, 'steps': 26072, 'loss/train': 1.817716121673584} -11/07/2021 00:53:08 - INFO - __main__ - Step 26074: {'lr': 0.00046806433705037445, 'samples': 5006208, 'steps': 26073, 'loss/train': 1.7162048816680908} -11/07/2021 00:53:08 - INFO - __main__ - Step 26075: {'lr': 0.00046806174175302806, 'samples': 5006400, 'steps': 26074, 'loss/train': 0.9646897912025452} -11/07/2021 00:53:09 - INFO - __main__ - Step 26076: {'lr': 0.00046805914635742656, 'samples': 5006592, 'steps': 26075, 'loss/train': 1.3818391561508179} -11/07/2021 00:53:10 - INFO - __main__ - Step 26077: {'lr': 0.0004680565508635709, 'samples': 5006784, 'steps': 26076, 'loss/train': 1.4534307718276978} -11/07/2021 00:53:10 - INFO - __main__ - Step 26078: {'lr': 0.00046805395527146237, 'samples': 5006976, 'steps': 26077, 'loss/train': 1.2013325691223145} -11/07/2021 00:53:10 - INFO - __main__ - Step 26079: {'lr': 0.0004680513595811021, 'samples': 5007168, 'steps': 26078, 'loss/train': 1.4902340173721313} -11/07/2021 00:53:11 - INFO - __main__ - Step 26080: {'lr': 0.0004680487637924912, 'samples': 5007360, 'steps': 26079, 'loss/train': 1.373033046722412} -11/07/2021 00:53:11 - INFO - __main__ - Step 26081: {'lr': 0.0004680461679056309, 'samples': 5007552, 'steps': 26080, 'loss/train': 1.8461296558380127} -11/07/2021 00:53:12 - INFO - __main__ - Step 26082: {'lr': 0.00046804357192052246, 'samples': 5007744, 'steps': 26081, 'loss/train': 1.5331897735595703} -11/07/2021 00:53:13 - INFO - __main__ - Step 26083: {'lr': 0.00046804097583716685, 'samples': 5007936, 'steps': 26082, 'loss/train': 1.252344012260437} -11/07/2021 00:53:13 - INFO - __main__ - Step 26084: {'lr': 0.0004680383796555654, 'samples': 5008128, 'steps': 26083, 'loss/train': 1.4637391567230225} -11/07/2021 00:53:13 - INFO - __main__ - Step 26085: {'lr': 0.00046803578337571917, 'samples': 5008320, 'steps': 26084, 'loss/train': 1.5039665699005127} -11/07/2021 00:53:14 - INFO - __main__ - Step 26086: {'lr': 0.00046803318699762937, 'samples': 5008512, 'steps': 26085, 'loss/train': 1.2997361421585083} -11/07/2021 00:53:15 - INFO - __main__ - Step 26087: {'lr': 0.0004680305905212972, 'samples': 5008704, 'steps': 26086, 'loss/train': 1.739014983177185} -11/07/2021 00:53:15 - INFO - __main__ - Step 26088: {'lr': 0.0004680279939467238, 'samples': 5008896, 'steps': 26087, 'loss/train': 1.3671000003814697} -11/07/2021 00:53:16 - INFO - __main__ - Step 26089: {'lr': 0.00046802539727391033, 'samples': 5009088, 'steps': 26088, 'loss/train': 1.5393263101577759} -11/07/2021 00:53:16 - INFO - __main__ - Step 26090: {'lr': 0.0004680228005028581, 'samples': 5009280, 'steps': 26089, 'loss/train': 1.33014714717865} -11/07/2021 00:53:16 - INFO - __main__ - Step 26091: {'lr': 0.000468020203633568, 'samples': 5009472, 'steps': 26090, 'loss/train': 1.4916388988494873} -11/07/2021 00:53:17 - INFO - __main__ - Step 26092: {'lr': 0.0004680176066660415, 'samples': 5009664, 'steps': 26091, 'loss/train': 1.7128859758377075} -11/07/2021 00:53:18 - INFO - __main__ - Step 26093: {'lr': 0.00046801500960027957, 'samples': 5009856, 'steps': 26092, 'loss/train': 1.4452115297317505} -11/07/2021 00:53:18 - INFO - __main__ - Step 26094: {'lr': 0.00046801241243628344, 'samples': 5010048, 'steps': 26093, 'loss/train': 1.9708287715911865} -11/07/2021 00:53:18 - INFO - __main__ - Step 26095: {'lr': 0.00046800981517405426, 'samples': 5010240, 'steps': 26094, 'loss/train': 1.3643174171447754} -11/07/2021 00:53:19 - INFO - __main__ - Step 26096: {'lr': 0.0004680072178135932, 'samples': 5010432, 'steps': 26095, 'loss/train': 2.488478899002075} -11/07/2021 00:53:19 - INFO - __main__ - Step 26097: {'lr': 0.00046800462035490156, 'samples': 5010624, 'steps': 26096, 'loss/train': 1.4790648221969604} -11/07/2021 00:53:20 - INFO - __main__ - Step 26098: {'lr': 0.0004680020227979803, 'samples': 5010816, 'steps': 26097, 'loss/train': 1.0440701246261597} -11/07/2021 00:53:20 - INFO - __main__ - Step 26099: {'lr': 0.0004679994251428308, 'samples': 5011008, 'steps': 26098, 'loss/train': 1.7082839012145996} -11/07/2021 00:53:21 - INFO - __main__ - Step 26100: {'lr': 0.00046799682738945397, 'samples': 5011200, 'steps': 26099, 'loss/train': 1.8536376953125} -11/07/2021 00:53:21 - INFO - __main__ - Step 26101: {'lr': 0.00046799422953785124, 'samples': 5011392, 'steps': 26100, 'loss/train': 1.5862019062042236} -11/07/2021 00:53:21 - INFO - __main__ - Step 26102: {'lr': 0.00046799163158802365, 'samples': 5011584, 'steps': 26101, 'loss/train': 1.9192478656768799} -11/07/2021 00:53:22 - INFO - __main__ - Step 26103: {'lr': 0.00046798903353997243, 'samples': 5011776, 'steps': 26102, 'loss/train': 1.8214565515518188} -11/07/2021 00:53:23 - INFO - __main__ - Step 26104: {'lr': 0.0004679864353936987, 'samples': 5011968, 'steps': 26103, 'loss/train': 2.0594255924224854} -11/07/2021 00:53:23 - INFO - __main__ - Step 26105: {'lr': 0.0004679838371492036, 'samples': 5012160, 'steps': 26104, 'loss/train': 1.3771926164627075} -11/07/2021 00:53:23 - INFO - __main__ - Step 26106: {'lr': 0.00046798123880648833, 'samples': 5012352, 'steps': 26105, 'loss/train': 1.7747282981872559} -11/07/2021 00:53:24 - INFO - __main__ - Step 26107: {'lr': 0.0004679786403655542, 'samples': 5012544, 'steps': 26106, 'loss/train': 1.5721908807754517} -11/07/2021 00:53:25 - INFO - __main__ - Step 26108: {'lr': 0.0004679760418264021, 'samples': 5012736, 'steps': 26107, 'loss/train': 1.555148720741272} -11/07/2021 00:53:25 - INFO - __main__ - Step 26109: {'lr': 0.00046797344318903343, 'samples': 5012928, 'steps': 26108, 'loss/train': 1.344144582748413} -11/07/2021 00:53:26 - INFO - __main__ - Step 26110: {'lr': 0.0004679708444534493, 'samples': 5013120, 'steps': 26109, 'loss/train': 0.920870304107666} -11/07/2021 00:53:26 - INFO - __main__ - Step 26111: {'lr': 0.0004679682456196509, 'samples': 5013312, 'steps': 26110, 'loss/train': 1.5601238012313843} -11/07/2021 00:53:26 - INFO - __main__ - Step 26112: {'lr': 0.0004679656466876393, 'samples': 5013504, 'steps': 26111, 'loss/train': 1.429107904434204} -11/07/2021 00:53:27 - INFO - __main__ - Step 26113: {'lr': 0.00046796304765741583, 'samples': 5013696, 'steps': 26112, 'loss/train': 1.5923376083374023} -11/07/2021 00:53:28 - INFO - __main__ - Step 26114: {'lr': 0.00046796044852898144, 'samples': 5013888, 'steps': 26113, 'loss/train': 1.8528300523757935} -11/07/2021 00:53:28 - INFO - __main__ - Step 26115: {'lr': 0.0004679578493023375, 'samples': 5014080, 'steps': 26114, 'loss/train': 1.4153774976730347} -11/07/2021 00:53:28 - INFO - __main__ - Step 26116: {'lr': 0.00046795524997748515, 'samples': 5014272, 'steps': 26115, 'loss/train': 1.7058981657028198} -11/07/2021 00:53:29 - INFO - __main__ - Step 26117: {'lr': 0.0004679526505544256, 'samples': 5014464, 'steps': 26116, 'loss/train': 1.5847781896591187} -11/07/2021 00:53:30 - INFO - __main__ - Step 26118: {'lr': 0.0004679500510331598, 'samples': 5014656, 'steps': 26117, 'loss/train': 1.441420078277588} -11/07/2021 00:53:30 - INFO - __main__ - Step 26119: {'lr': 0.00046794745141368917, 'samples': 5014848, 'steps': 26118, 'loss/train': 1.183732032775879} -11/07/2021 00:53:30 - INFO - __main__ - Step 26120: {'lr': 0.00046794485169601474, 'samples': 5015040, 'steps': 26119, 'loss/train': 1.5869964361190796} -11/07/2021 00:53:31 - INFO - __main__ - Step 26121: {'lr': 0.00046794225188013773, 'samples': 5015232, 'steps': 26120, 'loss/train': 1.3868657350540161} -11/07/2021 00:53:31 - INFO - __main__ - Step 26122: {'lr': 0.00046793965196605927, 'samples': 5015424, 'steps': 26121, 'loss/train': 1.588295817375183} -11/07/2021 00:53:31 - INFO - __main__ - Step 26123: {'lr': 0.00046793705195378066, 'samples': 5015616, 'steps': 26122, 'loss/train': 2.0373282432556152} -11/07/2021 00:53:32 - INFO - __main__ - Step 26124: {'lr': 0.0004679344518433029, 'samples': 5015808, 'steps': 26123, 'loss/train': 1.2457910776138306} -11/07/2021 00:53:33 - INFO - __main__ - Step 26125: {'lr': 0.0004679318516346273, 'samples': 5016000, 'steps': 26124, 'loss/train': 1.1270509958267212} -11/07/2021 00:53:33 - INFO - __main__ - Step 26126: {'lr': 0.0004679292513277549, 'samples': 5016192, 'steps': 26125, 'loss/train': 1.675414800643921} -11/07/2021 00:53:33 - INFO - __main__ - Step 26127: {'lr': 0.0004679266509226869, 'samples': 5016384, 'steps': 26126, 'loss/train': 1.6026920080184937} -11/07/2021 00:53:34 - INFO - __main__ - Step 26128: {'lr': 0.0004679240504194246, 'samples': 5016576, 'steps': 26127, 'loss/train': 1.3696702718734741} -11/07/2021 00:53:35 - INFO - __main__ - Step 26129: {'lr': 0.00046792144981796905, 'samples': 5016768, 'steps': 26128, 'loss/train': 1.309404969215393} -11/07/2021 00:53:35 - INFO - __main__ - Step 26130: {'lr': 0.0004679188491183215, 'samples': 5016960, 'steps': 26129, 'loss/train': 1.17288339138031} -11/07/2021 00:53:36 - INFO - __main__ - Step 26131: {'lr': 0.00046791624832048307, 'samples': 5017152, 'steps': 26130, 'loss/train': 1.457753300666809} -11/07/2021 00:53:36 - INFO - __main__ - Step 26132: {'lr': 0.0004679136474244549, 'samples': 5017344, 'steps': 26131, 'loss/train': 1.6909582614898682} -11/07/2021 00:53:36 - INFO - __main__ - Step 26133: {'lr': 0.00046791104643023823, 'samples': 5017536, 'steps': 26132, 'loss/train': 1.6915613412857056} -11/07/2021 00:53:37 - INFO - __main__ - Step 26134: {'lr': 0.0004679084453378342, 'samples': 5017728, 'steps': 26133, 'loss/train': 1.97373366355896} -11/07/2021 00:53:38 - INFO - __main__ - Step 26135: {'lr': 0.00046790584414724404, 'samples': 5017920, 'steps': 26134, 'loss/train': 1.0392847061157227} -11/07/2021 00:53:38 - INFO - __main__ - Step 26136: {'lr': 0.0004679032428584687, 'samples': 5018112, 'steps': 26135, 'loss/train': 1.4240553379058838} -11/07/2021 00:53:38 - INFO - __main__ - Step 26137: {'lr': 0.0004679006414715097, 'samples': 5018304, 'steps': 26136, 'loss/train': 1.4850119352340698} -11/07/2021 00:53:39 - INFO - __main__ - Step 26138: {'lr': 0.00046789803998636796, 'samples': 5018496, 'steps': 26137, 'loss/train': 1.529703974723816} -11/07/2021 00:53:40 - INFO - __main__ - Step 26139: {'lr': 0.0004678954384030448, 'samples': 5018688, 'steps': 26138, 'loss/train': 1.807644248008728} -11/07/2021 00:53:40 - INFO - __main__ - Step 26140: {'lr': 0.00046789283672154125, 'samples': 5018880, 'steps': 26139, 'loss/train': 1.7455646991729736} -11/07/2021 00:53:40 - INFO - __main__ - Step 26141: {'lr': 0.00046789023494185855, 'samples': 5019072, 'steps': 26140, 'loss/train': 1.525965929031372} -11/07/2021 00:53:41 - INFO - __main__ - Step 26142: {'lr': 0.0004678876330639978, 'samples': 5019264, 'steps': 26141, 'loss/train': 1.9528864622116089} -11/07/2021 00:53:41 - INFO - __main__ - Step 26143: {'lr': 0.0004678850310879604, 'samples': 5019456, 'steps': 26142, 'loss/train': 1.6074074506759644} -11/07/2021 00:53:42 - INFO - __main__ - Step 26144: {'lr': 0.0004678824290137473, 'samples': 5019648, 'steps': 26143, 'loss/train': 1.5852299928665161} -11/07/2021 00:53:43 - INFO - __main__ - Step 26145: {'lr': 0.0004678798268413597, 'samples': 5019840, 'steps': 26144, 'loss/train': 0.9158662557601929} -11/07/2021 00:53:43 - INFO - __main__ - Step 26146: {'lr': 0.00046787722457079887, 'samples': 5020032, 'steps': 26145, 'loss/train': 1.5754239559173584} -11/07/2021 00:53:43 - INFO - __main__ - Step 26147: {'lr': 0.00046787462220206587, 'samples': 5020224, 'steps': 26146, 'loss/train': 1.568524956703186} -11/07/2021 00:53:44 - INFO - __main__ - Step 26148: {'lr': 0.00046787201973516195, 'samples': 5020416, 'steps': 26147, 'loss/train': 1.5438616275787354} -11/07/2021 00:53:44 - INFO - __main__ - Step 26149: {'lr': 0.00046786941717008823, 'samples': 5020608, 'steps': 26148, 'loss/train': 1.8527145385742188} -11/07/2021 00:53:45 - INFO - __main__ - Step 26150: {'lr': 0.00046786681450684597, 'samples': 5020800, 'steps': 26149, 'loss/train': 1.8514100313186646} -11/07/2021 00:53:45 - INFO - __main__ - Step 26151: {'lr': 0.00046786421174543625, 'samples': 5020992, 'steps': 26150, 'loss/train': 0.8867548704147339} -11/07/2021 00:53:46 - INFO - __main__ - Step 26152: {'lr': 0.0004678616088858603, 'samples': 5021184, 'steps': 26151, 'loss/train': 1.5728057622909546} -11/07/2021 00:53:46 - INFO - __main__ - Step 26153: {'lr': 0.0004678590059281193, 'samples': 5021376, 'steps': 26152, 'loss/train': 1.5114586353302002} -11/07/2021 00:53:46 - INFO - __main__ - Step 26154: {'lr': 0.0004678564028722143, 'samples': 5021568, 'steps': 26153, 'loss/train': 1.5125452280044556} -11/07/2021 00:53:47 - INFO - __main__ - Step 26155: {'lr': 0.0004678537997181467, 'samples': 5021760, 'steps': 26154, 'loss/train': 1.6505911350250244} -11/07/2021 00:53:48 - INFO - __main__ - Step 26156: {'lr': 0.00046785119646591746, 'samples': 5021952, 'steps': 26155, 'loss/train': 1.7003118991851807} -11/07/2021 00:53:48 - INFO - __main__ - Step 26157: {'lr': 0.0004678485931155278, 'samples': 5022144, 'steps': 26156, 'loss/train': 1.5242116451263428} -11/07/2021 00:53:49 - INFO - __main__ - Step 26158: {'lr': 0.000467845989666979, 'samples': 5022336, 'steps': 26157, 'loss/train': 1.6533890962600708} -11/07/2021 00:53:49 - INFO - __main__ - Step 26159: {'lr': 0.0004678433861202721, 'samples': 5022528, 'steps': 26158, 'loss/train': 1.1330708265304565} -11/07/2021 00:53:50 - INFO - __main__ - Step 26160: {'lr': 0.0004678407824754083, 'samples': 5022720, 'steps': 26159, 'loss/train': 1.8086222410202026} -11/07/2021 00:53:50 - INFO - __main__ - Step 26161: {'lr': 0.00046783817873238885, 'samples': 5022912, 'steps': 26160, 'loss/train': 1.5170518159866333} -11/07/2021 00:53:51 - INFO - __main__ - Step 26162: {'lr': 0.0004678355748912149, 'samples': 5023104, 'steps': 26161, 'loss/train': 1.6570253372192383} -11/07/2021 00:53:51 - INFO - __main__ - Step 26163: {'lr': 0.0004678329709518876, 'samples': 5023296, 'steps': 26162, 'loss/train': 1.50641930103302} -11/07/2021 00:53:51 - INFO - __main__ - Step 26164: {'lr': 0.0004678303669144081, 'samples': 5023488, 'steps': 26163, 'loss/train': 1.6530953645706177} -11/07/2021 00:53:52 - INFO - __main__ - Step 26165: {'lr': 0.0004678277627787776, 'samples': 5023680, 'steps': 26164, 'loss/train': 0.966736912727356} -11/07/2021 00:53:53 - INFO - __main__ - Step 26166: {'lr': 0.0004678251585449973, 'samples': 5023872, 'steps': 26165, 'loss/train': 1.3423575162887573} -11/07/2021 00:53:53 - INFO - __main__ - Step 26167: {'lr': 0.0004678225542130683, 'samples': 5024064, 'steps': 26166, 'loss/train': 1.4492461681365967} -11/07/2021 00:53:53 - INFO - __main__ - Step 26168: {'lr': 0.0004678199497829919, 'samples': 5024256, 'steps': 26167, 'loss/train': 1.3655349016189575} -11/07/2021 00:53:54 - INFO - __main__ - Step 26169: {'lr': 0.0004678173452547691, 'samples': 5024448, 'steps': 26168, 'loss/train': 2.049821615219116} -11/07/2021 00:53:55 - INFO - __main__ - Step 26170: {'lr': 0.00046781474062840126, 'samples': 5024640, 'steps': 26169, 'loss/train': 1.5945308208465576} -11/07/2021 00:53:55 - INFO - __main__ - Step 26171: {'lr': 0.0004678121359038894, 'samples': 5024832, 'steps': 26170, 'loss/train': 2.121659994125366} -11/07/2021 00:53:56 - INFO - __main__ - Step 26172: {'lr': 0.0004678095310812347, 'samples': 5025024, 'steps': 26171, 'loss/train': 1.6644989252090454} -11/07/2021 00:53:56 - INFO - __main__ - Step 26173: {'lr': 0.0004678069261604384, 'samples': 5025216, 'steps': 26172, 'loss/train': 1.843034029006958} -11/07/2021 00:53:56 - INFO - __main__ - Step 26174: {'lr': 0.00046780432114150173, 'samples': 5025408, 'steps': 26173, 'loss/train': 1.1142686605453491} -11/07/2021 00:53:57 - INFO - __main__ - Step 26175: {'lr': 0.0004678017160244258, 'samples': 5025600, 'steps': 26174, 'loss/train': 1.3084547519683838} -11/07/2021 00:53:58 - INFO - __main__ - Step 26176: {'lr': 0.00046779911080921166, 'samples': 5025792, 'steps': 26175, 'loss/train': 1.2665361166000366} -11/07/2021 00:53:58 - INFO - __main__ - Step 26177: {'lr': 0.00046779650549586075, 'samples': 5025984, 'steps': 26176, 'loss/train': 1.6010990142822266} -11/07/2021 00:53:59 - INFO - __main__ - Step 26178: {'lr': 0.000467793900084374, 'samples': 5026176, 'steps': 26177, 'loss/train': 1.8408987522125244} -11/07/2021 00:53:59 - INFO - __main__ - Step 26179: {'lr': 0.0004677912945747527, 'samples': 5026368, 'steps': 26178, 'loss/train': 1.700212001800537} -11/07/2021 00:53:59 - INFO - __main__ - Step 26180: {'lr': 0.000467788688966998, 'samples': 5026560, 'steps': 26179, 'loss/train': 1.9452217817306519} -11/07/2021 00:54:00 - INFO - __main__ - Step 26181: {'lr': 0.00046778608326111104, 'samples': 5026752, 'steps': 26180, 'loss/train': 0.5576347708702087} -11/07/2021 00:54:01 - INFO - __main__ - Step 26182: {'lr': 0.00046778347745709317, 'samples': 5026944, 'steps': 26181, 'loss/train': 1.705079197883606} -11/07/2021 00:54:01 - INFO - __main__ - Step 26183: {'lr': 0.0004677808715549453, 'samples': 5027136, 'steps': 26182, 'loss/train': 1.4773807525634766} -11/07/2021 00:54:02 - INFO - __main__ - Step 26184: {'lr': 0.0004677782655546687, 'samples': 5027328, 'steps': 26183, 'loss/train': 1.2588014602661133} -11/07/2021 00:54:02 - INFO - __main__ - Step 26185: {'lr': 0.00046777565945626463, 'samples': 5027520, 'steps': 26184, 'loss/train': 1.3694013357162476} -11/07/2021 00:54:02 - INFO - __main__ - Step 26186: {'lr': 0.0004677730532597343, 'samples': 5027712, 'steps': 26185, 'loss/train': 0.18336506187915802} -11/07/2021 00:54:03 - INFO - __main__ - Step 26187: {'lr': 0.00046777044696507867, 'samples': 5027904, 'steps': 26186, 'loss/train': 1.2982537746429443} -11/07/2021 00:54:04 - INFO - __main__ - Step 26188: {'lr': 0.00046776784057229906, 'samples': 5028096, 'steps': 26187, 'loss/train': 1.6988948583602905} -11/07/2021 00:54:04 - INFO - __main__ - Step 26189: {'lr': 0.00046776523408139666, 'samples': 5028288, 'steps': 26188, 'loss/train': 1.8552799224853516} -11/07/2021 00:54:04 - INFO - __main__ - Step 26190: {'lr': 0.0004677626274923726, 'samples': 5028480, 'steps': 26189, 'loss/train': 1.4913320541381836} -11/07/2021 00:54:05 - INFO - __main__ - Step 26191: {'lr': 0.000467760020805228, 'samples': 5028672, 'steps': 26190, 'loss/train': 1.6391502618789673} -11/07/2021 00:54:06 - INFO - __main__ - Step 26192: {'lr': 0.0004677574140199642, 'samples': 5028864, 'steps': 26191, 'loss/train': 1.589673638343811} -11/07/2021 00:54:06 - INFO - __main__ - Step 26193: {'lr': 0.00046775480713658215, 'samples': 5029056, 'steps': 26192, 'loss/train': 1.6726784706115723} -11/07/2021 00:54:06 - INFO - __main__ - Step 26194: {'lr': 0.00046775220015508325, 'samples': 5029248, 'steps': 26193, 'loss/train': 1.3490551710128784} -11/07/2021 00:54:07 - INFO - __main__ - Step 26195: {'lr': 0.0004677495930754685, 'samples': 5029440, 'steps': 26194, 'loss/train': 1.2924178838729858} -11/07/2021 00:54:07 - INFO - __main__ - Step 26196: {'lr': 0.0004677469858977391, 'samples': 5029632, 'steps': 26195, 'loss/train': 2.0205130577087402} -11/07/2021 00:54:08 - INFO - __main__ - Step 26197: {'lr': 0.00046774437862189634, 'samples': 5029824, 'steps': 26196, 'loss/train': 1.8864357471466064} -11/07/2021 00:54:09 - INFO - __main__ - Step 26198: {'lr': 0.00046774177124794136, 'samples': 5030016, 'steps': 26197, 'loss/train': 1.3467926979064941} -11/07/2021 00:54:09 - INFO - __main__ - Step 26199: {'lr': 0.00046773916377587524, 'samples': 5030208, 'steps': 26198, 'loss/train': 1.4463247060775757} -11/07/2021 00:54:09 - INFO - __main__ - Step 26200: {'lr': 0.00046773655620569924, 'samples': 5030400, 'steps': 26199, 'loss/train': 1.1757603883743286} -11/07/2021 00:54:10 - INFO - __main__ - Step 26201: {'lr': 0.0004677339485374145, 'samples': 5030592, 'steps': 26200, 'loss/train': 1.4346240758895874} -11/07/2021 00:54:11 - INFO - __main__ - Step 26202: {'lr': 0.00046773134077102217, 'samples': 5030784, 'steps': 26201, 'loss/train': 1.732772707939148} -11/07/2021 00:54:11 - INFO - __main__ - Step 26203: {'lr': 0.00046772873290652344, 'samples': 5030976, 'steps': 26202, 'loss/train': 1.3843315839767456} -11/07/2021 00:54:11 - INFO - __main__ - Step 26204: {'lr': 0.0004677261249439196, 'samples': 5031168, 'steps': 26203, 'loss/train': 1.8565138578414917} -11/07/2021 00:54:12 - INFO - __main__ - Step 26205: {'lr': 0.0004677235168832117, 'samples': 5031360, 'steps': 26204, 'loss/train': 1.6033073663711548} -11/07/2021 00:54:12 - INFO - __main__ - Step 26206: {'lr': 0.0004677209087244009, 'samples': 5031552, 'steps': 26205, 'loss/train': 1.8159793615341187} -11/07/2021 00:54:13 - INFO - __main__ - Step 26207: {'lr': 0.0004677183004674884, 'samples': 5031744, 'steps': 26206, 'loss/train': 1.5248264074325562} -11/07/2021 00:54:13 - INFO - __main__ - Step 26208: {'lr': 0.00046771569211247546, 'samples': 5031936, 'steps': 26207, 'loss/train': 1.6858869791030884} -11/07/2021 00:54:14 - INFO - __main__ - Step 26209: {'lr': 0.00046771308365936315, 'samples': 5032128, 'steps': 26208, 'loss/train': 1.5982725620269775} -11/07/2021 00:54:14 - INFO - __main__ - Step 26210: {'lr': 0.00046771047510815267, 'samples': 5032320, 'steps': 26209, 'loss/train': 1.8095290660858154} -11/07/2021 00:54:14 - INFO - __main__ - Step 26211: {'lr': 0.0004677078664588452, 'samples': 5032512, 'steps': 26210, 'loss/train': 1.5817720890045166} -11/07/2021 00:54:16 - INFO - __main__ - Step 26212: {'lr': 0.000467705257711442, 'samples': 5032704, 'steps': 26211, 'loss/train': 1.801270842552185} -11/07/2021 00:54:16 - INFO - __main__ - Step 26213: {'lr': 0.0004677026488659441, 'samples': 5032896, 'steps': 26212, 'loss/train': 1.433125376701355} -11/07/2021 00:54:16 - INFO - __main__ - Step 26214: {'lr': 0.0004677000399223528, 'samples': 5033088, 'steps': 26213, 'loss/train': 1.7132267951965332} -11/07/2021 00:54:17 - INFO - __main__ - Step 26215: {'lr': 0.0004676974308806692, 'samples': 5033280, 'steps': 26214, 'loss/train': 1.7332468032836914} -11/07/2021 00:54:17 - INFO - __main__ - Step 26216: {'lr': 0.00046769482174089446, 'samples': 5033472, 'steps': 26215, 'loss/train': 1.8117945194244385} -11/07/2021 00:54:17 - INFO - __main__ - Step 26217: {'lr': 0.00046769221250302984, 'samples': 5033664, 'steps': 26216, 'loss/train': 1.13893723487854} -11/07/2021 00:54:18 - INFO - __main__ - Step 26218: {'lr': 0.0004676896031670764, 'samples': 5033856, 'steps': 26217, 'loss/train': 1.3056902885437012} -11/07/2021 00:54:19 - INFO - __main__ - Step 26219: {'lr': 0.00046768699373303546, 'samples': 5034048, 'steps': 26218, 'loss/train': 2.4533538818359375} -11/07/2021 00:54:19 - INFO - __main__ - Step 26220: {'lr': 0.00046768438420090807, 'samples': 5034240, 'steps': 26219, 'loss/train': 1.8676079511642456} -11/07/2021 00:54:19 - INFO - __main__ - Step 26221: {'lr': 0.0004676817745706955, 'samples': 5034432, 'steps': 26220, 'loss/train': 1.638798475265503} -11/07/2021 00:54:20 - INFO - __main__ - Step 26222: {'lr': 0.0004676791648423989, 'samples': 5034624, 'steps': 26221, 'loss/train': 0.4636261761188507} -11/07/2021 00:54:21 - INFO - __main__ - Step 26223: {'lr': 0.00046767655501601935, 'samples': 5034816, 'steps': 26222, 'loss/train': 1.136460542678833} -11/07/2021 00:54:21 - INFO - __main__ - Step 26224: {'lr': 0.0004676739450915581, 'samples': 5035008, 'steps': 26223, 'loss/train': 1.7114912271499634} -11/07/2021 00:54:22 - INFO - __main__ - Step 26225: {'lr': 0.0004676713350690164, 'samples': 5035200, 'steps': 26224, 'loss/train': 1.770675778388977} -11/07/2021 00:54:22 - INFO - __main__ - Step 26226: {'lr': 0.0004676687249483953, 'samples': 5035392, 'steps': 26225, 'loss/train': 1.5932910442352295} -11/07/2021 00:54:22 - INFO - __main__ - Step 26227: {'lr': 0.0004676661147296961, 'samples': 5035584, 'steps': 26226, 'loss/train': 1.6483561992645264} -11/07/2021 00:54:23 - INFO - __main__ - Step 26228: {'lr': 0.00046766350441291985, 'samples': 5035776, 'steps': 26227, 'loss/train': 1.5081048011779785} -11/07/2021 00:54:24 - INFO - __main__ - Step 26229: {'lr': 0.00046766089399806775, 'samples': 5035968, 'steps': 26228, 'loss/train': 1.5878859758377075} -11/07/2021 00:54:24 - INFO - __main__ - Step 26230: {'lr': 0.0004676582834851411, 'samples': 5036160, 'steps': 26229, 'loss/train': 1.6839022636413574} -11/07/2021 00:54:24 - INFO - __main__ - Step 26231: {'lr': 0.0004676556728741409, 'samples': 5036352, 'steps': 26230, 'loss/train': 1.9797955751419067} -11/07/2021 00:54:25 - INFO - __main__ - Step 26232: {'lr': 0.0004676530621650685, 'samples': 5036544, 'steps': 26231, 'loss/train': 1.775161862373352} -11/07/2021 00:54:25 - INFO - __main__ - Step 26233: {'lr': 0.00046765045135792495, 'samples': 5036736, 'steps': 26232, 'loss/train': 1.5758485794067383} -11/07/2021 00:54:26 - INFO - __main__ - Step 26234: {'lr': 0.00046764784045271146, 'samples': 5036928, 'steps': 26233, 'loss/train': 1.1304795742034912} -11/07/2021 00:54:26 - INFO - __main__ - Step 26235: {'lr': 0.0004676452294494292, 'samples': 5037120, 'steps': 26234, 'loss/train': 1.6500743627548218} -11/07/2021 00:54:27 - INFO - __main__ - Step 26236: {'lr': 0.00046764261834807944, 'samples': 5037312, 'steps': 26235, 'loss/train': 1.3043909072875977} -11/07/2021 00:54:27 - INFO - __main__ - Step 26237: {'lr': 0.0004676400071486632, 'samples': 5037504, 'steps': 26236, 'loss/train': 1.1312769651412964} -11/07/2021 00:54:27 - INFO - __main__ - Step 26238: {'lr': 0.0004676373958511817, 'samples': 5037696, 'steps': 26237, 'loss/train': 1.7899938821792603} -11/07/2021 00:54:28 - INFO - __main__ - Step 26239: {'lr': 0.00046763478445563617, 'samples': 5037888, 'steps': 26238, 'loss/train': 1.2193043231964111} -11/07/2021 00:54:29 - INFO - __main__ - Step 26240: {'lr': 0.0004676321729620278, 'samples': 5038080, 'steps': 26239, 'loss/train': 1.5249736309051514} -11/07/2021 00:54:29 - INFO - __main__ - Step 26241: {'lr': 0.0004676295613703577, 'samples': 5038272, 'steps': 26240, 'loss/train': 1.710008978843689} -11/07/2021 00:54:30 - INFO - __main__ - Step 26242: {'lr': 0.00046762694968062706, 'samples': 5038464, 'steps': 26241, 'loss/train': 1.24952232837677} -11/07/2021 00:54:30 - INFO - __main__ - Step 26243: {'lr': 0.0004676243378928371, 'samples': 5038656, 'steps': 26242, 'loss/train': 2.338625431060791} -11/07/2021 00:54:31 - INFO - __main__ - Step 26244: {'lr': 0.000467621726006989, 'samples': 5038848, 'steps': 26243, 'loss/train': 1.184955358505249} -11/07/2021 00:54:31 - INFO - __main__ - Step 26245: {'lr': 0.0004676191140230839, 'samples': 5039040, 'steps': 26244, 'loss/train': 1.1319618225097656} -11/07/2021 00:54:32 - INFO - __main__ - Step 26246: {'lr': 0.0004676165019411229, 'samples': 5039232, 'steps': 26245, 'loss/train': 1.7131967544555664} -11/07/2021 00:54:32 - INFO - __main__ - Step 26247: {'lr': 0.00046761388976110737, 'samples': 5039424, 'steps': 26246, 'loss/train': 1.0271192789077759} -11/07/2021 00:54:32 - INFO - __main__ - Step 26248: {'lr': 0.00046761127748303833, 'samples': 5039616, 'steps': 26247, 'loss/train': 1.5839369297027588} -11/07/2021 00:54:33 - INFO - __main__ - Step 26249: {'lr': 0.000467608665106917, 'samples': 5039808, 'steps': 26248, 'loss/train': 1.4229629039764404} -11/07/2021 00:54:34 - INFO - __main__ - Step 26250: {'lr': 0.0004676060526327446, 'samples': 5040000, 'steps': 26249, 'loss/train': 1.781359314918518} -11/07/2021 00:54:34 - INFO - __main__ - Step 26251: {'lr': 0.00046760344006052223, 'samples': 5040192, 'steps': 26250, 'loss/train': 1.8070279359817505} -11/07/2021 00:54:34 - INFO - __main__ - Step 26252: {'lr': 0.00046760082739025113, 'samples': 5040384, 'steps': 26251, 'loss/train': 1.6231582164764404} -11/07/2021 00:54:35 - INFO - __main__ - Step 26253: {'lr': 0.0004675982146219324, 'samples': 5040576, 'steps': 26252, 'loss/train': 1.6634784936904907} -11/07/2021 00:54:36 - INFO - __main__ - Step 26254: {'lr': 0.00046759560175556737, 'samples': 5040768, 'steps': 26253, 'loss/train': 1.4208816289901733} -11/07/2021 00:54:36 - INFO - __main__ - Step 26255: {'lr': 0.0004675929887911571, 'samples': 5040960, 'steps': 26254, 'loss/train': 1.548449993133545} -11/07/2021 00:54:36 - INFO - __main__ - Step 26256: {'lr': 0.0004675903757287027, 'samples': 5041152, 'steps': 26255, 'loss/train': 1.503303050994873} -11/07/2021 00:54:37 - INFO - __main__ - Step 26257: {'lr': 0.0004675877625682055, 'samples': 5041344, 'steps': 26256, 'loss/train': 1.5762418508529663} -11/07/2021 00:54:37 - INFO - __main__ - Step 26258: {'lr': 0.00046758514930966664, 'samples': 5041536, 'steps': 26257, 'loss/train': 1.1812611818313599} -11/07/2021 00:54:38 - INFO - __main__ - Step 26259: {'lr': 0.0004675825359530872, 'samples': 5041728, 'steps': 26258, 'loss/train': 1.4623467922210693} -11/07/2021 00:54:38 - INFO - __main__ - Step 26260: {'lr': 0.0004675799224984685, 'samples': 5041920, 'steps': 26259, 'loss/train': 0.653400182723999} -11/07/2021 00:54:39 - INFO - __main__ - Step 26261: {'lr': 0.00046757730894581164, 'samples': 5042112, 'steps': 26260, 'loss/train': 1.5049389600753784} -11/07/2021 00:54:39 - INFO - __main__ - Step 26262: {'lr': 0.00046757469529511777, 'samples': 5042304, 'steps': 26261, 'loss/train': 1.2047209739685059} -11/07/2021 00:54:40 - INFO - __main__ - Step 26263: {'lr': 0.0004675720815463881, 'samples': 5042496, 'steps': 26262, 'loss/train': 1.4288592338562012} -11/07/2021 00:54:41 - INFO - __main__ - Step 26264: {'lr': 0.00046756946769962375, 'samples': 5042688, 'steps': 26263, 'loss/train': 1.3080549240112305} -11/07/2021 00:54:41 - INFO - __main__ - Step 26265: {'lr': 0.000467566853754826, 'samples': 5042880, 'steps': 26264, 'loss/train': 1.5261808633804321} -11/07/2021 00:54:41 - INFO - __main__ - Step 26266: {'lr': 0.00046756423971199603, 'samples': 5043072, 'steps': 26265, 'loss/train': 1.3504849672317505} -11/07/2021 00:54:42 - INFO - __main__ - Step 26267: {'lr': 0.0004675616255711349, 'samples': 5043264, 'steps': 26266, 'loss/train': 1.8957056999206543} -11/07/2021 00:54:42 - INFO - __main__ - Step 26268: {'lr': 0.0004675590113322439, 'samples': 5043456, 'steps': 26267, 'loss/train': 2.033751964569092} -11/07/2021 00:54:43 - INFO - __main__ - Step 26269: {'lr': 0.00046755639699532414, 'samples': 5043648, 'steps': 26268, 'loss/train': 1.4890309572219849} -11/07/2021 00:54:43 - INFO - __main__ - Step 26270: {'lr': 0.00046755378256037685, 'samples': 5043840, 'steps': 26269, 'loss/train': 1.3406038284301758} -11/07/2021 00:54:44 - INFO - __main__ - Step 26271: {'lr': 0.00046755116802740316, 'samples': 5044032, 'steps': 26270, 'loss/train': 1.4244365692138672} -11/07/2021 00:54:44 - INFO - __main__ - Step 26272: {'lr': 0.00046754855339640436, 'samples': 5044224, 'steps': 26271, 'loss/train': 1.261167287826538} -11/07/2021 00:54:44 - INFO - __main__ - Step 26273: {'lr': 0.00046754593866738144, 'samples': 5044416, 'steps': 26272, 'loss/train': 1.2437100410461426} -11/07/2021 00:54:45 - INFO - __main__ - Step 26274: {'lr': 0.0004675433238403357, 'samples': 5044608, 'steps': 26273, 'loss/train': 1.7398239374160767} -11/07/2021 00:54:46 - INFO - __main__ - Step 26275: {'lr': 0.0004675407089152683, 'samples': 5044800, 'steps': 26274, 'loss/train': 1.3467254638671875} -11/07/2021 00:54:46 - INFO - __main__ - Step 26276: {'lr': 0.00046753809389218036, 'samples': 5044992, 'steps': 26275, 'loss/train': 1.356188178062439} -11/07/2021 00:54:46 - INFO - __main__ - Step 26277: {'lr': 0.0004675354787710732, 'samples': 5045184, 'steps': 26276, 'loss/train': 1.1773614883422852} -11/07/2021 00:54:47 - INFO - __main__ - Step 26278: {'lr': 0.0004675328635519479, 'samples': 5045376, 'steps': 26277, 'loss/train': 1.1977851390838623} -11/07/2021 00:54:47 - INFO - __main__ - Step 26279: {'lr': 0.0004675302482348056, 'samples': 5045568, 'steps': 26278, 'loss/train': 1.286010980606079} -11/07/2021 00:54:48 - INFO - __main__ - Step 26280: {'lr': 0.00046752763281964757, 'samples': 5045760, 'steps': 26279, 'loss/train': 1.3089194297790527} -11/07/2021 00:54:49 - INFO - __main__ - Step 26281: {'lr': 0.0004675250173064749, 'samples': 5045952, 'steps': 26280, 'loss/train': 1.6992191076278687} -11/07/2021 00:54:49 - INFO - __main__ - Step 26282: {'lr': 0.0004675224016952888, 'samples': 5046144, 'steps': 26281, 'loss/train': 1.4516578912734985} -11/07/2021 00:54:49 - INFO - __main__ - Step 26283: {'lr': 0.00046751978598609056, 'samples': 5046336, 'steps': 26282, 'loss/train': 1.43919837474823} -11/07/2021 00:54:50 - INFO - __main__ - Step 26284: {'lr': 0.00046751717017888116, 'samples': 5046528, 'steps': 26283, 'loss/train': 1.5895462036132812} -11/07/2021 00:54:51 - INFO - __main__ - Step 26285: {'lr': 0.00046751455427366194, 'samples': 5046720, 'steps': 26284, 'loss/train': 0.6971876621246338} -11/07/2021 00:54:51 - INFO - __main__ - Step 26286: {'lr': 0.00046751193827043405, 'samples': 5046912, 'steps': 26285, 'loss/train': 1.4004305601119995} -11/07/2021 00:54:51 - INFO - __main__ - Step 26287: {'lr': 0.0004675093221691985, 'samples': 5047104, 'steps': 26286, 'loss/train': 1.6197659969329834} -11/07/2021 00:54:52 - INFO - __main__ - Step 26288: {'lr': 0.0004675067059699567, 'samples': 5047296, 'steps': 26287, 'loss/train': 1.8886771202087402} -11/07/2021 00:54:52 - INFO - __main__ - Step 26289: {'lr': 0.00046750408967270973, 'samples': 5047488, 'steps': 26288, 'loss/train': 1.566393256187439} -11/07/2021 00:54:53 - INFO - __main__ - Step 26290: {'lr': 0.0004675014732774588, 'samples': 5047680, 'steps': 26289, 'loss/train': 1.660553216934204} -11/07/2021 00:54:54 - INFO - __main__ - Step 26291: {'lr': 0.000467498856784205, 'samples': 5047872, 'steps': 26290, 'loss/train': 1.9005926847457886} -11/07/2021 00:54:54 - INFO - __main__ - Step 26292: {'lr': 0.0004674962401929496, 'samples': 5048064, 'steps': 26291, 'loss/train': 0.9089964628219604} -11/07/2021 00:54:54 - INFO - __main__ - Step 26293: {'lr': 0.0004674936235036938, 'samples': 5048256, 'steps': 26292, 'loss/train': 1.5952370166778564} -11/07/2021 00:54:55 - INFO - __main__ - Step 26294: {'lr': 0.00046749100671643866, 'samples': 5048448, 'steps': 26293, 'loss/train': 1.6620838642120361} -11/07/2021 00:54:56 - INFO - __main__ - Step 26295: {'lr': 0.00046748838983118546, 'samples': 5048640, 'steps': 26294, 'loss/train': 1.4640512466430664} -11/07/2021 00:54:56 - INFO - __main__ - Step 26296: {'lr': 0.00046748577284793535, 'samples': 5048832, 'steps': 26295, 'loss/train': 1.491481065750122} -11/07/2021 00:54:56 - INFO - __main__ - Step 26297: {'lr': 0.00046748315576668946, 'samples': 5049024, 'steps': 26296, 'loss/train': 1.6581768989562988} -11/07/2021 00:54:57 - INFO - __main__ - Step 26298: {'lr': 0.0004674805385874491, 'samples': 5049216, 'steps': 26297, 'loss/train': 1.7091991901397705} -11/07/2021 00:54:57 - INFO - __main__ - Step 26299: {'lr': 0.0004674779213102153, 'samples': 5049408, 'steps': 26298, 'loss/train': 0.7105774283409119} -11/07/2021 00:54:58 - INFO - __main__ - Step 26300: {'lr': 0.00046747530393498934, 'samples': 5049600, 'steps': 26299, 'loss/train': 0.5618196129798889} -11/07/2021 00:54:58 - INFO - __main__ - Step 26301: {'lr': 0.0004674726864617723, 'samples': 5049792, 'steps': 26300, 'loss/train': 1.4105170965194702} -11/07/2021 00:54:59 - INFO - __main__ - Step 26302: {'lr': 0.00046747006889056556, 'samples': 5049984, 'steps': 26301, 'loss/train': 1.1258419752120972} -11/07/2021 00:54:59 - INFO - __main__ - Step 26303: {'lr': 0.00046746745122137, 'samples': 5050176, 'steps': 26302, 'loss/train': 1.513561725616455} -11/07/2021 00:55:00 - INFO - __main__ - Step 26304: {'lr': 0.000467464833454187, 'samples': 5050368, 'steps': 26303, 'loss/train': 1.7200157642364502} -11/07/2021 00:55:01 - INFO - __main__ - Step 26305: {'lr': 0.0004674622155890178, 'samples': 5050560, 'steps': 26304, 'loss/train': 1.6631202697753906} -11/07/2021 00:55:01 - INFO - __main__ - Step 26306: {'lr': 0.00046745959762586344, 'samples': 5050752, 'steps': 26305, 'loss/train': 1.888162612915039} -11/07/2021 00:55:01 - INFO - __main__ - Step 26307: {'lr': 0.0004674569795647251, 'samples': 5050944, 'steps': 26306, 'loss/train': 1.8183954954147339} -11/07/2021 00:55:02 - INFO - __main__ - Step 26308: {'lr': 0.00046745436140560397, 'samples': 5051136, 'steps': 26307, 'loss/train': 1.4250584840774536} -11/07/2021 00:55:02 - INFO - __main__ - Step 26309: {'lr': 0.00046745174314850136, 'samples': 5051328, 'steps': 26308, 'loss/train': 0.5985563397407532} -11/07/2021 00:55:03 - INFO - __main__ - Step 26310: {'lr': 0.00046744912479341826, 'samples': 5051520, 'steps': 26309, 'loss/train': 1.5755923986434937} -11/07/2021 00:55:03 - INFO - __main__ - Step 26311: {'lr': 0.00046744650634035603, 'samples': 5051712, 'steps': 26310, 'loss/train': 1.6963415145874023} -11/07/2021 00:55:04 - INFO - __main__ - Step 26312: {'lr': 0.0004674438877893157, 'samples': 5051904, 'steps': 26311, 'loss/train': 1.540200114250183} -11/07/2021 00:55:04 - INFO - __main__ - Step 26313: {'lr': 0.0004674412691402985, 'samples': 5052096, 'steps': 26312, 'loss/train': 1.536624789237976} -11/07/2021 00:55:04 - INFO - __main__ - Step 26314: {'lr': 0.00046743865039330565, 'samples': 5052288, 'steps': 26313, 'loss/train': 1.3715239763259888} -11/07/2021 00:55:05 - INFO - __main__ - Step 26315: {'lr': 0.00046743603154833827, 'samples': 5052480, 'steps': 26314, 'loss/train': 1.5983755588531494} -11/07/2021 00:55:06 - INFO - __main__ - Step 26316: {'lr': 0.00046743341260539756, 'samples': 5052672, 'steps': 26315, 'loss/train': 1.4672774076461792} -11/07/2021 00:55:06 - INFO - __main__ - Step 26317: {'lr': 0.00046743079356448476, 'samples': 5052864, 'steps': 26316, 'loss/train': 1.2478556632995605} -11/07/2021 00:55:06 - INFO - __main__ - Step 26318: {'lr': 0.000467428174425601, 'samples': 5053056, 'steps': 26317, 'loss/train': 1.39298415184021} -11/07/2021 00:55:07 - INFO - __main__ - Step 26319: {'lr': 0.0004674255551887474, 'samples': 5053248, 'steps': 26318, 'loss/train': 1.4729957580566406} -11/07/2021 00:55:07 - INFO - __main__ - Step 26320: {'lr': 0.0004674229358539253, 'samples': 5053440, 'steps': 26319, 'loss/train': 1.4828534126281738} -11/07/2021 00:55:09 - INFO - __main__ - Step 26321: {'lr': 0.0004674203164211357, 'samples': 5053632, 'steps': 26320, 'loss/train': 1.4319690465927124} -11/07/2021 00:55:09 - INFO - __main__ - Step 26322: {'lr': 0.00046741769689037985, 'samples': 5053824, 'steps': 26321, 'loss/train': 1.4296718835830688} -11/07/2021 00:55:09 - INFO - __main__ - Step 26323: {'lr': 0.0004674150772616589, 'samples': 5054016, 'steps': 26322, 'loss/train': 1.5283063650131226} -11/07/2021 00:55:10 - INFO - __main__ - Step 26324: {'lr': 0.0004674124575349742, 'samples': 5054208, 'steps': 26323, 'loss/train': 1.8238298892974854} -11/07/2021 00:55:10 - INFO - __main__ - Step 26325: {'lr': 0.00046740983771032674, 'samples': 5054400, 'steps': 26324, 'loss/train': 1.7715691328048706} -11/07/2021 00:55:11 - INFO - __main__ - Step 26326: {'lr': 0.0004674072177877178, 'samples': 5054592, 'steps': 26325, 'loss/train': 1.4993889331817627} -11/07/2021 00:55:12 - INFO - __main__ - Step 26327: {'lr': 0.0004674045977671484, 'samples': 5054784, 'steps': 26326, 'loss/train': 1.3500524759292603} -11/07/2021 00:55:12 - INFO - __main__ - Step 26328: {'lr': 0.00046740197764862, 'samples': 5054976, 'steps': 26327, 'loss/train': 1.5933117866516113} -11/07/2021 00:55:12 - INFO - __main__ - Step 26329: {'lr': 0.00046739935743213344, 'samples': 5055168, 'steps': 26328, 'loss/train': 1.496039628982544} -11/07/2021 00:55:13 - INFO - __main__ - Step 26330: {'lr': 0.00046739673711769026, 'samples': 5055360, 'steps': 26329, 'loss/train': 2.607337474822998} -11/07/2021 00:55:13 - INFO - __main__ - Step 26331: {'lr': 0.0004673941167052914, 'samples': 5055552, 'steps': 26330, 'loss/train': 1.002419114112854} -11/07/2021 00:55:13 - INFO - __main__ - Step 26332: {'lr': 0.0004673914961949381, 'samples': 5055744, 'steps': 26331, 'loss/train': 1.1333625316619873} -11/07/2021 00:55:14 - INFO - __main__ - Step 26333: {'lr': 0.0004673888755866316, 'samples': 5055936, 'steps': 26332, 'loss/train': 1.761634111404419} -11/07/2021 00:55:15 - INFO - __main__ - Step 26334: {'lr': 0.0004673862548803729, 'samples': 5056128, 'steps': 26333, 'loss/train': 1.6359180212020874} -11/07/2021 00:55:15 - INFO - __main__ - Step 26335: {'lr': 0.0004673836340761634, 'samples': 5056320, 'steps': 26334, 'loss/train': 1.7028871774673462} -11/07/2021 00:55:15 - INFO - __main__ - Step 26336: {'lr': 0.00046738101317400415, 'samples': 5056512, 'steps': 26335, 'loss/train': 1.6568629741668701} -11/07/2021 00:55:16 - INFO - __main__ - Step 26337: {'lr': 0.00046737839217389645, 'samples': 5056704, 'steps': 26336, 'loss/train': 1.5187630653381348} -11/07/2021 00:55:17 - INFO - __main__ - Step 26338: {'lr': 0.0004673757710758413, 'samples': 5056896, 'steps': 26337, 'loss/train': 1.3679804801940918} -11/07/2021 00:55:17 - INFO - __main__ - Step 26339: {'lr': 0.00046737314987984, 'samples': 5057088, 'steps': 26338, 'loss/train': 1.8160271644592285} -11/07/2021 00:55:17 - INFO - __main__ - Step 26340: {'lr': 0.0004673705285858938, 'samples': 5057280, 'steps': 26339, 'loss/train': 1.5020647048950195} -11/07/2021 00:55:18 - INFO - __main__ - Step 26341: {'lr': 0.00046736790719400373, 'samples': 5057472, 'steps': 26340, 'loss/train': 1.307187557220459} -11/07/2021 00:55:18 - INFO - __main__ - Step 26342: {'lr': 0.000467365285704171, 'samples': 5057664, 'steps': 26341, 'loss/train': 1.7790440320968628} -11/07/2021 00:55:19 - INFO - __main__ - Step 26343: {'lr': 0.00046736266411639694, 'samples': 5057856, 'steps': 26342, 'loss/train': 1.3135005235671997} -11/07/2021 00:55:20 - INFO - __main__ - Step 26344: {'lr': 0.00046736004243068255, 'samples': 5058048, 'steps': 26343, 'loss/train': 0.7145043611526489} -11/07/2021 00:55:20 - INFO - __main__ - Step 26345: {'lr': 0.00046735742064702904, 'samples': 5058240, 'steps': 26344, 'loss/train': 1.4895724058151245} -11/07/2021 00:55:20 - INFO - __main__ - Step 26346: {'lr': 0.00046735479876543765, 'samples': 5058432, 'steps': 26345, 'loss/train': 1.4524718523025513} -11/07/2021 00:55:21 - INFO - __main__ - Step 26347: {'lr': 0.00046735217678590957, 'samples': 5058624, 'steps': 26346, 'loss/train': 0.29512056708335876} -11/07/2021 00:55:22 - INFO - __main__ - Step 26348: {'lr': 0.00046734955470844594, 'samples': 5058816, 'steps': 26347, 'loss/train': 1.5119823217391968} -11/07/2021 00:55:22 - INFO - __main__ - Step 26349: {'lr': 0.00046734693253304795, 'samples': 5059008, 'steps': 26348, 'loss/train': 1.7592660188674927} -11/07/2021 00:55:23 - INFO - __main__ - Step 26350: {'lr': 0.0004673443102597168, 'samples': 5059200, 'steps': 26349, 'loss/train': 1.5248686075210571} -11/07/2021 00:55:23 - INFO - __main__ - Step 26351: {'lr': 0.00046734168788845363, 'samples': 5059392, 'steps': 26350, 'loss/train': 1.859383463859558} -11/07/2021 00:55:23 - INFO - __main__ - Step 26352: {'lr': 0.00046733906541925963, 'samples': 5059584, 'steps': 26351, 'loss/train': 1.4118645191192627} -11/07/2021 00:55:24 - INFO - __main__ - Step 26353: {'lr': 0.00046733644285213604, 'samples': 5059776, 'steps': 26352, 'loss/train': 1.3316917419433594} -11/07/2021 00:55:25 - INFO - __main__ - Step 26354: {'lr': 0.00046733382018708405, 'samples': 5059968, 'steps': 26353, 'loss/train': 1.6919605731964111} -11/07/2021 00:55:25 - INFO - __main__ - Step 26355: {'lr': 0.00046733119742410476, 'samples': 5060160, 'steps': 26354, 'loss/train': 1.5889085531234741} -11/07/2021 00:55:25 - INFO - __main__ - Step 26356: {'lr': 0.0004673285745631993, 'samples': 5060352, 'steps': 26355, 'loss/train': 1.95510995388031} -11/07/2021 00:55:26 - INFO - __main__ - Step 26357: {'lr': 0.000467325951604369, 'samples': 5060544, 'steps': 26356, 'loss/train': 2.011507034301758} -11/07/2021 00:55:26 - INFO - __main__ - Step 26358: {'lr': 0.00046732332854761507, 'samples': 5060736, 'steps': 26357, 'loss/train': 1.6759419441223145} -11/07/2021 00:55:27 - INFO - __main__ - Step 26359: {'lr': 0.00046732070539293847, 'samples': 5060928, 'steps': 26358, 'loss/train': 1.350864052772522} -11/07/2021 00:55:28 - INFO - __main__ - Step 26360: {'lr': 0.0004673180821403405, 'samples': 5061120, 'steps': 26359, 'loss/train': 1.483938455581665} -11/07/2021 00:55:28 - INFO - __main__ - Step 26361: {'lr': 0.00046731545878982253, 'samples': 5061312, 'steps': 26360, 'loss/train': 2.304304361343384} -11/07/2021 00:55:28 - INFO - __main__ - Step 26362: {'lr': 0.0004673128353413854, 'samples': 5061504, 'steps': 26361, 'loss/train': 1.9996891021728516} -11/07/2021 00:55:29 - INFO - __main__ - Step 26363: {'lr': 0.00046731021179503054, 'samples': 5061696, 'steps': 26362, 'loss/train': 1.1960369348526} -11/07/2021 00:55:30 - INFO - __main__ - Step 26364: {'lr': 0.00046730758815075903, 'samples': 5061888, 'steps': 26363, 'loss/train': 1.8923099040985107} -11/07/2021 00:55:30 - INFO - __main__ - Step 26365: {'lr': 0.0004673049644085721, 'samples': 5062080, 'steps': 26364, 'loss/train': 1.914736032485962} -11/07/2021 00:55:31 - INFO - __main__ - Step 26366: {'lr': 0.00046730234056847084, 'samples': 5062272, 'steps': 26365, 'loss/train': 1.7014739513397217} -11/07/2021 00:55:31 - INFO - __main__ - Step 26367: {'lr': 0.00046729971663045654, 'samples': 5062464, 'steps': 26366, 'loss/train': 1.6129825115203857} -11/07/2021 00:55:31 - INFO - __main__ - Step 26368: {'lr': 0.00046729709259453033, 'samples': 5062656, 'steps': 26367, 'loss/train': 0.9432440996170044} -11/07/2021 00:55:32 - INFO - __main__ - Step 26369: {'lr': 0.0004672944684606934, 'samples': 5062848, 'steps': 26368, 'loss/train': 1.4223899841308594} -11/07/2021 00:55:33 - INFO - __main__ - Step 26370: {'lr': 0.000467291844228947, 'samples': 5063040, 'steps': 26369, 'loss/train': 1.867058277130127} -11/07/2021 00:55:33 - INFO - __main__ - Step 26371: {'lr': 0.00046728921989929215, 'samples': 5063232, 'steps': 26370, 'loss/train': 1.4381300210952759} -11/07/2021 00:55:33 - INFO - __main__ - Step 26372: {'lr': 0.0004672865954717301, 'samples': 5063424, 'steps': 26371, 'loss/train': 1.4920525550842285} -11/07/2021 00:55:34 - INFO - __main__ - Step 26373: {'lr': 0.00046728397094626217, 'samples': 5063616, 'steps': 26372, 'loss/train': 1.6166425943374634} -11/07/2021 00:55:34 - INFO - __main__ - Step 26374: {'lr': 0.0004672813463228894, 'samples': 5063808, 'steps': 26373, 'loss/train': 1.3579533100128174} -11/07/2021 00:55:35 - INFO - __main__ - Step 26375: {'lr': 0.00046727872160161305, 'samples': 5064000, 'steps': 26374, 'loss/train': 1.3808456659317017} -11/07/2021 00:55:35 - INFO - __main__ - Step 26376: {'lr': 0.0004672760967824342, 'samples': 5064192, 'steps': 26375, 'loss/train': 1.6732211112976074} -11/07/2021 00:55:36 - INFO - __main__ - Step 26377: {'lr': 0.0004672734718653541, 'samples': 5064384, 'steps': 26376, 'loss/train': 2.095519781112671} -11/07/2021 00:55:36 - INFO - __main__ - Step 26378: {'lr': 0.00046727084685037394, 'samples': 5064576, 'steps': 26377, 'loss/train': 1.7713539600372314} -11/07/2021 00:55:37 - INFO - __main__ - Step 26379: {'lr': 0.00046726822173749497, 'samples': 5064768, 'steps': 26378, 'loss/train': 1.264957070350647} -11/07/2021 00:55:38 - INFO - __main__ - Step 26380: {'lr': 0.0004672655965267182, 'samples': 5064960, 'steps': 26379, 'loss/train': 1.3401517868041992} -11/07/2021 00:55:38 - INFO - __main__ - Step 26381: {'lr': 0.0004672629712180448, 'samples': 5065152, 'steps': 26380, 'loss/train': 5.758746147155762} -11/07/2021 00:55:38 - INFO - __main__ - Step 26382: {'lr': 0.00046726034581147624, 'samples': 5065344, 'steps': 26381, 'loss/train': 1.748800277709961} -11/07/2021 00:55:39 - INFO - __main__ - Step 26383: {'lr': 0.0004672577203070135, 'samples': 5065536, 'steps': 26382, 'loss/train': 1.6716623306274414} -11/07/2021 00:55:39 - INFO - __main__ - Step 26384: {'lr': 0.0004672550947046577, 'samples': 5065728, 'steps': 26383, 'loss/train': 1.507440209388733} -11/07/2021 00:55:39 - INFO - __main__ - Step 26385: {'lr': 0.0004672524690044102, 'samples': 5065920, 'steps': 26384, 'loss/train': 1.4670366048812866} -11/07/2021 00:55:40 - INFO - __main__ - Step 26386: {'lr': 0.000467249843206272, 'samples': 5066112, 'steps': 26385, 'loss/train': 1.9021941423416138} -11/07/2021 00:55:41 - INFO - __main__ - Step 26387: {'lr': 0.00046724721731024446, 'samples': 5066304, 'steps': 26386, 'loss/train': 2.118704080581665} -11/07/2021 00:55:41 - INFO - __main__ - Step 26388: {'lr': 0.00046724459131632854, 'samples': 5066496, 'steps': 26387, 'loss/train': 1.3493355512619019} -11/07/2021 00:55:42 - INFO - __main__ - Step 26389: {'lr': 0.00046724196522452565, 'samples': 5066688, 'steps': 26388, 'loss/train': 0.40509405732154846} -11/07/2021 00:55:42 - INFO - __main__ - Step 26390: {'lr': 0.00046723933903483687, 'samples': 5066880, 'steps': 26389, 'loss/train': 1.8364577293395996} -11/07/2021 00:55:43 - INFO - __main__ - Step 26391: {'lr': 0.00046723671274726344, 'samples': 5067072, 'steps': 26390, 'loss/train': 1.6346997022628784} -11/07/2021 00:55:43 - INFO - __main__ - Step 26392: {'lr': 0.00046723408636180645, 'samples': 5067264, 'steps': 26391, 'loss/train': 1.1927516460418701} -11/07/2021 00:55:43 - INFO - __main__ - Step 26393: {'lr': 0.00046723145987846715, 'samples': 5067456, 'steps': 26392, 'loss/train': 1.2922899723052979} -11/07/2021 00:55:44 - INFO - __main__ - Step 26394: {'lr': 0.00046722883329724667, 'samples': 5067648, 'steps': 26393, 'loss/train': 1.5836986303329468} -11/07/2021 00:55:44 - INFO - __main__ - Step 26395: {'lr': 0.0004672262066181463, 'samples': 5067840, 'steps': 26394, 'loss/train': 1.281071662902832} -11/07/2021 00:55:45 - INFO - __main__ - Step 26396: {'lr': 0.00046722357984116717, 'samples': 5068032, 'steps': 26395, 'loss/train': 1.5925194025039673} -11/07/2021 00:55:46 - INFO - __main__ - Step 26397: {'lr': 0.0004672209529663103, 'samples': 5068224, 'steps': 26396, 'loss/train': 1.9649863243103027} -11/07/2021 00:55:46 - INFO - __main__ - Step 26398: {'lr': 0.00046721832599357717, 'samples': 5068416, 'steps': 26397, 'loss/train': 1.9178727865219116} -11/07/2021 00:55:46 - INFO - __main__ - Step 26399: {'lr': 0.00046721569892296875, 'samples': 5068608, 'steps': 26398, 'loss/train': 1.6494786739349365} -11/07/2021 00:55:47 - INFO - __main__ - Step 26400: {'lr': 0.00046721307175448626, 'samples': 5068800, 'steps': 26399, 'loss/train': 1.4572476148605347} -11/07/2021 00:55:47 - INFO - __main__ - Step 26401: {'lr': 0.000467210444488131, 'samples': 5068992, 'steps': 26400, 'loss/train': 1.1953966617584229} -11/07/2021 00:55:48 - INFO - __main__ - Step 26402: {'lr': 0.000467207817123904, 'samples': 5069184, 'steps': 26401, 'loss/train': 1.564107894897461} -11/07/2021 00:55:49 - INFO - __main__ - Step 26403: {'lr': 0.0004672051896618065, 'samples': 5069376, 'steps': 26402, 'loss/train': 1.5417752265930176} -11/07/2021 00:55:49 - INFO - __main__ - Step 26404: {'lr': 0.0004672025621018397, 'samples': 5069568, 'steps': 26403, 'loss/train': 1.4741133451461792} -11/07/2021 00:55:49 - INFO - __main__ - Step 26405: {'lr': 0.00046719993444400477, 'samples': 5069760, 'steps': 26404, 'loss/train': 1.48698890209198} -11/07/2021 00:55:50 - INFO - __main__ - Step 26406: {'lr': 0.00046719730668830293, 'samples': 5069952, 'steps': 26405, 'loss/train': 1.4376373291015625} -11/07/2021 00:55:51 - INFO - __main__ - Step 26407: {'lr': 0.0004671946788347353, 'samples': 5070144, 'steps': 26406, 'loss/train': 1.4625463485717773} -11/07/2021 00:55:51 - INFO - __main__ - Step 26408: {'lr': 0.00046719205088330317, 'samples': 5070336, 'steps': 26407, 'loss/train': 1.9800376892089844} -11/07/2021 00:55:51 - INFO - __main__ - Step 26409: {'lr': 0.0004671894228340076, 'samples': 5070528, 'steps': 26408, 'loss/train': 1.3407139778137207} -11/07/2021 00:55:52 - INFO - __main__ - Step 26410: {'lr': 0.0004671867946868499, 'samples': 5070720, 'steps': 26409, 'loss/train': 1.9088515043258667} -11/07/2021 00:55:52 - INFO - __main__ - Step 26411: {'lr': 0.000467184166441831, 'samples': 5070912, 'steps': 26410, 'loss/train': 2.3126955032348633} -11/07/2021 00:55:53 - INFO - __main__ - Step 26412: {'lr': 0.0004671815380989525, 'samples': 5071104, 'steps': 26411, 'loss/train': 1.4580514430999756} -11/07/2021 00:55:53 - INFO - __main__ - Step 26413: {'lr': 0.0004671789096582152, 'samples': 5071296, 'steps': 26412, 'loss/train': 1.5600773096084595} -11/07/2021 00:55:54 - INFO - __main__ - Step 26414: {'lr': 0.00046717628111962045, 'samples': 5071488, 'steps': 26413, 'loss/train': 1.7384356260299683} -11/07/2021 00:55:54 - INFO - __main__ - Step 26415: {'lr': 0.00046717365248316947, 'samples': 5071680, 'steps': 26414, 'loss/train': 1.0957757234573364} -11/07/2021 00:55:54 - INFO - __main__ - Step 26416: {'lr': 0.00046717102374886334, 'samples': 5071872, 'steps': 26415, 'loss/train': 0.904839813709259} -11/07/2021 00:55:55 - INFO - __main__ - Step 26417: {'lr': 0.0004671683949167033, 'samples': 5072064, 'steps': 26416, 'loss/train': 1.6241687536239624} -11/07/2021 00:55:56 - INFO - __main__ - Step 26418: {'lr': 0.0004671657659866906, 'samples': 5072256, 'steps': 26417, 'loss/train': 1.8980976343154907} -11/07/2021 00:55:56 - INFO - __main__ - Step 26419: {'lr': 0.00046716313695882626, 'samples': 5072448, 'steps': 26418, 'loss/train': 1.2110810279846191} -11/07/2021 00:55:56 - INFO - __main__ - Step 26420: {'lr': 0.00046716050783311166, 'samples': 5072640, 'steps': 26419, 'loss/train': 1.319366693496704} -11/07/2021 00:55:57 - INFO - __main__ - Step 26421: {'lr': 0.00046715787860954785, 'samples': 5072832, 'steps': 26420, 'loss/train': 1.9053850173950195} -11/07/2021 00:55:58 - INFO - __main__ - Step 26422: {'lr': 0.000467155249288136, 'samples': 5073024, 'steps': 26421, 'loss/train': 1.293556809425354} -11/07/2021 00:55:58 - INFO - __main__ - Step 26423: {'lr': 0.00046715261986887734, 'samples': 5073216, 'steps': 26422, 'loss/train': 1.701919674873352} -11/07/2021 00:55:58 - INFO - __main__ - Step 26424: {'lr': 0.0004671499903517732, 'samples': 5073408, 'steps': 26423, 'loss/train': 1.5245121717453003} -11/07/2021 00:55:59 - INFO - __main__ - Step 26425: {'lr': 0.00046714736073682453, 'samples': 5073600, 'steps': 26424, 'loss/train': 1.1771432161331177} -11/07/2021 00:55:59 - INFO - __main__ - Step 26426: {'lr': 0.00046714473102403255, 'samples': 5073792, 'steps': 26425, 'loss/train': 1.4140645265579224} -11/07/2021 00:56:00 - INFO - __main__ - Step 26427: {'lr': 0.0004671421012133986, 'samples': 5073984, 'steps': 26426, 'loss/train': 1.5135844945907593} -11/07/2021 00:56:01 - INFO - __main__ - Step 26428: {'lr': 0.00046713947130492373, 'samples': 5074176, 'steps': 26427, 'loss/train': 1.628362774848938} -11/07/2021 00:56:01 - INFO - __main__ - Step 26429: {'lr': 0.0004671368412986091, 'samples': 5074368, 'steps': 26428, 'loss/train': 1.2044190168380737} -11/07/2021 00:56:01 - INFO - __main__ - Step 26430: {'lr': 0.0004671342111944561, 'samples': 5074560, 'steps': 26429, 'loss/train': 1.845758318901062} -11/07/2021 00:56:02 - INFO - __main__ - Step 26431: {'lr': 0.00046713158099246564, 'samples': 5074752, 'steps': 26430, 'loss/train': 1.8170115947723389} -11/07/2021 00:56:02 - INFO - __main__ - Step 26432: {'lr': 0.00046712895069263917, 'samples': 5074944, 'steps': 26431, 'loss/train': 1.7663159370422363} -11/07/2021 00:56:03 - INFO - __main__ - Step 26433: {'lr': 0.00046712632029497766, 'samples': 5075136, 'steps': 26432, 'loss/train': 1.277019739151001} -11/07/2021 00:56:03 - INFO - __main__ - Step 26434: {'lr': 0.0004671236897994824, 'samples': 5075328, 'steps': 26433, 'loss/train': 1.7203088998794556} -11/07/2021 00:56:04 - INFO - __main__ - Step 26435: {'lr': 0.00046712105920615455, 'samples': 5075520, 'steps': 26434, 'loss/train': 1.7292240858078003} -11/07/2021 00:56:04 - INFO - __main__ - Step 26436: {'lr': 0.00046711842851499533, 'samples': 5075712, 'steps': 26435, 'loss/train': 1.3361963033676147} -11/07/2021 00:56:04 - INFO - __main__ - Step 26437: {'lr': 0.0004671157977260059, 'samples': 5075904, 'steps': 26436, 'loss/train': 1.5535763502120972} -11/07/2021 00:56:06 - INFO - __main__ - Step 26438: {'lr': 0.0004671131668391874, 'samples': 5076096, 'steps': 26437, 'loss/train': 1.8279119729995728} -11/07/2021 00:56:06 - INFO - __main__ - Step 26439: {'lr': 0.00046711053585454104, 'samples': 5076288, 'steps': 26438, 'loss/train': 1.0926793813705444} -11/07/2021 00:56:06 - INFO - __main__ - Step 26440: {'lr': 0.0004671079047720681, 'samples': 5076480, 'steps': 26439, 'loss/train': 4.682829856872559} -11/07/2021 00:56:07 - INFO - __main__ - Step 26441: {'lr': 0.00046710527359176957, 'samples': 5076672, 'steps': 26440, 'loss/train': 1.4131914377212524} -11/07/2021 00:56:07 - INFO - __main__ - Step 26442: {'lr': 0.0004671026423136469, 'samples': 5076864, 'steps': 26441, 'loss/train': 1.6354575157165527} -11/07/2021 00:56:08 - INFO - __main__ - Step 26443: {'lr': 0.00046710001093770107, 'samples': 5077056, 'steps': 26442, 'loss/train': 1.4998884201049805} -11/07/2021 00:56:08 - INFO - __main__ - Step 26444: {'lr': 0.0004670973794639333, 'samples': 5077248, 'steps': 26443, 'loss/train': 1.4020780324935913} -11/07/2021 00:56:09 - INFO - __main__ - Step 26445: {'lr': 0.0004670947478923447, 'samples': 5077440, 'steps': 26444, 'loss/train': 1.4827768802642822} -11/07/2021 00:56:09 - INFO - __main__ - Step 26446: {'lr': 0.00046709211622293677, 'samples': 5077632, 'steps': 26445, 'loss/train': 1.532038927078247} -11/07/2021 00:56:10 - INFO - __main__ - Step 26447: {'lr': 0.00046708948445571037, 'samples': 5077824, 'steps': 26446, 'loss/train': 1.4269554615020752} -11/07/2021 00:56:10 - INFO - __main__ - Step 26448: {'lr': 0.0004670868525906668, 'samples': 5078016, 'steps': 26447, 'loss/train': 2.0321922302246094} -11/07/2021 00:56:11 - INFO - __main__ - Step 26449: {'lr': 0.00046708422062780725, 'samples': 5078208, 'steps': 26448, 'loss/train': 1.5487173795700073} -11/07/2021 00:56:11 - INFO - __main__ - Step 26450: {'lr': 0.0004670815885671329, 'samples': 5078400, 'steps': 26449, 'loss/train': 1.6052219867706299} -11/07/2021 00:56:12 - INFO - __main__ - Step 26451: {'lr': 0.00046707895640864494, 'samples': 5078592, 'steps': 26450, 'loss/train': 1.3936687707901} -11/07/2021 00:56:12 - INFO - __main__ - Step 26452: {'lr': 0.0004670763241523446, 'samples': 5078784, 'steps': 26451, 'loss/train': 1.4854100942611694} -11/07/2021 00:56:13 - INFO - __main__ - Step 26453: {'lr': 0.00046707369179823294, 'samples': 5078976, 'steps': 26452, 'loss/train': 1.4796305894851685} -11/07/2021 00:56:13 - INFO - __main__ - Step 26454: {'lr': 0.00046707105934631123, 'samples': 5079168, 'steps': 26453, 'loss/train': 1.150570034980774} -11/07/2021 00:56:14 - INFO - __main__ - Step 26455: {'lr': 0.00046706842679658067, 'samples': 5079360, 'steps': 26454, 'loss/train': 1.8077322244644165} -11/07/2021 00:56:14 - INFO - __main__ - Step 26456: {'lr': 0.0004670657941490425, 'samples': 5079552, 'steps': 26455, 'loss/train': 1.230172038078308} -11/07/2021 00:56:14 - INFO - __main__ - Step 26457: {'lr': 0.00046706316140369774, 'samples': 5079744, 'steps': 26456, 'loss/train': 1.8720364570617676} -11/07/2021 00:56:15 - INFO - __main__ - Step 26458: {'lr': 0.0004670605285605477, 'samples': 5079936, 'steps': 26457, 'loss/train': 1.4917019605636597} -11/07/2021 00:56:16 - INFO - __main__ - Step 26459: {'lr': 0.0004670578956195935, 'samples': 5080128, 'steps': 26458, 'loss/train': 1.4443360567092896} -11/07/2021 00:56:16 - INFO - __main__ - Step 26460: {'lr': 0.00046705526258083643, 'samples': 5080320, 'steps': 26459, 'loss/train': 1.5752904415130615} -11/07/2021 00:56:16 - INFO - __main__ - Step 26461: {'lr': 0.0004670526294442775, 'samples': 5080512, 'steps': 26460, 'loss/train': 1.234046459197998} -11/07/2021 00:56:17 - INFO - __main__ - Step 26462: {'lr': 0.0004670499962099181, 'samples': 5080704, 'steps': 26461, 'loss/train': 1.3155179023742676} -11/07/2021 00:56:17 - INFO - __main__ - Step 26463: {'lr': 0.0004670473628777593, 'samples': 5080896, 'steps': 26462, 'loss/train': 1.976694107055664} -11/07/2021 00:56:18 - INFO - __main__ - Step 26464: {'lr': 0.0004670447294478023, 'samples': 5081088, 'steps': 26463, 'loss/train': 1.5602601766586304} -11/07/2021 00:56:18 - INFO - __main__ - Step 26465: {'lr': 0.0004670420959200483, 'samples': 5081280, 'steps': 26464, 'loss/train': 1.194366693496704} -11/07/2021 00:56:19 - INFO - __main__ - Step 26466: {'lr': 0.00046703946229449846, 'samples': 5081472, 'steps': 26465, 'loss/train': 1.8380380868911743} -11/07/2021 00:56:19 - INFO - __main__ - Step 26467: {'lr': 0.00046703682857115406, 'samples': 5081664, 'steps': 26466, 'loss/train': 1.755829095840454} -11/07/2021 00:56:19 - INFO - __main__ - Step 26468: {'lr': 0.0004670341947500161, 'samples': 5081856, 'steps': 26467, 'loss/train': 0.9049766063690186} -11/07/2021 00:56:21 - INFO - __main__ - Step 26469: {'lr': 0.00046703156083108597, 'samples': 5082048, 'steps': 26468, 'loss/train': 1.4993257522583008} -11/07/2021 00:56:21 - INFO - __main__ - Step 26470: {'lr': 0.0004670289268143647, 'samples': 5082240, 'steps': 26469, 'loss/train': 1.6964185237884521} -11/07/2021 00:56:21 - INFO - __main__ - Step 26471: {'lr': 0.0004670262926998536, 'samples': 5082432, 'steps': 26470, 'loss/train': 1.3337154388427734} -11/07/2021 00:56:22 - INFO - __main__ - Step 26472: {'lr': 0.00046702365848755377, 'samples': 5082624, 'steps': 26471, 'loss/train': 1.2978936433792114} -11/07/2021 00:56:22 - INFO - __main__ - Step 26473: {'lr': 0.0004670210241774664, 'samples': 5082816, 'steps': 26472, 'loss/train': 1.5517992973327637} -11/07/2021 00:56:23 - INFO - __main__ - Step 26474: {'lr': 0.0004670183897695928, 'samples': 5083008, 'steps': 26473, 'loss/train': 1.5308436155319214} -11/07/2021 00:56:23 - INFO - __main__ - Step 26475: {'lr': 0.00046701575526393395, 'samples': 5083200, 'steps': 26474, 'loss/train': 1.3590461015701294} -11/07/2021 00:56:24 - INFO - __main__ - Step 26476: {'lr': 0.00046701312066049126, 'samples': 5083392, 'steps': 26475, 'loss/train': 1.4693495035171509} -11/07/2021 00:56:24 - INFO - __main__ - Step 26477: {'lr': 0.00046701048595926574, 'samples': 5083584, 'steps': 26476, 'loss/train': 1.6932660341262817} -11/07/2021 00:56:24 - INFO - __main__ - Step 26478: {'lr': 0.00046700785116025867, 'samples': 5083776, 'steps': 26477, 'loss/train': 1.4177215099334717} -11/07/2021 00:56:25 - INFO - __main__ - Step 26479: {'lr': 0.0004670052162634712, 'samples': 5083968, 'steps': 26478, 'loss/train': 2.0390894412994385} -11/07/2021 00:56:26 - INFO - __main__ - Step 26480: {'lr': 0.0004670025812689045, 'samples': 5084160, 'steps': 26479, 'loss/train': 1.4703865051269531} -11/07/2021 00:56:27 - INFO - __main__ - Step 26481: {'lr': 0.00046699994617655985, 'samples': 5084352, 'steps': 26480, 'loss/train': 1.6275564432144165} -11/07/2021 00:56:27 - INFO - __main__ - Step 26482: {'lr': 0.0004669973109864383, 'samples': 5084544, 'steps': 26481, 'loss/train': 0.5352272987365723} -11/07/2021 00:56:27 - INFO - __main__ - Step 26483: {'lr': 0.00046699467569854115, 'samples': 5084736, 'steps': 26482, 'loss/train': 1.8470903635025024} -11/07/2021 00:56:28 - INFO - __main__ - Step 26484: {'lr': 0.0004669920403128696, 'samples': 5084928, 'steps': 26483, 'loss/train': 1.5987228155136108} -11/07/2021 00:56:29 - INFO - __main__ - Step 26485: {'lr': 0.00046698940482942466, 'samples': 5085120, 'steps': 26484, 'loss/train': 1.9088078737258911} -11/07/2021 00:56:29 - INFO - __main__ - Step 26486: {'lr': 0.0004669867692482077, 'samples': 5085312, 'steps': 26485, 'loss/train': 1.6015602350234985} -11/07/2021 00:56:30 - INFO - __main__ - Step 26487: {'lr': 0.00046698413356921985, 'samples': 5085504, 'steps': 26486, 'loss/train': 1.708426594734192} -11/07/2021 00:56:30 - INFO - __main__ - Step 26488: {'lr': 0.00046698149779246235, 'samples': 5085696, 'steps': 26487, 'loss/train': 1.7259870767593384} -11/07/2021 00:56:30 - INFO - __main__ - Step 26489: {'lr': 0.0004669788619179363, 'samples': 5085888, 'steps': 26488, 'loss/train': 1.945603609085083} -11/07/2021 00:56:32 - INFO - __main__ - Step 26490: {'lr': 0.0004669762259456429, 'samples': 5086080, 'steps': 26489, 'loss/train': 0.9242888689041138} -11/07/2021 00:56:32 - INFO - __main__ - Step 26491: {'lr': 0.00046697358987558336, 'samples': 5086272, 'steps': 26490, 'loss/train': 2.0681726932525635} -11/07/2021 00:56:32 - INFO - __main__ - Step 26492: {'lr': 0.0004669709537077589, 'samples': 5086464, 'steps': 26491, 'loss/train': 1.5688045024871826} -11/07/2021 00:56:33 - INFO - __main__ - Step 26493: {'lr': 0.00046696831744217065, 'samples': 5086656, 'steps': 26492, 'loss/train': 1.3535728454589844} -11/07/2021 00:56:33 - INFO - __main__ - Step 26494: {'lr': 0.0004669656810788199, 'samples': 5086848, 'steps': 26493, 'loss/train': 1.0657094717025757} -11/07/2021 00:56:33 - INFO - __main__ - Step 26495: {'lr': 0.0004669630446177077, 'samples': 5087040, 'steps': 26494, 'loss/train': 1.4741947650909424} -11/07/2021 00:56:34 - INFO - __main__ - Step 26496: {'lr': 0.0004669604080588352, 'samples': 5087232, 'steps': 26495, 'loss/train': 1.8306576013565063} -11/07/2021 00:56:35 - INFO - __main__ - Step 26497: {'lr': 0.0004669577714022039, 'samples': 5087424, 'steps': 26496, 'loss/train': 1.7917108535766602} -11/07/2021 00:56:35 - INFO - __main__ - Step 26498: {'lr': 0.00046695513464781456, 'samples': 5087616, 'steps': 26497, 'loss/train': 1.7983497381210327} -11/07/2021 00:56:36 - INFO - __main__ - Step 26499: {'lr': 0.00046695249779566875, 'samples': 5087808, 'steps': 26498, 'loss/train': 1.3506072759628296} -11/07/2021 00:56:36 - INFO - __main__ - Step 26500: {'lr': 0.0004669498608457674, 'samples': 5088000, 'steps': 26499, 'loss/train': 1.5733281373977661} -11/07/2021 00:56:36 - INFO - __main__ - Step 26501: {'lr': 0.0004669472237981118, 'samples': 5088192, 'steps': 26500, 'loss/train': 1.33139169216156} -11/07/2021 00:56:37 - INFO - __main__ - Step 26502: {'lr': 0.00046694458665270315, 'samples': 5088384, 'steps': 26501, 'loss/train': 1.685796856880188} -11/07/2021 00:56:38 - INFO - __main__ - Step 26503: {'lr': 0.0004669419494095426, 'samples': 5088576, 'steps': 26502, 'loss/train': 1.5072300434112549} -11/07/2021 00:56:38 - INFO - __main__ - Step 26504: {'lr': 0.0004669393120686314, 'samples': 5088768, 'steps': 26503, 'loss/train': 1.6246660947799683} -11/07/2021 00:56:38 - INFO - __main__ - Step 26505: {'lr': 0.0004669366746299707, 'samples': 5088960, 'steps': 26504, 'loss/train': 1.5311013460159302} -11/07/2021 00:56:39 - INFO - __main__ - Step 26506: {'lr': 0.00046693403709356163, 'samples': 5089152, 'steps': 26505, 'loss/train': 1.2966697216033936} -11/07/2021 00:56:40 - INFO - __main__ - Step 26507: {'lr': 0.00046693139945940546, 'samples': 5089344, 'steps': 26506, 'loss/train': 1.573506236076355} -11/07/2021 00:56:40 - INFO - __main__ - Step 26508: {'lr': 0.0004669287617275033, 'samples': 5089536, 'steps': 26507, 'loss/train': 1.7121988534927368} -11/07/2021 00:56:41 - INFO - __main__ - Step 26509: {'lr': 0.0004669261238978564, 'samples': 5089728, 'steps': 26508, 'loss/train': 1.489428997039795} -11/07/2021 00:56:41 - INFO - __main__ - Step 26510: {'lr': 0.00046692348597046596, 'samples': 5089920, 'steps': 26509, 'loss/train': 1.5976169109344482} -11/07/2021 00:56:41 - INFO - __main__ - Step 26511: {'lr': 0.0004669208479453332, 'samples': 5090112, 'steps': 26510, 'loss/train': 1.6850656270980835} -11/07/2021 00:56:42 - INFO - __main__ - Step 26512: {'lr': 0.00046691820982245913, 'samples': 5090304, 'steps': 26511, 'loss/train': 1.530301809310913} -11/07/2021 00:56:43 - INFO - __main__ - Step 26513: {'lr': 0.00046691557160184516, 'samples': 5090496, 'steps': 26512, 'loss/train': 1.611854910850525} -11/07/2021 00:56:43 - INFO - __main__ - Step 26514: {'lr': 0.0004669129332834923, 'samples': 5090688, 'steps': 26513, 'loss/train': 1.6495177745819092} -11/07/2021 00:56:43 - INFO - __main__ - Step 26515: {'lr': 0.0004669102948674019, 'samples': 5090880, 'steps': 26514, 'loss/train': 1.213331699371338} -11/07/2021 00:56:44 - INFO - __main__ - Step 26516: {'lr': 0.000466907656353575, 'samples': 5091072, 'steps': 26515, 'loss/train': 1.4162719249725342} -11/07/2021 00:56:44 - INFO - __main__ - Step 26517: {'lr': 0.0004669050177420129, 'samples': 5091264, 'steps': 26516, 'loss/train': 1.6753724813461304} -11/07/2021 00:56:45 - INFO - __main__ - Step 26518: {'lr': 0.0004669023790327168, 'samples': 5091456, 'steps': 26517, 'loss/train': 1.3420944213867188} -11/07/2021 00:56:45 - INFO - __main__ - Step 26519: {'lr': 0.0004668997402256877, 'samples': 5091648, 'steps': 26518, 'loss/train': 1.114307165145874} -11/07/2021 00:56:46 - INFO - __main__ - Step 26520: {'lr': 0.00046689710132092704, 'samples': 5091840, 'steps': 26519, 'loss/train': 1.227500557899475} -11/07/2021 00:56:46 - INFO - __main__ - Step 26521: {'lr': 0.00046689446231843585, 'samples': 5092032, 'steps': 26520, 'loss/train': 5.975055694580078} -11/07/2021 00:56:47 - INFO - __main__ - Step 26522: {'lr': 0.0004668918232182153, 'samples': 5092224, 'steps': 26521, 'loss/train': 1.521012306213379} -11/07/2021 00:56:47 - INFO - __main__ - Step 26523: {'lr': 0.0004668891840202668, 'samples': 5092416, 'steps': 26522, 'loss/train': 1.4542280435562134} -11/07/2021 00:56:48 - INFO - __main__ - Step 26524: {'lr': 0.00046688654472459124, 'samples': 5092608, 'steps': 26523, 'loss/train': 1.7532317638397217} -11/07/2021 00:56:48 - INFO - __main__ - Step 26525: {'lr': 0.00046688390533119003, 'samples': 5092800, 'steps': 26524, 'loss/train': 1.5033717155456543} -11/07/2021 00:56:49 - INFO - __main__ - Step 26526: {'lr': 0.00046688126584006425, 'samples': 5092992, 'steps': 26525, 'loss/train': 1.1880830526351929} -11/07/2021 00:56:49 - INFO - __main__ - Step 26527: {'lr': 0.00046687862625121505, 'samples': 5093184, 'steps': 26526, 'loss/train': 1.5129117965698242} -11/07/2021 00:56:49 - INFO - __main__ - Step 26528: {'lr': 0.0004668759865646438, 'samples': 5093376, 'steps': 26527, 'loss/train': 1.808837652206421} -11/07/2021 00:56:50 - INFO - __main__ - Step 26529: {'lr': 0.00046687334678035153, 'samples': 5093568, 'steps': 26528, 'loss/train': 1.3349472284317017} -11/07/2021 00:56:51 - INFO - __main__ - Step 26530: {'lr': 0.00046687070689833943, 'samples': 5093760, 'steps': 26529, 'loss/train': 1.699949026107788} -11/07/2021 00:56:51 - INFO - __main__ - Step 26531: {'lr': 0.00046686806691860884, 'samples': 5093952, 'steps': 26530, 'loss/train': 1.6412250995635986} -11/07/2021 00:56:51 - INFO - __main__ - Step 26532: {'lr': 0.00046686542684116073, 'samples': 5094144, 'steps': 26531, 'loss/train': 1.5748305320739746} -11/07/2021 00:56:52 - INFO - __main__ - Step 26533: {'lr': 0.00046686278666599647, 'samples': 5094336, 'steps': 26532, 'loss/train': 1.6863652467727661} -11/07/2021 00:56:53 - INFO - __main__ - Step 26534: {'lr': 0.0004668601463931172, 'samples': 5094528, 'steps': 26533, 'loss/train': 1.5847936868667603} -11/07/2021 00:56:53 - INFO - __main__ - Step 26535: {'lr': 0.00046685750602252406, 'samples': 5094720, 'steps': 26534, 'loss/train': 1.4715627431869507} -11/07/2021 00:56:53 - INFO - __main__ - Step 26536: {'lr': 0.0004668548655542183, 'samples': 5094912, 'steps': 26535, 'loss/train': 1.1541719436645508} -11/07/2021 00:56:54 - INFO - __main__ - Step 26537: {'lr': 0.000466852224988201, 'samples': 5095104, 'steps': 26536, 'loss/train': 1.6187621355056763} -11/07/2021 00:56:54 - INFO - __main__ - Step 26538: {'lr': 0.00046684958432447355, 'samples': 5095296, 'steps': 26537, 'loss/train': 1.0727238655090332} -11/07/2021 00:56:55 - INFO - __main__ - Step 26539: {'lr': 0.00046684694356303693, 'samples': 5095488, 'steps': 26538, 'loss/train': 1.1763319969177246} -11/07/2021 00:56:56 - INFO - __main__ - Step 26540: {'lr': 0.0004668443027038925, 'samples': 5095680, 'steps': 26539, 'loss/train': 2.1044039726257324} -11/07/2021 00:56:56 - INFO - __main__ - Step 26541: {'lr': 0.00046684166174704134, 'samples': 5095872, 'steps': 26540, 'loss/train': 2.556725025177002} -11/07/2021 00:56:56 - INFO - __main__ - Step 26542: {'lr': 0.00046683902069248465, 'samples': 5096064, 'steps': 26541, 'loss/train': 1.3768486976623535} -11/07/2021 00:56:57 - INFO - __main__ - Step 26543: {'lr': 0.0004668363795402237, 'samples': 5096256, 'steps': 26542, 'loss/train': 1.3912994861602783} -11/07/2021 00:56:58 - INFO - __main__ - Step 26544: {'lr': 0.00046683373829025954, 'samples': 5096448, 'steps': 26543, 'loss/train': 1.4116778373718262} -11/07/2021 00:56:58 - INFO - __main__ - Step 26545: {'lr': 0.0004668310969425935, 'samples': 5096640, 'steps': 26544, 'loss/train': 1.3927422761917114} -11/07/2021 00:56:58 - INFO - __main__ - Step 26546: {'lr': 0.00046682845549722677, 'samples': 5096832, 'steps': 26545, 'loss/train': 1.552696943283081} -11/07/2021 00:56:59 - INFO - __main__ - Step 26547: {'lr': 0.0004668258139541604, 'samples': 5097024, 'steps': 26546, 'loss/train': 1.2917490005493164} -11/07/2021 00:56:59 - INFO - __main__ - Step 26548: {'lr': 0.00046682317231339565, 'samples': 5097216, 'steps': 26547, 'loss/train': 5.877769470214844} -11/07/2021 00:56:59 - INFO - __main__ - Step 26549: {'lr': 0.00046682053057493377, 'samples': 5097408, 'steps': 26548, 'loss/train': 0.9490289688110352} -11/07/2021 00:57:01 - INFO - __main__ - Step 26550: {'lr': 0.00046681788873877595, 'samples': 5097600, 'steps': 26549, 'loss/train': 1.548933982849121} -11/07/2021 00:57:01 - INFO - __main__ - Step 26551: {'lr': 0.00046681524680492327, 'samples': 5097792, 'steps': 26550, 'loss/train': 1.545667052268982} -11/07/2021 00:57:01 - INFO - __main__ - Step 26552: {'lr': 0.00046681260477337693, 'samples': 5097984, 'steps': 26551, 'loss/train': 1.4085031747817993} -11/07/2021 00:57:02 - INFO - __main__ - Step 26553: {'lr': 0.0004668099626441383, 'samples': 5098176, 'steps': 26552, 'loss/train': 1.656846523284912} -11/07/2021 00:57:02 - INFO - __main__ - Step 26554: {'lr': 0.00046680732041720836, 'samples': 5098368, 'steps': 26553, 'loss/train': 1.8511707782745361} -11/07/2021 00:57:03 - INFO - __main__ - Step 26555: {'lr': 0.0004668046780925884, 'samples': 5098560, 'steps': 26554, 'loss/train': 1.1346396207809448} -11/07/2021 00:57:03 - INFO - __main__ - Step 26556: {'lr': 0.0004668020356702796, 'samples': 5098752, 'steps': 26555, 'loss/train': 1.6512269973754883} -11/07/2021 00:57:04 - INFO - __main__ - Step 26557: {'lr': 0.0004667993931502832, 'samples': 5098944, 'steps': 26556, 'loss/train': 1.944300889968872} -11/07/2021 00:57:04 - INFO - __main__ - Step 26558: {'lr': 0.00046679675053260027, 'samples': 5099136, 'steps': 26557, 'loss/train': 1.6029387712478638} -11/07/2021 00:57:04 - INFO - __main__ - Step 26559: {'lr': 0.00046679410781723206, 'samples': 5099328, 'steps': 26558, 'loss/train': 1.526893973350525} -11/07/2021 00:57:05 - INFO - __main__ - Step 26560: {'lr': 0.0004667914650041799, 'samples': 5099520, 'steps': 26559, 'loss/train': 1.6373034715652466} -11/07/2021 00:57:06 - INFO - __main__ - Step 26561: {'lr': 0.00046678882209344474, 'samples': 5099712, 'steps': 26560, 'loss/train': 1.3498308658599854} -11/07/2021 00:57:06 - INFO - __main__ - Step 26562: {'lr': 0.00046678617908502785, 'samples': 5099904, 'steps': 26561, 'loss/train': 1.223779559135437} -11/07/2021 00:57:06 - INFO - __main__ - Step 26563: {'lr': 0.00046678353597893053, 'samples': 5100096, 'steps': 26562, 'loss/train': 1.7865734100341797} -11/07/2021 00:57:07 - INFO - __main__ - Step 26564: {'lr': 0.0004667808927751539, 'samples': 5100288, 'steps': 26563, 'loss/train': 1.7990397214889526} -11/07/2021 00:57:08 - INFO - __main__ - Step 26565: {'lr': 0.00046677824947369907, 'samples': 5100480, 'steps': 26564, 'loss/train': 1.9247980117797852} -11/07/2021 00:57:08 - INFO - __main__ - Step 26566: {'lr': 0.0004667756060745674, 'samples': 5100672, 'steps': 26565, 'loss/train': 1.6731843948364258} -11/07/2021 00:57:08 - INFO - __main__ - Step 26567: {'lr': 0.0004667729625777599, 'samples': 5100864, 'steps': 26566, 'loss/train': 1.8321985006332397} -11/07/2021 00:57:09 - INFO - __main__ - Step 26568: {'lr': 0.0004667703189832779, 'samples': 5101056, 'steps': 26567, 'loss/train': 1.3584908246994019} -11/07/2021 00:57:09 - INFO - __main__ - Step 26569: {'lr': 0.00046676767529112254, 'samples': 5101248, 'steps': 26568, 'loss/train': 1.4127012491226196} -11/07/2021 00:57:10 - INFO - __main__ - Step 26570: {'lr': 0.000466765031501295, 'samples': 5101440, 'steps': 26569, 'loss/train': 0.9467480182647705} -11/07/2021 00:57:10 - INFO - __main__ - Step 26571: {'lr': 0.0004667623876137965, 'samples': 5101632, 'steps': 26570, 'loss/train': 0.8069031238555908} -11/07/2021 00:57:11 - INFO - __main__ - Step 26572: {'lr': 0.00046675974362862815, 'samples': 5101824, 'steps': 26571, 'loss/train': 1.582007884979248} -11/07/2021 00:57:11 - INFO - __main__ - Step 26573: {'lr': 0.00046675709954579125, 'samples': 5102016, 'steps': 26572, 'loss/train': 1.6229231357574463} -11/07/2021 00:57:12 - INFO - __main__ - Step 26574: {'lr': 0.0004667544553652869, 'samples': 5102208, 'steps': 26573, 'loss/train': 1.5536285638809204} -11/07/2021 00:57:12 - INFO - __main__ - Step 26575: {'lr': 0.0004667518110871164, 'samples': 5102400, 'steps': 26574, 'loss/train': 1.0139391422271729} -11/07/2021 00:57:13 - INFO - __main__ - Step 26576: {'lr': 0.0004667491667112809, 'samples': 5102592, 'steps': 26575, 'loss/train': 1.362045168876648} -11/07/2021 00:57:13 - INFO - __main__ - Step 26577: {'lr': 0.0004667465222377815, 'samples': 5102784, 'steps': 26576, 'loss/train': 1.0441974401474} -11/07/2021 00:57:14 - INFO - __main__ - Step 26578: {'lr': 0.0004667438776666195, 'samples': 5102976, 'steps': 26577, 'loss/train': 1.6765360832214355} -11/07/2021 00:57:14 - INFO - __main__ - Step 26579: {'lr': 0.00046674123299779603, 'samples': 5103168, 'steps': 26578, 'loss/train': 0.872469961643219} -11/07/2021 00:57:14 - INFO - __main__ - Step 26580: {'lr': 0.0004667385882313123, 'samples': 5103360, 'steps': 26579, 'loss/train': 0.9930628538131714} -11/07/2021 00:57:15 - INFO - __main__ - Step 26581: {'lr': 0.0004667359433671695, 'samples': 5103552, 'steps': 26580, 'loss/train': 1.233246922492981} -11/07/2021 00:57:16 - INFO - __main__ - Step 26582: {'lr': 0.0004667332984053689, 'samples': 5103744, 'steps': 26581, 'loss/train': 1.1279759407043457} -11/07/2021 00:57:16 - INFO - __main__ - Step 26583: {'lr': 0.00046673065334591155, 'samples': 5103936, 'steps': 26582, 'loss/train': 1.609163522720337} -11/07/2021 00:57:16 - INFO - __main__ - Step 26584: {'lr': 0.00046672800818879873, 'samples': 5104128, 'steps': 26583, 'loss/train': 1.5642935037612915} -11/07/2021 00:57:17 - INFO - __main__ - Step 26585: {'lr': 0.0004667253629340316, 'samples': 5104320, 'steps': 26584, 'loss/train': 1.6174025535583496} -11/07/2021 00:57:18 - INFO - __main__ - Step 26586: {'lr': 0.0004667227175816114, 'samples': 5104512, 'steps': 26585, 'loss/train': 2.0503993034362793} -11/07/2021 00:57:18 - INFO - __main__ - Step 26587: {'lr': 0.0004667200721315393, 'samples': 5104704, 'steps': 26586, 'loss/train': 1.585839033126831} -11/07/2021 00:57:18 - INFO - __main__ - Step 26588: {'lr': 0.00046671742658381646, 'samples': 5104896, 'steps': 26587, 'loss/train': 1.4367401599884033} -11/07/2021 00:57:19 - INFO - __main__ - Step 26589: {'lr': 0.000466714780938444, 'samples': 5105088, 'steps': 26588, 'loss/train': 1.3386892080307007} -11/07/2021 00:57:19 - INFO - __main__ - Step 26590: {'lr': 0.0004667121351954233, 'samples': 5105280, 'steps': 26589, 'loss/train': 1.768083930015564} -11/07/2021 00:57:20 - INFO - __main__ - Step 26591: {'lr': 0.00046670948935475544, 'samples': 5105472, 'steps': 26590, 'loss/train': 1.9811300039291382} -11/07/2021 00:57:21 - INFO - __main__ - Step 26592: {'lr': 0.00046670684341644167, 'samples': 5105664, 'steps': 26591, 'loss/train': 0.7801468968391418} -11/07/2021 00:57:21 - INFO - __main__ - Step 26593: {'lr': 0.0004667041973804831, 'samples': 5105856, 'steps': 26592, 'loss/train': 0.811613142490387} -11/07/2021 00:57:22 - INFO - __main__ - Step 26594: {'lr': 0.00046670155124688096, 'samples': 5106048, 'steps': 26593, 'loss/train': 1.5572509765625} -11/07/2021 00:57:22 - INFO - __main__ - Step 26595: {'lr': 0.00046669890501563636, 'samples': 5106240, 'steps': 26594, 'loss/train': 1.732027292251587} -11/07/2021 00:57:22 - INFO - __main__ - Step 26596: {'lr': 0.0004666962586867507, 'samples': 5106432, 'steps': 26595, 'loss/train': 1.4996187686920166} -11/07/2021 00:57:23 - INFO - __main__ - Step 26597: {'lr': 0.000466693612260225, 'samples': 5106624, 'steps': 26596, 'loss/train': 1.6806252002716064} -11/07/2021 00:57:23 - INFO - __main__ - Step 26598: {'lr': 0.00046669096573606053, 'samples': 5106816, 'steps': 26597, 'loss/train': 1.095277190208435} -11/07/2021 00:57:24 - INFO - __main__ - Step 26599: {'lr': 0.00046668831911425844, 'samples': 5107008, 'steps': 26598, 'loss/train': 1.8940539360046387} -11/07/2021 00:57:24 - INFO - __main__ - Step 26600: {'lr': 0.00046668567239481994, 'samples': 5107200, 'steps': 26599, 'loss/train': 1.3034520149230957} -11/07/2021 00:57:25 - INFO - __main__ - Step 26601: {'lr': 0.0004666830255777462, 'samples': 5107392, 'steps': 26600, 'loss/train': 1.082856297492981} -11/07/2021 00:57:26 - INFO - __main__ - Step 26602: {'lr': 0.00046668037866303845, 'samples': 5107584, 'steps': 26601, 'loss/train': 1.5188623666763306} -11/07/2021 00:57:26 - INFO - __main__ - Step 26603: {'lr': 0.0004666777316506979, 'samples': 5107776, 'steps': 26602, 'loss/train': 1.660784363746643} -11/07/2021 00:57:26 - INFO - __main__ - Step 26604: {'lr': 0.00046667508454072566, 'samples': 5107968, 'steps': 26603, 'loss/train': 1.7365378141403198} -11/07/2021 00:57:27 - INFO - __main__ - Step 26605: {'lr': 0.00046667243733312296, 'samples': 5108160, 'steps': 26604, 'loss/train': 1.6284083127975464} -11/07/2021 00:57:27 - INFO - __main__ - Step 26606: {'lr': 0.000466669790027891, 'samples': 5108352, 'steps': 26605, 'loss/train': 1.1745686531066895} -11/07/2021 00:57:28 - INFO - __main__ - Step 26607: {'lr': 0.00046666714262503107, 'samples': 5108544, 'steps': 26606, 'loss/train': 1.6178178787231445} -11/07/2021 00:57:29 - INFO - __main__ - Step 26608: {'lr': 0.00046666449512454416, 'samples': 5108736, 'steps': 26607, 'loss/train': 1.1699672937393188} -11/07/2021 00:57:29 - INFO - __main__ - Step 26609: {'lr': 0.0004666618475264316, 'samples': 5108928, 'steps': 26608, 'loss/train': 1.7242342233657837} -11/07/2021 00:57:29 - INFO - __main__ - Step 26610: {'lr': 0.0004666591998306946, 'samples': 5109120, 'steps': 26609, 'loss/train': 1.758998155593872} -11/07/2021 00:57:30 - INFO - __main__ - Step 26611: {'lr': 0.0004666565520373343, 'samples': 5109312, 'steps': 26610, 'loss/train': 1.7067108154296875} -11/07/2021 00:57:31 - INFO - __main__ - Step 26612: {'lr': 0.00046665390414635184, 'samples': 5109504, 'steps': 26611, 'loss/train': 1.829398274421692} -11/07/2021 00:57:31 - INFO - __main__ - Step 26613: {'lr': 0.0004666512561577485, 'samples': 5109696, 'steps': 26612, 'loss/train': 1.667002558708191} -11/07/2021 00:57:31 - INFO - __main__ - Step 26614: {'lr': 0.0004666486080715255, 'samples': 5109888, 'steps': 26613, 'loss/train': 1.830881118774414} -11/07/2021 00:57:32 - INFO - __main__ - Step 26615: {'lr': 0.0004666459598876839, 'samples': 5110080, 'steps': 26614, 'loss/train': 0.904382050037384} -11/07/2021 00:57:32 - INFO - __main__ - Step 26616: {'lr': 0.000466643311606225, 'samples': 5110272, 'steps': 26615, 'loss/train': 1.795561671257019} -11/07/2021 00:57:33 - INFO - __main__ - Step 26617: {'lr': 0.00046664066322715006, 'samples': 5110464, 'steps': 26616, 'loss/train': 1.5816446542739868} -11/07/2021 00:57:34 - INFO - __main__ - Step 26618: {'lr': 0.00046663801475046004, 'samples': 5110656, 'steps': 26617, 'loss/train': 1.3576115369796753} -11/07/2021 00:57:34 - INFO - __main__ - Step 26619: {'lr': 0.0004666353661761563, 'samples': 5110848, 'steps': 26618, 'loss/train': 1.2115764617919922} -11/07/2021 00:57:34 - INFO - __main__ - Step 26620: {'lr': 0.0004666327175042401, 'samples': 5111040, 'steps': 26619, 'loss/train': 1.1487702131271362} -11/07/2021 00:57:35 - INFO - __main__ - Step 26621: {'lr': 0.00046663006873471247, 'samples': 5111232, 'steps': 26620, 'loss/train': 1.5510127544403076} -11/07/2021 00:57:35 - INFO - __main__ - Step 26622: {'lr': 0.00046662741986757463, 'samples': 5111424, 'steps': 26621, 'loss/train': 1.8322904109954834} -11/07/2021 00:57:36 - INFO - __main__ - Step 26623: {'lr': 0.0004666247709028279, 'samples': 5111616, 'steps': 26622, 'loss/train': 1.5032947063446045} -11/07/2021 00:57:36 - INFO - __main__ - Step 26624: {'lr': 0.00046662212184047334, 'samples': 5111808, 'steps': 26623, 'loss/train': 1.4322452545166016} -11/07/2021 00:57:37 - INFO - __main__ - Step 26625: {'lr': 0.0004666194726805122, 'samples': 5112000, 'steps': 26624, 'loss/train': 1.82273268699646} -11/07/2021 00:57:37 - INFO - __main__ - Step 26626: {'lr': 0.0004666168234229457, 'samples': 5112192, 'steps': 26625, 'loss/train': 0.9876610040664673} -11/07/2021 00:57:37 - INFO - __main__ - Step 26627: {'lr': 0.000466614174067775, 'samples': 5112384, 'steps': 26626, 'loss/train': 1.672943353652954} -11/07/2021 00:57:38 - INFO - __main__ - Step 26628: {'lr': 0.00046661152461500126, 'samples': 5112576, 'steps': 26627, 'loss/train': 1.9646693468093872} -11/07/2021 00:57:39 - INFO - __main__ - Step 26629: {'lr': 0.0004666088750646257, 'samples': 5112768, 'steps': 26628, 'loss/train': 1.5872939825057983} -11/07/2021 00:57:39 - INFO - __main__ - Step 26630: {'lr': 0.0004666062254166496, 'samples': 5112960, 'steps': 26629, 'loss/train': 1.6622138023376465} -11/07/2021 00:57:39 - INFO - __main__ - Step 26631: {'lr': 0.000466603575671074, 'samples': 5113152, 'steps': 26630, 'loss/train': 1.4871768951416016} -11/07/2021 00:57:40 - INFO - __main__ - Step 26632: {'lr': 0.00046660092582790025, 'samples': 5113344, 'steps': 26631, 'loss/train': 1.6067029237747192} -11/07/2021 00:57:41 - INFO - __main__ - Step 26633: {'lr': 0.0004665982758871294, 'samples': 5113536, 'steps': 26632, 'loss/train': 1.1848700046539307} -11/07/2021 00:57:41 - INFO - __main__ - Step 26634: {'lr': 0.0004665956258487627, 'samples': 5113728, 'steps': 26633, 'loss/train': 1.102095365524292} -11/07/2021 00:57:42 - INFO - __main__ - Step 26635: {'lr': 0.0004665929757128014, 'samples': 5113920, 'steps': 26634, 'loss/train': 1.3685040473937988} -11/07/2021 00:57:42 - INFO - __main__ - Step 26636: {'lr': 0.0004665903254792466, 'samples': 5114112, 'steps': 26635, 'loss/train': 2.0076229572296143} -11/07/2021 00:57:42 - INFO - __main__ - Step 26637: {'lr': 0.0004665876751480996, 'samples': 5114304, 'steps': 26636, 'loss/train': 1.8105500936508179} -11/07/2021 00:57:43 - INFO - __main__ - Step 26638: {'lr': 0.0004665850247193615, 'samples': 5114496, 'steps': 26637, 'loss/train': 1.4529505968093872} -11/07/2021 00:57:44 - INFO - __main__ - Step 26639: {'lr': 0.0004665823741930335, 'samples': 5114688, 'steps': 26638, 'loss/train': 1.054864764213562} -11/07/2021 00:57:44 - INFO - __main__ - Step 26640: {'lr': 0.00046657972356911696, 'samples': 5114880, 'steps': 26639, 'loss/train': 1.6424245834350586} -11/07/2021 00:57:44 - INFO - __main__ - Step 26641: {'lr': 0.00046657707284761274, 'samples': 5115072, 'steps': 26640, 'loss/train': 1.2736396789550781} -11/07/2021 00:57:45 - INFO - __main__ - Step 26642: {'lr': 0.0004665744220285224, 'samples': 5115264, 'steps': 26641, 'loss/train': 0.37159693241119385} -11/07/2021 00:57:45 - INFO - __main__ - Step 26643: {'lr': 0.0004665717711118469, 'samples': 5115456, 'steps': 26642, 'loss/train': 1.5933653116226196} -11/07/2021 00:57:46 - INFO - __main__ - Step 26644: {'lr': 0.00046656912009758743, 'samples': 5115648, 'steps': 26643, 'loss/train': 1.0128573179244995} -11/07/2021 00:57:46 - INFO - __main__ - Step 26645: {'lr': 0.0004665664689857454, 'samples': 5115840, 'steps': 26644, 'loss/train': 1.5813493728637695} -11/07/2021 00:57:47 - INFO - __main__ - Step 26646: {'lr': 0.00046656381777632173, 'samples': 5116032, 'steps': 26645, 'loss/train': 1.6319818496704102} -11/07/2021 00:57:47 - INFO - __main__ - Step 26647: {'lr': 0.0004665611664693178, 'samples': 5116224, 'steps': 26646, 'loss/train': 1.7234327793121338} -11/07/2021 00:57:48 - INFO - __main__ - Step 26648: {'lr': 0.0004665585150647348, 'samples': 5116416, 'steps': 26647, 'loss/train': 1.7393739223480225} -11/07/2021 00:57:49 - INFO - __main__ - Step 26649: {'lr': 0.0004665558635625738, 'samples': 5116608, 'steps': 26648, 'loss/train': 1.6047013998031616} -11/07/2021 00:57:49 - INFO - __main__ - Step 26650: {'lr': 0.00046655321196283604, 'samples': 5116800, 'steps': 26649, 'loss/train': 1.8685024976730347} -11/07/2021 00:57:49 - INFO - __main__ - Step 26651: {'lr': 0.00046655056026552287, 'samples': 5116992, 'steps': 26650, 'loss/train': 0.18996243178844452} -11/07/2021 00:57:50 - INFO - __main__ - Step 26652: {'lr': 0.0004665479084706353, 'samples': 5117184, 'steps': 26651, 'loss/train': 1.8232330083847046} -11/07/2021 00:57:50 - INFO - __main__ - Step 26653: {'lr': 0.00046654525657817457, 'samples': 5117376, 'steps': 26652, 'loss/train': 1.292604923248291} -11/07/2021 00:57:51 - INFO - __main__ - Step 26654: {'lr': 0.0004665426045881419, 'samples': 5117568, 'steps': 26653, 'loss/train': 1.6663436889648438} -11/07/2021 00:57:51 - INFO - __main__ - Step 26655: {'lr': 0.00046653995250053843, 'samples': 5117760, 'steps': 26654, 'loss/train': 1.220912218093872} -11/07/2021 00:57:52 - INFO - __main__ - Step 26656: {'lr': 0.00046653730031536545, 'samples': 5117952, 'steps': 26655, 'loss/train': 1.6533703804016113} -11/07/2021 00:57:52 - INFO - __main__ - Step 26657: {'lr': 0.0004665346480326241, 'samples': 5118144, 'steps': 26656, 'loss/train': 1.6312495470046997} -11/07/2021 00:57:53 - INFO - __main__ - Step 26658: {'lr': 0.00046653199565231554, 'samples': 5118336, 'steps': 26657, 'loss/train': 1.40569007396698} -11/07/2021 00:57:54 - INFO - __main__ - Step 26659: {'lr': 0.00046652934317444104, 'samples': 5118528, 'steps': 26658, 'loss/train': 1.6105440855026245} -11/07/2021 00:57:54 - INFO - __main__ - Step 26660: {'lr': 0.00046652669059900174, 'samples': 5118720, 'steps': 26659, 'loss/train': 1.2899856567382812} -11/07/2021 00:57:54 - INFO - __main__ - Step 26661: {'lr': 0.0004665240379259989, 'samples': 5118912, 'steps': 26660, 'loss/train': 1.2735904455184937} -11/07/2021 00:57:55 - INFO - __main__ - Step 26662: {'lr': 0.00046652138515543366, 'samples': 5119104, 'steps': 26661, 'loss/train': 1.6175771951675415} -11/07/2021 00:57:55 - INFO - __main__ - Step 26663: {'lr': 0.00046651873228730715, 'samples': 5119296, 'steps': 26662, 'loss/train': 1.0031540393829346} -11/07/2021 00:57:56 - INFO - __main__ - Step 26664: {'lr': 0.0004665160793216207, 'samples': 5119488, 'steps': 26663, 'loss/train': 1.4231845140457153} -11/07/2021 00:57:57 - INFO - __main__ - Step 26665: {'lr': 0.00046651342625837544, 'samples': 5119680, 'steps': 26664, 'loss/train': 1.0525844097137451} -11/07/2021 00:57:57 - INFO - __main__ - Step 26666: {'lr': 0.00046651077309757256, 'samples': 5119872, 'steps': 26665, 'loss/train': 0.7705839276313782} -11/07/2021 00:57:57 - INFO - __main__ - Step 26667: {'lr': 0.0004665081198392133, 'samples': 5120064, 'steps': 26666, 'loss/train': 1.1075023412704468} -11/07/2021 00:57:58 - INFO - __main__ - Step 26668: {'lr': 0.0004665054664832988, 'samples': 5120256, 'steps': 26667, 'loss/train': 1.461146354675293} -11/07/2021 00:57:58 - INFO - __main__ - Step 26669: {'lr': 0.00046650281302983024, 'samples': 5120448, 'steps': 26668, 'loss/train': 1.7595139741897583} -11/07/2021 00:57:59 - INFO - __main__ - Step 26670: {'lr': 0.00046650015947880886, 'samples': 5120640, 'steps': 26669, 'loss/train': 1.0714360475540161} -11/07/2021 00:58:00 - INFO - __main__ - Step 26671: {'lr': 0.00046649750583023595, 'samples': 5120832, 'steps': 26670, 'loss/train': 1.328011155128479} -11/07/2021 00:58:00 - INFO - __main__ - Step 26672: {'lr': 0.00046649485208411244, 'samples': 5121024, 'steps': 26671, 'loss/train': 1.5091999769210815} -11/07/2021 00:58:00 - INFO - __main__ - Step 26673: {'lr': 0.00046649219824043984, 'samples': 5121216, 'steps': 26672, 'loss/train': 1.622520089149475} -11/07/2021 00:58:01 - INFO - __main__ - Step 26674: {'lr': 0.00046648954429921914, 'samples': 5121408, 'steps': 26673, 'loss/train': 1.4281224012374878} -11/07/2021 00:58:02 - INFO - __main__ - Step 26675: {'lr': 0.00046648689026045157, 'samples': 5121600, 'steps': 26674, 'loss/train': 1.4314370155334473} -11/07/2021 00:58:02 - INFO - __main__ - Step 26676: {'lr': 0.0004664842361241384, 'samples': 5121792, 'steps': 26675, 'loss/train': 1.8390313386917114} -11/07/2021 00:58:02 - INFO - __main__ - Step 26677: {'lr': 0.00046648158189028073, 'samples': 5121984, 'steps': 26676, 'loss/train': 1.6365265846252441} -11/07/2021 00:58:03 - INFO - __main__ - Step 26678: {'lr': 0.0004664789275588798, 'samples': 5122176, 'steps': 26677, 'loss/train': 1.651261806488037} -11/07/2021 00:58:03 - INFO - __main__ - Step 26679: {'lr': 0.0004664762731299368, 'samples': 5122368, 'steps': 26678, 'loss/train': 1.6249920129776} -11/07/2021 00:58:04 - INFO - __main__ - Step 26680: {'lr': 0.00046647361860345293, 'samples': 5122560, 'steps': 26679, 'loss/train': 2.140415668487549} -11/07/2021 00:58:04 - INFO - __main__ - Step 26681: {'lr': 0.00046647096397942945, 'samples': 5122752, 'steps': 26680, 'loss/train': 2.295044183731079} -11/07/2021 00:58:05 - INFO - __main__ - Step 26682: {'lr': 0.0004664683092578674, 'samples': 5122944, 'steps': 26681, 'loss/train': 1.655160665512085} -11/07/2021 00:58:05 - INFO - __main__ - Step 26683: {'lr': 0.00046646565443876815, 'samples': 5123136, 'steps': 26682, 'loss/train': 1.6432113647460938} -11/07/2021 00:58:05 - INFO - __main__ - Step 26684: {'lr': 0.00046646299952213277, 'samples': 5123328, 'steps': 26683, 'loss/train': 1.8974426984786987} -11/07/2021 00:58:06 - INFO - __main__ - Step 26685: {'lr': 0.00046646034450796255, 'samples': 5123520, 'steps': 26684, 'loss/train': 1.5197091102600098} -11/07/2021 00:58:07 - INFO - __main__ - Step 26686: {'lr': 0.0004664576893962586, 'samples': 5123712, 'steps': 26685, 'loss/train': 1.4399789571762085} -11/07/2021 00:58:07 - INFO - __main__ - Step 26687: {'lr': 0.0004664550341870222, 'samples': 5123904, 'steps': 26686, 'loss/train': 1.472825050354004} -11/07/2021 00:58:07 - INFO - __main__ - Step 26688: {'lr': 0.00046645237888025444, 'samples': 5124096, 'steps': 26687, 'loss/train': 1.816226601600647} -11/07/2021 00:58:08 - INFO - __main__ - Step 26689: {'lr': 0.0004664497234759566, 'samples': 5124288, 'steps': 26688, 'loss/train': 1.6909376382827759} -11/07/2021 00:58:09 - INFO - __main__ - Step 26690: {'lr': 0.00046644706797412984, 'samples': 5124480, 'steps': 26689, 'loss/train': 1.7982065677642822} -11/07/2021 00:58:09 - INFO - __main__ - Step 26691: {'lr': 0.00046644441237477544, 'samples': 5124672, 'steps': 26690, 'loss/train': 0.9981279373168945} -11/07/2021 00:58:10 - INFO - __main__ - Step 26692: {'lr': 0.00046644175667789444, 'samples': 5124864, 'steps': 26691, 'loss/train': 1.3450186252593994} -11/07/2021 00:58:10 - INFO - __main__ - Step 26693: {'lr': 0.00046643910088348817, 'samples': 5125056, 'steps': 26692, 'loss/train': 1.7120623588562012} -11/07/2021 00:58:10 - INFO - __main__ - Step 26694: {'lr': 0.0004664364449915578, 'samples': 5125248, 'steps': 26693, 'loss/train': 1.2893990278244019} -11/07/2021 00:58:11 - INFO - __main__ - Step 26695: {'lr': 0.0004664337890021044, 'samples': 5125440, 'steps': 26694, 'loss/train': 1.5590112209320068} -11/07/2021 00:58:12 - INFO - __main__ - Step 26696: {'lr': 0.0004664311329151294, 'samples': 5125632, 'steps': 26695, 'loss/train': 1.4270391464233398} -11/07/2021 00:58:12 - INFO - __main__ - Step 26697: {'lr': 0.0004664284767306338, 'samples': 5125824, 'steps': 26696, 'loss/train': 1.45754075050354} -11/07/2021 00:58:12 - INFO - __main__ - Step 26698: {'lr': 0.0004664258204486189, 'samples': 5126016, 'steps': 26697, 'loss/train': 1.4459261894226074} -11/07/2021 00:58:13 - INFO - __main__ - Step 26699: {'lr': 0.0004664231640690859, 'samples': 5126208, 'steps': 26698, 'loss/train': 1.7300431728363037} -11/07/2021 00:58:13 - INFO - __main__ - Step 26700: {'lr': 0.0004664205075920359, 'samples': 5126400, 'steps': 26699, 'loss/train': 2.156492233276367} -11/07/2021 00:58:14 - INFO - __main__ - Step 26701: {'lr': 0.0004664178510174702, 'samples': 5126592, 'steps': 26700, 'loss/train': 1.6679294109344482} -11/07/2021 00:58:14 - INFO - __main__ - Step 26702: {'lr': 0.0004664151943453899, 'samples': 5126784, 'steps': 26701, 'loss/train': 1.5192807912826538} -11/07/2021 00:58:15 - INFO - __main__ - Step 26703: {'lr': 0.0004664125375757963, 'samples': 5126976, 'steps': 26702, 'loss/train': 1.510108470916748} -11/07/2021 00:58:15 - INFO - __main__ - Step 26704: {'lr': 0.00046640988070869053, 'samples': 5127168, 'steps': 26703, 'loss/train': 1.4754691123962402} -11/07/2021 00:58:16 - INFO - __main__ - Step 26705: {'lr': 0.00046640722374407384, 'samples': 5127360, 'steps': 26704, 'loss/train': 1.5549184083938599} -11/07/2021 00:58:17 - INFO - __main__ - Step 26706: {'lr': 0.00046640456668194737, 'samples': 5127552, 'steps': 26705, 'loss/train': 1.417669653892517} -11/07/2021 00:58:17 - INFO - __main__ - Step 26707: {'lr': 0.0004664019095223123, 'samples': 5127744, 'steps': 26706, 'loss/train': 1.262236475944519} -11/07/2021 00:58:17 - INFO - __main__ - Step 26708: {'lr': 0.00046639925226517, 'samples': 5127936, 'steps': 26707, 'loss/train': 1.6880942583084106} -11/07/2021 00:58:18 - INFO - __main__ - Step 26709: {'lr': 0.0004663965949105214, 'samples': 5128128, 'steps': 26708, 'loss/train': 1.3780642747879028} -11/07/2021 00:58:18 - INFO - __main__ - Step 26710: {'lr': 0.0004663939374583679, 'samples': 5128320, 'steps': 26709, 'loss/train': 1.3778291940689087} -11/07/2021 00:58:19 - INFO - __main__ - Step 26711: {'lr': 0.00046639127990871055, 'samples': 5128512, 'steps': 26710, 'loss/train': 1.5793744325637817} -11/07/2021 00:58:19 - INFO - __main__ - Step 26712: {'lr': 0.00046638862226155075, 'samples': 5128704, 'steps': 26711, 'loss/train': 1.086185336112976} -11/07/2021 00:58:20 - INFO - __main__ - Step 26713: {'lr': 0.0004663859645168895, 'samples': 5128896, 'steps': 26712, 'loss/train': 1.713158369064331} -11/07/2021 00:58:20 - INFO - __main__ - Step 26714: {'lr': 0.00046638330667472805, 'samples': 5129088, 'steps': 26713, 'loss/train': 1.4040732383728027} -11/07/2021 00:58:21 - INFO - __main__ - Step 26715: {'lr': 0.0004663806487350677, 'samples': 5129280, 'steps': 26714, 'loss/train': 1.3665399551391602} -11/07/2021 00:58:21 - INFO - __main__ - Step 26716: {'lr': 0.00046637799069790953, 'samples': 5129472, 'steps': 26715, 'loss/train': 1.311948299407959} -11/07/2021 00:58:22 - INFO - __main__ - Step 26717: {'lr': 0.00046637533256325476, 'samples': 5129664, 'steps': 26716, 'loss/train': 1.5316460132598877} -11/07/2021 00:58:22 - INFO - __main__ - Step 26718: {'lr': 0.0004663726743311046, 'samples': 5129856, 'steps': 26717, 'loss/train': 1.1193568706512451} -11/07/2021 00:58:23 - INFO - __main__ - Step 26719: {'lr': 0.00046637001600146027, 'samples': 5130048, 'steps': 26718, 'loss/train': 1.4479613304138184} -11/07/2021 00:58:23 - INFO - __main__ - Step 26720: {'lr': 0.000466367357574323, 'samples': 5130240, 'steps': 26719, 'loss/train': 1.812766671180725} -11/07/2021 00:58:24 - INFO - __main__ - Step 26721: {'lr': 0.00046636469904969387, 'samples': 5130432, 'steps': 26720, 'loss/train': 1.200969934463501} -11/07/2021 00:58:24 - INFO - __main__ - Step 26722: {'lr': 0.0004663620404275741, 'samples': 5130624, 'steps': 26721, 'loss/train': 1.617827296257019} -11/07/2021 00:58:25 - INFO - __main__ - Step 26723: {'lr': 0.00046635938170796505, 'samples': 5130816, 'steps': 26722, 'loss/train': 1.5450035333633423} -11/07/2021 00:58:25 - INFO - __main__ - Step 26724: {'lr': 0.00046635672289086774, 'samples': 5131008, 'steps': 26723, 'loss/train': 1.504841923713684} -11/07/2021 00:58:25 - INFO - __main__ - Step 26725: {'lr': 0.00046635406397628346, 'samples': 5131200, 'steps': 26724, 'loss/train': 1.0579419136047363} -11/07/2021 00:58:26 - INFO - __main__ - Step 26726: {'lr': 0.00046635140496421336, 'samples': 5131392, 'steps': 26725, 'loss/train': 1.883946418762207} -11/07/2021 00:58:27 - INFO - __main__ - Step 26727: {'lr': 0.0004663487458546586, 'samples': 5131584, 'steps': 26726, 'loss/train': 2.128173351287842} -11/07/2021 00:58:27 - INFO - __main__ - Step 26728: {'lr': 0.0004663460866476205, 'samples': 5131776, 'steps': 26727, 'loss/train': 1.4596672058105469} -11/07/2021 00:58:27 - INFO - __main__ - Step 26729: {'lr': 0.00046634342734310023, 'samples': 5131968, 'steps': 26728, 'loss/train': 1.3028556108474731} -11/07/2021 00:58:28 - INFO - __main__ - Step 26730: {'lr': 0.0004663407679410988, 'samples': 5132160, 'steps': 26729, 'loss/train': 1.107367992401123} -11/07/2021 00:58:29 - INFO - __main__ - Step 26731: {'lr': 0.0004663381084416177, 'samples': 5132352, 'steps': 26730, 'loss/train': 0.9006083607673645} -11/07/2021 00:58:29 - INFO - __main__ - Step 26732: {'lr': 0.00046633544884465796, 'samples': 5132544, 'steps': 26731, 'loss/train': 1.004862904548645} -11/07/2021 00:58:30 - INFO - __main__ - Step 26733: {'lr': 0.0004663327891502208, 'samples': 5132736, 'steps': 26732, 'loss/train': 1.9089033603668213} -11/07/2021 00:58:30 - INFO - __main__ - Step 26734: {'lr': 0.0004663301293583073, 'samples': 5132928, 'steps': 26733, 'loss/train': 1.0407803058624268} -11/07/2021 00:58:30 - INFO - __main__ - Step 26735: {'lr': 0.000466327469468919, 'samples': 5133120, 'steps': 26734, 'loss/train': 1.420594573020935} -11/07/2021 00:58:31 - INFO - __main__ - Step 26736: {'lr': 0.0004663248094820567, 'samples': 5133312, 'steps': 26735, 'loss/train': 1.2276805639266968} -11/07/2021 00:58:32 - INFO - __main__ - Step 26737: {'lr': 0.00046632214939772187, 'samples': 5133504, 'steps': 26736, 'loss/train': 1.0551986694335938} -11/07/2021 00:58:32 - INFO - __main__ - Step 26738: {'lr': 0.0004663194892159156, 'samples': 5133696, 'steps': 26737, 'loss/train': 1.1808747053146362} -11/07/2021 00:58:32 - INFO - __main__ - Step 26739: {'lr': 0.0004663168289366391, 'samples': 5133888, 'steps': 26738, 'loss/train': 1.6448155641555786} -11/07/2021 00:58:33 - INFO - __main__ - Step 26740: {'lr': 0.0004663141685598936, 'samples': 5134080, 'steps': 26739, 'loss/train': 1.2650645971298218} -11/07/2021 00:58:34 - INFO - __main__ - Step 26741: {'lr': 0.00046631150808568026, 'samples': 5134272, 'steps': 26740, 'loss/train': 1.4323738813400269} -11/07/2021 00:58:34 - INFO - __main__ - Step 26742: {'lr': 0.00046630884751400024, 'samples': 5134464, 'steps': 26741, 'loss/train': 1.3132368326187134} -11/07/2021 00:58:34 - INFO - __main__ - Step 26743: {'lr': 0.0004663061868448548, 'samples': 5134656, 'steps': 26742, 'loss/train': 1.777282476425171} -11/07/2021 00:58:35 - INFO - __main__ - Step 26744: {'lr': 0.0004663035260782452, 'samples': 5134848, 'steps': 26743, 'loss/train': 1.5186762809753418} -11/07/2021 00:58:35 - INFO - __main__ - Step 26745: {'lr': 0.0004663008652141726, 'samples': 5135040, 'steps': 26744, 'loss/train': 1.3067575693130493} -11/07/2021 00:58:36 - INFO - __main__ - Step 26746: {'lr': 0.00046629820425263805, 'samples': 5135232, 'steps': 26745, 'loss/train': 1.5075962543487549} -11/07/2021 00:58:37 - INFO - __main__ - Step 26747: {'lr': 0.00046629554319364293, 'samples': 5135424, 'steps': 26746, 'loss/train': 1.64328932762146} -11/07/2021 00:58:37 - INFO - __main__ - Step 26748: {'lr': 0.00046629288203718834, 'samples': 5135616, 'steps': 26747, 'loss/train': 1.1373062133789062} -11/07/2021 00:58:37 - INFO - __main__ - Step 26749: {'lr': 0.00046629022078327557, 'samples': 5135808, 'steps': 26748, 'loss/train': 1.623582124710083} -11/07/2021 00:58:38 - INFO - __main__ - Step 26750: {'lr': 0.0004662875594319057, 'samples': 5136000, 'steps': 26749, 'loss/train': 0.9610598683357239} -11/07/2021 00:58:38 - INFO - __main__ - Step 26751: {'lr': 0.00046628489798308006, 'samples': 5136192, 'steps': 26750, 'loss/train': 1.5221467018127441} -11/07/2021 00:58:39 - INFO - __main__ - Step 26752: {'lr': 0.0004662822364367997, 'samples': 5136384, 'steps': 26751, 'loss/train': 1.4284276962280273} -11/07/2021 00:58:39 - INFO - __main__ - Step 26753: {'lr': 0.000466279574793066, 'samples': 5136576, 'steps': 26752, 'loss/train': 1.580201268196106} -11/07/2021 00:58:40 - INFO - __main__ - Step 26754: {'lr': 0.00046627691305188004, 'samples': 5136768, 'steps': 26753, 'loss/train': 1.4526443481445312} -11/07/2021 00:58:40 - INFO - __main__ - Step 26755: {'lr': 0.00046627425121324294, 'samples': 5136960, 'steps': 26754, 'loss/train': 0.7486782670021057} -11/07/2021 00:58:40 - INFO - __main__ - Step 26756: {'lr': 0.0004662715892771561, 'samples': 5137152, 'steps': 26755, 'loss/train': 1.6319177150726318} -11/07/2021 00:58:42 - INFO - __main__ - Step 26757: {'lr': 0.0004662689272436206, 'samples': 5137344, 'steps': 26756, 'loss/train': 1.4941084384918213} -11/07/2021 00:58:42 - INFO - __main__ - Step 26758: {'lr': 0.00046626626511263764, 'samples': 5137536, 'steps': 26757, 'loss/train': 1.7254610061645508} -11/07/2021 00:58:42 - INFO - __main__ - Step 26759: {'lr': 0.00046626360288420845, 'samples': 5137728, 'steps': 26758, 'loss/train': 1.5891088247299194} -11/07/2021 00:58:43 - INFO - __main__ - Step 26760: {'lr': 0.00046626094055833426, 'samples': 5137920, 'steps': 26759, 'loss/train': 1.6341724395751953} -11/07/2021 00:58:43 - INFO - __main__ - Step 26761: {'lr': 0.0004662582781350161, 'samples': 5138112, 'steps': 26760, 'loss/train': 1.5685557126998901} -11/07/2021 00:58:44 - INFO - __main__ - Step 26762: {'lr': 0.00046625561561425543, 'samples': 5138304, 'steps': 26761, 'loss/train': 0.4045870006084442} -11/07/2021 00:58:44 - INFO - __main__ - Step 26763: {'lr': 0.00046625295299605323, 'samples': 5138496, 'steps': 26762, 'loss/train': 1.108884334564209} -11/07/2021 00:58:45 - INFO - __main__ - Step 26764: {'lr': 0.0004662502902804109, 'samples': 5138688, 'steps': 26763, 'loss/train': 1.5114766359329224} -11/07/2021 00:58:45 - INFO - __main__ - Step 26765: {'lr': 0.0004662476274673294, 'samples': 5138880, 'steps': 26764, 'loss/train': 0.9535731077194214} -11/07/2021 00:58:46 - INFO - __main__ - Step 26766: {'lr': 0.00046624496455681006, 'samples': 5139072, 'steps': 26765, 'loss/train': 0.9992877244949341} -11/07/2021 00:58:46 - INFO - __main__ - Step 26767: {'lr': 0.00046624230154885415, 'samples': 5139264, 'steps': 26766, 'loss/train': 0.9134907722473145} -11/07/2021 00:58:47 - INFO - __main__ - Step 26768: {'lr': 0.0004662396384434627, 'samples': 5139456, 'steps': 26767, 'loss/train': 1.1533561944961548} -11/07/2021 00:58:47 - INFO - __main__ - Step 26769: {'lr': 0.00046623697524063713, 'samples': 5139648, 'steps': 26768, 'loss/train': 1.5940784215927124} -11/07/2021 00:58:48 - INFO - __main__ - Step 26770: {'lr': 0.00046623431194037847, 'samples': 5139840, 'steps': 26769, 'loss/train': 1.6589995622634888} -11/07/2021 00:58:48 - INFO - __main__ - Step 26771: {'lr': 0.000466231648542688, 'samples': 5140032, 'steps': 26770, 'loss/train': 1.7405768632888794} -11/07/2021 00:58:48 - INFO - __main__ - Step 26772: {'lr': 0.0004662289850475668, 'samples': 5140224, 'steps': 26771, 'loss/train': 1.5431126356124878} -11/07/2021 00:58:49 - INFO - __main__ - Step 26773: {'lr': 0.0004662263214550162, 'samples': 5140416, 'steps': 26772, 'loss/train': 1.5235966444015503} -11/07/2021 00:58:50 - INFO - __main__ - Step 26774: {'lr': 0.00046622365776503735, 'samples': 5140608, 'steps': 26773, 'loss/train': 1.3490772247314453} -11/07/2021 00:58:50 - INFO - __main__ - Step 26775: {'lr': 0.0004662209939776315, 'samples': 5140800, 'steps': 26774, 'loss/train': 1.6184896230697632} -11/07/2021 00:58:50 - INFO - __main__ - Step 26776: {'lr': 0.0004662183300927997, 'samples': 5140992, 'steps': 26775, 'loss/train': 1.5121411085128784} -11/07/2021 00:58:51 - INFO - __main__ - Step 26777: {'lr': 0.0004662156661105433, 'samples': 5141184, 'steps': 26776, 'loss/train': 1.5256009101867676} -11/07/2021 00:58:52 - INFO - __main__ - Step 26778: {'lr': 0.0004662130020308635, 'samples': 5141376, 'steps': 26777, 'loss/train': 1.8537344932556152} -11/07/2021 00:58:52 - INFO - __main__ - Step 26779: {'lr': 0.00046621033785376146, 'samples': 5141568, 'steps': 26778, 'loss/train': 1.7795383930206299} -11/07/2021 00:58:53 - INFO - __main__ - Step 26780: {'lr': 0.00046620767357923834, 'samples': 5141760, 'steps': 26779, 'loss/train': 1.3969024419784546} -11/07/2021 00:58:53 - INFO - __main__ - Step 26781: {'lr': 0.0004662050092072954, 'samples': 5141952, 'steps': 26780, 'loss/train': 1.4966504573822021} -11/07/2021 00:58:53 - INFO - __main__ - Step 26782: {'lr': 0.0004662023447379338, 'samples': 5142144, 'steps': 26781, 'loss/train': 1.615160584449768} -11/07/2021 00:58:54 - INFO - __main__ - Step 26783: {'lr': 0.0004661996801711548, 'samples': 5142336, 'steps': 26782, 'loss/train': 1.3632062673568726} -11/07/2021 00:58:55 - INFO - __main__ - Step 26784: {'lr': 0.0004661970155069595, 'samples': 5142528, 'steps': 26783, 'loss/train': 1.2376118898391724} -11/07/2021 00:58:55 - INFO - __main__ - Step 26785: {'lr': 0.00046619435074534923, 'samples': 5142720, 'steps': 26784, 'loss/train': 1.4335567951202393} -11/07/2021 00:58:55 - INFO - __main__ - Step 26786: {'lr': 0.0004661916858863251, 'samples': 5142912, 'steps': 26785, 'loss/train': 1.4138081073760986} -11/07/2021 00:58:56 - INFO - __main__ - Step 26787: {'lr': 0.00046618902092988824, 'samples': 5143104, 'steps': 26786, 'loss/train': 1.8235607147216797} -11/07/2021 00:58:57 - INFO - __main__ - Step 26788: {'lr': 0.00046618635587604006, 'samples': 5143296, 'steps': 26787, 'loss/train': 1.5318324565887451} -11/07/2021 00:58:57 - INFO - __main__ - Step 26789: {'lr': 0.00046618369072478163, 'samples': 5143488, 'steps': 26788, 'loss/train': 1.4976593255996704} -11/07/2021 00:58:58 - INFO - __main__ - Step 26790: {'lr': 0.0004661810254761141, 'samples': 5143680, 'steps': 26789, 'loss/train': 1.76413893699646} -11/07/2021 00:58:58 - INFO - __main__ - Step 26791: {'lr': 0.0004661783601300388, 'samples': 5143872, 'steps': 26790, 'loss/train': 1.2355625629425049} -11/07/2021 00:58:58 - INFO - __main__ - Step 26792: {'lr': 0.00046617569468655686, 'samples': 5144064, 'steps': 26791, 'loss/train': 1.8549610376358032} -11/07/2021 00:58:59 - INFO - __main__ - Step 26793: {'lr': 0.00046617302914566945, 'samples': 5144256, 'steps': 26792, 'loss/train': 1.5732007026672363} -11/07/2021 00:59:00 - INFO - __main__ - Step 26794: {'lr': 0.00046617036350737786, 'samples': 5144448, 'steps': 26793, 'loss/train': 1.8792085647583008} -11/07/2021 00:59:00 - INFO - __main__ - Step 26795: {'lr': 0.0004661676977716832, 'samples': 5144640, 'steps': 26794, 'loss/train': 0.6580197215080261} -11/07/2021 00:59:00 - INFO - __main__ - Step 26796: {'lr': 0.0004661650319385867, 'samples': 5144832, 'steps': 26795, 'loss/train': 1.1191657781600952} -11/07/2021 00:59:01 - INFO - __main__ - Step 26797: {'lr': 0.0004661623660080896, 'samples': 5145024, 'steps': 26796, 'loss/train': 1.5374164581298828} -11/07/2021 00:59:01 - INFO - __main__ - Step 26798: {'lr': 0.000466159699980193, 'samples': 5145216, 'steps': 26797, 'loss/train': 1.153203010559082} -11/07/2021 00:59:02 - INFO - __main__ - Step 26799: {'lr': 0.0004661570338548983, 'samples': 5145408, 'steps': 26798, 'loss/train': 1.4095265865325928} -11/07/2021 00:59:02 - INFO - __main__ - Step 26800: {'lr': 0.00046615436763220645, 'samples': 5145600, 'steps': 26799, 'loss/train': 1.2437288761138916} -11/07/2021 00:59:03 - INFO - __main__ - Step 26801: {'lr': 0.0004661517013121189, 'samples': 5145792, 'steps': 26800, 'loss/train': 1.4183251857757568} -11/07/2021 00:59:03 - INFO - __main__ - Step 26802: {'lr': 0.00046614903489463667, 'samples': 5145984, 'steps': 26801, 'loss/train': 1.6035794019699097} -11/07/2021 00:59:04 - INFO - __main__ - Step 26803: {'lr': 0.000466146368379761, 'samples': 5146176, 'steps': 26802, 'loss/train': 1.5024195909500122} -11/07/2021 00:59:05 - INFO - __main__ - Step 26804: {'lr': 0.0004661437017674931, 'samples': 5146368, 'steps': 26803, 'loss/train': 1.229723572731018} -11/07/2021 00:59:05 - INFO - __main__ - Step 26805: {'lr': 0.00046614103505783423, 'samples': 5146560, 'steps': 26804, 'loss/train': 1.6293288469314575} -11/07/2021 00:59:05 - INFO - __main__ - Step 26806: {'lr': 0.0004661383682507856, 'samples': 5146752, 'steps': 26805, 'loss/train': 1.8361610174179077} -11/07/2021 00:59:06 - INFO - __main__ - Step 26807: {'lr': 0.00046613570134634825, 'samples': 5146944, 'steps': 26806, 'loss/train': 1.4449939727783203} -11/07/2021 00:59:06 - INFO - __main__ - Step 26808: {'lr': 0.00046613303434452346, 'samples': 5147136, 'steps': 26807, 'loss/train': 1.5649182796478271} -11/07/2021 00:59:07 - INFO - __main__ - Step 26809: {'lr': 0.00046613036724531254, 'samples': 5147328, 'steps': 26808, 'loss/train': 1.4508755207061768} -11/07/2021 00:59:07 - INFO - __main__ - Step 26810: {'lr': 0.00046612770004871663, 'samples': 5147520, 'steps': 26809, 'loss/train': 0.7488903403282166} -11/07/2021 00:59:08 - INFO - __main__ - Step 26811: {'lr': 0.00046612503275473687, 'samples': 5147712, 'steps': 26810, 'loss/train': 1.3369272947311401} -11/07/2021 00:59:08 - INFO - __main__ - Step 26812: {'lr': 0.00046612236536337456, 'samples': 5147904, 'steps': 26811, 'loss/train': 1.7601577043533325} -11/07/2021 00:59:08 - INFO - __main__ - Step 26813: {'lr': 0.00046611969787463083, 'samples': 5148096, 'steps': 26812, 'loss/train': 1.4340001344680786} -11/07/2021 00:59:10 - INFO - __main__ - Step 26814: {'lr': 0.00046611703028850683, 'samples': 5148288, 'steps': 26813, 'loss/train': 1.94196617603302} -11/07/2021 00:59:10 - INFO - __main__ - Step 26815: {'lr': 0.00046611436260500386, 'samples': 5148480, 'steps': 26814, 'loss/train': 1.50175142288208} -11/07/2021 00:59:10 - INFO - __main__ - Step 26816: {'lr': 0.00046611169482412305, 'samples': 5148672, 'steps': 26815, 'loss/train': 1.3230130672454834} -11/07/2021 00:59:11 - INFO - __main__ - Step 26817: {'lr': 0.00046610902694586576, 'samples': 5148864, 'steps': 26816, 'loss/train': 1.762872338294983} -11/07/2021 00:59:11 - INFO - __main__ - Step 26818: {'lr': 0.00046610635897023303, 'samples': 5149056, 'steps': 26817, 'loss/train': 0.9505210518836975} -11/07/2021 00:59:11 - INFO - __main__ - Step 26819: {'lr': 0.0004661036908972261, 'samples': 5149248, 'steps': 26818, 'loss/train': 1.371229648590088} -11/07/2021 00:59:12 - INFO - __main__ - Step 26820: {'lr': 0.0004661010227268462, 'samples': 5149440, 'steps': 26819, 'loss/train': 1.170758605003357} -11/07/2021 00:59:13 - INFO - __main__ - Step 26821: {'lr': 0.0004660983544590944, 'samples': 5149632, 'steps': 26820, 'loss/train': 1.5897732973098755} -11/07/2021 00:59:13 - INFO - __main__ - Step 26822: {'lr': 0.0004660956860939722, 'samples': 5149824, 'steps': 26821, 'loss/train': 1.6550143957138062} -11/07/2021 00:59:13 - INFO - __main__ - Step 26823: {'lr': 0.0004660930176314805, 'samples': 5150016, 'steps': 26822, 'loss/train': 1.2598298788070679} -11/07/2021 00:59:14 - INFO - __main__ - Step 26824: {'lr': 0.0004660903490716206, 'samples': 5150208, 'steps': 26823, 'loss/train': 1.2444219589233398} -11/07/2021 00:59:15 - INFO - __main__ - Step 26825: {'lr': 0.0004660876804143938, 'samples': 5150400, 'steps': 26824, 'loss/train': 1.2991782426834106} -11/07/2021 00:59:15 - INFO - __main__ - Step 26826: {'lr': 0.0004660850116598012, 'samples': 5150592, 'steps': 26825, 'loss/train': 2.0060222148895264} -11/07/2021 00:59:16 - INFO - __main__ - Step 26827: {'lr': 0.00046608234280784406, 'samples': 5150784, 'steps': 26826, 'loss/train': 1.3262913227081299} -11/07/2021 00:59:16 - INFO - __main__ - Step 26828: {'lr': 0.0004660796738585235, 'samples': 5150976, 'steps': 26827, 'loss/train': 1.8722556829452515} -11/07/2021 00:59:16 - INFO - __main__ - Step 26829: {'lr': 0.0004660770048118408, 'samples': 5151168, 'steps': 26828, 'loss/train': 1.2325032949447632} -11/07/2021 00:59:18 - INFO - __main__ - Step 26830: {'lr': 0.00046607433566779713, 'samples': 5151360, 'steps': 26829, 'loss/train': 0.7690796256065369} -11/07/2021 00:59:18 - INFO - __main__ - Step 26831: {'lr': 0.00046607166642639365, 'samples': 5151552, 'steps': 26830, 'loss/train': 1.4862192869186401} -11/07/2021 00:59:18 - INFO - __main__ - Step 26832: {'lr': 0.00046606899708763174, 'samples': 5151744, 'steps': 26831, 'loss/train': 1.6997482776641846} -11/07/2021 00:59:19 - INFO - __main__ - Step 26833: {'lr': 0.0004660663276515124, 'samples': 5151936, 'steps': 26832, 'loss/train': 1.7106437683105469} -11/07/2021 00:59:19 - INFO - __main__ - Step 26834: {'lr': 0.00046606365811803686, 'samples': 5152128, 'steps': 26833, 'loss/train': 1.5306406021118164} -11/07/2021 00:59:20 - INFO - __main__ - Step 26835: {'lr': 0.0004660609884872064, 'samples': 5152320, 'steps': 26834, 'loss/train': 1.4699666500091553} -11/07/2021 00:59:20 - INFO - __main__ - Step 26836: {'lr': 0.00046605831875902215, 'samples': 5152512, 'steps': 26835, 'loss/train': 1.2721798419952393} -11/07/2021 00:59:21 - INFO - __main__ - Step 26837: {'lr': 0.00046605564893348545, 'samples': 5152704, 'steps': 26836, 'loss/train': 1.8770490884780884} -11/07/2021 00:59:21 - INFO - __main__ - Step 26838: {'lr': 0.0004660529790105974, 'samples': 5152896, 'steps': 26837, 'loss/train': 1.1704834699630737} -11/07/2021 00:59:21 - INFO - __main__ - Step 26839: {'lr': 0.00046605030899035915, 'samples': 5153088, 'steps': 26838, 'loss/train': 1.6779916286468506} -11/07/2021 00:59:23 - INFO - __main__ - Step 26840: {'lr': 0.000466047638872772, 'samples': 5153280, 'steps': 26839, 'loss/train': 1.5715537071228027} -11/07/2021 00:59:23 - INFO - __main__ - Step 26841: {'lr': 0.0004660449686578371, 'samples': 5153472, 'steps': 26840, 'loss/train': 1.7219822406768799} -11/07/2021 00:59:23 - INFO - __main__ - Step 26842: {'lr': 0.0004660422983455557, 'samples': 5153664, 'steps': 26841, 'loss/train': 1.8314694166183472} -11/07/2021 00:59:24 - INFO - __main__ - Step 26843: {'lr': 0.0004660396279359289, 'samples': 5153856, 'steps': 26842, 'loss/train': 1.2206279039382935} -11/07/2021 00:59:24 - INFO - __main__ - Step 26844: {'lr': 0.000466036957428958, 'samples': 5154048, 'steps': 26843, 'loss/train': 1.7041361331939697} -11/07/2021 00:59:25 - INFO - __main__ - Step 26845: {'lr': 0.0004660342868246442, 'samples': 5154240, 'steps': 26844, 'loss/train': 2.0032145977020264} -11/07/2021 00:59:26 - INFO - __main__ - Step 26846: {'lr': 0.0004660316161229887, 'samples': 5154432, 'steps': 26845, 'loss/train': 0.9417108297348022} -11/07/2021 00:59:26 - INFO - __main__ - Step 26847: {'lr': 0.00046602894532399275, 'samples': 5154624, 'steps': 26846, 'loss/train': 1.3233318328857422} -11/07/2021 00:59:26 - INFO - __main__ - Step 26848: {'lr': 0.00046602627442765744, 'samples': 5154816, 'steps': 26847, 'loss/train': 1.4452942609786987} -11/07/2021 00:59:27 - INFO - __main__ - Step 26849: {'lr': 0.00046602360343398397, 'samples': 5155008, 'steps': 26848, 'loss/train': 1.0663906335830688} -11/07/2021 00:59:27 - INFO - __main__ - Step 26850: {'lr': 0.0004660209323429736, 'samples': 5155200, 'steps': 26849, 'loss/train': 1.239379644393921} -11/07/2021 00:59:27 - INFO - __main__ - Step 26851: {'lr': 0.0004660182611546276, 'samples': 5155392, 'steps': 26850, 'loss/train': 1.7812410593032837} -11/07/2021 00:59:28 - INFO - __main__ - Step 26852: {'lr': 0.0004660155898689471, 'samples': 5155584, 'steps': 26851, 'loss/train': 1.6919243335723877} -11/07/2021 00:59:29 - INFO - __main__ - Step 26853: {'lr': 0.0004660129184859332, 'samples': 5155776, 'steps': 26852, 'loss/train': 2.3535852432250977} -11/07/2021 00:59:29 - INFO - __main__ - Step 26854: {'lr': 0.00046601024700558736, 'samples': 5155968, 'steps': 26853, 'loss/train': 1.173360824584961} -11/07/2021 00:59:30 - INFO - __main__ - Step 26855: {'lr': 0.0004660075754279105, 'samples': 5156160, 'steps': 26854, 'loss/train': 1.432096242904663} -11/07/2021 00:59:30 - INFO - __main__ - Step 26856: {'lr': 0.00046600490375290406, 'samples': 5156352, 'steps': 26855, 'loss/train': 1.6817970275878906} -11/07/2021 00:59:31 - INFO - __main__ - Step 26857: {'lr': 0.0004660022319805691, 'samples': 5156544, 'steps': 26856, 'loss/train': 1.6581238508224487} -11/07/2021 00:59:31 - INFO - __main__ - Step 26858: {'lr': 0.0004659995601109069, 'samples': 5156736, 'steps': 26857, 'loss/train': 1.334643006324768} -11/07/2021 00:59:32 - INFO - __main__ - Step 26859: {'lr': 0.0004659968881439186, 'samples': 5156928, 'steps': 26858, 'loss/train': 1.651904582977295} -11/07/2021 00:59:32 - INFO - __main__ - Step 26860: {'lr': 0.00046599421607960545, 'samples': 5157120, 'steps': 26859, 'loss/train': 1.7464357614517212} -11/07/2021 00:59:32 - INFO - __main__ - Step 26861: {'lr': 0.0004659915439179686, 'samples': 5157312, 'steps': 26860, 'loss/train': 1.5475162267684937} -11/07/2021 00:59:33 - INFO - __main__ - Step 26862: {'lr': 0.0004659888716590094, 'samples': 5157504, 'steps': 26861, 'loss/train': 1.158503770828247} -11/07/2021 00:59:34 - INFO - __main__ - Step 26863: {'lr': 0.00046598619930272883, 'samples': 5157696, 'steps': 26862, 'loss/train': 1.7206814289093018} -11/07/2021 00:59:34 - INFO - __main__ - Step 26864: {'lr': 0.00046598352684912824, 'samples': 5157888, 'steps': 26863, 'loss/train': 1.4895248413085938} -11/07/2021 00:59:34 - INFO - __main__ - Step 26865: {'lr': 0.0004659808542982088, 'samples': 5158080, 'steps': 26864, 'loss/train': 1.326369047164917} -11/07/2021 00:59:35 - INFO - __main__ - Step 26866: {'lr': 0.0004659781816499718, 'samples': 5158272, 'steps': 26865, 'loss/train': 1.5209534168243408} -11/07/2021 00:59:36 - INFO - __main__ - Step 26867: {'lr': 0.0004659755089044183, 'samples': 5158464, 'steps': 26866, 'loss/train': 1.605056643486023} -11/07/2021 00:59:36 - INFO - __main__ - Step 26868: {'lr': 0.00046597283606154957, 'samples': 5158656, 'steps': 26867, 'loss/train': 0.6222965121269226} -11/07/2021 00:59:37 - INFO - __main__ - Step 26869: {'lr': 0.0004659701631213668, 'samples': 5158848, 'steps': 26868, 'loss/train': 1.559769868850708} -11/07/2021 00:59:37 - INFO - __main__ - Step 26870: {'lr': 0.00046596749008387124, 'samples': 5159040, 'steps': 26869, 'loss/train': 1.3670252561569214} -11/07/2021 00:59:37 - INFO - __main__ - Step 26871: {'lr': 0.00046596481694906403, 'samples': 5159232, 'steps': 26870, 'loss/train': 0.9740362763404846} -11/07/2021 00:59:38 - INFO - __main__ - Step 26872: {'lr': 0.00046596214371694643, 'samples': 5159424, 'steps': 26871, 'loss/train': 1.776827335357666} -11/07/2021 00:59:39 - INFO - __main__ - Step 26873: {'lr': 0.00046595947038751963, 'samples': 5159616, 'steps': 26872, 'loss/train': 1.6072895526885986} -11/07/2021 00:59:39 - INFO - __main__ - Step 26874: {'lr': 0.00046595679696078476, 'samples': 5159808, 'steps': 26873, 'loss/train': 1.5575486421585083} -11/07/2021 00:59:39 - INFO - __main__ - Step 26875: {'lr': 0.00046595412343674317, 'samples': 5160000, 'steps': 26874, 'loss/train': 1.6973767280578613} -11/07/2021 00:59:40 - INFO - __main__ - Step 26876: {'lr': 0.00046595144981539596, 'samples': 5160192, 'steps': 26875, 'loss/train': 1.2691295146942139} -11/07/2021 00:59:41 - INFO - __main__ - Step 26877: {'lr': 0.00046594877609674437, 'samples': 5160384, 'steps': 26876, 'loss/train': 1.1658782958984375} -11/07/2021 00:59:41 - INFO - __main__ - Step 26878: {'lr': 0.00046594610228078954, 'samples': 5160576, 'steps': 26877, 'loss/train': 1.6623400449752808} -11/07/2021 00:59:41 - INFO - __main__ - Step 26879: {'lr': 0.00046594342836753276, 'samples': 5160768, 'steps': 26878, 'loss/train': 2.1451001167297363} -11/07/2021 00:59:42 - INFO - __main__ - Step 26880: {'lr': 0.0004659407543569752, 'samples': 5160960, 'steps': 26879, 'loss/train': 1.7946914434432983} -11/07/2021 00:59:42 - INFO - __main__ - Step 26881: {'lr': 0.0004659380802491181, 'samples': 5161152, 'steps': 26880, 'loss/train': 1.3722161054611206} -11/07/2021 00:59:43 - INFO - __main__ - Step 26882: {'lr': 0.00046593540604396256, 'samples': 5161344, 'steps': 26881, 'loss/train': 0.8809364438056946} -11/07/2021 00:59:44 - INFO - __main__ - Step 26883: {'lr': 0.00046593273174150995, 'samples': 5161536, 'steps': 26882, 'loss/train': 1.5647692680358887} -11/07/2021 00:59:44 - INFO - __main__ - Step 26884: {'lr': 0.0004659300573417613, 'samples': 5161728, 'steps': 26883, 'loss/train': 1.522611141204834} -11/07/2021 00:59:44 - INFO - __main__ - Step 26885: {'lr': 0.00046592738284471794, 'samples': 5161920, 'steps': 26884, 'loss/train': 1.2077406644821167} -11/07/2021 00:59:45 - INFO - __main__ - Step 26886: {'lr': 0.000465924708250381, 'samples': 5162112, 'steps': 26885, 'loss/train': 1.7725774049758911} -11/07/2021 00:59:45 - INFO - __main__ - Step 26887: {'lr': 0.00046592203355875177, 'samples': 5162304, 'steps': 26886, 'loss/train': 1.3362911939620972} -11/07/2021 00:59:46 - INFO - __main__ - Step 26888: {'lr': 0.00046591935876983136, 'samples': 5162496, 'steps': 26887, 'loss/train': 1.8308025598526} -11/07/2021 00:59:46 - INFO - __main__ - Step 26889: {'lr': 0.0004659166838836211, 'samples': 5162688, 'steps': 26888, 'loss/train': 1.39945650100708} -11/07/2021 00:59:47 - INFO - __main__ - Step 26890: {'lr': 0.000465914008900122, 'samples': 5162880, 'steps': 26889, 'loss/train': 1.7456254959106445} -11/07/2021 00:59:47 - INFO - __main__ - Step 26891: {'lr': 0.00046591133381933546, 'samples': 5163072, 'steps': 26890, 'loss/train': 1.739495038986206} -11/07/2021 00:59:47 - INFO - __main__ - Step 26892: {'lr': 0.0004659086586412626, 'samples': 5163264, 'steps': 26891, 'loss/train': 1.6727256774902344} -11/07/2021 00:59:49 - INFO - __main__ - Step 26893: {'lr': 0.0004659059833659046, 'samples': 5163456, 'steps': 26892, 'loss/train': 1.331292748451233} -11/07/2021 00:59:49 - INFO - __main__ - Step 26894: {'lr': 0.0004659033079932627, 'samples': 5163648, 'steps': 26893, 'loss/train': 1.4414929151535034} -11/07/2021 00:59:49 - INFO - __main__ - Step 26895: {'lr': 0.00046590063252333806, 'samples': 5163840, 'steps': 26894, 'loss/train': 5.165720462799072} -11/07/2021 00:59:50 - INFO - __main__ - Step 26896: {'lr': 0.000465897956956132, 'samples': 5164032, 'steps': 26895, 'loss/train': 1.4558935165405273} -11/07/2021 00:59:50 - INFO - __main__ - Step 26897: {'lr': 0.0004658952812916456, 'samples': 5164224, 'steps': 26896, 'loss/train': 1.7362563610076904} -11/07/2021 00:59:51 - INFO - __main__ - Step 26898: {'lr': 0.0004658926055298802, 'samples': 5164416, 'steps': 26897, 'loss/train': 1.4366354942321777} -11/07/2021 00:59:52 - INFO - __main__ - Step 26899: {'lr': 0.0004658899296708369, 'samples': 5164608, 'steps': 26898, 'loss/train': 1.7091032266616821} -11/07/2021 00:59:52 - INFO - __main__ - Step 26900: {'lr': 0.00046588725371451685, 'samples': 5164800, 'steps': 26899, 'loss/train': 1.7321528196334839} -11/07/2021 00:59:52 - INFO - __main__ - Step 26901: {'lr': 0.00046588457766092134, 'samples': 5164992, 'steps': 26900, 'loss/train': 1.428074836730957} -11/07/2021 00:59:53 - INFO - __main__ - Step 26902: {'lr': 0.00046588190151005163, 'samples': 5165184, 'steps': 26901, 'loss/train': 1.7397880554199219} -11/07/2021 00:59:54 - INFO - __main__ - Step 26903: {'lr': 0.00046587922526190883, 'samples': 5165376, 'steps': 26902, 'loss/train': 1.7550833225250244} -11/07/2021 00:59:54 - INFO - __main__ - Step 26904: {'lr': 0.00046587654891649423, 'samples': 5165568, 'steps': 26903, 'loss/train': 1.6489547491073608} -11/07/2021 00:59:54 - INFO - __main__ - Step 26905: {'lr': 0.00046587387247380897, 'samples': 5165760, 'steps': 26904, 'loss/train': 1.046838641166687} -11/07/2021 00:59:55 - INFO - __main__ - Step 26906: {'lr': 0.00046587119593385424, 'samples': 5165952, 'steps': 26905, 'loss/train': 1.820117473602295} -11/07/2021 00:59:55 - INFO - __main__ - Step 26907: {'lr': 0.00046586851929663134, 'samples': 5166144, 'steps': 26906, 'loss/train': 1.7989552021026611} -11/07/2021 00:59:56 - INFO - __main__ - Step 26908: {'lr': 0.00046586584256214135, 'samples': 5166336, 'steps': 26907, 'loss/train': 1.5433944463729858} -11/07/2021 00:59:56 - INFO - __main__ - Step 26909: {'lr': 0.0004658631657303856, 'samples': 5166528, 'steps': 26908, 'loss/train': 2.116696834564209} -11/07/2021 00:59:57 - INFO - __main__ - Step 26910: {'lr': 0.0004658604888013652, 'samples': 5166720, 'steps': 26909, 'loss/train': 1.8567917346954346} -11/07/2021 00:59:57 - INFO - __main__ - Step 26911: {'lr': 0.00046585781177508137, 'samples': 5166912, 'steps': 26910, 'loss/train': 1.115211009979248} -11/07/2021 00:59:58 - INFO - __main__ - Step 26912: {'lr': 0.0004658551346515354, 'samples': 5167104, 'steps': 26911, 'loss/train': 1.6359246969223022} -11/07/2021 00:59:59 - INFO - __main__ - Step 26913: {'lr': 0.00046585245743072833, 'samples': 5167296, 'steps': 26912, 'loss/train': 2.238630533218384} -11/07/2021 00:59:59 - INFO - __main__ - Step 26914: {'lr': 0.0004658497801126616, 'samples': 5167488, 'steps': 26913, 'loss/train': 1.3893851041793823} -11/07/2021 00:59:59 - INFO - __main__ - Step 26915: {'lr': 0.00046584710269733623, 'samples': 5167680, 'steps': 26914, 'loss/train': 1.373899221420288} -11/07/2021 01:00:00 - INFO - __main__ - Step 26916: {'lr': 0.00046584442518475354, 'samples': 5167872, 'steps': 26915, 'loss/train': 1.1140812635421753} -11/07/2021 01:00:00 - INFO - __main__ - Step 26917: {'lr': 0.0004658417475749146, 'samples': 5168064, 'steps': 26916, 'loss/train': 1.7710485458374023} -11/07/2021 01:00:01 - INFO - __main__ - Step 26918: {'lr': 0.00046583906986782074, 'samples': 5168256, 'steps': 26917, 'loss/train': 1.4844192266464233} -11/07/2021 01:00:01 - INFO - __main__ - Step 26919: {'lr': 0.0004658363920634732, 'samples': 5168448, 'steps': 26918, 'loss/train': 1.3179831504821777} -11/07/2021 01:00:02 - INFO - __main__ - Step 26920: {'lr': 0.000465833714161873, 'samples': 5168640, 'steps': 26919, 'loss/train': 1.7123818397521973} -11/07/2021 01:00:02 - INFO - __main__ - Step 26921: {'lr': 0.00046583103616302146, 'samples': 5168832, 'steps': 26920, 'loss/train': 1.5609678030014038} -11/07/2021 01:00:02 - INFO - __main__ - Step 26922: {'lr': 0.0004658283580669198, 'samples': 5169024, 'steps': 26921, 'loss/train': 1.2969560623168945} -11/07/2021 01:00:03 - INFO - __main__ - Step 26923: {'lr': 0.0004658256798735693, 'samples': 5169216, 'steps': 26922, 'loss/train': 1.5124496221542358} -11/07/2021 01:00:04 - INFO - __main__ - Step 26924: {'lr': 0.000465823001582971, 'samples': 5169408, 'steps': 26923, 'loss/train': 1.7385716438293457} -11/07/2021 01:00:04 - INFO - __main__ - Step 26925: {'lr': 0.00046582032319512624, 'samples': 5169600, 'steps': 26924, 'loss/train': 1.0073723793029785} -11/07/2021 01:00:05 - INFO - __main__ - Step 26926: {'lr': 0.00046581764471003605, 'samples': 5169792, 'steps': 26925, 'loss/train': 1.363101840019226} -11/07/2021 01:00:05 - INFO - __main__ - Step 26927: {'lr': 0.0004658149661277019, 'samples': 5169984, 'steps': 26926, 'loss/train': 1.4179913997650146} -11/07/2021 01:00:05 - INFO - __main__ - Step 26928: {'lr': 0.0004658122874481248, 'samples': 5170176, 'steps': 26927, 'loss/train': 1.6892448663711548} -11/07/2021 01:00:07 - INFO - __main__ - Step 26929: {'lr': 0.000465809608671306, 'samples': 5170368, 'steps': 26928, 'loss/train': 1.7115468978881836} -11/07/2021 01:00:08 - INFO - __main__ - Step 26930: {'lr': 0.0004658069297972467, 'samples': 5170560, 'steps': 26929, 'loss/train': 2.0289013385772705} -11/07/2021 01:00:08 - INFO - __main__ - Step 26931: {'lr': 0.00046580425082594823, 'samples': 5170752, 'steps': 26930, 'loss/train': 2.270247220993042} -11/07/2021 01:00:08 - INFO - __main__ - Step 26932: {'lr': 0.00046580157175741155, 'samples': 5170944, 'steps': 26931, 'loss/train': 2.732706308364868} -11/07/2021 01:00:09 - INFO - __main__ - Step 26933: {'lr': 0.0004657988925916381, 'samples': 5171136, 'steps': 26932, 'loss/train': 1.691531777381897} -11/07/2021 01:00:09 - INFO - __main__ - Step 26934: {'lr': 0.000465796213328629, 'samples': 5171328, 'steps': 26933, 'loss/train': 1.6522505283355713} -11/07/2021 01:00:10 - INFO - __main__ - Step 26935: {'lr': 0.00046579353396838545, 'samples': 5171520, 'steps': 26934, 'loss/train': 2.0361757278442383} -11/07/2021 01:00:10 - INFO - __main__ - Step 26936: {'lr': 0.00046579085451090864, 'samples': 5171712, 'steps': 26935, 'loss/train': 1.6468123197555542} -11/07/2021 01:00:11 - INFO - __main__ - Step 26937: {'lr': 0.00046578817495619983, 'samples': 5171904, 'steps': 26936, 'loss/train': 1.5967553853988647} -11/07/2021 01:00:11 - INFO - __main__ - Step 26938: {'lr': 0.0004657854953042602, 'samples': 5172096, 'steps': 26937, 'loss/train': 2.384519577026367} -11/07/2021 01:00:12 - INFO - __main__ - Step 26939: {'lr': 0.00046578281555509094, 'samples': 5172288, 'steps': 26938, 'loss/train': 1.3857241868972778} -11/07/2021 01:00:12 - INFO - __main__ - Step 26940: {'lr': 0.00046578013570869325, 'samples': 5172480, 'steps': 26939, 'loss/train': 1.522921085357666} -11/07/2021 01:00:13 - INFO - __main__ - Step 26941: {'lr': 0.00046577745576506844, 'samples': 5172672, 'steps': 26940, 'loss/train': 2.2995705604553223} -11/07/2021 01:00:13 - INFO - __main__ - Step 26942: {'lr': 0.00046577477572421757, 'samples': 5172864, 'steps': 26941, 'loss/train': 1.364117980003357} -11/07/2021 01:00:14 - INFO - __main__ - Step 26943: {'lr': 0.0004657720955861419, 'samples': 5173056, 'steps': 26942, 'loss/train': 1.8198291063308716} -11/07/2021 01:00:14 - INFO - __main__ - Step 26944: {'lr': 0.00046576941535084274, 'samples': 5173248, 'steps': 26943, 'loss/train': 1.622612714767456} -11/07/2021 01:00:14 - INFO - __main__ - Step 26945: {'lr': 0.0004657667350183211, 'samples': 5173440, 'steps': 26944, 'loss/train': 1.3657492399215698} -11/07/2021 01:00:15 - INFO - __main__ - Step 26946: {'lr': 0.00046576405458857836, 'samples': 5173632, 'steps': 26945, 'loss/train': 1.5600732564926147} -11/07/2021 01:00:16 - INFO - __main__ - Step 26947: {'lr': 0.0004657613740616157, 'samples': 5173824, 'steps': 26946, 'loss/train': 1.2829210758209229} -11/07/2021 01:00:16 - INFO - __main__ - Step 26948: {'lr': 0.0004657586934374342, 'samples': 5174016, 'steps': 26947, 'loss/train': 1.333815336227417} -11/07/2021 01:00:17 - INFO - __main__ - Step 26949: {'lr': 0.0004657560127160352, 'samples': 5174208, 'steps': 26948, 'loss/train': 1.4350104331970215} -11/07/2021 01:00:17 - INFO - __main__ - Step 26950: {'lr': 0.00046575333189741993, 'samples': 5174400, 'steps': 26949, 'loss/train': 1.6693968772888184} -11/07/2021 01:00:18 - INFO - __main__ - Step 26951: {'lr': 0.00046575065098158945, 'samples': 5174592, 'steps': 26950, 'loss/train': 1.3539212942123413} -11/07/2021 01:00:18 - INFO - __main__ - Step 26952: {'lr': 0.0004657479699685451, 'samples': 5174784, 'steps': 26951, 'loss/train': 1.4676611423492432} -11/07/2021 01:00:19 - INFO - __main__ - Step 26953: {'lr': 0.00046574528885828803, 'samples': 5174976, 'steps': 26952, 'loss/train': 1.1450750827789307} -11/07/2021 01:00:19 - INFO - __main__ - Step 26954: {'lr': 0.0004657426076508195, 'samples': 5175168, 'steps': 26953, 'loss/train': 1.5569909811019897} -11/07/2021 01:00:19 - INFO - __main__ - Step 26955: {'lr': 0.00046573992634614064, 'samples': 5175360, 'steps': 26954, 'loss/train': 1.4932307004928589} -11/07/2021 01:00:20 - INFO - __main__ - Step 26956: {'lr': 0.00046573724494425274, 'samples': 5175552, 'steps': 26955, 'loss/train': 1.704939842224121} -11/07/2021 01:00:21 - INFO - __main__ - Step 26957: {'lr': 0.00046573456344515694, 'samples': 5175744, 'steps': 26956, 'loss/train': 2.1936867237091064} -11/07/2021 01:00:21 - INFO - __main__ - Step 26958: {'lr': 0.00046573188184885445, 'samples': 5175936, 'steps': 26957, 'loss/train': 1.7155307531356812} -11/07/2021 01:00:21 - INFO - __main__ - Step 26959: {'lr': 0.0004657292001553465, 'samples': 5176128, 'steps': 26958, 'loss/train': 0.9837502837181091} -11/07/2021 01:00:22 - INFO - __main__ - Step 26960: {'lr': 0.0004657265183646344, 'samples': 5176320, 'steps': 26959, 'loss/train': 0.9638455510139465} -11/07/2021 01:00:24 - INFO - __main__ - Step 26961: {'lr': 0.00046572383647671913, 'samples': 5176512, 'steps': 26960, 'loss/train': 1.653584361076355} -11/07/2021 01:00:24 - INFO - __main__ - Step 26962: {'lr': 0.0004657211544916021, 'samples': 5176704, 'steps': 26961, 'loss/train': 1.24321711063385} -11/07/2021 01:00:25 - INFO - __main__ - Step 26963: {'lr': 0.00046571847240928444, 'samples': 5176896, 'steps': 26962, 'loss/train': 1.4641504287719727} -11/07/2021 01:00:25 - INFO - __main__ - Step 26964: {'lr': 0.0004657157902297674, 'samples': 5177088, 'steps': 26963, 'loss/train': 1.522215723991394} -11/07/2021 01:00:25 - INFO - __main__ - Step 26965: {'lr': 0.00046571310795305213, 'samples': 5177280, 'steps': 26964, 'loss/train': 1.6530050039291382} -11/07/2021 01:00:26 - INFO - __main__ - Step 26966: {'lr': 0.0004657104255791398, 'samples': 5177472, 'steps': 26965, 'loss/train': 1.2860393524169922} -11/07/2021 01:00:26 - INFO - __main__ - Step 26967: {'lr': 0.0004657077431080317, 'samples': 5177664, 'steps': 26966, 'loss/train': 1.0747127532958984} -11/07/2021 01:00:26 - INFO - __main__ - Step 26968: {'lr': 0.00046570506053972906, 'samples': 5177856, 'steps': 26967, 'loss/train': 1.3991793394088745} -11/07/2021 01:00:27 - INFO - __main__ - Step 26969: {'lr': 0.000465702377874233, 'samples': 5178048, 'steps': 26968, 'loss/train': 1.2089049816131592} -11/07/2021 01:00:28 - INFO - __main__ - Step 26970: {'lr': 0.00046569969511154485, 'samples': 5178240, 'steps': 26969, 'loss/train': 1.4461259841918945} -11/07/2021 01:00:28 - INFO - __main__ - Step 26971: {'lr': 0.0004656970122516657, 'samples': 5178432, 'steps': 26970, 'loss/train': 1.7595458030700684} -11/07/2021 01:00:28 - INFO - __main__ - Step 26972: {'lr': 0.0004656943292945968, 'samples': 5178624, 'steps': 26971, 'loss/train': 1.6467506885528564} -11/07/2021 01:00:29 - INFO - __main__ - Step 26973: {'lr': 0.0004656916462403394, 'samples': 5178816, 'steps': 26972, 'loss/train': 1.8223869800567627} -11/07/2021 01:00:30 - INFO - __main__ - Step 26974: {'lr': 0.0004656889630888946, 'samples': 5179008, 'steps': 26973, 'loss/train': 1.9120339155197144} -11/07/2021 01:00:30 - INFO - __main__ - Step 26975: {'lr': 0.0004656862798402638, 'samples': 5179200, 'steps': 26974, 'loss/train': 1.7358126640319824} -11/07/2021 01:00:30 - INFO - __main__ - Step 26976: {'lr': 0.00046568359649444796, 'samples': 5179392, 'steps': 26975, 'loss/train': 1.541935920715332} -11/07/2021 01:00:31 - INFO - __main__ - Step 26977: {'lr': 0.0004656809130514485, 'samples': 5179584, 'steps': 26976, 'loss/train': 1.5258926153182983} -11/07/2021 01:00:31 - INFO - __main__ - Step 26978: {'lr': 0.00046567822951126646, 'samples': 5179776, 'steps': 26977, 'loss/train': 0.8509805798530579} -11/07/2021 01:00:32 - INFO - __main__ - Step 26979: {'lr': 0.00046567554587390324, 'samples': 5179968, 'steps': 26978, 'loss/train': 1.5014252662658691} -11/07/2021 01:00:33 - INFO - __main__ - Step 26980: {'lr': 0.00046567286213935994, 'samples': 5180160, 'steps': 26979, 'loss/train': 1.6096993684768677} -11/07/2021 01:00:33 - INFO - __main__ - Step 26981: {'lr': 0.00046567017830763776, 'samples': 5180352, 'steps': 26980, 'loss/train': 1.5932661294937134} -11/07/2021 01:00:33 - INFO - __main__ - Step 26982: {'lr': 0.0004656674943787379, 'samples': 5180544, 'steps': 26981, 'loss/train': 1.6337497234344482} -11/07/2021 01:00:34 - INFO - __main__ - Step 26983: {'lr': 0.0004656648103526616, 'samples': 5180736, 'steps': 26982, 'loss/train': 1.1553945541381836} -11/07/2021 01:00:34 - INFO - __main__ - Step 26984: {'lr': 0.00046566212622941005, 'samples': 5180928, 'steps': 26983, 'loss/train': 1.3024195432662964} -11/07/2021 01:00:35 - INFO - __main__ - Step 26985: {'lr': 0.00046565944200898453, 'samples': 5181120, 'steps': 26984, 'loss/train': 1.115247130393982} -11/07/2021 01:00:35 - INFO - __main__ - Step 26986: {'lr': 0.00046565675769138614, 'samples': 5181312, 'steps': 26985, 'loss/train': 1.7781128883361816} -11/07/2021 01:00:36 - INFO - __main__ - Step 26987: {'lr': 0.00046565407327661614, 'samples': 5181504, 'steps': 26986, 'loss/train': 1.3278738260269165} -11/07/2021 01:00:36 - INFO - __main__ - Step 26988: {'lr': 0.0004656513887646758, 'samples': 5181696, 'steps': 26987, 'loss/train': 1.3004204034805298} -11/07/2021 01:00:37 - INFO - __main__ - Step 26989: {'lr': 0.00046564870415556625, 'samples': 5181888, 'steps': 26988, 'loss/train': 1.5969914197921753} -11/07/2021 01:00:38 - INFO - __main__ - Step 26990: {'lr': 0.0004656460194492887, 'samples': 5182080, 'steps': 26989, 'loss/train': 1.6689649820327759} -11/07/2021 01:00:38 - INFO - __main__ - Step 26991: {'lr': 0.0004656433346458444, 'samples': 5182272, 'steps': 26990, 'loss/train': 1.328795075416565} -11/07/2021 01:00:38 - INFO - __main__ - Step 26992: {'lr': 0.0004656406497452345, 'samples': 5182464, 'steps': 26991, 'loss/train': 1.5303890705108643} -11/07/2021 01:00:39 - INFO - __main__ - Step 26993: {'lr': 0.0004656379647474603, 'samples': 5182656, 'steps': 26992, 'loss/train': 1.785988211631775} -11/07/2021 01:00:39 - INFO - __main__ - Step 26994: {'lr': 0.0004656352796525229, 'samples': 5182848, 'steps': 26993, 'loss/train': 1.4376311302185059} -11/07/2021 01:00:39 - INFO - __main__ - Step 26995: {'lr': 0.0004656325944604236, 'samples': 5183040, 'steps': 26994, 'loss/train': 1.5736900568008423} -11/07/2021 01:00:40 - INFO - __main__ - Step 26996: {'lr': 0.00046562990917116366, 'samples': 5183232, 'steps': 26995, 'loss/train': 1.916595697402954} -11/07/2021 01:00:41 - INFO - __main__ - Step 26997: {'lr': 0.0004656272237847441, 'samples': 5183424, 'steps': 26996, 'loss/train': 1.01767098903656} -11/07/2021 01:00:41 - INFO - __main__ - Step 26998: {'lr': 0.0004656245383011663, 'samples': 5183616, 'steps': 26997, 'loss/train': 1.6805261373519897} -11/07/2021 01:00:42 - INFO - __main__ - Step 26999: {'lr': 0.00046562185272043137, 'samples': 5183808, 'steps': 26998, 'loss/train': 1.7131564617156982} -11/07/2021 01:00:42 - INFO - __main__ - Step 27000: {'lr': 0.00046561916704254057, 'samples': 5184000, 'steps': 26999, 'loss/train': 1.855010986328125} -11/07/2021 01:00:43 - INFO - __main__ - Step 27001: {'lr': 0.0004656164812674951, 'samples': 5184192, 'steps': 27000, 'loss/train': 1.456249475479126} -11/07/2021 01:00:43 - INFO - __main__ - Step 27002: {'lr': 0.00046561379539529626, 'samples': 5184384, 'steps': 27001, 'loss/train': 0.16935046017169952} -11/07/2021 01:00:44 - INFO - __main__ - Step 27003: {'lr': 0.0004656111094259451, 'samples': 5184576, 'steps': 27002, 'loss/train': 1.3302737474441528} -11/07/2021 01:00:44 - INFO - __main__ - Step 27004: {'lr': 0.0004656084233594429, 'samples': 5184768, 'steps': 27003, 'loss/train': 1.6964117288589478} -11/07/2021 01:00:44 - INFO - __main__ - Step 27005: {'lr': 0.0004656057371957908, 'samples': 5184960, 'steps': 27004, 'loss/train': 1.0182842016220093} -11/07/2021 01:00:45 - INFO - __main__ - Step 27006: {'lr': 0.00046560305093499015, 'samples': 5185152, 'steps': 27005, 'loss/train': 1.4617400169372559} -11/07/2021 01:00:46 - INFO - __main__ - Step 27007: {'lr': 0.00046560036457704215, 'samples': 5185344, 'steps': 27006, 'loss/train': 1.2601394653320312} -11/07/2021 01:00:46 - INFO - __main__ - Step 27008: {'lr': 0.00046559767812194786, 'samples': 5185536, 'steps': 27007, 'loss/train': 1.5308825969696045} -11/07/2021 01:00:46 - INFO - __main__ - Step 27009: {'lr': 0.0004655949915697086, 'samples': 5185728, 'steps': 27008, 'loss/train': 1.6513859033584595} -11/07/2021 01:00:47 - INFO - __main__ - Step 27010: {'lr': 0.0004655923049203256, 'samples': 5185920, 'steps': 27009, 'loss/train': 1.715781807899475} -11/07/2021 01:00:48 - INFO - __main__ - Step 27011: {'lr': 0.00046558961817380005, 'samples': 5186112, 'steps': 27010, 'loss/train': 1.478920578956604} -11/07/2021 01:00:48 - INFO - __main__ - Step 27012: {'lr': 0.00046558693133013306, 'samples': 5186304, 'steps': 27011, 'loss/train': 1.7847849130630493} -11/07/2021 01:00:49 - INFO - __main__ - Step 27013: {'lr': 0.000465584244389326, 'samples': 5186496, 'steps': 27012, 'loss/train': 1.8046079874038696} -11/07/2021 01:00:49 - INFO - __main__ - Step 27014: {'lr': 0.00046558155735137996, 'samples': 5186688, 'steps': 27013, 'loss/train': 1.7372362613677979} -11/07/2021 01:00:49 - INFO - __main__ - Step 27015: {'lr': 0.00046557887021629623, 'samples': 5186880, 'steps': 27014, 'loss/train': 1.6177726984024048} -11/07/2021 01:00:50 - INFO - __main__ - Step 27016: {'lr': 0.000465576182984076, 'samples': 5187072, 'steps': 27015, 'loss/train': 1.7490988969802856} -11/07/2021 01:00:51 - INFO - __main__ - Step 27017: {'lr': 0.0004655734956547204, 'samples': 5187264, 'steps': 27016, 'loss/train': 1.8980671167373657} -11/07/2021 01:00:51 - INFO - __main__ - Step 27018: {'lr': 0.00046557080822823076, 'samples': 5187456, 'steps': 27017, 'loss/train': 1.4750101566314697} -11/07/2021 01:00:52 - INFO - __main__ - Step 27019: {'lr': 0.0004655681207046083, 'samples': 5187648, 'steps': 27018, 'loss/train': 1.6902590990066528} -11/07/2021 01:00:52 - INFO - __main__ - Step 27020: {'lr': 0.0004655654330838541, 'samples': 5187840, 'steps': 27019, 'loss/train': 0.45184364914894104} -11/07/2021 01:00:53 - INFO - __main__ - Step 27021: {'lr': 0.00046556274536596945, 'samples': 5188032, 'steps': 27020, 'loss/train': 1.976624846458435} -11/07/2021 01:00:53 - INFO - __main__ - Step 27022: {'lr': 0.00046556005755095555, 'samples': 5188224, 'steps': 27021, 'loss/train': 1.4296730756759644} -11/07/2021 01:00:54 - INFO - __main__ - Step 27023: {'lr': 0.00046555736963881355, 'samples': 5188416, 'steps': 27022, 'loss/train': 1.521439552307129} -11/07/2021 01:00:54 - INFO - __main__ - Step 27024: {'lr': 0.0004655546816295448, 'samples': 5188608, 'steps': 27023, 'loss/train': 1.745589256286621} -11/07/2021 01:00:54 - INFO - __main__ - Step 27025: {'lr': 0.0004655519935231505, 'samples': 5188800, 'steps': 27024, 'loss/train': 1.2226965427398682} -11/07/2021 01:00:55 - INFO - __main__ - Step 27026: {'lr': 0.00046554930531963166, 'samples': 5188992, 'steps': 27025, 'loss/train': 1.0397146940231323} -11/07/2021 01:00:56 - INFO - __main__ - Step 27027: {'lr': 0.0004655466170189897, 'samples': 5189184, 'steps': 27026, 'loss/train': 1.48588228225708} -11/07/2021 01:00:56 - INFO - __main__ - Step 27028: {'lr': 0.0004655439286212257, 'samples': 5189376, 'steps': 27027, 'loss/train': 2.311471939086914} -11/07/2021 01:00:57 - INFO - __main__ - Step 27029: {'lr': 0.00046554124012634105, 'samples': 5189568, 'steps': 27028, 'loss/train': 1.452401876449585} -11/07/2021 01:00:57 - INFO - __main__ - Step 27030: {'lr': 0.0004655385515343368, 'samples': 5189760, 'steps': 27029, 'loss/train': 2.314892530441284} -11/07/2021 01:00:57 - INFO - __main__ - Step 27031: {'lr': 0.0004655358628452142, 'samples': 5189952, 'steps': 27030, 'loss/train': 1.920503854751587} -11/07/2021 01:00:58 - INFO - __main__ - Step 27032: {'lr': 0.00046553317405897444, 'samples': 5190144, 'steps': 27031, 'loss/train': 1.8143914937973022} -11/07/2021 01:00:59 - INFO - __main__ - Step 27033: {'lr': 0.0004655304851756188, 'samples': 5190336, 'steps': 27032, 'loss/train': 1.876479983329773} -11/07/2021 01:00:59 - INFO - __main__ - Step 27034: {'lr': 0.0004655277961951484, 'samples': 5190528, 'steps': 27033, 'loss/train': 1.343095302581787} -11/07/2021 01:00:59 - INFO - __main__ - Step 27035: {'lr': 0.00046552510711756444, 'samples': 5190720, 'steps': 27034, 'loss/train': 1.8001316785812378} -11/07/2021 01:01:00 - INFO - __main__ - Step 27036: {'lr': 0.0004655224179428683, 'samples': 5190912, 'steps': 27035, 'loss/train': 1.749971628189087} -11/07/2021 01:01:01 - INFO - __main__ - Step 27037: {'lr': 0.00046551972867106106, 'samples': 5191104, 'steps': 27036, 'loss/train': 1.6416561603546143} -11/07/2021 01:01:01 - INFO - __main__ - Step 27038: {'lr': 0.00046551703930214393, 'samples': 5191296, 'steps': 27037, 'loss/train': 1.3201777935028076} -11/07/2021 01:01:02 - INFO - __main__ - Step 27039: {'lr': 0.00046551434983611823, 'samples': 5191488, 'steps': 27038, 'loss/train': 1.6423300504684448} -11/07/2021 01:01:02 - INFO - __main__ - Step 27040: {'lr': 0.00046551166027298505, 'samples': 5191680, 'steps': 27039, 'loss/train': 2.7235004901885986} -11/07/2021 01:01:02 - INFO - __main__ - Step 27041: {'lr': 0.0004655089706127456, 'samples': 5191872, 'steps': 27040, 'loss/train': 1.454121470451355} -11/07/2021 01:01:03 - INFO - __main__ - Step 27042: {'lr': 0.00046550628085540114, 'samples': 5192064, 'steps': 27041, 'loss/train': 1.6096910238265991} -11/07/2021 01:01:04 - INFO - __main__ - Step 27043: {'lr': 0.0004655035910009529, 'samples': 5192256, 'steps': 27042, 'loss/train': 1.7329154014587402} -11/07/2021 01:01:04 - INFO - __main__ - Step 27044: {'lr': 0.00046550090104940207, 'samples': 5192448, 'steps': 27043, 'loss/train': 1.8347967863082886} -11/07/2021 01:01:04 - INFO - __main__ - Step 27045: {'lr': 0.00046549821100074987, 'samples': 5192640, 'steps': 27044, 'loss/train': 1.4639747142791748} -11/07/2021 01:01:05 - INFO - __main__ - Step 27046: {'lr': 0.0004654955208549975, 'samples': 5192832, 'steps': 27045, 'loss/train': 1.7632167339324951} -11/07/2021 01:01:05 - INFO - __main__ - Step 27047: {'lr': 0.0004654928306121461, 'samples': 5193024, 'steps': 27046, 'loss/train': 1.101479172706604} -11/07/2021 01:01:07 - INFO - __main__ - Step 27048: {'lr': 0.000465490140272197, 'samples': 5193216, 'steps': 27047, 'loss/train': 1.7649903297424316} -11/07/2021 01:01:07 - INFO - __main__ - Step 27049: {'lr': 0.00046548744983515133, 'samples': 5193408, 'steps': 27048, 'loss/train': 1.3125827312469482} -11/07/2021 01:01:07 - INFO - __main__ - Step 27050: {'lr': 0.0004654847593010104, 'samples': 5193600, 'steps': 27049, 'loss/train': 1.8120845556259155} -11/07/2021 01:01:08 - INFO - __main__ - Step 27051: {'lr': 0.0004654820686697754, 'samples': 5193792, 'steps': 27050, 'loss/train': 0.23133371770381927} -11/07/2021 01:01:08 - INFO - __main__ - Step 27052: {'lr': 0.00046547937794144743, 'samples': 5193984, 'steps': 27051, 'loss/train': 1.9630906581878662} -11/07/2021 01:01:09 - INFO - __main__ - Step 27053: {'lr': 0.00046547668711602774, 'samples': 5194176, 'steps': 27052, 'loss/train': 1.4378554821014404} -11/07/2021 01:01:09 - INFO - __main__ - Step 27054: {'lr': 0.0004654739961935177, 'samples': 5194368, 'steps': 27053, 'loss/train': 1.6807277202606201} -11/07/2021 01:01:10 - INFO - __main__ - Step 27055: {'lr': 0.0004654713051739183, 'samples': 5194560, 'steps': 27054, 'loss/train': 1.4902753829956055} -11/07/2021 01:01:10 - INFO - __main__ - Step 27056: {'lr': 0.000465468614057231, 'samples': 5194752, 'steps': 27055, 'loss/train': 1.6699409484863281} -11/07/2021 01:01:10 - INFO - __main__ - Step 27057: {'lr': 0.0004654659228434567, 'samples': 5194944, 'steps': 27056, 'loss/train': 1.7816848754882812} -11/07/2021 01:01:11 - INFO - __main__ - Step 27058: {'lr': 0.00046546323153259686, 'samples': 5195136, 'steps': 27057, 'loss/train': 1.823567509651184} -11/07/2021 01:01:12 - INFO - __main__ - Step 27059: {'lr': 0.00046546054012465253, 'samples': 5195328, 'steps': 27058, 'loss/train': 1.432388186454773} -11/07/2021 01:01:12 - INFO - __main__ - Step 27060: {'lr': 0.00046545784861962516, 'samples': 5195520, 'steps': 27059, 'loss/train': 1.312885046005249} -11/07/2021 01:01:12 - INFO - __main__ - Step 27061: {'lr': 0.00046545515701751567, 'samples': 5195712, 'steps': 27060, 'loss/train': 1.9596468210220337} -11/07/2021 01:01:13 - INFO - __main__ - Step 27062: {'lr': 0.00046545246531832547, 'samples': 5195904, 'steps': 27061, 'loss/train': 1.8299909830093384} -11/07/2021 01:01:14 - INFO - __main__ - Step 27063: {'lr': 0.0004654497735220557, 'samples': 5196096, 'steps': 27062, 'loss/train': 1.0981870889663696} -11/07/2021 01:01:14 - INFO - __main__ - Step 27064: {'lr': 0.0004654470816287076, 'samples': 5196288, 'steps': 27063, 'loss/train': 1.9853992462158203} -11/07/2021 01:01:15 - INFO - __main__ - Step 27065: {'lr': 0.0004654443896382824, 'samples': 5196480, 'steps': 27064, 'loss/train': 2.3117482662200928} -11/07/2021 01:01:15 - INFO - __main__ - Step 27066: {'lr': 0.0004654416975507812, 'samples': 5196672, 'steps': 27065, 'loss/train': 1.6154303550720215} -11/07/2021 01:01:15 - INFO - __main__ - Step 27067: {'lr': 0.0004654390053662053, 'samples': 5196864, 'steps': 27066, 'loss/train': 1.7417590618133545} -11/07/2021 01:01:16 - INFO - __main__ - Step 27068: {'lr': 0.000465436313084556, 'samples': 5197056, 'steps': 27067, 'loss/train': 1.621261477470398} -11/07/2021 01:01:17 - INFO - __main__ - Step 27069: {'lr': 0.0004654336207058344, 'samples': 5197248, 'steps': 27068, 'loss/train': 1.588318943977356} -11/07/2021 01:01:17 - INFO - __main__ - Step 27070: {'lr': 0.0004654309282300416, 'samples': 5197440, 'steps': 27069, 'loss/train': 1.6834807395935059} -11/07/2021 01:01:17 - INFO - __main__ - Step 27071: {'lr': 0.00046542823565717914, 'samples': 5197632, 'steps': 27070, 'loss/train': 1.6977858543395996} -11/07/2021 01:01:18 - INFO - __main__ - Step 27072: {'lr': 0.00046542554298724793, 'samples': 5197824, 'steps': 27071, 'loss/train': 1.3400862216949463} -11/07/2021 01:01:19 - INFO - __main__ - Step 27073: {'lr': 0.00046542285022024935, 'samples': 5198016, 'steps': 27072, 'loss/train': 1.7301197052001953} -11/07/2021 01:01:19 - INFO - __main__ - Step 27074: {'lr': 0.0004654201573561845, 'samples': 5198208, 'steps': 27073, 'loss/train': 1.090531587600708} -11/07/2021 01:01:20 - INFO - __main__ - Step 27075: {'lr': 0.00046541746439505467, 'samples': 5198400, 'steps': 27074, 'loss/train': 1.289291501045227} -11/07/2021 01:01:20 - INFO - __main__ - Step 27076: {'lr': 0.00046541477133686107, 'samples': 5198592, 'steps': 27075, 'loss/train': 1.4234788417816162} -11/07/2021 01:01:20 - INFO - __main__ - Step 27077: {'lr': 0.0004654120781816049, 'samples': 5198784, 'steps': 27076, 'loss/train': 1.8242205381393433} -11/07/2021 01:01:21 - INFO - __main__ - Step 27078: {'lr': 0.00046540938492928735, 'samples': 5198976, 'steps': 27077, 'loss/train': 2.2250328063964844} -11/07/2021 01:01:22 - INFO - __main__ - Step 27079: {'lr': 0.0004654066915799097, 'samples': 5199168, 'steps': 27078, 'loss/train': 1.3047109842300415} -11/07/2021 01:01:22 - INFO - __main__ - Step 27080: {'lr': 0.000465403998133473, 'samples': 5199360, 'steps': 27079, 'loss/train': 1.8516128063201904} -11/07/2021 01:01:22 - INFO - __main__ - Step 27081: {'lr': 0.0004654013045899788, 'samples': 5199552, 'steps': 27080, 'loss/train': 1.7745814323425293} -11/07/2021 01:01:23 - INFO - __main__ - Step 27082: {'lr': 0.00046539861094942794, 'samples': 5199744, 'steps': 27081, 'loss/train': 1.7650301456451416} -11/07/2021 01:01:24 - INFO - __main__ - Step 27083: {'lr': 0.00046539591721182175, 'samples': 5199936, 'steps': 27082, 'loss/train': 1.4061222076416016} -11/07/2021 01:01:24 - INFO - __main__ - Step 27084: {'lr': 0.00046539322337716153, 'samples': 5200128, 'steps': 27083, 'loss/train': 2.0047829151153564} -11/07/2021 01:01:24 - INFO - __main__ - Step 27085: {'lr': 0.00046539052944544846, 'samples': 5200320, 'steps': 27084, 'loss/train': 1.4529653787612915} -11/07/2021 01:01:25 - INFO - __main__ - Step 27086: {'lr': 0.0004653878354166838, 'samples': 5200512, 'steps': 27085, 'loss/train': 1.6772856712341309} -11/07/2021 01:01:25 - INFO - __main__ - Step 27087: {'lr': 0.0004653851412908686, 'samples': 5200704, 'steps': 27086, 'loss/train': 1.6235452890396118} -11/07/2021 01:01:25 - INFO - __main__ - Step 27088: {'lr': 0.0004653824470680043, 'samples': 5200896, 'steps': 27087, 'loss/train': 1.2486436367034912} -11/07/2021 01:01:27 - INFO - __main__ - Step 27089: {'lr': 0.00046537975274809186, 'samples': 5201088, 'steps': 27088, 'loss/train': 1.7086710929870605} -11/07/2021 01:01:27 - INFO - __main__ - Step 27090: {'lr': 0.0004653770583311327, 'samples': 5201280, 'steps': 27089, 'loss/train': 1.279076099395752} -11/07/2021 01:01:27 - INFO - __main__ - Step 27091: {'lr': 0.00046537436381712796, 'samples': 5201472, 'steps': 27090, 'loss/train': 0.8488227725028992} -11/07/2021 01:01:28 - INFO - __main__ - Step 27092: {'lr': 0.00046537166920607886, 'samples': 5201664, 'steps': 27091, 'loss/train': 2.424959897994995} -11/07/2021 01:01:28 - INFO - __main__ - Step 27093: {'lr': 0.00046536897449798656, 'samples': 5201856, 'steps': 27092, 'loss/train': 1.0911108255386353} -11/07/2021 01:01:29 - INFO - __main__ - Step 27094: {'lr': 0.00046536627969285236, 'samples': 5202048, 'steps': 27093, 'loss/train': 1.772316813468933} -11/07/2021 01:01:29 - INFO - __main__ - Step 27095: {'lr': 0.0004653635847906774, 'samples': 5202240, 'steps': 27094, 'loss/train': 0.8457456231117249} -11/07/2021 01:01:30 - INFO - __main__ - Step 27096: {'lr': 0.000465360889791463, 'samples': 5202432, 'steps': 27095, 'loss/train': 1.7497080564498901} -11/07/2021 01:01:30 - INFO - __main__ - Step 27097: {'lr': 0.0004653581946952103, 'samples': 5202624, 'steps': 27096, 'loss/train': 1.5715991258621216} -11/07/2021 01:01:30 - INFO - __main__ - Step 27098: {'lr': 0.0004653554995019205, 'samples': 5202816, 'steps': 27097, 'loss/train': 1.6218191385269165} -11/07/2021 01:01:31 - INFO - __main__ - Step 27099: {'lr': 0.0004653528042115948, 'samples': 5203008, 'steps': 27098, 'loss/train': 1.8767164945602417} -11/07/2021 01:01:32 - INFO - __main__ - Step 27100: {'lr': 0.0004653501088242345, 'samples': 5203200, 'steps': 27099, 'loss/train': 1.2835679054260254} -11/07/2021 01:01:32 - INFO - __main__ - Step 27101: {'lr': 0.0004653474133398408, 'samples': 5203392, 'steps': 27100, 'loss/train': 1.3385190963745117} -11/07/2021 01:01:32 - INFO - __main__ - Step 27102: {'lr': 0.00046534471775841474, 'samples': 5203584, 'steps': 27101, 'loss/train': 1.365417718887329} -11/07/2021 01:01:33 - INFO - __main__ - Step 27103: {'lr': 0.0004653420220799578, 'samples': 5203776, 'steps': 27102, 'loss/train': 1.6177514791488647} -11/07/2021 01:01:34 - INFO - __main__ - Step 27104: {'lr': 0.000465339326304471, 'samples': 5203968, 'steps': 27103, 'loss/train': 1.4537159204483032} -11/07/2021 01:01:34 - INFO - __main__ - Step 27105: {'lr': 0.0004653366304319556, 'samples': 5204160, 'steps': 27104, 'loss/train': 1.086722493171692} -11/07/2021 01:01:35 - INFO - __main__ - Step 27106: {'lr': 0.0004653339344624129, 'samples': 5204352, 'steps': 27105, 'loss/train': 1.5146363973617554} -11/07/2021 01:01:35 - INFO - __main__ - Step 27107: {'lr': 0.00046533123839584406, 'samples': 5204544, 'steps': 27106, 'loss/train': 1.4945223331451416} -11/07/2021 01:01:35 - INFO - __main__ - Step 27108: {'lr': 0.0004653285422322503, 'samples': 5204736, 'steps': 27107, 'loss/train': 1.6637580394744873} -11/07/2021 01:01:36 - INFO - __main__ - Step 27109: {'lr': 0.00046532584597163275, 'samples': 5204928, 'steps': 27108, 'loss/train': 1.4501129388809204} -11/07/2021 01:01:37 - INFO - __main__ - Step 27110: {'lr': 0.0004653231496139927, 'samples': 5205120, 'steps': 27109, 'loss/train': 1.5620125532150269} -11/07/2021 01:01:37 - INFO - __main__ - Step 27111: {'lr': 0.0004653204531593315, 'samples': 5205312, 'steps': 27110, 'loss/train': 1.3244616985321045} -11/07/2021 01:01:38 - INFO - __main__ - Step 27112: {'lr': 0.0004653177566076501, 'samples': 5205504, 'steps': 27111, 'loss/train': 1.5549123287200928} -11/07/2021 01:01:38 - INFO - __main__ - Step 27113: {'lr': 0.0004653150599589498, 'samples': 5205696, 'steps': 27112, 'loss/train': 1.4433401823043823} -11/07/2021 01:01:38 - INFO - __main__ - Step 27114: {'lr': 0.0004653123632132319, 'samples': 5205888, 'steps': 27113, 'loss/train': 1.7523740530014038} -11/07/2021 01:01:39 - INFO - __main__ - Step 27115: {'lr': 0.0004653096663704976, 'samples': 5206080, 'steps': 27114, 'loss/train': 1.6249898672103882} -11/07/2021 01:01:40 - INFO - __main__ - Step 27116: {'lr': 0.0004653069694307481, 'samples': 5206272, 'steps': 27115, 'loss/train': 1.8098299503326416} -11/07/2021 01:01:40 - INFO - __main__ - Step 27117: {'lr': 0.00046530427239398453, 'samples': 5206464, 'steps': 27116, 'loss/train': 0.9234550595283508} -11/07/2021 01:01:40 - INFO - __main__ - Step 27118: {'lr': 0.0004653015752602082, 'samples': 5206656, 'steps': 27117, 'loss/train': 1.5943477153778076} -11/07/2021 01:01:41 - INFO - __main__ - Step 27119: {'lr': 0.0004652988780294204, 'samples': 5206848, 'steps': 27118, 'loss/train': 1.3826004266738892} -11/07/2021 01:01:42 - INFO - __main__ - Step 27120: {'lr': 0.00046529618070162215, 'samples': 5207040, 'steps': 27119, 'loss/train': 1.474747896194458} -11/07/2021 01:01:42 - INFO - __main__ - Step 27121: {'lr': 0.00046529348327681476, 'samples': 5207232, 'steps': 27120, 'loss/train': 1.324153184890747} -11/07/2021 01:01:42 - INFO - __main__ - Step 27122: {'lr': 0.0004652907857549995, 'samples': 5207424, 'steps': 27121, 'loss/train': 1.472080945968628} -11/07/2021 01:01:43 - INFO - __main__ - Step 27123: {'lr': 0.0004652880881361775, 'samples': 5207616, 'steps': 27122, 'loss/train': 1.215911626815796} -11/07/2021 01:01:43 - INFO - __main__ - Step 27124: {'lr': 0.00046528539042035, 'samples': 5207808, 'steps': 27123, 'loss/train': 1.5094414949417114} -11/07/2021 01:01:44 - INFO - __main__ - Step 27125: {'lr': 0.0004652826926075183, 'samples': 5208000, 'steps': 27124, 'loss/train': 1.5033190250396729} -11/07/2021 01:01:45 - INFO - __main__ - Step 27126: {'lr': 0.00046527999469768346, 'samples': 5208192, 'steps': 27125, 'loss/train': 1.8493744134902954} -11/07/2021 01:01:45 - INFO - __main__ - Step 27127: {'lr': 0.0004652772966908468, 'samples': 5208384, 'steps': 27126, 'loss/train': 1.2037136554718018} -11/07/2021 01:01:45 - INFO - __main__ - Step 27128: {'lr': 0.0004652745985870095, 'samples': 5208576, 'steps': 27127, 'loss/train': 1.5834203958511353} -11/07/2021 01:01:46 - INFO - __main__ - Step 27129: {'lr': 0.0004652719003861728, 'samples': 5208768, 'steps': 27128, 'loss/train': 1.11555016040802} -11/07/2021 01:01:46 - INFO - __main__ - Step 27130: {'lr': 0.0004652692020883379, 'samples': 5208960, 'steps': 27129, 'loss/train': 1.6084431409835815} -11/07/2021 01:01:47 - INFO - __main__ - Step 27131: {'lr': 0.00046526650369350605, 'samples': 5209152, 'steps': 27130, 'loss/train': 1.3682796955108643} -11/07/2021 01:01:47 - INFO - __main__ - Step 27132: {'lr': 0.0004652638052016784, 'samples': 5209344, 'steps': 27131, 'loss/train': 1.5609694719314575} -11/07/2021 01:01:48 - INFO - __main__ - Step 27133: {'lr': 0.00046526110661285615, 'samples': 5209536, 'steps': 27132, 'loss/train': 1.7686269283294678} -11/07/2021 01:01:48 - INFO - __main__ - Step 27134: {'lr': 0.00046525840792704064, 'samples': 5209728, 'steps': 27133, 'loss/train': 1.5374583005905151} -11/07/2021 01:01:49 - INFO - __main__ - Step 27135: {'lr': 0.000465255709144233, 'samples': 5209920, 'steps': 27134, 'loss/train': 1.4260269403457642} -11/07/2021 01:01:49 - INFO - __main__ - Step 27136: {'lr': 0.00046525301026443443, 'samples': 5210112, 'steps': 27135, 'loss/train': 1.6430789232254028} -11/07/2021 01:01:50 - INFO - __main__ - Step 27137: {'lr': 0.0004652503112876463, 'samples': 5210304, 'steps': 27136, 'loss/train': 1.476821780204773} -11/07/2021 01:01:50 - INFO - __main__ - Step 27138: {'lr': 0.00046524761221386956, 'samples': 5210496, 'steps': 27137, 'loss/train': 1.0227559804916382} -11/07/2021 01:01:51 - INFO - __main__ - Step 27139: {'lr': 0.0004652449130431056, 'samples': 5210688, 'steps': 27138, 'loss/train': 1.1180068254470825} -11/07/2021 01:01:51 - INFO - __main__ - Step 27140: {'lr': 0.00046524221377535564, 'samples': 5210880, 'steps': 27139, 'loss/train': 1.7611134052276611} -11/07/2021 01:01:52 - INFO - __main__ - Step 27141: {'lr': 0.00046523951441062087, 'samples': 5211072, 'steps': 27140, 'loss/train': 1.591782569885254} -11/07/2021 01:01:52 - INFO - __main__ - Step 27142: {'lr': 0.0004652368149489024, 'samples': 5211264, 'steps': 27141, 'loss/train': 1.1209391355514526} -11/07/2021 01:01:53 - INFO - __main__ - Step 27143: {'lr': 0.0004652341153902016, 'samples': 5211456, 'steps': 27142, 'loss/train': 1.741696834564209} -11/07/2021 01:01:53 - INFO - __main__ - Step 27144: {'lr': 0.00046523141573451965, 'samples': 5211648, 'steps': 27143, 'loss/train': 1.4735972881317139} -11/07/2021 01:01:53 - INFO - __main__ - Step 27145: {'lr': 0.0004652287159818577, 'samples': 5211840, 'steps': 27144, 'loss/train': 1.5447921752929688} -11/07/2021 01:01:54 - INFO - __main__ - Step 27146: {'lr': 0.00046522601613221704, 'samples': 5212032, 'steps': 27145, 'loss/train': 1.7040530443191528} -11/07/2021 01:01:55 - INFO - __main__ - Step 27147: {'lr': 0.0004652233161855989, 'samples': 5212224, 'steps': 27146, 'loss/train': 1.7633503675460815} -11/07/2021 01:01:55 - INFO - __main__ - Step 27148: {'lr': 0.0004652206161420044, 'samples': 5212416, 'steps': 27147, 'loss/train': 1.4151040315628052} -11/07/2021 01:01:55 - INFO - __main__ - Step 27149: {'lr': 0.00046521791600143483, 'samples': 5212608, 'steps': 27148, 'loss/train': 1.2859762907028198} -11/07/2021 01:01:56 - INFO - __main__ - Step 27150: {'lr': 0.00046521521576389134, 'samples': 5212800, 'steps': 27149, 'loss/train': 1.3248544931411743} -11/07/2021 01:01:57 - INFO - __main__ - Step 27151: {'lr': 0.00046521251542937524, 'samples': 5212992, 'steps': 27150, 'loss/train': 1.7026891708374023} -11/07/2021 01:01:57 - INFO - __main__ - Step 27152: {'lr': 0.0004652098149978877, 'samples': 5213184, 'steps': 27151, 'loss/train': 1.7094151973724365} -11/07/2021 01:01:57 - INFO - __main__ - Step 27153: {'lr': 0.00046520711446943, 'samples': 5213376, 'steps': 27152, 'loss/train': 1.3547008037567139} -11/07/2021 01:01:58 - INFO - __main__ - Step 27154: {'lr': 0.0004652044138440032, 'samples': 5213568, 'steps': 27153, 'loss/train': 1.6012340784072876} -11/07/2021 01:01:58 - INFO - __main__ - Step 27155: {'lr': 0.00046520171312160863, 'samples': 5213760, 'steps': 27154, 'loss/train': 1.2679134607315063} -11/07/2021 01:01:59 - INFO - __main__ - Step 27156: {'lr': 0.00046519901230224756, 'samples': 5213952, 'steps': 27155, 'loss/train': 1.0411334037780762} -11/07/2021 01:02:00 - INFO - __main__ - Step 27157: {'lr': 0.000465196311385921, 'samples': 5214144, 'steps': 27156, 'loss/train': 0.4594906270503998} -11/07/2021 01:02:00 - INFO - __main__ - Step 27158: {'lr': 0.0004651936103726304, 'samples': 5214336, 'steps': 27157, 'loss/train': 1.5192071199417114} -11/07/2021 01:02:00 - INFO - __main__ - Step 27159: {'lr': 0.0004651909092623769, 'samples': 5214528, 'steps': 27158, 'loss/train': 1.6818640232086182} -11/07/2021 01:02:01 - INFO - __main__ - Step 27160: {'lr': 0.00046518820805516165, 'samples': 5214720, 'steps': 27159, 'loss/train': 1.5658918619155884} -11/07/2021 01:02:02 - INFO - __main__ - Step 27161: {'lr': 0.0004651855067509859, 'samples': 5214912, 'steps': 27160, 'loss/train': 1.4818499088287354} -11/07/2021 01:02:02 - INFO - __main__ - Step 27162: {'lr': 0.0004651828053498509, 'samples': 5215104, 'steps': 27161, 'loss/train': 1.4773788452148438} -11/07/2021 01:02:02 - INFO - __main__ - Step 27163: {'lr': 0.0004651801038517579, 'samples': 5215296, 'steps': 27162, 'loss/train': 1.1611590385437012} -11/07/2021 01:02:03 - INFO - __main__ - Step 27164: {'lr': 0.000465177402256708, 'samples': 5215488, 'steps': 27163, 'loss/train': 1.544758677482605} -11/07/2021 01:02:03 - INFO - __main__ - Step 27165: {'lr': 0.00046517470056470244, 'samples': 5215680, 'steps': 27164, 'loss/train': 1.5025895833969116} -11/07/2021 01:02:05 - INFO - __main__ - Step 27166: {'lr': 0.00046517199877574257, 'samples': 5215872, 'steps': 27165, 'loss/train': 1.3345242738723755} -11/07/2021 01:02:05 - INFO - __main__ - Step 27167: {'lr': 0.0004651692968898295, 'samples': 5216064, 'steps': 27166, 'loss/train': 1.942888617515564} -11/07/2021 01:02:05 - INFO - __main__ - Step 27168: {'lr': 0.00046516659490696444, 'samples': 5216256, 'steps': 27167, 'loss/train': 1.3459722995758057} -11/07/2021 01:02:06 - INFO - __main__ - Step 27169: {'lr': 0.0004651638928271487, 'samples': 5216448, 'steps': 27168, 'loss/train': 1.6680691242218018} -11/07/2021 01:02:06 - INFO - __main__ - Step 27170: {'lr': 0.00046516119065038335, 'samples': 5216640, 'steps': 27169, 'loss/train': 0.6846105456352234} -11/07/2021 01:02:07 - INFO - __main__ - Step 27171: {'lr': 0.00046515848837666975, 'samples': 5216832, 'steps': 27170, 'loss/train': 0.5701700448989868} -11/07/2021 01:02:08 - INFO - __main__ - Step 27172: {'lr': 0.00046515578600600895, 'samples': 5217024, 'steps': 27171, 'loss/train': 1.4467335939407349} -11/07/2021 01:02:08 - INFO - __main__ - Step 27173: {'lr': 0.0004651530835384024, 'samples': 5217216, 'steps': 27172, 'loss/train': 1.3392056226730347} -11/07/2021 01:02:08 - INFO - __main__ - Step 27174: {'lr': 0.0004651503809738511, 'samples': 5217408, 'steps': 27173, 'loss/train': 1.2066261768341064} -11/07/2021 01:02:09 - INFO - __main__ - Step 27175: {'lr': 0.0004651476783123564, 'samples': 5217600, 'steps': 27174, 'loss/train': 1.503208875656128} -11/07/2021 01:02:09 - INFO - __main__ - Step 27176: {'lr': 0.00046514497555391946, 'samples': 5217792, 'steps': 27175, 'loss/train': 1.1453332901000977} -11/07/2021 01:02:10 - INFO - __main__ - Step 27177: {'lr': 0.0004651422726985415, 'samples': 5217984, 'steps': 27176, 'loss/train': 1.8215045928955078} -11/07/2021 01:02:10 - INFO - __main__ - Step 27178: {'lr': 0.00046513956974622377, 'samples': 5218176, 'steps': 27177, 'loss/train': 2.074622631072998} -11/07/2021 01:02:11 - INFO - __main__ - Step 27179: {'lr': 0.00046513686669696756, 'samples': 5218368, 'steps': 27178, 'loss/train': 1.3883646726608276} -11/07/2021 01:02:11 - INFO - __main__ - Step 27180: {'lr': 0.00046513416355077386, 'samples': 5218560, 'steps': 27179, 'loss/train': 1.4552028179168701} -11/07/2021 01:02:12 - INFO - __main__ - Step 27181: {'lr': 0.0004651314603076441, 'samples': 5218752, 'steps': 27180, 'loss/train': 1.4661346673965454} -11/07/2021 01:02:13 - INFO - __main__ - Step 27182: {'lr': 0.00046512875696757937, 'samples': 5218944, 'steps': 27181, 'loss/train': 1.8287869691848755} -11/07/2021 01:02:13 - INFO - __main__ - Step 27183: {'lr': 0.00046512605353058096, 'samples': 5219136, 'steps': 27182, 'loss/train': 0.7925441265106201} -11/07/2021 01:02:13 - INFO - __main__ - Step 27184: {'lr': 0.00046512334999665006, 'samples': 5219328, 'steps': 27183, 'loss/train': 1.6642957925796509} -11/07/2021 01:02:14 - INFO - __main__ - Step 27185: {'lr': 0.000465120646365788, 'samples': 5219520, 'steps': 27184, 'loss/train': 1.2242282629013062} -11/07/2021 01:02:14 - INFO - __main__ - Step 27186: {'lr': 0.0004651179426379958, 'samples': 5219712, 'steps': 27185, 'loss/train': 1.9081281423568726} -11/07/2021 01:02:15 - INFO - __main__ - Step 27187: {'lr': 0.00046511523881327476, 'samples': 5219904, 'steps': 27186, 'loss/train': 1.7007331848144531} -11/07/2021 01:02:16 - INFO - __main__ - Step 27188: {'lr': 0.00046511253489162616, 'samples': 5220096, 'steps': 27187, 'loss/train': 1.0498052835464478} -11/07/2021 01:02:16 - INFO - __main__ - Step 27189: {'lr': 0.00046510983087305114, 'samples': 5220288, 'steps': 27188, 'loss/train': 1.450149655342102} -11/07/2021 01:02:16 - INFO - __main__ - Step 27190: {'lr': 0.00046510712675755094, 'samples': 5220480, 'steps': 27189, 'loss/train': 1.5899168252944946} -11/07/2021 01:02:17 - INFO - __main__ - Step 27191: {'lr': 0.00046510442254512686, 'samples': 5220672, 'steps': 27190, 'loss/train': 1.399792194366455} -11/07/2021 01:02:18 - INFO - __main__ - Step 27192: {'lr': 0.00046510171823578, 'samples': 5220864, 'steps': 27191, 'loss/train': 1.7889716625213623} -11/07/2021 01:02:18 - INFO - __main__ - Step 27193: {'lr': 0.0004650990138295116, 'samples': 5221056, 'steps': 27192, 'loss/train': 1.8554221391677856} -11/07/2021 01:02:18 - INFO - __main__ - Step 27194: {'lr': 0.00046509630932632293, 'samples': 5221248, 'steps': 27193, 'loss/train': 1.738891839981079} -11/07/2021 01:02:19 - INFO - __main__ - Step 27195: {'lr': 0.0004650936047262152, 'samples': 5221440, 'steps': 27194, 'loss/train': 1.9472607374191284} -11/07/2021 01:02:19 - INFO - __main__ - Step 27196: {'lr': 0.0004650909000291895, 'samples': 5221632, 'steps': 27195, 'loss/train': 1.299528956413269} -11/07/2021 01:02:19 - INFO - __main__ - Step 27197: {'lr': 0.00046508819523524724, 'samples': 5221824, 'steps': 27196, 'loss/train': 1.4237334728240967} -11/07/2021 01:02:21 - INFO - __main__ - Step 27198: {'lr': 0.0004650854903443896, 'samples': 5222016, 'steps': 27197, 'loss/train': 2.340219497680664} -11/07/2021 01:02:21 - INFO - __main__ - Step 27199: {'lr': 0.00046508278535661775, 'samples': 5222208, 'steps': 27198, 'loss/train': 1.6890065670013428} -11/07/2021 01:02:22 - INFO - __main__ - Step 27200: {'lr': 0.00046508008027193286, 'samples': 5222400, 'steps': 27199, 'loss/train': 1.5595864057540894} -11/07/2021 01:02:22 - INFO - __main__ - Step 27201: {'lr': 0.0004650773750903363, 'samples': 5222592, 'steps': 27200, 'loss/train': 2.2038509845733643} -11/07/2021 01:02:22 - INFO - __main__ - Step 27202: {'lr': 0.0004650746698118291, 'samples': 5222784, 'steps': 27201, 'loss/train': 1.0606508255004883} -11/07/2021 01:02:23 - INFO - __main__ - Step 27203: {'lr': 0.0004650719644364126, 'samples': 5222976, 'steps': 27202, 'loss/train': 1.355365514755249} -11/07/2021 01:02:24 - INFO - __main__ - Step 27204: {'lr': 0.000465069258964088, 'samples': 5223168, 'steps': 27203, 'loss/train': 1.6440300941467285} -11/07/2021 01:02:24 - INFO - __main__ - Step 27205: {'lr': 0.0004650665533948565, 'samples': 5223360, 'steps': 27204, 'loss/train': 1.5045417547225952} -11/07/2021 01:02:24 - INFO - __main__ - Step 27206: {'lr': 0.00046506384772871935, 'samples': 5223552, 'steps': 27205, 'loss/train': 1.5792165994644165} -11/07/2021 01:02:25 - INFO - __main__ - Step 27207: {'lr': 0.0004650611419656777, 'samples': 5223744, 'steps': 27206, 'loss/train': 1.613562822341919} -11/07/2021 01:02:26 - INFO - __main__ - Step 27208: {'lr': 0.0004650584361057328, 'samples': 5223936, 'steps': 27207, 'loss/train': 1.467961311340332} -11/07/2021 01:02:26 - INFO - __main__ - Step 27209: {'lr': 0.00046505573014888604, 'samples': 5224128, 'steps': 27208, 'loss/train': 1.6682863235473633} -11/07/2021 01:02:26 - INFO - __main__ - Step 27210: {'lr': 0.0004650530240951383, 'samples': 5224320, 'steps': 27209, 'loss/train': 1.2404732704162598} -11/07/2021 01:02:27 - INFO - __main__ - Step 27211: {'lr': 0.0004650503179444911, 'samples': 5224512, 'steps': 27210, 'loss/train': 1.53238046169281} -11/07/2021 01:02:27 - INFO - __main__ - Step 27212: {'lr': 0.00046504761169694555, 'samples': 5224704, 'steps': 27211, 'loss/train': 1.7771190404891968} -11/07/2021 01:02:28 - INFO - __main__ - Step 27213: {'lr': 0.0004650449053525028, 'samples': 5224896, 'steps': 27212, 'loss/train': 1.3833065032958984} -11/07/2021 01:02:29 - INFO - __main__ - Step 27214: {'lr': 0.00046504219891116416, 'samples': 5225088, 'steps': 27213, 'loss/train': 1.3884916305541992} -11/07/2021 01:02:29 - INFO - __main__ - Step 27215: {'lr': 0.0004650394923729309, 'samples': 5225280, 'steps': 27214, 'loss/train': 1.773545742034912} -11/07/2021 01:02:29 - INFO - __main__ - Step 27216: {'lr': 0.00046503678573780403, 'samples': 5225472, 'steps': 27215, 'loss/train': 1.5457409620285034} -11/07/2021 01:02:30 - INFO - __main__ - Step 27217: {'lr': 0.000465034079005785, 'samples': 5225664, 'steps': 27216, 'loss/train': 1.5216282606124878} -11/07/2021 01:02:31 - INFO - __main__ - Step 27218: {'lr': 0.00046503137217687485, 'samples': 5225856, 'steps': 27217, 'loss/train': 1.4964834451675415} -11/07/2021 01:02:31 - INFO - __main__ - Step 27219: {'lr': 0.0004650286652510749, 'samples': 5226048, 'steps': 27218, 'loss/train': 1.5795546770095825} -11/07/2021 01:02:31 - INFO - __main__ - Step 27220: {'lr': 0.0004650259582283864, 'samples': 5226240, 'steps': 27219, 'loss/train': 1.4796018600463867} -11/07/2021 01:02:32 - INFO - __main__ - Step 27221: {'lr': 0.0004650232511088105, 'samples': 5226432, 'steps': 27220, 'loss/train': 1.6209487915039062} -11/07/2021 01:02:32 - INFO - __main__ - Step 27222: {'lr': 0.00046502054389234844, 'samples': 5226624, 'steps': 27221, 'loss/train': 0.906596302986145} -11/07/2021 01:02:33 - INFO - __main__ - Step 27223: {'lr': 0.0004650178365790014, 'samples': 5226816, 'steps': 27222, 'loss/train': 1.618649959564209} -11/07/2021 01:02:33 - INFO - __main__ - Step 27224: {'lr': 0.0004650151291687707, 'samples': 5227008, 'steps': 27223, 'loss/train': 1.4684704542160034} -11/07/2021 01:02:34 - INFO - __main__ - Step 27225: {'lr': 0.00046501242166165747, 'samples': 5227200, 'steps': 27224, 'loss/train': 1.6474354267120361} -11/07/2021 01:02:34 - INFO - __main__ - Step 27226: {'lr': 0.000465009714057663, 'samples': 5227392, 'steps': 27225, 'loss/train': 1.7976675033569336} -11/07/2021 01:02:34 - INFO - __main__ - Step 27227: {'lr': 0.00046500700635678844, 'samples': 5227584, 'steps': 27226, 'loss/train': 1.836778163909912} -11/07/2021 01:02:36 - INFO - __main__ - Step 27228: {'lr': 0.000465004298559035, 'samples': 5227776, 'steps': 27227, 'loss/train': 1.5999199151992798} -11/07/2021 01:02:36 - INFO - __main__ - Step 27229: {'lr': 0.00046500159066440404, 'samples': 5227968, 'steps': 27228, 'loss/train': 1.2133694887161255} -11/07/2021 01:02:36 - INFO - __main__ - Step 27230: {'lr': 0.0004649988826728966, 'samples': 5228160, 'steps': 27229, 'loss/train': 1.2805842161178589} -11/07/2021 01:02:37 - INFO - __main__ - Step 27231: {'lr': 0.000464996174584514, 'samples': 5228352, 'steps': 27230, 'loss/train': 1.5810779333114624} -11/07/2021 01:02:37 - INFO - __main__ - Step 27232: {'lr': 0.00046499346639925746, 'samples': 5228544, 'steps': 27231, 'loss/train': 1.931288242340088} -11/07/2021 01:02:38 - INFO - __main__ - Step 27233: {'lr': 0.0004649907581171282, 'samples': 5228736, 'steps': 27232, 'loss/train': 1.3784176111221313} -11/07/2021 01:02:38 - INFO - __main__ - Step 27234: {'lr': 0.00046498804973812735, 'samples': 5228928, 'steps': 27233, 'loss/train': 5.008947372436523} -11/07/2021 01:02:39 - INFO - __main__ - Step 27235: {'lr': 0.00046498534126225625, 'samples': 5229120, 'steps': 27234, 'loss/train': 1.4662317037582397} -11/07/2021 01:02:39 - INFO - __main__ - Step 27236: {'lr': 0.0004649826326895161, 'samples': 5229312, 'steps': 27235, 'loss/train': 1.7126282453536987} -11/07/2021 01:02:39 - INFO - __main__ - Step 27237: {'lr': 0.0004649799240199081, 'samples': 5229504, 'steps': 27236, 'loss/train': 1.5118376016616821} -11/07/2021 01:02:41 - INFO - __main__ - Step 27238: {'lr': 0.0004649772152534334, 'samples': 5229696, 'steps': 27237, 'loss/train': 2.3526248931884766} -11/07/2021 01:02:41 - INFO - __main__ - Step 27239: {'lr': 0.0004649745063900933, 'samples': 5229888, 'steps': 27238, 'loss/train': 1.6515519618988037} -11/07/2021 01:02:41 - INFO - __main__ - Step 27240: {'lr': 0.000464971797429889, 'samples': 5230080, 'steps': 27239, 'loss/train': 1.2007354497909546} -11/07/2021 01:02:42 - INFO - __main__ - Step 27241: {'lr': 0.00046496908837282173, 'samples': 5230272, 'steps': 27240, 'loss/train': 1.9977402687072754} -11/07/2021 01:02:42 - INFO - __main__ - Step 27242: {'lr': 0.00046496637921889276, 'samples': 5230464, 'steps': 27241, 'loss/train': 1.0261619091033936} -11/07/2021 01:02:42 - INFO - __main__ - Step 27243: {'lr': 0.0004649636699681031, 'samples': 5230656, 'steps': 27242, 'loss/train': 1.638994812965393} -11/07/2021 01:02:43 - INFO - __main__ - Step 27244: {'lr': 0.00046496096062045427, 'samples': 5230848, 'steps': 27243, 'loss/train': 1.7429476976394653} -11/07/2021 01:02:44 - INFO - __main__ - Step 27245: {'lr': 0.00046495825117594735, 'samples': 5231040, 'steps': 27244, 'loss/train': 1.555149793624878} -11/07/2021 01:02:44 - INFO - __main__ - Step 27246: {'lr': 0.0004649555416345835, 'samples': 5231232, 'steps': 27245, 'loss/train': 1.261429786682129} -11/07/2021 01:02:44 - INFO - __main__ - Step 27247: {'lr': 0.0004649528319963641, 'samples': 5231424, 'steps': 27246, 'loss/train': 1.4237511157989502} -11/07/2021 01:02:45 - INFO - __main__ - Step 27248: {'lr': 0.0004649501222612901, 'samples': 5231616, 'steps': 27247, 'loss/train': 2.1382250785827637} -11/07/2021 01:02:46 - INFO - __main__ - Step 27249: {'lr': 0.000464947412429363, 'samples': 5231808, 'steps': 27248, 'loss/train': 1.8834290504455566} -11/07/2021 01:02:46 - INFO - __main__ - Step 27250: {'lr': 0.000464944702500584, 'samples': 5232000, 'steps': 27249, 'loss/train': 1.60459303855896} -11/07/2021 01:02:47 - INFO - __main__ - Step 27251: {'lr': 0.0004649419924749541, 'samples': 5232192, 'steps': 27250, 'loss/train': 1.6707024574279785} -11/07/2021 01:02:47 - INFO - __main__ - Step 27252: {'lr': 0.0004649392823524746, 'samples': 5232384, 'steps': 27251, 'loss/train': 2.083890676498413} -11/07/2021 01:02:47 - INFO - __main__ - Step 27253: {'lr': 0.0004649365721331469, 'samples': 5232576, 'steps': 27252, 'loss/train': 1.1771005392074585} -11/07/2021 01:02:48 - INFO - __main__ - Step 27254: {'lr': 0.00046493386181697206, 'samples': 5232768, 'steps': 27253, 'loss/train': 1.486518144607544} -11/07/2021 01:02:49 - INFO - __main__ - Step 27255: {'lr': 0.00046493115140395136, 'samples': 5232960, 'steps': 27254, 'loss/train': 1.6178797483444214} -11/07/2021 01:02:49 - INFO - __main__ - Step 27256: {'lr': 0.000464928440894086, 'samples': 5233152, 'steps': 27255, 'loss/train': 1.117812156677246} -11/07/2021 01:02:49 - INFO - __main__ - Step 27257: {'lr': 0.00046492573028737716, 'samples': 5233344, 'steps': 27256, 'loss/train': 1.468658208847046} -11/07/2021 01:02:50 - INFO - __main__ - Step 27258: {'lr': 0.0004649230195838261, 'samples': 5233536, 'steps': 27257, 'loss/train': 1.4425030946731567} -11/07/2021 01:02:51 - INFO - __main__ - Step 27259: {'lr': 0.00046492030878343406, 'samples': 5233728, 'steps': 27258, 'loss/train': 1.1143912076950073} -11/07/2021 01:02:51 - INFO - __main__ - Step 27260: {'lr': 0.00046491759788620227, 'samples': 5233920, 'steps': 27259, 'loss/train': 1.2509312629699707} -11/07/2021 01:02:51 - INFO - __main__ - Step 27261: {'lr': 0.0004649148868921319, 'samples': 5234112, 'steps': 27260, 'loss/train': 1.6943997144699097} -11/07/2021 01:02:52 - INFO - __main__ - Step 27262: {'lr': 0.00046491217580122427, 'samples': 5234304, 'steps': 27261, 'loss/train': 1.703986644744873} -11/07/2021 01:02:52 - INFO - __main__ - Step 27263: {'lr': 0.00046490946461348045, 'samples': 5234496, 'steps': 27262, 'loss/train': 1.753912329673767} -11/07/2021 01:02:53 - INFO - __main__ - Step 27264: {'lr': 0.00046490675332890177, 'samples': 5234688, 'steps': 27263, 'loss/train': 1.8319761753082275} -11/07/2021 01:02:54 - INFO - __main__ - Step 27265: {'lr': 0.00046490404194748935, 'samples': 5234880, 'steps': 27264, 'loss/train': 1.6805005073547363} -11/07/2021 01:02:54 - INFO - __main__ - Step 27266: {'lr': 0.00046490133046924457, 'samples': 5235072, 'steps': 27265, 'loss/train': 1.169919729232788} -11/07/2021 01:02:54 - INFO - __main__ - Step 27267: {'lr': 0.0004648986188941685, 'samples': 5235264, 'steps': 27266, 'loss/train': 1.7877448797225952} -11/07/2021 01:02:55 - INFO - __main__ - Step 27268: {'lr': 0.0004648959072222625, 'samples': 5235456, 'steps': 27267, 'loss/train': 2.4874370098114014} -11/07/2021 01:02:56 - INFO - __main__ - Step 27269: {'lr': 0.0004648931954535277, 'samples': 5235648, 'steps': 27268, 'loss/train': 1.5646990537643433} -11/07/2021 01:02:56 - INFO - __main__ - Step 27270: {'lr': 0.0004648904835879654, 'samples': 5235840, 'steps': 27269, 'loss/train': 1.285988450050354} -11/07/2021 01:02:56 - INFO - __main__ - Step 27271: {'lr': 0.0004648877716255766, 'samples': 5236032, 'steps': 27270, 'loss/train': 1.7725143432617188} -11/07/2021 01:02:57 - INFO - __main__ - Step 27272: {'lr': 0.00046488505956636286, 'samples': 5236224, 'steps': 27271, 'loss/train': 1.777441143989563} -11/07/2021 01:02:57 - INFO - __main__ - Step 27273: {'lr': 0.0004648823474103251, 'samples': 5236416, 'steps': 27272, 'loss/train': 1.489535927772522} -11/07/2021 01:02:58 - INFO - __main__ - Step 27274: {'lr': 0.0004648796351574648, 'samples': 5236608, 'steps': 27273, 'loss/train': 1.0099929571151733} -11/07/2021 01:02:58 - INFO - __main__ - Step 27275: {'lr': 0.0004648769228077829, 'samples': 5236800, 'steps': 27274, 'loss/train': 1.5548713207244873} -11/07/2021 01:02:59 - INFO - __main__ - Step 27276: {'lr': 0.00046487421036128085, 'samples': 5236992, 'steps': 27275, 'loss/train': 1.2483229637145996} -11/07/2021 01:02:59 - INFO - __main__ - Step 27277: {'lr': 0.00046487149781795976, 'samples': 5237184, 'steps': 27276, 'loss/train': 1.5984280109405518} -11/07/2021 01:02:59 - INFO - __main__ - Step 27278: {'lr': 0.00046486878517782094, 'samples': 5237376, 'steps': 27277, 'loss/train': 1.1107038259506226} -11/07/2021 01:03:01 - INFO - __main__ - Step 27279: {'lr': 0.0004648660724408656, 'samples': 5237568, 'steps': 27278, 'loss/train': 1.5515042543411255} -11/07/2021 01:03:01 - INFO - __main__ - Step 27280: {'lr': 0.00046486335960709485, 'samples': 5237760, 'steps': 27279, 'loss/train': 1.8898242712020874} -11/07/2021 01:03:01 - INFO - __main__ - Step 27281: {'lr': 0.00046486064667651, 'samples': 5237952, 'steps': 27280, 'loss/train': 1.912441372871399} -11/07/2021 01:03:02 - INFO - __main__ - Step 27282: {'lr': 0.0004648579336491123, 'samples': 5238144, 'steps': 27281, 'loss/train': 1.492627739906311} -11/07/2021 01:03:02 - INFO - __main__ - Step 27283: {'lr': 0.0004648552205249029, 'samples': 5238336, 'steps': 27282, 'loss/train': 1.3607357740402222} -11/07/2021 01:03:02 - INFO - __main__ - Step 27284: {'lr': 0.000464852507303883, 'samples': 5238528, 'steps': 27283, 'loss/train': 1.754043698310852} -11/07/2021 01:03:03 - INFO - __main__ - Step 27285: {'lr': 0.0004648497939860539, 'samples': 5238720, 'steps': 27284, 'loss/train': 1.7543745040893555} -11/07/2021 01:03:04 - INFO - __main__ - Step 27286: {'lr': 0.0004648470805714169, 'samples': 5238912, 'steps': 27285, 'loss/train': 1.300349235534668} -11/07/2021 01:03:04 - INFO - __main__ - Step 27287: {'lr': 0.00046484436705997303, 'samples': 5239104, 'steps': 27286, 'loss/train': 1.2074387073516846} -11/07/2021 01:03:04 - INFO - __main__ - Step 27288: {'lr': 0.0004648416534517236, 'samples': 5239296, 'steps': 27287, 'loss/train': 1.1679052114486694} -11/07/2021 01:03:05 - INFO - __main__ - Step 27289: {'lr': 0.00046483893974666983, 'samples': 5239488, 'steps': 27288, 'loss/train': 1.7679553031921387} -11/07/2021 01:03:06 - INFO - __main__ - Step 27290: {'lr': 0.000464836225944813, 'samples': 5239680, 'steps': 27289, 'loss/train': 0.6809923648834229} -11/07/2021 01:03:06 - INFO - __main__ - Step 27291: {'lr': 0.00046483351204615423, 'samples': 5239872, 'steps': 27290, 'loss/train': 1.628966212272644} -11/07/2021 01:03:07 - INFO - __main__ - Step 27292: {'lr': 0.0004648307980506948, 'samples': 5240064, 'steps': 27291, 'loss/train': 1.4171942472457886} -11/07/2021 01:03:07 - INFO - __main__ - Step 27293: {'lr': 0.00046482808395843594, 'samples': 5240256, 'steps': 27292, 'loss/train': 2.384295701980591} -11/07/2021 01:03:07 - INFO - __main__ - Step 27294: {'lr': 0.0004648253697693789, 'samples': 5240448, 'steps': 27293, 'loss/train': 1.6184483766555786} -11/07/2021 01:03:08 - INFO - __main__ - Step 27295: {'lr': 0.0004648226554835248, 'samples': 5240640, 'steps': 27294, 'loss/train': 1.4949777126312256} -11/07/2021 01:03:09 - INFO - __main__ - Step 27296: {'lr': 0.000464819941100875, 'samples': 5240832, 'steps': 27295, 'loss/train': 1.562004566192627} -11/07/2021 01:03:09 - INFO - __main__ - Step 27297: {'lr': 0.00046481722662143057, 'samples': 5241024, 'steps': 27296, 'loss/train': 1.9358444213867188} -11/07/2021 01:03:09 - INFO - __main__ - Step 27298: {'lr': 0.0004648145120451929, 'samples': 5241216, 'steps': 27297, 'loss/train': 1.275517463684082} -11/07/2021 01:03:10 - INFO - __main__ - Step 27299: {'lr': 0.000464811797372163, 'samples': 5241408, 'steps': 27298, 'loss/train': 1.4358162879943848} -11/07/2021 01:03:11 - INFO - __main__ - Step 27300: {'lr': 0.00046480908260234234, 'samples': 5241600, 'steps': 27299, 'loss/train': 1.7115789651870728} -11/07/2021 01:03:12 - INFO - __main__ - Step 27301: {'lr': 0.0004648063677357319, 'samples': 5241792, 'steps': 27300, 'loss/train': 2.180518865585327} -11/07/2021 01:03:12 - INFO - __main__ - Step 27302: {'lr': 0.00046480365277233316, 'samples': 5241984, 'steps': 27301, 'loss/train': 2.0012290477752686} -11/07/2021 01:03:12 - INFO - __main__ - Step 27303: {'lr': 0.00046480093771214716, 'samples': 5242176, 'steps': 27302, 'loss/train': 1.8879752159118652} -11/07/2021 01:03:13 - INFO - __main__ - Step 27304: {'lr': 0.0004647982225551751, 'samples': 5242368, 'steps': 27303, 'loss/train': 0.4549408257007599} -11/07/2021 01:03:14 - INFO - __main__ - Step 27305: {'lr': 0.0004647955073014184, 'samples': 5242560, 'steps': 27304, 'loss/train': 2.0891189575195312} -11/07/2021 01:03:14 - INFO - __main__ - Step 27306: {'lr': 0.00046479279195087804, 'samples': 5242752, 'steps': 27305, 'loss/train': 1.5999822616577148} -11/07/2021 01:03:15 - INFO - __main__ - Step 27307: {'lr': 0.0004647900765035554, 'samples': 5242944, 'steps': 27306, 'loss/train': 1.7527434825897217} -11/07/2021 01:03:15 - INFO - __main__ - Step 27308: {'lr': 0.0004647873609594517, 'samples': 5243136, 'steps': 27307, 'loss/train': 1.2198915481567383} -11/07/2021 01:03:15 - INFO - __main__ - Step 27309: {'lr': 0.0004647846453185681, 'samples': 5243328, 'steps': 27308, 'loss/train': 1.5550477504730225} -11/07/2021 01:03:16 - INFO - __main__ - Step 27310: {'lr': 0.0004647819295809059, 'samples': 5243520, 'steps': 27309, 'loss/train': 1.791429877281189} -11/07/2021 01:03:17 - INFO - __main__ - Step 27311: {'lr': 0.00046477921374646624, 'samples': 5243712, 'steps': 27310, 'loss/train': 1.506710410118103} -11/07/2021 01:03:17 - INFO - __main__ - Step 27312: {'lr': 0.0004647764978152503, 'samples': 5243904, 'steps': 27311, 'loss/train': 1.6585369110107422} -11/07/2021 01:03:17 - INFO - __main__ - Step 27313: {'lr': 0.0004647737817872595, 'samples': 5244096, 'steps': 27312, 'loss/train': 1.6855876445770264} -11/07/2021 01:03:18 - INFO - __main__ - Step 27314: {'lr': 0.0004647710656624949, 'samples': 5244288, 'steps': 27313, 'loss/train': 1.1921801567077637} -11/07/2021 01:03:18 - INFO - __main__ - Step 27315: {'lr': 0.0004647683494409578, 'samples': 5244480, 'steps': 27314, 'loss/train': 1.5598256587982178} -11/07/2021 01:03:19 - INFO - __main__ - Step 27316: {'lr': 0.0004647656331226494, 'samples': 5244672, 'steps': 27315, 'loss/train': 1.3678679466247559} -11/07/2021 01:03:19 - INFO - __main__ - Step 27317: {'lr': 0.0004647629167075709, 'samples': 5244864, 'steps': 27316, 'loss/train': 1.58489191532135} -11/07/2021 01:03:20 - INFO - __main__ - Step 27318: {'lr': 0.00046476020019572354, 'samples': 5245056, 'steps': 27317, 'loss/train': 1.6443164348602295} -11/07/2021 01:03:20 - INFO - __main__ - Step 27319: {'lr': 0.00046475748358710856, 'samples': 5245248, 'steps': 27318, 'loss/train': 1.410498023033142} -11/07/2021 01:03:20 - INFO - __main__ - Step 27320: {'lr': 0.0004647547668817271, 'samples': 5245440, 'steps': 27319, 'loss/train': 1.5386722087860107} -11/07/2021 01:03:22 - INFO - __main__ - Step 27321: {'lr': 0.00046475205007958054, 'samples': 5245632, 'steps': 27320, 'loss/train': 1.3879882097244263} -11/07/2021 01:03:22 - INFO - __main__ - Step 27322: {'lr': 0.00046474933318067004, 'samples': 5245824, 'steps': 27321, 'loss/train': 1.2655384540557861} -11/07/2021 01:03:22 - INFO - __main__ - Step 27323: {'lr': 0.0004647466161849968, 'samples': 5246016, 'steps': 27322, 'loss/train': 1.598747730255127} -11/07/2021 01:03:23 - INFO - __main__ - Step 27324: {'lr': 0.000464743899092562, 'samples': 5246208, 'steps': 27323, 'loss/train': 1.4427452087402344} -11/07/2021 01:03:23 - INFO - __main__ - Step 27325: {'lr': 0.0004647411819033669, 'samples': 5246400, 'steps': 27324, 'loss/train': 1.6169787645339966} -11/07/2021 01:03:24 - INFO - __main__ - Step 27326: {'lr': 0.00046473846461741276, 'samples': 5246592, 'steps': 27325, 'loss/train': 1.5075080394744873} -11/07/2021 01:03:24 - INFO - __main__ - Step 27327: {'lr': 0.0004647357472347008, 'samples': 5246784, 'steps': 27326, 'loss/train': 1.5084218978881836} -11/07/2021 01:03:25 - INFO - __main__ - Step 27328: {'lr': 0.00046473302975523224, 'samples': 5246976, 'steps': 27327, 'loss/train': 1.3807927370071411} -11/07/2021 01:03:25 - INFO - __main__ - Step 27329: {'lr': 0.0004647303121790082, 'samples': 5247168, 'steps': 27328, 'loss/train': 1.8661872148513794} -11/07/2021 01:03:25 - INFO - __main__ - Step 27330: {'lr': 0.0004647275945060301, 'samples': 5247360, 'steps': 27329, 'loss/train': 1.6493861675262451} -11/07/2021 01:03:27 - INFO - __main__ - Step 27331: {'lr': 0.000464724876736299, 'samples': 5247552, 'steps': 27330, 'loss/train': 1.5648044347763062} -11/07/2021 01:03:27 - INFO - __main__ - Step 27332: {'lr': 0.00046472215886981616, 'samples': 5247744, 'steps': 27331, 'loss/train': 0.851533055305481} -11/07/2021 01:03:27 - INFO - __main__ - Step 27333: {'lr': 0.00046471944090658294, 'samples': 5247936, 'steps': 27332, 'loss/train': 1.6356053352355957} -11/07/2021 01:03:28 - INFO - __main__ - Step 27334: {'lr': 0.0004647167228466004, 'samples': 5248128, 'steps': 27333, 'loss/train': 1.8776708841323853} -11/07/2021 01:03:28 - INFO - __main__ - Step 27335: {'lr': 0.0004647140046898697, 'samples': 5248320, 'steps': 27334, 'loss/train': 1.3127461671829224} -11/07/2021 01:03:29 - INFO - __main__ - Step 27336: {'lr': 0.0004647112864363923, 'samples': 5248512, 'steps': 27335, 'loss/train': 1.7084875106811523} -11/07/2021 01:03:30 - INFO - __main__ - Step 27337: {'lr': 0.00046470856808616934, 'samples': 5248704, 'steps': 27336, 'loss/train': 1.421209454536438} -11/07/2021 01:03:30 - INFO - __main__ - Step 27338: {'lr': 0.0004647058496392019, 'samples': 5248896, 'steps': 27337, 'loss/train': 1.2902867794036865} -11/07/2021 01:03:30 - INFO - __main__ - Step 27339: {'lr': 0.0004647031310954914, 'samples': 5249088, 'steps': 27338, 'loss/train': 1.4306479692459106} -11/07/2021 01:03:31 - INFO - __main__ - Step 27340: {'lr': 0.00046470041245503895, 'samples': 5249280, 'steps': 27339, 'loss/train': 1.445697546005249} -11/07/2021 01:03:31 - INFO - __main__ - Step 27341: {'lr': 0.0004646976937178459, 'samples': 5249472, 'steps': 27340, 'loss/train': 1.2455345392227173} -11/07/2021 01:03:32 - INFO - __main__ - Step 27342: {'lr': 0.0004646949748839132, 'samples': 5249664, 'steps': 27341, 'loss/train': 1.1632879972457886} -11/07/2021 01:03:33 - INFO - __main__ - Step 27343: {'lr': 0.0004646922559532424, 'samples': 5249856, 'steps': 27342, 'loss/train': 1.8211750984191895} -11/07/2021 01:03:33 - INFO - __main__ - Step 27344: {'lr': 0.0004646895369258345, 'samples': 5250048, 'steps': 27343, 'loss/train': 1.6821507215499878} -11/07/2021 01:03:33 - INFO - __main__ - Step 27345: {'lr': 0.00046468681780169086, 'samples': 5250240, 'steps': 27344, 'loss/train': 1.6495689153671265} -11/07/2021 01:03:34 - INFO - __main__ - Step 27346: {'lr': 0.0004646840985808126, 'samples': 5250432, 'steps': 27345, 'loss/train': 1.566925287246704} -11/07/2021 01:03:35 - INFO - __main__ - Step 27347: {'lr': 0.0004646813792632011, 'samples': 5250624, 'steps': 27346, 'loss/train': 1.3244365453720093} -11/07/2021 01:03:35 - INFO - __main__ - Step 27348: {'lr': 0.00046467865984885736, 'samples': 5250816, 'steps': 27347, 'loss/train': 1.6940046548843384} -11/07/2021 01:03:35 - INFO - __main__ - Step 27349: {'lr': 0.0004646759403377828, 'samples': 5251008, 'steps': 27348, 'loss/train': 1.6910820007324219} -11/07/2021 01:03:36 - INFO - __main__ - Step 27350: {'lr': 0.00046467322072997865, 'samples': 5251200, 'steps': 27349, 'loss/train': 1.679405689239502} -11/07/2021 01:03:36 - INFO - __main__ - Step 27351: {'lr': 0.00046467050102544594, 'samples': 5251392, 'steps': 27350, 'loss/train': 1.8179465532302856} -11/07/2021 01:03:37 - INFO - __main__ - Step 27352: {'lr': 0.0004646677812241861, 'samples': 5251584, 'steps': 27351, 'loss/train': 1.789126992225647} -11/07/2021 01:03:37 - INFO - __main__ - Step 27353: {'lr': 0.0004646650613262001, 'samples': 5251776, 'steps': 27352, 'loss/train': 1.3540021181106567} -11/07/2021 01:03:38 - INFO - __main__ - Step 27354: {'lr': 0.00046466234133148957, 'samples': 5251968, 'steps': 27353, 'loss/train': 1.5730952024459839} -11/07/2021 01:03:38 - INFO - __main__ - Step 27355: {'lr': 0.00046465962124005535, 'samples': 5252160, 'steps': 27354, 'loss/train': 1.4978750944137573} -11/07/2021 01:03:38 - INFO - __main__ - Step 27356: {'lr': 0.0004646569010518988, 'samples': 5252352, 'steps': 27355, 'loss/train': 1.8019400835037231} -11/07/2021 01:03:40 - INFO - __main__ - Step 27357: {'lr': 0.00046465418076702125, 'samples': 5252544, 'steps': 27356, 'loss/train': 1.7005836963653564} -11/07/2021 01:03:40 - INFO - __main__ - Step 27358: {'lr': 0.00046465146038542375, 'samples': 5252736, 'steps': 27357, 'loss/train': 1.577629566192627} -11/07/2021 01:03:40 - INFO - __main__ - Step 27359: {'lr': 0.0004646487399071077, 'samples': 5252928, 'steps': 27358, 'loss/train': 1.6958972215652466} -11/07/2021 01:03:41 - INFO - __main__ - Step 27360: {'lr': 0.00046464601933207417, 'samples': 5253120, 'steps': 27359, 'loss/train': 1.4246464967727661} -11/07/2021 01:03:41 - INFO - __main__ - Step 27361: {'lr': 0.0004646432986603245, 'samples': 5253312, 'steps': 27360, 'loss/train': 1.8367726802825928} -11/07/2021 01:03:41 - INFO - __main__ - Step 27362: {'lr': 0.00046464057789185985, 'samples': 5253504, 'steps': 27361, 'loss/train': 1.778257966041565} -11/07/2021 01:03:42 - INFO - __main__ - Step 27363: {'lr': 0.00046463785702668156, 'samples': 5253696, 'steps': 27362, 'loss/train': 1.8035478591918945} -11/07/2021 01:03:43 - INFO - __main__ - Step 27364: {'lr': 0.0004646351360647907, 'samples': 5253888, 'steps': 27363, 'loss/train': 1.9287103414535522} -11/07/2021 01:03:43 - INFO - __main__ - Step 27365: {'lr': 0.00046463241500618846, 'samples': 5254080, 'steps': 27364, 'loss/train': 1.322129249572754} -11/07/2021 01:03:43 - INFO - __main__ - Step 27366: {'lr': 0.00046462969385087626, 'samples': 5254272, 'steps': 27365, 'loss/train': 1.7644007205963135} -11/07/2021 01:03:44 - INFO - __main__ - Step 27367: {'lr': 0.00046462697259885523, 'samples': 5254464, 'steps': 27366, 'loss/train': 2.6626901626586914} -11/07/2021 01:03:45 - INFO - __main__ - Step 27368: {'lr': 0.0004646242512501266, 'samples': 5254656, 'steps': 27367, 'loss/train': 1.7474702596664429} -11/07/2021 01:03:45 - INFO - __main__ - Step 27369: {'lr': 0.0004646215298046916, 'samples': 5254848, 'steps': 27368, 'loss/train': 1.823857307434082} -11/07/2021 01:03:45 - INFO - __main__ - Step 27370: {'lr': 0.00046461880826255143, 'samples': 5255040, 'steps': 27369, 'loss/train': 1.2764437198638916} -11/07/2021 01:03:46 - INFO - __main__ - Step 27371: {'lr': 0.00046461608662370734, 'samples': 5255232, 'steps': 27370, 'loss/train': 1.5031490325927734} -11/07/2021 01:03:46 - INFO - __main__ - Step 27372: {'lr': 0.0004646133648881606, 'samples': 5255424, 'steps': 27371, 'loss/train': 1.596226692199707} -11/07/2021 01:03:47 - INFO - __main__ - Step 27373: {'lr': 0.00046461064305591235, 'samples': 5255616, 'steps': 27372, 'loss/train': 1.7974703311920166} -11/07/2021 01:03:48 - INFO - __main__ - Step 27374: {'lr': 0.00046460792112696384, 'samples': 5255808, 'steps': 27373, 'loss/train': 1.4550420045852661} -11/07/2021 01:03:48 - INFO - __main__ - Step 27375: {'lr': 0.0004646051991013163, 'samples': 5256000, 'steps': 27374, 'loss/train': 2.2443268299102783} -11/07/2021 01:03:48 - INFO - __main__ - Step 27376: {'lr': 0.000464602476978971, 'samples': 5256192, 'steps': 27375, 'loss/train': 1.6068828105926514} -11/07/2021 01:03:49 - INFO - __main__ - Step 27377: {'lr': 0.00046459975475992914, 'samples': 5256384, 'steps': 27376, 'loss/train': 1.4636454582214355} -11/07/2021 01:03:50 - INFO - __main__ - Step 27378: {'lr': 0.00046459703244419194, 'samples': 5256576, 'steps': 27377, 'loss/train': 1.7761300802230835} -11/07/2021 01:03:50 - INFO - __main__ - Step 27379: {'lr': 0.0004645943100317606, 'samples': 5256768, 'steps': 27378, 'loss/train': 1.193964958190918} -11/07/2021 01:03:50 - INFO - __main__ - Step 27380: {'lr': 0.00046459158752263643, 'samples': 5256960, 'steps': 27379, 'loss/train': 1.663011908531189} -11/07/2021 01:03:51 - INFO - __main__ - Step 27381: {'lr': 0.0004645888649168205, 'samples': 5257152, 'steps': 27380, 'loss/train': 1.6378246545791626} -11/07/2021 01:03:51 - INFO - __main__ - Step 27382: {'lr': 0.0004645861422143143, 'samples': 5257344, 'steps': 27381, 'loss/train': 2.5152504444122314} -11/07/2021 01:03:52 - INFO - __main__ - Step 27383: {'lr': 0.0004645834194151187, 'samples': 5257536, 'steps': 27382, 'loss/train': 1.734678030014038} -11/07/2021 01:03:53 - INFO - __main__ - Step 27384: {'lr': 0.0004645806965192353, 'samples': 5257728, 'steps': 27383, 'loss/train': 0.6871659159660339} -11/07/2021 01:03:53 - INFO - __main__ - Step 27385: {'lr': 0.000464577973526665, 'samples': 5257920, 'steps': 27384, 'loss/train': 1.138061761856079} -11/07/2021 01:03:53 - INFO - __main__ - Step 27386: {'lr': 0.00046457525043740926, 'samples': 5258112, 'steps': 27385, 'loss/train': 1.6762138605117798} -11/07/2021 01:03:54 - INFO - __main__ - Step 27387: {'lr': 0.0004645725272514693, 'samples': 5258304, 'steps': 27386, 'loss/train': 1.5222851037979126} -11/07/2021 01:03:55 - INFO - __main__ - Step 27388: {'lr': 0.0004645698039688461, 'samples': 5258496, 'steps': 27387, 'loss/train': 1.952163815498352} -11/07/2021 01:03:55 - INFO - __main__ - Step 27389: {'lr': 0.00046456708058954116, 'samples': 5258688, 'steps': 27388, 'loss/train': 1.1741615533828735} -11/07/2021 01:03:55 - INFO - __main__ - Step 27390: {'lr': 0.0004645643571135556, 'samples': 5258880, 'steps': 27389, 'loss/train': 1.7031134366989136} -11/07/2021 01:03:56 - INFO - __main__ - Step 27391: {'lr': 0.00046456163354089065, 'samples': 5259072, 'steps': 27390, 'loss/train': 1.7008723020553589} -11/07/2021 01:03:56 - INFO - __main__ - Step 27392: {'lr': 0.00046455890987154747, 'samples': 5259264, 'steps': 27391, 'loss/train': 1.5040371417999268} -11/07/2021 01:03:56 - INFO - __main__ - Step 27393: {'lr': 0.0004645561861055274, 'samples': 5259456, 'steps': 27392, 'loss/train': 0.9468610882759094} -11/07/2021 01:03:58 - INFO - __main__ - Step 27394: {'lr': 0.00046455346224283167, 'samples': 5259648, 'steps': 27393, 'loss/train': 1.3570585250854492} -11/07/2021 01:03:58 - INFO - __main__ - Step 27395: {'lr': 0.00046455073828346137, 'samples': 5259840, 'steps': 27394, 'loss/train': 1.878167748451233} -11/07/2021 01:03:58 - INFO - __main__ - Step 27396: {'lr': 0.0004645480142274179, 'samples': 5260032, 'steps': 27395, 'loss/train': 1.4309208393096924} -11/07/2021 01:03:59 - INFO - __main__ - Step 27397: {'lr': 0.0004645452900747024, 'samples': 5260224, 'steps': 27396, 'loss/train': 0.8551251888275146} -11/07/2021 01:03:59 - INFO - __main__ - Step 27398: {'lr': 0.00046454256582531604, 'samples': 5260416, 'steps': 27397, 'loss/train': 1.6647512912750244} -11/07/2021 01:04:00 - INFO - __main__ - Step 27399: {'lr': 0.0004645398414792602, 'samples': 5260608, 'steps': 27398, 'loss/train': 1.1795614957809448} -11/07/2021 01:04:00 - INFO - __main__ - Step 27400: {'lr': 0.000464537117036536, 'samples': 5260800, 'steps': 27399, 'loss/train': 1.4849789142608643} -11/07/2021 01:04:01 - INFO - __main__ - Step 27401: {'lr': 0.00046453439249714466, 'samples': 5260992, 'steps': 27400, 'loss/train': 1.4565329551696777} -11/07/2021 01:04:01 - INFO - __main__ - Step 27402: {'lr': 0.00046453166786108736, 'samples': 5261184, 'steps': 27401, 'loss/train': 1.5868231058120728} -11/07/2021 01:04:01 - INFO - __main__ - Step 27403: {'lr': 0.00046452894312836547, 'samples': 5261376, 'steps': 27402, 'loss/train': 1.570541501045227} -11/07/2021 01:04:03 - INFO - __main__ - Step 27404: {'lr': 0.0004645262182989802, 'samples': 5261568, 'steps': 27403, 'loss/train': 1.6559795141220093} -11/07/2021 01:04:03 - INFO - __main__ - Step 27405: {'lr': 0.0004645234933729327, 'samples': 5261760, 'steps': 27404, 'loss/train': 4.920253753662109} -11/07/2021 01:04:03 - INFO - __main__ - Step 27406: {'lr': 0.00046452076835022416, 'samples': 5261952, 'steps': 27405, 'loss/train': 2.2183635234832764} -11/07/2021 01:04:04 - INFO - __main__ - Step 27407: {'lr': 0.0004645180432308559, 'samples': 5262144, 'steps': 27406, 'loss/train': 1.607749104499817} -11/07/2021 01:04:04 - INFO - __main__ - Step 27408: {'lr': 0.00046451531801482913, 'samples': 5262336, 'steps': 27407, 'loss/train': 1.6804707050323486} -11/07/2021 01:04:04 - INFO - __main__ - Step 27409: {'lr': 0.00046451259270214505, 'samples': 5262528, 'steps': 27408, 'loss/train': 1.7157375812530518} -11/07/2021 01:04:05 - INFO - __main__ - Step 27410: {'lr': 0.00046450986729280495, 'samples': 5262720, 'steps': 27409, 'loss/train': 0.6833308339118958} -11/07/2021 01:04:06 - INFO - __main__ - Step 27411: {'lr': 0.00046450714178680996, 'samples': 5262912, 'steps': 27410, 'loss/train': 1.1192928552627563} -11/07/2021 01:04:06 - INFO - __main__ - Step 27412: {'lr': 0.0004645044161841614, 'samples': 5263104, 'steps': 27411, 'loss/train': 1.5120153427124023} -11/07/2021 01:04:07 - INFO - __main__ - Step 27413: {'lr': 0.00046450169048486045, 'samples': 5263296, 'steps': 27412, 'loss/train': 1.5773380994796753} -11/07/2021 01:04:07 - INFO - __main__ - Step 27414: {'lr': 0.0004644989646889084, 'samples': 5263488, 'steps': 27413, 'loss/train': 1.3461500406265259} -11/07/2021 01:04:08 - INFO - __main__ - Step 27415: {'lr': 0.0004644962387963063, 'samples': 5263680, 'steps': 27414, 'loss/train': 1.4467198848724365} -11/07/2021 01:04:08 - INFO - __main__ - Step 27416: {'lr': 0.0004644935128070556, 'samples': 5263872, 'steps': 27415, 'loss/train': 0.9525635242462158} -11/07/2021 01:04:09 - INFO - __main__ - Step 27417: {'lr': 0.0004644907867211574, 'samples': 5264064, 'steps': 27416, 'loss/train': 2.4026198387145996} -11/07/2021 01:04:09 - INFO - __main__ - Step 27418: {'lr': 0.000464488060538613, 'samples': 5264256, 'steps': 27417, 'loss/train': 1.6511754989624023} -11/07/2021 01:04:09 - INFO - __main__ - Step 27419: {'lr': 0.0004644853342594235, 'samples': 5264448, 'steps': 27418, 'loss/train': 1.9703359603881836} -11/07/2021 01:04:10 - INFO - __main__ - Step 27420: {'lr': 0.0004644826078835903, 'samples': 5264640, 'steps': 27419, 'loss/train': 1.7109949588775635} -11/07/2021 01:04:11 - INFO - __main__ - Step 27421: {'lr': 0.00046447988141111457, 'samples': 5264832, 'steps': 27420, 'loss/train': 1.3898118734359741} -11/07/2021 01:04:11 - INFO - __main__ - Step 27422: {'lr': 0.0004644771548419975, 'samples': 5265024, 'steps': 27421, 'loss/train': 1.4866039752960205} -11/07/2021 01:04:11 - INFO - __main__ - Step 27423: {'lr': 0.0004644744281762403, 'samples': 5265216, 'steps': 27422, 'loss/train': 1.669671893119812} -11/07/2021 01:04:12 - INFO - __main__ - Step 27424: {'lr': 0.0004644717014138442, 'samples': 5265408, 'steps': 27423, 'loss/train': 2.594538450241089} -11/07/2021 01:04:13 - INFO - __main__ - Step 27425: {'lr': 0.0004644689745548105, 'samples': 5265600, 'steps': 27424, 'loss/train': 1.887316346168518} -11/07/2021 01:04:13 - INFO - __main__ - Step 27426: {'lr': 0.00046446624759914043, 'samples': 5265792, 'steps': 27425, 'loss/train': 1.6005641222000122} -11/07/2021 01:04:14 - INFO - __main__ - Step 27427: {'lr': 0.0004644635205468351, 'samples': 5265984, 'steps': 27426, 'loss/train': 1.8438071012496948} -11/07/2021 01:04:14 - INFO - __main__ - Step 27428: {'lr': 0.00046446079339789587, 'samples': 5266176, 'steps': 27427, 'loss/train': 1.7589665651321411} -11/07/2021 01:04:14 - INFO - __main__ - Step 27429: {'lr': 0.0004644580661523239, 'samples': 5266368, 'steps': 27428, 'loss/train': 1.9420253038406372} -11/07/2021 01:04:15 - INFO - __main__ - Step 27430: {'lr': 0.00046445533881012043, 'samples': 5266560, 'steps': 27429, 'loss/train': 1.7142422199249268} -11/07/2021 01:04:16 - INFO - __main__ - Step 27431: {'lr': 0.0004644526113712867, 'samples': 5266752, 'steps': 27430, 'loss/train': 1.6149872541427612} -11/07/2021 01:04:16 - INFO - __main__ - Step 27432: {'lr': 0.00046444988383582394, 'samples': 5266944, 'steps': 27431, 'loss/train': 1.6525791883468628} -11/07/2021 01:04:16 - INFO - __main__ - Step 27433: {'lr': 0.0004644471562037333, 'samples': 5267136, 'steps': 27432, 'loss/train': 1.556830644607544} -11/07/2021 01:04:17 - INFO - __main__ - Step 27434: {'lr': 0.0004644444284750162, 'samples': 5267328, 'steps': 27433, 'loss/train': 1.8048747777938843} -11/07/2021 01:04:17 - INFO - __main__ - Step 27435: {'lr': 0.0004644417006496737, 'samples': 5267520, 'steps': 27434, 'loss/train': 1.553612470626831} -11/07/2021 01:04:18 - INFO - __main__ - Step 27436: {'lr': 0.0004644389727277071, 'samples': 5267712, 'steps': 27435, 'loss/train': 1.6055339574813843} -11/07/2021 01:04:19 - INFO - __main__ - Step 27437: {'lr': 0.00046443624470911754, 'samples': 5267904, 'steps': 27436, 'loss/train': 1.7883402109146118} -11/07/2021 01:04:19 - INFO - __main__ - Step 27438: {'lr': 0.00046443351659390637, 'samples': 5268096, 'steps': 27437, 'loss/train': 1.3733422756195068} -11/07/2021 01:04:19 - INFO - __main__ - Step 27439: {'lr': 0.00046443078838207474, 'samples': 5268288, 'steps': 27438, 'loss/train': 1.651326298713684} -11/07/2021 01:04:20 - INFO - __main__ - Step 27440: {'lr': 0.00046442806007362394, 'samples': 5268480, 'steps': 27439, 'loss/train': 1.7419207096099854} -11/07/2021 01:04:21 - INFO - __main__ - Step 27441: {'lr': 0.00046442533166855517, 'samples': 5268672, 'steps': 27440, 'loss/train': 1.782727837562561} -11/07/2021 01:04:21 - INFO - __main__ - Step 27442: {'lr': 0.00046442260316686957, 'samples': 5268864, 'steps': 27441, 'loss/train': 1.3582515716552734} -11/07/2021 01:04:22 - INFO - __main__ - Step 27443: {'lr': 0.0004644198745685685, 'samples': 5269056, 'steps': 27442, 'loss/train': 1.7487573623657227} -11/07/2021 01:04:22 - INFO - __main__ - Step 27444: {'lr': 0.00046441714587365317, 'samples': 5269248, 'steps': 27443, 'loss/train': 1.5707968473434448} -11/07/2021 01:04:22 - INFO - __main__ - Step 27445: {'lr': 0.00046441441708212477, 'samples': 5269440, 'steps': 27444, 'loss/train': 1.8958215713500977} -11/07/2021 01:04:23 - INFO - __main__ - Step 27446: {'lr': 0.00046441168819398457, 'samples': 5269632, 'steps': 27445, 'loss/train': 1.5987136363983154} -11/07/2021 01:04:24 - INFO - __main__ - Step 27447: {'lr': 0.0004644089592092338, 'samples': 5269824, 'steps': 27446, 'loss/train': 1.5505801439285278} -11/07/2021 01:04:24 - INFO - __main__ - Step 27448: {'lr': 0.0004644062301278735, 'samples': 5270016, 'steps': 27447, 'loss/train': 1.6309155225753784} -11/07/2021 01:04:24 - INFO - __main__ - Step 27449: {'lr': 0.0004644035009499052, 'samples': 5270208, 'steps': 27448, 'loss/train': 1.9587770700454712} -11/07/2021 01:04:25 - INFO - __main__ - Step 27450: {'lr': 0.0004644007716753299, 'samples': 5270400, 'steps': 27449, 'loss/train': 2.0377914905548096} -11/07/2021 01:04:26 - INFO - __main__ - Step 27451: {'lr': 0.00046439804230414904, 'samples': 5270592, 'steps': 27450, 'loss/train': 1.4115687608718872} -11/07/2021 01:04:26 - INFO - __main__ - Step 27452: {'lr': 0.0004643953128363637, 'samples': 5270784, 'steps': 27451, 'loss/train': 1.5786956548690796} -11/07/2021 01:04:27 - INFO - __main__ - Step 27453: {'lr': 0.0004643925832719751, 'samples': 5270976, 'steps': 27452, 'loss/train': 1.5803961753845215} -11/07/2021 01:04:27 - INFO - __main__ - Step 27454: {'lr': 0.0004643898536109845, 'samples': 5271168, 'steps': 27453, 'loss/train': 1.38846755027771} -11/07/2021 01:04:27 - INFO - __main__ - Step 27455: {'lr': 0.0004643871238533931, 'samples': 5271360, 'steps': 27454, 'loss/train': 1.9401226043701172} -11/07/2021 01:04:28 - INFO - __main__ - Step 27456: {'lr': 0.0004643843939992022, 'samples': 5271552, 'steps': 27455, 'loss/train': 1.8082693815231323} -11/07/2021 01:04:29 - INFO - __main__ - Step 27457: {'lr': 0.0004643816640484131, 'samples': 5271744, 'steps': 27456, 'loss/train': 1.6021026372909546} -11/07/2021 01:04:29 - INFO - __main__ - Step 27458: {'lr': 0.0004643789340010268, 'samples': 5271936, 'steps': 27457, 'loss/train': 1.9755364656448364} -11/07/2021 01:04:29 - INFO - __main__ - Step 27459: {'lr': 0.00046437620385704476, 'samples': 5272128, 'steps': 27458, 'loss/train': 0.6707550287246704} -11/07/2021 01:04:30 - INFO - __main__ - Step 27460: {'lr': 0.0004643734736164681, 'samples': 5272320, 'steps': 27459, 'loss/train': 2.275068998336792} -11/07/2021 01:04:30 - INFO - __main__ - Step 27461: {'lr': 0.00046437074327929795, 'samples': 5272512, 'steps': 27460, 'loss/train': 1.1870478391647339} -11/07/2021 01:04:31 - INFO - __main__ - Step 27462: {'lr': 0.0004643680128455358, 'samples': 5272704, 'steps': 27461, 'loss/train': 1.5905396938323975} -11/07/2021 01:04:31 - INFO - __main__ - Step 27463: {'lr': 0.00046436528231518263, 'samples': 5272896, 'steps': 27462, 'loss/train': 1.551306128501892} -11/07/2021 01:04:32 - INFO - __main__ - Step 27464: {'lr': 0.0004643625516882398, 'samples': 5273088, 'steps': 27463, 'loss/train': 1.5059658288955688} -11/07/2021 01:04:32 - INFO - __main__ - Step 27465: {'lr': 0.0004643598209647085, 'samples': 5273280, 'steps': 27464, 'loss/train': 1.6166335344314575} -11/07/2021 01:04:32 - INFO - __main__ - Step 27466: {'lr': 0.00046435709014459, 'samples': 5273472, 'steps': 27465, 'loss/train': 1.4816384315490723} -11/07/2021 01:04:34 - INFO - __main__ - Step 27467: {'lr': 0.0004643543592278855, 'samples': 5273664, 'steps': 27466, 'loss/train': 0.9950994253158569} -11/07/2021 01:04:34 - INFO - __main__ - Step 27468: {'lr': 0.0004643516282145962, 'samples': 5273856, 'steps': 27467, 'loss/train': 2.083305835723877} -11/07/2021 01:04:34 - INFO - __main__ - Step 27469: {'lr': 0.0004643488971047234, 'samples': 5274048, 'steps': 27468, 'loss/train': 1.0330928564071655} -11/07/2021 01:04:35 - INFO - __main__ - Step 27470: {'lr': 0.0004643461658982683, 'samples': 5274240, 'steps': 27469, 'loss/train': 1.721252202987671} -11/07/2021 01:04:35 - INFO - __main__ - Step 27471: {'lr': 0.00046434343459523207, 'samples': 5274432, 'steps': 27470, 'loss/train': 1.5718274116516113} -11/07/2021 01:04:36 - INFO - __main__ - Step 27472: {'lr': 0.00046434070319561604, 'samples': 5274624, 'steps': 27471, 'loss/train': 1.4991551637649536} -11/07/2021 01:04:36 - INFO - __main__ - Step 27473: {'lr': 0.0004643379716994214, 'samples': 5274816, 'steps': 27472, 'loss/train': 1.754794955253601} -11/07/2021 01:04:37 - INFO - __main__ - Step 27474: {'lr': 0.0004643352401066494, 'samples': 5275008, 'steps': 27473, 'loss/train': 1.6142194271087646} -11/07/2021 01:04:37 - INFO - __main__ - Step 27475: {'lr': 0.00046433250841730123, 'samples': 5275200, 'steps': 27474, 'loss/train': 1.5695093870162964} -11/07/2021 01:04:37 - INFO - __main__ - Step 27476: {'lr': 0.0004643297766313781, 'samples': 5275392, 'steps': 27475, 'loss/train': 0.8923225402832031} -11/07/2021 01:04:39 - INFO - __main__ - Step 27477: {'lr': 0.0004643270447488813, 'samples': 5275584, 'steps': 27476, 'loss/train': 1.443546175956726} -11/07/2021 01:04:39 - INFO - __main__ - Step 27478: {'lr': 0.000464324312769812, 'samples': 5275776, 'steps': 27477, 'loss/train': 1.7197577953338623} -11/07/2021 01:04:39 - INFO - __main__ - Step 27479: {'lr': 0.0004643215806941716, 'samples': 5275968, 'steps': 27478, 'loss/train': 1.650207281112671} -11/07/2021 01:04:40 - INFO - __main__ - Step 27480: {'lr': 0.00046431884852196105, 'samples': 5276160, 'steps': 27479, 'loss/train': 1.3830845355987549} -11/07/2021 01:04:40 - INFO - __main__ - Step 27481: {'lr': 0.0004643161162531818, 'samples': 5276352, 'steps': 27480, 'loss/train': 1.2445502281188965} -11/07/2021 01:04:41 - INFO - __main__ - Step 27482: {'lr': 0.00046431338388783504, 'samples': 5276544, 'steps': 27481, 'loss/train': 0.7495806813240051} -11/07/2021 01:04:41 - INFO - __main__ - Step 27483: {'lr': 0.000464310651425922, 'samples': 5276736, 'steps': 27482, 'loss/train': 1.5686403512954712} -11/07/2021 01:04:42 - INFO - __main__ - Step 27484: {'lr': 0.00046430791886744384, 'samples': 5276928, 'steps': 27483, 'loss/train': 1.2439922094345093} -11/07/2021 01:04:42 - INFO - __main__ - Step 27485: {'lr': 0.0004643051862124018, 'samples': 5277120, 'steps': 27484, 'loss/train': 1.5504546165466309} -11/07/2021 01:04:42 - INFO - __main__ - Step 27486: {'lr': 0.0004643024534607973, 'samples': 5277312, 'steps': 27485, 'loss/train': 1.6598097085952759} -11/07/2021 01:04:43 - INFO - __main__ - Step 27487: {'lr': 0.00046429972061263125, 'samples': 5277504, 'steps': 27486, 'loss/train': 1.5114681720733643} -11/07/2021 01:04:44 - INFO - __main__ - Step 27488: {'lr': 0.0004642969876679051, 'samples': 5277696, 'steps': 27487, 'loss/train': 1.344405174255371} -11/07/2021 01:04:44 - INFO - __main__ - Step 27489: {'lr': 0.00046429425462662, 'samples': 5277888, 'steps': 27488, 'loss/train': 1.8302743434906006} -11/07/2021 01:04:44 - INFO - __main__ - Step 27490: {'lr': 0.00046429152148877727, 'samples': 5278080, 'steps': 27489, 'loss/train': 1.5790754556655884} -11/07/2021 01:04:45 - INFO - __main__ - Step 27491: {'lr': 0.00046428878825437815, 'samples': 5278272, 'steps': 27490, 'loss/train': 1.4722696542739868} -11/07/2021 01:04:45 - INFO - __main__ - Step 27492: {'lr': 0.00046428605492342367, 'samples': 5278464, 'steps': 27491, 'loss/train': 1.368982195854187} -11/07/2021 01:04:46 - INFO - __main__ - Step 27493: {'lr': 0.00046428332149591535, 'samples': 5278656, 'steps': 27492, 'loss/train': 1.5615782737731934} -11/07/2021 01:04:47 - INFO - __main__ - Step 27494: {'lr': 0.0004642805879718541, 'samples': 5278848, 'steps': 27493, 'loss/train': 0.2677178680896759} -11/07/2021 01:04:47 - INFO - __main__ - Step 27495: {'lr': 0.00046427785435124147, 'samples': 5279040, 'steps': 27494, 'loss/train': 1.5332293510437012} -11/07/2021 01:04:47 - INFO - __main__ - Step 27496: {'lr': 0.0004642751206340785, 'samples': 5279232, 'steps': 27495, 'loss/train': 1.7823522090911865} -11/07/2021 01:04:48 - INFO - __main__ - Step 27497: {'lr': 0.00046427238682036643, 'samples': 5279424, 'steps': 27496, 'loss/train': 1.2205898761749268} -11/07/2021 01:04:49 - INFO - __main__ - Step 27498: {'lr': 0.0004642696529101066, 'samples': 5279616, 'steps': 27497, 'loss/train': 1.7394107580184937} -11/07/2021 01:04:49 - INFO - __main__ - Step 27499: {'lr': 0.0004642669189033001, 'samples': 5279808, 'steps': 27498, 'loss/train': 1.6603978872299194} -11/07/2021 01:04:49 - INFO - __main__ - Step 27500: {'lr': 0.0004642641847999483, 'samples': 5280000, 'steps': 27499, 'loss/train': 1.5572772026062012} -11/07/2021 01:04:50 - INFO - __main__ - Step 27501: {'lr': 0.0004642614506000523, 'samples': 5280192, 'steps': 27500, 'loss/train': 1.5926954746246338} -11/07/2021 01:04:50 - INFO - __main__ - Step 27502: {'lr': 0.00046425871630361343, 'samples': 5280384, 'steps': 27501, 'loss/train': 1.7171363830566406} -11/07/2021 01:04:51 - INFO - __main__ - Step 27503: {'lr': 0.0004642559819106329, 'samples': 5280576, 'steps': 27502, 'loss/train': 1.238904595375061} -11/07/2021 01:04:51 - INFO - __main__ - Step 27504: {'lr': 0.0004642532474211119, 'samples': 5280768, 'steps': 27503, 'loss/train': 1.410136103630066} -11/07/2021 01:04:52 - INFO - __main__ - Step 27505: {'lr': 0.0004642505128350517, 'samples': 5280960, 'steps': 27504, 'loss/train': 1.3256465196609497} -11/07/2021 01:04:52 - INFO - __main__ - Step 27506: {'lr': 0.00046424777815245354, 'samples': 5281152, 'steps': 27505, 'loss/train': 3.3891711235046387} -11/07/2021 01:04:52 - INFO - __main__ - Step 27507: {'lr': 0.0004642450433733186, 'samples': 5281344, 'steps': 27506, 'loss/train': 1.6674591302871704} -11/07/2021 01:04:54 - INFO - __main__ - Step 27508: {'lr': 0.0004642423084976482, 'samples': 5281536, 'steps': 27507, 'loss/train': 1.3353351354599} -11/07/2021 01:04:54 - INFO - __main__ - Step 27509: {'lr': 0.0004642395735254435, 'samples': 5281728, 'steps': 27508, 'loss/train': 1.587765097618103} -11/07/2021 01:04:54 - INFO - __main__ - Step 27510: {'lr': 0.0004642368384567058, 'samples': 5281920, 'steps': 27509, 'loss/train': 1.5925922393798828} -11/07/2021 01:04:55 - INFO - __main__ - Step 27511: {'lr': 0.0004642341032914362, 'samples': 5282112, 'steps': 27510, 'loss/train': 1.5339746475219727} -11/07/2021 01:04:55 - INFO - __main__ - Step 27512: {'lr': 0.00046423136802963607, 'samples': 5282304, 'steps': 27511, 'loss/train': 1.8380541801452637} -11/07/2021 01:04:56 - INFO - __main__ - Step 27513: {'lr': 0.0004642286326713065, 'samples': 5282496, 'steps': 27512, 'loss/train': 1.510982871055603} -11/07/2021 01:04:56 - INFO - __main__ - Step 27514: {'lr': 0.000464225897216449, 'samples': 5282688, 'steps': 27513, 'loss/train': 1.748958945274353} -11/07/2021 01:04:57 - INFO - __main__ - Step 27515: {'lr': 0.0004642231616650645, 'samples': 5282880, 'steps': 27514, 'loss/train': 1.3821334838867188} -11/07/2021 01:04:57 - INFO - __main__ - Step 27516: {'lr': 0.00046422042601715433, 'samples': 5283072, 'steps': 27515, 'loss/train': 1.5916210412979126} -11/07/2021 01:04:57 - INFO - __main__ - Step 27517: {'lr': 0.00046421769027271974, 'samples': 5283264, 'steps': 27516, 'loss/train': 1.6284141540527344} -11/07/2021 01:04:58 - INFO - __main__ - Step 27518: {'lr': 0.00046421495443176204, 'samples': 5283456, 'steps': 27517, 'loss/train': 1.2993590831756592} -11/07/2021 01:04:59 - INFO - __main__ - Step 27519: {'lr': 0.0004642122184942824, 'samples': 5283648, 'steps': 27518, 'loss/train': 1.648287296295166} -11/07/2021 01:04:59 - INFO - __main__ - Step 27520: {'lr': 0.00046420948246028194, 'samples': 5283840, 'steps': 27519, 'loss/train': 1.5649181604385376} -11/07/2021 01:05:00 - INFO - __main__ - Step 27521: {'lr': 0.000464206746329762, 'samples': 5284032, 'steps': 27520, 'loss/train': 1.5230170488357544} -11/07/2021 01:05:00 - INFO - __main__ - Step 27522: {'lr': 0.00046420401010272385, 'samples': 5284224, 'steps': 27521, 'loss/train': 1.478598952293396} -11/07/2021 01:05:00 - INFO - __main__ - Step 27523: {'lr': 0.00046420127377916863, 'samples': 5284416, 'steps': 27522, 'loss/train': 1.6656675338745117} -11/07/2021 01:05:01 - INFO - __main__ - Step 27524: {'lr': 0.0004641985373590977, 'samples': 5284608, 'steps': 27523, 'loss/train': 0.9977850914001465} -11/07/2021 01:05:02 - INFO - __main__ - Step 27525: {'lr': 0.00046419580084251224, 'samples': 5284800, 'steps': 27524, 'loss/train': 1.8102953433990479} -11/07/2021 01:05:02 - INFO - __main__ - Step 27526: {'lr': 0.0004641930642294133, 'samples': 5284992, 'steps': 27525, 'loss/train': 1.6369602680206299} -11/07/2021 01:05:02 - INFO - __main__ - Step 27527: {'lr': 0.0004641903275198024, 'samples': 5285184, 'steps': 27526, 'loss/train': 0.6573544144630432} -11/07/2021 01:05:03 - INFO - __main__ - Step 27528: {'lr': 0.0004641875907136806, 'samples': 5285376, 'steps': 27527, 'loss/train': 1.3041669130325317} -11/07/2021 01:05:04 - INFO - __main__ - Step 27529: {'lr': 0.0004641848538110492, 'samples': 5285568, 'steps': 27528, 'loss/train': 1.6319307088851929} -11/07/2021 01:05:04 - INFO - __main__ - Step 27530: {'lr': 0.00046418211681190937, 'samples': 5285760, 'steps': 27529, 'loss/train': 1.5995657444000244} -11/07/2021 01:05:05 - INFO - __main__ - Step 27531: {'lr': 0.00046417937971626245, 'samples': 5285952, 'steps': 27530, 'loss/train': 1.3074729442596436} -11/07/2021 01:05:05 - INFO - __main__ - Step 27532: {'lr': 0.0004641766425241095, 'samples': 5286144, 'steps': 27531, 'loss/train': 1.555513858795166} -11/07/2021 01:05:05 - INFO - __main__ - Step 27533: {'lr': 0.000464173905235452, 'samples': 5286336, 'steps': 27532, 'loss/train': 1.5921692848205566} -11/07/2021 01:05:06 - INFO - __main__ - Step 27534: {'lr': 0.0004641711678502909, 'samples': 5286528, 'steps': 27533, 'loss/train': 1.369351863861084} -11/07/2021 01:05:07 - INFO - __main__ - Step 27535: {'lr': 0.00046416843036862766, 'samples': 5286720, 'steps': 27534, 'loss/train': 1.361032485961914} -11/07/2021 01:05:07 - INFO - __main__ - Step 27536: {'lr': 0.0004641656927904634, 'samples': 5286912, 'steps': 27535, 'loss/train': 1.411777377128601} -11/07/2021 01:05:07 - INFO - __main__ - Step 27537: {'lr': 0.00046416295511579944, 'samples': 5287104, 'steps': 27536, 'loss/train': 2.0430092811584473} -11/07/2021 01:05:08 - INFO - __main__ - Step 27538: {'lr': 0.0004641602173446369, 'samples': 5287296, 'steps': 27537, 'loss/train': 1.117910623550415} -11/07/2021 01:05:09 - INFO - __main__ - Step 27539: {'lr': 0.00046415747947697704, 'samples': 5287488, 'steps': 27538, 'loss/train': 1.8439534902572632} -11/07/2021 01:05:09 - INFO - __main__ - Step 27540: {'lr': 0.00046415474151282124, 'samples': 5287680, 'steps': 27539, 'loss/train': 2.1135165691375732} -11/07/2021 01:05:10 - INFO - __main__ - Step 27541: {'lr': 0.0004641520034521705, 'samples': 5287872, 'steps': 27540, 'loss/train': 1.5234469175338745} -11/07/2021 01:05:10 - INFO - __main__ - Step 27542: {'lr': 0.0004641492652950262, 'samples': 5288064, 'steps': 27541, 'loss/train': 1.8389887809753418} -11/07/2021 01:05:10 - INFO - __main__ - Step 27543: {'lr': 0.0004641465270413896, 'samples': 5288256, 'steps': 27542, 'loss/train': 0.9904304146766663} -11/07/2021 01:05:12 - INFO - __main__ - Step 27544: {'lr': 0.00046414378869126185, 'samples': 5288448, 'steps': 27543, 'loss/train': 0.8239241242408752} -11/07/2021 01:05:12 - INFO - __main__ - Step 27545: {'lr': 0.0004641410502446442, 'samples': 5288640, 'steps': 27544, 'loss/train': 1.446048378944397} -11/07/2021 01:05:12 - INFO - __main__ - Step 27546: {'lr': 0.00046413831170153785, 'samples': 5288832, 'steps': 27545, 'loss/train': 1.452160358428955} -11/07/2021 01:05:13 - INFO - __main__ - Step 27547: {'lr': 0.0004641355730619442, 'samples': 5289024, 'steps': 27546, 'loss/train': 1.589703917503357} -11/07/2021 01:05:13 - INFO - __main__ - Step 27548: {'lr': 0.0004641328343258643, 'samples': 5289216, 'steps': 27547, 'loss/train': 1.2328104972839355} -11/07/2021 01:05:13 - INFO - __main__ - Step 27549: {'lr': 0.00046413009549329946, 'samples': 5289408, 'steps': 27548, 'loss/train': 1.5615376234054565} -11/07/2021 01:05:15 - INFO - __main__ - Step 27550: {'lr': 0.0004641273565642509, 'samples': 5289600, 'steps': 27549, 'loss/train': 1.6135731935501099} -11/07/2021 01:05:15 - INFO - __main__ - Step 27551: {'lr': 0.0004641246175387198, 'samples': 5289792, 'steps': 27550, 'loss/train': 1.5954854488372803} -11/07/2021 01:05:15 - INFO - __main__ - Step 27552: {'lr': 0.0004641218784167075, 'samples': 5289984, 'steps': 27551, 'loss/train': 1.8309478759765625} -11/07/2021 01:05:16 - INFO - __main__ - Step 27553: {'lr': 0.0004641191391982152, 'samples': 5290176, 'steps': 27552, 'loss/train': 1.3916101455688477} -11/07/2021 01:05:16 - INFO - __main__ - Step 27554: {'lr': 0.00046411639988324407, 'samples': 5290368, 'steps': 27553, 'loss/train': 1.8725727796554565} -11/07/2021 01:05:17 - INFO - __main__ - Step 27555: {'lr': 0.00046411366047179547, 'samples': 5290560, 'steps': 27554, 'loss/train': 1.6179206371307373} -11/07/2021 01:05:17 - INFO - __main__ - Step 27556: {'lr': 0.00046411092096387054, 'samples': 5290752, 'steps': 27555, 'loss/train': 1.7249908447265625} -11/07/2021 01:05:18 - INFO - __main__ - Step 27557: {'lr': 0.0004641081813594705, 'samples': 5290944, 'steps': 27556, 'loss/train': 1.6517274379730225} -11/07/2021 01:05:18 - INFO - __main__ - Step 27558: {'lr': 0.0004641054416585966, 'samples': 5291136, 'steps': 27557, 'loss/train': 1.313826084136963} -11/07/2021 01:05:18 - INFO - __main__ - Step 27559: {'lr': 0.00046410270186125014, 'samples': 5291328, 'steps': 27558, 'loss/train': 1.542672038078308} -11/07/2021 01:05:21 - INFO - __main__ - Step 27560: {'lr': 0.0004640999619674323, 'samples': 5291520, 'steps': 27559, 'loss/train': 1.4132981300354004} -11/07/2021 01:05:21 - INFO - __main__ - Step 27561: {'lr': 0.0004640972219771443, 'samples': 5291712, 'steps': 27560, 'loss/train': 1.1761044263839722} -11/07/2021 01:05:22 - INFO - __main__ - Step 27562: {'lr': 0.00046409448189038737, 'samples': 5291904, 'steps': 27561, 'loss/train': 0.558796226978302} -11/07/2021 01:05:22 - INFO - __main__ - Step 27563: {'lr': 0.00046409174170716284, 'samples': 5292096, 'steps': 27562, 'loss/train': 1.4939899444580078} -11/07/2021 01:05:22 - INFO - __main__ - Step 27564: {'lr': 0.0004640890014274718, 'samples': 5292288, 'steps': 27563, 'loss/train': 1.3283414840698242} -11/07/2021 01:05:23 - INFO - __main__ - Step 27565: {'lr': 0.0004640862610513156, 'samples': 5292480, 'steps': 27564, 'loss/train': 2.123770236968994} -11/07/2021 01:05:23 - INFO - __main__ - Step 27566: {'lr': 0.00046408352057869545, 'samples': 5292672, 'steps': 27565, 'loss/train': 1.8661320209503174} -11/07/2021 01:05:23 - INFO - __main__ - Step 27567: {'lr': 0.0004640807800096126, 'samples': 5292864, 'steps': 27566, 'loss/train': 1.7928009033203125} -11/07/2021 01:05:24 - INFO - __main__ - Step 27568: {'lr': 0.0004640780393440682, 'samples': 5293056, 'steps': 27567, 'loss/train': 1.7955752611160278} -11/07/2021 01:05:25 - INFO - __main__ - Step 27569: {'lr': 0.0004640752985820635, 'samples': 5293248, 'steps': 27568, 'loss/train': 1.5294089317321777} -11/07/2021 01:05:25 - INFO - __main__ - Step 27570: {'lr': 0.0004640725577235998, 'samples': 5293440, 'steps': 27569, 'loss/train': 1.3322672843933105} -11/07/2021 01:05:25 - INFO - __main__ - Step 27571: {'lr': 0.00046406981676867836, 'samples': 5293632, 'steps': 27570, 'loss/train': 1.7561861276626587} -11/07/2021 01:05:26 - INFO - __main__ - Step 27572: {'lr': 0.00046406707571730035, 'samples': 5293824, 'steps': 27571, 'loss/train': 2.1232874393463135} -11/07/2021 01:05:26 - INFO - __main__ - Step 27573: {'lr': 0.000464064334569467, 'samples': 5294016, 'steps': 27572, 'loss/train': 1.5122051239013672} -11/07/2021 01:05:27 - INFO - __main__ - Step 27574: {'lr': 0.00046406159332517956, 'samples': 5294208, 'steps': 27573, 'loss/train': 0.921796977519989} -11/07/2021 01:05:28 - INFO - __main__ - Step 27575: {'lr': 0.00046405885198443926, 'samples': 5294400, 'steps': 27574, 'loss/train': 1.4629522562026978} -11/07/2021 01:05:28 - INFO - __main__ - Step 27576: {'lr': 0.00046405611054724737, 'samples': 5294592, 'steps': 27575, 'loss/train': 1.4078749418258667} -11/07/2021 01:05:28 - INFO - __main__ - Step 27577: {'lr': 0.00046405336901360507, 'samples': 5294784, 'steps': 27576, 'loss/train': 1.6363303661346436} -11/07/2021 01:05:29 - INFO - __main__ - Step 27578: {'lr': 0.00046405062738351366, 'samples': 5294976, 'steps': 27577, 'loss/train': 1.8103362321853638} -11/07/2021 01:05:30 - INFO - __main__ - Step 27579: {'lr': 0.00046404788565697434, 'samples': 5295168, 'steps': 27578, 'loss/train': 1.8461319208145142} -11/07/2021 01:05:30 - INFO - __main__ - Step 27580: {'lr': 0.00046404514383398835, 'samples': 5295360, 'steps': 27579, 'loss/train': 1.24917471408844} -11/07/2021 01:05:30 - INFO - __main__ - Step 27581: {'lr': 0.0004640424019145568, 'samples': 5295552, 'steps': 27580, 'loss/train': 1.6586353778839111} -11/07/2021 01:05:31 - INFO - __main__ - Step 27582: {'lr': 0.00046403965989868124, 'samples': 5295744, 'steps': 27581, 'loss/train': 1.3456676006317139} -11/07/2021 01:05:31 - INFO - __main__ - Step 27583: {'lr': 0.0004640369177863626, 'samples': 5295936, 'steps': 27582, 'loss/train': 1.9105370044708252} -11/07/2021 01:05:32 - INFO - __main__ - Step 27584: {'lr': 0.00046403417557760226, 'samples': 5296128, 'steps': 27583, 'loss/train': 1.5361580848693848} -11/07/2021 01:05:32 - INFO - __main__ - Step 27585: {'lr': 0.00046403143327240136, 'samples': 5296320, 'steps': 27584, 'loss/train': 1.2893943786621094} -11/07/2021 01:05:33 - INFO - __main__ - Step 27586: {'lr': 0.00046402869087076127, 'samples': 5296512, 'steps': 27585, 'loss/train': 1.3101916313171387} -11/07/2021 01:05:33 - INFO - __main__ - Step 27587: {'lr': 0.00046402594837268314, 'samples': 5296704, 'steps': 27586, 'loss/train': 1.1525654792785645} -11/07/2021 01:05:33 - INFO - __main__ - Step 27588: {'lr': 0.0004640232057781682, 'samples': 5296896, 'steps': 27587, 'loss/train': 1.3633612394332886} -11/07/2021 01:05:35 - INFO - __main__ - Step 27589: {'lr': 0.00046402046308721776, 'samples': 5297088, 'steps': 27588, 'loss/train': 1.827514886856079} -11/07/2021 01:05:35 - INFO - __main__ - Step 27590: {'lr': 0.0004640177202998329, 'samples': 5297280, 'steps': 27589, 'loss/train': 1.6969636678695679} -11/07/2021 01:05:35 - INFO - __main__ - Step 27591: {'lr': 0.00046401497741601505, 'samples': 5297472, 'steps': 27590, 'loss/train': 1.3765476942062378} -11/07/2021 01:05:36 - INFO - __main__ - Step 27592: {'lr': 0.00046401223443576537, 'samples': 5297664, 'steps': 27591, 'loss/train': 1.5166794061660767} -11/07/2021 01:05:36 - INFO - __main__ - Step 27593: {'lr': 0.00046400949135908497, 'samples': 5297856, 'steps': 27592, 'loss/train': 1.599624514579773} -11/07/2021 01:05:37 - INFO - __main__ - Step 27594: {'lr': 0.0004640067481859753, 'samples': 5298048, 'steps': 27593, 'loss/train': 1.871532917022705} -11/07/2021 01:05:37 - INFO - __main__ - Step 27595: {'lr': 0.00046400400491643744, 'samples': 5298240, 'steps': 27594, 'loss/train': 1.5986907482147217} -11/07/2021 01:05:38 - INFO - __main__ - Step 27596: {'lr': 0.00046400126155047265, 'samples': 5298432, 'steps': 27595, 'loss/train': 0.5922433733940125} -11/07/2021 01:05:38 - INFO - __main__ - Step 27597: {'lr': 0.0004639985180880822, 'samples': 5298624, 'steps': 27596, 'loss/train': 1.390427827835083} -11/07/2021 01:05:38 - INFO - __main__ - Step 27598: {'lr': 0.0004639957745292674, 'samples': 5298816, 'steps': 27597, 'loss/train': 1.2177232503890991} -11/07/2021 01:05:40 - INFO - __main__ - Step 27599: {'lr': 0.00046399303087402935, 'samples': 5299008, 'steps': 27598, 'loss/train': 1.1444631814956665} -11/07/2021 01:05:40 - INFO - __main__ - Step 27600: {'lr': 0.00046399028712236935, 'samples': 5299200, 'steps': 27599, 'loss/train': 0.8689119815826416} -11/07/2021 01:05:40 - INFO - __main__ - Step 27601: {'lr': 0.0004639875432742886, 'samples': 5299392, 'steps': 27600, 'loss/train': 1.5241239070892334} -11/07/2021 01:05:41 - INFO - __main__ - Step 27602: {'lr': 0.0004639847993297884, 'samples': 5299584, 'steps': 27601, 'loss/train': 1.5791829824447632} -11/07/2021 01:05:41 - INFO - __main__ - Step 27603: {'lr': 0.00046398205528886994, 'samples': 5299776, 'steps': 27602, 'loss/train': 0.9915977120399475} -11/07/2021 01:05:42 - INFO - __main__ - Step 27604: {'lr': 0.00046397931115153444, 'samples': 5299968, 'steps': 27603, 'loss/train': 1.067671775817871} -11/07/2021 01:05:42 - INFO - __main__ - Step 27605: {'lr': 0.0004639765669177833, 'samples': 5300160, 'steps': 27604, 'loss/train': 1.4505391120910645} -11/07/2021 01:05:43 - INFO - __main__ - Step 27606: {'lr': 0.00046397382258761744, 'samples': 5300352, 'steps': 27605, 'loss/train': 1.1855945587158203} -11/07/2021 01:05:43 - INFO - __main__ - Step 27607: {'lr': 0.0004639710781610384, 'samples': 5300544, 'steps': 27606, 'loss/train': 0.813217043876648} -11/07/2021 01:05:43 - INFO - __main__ - Step 27608: {'lr': 0.00046396833363804724, 'samples': 5300736, 'steps': 27607, 'loss/train': 1.563719391822815} -11/07/2021 01:05:44 - INFO - __main__ - Step 27609: {'lr': 0.00046396558901864527, 'samples': 5300928, 'steps': 27608, 'loss/train': 0.7621616125106812} -11/07/2021 01:05:45 - INFO - __main__ - Step 27610: {'lr': 0.0004639628443028337, 'samples': 5301120, 'steps': 27609, 'loss/train': 1.638516902923584} -11/07/2021 01:05:45 - INFO - __main__ - Step 27611: {'lr': 0.0004639600994906138, 'samples': 5301312, 'steps': 27610, 'loss/train': 1.7831859588623047} -11/07/2021 01:05:46 - INFO - __main__ - Step 27612: {'lr': 0.00046395735458198674, 'samples': 5301504, 'steps': 27611, 'loss/train': 2.2419371604919434} -11/07/2021 01:05:46 - INFO - __main__ - Step 27613: {'lr': 0.0004639546095769538, 'samples': 5301696, 'steps': 27612, 'loss/train': 1.0362420082092285} -11/07/2021 01:05:46 - INFO - __main__ - Step 27614: {'lr': 0.00046395186447551617, 'samples': 5301888, 'steps': 27613, 'loss/train': 1.3505686521530151} -11/07/2021 01:05:47 - INFO - __main__ - Step 27615: {'lr': 0.00046394911927767526, 'samples': 5302080, 'steps': 27614, 'loss/train': 1.3175309896469116} -11/07/2021 01:05:48 - INFO - __main__ - Step 27616: {'lr': 0.0004639463739834321, 'samples': 5302272, 'steps': 27615, 'loss/train': 1.468790054321289} -11/07/2021 01:05:48 - INFO - __main__ - Step 27617: {'lr': 0.00046394362859278793, 'samples': 5302464, 'steps': 27616, 'loss/train': 1.662192702293396} -11/07/2021 01:05:48 - INFO - __main__ - Step 27618: {'lr': 0.00046394088310574416, 'samples': 5302656, 'steps': 27617, 'loss/train': 1.2508586645126343} -11/07/2021 01:05:49 - INFO - __main__ - Step 27619: {'lr': 0.000463938137522302, 'samples': 5302848, 'steps': 27618, 'loss/train': 1.403387188911438} -11/07/2021 01:05:50 - INFO - __main__ - Step 27620: {'lr': 0.00046393539184246246, 'samples': 5303040, 'steps': 27619, 'loss/train': 1.3286373615264893} -11/07/2021 01:05:50 - INFO - __main__ - Step 27621: {'lr': 0.000463932646066227, 'samples': 5303232, 'steps': 27620, 'loss/train': 1.2126948833465576} -11/07/2021 01:05:50 - INFO - __main__ - Step 27622: {'lr': 0.0004639299001935968, 'samples': 5303424, 'steps': 27621, 'loss/train': 1.6715281009674072} -11/07/2021 01:05:51 - INFO - __main__ - Step 27623: {'lr': 0.0004639271542245731, 'samples': 5303616, 'steps': 27622, 'loss/train': 1.7359400987625122} -11/07/2021 01:05:51 - INFO - __main__ - Step 27624: {'lr': 0.000463924408159157, 'samples': 5303808, 'steps': 27623, 'loss/train': 1.3238176107406616} -11/07/2021 01:05:52 - INFO - __main__ - Step 27625: {'lr': 0.00046392166199735, 'samples': 5304000, 'steps': 27624, 'loss/train': 1.7469561100006104} -11/07/2021 01:05:53 - INFO - __main__ - Step 27626: {'lr': 0.00046391891573915325, 'samples': 5304192, 'steps': 27625, 'loss/train': 1.4644496440887451} -11/07/2021 01:05:53 - INFO - __main__ - Step 27627: {'lr': 0.0004639161693845678, 'samples': 5304384, 'steps': 27626, 'loss/train': 1.8536758422851562} -11/07/2021 01:05:53 - INFO - __main__ - Step 27628: {'lr': 0.0004639134229335951, 'samples': 5304576, 'steps': 27627, 'loss/train': 1.0943701267242432} -11/07/2021 01:05:54 - INFO - __main__ - Step 27629: {'lr': 0.0004639106763862363, 'samples': 5304768, 'steps': 27628, 'loss/train': 1.6058448553085327} -11/07/2021 01:05:55 - INFO - __main__ - Step 27630: {'lr': 0.00046390792974249263, 'samples': 5304960, 'steps': 27629, 'loss/train': 1.5895884037017822} -11/07/2021 01:05:55 - INFO - __main__ - Step 27631: {'lr': 0.00046390518300236535, 'samples': 5305152, 'steps': 27630, 'loss/train': 1.5727344751358032} -11/07/2021 01:05:55 - INFO - __main__ - Step 27632: {'lr': 0.0004639024361658557, 'samples': 5305344, 'steps': 27631, 'loss/train': 1.2182259559631348} -11/07/2021 01:05:56 - INFO - __main__ - Step 27633: {'lr': 0.00046389968923296496, 'samples': 5305536, 'steps': 27632, 'loss/train': 2.014322519302368} -11/07/2021 01:05:56 - INFO - __main__ - Step 27634: {'lr': 0.0004638969422036943, 'samples': 5305728, 'steps': 27633, 'loss/train': 1.4085277318954468} -11/07/2021 01:05:57 - INFO - __main__ - Step 27635: {'lr': 0.00046389419507804493, 'samples': 5305920, 'steps': 27634, 'loss/train': 1.580593466758728} -11/07/2021 01:05:57 - INFO - __main__ - Step 27636: {'lr': 0.00046389144785601813, 'samples': 5306112, 'steps': 27635, 'loss/train': 1.948710560798645} -11/07/2021 01:05:58 - INFO - __main__ - Step 27637: {'lr': 0.0004638887005376152, 'samples': 5306304, 'steps': 27636, 'loss/train': 1.4450467824935913} -11/07/2021 01:05:58 - INFO - __main__ - Step 27638: {'lr': 0.0004638859531228373, 'samples': 5306496, 'steps': 27637, 'loss/train': 1.8315891027450562} -11/07/2021 01:05:58 - INFO - __main__ - Step 27639: {'lr': 0.00046388320561168567, 'samples': 5306688, 'steps': 27638, 'loss/train': 1.0632545948028564} -11/07/2021 01:06:00 - INFO - __main__ - Step 27640: {'lr': 0.00046388045800416157, 'samples': 5306880, 'steps': 27639, 'loss/train': 1.5780152082443237} -11/07/2021 01:06:00 - INFO - __main__ - Step 27641: {'lr': 0.00046387771030026627, 'samples': 5307072, 'steps': 27640, 'loss/train': 1.3077924251556396} -11/07/2021 01:06:00 - INFO - __main__ - Step 27642: {'lr': 0.00046387496250000095, 'samples': 5307264, 'steps': 27641, 'loss/train': 1.3584179878234863} -11/07/2021 01:06:01 - INFO - __main__ - Step 27643: {'lr': 0.0004638722146033669, 'samples': 5307456, 'steps': 27642, 'loss/train': 1.375866174697876} -11/07/2021 01:06:01 - INFO - __main__ - Step 27644: {'lr': 0.0004638694666103653, 'samples': 5307648, 'steps': 27643, 'loss/train': 1.599300742149353} -11/07/2021 01:06:02 - INFO - __main__ - Step 27645: {'lr': 0.00046386671852099743, 'samples': 5307840, 'steps': 27644, 'loss/train': 1.7007393836975098} -11/07/2021 01:06:02 - INFO - __main__ - Step 27646: {'lr': 0.0004638639703352645, 'samples': 5308032, 'steps': 27645, 'loss/train': 1.2627149820327759} -11/07/2021 01:06:03 - INFO - __main__ - Step 27647: {'lr': 0.00046386122205316783, 'samples': 5308224, 'steps': 27646, 'loss/train': 1.877655029296875} -11/07/2021 01:06:03 - INFO - __main__ - Step 27648: {'lr': 0.0004638584736747085, 'samples': 5308416, 'steps': 27647, 'loss/train': 1.1750167608261108} -11/07/2021 01:06:03 - INFO - __main__ - Step 27649: {'lr': 0.00046385572519988793, 'samples': 5308608, 'steps': 27648, 'loss/train': 1.7251285314559937} -11/07/2021 01:06:04 - INFO - __main__ - Step 27650: {'lr': 0.00046385297662870716, 'samples': 5308800, 'steps': 27649, 'loss/train': 1.1966801881790161} -11/07/2021 01:06:05 - INFO - __main__ - Step 27651: {'lr': 0.00046385022796116766, 'samples': 5308992, 'steps': 27650, 'loss/train': 1.1399863958358765} -11/07/2021 01:06:05 - INFO - __main__ - Step 27652: {'lr': 0.0004638474791972705, 'samples': 5309184, 'steps': 27651, 'loss/train': 1.7064568996429443} -11/07/2021 01:06:06 - INFO - __main__ - Step 27653: {'lr': 0.000463844730337017, 'samples': 5309376, 'steps': 27652, 'loss/train': 1.5111110210418701} -11/07/2021 01:06:06 - INFO - __main__ - Step 27654: {'lr': 0.00046384198138040825, 'samples': 5309568, 'steps': 27653, 'loss/train': 1.664940595626831} -11/07/2021 01:06:06 - INFO - __main__ - Step 27655: {'lr': 0.00046383923232744565, 'samples': 5309760, 'steps': 27654, 'loss/train': 1.659050464630127} -11/07/2021 01:06:07 - INFO - __main__ - Step 27656: {'lr': 0.00046383648317813045, 'samples': 5309952, 'steps': 27655, 'loss/train': 1.68919837474823} -11/07/2021 01:06:08 - INFO - __main__ - Step 27657: {'lr': 0.0004638337339324638, 'samples': 5310144, 'steps': 27656, 'loss/train': 1.3775867223739624} -11/07/2021 01:06:08 - INFO - __main__ - Step 27658: {'lr': 0.00046383098459044697, 'samples': 5310336, 'steps': 27657, 'loss/train': 1.3585413694381714} -11/07/2021 01:06:08 - INFO - __main__ - Step 27659: {'lr': 0.0004638282351520812, 'samples': 5310528, 'steps': 27658, 'loss/train': 0.984664261341095} -11/07/2021 01:06:09 - INFO - __main__ - Step 27660: {'lr': 0.00046382548561736773, 'samples': 5310720, 'steps': 27659, 'loss/train': 1.7749240398406982} -11/07/2021 01:06:10 - INFO - __main__ - Step 27661: {'lr': 0.0004638227359863078, 'samples': 5310912, 'steps': 27660, 'loss/train': 1.3609564304351807} -11/07/2021 01:06:10 - INFO - __main__ - Step 27662: {'lr': 0.0004638199862589026, 'samples': 5311104, 'steps': 27661, 'loss/train': 1.6411045789718628} -11/07/2021 01:06:10 - INFO - __main__ - Step 27663: {'lr': 0.0004638172364351535, 'samples': 5311296, 'steps': 27662, 'loss/train': 1.0792185068130493} -11/07/2021 01:06:11 - INFO - __main__ - Step 27664: {'lr': 0.00046381448651506153, 'samples': 5311488, 'steps': 27663, 'loss/train': 1.6429427862167358} -11/07/2021 01:06:11 - INFO - __main__ - Step 27665: {'lr': 0.00046381173649862815, 'samples': 5311680, 'steps': 27664, 'loss/train': 1.6976220607757568} -11/07/2021 01:06:12 - INFO - __main__ - Step 27666: {'lr': 0.00046380898638585447, 'samples': 5311872, 'steps': 27665, 'loss/train': 1.4528379440307617} -11/07/2021 01:06:13 - INFO - __main__ - Step 27667: {'lr': 0.0004638062361767418, 'samples': 5312064, 'steps': 27666, 'loss/train': 1.2322639226913452} -11/07/2021 01:06:13 - INFO - __main__ - Step 27668: {'lr': 0.00046380348587129127, 'samples': 5312256, 'steps': 27667, 'loss/train': 1.549231767654419} -11/07/2021 01:06:13 - INFO - __main__ - Step 27669: {'lr': 0.0004638007354695042, 'samples': 5312448, 'steps': 27668, 'loss/train': 1.3693461418151855} -11/07/2021 01:06:14 - INFO - __main__ - Step 27670: {'lr': 0.0004637979849713818, 'samples': 5312640, 'steps': 27669, 'loss/train': 0.9689860343933105} -11/07/2021 01:06:15 - INFO - __main__ - Step 27671: {'lr': 0.0004637952343769254, 'samples': 5312832, 'steps': 27670, 'loss/train': 1.2298322916030884} -11/07/2021 01:06:15 - INFO - __main__ - Step 27672: {'lr': 0.00046379248368613615, 'samples': 5313024, 'steps': 27671, 'loss/train': 1.229887843132019} -11/07/2021 01:06:15 - INFO - __main__ - Step 27673: {'lr': 0.0004637897328990153, 'samples': 5313216, 'steps': 27672, 'loss/train': 1.0177441835403442} -11/07/2021 01:06:16 - INFO - __main__ - Step 27674: {'lr': 0.000463786982015564, 'samples': 5313408, 'steps': 27673, 'loss/train': 1.730981707572937} -11/07/2021 01:06:16 - INFO - __main__ - Step 27675: {'lr': 0.00046378423103578373, 'samples': 5313600, 'steps': 27674, 'loss/train': 1.2419869899749756} -11/07/2021 01:06:17 - INFO - __main__ - Step 27676: {'lr': 0.0004637814799596755, 'samples': 5313792, 'steps': 27675, 'loss/train': 2.1071531772613525} -11/07/2021 01:06:18 - INFO - __main__ - Step 27677: {'lr': 0.00046377872878724066, 'samples': 5313984, 'steps': 27676, 'loss/train': 1.697929859161377} -11/07/2021 01:06:18 - INFO - __main__ - Step 27678: {'lr': 0.0004637759775184804, 'samples': 5314176, 'steps': 27677, 'loss/train': 1.393756628036499} -11/07/2021 01:06:18 - INFO - __main__ - Step 27679: {'lr': 0.000463773226153396, 'samples': 5314368, 'steps': 27678, 'loss/train': 0.9993812441825867} -11/07/2021 01:06:19 - INFO - __main__ - Step 27680: {'lr': 0.00046377047469198875, 'samples': 5314560, 'steps': 27679, 'loss/train': 1.5201777219772339} -11/07/2021 01:06:20 - INFO - __main__ - Step 27681: {'lr': 0.00046376772313425974, 'samples': 5314752, 'steps': 27680, 'loss/train': 1.6973458528518677} -11/07/2021 01:06:20 - INFO - __main__ - Step 27682: {'lr': 0.0004637649714802102, 'samples': 5314944, 'steps': 27681, 'loss/train': 1.1721813678741455} -11/07/2021 01:06:20 - INFO - __main__ - Step 27683: {'lr': 0.0004637622197298417, 'samples': 5315136, 'steps': 27682, 'loss/train': 1.7788022756576538} -11/07/2021 01:06:21 - INFO - __main__ - Step 27684: {'lr': 0.000463759467883155, 'samples': 5315328, 'steps': 27683, 'loss/train': 1.6087898015975952} -11/07/2021 01:06:21 - INFO - __main__ - Step 27685: {'lr': 0.0004637567159401518, 'samples': 5315520, 'steps': 27684, 'loss/train': 1.1776622533798218} -11/07/2021 01:06:23 - INFO - __main__ - Step 27686: {'lr': 0.00046375396390083303, 'samples': 5315712, 'steps': 27685, 'loss/train': 1.6208345890045166} -11/07/2021 01:06:23 - INFO - __main__ - Step 27687: {'lr': 0.0004637512117652, 'samples': 5315904, 'steps': 27686, 'loss/train': 1.5504517555236816} -11/07/2021 01:06:23 - INFO - __main__ - Step 27688: {'lr': 0.00046374845953325394, 'samples': 5316096, 'steps': 27687, 'loss/train': 1.558203935623169} -11/07/2021 01:06:24 - INFO - __main__ - Step 27689: {'lr': 0.0004637457072049962, 'samples': 5316288, 'steps': 27688, 'loss/train': 2.274839162826538} -11/07/2021 01:06:24 - INFO - __main__ - Step 27690: {'lr': 0.0004637429547804279, 'samples': 5316480, 'steps': 27689, 'loss/train': 2.026301383972168} -11/07/2021 01:06:24 - INFO - __main__ - Step 27691: {'lr': 0.0004637402022595503, 'samples': 5316672, 'steps': 27690, 'loss/train': 1.0505366325378418} -11/07/2021 01:06:25 - INFO - __main__ - Step 27692: {'lr': 0.0004637374496423647, 'samples': 5316864, 'steps': 27691, 'loss/train': 1.7772705554962158} -11/07/2021 01:06:26 - INFO - __main__ - Step 27693: {'lr': 0.0004637346969288723, 'samples': 5317056, 'steps': 27692, 'loss/train': 0.7610371708869934} -11/07/2021 01:06:26 - INFO - __main__ - Step 27694: {'lr': 0.0004637319441190743, 'samples': 5317248, 'steps': 27693, 'loss/train': 0.8985799551010132} -11/07/2021 01:06:26 - INFO - __main__ - Step 27695: {'lr': 0.00046372919121297207, 'samples': 5317440, 'steps': 27694, 'loss/train': 1.4711743593215942} -11/07/2021 01:06:27 - INFO - __main__ - Step 27696: {'lr': 0.0004637264382105667, 'samples': 5317632, 'steps': 27695, 'loss/train': 1.6593880653381348} -11/07/2021 01:06:28 - INFO - __main__ - Step 27697: {'lr': 0.00046372368511185953, 'samples': 5317824, 'steps': 27696, 'loss/train': 1.6002044677734375} -11/07/2021 01:06:28 - INFO - __main__ - Step 27698: {'lr': 0.0004637209319168517, 'samples': 5318016, 'steps': 27697, 'loss/train': 1.400031566619873} -11/07/2021 01:06:29 - INFO - __main__ - Step 27699: {'lr': 0.0004637181786255446, 'samples': 5318208, 'steps': 27698, 'loss/train': 1.4328306913375854} -11/07/2021 01:06:29 - INFO - __main__ - Step 27700: {'lr': 0.0004637154252379394, 'samples': 5318400, 'steps': 27699, 'loss/train': 1.6177538633346558} -11/07/2021 01:06:29 - INFO - __main__ - Step 27701: {'lr': 0.00046371267175403724, 'samples': 5318592, 'steps': 27700, 'loss/train': 1.7811652421951294} -11/07/2021 01:06:31 - INFO - __main__ - Step 27702: {'lr': 0.0004637099181738395, 'samples': 5318784, 'steps': 27701, 'loss/train': 1.770586371421814} -11/07/2021 01:06:32 - INFO - __main__ - Step 27703: {'lr': 0.00046370716449734733, 'samples': 5318976, 'steps': 27702, 'loss/train': 1.5121160745620728} -11/07/2021 01:06:32 - INFO - __main__ - Step 27704: {'lr': 0.00046370441072456206, 'samples': 5319168, 'steps': 27703, 'loss/train': 1.7021570205688477} -11/07/2021 01:06:32 - INFO - __main__ - Step 27705: {'lr': 0.00046370165685548484, 'samples': 5319360, 'steps': 27704, 'loss/train': 1.472056269645691} -11/07/2021 01:06:33 - INFO - __main__ - Step 27706: {'lr': 0.00046369890289011696, 'samples': 5319552, 'steps': 27705, 'loss/train': 1.6031389236450195} -11/07/2021 01:06:33 - INFO - __main__ - Step 27707: {'lr': 0.0004636961488284597, 'samples': 5319744, 'steps': 27706, 'loss/train': 1.5327539443969727} -11/07/2021 01:06:33 - INFO - __main__ - Step 27708: {'lr': 0.0004636933946705142, 'samples': 5319936, 'steps': 27707, 'loss/train': 0.7630791664123535} -11/07/2021 01:06:34 - INFO - __main__ - Step 27709: {'lr': 0.00046369064041628175, 'samples': 5320128, 'steps': 27708, 'loss/train': 0.810263991355896} -11/07/2021 01:06:35 - INFO - __main__ - Step 27710: {'lr': 0.00046368788606576363, 'samples': 5320320, 'steps': 27709, 'loss/train': 1.462875247001648} -11/07/2021 01:06:35 - INFO - __main__ - Step 27711: {'lr': 0.00046368513161896104, 'samples': 5320512, 'steps': 27710, 'loss/train': 1.803904414176941} -11/07/2021 01:06:36 - INFO - __main__ - Step 27712: {'lr': 0.0004636823770758752, 'samples': 5320704, 'steps': 27711, 'loss/train': 2.0148212909698486} -11/07/2021 01:06:36 - INFO - __main__ - Step 27713: {'lr': 0.0004636796224365074, 'samples': 5320896, 'steps': 27712, 'loss/train': 1.991600751876831} -11/07/2021 01:06:37 - INFO - __main__ - Step 27714: {'lr': 0.0004636768677008588, 'samples': 5321088, 'steps': 27713, 'loss/train': 1.4234155416488647} -11/07/2021 01:06:37 - INFO - __main__ - Step 27715: {'lr': 0.0004636741128689308, 'samples': 5321280, 'steps': 27714, 'loss/train': 2.0229625701904297} -11/07/2021 01:06:38 - INFO - __main__ - Step 27716: {'lr': 0.00046367135794072445, 'samples': 5321472, 'steps': 27715, 'loss/train': 1.2980085611343384} -11/07/2021 01:06:38 - INFO - __main__ - Step 27717: {'lr': 0.0004636686029162411, 'samples': 5321664, 'steps': 27716, 'loss/train': 1.2549235820770264} -11/07/2021 01:06:38 - INFO - __main__ - Step 27718: {'lr': 0.000463665847795482, 'samples': 5321856, 'steps': 27717, 'loss/train': 1.4861565828323364} -11/07/2021 01:06:39 - INFO - __main__ - Step 27719: {'lr': 0.0004636630925784484, 'samples': 5322048, 'steps': 27718, 'loss/train': 1.936221957206726} -11/07/2021 01:06:40 - INFO - __main__ - Step 27720: {'lr': 0.0004636603372651415, 'samples': 5322240, 'steps': 27719, 'loss/train': 1.259960412979126} -11/07/2021 01:06:40 - INFO - __main__ - Step 27721: {'lr': 0.0004636575818555625, 'samples': 5322432, 'steps': 27720, 'loss/train': 1.568810224533081} -11/07/2021 01:06:40 - INFO - __main__ - Step 27722: {'lr': 0.00046365482634971275, 'samples': 5322624, 'steps': 27721, 'loss/train': 1.6244637966156006} -11/07/2021 01:06:41 - INFO - __main__ - Step 27723: {'lr': 0.00046365207074759344, 'samples': 5322816, 'steps': 27722, 'loss/train': 1.82841157913208} -11/07/2021 01:06:41 - INFO - __main__ - Step 27724: {'lr': 0.0004636493150492057, 'samples': 5323008, 'steps': 27723, 'loss/train': 0.8045539855957031} -11/07/2021 01:06:42 - INFO - __main__ - Step 27725: {'lr': 0.00046364655925455094, 'samples': 5323200, 'steps': 27724, 'loss/train': 1.3680577278137207} -11/07/2021 01:06:43 - INFO - __main__ - Step 27726: {'lr': 0.0004636438033636303, 'samples': 5323392, 'steps': 27725, 'loss/train': 1.5489109754562378} -11/07/2021 01:06:43 - INFO - __main__ - Step 27727: {'lr': 0.00046364104737644515, 'samples': 5323584, 'steps': 27726, 'loss/train': 1.6654754877090454} -11/07/2021 01:06:43 - INFO - __main__ - Step 27728: {'lr': 0.00046363829129299655, 'samples': 5323776, 'steps': 27727, 'loss/train': 1.5989880561828613} -11/07/2021 01:06:44 - INFO - __main__ - Step 27729: {'lr': 0.0004636355351132859, 'samples': 5323968, 'steps': 27728, 'loss/train': 1.1280689239501953} -11/07/2021 01:06:45 - INFO - __main__ - Step 27730: {'lr': 0.00046363277883731437, 'samples': 5324160, 'steps': 27729, 'loss/train': 1.599190354347229} -11/07/2021 01:06:45 - INFO - __main__ - Step 27731: {'lr': 0.0004636300224650831, 'samples': 5324352, 'steps': 27730, 'loss/train': 1.2962560653686523} -11/07/2021 01:06:45 - INFO - __main__ - Step 27732: {'lr': 0.00046362726599659355, 'samples': 5324544, 'steps': 27731, 'loss/train': 1.2981113195419312} -11/07/2021 01:06:46 - INFO - __main__ - Step 27733: {'lr': 0.0004636245094318468, 'samples': 5324736, 'steps': 27732, 'loss/train': 1.5841000080108643} -11/07/2021 01:06:46 - INFO - __main__ - Step 27734: {'lr': 0.0004636217527708442, 'samples': 5324928, 'steps': 27733, 'loss/train': 1.590748906135559} -11/07/2021 01:06:47 - INFO - __main__ - Step 27735: {'lr': 0.0004636189960135869, 'samples': 5325120, 'steps': 27734, 'loss/train': 1.6335985660552979} -11/07/2021 01:06:48 - INFO - __main__ - Step 27736: {'lr': 0.0004636162391600761, 'samples': 5325312, 'steps': 27735, 'loss/train': 1.3171145915985107} -11/07/2021 01:06:48 - INFO - __main__ - Step 27737: {'lr': 0.00046361348221031316, 'samples': 5325504, 'steps': 27736, 'loss/train': 1.492238998413086} -11/07/2021 01:06:48 - INFO - __main__ - Step 27738: {'lr': 0.00046361072516429936, 'samples': 5325696, 'steps': 27737, 'loss/train': 1.0480579137802124} -11/07/2021 01:06:49 - INFO - __main__ - Step 27739: {'lr': 0.0004636079680220358, 'samples': 5325888, 'steps': 27738, 'loss/train': 1.7593157291412354} -11/07/2021 01:06:50 - INFO - __main__ - Step 27740: {'lr': 0.0004636052107835238, 'samples': 5326080, 'steps': 27739, 'loss/train': 1.6487047672271729} -11/07/2021 01:06:50 - INFO - __main__ - Step 27741: {'lr': 0.0004636024534487646, 'samples': 5326272, 'steps': 27740, 'loss/train': 1.5217450857162476} -11/07/2021 01:06:51 - INFO - __main__ - Step 27742: {'lr': 0.0004635996960177594, 'samples': 5326464, 'steps': 27741, 'loss/train': 1.5599013566970825} -11/07/2021 01:06:51 - INFO - __main__ - Step 27743: {'lr': 0.0004635969384905095, 'samples': 5326656, 'steps': 27742, 'loss/train': 1.571807622909546} -11/07/2021 01:06:51 - INFO - __main__ - Step 27744: {'lr': 0.0004635941808670161, 'samples': 5326848, 'steps': 27743, 'loss/train': 1.3286199569702148} -11/07/2021 01:06:52 - INFO - __main__ - Step 27745: {'lr': 0.00046359142314728047, 'samples': 5327040, 'steps': 27744, 'loss/train': 1.714626431465149} -11/07/2021 01:06:53 - INFO - __main__ - Step 27746: {'lr': 0.00046358866533130385, 'samples': 5327232, 'steps': 27745, 'loss/train': 1.262636423110962} -11/07/2021 01:06:53 - INFO - __main__ - Step 27747: {'lr': 0.00046358590741908744, 'samples': 5327424, 'steps': 27746, 'loss/train': 1.909021258354187} -11/07/2021 01:06:53 - INFO - __main__ - Step 27748: {'lr': 0.0004635831494106325, 'samples': 5327616, 'steps': 27747, 'loss/train': 1.4999247789382935} -11/07/2021 01:06:54 - INFO - __main__ - Step 27749: {'lr': 0.0004635803913059404, 'samples': 5327808, 'steps': 27748, 'loss/train': 1.1166845560073853} -11/07/2021 01:06:54 - INFO - __main__ - Step 27750: {'lr': 0.00046357763310501216, 'samples': 5328000, 'steps': 27749, 'loss/train': 1.756516456604004} -11/07/2021 01:06:55 - INFO - __main__ - Step 27751: {'lr': 0.0004635748748078492, 'samples': 5328192, 'steps': 27750, 'loss/train': 1.2605432271957397} -11/07/2021 01:06:55 - INFO - __main__ - Step 27752: {'lr': 0.0004635721164144526, 'samples': 5328384, 'steps': 27751, 'loss/train': 1.455724835395813} -11/07/2021 01:06:56 - INFO - __main__ - Step 27753: {'lr': 0.0004635693579248238, 'samples': 5328576, 'steps': 27752, 'loss/train': 1.5267298221588135} -11/07/2021 01:06:56 - INFO - __main__ - Step 27754: {'lr': 0.00046356659933896393, 'samples': 5328768, 'steps': 27753, 'loss/train': 1.2926586866378784} -11/07/2021 01:06:56 - INFO - __main__ - Step 27755: {'lr': 0.0004635638406568742, 'samples': 5328960, 'steps': 27754, 'loss/train': 1.6973003149032593} -11/07/2021 01:06:57 - INFO - __main__ - Step 27756: {'lr': 0.00046356108187855594, 'samples': 5329152, 'steps': 27755, 'loss/train': 1.769636869430542} -11/07/2021 01:06:58 - INFO - __main__ - Step 27757: {'lr': 0.00046355832300401035, 'samples': 5329344, 'steps': 27756, 'loss/train': 1.4013556241989136} -11/07/2021 01:06:58 - INFO - __main__ - Step 27758: {'lr': 0.0004635555640332386, 'samples': 5329536, 'steps': 27757, 'loss/train': 1.6594982147216797} -11/07/2021 01:06:59 - INFO - __main__ - Step 27759: {'lr': 0.0004635528049662421, 'samples': 5329728, 'steps': 27758, 'loss/train': 1.3016235828399658} -11/07/2021 01:06:59 - INFO - __main__ - Step 27760: {'lr': 0.000463550045803022, 'samples': 5329920, 'steps': 27759, 'loss/train': 1.2639565467834473} -11/07/2021 01:07:00 - INFO - __main__ - Step 27761: {'lr': 0.00046354728654357947, 'samples': 5330112, 'steps': 27760, 'loss/train': 2.085947275161743} -11/07/2021 01:07:01 - INFO - __main__ - Step 27762: {'lr': 0.00046354452718791586, 'samples': 5330304, 'steps': 27761, 'loss/train': 0.21334145963191986} -11/07/2021 01:07:01 - INFO - __main__ - Step 27763: {'lr': 0.0004635417677360324, 'samples': 5330496, 'steps': 27762, 'loss/train': 1.1936448812484741} -11/07/2021 01:07:01 - INFO - __main__ - Step 27764: {'lr': 0.0004635390081879303, 'samples': 5330688, 'steps': 27763, 'loss/train': 1.293779730796814} -11/07/2021 01:07:02 - INFO - __main__ - Step 27765: {'lr': 0.0004635362485436109, 'samples': 5330880, 'steps': 27764, 'loss/train': 1.78763747215271} -11/07/2021 01:07:03 - INFO - __main__ - Step 27766: {'lr': 0.00046353348880307524, 'samples': 5331072, 'steps': 27765, 'loss/train': 1.6645318269729614} -11/07/2021 01:07:03 - INFO - __main__ - Step 27767: {'lr': 0.0004635307289663248, 'samples': 5331264, 'steps': 27766, 'loss/train': 0.7043894529342651} -11/07/2021 01:07:03 - INFO - __main__ - Step 27768: {'lr': 0.0004635279690333606, 'samples': 5331456, 'steps': 27767, 'loss/train': 1.8142160177230835} -11/07/2021 01:07:04 - INFO - __main__ - Step 27769: {'lr': 0.00046352520900418403, 'samples': 5331648, 'steps': 27768, 'loss/train': 1.401672124862671} -11/07/2021 01:07:04 - INFO - __main__ - Step 27770: {'lr': 0.00046352244887879623, 'samples': 5331840, 'steps': 27769, 'loss/train': 1.6772185564041138} -11/07/2021 01:07:05 - INFO - __main__ - Step 27771: {'lr': 0.0004635196886571986, 'samples': 5332032, 'steps': 27770, 'loss/train': 1.560492753982544} -11/07/2021 01:07:06 - INFO - __main__ - Step 27772: {'lr': 0.0004635169283393923, 'samples': 5332224, 'steps': 27771, 'loss/train': 1.3133739233016968} -11/07/2021 01:07:06 - INFO - __main__ - Step 27773: {'lr': 0.0004635141679253785, 'samples': 5332416, 'steps': 27772, 'loss/train': 1.5891863107681274} -11/07/2021 01:07:06 - INFO - __main__ - Step 27774: {'lr': 0.0004635114074151586, 'samples': 5332608, 'steps': 27773, 'loss/train': 1.5065265893936157} -11/07/2021 01:07:07 - INFO - __main__ - Step 27775: {'lr': 0.00046350864680873375, 'samples': 5332800, 'steps': 27774, 'loss/train': 1.1675381660461426} -11/07/2021 01:07:08 - INFO - __main__ - Step 27776: {'lr': 0.0004635058861061051, 'samples': 5332992, 'steps': 27775, 'loss/train': 1.5662585496902466} -11/07/2021 01:07:08 - INFO - __main__ - Step 27777: {'lr': 0.00046350312530727403, 'samples': 5333184, 'steps': 27776, 'loss/train': 1.0655912160873413} -11/07/2021 01:07:08 - INFO - __main__ - Step 27778: {'lr': 0.00046350036441224175, 'samples': 5333376, 'steps': 27777, 'loss/train': 1.738042950630188} -11/07/2021 01:07:09 - INFO - __main__ - Step 27779: {'lr': 0.00046349760342100955, 'samples': 5333568, 'steps': 27778, 'loss/train': 1.7702325582504272} -11/07/2021 01:07:09 - INFO - __main__ - Step 27780: {'lr': 0.00046349484233357854, 'samples': 5333760, 'steps': 27779, 'loss/train': 1.5026328563690186} -11/07/2021 01:07:09 - INFO - __main__ - Step 27781: {'lr': 0.0004634920811499501, 'samples': 5333952, 'steps': 27780, 'loss/train': 1.67792546749115} -11/07/2021 01:07:11 - INFO - __main__ - Step 27782: {'lr': 0.00046348931987012543, 'samples': 5334144, 'steps': 27781, 'loss/train': 0.21696703135967255} -11/07/2021 01:07:11 - INFO - __main__ - Step 27783: {'lr': 0.00046348655849410577, 'samples': 5334336, 'steps': 27782, 'loss/train': 1.6288264989852905} -11/07/2021 01:07:11 - INFO - __main__ - Step 27784: {'lr': 0.0004634837970218924, 'samples': 5334528, 'steps': 27783, 'loss/train': 0.30237165093421936} -11/07/2021 01:07:12 - INFO - __main__ - Step 27785: {'lr': 0.0004634810354534864, 'samples': 5334720, 'steps': 27784, 'loss/train': 1.7129555940628052} -11/07/2021 01:07:12 - INFO - __main__ - Step 27786: {'lr': 0.0004634782737888892, 'samples': 5334912, 'steps': 27785, 'loss/train': 0.9289341568946838} -11/07/2021 01:07:13 - INFO - __main__ - Step 27787: {'lr': 0.000463475512028102, 'samples': 5335104, 'steps': 27786, 'loss/train': 1.6294125318527222} -11/07/2021 01:07:14 - INFO - __main__ - Step 27788: {'lr': 0.000463472750171126, 'samples': 5335296, 'steps': 27787, 'loss/train': 1.5533576011657715} -11/07/2021 01:07:14 - INFO - __main__ - Step 27789: {'lr': 0.0004634699882179625, 'samples': 5335488, 'steps': 27788, 'loss/train': 1.5945382118225098} -11/07/2021 01:07:14 - INFO - __main__ - Step 27790: {'lr': 0.0004634672261686127, 'samples': 5335680, 'steps': 27789, 'loss/train': 1.3665266036987305} -11/07/2021 01:07:15 - INFO - __main__ - Step 27791: {'lr': 0.0004634644640230779, 'samples': 5335872, 'steps': 27790, 'loss/train': 1.4442942142486572} -11/07/2021 01:07:16 - INFO - __main__ - Step 27792: {'lr': 0.0004634617017813593, 'samples': 5336064, 'steps': 27791, 'loss/train': 1.4849623441696167} -11/07/2021 01:07:16 - INFO - __main__ - Step 27793: {'lr': 0.00046345893944345806, 'samples': 5336256, 'steps': 27792, 'loss/train': 1.4545289278030396} -11/07/2021 01:07:16 - INFO - __main__ - Step 27794: {'lr': 0.00046345617700937564, 'samples': 5336448, 'steps': 27793, 'loss/train': 1.5662834644317627} -11/07/2021 01:07:17 - INFO - __main__ - Step 27795: {'lr': 0.0004634534144791131, 'samples': 5336640, 'steps': 27794, 'loss/train': 1.4726775884628296} -11/07/2021 01:07:17 - INFO - __main__ - Step 27796: {'lr': 0.0004634506518526718, 'samples': 5336832, 'steps': 27795, 'loss/train': 1.4754371643066406} -11/07/2021 01:07:18 - INFO - __main__ - Step 27797: {'lr': 0.00046344788913005286, 'samples': 5337024, 'steps': 27796, 'loss/train': 1.5549851655960083} -11/07/2021 01:07:19 - INFO - __main__ - Step 27798: {'lr': 0.00046344512631125756, 'samples': 5337216, 'steps': 27797, 'loss/train': 1.6476571559906006} -11/07/2021 01:07:19 - INFO - __main__ - Step 27799: {'lr': 0.00046344236339628724, 'samples': 5337408, 'steps': 27798, 'loss/train': 1.7478976249694824} -11/07/2021 01:07:19 - INFO - __main__ - Step 27800: {'lr': 0.0004634396003851431, 'samples': 5337600, 'steps': 27799, 'loss/train': 1.513837456703186} -11/07/2021 01:07:20 - INFO - __main__ - Step 27801: {'lr': 0.00046343683727782635, 'samples': 5337792, 'steps': 27800, 'loss/train': 0.918851375579834} -11/07/2021 01:07:21 - INFO - __main__ - Step 27802: {'lr': 0.0004634340740743382, 'samples': 5337984, 'steps': 27801, 'loss/train': 1.074940800666809} -11/07/2021 01:07:21 - INFO - __main__ - Step 27803: {'lr': 0.00046343131077468, 'samples': 5338176, 'steps': 27802, 'loss/train': 1.383703589439392} -11/07/2021 01:07:22 - INFO - __main__ - Step 27804: {'lr': 0.00046342854737885296, 'samples': 5338368, 'steps': 27803, 'loss/train': 0.3601319193840027} -11/07/2021 01:07:22 - INFO - __main__ - Step 27805: {'lr': 0.00046342578388685837, 'samples': 5338560, 'steps': 27804, 'loss/train': 1.6942323446273804} -11/07/2021 01:07:22 - INFO - __main__ - Step 27806: {'lr': 0.0004634230202986973, 'samples': 5338752, 'steps': 27805, 'loss/train': 1.3652087450027466} -11/07/2021 01:07:23 - INFO - __main__ - Step 27807: {'lr': 0.0004634202566143712, 'samples': 5338944, 'steps': 27806, 'loss/train': 1.6079967021942139} -11/07/2021 01:07:23 - INFO - __main__ - Step 27808: {'lr': 0.00046341749283388117, 'samples': 5339136, 'steps': 27807, 'loss/train': 1.3260587453842163} -11/07/2021 01:07:24 - INFO - __main__ - Step 27809: {'lr': 0.0004634147289572285, 'samples': 5339328, 'steps': 27808, 'loss/train': 1.6334463357925415} -11/07/2021 01:07:24 - INFO - __main__ - Step 27810: {'lr': 0.00046341196498441453, 'samples': 5339520, 'steps': 27809, 'loss/train': 1.769137978553772} -11/07/2021 01:07:25 - INFO - __main__ - Step 27811: {'lr': 0.0004634092009154403, 'samples': 5339712, 'steps': 27810, 'loss/train': 1.2536112070083618} -11/07/2021 01:07:25 - INFO - __main__ - Step 27812: {'lr': 0.0004634064367503072, 'samples': 5339904, 'steps': 27811, 'loss/train': 1.5238810777664185} -11/07/2021 01:07:26 - INFO - __main__ - Step 27813: {'lr': 0.00046340367248901655, 'samples': 5340096, 'steps': 27812, 'loss/train': 1.3737224340438843} -11/07/2021 01:07:27 - INFO - __main__ - Step 27814: {'lr': 0.00046340090813156944, 'samples': 5340288, 'steps': 27813, 'loss/train': 1.1866050958633423} -11/07/2021 01:07:27 - INFO - __main__ - Step 27815: {'lr': 0.00046339814367796716, 'samples': 5340480, 'steps': 27814, 'loss/train': 1.5412652492523193} -11/07/2021 01:07:28 - INFO - __main__ - Step 27816: {'lr': 0.00046339537912821094, 'samples': 5340672, 'steps': 27815, 'loss/train': 1.8829264640808105} -11/07/2021 01:07:28 - INFO - __main__ - Step 27817: {'lr': 0.0004633926144823022, 'samples': 5340864, 'steps': 27816, 'loss/train': 1.5201081037521362} -11/07/2021 01:07:28 - INFO - __main__ - Step 27818: {'lr': 0.0004633898497402419, 'samples': 5341056, 'steps': 27817, 'loss/train': 0.9563632607460022} -11/07/2021 01:07:29 - INFO - __main__ - Step 27819: {'lr': 0.0004633870849020314, 'samples': 5341248, 'steps': 27818, 'loss/train': 1.2424542903900146} -11/07/2021 01:07:30 - INFO - __main__ - Step 27820: {'lr': 0.00046338431996767205, 'samples': 5341440, 'steps': 27819, 'loss/train': 1.699521780014038} -11/07/2021 01:07:30 - INFO - __main__ - Step 27821: {'lr': 0.00046338155493716503, 'samples': 5341632, 'steps': 27820, 'loss/train': 1.3380119800567627} -11/07/2021 01:07:30 - INFO - __main__ - Step 27822: {'lr': 0.0004633787898105115, 'samples': 5341824, 'steps': 27821, 'loss/train': 2.1813955307006836} -11/07/2021 01:07:31 - INFO - __main__ - Step 27823: {'lr': 0.0004633760245877129, 'samples': 5342016, 'steps': 27822, 'loss/train': 1.960642695426941} -11/07/2021 01:07:31 - INFO - __main__ - Step 27824: {'lr': 0.0004633732592687703, 'samples': 5342208, 'steps': 27823, 'loss/train': 1.445009469985962} -11/07/2021 01:07:32 - INFO - __main__ - Step 27825: {'lr': 0.00046337049385368495, 'samples': 5342400, 'steps': 27824, 'loss/train': 1.9721317291259766} -11/07/2021 01:07:33 - INFO - __main__ - Step 27826: {'lr': 0.00046336772834245824, 'samples': 5342592, 'steps': 27825, 'loss/train': 1.5805824995040894} -11/07/2021 01:07:33 - INFO - __main__ - Step 27827: {'lr': 0.0004633649627350912, 'samples': 5342784, 'steps': 27826, 'loss/train': 1.6834359169006348} -11/07/2021 01:07:33 - INFO - __main__ - Step 27828: {'lr': 0.00046336219703158526, 'samples': 5342976, 'steps': 27827, 'loss/train': 1.6386125087738037} -11/07/2021 01:07:34 - INFO - __main__ - Step 27829: {'lr': 0.00046335943123194164, 'samples': 5343168, 'steps': 27828, 'loss/train': 1.5754843950271606} -11/07/2021 01:07:35 - INFO - __main__ - Step 27830: {'lr': 0.0004633566653361615, 'samples': 5343360, 'steps': 27829, 'loss/train': 1.437250018119812} -11/07/2021 01:07:35 - INFO - __main__ - Step 27831: {'lr': 0.0004633538993442462, 'samples': 5343552, 'steps': 27830, 'loss/train': 1.7498289346694946} -11/07/2021 01:07:35 - INFO - __main__ - Step 27832: {'lr': 0.00046335113325619685, 'samples': 5343744, 'steps': 27831, 'loss/train': 1.5722873210906982} -11/07/2021 01:07:36 - INFO - __main__ - Step 27833: {'lr': 0.00046334836707201486, 'samples': 5343936, 'steps': 27832, 'loss/train': 1.515210509300232} -11/07/2021 01:07:36 - INFO - __main__ - Step 27834: {'lr': 0.0004633456007917013, 'samples': 5344128, 'steps': 27833, 'loss/train': 1.1740343570709229} -11/07/2021 01:07:37 - INFO - __main__ - Step 27835: {'lr': 0.0004633428344152576, 'samples': 5344320, 'steps': 27834, 'loss/train': 1.6871955394744873} -11/07/2021 01:07:38 - INFO - __main__ - Step 27836: {'lr': 0.0004633400679426848, 'samples': 5344512, 'steps': 27835, 'loss/train': 1.7944591045379639} -11/07/2021 01:07:38 - INFO - __main__ - Step 27837: {'lr': 0.00046333730137398433, 'samples': 5344704, 'steps': 27836, 'loss/train': 1.3786191940307617} -11/07/2021 01:07:38 - INFO - __main__ - Step 27838: {'lr': 0.00046333453470915736, 'samples': 5344896, 'steps': 27837, 'loss/train': 1.5384540557861328} -11/07/2021 01:07:39 - INFO - __main__ - Step 27839: {'lr': 0.0004633317679482051, 'samples': 5345088, 'steps': 27838, 'loss/train': 1.5437536239624023} -11/07/2021 01:07:39 - INFO - __main__ - Step 27840: {'lr': 0.00046332900109112893, 'samples': 5345280, 'steps': 27839, 'loss/train': 1.3671104907989502} -11/07/2021 01:07:40 - INFO - __main__ - Step 27841: {'lr': 0.0004633262341379299, 'samples': 5345472, 'steps': 27840, 'loss/train': 1.2937971353530884} -11/07/2021 01:07:41 - INFO - __main__ - Step 27842: {'lr': 0.0004633234670886094, 'samples': 5345664, 'steps': 27841, 'loss/train': 1.469732642173767} -11/07/2021 01:07:41 - INFO - __main__ - Step 27843: {'lr': 0.0004633206999431686, 'samples': 5345856, 'steps': 27842, 'loss/train': 1.695931077003479} -11/07/2021 01:07:41 - INFO - __main__ - Step 27844: {'lr': 0.00046331793270160885, 'samples': 5346048, 'steps': 27843, 'loss/train': 1.369606614112854} -11/07/2021 01:07:42 - INFO - __main__ - Step 27845: {'lr': 0.0004633151653639314, 'samples': 5346240, 'steps': 27844, 'loss/train': 1.5834770202636719} -11/07/2021 01:07:43 - INFO - __main__ - Step 27846: {'lr': 0.00046331239793013726, 'samples': 5346432, 'steps': 27845, 'loss/train': 1.5611268281936646} -11/07/2021 01:07:43 - INFO - __main__ - Step 27847: {'lr': 0.0004633096304002279, 'samples': 5346624, 'steps': 27846, 'loss/train': 1.500084638595581} -11/07/2021 01:07:43 - INFO - __main__ - Step 27848: {'lr': 0.00046330686277420454, 'samples': 5346816, 'steps': 27847, 'loss/train': 2.1239893436431885} -11/07/2021 01:07:44 - INFO - __main__ - Step 27849: {'lr': 0.00046330409505206837, 'samples': 5347008, 'steps': 27848, 'loss/train': 1.8391716480255127} -11/07/2021 01:07:45 - INFO - __main__ - Step 27850: {'lr': 0.00046330132723382066, 'samples': 5347200, 'steps': 27849, 'loss/train': 1.156402349472046} -11/07/2021 01:07:45 - INFO - __main__ - Step 27851: {'lr': 0.0004632985593194627, 'samples': 5347392, 'steps': 27850, 'loss/train': 1.3428056240081787} -11/07/2021 01:07:46 - INFO - __main__ - Step 27852: {'lr': 0.00046329579130899567, 'samples': 5347584, 'steps': 27851, 'loss/train': 1.7555490732192993} -11/07/2021 01:07:46 - INFO - __main__ - Step 27853: {'lr': 0.0004632930232024209, 'samples': 5347776, 'steps': 27852, 'loss/train': 1.594679832458496} -11/07/2021 01:07:46 - INFO - __main__ - Step 27854: {'lr': 0.0004632902549997395, 'samples': 5347968, 'steps': 27853, 'loss/train': 1.824711799621582} -11/07/2021 01:07:47 - INFO - __main__ - Step 27855: {'lr': 0.00046328748670095287, 'samples': 5348160, 'steps': 27854, 'loss/train': 1.6588963270187378} -11/07/2021 01:07:48 - INFO - __main__ - Step 27856: {'lr': 0.0004632847183060622, 'samples': 5348352, 'steps': 27855, 'loss/train': 1.4669275283813477} -11/07/2021 01:07:48 - INFO - __main__ - Step 27857: {'lr': 0.0004632819498150688, 'samples': 5348544, 'steps': 27856, 'loss/train': 1.2879362106323242} -11/07/2021 01:07:48 - INFO - __main__ - Step 27858: {'lr': 0.00046327918122797363, 'samples': 5348736, 'steps': 27857, 'loss/train': 1.6480536460876465} -11/07/2021 01:07:49 - INFO - __main__ - Step 27859: {'lr': 0.00046327641254477833, 'samples': 5348928, 'steps': 27858, 'loss/train': 1.6864488124847412} -11/07/2021 01:07:49 - INFO - __main__ - Step 27860: {'lr': 0.00046327364376548384, 'samples': 5349120, 'steps': 27859, 'loss/train': 1.5656856298446655} -11/07/2021 01:07:50 - INFO - __main__ - Step 27861: {'lr': 0.0004632708748900917, 'samples': 5349312, 'steps': 27860, 'loss/train': 0.713880717754364} -11/07/2021 01:07:50 - INFO - __main__ - Step 27862: {'lr': 0.00046326810591860285, 'samples': 5349504, 'steps': 27861, 'loss/train': 1.2501379251480103} -11/07/2021 01:07:51 - INFO - __main__ - Step 27863: {'lr': 0.0004632653368510187, 'samples': 5349696, 'steps': 27862, 'loss/train': 1.0524699687957764} -11/07/2021 01:07:51 - INFO - __main__ - Step 27864: {'lr': 0.00046326256768734053, 'samples': 5349888, 'steps': 27863, 'loss/train': 1.8845356702804565} -11/07/2021 01:07:51 - INFO - __main__ - Step 27865: {'lr': 0.0004632597984275695, 'samples': 5350080, 'steps': 27864, 'loss/train': 1.9486255645751953} -11/07/2021 01:07:53 - INFO - __main__ - Step 27866: {'lr': 0.00046325702907170697, 'samples': 5350272, 'steps': 27865, 'loss/train': 1.428919792175293} -11/07/2021 01:07:53 - INFO - __main__ - Step 27867: {'lr': 0.000463254259619754, 'samples': 5350464, 'steps': 27866, 'loss/train': 1.1179231405258179} -11/07/2021 01:07:53 - INFO - __main__ - Step 27868: {'lr': 0.000463251490071712, 'samples': 5350656, 'steps': 27867, 'loss/train': 0.8844492435455322} -11/07/2021 01:07:54 - INFO - __main__ - Step 27869: {'lr': 0.0004632487204275822, 'samples': 5350848, 'steps': 27868, 'loss/train': 2.0191144943237305} -11/07/2021 01:07:54 - INFO - __main__ - Step 27870: {'lr': 0.0004632459506873658, 'samples': 5351040, 'steps': 27869, 'loss/train': 1.6613689661026} -11/07/2021 01:07:54 - INFO - __main__ - Step 27871: {'lr': 0.0004632431808510641, 'samples': 5351232, 'steps': 27870, 'loss/train': 1.1953953504562378} -11/07/2021 01:07:55 - INFO - __main__ - Step 27872: {'lr': 0.0004632404109186782, 'samples': 5351424, 'steps': 27871, 'loss/train': 1.4809138774871826} -11/07/2021 01:07:56 - INFO - __main__ - Step 27873: {'lr': 0.0004632376408902096, 'samples': 5351616, 'steps': 27872, 'loss/train': 1.6379996538162231} -11/07/2021 01:07:56 - INFO - __main__ - Step 27874: {'lr': 0.0004632348707656593, 'samples': 5351808, 'steps': 27873, 'loss/train': 0.8251739740371704} -11/07/2021 01:07:56 - INFO - __main__ - Step 27875: {'lr': 0.00046323210054502874, 'samples': 5352000, 'steps': 27874, 'loss/train': 1.391992211341858} -11/07/2021 01:07:57 - INFO - __main__ - Step 27876: {'lr': 0.00046322933022831903, 'samples': 5352192, 'steps': 27875, 'loss/train': 1.0245487689971924} -11/07/2021 01:07:58 - INFO - __main__ - Step 27877: {'lr': 0.0004632265598155315, 'samples': 5352384, 'steps': 27876, 'loss/train': 1.4199742078781128} -11/07/2021 01:07:58 - INFO - __main__ - Step 27878: {'lr': 0.00046322378930666736, 'samples': 5352576, 'steps': 27877, 'loss/train': 2.1536476612091064} -11/07/2021 01:07:59 - INFO - __main__ - Step 27879: {'lr': 0.0004632210187017278, 'samples': 5352768, 'steps': 27878, 'loss/train': 1.9955917596817017} -11/07/2021 01:07:59 - INFO - __main__ - Step 27880: {'lr': 0.00046321824800071425, 'samples': 5352960, 'steps': 27879, 'loss/train': 1.3227732181549072} -11/07/2021 01:07:59 - INFO - __main__ - Step 27881: {'lr': 0.0004632154772036279, 'samples': 5353152, 'steps': 27880, 'loss/train': 1.6037013530731201} -11/07/2021 01:08:00 - INFO - __main__ - Step 27882: {'lr': 0.0004632127063104698, 'samples': 5353344, 'steps': 27881, 'loss/train': 1.2945456504821777} -11/07/2021 01:08:01 - INFO - __main__ - Step 27883: {'lr': 0.00046320993532124137, 'samples': 5353536, 'steps': 27882, 'loss/train': 1.5950944423675537} -11/07/2021 01:08:01 - INFO - __main__ - Step 27884: {'lr': 0.0004632071642359439, 'samples': 5353728, 'steps': 27883, 'loss/train': 1.419105052947998} -11/07/2021 01:08:01 - INFO - __main__ - Step 27885: {'lr': 0.0004632043930545785, 'samples': 5353920, 'steps': 27884, 'loss/train': 1.512109398841858} -11/07/2021 01:08:02 - INFO - __main__ - Step 27886: {'lr': 0.00046320162177714653, 'samples': 5354112, 'steps': 27885, 'loss/train': 1.366862416267395} -11/07/2021 01:08:03 - INFO - __main__ - Step 27887: {'lr': 0.00046319885040364925, 'samples': 5354304, 'steps': 27886, 'loss/train': 1.5487957000732422} -11/07/2021 01:08:04 - INFO - __main__ - Step 27888: {'lr': 0.00046319607893408776, 'samples': 5354496, 'steps': 27887, 'loss/train': 2.327791452407837} -11/07/2021 01:08:04 - INFO - __main__ - Step 27889: {'lr': 0.0004631933073684635, 'samples': 5354688, 'steps': 27888, 'loss/train': 1.4284238815307617} -11/07/2021 01:08:04 - INFO - __main__ - Step 27890: {'lr': 0.00046319053570677754, 'samples': 5354880, 'steps': 27889, 'loss/train': 1.7574843168258667} -11/07/2021 01:08:05 - INFO - __main__ - Step 27891: {'lr': 0.0004631877639490313, 'samples': 5355072, 'steps': 27890, 'loss/train': 1.6959110498428345} -11/07/2021 01:08:05 - INFO - __main__ - Step 27892: {'lr': 0.0004631849920952259, 'samples': 5355264, 'steps': 27891, 'loss/train': 1.7205824851989746} -11/07/2021 01:08:06 - INFO - __main__ - Step 27893: {'lr': 0.0004631822201453626, 'samples': 5355456, 'steps': 27892, 'loss/train': 1.7389143705368042} -11/07/2021 01:08:06 - INFO - __main__ - Step 27894: {'lr': 0.0004631794480994427, 'samples': 5355648, 'steps': 27893, 'loss/train': 1.2902930974960327} -11/07/2021 01:08:07 - INFO - __main__ - Step 27895: {'lr': 0.0004631766759574675, 'samples': 5355840, 'steps': 27894, 'loss/train': 1.7765417098999023} -11/07/2021 01:08:07 - INFO - __main__ - Step 27896: {'lr': 0.0004631739037194381, 'samples': 5356032, 'steps': 27895, 'loss/train': 1.2097101211547852} -11/07/2021 01:08:08 - INFO - __main__ - Step 27897: {'lr': 0.00046317113138535584, 'samples': 5356224, 'steps': 27896, 'loss/train': 1.501318097114563} -11/07/2021 01:08:08 - INFO - __main__ - Step 27898: {'lr': 0.0004631683589552219, 'samples': 5356416, 'steps': 27897, 'loss/train': 1.8397634029388428} -11/07/2021 01:08:09 - INFO - __main__ - Step 27899: {'lr': 0.00046316558642903774, 'samples': 5356608, 'steps': 27898, 'loss/train': 1.658473014831543} -11/07/2021 01:08:10 - INFO - __main__ - Step 27900: {'lr': 0.0004631628138068043, 'samples': 5356800, 'steps': 27899, 'loss/train': 1.2211940288543701} -11/07/2021 01:08:10 - INFO - __main__ - Step 27901: {'lr': 0.00046316004108852305, 'samples': 5356992, 'steps': 27900, 'loss/train': 1.6784851551055908} -11/07/2021 01:08:10 - INFO - __main__ - Step 27902: {'lr': 0.0004631572682741952, 'samples': 5357184, 'steps': 27901, 'loss/train': 1.5503257513046265} -11/07/2021 01:08:11 - INFO - __main__ - Step 27903: {'lr': 0.0004631544953638219, 'samples': 5357376, 'steps': 27902, 'loss/train': 2.5688607692718506} -11/07/2021 01:08:12 - INFO - __main__ - Step 27904: {'lr': 0.00046315172235740455, 'samples': 5357568, 'steps': 27903, 'loss/train': 1.378450632095337} -11/07/2021 01:08:12 - INFO - __main__ - Step 27905: {'lr': 0.0004631489492549443, 'samples': 5357760, 'steps': 27904, 'loss/train': 1.9023025035858154} -11/07/2021 01:08:12 - INFO - __main__ - Step 27906: {'lr': 0.00046314617605644243, 'samples': 5357952, 'steps': 27905, 'loss/train': 1.4637824296951294} -11/07/2021 01:08:13 - INFO - __main__ - Step 27907: {'lr': 0.0004631434027619001, 'samples': 5358144, 'steps': 27906, 'loss/train': 0.5341514945030212} -11/07/2021 01:08:13 - INFO - __main__ - Step 27908: {'lr': 0.0004631406293713188, 'samples': 5358336, 'steps': 27907, 'loss/train': 0.705164909362793} -11/07/2021 01:08:14 - INFO - __main__ - Step 27909: {'lr': 0.0004631378558846995, 'samples': 5358528, 'steps': 27908, 'loss/train': 1.9466551542282104} -11/07/2021 01:08:15 - INFO - __main__ - Step 27910: {'lr': 0.00046313508230204364, 'samples': 5358720, 'steps': 27909, 'loss/train': 1.1565824747085571} -11/07/2021 01:08:15 - INFO - __main__ - Step 27911: {'lr': 0.00046313230862335235, 'samples': 5358912, 'steps': 27910, 'loss/train': 1.4948753118515015} -11/07/2021 01:08:15 - INFO - __main__ - Step 27912: {'lr': 0.000463129534848627, 'samples': 5359104, 'steps': 27911, 'loss/train': 1.0003376007080078} -11/07/2021 01:08:16 - INFO - __main__ - Step 27913: {'lr': 0.0004631267609778687, 'samples': 5359296, 'steps': 27912, 'loss/train': 1.6802488565444946} -11/07/2021 01:08:17 - INFO - __main__ - Step 27914: {'lr': 0.0004631239870110788, 'samples': 5359488, 'steps': 27913, 'loss/train': 1.7102736234664917} -11/07/2021 01:08:17 - INFO - __main__ - Step 27915: {'lr': 0.00046312121294825846, 'samples': 5359680, 'steps': 27914, 'loss/train': 1.6894041299819946} -11/07/2021 01:08:17 - INFO - __main__ - Step 27916: {'lr': 0.00046311843878940904, 'samples': 5359872, 'steps': 27915, 'loss/train': 1.746033787727356} -11/07/2021 01:08:18 - INFO - __main__ - Step 27917: {'lr': 0.0004631156645345318, 'samples': 5360064, 'steps': 27916, 'loss/train': 1.992263674736023} -11/07/2021 01:08:18 - INFO - __main__ - Step 27918: {'lr': 0.0004631128901836278, 'samples': 5360256, 'steps': 27917, 'loss/train': 1.7350739240646362} -11/07/2021 01:08:19 - INFO - __main__ - Step 27919: {'lr': 0.0004631101157366985, 'samples': 5360448, 'steps': 27918, 'loss/train': 1.9519680738449097} -11/07/2021 01:08:19 - INFO - __main__ - Step 27920: {'lr': 0.0004631073411937451, 'samples': 5360640, 'steps': 27919, 'loss/train': 1.4760541915893555} -11/07/2021 01:08:20 - INFO - __main__ - Step 27921: {'lr': 0.00046310456655476875, 'samples': 5360832, 'steps': 27920, 'loss/train': 0.7511192560195923} -11/07/2021 01:08:20 - INFO - __main__ - Step 27922: {'lr': 0.0004631017918197709, 'samples': 5361024, 'steps': 27921, 'loss/train': 1.594227910041809} -11/07/2021 01:08:20 - INFO - __main__ - Step 27923: {'lr': 0.00046309901698875244, 'samples': 5361216, 'steps': 27922, 'loss/train': 1.0119025707244873} -11/07/2021 01:08:21 - INFO - __main__ - Step 27924: {'lr': 0.00046309624206171505, 'samples': 5361408, 'steps': 27923, 'loss/train': 1.7466933727264404} -11/07/2021 01:08:22 - INFO - __main__ - Step 27925: {'lr': 0.00046309346703865973, 'samples': 5361600, 'steps': 27924, 'loss/train': 1.556564211845398} -11/07/2021 01:08:22 - INFO - __main__ - Step 27926: {'lr': 0.00046309069191958775, 'samples': 5361792, 'steps': 27925, 'loss/train': 1.549757957458496} -11/07/2021 01:08:23 - INFO - __main__ - Step 27927: {'lr': 0.00046308791670450033, 'samples': 5361984, 'steps': 27926, 'loss/train': 1.4141809940338135} -11/07/2021 01:08:23 - INFO - __main__ - Step 27928: {'lr': 0.00046308514139339896, 'samples': 5362176, 'steps': 27927, 'loss/train': 1.1684983968734741} -11/07/2021 01:08:24 - INFO - __main__ - Step 27929: {'lr': 0.0004630823659862846, 'samples': 5362368, 'steps': 27928, 'loss/train': 1.5739498138427734} -11/07/2021 01:08:24 - INFO - __main__ - Step 27930: {'lr': 0.0004630795904831586, 'samples': 5362560, 'steps': 27929, 'loss/train': 1.2718456983566284} -11/07/2021 01:08:25 - INFO - __main__ - Step 27931: {'lr': 0.0004630768148840223, 'samples': 5362752, 'steps': 27930, 'loss/train': 1.2361918687820435} -11/07/2021 01:08:25 - INFO - __main__ - Step 27932: {'lr': 0.0004630740391888768, 'samples': 5362944, 'steps': 27931, 'loss/train': 1.6679351329803467} -11/07/2021 01:08:25 - INFO - __main__ - Step 27933: {'lr': 0.0004630712633977234, 'samples': 5363136, 'steps': 27932, 'loss/train': 1.3536804914474487} -11/07/2021 01:08:26 - INFO - __main__ - Step 27934: {'lr': 0.00046306848751056346, 'samples': 5363328, 'steps': 27933, 'loss/train': 1.3461530208587646} -11/07/2021 01:08:27 - INFO - __main__ - Step 27935: {'lr': 0.0004630657115273981, 'samples': 5363520, 'steps': 27934, 'loss/train': 1.6294420957565308} -11/07/2021 01:08:27 - INFO - __main__ - Step 27936: {'lr': 0.0004630629354482286, 'samples': 5363712, 'steps': 27935, 'loss/train': 1.4199550151824951} -11/07/2021 01:08:27 - INFO - __main__ - Step 27937: {'lr': 0.00046306015927305633, 'samples': 5363904, 'steps': 27936, 'loss/train': 1.5213775634765625} -11/07/2021 01:08:28 - INFO - __main__ - Step 27938: {'lr': 0.0004630573830018824, 'samples': 5364096, 'steps': 27937, 'loss/train': 1.4308301210403442} -11/07/2021 01:08:28 - INFO - __main__ - Step 27939: {'lr': 0.00046305460663470803, 'samples': 5364288, 'steps': 27938, 'loss/train': 1.7389413118362427} -11/07/2021 01:08:29 - INFO - __main__ - Step 27940: {'lr': 0.0004630518301715346, 'samples': 5364480, 'steps': 27939, 'loss/train': 1.478661060333252} -11/07/2021 01:08:29 - INFO - __main__ - Step 27941: {'lr': 0.00046304905361236335, 'samples': 5364672, 'steps': 27940, 'loss/train': 1.7717012166976929} -11/07/2021 01:08:30 - INFO - __main__ - Step 27942: {'lr': 0.00046304627695719535, 'samples': 5364864, 'steps': 27941, 'loss/train': 1.5955733060836792} -11/07/2021 01:08:30 - INFO - __main__ - Step 27943: {'lr': 0.0004630435002060321, 'samples': 5365056, 'steps': 27942, 'loss/train': 1.272430419921875} -11/07/2021 01:08:30 - INFO - __main__ - Step 27944: {'lr': 0.0004630407233588747, 'samples': 5365248, 'steps': 27943, 'loss/train': 1.54817533493042} -11/07/2021 01:08:31 - INFO - __main__ - Step 27945: {'lr': 0.00046303794641572445, 'samples': 5365440, 'steps': 27944, 'loss/train': 1.4762077331542969} -11/07/2021 01:08:32 - INFO - __main__ - Step 27946: {'lr': 0.0004630351693765825, 'samples': 5365632, 'steps': 27945, 'loss/train': 1.6068906784057617} -11/07/2021 01:08:32 - INFO - __main__ - Step 27947: {'lr': 0.0004630323922414503, 'samples': 5365824, 'steps': 27946, 'loss/train': 1.3695404529571533} -11/07/2021 01:08:32 - INFO - __main__ - Step 27948: {'lr': 0.00046302961501032896, 'samples': 5366016, 'steps': 27947, 'loss/train': 1.3957011699676514} -11/07/2021 01:08:33 - INFO - __main__ - Step 27949: {'lr': 0.00046302683768321973, 'samples': 5366208, 'steps': 27948, 'loss/train': 1.190190076828003} -11/07/2021 01:08:34 - INFO - __main__ - Step 27950: {'lr': 0.00046302406026012396, 'samples': 5366400, 'steps': 27949, 'loss/train': 1.5490968227386475} -11/07/2021 01:08:34 - INFO - __main__ - Step 27951: {'lr': 0.0004630212827410428, 'samples': 5366592, 'steps': 27950, 'loss/train': 1.3641514778137207} -11/07/2021 01:08:35 - INFO - __main__ - Step 27952: {'lr': 0.00046301850512597755, 'samples': 5366784, 'steps': 27951, 'loss/train': 1.511609435081482} -11/07/2021 01:08:35 - INFO - __main__ - Step 27953: {'lr': 0.0004630157274149294, 'samples': 5366976, 'steps': 27952, 'loss/train': 1.105630874633789} -11/07/2021 01:08:35 - INFO - __main__ - Step 27954: {'lr': 0.0004630129496078997, 'samples': 5367168, 'steps': 27953, 'loss/train': 1.6662789583206177} -11/07/2021 01:08:36 - INFO - __main__ - Step 27955: {'lr': 0.00046301017170488965, 'samples': 5367360, 'steps': 27954, 'loss/train': 1.4889657497406006} -11/07/2021 01:08:37 - INFO - __main__ - Step 27956: {'lr': 0.0004630073937059005, 'samples': 5367552, 'steps': 27955, 'loss/train': 0.7831249833106995} -11/07/2021 01:08:37 - INFO - __main__ - Step 27957: {'lr': 0.0004630046156109334, 'samples': 5367744, 'steps': 27956, 'loss/train': 1.9498980045318604} -11/07/2021 01:08:37 - INFO - __main__ - Step 27958: {'lr': 0.0004630018374199899, 'samples': 5367936, 'steps': 27957, 'loss/train': 1.4369566440582275} -11/07/2021 01:08:38 - INFO - __main__ - Step 27959: {'lr': 0.00046299905913307096, 'samples': 5368128, 'steps': 27958, 'loss/train': 1.1461580991744995} -11/07/2021 01:08:39 - INFO - __main__ - Step 27960: {'lr': 0.00046299628075017785, 'samples': 5368320, 'steps': 27959, 'loss/train': 1.9767727851867676} -11/07/2021 01:08:39 - INFO - __main__ - Step 27961: {'lr': 0.000462993502271312, 'samples': 5368512, 'steps': 27960, 'loss/train': 1.7098110914230347} -11/07/2021 01:08:40 - INFO - __main__ - Step 27962: {'lr': 0.00046299072369647453, 'samples': 5368704, 'steps': 27961, 'loss/train': 1.5643975734710693} -11/07/2021 01:08:40 - INFO - __main__ - Step 27963: {'lr': 0.00046298794502566676, 'samples': 5368896, 'steps': 27962, 'loss/train': 1.5460844039916992} -11/07/2021 01:08:40 - INFO - __main__ - Step 27964: {'lr': 0.0004629851662588899, 'samples': 5369088, 'steps': 27963, 'loss/train': 2.0571935176849365} -11/07/2021 01:08:41 - INFO - __main__ - Step 27965: {'lr': 0.00046298238739614524, 'samples': 5369280, 'steps': 27964, 'loss/train': 1.5529454946517944} -11/07/2021 01:08:42 - INFO - __main__ - Step 27966: {'lr': 0.0004629796084374339, 'samples': 5369472, 'steps': 27965, 'loss/train': 1.4575004577636719} -11/07/2021 01:08:42 - INFO - __main__ - Step 27967: {'lr': 0.00046297682938275733, 'samples': 5369664, 'steps': 27966, 'loss/train': 1.5414485931396484} -11/07/2021 01:08:42 - INFO - __main__ - Step 27968: {'lr': 0.0004629740502321167, 'samples': 5369856, 'steps': 27967, 'loss/train': 1.659104585647583} -11/07/2021 01:08:43 - INFO - __main__ - Step 27969: {'lr': 0.00046297127098551317, 'samples': 5370048, 'steps': 27968, 'loss/train': 0.7998484373092651} -11/07/2021 01:08:43 - INFO - __main__ - Step 27970: {'lr': 0.00046296849164294816, 'samples': 5370240, 'steps': 27969, 'loss/train': 1.6854795217514038} -11/07/2021 01:08:44 - INFO - __main__ - Step 27971: {'lr': 0.00046296571220442274, 'samples': 5370432, 'steps': 27970, 'loss/train': 1.4134701490402222} -11/07/2021 01:08:45 - INFO - __main__ - Step 27972: {'lr': 0.00046296293266993833, 'samples': 5370624, 'steps': 27971, 'loss/train': 1.8665457963943481} -11/07/2021 01:08:45 - INFO - __main__ - Step 27973: {'lr': 0.00046296015303949606, 'samples': 5370816, 'steps': 27972, 'loss/train': 1.2247053384780884} -11/07/2021 01:08:45 - INFO - __main__ - Step 27974: {'lr': 0.0004629573733130973, 'samples': 5371008, 'steps': 27973, 'loss/train': 1.5885862112045288} -11/07/2021 01:08:46 - INFO - __main__ - Step 27975: {'lr': 0.00046295459349074316, 'samples': 5371200, 'steps': 27974, 'loss/train': 1.613280177116394} -11/07/2021 01:08:47 - INFO - __main__ - Step 27976: {'lr': 0.000462951813572435, 'samples': 5371392, 'steps': 27975, 'loss/train': 1.2622509002685547} -11/07/2021 01:08:47 - INFO - __main__ - Step 27977: {'lr': 0.00046294903355817397, 'samples': 5371584, 'steps': 27976, 'loss/train': 1.672298789024353} -11/07/2021 01:08:47 - INFO - __main__ - Step 27978: {'lr': 0.0004629462534479615, 'samples': 5371776, 'steps': 27977, 'loss/train': 1.6013282537460327} -11/07/2021 01:08:48 - INFO - __main__ - Step 27979: {'lr': 0.0004629434732417986, 'samples': 5371968, 'steps': 27978, 'loss/train': 1.2018623352050781} -11/07/2021 01:08:48 - INFO - __main__ - Step 27980: {'lr': 0.0004629406929396868, 'samples': 5372160, 'steps': 27979, 'loss/train': 1.450639247894287} -11/07/2021 01:08:49 - INFO - __main__ - Step 27981: {'lr': 0.00046293791254162713, 'samples': 5372352, 'steps': 27980, 'loss/train': 1.7362723350524902} -11/07/2021 01:08:49 - INFO - __main__ - Step 27982: {'lr': 0.0004629351320476209, 'samples': 5372544, 'steps': 27981, 'loss/train': 1.3867053985595703} -11/07/2021 01:08:50 - INFO - __main__ - Step 27983: {'lr': 0.00046293235145766955, 'samples': 5372736, 'steps': 27982, 'loss/train': 1.4130687713623047} -11/07/2021 01:08:50 - INFO - __main__ - Step 27984: {'lr': 0.000462929570771774, 'samples': 5372928, 'steps': 27983, 'loss/train': 0.9213356375694275} -11/07/2021 01:08:50 - INFO - __main__ - Step 27985: {'lr': 0.0004629267899899358, 'samples': 5373120, 'steps': 27984, 'loss/train': 0.8098600506782532} -11/07/2021 01:08:51 - INFO - __main__ - Step 27986: {'lr': 0.00046292400911215594, 'samples': 5373312, 'steps': 27985, 'loss/train': 1.0836659669876099} -11/07/2021 01:08:52 - INFO - __main__ - Step 27987: {'lr': 0.00046292122813843586, 'samples': 5373504, 'steps': 27986, 'loss/train': 1.5532180070877075} -11/07/2021 01:08:52 - INFO - __main__ - Step 27988: {'lr': 0.00046291844706877674, 'samples': 5373696, 'steps': 27987, 'loss/train': 1.2126308679580688} -11/07/2021 01:08:52 - INFO - __main__ - Step 27989: {'lr': 0.0004629156659031799, 'samples': 5373888, 'steps': 27988, 'loss/train': 1.552217721939087} -11/07/2021 01:08:53 - INFO - __main__ - Step 27990: {'lr': 0.0004629128846416465, 'samples': 5374080, 'steps': 27989, 'loss/train': 1.5919543504714966} -11/07/2021 01:08:54 - INFO - __main__ - Step 27991: {'lr': 0.00046291010328417784, 'samples': 5374272, 'steps': 27990, 'loss/train': 1.7490825653076172} -11/07/2021 01:08:54 - INFO - __main__ - Step 27992: {'lr': 0.0004629073218307752, 'samples': 5374464, 'steps': 27991, 'loss/train': 1.7721277475357056} -11/07/2021 01:08:55 - INFO - __main__ - Step 27993: {'lr': 0.0004629045402814398, 'samples': 5374656, 'steps': 27992, 'loss/train': 1.260655403137207} -11/07/2021 01:08:55 - INFO - __main__ - Step 27994: {'lr': 0.0004629017586361729, 'samples': 5374848, 'steps': 27993, 'loss/train': 1.638946533203125} -11/07/2021 01:08:55 - INFO - __main__ - Step 27995: {'lr': 0.0004628989768949757, 'samples': 5375040, 'steps': 27994, 'loss/train': 1.3483721017837524} -11/07/2021 01:08:56 - INFO - __main__ - Step 27996: {'lr': 0.0004628961950578496, 'samples': 5375232, 'steps': 27995, 'loss/train': 1.5386420488357544} -11/07/2021 01:08:57 - INFO - __main__ - Step 27997: {'lr': 0.00046289341312479574, 'samples': 5375424, 'steps': 27996, 'loss/train': 1.6511589288711548} -11/07/2021 01:08:57 - INFO - __main__ - Step 27998: {'lr': 0.0004628906310958153, 'samples': 5375616, 'steps': 27997, 'loss/train': 1.5828850269317627} -11/07/2021 01:08:57 - INFO - __main__ - Step 27999: {'lr': 0.00046288784897090973, 'samples': 5375808, 'steps': 27998, 'loss/train': 1.1882143020629883} -11/07/2021 01:08:58 - INFO - __main__ - Step 28000: {'lr': 0.00046288506675008014, 'samples': 5376000, 'steps': 27999, 'loss/train': 1.262174367904663} -11/07/2021 01:08:59 - INFO - __main__ - Step 28001: {'lr': 0.0004628822844333278, 'samples': 5376192, 'steps': 28000, 'loss/train': 1.8064054250717163} -11/07/2021 01:08:59 - INFO - __main__ - Step 28002: {'lr': 0.0004628795020206541, 'samples': 5376384, 'steps': 28001, 'loss/train': 2.0902321338653564} -11/07/2021 01:09:00 - INFO - __main__ - Step 28003: {'lr': 0.00046287671951206004, 'samples': 5376576, 'steps': 28002, 'loss/train': 1.5915676355361938} -11/07/2021 01:09:00 - INFO - __main__ - Step 28004: {'lr': 0.0004628739369075471, 'samples': 5376768, 'steps': 28003, 'loss/train': 1.1522947549819946} -11/07/2021 01:09:00 - INFO - __main__ - Step 28005: {'lr': 0.00046287115420711643, 'samples': 5376960, 'steps': 28004, 'loss/train': 1.939139723777771} -11/07/2021 01:09:01 - INFO - __main__ - Step 28006: {'lr': 0.00046286837141076934, 'samples': 5377152, 'steps': 28005, 'loss/train': 1.4172292947769165} -11/07/2021 01:09:02 - INFO - __main__ - Step 28007: {'lr': 0.0004628655885185069, 'samples': 5377344, 'steps': 28006, 'loss/train': 0.7986924648284912} -11/07/2021 01:09:02 - INFO - __main__ - Step 28008: {'lr': 0.00046286280553033067, 'samples': 5377536, 'steps': 28007, 'loss/train': 1.7829539775848389} -11/07/2021 01:09:02 - INFO - __main__ - Step 28009: {'lr': 0.0004628600224462417, 'samples': 5377728, 'steps': 28008, 'loss/train': 2.08845853805542} -11/07/2021 01:09:03 - INFO - __main__ - Step 28010: {'lr': 0.00046285723926624126, 'samples': 5377920, 'steps': 28009, 'loss/train': 0.8777673244476318} -11/07/2021 01:09:03 - INFO - __main__ - Step 28011: {'lr': 0.00046285445599033063, 'samples': 5378112, 'steps': 28010, 'loss/train': 1.582600712776184} -11/07/2021 01:09:04 - INFO - __main__ - Step 28012: {'lr': 0.00046285167261851114, 'samples': 5378304, 'steps': 28011, 'loss/train': 1.723099708557129} -11/07/2021 01:09:04 - INFO - __main__ - Step 28013: {'lr': 0.00046284888915078384, 'samples': 5378496, 'steps': 28012, 'loss/train': 1.5498576164245605} -11/07/2021 01:09:05 - INFO - __main__ - Step 28014: {'lr': 0.00046284610558715024, 'samples': 5378688, 'steps': 28013, 'loss/train': 1.2753721475601196} -11/07/2021 01:09:05 - INFO - __main__ - Step 28015: {'lr': 0.00046284332192761136, 'samples': 5378880, 'steps': 28014, 'loss/train': 1.680116891860962} -11/07/2021 01:09:05 - INFO - __main__ - Step 28016: {'lr': 0.0004628405381721686, 'samples': 5379072, 'steps': 28015, 'loss/train': 1.4995726346969604} -11/07/2021 01:09:07 - INFO - __main__ - Step 28017: {'lr': 0.00046283775432082327, 'samples': 5379264, 'steps': 28016, 'loss/train': 1.733219027519226} -11/07/2021 01:09:07 - INFO - __main__ - Step 28018: {'lr': 0.0004628349703735765, 'samples': 5379456, 'steps': 28017, 'loss/train': 1.6560436487197876} -11/07/2021 01:09:07 - INFO - __main__ - Step 28019: {'lr': 0.0004628321863304295, 'samples': 5379648, 'steps': 28018, 'loss/train': 1.7639132738113403} -11/07/2021 01:09:08 - INFO - __main__ - Step 28020: {'lr': 0.00046282940219138366, 'samples': 5379840, 'steps': 28019, 'loss/train': 1.337292194366455} -11/07/2021 01:09:08 - INFO - __main__ - Step 28021: {'lr': 0.0004628266179564401, 'samples': 5380032, 'steps': 28020, 'loss/train': 0.2998325824737549} -11/07/2021 01:09:08 - INFO - __main__ - Step 28022: {'lr': 0.0004628238336256002, 'samples': 5380224, 'steps': 28021, 'loss/train': 1.5005648136138916} -11/07/2021 01:09:09 - INFO - __main__ - Step 28023: {'lr': 0.0004628210491988652, 'samples': 5380416, 'steps': 28022, 'loss/train': 1.5982273817062378} -11/07/2021 01:09:10 - INFO - __main__ - Step 28024: {'lr': 0.0004628182646762363, 'samples': 5380608, 'steps': 28023, 'loss/train': 1.552241325378418} -11/07/2021 01:09:10 - INFO - __main__ - Step 28025: {'lr': 0.00046281548005771476, 'samples': 5380800, 'steps': 28024, 'loss/train': 1.9095693826675415} -11/07/2021 01:09:10 - INFO - __main__ - Step 28026: {'lr': 0.0004628126953433018, 'samples': 5380992, 'steps': 28025, 'loss/train': 1.3487874269485474} -11/07/2021 01:09:11 - INFO - __main__ - Step 28027: {'lr': 0.00046280991053299883, 'samples': 5381184, 'steps': 28026, 'loss/train': 1.3562543392181396} -11/07/2021 01:09:12 - INFO - __main__ - Step 28028: {'lr': 0.00046280712562680695, 'samples': 5381376, 'steps': 28027, 'loss/train': 1.626530408859253} -11/07/2021 01:09:12 - INFO - __main__ - Step 28029: {'lr': 0.0004628043406247274, 'samples': 5381568, 'steps': 28028, 'loss/train': 2.292478084564209} -11/07/2021 01:09:12 - INFO - __main__ - Step 28030: {'lr': 0.0004628015555267616, 'samples': 5381760, 'steps': 28029, 'loss/train': 1.692482352256775} -11/07/2021 01:09:13 - INFO - __main__ - Step 28031: {'lr': 0.00046279877033291063, 'samples': 5381952, 'steps': 28030, 'loss/train': 1.5280697345733643} -11/07/2021 01:09:13 - INFO - __main__ - Step 28032: {'lr': 0.0004627959850431759, 'samples': 5382144, 'steps': 28031, 'loss/train': 2.019195318222046} -11/07/2021 01:09:14 - INFO - __main__ - Step 28033: {'lr': 0.0004627931996575585, 'samples': 5382336, 'steps': 28032, 'loss/train': 1.5592269897460938} -11/07/2021 01:09:15 - INFO - __main__ - Step 28034: {'lr': 0.0004627904141760598, 'samples': 5382528, 'steps': 28033, 'loss/train': 1.290827751159668} -11/07/2021 01:09:15 - INFO - __main__ - Step 28035: {'lr': 0.000462787628598681, 'samples': 5382720, 'steps': 28034, 'loss/train': 1.722243070602417} -11/07/2021 01:09:15 - INFO - __main__ - Step 28036: {'lr': 0.00046278484292542346, 'samples': 5382912, 'steps': 28035, 'loss/train': 1.1731336116790771} -11/07/2021 01:09:16 - INFO - __main__ - Step 28037: {'lr': 0.0004627820571562883, 'samples': 5383104, 'steps': 28036, 'loss/train': 1.524124026298523} -11/07/2021 01:09:17 - INFO - __main__ - Step 28038: {'lr': 0.0004627792712912768, 'samples': 5383296, 'steps': 28037, 'loss/train': 2.1107864379882812} -11/07/2021 01:09:17 - INFO - __main__ - Step 28039: {'lr': 0.0004627764853303902, 'samples': 5383488, 'steps': 28038, 'loss/train': 1.5921052694320679} -11/07/2021 01:09:17 - INFO - __main__ - Step 28040: {'lr': 0.00046277369927362987, 'samples': 5383680, 'steps': 28039, 'loss/train': 1.7127749919891357} -11/07/2021 01:09:18 - INFO - __main__ - Step 28041: {'lr': 0.00046277091312099704, 'samples': 5383872, 'steps': 28040, 'loss/train': 1.6613887548446655} -11/07/2021 01:09:18 - INFO - __main__ - Step 28042: {'lr': 0.00046276812687249283, 'samples': 5384064, 'steps': 28041, 'loss/train': 1.9463579654693604} -11/07/2021 01:09:19 - INFO - __main__ - Step 28043: {'lr': 0.00046276534052811863, 'samples': 5384256, 'steps': 28042, 'loss/train': 1.6028937101364136} -11/07/2021 01:09:20 - INFO - __main__ - Step 28044: {'lr': 0.00046276255408787565, 'samples': 5384448, 'steps': 28043, 'loss/train': 1.499482274055481} -11/07/2021 01:09:20 - INFO - __main__ - Step 28045: {'lr': 0.0004627597675517652, 'samples': 5384640, 'steps': 28044, 'loss/train': 0.9538659453392029} -11/07/2021 01:09:20 - INFO - __main__ - Step 28046: {'lr': 0.00046275698091978836, 'samples': 5384832, 'steps': 28045, 'loss/train': 1.4438320398330688} -11/07/2021 01:09:21 - INFO - __main__ - Step 28047: {'lr': 0.0004627541941919466, 'samples': 5385024, 'steps': 28046, 'loss/train': 1.389336109161377} -11/07/2021 01:09:22 - INFO - __main__ - Step 28048: {'lr': 0.00046275140736824104, 'samples': 5385216, 'steps': 28047, 'loss/train': 1.7338414192199707} -11/07/2021 01:09:22 - INFO - __main__ - Step 28049: {'lr': 0.000462748620448673, 'samples': 5385408, 'steps': 28048, 'loss/train': 1.335105061531067} -11/07/2021 01:09:22 - INFO - __main__ - Step 28050: {'lr': 0.0004627458334332437, 'samples': 5385600, 'steps': 28049, 'loss/train': 1.6704505681991577} -11/07/2021 01:09:23 - INFO - __main__ - Step 28051: {'lr': 0.0004627430463219544, 'samples': 5385792, 'steps': 28050, 'loss/train': 1.591986060142517} -11/07/2021 01:09:23 - INFO - __main__ - Step 28052: {'lr': 0.0004627402591148064, 'samples': 5385984, 'steps': 28051, 'loss/train': 1.5422168970108032} -11/07/2021 01:09:23 - INFO - __main__ - Step 28053: {'lr': 0.0004627374718118009, 'samples': 5386176, 'steps': 28052, 'loss/train': 1.6419172286987305} -11/07/2021 01:09:24 - INFO - __main__ - Step 28054: {'lr': 0.0004627346844129392, 'samples': 5386368, 'steps': 28053, 'loss/train': 1.4023685455322266} -11/07/2021 01:09:25 - INFO - __main__ - Step 28055: {'lr': 0.0004627318969182225, 'samples': 5386560, 'steps': 28054, 'loss/train': 1.5047255754470825} -11/07/2021 01:09:25 - INFO - __main__ - Step 28056: {'lr': 0.0004627291093276521, 'samples': 5386752, 'steps': 28055, 'loss/train': 1.5556131601333618} -11/07/2021 01:09:25 - INFO - __main__ - Step 28057: {'lr': 0.0004627263216412292, 'samples': 5386944, 'steps': 28056, 'loss/train': 2.0487048625946045} -11/07/2021 01:09:26 - INFO - __main__ - Step 28058: {'lr': 0.00046272353385895515, 'samples': 5387136, 'steps': 28057, 'loss/train': 1.6594773530960083} -11/07/2021 01:09:27 - INFO - __main__ - Step 28059: {'lr': 0.0004627207459808312, 'samples': 5387328, 'steps': 28058, 'loss/train': 1.4510393142700195} -11/07/2021 01:09:27 - INFO - __main__ - Step 28060: {'lr': 0.00046271795800685854, 'samples': 5387520, 'steps': 28059, 'loss/train': 1.6694095134735107} -11/07/2021 01:09:27 - INFO - __main__ - Step 28061: {'lr': 0.00046271516993703844, 'samples': 5387712, 'steps': 28060, 'loss/train': 1.4473903179168701} -11/07/2021 01:09:28 - INFO - __main__ - Step 28062: {'lr': 0.00046271238177137216, 'samples': 5387904, 'steps': 28061, 'loss/train': 1.3745687007904053} -11/07/2021 01:09:28 - INFO - __main__ - Step 28063: {'lr': 0.00046270959350986095, 'samples': 5388096, 'steps': 28062, 'loss/train': 1.5512062311172485} -11/07/2021 01:09:29 - INFO - __main__ - Step 28064: {'lr': 0.0004627068051525061, 'samples': 5388288, 'steps': 28063, 'loss/train': 1.3083319664001465} -11/07/2021 01:09:29 - INFO - __main__ - Step 28065: {'lr': 0.00046270401669930885, 'samples': 5388480, 'steps': 28064, 'loss/train': 1.5867365598678589} -11/07/2021 01:09:30 - INFO - __main__ - Step 28066: {'lr': 0.0004627012281502704, 'samples': 5388672, 'steps': 28065, 'loss/train': 1.640199065208435} -11/07/2021 01:09:30 - INFO - __main__ - Step 28067: {'lr': 0.00046269843950539214, 'samples': 5388864, 'steps': 28066, 'loss/train': 1.7950187921524048} -11/07/2021 01:09:31 - INFO - __main__ - Step 28068: {'lr': 0.00046269565076467517, 'samples': 5389056, 'steps': 28067, 'loss/train': 1.6963131427764893} -11/07/2021 01:09:32 - INFO - __main__ - Step 28069: {'lr': 0.0004626928619281209, 'samples': 5389248, 'steps': 28068, 'loss/train': 1.6827151775360107} -11/07/2021 01:09:32 - INFO - __main__ - Step 28070: {'lr': 0.0004626900729957305, 'samples': 5389440, 'steps': 28069, 'loss/train': 1.433807611465454} -11/07/2021 01:09:32 - INFO - __main__ - Step 28071: {'lr': 0.00046268728396750515, 'samples': 5389632, 'steps': 28070, 'loss/train': 1.8343700170516968} -11/07/2021 01:09:33 - INFO - __main__ - Step 28072: {'lr': 0.0004626844948434462, 'samples': 5389824, 'steps': 28071, 'loss/train': 1.6992357969284058} -11/07/2021 01:09:33 - INFO - __main__ - Step 28073: {'lr': 0.00046268170562355497, 'samples': 5390016, 'steps': 28072, 'loss/train': 1.352782964706421} -11/07/2021 01:09:34 - INFO - __main__ - Step 28074: {'lr': 0.0004626789163078327, 'samples': 5390208, 'steps': 28073, 'loss/train': 1.7138376235961914} -11/07/2021 01:09:35 - INFO - __main__ - Step 28075: {'lr': 0.00046267612689628046, 'samples': 5390400, 'steps': 28074, 'loss/train': 1.884217381477356} -11/07/2021 01:09:35 - INFO - __main__ - Step 28076: {'lr': 0.00046267333738889973, 'samples': 5390592, 'steps': 28075, 'loss/train': 0.8912597894668579} -11/07/2021 01:09:35 - INFO - __main__ - Step 28077: {'lr': 0.00046267054778569163, 'samples': 5390784, 'steps': 28076, 'loss/train': 1.3834558725357056} -11/07/2021 01:09:36 - INFO - __main__ - Step 28078: {'lr': 0.0004626677580866574, 'samples': 5390976, 'steps': 28077, 'loss/train': 1.657981514930725} -11/07/2021 01:09:37 - INFO - __main__ - Step 28079: {'lr': 0.00046266496829179847, 'samples': 5391168, 'steps': 28078, 'loss/train': 1.483892560005188} -11/07/2021 01:09:37 - INFO - __main__ - Step 28080: {'lr': 0.0004626621784011159, 'samples': 5391360, 'steps': 28079, 'loss/train': 1.7254626750946045} -11/07/2021 01:09:37 - INFO - __main__ - Step 28081: {'lr': 0.0004626593884146111, 'samples': 5391552, 'steps': 28080, 'loss/train': 1.7378684282302856} -11/07/2021 01:09:38 - INFO - __main__ - Step 28082: {'lr': 0.00046265659833228523, 'samples': 5391744, 'steps': 28081, 'loss/train': 1.5451849699020386} -11/07/2021 01:09:38 - INFO - __main__ - Step 28083: {'lr': 0.0004626538081541396, 'samples': 5391936, 'steps': 28082, 'loss/train': 1.3562519550323486} -11/07/2021 01:09:38 - INFO - __main__ - Step 28084: {'lr': 0.00046265101788017543, 'samples': 5392128, 'steps': 28083, 'loss/train': 1.4944548606872559} -11/07/2021 01:09:39 - INFO - __main__ - Step 28085: {'lr': 0.00046264822751039406, 'samples': 5392320, 'steps': 28084, 'loss/train': 1.656470775604248} -11/07/2021 01:09:40 - INFO - __main__ - Step 28086: {'lr': 0.00046264543704479654, 'samples': 5392512, 'steps': 28085, 'loss/train': 1.6204808950424194} -11/07/2021 01:09:40 - INFO - __main__ - Step 28087: {'lr': 0.0004626426464833844, 'samples': 5392704, 'steps': 28086, 'loss/train': 1.1907124519348145} -11/07/2021 01:09:40 - INFO - __main__ - Step 28088: {'lr': 0.0004626398558261586, 'samples': 5392896, 'steps': 28087, 'loss/train': 1.611730694770813} -11/07/2021 01:09:41 - INFO - __main__ - Step 28089: {'lr': 0.00046263706507312073, 'samples': 5393088, 'steps': 28088, 'loss/train': 1.4733778238296509} -11/07/2021 01:09:42 - INFO - __main__ - Step 28090: {'lr': 0.00046263427422427183, 'samples': 5393280, 'steps': 28089, 'loss/train': 1.566117525100708} -11/07/2021 01:09:42 - INFO - __main__ - Step 28091: {'lr': 0.00046263148327961324, 'samples': 5393472, 'steps': 28090, 'loss/train': 1.3886053562164307} -11/07/2021 01:09:43 - INFO - __main__ - Step 28092: {'lr': 0.00046262869223914613, 'samples': 5393664, 'steps': 28091, 'loss/train': 1.5615581274032593} -11/07/2021 01:09:43 - INFO - __main__ - Step 28093: {'lr': 0.00046262590110287183, 'samples': 5393856, 'steps': 28092, 'loss/train': 1.5337178707122803} -11/07/2021 01:09:43 - INFO - __main__ - Step 28094: {'lr': 0.00046262310987079156, 'samples': 5394048, 'steps': 28093, 'loss/train': 1.2868162393569946} -11/07/2021 01:09:44 - INFO - __main__ - Step 28095: {'lr': 0.0004626203185429066, 'samples': 5394240, 'steps': 28094, 'loss/train': 1.0722566843032837} -11/07/2021 01:09:45 - INFO - __main__ - Step 28096: {'lr': 0.00046261752711921825, 'samples': 5394432, 'steps': 28095, 'loss/train': 1.422263503074646} -11/07/2021 01:09:45 - INFO - __main__ - Step 28097: {'lr': 0.00046261473559972764, 'samples': 5394624, 'steps': 28096, 'loss/train': 1.1242746114730835} -11/07/2021 01:09:45 - INFO - __main__ - Step 28098: {'lr': 0.00046261194398443617, 'samples': 5394816, 'steps': 28097, 'loss/train': 1.7802011966705322} -11/07/2021 01:09:46 - INFO - __main__ - Step 28099: {'lr': 0.00046260915227334503, 'samples': 5395008, 'steps': 28098, 'loss/train': 1.442736029624939} -11/07/2021 01:09:47 - INFO - __main__ - Step 28100: {'lr': 0.0004626063604664555, 'samples': 5395200, 'steps': 28099, 'loss/train': 1.458739995956421} -11/07/2021 01:09:47 - INFO - __main__ - Step 28101: {'lr': 0.00046260356856376884, 'samples': 5395392, 'steps': 28100, 'loss/train': 1.3972065448760986} -11/07/2021 01:09:47 - INFO - __main__ - Step 28102: {'lr': 0.0004626007765652862, 'samples': 5395584, 'steps': 28101, 'loss/train': 1.6531623601913452} -11/07/2021 01:09:48 - INFO - __main__ - Step 28103: {'lr': 0.00046259798447100903, 'samples': 5395776, 'steps': 28102, 'loss/train': 0.6677843332290649} -11/07/2021 01:09:48 - INFO - __main__ - Step 28104: {'lr': 0.0004625951922809385, 'samples': 5395968, 'steps': 28103, 'loss/train': 1.4591470956802368} -11/07/2021 01:09:49 - INFO - __main__ - Step 28105: {'lr': 0.0004625923999950758, 'samples': 5396160, 'steps': 28104, 'loss/train': 1.812696933746338} -11/07/2021 01:09:50 - INFO - __main__ - Step 28106: {'lr': 0.0004625896076134222, 'samples': 5396352, 'steps': 28105, 'loss/train': 1.6228306293487549} -11/07/2021 01:09:50 - INFO - __main__ - Step 28107: {'lr': 0.00046258681513597913, 'samples': 5396544, 'steps': 28106, 'loss/train': 1.282670497894287} -11/07/2021 01:09:50 - INFO - __main__ - Step 28108: {'lr': 0.0004625840225627476, 'samples': 5396736, 'steps': 28107, 'loss/train': 1.8279814720153809} -11/07/2021 01:09:51 - INFO - __main__ - Step 28109: {'lr': 0.0004625812298937291, 'samples': 5396928, 'steps': 28108, 'loss/train': 1.9043680429458618} -11/07/2021 01:09:51 - INFO - __main__ - Step 28110: {'lr': 0.0004625784371289247, 'samples': 5397120, 'steps': 28109, 'loss/train': 1.7655878067016602} -11/07/2021 01:09:52 - INFO - __main__ - Step 28111: {'lr': 0.00046257564426833574, 'samples': 5397312, 'steps': 28110, 'loss/train': 0.7204713225364685} -11/07/2021 01:09:52 - INFO - __main__ - Step 28112: {'lr': 0.0004625728513119635, 'samples': 5397504, 'steps': 28111, 'loss/train': 1.454695463180542} -11/07/2021 01:09:53 - INFO - __main__ - Step 28113: {'lr': 0.0004625700582598092, 'samples': 5397696, 'steps': 28112, 'loss/train': 0.9713383316993713} -11/07/2021 01:09:53 - INFO - __main__ - Step 28114: {'lr': 0.00046256726511187407, 'samples': 5397888, 'steps': 28113, 'loss/train': 1.6995383501052856} -11/07/2021 01:09:53 - INFO - __main__ - Step 28115: {'lr': 0.0004625644718681595, 'samples': 5398080, 'steps': 28114, 'loss/train': 0.9354874491691589} -11/07/2021 01:09:54 - INFO - __main__ - Step 28116: {'lr': 0.0004625616785286666, 'samples': 5398272, 'steps': 28115, 'loss/train': 1.810640573501587} -11/07/2021 01:09:55 - INFO - __main__ - Step 28117: {'lr': 0.0004625588850933967, 'samples': 5398464, 'steps': 28116, 'loss/train': 1.472623348236084} -11/07/2021 01:09:55 - INFO - __main__ - Step 28118: {'lr': 0.00046255609156235105, 'samples': 5398656, 'steps': 28117, 'loss/train': 1.1488120555877686} -11/07/2021 01:09:55 - INFO - __main__ - Step 28119: {'lr': 0.0004625532979355309, 'samples': 5398848, 'steps': 28118, 'loss/train': 1.590772271156311} -11/07/2021 01:09:56 - INFO - __main__ - Step 28120: {'lr': 0.00046255050421293756, 'samples': 5399040, 'steps': 28119, 'loss/train': 1.3995095491409302} -11/07/2021 01:09:57 - INFO - __main__ - Step 28121: {'lr': 0.0004625477103945722, 'samples': 5399232, 'steps': 28120, 'loss/train': 0.9050951600074768} -11/07/2021 01:09:57 - INFO - __main__ - Step 28122: {'lr': 0.00046254491648043604, 'samples': 5399424, 'steps': 28121, 'loss/train': 0.5893778800964355} -11/07/2021 01:09:57 - INFO - __main__ - Step 28123: {'lr': 0.00046254212247053055, 'samples': 5399616, 'steps': 28122, 'loss/train': 1.2392082214355469} -11/07/2021 01:09:58 - INFO - __main__ - Step 28124: {'lr': 0.0004625393283648568, 'samples': 5399808, 'steps': 28123, 'loss/train': 1.4818974733352661} -11/07/2021 01:09:58 - INFO - __main__ - Step 28125: {'lr': 0.0004625365341634161, 'samples': 5400000, 'steps': 28124, 'loss/train': 1.5307754278182983} -11/07/2021 01:09:59 - INFO - __main__ - Step 28126: {'lr': 0.00046253373986620985, 'samples': 5400192, 'steps': 28125, 'loss/train': 1.4790600538253784} -11/07/2021 01:10:00 - INFO - __main__ - Step 28127: {'lr': 0.00046253094547323904, 'samples': 5400384, 'steps': 28126, 'loss/train': 1.7845100164413452} -11/07/2021 01:10:00 - INFO - __main__ - Step 28128: {'lr': 0.0004625281509845051, 'samples': 5400576, 'steps': 28127, 'loss/train': 2.040771961212158} -11/07/2021 01:10:00 - INFO - __main__ - Step 28129: {'lr': 0.0004625253564000092, 'samples': 5400768, 'steps': 28128, 'loss/train': 2.1188430786132812} -11/07/2021 01:10:01 - INFO - __main__ - Step 28130: {'lr': 0.00046252256171975273, 'samples': 5400960, 'steps': 28129, 'loss/train': 1.036460518836975} -11/07/2021 01:10:02 - INFO - __main__ - Step 28131: {'lr': 0.0004625197669437368, 'samples': 5401152, 'steps': 28130, 'loss/train': 1.5945188999176025} -11/07/2021 01:10:02 - INFO - __main__ - Step 28132: {'lr': 0.0004625169720719628, 'samples': 5401344, 'steps': 28131, 'loss/train': 1.317168951034546} -11/07/2021 01:10:02 - INFO - __main__ - Step 28133: {'lr': 0.0004625141771044319, 'samples': 5401536, 'steps': 28132, 'loss/train': 2.130425453186035} -11/07/2021 01:10:03 - INFO - __main__ - Step 28134: {'lr': 0.0004625113820411454, 'samples': 5401728, 'steps': 28133, 'loss/train': 2.2005603313446045} -11/07/2021 01:10:03 - INFO - __main__ - Step 28135: {'lr': 0.0004625085868821046, 'samples': 5401920, 'steps': 28134, 'loss/train': 2.0499491691589355} -11/07/2021 01:10:04 - INFO - __main__ - Step 28136: {'lr': 0.0004625057916273107, 'samples': 5402112, 'steps': 28135, 'loss/train': 1.384974479675293} -11/07/2021 01:10:04 - INFO - __main__ - Step 28137: {'lr': 0.00046250299627676486, 'samples': 5402304, 'steps': 28136, 'loss/train': 1.0415135622024536} -11/07/2021 01:10:05 - INFO - __main__ - Step 28138: {'lr': 0.0004625002008304685, 'samples': 5402496, 'steps': 28137, 'loss/train': 1.3801599740982056} -11/07/2021 01:10:05 - INFO - __main__ - Step 28139: {'lr': 0.00046249740528842286, 'samples': 5402688, 'steps': 28138, 'loss/train': 1.7484960556030273} -11/07/2021 01:10:06 - INFO - __main__ - Step 28140: {'lr': 0.00046249460965062917, 'samples': 5402880, 'steps': 28139, 'loss/train': 0.8357280492782593} -11/07/2021 01:10:06 - INFO - __main__ - Step 28141: {'lr': 0.0004624918139170887, 'samples': 5403072, 'steps': 28140, 'loss/train': 1.7102713584899902} -11/07/2021 01:10:07 - INFO - __main__ - Step 28142: {'lr': 0.0004624890180878027, 'samples': 5403264, 'steps': 28141, 'loss/train': 1.3664212226867676} -11/07/2021 01:10:07 - INFO - __main__ - Step 28143: {'lr': 0.00046248622216277235, 'samples': 5403456, 'steps': 28142, 'loss/train': 0.8420030474662781} -11/07/2021 01:10:08 - INFO - __main__ - Step 28144: {'lr': 0.0004624834261419991, 'samples': 5403648, 'steps': 28143, 'loss/train': 1.5578577518463135} -11/07/2021 01:10:08 - INFO - __main__ - Step 28145: {'lr': 0.000462480630025484, 'samples': 5403840, 'steps': 28144, 'loss/train': 1.7505838871002197} -11/07/2021 01:10:08 - INFO - __main__ - Step 28146: {'lr': 0.0004624778338132285, 'samples': 5404032, 'steps': 28145, 'loss/train': 1.77066171169281} -11/07/2021 01:10:09 - INFO - __main__ - Step 28147: {'lr': 0.0004624750375052337, 'samples': 5404224, 'steps': 28146, 'loss/train': 1.6351187229156494} -11/07/2021 01:10:10 - INFO - __main__ - Step 28148: {'lr': 0.0004624722411015009, 'samples': 5404416, 'steps': 28147, 'loss/train': 1.363378643989563} -11/07/2021 01:10:10 - INFO - __main__ - Step 28149: {'lr': 0.0004624694446020314, 'samples': 5404608, 'steps': 28148, 'loss/train': 1.5831588506698608} -11/07/2021 01:10:10 - INFO - __main__ - Step 28150: {'lr': 0.0004624666480068265, 'samples': 5404800, 'steps': 28149, 'loss/train': 1.492389440536499} -11/07/2021 01:10:11 - INFO - __main__ - Step 28151: {'lr': 0.0004624638513158874, 'samples': 5404992, 'steps': 28150, 'loss/train': 1.449171543121338} -11/07/2021 01:10:12 - INFO - __main__ - Step 28152: {'lr': 0.0004624610545292154, 'samples': 5405184, 'steps': 28151, 'loss/train': 1.6068949699401855} -11/07/2021 01:10:12 - INFO - __main__ - Step 28153: {'lr': 0.00046245825764681166, 'samples': 5405376, 'steps': 28152, 'loss/train': 1.152055263519287} -11/07/2021 01:10:13 - INFO - __main__ - Step 28154: {'lr': 0.0004624554606686775, 'samples': 5405568, 'steps': 28153, 'loss/train': 1.5159696340560913} -11/07/2021 01:10:13 - INFO - __main__ - Step 28155: {'lr': 0.0004624526635948142, 'samples': 5405760, 'steps': 28154, 'loss/train': 1.4149354696273804} -11/07/2021 01:10:13 - INFO - __main__ - Step 28156: {'lr': 0.000462449866425223, 'samples': 5405952, 'steps': 28155, 'loss/train': 1.441688060760498} -11/07/2021 01:10:14 - INFO - __main__ - Step 28157: {'lr': 0.0004624470691599052, 'samples': 5406144, 'steps': 28156, 'loss/train': 1.7866506576538086} -11/07/2021 01:10:15 - INFO - __main__ - Step 28158: {'lr': 0.00046244427179886207, 'samples': 5406336, 'steps': 28157, 'loss/train': 1.7607122659683228} -11/07/2021 01:10:15 - INFO - __main__ - Step 28159: {'lr': 0.0004624414743420947, 'samples': 5406528, 'steps': 28158, 'loss/train': 0.31811484694480896} -11/07/2021 01:10:15 - INFO - __main__ - Step 28160: {'lr': 0.00046243867678960463, 'samples': 5406720, 'steps': 28159, 'loss/train': 1.0300776958465576} -11/07/2021 01:10:16 - INFO - __main__ - Step 28161: {'lr': 0.00046243587914139285, 'samples': 5406912, 'steps': 28160, 'loss/train': 1.6217018365859985} -11/07/2021 01:10:16 - INFO - __main__ - Step 28162: {'lr': 0.00046243308139746076, 'samples': 5407104, 'steps': 28161, 'loss/train': 1.4089314937591553} -11/07/2021 01:10:17 - INFO - __main__ - Step 28163: {'lr': 0.00046243028355780967, 'samples': 5407296, 'steps': 28162, 'loss/train': 1.966225028038025} -11/07/2021 01:10:18 - INFO - __main__ - Step 28164: {'lr': 0.00046242748562244076, 'samples': 5407488, 'steps': 28163, 'loss/train': 1.695816159248352} -11/07/2021 01:10:18 - INFO - __main__ - Step 28165: {'lr': 0.00046242468759135523, 'samples': 5407680, 'steps': 28164, 'loss/train': 0.20627062022686005} -11/07/2021 01:10:18 - INFO - __main__ - Step 28166: {'lr': 0.00046242188946455444, 'samples': 5407872, 'steps': 28165, 'loss/train': 1.6223536729812622} -11/07/2021 01:10:19 - INFO - __main__ - Step 28167: {'lr': 0.0004624190912420397, 'samples': 5408064, 'steps': 28166, 'loss/train': 1.5699890851974487} -11/07/2021 01:10:20 - INFO - __main__ - Step 28168: {'lr': 0.0004624162929238121, 'samples': 5408256, 'steps': 28167, 'loss/train': 1.6369304656982422} -11/07/2021 01:10:20 - INFO - __main__ - Step 28169: {'lr': 0.000462413494509873, 'samples': 5408448, 'steps': 28168, 'loss/train': 1.537266731262207} -11/07/2021 01:10:20 - INFO - __main__ - Step 28170: {'lr': 0.0004624106960002237, 'samples': 5408640, 'steps': 28169, 'loss/train': 1.0919755697250366} -11/07/2021 01:10:21 - INFO - __main__ - Step 28171: {'lr': 0.0004624078973948654, 'samples': 5408832, 'steps': 28170, 'loss/train': 1.5566425323486328} -11/07/2021 01:10:21 - INFO - __main__ - Step 28172: {'lr': 0.00046240509869379943, 'samples': 5409024, 'steps': 28171, 'loss/train': 1.5323331356048584} -11/07/2021 01:10:22 - INFO - __main__ - Step 28173: {'lr': 0.00046240229989702697, 'samples': 5409216, 'steps': 28172, 'loss/train': 1.5322365760803223} -11/07/2021 01:10:22 - INFO - __main__ - Step 28174: {'lr': 0.0004623995010045493, 'samples': 5409408, 'steps': 28173, 'loss/train': 0.9593502879142761} -11/07/2021 01:10:23 - INFO - __main__ - Step 28175: {'lr': 0.0004623967020163677, 'samples': 5409600, 'steps': 28174, 'loss/train': 1.6781811714172363} -11/07/2021 01:10:23 - INFO - __main__ - Step 28176: {'lr': 0.0004623939029324834, 'samples': 5409792, 'steps': 28175, 'loss/train': 1.395211935043335} -11/07/2021 01:10:23 - INFO - __main__ - Step 28177: {'lr': 0.0004623911037528977, 'samples': 5409984, 'steps': 28176, 'loss/train': 1.3277342319488525} -11/07/2021 01:10:25 - INFO - __main__ - Step 28178: {'lr': 0.00046238830447761184, 'samples': 5410176, 'steps': 28177, 'loss/train': 1.2456005811691284} -11/07/2021 01:10:25 - INFO - __main__ - Step 28179: {'lr': 0.0004623855051066271, 'samples': 5410368, 'steps': 28178, 'loss/train': 1.7877765893936157} -11/07/2021 01:10:25 - INFO - __main__ - Step 28180: {'lr': 0.00046238270563994465, 'samples': 5410560, 'steps': 28179, 'loss/train': 1.342936635017395} -11/07/2021 01:10:26 - INFO - __main__ - Step 28181: {'lr': 0.00046237990607756596, 'samples': 5410752, 'steps': 28180, 'loss/train': 1.268366813659668} -11/07/2021 01:10:26 - INFO - __main__ - Step 28182: {'lr': 0.0004623771064194921, 'samples': 5410944, 'steps': 28181, 'loss/train': 1.347800612449646} -11/07/2021 01:10:27 - INFO - __main__ - Step 28183: {'lr': 0.0004623743066657244, 'samples': 5411136, 'steps': 28182, 'loss/train': 0.17466305196285248} -11/07/2021 01:10:27 - INFO - __main__ - Step 28184: {'lr': 0.00046237150681626414, 'samples': 5411328, 'steps': 28183, 'loss/train': 1.1365277767181396} -11/07/2021 01:10:28 - INFO - __main__ - Step 28185: {'lr': 0.00046236870687111254, 'samples': 5411520, 'steps': 28184, 'loss/train': 0.9038922786712646} -11/07/2021 01:10:28 - INFO - __main__ - Step 28186: {'lr': 0.0004623659068302708, 'samples': 5411712, 'steps': 28185, 'loss/train': 1.4337131977081299} -11/07/2021 01:10:28 - INFO - __main__ - Step 28187: {'lr': 0.00046236310669374035, 'samples': 5411904, 'steps': 28186, 'loss/train': 2.480987071990967} -11/07/2021 01:10:30 - INFO - __main__ - Step 28188: {'lr': 0.0004623603064615223, 'samples': 5412096, 'steps': 28187, 'loss/train': 1.4874110221862793} -11/07/2021 01:10:30 - INFO - __main__ - Step 28189: {'lr': 0.000462357506133618, 'samples': 5412288, 'steps': 28188, 'loss/train': 2.2280004024505615} -11/07/2021 01:10:30 - INFO - __main__ - Step 28190: {'lr': 0.00046235470571002877, 'samples': 5412480, 'steps': 28189, 'loss/train': 1.6419894695281982} -11/07/2021 01:10:31 - INFO - __main__ - Step 28191: {'lr': 0.00046235190519075564, 'samples': 5412672, 'steps': 28190, 'loss/train': 1.4072515964508057} -11/07/2021 01:10:31 - INFO - __main__ - Step 28192: {'lr': 0.00046234910457580014, 'samples': 5412864, 'steps': 28191, 'loss/train': 1.2326654195785522} -11/07/2021 01:10:31 - INFO - __main__ - Step 28193: {'lr': 0.0004623463038651633, 'samples': 5413056, 'steps': 28192, 'loss/train': 5.861023902893066} -11/07/2021 01:10:32 - INFO - __main__ - Step 28194: {'lr': 0.0004623435030588466, 'samples': 5413248, 'steps': 28193, 'loss/train': 5.822354316711426} -11/07/2021 01:10:33 - INFO - __main__ - Step 28195: {'lr': 0.00046234070215685116, 'samples': 5413440, 'steps': 28194, 'loss/train': 0.5922368168830872} -11/07/2021 01:10:33 - INFO - __main__ - Step 28196: {'lr': 0.0004623379011591782, 'samples': 5413632, 'steps': 28195, 'loss/train': 1.4715194702148438} -11/07/2021 01:10:33 - INFO - __main__ - Step 28197: {'lr': 0.00046233510006582913, 'samples': 5413824, 'steps': 28196, 'loss/train': 1.698293924331665} -11/07/2021 01:10:34 - INFO - __main__ - Step 28198: {'lr': 0.00046233229887680517, 'samples': 5414016, 'steps': 28197, 'loss/train': 1.3359768390655518} -11/07/2021 01:10:34 - INFO - __main__ - Step 28199: {'lr': 0.00046232949759210753, 'samples': 5414208, 'steps': 28198, 'loss/train': 1.5249158143997192} -11/07/2021 01:10:35 - INFO - __main__ - Step 28200: {'lr': 0.00046232669621173745, 'samples': 5414400, 'steps': 28199, 'loss/train': 1.369057297706604} -11/07/2021 01:10:36 - INFO - __main__ - Step 28201: {'lr': 0.00046232389473569623, 'samples': 5414592, 'steps': 28200, 'loss/train': 1.5750991106033325} -11/07/2021 01:10:36 - INFO - __main__ - Step 28202: {'lr': 0.0004623210931639852, 'samples': 5414784, 'steps': 28201, 'loss/train': 1.4961779117584229} -11/07/2021 01:10:36 - INFO - __main__ - Step 28203: {'lr': 0.00046231829149660553, 'samples': 5414976, 'steps': 28202, 'loss/train': 1.7517107725143433} -11/07/2021 01:10:37 - INFO - __main__ - Step 28204: {'lr': 0.00046231548973355854, 'samples': 5415168, 'steps': 28203, 'loss/train': 1.505367398262024} -11/07/2021 01:10:38 - INFO - __main__ - Step 28205: {'lr': 0.00046231268787484545, 'samples': 5415360, 'steps': 28204, 'loss/train': 1.7063173055648804} -11/07/2021 01:10:38 - INFO - __main__ - Step 28206: {'lr': 0.0004623098859204675, 'samples': 5415552, 'steps': 28205, 'loss/train': 1.0347256660461426} -11/07/2021 01:10:39 - INFO - __main__ - Step 28207: {'lr': 0.00046230708387042603, 'samples': 5415744, 'steps': 28206, 'loss/train': 1.5646445751190186} -11/07/2021 01:10:39 - INFO - __main__ - Step 28208: {'lr': 0.0004623042817247223, 'samples': 5415936, 'steps': 28207, 'loss/train': 1.6940830945968628} -11/07/2021 01:10:39 - INFO - __main__ - Step 28209: {'lr': 0.00046230147948335746, 'samples': 5416128, 'steps': 28208, 'loss/train': 0.8263731598854065} -11/07/2021 01:10:40 - INFO - __main__ - Step 28210: {'lr': 0.0004622986771463329, 'samples': 5416320, 'steps': 28209, 'loss/train': 0.4169537127017975} -11/07/2021 01:10:41 - INFO - __main__ - Step 28211: {'lr': 0.0004622958747136498, 'samples': 5416512, 'steps': 28210, 'loss/train': 1.35165536403656} -11/07/2021 01:10:41 - INFO - __main__ - Step 28212: {'lr': 0.00046229307218530945, 'samples': 5416704, 'steps': 28211, 'loss/train': 1.235717535018921} -11/07/2021 01:10:41 - INFO - __main__ - Step 28213: {'lr': 0.0004622902695613131, 'samples': 5416896, 'steps': 28212, 'loss/train': 0.730085551738739} -11/07/2021 01:10:42 - INFO - __main__ - Step 28214: {'lr': 0.00046228746684166214, 'samples': 5417088, 'steps': 28213, 'loss/train': 1.573953628540039} -11/07/2021 01:10:43 - INFO - __main__ - Step 28215: {'lr': 0.00046228466402635764, 'samples': 5417280, 'steps': 28214, 'loss/train': 1.9090080261230469} -11/07/2021 01:10:43 - INFO - __main__ - Step 28216: {'lr': 0.0004622818611154009, 'samples': 5417472, 'steps': 28215, 'loss/train': 0.8026754856109619} -11/07/2021 01:10:43 - INFO - __main__ - Step 28217: {'lr': 0.00046227905810879334, 'samples': 5417664, 'steps': 28216, 'loss/train': 1.769519329071045} -11/07/2021 01:10:44 - INFO - __main__ - Step 28218: {'lr': 0.0004622762550065361, 'samples': 5417856, 'steps': 28217, 'loss/train': 1.2289551496505737} -11/07/2021 01:10:44 - INFO - __main__ - Step 28219: {'lr': 0.0004622734518086304, 'samples': 5418048, 'steps': 28218, 'loss/train': 1.9097330570220947} -11/07/2021 01:10:45 - INFO - __main__ - Step 28220: {'lr': 0.0004622706485150776, 'samples': 5418240, 'steps': 28219, 'loss/train': 1.358104944229126} -11/07/2021 01:10:46 - INFO - __main__ - Step 28221: {'lr': 0.0004622678451258788, 'samples': 5418432, 'steps': 28220, 'loss/train': 1.5007022619247437} -11/07/2021 01:10:46 - INFO - __main__ - Step 28222: {'lr': 0.00046226504164103557, 'samples': 5418624, 'steps': 28221, 'loss/train': 1.2808752059936523} -11/07/2021 01:10:46 - INFO - __main__ - Step 28223: {'lr': 0.0004622622380605489, 'samples': 5418816, 'steps': 28222, 'loss/train': 1.0220810174942017} -11/07/2021 01:10:47 - INFO - __main__ - Step 28224: {'lr': 0.0004622594343844201, 'samples': 5419008, 'steps': 28223, 'loss/train': 1.1426414251327515} -11/07/2021 01:10:47 - INFO - __main__ - Step 28225: {'lr': 0.00046225663061265056, 'samples': 5419200, 'steps': 28224, 'loss/train': 1.3588509559631348} -11/07/2021 01:10:48 - INFO - __main__ - Step 28226: {'lr': 0.0004622538267452414, 'samples': 5419392, 'steps': 28225, 'loss/train': 1.5352381467819214} -11/07/2021 01:10:48 - INFO - __main__ - Step 28227: {'lr': 0.00046225102278219394, 'samples': 5419584, 'steps': 28226, 'loss/train': 1.7459994554519653} -11/07/2021 01:10:49 - INFO - __main__ - Step 28228: {'lr': 0.0004622482187235094, 'samples': 5419776, 'steps': 28227, 'loss/train': 1.6979622840881348} -11/07/2021 01:10:49 - INFO - __main__ - Step 28229: {'lr': 0.00046224541456918916, 'samples': 5419968, 'steps': 28228, 'loss/train': 1.3146947622299194} -11/07/2021 01:10:49 - INFO - __main__ - Step 28230: {'lr': 0.0004622426103192344, 'samples': 5420160, 'steps': 28229, 'loss/train': 1.72724187374115} -11/07/2021 01:10:50 - INFO - __main__ - Step 28231: {'lr': 0.00046223980597364647, 'samples': 5420352, 'steps': 28230, 'loss/train': 1.4171353578567505} -11/07/2021 01:10:51 - INFO - __main__ - Step 28232: {'lr': 0.0004622370015324264, 'samples': 5420544, 'steps': 28231, 'loss/train': 1.5277044773101807} -11/07/2021 01:10:51 - INFO - __main__ - Step 28233: {'lr': 0.0004622341969955757, 'samples': 5420736, 'steps': 28232, 'loss/train': 1.284793734550476} -11/07/2021 01:10:51 - INFO - __main__ - Step 28234: {'lr': 0.00046223139236309553, 'samples': 5420928, 'steps': 28233, 'loss/train': 1.54947030544281} -11/07/2021 01:10:52 - INFO - __main__ - Step 28235: {'lr': 0.0004622285876349872, 'samples': 5421120, 'steps': 28234, 'loss/train': 2.010934591293335} -11/07/2021 01:10:53 - INFO - __main__ - Step 28236: {'lr': 0.00046222578281125194, 'samples': 5421312, 'steps': 28235, 'loss/train': 1.3534091711044312} -11/07/2021 01:10:53 - INFO - __main__ - Step 28237: {'lr': 0.0004622229778918909, 'samples': 5421504, 'steps': 28236, 'loss/train': 1.2735710144042969} -11/07/2021 01:10:53 - INFO - __main__ - Step 28238: {'lr': 0.00046222017287690566, 'samples': 5421696, 'steps': 28237, 'loss/train': 1.203763484954834} -11/07/2021 01:10:54 - INFO - __main__ - Step 28239: {'lr': 0.00046221736776629713, 'samples': 5421888, 'steps': 28238, 'loss/train': 2.086308002471924} -11/07/2021 01:10:54 - INFO - __main__ - Step 28240: {'lr': 0.0004622145625600668, 'samples': 5422080, 'steps': 28239, 'loss/train': 1.3777828216552734} -11/07/2021 01:10:55 - INFO - __main__ - Step 28241: {'lr': 0.00046221175725821585, 'samples': 5422272, 'steps': 28240, 'loss/train': 1.2123701572418213} -11/07/2021 01:10:55 - INFO - __main__ - Step 28242: {'lr': 0.00046220895186074553, 'samples': 5422464, 'steps': 28241, 'loss/train': 1.9083006381988525} -11/07/2021 01:10:56 - INFO - __main__ - Step 28243: {'lr': 0.0004622061463676572, 'samples': 5422656, 'steps': 28242, 'loss/train': 1.196201205253601} -11/07/2021 01:10:56 - INFO - __main__ - Step 28244: {'lr': 0.000462203340778952, 'samples': 5422848, 'steps': 28243, 'loss/train': 1.1842589378356934} -11/07/2021 01:10:57 - INFO - __main__ - Step 28245: {'lr': 0.0004622005350946312, 'samples': 5423040, 'steps': 28244, 'loss/train': 1.2179888486862183} -11/07/2021 01:10:57 - INFO - __main__ - Step 28246: {'lr': 0.00046219772931469617, 'samples': 5423232, 'steps': 28245, 'loss/train': 1.2169467210769653} -11/07/2021 01:10:58 - INFO - __main__ - Step 28247: {'lr': 0.00046219492343914815, 'samples': 5423424, 'steps': 28246, 'loss/train': 1.2924308776855469} -11/07/2021 01:10:58 - INFO - __main__ - Step 28248: {'lr': 0.00046219211746798835, 'samples': 5423616, 'steps': 28247, 'loss/train': 1.3133745193481445} -11/07/2021 01:10:59 - INFO - __main__ - Step 28249: {'lr': 0.000462189311401218, 'samples': 5423808, 'steps': 28248, 'loss/train': 0.5545594096183777} -11/07/2021 01:10:59 - INFO - __main__ - Step 28250: {'lr': 0.0004621865052388385, 'samples': 5424000, 'steps': 28249, 'loss/train': 1.7208218574523926} -11/07/2021 01:11:00 - INFO - __main__ - Step 28251: {'lr': 0.00046218369898085097, 'samples': 5424192, 'steps': 28250, 'loss/train': 1.277891755104065} -11/07/2021 01:11:00 - INFO - __main__ - Step 28252: {'lr': 0.0004621808926272568, 'samples': 5424384, 'steps': 28251, 'loss/train': 1.8041847944259644} -11/07/2021 01:11:01 - INFO - __main__ - Step 28253: {'lr': 0.0004621780861780572, 'samples': 5424576, 'steps': 28252, 'loss/train': 1.4097659587860107} -11/07/2021 01:11:01 - INFO - __main__ - Step 28254: {'lr': 0.00046217527963325335, 'samples': 5424768, 'steps': 28253, 'loss/train': 1.9377212524414062} -11/07/2021 01:11:01 - INFO - __main__ - Step 28255: {'lr': 0.00046217247299284666, 'samples': 5424960, 'steps': 28254, 'loss/train': 2.2206597328186035} -11/07/2021 01:11:02 - INFO - __main__ - Step 28256: {'lr': 0.00046216966625683834, 'samples': 5425152, 'steps': 28255, 'loss/train': 0.9910633563995361} -11/07/2021 01:11:03 - INFO - __main__ - Step 28257: {'lr': 0.00046216685942522957, 'samples': 5425344, 'steps': 28256, 'loss/train': 1.0055487155914307} -11/07/2021 01:11:03 - INFO - __main__ - Step 28258: {'lr': 0.00046216405249802176, 'samples': 5425536, 'steps': 28257, 'loss/train': 1.5653692483901978} -11/07/2021 01:11:04 - INFO - __main__ - Step 28259: {'lr': 0.000462161245475216, 'samples': 5425728, 'steps': 28258, 'loss/train': 2.771857976913452} -11/07/2021 01:11:04 - INFO - __main__ - Step 28260: {'lr': 0.0004621584383568137, 'samples': 5425920, 'steps': 28259, 'loss/train': 0.6507758498191833} -11/07/2021 01:11:04 - INFO - __main__ - Step 28261: {'lr': 0.00046215563114281613, 'samples': 5426112, 'steps': 28260, 'loss/train': 1.4386929273605347} -11/07/2021 01:11:06 - INFO - __main__ - Step 28262: {'lr': 0.0004621528238332245, 'samples': 5426304, 'steps': 28261, 'loss/train': 1.5386488437652588} -11/07/2021 01:11:06 - INFO - __main__ - Step 28263: {'lr': 0.00046215001642804, 'samples': 5426496, 'steps': 28262, 'loss/train': 1.4531859159469604} -11/07/2021 01:11:06 - INFO - __main__ - Step 28264: {'lr': 0.0004621472089272641, 'samples': 5426688, 'steps': 28263, 'loss/train': 1.2668935060501099} -11/07/2021 01:11:07 - INFO - __main__ - Step 28265: {'lr': 0.0004621444013308979, 'samples': 5426880, 'steps': 28264, 'loss/train': 1.032285451889038} -11/07/2021 01:11:07 - INFO - __main__ - Step 28266: {'lr': 0.00046214159363894264, 'samples': 5427072, 'steps': 28265, 'loss/train': 1.93840491771698} -11/07/2021 01:11:08 - INFO - __main__ - Step 28267: {'lr': 0.0004621387858513997, 'samples': 5427264, 'steps': 28266, 'loss/train': 0.8712663650512695} -11/07/2021 01:11:08 - INFO - __main__ - Step 28268: {'lr': 0.0004621359779682703, 'samples': 5427456, 'steps': 28267, 'loss/train': 1.6369661092758179} -11/07/2021 01:11:09 - INFO - __main__ - Step 28269: {'lr': 0.0004621331699895557, 'samples': 5427648, 'steps': 28268, 'loss/train': 1.922584056854248} -11/07/2021 01:11:09 - INFO - __main__ - Step 28270: {'lr': 0.00046213036191525714, 'samples': 5427840, 'steps': 28269, 'loss/train': 1.4946922063827515} -11/07/2021 01:11:09 - INFO - __main__ - Step 28271: {'lr': 0.00046212755374537594, 'samples': 5428032, 'steps': 28270, 'loss/train': 1.5393568277359009} -11/07/2021 01:11:10 - INFO - __main__ - Step 28272: {'lr': 0.0004621247454799133, 'samples': 5428224, 'steps': 28271, 'loss/train': 1.8413314819335938} -11/07/2021 01:11:11 - INFO - __main__ - Step 28273: {'lr': 0.0004621219371188706, 'samples': 5428416, 'steps': 28272, 'loss/train': 1.6785149574279785} -11/07/2021 01:11:11 - INFO - __main__ - Step 28274: {'lr': 0.0004621191286622489, 'samples': 5428608, 'steps': 28273, 'loss/train': 1.8030606508255005} -11/07/2021 01:11:11 - INFO - __main__ - Step 28275: {'lr': 0.00046211632011004973, 'samples': 5428800, 'steps': 28274, 'loss/train': 1.560758113861084} -11/07/2021 01:11:12 - INFO - __main__ - Step 28276: {'lr': 0.0004621135114622742, 'samples': 5428992, 'steps': 28275, 'loss/train': 1.2767295837402344} -11/07/2021 01:11:13 - INFO - __main__ - Step 28277: {'lr': 0.00046211070271892353, 'samples': 5429184, 'steps': 28276, 'loss/train': 1.8365651369094849} -11/07/2021 01:11:13 - INFO - __main__ - Step 28278: {'lr': 0.00046210789387999906, 'samples': 5429376, 'steps': 28277, 'loss/train': 1.224928379058838} -11/07/2021 01:11:13 - INFO - __main__ - Step 28279: {'lr': 0.00046210508494550206, 'samples': 5429568, 'steps': 28278, 'loss/train': 1.620279312133789} -11/07/2021 01:11:14 - INFO - __main__ - Step 28280: {'lr': 0.0004621022759154338, 'samples': 5429760, 'steps': 28279, 'loss/train': 1.5172548294067383} -11/07/2021 01:11:14 - INFO - __main__ - Step 28281: {'lr': 0.0004620994667897955, 'samples': 5429952, 'steps': 28280, 'loss/train': 1.7610883712768555} -11/07/2021 01:11:15 - INFO - __main__ - Step 28282: {'lr': 0.0004620966575685885, 'samples': 5430144, 'steps': 28281, 'loss/train': 1.4005475044250488} -11/07/2021 01:11:16 - INFO - __main__ - Step 28283: {'lr': 0.000462093848251814, 'samples': 5430336, 'steps': 28282, 'loss/train': 1.6726186275482178} -11/07/2021 01:11:16 - INFO - __main__ - Step 28284: {'lr': 0.00046209103883947323, 'samples': 5430528, 'steps': 28283, 'loss/train': 1.5743645429611206} -11/07/2021 01:11:16 - INFO - __main__ - Step 28285: {'lr': 0.00046208822933156756, 'samples': 5430720, 'steps': 28284, 'loss/train': 1.523167371749878} -11/07/2021 01:11:17 - INFO - __main__ - Step 28286: {'lr': 0.00046208541972809824, 'samples': 5430912, 'steps': 28285, 'loss/train': 1.5007579326629639} -11/07/2021 01:11:17 - INFO - __main__ - Step 28287: {'lr': 0.00046208261002906643, 'samples': 5431104, 'steps': 28286, 'loss/train': 1.5673551559448242} -11/07/2021 01:11:18 - INFO - __main__ - Step 28288: {'lr': 0.00046207980023447347, 'samples': 5431296, 'steps': 28287, 'loss/train': 1.0199003219604492} -11/07/2021 01:11:18 - INFO - __main__ - Step 28289: {'lr': 0.0004620769903443207, 'samples': 5431488, 'steps': 28288, 'loss/train': 1.2680659294128418} -11/07/2021 01:11:19 - INFO - __main__ - Step 28290: {'lr': 0.00046207418035860927, 'samples': 5431680, 'steps': 28289, 'loss/train': 1.4011750221252441} -11/07/2021 01:11:19 - INFO - __main__ - Step 28291: {'lr': 0.00046207137027734046, 'samples': 5431872, 'steps': 28290, 'loss/train': 1.3798640966415405} -11/07/2021 01:11:19 - INFO - __main__ - Step 28292: {'lr': 0.00046206856010051555, 'samples': 5432064, 'steps': 28291, 'loss/train': 1.6333099603652954} -11/07/2021 01:11:20 - INFO - __main__ - Step 28293: {'lr': 0.0004620657498281359, 'samples': 5432256, 'steps': 28292, 'loss/train': 1.6269264221191406} -11/07/2021 01:11:21 - INFO - __main__ - Step 28294: {'lr': 0.0004620629394602027, 'samples': 5432448, 'steps': 28293, 'loss/train': 1.6605522632598877} -11/07/2021 01:11:21 - INFO - __main__ - Step 28295: {'lr': 0.00046206012899671715, 'samples': 5432640, 'steps': 28294, 'loss/train': 1.629433035850525} -11/07/2021 01:11:21 - INFO - __main__ - Step 28296: {'lr': 0.00046205731843768056, 'samples': 5432832, 'steps': 28295, 'loss/train': 1.2553709745407104} -11/07/2021 01:11:22 - INFO - __main__ - Step 28297: {'lr': 0.0004620545077830942, 'samples': 5433024, 'steps': 28296, 'loss/train': 1.2244160175323486} -11/07/2021 01:11:23 - INFO - __main__ - Step 28298: {'lr': 0.00046205169703295945, 'samples': 5433216, 'steps': 28297, 'loss/train': 1.3817449808120728} -11/07/2021 01:11:24 - INFO - __main__ - Step 28299: {'lr': 0.00046204888618727743, 'samples': 5433408, 'steps': 28298, 'loss/train': 2.1621477603912354} -11/07/2021 01:11:24 - INFO - __main__ - Step 28300: {'lr': 0.00046204607524604944, 'samples': 5433600, 'steps': 28299, 'loss/train': 1.4274929761886597} -11/07/2021 01:11:24 - INFO - __main__ - Step 28301: {'lr': 0.0004620432642092768, 'samples': 5433792, 'steps': 28300, 'loss/train': 0.30110833048820496} -11/07/2021 01:11:25 - INFO - __main__ - Step 28302: {'lr': 0.00046204045307696065, 'samples': 5433984, 'steps': 28301, 'loss/train': 1.907424807548523} -11/07/2021 01:11:26 - INFO - __main__ - Step 28303: {'lr': 0.0004620376418491024, 'samples': 5434176, 'steps': 28302, 'loss/train': 1.513163447380066} -11/07/2021 01:11:26 - INFO - __main__ - Step 28304: {'lr': 0.0004620348305257033, 'samples': 5434368, 'steps': 28303, 'loss/train': 1.9480259418487549} -11/07/2021 01:11:27 - INFO - __main__ - Step 28305: {'lr': 0.00046203201910676453, 'samples': 5434560, 'steps': 28304, 'loss/train': 1.8017507791519165} -11/07/2021 01:11:27 - INFO - __main__ - Step 28306: {'lr': 0.0004620292075922874, 'samples': 5434752, 'steps': 28305, 'loss/train': 1.4269638061523438} -11/07/2021 01:11:27 - INFO - __main__ - Step 28307: {'lr': 0.0004620263959822732, 'samples': 5434944, 'steps': 28306, 'loss/train': 1.9615912437438965} -11/07/2021 01:11:28 - INFO - __main__ - Step 28308: {'lr': 0.00046202358427672313, 'samples': 5435136, 'steps': 28307, 'loss/train': 1.8395740985870361} -11/07/2021 01:11:29 - INFO - __main__ - Step 28309: {'lr': 0.0004620207724756386, 'samples': 5435328, 'steps': 28308, 'loss/train': 0.8543437719345093} -11/07/2021 01:11:29 - INFO - __main__ - Step 28310: {'lr': 0.0004620179605790207, 'samples': 5435520, 'steps': 28309, 'loss/train': 1.6621850728988647} -11/07/2021 01:11:29 - INFO - __main__ - Step 28311: {'lr': 0.00046201514858687075, 'samples': 5435712, 'steps': 28310, 'loss/train': 1.4606200456619263} -11/07/2021 01:11:30 - INFO - __main__ - Step 28312: {'lr': 0.00046201233649919015, 'samples': 5435904, 'steps': 28311, 'loss/train': 2.1351730823516846} -11/07/2021 01:11:31 - INFO - __main__ - Step 28313: {'lr': 0.00046200952431598, 'samples': 5436096, 'steps': 28312, 'loss/train': 1.5596314668655396} -11/07/2021 01:11:31 - INFO - __main__ - Step 28314: {'lr': 0.00046200671203724166, 'samples': 5436288, 'steps': 28313, 'loss/train': 1.620673418045044} -11/07/2021 01:11:31 - INFO - __main__ - Step 28315: {'lr': 0.00046200389966297633, 'samples': 5436480, 'steps': 28314, 'loss/train': 1.219846248626709} -11/07/2021 01:11:32 - INFO - __main__ - Step 28316: {'lr': 0.00046200108719318537, 'samples': 5436672, 'steps': 28315, 'loss/train': 1.4547991752624512} -11/07/2021 01:11:32 - INFO - __main__ - Step 28317: {'lr': 0.0004619982746278699, 'samples': 5436864, 'steps': 28316, 'loss/train': 1.4756008386611938} -11/07/2021 01:11:33 - INFO - __main__ - Step 28318: {'lr': 0.00046199546196703134, 'samples': 5437056, 'steps': 28317, 'loss/train': 1.5366729497909546} -11/07/2021 01:11:34 - INFO - __main__ - Step 28319: {'lr': 0.0004619926492106709, 'samples': 5437248, 'steps': 28318, 'loss/train': 1.4585894346237183} -11/07/2021 01:11:34 - INFO - __main__ - Step 28320: {'lr': 0.0004619898363587899, 'samples': 5437440, 'steps': 28319, 'loss/train': 1.9013971090316772} -11/07/2021 01:11:34 - INFO - __main__ - Step 28321: {'lr': 0.00046198702341138944, 'samples': 5437632, 'steps': 28320, 'loss/train': 1.7438561916351318} -11/07/2021 01:11:35 - INFO - __main__ - Step 28322: {'lr': 0.00046198421036847093, 'samples': 5437824, 'steps': 28321, 'loss/train': 1.4920424222946167} -11/07/2021 01:11:35 - INFO - __main__ - Step 28323: {'lr': 0.00046198139723003563, 'samples': 5438016, 'steps': 28322, 'loss/train': 0.998529851436615} -11/07/2021 01:11:36 - INFO - __main__ - Step 28324: {'lr': 0.00046197858399608477, 'samples': 5438208, 'steps': 28323, 'loss/train': 1.9227137565612793} -11/07/2021 01:11:36 - INFO - __main__ - Step 28325: {'lr': 0.00046197577066661965, 'samples': 5438400, 'steps': 28324, 'loss/train': 1.6951842308044434} -11/07/2021 01:11:37 - INFO - __main__ - Step 28326: {'lr': 0.0004619729572416415, 'samples': 5438592, 'steps': 28325, 'loss/train': 1.8733631372451782} -11/07/2021 01:11:37 - INFO - __main__ - Step 28327: {'lr': 0.0004619701437211516, 'samples': 5438784, 'steps': 28326, 'loss/train': 1.6878166198730469} -11/07/2021 01:11:37 - INFO - __main__ - Step 28328: {'lr': 0.00046196733010515125, 'samples': 5438976, 'steps': 28327, 'loss/train': 1.9754751920700073} -11/07/2021 01:11:38 - INFO - __main__ - Step 28329: {'lr': 0.0004619645163936417, 'samples': 5439168, 'steps': 28328, 'loss/train': 1.7113882303237915} -11/07/2021 01:11:39 - INFO - __main__ - Step 28330: {'lr': 0.0004619617025866242, 'samples': 5439360, 'steps': 28329, 'loss/train': 0.6419276595115662} -11/07/2021 01:11:39 - INFO - __main__ - Step 28331: {'lr': 0.00046195888868409994, 'samples': 5439552, 'steps': 28330, 'loss/train': 1.6990545988082886} -11/07/2021 01:11:39 - INFO - __main__ - Step 28332: {'lr': 0.0004619560746860704, 'samples': 5439744, 'steps': 28331, 'loss/train': 1.4887057542800903} -11/07/2021 01:11:40 - INFO - __main__ - Step 28333: {'lr': 0.0004619532605925366, 'samples': 5439936, 'steps': 28332, 'loss/train': 1.4601359367370605} -11/07/2021 01:11:41 - INFO - __main__ - Step 28334: {'lr': 0.00046195044640350003, 'samples': 5440128, 'steps': 28333, 'loss/train': 1.3070403337478638} -11/07/2021 01:11:41 - INFO - __main__ - Step 28335: {'lr': 0.00046194763211896187, 'samples': 5440320, 'steps': 28334, 'loss/train': 1.5026382207870483} -11/07/2021 01:11:42 - INFO - __main__ - Step 28336: {'lr': 0.0004619448177389233, 'samples': 5440512, 'steps': 28335, 'loss/train': 1.9780086278915405} -11/07/2021 01:11:42 - INFO - __main__ - Step 28337: {'lr': 0.0004619420032633857, 'samples': 5440704, 'steps': 28336, 'loss/train': 1.5093754529953003} -11/07/2021 01:11:42 - INFO - __main__ - Step 28338: {'lr': 0.0004619391886923503, 'samples': 5440896, 'steps': 28337, 'loss/train': 1.0746419429779053} -11/07/2021 01:11:43 - INFO - __main__ - Step 28339: {'lr': 0.0004619363740258184, 'samples': 5441088, 'steps': 28338, 'loss/train': 1.0466197729110718} -11/07/2021 01:11:44 - INFO - __main__ - Step 28340: {'lr': 0.00046193355926379124, 'samples': 5441280, 'steps': 28339, 'loss/train': 1.5124543905258179} -11/07/2021 01:11:44 - INFO - __main__ - Step 28341: {'lr': 0.00046193074440627, 'samples': 5441472, 'steps': 28340, 'loss/train': 1.259055733680725} -11/07/2021 01:11:44 - INFO - __main__ - Step 28342: {'lr': 0.0004619279294532561, 'samples': 5441664, 'steps': 28341, 'loss/train': 1.285418152809143} -11/07/2021 01:11:45 - INFO - __main__ - Step 28343: {'lr': 0.00046192511440475083, 'samples': 5441856, 'steps': 28342, 'loss/train': 1.717706561088562} -11/07/2021 01:11:46 - INFO - __main__ - Step 28344: {'lr': 0.00046192229926075526, 'samples': 5442048, 'steps': 28343, 'loss/train': 1.809889316558838} -11/07/2021 01:11:46 - INFO - __main__ - Step 28345: {'lr': 0.0004619194840212708, 'samples': 5442240, 'steps': 28344, 'loss/train': 1.3425153493881226} -11/07/2021 01:11:47 - INFO - __main__ - Step 28346: {'lr': 0.0004619166686862987, 'samples': 5442432, 'steps': 28345, 'loss/train': 1.6994646787643433} -11/07/2021 01:11:47 - INFO - __main__ - Step 28347: {'lr': 0.0004619138532558402, 'samples': 5442624, 'steps': 28346, 'loss/train': 1.3344404697418213} -11/07/2021 01:11:47 - INFO - __main__ - Step 28348: {'lr': 0.00046191103772989664, 'samples': 5442816, 'steps': 28347, 'loss/train': 2.1455984115600586} -11/07/2021 01:11:48 - INFO - __main__ - Step 28349: {'lr': 0.00046190822210846917, 'samples': 5443008, 'steps': 28348, 'loss/train': 1.6893006563186646} -11/07/2021 01:11:49 - INFO - __main__ - Step 28350: {'lr': 0.0004619054063915592, 'samples': 5443200, 'steps': 28349, 'loss/train': 2.1755573749542236} -11/07/2021 01:11:49 - INFO - __main__ - Step 28351: {'lr': 0.00046190259057916786, 'samples': 5443392, 'steps': 28350, 'loss/train': 1.812320351600647} -11/07/2021 01:11:49 - INFO - __main__ - Step 28352: {'lr': 0.0004618997746712965, 'samples': 5443584, 'steps': 28351, 'loss/train': 1.5001801252365112} -11/07/2021 01:11:50 - INFO - __main__ - Step 28353: {'lr': 0.00046189695866794635, 'samples': 5443776, 'steps': 28352, 'loss/train': 1.3247753381729126} -11/07/2021 01:11:50 - INFO - __main__ - Step 28354: {'lr': 0.00046189414256911875, 'samples': 5443968, 'steps': 28353, 'loss/train': 1.6866405010223389} -11/07/2021 01:11:51 - INFO - __main__ - Step 28355: {'lr': 0.0004618913263748149, 'samples': 5444160, 'steps': 28354, 'loss/train': 1.6076704263687134} -11/07/2021 01:11:52 - INFO - __main__ - Step 28356: {'lr': 0.0004618885100850361, 'samples': 5444352, 'steps': 28355, 'loss/train': 1.0575443506240845} -11/07/2021 01:11:52 - INFO - __main__ - Step 28357: {'lr': 0.0004618856936997836, 'samples': 5444544, 'steps': 28356, 'loss/train': 1.492514729499817} -11/07/2021 01:11:52 - INFO - __main__ - Step 28358: {'lr': 0.0004618828772190586, 'samples': 5444736, 'steps': 28357, 'loss/train': 0.2902561128139496} -11/07/2021 01:11:53 - INFO - __main__ - Step 28359: {'lr': 0.0004618800606428626, 'samples': 5444928, 'steps': 28358, 'loss/train': 1.3694254159927368} -11/07/2021 01:11:53 - INFO - __main__ - Step 28360: {'lr': 0.00046187724397119657, 'samples': 5445120, 'steps': 28359, 'loss/train': 1.4556535482406616} -11/07/2021 01:11:54 - INFO - __main__ - Step 28361: {'lr': 0.000461874427204062, 'samples': 5445312, 'steps': 28360, 'loss/train': 1.813988447189331} -11/07/2021 01:11:55 - INFO - __main__ - Step 28362: {'lr': 0.00046187161034146, 'samples': 5445504, 'steps': 28361, 'loss/train': 0.8661501407623291} -11/07/2021 01:11:55 - INFO - __main__ - Step 28363: {'lr': 0.00046186879338339207, 'samples': 5445696, 'steps': 28362, 'loss/train': 1.7381328344345093} -11/07/2021 01:11:55 - INFO - __main__ - Step 28364: {'lr': 0.0004618659763298592, 'samples': 5445888, 'steps': 28363, 'loss/train': 1.5734864473342896} -11/07/2021 01:11:56 - INFO - __main__ - Step 28365: {'lr': 0.00046186315918086285, 'samples': 5446080, 'steps': 28364, 'loss/train': 1.5111933946609497} -11/07/2021 01:11:57 - INFO - __main__ - Step 28366: {'lr': 0.0004618603419364042, 'samples': 5446272, 'steps': 28365, 'loss/train': 1.3224831819534302} -11/07/2021 01:11:57 - INFO - __main__ - Step 28367: {'lr': 0.00046185752459648456, 'samples': 5446464, 'steps': 28366, 'loss/train': 1.7753583192825317} -11/07/2021 01:11:57 - INFO - __main__ - Step 28368: {'lr': 0.00046185470716110516, 'samples': 5446656, 'steps': 28367, 'loss/train': 1.8063596487045288} -11/07/2021 01:11:58 - INFO - __main__ - Step 28369: {'lr': 0.00046185188963026734, 'samples': 5446848, 'steps': 28368, 'loss/train': 1.3005485534667969} -11/07/2021 01:11:58 - INFO - __main__ - Step 28370: {'lr': 0.0004618490720039723, 'samples': 5447040, 'steps': 28369, 'loss/train': 1.5186891555786133} -11/07/2021 01:11:59 - INFO - __main__ - Step 28371: {'lr': 0.0004618462542822214, 'samples': 5447232, 'steps': 28370, 'loss/train': 1.5141217708587646} -11/07/2021 01:12:00 - INFO - __main__ - Step 28372: {'lr': 0.0004618434364650158, 'samples': 5447424, 'steps': 28371, 'loss/train': 1.753641963005066} -11/07/2021 01:12:00 - INFO - __main__ - Step 28373: {'lr': 0.00046184061855235683, 'samples': 5447616, 'steps': 28372, 'loss/train': 1.5009593963623047} -11/07/2021 01:12:00 - INFO - __main__ - Step 28374: {'lr': 0.00046183780054424574, 'samples': 5447808, 'steps': 28373, 'loss/train': 1.1196340322494507} -11/07/2021 01:12:01 - INFO - __main__ - Step 28375: {'lr': 0.00046183498244068376, 'samples': 5448000, 'steps': 28374, 'loss/train': 1.3198537826538086} -11/07/2021 01:12:02 - INFO - __main__ - Step 28376: {'lr': 0.00046183216424167226, 'samples': 5448192, 'steps': 28375, 'loss/train': 1.1616865396499634} -11/07/2021 01:12:02 - INFO - __main__ - Step 28377: {'lr': 0.0004618293459472124, 'samples': 5448384, 'steps': 28376, 'loss/train': 1.6450309753417969} -11/07/2021 01:12:02 - INFO - __main__ - Step 28378: {'lr': 0.0004618265275573056, 'samples': 5448576, 'steps': 28377, 'loss/train': 1.5486198663711548} -11/07/2021 01:12:03 - INFO - __main__ - Step 28379: {'lr': 0.00046182370907195294, 'samples': 5448768, 'steps': 28378, 'loss/train': 1.7771023511886597} -11/07/2021 01:12:03 - INFO - __main__ - Step 28380: {'lr': 0.00046182089049115585, 'samples': 5448960, 'steps': 28379, 'loss/train': 1.8674331903457642} -11/07/2021 01:12:03 - INFO - __main__ - Step 28381: {'lr': 0.0004618180718149155, 'samples': 5449152, 'steps': 28380, 'loss/train': 2.1471502780914307} -11/07/2021 01:12:05 - INFO - __main__ - Step 28382: {'lr': 0.00046181525304323325, 'samples': 5449344, 'steps': 28381, 'loss/train': 1.8558167219161987} -11/07/2021 01:12:05 - INFO - __main__ - Step 28383: {'lr': 0.0004618124341761102, 'samples': 5449536, 'steps': 28382, 'loss/train': 1.9591509103775024} -11/07/2021 01:12:05 - INFO - __main__ - Step 28384: {'lr': 0.0004618096152135478, 'samples': 5449728, 'steps': 28383, 'loss/train': 1.861006736755371} -11/07/2021 01:12:06 - INFO - __main__ - Step 28385: {'lr': 0.00046180679615554735, 'samples': 5449920, 'steps': 28384, 'loss/train': 1.9714553356170654} -11/07/2021 01:12:06 - INFO - __main__ - Step 28386: {'lr': 0.00046180397700210985, 'samples': 5450112, 'steps': 28385, 'loss/train': 1.4372633695602417} -11/07/2021 01:12:07 - INFO - __main__ - Step 28387: {'lr': 0.0004618011577532368, 'samples': 5450304, 'steps': 28386, 'loss/train': 1.5484124422073364} -11/07/2021 01:12:07 - INFO - __main__ - Step 28388: {'lr': 0.0004617983384089295, 'samples': 5450496, 'steps': 28387, 'loss/train': 1.984816074371338} -11/07/2021 01:12:08 - INFO - __main__ - Step 28389: {'lr': 0.00046179551896918916, 'samples': 5450688, 'steps': 28388, 'loss/train': 1.4153586626052856} -11/07/2021 01:12:08 - INFO - __main__ - Step 28390: {'lr': 0.00046179269943401693, 'samples': 5450880, 'steps': 28389, 'loss/train': 1.8363102674484253} -11/07/2021 01:12:08 - INFO - __main__ - Step 28391: {'lr': 0.00046178987980341414, 'samples': 5451072, 'steps': 28390, 'loss/train': 1.4534401893615723} -11/07/2021 01:12:10 - INFO - __main__ - Step 28392: {'lr': 0.00046178706007738227, 'samples': 5451264, 'steps': 28391, 'loss/train': 1.542893648147583} -11/07/2021 01:12:10 - INFO - __main__ - Step 28393: {'lr': 0.0004617842402559223, 'samples': 5451456, 'steps': 28392, 'loss/train': 1.431994915008545} -11/07/2021 01:12:10 - INFO - __main__ - Step 28394: {'lr': 0.0004617814203390356, 'samples': 5451648, 'steps': 28393, 'loss/train': 2.0125787258148193} -11/07/2021 01:12:11 - INFO - __main__ - Step 28395: {'lr': 0.0004617786003267235, 'samples': 5451840, 'steps': 28394, 'loss/train': 1.5543104410171509} -11/07/2021 01:12:11 - INFO - __main__ - Step 28396: {'lr': 0.00046177578021898717, 'samples': 5452032, 'steps': 28395, 'loss/train': 1.5467292070388794} -11/07/2021 01:12:12 - INFO - __main__ - Step 28397: {'lr': 0.000461772960015828, 'samples': 5452224, 'steps': 28396, 'loss/train': 1.1211336851119995} -11/07/2021 01:12:12 - INFO - __main__ - Step 28398: {'lr': 0.00046177013971724723, 'samples': 5452416, 'steps': 28397, 'loss/train': 1.3289721012115479} -11/07/2021 01:12:13 - INFO - __main__ - Step 28399: {'lr': 0.00046176731932324604, 'samples': 5452608, 'steps': 28398, 'loss/train': 1.5812649726867676} -11/07/2021 01:12:13 - INFO - __main__ - Step 28400: {'lr': 0.0004617644988338258, 'samples': 5452800, 'steps': 28399, 'loss/train': 1.628312110900879} -11/07/2021 01:12:13 - INFO - __main__ - Step 28401: {'lr': 0.0004617616782489877, 'samples': 5452992, 'steps': 28400, 'loss/train': 1.4269146919250488} -11/07/2021 01:12:14 - INFO - __main__ - Step 28402: {'lr': 0.00046175885756873314, 'samples': 5453184, 'steps': 28401, 'loss/train': 1.520078420639038} -11/07/2021 01:12:15 - INFO - __main__ - Step 28403: {'lr': 0.00046175603679306324, 'samples': 5453376, 'steps': 28402, 'loss/train': 1.4348992109298706} -11/07/2021 01:12:15 - INFO - __main__ - Step 28404: {'lr': 0.0004617532159219794, 'samples': 5453568, 'steps': 28403, 'loss/train': 1.6966314315795898} -11/07/2021 01:12:15 - INFO - __main__ - Step 28405: {'lr': 0.0004617503949554828, 'samples': 5453760, 'steps': 28404, 'loss/train': 1.50644052028656} -11/07/2021 01:12:16 - INFO - __main__ - Step 28406: {'lr': 0.0004617475738935747, 'samples': 5453952, 'steps': 28405, 'loss/train': 1.5906078815460205} -11/07/2021 01:12:17 - INFO - __main__ - Step 28407: {'lr': 0.0004617447527362564, 'samples': 5454144, 'steps': 28406, 'loss/train': 1.3887377977371216} -11/07/2021 01:12:17 - INFO - __main__ - Step 28408: {'lr': 0.00046174193148352914, 'samples': 5454336, 'steps': 28407, 'loss/train': 2.1632323265075684} -11/07/2021 01:12:18 - INFO - __main__ - Step 28409: {'lr': 0.00046173911013539437, 'samples': 5454528, 'steps': 28408, 'loss/train': 1.411903977394104} -11/07/2021 01:12:18 - INFO - __main__ - Step 28410: {'lr': 0.0004617362886918531, 'samples': 5454720, 'steps': 28409, 'loss/train': 1.8714888095855713} -11/07/2021 01:12:19 - INFO - __main__ - Step 28411: {'lr': 0.0004617334671529069, 'samples': 5454912, 'steps': 28410, 'loss/train': 1.2680634260177612} -11/07/2021 01:12:19 - INFO - __main__ - Step 28412: {'lr': 0.0004617306455185567, 'samples': 5455104, 'steps': 28411, 'loss/train': 2.167773962020874} -11/07/2021 01:12:20 - INFO - __main__ - Step 28413: {'lr': 0.00046172782378880404, 'samples': 5455296, 'steps': 28412, 'loss/train': 1.7435532808303833} -11/07/2021 01:12:20 - INFO - __main__ - Step 28414: {'lr': 0.00046172500196364996, 'samples': 5455488, 'steps': 28413, 'loss/train': 0.7721033692359924} -11/07/2021 01:12:21 - INFO - __main__ - Step 28415: {'lr': 0.000461722180043096, 'samples': 5455680, 'steps': 28414, 'loss/train': 1.5514968633651733} -11/07/2021 01:12:21 - INFO - __main__ - Step 28416: {'lr': 0.0004617193580271433, 'samples': 5455872, 'steps': 28415, 'loss/train': 3.148294687271118} -11/07/2021 01:12:21 - INFO - __main__ - Step 28417: {'lr': 0.000461716535915793, 'samples': 5456064, 'steps': 28416, 'loss/train': 1.618602991104126} -11/07/2021 01:12:22 - INFO - __main__ - Step 28418: {'lr': 0.0004617137137090466, 'samples': 5456256, 'steps': 28417, 'loss/train': 1.428109884262085} -11/07/2021 01:12:23 - INFO - __main__ - Step 28419: {'lr': 0.0004617108914069052, 'samples': 5456448, 'steps': 28418, 'loss/train': 1.310810923576355} -11/07/2021 01:12:23 - INFO - __main__ - Step 28420: {'lr': 0.0004617080690093701, 'samples': 5456640, 'steps': 28419, 'loss/train': 1.2667416334152222} -11/07/2021 01:12:23 - INFO - __main__ - Step 28421: {'lr': 0.00046170524651644276, 'samples': 5456832, 'steps': 28420, 'loss/train': 1.5690606832504272} -11/07/2021 01:12:24 - INFO - __main__ - Step 28422: {'lr': 0.00046170242392812425, 'samples': 5457024, 'steps': 28421, 'loss/train': 1.829864501953125} -11/07/2021 01:12:25 - INFO - __main__ - Step 28423: {'lr': 0.0004616996012444158, 'samples': 5457216, 'steps': 28422, 'loss/train': 1.873397707939148} -11/07/2021 01:12:25 - INFO - __main__ - Step 28424: {'lr': 0.00046169677846531884, 'samples': 5457408, 'steps': 28423, 'loss/train': 1.3015440702438354} -11/07/2021 01:12:26 - INFO - __main__ - Step 28425: {'lr': 0.0004616939555908346, 'samples': 5457600, 'steps': 28424, 'loss/train': 0.9528545141220093} -11/07/2021 01:12:26 - INFO - __main__ - Step 28426: {'lr': 0.0004616911326209643, 'samples': 5457792, 'steps': 28425, 'loss/train': 2.169158935546875} -11/07/2021 01:12:26 - INFO - __main__ - Step 28427: {'lr': 0.0004616883095557092, 'samples': 5457984, 'steps': 28426, 'loss/train': 1.5702557563781738} -11/07/2021 01:12:27 - INFO - __main__ - Step 28428: {'lr': 0.0004616854863950707, 'samples': 5458176, 'steps': 28427, 'loss/train': 1.5576798915863037} -11/07/2021 01:12:28 - INFO - __main__ - Step 28429: {'lr': 0.00046168266313904995, 'samples': 5458368, 'steps': 28428, 'loss/train': 1.4445343017578125} -11/07/2021 01:12:28 - INFO - __main__ - Step 28430: {'lr': 0.00046167983978764827, 'samples': 5458560, 'steps': 28429, 'loss/train': 5.771895408630371} -11/07/2021 01:12:28 - INFO - __main__ - Step 28431: {'lr': 0.0004616770163408669, 'samples': 5458752, 'steps': 28430, 'loss/train': 1.5220882892608643} -11/07/2021 01:12:29 - INFO - __main__ - Step 28432: {'lr': 0.00046167419279870715, 'samples': 5458944, 'steps': 28431, 'loss/train': 2.1063215732574463} -11/07/2021 01:12:29 - INFO - __main__ - Step 28433: {'lr': 0.00046167136916117025, 'samples': 5459136, 'steps': 28432, 'loss/train': 1.3773339986801147} -11/07/2021 01:12:30 - INFO - __main__ - Step 28434: {'lr': 0.00046166854542825756, 'samples': 5459328, 'steps': 28433, 'loss/train': 1.733251929283142} -11/07/2021 01:12:31 - INFO - __main__ - Step 28435: {'lr': 0.0004616657215999702, 'samples': 5459520, 'steps': 28434, 'loss/train': 1.6719069480895996} -11/07/2021 01:12:31 - INFO - __main__ - Step 28436: {'lr': 0.0004616628976763096, 'samples': 5459712, 'steps': 28435, 'loss/train': 1.5270695686340332} -11/07/2021 01:12:31 - INFO - __main__ - Step 28437: {'lr': 0.0004616600736572769, 'samples': 5459904, 'steps': 28436, 'loss/train': 1.066251516342163} -11/07/2021 01:12:32 - INFO - __main__ - Step 28438: {'lr': 0.0004616572495428735, 'samples': 5460096, 'steps': 28437, 'loss/train': 1.0775712728500366} -11/07/2021 01:12:32 - INFO - __main__ - Step 28439: {'lr': 0.0004616544253331006, 'samples': 5460288, 'steps': 28438, 'loss/train': 1.4521342515945435} -11/07/2021 01:12:33 - INFO - __main__ - Step 28440: {'lr': 0.00046165160102795943, 'samples': 5460480, 'steps': 28439, 'loss/train': 0.8910706639289856} -11/07/2021 01:12:33 - INFO - __main__ - Step 28441: {'lr': 0.0004616487766274514, 'samples': 5460672, 'steps': 28440, 'loss/train': 1.8507764339447021} -11/07/2021 01:12:34 - INFO - __main__ - Step 28442: {'lr': 0.0004616459521315777, 'samples': 5460864, 'steps': 28441, 'loss/train': 1.7701815366744995} -11/07/2021 01:12:34 - INFO - __main__ - Step 28443: {'lr': 0.0004616431275403395, 'samples': 5461056, 'steps': 28442, 'loss/train': 1.6071275472640991} -11/07/2021 01:12:34 - INFO - __main__ - Step 28444: {'lr': 0.0004616403028537382, 'samples': 5461248, 'steps': 28443, 'loss/train': 1.9984899759292603} -11/07/2021 01:12:36 - INFO - __main__ - Step 28445: {'lr': 0.0004616374780717751, 'samples': 5461440, 'steps': 28444, 'loss/train': 1.3097763061523438} -11/07/2021 01:12:36 - INFO - __main__ - Step 28446: {'lr': 0.0004616346531944514, 'samples': 5461632, 'steps': 28445, 'loss/train': 1.804141640663147} -11/07/2021 01:12:36 - INFO - __main__ - Step 28447: {'lr': 0.00046163182822176835, 'samples': 5461824, 'steps': 28446, 'loss/train': 1.2777339220046997} -11/07/2021 01:12:37 - INFO - __main__ - Step 28448: {'lr': 0.0004616290031537273, 'samples': 5462016, 'steps': 28447, 'loss/train': 1.434464454650879} -11/07/2021 01:12:37 - INFO - __main__ - Step 28449: {'lr': 0.0004616261779903295, 'samples': 5462208, 'steps': 28448, 'loss/train': 2.0488641262054443} -11/07/2021 01:12:38 - INFO - __main__ - Step 28450: {'lr': 0.0004616233527315762, 'samples': 5462400, 'steps': 28449, 'loss/train': 2.1894938945770264} -11/07/2021 01:12:38 - INFO - __main__ - Step 28451: {'lr': 0.0004616205273774686, 'samples': 5462592, 'steps': 28450, 'loss/train': 1.64618718624115} -11/07/2021 01:12:39 - INFO - __main__ - Step 28452: {'lr': 0.00046161770192800817, 'samples': 5462784, 'steps': 28451, 'loss/train': 1.3208832740783691} -11/07/2021 01:12:39 - INFO - __main__ - Step 28453: {'lr': 0.000461614876383196, 'samples': 5462976, 'steps': 28452, 'loss/train': 1.8666967153549194} -11/07/2021 01:12:40 - INFO - __main__ - Step 28454: {'lr': 0.0004616120507430335, 'samples': 5463168, 'steps': 28453, 'loss/train': 1.324458360671997} -11/07/2021 01:12:40 - INFO - __main__ - Step 28455: {'lr': 0.00046160922500752176, 'samples': 5463360, 'steps': 28454, 'loss/train': 1.936042308807373} -11/07/2021 01:12:41 - INFO - __main__ - Step 28456: {'lr': 0.0004616063991766623, 'samples': 5463552, 'steps': 28455, 'loss/train': 1.9124518632888794} -11/07/2021 01:12:41 - INFO - __main__ - Step 28457: {'lr': 0.0004616035732504562, 'samples': 5463744, 'steps': 28456, 'loss/train': 1.5295157432556152} -11/07/2021 01:12:42 - INFO - __main__ - Step 28458: {'lr': 0.0004616007472289048, 'samples': 5463936, 'steps': 28457, 'loss/train': 1.5819324254989624} -11/07/2021 01:12:42 - INFO - __main__ - Step 28459: {'lr': 0.00046159792111200937, 'samples': 5464128, 'steps': 28458, 'loss/train': 1.3726308345794678} -11/07/2021 01:12:43 - INFO - __main__ - Step 28460: {'lr': 0.0004615950948997711, 'samples': 5464320, 'steps': 28459, 'loss/train': 1.8839472532272339} -11/07/2021 01:12:43 - INFO - __main__ - Step 28461: {'lr': 0.0004615922685921915, 'samples': 5464512, 'steps': 28460, 'loss/train': 1.636143445968628} -11/07/2021 01:12:44 - INFO - __main__ - Step 28462: {'lr': 0.0004615894421892716, 'samples': 5464704, 'steps': 28461, 'loss/train': 1.6835225820541382} -11/07/2021 01:12:44 - INFO - __main__ - Step 28463: {'lr': 0.0004615866156910128, 'samples': 5464896, 'steps': 28462, 'loss/train': 1.6727573871612549} -11/07/2021 01:12:44 - INFO - __main__ - Step 28464: {'lr': 0.00046158378909741626, 'samples': 5465088, 'steps': 28463, 'loss/train': 1.4402834177017212} -11/07/2021 01:12:45 - INFO - __main__ - Step 28465: {'lr': 0.00046158096240848343, 'samples': 5465280, 'steps': 28464, 'loss/train': 1.9877482652664185} -11/07/2021 01:12:46 - INFO - __main__ - Step 28466: {'lr': 0.00046157813562421545, 'samples': 5465472, 'steps': 28465, 'loss/train': 1.5668485164642334} -11/07/2021 01:12:46 - INFO - __main__ - Step 28467: {'lr': 0.0004615753087446136, 'samples': 5465664, 'steps': 28466, 'loss/train': 1.9259995222091675} -11/07/2021 01:12:47 - INFO - __main__ - Step 28468: {'lr': 0.00046157248176967915, 'samples': 5465856, 'steps': 28467, 'loss/train': 1.5455939769744873} -11/07/2021 01:12:47 - INFO - __main__ - Step 28469: {'lr': 0.0004615696546994135, 'samples': 5466048, 'steps': 28468, 'loss/train': 1.7399810552597046} -11/07/2021 01:12:48 - INFO - __main__ - Step 28470: {'lr': 0.00046156682753381774, 'samples': 5466240, 'steps': 28469, 'loss/train': 1.6447303295135498} -11/07/2021 01:12:48 - INFO - __main__ - Step 28471: {'lr': 0.0004615640002728932, 'samples': 5466432, 'steps': 28470, 'loss/train': 1.3740919828414917} -11/07/2021 01:12:49 - INFO - __main__ - Step 28472: {'lr': 0.00046156117291664133, 'samples': 5466624, 'steps': 28471, 'loss/train': 1.115888237953186} -11/07/2021 01:12:49 - INFO - __main__ - Step 28473: {'lr': 0.0004615583454650632, 'samples': 5466816, 'steps': 28472, 'loss/train': 1.3618167638778687} -11/07/2021 01:12:49 - INFO - __main__ - Step 28474: {'lr': 0.00046155551791816007, 'samples': 5467008, 'steps': 28473, 'loss/train': 1.1851608753204346} -11/07/2021 01:12:50 - INFO - __main__ - Step 28475: {'lr': 0.00046155269027593337, 'samples': 5467200, 'steps': 28474, 'loss/train': 1.7829506397247314} -11/07/2021 01:12:51 - INFO - __main__ - Step 28476: {'lr': 0.00046154986253838426, 'samples': 5467392, 'steps': 28475, 'loss/train': 1.390133023262024} -11/07/2021 01:12:51 - INFO - __main__ - Step 28477: {'lr': 0.00046154703470551405, 'samples': 5467584, 'steps': 28476, 'loss/train': 2.0066704750061035} -11/07/2021 01:12:51 - INFO - __main__ - Step 28478: {'lr': 0.000461544206777324, 'samples': 5467776, 'steps': 28477, 'loss/train': 1.3123130798339844} -11/07/2021 01:12:52 - INFO - __main__ - Step 28479: {'lr': 0.00046154137875381547, 'samples': 5467968, 'steps': 28478, 'loss/train': 1.2928277254104614} -11/07/2021 01:12:52 - INFO - __main__ - Step 28480: {'lr': 0.00046153855063498964, 'samples': 5468160, 'steps': 28479, 'loss/train': 1.7671639919281006} -11/07/2021 01:12:53 - INFO - __main__ - Step 28481: {'lr': 0.00046153572242084776, 'samples': 5468352, 'steps': 28480, 'loss/train': 0.9786882400512695} -11/07/2021 01:12:53 - INFO - __main__ - Step 28482: {'lr': 0.0004615328941113911, 'samples': 5468544, 'steps': 28481, 'loss/train': 1.719839334487915} -11/07/2021 01:12:54 - INFO - __main__ - Step 28483: {'lr': 0.00046153006570662106, 'samples': 5468736, 'steps': 28482, 'loss/train': 1.1868432760238647} -11/07/2021 01:12:54 - INFO - __main__ - Step 28484: {'lr': 0.0004615272372065388, 'samples': 5468928, 'steps': 28483, 'loss/train': 1.8249025344848633} -11/07/2021 01:12:55 - INFO - __main__ - Step 28485: {'lr': 0.0004615244086111456, 'samples': 5469120, 'steps': 28484, 'loss/train': 1.76587975025177} -11/07/2021 01:12:56 - INFO - __main__ - Step 28486: {'lr': 0.00046152157992044283, 'samples': 5469312, 'steps': 28485, 'loss/train': 1.6965020895004272} -11/07/2021 01:12:56 - INFO - __main__ - Step 28487: {'lr': 0.0004615187511344316, 'samples': 5469504, 'steps': 28486, 'loss/train': 1.5689350366592407} -11/07/2021 01:12:56 - INFO - __main__ - Step 28488: {'lr': 0.00046151592225311347, 'samples': 5469696, 'steps': 28487, 'loss/train': 1.4092538356781006} -11/07/2021 01:12:57 - INFO - __main__ - Step 28489: {'lr': 0.0004615130932764894, 'samples': 5469888, 'steps': 28488, 'loss/train': 1.659226655960083} -11/07/2021 01:12:57 - INFO - __main__ - Step 28490: {'lr': 0.0004615102642045608, 'samples': 5470080, 'steps': 28489, 'loss/train': 1.4775367975234985} -11/07/2021 01:12:58 - INFO - __main__ - Step 28491: {'lr': 0.00046150743503732897, 'samples': 5470272, 'steps': 28490, 'loss/train': 1.2291374206542969} -11/07/2021 01:12:58 - INFO - __main__ - Step 28492: {'lr': 0.0004615046057747951, 'samples': 5470464, 'steps': 28491, 'loss/train': 1.5803325176239014} -11/07/2021 01:12:59 - INFO - __main__ - Step 28493: {'lr': 0.0004615017764169606, 'samples': 5470656, 'steps': 28492, 'loss/train': 1.3385908603668213} -11/07/2021 01:12:59 - INFO - __main__ - Step 28494: {'lr': 0.00046149894696382655, 'samples': 5470848, 'steps': 28493, 'loss/train': 1.8293430805206299} -11/07/2021 01:12:59 - INFO - __main__ - Step 28495: {'lr': 0.00046149611741539445, 'samples': 5471040, 'steps': 28494, 'loss/train': 2.066129684448242} -11/07/2021 01:13:00 - INFO - __main__ - Step 28496: {'lr': 0.00046149328777166543, 'samples': 5471232, 'steps': 28495, 'loss/train': 1.5534108877182007} -11/07/2021 01:13:01 - INFO - __main__ - Step 28497: {'lr': 0.0004614904580326408, 'samples': 5471424, 'steps': 28496, 'loss/train': 1.92973792552948} -11/07/2021 01:13:01 - INFO - __main__ - Step 28498: {'lr': 0.0004614876281983218, 'samples': 5471616, 'steps': 28497, 'loss/train': 1.3637464046478271} -11/07/2021 01:13:01 - INFO - __main__ - Step 28499: {'lr': 0.0004614847982687097, 'samples': 5471808, 'steps': 28498, 'loss/train': 1.5086700916290283} -11/07/2021 01:13:02 - INFO - __main__ - Step 28500: {'lr': 0.0004614819682438059, 'samples': 5472000, 'steps': 28499, 'loss/train': 1.41326105594635} -11/07/2021 01:13:03 - INFO - __main__ - Step 28501: {'lr': 0.00046147913812361155, 'samples': 5472192, 'steps': 28500, 'loss/train': 1.4224140644073486} -11/07/2021 01:13:03 - INFO - __main__ - Step 28502: {'lr': 0.000461476307908128, 'samples': 5472384, 'steps': 28501, 'loss/train': 1.9110409021377563} -11/07/2021 01:13:04 - INFO - __main__ - Step 28503: {'lr': 0.00046147347759735647, 'samples': 5472576, 'steps': 28502, 'loss/train': 2.035921573638916} -11/07/2021 01:13:04 - INFO - __main__ - Step 28504: {'lr': 0.00046147064719129823, 'samples': 5472768, 'steps': 28503, 'loss/train': 1.4053170680999756} -11/07/2021 01:13:04 - INFO - __main__ - Step 28505: {'lr': 0.00046146781668995456, 'samples': 5472960, 'steps': 28504, 'loss/train': 1.5621429681777954} -11/07/2021 01:13:05 - INFO - __main__ - Step 28506: {'lr': 0.0004614649860933268, 'samples': 5473152, 'steps': 28505, 'loss/train': 1.4961036443710327} -11/07/2021 01:13:06 - INFO - __main__ - Step 28507: {'lr': 0.0004614621554014162, 'samples': 5473344, 'steps': 28506, 'loss/train': 1.6253371238708496} -11/07/2021 01:13:06 - INFO - __main__ - Step 28508: {'lr': 0.00046145932461422396, 'samples': 5473536, 'steps': 28507, 'loss/train': 1.7970013618469238} -11/07/2021 01:13:06 - INFO - __main__ - Step 28509: {'lr': 0.00046145649373175145, 'samples': 5473728, 'steps': 28508, 'loss/train': 1.8721892833709717} -11/07/2021 01:13:07 - INFO - __main__ - Step 28510: {'lr': 0.0004614536627539999, 'samples': 5473920, 'steps': 28509, 'loss/train': 1.5840485095977783} -11/07/2021 01:13:08 - INFO - __main__ - Step 28511: {'lr': 0.0004614508316809706, 'samples': 5474112, 'steps': 28510, 'loss/train': 1.2819918394088745} -11/07/2021 01:13:08 - INFO - __main__ - Step 28512: {'lr': 0.00046144800051266477, 'samples': 5474304, 'steps': 28511, 'loss/train': 1.383216142654419} -11/07/2021 01:13:09 - INFO - __main__ - Step 28513: {'lr': 0.00046144516924908377, 'samples': 5474496, 'steps': 28512, 'loss/train': 1.5542588233947754} -11/07/2021 01:13:09 - INFO - __main__ - Step 28514: {'lr': 0.0004614423378902289, 'samples': 5474688, 'steps': 28513, 'loss/train': 1.4837170839309692} -11/07/2021 01:13:09 - INFO - __main__ - Step 28515: {'lr': 0.0004614395064361013, 'samples': 5474880, 'steps': 28514, 'loss/train': 1.7974506616592407} -11/07/2021 01:13:11 - INFO - __main__ - Step 28516: {'lr': 0.00046143667488670226, 'samples': 5475072, 'steps': 28515, 'loss/train': 1.2926692962646484} -11/07/2021 01:13:11 - INFO - __main__ - Step 28517: {'lr': 0.00046143384324203325, 'samples': 5475264, 'steps': 28516, 'loss/train': 1.5892486572265625} -11/07/2021 01:13:12 - INFO - __main__ - Step 28518: {'lr': 0.00046143101150209533, 'samples': 5475456, 'steps': 28517, 'loss/train': 1.1255959272384644} -11/07/2021 01:13:12 - INFO - __main__ - Step 28519: {'lr': 0.0004614281796668899, 'samples': 5475648, 'steps': 28518, 'loss/train': 0.5575433373451233} -11/07/2021 01:13:12 - INFO - __main__ - Step 28520: {'lr': 0.0004614253477364182, 'samples': 5475840, 'steps': 28519, 'loss/train': 1.642098069190979} -11/07/2021 01:13:13 - INFO - __main__ - Step 28521: {'lr': 0.0004614225157106815, 'samples': 5476032, 'steps': 28520, 'loss/train': 1.7778156995773315} -11/07/2021 01:13:14 - INFO - __main__ - Step 28522: {'lr': 0.00046141968358968103, 'samples': 5476224, 'steps': 28521, 'loss/train': 1.1304028034210205} -11/07/2021 01:13:14 - INFO - __main__ - Step 28523: {'lr': 0.00046141685137341814, 'samples': 5476416, 'steps': 28522, 'loss/train': 1.6093932390213013} -11/07/2021 01:13:14 - INFO - __main__ - Step 28524: {'lr': 0.00046141401906189404, 'samples': 5476608, 'steps': 28523, 'loss/train': 1.4824190139770508} -11/07/2021 01:13:15 - INFO - __main__ - Step 28525: {'lr': 0.0004614111866551101, 'samples': 5476800, 'steps': 28524, 'loss/train': 1.7257108688354492} -11/07/2021 01:13:15 - INFO - __main__ - Step 28526: {'lr': 0.0004614083541530675, 'samples': 5476992, 'steps': 28525, 'loss/train': 1.8572736978530884} -11/07/2021 01:13:16 - INFO - __main__ - Step 28527: {'lr': 0.00046140552155576767, 'samples': 5477184, 'steps': 28526, 'loss/train': 1.5072067975997925} -11/07/2021 01:13:17 - INFO - __main__ - Step 28528: {'lr': 0.0004614026888632116, 'samples': 5477376, 'steps': 28527, 'loss/train': 1.8376927375793457} -11/07/2021 01:13:17 - INFO - __main__ - Step 28529: {'lr': 0.00046139985607540087, 'samples': 5477568, 'steps': 28528, 'loss/train': 1.7291768789291382} -11/07/2021 01:13:17 - INFO - __main__ - Step 28530: {'lr': 0.00046139702319233656, 'samples': 5477760, 'steps': 28529, 'loss/train': 1.209162712097168} -11/07/2021 01:13:18 - INFO - __main__ - Step 28531: {'lr': 0.00046139419021402005, 'samples': 5477952, 'steps': 28530, 'loss/train': 0.9393748641014099} -11/07/2021 01:13:18 - INFO - __main__ - Step 28532: {'lr': 0.00046139135714045253, 'samples': 5478144, 'steps': 28531, 'loss/train': 2.0351850986480713} -11/07/2021 01:13:19 - INFO - __main__ - Step 28533: {'lr': 0.00046138852397163547, 'samples': 5478336, 'steps': 28532, 'loss/train': 1.5962907075881958} -11/07/2021 01:13:19 - INFO - __main__ - Step 28534: {'lr': 0.00046138569070756984, 'samples': 5478528, 'steps': 28533, 'loss/train': 1.830586552619934} -11/07/2021 01:13:20 - INFO - __main__ - Step 28535: {'lr': 0.00046138285734825715, 'samples': 5478720, 'steps': 28534, 'loss/train': 1.1147873401641846} -11/07/2021 01:13:20 - INFO - __main__ - Step 28536: {'lr': 0.0004613800238936986, 'samples': 5478912, 'steps': 28535, 'loss/train': 1.8073807954788208} -11/07/2021 01:13:20 - INFO - __main__ - Step 28537: {'lr': 0.0004613771903438955, 'samples': 5479104, 'steps': 28536, 'loss/train': 1.6306997537612915} -11/07/2021 01:13:22 - INFO - __main__ - Step 28538: {'lr': 0.00046137435669884897, 'samples': 5479296, 'steps': 28537, 'loss/train': 1.6193535327911377} -11/07/2021 01:13:23 - INFO - __main__ - Step 28539: {'lr': 0.00046137152295856054, 'samples': 5479488, 'steps': 28538, 'loss/train': 0.4254659116268158} -11/07/2021 01:13:23 - INFO - __main__ - Step 28540: {'lr': 0.0004613686891230313, 'samples': 5479680, 'steps': 28539, 'loss/train': 1.918066382408142} -11/07/2021 01:13:23 - INFO - __main__ - Step 28541: {'lr': 0.0004613658551922627, 'samples': 5479872, 'steps': 28540, 'loss/train': 1.661318063735962} -11/07/2021 01:13:24 - INFO - __main__ - Step 28542: {'lr': 0.0004613630211662558, 'samples': 5480064, 'steps': 28541, 'loss/train': 1.55586576461792} -11/07/2021 01:13:24 - INFO - __main__ - Step 28543: {'lr': 0.00046136018704501203, 'samples': 5480256, 'steps': 28542, 'loss/train': 1.6200159788131714} -11/07/2021 01:13:25 - INFO - __main__ - Step 28544: {'lr': 0.00046135735282853263, 'samples': 5480448, 'steps': 28543, 'loss/train': 1.8351638317108154} -11/07/2021 01:13:25 - INFO - __main__ - Step 28545: {'lr': 0.0004613545185168188, 'samples': 5480640, 'steps': 28544, 'loss/train': 1.0412639379501343} -11/07/2021 01:13:26 - INFO - __main__ - Step 28546: {'lr': 0.0004613516841098719, 'samples': 5480832, 'steps': 28545, 'loss/train': 1.9801928997039795} -11/07/2021 01:13:26 - INFO - __main__ - Step 28547: {'lr': 0.0004613488496076933, 'samples': 5481024, 'steps': 28546, 'loss/train': 1.2984365224838257} -11/07/2021 01:13:26 - INFO - __main__ - Step 28548: {'lr': 0.00046134601501028404, 'samples': 5481216, 'steps': 28547, 'loss/train': 1.278522253036499} -11/07/2021 01:13:28 - INFO - __main__ - Step 28549: {'lr': 0.0004613431803176456, 'samples': 5481408, 'steps': 28548, 'loss/train': 1.4743411540985107} -11/07/2021 01:13:28 - INFO - __main__ - Step 28550: {'lr': 0.00046134034552977924, 'samples': 5481600, 'steps': 28549, 'loss/train': 1.5944483280181885} -11/07/2021 01:13:28 - INFO - __main__ - Step 28551: {'lr': 0.00046133751064668605, 'samples': 5481792, 'steps': 28550, 'loss/train': 1.5976324081420898} -11/07/2021 01:13:29 - INFO - __main__ - Step 28552: {'lr': 0.0004613346756683675, 'samples': 5481984, 'steps': 28551, 'loss/train': 1.5659213066101074} -11/07/2021 01:13:29 - INFO - __main__ - Step 28553: {'lr': 0.0004613318405948248, 'samples': 5482176, 'steps': 28552, 'loss/train': 1.5147918462753296} -11/07/2021 01:13:29 - INFO - __main__ - Step 28554: {'lr': 0.00046132900542605925, 'samples': 5482368, 'steps': 28553, 'loss/train': 2.00808048248291} -11/07/2021 01:13:31 - INFO - __main__ - Step 28555: {'lr': 0.0004613261701620721, 'samples': 5482560, 'steps': 28554, 'loss/train': 2.5371766090393066} -11/07/2021 01:13:31 - INFO - __main__ - Step 28556: {'lr': 0.0004613233348028646, 'samples': 5482752, 'steps': 28555, 'loss/train': 1.2087116241455078} -11/07/2021 01:13:31 - INFO - __main__ - Step 28557: {'lr': 0.0004613204993484381, 'samples': 5482944, 'steps': 28556, 'loss/train': 1.5834543704986572} -11/07/2021 01:13:32 - INFO - __main__ - Step 28558: {'lr': 0.00046131766379879386, 'samples': 5483136, 'steps': 28557, 'loss/train': 1.4561253786087036} -11/07/2021 01:13:32 - INFO - __main__ - Step 28559: {'lr': 0.0004613148281539331, 'samples': 5483328, 'steps': 28558, 'loss/train': 1.8825464248657227} -11/07/2021 01:13:33 - INFO - __main__ - Step 28560: {'lr': 0.00046131199241385726, 'samples': 5483520, 'steps': 28559, 'loss/train': 1.786787986755371} -11/07/2021 01:13:33 - INFO - __main__ - Step 28561: {'lr': 0.0004613091565785673, 'samples': 5483712, 'steps': 28560, 'loss/train': 1.2102888822555542} -11/07/2021 01:13:34 - INFO - __main__ - Step 28562: {'lr': 0.0004613063206480649, 'samples': 5483904, 'steps': 28561, 'loss/train': 2.037170886993408} -11/07/2021 01:13:34 - INFO - __main__ - Step 28563: {'lr': 0.000461303484622351, 'samples': 5484096, 'steps': 28562, 'loss/train': 1.8780871629714966} -11/07/2021 01:13:34 - INFO - __main__ - Step 28564: {'lr': 0.00046130064850142703, 'samples': 5484288, 'steps': 28563, 'loss/train': 1.3572795391082764} -11/07/2021 01:13:35 - INFO - __main__ - Step 28565: {'lr': 0.0004612978122852942, 'samples': 5484480, 'steps': 28564, 'loss/train': 1.3927767276763916} -11/07/2021 01:13:36 - INFO - __main__ - Step 28566: {'lr': 0.000461294975973954, 'samples': 5484672, 'steps': 28565, 'loss/train': 2.1032114028930664} -11/07/2021 01:13:36 - INFO - __main__ - Step 28567: {'lr': 0.0004612921395674074, 'samples': 5484864, 'steps': 28566, 'loss/train': 1.9771486520767212} -11/07/2021 01:13:36 - INFO - __main__ - Step 28568: {'lr': 0.0004612893030656559, 'samples': 5485056, 'steps': 28567, 'loss/train': 1.6528112888336182} -11/07/2021 01:13:37 - INFO - __main__ - Step 28569: {'lr': 0.0004612864664687007, 'samples': 5485248, 'steps': 28568, 'loss/train': 1.4817839860916138} -11/07/2021 01:13:38 - INFO - __main__ - Step 28570: {'lr': 0.0004612836297765429, 'samples': 5485440, 'steps': 28569, 'loss/train': 1.3428547382354736} -11/07/2021 01:13:38 - INFO - __main__ - Step 28571: {'lr': 0.00046128079298918414, 'samples': 5485632, 'steps': 28570, 'loss/train': 1.592185616493225} -11/07/2021 01:13:39 - INFO - __main__ - Step 28572: {'lr': 0.00046127795610662547, 'samples': 5485824, 'steps': 28571, 'loss/train': 2.0489470958709717} -11/07/2021 01:13:39 - INFO - __main__ - Step 28573: {'lr': 0.0004612751191288682, 'samples': 5486016, 'steps': 28572, 'loss/train': 1.5951439142227173} -11/07/2021 01:13:39 - INFO - __main__ - Step 28574: {'lr': 0.00046127228205591366, 'samples': 5486208, 'steps': 28573, 'loss/train': 1.285809874534607} -11/07/2021 01:13:40 - INFO - __main__ - Step 28575: {'lr': 0.0004612694448877631, 'samples': 5486400, 'steps': 28574, 'loss/train': 1.5925551652908325} -11/07/2021 01:13:41 - INFO - __main__ - Step 28576: {'lr': 0.00046126660762441774, 'samples': 5486592, 'steps': 28575, 'loss/train': 0.4271937906742096} -11/07/2021 01:13:41 - INFO - __main__ - Step 28577: {'lr': 0.00046126377026587897, 'samples': 5486784, 'steps': 28576, 'loss/train': 1.7694735527038574} -11/07/2021 01:13:41 - INFO - __main__ - Step 28578: {'lr': 0.0004612609328121479, 'samples': 5486976, 'steps': 28577, 'loss/train': 1.6860110759735107} -11/07/2021 01:13:42 - INFO - __main__ - Step 28579: {'lr': 0.000461258095263226, 'samples': 5487168, 'steps': 28578, 'loss/train': 1.9026232957839966} -11/07/2021 01:13:43 - INFO - __main__ - Step 28580: {'lr': 0.00046125525761911445, 'samples': 5487360, 'steps': 28579, 'loss/train': 1.164626955986023} -11/07/2021 01:13:43 - INFO - __main__ - Step 28581: {'lr': 0.00046125241987981445, 'samples': 5487552, 'steps': 28580, 'loss/train': 1.4468891620635986} -11/07/2021 01:13:43 - INFO - __main__ - Step 28582: {'lr': 0.0004612495820453275, 'samples': 5487744, 'steps': 28581, 'loss/train': 1.3925243616104126} -11/07/2021 01:13:44 - INFO - __main__ - Step 28583: {'lr': 0.0004612467441156547, 'samples': 5487936, 'steps': 28582, 'loss/train': 1.0571708679199219} -11/07/2021 01:13:44 - INFO - __main__ - Step 28584: {'lr': 0.00046124390609079735, 'samples': 5488128, 'steps': 28583, 'loss/train': 1.5288128852844238} -11/07/2021 01:13:45 - INFO - __main__ - Step 28585: {'lr': 0.00046124106797075683, 'samples': 5488320, 'steps': 28584, 'loss/train': 1.6580777168273926} -11/07/2021 01:13:45 - INFO - __main__ - Step 28586: {'lr': 0.00046123822975553425, 'samples': 5488512, 'steps': 28585, 'loss/train': 1.5447169542312622} -11/07/2021 01:13:46 - INFO - __main__ - Step 28587: {'lr': 0.00046123539144513103, 'samples': 5488704, 'steps': 28586, 'loss/train': 1.0325883626937866} -11/07/2021 01:13:46 - INFO - __main__ - Step 28588: {'lr': 0.00046123255303954835, 'samples': 5488896, 'steps': 28587, 'loss/train': 0.9563302397727966} -11/07/2021 01:13:46 - INFO - __main__ - Step 28589: {'lr': 0.0004612297145387876, 'samples': 5489088, 'steps': 28588, 'loss/train': 2.1595003604888916} -11/07/2021 01:13:47 - INFO - __main__ - Step 28590: {'lr': 0.00046122687594285, 'samples': 5489280, 'steps': 28589, 'loss/train': 1.2853444814682007} -11/07/2021 01:13:48 - INFO - __main__ - Step 28591: {'lr': 0.0004612240372517368, 'samples': 5489472, 'steps': 28590, 'loss/train': 1.3485485315322876} -11/07/2021 01:13:48 - INFO - __main__ - Step 28592: {'lr': 0.00046122119846544936, 'samples': 5489664, 'steps': 28591, 'loss/train': 1.4400455951690674} -11/07/2021 01:13:48 - INFO - __main__ - Step 28593: {'lr': 0.00046121835958398883, 'samples': 5489856, 'steps': 28592, 'loss/train': 1.4383652210235596} -11/07/2021 01:13:49 - INFO - __main__ - Step 28594: {'lr': 0.0004612155206073566, 'samples': 5490048, 'steps': 28593, 'loss/train': 1.3600523471832275} -11/07/2021 01:13:49 - INFO - __main__ - Step 28595: {'lr': 0.000461212681535554, 'samples': 5490240, 'steps': 28594, 'loss/train': 1.7095885276794434} -11/07/2021 01:13:50 - INFO - __main__ - Step 28596: {'lr': 0.0004612098423685821, 'samples': 5490432, 'steps': 28595, 'loss/train': 1.767296314239502} -11/07/2021 01:13:51 - INFO - __main__ - Step 28597: {'lr': 0.0004612070031064424, 'samples': 5490624, 'steps': 28596, 'loss/train': 1.2135729789733887} -11/07/2021 01:13:51 - INFO - __main__ - Step 28598: {'lr': 0.000461204163749136, 'samples': 5490816, 'steps': 28597, 'loss/train': 1.7606945037841797} -11/07/2021 01:13:51 - INFO - __main__ - Step 28599: {'lr': 0.0004612013242966643, 'samples': 5491008, 'steps': 28598, 'loss/train': 1.0029528141021729} -11/07/2021 01:13:52 - INFO - __main__ - Step 28600: {'lr': 0.0004611984847490285, 'samples': 5491200, 'steps': 28599, 'loss/train': 1.3767914772033691} -11/07/2021 01:13:53 - INFO - __main__ - Step 28601: {'lr': 0.00046119564510623, 'samples': 5491392, 'steps': 28600, 'loss/train': 1.7137017250061035} -11/07/2021 01:13:53 - INFO - __main__ - Step 28602: {'lr': 0.00046119280536827, 'samples': 5491584, 'steps': 28601, 'loss/train': 1.4423989057540894} -11/07/2021 01:13:54 - INFO - __main__ - Step 28603: {'lr': 0.0004611899655351497, 'samples': 5491776, 'steps': 28602, 'loss/train': 1.636980652809143} -11/07/2021 01:13:54 - INFO - __main__ - Step 28604: {'lr': 0.0004611871256068705, 'samples': 5491968, 'steps': 28603, 'loss/train': 1.7325501441955566} -11/07/2021 01:13:54 - INFO - __main__ - Step 28605: {'lr': 0.0004611842855834336, 'samples': 5492160, 'steps': 28604, 'loss/train': 1.6320688724517822} -11/07/2021 01:13:55 - INFO - __main__ - Step 28606: {'lr': 0.00046118144546484043, 'samples': 5492352, 'steps': 28605, 'loss/train': 1.2296459674835205} -11/07/2021 01:13:56 - INFO - __main__ - Step 28607: {'lr': 0.0004611786052510921, 'samples': 5492544, 'steps': 28606, 'loss/train': 0.447788268327713} -11/07/2021 01:13:56 - INFO - __main__ - Step 28608: {'lr': 0.0004611757649421899, 'samples': 5492736, 'steps': 28607, 'loss/train': 1.6928179264068604} -11/07/2021 01:13:57 - INFO - __main__ - Step 28609: {'lr': 0.0004611729245381352, 'samples': 5492928, 'steps': 28608, 'loss/train': 2.53912615776062} -11/07/2021 01:13:57 - INFO - __main__ - Step 28610: {'lr': 0.00046117008403892925, 'samples': 5493120, 'steps': 28609, 'loss/train': 1.485178828239441} -11/07/2021 01:13:57 - INFO - __main__ - Step 28611: {'lr': 0.0004611672434445733, 'samples': 5493312, 'steps': 28610, 'loss/train': 1.8342007398605347} -11/07/2021 01:13:58 - INFO - __main__ - Step 28612: {'lr': 0.0004611644027550687, 'samples': 5493504, 'steps': 28611, 'loss/train': 4.171876907348633} -11/07/2021 01:13:59 - INFO - __main__ - Step 28613: {'lr': 0.00046116156197041657, 'samples': 5493696, 'steps': 28612, 'loss/train': 1.8307241201400757} -11/07/2021 01:13:59 - INFO - __main__ - Step 28614: {'lr': 0.0004611587210906184, 'samples': 5493888, 'steps': 28613, 'loss/train': 0.7530031204223633} -11/07/2021 01:14:00 - INFO - __main__ - Step 28615: {'lr': 0.0004611558801156753, 'samples': 5494080, 'steps': 28614, 'loss/train': 1.3507496118545532} -11/07/2021 01:14:00 - INFO - __main__ - Step 28616: {'lr': 0.0004611530390455887, 'samples': 5494272, 'steps': 28615, 'loss/train': 1.4227341413497925} -11/07/2021 01:14:01 - INFO - __main__ - Step 28617: {'lr': 0.00046115019788035974, 'samples': 5494464, 'steps': 28616, 'loss/train': 0.9620317816734314} -11/07/2021 01:14:01 - INFO - __main__ - Step 28618: {'lr': 0.00046114735661998975, 'samples': 5494656, 'steps': 28617, 'loss/train': 0.9758543372154236} -11/07/2021 01:14:02 - INFO - __main__ - Step 28619: {'lr': 0.0004611445152644801, 'samples': 5494848, 'steps': 28618, 'loss/train': 0.5890863537788391} -11/07/2021 01:14:02 - INFO - __main__ - Step 28620: {'lr': 0.00046114167381383186, 'samples': 5495040, 'steps': 28619, 'loss/train': 2.1583333015441895} -11/07/2021 01:14:02 - INFO - __main__ - Step 28621: {'lr': 0.0004611388322680465, 'samples': 5495232, 'steps': 28620, 'loss/train': 1.5053393840789795} -11/07/2021 01:14:03 - INFO - __main__ - Step 28622: {'lr': 0.0004611359906271253, 'samples': 5495424, 'steps': 28621, 'loss/train': 1.5294830799102783} -11/07/2021 01:14:04 - INFO - __main__ - Step 28623: {'lr': 0.0004611331488910694, 'samples': 5495616, 'steps': 28622, 'loss/train': 1.6916823387145996} -11/07/2021 01:14:04 - INFO - __main__ - Step 28624: {'lr': 0.00046113030705988026, 'samples': 5495808, 'steps': 28623, 'loss/train': 1.8420982360839844} -11/07/2021 01:14:04 - INFO - __main__ - Step 28625: {'lr': 0.000461127465133559, 'samples': 5496000, 'steps': 28624, 'loss/train': 1.3573448657989502} -11/07/2021 01:14:05 - INFO - __main__ - Step 28626: {'lr': 0.0004611246231121069, 'samples': 5496192, 'steps': 28625, 'loss/train': 1.6356327533721924} -11/07/2021 01:14:05 - INFO - __main__ - Step 28627: {'lr': 0.00046112178099552535, 'samples': 5496384, 'steps': 28626, 'loss/train': 1.0614502429962158} -11/07/2021 01:14:06 - INFO - __main__ - Step 28628: {'lr': 0.0004611189387838156, 'samples': 5496576, 'steps': 28627, 'loss/train': 1.4590609073638916} -11/07/2021 01:14:06 - INFO - __main__ - Step 28629: {'lr': 0.00046111609647697893, 'samples': 5496768, 'steps': 28628, 'loss/train': 1.7812243700027466} -11/07/2021 01:14:07 - INFO - __main__ - Step 28630: {'lr': 0.0004611132540750166, 'samples': 5496960, 'steps': 28629, 'loss/train': 1.6481937170028687} -11/07/2021 01:14:07 - INFO - __main__ - Step 28631: {'lr': 0.00046111041157792987, 'samples': 5497152, 'steps': 28630, 'loss/train': 2.1358513832092285} -11/07/2021 01:14:08 - INFO - __main__ - Step 28632: {'lr': 0.00046110756898572, 'samples': 5497344, 'steps': 28631, 'loss/train': 1.7727172374725342} -11/07/2021 01:14:09 - INFO - __main__ - Step 28633: {'lr': 0.0004611047262983884, 'samples': 5497536, 'steps': 28632, 'loss/train': 1.3694134950637817} -11/07/2021 01:14:09 - INFO - __main__ - Step 28634: {'lr': 0.00046110188351593625, 'samples': 5497728, 'steps': 28633, 'loss/train': 1.2695839405059814} -11/07/2021 01:14:09 - INFO - __main__ - Step 28635: {'lr': 0.0004610990406383648, 'samples': 5497920, 'steps': 28634, 'loss/train': 1.223016619682312} -11/07/2021 01:14:10 - INFO - __main__ - Step 28636: {'lr': 0.00046109619766567547, 'samples': 5498112, 'steps': 28635, 'loss/train': 0.545827329158783} -11/07/2021 01:14:10 - INFO - __main__ - Step 28637: {'lr': 0.0004610933545978694, 'samples': 5498304, 'steps': 28636, 'loss/train': 2.735299587249756} -11/07/2021 01:14:11 - INFO - __main__ - Step 28638: {'lr': 0.0004610905114349478, 'samples': 5498496, 'steps': 28637, 'loss/train': 1.3574023246765137} -11/07/2021 01:14:12 - INFO - __main__ - Step 28639: {'lr': 0.0004610876681769123, 'samples': 5498688, 'steps': 28638, 'loss/train': 1.8435614109039307} -11/07/2021 01:14:12 - INFO - __main__ - Step 28640: {'lr': 0.0004610848248237638, 'samples': 5498880, 'steps': 28639, 'loss/train': 1.2343521118164062} -11/07/2021 01:14:12 - INFO - __main__ - Step 28641: {'lr': 0.00046108198137550377, 'samples': 5499072, 'steps': 28640, 'loss/train': 1.4320803880691528} -11/07/2021 01:14:13 - INFO - __main__ - Step 28642: {'lr': 0.0004610791378321335, 'samples': 5499264, 'steps': 28641, 'loss/train': 1.575751543045044} -11/07/2021 01:14:13 - INFO - __main__ - Step 28643: {'lr': 0.0004610762941936542, 'samples': 5499456, 'steps': 28642, 'loss/train': 1.3416160345077515} -11/07/2021 01:14:14 - INFO - __main__ - Step 28644: {'lr': 0.0004610734504600671, 'samples': 5499648, 'steps': 28643, 'loss/train': 1.591726541519165} -11/07/2021 01:14:14 - INFO - __main__ - Step 28645: {'lr': 0.00046107060663137366, 'samples': 5499840, 'steps': 28644, 'loss/train': 1.678292989730835} -11/07/2021 01:14:15 - INFO - __main__ - Step 28646: {'lr': 0.00046106776270757506, 'samples': 5500032, 'steps': 28645, 'loss/train': 1.7594455480575562} -11/07/2021 01:14:15 - INFO - __main__ - Step 28647: {'lr': 0.0004610649186886725, 'samples': 5500224, 'steps': 28646, 'loss/train': 1.5664775371551514} -11/07/2021 01:14:16 - INFO - __main__ - Step 28648: {'lr': 0.00046106207457466744, 'samples': 5500416, 'steps': 28647, 'loss/train': 1.4586031436920166} -11/07/2021 01:14:17 - INFO - __main__ - Step 28649: {'lr': 0.0004610592303655611, 'samples': 5500608, 'steps': 28648, 'loss/train': 1.7166132926940918} -11/07/2021 01:14:17 - INFO - __main__ - Step 28650: {'lr': 0.0004610563860613546, 'samples': 5500800, 'steps': 28649, 'loss/train': 5.587038516998291} -11/07/2021 01:14:17 - INFO - __main__ - Step 28651: {'lr': 0.00046105354166204937, 'samples': 5500992, 'steps': 28650, 'loss/train': 1.741302251815796} -11/07/2021 01:14:18 - INFO - __main__ - Step 28652: {'lr': 0.00046105069716764676, 'samples': 5501184, 'steps': 28651, 'loss/train': 0.7651360630989075} -11/07/2021 01:14:18 - INFO - __main__ - Step 28653: {'lr': 0.00046104785257814786, 'samples': 5501376, 'steps': 28652, 'loss/train': 1.889872431755066} -11/07/2021 01:14:19 - INFO - __main__ - Step 28654: {'lr': 0.0004610450078935541, 'samples': 5501568, 'steps': 28653, 'loss/train': 1.3259265422821045} -11/07/2021 01:14:20 - INFO - __main__ - Step 28655: {'lr': 0.00046104216311386676, 'samples': 5501760, 'steps': 28654, 'loss/train': 1.460955023765564} -11/07/2021 01:14:20 - INFO - __main__ - Step 28656: {'lr': 0.000461039318239087, 'samples': 5501952, 'steps': 28655, 'loss/train': 1.2348376512527466} -11/07/2021 01:14:21 - INFO - __main__ - Step 28657: {'lr': 0.00046103647326921625, 'samples': 5502144, 'steps': 28656, 'loss/train': 2.395113945007324} -11/07/2021 01:14:21 - INFO - __main__ - Step 28658: {'lr': 0.00046103362820425567, 'samples': 5502336, 'steps': 28657, 'loss/train': 1.311152696609497} -11/07/2021 01:14:21 - INFO - __main__ - Step 28659: {'lr': 0.00046103078304420665, 'samples': 5502528, 'steps': 28658, 'loss/train': 1.4987415075302124} -11/07/2021 01:14:22 - INFO - __main__ - Step 28660: {'lr': 0.0004610279377890704, 'samples': 5502720, 'steps': 28659, 'loss/train': 0.693972647190094} -11/07/2021 01:14:23 - INFO - __main__ - Step 28661: {'lr': 0.00046102509243884813, 'samples': 5502912, 'steps': 28660, 'loss/train': 1.4814105033874512} -11/07/2021 01:14:23 - INFO - __main__ - Step 28662: {'lr': 0.0004610222469935413, 'samples': 5503104, 'steps': 28661, 'loss/train': 1.6567411422729492} -11/07/2021 01:14:23 - INFO - __main__ - Step 28663: {'lr': 0.000461019401453151, 'samples': 5503296, 'steps': 28662, 'loss/train': 2.106566905975342} -11/07/2021 01:14:24 - INFO - __main__ - Step 28664: {'lr': 0.00046101655581767874, 'samples': 5503488, 'steps': 28663, 'loss/train': 0.5619341731071472} -11/07/2021 01:14:25 - INFO - __main__ - Step 28665: {'lr': 0.0004610137100871257, 'samples': 5503680, 'steps': 28664, 'loss/train': 1.7786967754364014} -11/07/2021 01:14:25 - INFO - __main__ - Step 28666: {'lr': 0.00046101086426149297, 'samples': 5503872, 'steps': 28665, 'loss/train': 1.7782741785049438} -11/07/2021 01:14:26 - INFO - __main__ - Step 28667: {'lr': 0.0004610080183407821, 'samples': 5504064, 'steps': 28666, 'loss/train': 1.60888671875} -11/07/2021 01:14:26 - INFO - __main__ - Step 28668: {'lr': 0.0004610051723249943, 'samples': 5504256, 'steps': 28667, 'loss/train': 1.6466768980026245} -11/07/2021 01:14:26 - INFO - __main__ - Step 28669: {'lr': 0.0004610023262141308, 'samples': 5504448, 'steps': 28668, 'loss/train': 2.1476855278015137} -11/07/2021 01:14:27 - INFO - __main__ - Step 28670: {'lr': 0.00046099948000819294, 'samples': 5504640, 'steps': 28669, 'loss/train': 2.24654483795166} -11/07/2021 01:14:28 - INFO - __main__ - Step 28671: {'lr': 0.0004609966337071819, 'samples': 5504832, 'steps': 28670, 'loss/train': 1.561232089996338} -11/07/2021 01:14:28 - INFO - __main__ - Step 28672: {'lr': 0.00046099378731109906, 'samples': 5505024, 'steps': 28671, 'loss/train': 0.2538740634918213} -11/07/2021 01:14:28 - INFO - __main__ - Step 28673: {'lr': 0.00046099094081994565, 'samples': 5505216, 'steps': 28672, 'loss/train': 1.683111310005188} -11/07/2021 01:14:29 - INFO - __main__ - Step 28674: {'lr': 0.000460988094233723, 'samples': 5505408, 'steps': 28673, 'loss/train': 0.622854471206665} -11/07/2021 01:14:29 - INFO - __main__ - Step 28675: {'lr': 0.00046098524755243246, 'samples': 5505600, 'steps': 28674, 'loss/train': 1.3095825910568237} -11/07/2021 01:14:30 - INFO - __main__ - Step 28676: {'lr': 0.0004609824007760751, 'samples': 5505792, 'steps': 28675, 'loss/train': 1.7884206771850586} -11/07/2021 01:14:31 - INFO - __main__ - Step 28677: {'lr': 0.0004609795539046524, 'samples': 5505984, 'steps': 28676, 'loss/train': 0.9840785264968872} -11/07/2021 01:14:31 - INFO - __main__ - Step 28678: {'lr': 0.0004609767069381655, 'samples': 5506176, 'steps': 28677, 'loss/train': 1.2989946603775024} -11/07/2021 01:14:31 - INFO - __main__ - Step 28679: {'lr': 0.00046097385987661576, 'samples': 5506368, 'steps': 28678, 'loss/train': 0.7278133630752563} -11/07/2021 01:14:32 - INFO - __main__ - Step 28680: {'lr': 0.00046097101272000454, 'samples': 5506560, 'steps': 28679, 'loss/train': 2.0719168186187744} -11/07/2021 01:14:33 - INFO - __main__ - Step 28681: {'lr': 0.0004609681654683329, 'samples': 5506752, 'steps': 28680, 'loss/train': 1.3236138820648193} -11/07/2021 01:14:33 - INFO - __main__ - Step 28682: {'lr': 0.0004609653181216024, 'samples': 5506944, 'steps': 28681, 'loss/train': 1.3993245363235474} -11/07/2021 01:14:33 - INFO - __main__ - Step 28683: {'lr': 0.0004609624706798141, 'samples': 5507136, 'steps': 28682, 'loss/train': 1.698938250541687} -11/07/2021 01:14:34 - INFO - __main__ - Step 28684: {'lr': 0.00046095962314296934, 'samples': 5507328, 'steps': 28683, 'loss/train': 1.4753496646881104} -11/07/2021 01:14:34 - INFO - __main__ - Step 28685: {'lr': 0.00046095677551106953, 'samples': 5507520, 'steps': 28684, 'loss/train': 1.476138710975647} -11/07/2021 01:14:35 - INFO - __main__ - Step 28686: {'lr': 0.00046095392778411576, 'samples': 5507712, 'steps': 28685, 'loss/train': 2.1143760681152344} -11/07/2021 01:14:35 - INFO - __main__ - Step 28687: {'lr': 0.0004609510799621095, 'samples': 5507904, 'steps': 28686, 'loss/train': 1.7127150297164917} -11/07/2021 01:14:36 - INFO - __main__ - Step 28688: {'lr': 0.0004609482320450519, 'samples': 5508096, 'steps': 28687, 'loss/train': 1.77858567237854} -11/07/2021 01:14:36 - INFO - __main__ - Step 28689: {'lr': 0.00046094538403294416, 'samples': 5508288, 'steps': 28688, 'loss/train': 1.3900631666183472} -11/07/2021 01:14:36 - INFO - __main__ - Step 28690: {'lr': 0.00046094253592578784, 'samples': 5508480, 'steps': 28689, 'loss/train': 1.9384557008743286} -11/07/2021 01:14:37 - INFO - __main__ - Step 28691: {'lr': 0.000460939687723584, 'samples': 5508672, 'steps': 28690, 'loss/train': 1.296342134475708} -11/07/2021 01:14:38 - INFO - __main__ - Step 28692: {'lr': 0.000460936839426334, 'samples': 5508864, 'steps': 28691, 'loss/train': 2.038013458251953} -11/07/2021 01:14:38 - INFO - __main__ - Step 28693: {'lr': 0.00046093399103403913, 'samples': 5509056, 'steps': 28692, 'loss/train': 1.3611464500427246} -11/07/2021 01:14:39 - INFO - __main__ - Step 28694: {'lr': 0.00046093114254670066, 'samples': 5509248, 'steps': 28693, 'loss/train': 0.881278395652771} -11/07/2021 01:14:39 - INFO - __main__ - Step 28695: {'lr': 0.0004609282939643199, 'samples': 5509440, 'steps': 28694, 'loss/train': 1.3509044647216797} -11/07/2021 01:14:39 - INFO - __main__ - Step 28696: {'lr': 0.00046092544528689806, 'samples': 5509632, 'steps': 28695, 'loss/train': 1.7343835830688477} -11/07/2021 01:14:40 - INFO - __main__ - Step 28697: {'lr': 0.0004609225965144365, 'samples': 5509824, 'steps': 28696, 'loss/train': 1.621491551399231} -11/07/2021 01:14:41 - INFO - __main__ - Step 28698: {'lr': 0.00046091974764693645, 'samples': 5510016, 'steps': 28697, 'loss/train': 1.771262764930725} -11/07/2021 01:14:41 - INFO - __main__ - Step 28699: {'lr': 0.0004609168986843992, 'samples': 5510208, 'steps': 28698, 'loss/train': 1.3424490690231323} -11/07/2021 01:14:41 - INFO - __main__ - Step 28700: {'lr': 0.000460914049626826, 'samples': 5510400, 'steps': 28699, 'loss/train': 1.46780526638031} -11/07/2021 01:14:42 - INFO - __main__ - Step 28701: {'lr': 0.0004609112004742183, 'samples': 5510592, 'steps': 28700, 'loss/train': 1.7891309261322021} -11/07/2021 01:14:43 - INFO - __main__ - Step 28702: {'lr': 0.0004609083512265773, 'samples': 5510784, 'steps': 28701, 'loss/train': 1.23452889919281} -11/07/2021 01:14:43 - INFO - __main__ - Step 28703: {'lr': 0.0004609055018839041, 'samples': 5510976, 'steps': 28702, 'loss/train': 1.4976916313171387} -11/07/2021 01:14:43 - INFO - __main__ - Step 28704: {'lr': 0.0004609026524462002, 'samples': 5511168, 'steps': 28703, 'loss/train': 1.540532112121582} -11/07/2021 01:14:44 - INFO - __main__ - Step 28705: {'lr': 0.00046089980291346685, 'samples': 5511360, 'steps': 28704, 'loss/train': 1.2702617645263672} -11/07/2021 01:14:44 - INFO - __main__ - Step 28706: {'lr': 0.00046089695328570523, 'samples': 5511552, 'steps': 28705, 'loss/train': 1.664182186126709} -11/07/2021 01:14:45 - INFO - __main__ - Step 28707: {'lr': 0.0004608941035629168, 'samples': 5511744, 'steps': 28706, 'loss/train': 1.796590805053711} -11/07/2021 01:14:45 - INFO - __main__ - Step 28708: {'lr': 0.0004608912537451027, 'samples': 5511936, 'steps': 28707, 'loss/train': 1.765599012374878} -11/07/2021 01:14:46 - INFO - __main__ - Step 28709: {'lr': 0.0004608884038322642, 'samples': 5512128, 'steps': 28708, 'loss/train': 1.7580174207687378} -11/07/2021 01:14:46 - INFO - __main__ - Step 28710: {'lr': 0.00046088555382440275, 'samples': 5512320, 'steps': 28709, 'loss/train': 1.446540117263794} -11/07/2021 01:14:46 - INFO - __main__ - Step 28711: {'lr': 0.0004608827037215194, 'samples': 5512512, 'steps': 28710, 'loss/train': 1.4470421075820923} -11/07/2021 01:14:47 - INFO - __main__ - Step 28712: {'lr': 0.0004608798535236156, 'samples': 5512704, 'steps': 28711, 'loss/train': 1.5437874794006348} -11/07/2021 01:14:48 - INFO - __main__ - Step 28713: {'lr': 0.0004608770032306926, 'samples': 5512896, 'steps': 28712, 'loss/train': 1.2525914907455444} -11/07/2021 01:14:48 - INFO - __main__ - Step 28714: {'lr': 0.0004608741528427517, 'samples': 5513088, 'steps': 28713, 'loss/train': 1.7943804264068604} -11/07/2021 01:14:48 - INFO - __main__ - Step 28715: {'lr': 0.0004608713023597941, 'samples': 5513280, 'steps': 28714, 'loss/train': 1.7214324474334717} -11/07/2021 01:14:49 - INFO - __main__ - Step 28716: {'lr': 0.00046086845178182123, 'samples': 5513472, 'steps': 28715, 'loss/train': 1.343458652496338} -11/07/2021 01:14:49 - INFO - __main__ - Step 28717: {'lr': 0.00046086560110883423, 'samples': 5513664, 'steps': 28716, 'loss/train': 1.327499270439148} -11/07/2021 01:14:50 - INFO - __main__ - Step 28718: {'lr': 0.00046086275034083453, 'samples': 5513856, 'steps': 28717, 'loss/train': 1.1367992162704468} -11/07/2021 01:14:51 - INFO - __main__ - Step 28719: {'lr': 0.00046085989947782327, 'samples': 5514048, 'steps': 28718, 'loss/train': 1.0489040613174438} -11/07/2021 01:14:51 - INFO - __main__ - Step 28720: {'lr': 0.00046085704851980174, 'samples': 5514240, 'steps': 28719, 'loss/train': 1.5698318481445312} -11/07/2021 01:14:51 - INFO - __main__ - Step 28721: {'lr': 0.00046085419746677136, 'samples': 5514432, 'steps': 28720, 'loss/train': 1.8643708229064941} -11/07/2021 01:14:52 - INFO - __main__ - Step 28722: {'lr': 0.00046085134631873326, 'samples': 5514624, 'steps': 28721, 'loss/train': 0.3820008933544159} -11/07/2021 01:14:53 - INFO - __main__ - Step 28723: {'lr': 0.0004608484950756888, 'samples': 5514816, 'steps': 28722, 'loss/train': 1.9114362001419067} -11/07/2021 01:14:53 - INFO - __main__ - Step 28724: {'lr': 0.0004608456437376393, 'samples': 5515008, 'steps': 28723, 'loss/train': 1.7168536186218262} -11/07/2021 01:14:54 - INFO - __main__ - Step 28725: {'lr': 0.000460842792304586, 'samples': 5515200, 'steps': 28724, 'loss/train': 1.5014718770980835} -11/07/2021 01:14:54 - INFO - __main__ - Step 28726: {'lr': 0.00046083994077653024, 'samples': 5515392, 'steps': 28725, 'loss/train': 1.781377911567688} -11/07/2021 01:14:54 - INFO - __main__ - Step 28727: {'lr': 0.0004608370891534732, 'samples': 5515584, 'steps': 28726, 'loss/train': 1.7531365156173706} -11/07/2021 01:14:55 - INFO - __main__ - Step 28728: {'lr': 0.0004608342374354162, 'samples': 5515776, 'steps': 28727, 'loss/train': 1.8156870603561401} -11/07/2021 01:14:56 - INFO - __main__ - Step 28729: {'lr': 0.0004608313856223606, 'samples': 5515968, 'steps': 28728, 'loss/train': 1.3125196695327759} -11/07/2021 01:14:56 - INFO - __main__ - Step 28730: {'lr': 0.00046082853371430754, 'samples': 5516160, 'steps': 28729, 'loss/train': 0.5172771215438843} -11/07/2021 01:14:56 - INFO - __main__ - Step 28731: {'lr': 0.0004608256817112585, 'samples': 5516352, 'steps': 28730, 'loss/train': 1.6598970890045166} -11/07/2021 01:14:57 - INFO - __main__ - Step 28732: {'lr': 0.00046082282961321466, 'samples': 5516544, 'steps': 28731, 'loss/train': 1.5800282955169678} -11/07/2021 01:14:57 - INFO - __main__ - Step 28733: {'lr': 0.00046081997742017725, 'samples': 5516736, 'steps': 28732, 'loss/train': 1.9237587451934814} -11/07/2021 01:14:58 - INFO - __main__ - Step 28734: {'lr': 0.00046081712513214757, 'samples': 5516928, 'steps': 28733, 'loss/train': 1.1939243078231812} -11/07/2021 01:14:59 - INFO - __main__ - Step 28735: {'lr': 0.0004608142727491271, 'samples': 5517120, 'steps': 28734, 'loss/train': 1.5787652730941772} -11/07/2021 01:14:59 - INFO - __main__ - Step 28736: {'lr': 0.00046081142027111683, 'samples': 5517312, 'steps': 28735, 'loss/train': 1.1781924962997437} -11/07/2021 01:14:59 - INFO - __main__ - Step 28737: {'lr': 0.0004608085676981182, 'samples': 5517504, 'steps': 28736, 'loss/train': 1.891564965248108} -11/07/2021 01:15:00 - INFO - __main__ - Step 28738: {'lr': 0.0004608057150301326, 'samples': 5517696, 'steps': 28737, 'loss/train': 0.9074145555496216} -11/07/2021 01:15:01 - INFO - __main__ - Step 28739: {'lr': 0.00046080286226716106, 'samples': 5517888, 'steps': 28738, 'loss/train': 1.5400950908660889} -11/07/2021 01:15:01 - INFO - __main__ - Step 28740: {'lr': 0.00046080000940920506, 'samples': 5518080, 'steps': 28739, 'loss/train': 1.1455605030059814} -11/07/2021 01:15:02 - INFO - __main__ - Step 28741: {'lr': 0.00046079715645626584, 'samples': 5518272, 'steps': 28740, 'loss/train': 1.4673417806625366} -11/07/2021 01:15:02 - INFO - __main__ - Step 28742: {'lr': 0.00046079430340834467, 'samples': 5518464, 'steps': 28741, 'loss/train': 1.6762181520462036} -11/07/2021 01:15:03 - INFO - __main__ - Step 28743: {'lr': 0.00046079145026544277, 'samples': 5518656, 'steps': 28742, 'loss/train': 1.453457236289978} -11/07/2021 01:15:04 - INFO - __main__ - Step 28744: {'lr': 0.0004607885970275616, 'samples': 5518848, 'steps': 28743, 'loss/train': 0.2404089868068695} -11/07/2021 01:15:04 - INFO - __main__ - Step 28745: {'lr': 0.0004607857436947023, 'samples': 5519040, 'steps': 28744, 'loss/train': 1.8219144344329834} -11/07/2021 01:15:04 - INFO - __main__ - Step 28746: {'lr': 0.00046078289026686616, 'samples': 5519232, 'steps': 28745, 'loss/train': 1.8101202249526978} -11/07/2021 01:15:05 - INFO - __main__ - Step 28747: {'lr': 0.00046078003674405457, 'samples': 5519424, 'steps': 28746, 'loss/train': 1.357011079788208} -11/07/2021 01:15:05 - INFO - __main__ - Step 28748: {'lr': 0.0004607771831262687, 'samples': 5519616, 'steps': 28747, 'loss/train': 1.8157292604446411} -11/07/2021 01:15:06 - INFO - __main__ - Step 28749: {'lr': 0.00046077432941350993, 'samples': 5519808, 'steps': 28748, 'loss/train': 1.8717877864837646} -11/07/2021 01:15:06 - INFO - __main__ - Step 28750: {'lr': 0.00046077147560577943, 'samples': 5520000, 'steps': 28749, 'loss/train': 1.5922538042068481} -11/07/2021 01:15:07 - INFO - __main__ - Step 28751: {'lr': 0.0004607686217030786, 'samples': 5520192, 'steps': 28750, 'loss/train': 2.1468424797058105} -11/07/2021 01:15:07 - INFO - __main__ - Step 28752: {'lr': 0.00046076576770540865, 'samples': 5520384, 'steps': 28751, 'loss/train': 1.7125825881958008} -11/07/2021 01:15:08 - INFO - __main__ - Step 28753: {'lr': 0.00046076291361277097, 'samples': 5520576, 'steps': 28752, 'loss/train': 1.5815342664718628} -11/07/2021 01:15:08 - INFO - __main__ - Step 28754: {'lr': 0.00046076005942516666, 'samples': 5520768, 'steps': 28753, 'loss/train': 1.7074263095855713} -11/07/2021 01:15:09 - INFO - __main__ - Step 28755: {'lr': 0.0004607572051425972, 'samples': 5520960, 'steps': 28754, 'loss/train': 2.52258563041687} -11/07/2021 01:15:09 - INFO - __main__ - Step 28756: {'lr': 0.00046075435076506376, 'samples': 5521152, 'steps': 28755, 'loss/train': 1.4358375072479248} -11/07/2021 01:15:10 - INFO - __main__ - Step 28757: {'lr': 0.0004607514962925677, 'samples': 5521344, 'steps': 28756, 'loss/train': 1.3483976125717163} -11/07/2021 01:15:10 - INFO - __main__ - Step 28758: {'lr': 0.00046074864172511025, 'samples': 5521536, 'steps': 28757, 'loss/train': 1.3330392837524414} -11/07/2021 01:15:10 - INFO - __main__ - Step 28759: {'lr': 0.0004607457870626928, 'samples': 5521728, 'steps': 28758, 'loss/train': 2.126948118209839} -11/07/2021 01:15:11 - INFO - __main__ - Step 28760: {'lr': 0.0004607429323053164, 'samples': 5521920, 'steps': 28759, 'loss/train': 1.9364488124847412} -11/07/2021 01:15:12 - INFO - __main__ - Step 28761: {'lr': 0.0004607400774529825, 'samples': 5522112, 'steps': 28760, 'loss/train': 1.7834445238113403} -11/07/2021 01:15:12 - INFO - __main__ - Step 28762: {'lr': 0.0004607372225056925, 'samples': 5522304, 'steps': 28761, 'loss/train': 1.589208960533142} -11/07/2021 01:15:12 - INFO - __main__ - Step 28763: {'lr': 0.00046073436746344744, 'samples': 5522496, 'steps': 28762, 'loss/train': 1.5198677778244019} -11/07/2021 01:15:13 - INFO - __main__ - Step 28764: {'lr': 0.0004607315123262488, 'samples': 5522688, 'steps': 28763, 'loss/train': 1.6237186193466187} -11/07/2021 01:15:14 - INFO - __main__ - Step 28765: {'lr': 0.0004607286570940977, 'samples': 5522880, 'steps': 28764, 'loss/train': 0.8403159379959106} -11/07/2021 01:15:14 - INFO - __main__ - Step 28766: {'lr': 0.0004607258017669956, 'samples': 5523072, 'steps': 28765, 'loss/train': 1.419538140296936} -11/07/2021 01:15:15 - INFO - __main__ - Step 28767: {'lr': 0.0004607229463449437, 'samples': 5523264, 'steps': 28766, 'loss/train': 1.5430967807769775} -11/07/2021 01:15:15 - INFO - __main__ - Step 28768: {'lr': 0.00046072009082794333, 'samples': 5523456, 'steps': 28767, 'loss/train': 1.846705436706543} -11/07/2021 01:15:15 - INFO - __main__ - Step 28769: {'lr': 0.00046071723521599563, 'samples': 5523648, 'steps': 28768, 'loss/train': 1.8131253719329834} -11/07/2021 01:15:16 - INFO - __main__ - Step 28770: {'lr': 0.000460714379509102, 'samples': 5523840, 'steps': 28769, 'loss/train': 1.3720142841339111} -11/07/2021 01:15:17 - INFO - __main__ - Step 28771: {'lr': 0.0004607115237072638, 'samples': 5524032, 'steps': 28770, 'loss/train': 1.7073737382888794} -11/07/2021 01:15:17 - INFO - __main__ - Step 28772: {'lr': 0.00046070866781048225, 'samples': 5524224, 'steps': 28771, 'loss/train': 1.6079767942428589} -11/07/2021 01:15:17 - INFO - __main__ - Step 28773: {'lr': 0.0004607058118187586, 'samples': 5524416, 'steps': 28772, 'loss/train': 1.6379915475845337} -11/07/2021 01:15:18 - INFO - __main__ - Step 28774: {'lr': 0.00046070295573209406, 'samples': 5524608, 'steps': 28773, 'loss/train': 1.3397719860076904} -11/07/2021 01:15:18 - INFO - __main__ - Step 28775: {'lr': 0.00046070009955049017, 'samples': 5524800, 'steps': 28774, 'loss/train': 1.4922139644622803} -11/07/2021 01:15:19 - INFO - __main__ - Step 28776: {'lr': 0.000460697243273948, 'samples': 5524992, 'steps': 28775, 'loss/train': 1.7376784086227417} -11/07/2021 01:15:19 - INFO - __main__ - Step 28777: {'lr': 0.0004606943869024689, 'samples': 5525184, 'steps': 28776, 'loss/train': 1.3660744428634644} -11/07/2021 01:15:20 - INFO - __main__ - Step 28778: {'lr': 0.0004606915304360542, 'samples': 5525376, 'steps': 28777, 'loss/train': 1.768597960472107} -11/07/2021 01:15:20 - INFO - __main__ - Step 28779: {'lr': 0.00046068867387470507, 'samples': 5525568, 'steps': 28778, 'loss/train': 1.5304911136627197} -11/07/2021 01:15:20 - INFO - __main__ - Step 28780: {'lr': 0.00046068581721842294, 'samples': 5525760, 'steps': 28779, 'loss/train': 1.5088049173355103} -11/07/2021 01:15:22 - INFO - __main__ - Step 28781: {'lr': 0.00046068296046720904, 'samples': 5525952, 'steps': 28780, 'loss/train': 1.3194479942321777} -11/07/2021 01:15:22 - INFO - __main__ - Step 28782: {'lr': 0.0004606801036210646, 'samples': 5526144, 'steps': 28781, 'loss/train': 1.318917155265808} -11/07/2021 01:15:22 - INFO - __main__ - Step 28783: {'lr': 0.000460677246679991, 'samples': 5526336, 'steps': 28782, 'loss/train': 1.745903491973877} -11/07/2021 01:15:23 - INFO - __main__ - Step 28784: {'lr': 0.00046067438964398944, 'samples': 5526528, 'steps': 28783, 'loss/train': 1.8044811487197876} -11/07/2021 01:15:23 - INFO - __main__ - Step 28785: {'lr': 0.00046067153251306127, 'samples': 5526720, 'steps': 28784, 'loss/train': 1.8561345338821411} -11/07/2021 01:15:23 - INFO - __main__ - Step 28786: {'lr': 0.0004606686752872078, 'samples': 5526912, 'steps': 28785, 'loss/train': 0.1970166563987732} -11/07/2021 01:15:24 - INFO - __main__ - Step 28787: {'lr': 0.0004606658179664302, 'samples': 5527104, 'steps': 28786, 'loss/train': 1.122194528579712} -11/07/2021 01:15:25 - INFO - __main__ - Step 28788: {'lr': 0.00046066296055072986, 'samples': 5527296, 'steps': 28787, 'loss/train': 1.4112536907196045} -11/07/2021 01:15:25 - INFO - __main__ - Step 28789: {'lr': 0.0004606601030401081, 'samples': 5527488, 'steps': 28788, 'loss/train': 1.6186010837554932} -11/07/2021 01:15:26 - INFO - __main__ - Step 28790: {'lr': 0.0004606572454345661, 'samples': 5527680, 'steps': 28789, 'loss/train': 1.6745975017547607} -11/07/2021 01:15:26 - INFO - __main__ - Step 28791: {'lr': 0.0004606543877341052, 'samples': 5527872, 'steps': 28790, 'loss/train': 1.5834710597991943} -11/07/2021 01:15:27 - INFO - __main__ - Step 28792: {'lr': 0.00046065152993872665, 'samples': 5528064, 'steps': 28791, 'loss/train': 1.9523475170135498} -11/07/2021 01:15:27 - INFO - __main__ - Step 28793: {'lr': 0.0004606486720484318, 'samples': 5528256, 'steps': 28792, 'loss/train': 1.4230964183807373} -11/07/2021 01:15:28 - INFO - __main__ - Step 28794: {'lr': 0.0004606458140632219, 'samples': 5528448, 'steps': 28793, 'loss/train': 1.6033148765563965} -11/07/2021 01:15:28 - INFO - __main__ - Step 28795: {'lr': 0.0004606429559830982, 'samples': 5528640, 'steps': 28794, 'loss/train': 1.8930948972702026} -11/07/2021 01:15:28 - INFO - __main__ - Step 28796: {'lr': 0.00046064009780806217, 'samples': 5528832, 'steps': 28795, 'loss/train': 1.2086946964263916} -11/07/2021 01:15:29 - INFO - __main__ - Step 28797: {'lr': 0.0004606372395381149, 'samples': 5529024, 'steps': 28796, 'loss/train': 1.422204852104187} -11/07/2021 01:15:30 - INFO - __main__ - Step 28798: {'lr': 0.0004606343811732577, 'samples': 5529216, 'steps': 28797, 'loss/train': 1.636315941810608} -11/07/2021 01:15:30 - INFO - __main__ - Step 28799: {'lr': 0.0004606315227134919, 'samples': 5529408, 'steps': 28798, 'loss/train': 1.4297635555267334} -11/07/2021 01:15:30 - INFO - __main__ - Step 28800: {'lr': 0.0004606286641588188, 'samples': 5529600, 'steps': 28799, 'loss/train': 1.58151113986969} -11/07/2021 01:15:31 - INFO - __main__ - Step 28801: {'lr': 0.0004606258055092397, 'samples': 5529792, 'steps': 28800, 'loss/train': 1.6272387504577637} -11/07/2021 01:15:32 - INFO - __main__ - Step 28802: {'lr': 0.00046062294676475584, 'samples': 5529984, 'steps': 28801, 'loss/train': 1.5560965538024902} -11/07/2021 01:15:32 - INFO - __main__ - Step 28803: {'lr': 0.0004606200879253685, 'samples': 5530176, 'steps': 28802, 'loss/train': 1.6053823232650757} -11/07/2021 01:15:33 - INFO - __main__ - Step 28804: {'lr': 0.00046061722899107905, 'samples': 5530368, 'steps': 28803, 'loss/train': 0.8932515978813171} -11/07/2021 01:15:33 - INFO - __main__ - Step 28805: {'lr': 0.0004606143699618888, 'samples': 5530560, 'steps': 28804, 'loss/train': 0.1487438976764679} -11/07/2021 01:15:33 - INFO - __main__ - Step 28806: {'lr': 0.00046061151083779886, 'samples': 5530752, 'steps': 28805, 'loss/train': 1.1285860538482666} -11/07/2021 01:15:34 - INFO - __main__ - Step 28807: {'lr': 0.0004606086516188106, 'samples': 5530944, 'steps': 28806, 'loss/train': 0.792855441570282} -11/07/2021 01:15:35 - INFO - __main__ - Step 28808: {'lr': 0.00046060579230492533, 'samples': 5531136, 'steps': 28807, 'loss/train': 1.6321196556091309} -11/07/2021 01:15:35 - INFO - __main__ - Step 28809: {'lr': 0.0004606029328961444, 'samples': 5531328, 'steps': 28808, 'loss/train': 0.44900208711624146} -11/07/2021 01:15:36 - INFO - __main__ - Step 28810: {'lr': 0.000460600073392469, 'samples': 5531520, 'steps': 28809, 'loss/train': 0.22598089277744293} -11/07/2021 01:15:36 - INFO - __main__ - Step 28811: {'lr': 0.00046059721379390053, 'samples': 5531712, 'steps': 28810, 'loss/train': 2.1848089694976807} -11/07/2021 01:15:36 - INFO - __main__ - Step 28812: {'lr': 0.0004605943541004401, 'samples': 5531904, 'steps': 28811, 'loss/train': 2.273839235305786} -11/07/2021 01:15:38 - INFO - __main__ - Step 28813: {'lr': 0.00046059149431208914, 'samples': 5532096, 'steps': 28812, 'loss/train': 1.8862618207931519} -11/07/2021 01:15:38 - INFO - __main__ - Step 28814: {'lr': 0.0004605886344288489, 'samples': 5532288, 'steps': 28813, 'loss/train': 1.0264168977737427} -11/07/2021 01:15:38 - INFO - __main__ - Step 28815: {'lr': 0.0004605857744507207, 'samples': 5532480, 'steps': 28814, 'loss/train': 1.2002111673355103} -11/07/2021 01:15:39 - INFO - __main__ - Step 28816: {'lr': 0.00046058291437770584, 'samples': 5532672, 'steps': 28815, 'loss/train': 1.7769715785980225} -11/07/2021 01:15:39 - INFO - __main__ - Step 28817: {'lr': 0.0004605800542098054, 'samples': 5532864, 'steps': 28816, 'loss/train': 1.6534240245819092} -11/07/2021 01:15:40 - INFO - __main__ - Step 28818: {'lr': 0.00046057719394702103, 'samples': 5533056, 'steps': 28817, 'loss/train': 1.4326366186141968} -11/07/2021 01:15:40 - INFO - __main__ - Step 28819: {'lr': 0.00046057433358935373, 'samples': 5533248, 'steps': 28818, 'loss/train': 1.4733604192733765} -11/07/2021 01:15:41 - INFO - __main__ - Step 28820: {'lr': 0.0004605714731368049, 'samples': 5533440, 'steps': 28819, 'loss/train': 1.6320061683654785} -11/07/2021 01:15:41 - INFO - __main__ - Step 28821: {'lr': 0.0004605686125893758, 'samples': 5533632, 'steps': 28820, 'loss/train': 1.660555124282837} -11/07/2021 01:15:41 - INFO - __main__ - Step 28822: {'lr': 0.00046056575194706773, 'samples': 5533824, 'steps': 28821, 'loss/train': 1.3864659070968628} -11/07/2021 01:15:42 - INFO - __main__ - Step 28823: {'lr': 0.000460562891209882, 'samples': 5534016, 'steps': 28822, 'loss/train': 1.2763863801956177} -11/07/2021 01:15:43 - INFO - __main__ - Step 28824: {'lr': 0.0004605600303778199, 'samples': 5534208, 'steps': 28823, 'loss/train': 1.6745431423187256} -11/07/2021 01:15:43 - INFO - __main__ - Step 28825: {'lr': 0.0004605571694508827, 'samples': 5534400, 'steps': 28824, 'loss/train': 1.4444369077682495} -11/07/2021 01:15:44 - INFO - __main__ - Step 28826: {'lr': 0.0004605543084290716, 'samples': 5534592, 'steps': 28825, 'loss/train': 1.4224810600280762} -11/07/2021 01:15:44 - INFO - __main__ - Step 28827: {'lr': 0.00046055144731238805, 'samples': 5534784, 'steps': 28826, 'loss/train': 1.407976746559143} -11/07/2021 01:15:45 - INFO - __main__ - Step 28828: {'lr': 0.00046054858610083325, 'samples': 5534976, 'steps': 28827, 'loss/train': 3.1830976009368896} -11/07/2021 01:15:45 - INFO - __main__ - Step 28829: {'lr': 0.0004605457247944086, 'samples': 5535168, 'steps': 28828, 'loss/train': 1.439624309539795} -11/07/2021 01:15:46 - INFO - __main__ - Step 28830: {'lr': 0.0004605428633931152, 'samples': 5535360, 'steps': 28829, 'loss/train': 1.4871230125427246} -11/07/2021 01:15:46 - INFO - __main__ - Step 28831: {'lr': 0.00046054000189695444, 'samples': 5535552, 'steps': 28830, 'loss/train': 1.4554721117019653} -11/07/2021 01:15:46 - INFO - __main__ - Step 28832: {'lr': 0.00046053714030592764, 'samples': 5535744, 'steps': 28831, 'loss/train': 1.7599273920059204} -11/07/2021 01:15:47 - INFO - __main__ - Step 28833: {'lr': 0.0004605342786200359, 'samples': 5535936, 'steps': 28832, 'loss/train': 1.0530322790145874} -11/07/2021 01:15:48 - INFO - __main__ - Step 28834: {'lr': 0.0004605314168392809, 'samples': 5536128, 'steps': 28833, 'loss/train': 1.3571157455444336} -11/07/2021 01:15:48 - INFO - __main__ - Step 28835: {'lr': 0.00046052855496366354, 'samples': 5536320, 'steps': 28834, 'loss/train': 1.7880867719650269} -11/07/2021 01:15:48 - INFO - __main__ - Step 28836: {'lr': 0.0004605256929931853, 'samples': 5536512, 'steps': 28835, 'loss/train': 1.3933273553848267} -11/07/2021 01:15:49 - INFO - __main__ - Step 28837: {'lr': 0.0004605228309278474, 'samples': 5536704, 'steps': 28836, 'loss/train': 1.5931357145309448} -11/07/2021 01:15:49 - INFO - __main__ - Step 28838: {'lr': 0.0004605199687676512, 'samples': 5536896, 'steps': 28837, 'loss/train': 1.2500851154327393} -11/07/2021 01:15:50 - INFO - __main__ - Step 28839: {'lr': 0.00046051710651259797, 'samples': 5537088, 'steps': 28838, 'loss/train': 1.5644257068634033} -11/07/2021 01:15:51 - INFO - __main__ - Step 28840: {'lr': 0.00046051424416268896, 'samples': 5537280, 'steps': 28839, 'loss/train': 1.6065336465835571} -11/07/2021 01:15:51 - INFO - __main__ - Step 28841: {'lr': 0.0004605113817179255, 'samples': 5537472, 'steps': 28840, 'loss/train': 1.748841404914856} -11/07/2021 01:15:51 - INFO - __main__ - Step 28842: {'lr': 0.00046050851917830884, 'samples': 5537664, 'steps': 28841, 'loss/train': 1.69772207736969} -11/07/2021 01:15:52 - INFO - __main__ - Step 28843: {'lr': 0.00046050565654384023, 'samples': 5537856, 'steps': 28842, 'loss/train': 1.5625964403152466} -11/07/2021 01:15:53 - INFO - __main__ - Step 28844: {'lr': 0.0004605027938145211, 'samples': 5538048, 'steps': 28843, 'loss/train': 0.6934532523155212} -11/07/2021 01:15:53 - INFO - __main__ - Step 28845: {'lr': 0.0004604999309903526, 'samples': 5538240, 'steps': 28844, 'loss/train': 1.4595178365707397} -11/07/2021 01:15:53 - INFO - __main__ - Step 28846: {'lr': 0.0004604970680713362, 'samples': 5538432, 'steps': 28845, 'loss/train': 1.1132322549819946} -11/07/2021 01:15:54 - INFO - __main__ - Step 28847: {'lr': 0.00046049420505747294, 'samples': 5538624, 'steps': 28846, 'loss/train': 1.3030951023101807} -11/07/2021 01:15:54 - INFO - __main__ - Step 28848: {'lr': 0.0004604913419487643, 'samples': 5538816, 'steps': 28847, 'loss/train': 1.7613273859024048} -11/07/2021 01:15:55 - INFO - __main__ - Step 28849: {'lr': 0.00046048847874521144, 'samples': 5539008, 'steps': 28848, 'loss/train': 1.3294694423675537} -11/07/2021 01:15:56 - INFO - __main__ - Step 28850: {'lr': 0.00046048561544681575, 'samples': 5539200, 'steps': 28849, 'loss/train': 1.4349967241287231} -11/07/2021 01:15:56 - INFO - __main__ - Step 28851: {'lr': 0.00046048275205357855, 'samples': 5539392, 'steps': 28850, 'loss/train': 0.1284380406141281} -11/07/2021 01:15:56 - INFO - __main__ - Step 28852: {'lr': 0.00046047988856550104, 'samples': 5539584, 'steps': 28851, 'loss/train': 1.5595612525939941} -11/07/2021 01:15:57 - INFO - __main__ - Step 28853: {'lr': 0.00046047702498258446, 'samples': 5539776, 'steps': 28852, 'loss/train': 1.5112496614456177} -11/07/2021 01:15:58 - INFO - __main__ - Step 28854: {'lr': 0.00046047416130483033, 'samples': 5539968, 'steps': 28853, 'loss/train': 1.659077525138855} -11/07/2021 01:15:58 - INFO - __main__ - Step 28855: {'lr': 0.00046047129753223973, 'samples': 5540160, 'steps': 28854, 'loss/train': 1.7341511249542236} -11/07/2021 01:15:59 - INFO - __main__ - Step 28856: {'lr': 0.0004604684336648139, 'samples': 5540352, 'steps': 28855, 'loss/train': 1.5935263633728027} -11/07/2021 01:15:59 - INFO - __main__ - Step 28857: {'lr': 0.00046046556970255435, 'samples': 5540544, 'steps': 28856, 'loss/train': 1.6662061214447021} -11/07/2021 01:15:59 - INFO - __main__ - Step 28858: {'lr': 0.0004604627056454622, 'samples': 5540736, 'steps': 28857, 'loss/train': 1.6770565509796143} -11/07/2021 01:16:00 - INFO - __main__ - Step 28859: {'lr': 0.00046045984149353894, 'samples': 5540928, 'steps': 28858, 'loss/train': 1.8274426460266113} -11/07/2021 01:16:01 - INFO - __main__ - Step 28860: {'lr': 0.0004604569772467856, 'samples': 5541120, 'steps': 28859, 'loss/train': 1.324919581413269} -11/07/2021 01:16:01 - INFO - __main__ - Step 28861: {'lr': 0.00046045411290520364, 'samples': 5541312, 'steps': 28860, 'loss/train': 1.090241551399231} -11/07/2021 01:16:01 - INFO - __main__ - Step 28862: {'lr': 0.00046045124846879427, 'samples': 5541504, 'steps': 28861, 'loss/train': 1.5456140041351318} -11/07/2021 01:16:02 - INFO - __main__ - Step 28863: {'lr': 0.00046044838393755885, 'samples': 5541696, 'steps': 28862, 'loss/train': 1.5965884923934937} -11/07/2021 01:16:02 - INFO - __main__ - Step 28864: {'lr': 0.00046044551931149856, 'samples': 5541888, 'steps': 28863, 'loss/train': 1.7188166379928589} -11/07/2021 01:16:03 - INFO - __main__ - Step 28865: {'lr': 0.0004604426545906149, 'samples': 5542080, 'steps': 28864, 'loss/train': 1.2183637619018555} -11/07/2021 01:16:03 - INFO - __main__ - Step 28866: {'lr': 0.0004604397897749089, 'samples': 5542272, 'steps': 28865, 'loss/train': 0.32164669036865234} -11/07/2021 01:16:04 - INFO - __main__ - Step 28867: {'lr': 0.00046043692486438207, 'samples': 5542464, 'steps': 28866, 'loss/train': 1.7163790464401245} -11/07/2021 01:16:04 - INFO - __main__ - Step 28868: {'lr': 0.00046043405985903555, 'samples': 5542656, 'steps': 28867, 'loss/train': 1.8655368089675903} -11/07/2021 01:16:04 - INFO - __main__ - Step 28869: {'lr': 0.00046043119475887073, 'samples': 5542848, 'steps': 28868, 'loss/train': 1.7012056112289429} -11/07/2021 01:16:06 - INFO - __main__ - Step 28870: {'lr': 0.0004604283295638888, 'samples': 5543040, 'steps': 28869, 'loss/train': 3.340463638305664} -11/07/2021 01:16:06 - INFO - __main__ - Step 28871: {'lr': 0.00046042546427409116, 'samples': 5543232, 'steps': 28870, 'loss/train': 1.3275420665740967} -11/07/2021 01:16:06 - INFO - __main__ - Step 28872: {'lr': 0.000460422598889479, 'samples': 5543424, 'steps': 28871, 'loss/train': 1.4772756099700928} -11/07/2021 01:16:07 - INFO - __main__ - Step 28873: {'lr': 0.0004604197334100537, 'samples': 5543616, 'steps': 28872, 'loss/train': 1.8350965976715088} -11/07/2021 01:16:07 - INFO - __main__ - Step 28874: {'lr': 0.0004604168678358166, 'samples': 5543808, 'steps': 28873, 'loss/train': 1.100998044013977} -11/07/2021 01:16:08 - INFO - __main__ - Step 28875: {'lr': 0.00046041400216676874, 'samples': 5544000, 'steps': 28874, 'loss/train': 1.4697104692459106} -11/07/2021 01:16:08 - INFO - __main__ - Step 28876: {'lr': 0.0004604111364029118, 'samples': 5544192, 'steps': 28875, 'loss/train': 1.0781641006469727} -11/07/2021 01:16:09 - INFO - __main__ - Step 28877: {'lr': 0.0004604082705442466, 'samples': 5544384, 'steps': 28876, 'loss/train': 1.4803532361984253} -11/07/2021 01:16:09 - INFO - __main__ - Step 28878: {'lr': 0.00046040540459077483, 'samples': 5544576, 'steps': 28877, 'loss/train': 1.636860966682434} -11/07/2021 01:16:09 - INFO - __main__ - Step 28879: {'lr': 0.0004604025385424976, 'samples': 5544768, 'steps': 28878, 'loss/train': 1.2803477048873901} -11/07/2021 01:16:10 - INFO - __main__ - Step 28880: {'lr': 0.00046039967239941626, 'samples': 5544960, 'steps': 28879, 'loss/train': 1.3108853101730347} -11/07/2021 01:16:11 - INFO - __main__ - Step 28881: {'lr': 0.000460396806161532, 'samples': 5545152, 'steps': 28880, 'loss/train': 1.2313545942306519} -11/07/2021 01:16:11 - INFO - __main__ - Step 28882: {'lr': 0.0004603939398288463, 'samples': 5545344, 'steps': 28881, 'loss/train': 1.4944992065429688} -11/07/2021 01:16:11 - INFO - __main__ - Step 28883: {'lr': 0.00046039107340136023, 'samples': 5545536, 'steps': 28882, 'loss/train': 1.5530414581298828} -11/07/2021 01:16:12 - INFO - __main__ - Step 28884: {'lr': 0.00046038820687907523, 'samples': 5545728, 'steps': 28883, 'loss/train': 1.3977794647216797} -11/07/2021 01:16:13 - INFO - __main__ - Step 28885: {'lr': 0.0004603853402619925, 'samples': 5545920, 'steps': 28884, 'loss/train': 1.6549947261810303} -11/07/2021 01:16:13 - INFO - __main__ - Step 28886: {'lr': 0.00046038247355011347, 'samples': 5546112, 'steps': 28885, 'loss/train': 1.4465737342834473} -11/07/2021 01:16:14 - INFO - __main__ - Step 28887: {'lr': 0.00046037960674343925, 'samples': 5546304, 'steps': 28886, 'loss/train': 1.5918290615081787} -11/07/2021 01:16:14 - INFO - __main__ - Step 28888: {'lr': 0.0004603767398419713, 'samples': 5546496, 'steps': 28887, 'loss/train': 1.016764760017395} -11/07/2021 01:16:14 - INFO - __main__ - Step 28889: {'lr': 0.0004603738728457109, 'samples': 5546688, 'steps': 28888, 'loss/train': 1.5167356729507446} -11/07/2021 01:16:15 - INFO - __main__ - Step 28890: {'lr': 0.0004603710057546592, 'samples': 5546880, 'steps': 28889, 'loss/train': 1.4391789436340332} -11/07/2021 01:16:16 - INFO - __main__ - Step 28891: {'lr': 0.0004603681385688175, 'samples': 5547072, 'steps': 28890, 'loss/train': 1.2934634685516357} -11/07/2021 01:16:16 - INFO - __main__ - Step 28892: {'lr': 0.00046036527128818724, 'samples': 5547264, 'steps': 28891, 'loss/train': 1.4205087423324585} -11/07/2021 01:16:16 - INFO - __main__ - Step 28893: {'lr': 0.0004603624039127696, 'samples': 5547456, 'steps': 28892, 'loss/train': 2.161067008972168} -11/07/2021 01:16:17 - INFO - __main__ - Step 28894: {'lr': 0.00046035953644256596, 'samples': 5547648, 'steps': 28893, 'loss/train': 1.1943391561508179} -11/07/2021 01:16:18 - INFO - __main__ - Step 28895: {'lr': 0.00046035666887757755, 'samples': 5547840, 'steps': 28894, 'loss/train': 1.3796454668045044} -11/07/2021 01:16:18 - INFO - __main__ - Step 28896: {'lr': 0.00046035380121780563, 'samples': 5548032, 'steps': 28895, 'loss/train': 1.6449450254440308} -11/07/2021 01:16:18 - INFO - __main__ - Step 28897: {'lr': 0.0004603509334632515, 'samples': 5548224, 'steps': 28896, 'loss/train': 1.3734986782073975} -11/07/2021 01:16:19 - INFO - __main__ - Step 28898: {'lr': 0.00046034806561391655, 'samples': 5548416, 'steps': 28897, 'loss/train': 1.2445614337921143} -11/07/2021 01:16:19 - INFO - __main__ - Step 28899: {'lr': 0.000460345197669802, 'samples': 5548608, 'steps': 28898, 'loss/train': 1.8080830574035645} -11/07/2021 01:16:20 - INFO - __main__ - Step 28900: {'lr': 0.0004603423296309092, 'samples': 5548800, 'steps': 28899, 'loss/train': 1.0341877937316895} -11/07/2021 01:16:21 - INFO - __main__ - Step 28901: {'lr': 0.0004603394614972393, 'samples': 5548992, 'steps': 28900, 'loss/train': 0.27347704768180847} -11/07/2021 01:16:21 - INFO - __main__ - Step 28902: {'lr': 0.00046033659326879373, 'samples': 5549184, 'steps': 28901, 'loss/train': 1.4428738355636597} -11/07/2021 01:16:21 - INFO - __main__ - Step 28903: {'lr': 0.00046033372494557373, 'samples': 5549376, 'steps': 28902, 'loss/train': 0.5731782913208008} -11/07/2021 01:16:22 - INFO - __main__ - Step 28904: {'lr': 0.00046033085652758053, 'samples': 5549568, 'steps': 28903, 'loss/train': 1.4512176513671875} -11/07/2021 01:16:22 - INFO - __main__ - Step 28905: {'lr': 0.00046032798801481564, 'samples': 5549760, 'steps': 28904, 'loss/train': 1.1815423965454102} -11/07/2021 01:16:23 - INFO - __main__ - Step 28906: {'lr': 0.0004603251194072801, 'samples': 5549952, 'steps': 28905, 'loss/train': 1.6696475744247437} -11/07/2021 01:16:23 - INFO - __main__ - Step 28907: {'lr': 0.0004603222507049754, 'samples': 5550144, 'steps': 28906, 'loss/train': 1.1920045614242554} -11/07/2021 01:16:24 - INFO - __main__ - Step 28908: {'lr': 0.00046031938190790254, 'samples': 5550336, 'steps': 28907, 'loss/train': 1.7647217512130737} -11/07/2021 01:16:24 - INFO - __main__ - Step 28909: {'lr': 0.0004603165130160633, 'samples': 5550528, 'steps': 28908, 'loss/train': 0.8402041792869568} -11/07/2021 01:16:24 - INFO - __main__ - Step 28910: {'lr': 0.0004603136440294584, 'samples': 5550720, 'steps': 28909, 'loss/train': 1.6364444494247437} -11/07/2021 01:16:25 - INFO - __main__ - Step 28911: {'lr': 0.0004603107749480896, 'samples': 5550912, 'steps': 28910, 'loss/train': 2.21443510055542} -11/07/2021 01:16:26 - INFO - __main__ - Step 28912: {'lr': 0.0004603079057719579, 'samples': 5551104, 'steps': 28911, 'loss/train': 1.697066068649292} -11/07/2021 01:16:26 - INFO - __main__ - Step 28913: {'lr': 0.0004603050365010648, 'samples': 5551296, 'steps': 28912, 'loss/train': 1.8834847211837769} -11/07/2021 01:16:26 - INFO - __main__ - Step 28914: {'lr': 0.00046030216713541147, 'samples': 5551488, 'steps': 28913, 'loss/train': 0.9854968786239624} -11/07/2021 01:16:27 - INFO - __main__ - Step 28915: {'lr': 0.00046029929767499924, 'samples': 5551680, 'steps': 28914, 'loss/train': 1.711262822151184} -11/07/2021 01:16:28 - INFO - __main__ - Step 28916: {'lr': 0.0004602964281198293, 'samples': 5551872, 'steps': 28915, 'loss/train': 1.4778679609298706} -11/07/2021 01:16:28 - INFO - __main__ - Step 28917: {'lr': 0.0004602935584699031, 'samples': 5552064, 'steps': 28916, 'loss/train': 1.2499537467956543} -11/07/2021 01:16:29 - INFO - __main__ - Step 28918: {'lr': 0.00046029068872522185, 'samples': 5552256, 'steps': 28917, 'loss/train': 1.4326282739639282} -11/07/2021 01:16:29 - INFO - __main__ - Step 28919: {'lr': 0.0004602878188857869, 'samples': 5552448, 'steps': 28918, 'loss/train': 1.5676058530807495} -11/07/2021 01:16:29 - INFO - __main__ - Step 28920: {'lr': 0.0004602849489515995, 'samples': 5552640, 'steps': 28919, 'loss/train': 1.5974217653274536} -11/07/2021 01:16:30 - INFO - __main__ - Step 28921: {'lr': 0.00046028207892266095, 'samples': 5552832, 'steps': 28920, 'loss/train': 1.2199342250823975} -11/07/2021 01:16:31 - INFO - __main__ - Step 28922: {'lr': 0.00046027920879897243, 'samples': 5553024, 'steps': 28921, 'loss/train': 1.4522511959075928} -11/07/2021 01:16:31 - INFO - __main__ - Step 28923: {'lr': 0.00046027633858053554, 'samples': 5553216, 'steps': 28922, 'loss/train': 2.157140016555786} -11/07/2021 01:16:31 - INFO - __main__ - Step 28924: {'lr': 0.0004602734682673512, 'samples': 5553408, 'steps': 28923, 'loss/train': 1.2557610273361206} -11/07/2021 01:16:32 - INFO - __main__ - Step 28925: {'lr': 0.0004602705978594209, 'samples': 5553600, 'steps': 28924, 'loss/train': 1.552826166152954} -11/07/2021 01:16:33 - INFO - __main__ - Step 28926: {'lr': 0.00046026772735674606, 'samples': 5553792, 'steps': 28925, 'loss/train': 1.3594396114349365} -11/07/2021 01:16:33 - INFO - __main__ - Step 28927: {'lr': 0.00046026485675932765, 'samples': 5553984, 'steps': 28926, 'loss/train': 1.2299970388412476} -11/07/2021 01:16:33 - INFO - __main__ - Step 28928: {'lr': 0.0004602619860671672, 'samples': 5554176, 'steps': 28927, 'loss/train': 1.5360386371612549} -11/07/2021 01:16:34 - INFO - __main__ - Step 28929: {'lr': 0.000460259115280266, 'samples': 5554368, 'steps': 28928, 'loss/train': 1.3246605396270752} -11/07/2021 01:16:34 - INFO - __main__ - Step 28930: {'lr': 0.00046025624439862523, 'samples': 5554560, 'steps': 28929, 'loss/train': 1.4679009914398193} -11/07/2021 01:16:35 - INFO - __main__ - Step 28931: {'lr': 0.0004602533734222463, 'samples': 5554752, 'steps': 28930, 'loss/train': 1.6778373718261719} -11/07/2021 01:16:35 - INFO - __main__ - Step 28932: {'lr': 0.00046025050235113036, 'samples': 5554944, 'steps': 28931, 'loss/train': 1.3062094449996948} -11/07/2021 01:16:36 - INFO - __main__ - Step 28933: {'lr': 0.00046024763118527885, 'samples': 5555136, 'steps': 28932, 'loss/train': 1.3774343729019165} -11/07/2021 01:16:36 - INFO - __main__ - Step 28934: {'lr': 0.00046024475992469295, 'samples': 5555328, 'steps': 28933, 'loss/train': 1.7465287446975708} -11/07/2021 01:16:36 - INFO - __main__ - Step 28935: {'lr': 0.0004602418885693741, 'samples': 5555520, 'steps': 28934, 'loss/train': 1.3427748680114746} -11/07/2021 01:16:38 - INFO - __main__ - Step 28936: {'lr': 0.0004602390171193234, 'samples': 5555712, 'steps': 28935, 'loss/train': 1.4913746118545532} -11/07/2021 01:16:38 - INFO - __main__ - Step 28937: {'lr': 0.0004602361455745423, 'samples': 5555904, 'steps': 28936, 'loss/train': 1.596330165863037} -11/07/2021 01:16:38 - INFO - __main__ - Step 28938: {'lr': 0.000460233273935032, 'samples': 5556096, 'steps': 28937, 'loss/train': 1.6190026998519897} -11/07/2021 01:16:39 - INFO - __main__ - Step 28939: {'lr': 0.00046023040220079383, 'samples': 5556288, 'steps': 28938, 'loss/train': 0.8826161026954651} -11/07/2021 01:16:39 - INFO - __main__ - Step 28940: {'lr': 0.00046022753037182915, 'samples': 5556480, 'steps': 28939, 'loss/train': 1.280436635017395} -11/07/2021 01:16:39 - INFO - __main__ - Step 28941: {'lr': 0.0004602246584481391, 'samples': 5556672, 'steps': 28940, 'loss/train': 1.4741681814193726} -11/07/2021 01:16:41 - INFO - __main__ - Step 28942: {'lr': 0.00046022178642972513, 'samples': 5556864, 'steps': 28941, 'loss/train': 1.4609594345092773} -11/07/2021 01:16:41 - INFO - __main__ - Step 28943: {'lr': 0.00046021891431658845, 'samples': 5557056, 'steps': 28942, 'loss/train': 1.2200900316238403} -11/07/2021 01:16:41 - INFO - __main__ - Step 28944: {'lr': 0.00046021604210873035, 'samples': 5557248, 'steps': 28943, 'loss/train': 1.5990513563156128} -11/07/2021 01:16:42 - INFO - __main__ - Step 28945: {'lr': 0.0004602131698061521, 'samples': 5557440, 'steps': 28944, 'loss/train': 2.0704479217529297} -11/07/2021 01:16:42 - INFO - __main__ - Step 28946: {'lr': 0.0004602102974088551, 'samples': 5557632, 'steps': 28945, 'loss/train': 1.6211740970611572} -11/07/2021 01:16:42 - INFO - __main__ - Step 28947: {'lr': 0.00046020742491684067, 'samples': 5557824, 'steps': 28946, 'loss/train': 1.4822145700454712} -11/07/2021 01:16:45 - INFO - __main__ - Step 28948: {'lr': 0.0004602045523301099, 'samples': 5558016, 'steps': 28947, 'loss/train': 0.5823309421539307} -11/07/2021 01:16:45 - INFO - __main__ - Step 28949: {'lr': 0.0004602016796486642, 'samples': 5558208, 'steps': 28948, 'loss/train': 1.7212554216384888} -11/07/2021 01:16:45 - INFO - __main__ - Step 28950: {'lr': 0.00046019880687250494, 'samples': 5558400, 'steps': 28949, 'loss/train': 1.8272355794906616} -11/07/2021 01:16:46 - INFO - __main__ - Step 28951: {'lr': 0.0004601959340016333, 'samples': 5558592, 'steps': 28950, 'loss/train': 1.1154563426971436} -11/07/2021 01:16:46 - INFO - __main__ - Step 28952: {'lr': 0.0004601930610360506, 'samples': 5558784, 'steps': 28951, 'loss/train': 1.3865123987197876} -11/07/2021 01:16:47 - INFO - __main__ - Step 28953: {'lr': 0.0004601901879757582, 'samples': 5558976, 'steps': 28952, 'loss/train': 1.8884626626968384} -11/07/2021 01:16:47 - INFO - __main__ - Step 28954: {'lr': 0.0004601873148207573, 'samples': 5559168, 'steps': 28953, 'loss/train': 1.8347766399383545} -11/07/2021 01:16:47 - INFO - __main__ - Step 28955: {'lr': 0.00046018444157104924, 'samples': 5559360, 'steps': 28954, 'loss/train': 1.8239595890045166} -11/07/2021 01:16:48 - INFO - __main__ - Step 28956: {'lr': 0.0004601815682266353, 'samples': 5559552, 'steps': 28955, 'loss/train': 1.7957842350006104} -11/07/2021 01:16:49 - INFO - __main__ - Step 28957: {'lr': 0.00046017869478751685, 'samples': 5559744, 'steps': 28956, 'loss/train': 2.1072323322296143} -11/07/2021 01:16:49 - INFO - __main__ - Step 28958: {'lr': 0.00046017582125369505, 'samples': 5559936, 'steps': 28957, 'loss/train': 1.7136385440826416} -11/07/2021 01:16:49 - INFO - __main__ - Step 28959: {'lr': 0.00046017294762517127, 'samples': 5560128, 'steps': 28958, 'loss/train': 1.5811877250671387} -11/07/2021 01:16:50 - INFO - __main__ - Step 28960: {'lr': 0.0004601700739019469, 'samples': 5560320, 'steps': 28959, 'loss/train': 1.454060673713684} -11/07/2021 01:16:51 - INFO - __main__ - Step 28961: {'lr': 0.000460167200084023, 'samples': 5560512, 'steps': 28960, 'loss/train': 1.2183918952941895} -11/07/2021 01:16:51 - INFO - __main__ - Step 28962: {'lr': 0.00046016432617140113, 'samples': 5560704, 'steps': 28961, 'loss/train': 1.2029508352279663} -11/07/2021 01:16:52 - INFO - __main__ - Step 28963: {'lr': 0.0004601614521640824, 'samples': 5560896, 'steps': 28962, 'loss/train': 0.5521527528762817} -11/07/2021 01:16:52 - INFO - __main__ - Step 28964: {'lr': 0.00046015857806206816, 'samples': 5561088, 'steps': 28963, 'loss/train': 1.4131869077682495} -11/07/2021 01:16:52 - INFO - __main__ - Step 28965: {'lr': 0.0004601557038653597, 'samples': 5561280, 'steps': 28964, 'loss/train': 1.6671829223632812} -11/07/2021 01:16:54 - INFO - __main__ - Step 28966: {'lr': 0.0004601528295739583, 'samples': 5561472, 'steps': 28965, 'loss/train': 1.7216248512268066} -11/07/2021 01:16:54 - INFO - __main__ - Step 28967: {'lr': 0.00046014995518786536, 'samples': 5561664, 'steps': 28966, 'loss/train': 1.4837855100631714} -11/07/2021 01:16:54 - INFO - __main__ - Step 28968: {'lr': 0.000460147080707082, 'samples': 5561856, 'steps': 28967, 'loss/train': 1.7088741064071655} -11/07/2021 01:16:55 - INFO - __main__ - Step 28969: {'lr': 0.00046014420613160967, 'samples': 5562048, 'steps': 28968, 'loss/train': 1.698925256729126} -11/07/2021 01:16:55 - INFO - __main__ - Step 28970: {'lr': 0.00046014133146144966, 'samples': 5562240, 'steps': 28969, 'loss/train': 2.0839052200317383} -11/07/2021 01:16:55 - INFO - __main__ - Step 28971: {'lr': 0.0004601384566966031, 'samples': 5562432, 'steps': 28970, 'loss/train': 2.054642915725708} -11/07/2021 01:16:57 - INFO - __main__ - Step 28972: {'lr': 0.0004601355818370714, 'samples': 5562624, 'steps': 28971, 'loss/train': 1.8072031736373901} -11/07/2021 01:16:57 - INFO - __main__ - Step 28973: {'lr': 0.0004601327068828559, 'samples': 5562816, 'steps': 28972, 'loss/train': 1.22524893283844} -11/07/2021 01:16:57 - INFO - __main__ - Step 28974: {'lr': 0.0004601298318339578, 'samples': 5563008, 'steps': 28973, 'loss/train': 1.5835840702056885} -11/07/2021 01:16:58 - INFO - __main__ - Step 28975: {'lr': 0.0004601269566903785, 'samples': 5563200, 'steps': 28974, 'loss/train': 1.7203696966171265} -11/07/2021 01:16:58 - INFO - __main__ - Step 28976: {'lr': 0.0004601240814521192, 'samples': 5563392, 'steps': 28975, 'loss/train': 1.3847191333770752} -11/07/2021 01:16:59 - INFO - __main__ - Step 28977: {'lr': 0.00046012120611918126, 'samples': 5563584, 'steps': 28976, 'loss/train': 1.4361244440078735} -11/07/2021 01:16:59 - INFO - __main__ - Step 28978: {'lr': 0.0004601183306915659, 'samples': 5563776, 'steps': 28977, 'loss/train': 1.4285329580307007} -11/07/2021 01:17:00 - INFO - __main__ - Step 28979: {'lr': 0.0004601154551692745, 'samples': 5563968, 'steps': 28978, 'loss/train': 1.5221688747406006} -11/07/2021 01:17:00 - INFO - __main__ - Step 28980: {'lr': 0.00046011257955230826, 'samples': 5564160, 'steps': 28979, 'loss/train': 1.8839620351791382} -11/07/2021 01:17:00 - INFO - __main__ - Step 28981: {'lr': 0.00046010970384066863, 'samples': 5564352, 'steps': 28980, 'loss/train': 1.4196536540985107} -11/07/2021 01:17:02 - INFO - __main__ - Step 28982: {'lr': 0.00046010682803435674, 'samples': 5564544, 'steps': 28981, 'loss/train': 1.8078101873397827} -11/07/2021 01:17:02 - INFO - __main__ - Step 28983: {'lr': 0.000460103952133374, 'samples': 5564736, 'steps': 28982, 'loss/train': 1.357619285583496} -11/07/2021 01:17:02 - INFO - __main__ - Step 28984: {'lr': 0.00046010107613772154, 'samples': 5564928, 'steps': 28983, 'loss/train': 1.4675019979476929} -11/07/2021 01:17:03 - INFO - __main__ - Step 28985: {'lr': 0.0004600982000474009, 'samples': 5565120, 'steps': 28984, 'loss/train': 1.3713990449905396} -11/07/2021 01:17:03 - INFO - __main__ - Step 28986: {'lr': 0.0004600953238624133, 'samples': 5565312, 'steps': 28985, 'loss/train': 1.625765323638916} -11/07/2021 01:17:04 - INFO - __main__ - Step 28987: {'lr': 0.00046009244758275986, 'samples': 5565504, 'steps': 28986, 'loss/train': 1.4445399045944214} -11/07/2021 01:17:04 - INFO - __main__ - Step 28988: {'lr': 0.0004600895712084421, 'samples': 5565696, 'steps': 28987, 'loss/train': 2.432183265686035} -11/07/2021 01:17:05 - INFO - __main__ - Step 28989: {'lr': 0.0004600866947394611, 'samples': 5565888, 'steps': 28988, 'loss/train': 1.3554515838623047} -11/07/2021 01:17:05 - INFO - __main__ - Step 28990: {'lr': 0.0004600838181758184, 'samples': 5566080, 'steps': 28989, 'loss/train': 0.8822077512741089} -11/07/2021 01:17:05 - INFO - __main__ - Step 28991: {'lr': 0.00046008094151751513, 'samples': 5566272, 'steps': 28990, 'loss/train': 0.9555196166038513} -11/07/2021 01:17:07 - INFO - __main__ - Step 28992: {'lr': 0.0004600780647645526, 'samples': 5566464, 'steps': 28991, 'loss/train': 1.7758179903030396} -11/07/2021 01:17:07 - INFO - __main__ - Step 28993: {'lr': 0.0004600751879169321, 'samples': 5566656, 'steps': 28992, 'loss/train': 1.2778682708740234} -11/07/2021 01:17:07 - INFO - __main__ - Step 28994: {'lr': 0.00046007231097465505, 'samples': 5566848, 'steps': 28993, 'loss/train': 1.7804596424102783} -11/07/2021 01:17:08 - INFO - __main__ - Step 28995: {'lr': 0.00046006943393772274, 'samples': 5567040, 'steps': 28994, 'loss/train': 1.4568381309509277} -11/07/2021 01:17:08 - INFO - __main__ - Step 28996: {'lr': 0.00046006655680613616, 'samples': 5567232, 'steps': 28995, 'loss/train': 1.5894285440444946} -11/07/2021 01:17:08 - INFO - __main__ - Step 28997: {'lr': 0.00046006367957989705, 'samples': 5567424, 'steps': 28996, 'loss/train': 1.3978854417800903} -11/07/2021 01:17:09 - INFO - __main__ - Step 28998: {'lr': 0.0004600608022590064, 'samples': 5567616, 'steps': 28997, 'loss/train': 1.5449564456939697} -11/07/2021 01:17:10 - INFO - __main__ - Step 28999: {'lr': 0.0004600579248434655, 'samples': 5567808, 'steps': 28998, 'loss/train': 1.7216355800628662} -11/07/2021 01:17:10 - INFO - __main__ - Step 29000: {'lr': 0.0004600550473332759, 'samples': 5568000, 'steps': 28999, 'loss/train': 1.7568962574005127} -11/07/2021 01:17:10 - INFO - __main__ - Step 29001: {'lr': 0.0004600521697284386, 'samples': 5568192, 'steps': 29000, 'loss/train': 1.4287441968917847} -11/07/2021 01:17:11 - INFO - __main__ - Step 29002: {'lr': 0.0004600492920289551, 'samples': 5568384, 'steps': 29001, 'loss/train': 2.267775535583496} -11/07/2021 01:17:12 - INFO - __main__ - Step 29003: {'lr': 0.00046004641423482665, 'samples': 5568576, 'steps': 29002, 'loss/train': 1.5189000368118286} -11/07/2021 01:17:12 - INFO - __main__ - Step 29004: {'lr': 0.00046004353634605447, 'samples': 5568768, 'steps': 29003, 'loss/train': 1.6470844745635986} -11/07/2021 01:17:12 - INFO - __main__ - Step 29005: {'lr': 0.00046004065836263995, 'samples': 5568960, 'steps': 29004, 'loss/train': 1.8419655561447144} -11/07/2021 01:17:13 - INFO - __main__ - Step 29006: {'lr': 0.00046003778028458434, 'samples': 5569152, 'steps': 29005, 'loss/train': 1.6046967506408691} -11/07/2021 01:17:13 - INFO - __main__ - Step 29007: {'lr': 0.00046003490211188894, 'samples': 5569344, 'steps': 29006, 'loss/train': 1.4088990688323975} -11/07/2021 01:17:14 - INFO - __main__ - Step 29008: {'lr': 0.00046003202384455505, 'samples': 5569536, 'steps': 29007, 'loss/train': 1.0364364385604858} -11/07/2021 01:17:15 - INFO - __main__ - Step 29009: {'lr': 0.000460029145482584, 'samples': 5569728, 'steps': 29008, 'loss/train': 1.6944390535354614} -11/07/2021 01:17:15 - INFO - __main__ - Step 29010: {'lr': 0.00046002626702597706, 'samples': 5569920, 'steps': 29009, 'loss/train': 1.6687331199645996} -11/07/2021 01:17:15 - INFO - __main__ - Step 29011: {'lr': 0.00046002338847473545, 'samples': 5570112, 'steps': 29010, 'loss/train': 1.7623625993728638} -11/07/2021 01:17:16 - INFO - __main__ - Step 29012: {'lr': 0.0004600205098288606, 'samples': 5570304, 'steps': 29011, 'loss/train': 1.7710977792739868} -11/07/2021 01:17:17 - INFO - __main__ - Step 29013: {'lr': 0.00046001763108835384, 'samples': 5570496, 'steps': 29012, 'loss/train': 1.4041374921798706} -11/07/2021 01:17:17 - INFO - __main__ - Step 29014: {'lr': 0.0004600147522532162, 'samples': 5570688, 'steps': 29013, 'loss/train': 1.6077314615249634} -11/07/2021 01:17:17 - INFO - __main__ - Step 29015: {'lr': 0.0004600118733234493, 'samples': 5570880, 'steps': 29014, 'loss/train': 1.8222843408584595} -11/07/2021 01:17:18 - INFO - __main__ - Step 29016: {'lr': 0.0004600089942990542, 'samples': 5571072, 'steps': 29015, 'loss/train': 1.5851895809173584} -11/07/2021 01:17:18 - INFO - __main__ - Step 29017: {'lr': 0.00046000611518003234, 'samples': 5571264, 'steps': 29016, 'loss/train': 1.1701395511627197} -11/07/2021 01:17:19 - INFO - __main__ - Step 29018: {'lr': 0.00046000323596638495, 'samples': 5571456, 'steps': 29017, 'loss/train': 2.0442075729370117} -11/07/2021 01:17:19 - INFO - __main__ - Step 29019: {'lr': 0.0004600003566581133, 'samples': 5571648, 'steps': 29018, 'loss/train': 1.799600601196289} -11/07/2021 01:17:20 - INFO - __main__ - Step 29020: {'lr': 0.00045999747725521876, 'samples': 5571840, 'steps': 29019, 'loss/train': 1.7369462251663208} -11/07/2021 01:17:20 - INFO - __main__ - Step 29021: {'lr': 0.0004599945977577026, 'samples': 5572032, 'steps': 29020, 'loss/train': 1.4682435989379883} -11/07/2021 01:17:21 - INFO - __main__ - Step 29022: {'lr': 0.0004599917181655661, 'samples': 5572224, 'steps': 29021, 'loss/train': 1.2437880039215088} -11/07/2021 01:17:21 - INFO - __main__ - Step 29023: {'lr': 0.00045998883847881057, 'samples': 5572416, 'steps': 29022, 'loss/train': 1.7971512079238892} -11/07/2021 01:17:22 - INFO - __main__ - Step 29024: {'lr': 0.00045998595869743735, 'samples': 5572608, 'steps': 29023, 'loss/train': 1.206907868385315} -11/07/2021 01:17:22 - INFO - __main__ - Step 29025: {'lr': 0.0004599830788214477, 'samples': 5572800, 'steps': 29024, 'loss/train': 0.9922259449958801} -11/07/2021 01:17:23 - INFO - __main__ - Step 29026: {'lr': 0.0004599801988508429, 'samples': 5572992, 'steps': 29025, 'loss/train': 1.8546106815338135} -11/07/2021 01:17:23 - INFO - __main__ - Step 29027: {'lr': 0.00045997731878562423, 'samples': 5573184, 'steps': 29026, 'loss/train': 1.5244265794754028} -11/07/2021 01:17:24 - INFO - __main__ - Step 29028: {'lr': 0.000459974438625793, 'samples': 5573376, 'steps': 29027, 'loss/train': 2.1775026321411133} -11/07/2021 01:17:24 - INFO - __main__ - Step 29029: {'lr': 0.0004599715583713506, 'samples': 5573568, 'steps': 29028, 'loss/train': 1.9676076173782349} -11/07/2021 01:17:25 - INFO - __main__ - Step 29030: {'lr': 0.00045996867802229824, 'samples': 5573760, 'steps': 29029, 'loss/train': 1.1934735774993896} -11/07/2021 01:17:25 - INFO - __main__ - Step 29031: {'lr': 0.0004599657975786372, 'samples': 5573952, 'steps': 29030, 'loss/train': 1.431510329246521} -11/07/2021 01:17:25 - INFO - __main__ - Step 29032: {'lr': 0.00045996291704036884, 'samples': 5574144, 'steps': 29031, 'loss/train': 1.6111900806427002} -11/07/2021 01:17:27 - INFO - __main__ - Step 29033: {'lr': 0.00045996003640749446, 'samples': 5574336, 'steps': 29032, 'loss/train': 1.6642199754714966} -11/07/2021 01:17:27 - INFO - __main__ - Step 29034: {'lr': 0.0004599571556800153, 'samples': 5574528, 'steps': 29033, 'loss/train': 0.855462372303009} -11/07/2021 01:17:27 - INFO - __main__ - Step 29035: {'lr': 0.00045995427485793263, 'samples': 5574720, 'steps': 29034, 'loss/train': 1.7289525270462036} -11/07/2021 01:17:28 - INFO - __main__ - Step 29036: {'lr': 0.00045995139394124784, 'samples': 5574912, 'steps': 29035, 'loss/train': 1.251185417175293} -11/07/2021 01:17:28 - INFO - __main__ - Step 29037: {'lr': 0.0004599485129299622, 'samples': 5575104, 'steps': 29036, 'loss/train': 1.4728577136993408} -11/07/2021 01:17:29 - INFO - __main__ - Step 29038: {'lr': 0.000459945631824077, 'samples': 5575296, 'steps': 29037, 'loss/train': 1.2936763763427734} -11/07/2021 01:17:29 - INFO - __main__ - Step 29039: {'lr': 0.0004599427506235936, 'samples': 5575488, 'steps': 29038, 'loss/train': 0.8940146565437317} -11/07/2021 01:17:30 - INFO - __main__ - Step 29040: {'lr': 0.0004599398693285132, 'samples': 5575680, 'steps': 29039, 'loss/train': 0.8102036118507385} -11/07/2021 01:17:30 - INFO - __main__ - Step 29041: {'lr': 0.0004599369879388371, 'samples': 5575872, 'steps': 29040, 'loss/train': 0.8322492241859436} -11/07/2021 01:17:30 - INFO - __main__ - Step 29042: {'lr': 0.0004599341064545666, 'samples': 5576064, 'steps': 29041, 'loss/train': 1.413248896598816} -11/07/2021 01:17:31 - INFO - __main__ - Step 29043: {'lr': 0.00045993122487570303, 'samples': 5576256, 'steps': 29042, 'loss/train': 1.6776422262191772} -11/07/2021 01:17:32 - INFO - __main__ - Step 29044: {'lr': 0.00045992834320224773, 'samples': 5576448, 'steps': 29043, 'loss/train': 1.8192821741104126} -11/07/2021 01:17:32 - INFO - __main__ - Step 29045: {'lr': 0.000459925461434202, 'samples': 5576640, 'steps': 29044, 'loss/train': 1.0544776916503906} -11/07/2021 01:17:33 - INFO - __main__ - Step 29046: {'lr': 0.00045992257957156704, 'samples': 5576832, 'steps': 29045, 'loss/train': 1.755774736404419} -11/07/2021 01:17:33 - INFO - __main__ - Step 29047: {'lr': 0.00045991969761434426, 'samples': 5577024, 'steps': 29046, 'loss/train': 1.1235843896865845} -11/07/2021 01:17:33 - INFO - __main__ - Step 29048: {'lr': 0.0004599168155625348, 'samples': 5577216, 'steps': 29047, 'loss/train': 1.1373010873794556} -11/07/2021 01:17:34 - INFO - __main__ - Step 29049: {'lr': 0.00045991393341614017, 'samples': 5577408, 'steps': 29048, 'loss/train': 2.1169443130493164} -11/07/2021 01:17:35 - INFO - __main__ - Step 29050: {'lr': 0.0004599110511751615, 'samples': 5577600, 'steps': 29049, 'loss/train': 1.5747123956680298} -11/07/2021 01:17:35 - INFO - __main__ - Step 29051: {'lr': 0.0004599081688396002, 'samples': 5577792, 'steps': 29050, 'loss/train': 1.0253344774246216} -11/07/2021 01:17:35 - INFO - __main__ - Step 29052: {'lr': 0.0004599052864094575, 'samples': 5577984, 'steps': 29051, 'loss/train': 1.7327574491500854} -11/07/2021 01:17:36 - INFO - __main__ - Step 29053: {'lr': 0.0004599024038847347, 'samples': 5578176, 'steps': 29052, 'loss/train': 1.7626140117645264} -11/07/2021 01:17:37 - INFO - __main__ - Step 29054: {'lr': 0.0004598995212654331, 'samples': 5578368, 'steps': 29053, 'loss/train': 1.4643959999084473} -11/07/2021 01:17:37 - INFO - __main__ - Step 29055: {'lr': 0.0004598966385515541, 'samples': 5578560, 'steps': 29054, 'loss/train': 1.8471664190292358} -11/07/2021 01:17:37 - INFO - __main__ - Step 29056: {'lr': 0.00045989375574309875, 'samples': 5578752, 'steps': 29055, 'loss/train': 2.308751106262207} -11/07/2021 01:17:38 - INFO - __main__ - Step 29057: {'lr': 0.00045989087284006863, 'samples': 5578944, 'steps': 29056, 'loss/train': 1.551805019378662} -11/07/2021 01:17:38 - INFO - __main__ - Step 29058: {'lr': 0.00045988798984246496, 'samples': 5579136, 'steps': 29057, 'loss/train': 1.2563121318817139} -11/07/2021 01:17:39 - INFO - __main__ - Step 29059: {'lr': 0.0004598851067502889, 'samples': 5579328, 'steps': 29058, 'loss/train': 1.0828661918640137} -11/07/2021 01:17:39 - INFO - __main__ - Step 29060: {'lr': 0.00045988222356354186, 'samples': 5579520, 'steps': 29059, 'loss/train': 1.0682960748672485} -11/07/2021 01:17:40 - INFO - __main__ - Step 29061: {'lr': 0.00045987934028222515, 'samples': 5579712, 'steps': 29060, 'loss/train': 1.3602944612503052} -11/07/2021 01:17:40 - INFO - __main__ - Step 29062: {'lr': 0.00045987645690634003, 'samples': 5579904, 'steps': 29061, 'loss/train': 1.555138349533081} -11/07/2021 01:17:41 - INFO - __main__ - Step 29063: {'lr': 0.0004598735734358879, 'samples': 5580096, 'steps': 29062, 'loss/train': 1.8989344835281372} -11/07/2021 01:17:41 - INFO - __main__ - Step 29064: {'lr': 0.0004598706898708699, 'samples': 5580288, 'steps': 29063, 'loss/train': 1.1886340379714966} -11/07/2021 01:17:42 - INFO - __main__ - Step 29065: {'lr': 0.00045986780621128743, 'samples': 5580480, 'steps': 29064, 'loss/train': 1.308013677597046} -11/07/2021 01:17:42 - INFO - __main__ - Step 29066: {'lr': 0.00045986492245714175, 'samples': 5580672, 'steps': 29065, 'loss/train': 1.5125694274902344} -11/07/2021 01:17:43 - INFO - __main__ - Step 29067: {'lr': 0.0004598620386084342, 'samples': 5580864, 'steps': 29066, 'loss/train': 1.6981607675552368} -11/07/2021 01:17:43 - INFO - __main__ - Step 29068: {'lr': 0.00045985915466516605, 'samples': 5581056, 'steps': 29067, 'loss/train': 0.809975802898407} -11/07/2021 01:17:43 - INFO - __main__ - Step 29069: {'lr': 0.0004598562706273386, 'samples': 5581248, 'steps': 29068, 'loss/train': 1.6589301824569702} -11/07/2021 01:17:44 - INFO - __main__ - Step 29070: {'lr': 0.0004598533864949531, 'samples': 5581440, 'steps': 29069, 'loss/train': 1.6808274984359741} -11/07/2021 01:17:45 - INFO - __main__ - Step 29071: {'lr': 0.00045985050226801097, 'samples': 5581632, 'steps': 29070, 'loss/train': 1.6667805910110474} -11/07/2021 01:17:45 - INFO - __main__ - Step 29072: {'lr': 0.0004598476179465134, 'samples': 5581824, 'steps': 29071, 'loss/train': 0.8117663264274597} -11/07/2021 01:17:46 - INFO - __main__ - Step 29073: {'lr': 0.00045984473353046174, 'samples': 5582016, 'steps': 29072, 'loss/train': 1.6126930713653564} -11/07/2021 01:17:46 - INFO - __main__ - Step 29074: {'lr': 0.00045984184901985735, 'samples': 5582208, 'steps': 29073, 'loss/train': 1.5174460411071777} -11/07/2021 01:17:47 - INFO - __main__ - Step 29075: {'lr': 0.00045983896441470143, 'samples': 5582400, 'steps': 29074, 'loss/train': 1.7275384664535522} -11/07/2021 01:17:47 - INFO - __main__ - Step 29076: {'lr': 0.00045983607971499527, 'samples': 5582592, 'steps': 29075, 'loss/train': 1.643984317779541} -11/07/2021 01:17:48 - INFO - __main__ - Step 29077: {'lr': 0.0004598331949207402, 'samples': 5582784, 'steps': 29076, 'loss/train': 1.5335731506347656} -11/07/2021 01:17:48 - INFO - __main__ - Step 29078: {'lr': 0.00045983031003193756, 'samples': 5582976, 'steps': 29077, 'loss/train': 1.7958552837371826} -11/07/2021 01:17:48 - INFO - __main__ - Step 29079: {'lr': 0.0004598274250485886, 'samples': 5583168, 'steps': 29078, 'loss/train': 1.3020613193511963} -11/07/2021 01:17:49 - INFO - __main__ - Step 29080: {'lr': 0.00045982453997069463, 'samples': 5583360, 'steps': 29079, 'loss/train': 1.7859662771224976} -11/07/2021 01:17:50 - INFO - __main__ - Step 29081: {'lr': 0.00045982165479825697, 'samples': 5583552, 'steps': 29080, 'loss/train': 1.3405777215957642} -11/07/2021 01:17:50 - INFO - __main__ - Step 29082: {'lr': 0.000459818769531277, 'samples': 5583744, 'steps': 29081, 'loss/train': 1.7002794742584229} -11/07/2021 01:17:50 - INFO - __main__ - Step 29083: {'lr': 0.00045981588416975583, 'samples': 5583936, 'steps': 29082, 'loss/train': 1.580579161643982} -11/07/2021 01:17:51 - INFO - __main__ - Step 29084: {'lr': 0.00045981299871369484, 'samples': 5584128, 'steps': 29083, 'loss/train': 0.7894611358642578} -11/07/2021 01:17:51 - INFO - __main__ - Step 29085: {'lr': 0.0004598101131630954, 'samples': 5584320, 'steps': 29084, 'loss/train': 1.9372822046279907} -11/07/2021 01:17:52 - INFO - __main__ - Step 29086: {'lr': 0.0004598072275179588, 'samples': 5584512, 'steps': 29085, 'loss/train': 1.543207049369812} -11/07/2021 01:17:52 - INFO - __main__ - Step 29087: {'lr': 0.00045980434177828625, 'samples': 5584704, 'steps': 29086, 'loss/train': 1.4375332593917847} -11/07/2021 01:17:53 - INFO - __main__ - Step 29088: {'lr': 0.00045980145594407907, 'samples': 5584896, 'steps': 29087, 'loss/train': 2.165194511413574} -11/07/2021 01:17:53 - INFO - __main__ - Step 29089: {'lr': 0.00045979857001533867, 'samples': 5585088, 'steps': 29088, 'loss/train': 1.6920965909957886} -11/07/2021 01:17:53 - INFO - __main__ - Step 29090: {'lr': 0.0004597956839920662, 'samples': 5585280, 'steps': 29089, 'loss/train': 0.8672987818717957} -11/07/2021 01:17:54 - INFO - __main__ - Step 29091: {'lr': 0.00045979279787426307, 'samples': 5585472, 'steps': 29090, 'loss/train': 1.85176420211792} -11/07/2021 01:17:55 - INFO - __main__ - Step 29092: {'lr': 0.00045978991166193057, 'samples': 5585664, 'steps': 29091, 'loss/train': 1.672255516052246} -11/07/2021 01:17:55 - INFO - __main__ - Step 29093: {'lr': 0.0004597870253550699, 'samples': 5585856, 'steps': 29092, 'loss/train': 1.3873833417892456} -11/07/2021 01:17:55 - INFO - __main__ - Step 29094: {'lr': 0.0004597841389536825, 'samples': 5586048, 'steps': 29093, 'loss/train': 1.0229157209396362} -11/07/2021 01:17:56 - INFO - __main__ - Step 29095: {'lr': 0.00045978125245776957, 'samples': 5586240, 'steps': 29094, 'loss/train': 1.6391146183013916} -11/07/2021 01:17:57 - INFO - __main__ - Step 29096: {'lr': 0.00045977836586733246, 'samples': 5586432, 'steps': 29095, 'loss/train': 1.6857407093048096} -11/07/2021 01:17:57 - INFO - __main__ - Step 29097: {'lr': 0.00045977547918237243, 'samples': 5586624, 'steps': 29096, 'loss/train': 1.3226008415222168} -11/07/2021 01:17:58 - INFO - __main__ - Step 29098: {'lr': 0.0004597725924028908, 'samples': 5586816, 'steps': 29097, 'loss/train': 1.9238613843917847} -11/07/2021 01:17:58 - INFO - __main__ - Step 29099: {'lr': 0.00045976970552888896, 'samples': 5587008, 'steps': 29098, 'loss/train': 1.1772266626358032} -11/07/2021 01:17:58 - INFO - __main__ - Step 29100: {'lr': 0.00045976681856036805, 'samples': 5587200, 'steps': 29099, 'loss/train': 1.3465580940246582} -11/07/2021 01:17:59 - INFO - __main__ - Step 29101: {'lr': 0.00045976393149732943, 'samples': 5587392, 'steps': 29100, 'loss/train': 1.9874027967453003} -11/07/2021 01:18:00 - INFO - __main__ - Step 29102: {'lr': 0.0004597610443397745, 'samples': 5587584, 'steps': 29101, 'loss/train': 1.2521934509277344} -11/07/2021 01:18:00 - INFO - __main__ - Step 29103: {'lr': 0.0004597581570877044, 'samples': 5587776, 'steps': 29102, 'loss/train': 1.4241652488708496} -11/07/2021 01:18:00 - INFO - __main__ - Step 29104: {'lr': 0.00045975526974112056, 'samples': 5587968, 'steps': 29103, 'loss/train': 2.0824873447418213} -11/07/2021 01:18:01 - INFO - __main__ - Step 29105: {'lr': 0.0004597523823000243, 'samples': 5588160, 'steps': 29104, 'loss/train': 1.5525542497634888} -11/07/2021 01:18:01 - INFO - __main__ - Step 29106: {'lr': 0.0004597494947644167, 'samples': 5588352, 'steps': 29105, 'loss/train': 1.7280526161193848} -11/07/2021 01:18:02 - INFO - __main__ - Step 29107: {'lr': 0.0004597466071342993, 'samples': 5588544, 'steps': 29106, 'loss/train': 0.9949897527694702} -11/07/2021 01:18:03 - INFO - __main__ - Step 29108: {'lr': 0.0004597437194096733, 'samples': 5588736, 'steps': 29107, 'loss/train': 1.6158809661865234} -11/07/2021 01:18:03 - INFO - __main__ - Step 29109: {'lr': 0.00045974083159054, 'samples': 5588928, 'steps': 29108, 'loss/train': 1.43483567237854} -11/07/2021 01:18:03 - INFO - __main__ - Step 29110: {'lr': 0.0004597379436769008, 'samples': 5589120, 'steps': 29109, 'loss/train': 1.5917630195617676} -11/07/2021 01:18:04 - INFO - __main__ - Step 29111: {'lr': 0.00045973505566875684, 'samples': 5589312, 'steps': 29110, 'loss/train': 2.0971126556396484} -11/07/2021 01:18:05 - INFO - __main__ - Step 29112: {'lr': 0.00045973216756610945, 'samples': 5589504, 'steps': 29111, 'loss/train': 1.5469576120376587} -11/07/2021 01:18:05 - INFO - __main__ - Step 29113: {'lr': 0.00045972927936896007, 'samples': 5589696, 'steps': 29112, 'loss/train': 1.5790016651153564} -11/07/2021 01:18:05 - INFO - __main__ - Step 29114: {'lr': 0.0004597263910773099, 'samples': 5589888, 'steps': 29113, 'loss/train': 1.2219035625457764} -11/07/2021 01:18:06 - INFO - __main__ - Step 29115: {'lr': 0.0004597235026911603, 'samples': 5590080, 'steps': 29114, 'loss/train': 1.5206252336502075} -11/07/2021 01:18:06 - INFO - __main__ - Step 29116: {'lr': 0.0004597206142105124, 'samples': 5590272, 'steps': 29115, 'loss/train': 1.6539644002914429} -11/07/2021 01:18:07 - INFO - __main__ - Step 29117: {'lr': 0.0004597177256353677, 'samples': 5590464, 'steps': 29116, 'loss/train': 1.8472036123275757} -11/07/2021 01:18:07 - INFO - __main__ - Step 29118: {'lr': 0.0004597148369657275, 'samples': 5590656, 'steps': 29117, 'loss/train': 1.2005980014801025} -11/07/2021 01:18:08 - INFO - __main__ - Step 29119: {'lr': 0.0004597119482015929, 'samples': 5590848, 'steps': 29118, 'loss/train': 1.5274251699447632} -11/07/2021 01:18:08 - INFO - __main__ - Step 29120: {'lr': 0.00045970905934296537, 'samples': 5591040, 'steps': 29119, 'loss/train': 1.3336411714553833} -11/07/2021 01:18:08 - INFO - __main__ - Step 29121: {'lr': 0.0004597061703898462, 'samples': 5591232, 'steps': 29120, 'loss/train': 1.4341195821762085} -11/07/2021 01:18:10 - INFO - __main__ - Step 29122: {'lr': 0.0004597032813422367, 'samples': 5591424, 'steps': 29121, 'loss/train': 1.2545655965805054} -11/07/2021 01:18:10 - INFO - __main__ - Step 29123: {'lr': 0.00045970039220013804, 'samples': 5591616, 'steps': 29122, 'loss/train': 1.6790838241577148} -11/07/2021 01:18:10 - INFO - __main__ - Step 29124: {'lr': 0.00045969750296355173, 'samples': 5591808, 'steps': 29123, 'loss/train': 1.3595398664474487} -11/07/2021 01:18:11 - INFO - __main__ - Step 29125: {'lr': 0.0004596946136324789, 'samples': 5592000, 'steps': 29124, 'loss/train': 1.5711055994033813} -11/07/2021 01:18:11 - INFO - __main__ - Step 29126: {'lr': 0.0004596917242069209, 'samples': 5592192, 'steps': 29125, 'loss/train': 1.3224055767059326} -11/07/2021 01:18:12 - INFO - __main__ - Step 29127: {'lr': 0.00045968883468687906, 'samples': 5592384, 'steps': 29126, 'loss/train': 1.640031099319458} -11/07/2021 01:18:12 - INFO - __main__ - Step 29128: {'lr': 0.00045968594507235467, 'samples': 5592576, 'steps': 29127, 'loss/train': 1.769572138786316} -11/07/2021 01:18:13 - INFO - __main__ - Step 29129: {'lr': 0.00045968305536334906, 'samples': 5592768, 'steps': 29128, 'loss/train': 1.6369398832321167} -11/07/2021 01:18:13 - INFO - __main__ - Step 29130: {'lr': 0.00045968016555986347, 'samples': 5592960, 'steps': 29129, 'loss/train': 1.5712953805923462} -11/07/2021 01:18:13 - INFO - __main__ - Step 29131: {'lr': 0.0004596772756618992, 'samples': 5593152, 'steps': 29130, 'loss/train': 1.609351634979248} -11/07/2021 01:18:14 - INFO - __main__ - Step 29132: {'lr': 0.0004596743856694576, 'samples': 5593344, 'steps': 29131, 'loss/train': 0.9651497602462769} -11/07/2021 01:18:15 - INFO - __main__ - Step 29133: {'lr': 0.00045967149558254, 'samples': 5593536, 'steps': 29132, 'loss/train': 1.5109275579452515} -11/07/2021 01:18:15 - INFO - __main__ - Step 29134: {'lr': 0.0004596686054011476, 'samples': 5593728, 'steps': 29133, 'loss/train': 1.9324721097946167} -11/07/2021 01:18:15 - INFO - __main__ - Step 29135: {'lr': 0.0004596657151252819, 'samples': 5593920, 'steps': 29134, 'loss/train': 1.8306808471679688} -11/07/2021 01:18:16 - INFO - __main__ - Step 29136: {'lr': 0.0004596628247549439, 'samples': 5594112, 'steps': 29135, 'loss/train': 1.4166126251220703} -11/07/2021 01:18:16 - INFO - __main__ - Step 29137: {'lr': 0.00045965993429013507, 'samples': 5594304, 'steps': 29136, 'loss/train': 1.7979376316070557} -11/07/2021 01:18:17 - INFO - __main__ - Step 29138: {'lr': 0.0004596570437308568, 'samples': 5594496, 'steps': 29137, 'loss/train': 1.7460390329360962} -11/07/2021 01:18:18 - INFO - __main__ - Step 29139: {'lr': 0.0004596541530771103, 'samples': 5594688, 'steps': 29138, 'loss/train': 1.9361435174942017} -11/07/2021 01:18:18 - INFO - __main__ - Step 29140: {'lr': 0.0004596512623288969, 'samples': 5594880, 'steps': 29139, 'loss/train': 1.3820250034332275} -11/07/2021 01:18:18 - INFO - __main__ - Step 29141: {'lr': 0.00045964837148621776, 'samples': 5595072, 'steps': 29140, 'loss/train': 1.4857066869735718} -11/07/2021 01:18:19 - INFO - __main__ - Step 29142: {'lr': 0.00045964548054907434, 'samples': 5595264, 'steps': 29141, 'loss/train': 1.4133851528167725} -11/07/2021 01:18:20 - INFO - __main__ - Step 29143: {'lr': 0.00045964258951746795, 'samples': 5595456, 'steps': 29142, 'loss/train': 2.953083038330078} -11/07/2021 01:18:20 - INFO - __main__ - Step 29144: {'lr': 0.0004596396983913998, 'samples': 5595648, 'steps': 29143, 'loss/train': 1.48224675655365} -11/07/2021 01:18:20 - INFO - __main__ - Step 29145: {'lr': 0.00045963680717087124, 'samples': 5595840, 'steps': 29144, 'loss/train': 1.531014323234558} -11/07/2021 01:18:21 - INFO - __main__ - Step 29146: {'lr': 0.0004596339158558835, 'samples': 5596032, 'steps': 29145, 'loss/train': 1.592858910560608} -11/07/2021 01:18:21 - INFO - __main__ - Step 29147: {'lr': 0.0004596310244464381, 'samples': 5596224, 'steps': 29146, 'loss/train': 0.8829703330993652} -11/07/2021 01:18:22 - INFO - __main__ - Step 29148: {'lr': 0.0004596281329425361, 'samples': 5596416, 'steps': 29147, 'loss/train': 1.290963888168335} -11/07/2021 01:18:23 - INFO - __main__ - Step 29149: {'lr': 0.0004596252413441789, 'samples': 5596608, 'steps': 29148, 'loss/train': 0.9775720834732056} -11/07/2021 01:18:23 - INFO - __main__ - Step 29150: {'lr': 0.00045962234965136783, 'samples': 5596800, 'steps': 29149, 'loss/train': 1.0753238201141357} -11/07/2021 01:18:23 - INFO - __main__ - Step 29151: {'lr': 0.0004596194578641042, 'samples': 5596992, 'steps': 29150, 'loss/train': 1.0315475463867188} -11/07/2021 01:18:24 - INFO - __main__ - Step 29152: {'lr': 0.00045961656598238925, 'samples': 5597184, 'steps': 29151, 'loss/train': 1.5725375413894653} -11/07/2021 01:18:24 - INFO - __main__ - Step 29153: {'lr': 0.00045961367400622436, 'samples': 5597376, 'steps': 29152, 'loss/train': 1.589746356010437} -11/07/2021 01:18:25 - INFO - __main__ - Step 29154: {'lr': 0.00045961078193561066, 'samples': 5597568, 'steps': 29153, 'loss/train': 1.2909806966781616} -11/07/2021 01:18:26 - INFO - __main__ - Step 29155: {'lr': 0.00045960788977054967, 'samples': 5597760, 'steps': 29154, 'loss/train': 1.0973178148269653} -11/07/2021 01:18:26 - INFO - __main__ - Step 29156: {'lr': 0.0004596049975110426, 'samples': 5597952, 'steps': 29155, 'loss/train': 1.581822156906128} -11/07/2021 01:18:26 - INFO - __main__ - Step 29157: {'lr': 0.00045960210515709064, 'samples': 5598144, 'steps': 29156, 'loss/train': 1.6044692993164062} -11/07/2021 01:18:27 - INFO - __main__ - Step 29158: {'lr': 0.0004595992127086953, 'samples': 5598336, 'steps': 29157, 'loss/train': 1.4625189304351807} -11/07/2021 01:18:28 - INFO - __main__ - Step 29159: {'lr': 0.00045959632016585774, 'samples': 5598528, 'steps': 29158, 'loss/train': 1.1689990758895874} -11/07/2021 01:18:28 - INFO - __main__ - Step 29160: {'lr': 0.0004595934275285794, 'samples': 5598720, 'steps': 29159, 'loss/train': 1.17728853225708} -11/07/2021 01:18:28 - INFO - __main__ - Step 29161: {'lr': 0.00045959053479686143, 'samples': 5598912, 'steps': 29160, 'loss/train': 1.8568990230560303} -11/07/2021 01:18:29 - INFO - __main__ - Step 29162: {'lr': 0.0004595876419707052, 'samples': 5599104, 'steps': 29161, 'loss/train': 1.5310627222061157} -11/07/2021 01:18:29 - INFO - __main__ - Step 29163: {'lr': 0.00045958474905011205, 'samples': 5599296, 'steps': 29162, 'loss/train': 1.558485984802246} -11/07/2021 01:18:30 - INFO - __main__ - Step 29164: {'lr': 0.0004595818560350832, 'samples': 5599488, 'steps': 29163, 'loss/train': 1.6781156063079834} -11/07/2021 01:18:30 - INFO - __main__ - Step 29165: {'lr': 0.00045957896292562003, 'samples': 5599680, 'steps': 29164, 'loss/train': 1.1443002223968506} -11/07/2021 01:18:31 - INFO - __main__ - Step 29166: {'lr': 0.0004595760697217238, 'samples': 5599872, 'steps': 29165, 'loss/train': 1.450128436088562} -11/07/2021 01:18:31 - INFO - __main__ - Step 29167: {'lr': 0.0004595731764233958, 'samples': 5600064, 'steps': 29166, 'loss/train': 1.574720859527588} -11/07/2021 01:18:31 - INFO - __main__ - Step 29168: {'lr': 0.0004595702830306374, 'samples': 5600256, 'steps': 29167, 'loss/train': 1.3746927976608276} -11/07/2021 01:18:32 - INFO - __main__ - Step 29169: {'lr': 0.0004595673895434498, 'samples': 5600448, 'steps': 29168, 'loss/train': 1.7352036237716675} -11/07/2021 01:18:33 - INFO - __main__ - Step 29170: {'lr': 0.00045956449596183446, 'samples': 5600640, 'steps': 29169, 'loss/train': 1.508607268333435} -11/07/2021 01:18:33 - INFO - __main__ - Step 29171: {'lr': 0.00045956160228579257, 'samples': 5600832, 'steps': 29170, 'loss/train': 1.5599982738494873} -11/07/2021 01:18:33 - INFO - __main__ - Step 29172: {'lr': 0.00045955870851532545, 'samples': 5601024, 'steps': 29171, 'loss/train': 1.8760854005813599} -11/07/2021 01:18:34 - INFO - __main__ - Step 29173: {'lr': 0.0004595558146504344, 'samples': 5601216, 'steps': 29172, 'loss/train': 1.5260308980941772} -11/07/2021 01:18:35 - INFO - __main__ - Step 29174: {'lr': 0.0004595529206911207, 'samples': 5601408, 'steps': 29173, 'loss/train': 2.0422980785369873} -11/07/2021 01:18:35 - INFO - __main__ - Step 29175: {'lr': 0.00045955002663738574, 'samples': 5601600, 'steps': 29174, 'loss/train': 1.5203852653503418} -11/07/2021 01:18:36 - INFO - __main__ - Step 29176: {'lr': 0.0004595471324892307, 'samples': 5601792, 'steps': 29175, 'loss/train': 1.7010663747787476} -11/07/2021 01:18:36 - INFO - __main__ - Step 29177: {'lr': 0.00045954423824665704, 'samples': 5601984, 'steps': 29176, 'loss/train': 1.3339821100234985} -11/07/2021 01:18:36 - INFO - __main__ - Step 29178: {'lr': 0.00045954134390966593, 'samples': 5602176, 'steps': 29177, 'loss/train': 1.674849033355713} -11/07/2021 01:18:37 - INFO - __main__ - Step 29179: {'lr': 0.00045953844947825876, 'samples': 5602368, 'steps': 29178, 'loss/train': 1.3179696798324585} -11/07/2021 01:18:38 - INFO - __main__ - Step 29180: {'lr': 0.0004595355549524368, 'samples': 5602560, 'steps': 29179, 'loss/train': 1.878377079963684} -11/07/2021 01:18:38 - INFO - __main__ - Step 29181: {'lr': 0.0004595326603322013, 'samples': 5602752, 'steps': 29180, 'loss/train': 1.4170050621032715} -11/07/2021 01:18:38 - INFO - __main__ - Step 29182: {'lr': 0.00045952976561755365, 'samples': 5602944, 'steps': 29181, 'loss/train': 1.6162670850753784} -11/07/2021 01:18:39 - INFO - __main__ - Step 29183: {'lr': 0.00045952687080849517, 'samples': 5603136, 'steps': 29182, 'loss/train': 1.6467374563217163} -11/07/2021 01:18:39 - INFO - __main__ - Step 29184: {'lr': 0.000459523975905027, 'samples': 5603328, 'steps': 29183, 'loss/train': 1.4982033967971802} -11/07/2021 01:18:40 - INFO - __main__ - Step 29185: {'lr': 0.0004595210809071506, 'samples': 5603520, 'steps': 29184, 'loss/train': 1.130165934562683} -11/07/2021 01:18:41 - INFO - __main__ - Step 29186: {'lr': 0.0004595181858148673, 'samples': 5603712, 'steps': 29185, 'loss/train': 1.5109838247299194} -11/07/2021 01:18:41 - INFO - __main__ - Step 29187: {'lr': 0.00045951529062817834, 'samples': 5603904, 'steps': 29186, 'loss/train': 1.0921766757965088} -11/07/2021 01:18:41 - INFO - __main__ - Step 29188: {'lr': 0.00045951239534708496, 'samples': 5604096, 'steps': 29187, 'loss/train': 1.9147355556488037} -11/07/2021 01:18:42 - INFO - __main__ - Step 29189: {'lr': 0.0004595094999715885, 'samples': 5604288, 'steps': 29188, 'loss/train': 1.8540912866592407} -11/07/2021 01:18:43 - INFO - __main__ - Step 29190: {'lr': 0.00045950660450169034, 'samples': 5604480, 'steps': 29189, 'loss/train': 1.7768203020095825} -11/07/2021 01:18:43 - INFO - __main__ - Step 29191: {'lr': 0.0004595037089373918, 'samples': 5604672, 'steps': 29190, 'loss/train': 2.194700241088867} -11/07/2021 01:18:43 - INFO - __main__ - Step 29192: {'lr': 0.000459500813278694, 'samples': 5604864, 'steps': 29191, 'loss/train': 0.8722490072250366} -11/07/2021 01:18:44 - INFO - __main__ - Step 29193: {'lr': 0.0004594979175255984, 'samples': 5605056, 'steps': 29192, 'loss/train': 1.1617752313613892} -11/07/2021 01:18:44 - INFO - __main__ - Step 29194: {'lr': 0.0004594950216781063, 'samples': 5605248, 'steps': 29193, 'loss/train': 1.210199236869812} -11/07/2021 01:18:45 - INFO - __main__ - Step 29195: {'lr': 0.000459492125736219, 'samples': 5605440, 'steps': 29194, 'loss/train': 1.6432205438613892} -11/07/2021 01:18:45 - INFO - __main__ - Step 29196: {'lr': 0.00045948922969993777, 'samples': 5605632, 'steps': 29195, 'loss/train': 0.8898891806602478} -11/07/2021 01:18:46 - INFO - __main__ - Step 29197: {'lr': 0.0004594863335692639, 'samples': 5605824, 'steps': 29196, 'loss/train': 1.2649930715560913} -11/07/2021 01:18:46 - INFO - __main__ - Step 29198: {'lr': 0.00045948343734419873, 'samples': 5606016, 'steps': 29197, 'loss/train': 1.6112602949142456} -11/07/2021 01:18:47 - INFO - __main__ - Step 29199: {'lr': 0.00045948054102474357, 'samples': 5606208, 'steps': 29198, 'loss/train': 1.6902039051055908} -11/07/2021 01:18:48 - INFO - __main__ - Step 29200: {'lr': 0.00045947764461089967, 'samples': 5606400, 'steps': 29199, 'loss/train': 1.480944275856018} -11/07/2021 01:18:48 - INFO - __main__ - Step 29201: {'lr': 0.00045947474810266844, 'samples': 5606592, 'steps': 29200, 'loss/train': 0.9518805146217346} -11/07/2021 01:18:48 - INFO - __main__ - Step 29202: {'lr': 0.00045947185150005106, 'samples': 5606784, 'steps': 29201, 'loss/train': 1.26365065574646} -11/07/2021 01:18:49 - INFO - __main__ - Step 29203: {'lr': 0.0004594689548030489, 'samples': 5606976, 'steps': 29202, 'loss/train': 1.0666319131851196} -11/07/2021 01:18:49 - INFO - __main__ - Step 29204: {'lr': 0.0004594660580116633, 'samples': 5607168, 'steps': 29203, 'loss/train': 0.9265233874320984} -11/07/2021 01:18:49 - INFO - __main__ - Step 29205: {'lr': 0.00045946316112589546, 'samples': 5607360, 'steps': 29204, 'loss/train': 1.244853138923645} -11/07/2021 01:18:51 - INFO - __main__ - Step 29206: {'lr': 0.0004594602641457468, 'samples': 5607552, 'steps': 29205, 'loss/train': 1.705867052078247} -11/07/2021 01:18:51 - INFO - __main__ - Step 29207: {'lr': 0.0004594573670712186, 'samples': 5607744, 'steps': 29206, 'loss/train': 1.5587643384933472} -11/07/2021 01:18:51 - INFO - __main__ - Step 29208: {'lr': 0.0004594544699023121, 'samples': 5607936, 'steps': 29207, 'loss/train': 1.1340076923370361} -11/07/2021 01:18:52 - INFO - __main__ - Step 29209: {'lr': 0.0004594515726390287, 'samples': 5608128, 'steps': 29208, 'loss/train': 1.416571855545044} -11/07/2021 01:18:52 - INFO - __main__ - Step 29210: {'lr': 0.00045944867528136956, 'samples': 5608320, 'steps': 29209, 'loss/train': 1.8951489925384521} -11/07/2021 01:18:53 - INFO - __main__ - Step 29211: {'lr': 0.00045944577782933615, 'samples': 5608512, 'steps': 29210, 'loss/train': 1.3687822818756104} -11/07/2021 01:18:53 - INFO - __main__ - Step 29212: {'lr': 0.0004594428802829297, 'samples': 5608704, 'steps': 29211, 'loss/train': 1.7491780519485474} -11/07/2021 01:18:54 - INFO - __main__ - Step 29213: {'lr': 0.00045943998264215153, 'samples': 5608896, 'steps': 29212, 'loss/train': 1.585396409034729} -11/07/2021 01:18:54 - INFO - __main__ - Step 29214: {'lr': 0.0004594370849070029, 'samples': 5609088, 'steps': 29213, 'loss/train': 1.8933584690093994} -11/07/2021 01:18:54 - INFO - __main__ - Step 29215: {'lr': 0.00045943418707748517, 'samples': 5609280, 'steps': 29214, 'loss/train': 1.7437858581542969} -11/07/2021 01:18:56 - INFO - __main__ - Step 29216: {'lr': 0.00045943128915359966, 'samples': 5609472, 'steps': 29215, 'loss/train': 1.339712381362915} -11/07/2021 01:18:56 - INFO - __main__ - Step 29217: {'lr': 0.0004594283911353476, 'samples': 5609664, 'steps': 29216, 'loss/train': 1.498565673828125} -11/07/2021 01:18:56 - INFO - __main__ - Step 29218: {'lr': 0.0004594254930227303, 'samples': 5609856, 'steps': 29217, 'loss/train': 1.5219602584838867} -11/07/2021 01:18:57 - INFO - __main__ - Step 29219: {'lr': 0.0004594225948157492, 'samples': 5610048, 'steps': 29218, 'loss/train': 1.590041160583496} -11/07/2021 01:18:57 - INFO - __main__ - Step 29220: {'lr': 0.0004594196965144054, 'samples': 5610240, 'steps': 29219, 'loss/train': 1.4370402097702026} -11/07/2021 01:18:58 - INFO - __main__ - Step 29221: {'lr': 0.0004594167981187004, 'samples': 5610432, 'steps': 29220, 'loss/train': 1.6703990697860718} -11/07/2021 01:18:58 - INFO - __main__ - Step 29222: {'lr': 0.00045941389962863546, 'samples': 5610624, 'steps': 29221, 'loss/train': 1.4225343465805054} -11/07/2021 01:18:59 - INFO - __main__ - Step 29223: {'lr': 0.00045941100104421176, 'samples': 5610816, 'steps': 29222, 'loss/train': 0.5798635482788086} -11/07/2021 01:18:59 - INFO - __main__ - Step 29224: {'lr': 0.0004594081023654307, 'samples': 5611008, 'steps': 29223, 'loss/train': 1.542803406715393} -11/07/2021 01:18:59 - INFO - __main__ - Step 29225: {'lr': 0.00045940520359229366, 'samples': 5611200, 'steps': 29224, 'loss/train': 2.027190923690796} -11/07/2021 01:19:00 - INFO - __main__ - Step 29226: {'lr': 0.0004594023047248018, 'samples': 5611392, 'steps': 29225, 'loss/train': 1.4777716398239136} -11/07/2021 01:19:01 - INFO - __main__ - Step 29227: {'lr': 0.0004593994057629565, 'samples': 5611584, 'steps': 29226, 'loss/train': 2.0218591690063477} -11/07/2021 01:19:01 - INFO - __main__ - Step 29228: {'lr': 0.000459396506706759, 'samples': 5611776, 'steps': 29227, 'loss/train': 1.5503898859024048} -11/07/2021 01:19:02 - INFO - __main__ - Step 29229: {'lr': 0.00045939360755621074, 'samples': 5611968, 'steps': 29228, 'loss/train': 1.5109821557998657} -11/07/2021 01:19:02 - INFO - __main__ - Step 29230: {'lr': 0.00045939070831131293, 'samples': 5612160, 'steps': 29229, 'loss/train': 1.4671088457107544} -11/07/2021 01:19:02 - INFO - __main__ - Step 29231: {'lr': 0.00045938780897206686, 'samples': 5612352, 'steps': 29230, 'loss/train': 1.9293100833892822} -11/07/2021 01:19:03 - INFO - __main__ - Step 29232: {'lr': 0.000459384909538474, 'samples': 5612544, 'steps': 29231, 'loss/train': 1.5910476446151733} -11/07/2021 01:19:04 - INFO - __main__ - Step 29233: {'lr': 0.00045938201001053546, 'samples': 5612736, 'steps': 29232, 'loss/train': 1.4884496927261353} -11/07/2021 01:19:04 - INFO - __main__ - Step 29234: {'lr': 0.00045937911038825257, 'samples': 5612928, 'steps': 29233, 'loss/train': 2.0655133724212646} -11/07/2021 01:19:04 - INFO - __main__ - Step 29235: {'lr': 0.00045937621067162674, 'samples': 5613120, 'steps': 29234, 'loss/train': 1.460890293121338} -11/07/2021 01:19:05 - INFO - __main__ - Step 29236: {'lr': 0.0004593733108606592, 'samples': 5613312, 'steps': 29235, 'loss/train': 1.3662402629852295} -11/07/2021 01:19:06 - INFO - __main__ - Step 29237: {'lr': 0.00045937041095535125, 'samples': 5613504, 'steps': 29236, 'loss/train': 2.0695712566375732} -11/07/2021 01:19:06 - INFO - __main__ - Step 29238: {'lr': 0.00045936751095570426, 'samples': 5613696, 'steps': 29237, 'loss/train': 0.9652360081672668} -11/07/2021 01:19:06 - INFO - __main__ - Step 29239: {'lr': 0.0004593646108617195, 'samples': 5613888, 'steps': 29238, 'loss/train': 1.482219934463501} -11/07/2021 01:19:07 - INFO - __main__ - Step 29240: {'lr': 0.00045936171067339826, 'samples': 5614080, 'steps': 29239, 'loss/train': 1.7664074897766113} -11/07/2021 01:19:07 - INFO - __main__ - Step 29241: {'lr': 0.0004593588103907419, 'samples': 5614272, 'steps': 29240, 'loss/train': 2.0414185523986816} -11/07/2021 01:19:09 - INFO - __main__ - Step 29242: {'lr': 0.00045935591001375163, 'samples': 5614464, 'steps': 29241, 'loss/train': 1.3956793546676636} -11/07/2021 01:19:09 - INFO - __main__ - Step 29243: {'lr': 0.0004593530095424289, 'samples': 5614656, 'steps': 29242, 'loss/train': 0.9382502436637878} -11/07/2021 01:19:09 - INFO - __main__ - Step 29244: {'lr': 0.0004593501089767749, 'samples': 5614848, 'steps': 29243, 'loss/train': 0.818658173084259} -11/07/2021 01:19:10 - INFO - __main__ - Step 29245: {'lr': 0.00045934720831679093, 'samples': 5615040, 'steps': 29244, 'loss/train': 0.30459633469581604} -11/07/2021 01:19:10 - INFO - __main__ - Step 29246: {'lr': 0.00045934430756247835, 'samples': 5615232, 'steps': 29245, 'loss/train': 0.5222163796424866} -11/07/2021 01:19:10 - INFO - __main__ - Step 29247: {'lr': 0.0004593414067138385, 'samples': 5615424, 'steps': 29246, 'loss/train': 2.345348596572876} -11/07/2021 01:19:12 - INFO - __main__ - Step 29248: {'lr': 0.0004593385057708726, 'samples': 5615616, 'steps': 29247, 'loss/train': 1.585673451423645} -11/07/2021 01:19:12 - INFO - __main__ - Step 29249: {'lr': 0.00045933560473358206, 'samples': 5615808, 'steps': 29248, 'loss/train': 1.8178879022598267} -11/07/2021 01:19:12 - INFO - __main__ - Step 29250: {'lr': 0.00045933270360196804, 'samples': 5616000, 'steps': 29249, 'loss/train': 0.9683892130851746} -11/07/2021 01:19:13 - INFO - __main__ - Step 29251: {'lr': 0.00045932980237603196, 'samples': 5616192, 'steps': 29250, 'loss/train': 1.3415101766586304} -11/07/2021 01:19:13 - INFO - __main__ - Step 29252: {'lr': 0.0004593269010557751, 'samples': 5616384, 'steps': 29251, 'loss/train': 1.6597208976745605} -11/07/2021 01:19:13 - INFO - __main__ - Step 29253: {'lr': 0.00045932399964119884, 'samples': 5616576, 'steps': 29252, 'loss/train': 1.457929253578186} -11/07/2021 01:19:14 - INFO - __main__ - Step 29254: {'lr': 0.00045932109813230437, 'samples': 5616768, 'steps': 29253, 'loss/train': 1.772652506828308} -11/07/2021 01:19:15 - INFO - __main__ - Step 29255: {'lr': 0.00045931819652909303, 'samples': 5616960, 'steps': 29254, 'loss/train': 1.9733912944793701} -11/07/2021 01:19:15 - INFO - __main__ - Step 29256: {'lr': 0.0004593152948315661, 'samples': 5617152, 'steps': 29255, 'loss/train': 1.6951172351837158} -11/07/2021 01:19:15 - INFO - __main__ - Step 29257: {'lr': 0.000459312393039725, 'samples': 5617344, 'steps': 29256, 'loss/train': 1.5540403127670288} -11/07/2021 01:19:16 - INFO - __main__ - Step 29258: {'lr': 0.0004593094911535709, 'samples': 5617536, 'steps': 29257, 'loss/train': 2.5532915592193604} -11/07/2021 01:19:17 - INFO - __main__ - Step 29259: {'lr': 0.00045930658917310525, 'samples': 5617728, 'steps': 29258, 'loss/train': 1.8263392448425293} -11/07/2021 01:19:17 - INFO - __main__ - Step 29260: {'lr': 0.0004593036870983293, 'samples': 5617920, 'steps': 29259, 'loss/train': 1.6476937532424927} -11/07/2021 01:19:18 - INFO - __main__ - Step 29261: {'lr': 0.0004593007849292442, 'samples': 5618112, 'steps': 29260, 'loss/train': 1.4127036333084106} -11/07/2021 01:19:18 - INFO - __main__ - Step 29262: {'lr': 0.0004592978826658515, 'samples': 5618304, 'steps': 29261, 'loss/train': 1.454675555229187} -11/07/2021 01:19:18 - INFO - __main__ - Step 29263: {'lr': 0.0004592949803081524, 'samples': 5618496, 'steps': 29262, 'loss/train': 1.6450902223587036} -11/07/2021 01:19:19 - INFO - __main__ - Step 29264: {'lr': 0.0004592920778561481, 'samples': 5618688, 'steps': 29263, 'loss/train': 1.128226637840271} -11/07/2021 01:19:20 - INFO - __main__ - Step 29265: {'lr': 0.00045928917530984014, 'samples': 5618880, 'steps': 29264, 'loss/train': 1.5634617805480957} -11/07/2021 01:19:20 - INFO - __main__ - Step 29266: {'lr': 0.00045928627266922974, 'samples': 5619072, 'steps': 29265, 'loss/train': 1.4417423009872437} -11/07/2021 01:19:20 - INFO - __main__ - Step 29267: {'lr': 0.0004592833699343181, 'samples': 5619264, 'steps': 29266, 'loss/train': 1.5430980920791626} -11/07/2021 01:19:21 - INFO - __main__ - Step 29268: {'lr': 0.0004592804671051066, 'samples': 5619456, 'steps': 29267, 'loss/train': 1.0452214479446411} -11/07/2021 01:19:22 - INFO - __main__ - Step 29269: {'lr': 0.0004592775641815966, 'samples': 5619648, 'steps': 29268, 'loss/train': 1.6853535175323486} -11/07/2021 01:19:22 - INFO - __main__ - Step 29270: {'lr': 0.0004592746611637893, 'samples': 5619840, 'steps': 29269, 'loss/train': 1.5771098136901855} -11/07/2021 01:19:23 - INFO - __main__ - Step 29271: {'lr': 0.00045927175805168607, 'samples': 5620032, 'steps': 29270, 'loss/train': 1.4390790462493896} -11/07/2021 01:19:23 - INFO - __main__ - Step 29272: {'lr': 0.00045926885484528823, 'samples': 5620224, 'steps': 29271, 'loss/train': 1.9551517963409424} -11/07/2021 01:19:23 - INFO - __main__ - Step 29273: {'lr': 0.0004592659515445971, 'samples': 5620416, 'steps': 29272, 'loss/train': 1.2658156156539917} -11/07/2021 01:19:24 - INFO - __main__ - Step 29274: {'lr': 0.00045926304814961397, 'samples': 5620608, 'steps': 29273, 'loss/train': 1.2549620866775513} -11/07/2021 01:19:25 - INFO - __main__ - Step 29275: {'lr': 0.00045926014466034004, 'samples': 5620800, 'steps': 29274, 'loss/train': 1.371767282485962} -11/07/2021 01:19:25 - INFO - __main__ - Step 29276: {'lr': 0.0004592572410767768, 'samples': 5620992, 'steps': 29275, 'loss/train': 1.3488487005233765} -11/07/2021 01:19:25 - INFO - __main__ - Step 29277: {'lr': 0.0004592543373989255, 'samples': 5621184, 'steps': 29276, 'loss/train': 1.4339321851730347} -11/07/2021 01:19:26 - INFO - __main__ - Step 29278: {'lr': 0.0004592514336267874, 'samples': 5621376, 'steps': 29277, 'loss/train': 1.396821141242981} -11/07/2021 01:19:26 - INFO - __main__ - Step 29279: {'lr': 0.0004592485297603638, 'samples': 5621568, 'steps': 29278, 'loss/train': 1.555566668510437} -11/07/2021 01:19:27 - INFO - __main__ - Step 29280: {'lr': 0.0004592456257996561, 'samples': 5621760, 'steps': 29279, 'loss/train': 1.6349639892578125} -11/07/2021 01:19:28 - INFO - __main__ - Step 29281: {'lr': 0.0004592427217446655, 'samples': 5621952, 'steps': 29280, 'loss/train': 1.6176657676696777} -11/07/2021 01:19:28 - INFO - __main__ - Step 29282: {'lr': 0.00045923981759539336, 'samples': 5622144, 'steps': 29281, 'loss/train': 1.900167465209961} -11/07/2021 01:19:28 - INFO - __main__ - Step 29283: {'lr': 0.000459236913351841, 'samples': 5622336, 'steps': 29282, 'loss/train': 2.1861953735351562} -11/07/2021 01:19:29 - INFO - __main__ - Step 29284: {'lr': 0.0004592340090140097, 'samples': 5622528, 'steps': 29283, 'loss/train': 1.3462752103805542} -11/07/2021 01:19:30 - INFO - __main__ - Step 29285: {'lr': 0.0004592311045819008, 'samples': 5622720, 'steps': 29284, 'loss/train': 1.4200493097305298} -11/07/2021 01:19:31 - INFO - __main__ - Step 29286: {'lr': 0.00045922820005551556, 'samples': 5622912, 'steps': 29285, 'loss/train': 1.8635931015014648} -11/07/2021 01:19:31 - INFO - __main__ - Step 29287: {'lr': 0.0004592252954348554, 'samples': 5623104, 'steps': 29286, 'loss/train': 1.6215516328811646} -11/07/2021 01:19:31 - INFO - __main__ - Step 29288: {'lr': 0.0004592223907199215, 'samples': 5623296, 'steps': 29287, 'loss/train': 1.471245527267456} -11/07/2021 01:19:32 - INFO - __main__ - Step 29289: {'lr': 0.0004592194859107153, 'samples': 5623488, 'steps': 29288, 'loss/train': 0.9702801704406738} -11/07/2021 01:19:33 - INFO - __main__ - Step 29290: {'lr': 0.0004592165810072379, 'samples': 5623680, 'steps': 29289, 'loss/train': 1.7796401977539062} -11/07/2021 01:19:33 - INFO - __main__ - Step 29291: {'lr': 0.00045921367600949077, 'samples': 5623872, 'steps': 29290, 'loss/train': 1.4581795930862427} -11/07/2021 01:19:33 - INFO - __main__ - Step 29292: {'lr': 0.0004592107709174752, 'samples': 5624064, 'steps': 29291, 'loss/train': 1.3144384622573853} -11/07/2021 01:19:34 - INFO - __main__ - Step 29293: {'lr': 0.0004592078657311925, 'samples': 5624256, 'steps': 29292, 'loss/train': 1.609805703163147} -11/07/2021 01:19:34 - INFO - __main__ - Step 29294: {'lr': 0.000459204960450644, 'samples': 5624448, 'steps': 29293, 'loss/train': 1.7830214500427246} -11/07/2021 01:19:35 - INFO - __main__ - Step 29295: {'lr': 0.0004592020550758309, 'samples': 5624640, 'steps': 29294, 'loss/train': 1.4547706842422485} -11/07/2021 01:19:35 - INFO - __main__ - Step 29296: {'lr': 0.0004591991496067546, 'samples': 5624832, 'steps': 29295, 'loss/train': 2.029094696044922} -11/07/2021 01:19:36 - INFO - __main__ - Step 29297: {'lr': 0.00045919624404341643, 'samples': 5625024, 'steps': 29296, 'loss/train': 0.851370632648468} -11/07/2021 01:19:36 - INFO - __main__ - Step 29298: {'lr': 0.00045919333838581757, 'samples': 5625216, 'steps': 29297, 'loss/train': 1.4973098039627075} -11/07/2021 01:19:37 - INFO - __main__ - Step 29299: {'lr': 0.00045919043263395953, 'samples': 5625408, 'steps': 29298, 'loss/train': 1.7972590923309326} -11/07/2021 01:19:37 - INFO - __main__ - Step 29300: {'lr': 0.00045918752678784344, 'samples': 5625600, 'steps': 29299, 'loss/train': 1.6929970979690552} -11/07/2021 01:19:38 - INFO - __main__ - Step 29301: {'lr': 0.0004591846208474707, 'samples': 5625792, 'steps': 29300, 'loss/train': 1.6178035736083984} -11/07/2021 01:19:38 - INFO - __main__ - Step 29302: {'lr': 0.00045918171481284256, 'samples': 5625984, 'steps': 29301, 'loss/train': 1.3055503368377686} -11/07/2021 01:19:39 - INFO - __main__ - Step 29303: {'lr': 0.0004591788086839604, 'samples': 5626176, 'steps': 29302, 'loss/train': 1.4833933115005493} -11/07/2021 01:19:39 - INFO - __main__ - Step 29304: {'lr': 0.0004591759024608255, 'samples': 5626368, 'steps': 29303, 'loss/train': 1.6076900959014893} -11/07/2021 01:19:39 - INFO - __main__ - Step 29305: {'lr': 0.0004591729961434392, 'samples': 5626560, 'steps': 29304, 'loss/train': 1.6441346406936646} -11/07/2021 01:19:40 - INFO - __main__ - Step 29306: {'lr': 0.00045917008973180273, 'samples': 5626752, 'steps': 29305, 'loss/train': 1.4150656461715698} -11/07/2021 01:19:41 - INFO - __main__ - Step 29307: {'lr': 0.0004591671832259174, 'samples': 5626944, 'steps': 29306, 'loss/train': 1.6857331991195679} -11/07/2021 01:19:41 - INFO - __main__ - Step 29308: {'lr': 0.00045916427662578464, 'samples': 5627136, 'steps': 29307, 'loss/train': 1.3254634141921997} -11/07/2021 01:19:41 - INFO - __main__ - Step 29309: {'lr': 0.00045916136993140574, 'samples': 5627328, 'steps': 29308, 'loss/train': 2.0325093269348145} -11/07/2021 01:19:42 - INFO - __main__ - Step 29310: {'lr': 0.00045915846314278187, 'samples': 5627520, 'steps': 29309, 'loss/train': 1.971750020980835} -11/07/2021 01:19:43 - INFO - __main__ - Step 29311: {'lr': 0.0004591555562599144, 'samples': 5627712, 'steps': 29310, 'loss/train': 1.5656483173370361} -11/07/2021 01:19:43 - INFO - __main__ - Step 29312: {'lr': 0.00045915264928280476, 'samples': 5627904, 'steps': 29311, 'loss/train': 1.7062572240829468} -11/07/2021 01:19:44 - INFO - __main__ - Step 29313: {'lr': 0.00045914974221145403, 'samples': 5628096, 'steps': 29312, 'loss/train': 1.6548060178756714} -11/07/2021 01:19:44 - INFO - __main__ - Step 29314: {'lr': 0.00045914683504586374, 'samples': 5628288, 'steps': 29313, 'loss/train': 1.8358749151229858} -11/07/2021 01:19:44 - INFO - __main__ - Step 29315: {'lr': 0.0004591439277860351, 'samples': 5628480, 'steps': 29314, 'loss/train': 1.781209945678711} -11/07/2021 01:19:45 - INFO - __main__ - Step 29316: {'lr': 0.00045914102043196947, 'samples': 5628672, 'steps': 29315, 'loss/train': 0.8205442428588867} -11/07/2021 01:19:46 - INFO - __main__ - Step 29317: {'lr': 0.00045913811298366804, 'samples': 5628864, 'steps': 29316, 'loss/train': 1.5368036031723022} -11/07/2021 01:19:46 - INFO - __main__ - Step 29318: {'lr': 0.0004591352054411323, 'samples': 5629056, 'steps': 29317, 'loss/train': 1.600978970527649} -11/07/2021 01:19:46 - INFO - __main__ - Step 29319: {'lr': 0.00045913229780436337, 'samples': 5629248, 'steps': 29318, 'loss/train': 0.5395891070365906} -11/07/2021 01:19:47 - INFO - __main__ - Step 29320: {'lr': 0.00045912939007336273, 'samples': 5629440, 'steps': 29319, 'loss/train': 1.9441035985946655} -11/07/2021 01:19:47 - INFO - __main__ - Step 29321: {'lr': 0.0004591264822481316, 'samples': 5629632, 'steps': 29320, 'loss/train': 1.6170451641082764} -11/07/2021 01:19:48 - INFO - __main__ - Step 29322: {'lr': 0.00045912357432867124, 'samples': 5629824, 'steps': 29321, 'loss/train': 0.8419768214225769} -11/07/2021 01:19:49 - INFO - __main__ - Step 29323: {'lr': 0.00045912066631498304, 'samples': 5630016, 'steps': 29322, 'loss/train': 1.2050539255142212} -11/07/2021 01:19:49 - INFO - __main__ - Step 29324: {'lr': 0.00045911775820706835, 'samples': 5630208, 'steps': 29323, 'loss/train': 1.4944329261779785} -11/07/2021 01:19:49 - INFO - __main__ - Step 29325: {'lr': 0.0004591148500049284, 'samples': 5630400, 'steps': 29324, 'loss/train': 1.7582799196243286} -11/07/2021 01:19:50 - INFO - __main__ - Step 29326: {'lr': 0.00045911194170856454, 'samples': 5630592, 'steps': 29325, 'loss/train': 2.302961826324463} -11/07/2021 01:19:51 - INFO - __main__ - Step 29327: {'lr': 0.00045910903331797807, 'samples': 5630784, 'steps': 29326, 'loss/train': 1.354048252105713} -11/07/2021 01:19:51 - INFO - __main__ - Step 29328: {'lr': 0.00045910612483317025, 'samples': 5630976, 'steps': 29327, 'loss/train': 1.7314233779907227} -11/07/2021 01:19:51 - INFO - __main__ - Step 29329: {'lr': 0.00045910321625414245, 'samples': 5631168, 'steps': 29328, 'loss/train': 1.6378663778305054} -11/07/2021 01:19:52 - INFO - __main__ - Step 29330: {'lr': 0.00045910030758089597, 'samples': 5631360, 'steps': 29329, 'loss/train': 1.2831581830978394} -11/07/2021 01:19:52 - INFO - __main__ - Step 29331: {'lr': 0.00045909739881343215, 'samples': 5631552, 'steps': 29330, 'loss/train': 1.3802523612976074} -11/07/2021 01:19:53 - INFO - __main__ - Step 29332: {'lr': 0.00045909448995175224, 'samples': 5631744, 'steps': 29331, 'loss/train': 1.3257133960723877} -11/07/2021 01:19:54 - INFO - __main__ - Step 29333: {'lr': 0.00045909158099585756, 'samples': 5631936, 'steps': 29332, 'loss/train': 1.4882980585098267} -11/07/2021 01:19:54 - INFO - __main__ - Step 29334: {'lr': 0.00045908867194574955, 'samples': 5632128, 'steps': 29333, 'loss/train': 1.4736945629119873} -11/07/2021 01:19:54 - INFO - __main__ - Step 29335: {'lr': 0.00045908576280142925, 'samples': 5632320, 'steps': 29334, 'loss/train': 1.6490302085876465} -11/07/2021 01:19:55 - INFO - __main__ - Step 29336: {'lr': 0.00045908285356289824, 'samples': 5632512, 'steps': 29335, 'loss/train': 1.8033547401428223} -11/07/2021 01:19:56 - INFO - __main__ - Step 29337: {'lr': 0.0004590799442301577, 'samples': 5632704, 'steps': 29336, 'loss/train': 1.8330843448638916} -11/07/2021 01:19:56 - INFO - __main__ - Step 29338: {'lr': 0.00045907703480320894, 'samples': 5632896, 'steps': 29337, 'loss/train': 1.6994603872299194} -11/07/2021 01:19:56 - INFO - __main__ - Step 29339: {'lr': 0.0004590741252820533, 'samples': 5633088, 'steps': 29338, 'loss/train': 1.590700387954712} -11/07/2021 01:19:57 - INFO - __main__ - Step 29340: {'lr': 0.00045907121566669216, 'samples': 5633280, 'steps': 29339, 'loss/train': 1.7707066535949707} -11/07/2021 01:19:57 - INFO - __main__ - Step 29341: {'lr': 0.0004590683059571267, 'samples': 5633472, 'steps': 29340, 'loss/train': 1.6956660747528076} -11/07/2021 01:19:58 - INFO - __main__ - Step 29342: {'lr': 0.0004590653961533582, 'samples': 5633664, 'steps': 29341, 'loss/train': 1.455352544784546} -11/07/2021 01:19:58 - INFO - __main__ - Step 29343: {'lr': 0.00045906248625538816, 'samples': 5633856, 'steps': 29342, 'loss/train': 1.6896904706954956} -11/07/2021 01:19:59 - INFO - __main__ - Step 29344: {'lr': 0.00045905957626321775, 'samples': 5634048, 'steps': 29343, 'loss/train': 1.7443041801452637} -11/07/2021 01:19:59 - INFO - __main__ - Step 29345: {'lr': 0.0004590566661768484, 'samples': 5634240, 'steps': 29344, 'loss/train': 1.7320188283920288} -11/07/2021 01:19:59 - INFO - __main__ - Step 29346: {'lr': 0.00045905375599628127, 'samples': 5634432, 'steps': 29345, 'loss/train': 1.636330246925354} -11/07/2021 01:20:01 - INFO - __main__ - Step 29347: {'lr': 0.00045905084572151774, 'samples': 5634624, 'steps': 29346, 'loss/train': 1.3468916416168213} -11/07/2021 01:20:01 - INFO - __main__ - Step 29348: {'lr': 0.0004590479353525591, 'samples': 5634816, 'steps': 29347, 'loss/train': 1.354005217552185} -11/07/2021 01:20:01 - INFO - __main__ - Step 29349: {'lr': 0.00045904502488940677, 'samples': 5635008, 'steps': 29348, 'loss/train': 1.5239914655685425} -11/07/2021 01:20:02 - INFO - __main__ - Step 29350: {'lr': 0.0004590421143320619, 'samples': 5635200, 'steps': 29349, 'loss/train': 0.6602169871330261} -11/07/2021 01:20:02 - INFO - __main__ - Step 29351: {'lr': 0.0004590392036805259, 'samples': 5635392, 'steps': 29350, 'loss/train': 1.3653275966644287} -11/07/2021 01:20:02 - INFO - __main__ - Step 29352: {'lr': 0.0004590362929348001, 'samples': 5635584, 'steps': 29351, 'loss/train': 1.6804929971694946} -11/07/2021 01:20:03 - INFO - __main__ - Step 29353: {'lr': 0.00045903338209488575, 'samples': 5635776, 'steps': 29352, 'loss/train': 1.9492771625518799} -11/07/2021 01:20:04 - INFO - __main__ - Step 29354: {'lr': 0.0004590304711607842, 'samples': 5635968, 'steps': 29353, 'loss/train': 1.5898215770721436} -11/07/2021 01:20:04 - INFO - __main__ - Step 29355: {'lr': 0.0004590275601324967, 'samples': 5636160, 'steps': 29354, 'loss/train': 2.0531885623931885} -11/07/2021 01:20:05 - INFO - __main__ - Step 29356: {'lr': 0.0004590246490100246, 'samples': 5636352, 'steps': 29355, 'loss/train': 0.7158932089805603} -11/07/2021 01:20:05 - INFO - __main__ - Step 29357: {'lr': 0.00045902173779336925, 'samples': 5636544, 'steps': 29356, 'loss/train': 0.8776659965515137} -11/07/2021 01:20:06 - INFO - __main__ - Step 29358: {'lr': 0.0004590188264825319, 'samples': 5636736, 'steps': 29357, 'loss/train': 1.6090434789657593} -11/07/2021 01:20:06 - INFO - __main__ - Step 29359: {'lr': 0.00045901591507751393, 'samples': 5636928, 'steps': 29358, 'loss/train': 1.2736858129501343} -11/07/2021 01:20:07 - INFO - __main__ - Step 29360: {'lr': 0.00045901300357831666, 'samples': 5637120, 'steps': 29359, 'loss/train': 0.9557590484619141} -11/07/2021 01:20:07 - INFO - __main__ - Step 29361: {'lr': 0.00045901009198494124, 'samples': 5637312, 'steps': 29360, 'loss/train': 1.6712108850479126} -11/07/2021 01:20:07 - INFO - __main__ - Step 29362: {'lr': 0.0004590071802973892, 'samples': 5637504, 'steps': 29361, 'loss/train': 1.7179455757141113} -11/07/2021 01:20:08 - INFO - __main__ - Step 29363: {'lr': 0.0004590042685156617, 'samples': 5637696, 'steps': 29362, 'loss/train': 2.0271809101104736} -11/07/2021 01:20:09 - INFO - __main__ - Step 29364: {'lr': 0.0004590013566397601, 'samples': 5637888, 'steps': 29363, 'loss/train': 1.2667248249053955} -11/07/2021 01:20:09 - INFO - __main__ - Step 29365: {'lr': 0.00045899844466968574, 'samples': 5638080, 'steps': 29364, 'loss/train': 1.6341489553451538} -11/07/2021 01:20:09 - INFO - __main__ - Step 29366: {'lr': 0.00045899553260543986, 'samples': 5638272, 'steps': 29365, 'loss/train': 1.4595669507980347} -11/07/2021 01:20:10 - INFO - __main__ - Step 29367: {'lr': 0.0004589926204470238, 'samples': 5638464, 'steps': 29366, 'loss/train': 1.6928445100784302} -11/07/2021 01:20:11 - INFO - __main__ - Step 29368: {'lr': 0.000458989708194439, 'samples': 5638656, 'steps': 29367, 'loss/train': 1.4349541664123535} -11/07/2021 01:20:11 - INFO - __main__ - Step 29369: {'lr': 0.0004589867958476866, 'samples': 5638848, 'steps': 29368, 'loss/train': 1.667285680770874} -11/07/2021 01:20:11 - INFO - __main__ - Step 29370: {'lr': 0.000458983883406768, 'samples': 5639040, 'steps': 29369, 'loss/train': 1.657423734664917} -11/07/2021 01:20:12 - INFO - __main__ - Step 29371: {'lr': 0.0004589809708716844, 'samples': 5639232, 'steps': 29370, 'loss/train': 1.6851989030838013} -11/07/2021 01:20:12 - INFO - __main__ - Step 29372: {'lr': 0.0004589780582424373, 'samples': 5639424, 'steps': 29371, 'loss/train': 1.1141544580459595} -11/07/2021 01:20:13 - INFO - __main__ - Step 29373: {'lr': 0.00045897514551902785, 'samples': 5639616, 'steps': 29372, 'loss/train': 1.305080771446228} -11/07/2021 01:20:14 - INFO - __main__ - Step 29374: {'lr': 0.0004589722327014575, 'samples': 5639808, 'steps': 29373, 'loss/train': 1.4186768531799316} -11/07/2021 01:20:14 - INFO - __main__ - Step 29375: {'lr': 0.0004589693197897274, 'samples': 5640000, 'steps': 29374, 'loss/train': 1.5759755373001099} -11/07/2021 01:20:15 - INFO - __main__ - Step 29376: {'lr': 0.0004589664067838389, 'samples': 5640192, 'steps': 29375, 'loss/train': 1.7532117366790771} -11/07/2021 01:20:15 - INFO - __main__ - Step 29377: {'lr': 0.00045896349368379356, 'samples': 5640384, 'steps': 29376, 'loss/train': 1.5392422676086426} -11/07/2021 01:20:16 - INFO - __main__ - Step 29378: {'lr': 0.00045896058048959233, 'samples': 5640576, 'steps': 29377, 'loss/train': 0.8304669857025146} -11/07/2021 01:20:16 - INFO - __main__ - Step 29379: {'lr': 0.00045895766720123677, 'samples': 5640768, 'steps': 29378, 'loss/train': 1.7094236612319946} -11/07/2021 01:20:17 - INFO - __main__ - Step 29380: {'lr': 0.0004589547538187281, 'samples': 5640960, 'steps': 29379, 'loss/train': 1.5307104587554932} -11/07/2021 01:20:17 - INFO - __main__ - Step 29381: {'lr': 0.0004589518403420676, 'samples': 5641152, 'steps': 29380, 'loss/train': 1.6963664293289185} -11/07/2021 01:20:17 - INFO - __main__ - Step 29382: {'lr': 0.00045894892677125667, 'samples': 5641344, 'steps': 29381, 'loss/train': 1.6436216831207275} -11/07/2021 01:20:18 - INFO - __main__ - Step 29383: {'lr': 0.0004589460131062965, 'samples': 5641536, 'steps': 29382, 'loss/train': 1.7731062173843384} -11/07/2021 01:20:19 - INFO - __main__ - Step 29384: {'lr': 0.00045894309934718853, 'samples': 5641728, 'steps': 29383, 'loss/train': 1.121886134147644} -11/07/2021 01:20:19 - INFO - __main__ - Step 29385: {'lr': 0.00045894018549393404, 'samples': 5641920, 'steps': 29384, 'loss/train': 1.575050711631775} -11/07/2021 01:20:19 - INFO - __main__ - Step 29386: {'lr': 0.0004589372715465343, 'samples': 5642112, 'steps': 29385, 'loss/train': 1.6603325605392456} -11/07/2021 01:20:20 - INFO - __main__ - Step 29387: {'lr': 0.0004589343575049907, 'samples': 5642304, 'steps': 29386, 'loss/train': 1.5052731037139893} -11/07/2021 01:20:21 - INFO - __main__ - Step 29388: {'lr': 0.0004589314433693044, 'samples': 5642496, 'steps': 29387, 'loss/train': 1.483961820602417} -11/07/2021 01:20:21 - INFO - __main__ - Step 29389: {'lr': 0.0004589285291394769, 'samples': 5642688, 'steps': 29388, 'loss/train': 1.6082696914672852} -11/07/2021 01:20:22 - INFO - __main__ - Step 29390: {'lr': 0.00045892561481550943, 'samples': 5642880, 'steps': 29389, 'loss/train': 0.4304291605949402} -11/07/2021 01:20:22 - INFO - __main__ - Step 29391: {'lr': 0.0004589227003974032, 'samples': 5643072, 'steps': 29390, 'loss/train': 2.2525391578674316} -11/07/2021 01:20:22 - INFO - __main__ - Step 29392: {'lr': 0.00045891978588515975, 'samples': 5643264, 'steps': 29391, 'loss/train': 1.5738767385482788} -11/07/2021 01:20:23 - INFO - __main__ - Step 29393: {'lr': 0.0004589168712787802, 'samples': 5643456, 'steps': 29392, 'loss/train': 0.9495261907577515} -11/07/2021 01:20:24 - INFO - __main__ - Step 29394: {'lr': 0.00045891395657826595, 'samples': 5643648, 'steps': 29393, 'loss/train': 1.761458158493042} -11/07/2021 01:20:24 - INFO - __main__ - Step 29395: {'lr': 0.0004589110417836183, 'samples': 5643840, 'steps': 29394, 'loss/train': 1.4254180192947388} -11/07/2021 01:20:24 - INFO - __main__ - Step 29396: {'lr': 0.0004589081268948386, 'samples': 5644032, 'steps': 29395, 'loss/train': 0.7713015675544739} -11/07/2021 01:20:25 - INFO - __main__ - Step 29397: {'lr': 0.00045890521191192807, 'samples': 5644224, 'steps': 29396, 'loss/train': 1.3440076112747192} -11/07/2021 01:20:26 - INFO - __main__ - Step 29398: {'lr': 0.0004589022968348881, 'samples': 5644416, 'steps': 29397, 'loss/train': 1.3670624494552612} -11/07/2021 01:20:26 - INFO - __main__ - Step 29399: {'lr': 0.0004588993816637199, 'samples': 5644608, 'steps': 29398, 'loss/train': 1.271843433380127} -11/07/2021 01:20:26 - INFO - __main__ - Step 29400: {'lr': 0.00045889646639842496, 'samples': 5644800, 'steps': 29399, 'loss/train': 1.7491928339004517} -11/07/2021 01:20:27 - INFO - __main__ - Step 29401: {'lr': 0.0004588935510390045, 'samples': 5644992, 'steps': 29400, 'loss/train': 1.18025541305542} -11/07/2021 01:20:27 - INFO - __main__ - Step 29402: {'lr': 0.00045889063558545974, 'samples': 5645184, 'steps': 29401, 'loss/train': 1.5742133855819702} -11/07/2021 01:20:28 - INFO - __main__ - Step 29403: {'lr': 0.0004588877200377921, 'samples': 5645376, 'steps': 29402, 'loss/train': 1.396234154701233} -11/07/2021 01:20:29 - INFO - __main__ - Step 29404: {'lr': 0.000458884804396003, 'samples': 5645568, 'steps': 29403, 'loss/train': 1.0069153308868408} -11/07/2021 01:20:29 - INFO - __main__ - Step 29405: {'lr': 0.0004588818886600935, 'samples': 5645760, 'steps': 29404, 'loss/train': 1.5877037048339844} -11/07/2021 01:20:29 - INFO - __main__ - Step 29406: {'lr': 0.00045887897283006506, 'samples': 5645952, 'steps': 29405, 'loss/train': 1.3609683513641357} -11/07/2021 01:20:30 - INFO - __main__ - Step 29407: {'lr': 0.00045887605690591904, 'samples': 5646144, 'steps': 29406, 'loss/train': 1.4616987705230713} -11/07/2021 01:20:30 - INFO - __main__ - Step 29408: {'lr': 0.0004588731408876566, 'samples': 5646336, 'steps': 29407, 'loss/train': 1.570209264755249} -11/07/2021 01:20:31 - INFO - __main__ - Step 29409: {'lr': 0.00045887022477527923, 'samples': 5646528, 'steps': 29408, 'loss/train': 1.9197208881378174} -11/07/2021 01:20:32 - INFO - __main__ - Step 29410: {'lr': 0.0004588673085687881, 'samples': 5646720, 'steps': 29409, 'loss/train': 1.5169775485992432} -11/07/2021 01:20:32 - INFO - __main__ - Step 29411: {'lr': 0.00045886439226818464, 'samples': 5646912, 'steps': 29410, 'loss/train': 1.6643450260162354} -11/07/2021 01:20:32 - INFO - __main__ - Step 29412: {'lr': 0.0004588614758734701, 'samples': 5647104, 'steps': 29411, 'loss/train': 1.5076509714126587} -11/07/2021 01:20:33 - INFO - __main__ - Step 29413: {'lr': 0.0004588585593846458, 'samples': 5647296, 'steps': 29412, 'loss/train': 0.8832883834838867} -11/07/2021 01:20:33 - INFO - __main__ - Step 29414: {'lr': 0.000458855642801713, 'samples': 5647488, 'steps': 29413, 'loss/train': 1.680592656135559} -11/07/2021 01:20:34 - INFO - __main__ - Step 29415: {'lr': 0.00045885272612467313, 'samples': 5647680, 'steps': 29414, 'loss/train': 1.6815725564956665} -11/07/2021 01:20:34 - INFO - __main__ - Step 29416: {'lr': 0.0004588498093535274, 'samples': 5647872, 'steps': 29415, 'loss/train': 1.485547423362732} -11/07/2021 01:20:35 - INFO - __main__ - Step 29417: {'lr': 0.0004588468924882772, 'samples': 5648064, 'steps': 29416, 'loss/train': 1.5461474657058716} -11/07/2021 01:20:35 - INFO - __main__ - Step 29418: {'lr': 0.0004588439755289238, 'samples': 5648256, 'steps': 29417, 'loss/train': 1.3511896133422852} -11/07/2021 01:20:35 - INFO - __main__ - Step 29419: {'lr': 0.00045884105847546853, 'samples': 5648448, 'steps': 29418, 'loss/train': 2.118772506713867} -11/07/2021 01:20:37 - INFO - __main__ - Step 29420: {'lr': 0.00045883814132791274, 'samples': 5648640, 'steps': 29419, 'loss/train': 1.338430643081665} -11/07/2021 01:20:37 - INFO - __main__ - Step 29421: {'lr': 0.0004588352240862577, 'samples': 5648832, 'steps': 29420, 'loss/train': 1.2146153450012207} -11/07/2021 01:20:37 - INFO - __main__ - Step 29422: {'lr': 0.0004588323067505047, 'samples': 5649024, 'steps': 29421, 'loss/train': 1.3759852647781372} -11/07/2021 01:20:38 - INFO - __main__ - Step 29423: {'lr': 0.00045882938932065504, 'samples': 5649216, 'steps': 29422, 'loss/train': 1.1928725242614746} -11/07/2021 01:20:38 - INFO - __main__ - Step 29424: {'lr': 0.0004588264717967101, 'samples': 5649408, 'steps': 29423, 'loss/train': 1.5485185384750366} -11/07/2021 01:20:39 - INFO - __main__ - Step 29425: {'lr': 0.00045882355417867124, 'samples': 5649600, 'steps': 29424, 'loss/train': 1.6709578037261963} -11/07/2021 01:20:39 - INFO - __main__ - Step 29426: {'lr': 0.00045882063646653966, 'samples': 5649792, 'steps': 29425, 'loss/train': 1.5203857421875} -11/07/2021 01:20:40 - INFO - __main__ - Step 29427: {'lr': 0.00045881771866031673, 'samples': 5649984, 'steps': 29426, 'loss/train': 1.921944260597229} -11/07/2021 01:20:40 - INFO - __main__ - Step 29428: {'lr': 0.00045881480076000376, 'samples': 5650176, 'steps': 29427, 'loss/train': 1.3370532989501953} -11/07/2021 01:20:40 - INFO - __main__ - Step 29429: {'lr': 0.00045881188276560204, 'samples': 5650368, 'steps': 29428, 'loss/train': 2.0083775520324707} -11/07/2021 01:20:42 - INFO - __main__ - Step 29430: {'lr': 0.000458808964677113, 'samples': 5650560, 'steps': 29429, 'loss/train': 1.303795576095581} -11/07/2021 01:20:42 - INFO - __main__ - Step 29431: {'lr': 0.00045880604649453774, 'samples': 5650752, 'steps': 29430, 'loss/train': 1.9484096765518188} -11/07/2021 01:20:42 - INFO - __main__ - Step 29432: {'lr': 0.00045880312821787775, 'samples': 5650944, 'steps': 29431, 'loss/train': 1.3311874866485596} -11/07/2021 01:20:43 - INFO - __main__ - Step 29433: {'lr': 0.00045880020984713434, 'samples': 5651136, 'steps': 29432, 'loss/train': 1.860125184059143} -11/07/2021 01:20:43 - INFO - __main__ - Step 29434: {'lr': 0.0004587972913823087, 'samples': 5651328, 'steps': 29433, 'loss/train': 1.5912048816680908} -11/07/2021 01:20:43 - INFO - __main__ - Step 29435: {'lr': 0.00045879437282340225, 'samples': 5651520, 'steps': 29434, 'loss/train': 1.089166522026062} -11/07/2021 01:20:44 - INFO - __main__ - Step 29436: {'lr': 0.00045879145417041623, 'samples': 5651712, 'steps': 29435, 'loss/train': 1.9212347269058228} -11/07/2021 01:20:45 - INFO - __main__ - Step 29437: {'lr': 0.0004587885354233521, 'samples': 5651904, 'steps': 29436, 'loss/train': 1.658786416053772} -11/07/2021 01:20:45 - INFO - __main__ - Step 29438: {'lr': 0.0004587856165822111, 'samples': 5652096, 'steps': 29437, 'loss/train': 1.6033729314804077} -11/07/2021 01:20:45 - INFO - __main__ - Step 29439: {'lr': 0.0004587826976469944, 'samples': 5652288, 'steps': 29438, 'loss/train': 1.6085463762283325} -11/07/2021 01:20:46 - INFO - __main__ - Step 29440: {'lr': 0.0004587797786177035, 'samples': 5652480, 'steps': 29439, 'loss/train': 2.093695640563965} -11/07/2021 01:20:46 - INFO - __main__ - Step 29441: {'lr': 0.0004587768594943396, 'samples': 5652672, 'steps': 29440, 'loss/train': 1.3613848686218262} -11/07/2021 01:20:47 - INFO - __main__ - Step 29442: {'lr': 0.00045877394027690413, 'samples': 5652864, 'steps': 29441, 'loss/train': 1.7916233539581299} -11/07/2021 01:20:47 - INFO - __main__ - Step 29443: {'lr': 0.0004587710209653984, 'samples': 5653056, 'steps': 29442, 'loss/train': 1.3992745876312256} -11/07/2021 01:20:48 - INFO - __main__ - Step 29444: {'lr': 0.0004587681015598235, 'samples': 5653248, 'steps': 29443, 'loss/train': 1.518426775932312} -11/07/2021 01:20:48 - INFO - __main__ - Step 29445: {'lr': 0.00045876518206018103, 'samples': 5653440, 'steps': 29444, 'loss/train': 1.5235440731048584} -11/07/2021 01:20:48 - INFO - __main__ - Step 29446: {'lr': 0.00045876226246647226, 'samples': 5653632, 'steps': 29445, 'loss/train': 1.6063261032104492} -11/07/2021 01:20:50 - INFO - __main__ - Step 29447: {'lr': 0.0004587593427786983, 'samples': 5653824, 'steps': 29446, 'loss/train': 1.4011942148208618} -11/07/2021 01:20:50 - INFO - __main__ - Step 29448: {'lr': 0.0004587564229968606, 'samples': 5654016, 'steps': 29447, 'loss/train': 1.538805603981018} -11/07/2021 01:20:50 - INFO - __main__ - Step 29449: {'lr': 0.00045875350312096053, 'samples': 5654208, 'steps': 29448, 'loss/train': 1.532183289527893} -11/07/2021 01:20:51 - INFO - __main__ - Step 29450: {'lr': 0.0004587505831509994, 'samples': 5654400, 'steps': 29449, 'loss/train': 1.8191397190093994} -11/07/2021 01:20:51 - INFO - __main__ - Step 29451: {'lr': 0.0004587476630869784, 'samples': 5654592, 'steps': 29450, 'loss/train': 1.310355305671692} -11/07/2021 01:20:52 - INFO - __main__ - Step 29452: {'lr': 0.000458744742928899, 'samples': 5654784, 'steps': 29451, 'loss/train': 0.8070980906486511} -11/07/2021 01:20:52 - INFO - __main__ - Step 29453: {'lr': 0.00045874182267676236, 'samples': 5654976, 'steps': 29452, 'loss/train': 2.1116678714752197} -11/07/2021 01:20:53 - INFO - __main__ - Step 29454: {'lr': 0.0004587389023305699, 'samples': 5655168, 'steps': 29453, 'loss/train': 1.662084698677063} -11/07/2021 01:20:53 - INFO - __main__ - Step 29455: {'lr': 0.00045873598189032295, 'samples': 5655360, 'steps': 29454, 'loss/train': 0.8377273082733154} -11/07/2021 01:20:53 - INFO - __main__ - Step 29456: {'lr': 0.00045873306135602276, 'samples': 5655552, 'steps': 29455, 'loss/train': 1.3423774242401123} -11/07/2021 01:20:55 - INFO - __main__ - Step 29457: {'lr': 0.00045873014072767064, 'samples': 5655744, 'steps': 29456, 'loss/train': 1.6420247554779053} -11/07/2021 01:20:55 - INFO - __main__ - Step 29458: {'lr': 0.000458727220005268, 'samples': 5655936, 'steps': 29457, 'loss/train': 1.5810794830322266} -11/07/2021 01:20:55 - INFO - __main__ - Step 29459: {'lr': 0.00045872429918881606, 'samples': 5656128, 'steps': 29458, 'loss/train': 1.1572012901306152} -11/07/2021 01:20:56 - INFO - __main__ - Step 29460: {'lr': 0.00045872137827831616, 'samples': 5656320, 'steps': 29459, 'loss/train': 0.9177290797233582} -11/07/2021 01:20:56 - INFO - __main__ - Step 29461: {'lr': 0.00045871845727376973, 'samples': 5656512, 'steps': 29460, 'loss/train': 1.4853347539901733} -11/07/2021 01:20:57 - INFO - __main__ - Step 29462: {'lr': 0.0004587155361751778, 'samples': 5656704, 'steps': 29461, 'loss/train': 1.3394935131072998} -11/07/2021 01:20:57 - INFO - __main__ - Step 29463: {'lr': 0.000458712614982542, 'samples': 5656896, 'steps': 29462, 'loss/train': 1.614371418952942} -11/07/2021 01:20:58 - INFO - __main__ - Step 29464: {'lr': 0.00045870969369586346, 'samples': 5657088, 'steps': 29463, 'loss/train': 1.7958014011383057} -11/07/2021 01:20:58 - INFO - __main__ - Step 29465: {'lr': 0.00045870677231514356, 'samples': 5657280, 'steps': 29464, 'loss/train': 1.4317177534103394} -11/07/2021 01:20:59 - INFO - __main__ - Step 29466: {'lr': 0.0004587038508403837, 'samples': 5657472, 'steps': 29465, 'loss/train': 1.5790847539901733} -11/07/2021 01:21:00 - INFO - __main__ - Step 29467: {'lr': 0.000458700929271585, 'samples': 5657664, 'steps': 29466, 'loss/train': 1.7337079048156738} -11/07/2021 01:21:00 - INFO - __main__ - Step 29468: {'lr': 0.0004586980076087489, 'samples': 5657856, 'steps': 29467, 'loss/train': 1.7457712888717651} -11/07/2021 01:21:00 - INFO - __main__ - Step 29469: {'lr': 0.0004586950858518767, 'samples': 5658048, 'steps': 29468, 'loss/train': 1.7356659173965454} -11/07/2021 01:21:01 - INFO - __main__ - Step 29470: {'lr': 0.0004586921640009697, 'samples': 5658240, 'steps': 29469, 'loss/train': 1.5608547925949097} -11/07/2021 01:21:01 - INFO - __main__ - Step 29471: {'lr': 0.0004586892420560294, 'samples': 5658432, 'steps': 29470, 'loss/train': 1.1268757581710815} -11/07/2021 01:21:02 - INFO - __main__ - Step 29472: {'lr': 0.0004586863200170567, 'samples': 5658624, 'steps': 29471, 'loss/train': 0.8702432513237} -11/07/2021 01:21:03 - INFO - __main__ - Step 29473: {'lr': 0.00045868339788405333, 'samples': 5658816, 'steps': 29472, 'loss/train': 1.633955955505371} -11/07/2021 01:21:03 - INFO - __main__ - Step 29474: {'lr': 0.0004586804756570204, 'samples': 5659008, 'steps': 29473, 'loss/train': 1.199129343032837} -11/07/2021 01:21:03 - INFO - __main__ - Step 29475: {'lr': 0.0004586775533359592, 'samples': 5659200, 'steps': 29474, 'loss/train': 2.014317750930786} -11/07/2021 01:21:04 - INFO - __main__ - Step 29476: {'lr': 0.00045867463092087116, 'samples': 5659392, 'steps': 29475, 'loss/train': 1.0253338813781738} -11/07/2021 01:21:05 - INFO - __main__ - Step 29477: {'lr': 0.00045867170841175755, 'samples': 5659584, 'steps': 29476, 'loss/train': 0.2625601887702942} -11/07/2021 01:21:05 - INFO - __main__ - Step 29478: {'lr': 0.0004586687858086197, 'samples': 5659776, 'steps': 29477, 'loss/train': 1.3529233932495117} -11/07/2021 01:21:05 - INFO - __main__ - Step 29479: {'lr': 0.0004586658631114589, 'samples': 5659968, 'steps': 29478, 'loss/train': 1.5325437784194946} -11/07/2021 01:21:06 - INFO - __main__ - Step 29480: {'lr': 0.0004586629403202765, 'samples': 5660160, 'steps': 29479, 'loss/train': 1.3387819528579712} -11/07/2021 01:21:06 - INFO - __main__ - Step 29481: {'lr': 0.0004586600174350738, 'samples': 5660352, 'steps': 29480, 'loss/train': 2.0539634227752686} -11/07/2021 01:21:07 - INFO - __main__ - Step 29482: {'lr': 0.0004586570944558521, 'samples': 5660544, 'steps': 29481, 'loss/train': 0.8757557272911072} -11/07/2021 01:21:08 - INFO - __main__ - Step 29483: {'lr': 0.00045865417138261276, 'samples': 5660736, 'steps': 29482, 'loss/train': 1.633339762687683} -11/07/2021 01:21:08 - INFO - __main__ - Step 29484: {'lr': 0.00045865124821535704, 'samples': 5660928, 'steps': 29483, 'loss/train': 1.6316306591033936} -11/07/2021 01:21:08 - INFO - __main__ - Step 29485: {'lr': 0.00045864832495408624, 'samples': 5661120, 'steps': 29484, 'loss/train': 2.1339690685272217} -11/07/2021 01:21:09 - INFO - __main__ - Step 29486: {'lr': 0.0004586454015988019, 'samples': 5661312, 'steps': 29485, 'loss/train': 1.2461416721343994} -11/07/2021 01:21:09 - INFO - __main__ - Step 29487: {'lr': 0.000458642478149505, 'samples': 5661504, 'steps': 29486, 'loss/train': 1.9071553945541382} -11/07/2021 01:21:11 - INFO - __main__ - Step 29488: {'lr': 0.00045863955460619707, 'samples': 5661696, 'steps': 29487, 'loss/train': 1.6638797521591187} -11/07/2021 01:21:12 - INFO - __main__ - Step 29489: {'lr': 0.0004586366309688793, 'samples': 5661888, 'steps': 29488, 'loss/train': 0.8595585823059082} -11/07/2021 01:21:12 - INFO - __main__ - Step 29490: {'lr': 0.00045863370723755315, 'samples': 5662080, 'steps': 29489, 'loss/train': 1.6457905769348145} -11/07/2021 01:21:12 - INFO - __main__ - Step 29491: {'lr': 0.00045863078341221993, 'samples': 5662272, 'steps': 29490, 'loss/train': 1.3534252643585205} -11/07/2021 01:21:13 - INFO - __main__ - Step 29492: {'lr': 0.0004586278594928808, 'samples': 5662464, 'steps': 29491, 'loss/train': 1.8189722299575806} -11/07/2021 01:21:13 - INFO - __main__ - Step 29493: {'lr': 0.0004586249354795372, 'samples': 5662656, 'steps': 29492, 'loss/train': 1.8026632070541382} -11/07/2021 01:21:13 - INFO - __main__ - Step 29494: {'lr': 0.0004586220113721905, 'samples': 5662848, 'steps': 29493, 'loss/train': 1.0064070224761963} -11/07/2021 01:21:14 - INFO - __main__ - Step 29495: {'lr': 0.0004586190871708419, 'samples': 5663040, 'steps': 29494, 'loss/train': 1.061107873916626} -11/07/2021 01:21:15 - INFO - __main__ - Step 29496: {'lr': 0.0004586161628754927, 'samples': 5663232, 'steps': 29495, 'loss/train': 1.4288783073425293} -11/07/2021 01:21:15 - INFO - __main__ - Step 29497: {'lr': 0.0004586132384861443, 'samples': 5663424, 'steps': 29496, 'loss/train': 0.9088807106018066} -11/07/2021 01:21:16 - INFO - __main__ - Step 29498: {'lr': 0.000458610314002798, 'samples': 5663616, 'steps': 29497, 'loss/train': 1.5161337852478027} -11/07/2021 01:21:16 - INFO - __main__ - Step 29499: {'lr': 0.0004586073894254551, 'samples': 5663808, 'steps': 29498, 'loss/train': 2.5317184925079346} -11/07/2021 01:21:16 - INFO - __main__ - Step 29500: {'lr': 0.000458604464754117, 'samples': 5664000, 'steps': 29499, 'loss/train': 1.939312219619751} -11/07/2021 01:21:18 - INFO - __main__ - Step 29501: {'lr': 0.0004586015399887849, 'samples': 5664192, 'steps': 29500, 'loss/train': 1.8874361515045166} -11/07/2021 01:21:18 - INFO - __main__ - Step 29502: {'lr': 0.0004585986151294602, 'samples': 5664384, 'steps': 29501, 'loss/train': 1.2751479148864746} -11/07/2021 01:21:18 - INFO - __main__ - Step 29503: {'lr': 0.0004585956901761441, 'samples': 5664576, 'steps': 29502, 'loss/train': 1.4074900150299072} -11/07/2021 01:21:19 - INFO - __main__ - Step 29504: {'lr': 0.00045859276512883807, 'samples': 5664768, 'steps': 29503, 'loss/train': 1.9444576501846313} -11/07/2021 01:21:19 - INFO - __main__ - Step 29505: {'lr': 0.00045858983998754336, 'samples': 5664960, 'steps': 29504, 'loss/train': 1.9173896312713623} -11/07/2021 01:21:20 - INFO - __main__ - Step 29506: {'lr': 0.0004585869147522612, 'samples': 5665152, 'steps': 29505, 'loss/train': 1.8542300462722778} -11/07/2021 01:21:20 - INFO - __main__ - Step 29507: {'lr': 0.00045858398942299306, 'samples': 5665344, 'steps': 29506, 'loss/train': 1.4023475646972656} -11/07/2021 01:21:21 - INFO - __main__ - Step 29508: {'lr': 0.0004585810639997402, 'samples': 5665536, 'steps': 29507, 'loss/train': 1.542800784111023} -11/07/2021 01:21:21 - INFO - __main__ - Step 29509: {'lr': 0.0004585781384825039, 'samples': 5665728, 'steps': 29508, 'loss/train': 2.0159964561462402} -11/07/2021 01:21:21 - INFO - __main__ - Step 29510: {'lr': 0.00045857521287128556, 'samples': 5665920, 'steps': 29509, 'loss/train': 1.922012448310852} -11/07/2021 01:21:22 - INFO - __main__ - Step 29511: {'lr': 0.0004585722871660864, 'samples': 5666112, 'steps': 29510, 'loss/train': 1.5604584217071533} -11/07/2021 01:21:23 - INFO - __main__ - Step 29512: {'lr': 0.0004585693613669078, 'samples': 5666304, 'steps': 29511, 'loss/train': 2.035801887512207} -11/07/2021 01:21:23 - INFO - __main__ - Step 29513: {'lr': 0.0004585664354737511, 'samples': 5666496, 'steps': 29512, 'loss/train': 1.9828746318817139} -11/07/2021 01:21:23 - INFO - __main__ - Step 29514: {'lr': 0.0004585635094866175, 'samples': 5666688, 'steps': 29513, 'loss/train': 1.7652790546417236} -11/07/2021 01:21:24 - INFO - __main__ - Step 29515: {'lr': 0.0004585605834055084, 'samples': 5666880, 'steps': 29514, 'loss/train': 2.0004334449768066} -11/07/2021 01:21:24 - INFO - __main__ - Step 29516: {'lr': 0.00045855765723042526, 'samples': 5667072, 'steps': 29515, 'loss/train': 1.1060426235198975} -11/07/2021 01:21:26 - INFO - __main__ - Step 29517: {'lr': 0.00045855473096136914, 'samples': 5667264, 'steps': 29516, 'loss/train': 1.4863965511322021} -11/07/2021 01:21:26 - INFO - __main__ - Step 29518: {'lr': 0.00045855180459834153, 'samples': 5667456, 'steps': 29517, 'loss/train': 1.6433055400848389} -11/07/2021 01:21:26 - INFO - __main__ - Step 29519: {'lr': 0.0004585488781413437, 'samples': 5667648, 'steps': 29518, 'loss/train': 1.927058219909668} -11/07/2021 01:21:27 - INFO - __main__ - Step 29520: {'lr': 0.00045854595159037695, 'samples': 5667840, 'steps': 29519, 'loss/train': 1.3411040306091309} -11/07/2021 01:21:27 - INFO - __main__ - Step 29521: {'lr': 0.0004585430249454425, 'samples': 5668032, 'steps': 29520, 'loss/train': 0.4509488046169281} -11/07/2021 01:21:28 - INFO - __main__ - Step 29522: {'lr': 0.000458540098206542, 'samples': 5668224, 'steps': 29521, 'loss/train': 1.7586899995803833} -11/07/2021 01:21:28 - INFO - __main__ - Step 29523: {'lr': 0.00045853717137367634, 'samples': 5668416, 'steps': 29522, 'loss/train': 1.6397231817245483} -11/07/2021 01:21:29 - INFO - __main__ - Step 29524: {'lr': 0.0004585342444468471, 'samples': 5668608, 'steps': 29523, 'loss/train': 1.4895061254501343} -11/07/2021 01:21:29 - INFO - __main__ - Step 29525: {'lr': 0.00045853131742605563, 'samples': 5668800, 'steps': 29524, 'loss/train': 1.8235915899276733} -11/07/2021 01:21:29 - INFO - __main__ - Step 29526: {'lr': 0.0004585283903113031, 'samples': 5668992, 'steps': 29525, 'loss/train': 1.258795142173767} -11/07/2021 01:21:30 - INFO - __main__ - Step 29527: {'lr': 0.00045852546310259093, 'samples': 5669184, 'steps': 29526, 'loss/train': 1.4527385234832764} -11/07/2021 01:21:31 - INFO - __main__ - Step 29528: {'lr': 0.00045852253579992043, 'samples': 5669376, 'steps': 29527, 'loss/train': 1.888344168663025} -11/07/2021 01:21:31 - INFO - __main__ - Step 29529: {'lr': 0.0004585196084032928, 'samples': 5669568, 'steps': 29528, 'loss/train': 1.6944209337234497} -11/07/2021 01:21:32 - INFO - __main__ - Step 29530: {'lr': 0.0004585166809127095, 'samples': 5669760, 'steps': 29529, 'loss/train': 1.6376452445983887} -11/07/2021 01:21:32 - INFO - __main__ - Step 29531: {'lr': 0.0004585137533281718, 'samples': 5669952, 'steps': 29530, 'loss/train': 1.8920257091522217} -11/07/2021 01:21:33 - INFO - __main__ - Step 29532: {'lr': 0.00045851082564968103, 'samples': 5670144, 'steps': 29531, 'loss/train': 1.875730276107788} -11/07/2021 01:21:33 - INFO - __main__ - Step 29533: {'lr': 0.0004585078978772385, 'samples': 5670336, 'steps': 29532, 'loss/train': 1.7644169330596924} -11/07/2021 01:21:34 - INFO - __main__ - Step 29534: {'lr': 0.0004585049700108455, 'samples': 5670528, 'steps': 29533, 'loss/train': 1.3630928993225098} -11/07/2021 01:21:34 - INFO - __main__ - Step 29535: {'lr': 0.00045850204205050344, 'samples': 5670720, 'steps': 29534, 'loss/train': 1.7111839056015015} -11/07/2021 01:21:34 - INFO - __main__ - Step 29536: {'lr': 0.0004584991139962135, 'samples': 5670912, 'steps': 29535, 'loss/train': 1.4443424940109253} -11/07/2021 01:21:35 - INFO - __main__ - Step 29537: {'lr': 0.00045849618584797717, 'samples': 5671104, 'steps': 29536, 'loss/train': 1.442642092704773} -11/07/2021 01:21:36 - INFO - __main__ - Step 29538: {'lr': 0.0004584932576057956, 'samples': 5671296, 'steps': 29537, 'loss/train': 1.4730128049850464} -11/07/2021 01:21:36 - INFO - __main__ - Step 29539: {'lr': 0.00045849032926967016, 'samples': 5671488, 'steps': 29538, 'loss/train': 1.708472728729248} -11/07/2021 01:21:36 - INFO - __main__ - Step 29540: {'lr': 0.0004584874008396023, 'samples': 5671680, 'steps': 29539, 'loss/train': 1.5613409280776978} -11/07/2021 01:21:37 - INFO - __main__ - Step 29541: {'lr': 0.00045848447231559315, 'samples': 5671872, 'steps': 29540, 'loss/train': 1.6380871534347534} -11/07/2021 01:21:38 - INFO - __main__ - Step 29542: {'lr': 0.00045848154369764415, 'samples': 5672064, 'steps': 29541, 'loss/train': 1.8458172082901} -11/07/2021 01:21:38 - INFO - __main__ - Step 29543: {'lr': 0.0004584786149857566, 'samples': 5672256, 'steps': 29542, 'loss/train': 1.5878684520721436} -11/07/2021 01:21:39 - INFO - __main__ - Step 29544: {'lr': 0.00045847568617993174, 'samples': 5672448, 'steps': 29543, 'loss/train': 1.3373163938522339} -11/07/2021 01:21:39 - INFO - __main__ - Step 29545: {'lr': 0.000458472757280171, 'samples': 5672640, 'steps': 29544, 'loss/train': 1.7970337867736816} -11/07/2021 01:21:39 - INFO - __main__ - Step 29546: {'lr': 0.0004584698282864757, 'samples': 5672832, 'steps': 29545, 'loss/train': 1.8570822477340698} -11/07/2021 01:21:40 - INFO - __main__ - Step 29547: {'lr': 0.000458466899198847, 'samples': 5673024, 'steps': 29546, 'loss/train': 1.45450758934021} -11/07/2021 01:21:41 - INFO - __main__ - Step 29548: {'lr': 0.0004584639700172863, 'samples': 5673216, 'steps': 29547, 'loss/train': 1.361185073852539} -11/07/2021 01:21:41 - INFO - __main__ - Step 29549: {'lr': 0.00045846104074179504, 'samples': 5673408, 'steps': 29548, 'loss/train': 1.5456278324127197} -11/07/2021 01:21:41 - INFO - __main__ - Step 29550: {'lr': 0.00045845811137237445, 'samples': 5673600, 'steps': 29549, 'loss/train': 2.0732905864715576} -11/07/2021 01:21:42 - INFO - __main__ - Step 29551: {'lr': 0.0004584551819090259, 'samples': 5673792, 'steps': 29550, 'loss/train': 1.9945400953292847} -11/07/2021 01:21:42 - INFO - __main__ - Step 29552: {'lr': 0.0004584522523517506, 'samples': 5673984, 'steps': 29551, 'loss/train': 1.3577299118041992} -11/07/2021 01:21:43 - INFO - __main__ - Step 29553: {'lr': 0.00045844932270054997, 'samples': 5674176, 'steps': 29552, 'loss/train': 2.1527366638183594} -11/07/2021 01:21:43 - INFO - __main__ - Step 29554: {'lr': 0.00045844639295542525, 'samples': 5674368, 'steps': 29553, 'loss/train': 1.4013590812683105} -11/07/2021 01:21:44 - INFO - __main__ - Step 29555: {'lr': 0.0004584434631163779, 'samples': 5674560, 'steps': 29554, 'loss/train': 1.350577712059021} -11/07/2021 01:21:44 - INFO - __main__ - Step 29556: {'lr': 0.000458440533183409, 'samples': 5674752, 'steps': 29555, 'loss/train': 1.1925235986709595} -11/07/2021 01:21:44 - INFO - __main__ - Step 29557: {'lr': 0.0004584376031565201, 'samples': 5674944, 'steps': 29556, 'loss/train': 1.6832846403121948} -11/07/2021 01:21:46 - INFO - __main__ - Step 29558: {'lr': 0.0004584346730357124, 'samples': 5675136, 'steps': 29557, 'loss/train': 1.5070879459381104} -11/07/2021 01:21:46 - INFO - __main__ - Step 29559: {'lr': 0.0004584317428209872, 'samples': 5675328, 'steps': 29558, 'loss/train': 1.5490034818649292} -11/07/2021 01:21:46 - INFO - __main__ - Step 29560: {'lr': 0.0004584288125123459, 'samples': 5675520, 'steps': 29559, 'loss/train': 1.1577174663543701} -11/07/2021 01:21:47 - INFO - __main__ - Step 29561: {'lr': 0.0004584258821097899, 'samples': 5675712, 'steps': 29560, 'loss/train': 1.5316812992095947} -11/07/2021 01:21:47 - INFO - __main__ - Step 29562: {'lr': 0.0004584229516133203, 'samples': 5675904, 'steps': 29561, 'loss/train': 1.6711317300796509} -11/07/2021 01:21:48 - INFO - __main__ - Step 29563: {'lr': 0.00045842002102293856, 'samples': 5676096, 'steps': 29562, 'loss/train': 1.4156216382980347} -11/07/2021 01:21:48 - INFO - __main__ - Step 29564: {'lr': 0.000458417090338646, 'samples': 5676288, 'steps': 29563, 'loss/train': 1.5477793216705322} -11/07/2021 01:21:49 - INFO - __main__ - Step 29565: {'lr': 0.00045841415956044394, 'samples': 5676480, 'steps': 29564, 'loss/train': 0.47286054491996765} -11/07/2021 01:21:49 - INFO - __main__ - Step 29566: {'lr': 0.0004584112286883336, 'samples': 5676672, 'steps': 29565, 'loss/train': 1.372520089149475} -11/07/2021 01:21:49 - INFO - __main__ - Step 29567: {'lr': 0.0004584082977223164, 'samples': 5676864, 'steps': 29566, 'loss/train': 1.6289653778076172} -11/07/2021 01:21:51 - INFO - __main__ - Step 29568: {'lr': 0.0004584053666623937, 'samples': 5677056, 'steps': 29567, 'loss/train': 1.2834872007369995} -11/07/2021 01:21:51 - INFO - __main__ - Step 29569: {'lr': 0.00045840243550856666, 'samples': 5677248, 'steps': 29568, 'loss/train': 1.9355740547180176} -11/07/2021 01:21:51 - INFO - __main__ - Step 29570: {'lr': 0.00045839950426083677, 'samples': 5677440, 'steps': 29569, 'loss/train': 1.7786345481872559} -11/07/2021 01:21:52 - INFO - __main__ - Step 29571: {'lr': 0.0004583965729192052, 'samples': 5677632, 'steps': 29570, 'loss/train': 1.6350317001342773} -11/07/2021 01:21:52 - INFO - __main__ - Step 29572: {'lr': 0.00045839364148367345, 'samples': 5677824, 'steps': 29571, 'loss/train': 1.5409319400787354} -11/07/2021 01:21:52 - INFO - __main__ - Step 29573: {'lr': 0.00045839070995424273, 'samples': 5678016, 'steps': 29572, 'loss/train': 1.367226004600525} -11/07/2021 01:21:53 - INFO - __main__ - Step 29574: {'lr': 0.00045838777833091425, 'samples': 5678208, 'steps': 29573, 'loss/train': 1.731628656387329} -11/07/2021 01:21:54 - INFO - __main__ - Step 29575: {'lr': 0.00045838484661368963, 'samples': 5678400, 'steps': 29574, 'loss/train': 1.5066232681274414} -11/07/2021 01:21:54 - INFO - __main__ - Step 29576: {'lr': 0.00045838191480256985, 'samples': 5678592, 'steps': 29575, 'loss/train': 1.3395975828170776} -11/07/2021 01:21:54 - INFO - __main__ - Step 29577: {'lr': 0.00045837898289755654, 'samples': 5678784, 'steps': 29576, 'loss/train': 1.3253049850463867} -11/07/2021 01:21:55 - INFO - __main__ - Step 29578: {'lr': 0.0004583760508986508, 'samples': 5678976, 'steps': 29577, 'loss/train': 1.2868000268936157} -11/07/2021 01:21:56 - INFO - __main__ - Step 29579: {'lr': 0.000458373118805854, 'samples': 5679168, 'steps': 29578, 'loss/train': 1.4119806289672852} -11/07/2021 01:21:56 - INFO - __main__ - Step 29580: {'lr': 0.00045837018661916754, 'samples': 5679360, 'steps': 29579, 'loss/train': 1.2361005544662476} -11/07/2021 01:21:56 - INFO - __main__ - Step 29581: {'lr': 0.00045836725433859266, 'samples': 5679552, 'steps': 29580, 'loss/train': 2.188758611679077} -11/07/2021 01:21:57 - INFO - __main__ - Step 29582: {'lr': 0.0004583643219641307, 'samples': 5679744, 'steps': 29581, 'loss/train': 1.2891649007797241} -11/07/2021 01:21:57 - INFO - __main__ - Step 29583: {'lr': 0.00045836138949578297, 'samples': 5679936, 'steps': 29582, 'loss/train': 1.5164471864700317} -11/07/2021 01:21:58 - INFO - __main__ - Step 29584: {'lr': 0.00045835845693355096, 'samples': 5680128, 'steps': 29583, 'loss/train': 1.9012441635131836} -11/07/2021 01:21:59 - INFO - __main__ - Step 29585: {'lr': 0.00045835552427743567, 'samples': 5680320, 'steps': 29584, 'loss/train': 1.8651920557022095} -11/07/2021 01:21:59 - INFO - __main__ - Step 29586: {'lr': 0.00045835259152743866, 'samples': 5680512, 'steps': 29585, 'loss/train': 1.9096503257751465} -11/07/2021 01:21:59 - INFO - __main__ - Step 29587: {'lr': 0.0004583496586835612, 'samples': 5680704, 'steps': 29586, 'loss/train': 1.5053143501281738} -11/07/2021 01:22:00 - INFO - __main__ - Step 29588: {'lr': 0.0004583467257458046, 'samples': 5680896, 'steps': 29587, 'loss/train': 0.6775304079055786} -11/07/2021 01:22:01 - INFO - __main__ - Step 29589: {'lr': 0.00045834379271417013, 'samples': 5681088, 'steps': 29588, 'loss/train': 1.7188389301300049} -11/07/2021 01:22:02 - INFO - __main__ - Step 29590: {'lr': 0.0004583408595886592, 'samples': 5681280, 'steps': 29589, 'loss/train': 1.8896228075027466} -11/07/2021 01:22:02 - INFO - __main__ - Step 29591: {'lr': 0.0004583379263692732, 'samples': 5681472, 'steps': 29590, 'loss/train': 1.986293077468872} -11/07/2021 01:22:02 - INFO - __main__ - Step 29592: {'lr': 0.0004583349930560132, 'samples': 5681664, 'steps': 29591, 'loss/train': 0.1942824423313141} -11/07/2021 01:22:03 - INFO - __main__ - Step 29593: {'lr': 0.0004583320596488807, 'samples': 5681856, 'steps': 29592, 'loss/train': 1.5070799589157104} -11/07/2021 01:22:04 - INFO - __main__ - Step 29594: {'lr': 0.000458329126147877, 'samples': 5682048, 'steps': 29593, 'loss/train': 2.0239007472991943} -11/07/2021 01:22:04 - INFO - __main__ - Step 29595: {'lr': 0.00045832619255300344, 'samples': 5682240, 'steps': 29594, 'loss/train': 1.57216215133667} -11/07/2021 01:22:05 - INFO - __main__ - Step 29596: {'lr': 0.00045832325886426125, 'samples': 5682432, 'steps': 29595, 'loss/train': 1.732596755027771} -11/07/2021 01:22:05 - INFO - __main__ - Step 29597: {'lr': 0.0004583203250816518, 'samples': 5682624, 'steps': 29596, 'loss/train': 1.4190809726715088} -11/07/2021 01:22:05 - INFO - __main__ - Step 29598: {'lr': 0.0004583173912051765, 'samples': 5682816, 'steps': 29597, 'loss/train': 0.721015989780426} -11/07/2021 01:22:06 - INFO - __main__ - Step 29599: {'lr': 0.00045831445723483656, 'samples': 5683008, 'steps': 29598, 'loss/train': 1.7590328454971313} -11/07/2021 01:22:07 - INFO - __main__ - Step 29600: {'lr': 0.0004583115231706334, 'samples': 5683200, 'steps': 29599, 'loss/train': 1.3749176263809204} -11/07/2021 01:22:07 - INFO - __main__ - Step 29601: {'lr': 0.0004583085890125682, 'samples': 5683392, 'steps': 29600, 'loss/train': 1.6116366386413574} -11/07/2021 01:22:07 - INFO - __main__ - Step 29602: {'lr': 0.0004583056547606424, 'samples': 5683584, 'steps': 29601, 'loss/train': 1.6327733993530273} -11/07/2021 01:22:08 - INFO - __main__ - Step 29603: {'lr': 0.0004583027204148573, 'samples': 5683776, 'steps': 29602, 'loss/train': 1.0818742513656616} -11/07/2021 01:22:08 - INFO - __main__ - Step 29604: {'lr': 0.0004582997859752142, 'samples': 5683968, 'steps': 29603, 'loss/train': 1.9879107475280762} -11/07/2021 01:22:09 - INFO - __main__ - Step 29605: {'lr': 0.0004582968514417144, 'samples': 5684160, 'steps': 29604, 'loss/train': 1.4256826639175415} -11/07/2021 01:22:10 - INFO - __main__ - Step 29606: {'lr': 0.00045829391681435926, 'samples': 5684352, 'steps': 29605, 'loss/train': 1.6640363931655884} -11/07/2021 01:22:10 - INFO - __main__ - Step 29607: {'lr': 0.0004582909820931501, 'samples': 5684544, 'steps': 29606, 'loss/train': 1.8146600723266602} -11/07/2021 01:22:10 - INFO - __main__ - Step 29608: {'lr': 0.00045828804727808824, 'samples': 5684736, 'steps': 29607, 'loss/train': 1.7391760349273682} -11/07/2021 01:22:11 - INFO - __main__ - Step 29609: {'lr': 0.000458285112369175, 'samples': 5684928, 'steps': 29608, 'loss/train': 1.596211314201355} -11/07/2021 01:22:12 - INFO - __main__ - Step 29610: {'lr': 0.0004582821773664118, 'samples': 5685120, 'steps': 29609, 'loss/train': 1.5998541116714478} -11/07/2021 01:22:12 - INFO - __main__ - Step 29611: {'lr': 0.0004582792422697997, 'samples': 5685312, 'steps': 29610, 'loss/train': 1.378007173538208} -11/07/2021 01:22:12 - INFO - __main__ - Step 29612: {'lr': 0.0004582763070793403, 'samples': 5685504, 'steps': 29611, 'loss/train': 1.8445258140563965} -11/07/2021 01:22:13 - INFO - __main__ - Step 29613: {'lr': 0.0004582733717950347, 'samples': 5685696, 'steps': 29612, 'loss/train': 1.6518462896347046} -11/07/2021 01:22:13 - INFO - __main__ - Step 29614: {'lr': 0.00045827043641688444, 'samples': 5685888, 'steps': 29613, 'loss/train': 1.6120516061782837} -11/07/2021 01:22:14 - INFO - __main__ - Step 29615: {'lr': 0.00045826750094489065, 'samples': 5686080, 'steps': 29614, 'loss/train': 1.4761862754821777} -11/07/2021 01:22:15 - INFO - __main__ - Step 29616: {'lr': 0.00045826456537905483, 'samples': 5686272, 'steps': 29615, 'loss/train': 1.6258699893951416} -11/07/2021 01:22:15 - INFO - __main__ - Step 29617: {'lr': 0.0004582616297193781, 'samples': 5686464, 'steps': 29616, 'loss/train': 1.48533296585083} -11/07/2021 01:22:15 - INFO - __main__ - Step 29618: {'lr': 0.000458258693965862, 'samples': 5686656, 'steps': 29617, 'loss/train': 1.9197696447372437} -11/07/2021 01:22:16 - INFO - __main__ - Step 29619: {'lr': 0.0004582557581185077, 'samples': 5686848, 'steps': 29618, 'loss/train': 0.8355976343154907} -11/07/2021 01:22:17 - INFO - __main__ - Step 29620: {'lr': 0.00045825282217731655, 'samples': 5687040, 'steps': 29619, 'loss/train': 1.4850707054138184} -11/07/2021 01:22:17 - INFO - __main__ - Step 29621: {'lr': 0.00045824988614228995, 'samples': 5687232, 'steps': 29620, 'loss/train': 0.415968120098114} -11/07/2021 01:22:17 - INFO - __main__ - Step 29622: {'lr': 0.0004582469500134292, 'samples': 5687424, 'steps': 29621, 'loss/train': 1.5455137491226196} -11/07/2021 01:22:18 - INFO - __main__ - Step 29623: {'lr': 0.00045824401379073544, 'samples': 5687616, 'steps': 29622, 'loss/train': 2.0614051818847656} -11/07/2021 01:22:18 - INFO - __main__ - Step 29624: {'lr': 0.0004582410774742103, 'samples': 5687808, 'steps': 29623, 'loss/train': 1.6692601442337036} -11/07/2021 01:22:20 - INFO - __main__ - Step 29625: {'lr': 0.00045823814106385485, 'samples': 5688000, 'steps': 29624, 'loss/train': 1.550163984298706} -11/07/2021 01:22:20 - INFO - __main__ - Step 29626: {'lr': 0.0004582352045596705, 'samples': 5688192, 'steps': 29625, 'loss/train': 1.4578899145126343} -11/07/2021 01:22:20 - INFO - __main__ - Step 29627: {'lr': 0.0004582322679616586, 'samples': 5688384, 'steps': 29626, 'loss/train': 2.6318256855010986} -11/07/2021 01:22:21 - INFO - __main__ - Step 29628: {'lr': 0.0004582293312698205, 'samples': 5688576, 'steps': 29627, 'loss/train': 1.6896731853485107} -11/07/2021 01:22:21 - INFO - __main__ - Step 29629: {'lr': 0.00045822639448415736, 'samples': 5688768, 'steps': 29628, 'loss/train': 1.2518410682678223} -11/07/2021 01:22:21 - INFO - __main__ - Step 29630: {'lr': 0.0004582234576046707, 'samples': 5688960, 'steps': 29629, 'loss/train': 1.666911005973816} -11/07/2021 01:22:23 - INFO - __main__ - Step 29631: {'lr': 0.00045822052063136177, 'samples': 5689152, 'steps': 29630, 'loss/train': 1.9199504852294922} -11/07/2021 01:22:23 - INFO - __main__ - Step 29632: {'lr': 0.0004582175835642319, 'samples': 5689344, 'steps': 29631, 'loss/train': 1.5861963033676147} -11/07/2021 01:22:23 - INFO - __main__ - Step 29633: {'lr': 0.0004582146464032824, 'samples': 5689536, 'steps': 29632, 'loss/train': 1.229762077331543} -11/07/2021 01:22:24 - INFO - __main__ - Step 29634: {'lr': 0.0004582117091485145, 'samples': 5689728, 'steps': 29633, 'loss/train': 1.304877758026123} -11/07/2021 01:22:24 - INFO - __main__ - Step 29635: {'lr': 0.0004582087717999297, 'samples': 5689920, 'steps': 29634, 'loss/train': 1.5370056629180908} -11/07/2021 01:22:24 - INFO - __main__ - Step 29636: {'lr': 0.0004582058343575292, 'samples': 5690112, 'steps': 29635, 'loss/train': 1.7247610092163086} -11/07/2021 01:22:25 - INFO - __main__ - Step 29637: {'lr': 0.00045820289682131437, 'samples': 5690304, 'steps': 29636, 'loss/train': 0.6707466840744019} -11/07/2021 01:22:26 - INFO - __main__ - Step 29638: {'lr': 0.0004581999591912865, 'samples': 5690496, 'steps': 29637, 'loss/train': 1.200347900390625} -11/07/2021 01:22:26 - INFO - __main__ - Step 29639: {'lr': 0.000458197021467447, 'samples': 5690688, 'steps': 29638, 'loss/train': 1.260533094406128} -11/07/2021 01:22:27 - INFO - __main__ - Step 29640: {'lr': 0.00045819408364979714, 'samples': 5690880, 'steps': 29639, 'loss/train': 0.8662011623382568} -11/07/2021 01:22:27 - INFO - __main__ - Step 29641: {'lr': 0.0004581911457383382, 'samples': 5691072, 'steps': 29640, 'loss/train': 1.6379077434539795} -11/07/2021 01:22:28 - INFO - __main__ - Step 29642: {'lr': 0.0004581882077330716, 'samples': 5691264, 'steps': 29641, 'loss/train': 1.6704963445663452} -11/07/2021 01:22:28 - INFO - __main__ - Step 29643: {'lr': 0.0004581852696339985, 'samples': 5691456, 'steps': 29642, 'loss/train': 1.9362915754318237} -11/07/2021 01:22:29 - INFO - __main__ - Step 29644: {'lr': 0.00045818233144112044, 'samples': 5691648, 'steps': 29643, 'loss/train': 1.3519880771636963} -11/07/2021 01:22:29 - INFO - __main__ - Step 29645: {'lr': 0.00045817939315443855, 'samples': 5691840, 'steps': 29644, 'loss/train': 1.4004114866256714} -11/07/2021 01:22:29 - INFO - __main__ - Step 29646: {'lr': 0.0004581764547739543, 'samples': 5692032, 'steps': 29645, 'loss/train': 1.1390637159347534} -11/07/2021 01:22:30 - INFO - __main__ - Step 29647: {'lr': 0.00045817351629966896, 'samples': 5692224, 'steps': 29646, 'loss/train': 1.4488816261291504} -11/07/2021 01:22:31 - INFO - __main__ - Step 29648: {'lr': 0.00045817057773158375, 'samples': 5692416, 'steps': 29647, 'loss/train': 1.579978346824646} -11/07/2021 01:22:31 - INFO - __main__ - Step 29649: {'lr': 0.0004581676390697002, 'samples': 5692608, 'steps': 29648, 'loss/train': 0.9321296811103821} -11/07/2021 01:22:31 - INFO - __main__ - Step 29650: {'lr': 0.00045816470031401945, 'samples': 5692800, 'steps': 29649, 'loss/train': 1.462112307548523} -11/07/2021 01:22:32 - INFO - __main__ - Step 29651: {'lr': 0.00045816176146454296, 'samples': 5692992, 'steps': 29650, 'loss/train': 1.399960994720459} -11/07/2021 01:22:32 - INFO - __main__ - Step 29652: {'lr': 0.00045815882252127197, 'samples': 5693184, 'steps': 29651, 'loss/train': 1.866282343864441} -11/07/2021 01:22:34 - INFO - __main__ - Step 29653: {'lr': 0.0004581558834842078, 'samples': 5693376, 'steps': 29652, 'loss/train': 1.5247520208358765} -11/07/2021 01:22:34 - INFO - __main__ - Step 29654: {'lr': 0.00045815294435335184, 'samples': 5693568, 'steps': 29653, 'loss/train': 1.0651295185089111} -11/07/2021 01:22:34 - INFO - __main__ - Step 29655: {'lr': 0.0004581500051287053, 'samples': 5693760, 'steps': 29654, 'loss/train': 0.4343424439430237} -11/07/2021 01:22:35 - INFO - __main__ - Step 29656: {'lr': 0.00045814706581026967, 'samples': 5693952, 'steps': 29655, 'loss/train': 1.4132171869277954} -11/07/2021 01:22:35 - INFO - __main__ - Step 29657: {'lr': 0.0004581441263980461, 'samples': 5694144, 'steps': 29656, 'loss/train': 1.448478102684021} -11/07/2021 01:22:36 - INFO - __main__ - Step 29658: {'lr': 0.0004581411868920361, 'samples': 5694336, 'steps': 29657, 'loss/train': 0.7318187952041626} -11/07/2021 01:22:36 - INFO - __main__ - Step 29659: {'lr': 0.00045813824729224085, 'samples': 5694528, 'steps': 29658, 'loss/train': 1.9026389122009277} -11/07/2021 01:22:37 - INFO - __main__ - Step 29660: {'lr': 0.0004581353075986617, 'samples': 5694720, 'steps': 29659, 'loss/train': 1.1821388006210327} -11/07/2021 01:22:37 - INFO - __main__ - Step 29661: {'lr': 0.00045813236781129996, 'samples': 5694912, 'steps': 29660, 'loss/train': 1.7136733531951904} -11/07/2021 01:22:37 - INFO - __main__ - Step 29662: {'lr': 0.00045812942793015707, 'samples': 5695104, 'steps': 29661, 'loss/train': 0.9536595940589905} -11/07/2021 01:22:38 - INFO - __main__ - Step 29663: {'lr': 0.0004581264879552342, 'samples': 5695296, 'steps': 29662, 'loss/train': 1.8095760345458984} -11/07/2021 01:22:39 - INFO - __main__ - Step 29664: {'lr': 0.00045812354788653275, 'samples': 5695488, 'steps': 29663, 'loss/train': 2.0689356327056885} -11/07/2021 01:22:39 - INFO - __main__ - Step 29665: {'lr': 0.00045812060772405403, 'samples': 5695680, 'steps': 29664, 'loss/train': 1.4600616693496704} -11/07/2021 01:22:40 - INFO - __main__ - Step 29666: {'lr': 0.0004581176674677995, 'samples': 5695872, 'steps': 29665, 'loss/train': 1.7237344980239868} -11/07/2021 01:22:40 - INFO - __main__ - Step 29667: {'lr': 0.00045811472711777026, 'samples': 5696064, 'steps': 29666, 'loss/train': 1.4242371320724487} -11/07/2021 01:22:41 - INFO - __main__ - Step 29668: {'lr': 0.0004581117866739677, 'samples': 5696256, 'steps': 29667, 'loss/train': 1.5728676319122314} -11/07/2021 01:22:41 - INFO - __main__ - Step 29669: {'lr': 0.00045810884613639325, 'samples': 5696448, 'steps': 29668, 'loss/train': 1.5524414777755737} -11/07/2021 01:22:42 - INFO - __main__ - Step 29670: {'lr': 0.00045810590550504816, 'samples': 5696640, 'steps': 29669, 'loss/train': 1.336570382118225} -11/07/2021 01:22:42 - INFO - __main__ - Step 29671: {'lr': 0.0004581029647799337, 'samples': 5696832, 'steps': 29670, 'loss/train': 1.8532898426055908} -11/07/2021 01:22:42 - INFO - __main__ - Step 29672: {'lr': 0.0004581000239610513, 'samples': 5697024, 'steps': 29671, 'loss/train': 1.6476597785949707} -11/07/2021 01:22:43 - INFO - __main__ - Step 29673: {'lr': 0.0004580970830484023, 'samples': 5697216, 'steps': 29672, 'loss/train': 1.576622486114502} -11/07/2021 01:22:44 - INFO - __main__ - Step 29674: {'lr': 0.00045809414204198785, 'samples': 5697408, 'steps': 29673, 'loss/train': 0.773138701915741} -11/07/2021 01:22:44 - INFO - __main__ - Step 29675: {'lr': 0.00045809120094180946, 'samples': 5697600, 'steps': 29674, 'loss/train': 1.7726764678955078} -11/07/2021 01:22:44 - INFO - __main__ - Step 29676: {'lr': 0.00045808825974786834, 'samples': 5697792, 'steps': 29675, 'loss/train': 1.6256364583969116} -11/07/2021 01:22:45 - INFO - __main__ - Step 29677: {'lr': 0.0004580853184601659, 'samples': 5697984, 'steps': 29676, 'loss/train': 1.227905511856079} -11/07/2021 01:22:46 - INFO - __main__ - Step 29678: {'lr': 0.0004580823770787034, 'samples': 5698176, 'steps': 29677, 'loss/train': 1.5438227653503418} -11/07/2021 01:22:46 - INFO - __main__ - Step 29679: {'lr': 0.0004580794356034822, 'samples': 5698368, 'steps': 29678, 'loss/train': 1.741622805595398} -11/07/2021 01:22:46 - INFO - __main__ - Step 29680: {'lr': 0.0004580764940345036, 'samples': 5698560, 'steps': 29679, 'loss/train': 1.3502264022827148} -11/07/2021 01:22:47 - INFO - __main__ - Step 29681: {'lr': 0.00045807355237176896, 'samples': 5698752, 'steps': 29680, 'loss/train': 1.0882927179336548} -11/07/2021 01:22:47 - INFO - __main__ - Step 29682: {'lr': 0.0004580706106152796, 'samples': 5698944, 'steps': 29681, 'loss/train': 1.5208772420883179} -11/07/2021 01:22:48 - INFO - __main__ - Step 29683: {'lr': 0.00045806766876503683, 'samples': 5699136, 'steps': 29682, 'loss/train': 1.5638811588287354} -11/07/2021 01:22:49 - INFO - __main__ - Step 29684: {'lr': 0.000458064726821042, 'samples': 5699328, 'steps': 29683, 'loss/train': 2.4141056537628174} -11/07/2021 01:22:49 - INFO - __main__ - Step 29685: {'lr': 0.0004580617847832964, 'samples': 5699520, 'steps': 29684, 'loss/train': 1.8928292989730835} -11/07/2021 01:22:49 - INFO - __main__ - Step 29686: {'lr': 0.0004580588426518013, 'samples': 5699712, 'steps': 29685, 'loss/train': 1.3639895915985107} -11/07/2021 01:22:50 - INFO - __main__ - Step 29687: {'lr': 0.0004580559004265582, 'samples': 5699904, 'steps': 29686, 'loss/train': 1.5898321866989136} -11/07/2021 01:22:51 - INFO - __main__ - Step 29688: {'lr': 0.0004580529581075683, 'samples': 5700096, 'steps': 29687, 'loss/train': 1.2457053661346436} -11/07/2021 01:22:51 - INFO - __main__ - Step 29689: {'lr': 0.0004580500156948329, 'samples': 5700288, 'steps': 29688, 'loss/train': 1.5697243213653564} -11/07/2021 01:22:51 - INFO - __main__ - Step 29690: {'lr': 0.0004580470731883534, 'samples': 5700480, 'steps': 29689, 'loss/train': 1.5891913175582886} -11/07/2021 01:22:52 - INFO - __main__ - Step 29691: {'lr': 0.0004580441305881311, 'samples': 5700672, 'steps': 29690, 'loss/train': 1.4484436511993408} -11/07/2021 01:22:52 - INFO - __main__ - Step 29692: {'lr': 0.0004580411878941673, 'samples': 5700864, 'steps': 29691, 'loss/train': 1.649519681930542} -11/07/2021 01:22:53 - INFO - __main__ - Step 29693: {'lr': 0.0004580382451064634, 'samples': 5701056, 'steps': 29692, 'loss/train': 1.3619575500488281} -11/07/2021 01:22:53 - INFO - __main__ - Step 29694: {'lr': 0.00045803530222502065, 'samples': 5701248, 'steps': 29693, 'loss/train': 1.5870784521102905} -11/07/2021 01:22:54 - INFO - __main__ - Step 29695: {'lr': 0.0004580323592498404, 'samples': 5701440, 'steps': 29694, 'loss/train': 1.6245121955871582} -11/07/2021 01:22:54 - INFO - __main__ - Step 29696: {'lr': 0.00045802941618092397, 'samples': 5701632, 'steps': 29695, 'loss/train': 1.578203797340393} -11/07/2021 01:22:55 - INFO - __main__ - Step 29697: {'lr': 0.0004580264730182727, 'samples': 5701824, 'steps': 29696, 'loss/train': 1.8025213479995728} -11/07/2021 01:22:55 - INFO - __main__ - Step 29698: {'lr': 0.000458023529761888, 'samples': 5702016, 'steps': 29697, 'loss/train': 1.5820423364639282} -11/07/2021 01:22:56 - INFO - __main__ - Step 29699: {'lr': 0.00045802058641177104, 'samples': 5702208, 'steps': 29698, 'loss/train': 1.6937873363494873} -11/07/2021 01:22:56 - INFO - __main__ - Step 29700: {'lr': 0.00045801764296792317, 'samples': 5702400, 'steps': 29699, 'loss/train': 1.8489793539047241} -11/07/2021 01:22:57 - INFO - __main__ - Step 29701: {'lr': 0.0004580146994303458, 'samples': 5702592, 'steps': 29700, 'loss/train': 1.885706901550293} -11/07/2021 01:22:57 - INFO - __main__ - Step 29702: {'lr': 0.0004580117557990402, 'samples': 5702784, 'steps': 29701, 'loss/train': 1.9294558763504028} -11/07/2021 01:22:57 - INFO - __main__ - Step 29703: {'lr': 0.0004580088120740077, 'samples': 5702976, 'steps': 29702, 'loss/train': 1.8159981966018677} -11/07/2021 01:22:58 - INFO - __main__ - Step 29704: {'lr': 0.0004580058682552497, 'samples': 5703168, 'steps': 29703, 'loss/train': 1.570683479309082} -11/07/2021 01:22:59 - INFO - __main__ - Step 29705: {'lr': 0.00045800292434276736, 'samples': 5703360, 'steps': 29704, 'loss/train': 1.5014185905456543} -11/07/2021 01:22:59 - INFO - __main__ - Step 29706: {'lr': 0.0004579999803365622, 'samples': 5703552, 'steps': 29705, 'loss/train': 1.7709827423095703} -11/07/2021 01:23:00 - INFO - __main__ - Step 29707: {'lr': 0.00045799703623663546, 'samples': 5703744, 'steps': 29706, 'loss/train': 1.4139878749847412} -11/07/2021 01:23:00 - INFO - __main__ - Step 29708: {'lr': 0.00045799409204298844, 'samples': 5703936, 'steps': 29707, 'loss/train': 1.8164315223693848} -11/07/2021 01:23:00 - INFO - __main__ - Step 29709: {'lr': 0.00045799114775562245, 'samples': 5704128, 'steps': 29708, 'loss/train': 1.409840703010559} -11/07/2021 01:23:01 - INFO - __main__ - Step 29710: {'lr': 0.00045798820337453894, 'samples': 5704320, 'steps': 29709, 'loss/train': 1.6338276863098145} -11/07/2021 01:23:02 - INFO - __main__ - Step 29711: {'lr': 0.00045798525889973905, 'samples': 5704512, 'steps': 29710, 'loss/train': 1.4953669309616089} -11/07/2021 01:23:02 - INFO - __main__ - Step 29712: {'lr': 0.00045798231433122436, 'samples': 5704704, 'steps': 29711, 'loss/train': 1.7392159700393677} -11/07/2021 01:23:02 - INFO - __main__ - Step 29713: {'lr': 0.00045797936966899595, 'samples': 5704896, 'steps': 29712, 'loss/train': 1.2416294813156128} -11/07/2021 01:23:03 - INFO - __main__ - Step 29714: {'lr': 0.00045797642491305523, 'samples': 5705088, 'steps': 29713, 'loss/train': 1.5721782445907593} -11/07/2021 01:23:04 - INFO - __main__ - Step 29715: {'lr': 0.0004579734800634036, 'samples': 5705280, 'steps': 29714, 'loss/train': 1.1889970302581787} -11/07/2021 01:23:04 - INFO - __main__ - Step 29716: {'lr': 0.0004579705351200423, 'samples': 5705472, 'steps': 29715, 'loss/train': 1.799396276473999} -11/07/2021 01:23:04 - INFO - __main__ - Step 29717: {'lr': 0.0004579675900829727, 'samples': 5705664, 'steps': 29716, 'loss/train': 0.6931185126304626} -11/07/2021 01:23:05 - INFO - __main__ - Step 29718: {'lr': 0.00045796464495219614, 'samples': 5705856, 'steps': 29717, 'loss/train': 0.6500502824783325} -11/07/2021 01:23:05 - INFO - __main__ - Step 29719: {'lr': 0.00045796169972771387, 'samples': 5706048, 'steps': 29718, 'loss/train': 1.6350395679473877} -11/07/2021 01:23:05 - INFO - __main__ - Step 29720: {'lr': 0.00045795875440952726, 'samples': 5706240, 'steps': 29719, 'loss/train': 1.9400047063827515} -11/07/2021 01:23:07 - INFO - __main__ - Step 29721: {'lr': 0.00045795580899763767, 'samples': 5706432, 'steps': 29720, 'loss/train': 5.601465225219727} -11/07/2021 01:23:07 - INFO - __main__ - Step 29722: {'lr': 0.00045795286349204633, 'samples': 5706624, 'steps': 29721, 'loss/train': 1.3674595355987549} -11/07/2021 01:23:07 - INFO - __main__ - Step 29723: {'lr': 0.0004579499178927547, 'samples': 5706816, 'steps': 29722, 'loss/train': 1.397915005683899} -11/07/2021 01:23:08 - INFO - __main__ - Step 29724: {'lr': 0.0004579469721997641, 'samples': 5707008, 'steps': 29723, 'loss/train': 1.326294183731079} -11/07/2021 01:23:08 - INFO - __main__ - Step 29725: {'lr': 0.0004579440264130758, 'samples': 5707200, 'steps': 29724, 'loss/train': 1.4774163961410522} -11/07/2021 01:23:09 - INFO - __main__ - Step 29726: {'lr': 0.000457941080532691, 'samples': 5707392, 'steps': 29725, 'loss/train': 1.7879488468170166} -11/07/2021 01:23:09 - INFO - __main__ - Step 29727: {'lr': 0.0004579381345586113, 'samples': 5707584, 'steps': 29726, 'loss/train': 1.5059592723846436} -11/07/2021 01:23:10 - INFO - __main__ - Step 29728: {'lr': 0.0004579351884908378, 'samples': 5707776, 'steps': 29727, 'loss/train': 1.71578848361969} -11/07/2021 01:23:10 - INFO - __main__ - Step 29729: {'lr': 0.00045793224232937193, 'samples': 5707968, 'steps': 29728, 'loss/train': 1.545784831047058} -11/07/2021 01:23:10 - INFO - __main__ - Step 29730: {'lr': 0.0004579292960742151, 'samples': 5708160, 'steps': 29729, 'loss/train': 1.4610202312469482} -11/07/2021 01:23:11 - INFO - __main__ - Step 29731: {'lr': 0.0004579263497253684, 'samples': 5708352, 'steps': 29730, 'loss/train': 1.483440637588501} -11/07/2021 01:23:12 - INFO - __main__ - Step 29732: {'lr': 0.00045792340328283334, 'samples': 5708544, 'steps': 29731, 'loss/train': 1.6959503889083862} -11/07/2021 01:23:12 - INFO - __main__ - Step 29733: {'lr': 0.0004579204567466112, 'samples': 5708736, 'steps': 29732, 'loss/train': 1.0574575662612915} -11/07/2021 01:23:12 - INFO - __main__ - Step 29734: {'lr': 0.0004579175101167033, 'samples': 5708928, 'steps': 29733, 'loss/train': 1.4164676666259766} -11/07/2021 01:23:13 - INFO - __main__ - Step 29735: {'lr': 0.000457914563393111, 'samples': 5709120, 'steps': 29734, 'loss/train': 1.6582592725753784} -11/07/2021 01:23:13 - INFO - __main__ - Step 29736: {'lr': 0.00045791161657583555, 'samples': 5709312, 'steps': 29735, 'loss/train': 1.8787389993667603} -11/07/2021 01:23:14 - INFO - __main__ - Step 29737: {'lr': 0.00045790866966487843, 'samples': 5709504, 'steps': 29736, 'loss/train': 1.2307028770446777} -11/07/2021 01:23:15 - INFO - __main__ - Step 29738: {'lr': 0.0004579057226602408, 'samples': 5709696, 'steps': 29737, 'loss/train': 1.615642786026001} -11/07/2021 01:23:15 - INFO - __main__ - Step 29739: {'lr': 0.00045790277556192414, 'samples': 5709888, 'steps': 29738, 'loss/train': 1.572300910949707} -11/07/2021 01:23:15 - INFO - __main__ - Step 29740: {'lr': 0.0004578998283699296, 'samples': 5710080, 'steps': 29739, 'loss/train': 1.4859967231750488} -11/07/2021 01:23:16 - INFO - __main__ - Step 29741: {'lr': 0.0004578968810842586, 'samples': 5710272, 'steps': 29740, 'loss/train': 1.0473401546478271} -11/07/2021 01:23:17 - INFO - __main__ - Step 29742: {'lr': 0.0004578939337049126, 'samples': 5710464, 'steps': 29741, 'loss/train': 1.2427921295166016} -11/07/2021 01:23:17 - INFO - __main__ - Step 29743: {'lr': 0.0004578909862318927, 'samples': 5710656, 'steps': 29742, 'loss/train': 2.206838369369507} -11/07/2021 01:23:17 - INFO - __main__ - Step 29744: {'lr': 0.00045788803866520037, 'samples': 5710848, 'steps': 29743, 'loss/train': 1.1564019918441772} -11/07/2021 01:23:18 - INFO - __main__ - Step 29745: {'lr': 0.0004578850910048369, 'samples': 5711040, 'steps': 29744, 'loss/train': 0.6552532315254211} -11/07/2021 01:23:18 - INFO - __main__ - Step 29746: {'lr': 0.0004578821432508036, 'samples': 5711232, 'steps': 29745, 'loss/train': 1.3801320791244507} -11/07/2021 01:23:19 - INFO - __main__ - Step 29747: {'lr': 0.00045787919540310175, 'samples': 5711424, 'steps': 29746, 'loss/train': 1.7450164556503296} -11/07/2021 01:23:20 - INFO - __main__ - Step 29748: {'lr': 0.0004578762474617328, 'samples': 5711616, 'steps': 29747, 'loss/train': 1.2243391275405884} -11/07/2021 01:23:20 - INFO - __main__ - Step 29749: {'lr': 0.00045787329942669803, 'samples': 5711808, 'steps': 29748, 'loss/train': 1.2877225875854492} -11/07/2021 01:23:20 - INFO - __main__ - Step 29750: {'lr': 0.0004578703512979988, 'samples': 5712000, 'steps': 29749, 'loss/train': 1.1598126888275146} -11/07/2021 01:23:21 - INFO - __main__ - Step 29751: {'lr': 0.00045786740307563633, 'samples': 5712192, 'steps': 29750, 'loss/train': 1.3428281545639038} -11/07/2021 01:23:22 - INFO - __main__ - Step 29752: {'lr': 0.000457864454759612, 'samples': 5712384, 'steps': 29751, 'loss/train': 1.5730271339416504} -11/07/2021 01:23:22 - INFO - __main__ - Step 29753: {'lr': 0.00045786150634992716, 'samples': 5712576, 'steps': 29752, 'loss/train': 1.583794355392456} -11/07/2021 01:23:22 - INFO - __main__ - Step 29754: {'lr': 0.0004578585578465833, 'samples': 5712768, 'steps': 29753, 'loss/train': 1.4892146587371826} -11/07/2021 01:23:23 - INFO - __main__ - Step 29755: {'lr': 0.00045785560924958135, 'samples': 5712960, 'steps': 29754, 'loss/train': 1.5873689651489258} -11/07/2021 01:23:23 - INFO - __main__ - Step 29756: {'lr': 0.00045785266055892296, 'samples': 5713152, 'steps': 29755, 'loss/train': 1.9628443717956543} -11/07/2021 01:23:23 - INFO - __main__ - Step 29757: {'lr': 0.0004578497117746094, 'samples': 5713344, 'steps': 29756, 'loss/train': 1.3814347982406616} -11/07/2021 01:23:24 - INFO - __main__ - Step 29758: {'lr': 0.00045784676289664194, 'samples': 5713536, 'steps': 29757, 'loss/train': 1.3554935455322266} -11/07/2021 01:23:25 - INFO - __main__ - Step 29759: {'lr': 0.00045784381392502193, 'samples': 5713728, 'steps': 29758, 'loss/train': 1.3909201622009277} -11/07/2021 01:23:25 - INFO - __main__ - Step 29760: {'lr': 0.00045784086485975076, 'samples': 5713920, 'steps': 29759, 'loss/train': 1.44081449508667} -11/07/2021 01:23:26 - INFO - __main__ - Step 29761: {'lr': 0.00045783791570082956, 'samples': 5714112, 'steps': 29760, 'loss/train': 1.479193091392517} -11/07/2021 01:23:26 - INFO - __main__ - Step 29762: {'lr': 0.00045783496644825997, 'samples': 5714304, 'steps': 29761, 'loss/train': 1.6843669414520264} -11/07/2021 01:23:27 - INFO - __main__ - Step 29763: {'lr': 0.000457832017102043, 'samples': 5714496, 'steps': 29762, 'loss/train': 1.9135608673095703} -11/07/2021 01:23:27 - INFO - __main__ - Step 29764: {'lr': 0.00045782906766218026, 'samples': 5714688, 'steps': 29763, 'loss/train': 1.373593807220459} -11/07/2021 01:23:28 - INFO - __main__ - Step 29765: {'lr': 0.00045782611812867285, 'samples': 5714880, 'steps': 29764, 'loss/train': 1.7488089799880981} -11/07/2021 01:23:28 - INFO - __main__ - Step 29766: {'lr': 0.0004578231685015223, 'samples': 5715072, 'steps': 29765, 'loss/train': 1.6487336158752441} -11/07/2021 01:23:28 - INFO - __main__ - Step 29767: {'lr': 0.00045782021878072976, 'samples': 5715264, 'steps': 29766, 'loss/train': 1.114486575126648} -11/07/2021 01:23:30 - INFO - __main__ - Step 29768: {'lr': 0.0004578172689662967, 'samples': 5715456, 'steps': 29767, 'loss/train': 1.9899827241897583} -11/07/2021 01:23:30 - INFO - __main__ - Step 29769: {'lr': 0.0004578143190582243, 'samples': 5715648, 'steps': 29768, 'loss/train': 1.4738233089447021} -11/07/2021 01:23:31 - INFO - __main__ - Step 29770: {'lr': 0.000457811369056514, 'samples': 5715840, 'steps': 29769, 'loss/train': 1.630418300628662} -11/07/2021 01:23:31 - INFO - __main__ - Step 29771: {'lr': 0.0004578084189611671, 'samples': 5716032, 'steps': 29770, 'loss/train': 2.4739456176757812} -11/07/2021 01:23:31 - INFO - __main__ - Step 29772: {'lr': 0.000457805468772185, 'samples': 5716224, 'steps': 29771, 'loss/train': 1.9433209896087646} -11/07/2021 01:23:32 - INFO - __main__ - Step 29773: {'lr': 0.00045780251848956887, 'samples': 5716416, 'steps': 29772, 'loss/train': 1.7320784330368042} -11/07/2021 01:23:33 - INFO - __main__ - Step 29774: {'lr': 0.0004577995681133202, 'samples': 5716608, 'steps': 29773, 'loss/train': 1.7899585962295532} -11/07/2021 01:23:33 - INFO - __main__ - Step 29775: {'lr': 0.00045779661764344025, 'samples': 5716800, 'steps': 29774, 'loss/train': 1.639638900756836} -11/07/2021 01:23:34 - INFO - __main__ - Step 29776: {'lr': 0.0004577936670799303, 'samples': 5716992, 'steps': 29775, 'loss/train': 1.1416207551956177} -11/07/2021 01:23:34 - INFO - __main__ - Step 29777: {'lr': 0.00045779071642279177, 'samples': 5717184, 'steps': 29776, 'loss/train': 1.4320186376571655} -11/07/2021 01:23:34 - INFO - __main__ - Step 29778: {'lr': 0.00045778776567202597, 'samples': 5717376, 'steps': 29777, 'loss/train': 0.19236861169338226} -11/07/2021 01:23:35 - INFO - __main__ - Step 29779: {'lr': 0.0004577848148276341, 'samples': 5717568, 'steps': 29778, 'loss/train': 1.3992671966552734} -11/07/2021 01:23:36 - INFO - __main__ - Step 29780: {'lr': 0.00045778186388961776, 'samples': 5717760, 'steps': 29779, 'loss/train': 0.9883819818496704} -11/07/2021 01:23:36 - INFO - __main__ - Step 29781: {'lr': 0.000457778912857978, 'samples': 5717952, 'steps': 29780, 'loss/train': 1.4643261432647705} -11/07/2021 01:23:36 - INFO - __main__ - Step 29782: {'lr': 0.0004577759617327163, 'samples': 5718144, 'steps': 29781, 'loss/train': 0.6966073513031006} -11/07/2021 01:23:37 - INFO - __main__ - Step 29783: {'lr': 0.000457773010513834, 'samples': 5718336, 'steps': 29782, 'loss/train': 1.7028216123580933} -11/07/2021 01:23:38 - INFO - __main__ - Step 29784: {'lr': 0.0004577700592013323, 'samples': 5718528, 'steps': 29783, 'loss/train': 1.820124864578247} -11/07/2021 01:23:38 - INFO - __main__ - Step 29785: {'lr': 0.0004577671077952127, 'samples': 5718720, 'steps': 29784, 'loss/train': 1.080474853515625} -11/07/2021 01:23:38 - INFO - __main__ - Step 29786: {'lr': 0.0004577641562954764, 'samples': 5718912, 'steps': 29785, 'loss/train': 1.6864469051361084} -11/07/2021 01:23:39 - INFO - __main__ - Step 29787: {'lr': 0.00045776120470212477, 'samples': 5719104, 'steps': 29786, 'loss/train': 1.9222395420074463} -11/07/2021 01:23:39 - INFO - __main__ - Step 29788: {'lr': 0.00045775825301515923, 'samples': 5719296, 'steps': 29787, 'loss/train': 1.5662935972213745} -11/07/2021 01:23:40 - INFO - __main__ - Step 29789: {'lr': 0.00045775530123458096, 'samples': 5719488, 'steps': 29788, 'loss/train': 1.7799813747406006} -11/07/2021 01:23:41 - INFO - __main__ - Step 29790: {'lr': 0.00045775234936039133, 'samples': 5719680, 'steps': 29789, 'loss/train': 1.6136198043823242} -11/07/2021 01:23:41 - INFO - __main__ - Step 29791: {'lr': 0.00045774939739259173, 'samples': 5719872, 'steps': 29790, 'loss/train': 1.7736300230026245} -11/07/2021 01:23:41 - INFO - __main__ - Step 29792: {'lr': 0.0004577464453311835, 'samples': 5720064, 'steps': 29791, 'loss/train': 1.390116572380066} -11/07/2021 01:23:42 - INFO - __main__ - Step 29793: {'lr': 0.00045774349317616786, 'samples': 5720256, 'steps': 29792, 'loss/train': 1.5883327722549438} -11/07/2021 01:23:43 - INFO - __main__ - Step 29794: {'lr': 0.00045774054092754624, 'samples': 5720448, 'steps': 29793, 'loss/train': 1.7770684957504272} -11/07/2021 01:23:43 - INFO - __main__ - Step 29795: {'lr': 0.00045773758858531997, 'samples': 5720640, 'steps': 29794, 'loss/train': 1.6819716691970825} -11/07/2021 01:23:43 - INFO - __main__ - Step 29796: {'lr': 0.0004577346361494903, 'samples': 5720832, 'steps': 29795, 'loss/train': 1.8606592416763306} -11/07/2021 01:23:44 - INFO - __main__ - Step 29797: {'lr': 0.0004577316836200586, 'samples': 5721024, 'steps': 29796, 'loss/train': 1.347123146057129} -11/07/2021 01:23:44 - INFO - __main__ - Step 29798: {'lr': 0.0004577287309970262, 'samples': 5721216, 'steps': 29797, 'loss/train': 1.5793622732162476} -11/07/2021 01:23:46 - INFO - __main__ - Step 29799: {'lr': 0.0004577257782803945, 'samples': 5721408, 'steps': 29798, 'loss/train': 1.1619411706924438} -11/07/2021 01:23:47 - INFO - __main__ - Step 29800: {'lr': 0.00045772282547016475, 'samples': 5721600, 'steps': 29799, 'loss/train': 1.731318712234497} -11/07/2021 01:23:47 - INFO - __main__ - Step 29801: {'lr': 0.0004577198725663383, 'samples': 5721792, 'steps': 29800, 'loss/train': 1.8544946908950806} -11/07/2021 01:23:47 - INFO - __main__ - Step 29802: {'lr': 0.00045771691956891645, 'samples': 5721984, 'steps': 29801, 'loss/train': 1.3345541954040527} -11/07/2021 01:23:48 - INFO - __main__ - Step 29803: {'lr': 0.00045771396647790053, 'samples': 5722176, 'steps': 29802, 'loss/train': 1.8053834438323975} -11/07/2021 01:23:48 - INFO - __main__ - Step 29804: {'lr': 0.00045771101329329195, 'samples': 5722368, 'steps': 29803, 'loss/train': 1.8068797588348389} -11/07/2021 01:23:48 - INFO - __main__ - Step 29805: {'lr': 0.00045770806001509205, 'samples': 5722560, 'steps': 29804, 'loss/train': 1.7853294610977173} -11/07/2021 01:23:49 - INFO - __main__ - Step 29806: {'lr': 0.00045770510664330203, 'samples': 5722752, 'steps': 29805, 'loss/train': 1.2462117671966553} -11/07/2021 01:23:50 - INFO - __main__ - Step 29807: {'lr': 0.0004577021531779233, 'samples': 5722944, 'steps': 29806, 'loss/train': 1.5601024627685547} -11/07/2021 01:23:50 - INFO - __main__ - Step 29808: {'lr': 0.00045769919961895716, 'samples': 5723136, 'steps': 29807, 'loss/train': 1.5851486921310425} -11/07/2021 01:23:50 - INFO - __main__ - Step 29809: {'lr': 0.000457696245966405, 'samples': 5723328, 'steps': 29808, 'loss/train': 1.6994768381118774} -11/07/2021 01:23:51 - INFO - __main__ - Step 29810: {'lr': 0.0004576932922202681, 'samples': 5723520, 'steps': 29809, 'loss/train': 1.0932499170303345} -11/07/2021 01:23:51 - INFO - __main__ - Step 29811: {'lr': 0.00045769033838054783, 'samples': 5723712, 'steps': 29810, 'loss/train': 1.7573410272598267} -11/07/2021 01:23:52 - INFO - __main__ - Step 29812: {'lr': 0.0004576873844472455, 'samples': 5723904, 'steps': 29811, 'loss/train': 1.5087987184524536} -11/07/2021 01:23:52 - INFO - __main__ - Step 29813: {'lr': 0.00045768443042036247, 'samples': 5724096, 'steps': 29812, 'loss/train': 1.4405393600463867} -11/07/2021 01:23:53 - INFO - __main__ - Step 29814: {'lr': 0.0004576814762999, 'samples': 5724288, 'steps': 29813, 'loss/train': 1.6026747226715088} -11/07/2021 01:23:53 - INFO - __main__ - Step 29815: {'lr': 0.00045767852208585945, 'samples': 5724480, 'steps': 29814, 'loss/train': 1.3455612659454346} -11/07/2021 01:23:53 - INFO - __main__ - Step 29816: {'lr': 0.00045767556777824217, 'samples': 5724672, 'steps': 29815, 'loss/train': 1.5217554569244385} -11/07/2021 01:23:55 - INFO - __main__ - Step 29817: {'lr': 0.00045767261337704946, 'samples': 5724864, 'steps': 29816, 'loss/train': 2.1377294063568115} -11/07/2021 01:23:55 - INFO - __main__ - Step 29818: {'lr': 0.00045766965888228273, 'samples': 5725056, 'steps': 29817, 'loss/train': 1.8070579767227173} -11/07/2021 01:23:55 - INFO - __main__ - Step 29819: {'lr': 0.00045766670429394317, 'samples': 5725248, 'steps': 29818, 'loss/train': 1.0186076164245605} -11/07/2021 01:23:56 - INFO - __main__ - Step 29820: {'lr': 0.00045766374961203236, 'samples': 5725440, 'steps': 29819, 'loss/train': 1.401145100593567} -11/07/2021 01:23:56 - INFO - __main__ - Step 29821: {'lr': 0.0004576607948365513, 'samples': 5725632, 'steps': 29820, 'loss/train': 1.6666818857192993} -11/07/2021 01:23:57 - INFO - __main__ - Step 29822: {'lr': 0.0004576578399675015, 'samples': 5725824, 'steps': 29821, 'loss/train': 1.4097083806991577} -11/07/2021 01:23:57 - INFO - __main__ - Step 29823: {'lr': 0.00045765488500488437, 'samples': 5726016, 'steps': 29822, 'loss/train': 1.3067562580108643} -11/07/2021 01:23:58 - INFO - __main__ - Step 29824: {'lr': 0.0004576519299487012, 'samples': 5726208, 'steps': 29823, 'loss/train': 1.5579853057861328} -11/07/2021 01:23:58 - INFO - __main__ - Step 29825: {'lr': 0.00045764897479895315, 'samples': 5726400, 'steps': 29824, 'loss/train': 1.7080674171447754} -11/07/2021 01:23:58 - INFO - __main__ - Step 29826: {'lr': 0.0004576460195556418, 'samples': 5726592, 'steps': 29825, 'loss/train': 1.8079490661621094} -11/07/2021 01:23:59 - INFO - __main__ - Step 29827: {'lr': 0.0004576430642187682, 'samples': 5726784, 'steps': 29826, 'loss/train': 1.7533303499221802} -11/07/2021 01:24:00 - INFO - __main__ - Step 29828: {'lr': 0.00045764010878833396, 'samples': 5726976, 'steps': 29827, 'loss/train': 1.6237348318099976} -11/07/2021 01:24:00 - INFO - __main__ - Step 29829: {'lr': 0.00045763715326434023, 'samples': 5727168, 'steps': 29828, 'loss/train': 1.3736622333526611} -11/07/2021 01:24:00 - INFO - __main__ - Step 29830: {'lr': 0.0004576341976467884, 'samples': 5727360, 'steps': 29829, 'loss/train': 1.267899990081787} -11/07/2021 01:24:01 - INFO - __main__ - Step 29831: {'lr': 0.00045763124193567983, 'samples': 5727552, 'steps': 29830, 'loss/train': 0.6706776022911072} -11/07/2021 01:24:02 - INFO - __main__ - Step 29832: {'lr': 0.0004576282861310158, 'samples': 5727744, 'steps': 29831, 'loss/train': 1.6785303354263306} -11/07/2021 01:24:02 - INFO - __main__ - Step 29833: {'lr': 0.00045762533023279773, 'samples': 5727936, 'steps': 29832, 'loss/train': 1.4475414752960205} -11/07/2021 01:24:02 - INFO - __main__ - Step 29834: {'lr': 0.00045762237424102687, 'samples': 5728128, 'steps': 29833, 'loss/train': 1.6399792432785034} -11/07/2021 01:24:03 - INFO - __main__ - Step 29835: {'lr': 0.0004576194181557045, 'samples': 5728320, 'steps': 29834, 'loss/train': 1.3964948654174805} -11/07/2021 01:24:03 - INFO - __main__ - Step 29836: {'lr': 0.00045761646197683216, 'samples': 5728512, 'steps': 29835, 'loss/train': 2.0420026779174805} -11/07/2021 01:24:04 - INFO - __main__ - Step 29837: {'lr': 0.00045761350570441096, 'samples': 5728704, 'steps': 29836, 'loss/train': 1.8259185552597046} -11/07/2021 01:24:05 - INFO - __main__ - Step 29838: {'lr': 0.0004576105493384423, 'samples': 5728896, 'steps': 29837, 'loss/train': 1.2299456596374512} -11/07/2021 01:24:05 - INFO - __main__ - Step 29839: {'lr': 0.00045760759287892755, 'samples': 5729088, 'steps': 29838, 'loss/train': 0.7691632509231567} -11/07/2021 01:24:05 - INFO - __main__ - Step 29840: {'lr': 0.000457604636325868, 'samples': 5729280, 'steps': 29839, 'loss/train': 1.6238632202148438} -11/07/2021 01:24:06 - INFO - __main__ - Step 29841: {'lr': 0.00045760167967926504, 'samples': 5729472, 'steps': 29840, 'loss/train': 1.3403931856155396} -11/07/2021 01:24:07 - INFO - __main__ - Step 29842: {'lr': 0.00045759872293911995, 'samples': 5729664, 'steps': 29841, 'loss/train': 1.3798387050628662} -11/07/2021 01:24:07 - INFO - __main__ - Step 29843: {'lr': 0.00045759576610543407, 'samples': 5729856, 'steps': 29842, 'loss/train': 1.6725951433181763} -11/07/2021 01:24:07 - INFO - __main__ - Step 29844: {'lr': 0.0004575928091782088, 'samples': 5730048, 'steps': 29843, 'loss/train': 1.3758196830749512} -11/07/2021 01:24:08 - INFO - __main__ - Step 29845: {'lr': 0.00045758985215744536, 'samples': 5730240, 'steps': 29844, 'loss/train': 1.447424292564392} -11/07/2021 01:24:08 - INFO - __main__ - Step 29846: {'lr': 0.0004575868950431452, 'samples': 5730432, 'steps': 29845, 'loss/train': 1.807071328163147} -11/07/2021 01:24:08 - INFO - __main__ - Step 29847: {'lr': 0.0004575839378353095, 'samples': 5730624, 'steps': 29846, 'loss/train': 1.5199185609817505} -11/07/2021 01:24:09 - INFO - __main__ - Step 29848: {'lr': 0.0004575809805339397, 'samples': 5730816, 'steps': 29847, 'loss/train': 1.3373128175735474} -11/07/2021 01:24:10 - INFO - __main__ - Step 29849: {'lr': 0.0004575780231390371, 'samples': 5731008, 'steps': 29848, 'loss/train': 1.7042051553726196} -11/07/2021 01:24:10 - INFO - __main__ - Step 29850: {'lr': 0.0004575750656506031, 'samples': 5731200, 'steps': 29849, 'loss/train': 1.6827337741851807} -11/07/2021 01:24:11 - INFO - __main__ - Step 29851: {'lr': 0.00045757210806863895, 'samples': 5731392, 'steps': 29850, 'loss/train': 1.5924853086471558} -11/07/2021 01:24:11 - INFO - __main__ - Step 29852: {'lr': 0.0004575691503931461, 'samples': 5731584, 'steps': 29851, 'loss/train': 1.6998484134674072} -11/07/2021 01:24:12 - INFO - __main__ - Step 29853: {'lr': 0.00045756619262412565, 'samples': 5731776, 'steps': 29852, 'loss/train': 1.5841456651687622} -11/07/2021 01:24:12 - INFO - __main__ - Step 29854: {'lr': 0.0004575632347615791, 'samples': 5731968, 'steps': 29853, 'loss/train': 1.5362069606781006} -11/07/2021 01:24:13 - INFO - __main__ - Step 29855: {'lr': 0.0004575602768055078, 'samples': 5732160, 'steps': 29854, 'loss/train': 2.408329963684082} -11/07/2021 01:24:13 - INFO - __main__ - Step 29856: {'lr': 0.00045755731875591303, 'samples': 5732352, 'steps': 29855, 'loss/train': 1.5316470861434937} -11/07/2021 01:24:13 - INFO - __main__ - Step 29857: {'lr': 0.0004575543606127961, 'samples': 5732544, 'steps': 29856, 'loss/train': 1.3378548622131348} -11/07/2021 01:24:14 - INFO - __main__ - Step 29858: {'lr': 0.0004575514023761585, 'samples': 5732736, 'steps': 29857, 'loss/train': 1.5171469449996948} -11/07/2021 01:24:15 - INFO - __main__ - Step 29859: {'lr': 0.00045754844404600136, 'samples': 5732928, 'steps': 29858, 'loss/train': 1.53959059715271} -11/07/2021 01:24:15 - INFO - __main__ - Step 29860: {'lr': 0.00045754548562232605, 'samples': 5733120, 'steps': 29859, 'loss/train': 1.0466532707214355} -11/07/2021 01:24:16 - INFO - __main__ - Step 29861: {'lr': 0.00045754252710513397, 'samples': 5733312, 'steps': 29860, 'loss/train': 1.539314866065979} -11/07/2021 01:24:16 - INFO - __main__ - Step 29862: {'lr': 0.00045753956849442647, 'samples': 5733504, 'steps': 29861, 'loss/train': 1.9545060396194458} -11/07/2021 01:24:17 - INFO - __main__ - Step 29863: {'lr': 0.00045753660979020485, 'samples': 5733696, 'steps': 29862, 'loss/train': 1.7656947374343872} -11/07/2021 01:24:17 - INFO - __main__ - Step 29864: {'lr': 0.0004575336509924704, 'samples': 5733888, 'steps': 29863, 'loss/train': 1.5456066131591797} -11/07/2021 01:24:18 - INFO - __main__ - Step 29865: {'lr': 0.0004575306921012245, 'samples': 5734080, 'steps': 29864, 'loss/train': 1.8647871017456055} -11/07/2021 01:24:18 - INFO - __main__ - Step 29866: {'lr': 0.00045752773311646846, 'samples': 5734272, 'steps': 29865, 'loss/train': 1.4891483783721924} -11/07/2021 01:24:18 - INFO - __main__ - Step 29867: {'lr': 0.0004575247740382037, 'samples': 5734464, 'steps': 29866, 'loss/train': 1.5018141269683838} -11/07/2021 01:24:20 - INFO - __main__ - Step 29868: {'lr': 0.0004575218148664314, 'samples': 5734656, 'steps': 29867, 'loss/train': 1.6410999298095703} -11/07/2021 01:24:20 - INFO - __main__ - Step 29869: {'lr': 0.00045751885560115294, 'samples': 5734848, 'steps': 29868, 'loss/train': 1.5205363035202026} -11/07/2021 01:24:20 - INFO - __main__ - Step 29870: {'lr': 0.0004575158962423698, 'samples': 5735040, 'steps': 29869, 'loss/train': 1.8936104774475098} -11/07/2021 01:24:21 - INFO - __main__ - Step 29871: {'lr': 0.0004575129367900831, 'samples': 5735232, 'steps': 29870, 'loss/train': 1.8289682865142822} -11/07/2021 01:24:21 - INFO - __main__ - Step 29872: {'lr': 0.0004575099772442943, 'samples': 5735424, 'steps': 29871, 'loss/train': 1.6737574338912964} -11/07/2021 01:24:21 - INFO - __main__ - Step 29873: {'lr': 0.0004575070176050047, 'samples': 5735616, 'steps': 29872, 'loss/train': 1.4331068992614746} -11/07/2021 01:24:22 - INFO - __main__ - Step 29874: {'lr': 0.00045750405787221566, 'samples': 5735808, 'steps': 29873, 'loss/train': 1.4061284065246582} -11/07/2021 01:24:23 - INFO - __main__ - Step 29875: {'lr': 0.0004575010980459285, 'samples': 5736000, 'steps': 29874, 'loss/train': 1.251508355140686} -11/07/2021 01:24:23 - INFO - __main__ - Step 29876: {'lr': 0.0004574981381261445, 'samples': 5736192, 'steps': 29875, 'loss/train': 1.3016911745071411} -11/07/2021 01:24:23 - INFO - __main__ - Step 29877: {'lr': 0.0004574951781128651, 'samples': 5736384, 'steps': 29876, 'loss/train': 1.335336446762085} -11/07/2021 01:24:24 - INFO - __main__ - Step 29878: {'lr': 0.0004574922180060915, 'samples': 5736576, 'steps': 29877, 'loss/train': 1.3123310804367065} -11/07/2021 01:24:25 - INFO - __main__ - Step 29879: {'lr': 0.0004574892578058252, 'samples': 5736768, 'steps': 29878, 'loss/train': 0.9599051475524902} -11/07/2021 01:24:25 - INFO - __main__ - Step 29880: {'lr': 0.0004574862975120674, 'samples': 5736960, 'steps': 29879, 'loss/train': 1.6392614841461182} -11/07/2021 01:24:25 - INFO - __main__ - Step 29881: {'lr': 0.0004574833371248195, 'samples': 5737152, 'steps': 29880, 'loss/train': 1.8147220611572266} -11/07/2021 01:24:26 - INFO - __main__ - Step 29882: {'lr': 0.00045748037664408275, 'samples': 5737344, 'steps': 29881, 'loss/train': 1.6705900430679321} -11/07/2021 01:24:26 - INFO - __main__ - Step 29883: {'lr': 0.0004574774160698586, 'samples': 5737536, 'steps': 29882, 'loss/train': 1.6094480752944946} -11/07/2021 01:24:27 - INFO - __main__ - Step 29884: {'lr': 0.00045747445540214826, 'samples': 5737728, 'steps': 29883, 'loss/train': 1.6537147760391235} -11/07/2021 01:24:28 - INFO - __main__ - Step 29885: {'lr': 0.00045747149464095324, 'samples': 5737920, 'steps': 29884, 'loss/train': 1.493760347366333} -11/07/2021 01:24:28 - INFO - __main__ - Step 29886: {'lr': 0.00045746853378627467, 'samples': 5738112, 'steps': 29885, 'loss/train': 1.9688208103179932} -11/07/2021 01:24:28 - INFO - __main__ - Step 29887: {'lr': 0.000457465572838114, 'samples': 5738304, 'steps': 29886, 'loss/train': 0.6421449184417725} -11/07/2021 01:24:29 - INFO - __main__ - Step 29888: {'lr': 0.0004574626117964726, 'samples': 5738496, 'steps': 29887, 'loss/train': 2.212495803833008} -11/07/2021 01:24:30 - INFO - __main__ - Step 29889: {'lr': 0.00045745965066135163, 'samples': 5738688, 'steps': 29888, 'loss/train': 0.825211763381958} -11/07/2021 01:24:30 - INFO - __main__ - Step 29890: {'lr': 0.00045745668943275266, 'samples': 5738880, 'steps': 29889, 'loss/train': 1.9920496940612793} -11/07/2021 01:24:30 - INFO - __main__ - Step 29891: {'lr': 0.00045745372811067687, 'samples': 5739072, 'steps': 29890, 'loss/train': 1.0584920644760132} -11/07/2021 01:24:31 - INFO - __main__ - Step 29892: {'lr': 0.00045745076669512566, 'samples': 5739264, 'steps': 29891, 'loss/train': 1.6357108354568481} -11/07/2021 01:24:31 - INFO - __main__ - Step 29893: {'lr': 0.0004574478051861003, 'samples': 5739456, 'steps': 29892, 'loss/train': 1.5066235065460205} -11/07/2021 01:24:32 - INFO - __main__ - Step 29894: {'lr': 0.00045744484358360216, 'samples': 5739648, 'steps': 29893, 'loss/train': 1.6722524166107178} -11/07/2021 01:24:33 - INFO - __main__ - Step 29895: {'lr': 0.0004574418818876326, 'samples': 5739840, 'steps': 29894, 'loss/train': 1.4991633892059326} -11/07/2021 01:24:33 - INFO - __main__ - Step 29896: {'lr': 0.0004574389200981929, 'samples': 5740032, 'steps': 29895, 'loss/train': 1.4193624258041382} -11/07/2021 01:24:33 - INFO - __main__ - Step 29897: {'lr': 0.00045743595821528437, 'samples': 5740224, 'steps': 29896, 'loss/train': 1.590252161026001} -11/07/2021 01:24:34 - INFO - __main__ - Step 29898: {'lr': 0.0004574329962389085, 'samples': 5740416, 'steps': 29897, 'loss/train': 1.6737258434295654} -11/07/2021 01:24:34 - INFO - __main__ - Step 29899: {'lr': 0.0004574300341690665, 'samples': 5740608, 'steps': 29898, 'loss/train': 1.7634446620941162} -11/07/2021 01:24:35 - INFO - __main__ - Step 29900: {'lr': 0.00045742707200575975, 'samples': 5740800, 'steps': 29899, 'loss/train': 1.6548808813095093} -11/07/2021 01:24:35 - INFO - __main__ - Step 29901: {'lr': 0.00045742410974898947, 'samples': 5740992, 'steps': 29900, 'loss/train': 1.6476119756698608} -11/07/2021 01:24:36 - INFO - __main__ - Step 29902: {'lr': 0.0004574211473987571, 'samples': 5741184, 'steps': 29901, 'loss/train': 1.7704423666000366} -11/07/2021 01:24:36 - INFO - __main__ - Step 29903: {'lr': 0.00045741818495506403, 'samples': 5741376, 'steps': 29902, 'loss/train': 1.6585086584091187} -11/07/2021 01:24:36 - INFO - __main__ - Step 29904: {'lr': 0.0004574152224179115, 'samples': 5741568, 'steps': 29903, 'loss/train': 1.849440097808838} -11/07/2021 01:24:37 - INFO - __main__ - Step 29905: {'lr': 0.0004574122597873008, 'samples': 5741760, 'steps': 29904, 'loss/train': 1.5148991346359253} -11/07/2021 01:24:38 - INFO - __main__ - Step 29906: {'lr': 0.0004574092970632335, 'samples': 5741952, 'steps': 29905, 'loss/train': 1.5750218629837036} -11/07/2021 01:24:38 - INFO - __main__ - Step 29907: {'lr': 0.00045740633424571064, 'samples': 5742144, 'steps': 29906, 'loss/train': 1.9244686365127563} -11/07/2021 01:24:39 - INFO - __main__ - Step 29908: {'lr': 0.00045740337133473374, 'samples': 5742336, 'steps': 29907, 'loss/train': 1.775071620941162} -11/07/2021 01:24:39 - INFO - __main__ - Step 29909: {'lr': 0.00045740040833030404, 'samples': 5742528, 'steps': 29908, 'loss/train': 1.9028395414352417} -11/07/2021 01:24:40 - INFO - __main__ - Step 29910: {'lr': 0.00045739744523242294, 'samples': 5742720, 'steps': 29909, 'loss/train': 1.3661624193191528} -11/07/2021 01:24:40 - INFO - __main__ - Step 29911: {'lr': 0.0004573944820410918, 'samples': 5742912, 'steps': 29910, 'loss/train': 1.7625046968460083} -11/07/2021 01:24:41 - INFO - __main__ - Step 29912: {'lr': 0.0004573915187563118, 'samples': 5743104, 'steps': 29911, 'loss/train': 1.7702594995498657} -11/07/2021 01:24:41 - INFO - __main__ - Step 29913: {'lr': 0.00045738855537808443, 'samples': 5743296, 'steps': 29912, 'loss/train': 1.0329153537750244} -11/07/2021 01:24:41 - INFO - __main__ - Step 29914: {'lr': 0.000457385591906411, 'samples': 5743488, 'steps': 29913, 'loss/train': 1.6367841958999634} -11/07/2021 01:24:42 - INFO - __main__ - Step 29915: {'lr': 0.00045738262834129283, 'samples': 5743680, 'steps': 29914, 'loss/train': 1.5828520059585571} -11/07/2021 01:24:43 - INFO - __main__ - Step 29916: {'lr': 0.0004573796646827312, 'samples': 5743872, 'steps': 29915, 'loss/train': 1.8843293190002441} -11/07/2021 01:24:43 - INFO - __main__ - Step 29917: {'lr': 0.0004573767009307276, 'samples': 5744064, 'steps': 29916, 'loss/train': 1.4333949089050293} -11/07/2021 01:24:44 - INFO - __main__ - Step 29918: {'lr': 0.0004573737370852831, 'samples': 5744256, 'steps': 29917, 'loss/train': 1.7710152864456177} -11/07/2021 01:24:44 - INFO - __main__ - Step 29919: {'lr': 0.0004573707731463993, 'samples': 5744448, 'steps': 29918, 'loss/train': 1.1830955743789673} -11/07/2021 01:24:45 - INFO - __main__ - Step 29920: {'lr': 0.00045736780911407736, 'samples': 5744640, 'steps': 29919, 'loss/train': 1.6793465614318848} -11/07/2021 01:24:45 - INFO - __main__ - Step 29921: {'lr': 0.00045736484498831877, 'samples': 5744832, 'steps': 29920, 'loss/train': 1.932478427886963} -11/07/2021 01:24:46 - INFO - __main__ - Step 29922: {'lr': 0.0004573618807691248, 'samples': 5745024, 'steps': 29921, 'loss/train': 1.56174635887146} -11/07/2021 01:24:46 - INFO - __main__ - Step 29923: {'lr': 0.0004573589164564966, 'samples': 5745216, 'steps': 29922, 'loss/train': 1.684158205986023} -11/07/2021 01:24:46 - INFO - __main__ - Step 29924: {'lr': 0.00045735595205043583, 'samples': 5745408, 'steps': 29923, 'loss/train': 1.9968838691711426} -11/07/2021 01:24:47 - INFO - __main__ - Step 29925: {'lr': 0.00045735298755094364, 'samples': 5745600, 'steps': 29924, 'loss/train': 1.8304612636566162} -11/07/2021 01:24:48 - INFO - __main__ - Step 29926: {'lr': 0.00045735002295802137, 'samples': 5745792, 'steps': 29925, 'loss/train': 1.8053874969482422} -11/07/2021 01:24:48 - INFO - __main__ - Step 29927: {'lr': 0.00045734705827167035, 'samples': 5745984, 'steps': 29926, 'loss/train': 1.7693537473678589} -11/07/2021 01:24:48 - INFO - __main__ - Step 29928: {'lr': 0.000457344093491892, 'samples': 5746176, 'steps': 29927, 'loss/train': 1.6845461130142212} -11/07/2021 01:24:49 - INFO - __main__ - Step 29929: {'lr': 0.00045734112861868753, 'samples': 5746368, 'steps': 29928, 'loss/train': 0.90385502576828} -11/07/2021 01:24:49 - INFO - __main__ - Step 29930: {'lr': 0.0004573381636520584, 'samples': 5746560, 'steps': 29929, 'loss/train': 1.354880690574646} -11/07/2021 01:24:50 - INFO - __main__ - Step 29931: {'lr': 0.0004573351985920059, 'samples': 5746752, 'steps': 29930, 'loss/train': 1.7663991451263428} -11/07/2021 01:24:51 - INFO - __main__ - Step 29932: {'lr': 0.0004573322334385314, 'samples': 5746944, 'steps': 29931, 'loss/train': 0.8987229466438293} -11/07/2021 01:24:51 - INFO - __main__ - Step 29933: {'lr': 0.0004573292681916361, 'samples': 5747136, 'steps': 29932, 'loss/train': 1.6049652099609375} -11/07/2021 01:24:51 - INFO - __main__ - Step 29934: {'lr': 0.0004573263028513214, 'samples': 5747328, 'steps': 29933, 'loss/train': 1.4241623878479004} -11/07/2021 01:24:52 - INFO - __main__ - Step 29935: {'lr': 0.0004573233374175888, 'samples': 5747520, 'steps': 29934, 'loss/train': 1.8239710330963135} -11/07/2021 01:24:53 - INFO - __main__ - Step 29936: {'lr': 0.0004573203718904394, 'samples': 5747712, 'steps': 29935, 'loss/train': 1.6157418489456177} -11/07/2021 01:24:53 - INFO - __main__ - Step 29937: {'lr': 0.00045731740626987473, 'samples': 5747904, 'steps': 29936, 'loss/train': 1.3402079343795776} -11/07/2021 01:24:53 - INFO - __main__ - Step 29938: {'lr': 0.00045731444055589597, 'samples': 5748096, 'steps': 29937, 'loss/train': 1.3002804517745972} -11/07/2021 01:24:54 - INFO - __main__ - Step 29939: {'lr': 0.0004573114747485045, 'samples': 5748288, 'steps': 29938, 'loss/train': 1.498435139656067} -11/07/2021 01:24:54 - INFO - __main__ - Step 29940: {'lr': 0.0004573085088477017, 'samples': 5748480, 'steps': 29939, 'loss/train': 1.1412640810012817} -11/07/2021 01:24:55 - INFO - __main__ - Step 29941: {'lr': 0.0004573055428534889, 'samples': 5748672, 'steps': 29940, 'loss/train': 1.5386608839035034} -11/07/2021 01:24:56 - INFO - __main__ - Step 29942: {'lr': 0.00045730257676586747, 'samples': 5748864, 'steps': 29941, 'loss/train': 0.6990121603012085} -11/07/2021 01:24:56 - INFO - __main__ - Step 29943: {'lr': 0.0004572996105848386, 'samples': 5749056, 'steps': 29942, 'loss/train': 1.4737290143966675} -11/07/2021 01:24:56 - INFO - __main__ - Step 29944: {'lr': 0.0004572966443104038, 'samples': 5749248, 'steps': 29943, 'loss/train': 1.4378646612167358} -11/07/2021 01:24:57 - INFO - __main__ - Step 29945: {'lr': 0.00045729367794256434, 'samples': 5749440, 'steps': 29944, 'loss/train': 1.599612832069397} -11/07/2021 01:24:58 - INFO - __main__ - Step 29946: {'lr': 0.0004572907114813215, 'samples': 5749632, 'steps': 29945, 'loss/train': 1.34317946434021} -11/07/2021 01:24:58 - INFO - __main__ - Step 29947: {'lr': 0.0004572877449266767, 'samples': 5749824, 'steps': 29946, 'loss/train': 1.4258098602294922} -11/07/2021 01:24:58 - INFO - __main__ - Step 29948: {'lr': 0.0004572847782786312, 'samples': 5750016, 'steps': 29947, 'loss/train': 1.0848888158798218} -11/07/2021 01:24:59 - INFO - __main__ - Step 29949: {'lr': 0.0004572818115371864, 'samples': 5750208, 'steps': 29948, 'loss/train': 1.4937506914138794} -11/07/2021 01:24:59 - INFO - __main__ - Step 29950: {'lr': 0.0004572788447023436, 'samples': 5750400, 'steps': 29949, 'loss/train': 1.7091032266616821} -11/07/2021 01:25:00 - INFO - __main__ - Step 29951: {'lr': 0.00045727587777410415, 'samples': 5750592, 'steps': 29950, 'loss/train': 1.3422096967697144} -11/07/2021 01:25:00 - INFO - __main__ - Step 29952: {'lr': 0.00045727291075246937, 'samples': 5750784, 'steps': 29951, 'loss/train': 1.6312906742095947} -11/07/2021 01:25:01 - INFO - __main__ - Step 29953: {'lr': 0.0004572699436374407, 'samples': 5750976, 'steps': 29952, 'loss/train': 1.4829158782958984} -11/07/2021 01:25:01 - INFO - __main__ - Step 29954: {'lr': 0.00045726697642901925, 'samples': 5751168, 'steps': 29953, 'loss/train': 1.410493016242981} -11/07/2021 01:25:01 - INFO - __main__ - Step 29955: {'lr': 0.0004572640091272066, 'samples': 5751360, 'steps': 29954, 'loss/train': 1.5101686716079712} -11/07/2021 01:25:02 - INFO - __main__ - Step 29956: {'lr': 0.000457261041732004, 'samples': 5751552, 'steps': 29955, 'loss/train': 1.3401647806167603} -11/07/2021 01:25:03 - INFO - __main__ - Step 29957: {'lr': 0.0004572580742434127, 'samples': 5751744, 'steps': 29956, 'loss/train': 1.9295035600662231} -11/07/2021 01:25:03 - INFO - __main__ - Step 29958: {'lr': 0.00045725510666143424, 'samples': 5751936, 'steps': 29957, 'loss/train': 1.5255932807922363} -11/07/2021 01:25:03 - INFO - __main__ - Step 29959: {'lr': 0.0004572521389860697, 'samples': 5752128, 'steps': 29958, 'loss/train': 1.4836983680725098} -11/07/2021 01:25:04 - INFO - __main__ - Step 29960: {'lr': 0.00045724917121732055, 'samples': 5752320, 'steps': 29959, 'loss/train': 1.8313194513320923} -11/07/2021 01:25:04 - INFO - __main__ - Step 29961: {'lr': 0.0004572462033551882, 'samples': 5752512, 'steps': 29960, 'loss/train': 1.5937235355377197} -11/07/2021 01:25:05 - INFO - __main__ - Step 29962: {'lr': 0.00045724323539967385, 'samples': 5752704, 'steps': 29961, 'loss/train': 1.5976606607437134} -11/07/2021 01:25:06 - INFO - __main__ - Step 29963: {'lr': 0.00045724026735077886, 'samples': 5752896, 'steps': 29962, 'loss/train': 1.7151837348937988} -11/07/2021 01:25:06 - INFO - __main__ - Step 29964: {'lr': 0.00045723729920850464, 'samples': 5753088, 'steps': 29963, 'loss/train': 1.3524528741836548} -11/07/2021 01:25:06 - INFO - __main__ - Step 29965: {'lr': 0.00045723433097285247, 'samples': 5753280, 'steps': 29964, 'loss/train': 1.1049710512161255} -11/07/2021 01:25:07 - INFO - __main__ - Step 29966: {'lr': 0.0004572313626438238, 'samples': 5753472, 'steps': 29965, 'loss/train': 1.2778706550598145} -11/07/2021 01:25:08 - INFO - __main__ - Step 29967: {'lr': 0.00045722839422141984, 'samples': 5753664, 'steps': 29966, 'loss/train': 1.5637139081954956} -11/07/2021 01:25:08 - INFO - __main__ - Step 29968: {'lr': 0.000457225425705642, 'samples': 5753856, 'steps': 29967, 'loss/train': 1.3151350021362305} -11/07/2021 01:25:08 - INFO - __main__ - Step 29969: {'lr': 0.0004572224570964915, 'samples': 5754048, 'steps': 29968, 'loss/train': 1.915236473083496} -11/07/2021 01:25:09 - INFO - __main__ - Step 29970: {'lr': 0.0004572194883939697, 'samples': 5754240, 'steps': 29969, 'loss/train': 1.596436619758606} -11/07/2021 01:25:09 - INFO - __main__ - Step 29971: {'lr': 0.0004572165195980781, 'samples': 5754432, 'steps': 29970, 'loss/train': 1.238713026046753} -11/07/2021 01:25:10 - INFO - __main__ - Step 29972: {'lr': 0.0004572135507088179, 'samples': 5754624, 'steps': 29971, 'loss/train': 1.2251867055892944} -11/07/2021 01:25:11 - INFO - __main__ - Step 29973: {'lr': 0.00045721058172619043, 'samples': 5754816, 'steps': 29972, 'loss/train': 1.2458912134170532} -11/07/2021 01:25:11 - INFO - __main__ - Step 29974: {'lr': 0.0004572076126501972, 'samples': 5755008, 'steps': 29973, 'loss/train': 1.693926215171814} -11/07/2021 01:25:11 - INFO - __main__ - Step 29975: {'lr': 0.00045720464348083937, 'samples': 5755200, 'steps': 29974, 'loss/train': 1.7528555393218994} -11/07/2021 01:25:12 - INFO - __main__ - Step 29976: {'lr': 0.0004572016742181182, 'samples': 5755392, 'steps': 29975, 'loss/train': 1.8526099920272827} -11/07/2021 01:25:12 - INFO - __main__ - Step 29977: {'lr': 0.0004571987048620353, 'samples': 5755584, 'steps': 29976, 'loss/train': 1.5356825590133667} -11/07/2021 01:25:13 - INFO - __main__ - Step 29978: {'lr': 0.0004571957354125918, 'samples': 5755776, 'steps': 29977, 'loss/train': 1.5769151449203491} -11/07/2021 01:25:14 - INFO - __main__ - Step 29979: {'lr': 0.00045719276586978907, 'samples': 5755968, 'steps': 29978, 'loss/train': 1.5161664485931396} -11/07/2021 01:25:14 - INFO - __main__ - Step 29980: {'lr': 0.00045718979623362855, 'samples': 5756160, 'steps': 29979, 'loss/train': 1.3842449188232422} -11/07/2021 01:25:14 - INFO - __main__ - Step 29981: {'lr': 0.00045718682650411146, 'samples': 5756352, 'steps': 29980, 'loss/train': 1.6693494319915771} -11/07/2021 01:25:15 - INFO - __main__ - Step 29982: {'lr': 0.0004571838566812392, 'samples': 5756544, 'steps': 29981, 'loss/train': 1.5294941663742065} -11/07/2021 01:25:16 - INFO - __main__ - Step 29983: {'lr': 0.00045718088676501305, 'samples': 5756736, 'steps': 29982, 'loss/train': 1.6696785688400269} -11/07/2021 01:25:16 - INFO - __main__ - Step 29984: {'lr': 0.0004571779167554344, 'samples': 5756928, 'steps': 29983, 'loss/train': 1.5812838077545166} -11/07/2021 01:25:16 - INFO - __main__ - Step 29985: {'lr': 0.0004571749466525046, 'samples': 5757120, 'steps': 29984, 'loss/train': 1.3214921951293945} -11/07/2021 01:25:17 - INFO - __main__ - Step 29986: {'lr': 0.000457171976456225, 'samples': 5757312, 'steps': 29985, 'loss/train': 1.646202802658081} -11/07/2021 01:25:17 - INFO - __main__ - Step 29987: {'lr': 0.00045716900616659686, 'samples': 5757504, 'steps': 29986, 'loss/train': 2.17270565032959} -11/07/2021 01:25:18 - INFO - __main__ - Step 29988: {'lr': 0.00045716603578362157, 'samples': 5757696, 'steps': 29987, 'loss/train': 1.8010432720184326} -11/07/2021 01:25:19 - INFO - __main__ - Step 29989: {'lr': 0.00045716306530730043, 'samples': 5757888, 'steps': 29988, 'loss/train': 1.2930711507797241} -11/07/2021 01:25:19 - INFO - __main__ - Step 29990: {'lr': 0.00045716009473763486, 'samples': 5758080, 'steps': 29989, 'loss/train': 1.630855679512024} -11/07/2021 01:25:19 - INFO - __main__ - Step 29991: {'lr': 0.0004571571240746262, 'samples': 5758272, 'steps': 29990, 'loss/train': 1.8557555675506592} -11/07/2021 01:25:20 - INFO - __main__ - Step 29992: {'lr': 0.00045715415331827564, 'samples': 5758464, 'steps': 29991, 'loss/train': 1.6086505651474} -11/07/2021 01:25:20 - INFO - __main__ - Step 29993: {'lr': 0.00045715118246858466, 'samples': 5758656, 'steps': 29992, 'loss/train': 1.5766459703445435} -11/07/2021 01:25:21 - INFO - __main__ - Step 29994: {'lr': 0.0004571482115255545, 'samples': 5758848, 'steps': 29993, 'loss/train': 1.404898762702942} -11/07/2021 01:25:21 - INFO - __main__ - Step 29995: {'lr': 0.0004571452404891866, 'samples': 5759040, 'steps': 29994, 'loss/train': 1.7848975658416748} -11/07/2021 01:25:22 - INFO - __main__ - Step 29996: {'lr': 0.0004571422693594822, 'samples': 5759232, 'steps': 29995, 'loss/train': 1.7715831995010376} -11/07/2021 01:25:22 - INFO - __main__ - Step 29997: {'lr': 0.00045713929813644274, 'samples': 5759424, 'steps': 29996, 'loss/train': 1.537301778793335} -11/07/2021 01:25:22 - INFO - __main__ - Step 29998: {'lr': 0.0004571363268200695, 'samples': 5759616, 'steps': 29997, 'loss/train': 1.6564396619796753} -11/07/2021 01:25:23 - INFO - __main__ - Step 29999: {'lr': 0.0004571333554103638, 'samples': 5759808, 'steps': 29998, 'loss/train': 1.6401314735412598} -11/07/2021 01:25:24 - INFO - __main__ - Step 30000: {'lr': 0.0004571303839073271, 'samples': 5760000, 'steps': 29999, 'loss/train': 1.3726354837417603} -11/07/2021 01:25:24 - INFO - __main__ - Evaluating and saving model checkpoint -11/07/2021 01:28:38 - INFO - __main__ - Step 30000: {'loss/eval': 1.5031383037567139, 'perplexity': 4.495776176452637} -11/07/2021 01:28:49 - WARNING - huggingface_hub.repository - Adding files tracked by Git LFS: ['wandb/run-20211106_211610-dtkf2u0m/logs/debug-internal.log']. This may take a bit of time if the files are large. -11/07/2021 01:28:53 - WARNING - huggingface_hub.repository - Several commits (2) will be pushed upstream. -11/07/2021 01:28:53 - WARNING - huggingface_hub.repository - The progress bars may be unreliable. -11/07/2021 01:29:19 - WARNING - huggingface_hub.repository - To https://huggingface.co/lvwerra/codeparrot-small - acc8d6f..d425b2d proud-haze-135 -> proud-haze-135 - -11/07/2021 01:29:21 - INFO - __main__ - Step 30001: {'lr': 0.00045712741231096054, 'samples': 5760192, 'steps': 30000, 'loss/train': 1.1647251844406128} -11/07/2021 01:29:21 - INFO - __main__ - Step 30002: {'lr': 0.0004571244406212656, 'samples': 5760384, 'steps': 30001, 'loss/train': 1.471921682357788} -11/07/2021 01:29:22 - INFO - __main__ - Step 30003: {'lr': 0.00045712146883824357, 'samples': 5760576, 'steps': 30002, 'loss/train': 1.4950001239776611} -11/07/2021 01:29:22 - INFO - __main__ - Step 30004: {'lr': 0.00045711849696189585, 'samples': 5760768, 'steps': 30003, 'loss/train': 1.5751121044158936} -11/07/2021 01:29:23 - INFO - __main__ - Step 30005: {'lr': 0.0004571155249922237, 'samples': 5760960, 'steps': 30004, 'loss/train': 0.9164716601371765} -11/07/2021 01:29:24 - INFO - __main__ - Step 30006: {'lr': 0.00045711255292922847, 'samples': 5761152, 'steps': 30005, 'loss/train': 1.8894248008728027} -11/07/2021 01:29:24 - INFO - __main__ - Step 30007: {'lr': 0.00045710958077291156, 'samples': 5761344, 'steps': 30006, 'loss/train': 1.6442089080810547} -11/07/2021 01:29:24 - INFO - __main__ - Step 30008: {'lr': 0.00045710660852327423, 'samples': 5761536, 'steps': 30007, 'loss/train': 1.578920841217041} -11/07/2021 01:29:25 - INFO - __main__ - Step 30009: {'lr': 0.00045710363618031783, 'samples': 5761728, 'steps': 30008, 'loss/train': 1.5235463380813599} -11/07/2021 01:29:26 - INFO - __main__ - Step 30010: {'lr': 0.0004571006637440438, 'samples': 5761920, 'steps': 30009, 'loss/train': 1.534705400466919} -11/07/2021 01:29:26 - INFO - __main__ - Step 30011: {'lr': 0.00045709769121445335, 'samples': 5762112, 'steps': 30010, 'loss/train': 1.927817463874817} -11/07/2021 01:29:26 - INFO - __main__ - Step 30012: {'lr': 0.00045709471859154793, 'samples': 5762304, 'steps': 30011, 'loss/train': 1.541087031364441} -11/07/2021 01:29:27 - INFO - __main__ - Step 30013: {'lr': 0.0004570917458753288, 'samples': 5762496, 'steps': 30012, 'loss/train': 0.8787887692451477} -11/07/2021 01:29:27 - INFO - __main__ - Step 30014: {'lr': 0.00045708877306579733, 'samples': 5762688, 'steps': 30013, 'loss/train': 1.8259247541427612} -11/07/2021 01:29:28 - INFO - __main__ - Step 30015: {'lr': 0.00045708580016295486, 'samples': 5762880, 'steps': 30014, 'loss/train': 5.611205101013184} -11/07/2021 01:29:28 - INFO - __main__ - Step 30016: {'lr': 0.0004570828271668027, 'samples': 5763072, 'steps': 30015, 'loss/train': 1.2683762311935425} -11/07/2021 01:29:29 - INFO - __main__ - Step 30017: {'lr': 0.0004570798540773422, 'samples': 5763264, 'steps': 30016, 'loss/train': 1.17982816696167} -11/07/2021 01:29:29 - INFO - __main__ - Step 30018: {'lr': 0.0004570768808945748, 'samples': 5763456, 'steps': 30017, 'loss/train': 2.3335750102996826} -11/07/2021 01:29:30 - INFO - __main__ - Step 30019: {'lr': 0.00045707390761850163, 'samples': 5763648, 'steps': 30018, 'loss/train': 1.6228090524673462} -11/07/2021 01:29:30 - INFO - __main__ - Step 30020: {'lr': 0.00045707093424912426, 'samples': 5763840, 'steps': 30019, 'loss/train': 1.74102783203125} -11/07/2021 01:29:31 - INFO - __main__ - Step 30021: {'lr': 0.00045706796078644386, 'samples': 5764032, 'steps': 30020, 'loss/train': 1.6227269172668457} -11/07/2021 01:29:32 - INFO - __main__ - Step 30022: {'lr': 0.00045706498723046185, 'samples': 5764224, 'steps': 30021, 'loss/train': 1.0815889835357666} -11/07/2021 01:29:32 - INFO - __main__ - Step 30023: {'lr': 0.0004570620135811795, 'samples': 5764416, 'steps': 30022, 'loss/train': 1.4398486614227295} -11/07/2021 01:29:32 - INFO - __main__ - Step 30024: {'lr': 0.0004570590398385983, 'samples': 5764608, 'steps': 30023, 'loss/train': 1.8302394151687622} -11/07/2021 01:29:33 - INFO - __main__ - Step 30025: {'lr': 0.0004570560660027194, 'samples': 5764800, 'steps': 30024, 'loss/train': 1.3542307615280151} -11/07/2021 01:29:34 - INFO - __main__ - Step 30026: {'lr': 0.00045705309207354433, 'samples': 5764992, 'steps': 30025, 'loss/train': 1.7640297412872314} -11/07/2021 01:29:34 - INFO - __main__ - Step 30027: {'lr': 0.00045705011805107426, 'samples': 5765184, 'steps': 30026, 'loss/train': 1.3665052652359009} -11/07/2021 01:29:35 - INFO - __main__ - Step 30028: {'lr': 0.00045704714393531064, 'samples': 5765376, 'steps': 30027, 'loss/train': 1.857277750968933} -11/07/2021 01:29:35 - INFO - __main__ - Step 30029: {'lr': 0.00045704416972625474, 'samples': 5765568, 'steps': 30028, 'loss/train': 1.743507981300354} -11/07/2021 01:29:35 - INFO - __main__ - Step 30030: {'lr': 0.000457041195423908, 'samples': 5765760, 'steps': 30029, 'loss/train': 0.26046043634414673} -11/07/2021 01:29:36 - INFO - __main__ - Step 30031: {'lr': 0.0004570382210282716, 'samples': 5765952, 'steps': 30030, 'loss/train': 1.2793536186218262} -11/07/2021 01:29:37 - INFO - __main__ - Step 30032: {'lr': 0.00045703524653934705, 'samples': 5766144, 'steps': 30031, 'loss/train': 1.660413384437561} -11/07/2021 01:29:37 - INFO - __main__ - Step 30033: {'lr': 0.0004570322719571355, 'samples': 5766336, 'steps': 30032, 'loss/train': 1.4386049509048462} -11/07/2021 01:29:37 - INFO - __main__ - Step 30034: {'lr': 0.00045702929728163845, 'samples': 5766528, 'steps': 30033, 'loss/train': 1.5465935468673706} -11/07/2021 01:29:38 - INFO - __main__ - Step 30035: {'lr': 0.00045702632251285727, 'samples': 5766720, 'steps': 30034, 'loss/train': 1.477612853050232} -11/07/2021 01:29:39 - INFO - __main__ - Step 30036: {'lr': 0.0004570233476507931, 'samples': 5766912, 'steps': 30035, 'loss/train': 1.1126904487609863} -11/07/2021 01:29:39 - INFO - __main__ - Step 30037: {'lr': 0.0004570203726954475, 'samples': 5767104, 'steps': 30036, 'loss/train': 1.389814853668213} -11/07/2021 01:29:40 - INFO - __main__ - Step 30038: {'lr': 0.0004570173976468217, 'samples': 5767296, 'steps': 30037, 'loss/train': 1.1946580410003662} -11/07/2021 01:29:40 - INFO - __main__ - Step 30039: {'lr': 0.0004570144225049171, 'samples': 5767488, 'steps': 30038, 'loss/train': 1.7716975212097168} -11/07/2021 01:29:40 - INFO - __main__ - Step 30040: {'lr': 0.00045701144726973487, 'samples': 5767680, 'steps': 30039, 'loss/train': 1.5792721509933472} -11/07/2021 01:29:41 - INFO - __main__ - Step 30041: {'lr': 0.0004570084719412766, 'samples': 5767872, 'steps': 30040, 'loss/train': 1.5281107425689697} -11/07/2021 01:29:42 - INFO - __main__ - Step 30042: {'lr': 0.00045700549651954344, 'samples': 5768064, 'steps': 30041, 'loss/train': 1.7906538248062134} -11/07/2021 01:29:42 - INFO - __main__ - Step 30043: {'lr': 0.0004570025210045368, 'samples': 5768256, 'steps': 30042, 'loss/train': 1.53825044631958} -11/07/2021 01:29:42 - INFO - __main__ - Step 30044: {'lr': 0.00045699954539625803, 'samples': 5768448, 'steps': 30043, 'loss/train': 1.9995921850204468} -11/07/2021 01:29:43 - INFO - __main__ - Step 30045: {'lr': 0.0004569965696947085, 'samples': 5768640, 'steps': 30044, 'loss/train': 1.798302173614502} -11/07/2021 01:29:44 - INFO - __main__ - Step 30046: {'lr': 0.00045699359389988944, 'samples': 5768832, 'steps': 30045, 'loss/train': 1.6981176137924194} -11/07/2021 01:29:44 - INFO - __main__ - Step 30047: {'lr': 0.0004569906180118023, 'samples': 5769024, 'steps': 30046, 'loss/train': 1.1167492866516113} -11/07/2021 01:29:45 - INFO - __main__ - Step 30048: {'lr': 0.0004569876420304484, 'samples': 5769216, 'steps': 30047, 'loss/train': 1.6173962354660034} -11/07/2021 01:29:45 - INFO - __main__ - Step 30049: {'lr': 0.000456984665955829, 'samples': 5769408, 'steps': 30048, 'loss/train': 1.273735523223877} -11/07/2021 01:29:45 - INFO - __main__ - Step 30050: {'lr': 0.00045698168978794553, 'samples': 5769600, 'steps': 30049, 'loss/train': 1.3786624670028687} -11/07/2021 01:29:46 - INFO - __main__ - Step 30051: {'lr': 0.0004569787135267993, 'samples': 5769792, 'steps': 30050, 'loss/train': 0.8889176845550537} -11/07/2021 01:29:47 - INFO - __main__ - Step 30052: {'lr': 0.00045697573717239174, 'samples': 5769984, 'steps': 30051, 'loss/train': 1.804728388786316} -11/07/2021 01:29:47 - INFO - __main__ - Step 30053: {'lr': 0.0004569727607247239, 'samples': 5770176, 'steps': 30052, 'loss/train': 1.58971107006073} -11/07/2021 01:29:47 - INFO - __main__ - Step 30054: {'lr': 0.00045696978418379754, 'samples': 5770368, 'steps': 30053, 'loss/train': 1.5156389474868774} -11/07/2021 01:29:48 - INFO - __main__ - Step 30055: {'lr': 0.0004569668075496137, 'samples': 5770560, 'steps': 30054, 'loss/train': 0.4359086751937866} -11/07/2021 01:29:48 - INFO - __main__ - Step 30056: {'lr': 0.00045696383082217387, 'samples': 5770752, 'steps': 30055, 'loss/train': 1.3137329816818237} -11/07/2021 01:29:49 - INFO - __main__ - Step 30057: {'lr': 0.00045696085400147925, 'samples': 5770944, 'steps': 30056, 'loss/train': 1.8441475629806519} -11/07/2021 01:29:50 - INFO - __main__ - Step 30058: {'lr': 0.00045695787708753126, 'samples': 5771136, 'steps': 30057, 'loss/train': 0.7664819359779358} -11/07/2021 01:29:50 - INFO - __main__ - Step 30059: {'lr': 0.0004569549000803313, 'samples': 5771328, 'steps': 30058, 'loss/train': 1.503903865814209} -11/07/2021 01:29:50 - INFO - __main__ - Step 30060: {'lr': 0.00045695192297988066, 'samples': 5771520, 'steps': 30059, 'loss/train': 1.5076161623001099} -11/07/2021 01:29:51 - INFO - __main__ - Step 30061: {'lr': 0.00045694894578618064, 'samples': 5771712, 'steps': 30060, 'loss/train': 1.1038973331451416} -11/07/2021 01:29:52 - INFO - __main__ - Step 30062: {'lr': 0.00045694596849923263, 'samples': 5771904, 'steps': 30061, 'loss/train': 2.0637073516845703} -11/07/2021 01:29:52 - INFO - __main__ - Step 30063: {'lr': 0.0004569429911190379, 'samples': 5772096, 'steps': 30062, 'loss/train': 1.0061378479003906} -11/07/2021 01:29:52 - INFO - __main__ - Step 30064: {'lr': 0.00045694001364559797, 'samples': 5772288, 'steps': 30063, 'loss/train': 1.5570694208145142} -11/07/2021 01:29:53 - INFO - __main__ - Step 30065: {'lr': 0.00045693703607891403, 'samples': 5772480, 'steps': 30064, 'loss/train': 0.8967161774635315} -11/07/2021 01:29:53 - INFO - __main__ - Step 30066: {'lr': 0.0004569340584189874, 'samples': 5772672, 'steps': 30065, 'loss/train': 1.420305609703064} -11/07/2021 01:29:54 - INFO - __main__ - Step 30067: {'lr': 0.0004569310806658195, 'samples': 5772864, 'steps': 30066, 'loss/train': 0.3159783184528351} -11/07/2021 01:29:55 - INFO - __main__ - Step 30068: {'lr': 0.0004569281028194117, 'samples': 5773056, 'steps': 30067, 'loss/train': 1.5327019691467285} -11/07/2021 01:29:55 - INFO - __main__ - Step 30069: {'lr': 0.0004569251248797652, 'samples': 5773248, 'steps': 30068, 'loss/train': 2.2474756240844727} -11/07/2021 01:29:56 - INFO - __main__ - Step 30070: {'lr': 0.0004569221468468815, 'samples': 5773440, 'steps': 30069, 'loss/train': 2.7942593097686768} -11/07/2021 01:29:56 - INFO - __main__ - Step 30071: {'lr': 0.0004569191687207618, 'samples': 5773632, 'steps': 30070, 'loss/train': 2.573376417160034} -11/07/2021 01:29:56 - INFO - __main__ - Step 30072: {'lr': 0.0004569161905014076, 'samples': 5773824, 'steps': 30071, 'loss/train': 2.012526273727417} -11/07/2021 01:29:57 - INFO - __main__ - Step 30073: {'lr': 0.0004569132121888201, 'samples': 5774016, 'steps': 30072, 'loss/train': 1.594914197921753} -11/07/2021 01:29:58 - INFO - __main__ - Step 30074: {'lr': 0.0004569102337830007, 'samples': 5774208, 'steps': 30073, 'loss/train': 1.4602880477905273} -11/07/2021 01:29:58 - INFO - __main__ - Step 30075: {'lr': 0.00045690725528395077, 'samples': 5774400, 'steps': 30074, 'loss/train': 1.65486741065979} -11/07/2021 01:29:58 - INFO - __main__ - Step 30076: {'lr': 0.0004569042766916717, 'samples': 5774592, 'steps': 30075, 'loss/train': 2.147484540939331} -11/07/2021 01:29:59 - INFO - __main__ - Step 30077: {'lr': 0.0004569012980061646, 'samples': 5774784, 'steps': 30076, 'loss/train': 1.3971514701843262} -11/07/2021 01:30:00 - INFO - __main__ - Step 30078: {'lr': 0.00045689831922743107, 'samples': 5774976, 'steps': 30077, 'loss/train': 1.5956676006317139} -11/07/2021 01:30:00 - INFO - __main__ - Step 30079: {'lr': 0.0004568953403554723, 'samples': 5775168, 'steps': 30078, 'loss/train': 2.0979011058807373} -11/07/2021 01:30:00 - INFO - __main__ - Step 30080: {'lr': 0.0004568923613902897, 'samples': 5775360, 'steps': 30079, 'loss/train': 1.4927865266799927} -11/07/2021 01:30:01 - INFO - __main__ - Step 30081: {'lr': 0.0004568893823318846, 'samples': 5775552, 'steps': 30080, 'loss/train': 1.610865592956543} -11/07/2021 01:30:01 - INFO - __main__ - Step 30082: {'lr': 0.0004568864031802583, 'samples': 5775744, 'steps': 30081, 'loss/train': 1.672869324684143} -11/07/2021 01:30:02 - INFO - __main__ - Step 30083: {'lr': 0.00045688342393541227, 'samples': 5775936, 'steps': 30082, 'loss/train': 1.5688196420669556} -11/07/2021 01:30:03 - INFO - __main__ - Step 30084: {'lr': 0.00045688044459734766, 'samples': 5776128, 'steps': 30083, 'loss/train': 0.9201650023460388} -11/07/2021 01:30:03 - INFO - __main__ - Step 30085: {'lr': 0.000456877465166066, 'samples': 5776320, 'steps': 30084, 'loss/train': 1.4790961742401123} -11/07/2021 01:30:03 - INFO - __main__ - Step 30086: {'lr': 0.0004568744856415685, 'samples': 5776512, 'steps': 30085, 'loss/train': 1.6495736837387085} -11/07/2021 01:30:04 - INFO - __main__ - Step 30087: {'lr': 0.0004568715060238565, 'samples': 5776704, 'steps': 30086, 'loss/train': 1.9113773107528687} -11/07/2021 01:30:05 - INFO - __main__ - Step 30088: {'lr': 0.0004568685263129315, 'samples': 5776896, 'steps': 30087, 'loss/train': 1.5765928030014038} -11/07/2021 01:30:05 - INFO - __main__ - Step 30089: {'lr': 0.00045686554650879464, 'samples': 5777088, 'steps': 30088, 'loss/train': 2.0161173343658447} -11/07/2021 01:30:05 - INFO - __main__ - Step 30090: {'lr': 0.0004568625666114474, 'samples': 5777280, 'steps': 30089, 'loss/train': 1.174398422241211} -11/07/2021 01:30:06 - INFO - __main__ - Step 30091: {'lr': 0.00045685958662089113, 'samples': 5777472, 'steps': 30090, 'loss/train': 2.05692195892334} -11/07/2021 01:30:06 - INFO - __main__ - Step 30092: {'lr': 0.000456856606537127, 'samples': 5777664, 'steps': 30091, 'loss/train': 1.8893474340438843} -11/07/2021 01:30:06 - INFO - __main__ - Step 30093: {'lr': 0.00045685362636015657, 'samples': 5777856, 'steps': 30092, 'loss/train': 1.5812064409255981} -11/07/2021 01:30:07 - INFO - __main__ - Step 30094: {'lr': 0.00045685064608998107, 'samples': 5778048, 'steps': 30093, 'loss/train': 1.4328776597976685} -11/07/2021 01:30:08 - INFO - __main__ - Step 30095: {'lr': 0.00045684766572660185, 'samples': 5778240, 'steps': 30094, 'loss/train': 1.4008127450942993} -11/07/2021 01:30:08 - INFO - __main__ - Step 30096: {'lr': 0.0004568446852700203, 'samples': 5778432, 'steps': 30095, 'loss/train': 1.5155335664749146} -11/07/2021 01:30:08 - INFO - __main__ - Step 30097: {'lr': 0.00045684170472023766, 'samples': 5778624, 'steps': 30096, 'loss/train': 1.069875955581665} -11/07/2021 01:30:09 - INFO - __main__ - Step 30098: {'lr': 0.00045683872407725534, 'samples': 5778816, 'steps': 30097, 'loss/train': 1.413217306137085} -11/07/2021 01:30:10 - INFO - __main__ - Step 30099: {'lr': 0.00045683574334107473, 'samples': 5779008, 'steps': 30098, 'loss/train': 1.6160032749176025} -11/07/2021 01:30:10 - INFO - __main__ - Step 30100: {'lr': 0.00045683276251169713, 'samples': 5779200, 'steps': 30099, 'loss/train': 1.3631938695907593} -11/07/2021 01:30:10 - INFO - __main__ - Step 30101: {'lr': 0.00045682978158912384, 'samples': 5779392, 'steps': 30100, 'loss/train': 1.698129653930664} -11/07/2021 01:30:11 - INFO - __main__ - Step 30102: {'lr': 0.0004568268005733562, 'samples': 5779584, 'steps': 30101, 'loss/train': 1.546492576599121} -11/07/2021 01:30:11 - INFO - __main__ - Step 30103: {'lr': 0.0004568238194643958, 'samples': 5779776, 'steps': 30102, 'loss/train': 2.1197760105133057} -11/07/2021 01:30:12 - INFO - __main__ - Step 30104: {'lr': 0.00045682083826224356, 'samples': 5779968, 'steps': 30103, 'loss/train': 1.2861956357955933} -11/07/2021 01:30:13 - INFO - __main__ - Step 30105: {'lr': 0.00045681785696690113, 'samples': 5780160, 'steps': 30104, 'loss/train': 1.3815172910690308} -11/07/2021 01:30:13 - INFO - __main__ - Step 30106: {'lr': 0.0004568148755783698, 'samples': 5780352, 'steps': 30105, 'loss/train': 1.5989118814468384} -11/07/2021 01:30:13 - INFO - __main__ - Step 30107: {'lr': 0.00045681189409665083, 'samples': 5780544, 'steps': 30106, 'loss/train': 1.6340943574905396} -11/07/2021 01:30:14 - INFO - __main__ - Step 30108: {'lr': 0.00045680891252174557, 'samples': 5780736, 'steps': 30107, 'loss/train': 0.8320098519325256} -11/07/2021 01:30:15 - INFO - __main__ - Step 30109: {'lr': 0.0004568059308536554, 'samples': 5780928, 'steps': 30108, 'loss/train': 2.0117850303649902} -11/07/2021 01:30:15 - INFO - __main__ - Step 30110: {'lr': 0.00045680294909238175, 'samples': 5781120, 'steps': 30109, 'loss/train': 1.3014116287231445} -11/07/2021 01:30:16 - INFO - __main__ - Step 30111: {'lr': 0.00045679996723792585, 'samples': 5781312, 'steps': 30110, 'loss/train': 1.8772363662719727} -11/07/2021 01:30:16 - INFO - __main__ - Step 30112: {'lr': 0.00045679698529028906, 'samples': 5781504, 'steps': 30111, 'loss/train': 1.3997163772583008} -11/07/2021 01:30:16 - INFO - __main__ - Step 30113: {'lr': 0.00045679400324947274, 'samples': 5781696, 'steps': 30112, 'loss/train': 1.5095996856689453} -11/07/2021 01:30:17 - INFO - __main__ - Step 30114: {'lr': 0.00045679102111547825, 'samples': 5781888, 'steps': 30113, 'loss/train': 1.160984754562378} -11/07/2021 01:30:18 - INFO - __main__ - Step 30115: {'lr': 0.00045678803888830687, 'samples': 5782080, 'steps': 30114, 'loss/train': 1.4564838409423828} -11/07/2021 01:30:18 - INFO - __main__ - Step 30116: {'lr': 0.0004567850565679601, 'samples': 5782272, 'steps': 30115, 'loss/train': 1.005316972732544} -11/07/2021 01:30:19 - INFO - __main__ - Step 30117: {'lr': 0.00045678207415443913, 'samples': 5782464, 'steps': 30116, 'loss/train': 1.553978443145752} -11/07/2021 01:30:19 - INFO - __main__ - Step 30118: {'lr': 0.0004567790916477453, 'samples': 5782656, 'steps': 30117, 'loss/train': 1.6825364828109741} -11/07/2021 01:30:19 - INFO - __main__ - Step 30119: {'lr': 0.00045677610904788004, 'samples': 5782848, 'steps': 30118, 'loss/train': 2.8823390007019043} -11/07/2021 01:30:20 - INFO - __main__ - Step 30120: {'lr': 0.00045677312635484466, 'samples': 5783040, 'steps': 30119, 'loss/train': 1.8276495933532715} -11/07/2021 01:30:21 - INFO - __main__ - Step 30121: {'lr': 0.00045677014356864043, 'samples': 5783232, 'steps': 30120, 'loss/train': 1.7994734048843384} -11/07/2021 01:30:21 - INFO - __main__ - Step 30122: {'lr': 0.0004567671606892688, 'samples': 5783424, 'steps': 30121, 'loss/train': 1.3283331394195557} -11/07/2021 01:30:21 - INFO - __main__ - Step 30123: {'lr': 0.00045676417771673116, 'samples': 5783616, 'steps': 30122, 'loss/train': 1.4653687477111816} -11/07/2021 01:30:22 - INFO - __main__ - Step 30124: {'lr': 0.0004567611946510287, 'samples': 5783808, 'steps': 30123, 'loss/train': 1.199395775794983} -11/07/2021 01:30:22 - INFO - __main__ - Step 30125: {'lr': 0.00045675821149216285, 'samples': 5784000, 'steps': 30124, 'loss/train': 1.7691177129745483} -11/07/2021 01:30:24 - INFO - __main__ - Step 30126: {'lr': 0.00045675522824013495, 'samples': 5784192, 'steps': 30125, 'loss/train': 1.8721429109573364} -11/07/2021 01:30:24 - INFO - __main__ - Step 30127: {'lr': 0.00045675224489494633, 'samples': 5784384, 'steps': 30126, 'loss/train': 1.6406543254852295} -11/07/2021 01:30:24 - INFO - __main__ - Step 30128: {'lr': 0.00045674926145659834, 'samples': 5784576, 'steps': 30127, 'loss/train': 2.016087293624878} -11/07/2021 01:30:25 - INFO - __main__ - Step 30129: {'lr': 0.0004567462779250923, 'samples': 5784768, 'steps': 30128, 'loss/train': 1.9647272825241089} -11/07/2021 01:30:25 - INFO - __main__ - Step 30130: {'lr': 0.0004567432943004296, 'samples': 5784960, 'steps': 30129, 'loss/train': 2.230543375015259} -11/07/2021 01:30:26 - INFO - __main__ - Step 30131: {'lr': 0.00045674031058261157, 'samples': 5785152, 'steps': 30130, 'loss/train': 1.6160472631454468} -11/07/2021 01:30:27 - INFO - __main__ - Step 30132: {'lr': 0.0004567373267716395, 'samples': 5785344, 'steps': 30131, 'loss/train': 1.335902452468872} -11/07/2021 01:30:27 - INFO - __main__ - Step 30133: {'lr': 0.0004567343428675148, 'samples': 5785536, 'steps': 30132, 'loss/train': 3.5647571086883545} -11/07/2021 01:30:27 - INFO - __main__ - Step 30134: {'lr': 0.00045673135887023874, 'samples': 5785728, 'steps': 30133, 'loss/train': 1.5163437128067017} -11/07/2021 01:30:28 - INFO - __main__ - Step 30135: {'lr': 0.0004567283747798128, 'samples': 5785920, 'steps': 30134, 'loss/train': 0.4308475852012634} -11/07/2021 01:30:28 - INFO - __main__ - Step 30136: {'lr': 0.0004567253905962383, 'samples': 5786112, 'steps': 30135, 'loss/train': 0.8566787838935852} -11/07/2021 01:30:29 - INFO - __main__ - Step 30137: {'lr': 0.00045672240631951645, 'samples': 5786304, 'steps': 30136, 'loss/train': 2.039283275604248} -11/07/2021 01:30:29 - INFO - __main__ - Step 30138: {'lr': 0.0004567194219496487, 'samples': 5786496, 'steps': 30137, 'loss/train': 2.0596466064453125} -11/07/2021 01:30:30 - INFO - __main__ - Step 30139: {'lr': 0.0004567164374866363, 'samples': 5786688, 'steps': 30138, 'loss/train': 1.325622797012329} -11/07/2021 01:30:30 - INFO - __main__ - Step 30140: {'lr': 0.00045671345293048075, 'samples': 5786880, 'steps': 30139, 'loss/train': 2.0110180377960205} -11/07/2021 01:30:30 - INFO - __main__ - Step 30141: {'lr': 0.00045671046828118324, 'samples': 5787072, 'steps': 30140, 'loss/train': 1.7381306886672974} -11/07/2021 01:30:32 - INFO - __main__ - Step 30142: {'lr': 0.0004567074835387452, 'samples': 5787264, 'steps': 30141, 'loss/train': 1.5954102277755737} -11/07/2021 01:30:32 - INFO - __main__ - Step 30143: {'lr': 0.000456704498703168, 'samples': 5787456, 'steps': 30142, 'loss/train': 1.3785072565078735} -11/07/2021 01:30:32 - INFO - __main__ - Step 30144: {'lr': 0.0004567015137744529, 'samples': 5787648, 'steps': 30143, 'loss/train': 1.4675315618515015} -11/07/2021 01:30:33 - INFO - __main__ - Step 30145: {'lr': 0.00045669852875260134, 'samples': 5787840, 'steps': 30144, 'loss/train': 1.5212641954421997} -11/07/2021 01:30:33 - INFO - __main__ - Step 30146: {'lr': 0.00045669554363761454, 'samples': 5788032, 'steps': 30145, 'loss/train': 1.521730661392212} -11/07/2021 01:30:34 - INFO - __main__ - Step 30147: {'lr': 0.0004566925584294939, 'samples': 5788224, 'steps': 30146, 'loss/train': 1.2389037609100342} -11/07/2021 01:30:34 - INFO - __main__ - Step 30148: {'lr': 0.00045668957312824086, 'samples': 5788416, 'steps': 30147, 'loss/train': 1.8396090269088745} -11/07/2021 01:30:35 - INFO - __main__ - Step 30149: {'lr': 0.00045668658773385663, 'samples': 5788608, 'steps': 30148, 'loss/train': 1.3113459348678589} -11/07/2021 01:30:35 - INFO - __main__ - Step 30150: {'lr': 0.00045668360224634263, 'samples': 5788800, 'steps': 30149, 'loss/train': 1.4173098802566528} -11/07/2021 01:30:36 - INFO - __main__ - Step 30151: {'lr': 0.00045668061666570027, 'samples': 5788992, 'steps': 30150, 'loss/train': 1.859587550163269} -11/07/2021 01:30:36 - INFO - __main__ - Step 30152: {'lr': 0.0004566776309919307, 'samples': 5789184, 'steps': 30151, 'loss/train': 1.4605780839920044} -11/07/2021 01:30:37 - INFO - __main__ - Step 30153: {'lr': 0.0004566746452250354, 'samples': 5789376, 'steps': 30152, 'loss/train': 1.5716723203659058} -11/07/2021 01:30:37 - INFO - __main__ - Step 30154: {'lr': 0.00045667165936501573, 'samples': 5789568, 'steps': 30153, 'loss/train': 1.8349000215530396} -11/07/2021 01:30:38 - INFO - __main__ - Step 30155: {'lr': 0.000456668673411873, 'samples': 5789760, 'steps': 30154, 'loss/train': 1.5699809789657593} -11/07/2021 01:30:38 - INFO - __main__ - Step 30156: {'lr': 0.00045666568736560853, 'samples': 5789952, 'steps': 30155, 'loss/train': 1.7113829851150513} -11/07/2021 01:30:38 - INFO - __main__ - Step 30157: {'lr': 0.0004566627012262238, 'samples': 5790144, 'steps': 30156, 'loss/train': 1.5282222032546997} -11/07/2021 01:30:39 - INFO - __main__ - Step 30158: {'lr': 0.0004566597149937199, 'samples': 5790336, 'steps': 30157, 'loss/train': 1.5575758218765259} -11/07/2021 01:30:40 - INFO - __main__ - Step 30159: {'lr': 0.00045665672866809835, 'samples': 5790528, 'steps': 30158, 'loss/train': 1.7184828519821167} -11/07/2021 01:30:40 - INFO - __main__ - Step 30160: {'lr': 0.0004566537422493605, 'samples': 5790720, 'steps': 30159, 'loss/train': 1.5131640434265137} -11/07/2021 01:30:40 - INFO - __main__ - Step 30161: {'lr': 0.00045665075573750764, 'samples': 5790912, 'steps': 30160, 'loss/train': 1.4869385957717896} -11/07/2021 01:30:41 - INFO - __main__ - Step 30162: {'lr': 0.00045664776913254115, 'samples': 5791104, 'steps': 30161, 'loss/train': 3.2416024208068848} -11/07/2021 01:30:42 - INFO - __main__ - Step 30163: {'lr': 0.0004566447824344624, 'samples': 5791296, 'steps': 30162, 'loss/train': 1.4250823259353638} -11/07/2021 01:30:42 - INFO - __main__ - Step 30164: {'lr': 0.00045664179564327266, 'samples': 5791488, 'steps': 30163, 'loss/train': 1.4880365133285522} -11/07/2021 01:30:42 - INFO - __main__ - Step 30165: {'lr': 0.00045663880875897325, 'samples': 5791680, 'steps': 30164, 'loss/train': 1.4041705131530762} -11/07/2021 01:30:43 - INFO - __main__ - Step 30166: {'lr': 0.00045663582178156564, 'samples': 5791872, 'steps': 30165, 'loss/train': 1.2579805850982666} -11/07/2021 01:30:43 - INFO - __main__ - Step 30167: {'lr': 0.00045663283471105115, 'samples': 5792064, 'steps': 30166, 'loss/train': 1.209857702255249} -11/07/2021 01:30:45 - INFO - __main__ - Step 30168: {'lr': 0.00045662984754743106, 'samples': 5792256, 'steps': 30167, 'loss/train': 1.6755338907241821} -11/07/2021 01:30:45 - INFO - __main__ - Step 30169: {'lr': 0.00045662686029070674, 'samples': 5792448, 'steps': 30168, 'loss/train': 1.4897969961166382} -11/07/2021 01:30:45 - INFO - __main__ - Step 30170: {'lr': 0.0004566238729408796, 'samples': 5792640, 'steps': 30169, 'loss/train': 0.8648298382759094} -11/07/2021 01:30:46 - INFO - __main__ - Step 30171: {'lr': 0.00045662088549795087, 'samples': 5792832, 'steps': 30170, 'loss/train': 1.545324444770813} -11/07/2021 01:30:46 - INFO - __main__ - Step 30172: {'lr': 0.000456617897961922, 'samples': 5793024, 'steps': 30171, 'loss/train': 1.4268949031829834} -11/07/2021 01:30:47 - INFO - __main__ - Step 30173: {'lr': 0.00045661491033279427, 'samples': 5793216, 'steps': 30172, 'loss/train': 1.5952434539794922} -11/07/2021 01:30:48 - INFO - __main__ - Step 30174: {'lr': 0.00045661192261056905, 'samples': 5793408, 'steps': 30173, 'loss/train': 1.5790772438049316} -11/07/2021 01:30:48 - INFO - __main__ - Step 30175: {'lr': 0.00045660893479524767, 'samples': 5793600, 'steps': 30174, 'loss/train': 2.000520706176758} -11/07/2021 01:30:48 - INFO - __main__ - Step 30176: {'lr': 0.00045660594688683154, 'samples': 5793792, 'steps': 30175, 'loss/train': 1.4284133911132812} -11/07/2021 01:30:49 - INFO - __main__ - Step 30177: {'lr': 0.00045660295888532196, 'samples': 5793984, 'steps': 30176, 'loss/train': 1.7523822784423828} -11/07/2021 01:30:50 - INFO - __main__ - Step 30178: {'lr': 0.00045659997079072024, 'samples': 5794176, 'steps': 30177, 'loss/train': 1.5193082094192505} -11/07/2021 01:30:50 - INFO - __main__ - Step 30179: {'lr': 0.00045659698260302773, 'samples': 5794368, 'steps': 30178, 'loss/train': 1.563475251197815} -11/07/2021 01:30:50 - INFO - __main__ - Step 30180: {'lr': 0.00045659399432224583, 'samples': 5794560, 'steps': 30179, 'loss/train': 1.3032660484313965} -11/07/2021 01:30:51 - INFO - __main__ - Step 30181: {'lr': 0.00045659100594837586, 'samples': 5794752, 'steps': 30180, 'loss/train': 1.5408105850219727} -11/07/2021 01:30:51 - INFO - __main__ - Step 30182: {'lr': 0.0004565880174814192, 'samples': 5794944, 'steps': 30181, 'loss/train': 1.7648100852966309} -11/07/2021 01:30:51 - INFO - __main__ - Step 30183: {'lr': 0.0004565850289213772, 'samples': 5795136, 'steps': 30182, 'loss/train': 1.5357639789581299} -11/07/2021 01:30:53 - INFO - __main__ - Step 30184: {'lr': 0.0004565820402682511, 'samples': 5795328, 'steps': 30183, 'loss/train': 1.9818118810653687} -11/07/2021 01:30:53 - INFO - __main__ - Step 30185: {'lr': 0.00045657905152204236, 'samples': 5795520, 'steps': 30184, 'loss/train': 0.6554961204528809} -11/07/2021 01:30:53 - INFO - __main__ - Step 30186: {'lr': 0.0004565760626827523, 'samples': 5795712, 'steps': 30185, 'loss/train': 1.025604248046875} -11/07/2021 01:30:54 - INFO - __main__ - Step 30187: {'lr': 0.00045657307375038226, 'samples': 5795904, 'steps': 30186, 'loss/train': 1.1355433464050293} -11/07/2021 01:30:54 - INFO - __main__ - Step 30188: {'lr': 0.00045657008472493356, 'samples': 5796096, 'steps': 30187, 'loss/train': 1.4717738628387451} -11/07/2021 01:30:55 - INFO - __main__ - Step 30189: {'lr': 0.0004565670956064075, 'samples': 5796288, 'steps': 30188, 'loss/train': 1.4684523344039917} -11/07/2021 01:30:55 - INFO - __main__ - Step 30190: {'lr': 0.00045656410639480563, 'samples': 5796480, 'steps': 30189, 'loss/train': 1.4059257507324219} -11/07/2021 01:30:56 - INFO - __main__ - Step 30191: {'lr': 0.00045656111709012906, 'samples': 5796672, 'steps': 30190, 'loss/train': 1.1448701620101929} -11/07/2021 01:30:56 - INFO - __main__ - Step 30192: {'lr': 0.00045655812769237927, 'samples': 5796864, 'steps': 30191, 'loss/train': 1.4939942359924316} -11/07/2021 01:30:57 - INFO - __main__ - Step 30193: {'lr': 0.00045655513820155755, 'samples': 5797056, 'steps': 30192, 'loss/train': 4.016806602478027} -11/07/2021 01:30:58 - INFO - __main__ - Step 30194: {'lr': 0.00045655214861766525, 'samples': 5797248, 'steps': 30193, 'loss/train': 1.5990046262741089} -11/07/2021 01:30:58 - INFO - __main__ - Step 30195: {'lr': 0.0004565491589407038, 'samples': 5797440, 'steps': 30194, 'loss/train': 1.4188684225082397} -11/07/2021 01:30:59 - INFO - __main__ - Step 30196: {'lr': 0.0004565461691706745, 'samples': 5797632, 'steps': 30195, 'loss/train': 1.6000747680664062} -11/07/2021 01:30:59 - INFO - __main__ - Step 30197: {'lr': 0.0004565431793075786, 'samples': 5797824, 'steps': 30196, 'loss/train': 1.141895055770874} -11/07/2021 01:30:59 - INFO - __main__ - Step 30198: {'lr': 0.0004565401893514176, 'samples': 5798016, 'steps': 30197, 'loss/train': 1.2154690027236938} -11/07/2021 01:31:00 - INFO - __main__ - Step 30199: {'lr': 0.0004565371993021927, 'samples': 5798208, 'steps': 30198, 'loss/train': 1.5073283910751343} -11/07/2021 01:31:01 - INFO - __main__ - Step 30200: {'lr': 0.00045653420915990546, 'samples': 5798400, 'steps': 30199, 'loss/train': 1.5848606824874878} -11/07/2021 01:31:01 - INFO - __main__ - Step 30201: {'lr': 0.000456531218924557, 'samples': 5798592, 'steps': 30200, 'loss/train': 1.862545371055603} -11/07/2021 01:31:01 - INFO - __main__ - Step 30202: {'lr': 0.0004565282285961488, 'samples': 5798784, 'steps': 30201, 'loss/train': 1.546978235244751} -11/07/2021 01:31:02 - INFO - __main__ - Step 30203: {'lr': 0.0004565252381746821, 'samples': 5798976, 'steps': 30202, 'loss/train': 1.5877180099487305} -11/07/2021 01:31:02 - INFO - __main__ - Step 30204: {'lr': 0.0004565222476601584, 'samples': 5799168, 'steps': 30203, 'loss/train': 1.850545883178711} -11/07/2021 01:31:03 - INFO - __main__ - Step 30205: {'lr': 0.0004565192570525789, 'samples': 5799360, 'steps': 30204, 'loss/train': 1.8471728563308716} -11/07/2021 01:31:03 - INFO - __main__ - Step 30206: {'lr': 0.00045651626635194497, 'samples': 5799552, 'steps': 30205, 'loss/train': 1.6950767040252686} -11/07/2021 01:31:04 - INFO - __main__ - Step 30207: {'lr': 0.0004565132755582581, 'samples': 5799744, 'steps': 30206, 'loss/train': 1.3628997802734375} -11/07/2021 01:31:04 - INFO - __main__ - Step 30208: {'lr': 0.0004565102846715195, 'samples': 5799936, 'steps': 30207, 'loss/train': 1.5977096557617188} -11/07/2021 01:31:04 - INFO - __main__ - Step 30209: {'lr': 0.0004565072936917305, 'samples': 5800128, 'steps': 30208, 'loss/train': 1.0420420169830322} -11/07/2021 01:31:06 - INFO - __main__ - Step 30210: {'lr': 0.0004565043026188926, 'samples': 5800320, 'steps': 30209, 'loss/train': 1.3461986780166626} -11/07/2021 01:31:06 - INFO - __main__ - Step 30211: {'lr': 0.000456501311453007, 'samples': 5800512, 'steps': 30210, 'loss/train': 1.7356064319610596} -11/07/2021 01:31:06 - INFO - __main__ - Step 30212: {'lr': 0.00045649832019407504, 'samples': 5800704, 'steps': 30211, 'loss/train': 1.5009082555770874} -11/07/2021 01:31:07 - INFO - __main__ - Step 30213: {'lr': 0.0004564953288420982, 'samples': 5800896, 'steps': 30212, 'loss/train': 1.2765473127365112} -11/07/2021 01:31:07 - INFO - __main__ - Step 30214: {'lr': 0.00045649233739707774, 'samples': 5801088, 'steps': 30213, 'loss/train': 1.5545157194137573} -11/07/2021 01:31:07 - INFO - __main__ - Step 30215: {'lr': 0.00045648934585901496, 'samples': 5801280, 'steps': 30214, 'loss/train': 1.4928683042526245} -11/07/2021 01:31:08 - INFO - __main__ - Step 30216: {'lr': 0.0004564863542279113, 'samples': 5801472, 'steps': 30215, 'loss/train': 1.6348497867584229} -11/07/2021 01:31:09 - INFO - __main__ - Step 30217: {'lr': 0.0004564833625037681, 'samples': 5801664, 'steps': 30216, 'loss/train': 1.4835448265075684} -11/07/2021 01:31:09 - INFO - __main__ - Step 30218: {'lr': 0.00045648037068658667, 'samples': 5801856, 'steps': 30217, 'loss/train': 1.124776005744934} -11/07/2021 01:31:09 - INFO - __main__ - Step 30219: {'lr': 0.00045647737877636834, 'samples': 5802048, 'steps': 30218, 'loss/train': 1.5227097272872925} -11/07/2021 01:31:10 - INFO - __main__ - Step 30220: {'lr': 0.0004564743867731145, 'samples': 5802240, 'steps': 30219, 'loss/train': 1.4747366905212402} -11/07/2021 01:31:11 - INFO - __main__ - Step 30221: {'lr': 0.0004564713946768265, 'samples': 5802432, 'steps': 30220, 'loss/train': 1.6206881999969482} -11/07/2021 01:31:11 - INFO - __main__ - Step 30222: {'lr': 0.0004564684024875057, 'samples': 5802624, 'steps': 30221, 'loss/train': 1.8404051065444946} -11/07/2021 01:31:12 - INFO - __main__ - Step 30223: {'lr': 0.0004564654102051534, 'samples': 5802816, 'steps': 30222, 'loss/train': 0.8817972540855408} -11/07/2021 01:31:12 - INFO - __main__ - Step 30224: {'lr': 0.000456462417829771, 'samples': 5803008, 'steps': 30223, 'loss/train': 1.4281342029571533} -11/07/2021 01:31:12 - INFO - __main__ - Step 30225: {'lr': 0.0004564594253613598, 'samples': 5803200, 'steps': 30224, 'loss/train': 1.5440261363983154} -11/07/2021 01:31:13 - INFO - __main__ - Step 30226: {'lr': 0.0004564564327999211, 'samples': 5803392, 'steps': 30225, 'loss/train': 1.7672604322433472} -11/07/2021 01:31:14 - INFO - __main__ - Step 30227: {'lr': 0.00045645344014545643, 'samples': 5803584, 'steps': 30226, 'loss/train': 1.117114543914795} -11/07/2021 01:31:14 - INFO - __main__ - Step 30228: {'lr': 0.00045645044739796694, 'samples': 5803776, 'steps': 30227, 'loss/train': 1.7497179508209229} -11/07/2021 01:31:14 - INFO - __main__ - Step 30229: {'lr': 0.00045644745455745414, 'samples': 5803968, 'steps': 30228, 'loss/train': 1.7879761457443237} -11/07/2021 01:31:15 - INFO - __main__ - Step 30230: {'lr': 0.0004564444616239193, 'samples': 5804160, 'steps': 30229, 'loss/train': 1.0915133953094482} -11/07/2021 01:31:16 - INFO - __main__ - Step 30231: {'lr': 0.0004564414685973637, 'samples': 5804352, 'steps': 30230, 'loss/train': 1.574084758758545} -11/07/2021 01:31:16 - INFO - __main__ - Step 30232: {'lr': 0.0004564384754777888, 'samples': 5804544, 'steps': 30231, 'loss/train': 1.618294358253479} -11/07/2021 01:31:16 - INFO - __main__ - Step 30233: {'lr': 0.00045643548226519587, 'samples': 5804736, 'steps': 30232, 'loss/train': 1.8467299938201904} -11/07/2021 01:31:17 - INFO - __main__ - Step 30234: {'lr': 0.00045643248895958636, 'samples': 5804928, 'steps': 30233, 'loss/train': 1.3164348602294922} -11/07/2021 01:31:17 - INFO - __main__ - Step 30235: {'lr': 0.00045642949556096146, 'samples': 5805120, 'steps': 30234, 'loss/train': 1.2188383340835571} -11/07/2021 01:31:17 - INFO - __main__ - Step 30236: {'lr': 0.0004564265020693227, 'samples': 5805312, 'steps': 30235, 'loss/train': 1.6616016626358032} -11/07/2021 01:31:18 - INFO - __main__ - Step 30237: {'lr': 0.0004564235084846713, 'samples': 5805504, 'steps': 30236, 'loss/train': 1.7576926946640015} -11/07/2021 01:31:19 - INFO - __main__ - Step 30238: {'lr': 0.00045642051480700873, 'samples': 5805696, 'steps': 30237, 'loss/train': 1.550876259803772} -11/07/2021 01:31:19 - INFO - __main__ - Step 30239: {'lr': 0.0004564175210363362, 'samples': 5805888, 'steps': 30238, 'loss/train': 1.633492350578308} -11/07/2021 01:31:20 - INFO - __main__ - Step 30240: {'lr': 0.00045641452717265507, 'samples': 5806080, 'steps': 30239, 'loss/train': 1.3447606563568115} -11/07/2021 01:31:20 - INFO - __main__ - Step 30241: {'lr': 0.00045641153321596687, 'samples': 5806272, 'steps': 30240, 'loss/train': 1.3774157762527466} -11/07/2021 01:31:21 - INFO - __main__ - Step 30242: {'lr': 0.0004564085391662727, 'samples': 5806464, 'steps': 30241, 'loss/train': 1.6286267042160034} -11/07/2021 01:31:21 - INFO - __main__ - Step 30243: {'lr': 0.00045640554502357413, 'samples': 5806656, 'steps': 30242, 'loss/train': 1.4465882778167725} -11/07/2021 01:31:22 - INFO - __main__ - Step 30244: {'lr': 0.0004564025507878723, 'samples': 5806848, 'steps': 30243, 'loss/train': 1.7390762567520142} -11/07/2021 01:31:22 - INFO - __main__ - Step 30245: {'lr': 0.00045639955645916875, 'samples': 5807040, 'steps': 30244, 'loss/train': 0.9178106188774109} -11/07/2021 01:31:22 - INFO - __main__ - Step 30246: {'lr': 0.0004563965620374647, 'samples': 5807232, 'steps': 30245, 'loss/train': 1.531065583229065} -11/07/2021 01:31:23 - INFO - __main__ - Step 30247: {'lr': 0.0004563935675227615, 'samples': 5807424, 'steps': 30246, 'loss/train': 1.9159185886383057} -11/07/2021 01:31:24 - INFO - __main__ - Step 30248: {'lr': 0.00045639057291506065, 'samples': 5807616, 'steps': 30247, 'loss/train': 1.6641156673431396} -11/07/2021 01:31:24 - INFO - __main__ - Step 30249: {'lr': 0.0004563875782143633, 'samples': 5807808, 'steps': 30248, 'loss/train': 1.6026545763015747} -11/07/2021 01:31:25 - INFO - __main__ - Step 30250: {'lr': 0.000456384583420671, 'samples': 5808000, 'steps': 30249, 'loss/train': 1.2319056987762451} -11/07/2021 01:31:25 - INFO - __main__ - Step 30251: {'lr': 0.0004563815885339849, 'samples': 5808192, 'steps': 30250, 'loss/train': 1.30437171459198} -11/07/2021 01:31:25 - INFO - __main__ - Step 30252: {'lr': 0.00045637859355430647, 'samples': 5808384, 'steps': 30251, 'loss/train': 1.471893548965454} -11/07/2021 01:31:26 - INFO - __main__ - Step 30253: {'lr': 0.000456375598481637, 'samples': 5808576, 'steps': 30252, 'loss/train': 1.7426419258117676} -11/07/2021 01:31:27 - INFO - __main__ - Step 30254: {'lr': 0.00045637260331597793, 'samples': 5808768, 'steps': 30253, 'loss/train': 1.6000956296920776} -11/07/2021 01:31:27 - INFO - __main__ - Step 30255: {'lr': 0.00045636960805733054, 'samples': 5808960, 'steps': 30254, 'loss/train': 1.3028124570846558} -11/07/2021 01:31:27 - INFO - __main__ - Step 30256: {'lr': 0.0004563666127056961, 'samples': 5809152, 'steps': 30255, 'loss/train': 1.526604413986206} -11/07/2021 01:31:28 - INFO - __main__ - Step 30257: {'lr': 0.0004563636172610761, 'samples': 5809344, 'steps': 30256, 'loss/train': 1.6551815271377563} -11/07/2021 01:31:29 - INFO - __main__ - Step 30258: {'lr': 0.00045636062172347186, 'samples': 5809536, 'steps': 30257, 'loss/train': 0.7848110198974609} -11/07/2021 01:31:29 - INFO - __main__ - Step 30259: {'lr': 0.0004563576260928847, 'samples': 5809728, 'steps': 30258, 'loss/train': 1.6645081043243408} -11/07/2021 01:31:30 - INFO - __main__ - Step 30260: {'lr': 0.000456354630369316, 'samples': 5809920, 'steps': 30259, 'loss/train': 1.7983936071395874} -11/07/2021 01:31:30 - INFO - __main__ - Step 30261: {'lr': 0.00045635163455276707, 'samples': 5810112, 'steps': 30260, 'loss/train': 1.5694831609725952} -11/07/2021 01:31:30 - INFO - __main__ - Step 30262: {'lr': 0.0004563486386432393, 'samples': 5810304, 'steps': 30261, 'loss/train': 1.768189549446106} -11/07/2021 01:31:31 - INFO - __main__ - Step 30263: {'lr': 0.00045634564264073396, 'samples': 5810496, 'steps': 30262, 'loss/train': 0.912808358669281} -11/07/2021 01:31:32 - INFO - __main__ - Step 30264: {'lr': 0.0004563426465452525, 'samples': 5810688, 'steps': 30263, 'loss/train': 1.8347886800765991} -11/07/2021 01:31:32 - INFO - __main__ - Step 30265: {'lr': 0.00045633965035679614, 'samples': 5810880, 'steps': 30264, 'loss/train': 1.2841131687164307} -11/07/2021 01:31:33 - INFO - __main__ - Step 30266: {'lr': 0.0004563366540753664, 'samples': 5811072, 'steps': 30265, 'loss/train': 1.7946243286132812} -11/07/2021 01:31:33 - INFO - __main__ - Step 30267: {'lr': 0.00045633365770096456, 'samples': 5811264, 'steps': 30266, 'loss/train': 1.5827088356018066} -11/07/2021 01:31:33 - INFO - __main__ - Step 30268: {'lr': 0.000456330661233592, 'samples': 5811456, 'steps': 30267, 'loss/train': 1.5512784719467163} -11/07/2021 01:31:35 - INFO - __main__ - Step 30269: {'lr': 0.00045632766467324995, 'samples': 5811648, 'steps': 30268, 'loss/train': 1.6750398874282837} -11/07/2021 01:31:35 - INFO - __main__ - Step 30270: {'lr': 0.0004563246680199398, 'samples': 5811840, 'steps': 30269, 'loss/train': 1.5613741874694824} -11/07/2021 01:31:36 - INFO - __main__ - Step 30271: {'lr': 0.000456321671273663, 'samples': 5812032, 'steps': 30270, 'loss/train': 1.44844651222229} -11/07/2021 01:31:36 - INFO - __main__ - Step 30272: {'lr': 0.00045631867443442084, 'samples': 5812224, 'steps': 30271, 'loss/train': 1.8668856620788574} -11/07/2021 01:31:36 - INFO - __main__ - Step 30273: {'lr': 0.00045631567750221465, 'samples': 5812416, 'steps': 30272, 'loss/train': 1.2790777683258057} -11/07/2021 01:31:37 - INFO - __main__ - Step 30274: {'lr': 0.0004563126804770458, 'samples': 5812608, 'steps': 30273, 'loss/train': 1.2653971910476685} -11/07/2021 01:31:38 - INFO - __main__ - Step 30275: {'lr': 0.00045630968335891564, 'samples': 5812800, 'steps': 30274, 'loss/train': 0.49572262167930603} -11/07/2021 01:31:38 - INFO - __main__ - Step 30276: {'lr': 0.00045630668614782553, 'samples': 5812992, 'steps': 30275, 'loss/train': 1.835469365119934} -11/07/2021 01:31:39 - INFO - __main__ - Step 30277: {'lr': 0.0004563036888437768, 'samples': 5813184, 'steps': 30276, 'loss/train': 1.9106202125549316} -11/07/2021 01:31:39 - INFO - __main__ - Step 30278: {'lr': 0.0004563006914467709, 'samples': 5813376, 'steps': 30277, 'loss/train': 1.3554658889770508} -11/07/2021 01:31:39 - INFO - __main__ - Step 30279: {'lr': 0.000456297693956809, 'samples': 5813568, 'steps': 30278, 'loss/train': 1.355484127998352} -11/07/2021 01:31:40 - INFO - __main__ - Step 30280: {'lr': 0.0004562946963738925, 'samples': 5813760, 'steps': 30279, 'loss/train': 1.4761924743652344} -11/07/2021 01:31:41 - INFO - __main__ - Step 30281: {'lr': 0.0004562916986980229, 'samples': 5813952, 'steps': 30280, 'loss/train': 2.2222375869750977} -11/07/2021 01:31:41 - INFO - __main__ - Step 30282: {'lr': 0.0004562887009292014, 'samples': 5814144, 'steps': 30281, 'loss/train': 1.4915366172790527} -11/07/2021 01:31:41 - INFO - __main__ - Step 30283: {'lr': 0.0004562857030674293, 'samples': 5814336, 'steps': 30282, 'loss/train': 1.5470994710922241} -11/07/2021 01:31:42 - INFO - __main__ - Step 30284: {'lr': 0.0004562827051127082, 'samples': 5814528, 'steps': 30283, 'loss/train': 1.2854667901992798} -11/07/2021 01:31:43 - INFO - __main__ - Step 30285: {'lr': 0.0004562797070650392, 'samples': 5814720, 'steps': 30284, 'loss/train': 1.4260727167129517} -11/07/2021 01:31:43 - INFO - __main__ - Step 30286: {'lr': 0.00045627670892442376, 'samples': 5814912, 'steps': 30285, 'loss/train': 1.5417121648788452} -11/07/2021 01:31:43 - INFO - __main__ - Step 30287: {'lr': 0.0004562737106908632, 'samples': 5815104, 'steps': 30286, 'loss/train': 0.8534297943115234} -11/07/2021 01:31:44 - INFO - __main__ - Step 30288: {'lr': 0.00045627071236435896, 'samples': 5815296, 'steps': 30287, 'loss/train': 1.6247920989990234} -11/07/2021 01:31:44 - INFO - __main__ - Step 30289: {'lr': 0.0004562677139449123, 'samples': 5815488, 'steps': 30288, 'loss/train': 1.485723853111267} -11/07/2021 01:31:45 - INFO - __main__ - Step 30290: {'lr': 0.0004562647154325246, 'samples': 5815680, 'steps': 30289, 'loss/train': 1.6737288236618042} -11/07/2021 01:31:45 - INFO - __main__ - Step 30291: {'lr': 0.0004562617168271971, 'samples': 5815872, 'steps': 30290, 'loss/train': 1.262340784072876} -11/07/2021 01:31:46 - INFO - __main__ - Step 30292: {'lr': 0.0004562587181289314, 'samples': 5816064, 'steps': 30291, 'loss/train': 1.1251622438430786} -11/07/2021 01:31:46 - INFO - __main__ - Step 30293: {'lr': 0.00045625571933772857, 'samples': 5816256, 'steps': 30292, 'loss/train': 1.7130277156829834} -11/07/2021 01:31:47 - INFO - __main__ - Step 30294: {'lr': 0.0004562527204535902, 'samples': 5816448, 'steps': 30293, 'loss/train': 1.5328103303909302} -11/07/2021 01:31:47 - INFO - __main__ - Step 30295: {'lr': 0.00045624972147651746, 'samples': 5816640, 'steps': 30294, 'loss/train': 1.6957600116729736} -11/07/2021 01:31:48 - INFO - __main__ - Step 30296: {'lr': 0.00045624672240651183, 'samples': 5816832, 'steps': 30295, 'loss/train': 1.4732813835144043} -11/07/2021 01:31:48 - INFO - __main__ - Step 30297: {'lr': 0.00045624372324357457, 'samples': 5817024, 'steps': 30296, 'loss/train': 1.6591161489486694} -11/07/2021 01:31:49 - INFO - __main__ - Step 30298: {'lr': 0.0004562407239877071, 'samples': 5817216, 'steps': 30297, 'loss/train': 1.7493314743041992} -11/07/2021 01:31:49 - INFO - __main__ - Step 30299: {'lr': 0.0004562377246389108, 'samples': 5817408, 'steps': 30298, 'loss/train': 1.5536787509918213} -11/07/2021 01:31:50 - INFO - __main__ - Step 30300: {'lr': 0.00045623472519718683, 'samples': 5817600, 'steps': 30299, 'loss/train': 1.7294906377792358} -11/07/2021 01:31:50 - INFO - __main__ - Step 30301: {'lr': 0.00045623172566253676, 'samples': 5817792, 'steps': 30300, 'loss/train': 1.6559518575668335} -11/07/2021 01:31:51 - INFO - __main__ - Step 30302: {'lr': 0.00045622872603496184, 'samples': 5817984, 'steps': 30301, 'loss/train': 1.169908881187439} -11/07/2021 01:31:51 - INFO - __main__ - Step 30303: {'lr': 0.0004562257263144635, 'samples': 5818176, 'steps': 30302, 'loss/train': 1.2968664169311523} -11/07/2021 01:31:51 - INFO - __main__ - Step 30304: {'lr': 0.0004562227265010429, 'samples': 5818368, 'steps': 30303, 'loss/train': 1.3897583484649658} -11/07/2021 01:31:52 - INFO - __main__ - Step 30305: {'lr': 0.00045621972659470156, 'samples': 5818560, 'steps': 30304, 'loss/train': 1.796301007270813} -11/07/2021 01:31:53 - INFO - __main__ - Step 30306: {'lr': 0.0004562167265954409, 'samples': 5818752, 'steps': 30305, 'loss/train': 1.7360395193099976} -11/07/2021 01:31:53 - INFO - __main__ - Step 30307: {'lr': 0.000456213726503262, 'samples': 5818944, 'steps': 30306, 'loss/train': 1.4913867712020874} -11/07/2021 01:31:53 - INFO - __main__ - Step 30308: {'lr': 0.0004562107263181665, 'samples': 5819136, 'steps': 30307, 'loss/train': 1.6164582967758179} -11/07/2021 01:31:54 - INFO - __main__ - Step 30309: {'lr': 0.0004562077260401556, 'samples': 5819328, 'steps': 30308, 'loss/train': 1.4213775396347046} -11/07/2021 01:31:54 - INFO - __main__ - Step 30310: {'lr': 0.00045620472566923064, 'samples': 5819520, 'steps': 30309, 'loss/train': 1.0018659830093384} -11/07/2021 01:31:55 - INFO - __main__ - Step 30311: {'lr': 0.0004562017252053931, 'samples': 5819712, 'steps': 30310, 'loss/train': 1.6342417001724243} -11/07/2021 01:31:56 - INFO - __main__ - Step 30312: {'lr': 0.0004561987246486442, 'samples': 5819904, 'steps': 30311, 'loss/train': 1.7264950275421143} -11/07/2021 01:31:56 - INFO - __main__ - Step 30313: {'lr': 0.00045619572399898534, 'samples': 5820096, 'steps': 30312, 'loss/train': 6.909998893737793} -11/07/2021 01:31:56 - INFO - __main__ - Step 30314: {'lr': 0.0004561927232564179, 'samples': 5820288, 'steps': 30313, 'loss/train': 2.314699172973633} -11/07/2021 01:31:57 - INFO - __main__ - Step 30315: {'lr': 0.00045618972242094313, 'samples': 5820480, 'steps': 30314, 'loss/train': 0.9875410199165344} -11/07/2021 01:31:58 - INFO - __main__ - Step 30316: {'lr': 0.00045618672149256244, 'samples': 5820672, 'steps': 30315, 'loss/train': 1.4033745527267456} -11/07/2021 01:31:58 - INFO - __main__ - Step 30317: {'lr': 0.0004561837204712773, 'samples': 5820864, 'steps': 30316, 'loss/train': 0.5098898410797119} -11/07/2021 01:31:59 - INFO - __main__ - Step 30318: {'lr': 0.0004561807193570888, 'samples': 5821056, 'steps': 30317, 'loss/train': 0.8450649976730347} -11/07/2021 01:31:59 - INFO - __main__ - Step 30319: {'lr': 0.0004561777181499986, 'samples': 5821248, 'steps': 30318, 'loss/train': 1.991714358329773} -11/07/2021 01:31:59 - INFO - __main__ - Step 30320: {'lr': 0.00045617471685000785, 'samples': 5821440, 'steps': 30319, 'loss/train': 0.922199547290802} -11/07/2021 01:32:00 - INFO - __main__ - Step 30321: {'lr': 0.00045617171545711793, 'samples': 5821632, 'steps': 30320, 'loss/train': 1.2312003374099731} -11/07/2021 01:32:01 - INFO - __main__ - Step 30322: {'lr': 0.0004561687139713302, 'samples': 5821824, 'steps': 30321, 'loss/train': 1.8956984281539917} -11/07/2021 01:32:01 - INFO - __main__ - Step 30323: {'lr': 0.00045616571239264614, 'samples': 5822016, 'steps': 30322, 'loss/train': 1.717467188835144} -11/07/2021 01:32:02 - INFO - __main__ - Step 30324: {'lr': 0.0004561627107210669, 'samples': 5822208, 'steps': 30323, 'loss/train': 1.844076156616211} -11/07/2021 01:32:02 - INFO - __main__ - Step 30325: {'lr': 0.00045615970895659393, 'samples': 5822400, 'steps': 30324, 'loss/train': 0.860467255115509} -11/07/2021 01:32:02 - INFO - __main__ - Step 30326: {'lr': 0.00045615670709922855, 'samples': 5822592, 'steps': 30325, 'loss/train': 2.927840232849121} -11/07/2021 01:32:03 - INFO - __main__ - Step 30327: {'lr': 0.0004561537051489722, 'samples': 5822784, 'steps': 30326, 'loss/train': 2.943389892578125} -11/07/2021 01:32:04 - INFO - __main__ - Step 30328: {'lr': 0.00045615070310582617, 'samples': 5822976, 'steps': 30327, 'loss/train': 1.597343921661377} -11/07/2021 01:32:04 - INFO - __main__ - Step 30329: {'lr': 0.00045614770096979177, 'samples': 5823168, 'steps': 30328, 'loss/train': 1.5728250741958618} -11/07/2021 01:32:05 - INFO - __main__ - Step 30330: {'lr': 0.0004561446987408704, 'samples': 5823360, 'steps': 30329, 'loss/train': 1.852549433708191} -11/07/2021 01:32:05 - INFO - __main__ - Step 30331: {'lr': 0.00045614169641906344, 'samples': 5823552, 'steps': 30330, 'loss/train': 1.5262786149978638} -11/07/2021 01:32:05 - INFO - __main__ - Step 30332: {'lr': 0.00045613869400437223, 'samples': 5823744, 'steps': 30331, 'loss/train': 1.6622519493103027} -11/07/2021 01:32:06 - INFO - __main__ - Step 30333: {'lr': 0.000456135691496798, 'samples': 5823936, 'steps': 30332, 'loss/train': 1.857367992401123} -11/07/2021 01:32:07 - INFO - __main__ - Step 30334: {'lr': 0.0004561326888963423, 'samples': 5824128, 'steps': 30333, 'loss/train': 1.3868197202682495} -11/07/2021 01:32:07 - INFO - __main__ - Step 30335: {'lr': 0.0004561296862030064, 'samples': 5824320, 'steps': 30334, 'loss/train': 1.6627488136291504} -11/07/2021 01:32:07 - INFO - __main__ - Step 30336: {'lr': 0.00045612668341679164, 'samples': 5824512, 'steps': 30335, 'loss/train': 1.669124722480774} -11/07/2021 01:32:08 - INFO - __main__ - Step 30337: {'lr': 0.0004561236805376994, 'samples': 5824704, 'steps': 30336, 'loss/train': 1.3865309953689575} -11/07/2021 01:32:09 - INFO - __main__ - Step 30338: {'lr': 0.00045612067756573097, 'samples': 5824896, 'steps': 30337, 'loss/train': 1.4449416399002075} -11/07/2021 01:32:09 - INFO - __main__ - Step 30339: {'lr': 0.0004561176745008877, 'samples': 5825088, 'steps': 30338, 'loss/train': 1.609216570854187} -11/07/2021 01:32:10 - INFO - __main__ - Step 30340: {'lr': 0.000456114671343171, 'samples': 5825280, 'steps': 30339, 'loss/train': 1.2884266376495361} -11/07/2021 01:32:10 - INFO - __main__ - Step 30341: {'lr': 0.00045611166809258227, 'samples': 5825472, 'steps': 30340, 'loss/train': 1.75202214717865} -11/07/2021 01:32:10 - INFO - __main__ - Step 30342: {'lr': 0.0004561086647491227, 'samples': 5825664, 'steps': 30341, 'loss/train': 1.4077476263046265} -11/07/2021 01:32:11 - INFO - __main__ - Step 30343: {'lr': 0.00045610566131279386, 'samples': 5825856, 'steps': 30342, 'loss/train': 1.4677209854125977} -11/07/2021 01:32:12 - INFO - __main__ - Step 30344: {'lr': 0.00045610265778359696, 'samples': 5826048, 'steps': 30343, 'loss/train': 0.9540789723396301} -11/07/2021 01:32:12 - INFO - __main__ - Step 30345: {'lr': 0.00045609965416153333, 'samples': 5826240, 'steps': 30344, 'loss/train': 1.9768776893615723} -11/07/2021 01:32:12 - INFO - __main__ - Step 30346: {'lr': 0.0004560966504466044, 'samples': 5826432, 'steps': 30345, 'loss/train': 1.844706416130066} -11/07/2021 01:32:13 - INFO - __main__ - Step 30347: {'lr': 0.00045609364663881153, 'samples': 5826624, 'steps': 30346, 'loss/train': 1.6334888935089111} -11/07/2021 01:32:14 - INFO - __main__ - Step 30348: {'lr': 0.000456090642738156, 'samples': 5826816, 'steps': 30347, 'loss/train': 1.814347505569458} -11/07/2021 01:32:14 - INFO - __main__ - Step 30349: {'lr': 0.00045608763874463925, 'samples': 5827008, 'steps': 30348, 'loss/train': 1.4767755270004272} -11/07/2021 01:32:14 - INFO - __main__ - Step 30350: {'lr': 0.00045608463465826257, 'samples': 5827200, 'steps': 30349, 'loss/train': 1.694061040878296} -11/07/2021 01:32:15 - INFO - __main__ - Step 30351: {'lr': 0.0004560816304790274, 'samples': 5827392, 'steps': 30350, 'loss/train': 1.9288541078567505} -11/07/2021 01:32:15 - INFO - __main__ - Step 30352: {'lr': 0.0004560786262069349, 'samples': 5827584, 'steps': 30351, 'loss/train': 1.5461041927337646} -11/07/2021 01:32:16 - INFO - __main__ - Step 30353: {'lr': 0.00045607562184198666, 'samples': 5827776, 'steps': 30352, 'loss/train': 1.8285548686981201} -11/07/2021 01:32:17 - INFO - __main__ - Step 30354: {'lr': 0.00045607261738418384, 'samples': 5827968, 'steps': 30353, 'loss/train': 1.6511898040771484} -11/07/2021 01:32:17 - INFO - __main__ - Step 30355: {'lr': 0.00045606961283352793, 'samples': 5828160, 'steps': 30354, 'loss/train': 1.591403603553772} -11/07/2021 01:32:17 - INFO - __main__ - Step 30356: {'lr': 0.0004560666081900202, 'samples': 5828352, 'steps': 30355, 'loss/train': 1.5361576080322266} -11/07/2021 01:32:18 - INFO - __main__ - Step 30357: {'lr': 0.00045606360345366203, 'samples': 5828544, 'steps': 30356, 'loss/train': 1.9898298978805542} -11/07/2021 01:32:18 - INFO - __main__ - Step 30358: {'lr': 0.00045606059862445485, 'samples': 5828736, 'steps': 30357, 'loss/train': 0.9508589506149292} -11/07/2021 01:32:20 - INFO - __main__ - Step 30359: {'lr': 0.0004560575937023999, 'samples': 5828928, 'steps': 30358, 'loss/train': 1.9072965383529663} -11/07/2021 01:32:20 - INFO - __main__ - Step 30360: {'lr': 0.0004560545886874986, 'samples': 5829120, 'steps': 30359, 'loss/train': 0.832706093788147} -11/07/2021 01:32:20 - INFO - __main__ - Step 30361: {'lr': 0.00045605158357975225, 'samples': 5829312, 'steps': 30360, 'loss/train': 1.1118340492248535} -11/07/2021 01:32:21 - INFO - __main__ - Step 30362: {'lr': 0.00045604857837916224, 'samples': 5829504, 'steps': 30361, 'loss/train': 1.3667658567428589} -11/07/2021 01:32:21 - INFO - __main__ - Step 30363: {'lr': 0.0004560455730857299, 'samples': 5829696, 'steps': 30362, 'loss/train': 2.0607755184173584} -11/07/2021 01:32:21 - INFO - __main__ - Step 30364: {'lr': 0.0004560425676994566, 'samples': 5829888, 'steps': 30363, 'loss/train': 1.497362732887268} -11/07/2021 01:32:22 - INFO - __main__ - Step 30365: {'lr': 0.00045603956222034384, 'samples': 5830080, 'steps': 30364, 'loss/train': 1.8845192193984985} -11/07/2021 01:32:23 - INFO - __main__ - Step 30366: {'lr': 0.0004560365566483927, 'samples': 5830272, 'steps': 30365, 'loss/train': 1.4809709787368774} -11/07/2021 01:32:23 - INFO - __main__ - Step 30367: {'lr': 0.00045603355098360466, 'samples': 5830464, 'steps': 30366, 'loss/train': 1.458250880241394} -11/07/2021 01:32:23 - INFO - __main__ - Step 30368: {'lr': 0.00045603054522598107, 'samples': 5830656, 'steps': 30367, 'loss/train': 1.8294758796691895} -11/07/2021 01:32:24 - INFO - __main__ - Step 30369: {'lr': 0.0004560275393755233, 'samples': 5830848, 'steps': 30368, 'loss/train': 1.6920772790908813} -11/07/2021 01:32:25 - INFO - __main__ - Step 30370: {'lr': 0.0004560245334322328, 'samples': 5831040, 'steps': 30369, 'loss/train': 1.7748409509658813} -11/07/2021 01:32:25 - INFO - __main__ - Step 30371: {'lr': 0.00045602152739611075, 'samples': 5831232, 'steps': 30370, 'loss/train': 1.7006174325942993} -11/07/2021 01:32:25 - INFO - __main__ - Step 30372: {'lr': 0.0004560185212671586, 'samples': 5831424, 'steps': 30371, 'loss/train': 1.10115647315979} -11/07/2021 01:32:26 - INFO - __main__ - Step 30373: {'lr': 0.00045601551504537765, 'samples': 5831616, 'steps': 30372, 'loss/train': 1.4324897527694702} -11/07/2021 01:32:26 - INFO - __main__ - Step 30374: {'lr': 0.0004560125087307693, 'samples': 5831808, 'steps': 30373, 'loss/train': 1.8265717029571533} -11/07/2021 01:32:27 - INFO - __main__ - Step 30375: {'lr': 0.00045600950232333495, 'samples': 5832000, 'steps': 30374, 'loss/train': 1.6013633012771606} -11/07/2021 01:32:28 - INFO - __main__ - Step 30376: {'lr': 0.00045600649582307586, 'samples': 5832192, 'steps': 30375, 'loss/train': 1.4706649780273438} -11/07/2021 01:32:28 - INFO - __main__ - Step 30377: {'lr': 0.00045600348922999334, 'samples': 5832384, 'steps': 30376, 'loss/train': 0.897438645362854} -11/07/2021 01:32:28 - INFO - __main__ - Step 30378: {'lr': 0.0004560004825440889, 'samples': 5832576, 'steps': 30377, 'loss/train': 1.6653149127960205} -11/07/2021 01:32:29 - INFO - __main__ - Step 30379: {'lr': 0.0004559974757653639, 'samples': 5832768, 'steps': 30378, 'loss/train': 1.7461222410202026} -11/07/2021 01:32:30 - INFO - __main__ - Step 30380: {'lr': 0.0004559944688938195, 'samples': 5832960, 'steps': 30379, 'loss/train': 1.4538600444793701} -11/07/2021 01:32:30 - INFO - __main__ - Step 30381: {'lr': 0.0004559914619294572, 'samples': 5833152, 'steps': 30380, 'loss/train': 1.8406343460083008} -11/07/2021 01:32:30 - INFO - __main__ - Step 30382: {'lr': 0.00045598845487227835, 'samples': 5833344, 'steps': 30381, 'loss/train': 2.0610239505767822} -11/07/2021 01:32:31 - INFO - __main__ - Step 30383: {'lr': 0.0004559854477222842, 'samples': 5833536, 'steps': 30382, 'loss/train': 1.8445994853973389} -11/07/2021 01:32:31 - INFO - __main__ - Step 30384: {'lr': 0.0004559824404794763, 'samples': 5833728, 'steps': 30383, 'loss/train': 1.59585702419281} -11/07/2021 01:32:32 - INFO - __main__ - Step 30385: {'lr': 0.0004559794331438558, 'samples': 5833920, 'steps': 30384, 'loss/train': 1.5763202905654907} -11/07/2021 01:32:32 - INFO - __main__ - Step 30386: {'lr': 0.0004559764257154242, 'samples': 5834112, 'steps': 30385, 'loss/train': 1.6152302026748657} -11/07/2021 01:32:33 - INFO - __main__ - Step 30387: {'lr': 0.0004559734181941828, 'samples': 5834304, 'steps': 30386, 'loss/train': 2.4096007347106934} -11/07/2021 01:32:33 - INFO - __main__ - Step 30388: {'lr': 0.0004559704105801329, 'samples': 5834496, 'steps': 30387, 'loss/train': 1.8948359489440918} -11/07/2021 01:32:34 - INFO - __main__ - Step 30389: {'lr': 0.00045596740287327597, 'samples': 5834688, 'steps': 30388, 'loss/train': 0.19201065599918365} -11/07/2021 01:32:34 - INFO - __main__ - Step 30390: {'lr': 0.0004559643950736133, 'samples': 5834880, 'steps': 30389, 'loss/train': 1.251489520072937} -11/07/2021 01:32:35 - INFO - __main__ - Step 30391: {'lr': 0.00045596138718114626, 'samples': 5835072, 'steps': 30390, 'loss/train': 1.5772721767425537} -11/07/2021 01:32:35 - INFO - __main__ - Step 30392: {'lr': 0.00045595837919587616, 'samples': 5835264, 'steps': 30391, 'loss/train': 1.3363888263702393} -11/07/2021 01:32:36 - INFO - __main__ - Step 30393: {'lr': 0.0004559553711178044, 'samples': 5835456, 'steps': 30392, 'loss/train': 0.6586275696754456} -11/07/2021 01:32:36 - INFO - __main__ - Step 30394: {'lr': 0.00045595236294693236, 'samples': 5835648, 'steps': 30393, 'loss/train': 1.7032047510147095} -11/07/2021 01:32:36 - INFO - __main__ - Step 30395: {'lr': 0.00045594935468326137, 'samples': 5835840, 'steps': 30394, 'loss/train': 1.174822211265564} -11/07/2021 01:32:37 - INFO - __main__ - Step 30396: {'lr': 0.00045594634632679275, 'samples': 5836032, 'steps': 30395, 'loss/train': 1.8963793516159058} -11/07/2021 01:32:38 - INFO - __main__ - Step 30397: {'lr': 0.0004559433378775278, 'samples': 5836224, 'steps': 30396, 'loss/train': 1.6081353425979614} -11/07/2021 01:32:38 - INFO - __main__ - Step 30398: {'lr': 0.00045594032933546813, 'samples': 5836416, 'steps': 30397, 'loss/train': 1.5449819564819336} -11/07/2021 01:32:38 - INFO - __main__ - Step 30399: {'lr': 0.00045593732070061484, 'samples': 5836608, 'steps': 30398, 'loss/train': 1.6387768983840942} -11/07/2021 01:32:39 - INFO - __main__ - Step 30400: {'lr': 0.00045593431197296934, 'samples': 5836800, 'steps': 30399, 'loss/train': 1.495215654373169} -11/07/2021 01:32:40 - INFO - __main__ - Step 30401: {'lr': 0.00045593130315253305, 'samples': 5836992, 'steps': 30400, 'loss/train': 1.1243253946304321} -11/07/2021 01:32:40 - INFO - __main__ - Step 30402: {'lr': 0.0004559282942393073, 'samples': 5837184, 'steps': 30401, 'loss/train': 2.1499686241149902} -11/07/2021 01:32:41 - INFO - __main__ - Step 30403: {'lr': 0.00045592528523329346, 'samples': 5837376, 'steps': 30402, 'loss/train': 1.4585944414138794} -11/07/2021 01:32:41 - INFO - __main__ - Step 30404: {'lr': 0.0004559222761344928, 'samples': 5837568, 'steps': 30403, 'loss/train': 1.3113209009170532} -11/07/2021 01:32:41 - INFO - __main__ - Step 30405: {'lr': 0.0004559192669429068, 'samples': 5837760, 'steps': 30404, 'loss/train': 1.6635924577713013} -11/07/2021 01:32:42 - INFO - __main__ - Step 30406: {'lr': 0.0004559162576585367, 'samples': 5837952, 'steps': 30405, 'loss/train': 1.4389300346374512} -11/07/2021 01:32:43 - INFO - __main__ - Step 30407: {'lr': 0.00045591324828138396, 'samples': 5838144, 'steps': 30406, 'loss/train': 2.16180157661438} -11/07/2021 01:32:43 - INFO - __main__ - Step 30408: {'lr': 0.0004559102388114499, 'samples': 5838336, 'steps': 30407, 'loss/train': 1.4051746129989624} -11/07/2021 01:32:43 - INFO - __main__ - Step 30409: {'lr': 0.00045590722924873585, 'samples': 5838528, 'steps': 30408, 'loss/train': 1.2232269048690796} -11/07/2021 01:32:44 - INFO - __main__ - Step 30410: {'lr': 0.00045590421959324314, 'samples': 5838720, 'steps': 30409, 'loss/train': 1.7550944089889526} -11/07/2021 01:32:44 - INFO - __main__ - Step 30411: {'lr': 0.0004559012098449732, 'samples': 5838912, 'steps': 30410, 'loss/train': 1.7170732021331787} -11/07/2021 01:32:45 - INFO - __main__ - Step 30412: {'lr': 0.00045589820000392736, 'samples': 5839104, 'steps': 30411, 'loss/train': 1.328830361366272} -11/07/2021 01:32:46 - INFO - __main__ - Step 30413: {'lr': 0.00045589519007010695, 'samples': 5839296, 'steps': 30412, 'loss/train': 1.4785791635513306} -11/07/2021 01:32:46 - INFO - __main__ - Step 30414: {'lr': 0.0004558921800435133, 'samples': 5839488, 'steps': 30413, 'loss/train': 1.152627944946289} -11/07/2021 01:32:46 - INFO - __main__ - Step 30415: {'lr': 0.00045588916992414784, 'samples': 5839680, 'steps': 30414, 'loss/train': 0.5767570734024048} -11/07/2021 01:32:47 - INFO - __main__ - Step 30416: {'lr': 0.0004558861597120119, 'samples': 5839872, 'steps': 30415, 'loss/train': 2.3084864616394043} -11/07/2021 01:32:48 - INFO - __main__ - Step 30417: {'lr': 0.00045588314940710683, 'samples': 5840064, 'steps': 30416, 'loss/train': 1.6227964162826538} -11/07/2021 01:32:48 - INFO - __main__ - Step 30418: {'lr': 0.00045588013900943404, 'samples': 5840256, 'steps': 30417, 'loss/train': 0.9265647530555725} -11/07/2021 01:32:48 - INFO - __main__ - Step 30419: {'lr': 0.0004558771285189948, 'samples': 5840448, 'steps': 30418, 'loss/train': 1.315839171409607} -11/07/2021 01:32:49 - INFO - __main__ - Step 30420: {'lr': 0.00045587411793579047, 'samples': 5840640, 'steps': 30419, 'loss/train': 1.4096364974975586} -11/07/2021 01:32:49 - INFO - __main__ - Step 30421: {'lr': 0.0004558711072598225, 'samples': 5840832, 'steps': 30420, 'loss/train': 1.443522572517395} -11/07/2021 01:32:50 - INFO - __main__ - Step 30422: {'lr': 0.0004558680964910922, 'samples': 5841024, 'steps': 30421, 'loss/train': 1.4016804695129395} -11/07/2021 01:32:50 - INFO - __main__ - Step 30423: {'lr': 0.0004558650856296008, 'samples': 5841216, 'steps': 30422, 'loss/train': 1.8984380960464478} -11/07/2021 01:32:51 - INFO - __main__ - Step 30424: {'lr': 0.0004558620746753499, 'samples': 5841408, 'steps': 30423, 'loss/train': 1.569122076034546} -11/07/2021 01:32:51 - INFO - __main__ - Step 30425: {'lr': 0.00045585906362834063, 'samples': 5841600, 'steps': 30424, 'loss/train': 1.7328251600265503} -11/07/2021 01:32:51 - INFO - __main__ - Step 30426: {'lr': 0.00045585605248857456, 'samples': 5841792, 'steps': 30425, 'loss/train': 1.608799695968628} -11/07/2021 01:32:52 - INFO - __main__ - Step 30427: {'lr': 0.00045585304125605276, 'samples': 5841984, 'steps': 30426, 'loss/train': 1.329828143119812} -11/07/2021 01:32:53 - INFO - __main__ - Step 30428: {'lr': 0.0004558500299307768, 'samples': 5842176, 'steps': 30427, 'loss/train': 1.7235779762268066} -11/07/2021 01:32:53 - INFO - __main__ - Step 30429: {'lr': 0.00045584701851274814, 'samples': 5842368, 'steps': 30428, 'loss/train': 1.8039371967315674} -11/07/2021 01:32:53 - INFO - __main__ - Step 30430: {'lr': 0.0004558440070019678, 'samples': 5842560, 'steps': 30429, 'loss/train': 0.8503919839859009} -11/07/2021 01:32:54 - INFO - __main__ - Step 30431: {'lr': 0.0004558409953984375, 'samples': 5842752, 'steps': 30430, 'loss/train': 1.530393362045288} -11/07/2021 01:32:55 - INFO - __main__ - Step 30432: {'lr': 0.00045583798370215837, 'samples': 5842944, 'steps': 30431, 'loss/train': 0.22017337381839752} -11/07/2021 01:32:55 - INFO - __main__ - Step 30433: {'lr': 0.00045583497191313175, 'samples': 5843136, 'steps': 30432, 'loss/train': 1.5525765419006348} -11/07/2021 01:32:56 - INFO - __main__ - Step 30434: {'lr': 0.00045583196003135906, 'samples': 5843328, 'steps': 30433, 'loss/train': 1.5046756267547607} -11/07/2021 01:32:56 - INFO - __main__ - Step 30435: {'lr': 0.0004558289480568417, 'samples': 5843520, 'steps': 30434, 'loss/train': 1.2534716129302979} -11/07/2021 01:32:56 - INFO - __main__ - Step 30436: {'lr': 0.00045582593598958107, 'samples': 5843712, 'steps': 30435, 'loss/train': 1.0785267353057861} -11/07/2021 01:32:57 - INFO - __main__ - Step 30437: {'lr': 0.00045582292382957836, 'samples': 5843904, 'steps': 30436, 'loss/train': 1.7116634845733643} -11/07/2021 01:32:58 - INFO - __main__ - Step 30438: {'lr': 0.000455819911576835, 'samples': 5844096, 'steps': 30437, 'loss/train': 1.413965106010437} -11/07/2021 01:32:58 - INFO - __main__ - Step 30439: {'lr': 0.00045581689923135247, 'samples': 5844288, 'steps': 30438, 'loss/train': 1.6645784378051758} -11/07/2021 01:32:58 - INFO - __main__ - Step 30440: {'lr': 0.00045581388679313194, 'samples': 5844480, 'steps': 30439, 'loss/train': 1.785849928855896} -11/07/2021 01:32:59 - INFO - __main__ - Step 30441: {'lr': 0.0004558108742621748, 'samples': 5844672, 'steps': 30440, 'loss/train': 0.9725473523139954} -11/07/2021 01:32:59 - INFO - __main__ - Step 30442: {'lr': 0.00045580786163848254, 'samples': 5844864, 'steps': 30441, 'loss/train': 1.6476956605911255} -11/07/2021 01:33:00 - INFO - __main__ - Step 30443: {'lr': 0.00045580484892205643, 'samples': 5845056, 'steps': 30442, 'loss/train': 1.4735348224639893} -11/07/2021 01:33:00 - INFO - __main__ - Step 30444: {'lr': 0.0004558018361128978, 'samples': 5845248, 'steps': 30443, 'loss/train': 1.8190598487854004} -11/07/2021 01:33:01 - INFO - __main__ - Step 30445: {'lr': 0.0004557988232110081, 'samples': 5845440, 'steps': 30444, 'loss/train': 1.864393711090088} -11/07/2021 01:33:01 - INFO - __main__ - Step 30446: {'lr': 0.00045579581021638855, 'samples': 5845632, 'steps': 30445, 'loss/train': 0.5898078083992004} -11/07/2021 01:33:01 - INFO - __main__ - Step 30447: {'lr': 0.00045579279712904057, 'samples': 5845824, 'steps': 30446, 'loss/train': 1.3282579183578491} -11/07/2021 01:33:02 - INFO - __main__ - Step 30448: {'lr': 0.00045578978394896565, 'samples': 5846016, 'steps': 30447, 'loss/train': 1.671467661857605} -11/07/2021 01:33:03 - INFO - __main__ - Step 30449: {'lr': 0.00045578677067616494, 'samples': 5846208, 'steps': 30448, 'loss/train': 1.5926649570465088} -11/07/2021 01:33:03 - INFO - __main__ - Step 30450: {'lr': 0.0004557837573106399, 'samples': 5846400, 'steps': 30449, 'loss/train': 1.6386229991912842} -11/07/2021 01:33:04 - INFO - __main__ - Step 30451: {'lr': 0.0004557807438523919, 'samples': 5846592, 'steps': 30450, 'loss/train': 1.629556655883789} -11/07/2021 01:33:04 - INFO - __main__ - Step 30452: {'lr': 0.00045577773030142224, 'samples': 5846784, 'steps': 30451, 'loss/train': 1.3279333114624023} -11/07/2021 01:33:05 - INFO - __main__ - Step 30453: {'lr': 0.0004557747166577323, 'samples': 5846976, 'steps': 30452, 'loss/train': 1.726426362991333} -11/07/2021 01:33:06 - INFO - __main__ - Step 30454: {'lr': 0.0004557717029213234, 'samples': 5847168, 'steps': 30453, 'loss/train': 1.1271165609359741} -11/07/2021 01:33:06 - INFO - __main__ - Step 30455: {'lr': 0.00045576868909219704, 'samples': 5847360, 'steps': 30454, 'loss/train': 1.4849731922149658} -11/07/2021 01:33:06 - INFO - __main__ - Step 30456: {'lr': 0.0004557656751703544, 'samples': 5847552, 'steps': 30455, 'loss/train': 1.2597217559814453} -11/07/2021 01:33:07 - INFO - __main__ - Step 30457: {'lr': 0.000455762661155797, 'samples': 5847744, 'steps': 30456, 'loss/train': 1.6121560335159302} -11/07/2021 01:33:08 - INFO - __main__ - Step 30458: {'lr': 0.0004557596470485261, 'samples': 5847936, 'steps': 30457, 'loss/train': 1.1347659826278687} -11/07/2021 01:33:08 - INFO - __main__ - Step 30459: {'lr': 0.0004557566328485431, 'samples': 5848128, 'steps': 30458, 'loss/train': 0.9545296430587769} -11/07/2021 01:33:08 - INFO - __main__ - Step 30460: {'lr': 0.00045575361855584927, 'samples': 5848320, 'steps': 30459, 'loss/train': 1.9373095035552979} -11/07/2021 01:33:09 - INFO - __main__ - Step 30461: {'lr': 0.00045575060417044614, 'samples': 5848512, 'steps': 30460, 'loss/train': 1.6543169021606445} -11/07/2021 01:33:09 - INFO - __main__ - Step 30462: {'lr': 0.0004557475896923349, 'samples': 5848704, 'steps': 30461, 'loss/train': 1.2315062284469604} -11/07/2021 01:33:10 - INFO - __main__ - Step 30463: {'lr': 0.0004557445751215169, 'samples': 5848896, 'steps': 30462, 'loss/train': 1.3893226385116577} -11/07/2021 01:33:10 - INFO - __main__ - Step 30464: {'lr': 0.00045574156045799367, 'samples': 5849088, 'steps': 30463, 'loss/train': 1.6300371885299683} -11/07/2021 01:33:11 - INFO - __main__ - Step 30465: {'lr': 0.0004557385457017664, 'samples': 5849280, 'steps': 30464, 'loss/train': 1.397165298461914} -11/07/2021 01:33:11 - INFO - __main__ - Step 30466: {'lr': 0.0004557355308528366, 'samples': 5849472, 'steps': 30465, 'loss/train': 1.7070040702819824} -11/07/2021 01:33:12 - INFO - __main__ - Step 30467: {'lr': 0.00045573251591120545, 'samples': 5849664, 'steps': 30466, 'loss/train': 0.650546133518219} -11/07/2021 01:33:12 - INFO - __main__ - Step 30468: {'lr': 0.00045572950087687447, 'samples': 5849856, 'steps': 30467, 'loss/train': 1.5740357637405396} -11/07/2021 01:33:13 - INFO - __main__ - Step 30469: {'lr': 0.0004557264857498449, 'samples': 5850048, 'steps': 30468, 'loss/train': 1.7624471187591553} -11/07/2021 01:33:13 - INFO - __main__ - Step 30470: {'lr': 0.0004557234705301182, 'samples': 5850240, 'steps': 30469, 'loss/train': 1.3435560464859009} -11/07/2021 01:33:14 - INFO - __main__ - Step 30471: {'lr': 0.0004557204552176957, 'samples': 5850432, 'steps': 30470, 'loss/train': 1.2548309564590454} -11/07/2021 01:33:14 - INFO - __main__ - Step 30472: {'lr': 0.0004557174398125786, 'samples': 5850624, 'steps': 30471, 'loss/train': 1.7051408290863037} -11/07/2021 01:33:14 - INFO - __main__ - Step 30473: {'lr': 0.00045571442431476856, 'samples': 5850816, 'steps': 30472, 'loss/train': 0.7577283382415771} -11/07/2021 01:33:15 - INFO - __main__ - Step 30474: {'lr': 0.0004557114087242667, 'samples': 5851008, 'steps': 30473, 'loss/train': 1.2576820850372314} -11/07/2021 01:33:16 - INFO - __main__ - Step 30475: {'lr': 0.0004557083930410745, 'samples': 5851200, 'steps': 30474, 'loss/train': 1.5838309526443481} -11/07/2021 01:33:16 - INFO - __main__ - Step 30476: {'lr': 0.0004557053772651932, 'samples': 5851392, 'steps': 30475, 'loss/train': 1.0980839729309082} -11/07/2021 01:33:16 - INFO - __main__ - Step 30477: {'lr': 0.00045570236139662426, 'samples': 5851584, 'steps': 30476, 'loss/train': 1.8236390352249146} -11/07/2021 01:33:17 - INFO - __main__ - Step 30478: {'lr': 0.000455699345435369, 'samples': 5851776, 'steps': 30477, 'loss/train': 1.789986252784729} -11/07/2021 01:33:18 - INFO - __main__ - Step 30479: {'lr': 0.0004556963293814288, 'samples': 5851968, 'steps': 30478, 'loss/train': 1.3823659420013428} -11/07/2021 01:33:18 - INFO - __main__ - Step 30480: {'lr': 0.000455693313234805, 'samples': 5852160, 'steps': 30479, 'loss/train': 1.5483280420303345} -11/07/2021 01:33:18 - INFO - __main__ - Step 30481: {'lr': 0.000455690296995499, 'samples': 5852352, 'steps': 30480, 'loss/train': 1.7918452024459839} -11/07/2021 01:33:19 - INFO - __main__ - Step 30482: {'lr': 0.00045568728066351205, 'samples': 5852544, 'steps': 30481, 'loss/train': 1.6299755573272705} -11/07/2021 01:33:19 - INFO - __main__ - Step 30483: {'lr': 0.0004556842642388457, 'samples': 5852736, 'steps': 30482, 'loss/train': 1.5032507181167603} -11/07/2021 01:33:20 - INFO - __main__ - Step 30484: {'lr': 0.0004556812477215011, 'samples': 5852928, 'steps': 30483, 'loss/train': 1.8862870931625366} -11/07/2021 01:33:21 - INFO - __main__ - Step 30485: {'lr': 0.0004556782311114798, 'samples': 5853120, 'steps': 30484, 'loss/train': 1.2660750150680542} -11/07/2021 01:33:21 - INFO - __main__ - Step 30486: {'lr': 0.00045567521440878294, 'samples': 5853312, 'steps': 30485, 'loss/train': 1.1814024448394775} -11/07/2021 01:33:22 - INFO - __main__ - Step 30487: {'lr': 0.000455672197613412, 'samples': 5853504, 'steps': 30486, 'loss/train': 1.257530689239502} -11/07/2021 01:33:22 - INFO - __main__ - Step 30488: {'lr': 0.00045566918072536844, 'samples': 5853696, 'steps': 30487, 'loss/train': 1.7170592546463013} -11/07/2021 01:33:23 - INFO - __main__ - Step 30489: {'lr': 0.00045566616374465355, 'samples': 5853888, 'steps': 30488, 'loss/train': 1.4508795738220215} -11/07/2021 01:33:24 - INFO - __main__ - Step 30490: {'lr': 0.0004556631466712686, 'samples': 5854080, 'steps': 30489, 'loss/train': 1.3915959596633911} -11/07/2021 01:33:24 - INFO - __main__ - Step 30491: {'lr': 0.00045566012950521497, 'samples': 5854272, 'steps': 30490, 'loss/train': 1.7133105993270874} -11/07/2021 01:33:24 - INFO - __main__ - Step 30492: {'lr': 0.0004556571122464941, 'samples': 5854464, 'steps': 30491, 'loss/train': 0.9542956948280334} -11/07/2021 01:33:25 - INFO - __main__ - Step 30493: {'lr': 0.0004556540948951073, 'samples': 5854656, 'steps': 30492, 'loss/train': 1.3986448049545288} -11/07/2021 01:33:25 - INFO - __main__ - Step 30494: {'lr': 0.00045565107745105594, 'samples': 5854848, 'steps': 30493, 'loss/train': 1.6358494758605957} -11/07/2021 01:33:26 - INFO - __main__ - Step 30495: {'lr': 0.00045564805991434135, 'samples': 5855040, 'steps': 30494, 'loss/train': 1.6779626607894897} -11/07/2021 01:33:26 - INFO - __main__ - Step 30496: {'lr': 0.00045564504228496494, 'samples': 5855232, 'steps': 30495, 'loss/train': 1.607884168624878} -11/07/2021 01:33:27 - INFO - __main__ - Step 30497: {'lr': 0.0004556420245629281, 'samples': 5855424, 'steps': 30496, 'loss/train': 1.7303855419158936} -11/07/2021 01:33:27 - INFO - __main__ - Step 30498: {'lr': 0.00045563900674823205, 'samples': 5855616, 'steps': 30497, 'loss/train': 1.3164902925491333} -11/07/2021 01:33:27 - INFO - __main__ - Step 30499: {'lr': 0.0004556359888408783, 'samples': 5855808, 'steps': 30498, 'loss/train': 1.3503849506378174} -11/07/2021 01:33:28 - INFO - __main__ - Step 30500: {'lr': 0.00045563297084086807, 'samples': 5856000, 'steps': 30499, 'loss/train': 1.9133379459381104} -11/07/2021 01:33:29 - INFO - __main__ - Step 30501: {'lr': 0.00045562995274820285, 'samples': 5856192, 'steps': 30500, 'loss/train': 1.8207396268844604} -11/07/2021 01:33:29 - INFO - __main__ - Step 30502: {'lr': 0.00045562693456288394, 'samples': 5856384, 'steps': 30501, 'loss/train': 1.9690886735916138} -11/07/2021 01:33:29 - INFO - __main__ - Step 30503: {'lr': 0.00045562391628491274, 'samples': 5856576, 'steps': 30502, 'loss/train': 1.3326011896133423} -11/07/2021 01:33:30 - INFO - __main__ - Step 30504: {'lr': 0.00045562089791429056, 'samples': 5856768, 'steps': 30503, 'loss/train': 1.9938852787017822} -11/07/2021 01:33:31 - INFO - __main__ - Step 30505: {'lr': 0.00045561787945101875, 'samples': 5856960, 'steps': 30504, 'loss/train': 1.5999820232391357} -11/07/2021 01:33:32 - INFO - __main__ - Step 30506: {'lr': 0.0004556148608950987, 'samples': 5857152, 'steps': 30505, 'loss/train': 1.660935401916504} -11/07/2021 01:33:32 - INFO - __main__ - Step 30507: {'lr': 0.0004556118422465319, 'samples': 5857344, 'steps': 30506, 'loss/train': 1.7182539701461792} -11/07/2021 01:33:32 - INFO - __main__ - Step 30508: {'lr': 0.00045560882350531936, 'samples': 5857536, 'steps': 30507, 'loss/train': 3.5188839435577393} -11/07/2021 01:33:33 - INFO - __main__ - Step 30509: {'lr': 0.00045560580467146275, 'samples': 5857728, 'steps': 30508, 'loss/train': 1.6736948490142822} -11/07/2021 01:33:33 - INFO - __main__ - Step 30510: {'lr': 0.00045560278574496334, 'samples': 5857920, 'steps': 30509, 'loss/train': 1.7277591228485107} -11/07/2021 01:33:34 - INFO - __main__ - Step 30511: {'lr': 0.0004555997667258225, 'samples': 5858112, 'steps': 30510, 'loss/train': 1.3974577188491821} -11/07/2021 01:33:34 - INFO - __main__ - Step 30512: {'lr': 0.0004555967476140416, 'samples': 5858304, 'steps': 30511, 'loss/train': 1.6479278802871704} -11/07/2021 01:33:35 - INFO - __main__ - Step 30513: {'lr': 0.00045559372840962186, 'samples': 5858496, 'steps': 30512, 'loss/train': 1.2236391305923462} -11/07/2021 01:33:35 - INFO - __main__ - Step 30514: {'lr': 0.00045559070911256486, 'samples': 5858688, 'steps': 30513, 'loss/train': 1.4619766473770142} -11/07/2021 01:33:35 - INFO - __main__ - Step 30515: {'lr': 0.00045558768972287183, 'samples': 5858880, 'steps': 30514, 'loss/train': 1.701179027557373} -11/07/2021 01:33:36 - INFO - __main__ - Step 30516: {'lr': 0.0004555846702405442, 'samples': 5859072, 'steps': 30515, 'loss/train': 1.1603152751922607} -11/07/2021 01:33:37 - INFO - __main__ - Step 30517: {'lr': 0.0004555816506655832, 'samples': 5859264, 'steps': 30516, 'loss/train': 1.6459802389144897} -11/07/2021 01:33:37 - INFO - __main__ - Step 30518: {'lr': 0.00045557863099799034, 'samples': 5859456, 'steps': 30517, 'loss/train': 1.5410176515579224} -11/07/2021 01:33:38 - INFO - __main__ - Step 30519: {'lr': 0.000455575611237767, 'samples': 5859648, 'steps': 30518, 'loss/train': 2.3247158527374268} -11/07/2021 01:33:38 - INFO - __main__ - Step 30520: {'lr': 0.00045557259138491435, 'samples': 5859840, 'steps': 30519, 'loss/train': 1.3978822231292725} -11/07/2021 01:33:38 - INFO - __main__ - Step 30521: {'lr': 0.0004555695714394339, 'samples': 5860032, 'steps': 30520, 'loss/train': 1.592763066291809} -11/07/2021 01:33:39 - INFO - __main__ - Step 30522: {'lr': 0.00045556655140132696, 'samples': 5860224, 'steps': 30521, 'loss/train': 1.1270097494125366} -11/07/2021 01:33:40 - INFO - __main__ - Step 30523: {'lr': 0.00045556353127059493, 'samples': 5860416, 'steps': 30522, 'loss/train': 1.5414197444915771} -11/07/2021 01:33:40 - INFO - __main__ - Step 30524: {'lr': 0.0004555605110472391, 'samples': 5860608, 'steps': 30523, 'loss/train': 0.3523915410041809} -11/07/2021 01:33:40 - INFO - __main__ - Step 30525: {'lr': 0.0004555574907312609, 'samples': 5860800, 'steps': 30524, 'loss/train': 1.533868670463562} -11/07/2021 01:33:41 - INFO - __main__ - Step 30526: {'lr': 0.00045555447032266167, 'samples': 5860992, 'steps': 30525, 'loss/train': 1.9231667518615723} -11/07/2021 01:33:42 - INFO - __main__ - Step 30527: {'lr': 0.0004555514498214428, 'samples': 5861184, 'steps': 30526, 'loss/train': 0.2879134714603424} -11/07/2021 01:33:42 - INFO - __main__ - Step 30528: {'lr': 0.0004555484292276055, 'samples': 5861376, 'steps': 30527, 'loss/train': 1.9613897800445557} -11/07/2021 01:33:42 - INFO - __main__ - Step 30529: {'lr': 0.0004555454085411514, 'samples': 5861568, 'steps': 30528, 'loss/train': 1.6907329559326172} -11/07/2021 01:33:43 - INFO - __main__ - Step 30530: {'lr': 0.0004555423877620817, 'samples': 5861760, 'steps': 30529, 'loss/train': 1.6974469423294067} -11/07/2021 01:33:43 - INFO - __main__ - Step 30531: {'lr': 0.00045553936689039765, 'samples': 5861952, 'steps': 30530, 'loss/train': 1.763445258140564} -11/07/2021 01:33:44 - INFO - __main__ - Step 30532: {'lr': 0.00045553634592610084, 'samples': 5862144, 'steps': 30531, 'loss/train': 1.4664535522460938} -11/07/2021 01:33:45 - INFO - __main__ - Step 30533: {'lr': 0.00045553332486919246, 'samples': 5862336, 'steps': 30532, 'loss/train': 1.4843565225601196} -11/07/2021 01:33:45 - INFO - __main__ - Step 30534: {'lr': 0.000455530303719674, 'samples': 5862528, 'steps': 30533, 'loss/train': 1.5967292785644531} -11/07/2021 01:33:45 - INFO - __main__ - Step 30535: {'lr': 0.00045552728247754673, 'samples': 5862720, 'steps': 30534, 'loss/train': 1.8246897459030151} -11/07/2021 01:33:46 - INFO - __main__ - Step 30536: {'lr': 0.000455524261142812, 'samples': 5862912, 'steps': 30535, 'loss/train': 5.765089988708496} -11/07/2021 01:33:46 - INFO - __main__ - Step 30537: {'lr': 0.00045552123971547123, 'samples': 5863104, 'steps': 30536, 'loss/train': 0.8816110491752625} -11/07/2021 01:33:47 - INFO - __main__ - Step 30538: {'lr': 0.00045551821819552575, 'samples': 5863296, 'steps': 30537, 'loss/train': 1.4403982162475586} -11/07/2021 01:33:47 - INFO - __main__ - Step 30539: {'lr': 0.0004555151965829769, 'samples': 5863488, 'steps': 30538, 'loss/train': 1.8970357179641724} -11/07/2021 01:33:48 - INFO - __main__ - Step 30540: {'lr': 0.0004555121748778261, 'samples': 5863680, 'steps': 30539, 'loss/train': 1.0221960544586182} -11/07/2021 01:33:48 - INFO - __main__ - Step 30541: {'lr': 0.0004555091530800748, 'samples': 5863872, 'steps': 30540, 'loss/train': 1.4456019401550293} -11/07/2021 01:33:49 - INFO - __main__ - Step 30542: {'lr': 0.0004555061311897241, 'samples': 5864064, 'steps': 30541, 'loss/train': 1.6158738136291504} -11/07/2021 01:33:50 - INFO - __main__ - Step 30543: {'lr': 0.0004555031092067756, 'samples': 5864256, 'steps': 30542, 'loss/train': 2.1358749866485596} -11/07/2021 01:33:50 - INFO - __main__ - Step 30544: {'lr': 0.00045550008713123047, 'samples': 5864448, 'steps': 30543, 'loss/train': 1.3832736015319824} -11/07/2021 01:33:50 - INFO - __main__ - Step 30545: {'lr': 0.00045549706496309027, 'samples': 5864640, 'steps': 30544, 'loss/train': 1.976824164390564} -11/07/2021 01:33:51 - INFO - __main__ - Step 30546: {'lr': 0.0004554940427023562, 'samples': 5864832, 'steps': 30545, 'loss/train': 1.4866725206375122} -11/07/2021 01:33:51 - INFO - __main__ - Step 30547: {'lr': 0.00045549102034902973, 'samples': 5865024, 'steps': 30546, 'loss/train': 1.2114545106887817} -11/07/2021 01:33:53 - INFO - __main__ - Step 30548: {'lr': 0.0004554879979031121, 'samples': 5865216, 'steps': 30547, 'loss/train': 1.4681395292282104} -11/07/2021 01:33:53 - INFO - __main__ - Step 30549: {'lr': 0.00045548497536460487, 'samples': 5865408, 'steps': 30548, 'loss/train': 1.0890514850616455} -11/07/2021 01:33:54 - INFO - __main__ - Step 30550: {'lr': 0.00045548195273350926, 'samples': 5865600, 'steps': 30549, 'loss/train': 1.9650791883468628} -11/07/2021 01:33:54 - INFO - __main__ - Step 30551: {'lr': 0.0004554789300098265, 'samples': 5865792, 'steps': 30550, 'loss/train': 1.7189000844955444} -11/07/2021 01:33:54 - INFO - __main__ - Step 30552: {'lr': 0.00045547590719355823, 'samples': 5865984, 'steps': 30551, 'loss/train': 1.40700364112854} -11/07/2021 01:33:55 - INFO - __main__ - Step 30553: {'lr': 0.00045547288428470574, 'samples': 5866176, 'steps': 30552, 'loss/train': 1.4973241090774536} -11/07/2021 01:33:55 - INFO - __main__ - Step 30554: {'lr': 0.0004554698612832703, 'samples': 5866368, 'steps': 30553, 'loss/train': 2.791121482849121} -11/07/2021 01:33:55 - INFO - __main__ - Step 30555: {'lr': 0.00045546683818925327, 'samples': 5866560, 'steps': 30554, 'loss/train': 2.858717918395996} -11/07/2021 01:33:56 - INFO - __main__ - Step 30556: {'lr': 0.000455463815002656, 'samples': 5866752, 'steps': 30555, 'loss/train': 2.730980634689331} -11/07/2021 01:33:57 - INFO - __main__ - Step 30557: {'lr': 0.00045546079172348, 'samples': 5866944, 'steps': 30556, 'loss/train': 1.6503729820251465} -11/07/2021 01:33:57 - INFO - __main__ - Step 30558: {'lr': 0.00045545776835172647, 'samples': 5867136, 'steps': 30557, 'loss/train': 1.6318061351776123} -11/07/2021 01:33:57 - INFO - __main__ - Step 30559: {'lr': 0.00045545474488739693, 'samples': 5867328, 'steps': 30558, 'loss/train': 1.0276840925216675} -11/07/2021 01:33:58 - INFO - __main__ - Step 30560: {'lr': 0.0004554517213304926, 'samples': 5867520, 'steps': 30559, 'loss/train': 1.5448262691497803} -11/07/2021 01:33:59 - INFO - __main__ - Step 30561: {'lr': 0.00045544869768101486, 'samples': 5867712, 'steps': 30560, 'loss/train': 1.3254529237747192} -11/07/2021 01:33:59 - INFO - __main__ - Step 30562: {'lr': 0.0004554456739389652, 'samples': 5867904, 'steps': 30561, 'loss/train': 2.473137855529785} -11/07/2021 01:34:00 - INFO - __main__ - Step 30563: {'lr': 0.00045544265010434484, 'samples': 5868096, 'steps': 30562, 'loss/train': 1.485152244567871} -11/07/2021 01:34:00 - INFO - __main__ - Step 30564: {'lr': 0.0004554396261771552, 'samples': 5868288, 'steps': 30563, 'loss/train': 1.870257019996643} -11/07/2021 01:34:00 - INFO - __main__ - Step 30565: {'lr': 0.00045543660215739755, 'samples': 5868480, 'steps': 30564, 'loss/train': 1.6671714782714844} -11/07/2021 01:34:02 - INFO - __main__ - Step 30566: {'lr': 0.00045543357804507344, 'samples': 5868672, 'steps': 30565, 'loss/train': 1.806578516960144} -11/07/2021 01:34:02 - INFO - __main__ - Step 30567: {'lr': 0.00045543055384018405, 'samples': 5868864, 'steps': 30566, 'loss/train': 1.5219746828079224} -11/07/2021 01:34:02 - INFO - __main__ - Step 30568: {'lr': 0.0004554275295427309, 'samples': 5869056, 'steps': 30567, 'loss/train': 1.6241127252578735} -11/07/2021 01:34:03 - INFO - __main__ - Step 30569: {'lr': 0.0004554245051527153, 'samples': 5869248, 'steps': 30568, 'loss/train': 4.016051292419434} -11/07/2021 01:34:03 - INFO - __main__ - Step 30570: {'lr': 0.0004554214806701384, 'samples': 5869440, 'steps': 30569, 'loss/train': 1.164947748184204} -11/07/2021 01:34:05 - INFO - __main__ - Step 30571: {'lr': 0.000455418456095002, 'samples': 5869632, 'steps': 30570, 'loss/train': 0.8092489838600159} -11/07/2021 01:34:05 - INFO - __main__ - Step 30572: {'lr': 0.000455415431427307, 'samples': 5869824, 'steps': 30571, 'loss/train': 1.6690469980239868} -11/07/2021 01:34:06 - INFO - __main__ - Step 30573: {'lr': 0.00045541240666705516, 'samples': 5870016, 'steps': 30572, 'loss/train': 2.228196144104004} -11/07/2021 01:34:06 - INFO - __main__ - Step 30574: {'lr': 0.0004554093818142475, 'samples': 5870208, 'steps': 30573, 'loss/train': 1.8303005695343018} -11/07/2021 01:34:06 - INFO - __main__ - Step 30575: {'lr': 0.0004554063568688857, 'samples': 5870400, 'steps': 30574, 'loss/train': 1.8389360904693604} -11/07/2021 01:34:07 - INFO - __main__ - Step 30576: {'lr': 0.0004554033318309708, 'samples': 5870592, 'steps': 30575, 'loss/train': 1.5906447172164917} -11/07/2021 01:34:07 - INFO - __main__ - Step 30577: {'lr': 0.00045540030670050447, 'samples': 5870784, 'steps': 30576, 'loss/train': 1.800966739654541} -11/07/2021 01:34:08 - INFO - __main__ - Step 30578: {'lr': 0.0004553972814774878, 'samples': 5870976, 'steps': 30577, 'loss/train': 1.8366080522537231} -11/07/2021 01:34:08 - INFO - __main__ - Step 30579: {'lr': 0.00045539425616192243, 'samples': 5871168, 'steps': 30578, 'loss/train': 1.4894955158233643} -11/07/2021 01:34:09 - INFO - __main__ - Step 30580: {'lr': 0.0004553912307538095, 'samples': 5871360, 'steps': 30579, 'loss/train': 1.6211987733840942} -11/07/2021 01:34:09 - INFO - __main__ - Step 30581: {'lr': 0.0004553882052531504, 'samples': 5871552, 'steps': 30580, 'loss/train': 1.6969722509384155} -11/07/2021 01:34:10 - INFO - __main__ - Step 30582: {'lr': 0.00045538517965994663, 'samples': 5871744, 'steps': 30581, 'loss/train': 1.7053320407867432} -11/07/2021 01:34:10 - INFO - __main__ - Step 30583: {'lr': 0.0004553821539741994, 'samples': 5871936, 'steps': 30582, 'loss/train': 1.3603167533874512} -11/07/2021 01:34:11 - INFO - __main__ - Step 30584: {'lr': 0.0004553791281959102, 'samples': 5872128, 'steps': 30583, 'loss/train': 1.4426591396331787} -11/07/2021 01:34:12 - INFO - __main__ - Step 30585: {'lr': 0.00045537610232508033, 'samples': 5872320, 'steps': 30584, 'loss/train': 1.5270507335662842} -11/07/2021 01:34:12 - INFO - __main__ - Step 30586: {'lr': 0.0004553730763617111, 'samples': 5872512, 'steps': 30585, 'loss/train': 1.8075188398361206} -11/07/2021 01:34:12 - INFO - __main__ - Step 30587: {'lr': 0.000455370050305804, 'samples': 5872704, 'steps': 30586, 'loss/train': 1.578984022140503} -11/07/2021 01:34:13 - INFO - __main__ - Step 30588: {'lr': 0.0004553670241573603, 'samples': 5872896, 'steps': 30587, 'loss/train': 1.416538119316101} -11/07/2021 01:34:13 - INFO - __main__ - Step 30589: {'lr': 0.00045536399791638133, 'samples': 5873088, 'steps': 30588, 'loss/train': 2.0954222679138184} -11/07/2021 01:34:14 - INFO - __main__ - Step 30590: {'lr': 0.0004553609715828686, 'samples': 5873280, 'steps': 30589, 'loss/train': 1.8816574811935425} -11/07/2021 01:34:14 - INFO - __main__ - Step 30591: {'lr': 0.00045535794515682334, 'samples': 5873472, 'steps': 30590, 'loss/train': 1.5985524654388428} -11/07/2021 01:34:15 - INFO - __main__ - Step 30592: {'lr': 0.00045535491863824695, 'samples': 5873664, 'steps': 30591, 'loss/train': 1.902991771697998} -11/07/2021 01:34:15 - INFO - __main__ - Step 30593: {'lr': 0.0004553518920271408, 'samples': 5873856, 'steps': 30592, 'loss/train': 1.2298734188079834} -11/07/2021 01:34:15 - INFO - __main__ - Step 30594: {'lr': 0.00045534886532350627, 'samples': 5874048, 'steps': 30593, 'loss/train': 1.693086862564087} -11/07/2021 01:34:16 - INFO - __main__ - Step 30595: {'lr': 0.00045534583852734474, 'samples': 5874240, 'steps': 30594, 'loss/train': 1.6848118305206299} -11/07/2021 01:34:17 - INFO - __main__ - Step 30596: {'lr': 0.00045534281163865756, 'samples': 5874432, 'steps': 30595, 'loss/train': 2.0250253677368164} -11/07/2021 01:34:17 - INFO - __main__ - Step 30597: {'lr': 0.000455339784657446, 'samples': 5874624, 'steps': 30596, 'loss/train': 1.2345815896987915} -11/07/2021 01:34:17 - INFO - __main__ - Step 30598: {'lr': 0.0004553367575837115, 'samples': 5874816, 'steps': 30597, 'loss/train': 1.6201162338256836} -11/07/2021 01:34:18 - INFO - __main__ - Step 30599: {'lr': 0.00045533373041745545, 'samples': 5875008, 'steps': 30598, 'loss/train': 1.4778693914413452} -11/07/2021 01:34:19 - INFO - __main__ - Step 30600: {'lr': 0.00045533070315867917, 'samples': 5875200, 'steps': 30599, 'loss/train': 1.1637945175170898} -11/07/2021 01:34:19 - INFO - __main__ - Step 30601: {'lr': 0.0004553276758073841, 'samples': 5875392, 'steps': 30600, 'loss/train': 0.970828115940094} -11/07/2021 01:34:20 - INFO - __main__ - Step 30602: {'lr': 0.00045532464836357155, 'samples': 5875584, 'steps': 30601, 'loss/train': 1.6925225257873535} -11/07/2021 01:34:20 - INFO - __main__ - Step 30603: {'lr': 0.0004553216208272428, 'samples': 5875776, 'steps': 30602, 'loss/train': 1.729225993156433} -11/07/2021 01:34:20 - INFO - __main__ - Step 30604: {'lr': 0.0004553185931983994, 'samples': 5875968, 'steps': 30603, 'loss/train': 1.6972366571426392} -11/07/2021 01:34:21 - INFO - __main__ - Step 30605: {'lr': 0.00045531556547704255, 'samples': 5876160, 'steps': 30604, 'loss/train': 1.6841012239456177} -11/07/2021 01:34:22 - INFO - __main__ - Step 30606: {'lr': 0.00045531253766317373, 'samples': 5876352, 'steps': 30605, 'loss/train': 1.5396567583084106} -11/07/2021 01:34:22 - INFO - __main__ - Step 30607: {'lr': 0.0004553095097567942, 'samples': 5876544, 'steps': 30606, 'loss/train': 1.3511580228805542} -11/07/2021 01:34:22 - INFO - __main__ - Step 30608: {'lr': 0.0004553064817579053, 'samples': 5876736, 'steps': 30607, 'loss/train': 1.6638671159744263} -11/07/2021 01:34:23 - INFO - __main__ - Step 30609: {'lr': 0.0004553034536665086, 'samples': 5876928, 'steps': 30608, 'loss/train': 1.478841781616211} -11/07/2021 01:34:24 - INFO - __main__ - Step 30610: {'lr': 0.0004553004254826053, 'samples': 5877120, 'steps': 30609, 'loss/train': 1.5827250480651855} -11/07/2021 01:34:24 - INFO - __main__ - Step 30611: {'lr': 0.0004552973972061967, 'samples': 5877312, 'steps': 30610, 'loss/train': 2.2319352626800537} -11/07/2021 01:34:24 - INFO - __main__ - Step 30612: {'lr': 0.00045529436883728436, 'samples': 5877504, 'steps': 30611, 'loss/train': 1.6994431018829346} -11/07/2021 01:34:25 - INFO - __main__ - Step 30613: {'lr': 0.0004552913403758695, 'samples': 5877696, 'steps': 30612, 'loss/train': 1.6245088577270508} -11/07/2021 01:34:25 - INFO - __main__ - Step 30614: {'lr': 0.00045528831182195355, 'samples': 5877888, 'steps': 30613, 'loss/train': 1.5530428886413574} -11/07/2021 01:34:26 - INFO - __main__ - Step 30615: {'lr': 0.00045528528317553786, 'samples': 5878080, 'steps': 30614, 'loss/train': 1.5801184177398682} -11/07/2021 01:34:27 - INFO - __main__ - Step 30616: {'lr': 0.0004552822544366238, 'samples': 5878272, 'steps': 30615, 'loss/train': 1.069941759109497} -11/07/2021 01:34:27 - INFO - __main__ - Step 30617: {'lr': 0.00045527922560521274, 'samples': 5878464, 'steps': 30616, 'loss/train': 1.248826265335083} -11/07/2021 01:34:27 - INFO - __main__ - Step 30618: {'lr': 0.0004552761966813059, 'samples': 5878656, 'steps': 30617, 'loss/train': 1.8219928741455078} -11/07/2021 01:34:28 - INFO - __main__ - Step 30619: {'lr': 0.00045527316766490487, 'samples': 5878848, 'steps': 30618, 'loss/train': 1.383254051208496} -11/07/2021 01:34:28 - INFO - __main__ - Step 30620: {'lr': 0.000455270138556011, 'samples': 5879040, 'steps': 30619, 'loss/train': 1.7578457593917847} -11/07/2021 01:34:29 - INFO - __main__ - Step 30621: {'lr': 0.00045526710935462543, 'samples': 5879232, 'steps': 30620, 'loss/train': 1.6432160139083862} -11/07/2021 01:34:29 - INFO - __main__ - Step 30622: {'lr': 0.00045526408006074973, 'samples': 5879424, 'steps': 30621, 'loss/train': 1.3899623155593872} -11/07/2021 01:34:30 - INFO - __main__ - Step 30623: {'lr': 0.00045526105067438525, 'samples': 5879616, 'steps': 30622, 'loss/train': 1.098164439201355} -11/07/2021 01:34:30 - INFO - __main__ - Step 30624: {'lr': 0.00045525802119553323, 'samples': 5879808, 'steps': 30623, 'loss/train': 1.6256321668624878} -11/07/2021 01:34:30 - INFO - __main__ - Step 30625: {'lr': 0.0004552549916241951, 'samples': 5880000, 'steps': 30624, 'loss/train': 1.5688073635101318} -11/07/2021 01:34:32 - INFO - __main__ - Step 30626: {'lr': 0.0004552519619603723, 'samples': 5880192, 'steps': 30625, 'loss/train': 0.8748301863670349} -11/07/2021 01:34:32 - INFO - __main__ - Step 30627: {'lr': 0.00045524893220406617, 'samples': 5880384, 'steps': 30626, 'loss/train': 1.403340220451355} -11/07/2021 01:34:32 - INFO - __main__ - Step 30628: {'lr': 0.00045524590235527796, 'samples': 5880576, 'steps': 30627, 'loss/train': 1.6631159782409668} -11/07/2021 01:34:33 - INFO - __main__ - Step 30629: {'lr': 0.0004552428724140091, 'samples': 5880768, 'steps': 30628, 'loss/train': 0.9583744406700134} -11/07/2021 01:34:33 - INFO - __main__ - Step 30630: {'lr': 0.000455239842380261, 'samples': 5880960, 'steps': 30629, 'loss/train': 0.6214451789855957} -11/07/2021 01:34:35 - INFO - __main__ - Step 30631: {'lr': 0.000455236812254035, 'samples': 5881152, 'steps': 30630, 'loss/train': 1.3606207370758057} -11/07/2021 01:34:36 - INFO - __main__ - Step 30632: {'lr': 0.0004552337820353325, 'samples': 5881344, 'steps': 30631, 'loss/train': 1.9707520008087158} -11/07/2021 01:34:36 - INFO - __main__ - Step 30633: {'lr': 0.00045523075172415476, 'samples': 5881536, 'steps': 30632, 'loss/train': 1.6842832565307617} -11/07/2021 01:34:36 - INFO - __main__ - Step 30634: {'lr': 0.0004552277213205032, 'samples': 5881728, 'steps': 30633, 'loss/train': 1.5775192975997925} -11/07/2021 01:34:37 - INFO - __main__ - Step 30635: {'lr': 0.0004552246908243792, 'samples': 5881920, 'steps': 30634, 'loss/train': 1.81877601146698} -11/07/2021 01:34:37 - INFO - __main__ - Step 30636: {'lr': 0.00045522166023578413, 'samples': 5882112, 'steps': 30635, 'loss/train': 1.7876152992248535} -11/07/2021 01:34:37 - INFO - __main__ - Step 30637: {'lr': 0.0004552186295547194, 'samples': 5882304, 'steps': 30636, 'loss/train': 1.7799782752990723} -11/07/2021 01:34:38 - INFO - __main__ - Step 30638: {'lr': 0.0004552155987811863, 'samples': 5882496, 'steps': 30637, 'loss/train': 1.8900376558303833} -11/07/2021 01:34:39 - INFO - __main__ - Step 30639: {'lr': 0.00045521256791518616, 'samples': 5882688, 'steps': 30638, 'loss/train': 1.7110861539840698} -11/07/2021 01:34:39 - INFO - __main__ - Step 30640: {'lr': 0.0004552095369567205, 'samples': 5882880, 'steps': 30639, 'loss/train': 1.56343674659729} -11/07/2021 01:34:39 - INFO - __main__ - Step 30641: {'lr': 0.00045520650590579056, 'samples': 5883072, 'steps': 30640, 'loss/train': 1.666163444519043} -11/07/2021 01:34:40 - INFO - __main__ - Step 30642: {'lr': 0.00045520347476239763, 'samples': 5883264, 'steps': 30641, 'loss/train': 1.7846308946609497} -11/07/2021 01:34:40 - INFO - __main__ - Step 30643: {'lr': 0.00045520044352654335, 'samples': 5883456, 'steps': 30642, 'loss/train': 1.5713022947311401} -11/07/2021 01:34:41 - INFO - __main__ - Step 30644: {'lr': 0.0004551974121982288, 'samples': 5883648, 'steps': 30643, 'loss/train': 1.5387201309204102} -11/07/2021 01:34:42 - INFO - __main__ - Step 30645: {'lr': 0.00045519438077745543, 'samples': 5883840, 'steps': 30644, 'loss/train': 1.3501056432724} -11/07/2021 01:34:42 - INFO - __main__ - Step 30646: {'lr': 0.0004551913492642248, 'samples': 5884032, 'steps': 30645, 'loss/train': 1.4950666427612305} -11/07/2021 01:34:42 - INFO - __main__ - Step 30647: {'lr': 0.00045518831765853796, 'samples': 5884224, 'steps': 30646, 'loss/train': 1.1170263290405273} -11/07/2021 01:34:43 - INFO - __main__ - Step 30648: {'lr': 0.0004551852859603965, 'samples': 5884416, 'steps': 30647, 'loss/train': 1.549283742904663} -11/07/2021 01:34:43 - INFO - __main__ - Step 30649: {'lr': 0.0004551822541698017, 'samples': 5884608, 'steps': 30648, 'loss/train': 1.6494215726852417} -11/07/2021 01:34:44 - INFO - __main__ - Step 30650: {'lr': 0.0004551792222867549, 'samples': 5884800, 'steps': 30649, 'loss/train': 1.7705411911010742} -11/07/2021 01:34:44 - INFO - __main__ - Step 30651: {'lr': 0.0004551761903112576, 'samples': 5884992, 'steps': 30650, 'loss/train': 1.90091073513031} -11/07/2021 01:34:45 - INFO - __main__ - Step 30652: {'lr': 0.000455173158243311, 'samples': 5885184, 'steps': 30651, 'loss/train': 1.9132969379425049} -11/07/2021 01:34:45 - INFO - __main__ - Step 30653: {'lr': 0.0004551701260829166, 'samples': 5885376, 'steps': 30652, 'loss/train': 1.7156943082809448} -11/07/2021 01:34:46 - INFO - __main__ - Step 30654: {'lr': 0.00045516709383007563, 'samples': 5885568, 'steps': 30653, 'loss/train': 1.2612545490264893} -11/07/2021 01:34:46 - INFO - __main__ - Step 30655: {'lr': 0.0004551640614847896, 'samples': 5885760, 'steps': 30654, 'loss/train': 0.7886247038841248} -11/07/2021 01:34:47 - INFO - __main__ - Step 30656: {'lr': 0.00045516102904705983, 'samples': 5885952, 'steps': 30655, 'loss/train': 1.3656479120254517} -11/07/2021 01:34:47 - INFO - __main__ - Step 30657: {'lr': 0.0004551579965168876, 'samples': 5886144, 'steps': 30656, 'loss/train': 1.431735634803772} -11/07/2021 01:34:47 - INFO - __main__ - Step 30658: {'lr': 0.00045515496389427433, 'samples': 5886336, 'steps': 30657, 'loss/train': 1.4148099422454834} -11/07/2021 01:34:49 - INFO - __main__ - Step 30659: {'lr': 0.0004551519311792215, 'samples': 5886528, 'steps': 30658, 'loss/train': 1.6572784185409546} -11/07/2021 01:34:49 - INFO - __main__ - Step 30660: {'lr': 0.00045514889837173025, 'samples': 5886720, 'steps': 30659, 'loss/train': 1.0424095392227173} -11/07/2021 01:34:49 - INFO - __main__ - Step 30661: {'lr': 0.00045514586547180214, 'samples': 5886912, 'steps': 30660, 'loss/train': 1.1317081451416016} -11/07/2021 01:34:50 - INFO - __main__ - Step 30662: {'lr': 0.0004551428324794385, 'samples': 5887104, 'steps': 30661, 'loss/train': 1.580672025680542} -11/07/2021 01:34:50 - INFO - __main__ - Step 30663: {'lr': 0.00045513979939464056, 'samples': 5887296, 'steps': 30662, 'loss/train': 1.5205079317092896} -11/07/2021 01:34:51 - INFO - __main__ - Step 30664: {'lr': 0.0004551367662174099, 'samples': 5887488, 'steps': 30663, 'loss/train': 1.219908595085144} -11/07/2021 01:34:52 - INFO - __main__ - Step 30665: {'lr': 0.0004551337329477477, 'samples': 5887680, 'steps': 30664, 'loss/train': 1.2398808002471924} -11/07/2021 01:34:52 - INFO - __main__ - Step 30666: {'lr': 0.00045513069958565545, 'samples': 5887872, 'steps': 30665, 'loss/train': 1.4924900531768799} -11/07/2021 01:34:52 - INFO - __main__ - Step 30667: {'lr': 0.00045512766613113457, 'samples': 5888064, 'steps': 30666, 'loss/train': 1.8135350942611694} -11/07/2021 01:34:53 - INFO - __main__ - Step 30668: {'lr': 0.00045512463258418615, 'samples': 5888256, 'steps': 30667, 'loss/train': 1.542351245880127} -11/07/2021 01:34:53 - INFO - __main__ - Step 30669: {'lr': 0.00045512159894481183, 'samples': 5888448, 'steps': 30668, 'loss/train': 1.554823637008667} -11/07/2021 01:34:55 - INFO - __main__ - Step 30670: {'lr': 0.00045511856521301286, 'samples': 5888640, 'steps': 30669, 'loss/train': 1.5602335929870605} -11/07/2021 01:34:55 - INFO - __main__ - Step 30671: {'lr': 0.0004551155313887906, 'samples': 5888832, 'steps': 30670, 'loss/train': 1.5313934087753296} -11/07/2021 01:34:55 - INFO - __main__ - Step 30672: {'lr': 0.0004551124974721465, 'samples': 5889024, 'steps': 30671, 'loss/train': 1.4817216396331787} -11/07/2021 01:34:56 - INFO - __main__ - Step 30673: {'lr': 0.00045510946346308186, 'samples': 5889216, 'steps': 30672, 'loss/train': 1.8890703916549683} -11/07/2021 01:34:56 - INFO - __main__ - Step 30674: {'lr': 0.0004551064293615981, 'samples': 5889408, 'steps': 30673, 'loss/train': 1.8428637981414795} -11/07/2021 01:34:57 - INFO - __main__ - Step 30675: {'lr': 0.00045510339516769647, 'samples': 5889600, 'steps': 30674, 'loss/train': 1.5842695236206055} -11/07/2021 01:34:57 - INFO - __main__ - Step 30676: {'lr': 0.0004551003608813784, 'samples': 5889792, 'steps': 30675, 'loss/train': 1.331461787223816} -11/07/2021 01:34:58 - INFO - __main__ - Step 30677: {'lr': 0.00045509732650264535, 'samples': 5889984, 'steps': 30676, 'loss/train': 1.6517804861068726} -11/07/2021 01:34:58 - INFO - __main__ - Step 30678: {'lr': 0.00045509429203149856, 'samples': 5890176, 'steps': 30677, 'loss/train': 1.6982057094573975} -11/07/2021 01:34:59 - INFO - __main__ - Step 30679: {'lr': 0.00045509125746793946, 'samples': 5890368, 'steps': 30678, 'loss/train': 1.3411773443222046} -11/07/2021 01:34:59 - INFO - __main__ - Step 30680: {'lr': 0.00045508822281196937, 'samples': 5890560, 'steps': 30679, 'loss/train': 1.4626752138137817} -11/07/2021 01:34:59 - INFO - __main__ - Step 30681: {'lr': 0.0004550851880635898, 'samples': 5890752, 'steps': 30680, 'loss/train': 1.4452056884765625} -11/07/2021 01:35:00 - INFO - __main__ - Step 30682: {'lr': 0.0004550821532228019, 'samples': 5890944, 'steps': 30681, 'loss/train': 1.9559125900268555} -11/07/2021 01:35:01 - INFO - __main__ - Step 30683: {'lr': 0.00045507911828960717, 'samples': 5891136, 'steps': 30682, 'loss/train': 1.2644442319869995} -11/07/2021 01:35:01 - INFO - __main__ - Step 30684: {'lr': 0.000455076083264007, 'samples': 5891328, 'steps': 30683, 'loss/train': 1.6457964181900024} -11/07/2021 01:35:01 - INFO - __main__ - Step 30685: {'lr': 0.0004550730481460027, 'samples': 5891520, 'steps': 30684, 'loss/train': 1.6096035242080688} -11/07/2021 01:35:02 - INFO - __main__ - Step 30686: {'lr': 0.0004550700129355956, 'samples': 5891712, 'steps': 30685, 'loss/train': 1.6629770994186401} -11/07/2021 01:35:03 - INFO - __main__ - Step 30687: {'lr': 0.0004550669776327871, 'samples': 5891904, 'steps': 30686, 'loss/train': 1.6891008615493774} -11/07/2021 01:35:03 - INFO - __main__ - Step 30688: {'lr': 0.00045506394223757867, 'samples': 5892096, 'steps': 30687, 'loss/train': 1.3316161632537842} -11/07/2021 01:35:03 - INFO - __main__ - Step 30689: {'lr': 0.00045506090674997157, 'samples': 5892288, 'steps': 30688, 'loss/train': 1.6416163444519043} -11/07/2021 01:35:04 - INFO - __main__ - Step 30690: {'lr': 0.00045505787116996714, 'samples': 5892480, 'steps': 30689, 'loss/train': 1.483043909072876} -11/07/2021 01:35:04 - INFO - __main__ - Step 30691: {'lr': 0.0004550548354975669, 'samples': 5892672, 'steps': 30690, 'loss/train': 1.6424208879470825} -11/07/2021 01:35:05 - INFO - __main__ - Step 30692: {'lr': 0.000455051799732772, 'samples': 5892864, 'steps': 30691, 'loss/train': 1.5616493225097656} -11/07/2021 01:35:05 - INFO - __main__ - Step 30693: {'lr': 0.000455048763875584, 'samples': 5893056, 'steps': 30692, 'loss/train': 1.2560726404190063} -11/07/2021 01:35:06 - INFO - __main__ - Step 30694: {'lr': 0.00045504572792600415, 'samples': 5893248, 'steps': 30693, 'loss/train': 1.7685329914093018} -11/07/2021 01:35:06 - INFO - __main__ - Step 30695: {'lr': 0.00045504269188403386, 'samples': 5893440, 'steps': 30694, 'loss/train': 1.0254260301589966} -11/07/2021 01:35:07 - INFO - __main__ - Step 30696: {'lr': 0.00045503965574967447, 'samples': 5893632, 'steps': 30695, 'loss/train': 1.7200754880905151} -11/07/2021 01:35:08 - INFO - __main__ - Step 30697: {'lr': 0.0004550366195229274, 'samples': 5893824, 'steps': 30696, 'loss/train': 1.283591628074646} -11/07/2021 01:35:08 - INFO - __main__ - Step 30698: {'lr': 0.00045503358320379405, 'samples': 5894016, 'steps': 30697, 'loss/train': 2.061112403869629} -11/07/2021 01:35:08 - INFO - __main__ - Step 30699: {'lr': 0.00045503054679227567, 'samples': 5894208, 'steps': 30698, 'loss/train': 0.9666875004768372} -11/07/2021 01:35:09 - INFO - __main__ - Step 30700: {'lr': 0.00045502751028837367, 'samples': 5894400, 'steps': 30699, 'loss/train': 1.7538293600082397} -11/07/2021 01:35:09 - INFO - __main__ - Step 30701: {'lr': 0.00045502447369208957, 'samples': 5894592, 'steps': 30700, 'loss/train': 0.1268743872642517} -11/07/2021 01:35:10 - INFO - __main__ - Step 30702: {'lr': 0.00045502143700342445, 'samples': 5894784, 'steps': 30701, 'loss/train': 1.3488339185714722} -11/07/2021 01:35:10 - INFO - __main__ - Step 30703: {'lr': 0.0004550184002223799, 'samples': 5894976, 'steps': 30702, 'loss/train': 1.573800802230835} -11/07/2021 01:35:11 - INFO - __main__ - Step 30704: {'lr': 0.0004550153633489572, 'samples': 5895168, 'steps': 30703, 'loss/train': 1.883345127105713} -11/07/2021 01:35:11 - INFO - __main__ - Step 30705: {'lr': 0.0004550123263831578, 'samples': 5895360, 'steps': 30704, 'loss/train': 2.1430163383483887} -11/07/2021 01:35:11 - INFO - __main__ - Step 30706: {'lr': 0.0004550092893249829, 'samples': 5895552, 'steps': 30705, 'loss/train': 1.7087527513504028} -11/07/2021 01:35:12 - INFO - __main__ - Step 30707: {'lr': 0.00045500625217443404, 'samples': 5895744, 'steps': 30706, 'loss/train': 1.6913039684295654} -11/07/2021 01:35:13 - INFO - __main__ - Step 30708: {'lr': 0.0004550032149315125, 'samples': 5895936, 'steps': 30707, 'loss/train': 1.7982276678085327} -11/07/2021 01:35:13 - INFO - __main__ - Step 30709: {'lr': 0.00045500017759621974, 'samples': 5896128, 'steps': 30708, 'loss/train': 1.4455924034118652} -11/07/2021 01:35:13 - INFO - __main__ - Step 30710: {'lr': 0.00045499714016855705, 'samples': 5896320, 'steps': 30709, 'loss/train': 1.656386137008667} -11/07/2021 01:35:14 - INFO - __main__ - Step 30711: {'lr': 0.0004549941026485258, 'samples': 5896512, 'steps': 30710, 'loss/train': 1.3936392068862915} -11/07/2021 01:35:14 - INFO - __main__ - Step 30712: {'lr': 0.00045499106503612733, 'samples': 5896704, 'steps': 30711, 'loss/train': 1.678410530090332} -11/07/2021 01:35:15 - INFO - __main__ - Step 30713: {'lr': 0.00045498802733136306, 'samples': 5896896, 'steps': 30712, 'loss/train': 1.5728613138198853} -11/07/2021 01:35:16 - INFO - __main__ - Step 30714: {'lr': 0.0004549849895342344, 'samples': 5897088, 'steps': 30713, 'loss/train': 1.51631760597229} -11/07/2021 01:35:16 - INFO - __main__ - Step 30715: {'lr': 0.00045498195164474264, 'samples': 5897280, 'steps': 30714, 'loss/train': 1.4547069072723389} -11/07/2021 01:35:16 - INFO - __main__ - Step 30716: {'lr': 0.00045497891366288914, 'samples': 5897472, 'steps': 30715, 'loss/train': 2.198493480682373} -11/07/2021 01:35:17 - INFO - __main__ - Step 30717: {'lr': 0.0004549758755886754, 'samples': 5897664, 'steps': 30716, 'loss/train': 5.7820844650268555} -11/07/2021 01:35:17 - INFO - __main__ - Step 30718: {'lr': 0.00045497283742210263, 'samples': 5897856, 'steps': 30717, 'loss/train': 1.0657594203948975} -11/07/2021 01:35:18 - INFO - __main__ - Step 30719: {'lr': 0.0004549697991631722, 'samples': 5898048, 'steps': 30718, 'loss/train': 1.59716796875} -11/07/2021 01:35:18 - INFO - __main__ - Step 30720: {'lr': 0.0004549667608118856, 'samples': 5898240, 'steps': 30719, 'loss/train': 1.0632942914962769} -11/07/2021 01:35:19 - INFO - __main__ - Step 30721: {'lr': 0.0004549637223682441, 'samples': 5898432, 'steps': 30720, 'loss/train': 1.446715235710144} -11/07/2021 01:35:19 - INFO - __main__ - Step 30722: {'lr': 0.0004549606838322492, 'samples': 5898624, 'steps': 30721, 'loss/train': 1.3796584606170654} -11/07/2021 01:35:19 - INFO - __main__ - Step 30723: {'lr': 0.00045495764520390216, 'samples': 5898816, 'steps': 30722, 'loss/train': 1.4826099872589111} -11/07/2021 01:35:21 - INFO - __main__ - Step 30724: {'lr': 0.0004549546064832043, 'samples': 5899008, 'steps': 30723, 'loss/train': 1.9744141101837158} -11/07/2021 01:35:21 - INFO - __main__ - Step 30725: {'lr': 0.0004549515676701571, 'samples': 5899200, 'steps': 30724, 'loss/train': 1.6435303688049316} -11/07/2021 01:35:21 - INFO - __main__ - Step 30726: {'lr': 0.0004549485287647619, 'samples': 5899392, 'steps': 30725, 'loss/train': 1.5569947957992554} -11/07/2021 01:35:22 - INFO - __main__ - Step 30727: {'lr': 0.00045494548976702, 'samples': 5899584, 'steps': 30726, 'loss/train': 1.3677185773849487} -11/07/2021 01:35:22 - INFO - __main__ - Step 30728: {'lr': 0.0004549424506769329, 'samples': 5899776, 'steps': 30727, 'loss/train': 1.946964144706726} -11/07/2021 01:35:23 - INFO - __main__ - Step 30729: {'lr': 0.00045493941149450185, 'samples': 5899968, 'steps': 30728, 'loss/train': 1.450317621231079} -11/07/2021 01:35:23 - INFO - __main__ - Step 30730: {'lr': 0.00045493637221972826, 'samples': 5900160, 'steps': 30729, 'loss/train': 1.8467463254928589} -11/07/2021 01:35:24 - INFO - __main__ - Step 30731: {'lr': 0.0004549333328526135, 'samples': 5900352, 'steps': 30730, 'loss/train': 1.7263344526290894} -11/07/2021 01:35:24 - INFO - __main__ - Step 30732: {'lr': 0.0004549302933931589, 'samples': 5900544, 'steps': 30731, 'loss/train': 1.9243172407150269} -11/07/2021 01:35:24 - INFO - __main__ - Step 30733: {'lr': 0.000454927253841366, 'samples': 5900736, 'steps': 30732, 'loss/train': 1.7375285625457764} -11/07/2021 01:35:26 - INFO - __main__ - Step 30734: {'lr': 0.00045492421419723595, 'samples': 5900928, 'steps': 30733, 'loss/train': 1.4696018695831299} -11/07/2021 01:35:26 - INFO - __main__ - Step 30735: {'lr': 0.00045492117446077027, 'samples': 5901120, 'steps': 30734, 'loss/train': 0.8575605154037476} -11/07/2021 01:35:26 - INFO - __main__ - Step 30736: {'lr': 0.0004549181346319702, 'samples': 5901312, 'steps': 30735, 'loss/train': 2.1260533332824707} -11/07/2021 01:35:27 - INFO - __main__ - Step 30737: {'lr': 0.00045491509471083717, 'samples': 5901504, 'steps': 30736, 'loss/train': 1.023028016090393} -11/07/2021 01:35:27 - INFO - __main__ - Step 30738: {'lr': 0.00045491205469737263, 'samples': 5901696, 'steps': 30737, 'loss/train': 1.1181199550628662} -11/07/2021 01:35:28 - INFO - __main__ - Step 30739: {'lr': 0.00045490901459157787, 'samples': 5901888, 'steps': 30738, 'loss/train': 0.6728991270065308} -11/07/2021 01:35:28 - INFO - __main__ - Step 30740: {'lr': 0.0004549059743934543, 'samples': 5902080, 'steps': 30739, 'loss/train': 1.761975884437561} -11/07/2021 01:35:29 - INFO - __main__ - Step 30741: {'lr': 0.00045490293410300315, 'samples': 5902272, 'steps': 30740, 'loss/train': 1.6367331743240356} -11/07/2021 01:35:29 - INFO - __main__ - Step 30742: {'lr': 0.000454899893720226, 'samples': 5902464, 'steps': 30741, 'loss/train': 1.7650607824325562} -11/07/2021 01:35:30 - INFO - __main__ - Step 30743: {'lr': 0.000454896853245124, 'samples': 5902656, 'steps': 30742, 'loss/train': 1.5175005197525024} -11/07/2021 01:35:30 - INFO - __main__ - Step 30744: {'lr': 0.00045489381267769873, 'samples': 5902848, 'steps': 30743, 'loss/train': 1.7161122560501099} -11/07/2021 01:35:31 - INFO - __main__ - Step 30745: {'lr': 0.00045489077201795147, 'samples': 5903040, 'steps': 30744, 'loss/train': 1.8334271907806396} -11/07/2021 01:35:31 - INFO - __main__ - Step 30746: {'lr': 0.0004548877312658836, 'samples': 5903232, 'steps': 30745, 'loss/train': 1.4619717597961426} -11/07/2021 01:35:32 - INFO - __main__ - Step 30747: {'lr': 0.0004548846904214964, 'samples': 5903424, 'steps': 30746, 'loss/train': 1.4247400760650635} -11/07/2021 01:35:32 - INFO - __main__ - Step 30748: {'lr': 0.00045488164948479144, 'samples': 5903616, 'steps': 30747, 'loss/train': 2.2171173095703125} -11/07/2021 01:35:32 - INFO - __main__ - Step 30749: {'lr': 0.0004548786084557699, 'samples': 5903808, 'steps': 30748, 'loss/train': 2.2073068618774414} -11/07/2021 01:35:33 - INFO - __main__ - Step 30750: {'lr': 0.00045487556733443327, 'samples': 5904000, 'steps': 30749, 'loss/train': 1.677097201347351} -11/07/2021 01:35:34 - INFO - __main__ - Step 30751: {'lr': 0.0004548725261207828, 'samples': 5904192, 'steps': 30750, 'loss/train': 1.304649829864502} -11/07/2021 01:35:34 - INFO - __main__ - Step 30752: {'lr': 0.0004548694848148199, 'samples': 5904384, 'steps': 30751, 'loss/train': 1.7409619092941284} -11/07/2021 01:35:34 - INFO - __main__ - Step 30753: {'lr': 0.0004548664434165461, 'samples': 5904576, 'steps': 30752, 'loss/train': 1.7309997081756592} -11/07/2021 01:35:35 - INFO - __main__ - Step 30754: {'lr': 0.0004548634019259625, 'samples': 5904768, 'steps': 30753, 'loss/train': 1.2886046171188354} -11/07/2021 01:35:36 - INFO - __main__ - Step 30755: {'lr': 0.0004548603603430708, 'samples': 5904960, 'steps': 30754, 'loss/train': 1.547845482826233} -11/07/2021 01:35:36 - INFO - __main__ - Step 30756: {'lr': 0.00045485731866787206, 'samples': 5905152, 'steps': 30755, 'loss/train': 1.908001184463501} -11/07/2021 01:35:36 - INFO - __main__ - Step 30757: {'lr': 0.00045485427690036774, 'samples': 5905344, 'steps': 30756, 'loss/train': 1.702413558959961} -11/07/2021 01:35:37 - INFO - __main__ - Step 30758: {'lr': 0.0004548512350405593, 'samples': 5905536, 'steps': 30757, 'loss/train': 2.074098587036133} -11/07/2021 01:35:37 - INFO - __main__ - Step 30759: {'lr': 0.00045484819308844806, 'samples': 5905728, 'steps': 30758, 'loss/train': 1.4840266704559326} -11/07/2021 01:35:38 - INFO - __main__ - Step 30760: {'lr': 0.00045484515104403535, 'samples': 5905920, 'steps': 30759, 'loss/train': 1.3921496868133545} -11/07/2021 01:35:38 - INFO - __main__ - Step 30761: {'lr': 0.00045484210890732257, 'samples': 5906112, 'steps': 30760, 'loss/train': 1.3195807933807373} -11/07/2021 01:35:39 - INFO - __main__ - Step 30762: {'lr': 0.0004548390666783111, 'samples': 5906304, 'steps': 30761, 'loss/train': 1.9495140314102173} -11/07/2021 01:35:39 - INFO - __main__ - Step 30763: {'lr': 0.00045483602435700233, 'samples': 5906496, 'steps': 30762, 'loss/train': 1.6819427013397217} -11/07/2021 01:35:40 - INFO - __main__ - Step 30764: {'lr': 0.0004548329819433976, 'samples': 5906688, 'steps': 30763, 'loss/train': 1.9270631074905396} -11/07/2021 01:35:41 - INFO - __main__ - Step 30765: {'lr': 0.00045482993943749835, 'samples': 5906880, 'steps': 30764, 'loss/train': 1.6744219064712524} -11/07/2021 01:35:41 - INFO - __main__ - Step 30766: {'lr': 0.0004548268968393058, 'samples': 5907072, 'steps': 30765, 'loss/train': 1.958350658416748} -11/07/2021 01:35:41 - INFO - __main__ - Step 30767: {'lr': 0.0004548238541488214, 'samples': 5907264, 'steps': 30766, 'loss/train': 1.2977490425109863} -11/07/2021 01:35:42 - INFO - __main__ - Step 30768: {'lr': 0.00045482081136604665, 'samples': 5907456, 'steps': 30767, 'loss/train': 1.6346162557601929} -11/07/2021 01:35:42 - INFO - __main__ - Step 30769: {'lr': 0.0004548177684909827, 'samples': 5907648, 'steps': 30768, 'loss/train': 0.8329635262489319} -11/07/2021 01:35:43 - INFO - __main__ - Step 30770: {'lr': 0.0004548147255236311, 'samples': 5907840, 'steps': 30769, 'loss/train': 1.6094725131988525} -11/07/2021 01:35:43 - INFO - __main__ - Step 30771: {'lr': 0.0004548116824639931, 'samples': 5908032, 'steps': 30770, 'loss/train': 1.5290954113006592} -11/07/2021 01:35:44 - INFO - __main__ - Step 30772: {'lr': 0.00045480863931207004, 'samples': 5908224, 'steps': 30771, 'loss/train': 1.5912102460861206} -11/07/2021 01:35:44 - INFO - __main__ - Step 30773: {'lr': 0.0004548055960678635, 'samples': 5908416, 'steps': 30772, 'loss/train': 2.0271196365356445} -11/07/2021 01:35:44 - INFO - __main__ - Step 30774: {'lr': 0.0004548025527313746, 'samples': 5908608, 'steps': 30773, 'loss/train': 1.5651638507843018} -11/07/2021 01:35:45 - INFO - __main__ - Step 30775: {'lr': 0.00045479950930260495, 'samples': 5908800, 'steps': 30774, 'loss/train': 1.0466399192810059} -11/07/2021 01:35:46 - INFO - __main__ - Step 30776: {'lr': 0.0004547964657815558, 'samples': 5908992, 'steps': 30775, 'loss/train': 1.261448860168457} -11/07/2021 01:35:46 - INFO - __main__ - Step 30777: {'lr': 0.0004547934221682284, 'samples': 5909184, 'steps': 30776, 'loss/train': 1.8580161333084106} -11/07/2021 01:35:46 - INFO - __main__ - Step 30778: {'lr': 0.00045479037846262436, 'samples': 5909376, 'steps': 30777, 'loss/train': 1.7419246435165405} -11/07/2021 01:35:47 - INFO - __main__ - Step 30779: {'lr': 0.00045478733466474487, 'samples': 5909568, 'steps': 30778, 'loss/train': 1.6353005170822144} -11/07/2021 01:35:47 - INFO - __main__ - Step 30780: {'lr': 0.0004547842907745914, 'samples': 5909760, 'steps': 30779, 'loss/train': 1.5967276096343994} -11/07/2021 01:35:48 - INFO - __main__ - Step 30781: {'lr': 0.00045478124679216523, 'samples': 5909952, 'steps': 30780, 'loss/train': 1.739806890487671} -11/07/2021 01:35:49 - INFO - __main__ - Step 30782: {'lr': 0.00045477820271746784, 'samples': 5910144, 'steps': 30781, 'loss/train': 1.5588977336883545} -11/07/2021 01:35:49 - INFO - __main__ - Step 30783: {'lr': 0.00045477515855050056, 'samples': 5910336, 'steps': 30782, 'loss/train': 1.5034235715866089} -11/07/2021 01:35:49 - INFO - __main__ - Step 30784: {'lr': 0.0004547721142912647, 'samples': 5910528, 'steps': 30783, 'loss/train': 1.5956065654754639} -11/07/2021 01:35:50 - INFO - __main__ - Step 30785: {'lr': 0.00045476906993976177, 'samples': 5910720, 'steps': 30784, 'loss/train': 1.606019139289856} -11/07/2021 01:35:51 - INFO - __main__ - Step 30786: {'lr': 0.000454766025495993, 'samples': 5910912, 'steps': 30785, 'loss/train': 1.5922966003417969} -11/07/2021 01:35:51 - INFO - __main__ - Step 30787: {'lr': 0.00045476298095995985, 'samples': 5911104, 'steps': 30786, 'loss/train': 5.82503604888916} -11/07/2021 01:35:51 - INFO - __main__ - Step 30788: {'lr': 0.00045475993633166357, 'samples': 5911296, 'steps': 30787, 'loss/train': 1.2205564975738525} -11/07/2021 01:35:52 - INFO - __main__ - Step 30789: {'lr': 0.00045475689161110565, 'samples': 5911488, 'steps': 30788, 'loss/train': 1.7455384731292725} -11/07/2021 01:35:52 - INFO - __main__ - Step 30790: {'lr': 0.0004547538467982876, 'samples': 5911680, 'steps': 30789, 'loss/train': 0.18178731203079224} -11/07/2021 01:35:53 - INFO - __main__ - Step 30791: {'lr': 0.00045475080189321044, 'samples': 5911872, 'steps': 30790, 'loss/train': 1.3786267042160034} -11/07/2021 01:35:53 - INFO - __main__ - Step 30792: {'lr': 0.00045474775689587576, 'samples': 5912064, 'steps': 30791, 'loss/train': 1.1766566038131714} -11/07/2021 01:35:54 - INFO - __main__ - Step 30793: {'lr': 0.00045474471180628496, 'samples': 5912256, 'steps': 30792, 'loss/train': 1.1489925384521484} -11/07/2021 01:35:54 - INFO - __main__ - Step 30794: {'lr': 0.0004547416666244393, 'samples': 5912448, 'steps': 30793, 'loss/train': 1.3420683145523071} -11/07/2021 01:35:55 - INFO - __main__ - Step 30795: {'lr': 0.00045473862135034026, 'samples': 5912640, 'steps': 30794, 'loss/train': 1.1864869594573975} -11/07/2021 01:35:55 - INFO - __main__ - Step 30796: {'lr': 0.0004547355759839891, 'samples': 5912832, 'steps': 30795, 'loss/train': 1.5019656419754028} -11/07/2021 01:35:56 - INFO - __main__ - Step 30797: {'lr': 0.00045473253052538725, 'samples': 5913024, 'steps': 30796, 'loss/train': 2.0348379611968994} -11/07/2021 01:35:56 - INFO - __main__ - Step 30798: {'lr': 0.00045472948497453613, 'samples': 5913216, 'steps': 30797, 'loss/train': 1.2545139789581299} -11/07/2021 01:35:57 - INFO - __main__ - Step 30799: {'lr': 0.00045472643933143703, 'samples': 5913408, 'steps': 30798, 'loss/train': 1.5450226068496704} -11/07/2021 01:35:57 - INFO - __main__ - Step 30800: {'lr': 0.0004547233935960914, 'samples': 5913600, 'steps': 30799, 'loss/train': 1.9017813205718994} -11/07/2021 01:35:57 - INFO - __main__ - Step 30801: {'lr': 0.00045472034776850045, 'samples': 5913792, 'steps': 30800, 'loss/train': 1.516133189201355} -11/07/2021 01:35:58 - INFO - __main__ - Step 30802: {'lr': 0.0004547173018486658, 'samples': 5913984, 'steps': 30801, 'loss/train': 1.5497409105300903} -11/07/2021 01:35:59 - INFO - __main__ - Step 30803: {'lr': 0.0004547142558365887, 'samples': 5914176, 'steps': 30802, 'loss/train': 1.4988566637039185} -11/07/2021 01:35:59 - INFO - __main__ - Step 30804: {'lr': 0.0004547112097322704, 'samples': 5914368, 'steps': 30803, 'loss/train': 1.5426658391952515} -11/07/2021 01:35:59 - INFO - __main__ - Step 30805: {'lr': 0.00045470816353571244, 'samples': 5914560, 'steps': 30804, 'loss/train': 1.770569920539856} -11/07/2021 01:36:00 - INFO - __main__ - Step 30806: {'lr': 0.00045470511724691613, 'samples': 5914752, 'steps': 30805, 'loss/train': 1.310795783996582} -11/07/2021 01:36:01 - INFO - __main__ - Step 30807: {'lr': 0.0004547020708658829, 'samples': 5914944, 'steps': 30806, 'loss/train': 1.5118852853775024} -11/07/2021 01:36:01 - INFO - __main__ - Step 30808: {'lr': 0.000454699024392614, 'samples': 5915136, 'steps': 30807, 'loss/train': 1.5655699968338013} -11/07/2021 01:36:02 - INFO - __main__ - Step 30809: {'lr': 0.0004546959778271109, 'samples': 5915328, 'steps': 30808, 'loss/train': 1.6117366552352905} -11/07/2021 01:36:02 - INFO - __main__ - Step 30810: {'lr': 0.00045469293116937504, 'samples': 5915520, 'steps': 30809, 'loss/train': 1.5515666007995605} -11/07/2021 01:36:02 - INFO - __main__ - Step 30811: {'lr': 0.0004546898844194076, 'samples': 5915712, 'steps': 30810, 'loss/train': 1.419262409210205} -11/07/2021 01:36:03 - INFO - __main__ - Step 30812: {'lr': 0.00045468683757721005, 'samples': 5915904, 'steps': 30811, 'loss/train': 1.8689558506011963} -11/07/2021 01:36:04 - INFO - __main__ - Step 30813: {'lr': 0.0004546837906427839, 'samples': 5916096, 'steps': 30812, 'loss/train': 1.618916392326355} -11/07/2021 01:36:04 - INFO - __main__ - Step 30814: {'lr': 0.00045468074361613026, 'samples': 5916288, 'steps': 30813, 'loss/train': 1.5968495607376099} -11/07/2021 01:36:04 - INFO - __main__ - Step 30815: {'lr': 0.0004546776964972507, 'samples': 5916480, 'steps': 30814, 'loss/train': 1.4214028120040894} -11/07/2021 01:36:05 - INFO - __main__ - Step 30816: {'lr': 0.00045467464928614657, 'samples': 5916672, 'steps': 30815, 'loss/train': 1.8217263221740723} -11/07/2021 01:36:05 - INFO - __main__ - Step 30817: {'lr': 0.0004546716019828191, 'samples': 5916864, 'steps': 30816, 'loss/train': 1.5973073244094849} -11/07/2021 01:36:06 - INFO - __main__ - Step 30818: {'lr': 0.00045466855458726975, 'samples': 5917056, 'steps': 30817, 'loss/train': 1.2746789455413818} -11/07/2021 01:36:06 - INFO - __main__ - Step 30819: {'lr': 0.0004546655070995, 'samples': 5917248, 'steps': 30818, 'loss/train': 1.660507082939148} -11/07/2021 01:36:07 - INFO - __main__ - Step 30820: {'lr': 0.0004546624595195111, 'samples': 5917440, 'steps': 30819, 'loss/train': 1.6329345703125} -11/07/2021 01:36:07 - INFO - __main__ - Step 30821: {'lr': 0.0004546594118473044, 'samples': 5917632, 'steps': 30820, 'loss/train': 1.6678979396820068} -11/07/2021 01:36:07 - INFO - __main__ - Step 30822: {'lr': 0.0004546563640828814, 'samples': 5917824, 'steps': 30821, 'loss/train': 1.5760250091552734} -11/07/2021 01:36:08 - INFO - __main__ - Step 30823: {'lr': 0.0004546533162262434, 'samples': 5918016, 'steps': 30822, 'loss/train': 1.591220498085022} -11/07/2021 01:36:09 - INFO - __main__ - Step 30824: {'lr': 0.00045465026827739175, 'samples': 5918208, 'steps': 30823, 'loss/train': 1.3347065448760986} -11/07/2021 01:36:09 - INFO - __main__ - Step 30825: {'lr': 0.00045464722023632784, 'samples': 5918400, 'steps': 30824, 'loss/train': 1.0544623136520386} -11/07/2021 01:36:09 - INFO - __main__ - Step 30826: {'lr': 0.00045464417210305303, 'samples': 5918592, 'steps': 30825, 'loss/train': 0.868805468082428} -11/07/2021 01:36:10 - INFO - __main__ - Step 30827: {'lr': 0.0004546411238775687, 'samples': 5918784, 'steps': 30826, 'loss/train': 1.4293575286865234} -11/07/2021 01:36:11 - INFO - __main__ - Step 30828: {'lr': 0.00045463807555987633, 'samples': 5918976, 'steps': 30827, 'loss/train': 1.6750293970108032} -11/07/2021 01:36:11 - INFO - __main__ - Step 30829: {'lr': 0.0004546350271499772, 'samples': 5919168, 'steps': 30828, 'loss/train': 1.5183910131454468} -11/07/2021 01:36:12 - INFO - __main__ - Step 30830: {'lr': 0.0004546319786478726, 'samples': 5919360, 'steps': 30829, 'loss/train': 1.4833358526229858} -11/07/2021 01:36:12 - INFO - __main__ - Step 30831: {'lr': 0.000454628930053564, 'samples': 5919552, 'steps': 30830, 'loss/train': 1.5842455625534058} -11/07/2021 01:36:12 - INFO - __main__ - Step 30832: {'lr': 0.0004546258813670528, 'samples': 5919744, 'steps': 30831, 'loss/train': 1.7990853786468506} -11/07/2021 01:36:13 - INFO - __main__ - Step 30833: {'lr': 0.0004546228325883403, 'samples': 5919936, 'steps': 30832, 'loss/train': 1.3607431650161743} -11/07/2021 01:36:14 - INFO - __main__ - Step 30834: {'lr': 0.00045461978371742794, 'samples': 5920128, 'steps': 30833, 'loss/train': 2.1018025875091553} -11/07/2021 01:36:14 - INFO - __main__ - Step 30835: {'lr': 0.00045461673475431704, 'samples': 5920320, 'steps': 30834, 'loss/train': 1.1725069284439087} -11/07/2021 01:36:14 - INFO - __main__ - Step 30836: {'lr': 0.00045461368569900895, 'samples': 5920512, 'steps': 30835, 'loss/train': 1.8515321016311646} -11/07/2021 01:36:15 - INFO - __main__ - Step 30837: {'lr': 0.0004546106365515052, 'samples': 5920704, 'steps': 30836, 'loss/train': 1.7336543798446655} -11/07/2021 01:36:15 - INFO - __main__ - Step 30838: {'lr': 0.000454607587311807, 'samples': 5920896, 'steps': 30837, 'loss/train': 1.4543534517288208} -11/07/2021 01:36:16 - INFO - __main__ - Step 30839: {'lr': 0.00045460453797991577, 'samples': 5921088, 'steps': 30838, 'loss/train': 1.7454028129577637} -11/07/2021 01:36:17 - INFO - __main__ - Step 30840: {'lr': 0.00045460148855583295, 'samples': 5921280, 'steps': 30839, 'loss/train': 1.305275559425354} -11/07/2021 01:36:17 - INFO - __main__ - Step 30841: {'lr': 0.00045459843903955977, 'samples': 5921472, 'steps': 30840, 'loss/train': 0.245193749666214} -11/07/2021 01:36:17 - INFO - __main__ - Step 30842: {'lr': 0.00045459538943109774, 'samples': 5921664, 'steps': 30841, 'loss/train': 1.5130547285079956} -11/07/2021 01:36:18 - INFO - __main__ - Step 30843: {'lr': 0.0004545923397304482, 'samples': 5921856, 'steps': 30842, 'loss/train': 1.6042557954788208} -11/07/2021 01:36:19 - INFO - __main__ - Step 30844: {'lr': 0.0004545892899376125, 'samples': 5922048, 'steps': 30843, 'loss/train': 1.2996978759765625} -11/07/2021 01:36:19 - INFO - __main__ - Step 30845: {'lr': 0.000454586240052592, 'samples': 5922240, 'steps': 30844, 'loss/train': 1.932795524597168} -11/07/2021 01:36:19 - INFO - __main__ - Step 30846: {'lr': 0.00045458319007538804, 'samples': 5922432, 'steps': 30845, 'loss/train': 1.3812726736068726} -11/07/2021 01:36:20 - INFO - __main__ - Step 30847: {'lr': 0.00045458014000600213, 'samples': 5922624, 'steps': 30846, 'loss/train': 1.7849777936935425} -11/07/2021 01:36:20 - INFO - __main__ - Step 30848: {'lr': 0.00045457708984443556, 'samples': 5922816, 'steps': 30847, 'loss/train': 1.9209630489349365} -11/07/2021 01:36:21 - INFO - __main__ - Step 30849: {'lr': 0.0004545740395906897, 'samples': 5923008, 'steps': 30848, 'loss/train': 1.4414986371994019} -11/07/2021 01:36:22 - INFO - __main__ - Step 30850: {'lr': 0.0004545709892447659, 'samples': 5923200, 'steps': 30849, 'loss/train': 1.7687026262283325} -11/07/2021 01:36:22 - INFO - __main__ - Step 30851: {'lr': 0.00045456793880666556, 'samples': 5923392, 'steps': 30850, 'loss/train': 1.5331692695617676} -11/07/2021 01:36:22 - INFO - __main__ - Step 30852: {'lr': 0.0004545648882763902, 'samples': 5923584, 'steps': 30851, 'loss/train': 1.2778525352478027} -11/07/2021 01:36:23 - INFO - __main__ - Step 30853: {'lr': 0.0004545618376539409, 'samples': 5923776, 'steps': 30852, 'loss/train': 1.6304030418395996} -11/07/2021 01:36:23 - INFO - __main__ - Step 30854: {'lr': 0.0004545587869393193, 'samples': 5923968, 'steps': 30853, 'loss/train': 0.9640048742294312} -11/07/2021 01:36:24 - INFO - __main__ - Step 30855: {'lr': 0.00045455573613252667, 'samples': 5924160, 'steps': 30854, 'loss/train': 1.319207787513733} -11/07/2021 01:36:24 - INFO - __main__ - Step 30856: {'lr': 0.0004545526852335643, 'samples': 5924352, 'steps': 30855, 'loss/train': 3.6997063159942627} -11/07/2021 01:36:25 - INFO - __main__ - Step 30857: {'lr': 0.0004545496342424337, 'samples': 5924544, 'steps': 30856, 'loss/train': 1.8156380653381348} -11/07/2021 01:36:25 - INFO - __main__ - Step 30858: {'lr': 0.00045454658315913617, 'samples': 5924736, 'steps': 30857, 'loss/train': 1.4153854846954346} -11/07/2021 01:36:26 - INFO - __main__ - Step 30859: {'lr': 0.0004545435319836731, 'samples': 5924928, 'steps': 30858, 'loss/train': 1.6114808320999146} -11/07/2021 01:36:27 - INFO - __main__ - Step 30860: {'lr': 0.00045454048071604593, 'samples': 5925120, 'steps': 30859, 'loss/train': 1.5351415872573853} -11/07/2021 01:36:27 - INFO - __main__ - Step 30861: {'lr': 0.0004545374293562559, 'samples': 5925312, 'steps': 30860, 'loss/train': 1.7278437614440918} -11/07/2021 01:36:27 - INFO - __main__ - Step 30862: {'lr': 0.00045453437790430446, 'samples': 5925504, 'steps': 30861, 'loss/train': 1.910088300704956} -11/07/2021 01:36:28 - INFO - __main__ - Step 30863: {'lr': 0.000454531326360193, 'samples': 5925696, 'steps': 30862, 'loss/train': 1.8231418132781982} -11/07/2021 01:36:28 - INFO - __main__ - Step 30864: {'lr': 0.00045452827472392286, 'samples': 5925888, 'steps': 30863, 'loss/train': 1.726006269454956} -11/07/2021 01:36:29 - INFO - __main__ - Step 30865: {'lr': 0.0004545252229954955, 'samples': 5926080, 'steps': 30864, 'loss/train': 1.0793594121932983} -11/07/2021 01:36:29 - INFO - __main__ - Step 30866: {'lr': 0.00045452217117491225, 'samples': 5926272, 'steps': 30865, 'loss/train': 1.897141456604004} -11/07/2021 01:36:30 - INFO - __main__ - Step 30867: {'lr': 0.00045451911926217437, 'samples': 5926464, 'steps': 30866, 'loss/train': 1.3745735883712769} -11/07/2021 01:36:30 - INFO - __main__ - Step 30868: {'lr': 0.00045451606725728337, 'samples': 5926656, 'steps': 30867, 'loss/train': 1.2515405416488647} -11/07/2021 01:36:30 - INFO - __main__ - Step 30869: {'lr': 0.0004545130151602406, 'samples': 5926848, 'steps': 30868, 'loss/train': 2.071918249130249} -11/07/2021 01:36:31 - INFO - __main__ - Step 30870: {'lr': 0.00045450996297104743, 'samples': 5927040, 'steps': 30869, 'loss/train': 1.5846422910690308} -11/07/2021 01:36:32 - INFO - __main__ - Step 30871: {'lr': 0.00045450691068970515, 'samples': 5927232, 'steps': 30870, 'loss/train': 1.7457700967788696} -11/07/2021 01:36:32 - INFO - __main__ - Step 30872: {'lr': 0.00045450385831621534, 'samples': 5927424, 'steps': 30871, 'loss/train': 1.7874201536178589} -11/07/2021 01:36:32 - INFO - __main__ - Step 30873: {'lr': 0.0004545008058505792, 'samples': 5927616, 'steps': 30872, 'loss/train': 3.894684076309204} -11/07/2021 01:36:33 - INFO - __main__ - Step 30874: {'lr': 0.0004544977532927981, 'samples': 5927808, 'steps': 30873, 'loss/train': 1.8667088747024536} -11/07/2021 01:36:33 - INFO - __main__ - Step 30875: {'lr': 0.0004544947006428735, 'samples': 5928000, 'steps': 30874, 'loss/train': 2.0149505138397217} -11/07/2021 01:36:34 - INFO - __main__ - Step 30876: {'lr': 0.00045449164790080675, 'samples': 5928192, 'steps': 30875, 'loss/train': 1.3990708589553833} -11/07/2021 01:36:35 - INFO - __main__ - Step 30877: {'lr': 0.00045448859506659926, 'samples': 5928384, 'steps': 30876, 'loss/train': 1.3811663389205933} -11/07/2021 01:36:35 - INFO - __main__ - Step 30878: {'lr': 0.0004544855421402523, 'samples': 5928576, 'steps': 30877, 'loss/train': 1.2561410665512085} -11/07/2021 01:36:35 - INFO - __main__ - Step 30879: {'lr': 0.00045448248912176726, 'samples': 5928768, 'steps': 30878, 'loss/train': 1.218980312347412} -11/07/2021 01:36:36 - INFO - __main__ - Step 30880: {'lr': 0.00045447943601114563, 'samples': 5928960, 'steps': 30879, 'loss/train': 1.5677345991134644} -11/07/2021 01:36:37 - INFO - __main__ - Step 30881: {'lr': 0.00045447638280838877, 'samples': 5929152, 'steps': 30880, 'loss/train': 2.2396042346954346} -11/07/2021 01:36:37 - INFO - __main__ - Step 30882: {'lr': 0.000454473329513498, 'samples': 5929344, 'steps': 30881, 'loss/train': 1.402809739112854} -11/07/2021 01:36:38 - INFO - __main__ - Step 30883: {'lr': 0.0004544702761264746, 'samples': 5929536, 'steps': 30882, 'loss/train': 1.6992740631103516} -11/07/2021 01:36:38 - INFO - __main__ - Step 30884: {'lr': 0.0004544672226473201, 'samples': 5929728, 'steps': 30883, 'loss/train': 1.5864168405532837} -11/07/2021 01:36:38 - INFO - __main__ - Step 30885: {'lr': 0.00045446416907603585, 'samples': 5929920, 'steps': 30884, 'loss/train': 1.8292831182479858} -11/07/2021 01:36:39 - INFO - __main__ - Step 30886: {'lr': 0.00045446111541262317, 'samples': 5930112, 'steps': 30885, 'loss/train': 2.021177053451538} -11/07/2021 01:36:40 - INFO - __main__ - Step 30887: {'lr': 0.0004544580616570835, 'samples': 5930304, 'steps': 30886, 'loss/train': 1.7107443809509277} -11/07/2021 01:36:40 - INFO - __main__ - Step 30888: {'lr': 0.0004544550078094182, 'samples': 5930496, 'steps': 30887, 'loss/train': 1.7455068826675415} -11/07/2021 01:36:40 - INFO - __main__ - Step 30889: {'lr': 0.00045445195386962855, 'samples': 5930688, 'steps': 30888, 'loss/train': 1.7165838479995728} -11/07/2021 01:36:41 - INFO - __main__ - Step 30890: {'lr': 0.0004544488998377161, 'samples': 5930880, 'steps': 30889, 'loss/train': 1.4680341482162476} -11/07/2021 01:36:41 - INFO - __main__ - Step 30891: {'lr': 0.000454445845713682, 'samples': 5931072, 'steps': 30890, 'loss/train': 1.9559266567230225} -11/07/2021 01:36:42 - INFO - __main__ - Step 30892: {'lr': 0.0004544427914975279, 'samples': 5931264, 'steps': 30891, 'loss/train': 1.3994450569152832} -11/07/2021 01:36:42 - INFO - __main__ - Step 30893: {'lr': 0.0004544397371892549, 'samples': 5931456, 'steps': 30892, 'loss/train': 1.4075242280960083} -11/07/2021 01:36:43 - INFO - __main__ - Step 30894: {'lr': 0.00045443668278886463, 'samples': 5931648, 'steps': 30893, 'loss/train': 1.1928571462631226} -11/07/2021 01:36:43 - INFO - __main__ - Step 30895: {'lr': 0.00045443362829635826, 'samples': 5931840, 'steps': 30894, 'loss/train': 1.7529635429382324} -11/07/2021 01:36:43 - INFO - __main__ - Step 30896: {'lr': 0.00045443057371173727, 'samples': 5932032, 'steps': 30895, 'loss/train': 1.4993561506271362} -11/07/2021 01:36:44 - INFO - __main__ - Step 30897: {'lr': 0.00045442751903500305, 'samples': 5932224, 'steps': 30896, 'loss/train': 1.454590916633606} -11/07/2021 01:36:45 - INFO - __main__ - Step 30898: {'lr': 0.0004544244642661569, 'samples': 5932416, 'steps': 30897, 'loss/train': 0.9046458601951599} -11/07/2021 01:36:45 - INFO - __main__ - Step 30899: {'lr': 0.00045442140940520027, 'samples': 5932608, 'steps': 30898, 'loss/train': 1.2835602760314941} -11/07/2021 01:36:45 - INFO - __main__ - Step 30900: {'lr': 0.0004544183544521345, 'samples': 5932800, 'steps': 30899, 'loss/train': 2.022730827331543} -11/07/2021 01:36:46 - INFO - __main__ - Step 30901: {'lr': 0.00045441529940696104, 'samples': 5932992, 'steps': 30900, 'loss/train': 1.4904640913009644} -11/07/2021 01:36:47 - INFO - __main__ - Step 30902: {'lr': 0.0004544122442696811, 'samples': 5933184, 'steps': 30901, 'loss/train': 1.6012802124023438} -11/07/2021 01:36:47 - INFO - __main__ - Step 30903: {'lr': 0.0004544091890402962, 'samples': 5933376, 'steps': 30902, 'loss/train': 1.2576720714569092} -11/07/2021 01:36:48 - INFO - __main__ - Step 30904: {'lr': 0.0004544061337188077, 'samples': 5933568, 'steps': 30903, 'loss/train': 1.4356153011322021} -11/07/2021 01:36:48 - INFO - __main__ - Step 30905: {'lr': 0.0004544030783052169, 'samples': 5933760, 'steps': 30904, 'loss/train': 1.6024492979049683} -11/07/2021 01:36:48 - INFO - __main__ - Step 30906: {'lr': 0.0004544000227995253, 'samples': 5933952, 'steps': 30905, 'loss/train': 1.9224432706832886} -11/07/2021 01:36:49 - INFO - __main__ - Step 30907: {'lr': 0.00045439696720173405, 'samples': 5934144, 'steps': 30906, 'loss/train': 1.2479407787322998} -11/07/2021 01:36:50 - INFO - __main__ - Step 30908: {'lr': 0.00045439391151184483, 'samples': 5934336, 'steps': 30907, 'loss/train': 1.609938383102417} -11/07/2021 01:36:50 - INFO - __main__ - Step 30909: {'lr': 0.0004543908557298588, 'samples': 5934528, 'steps': 30908, 'loss/train': 1.8101469278335571} -11/07/2021 01:36:50 - INFO - __main__ - Step 30910: {'lr': 0.0004543877998557775, 'samples': 5934720, 'steps': 30909, 'loss/train': 0.7057313919067383} -11/07/2021 01:36:51 - INFO - __main__ - Step 30911: {'lr': 0.00045438474388960205, 'samples': 5934912, 'steps': 30910, 'loss/train': 1.4680485725402832} -11/07/2021 01:36:52 - INFO - __main__ - Step 30912: {'lr': 0.0004543816878313341, 'samples': 5935104, 'steps': 30911, 'loss/train': 1.6297519207000732} -11/07/2021 01:36:52 - INFO - __main__ - Step 30913: {'lr': 0.0004543786316809749, 'samples': 5935296, 'steps': 30912, 'loss/train': 1.6242061853408813} -11/07/2021 01:36:53 - INFO - __main__ - Step 30914: {'lr': 0.0004543755754385258, 'samples': 5935488, 'steps': 30913, 'loss/train': 1.5210531949996948} -11/07/2021 01:36:53 - INFO - __main__ - Step 30915: {'lr': 0.00045437251910398824, 'samples': 5935680, 'steps': 30914, 'loss/train': 1.4314866065979004} -11/07/2021 01:36:53 - INFO - __main__ - Step 30916: {'lr': 0.00045436946267736364, 'samples': 5935872, 'steps': 30915, 'loss/train': 1.382826805114746} -11/07/2021 01:36:54 - INFO - __main__ - Step 30917: {'lr': 0.0004543664061586532, 'samples': 5936064, 'steps': 30916, 'loss/train': 1.454323649406433} -11/07/2021 01:36:55 - INFO - __main__ - Step 30918: {'lr': 0.00045436334954785854, 'samples': 5936256, 'steps': 30917, 'loss/train': 1.7000982761383057} -11/07/2021 01:36:55 - INFO - __main__ - Step 30919: {'lr': 0.0004543602928449808, 'samples': 5936448, 'steps': 30918, 'loss/train': 1.026580810546875} -11/07/2021 01:36:55 - INFO - __main__ - Step 30920: {'lr': 0.00045435723605002156, 'samples': 5936640, 'steps': 30919, 'loss/train': 1.9266397953033447} -11/07/2021 01:36:56 - INFO - __main__ - Step 30921: {'lr': 0.00045435417916298205, 'samples': 5936832, 'steps': 30920, 'loss/train': 1.4937081336975098} -11/07/2021 01:36:57 - INFO - __main__ - Step 30922: {'lr': 0.00045435112218386364, 'samples': 5937024, 'steps': 30921, 'loss/train': 1.2779721021652222} -11/07/2021 01:36:57 - INFO - __main__ - Step 30923: {'lr': 0.00045434806511266784, 'samples': 5937216, 'steps': 30922, 'loss/train': 2.076853036880493} -11/07/2021 01:36:57 - INFO - __main__ - Step 30924: {'lr': 0.0004543450079493959, 'samples': 5937408, 'steps': 30923, 'loss/train': 1.4119458198547363} -11/07/2021 01:36:58 - INFO - __main__ - Step 30925: {'lr': 0.0004543419506940494, 'samples': 5937600, 'steps': 30924, 'loss/train': 1.425700306892395} -11/07/2021 01:36:58 - INFO - __main__ - Step 30926: {'lr': 0.0004543388933466294, 'samples': 5937792, 'steps': 30925, 'loss/train': 1.519874930381775} -11/07/2021 01:36:58 - INFO - __main__ - Step 30927: {'lr': 0.00045433583590713756, 'samples': 5937984, 'steps': 30926, 'loss/train': 1.5032317638397217} -11/07/2021 01:37:00 - INFO - __main__ - Step 30928: {'lr': 0.0004543327783755751, 'samples': 5938176, 'steps': 30927, 'loss/train': 1.0906578302383423} -11/07/2021 01:37:00 - INFO - __main__ - Step 30929: {'lr': 0.0004543297207519434, 'samples': 5938368, 'steps': 30928, 'loss/train': 1.8797330856323242} -11/07/2021 01:37:00 - INFO - __main__ - Step 30930: {'lr': 0.0004543266630362439, 'samples': 5938560, 'steps': 30929, 'loss/train': 1.2183094024658203} -11/07/2021 01:37:01 - INFO - __main__ - Step 30931: {'lr': 0.00045432360522847803, 'samples': 5938752, 'steps': 30930, 'loss/train': 1.430260419845581} -11/07/2021 01:37:01 - INFO - __main__ - Step 30932: {'lr': 0.000454320547328647, 'samples': 5938944, 'steps': 30931, 'loss/train': 1.7848718166351318} -11/07/2021 01:37:02 - INFO - __main__ - Step 30933: {'lr': 0.00045431748933675236, 'samples': 5939136, 'steps': 30932, 'loss/train': 1.704218864440918} -11/07/2021 01:37:02 - INFO - __main__ - Step 30934: {'lr': 0.00045431443125279534, 'samples': 5939328, 'steps': 30933, 'loss/train': 1.6153076887130737} -11/07/2021 01:37:03 - INFO - __main__ - Step 30935: {'lr': 0.00045431137307677753, 'samples': 5939520, 'steps': 30934, 'loss/train': 1.322769045829773} -11/07/2021 01:37:03 - INFO - __main__ - Step 30936: {'lr': 0.00045430831480870005, 'samples': 5939712, 'steps': 30935, 'loss/train': 2.219740390777588} -11/07/2021 01:37:03 - INFO - __main__ - Step 30937: {'lr': 0.0004543052564485644, 'samples': 5939904, 'steps': 30936, 'loss/train': 1.327895164489746} -11/07/2021 01:37:04 - INFO - __main__ - Step 30938: {'lr': 0.00045430219799637197, 'samples': 5940096, 'steps': 30937, 'loss/train': 1.515455722808838} -11/07/2021 01:37:05 - INFO - __main__ - Step 30939: {'lr': 0.0004542991394521241, 'samples': 5940288, 'steps': 30938, 'loss/train': 2.256800413131714} -11/07/2021 01:37:05 - INFO - __main__ - Step 30940: {'lr': 0.00045429608081582216, 'samples': 5940480, 'steps': 30939, 'loss/train': 1.5054608583450317} -11/07/2021 01:37:06 - INFO - __main__ - Step 30941: {'lr': 0.0004542930220874677, 'samples': 5940672, 'steps': 30940, 'loss/train': 1.8650132417678833} -11/07/2021 01:37:06 - INFO - __main__ - Step 30942: {'lr': 0.00045428996326706185, 'samples': 5940864, 'steps': 30941, 'loss/train': 1.4545024633407593} -11/07/2021 01:37:07 - INFO - __main__ - Step 30943: {'lr': 0.0004542869043546061, 'samples': 5941056, 'steps': 30942, 'loss/train': 1.7451108694076538} -11/07/2021 01:37:07 - INFO - __main__ - Step 30944: {'lr': 0.0004542838453501018, 'samples': 5941248, 'steps': 30943, 'loss/train': 1.6728150844573975} -11/07/2021 01:37:08 - INFO - __main__ - Step 30945: {'lr': 0.0004542807862535504, 'samples': 5941440, 'steps': 30944, 'loss/train': 1.211879014968872} -11/07/2021 01:37:08 - INFO - __main__ - Step 30946: {'lr': 0.0004542777270649533, 'samples': 5941632, 'steps': 30945, 'loss/train': 1.518599033355713} -11/07/2021 01:37:08 - INFO - __main__ - Step 30947: {'lr': 0.0004542746677843117, 'samples': 5941824, 'steps': 30946, 'loss/train': 1.4764024019241333} -11/07/2021 01:37:09 - INFO - __main__ - Step 30948: {'lr': 0.0004542716084116271, 'samples': 5942016, 'steps': 30947, 'loss/train': 1.9140671491622925} -11/07/2021 01:37:10 - INFO - __main__ - Step 30949: {'lr': 0.0004542685489469008, 'samples': 5942208, 'steps': 30948, 'loss/train': 2.9213457107543945} -11/07/2021 01:37:10 - INFO - __main__ - Step 30950: {'lr': 0.0004542654893901344, 'samples': 5942400, 'steps': 30949, 'loss/train': 1.50641667842865} -11/07/2021 01:37:10 - INFO - __main__ - Step 30951: {'lr': 0.00045426242974132904, 'samples': 5942592, 'steps': 30950, 'loss/train': 1.8398200273513794} -11/07/2021 01:37:11 - INFO - __main__ - Step 30952: {'lr': 0.0004542593700004862, 'samples': 5942784, 'steps': 30951, 'loss/train': 1.6665246486663818} -11/07/2021 01:37:11 - INFO - __main__ - Step 30953: {'lr': 0.0004542563101676072, 'samples': 5942976, 'steps': 30952, 'loss/train': 1.343689203262329} -11/07/2021 01:37:12 - INFO - __main__ - Step 30954: {'lr': 0.0004542532502426935, 'samples': 5943168, 'steps': 30953, 'loss/train': 1.6398005485534668} -11/07/2021 01:37:12 - INFO - __main__ - Step 30955: {'lr': 0.0004542501902257464, 'samples': 5943360, 'steps': 30954, 'loss/train': 1.0328978300094604} -11/07/2021 01:37:13 - INFO - __main__ - Step 30956: {'lr': 0.0004542471301167673, 'samples': 5943552, 'steps': 30955, 'loss/train': 1.7728264331817627} -11/07/2021 01:37:13 - INFO - __main__ - Step 30957: {'lr': 0.0004542440699157577, 'samples': 5943744, 'steps': 30956, 'loss/train': 1.5043604373931885} -11/07/2021 01:37:13 - INFO - __main__ - Step 30958: {'lr': 0.00045424100962271883, 'samples': 5943936, 'steps': 30957, 'loss/train': 1.5568513870239258} -11/07/2021 01:37:15 - INFO - __main__ - Step 30959: {'lr': 0.00045423794923765204, 'samples': 5944128, 'steps': 30958, 'loss/train': 1.4711169004440308} -11/07/2021 01:37:15 - INFO - __main__ - Step 30960: {'lr': 0.00045423488876055883, 'samples': 5944320, 'steps': 30959, 'loss/train': 1.6682064533233643} -11/07/2021 01:37:15 - INFO - __main__ - Step 30961: {'lr': 0.00045423182819144054, 'samples': 5944512, 'steps': 30960, 'loss/train': 1.5531412363052368} -11/07/2021 01:37:16 - INFO - __main__ - Step 30962: {'lr': 0.00045422876753029853, 'samples': 5944704, 'steps': 30961, 'loss/train': 1.60807466506958} -11/07/2021 01:37:16 - INFO - __main__ - Step 30963: {'lr': 0.0004542257067771342, 'samples': 5944896, 'steps': 30962, 'loss/train': 1.7051243782043457} -11/07/2021 01:37:17 - INFO - __main__ - Step 30964: {'lr': 0.0004542226459319489, 'samples': 5945088, 'steps': 30963, 'loss/train': 1.5874546766281128} -11/07/2021 01:37:17 - INFO - __main__ - Step 30965: {'lr': 0.000454219584994744, 'samples': 5945280, 'steps': 30964, 'loss/train': 2.2392561435699463} -11/07/2021 01:37:18 - INFO - __main__ - Step 30966: {'lr': 0.00045421652396552094, 'samples': 5945472, 'steps': 30965, 'loss/train': 1.6757169961929321} -11/07/2021 01:37:18 - INFO - __main__ - Step 30967: {'lr': 0.0004542134628442811, 'samples': 5945664, 'steps': 30966, 'loss/train': 1.6425938606262207} -11/07/2021 01:37:18 - INFO - __main__ - Step 30968: {'lr': 0.0004542104016310258, 'samples': 5945856, 'steps': 30967, 'loss/train': 1.8963409662246704} -11/07/2021 01:37:19 - INFO - __main__ - Step 30969: {'lr': 0.0004542073403257564, 'samples': 5946048, 'steps': 30968, 'loss/train': 1.6767983436584473} -11/07/2021 01:37:20 - INFO - __main__ - Step 30970: {'lr': 0.0004542042789284744, 'samples': 5946240, 'steps': 30969, 'loss/train': 1.701396107673645} -11/07/2021 01:37:20 - INFO - __main__ - Step 30971: {'lr': 0.0004542012174391811, 'samples': 5946432, 'steps': 30970, 'loss/train': 1.6189563274383545} -11/07/2021 01:37:21 - INFO - __main__ - Step 30972: {'lr': 0.0004541981558578778, 'samples': 5946624, 'steps': 30971, 'loss/train': 1.6633687019348145} -11/07/2021 01:37:21 - INFO - __main__ - Step 30973: {'lr': 0.00045419509418456603, 'samples': 5946816, 'steps': 30972, 'loss/train': 1.5318022966384888} -11/07/2021 01:37:22 - INFO - __main__ - Step 30974: {'lr': 0.00045419203241924705, 'samples': 5947008, 'steps': 30973, 'loss/train': 1.4163742065429688} -11/07/2021 01:37:22 - INFO - __main__ - Step 30975: {'lr': 0.00045418897056192234, 'samples': 5947200, 'steps': 30974, 'loss/train': 1.6730180978775024} -11/07/2021 01:37:23 - INFO - __main__ - Step 30976: {'lr': 0.00045418590861259317, 'samples': 5947392, 'steps': 30975, 'loss/train': 1.4678789377212524} -11/07/2021 01:37:23 - INFO - __main__ - Step 30977: {'lr': 0.0004541828465712611, 'samples': 5947584, 'steps': 30976, 'loss/train': 1.392598271369934} -11/07/2021 01:37:23 - INFO - __main__ - Step 30978: {'lr': 0.0004541797844379273, 'samples': 5947776, 'steps': 30977, 'loss/train': 1.4600822925567627} -11/07/2021 01:37:24 - INFO - __main__ - Step 30979: {'lr': 0.0004541767222125932, 'samples': 5947968, 'steps': 30978, 'loss/train': 1.5391762256622314} -11/07/2021 01:37:25 - INFO - __main__ - Step 30980: {'lr': 0.0004541736598952603, 'samples': 5948160, 'steps': 30979, 'loss/train': 1.474677324295044} -11/07/2021 01:37:25 - INFO - __main__ - Step 30981: {'lr': 0.0004541705974859298, 'samples': 5948352, 'steps': 30980, 'loss/train': 1.150425672531128} -11/07/2021 01:37:25 - INFO - __main__ - Step 30982: {'lr': 0.0004541675349846033, 'samples': 5948544, 'steps': 30981, 'loss/train': 1.3606353998184204} -11/07/2021 01:37:26 - INFO - __main__ - Step 30983: {'lr': 0.000454164472391282, 'samples': 5948736, 'steps': 30982, 'loss/train': 1.8952081203460693} -11/07/2021 01:37:27 - INFO - __main__ - Step 30984: {'lr': 0.00045416140970596736, 'samples': 5948928, 'steps': 30983, 'loss/train': 1.3433048725128174} -11/07/2021 01:37:27 - INFO - __main__ - Step 30985: {'lr': 0.0004541583469286607, 'samples': 5949120, 'steps': 30984, 'loss/train': 1.4420620203018188} -11/07/2021 01:37:27 - INFO - __main__ - Step 30986: {'lr': 0.00045415528405936347, 'samples': 5949312, 'steps': 30985, 'loss/train': 1.4229804277420044} -11/07/2021 01:37:28 - INFO - __main__ - Step 30987: {'lr': 0.000454152221098077, 'samples': 5949504, 'steps': 30986, 'loss/train': 1.2379319667816162} -11/07/2021 01:37:28 - INFO - __main__ - Step 30988: {'lr': 0.0004541491580448027, 'samples': 5949696, 'steps': 30987, 'loss/train': 1.443123698234558} -11/07/2021 01:37:29 - INFO - __main__ - Step 30989: {'lr': 0.00045414609489954195, 'samples': 5949888, 'steps': 30988, 'loss/train': 1.3216699361801147} -11/07/2021 01:37:29 - INFO - __main__ - Step 30990: {'lr': 0.00045414303166229616, 'samples': 5950080, 'steps': 30989, 'loss/train': 1.2806390523910522} -11/07/2021 01:37:30 - INFO - __main__ - Step 30991: {'lr': 0.0004541399683330666, 'samples': 5950272, 'steps': 30990, 'loss/train': 1.38321053981781} -11/07/2021 01:37:30 - INFO - __main__ - Step 30992: {'lr': 0.00045413690491185476, 'samples': 5950464, 'steps': 30991, 'loss/train': 1.6959577798843384} -11/07/2021 01:37:30 - INFO - __main__ - Step 30993: {'lr': 0.00045413384139866196, 'samples': 5950656, 'steps': 30992, 'loss/train': 1.4465599060058594} -11/07/2021 01:37:31 - INFO - __main__ - Step 30994: {'lr': 0.0004541307777934896, 'samples': 5950848, 'steps': 30993, 'loss/train': 1.340911626815796} -11/07/2021 01:37:32 - INFO - __main__ - Step 30995: {'lr': 0.00045412771409633905, 'samples': 5951040, 'steps': 30994, 'loss/train': 1.0903595685958862} -11/07/2021 01:37:32 - INFO - __main__ - Step 30996: {'lr': 0.0004541246503072117, 'samples': 5951232, 'steps': 30995, 'loss/train': 1.2522296905517578} -11/07/2021 01:37:33 - INFO - __main__ - Step 30997: {'lr': 0.000454121586426109, 'samples': 5951424, 'steps': 30996, 'loss/train': 1.7061339616775513} -11/07/2021 01:37:33 - INFO - __main__ - Step 30998: {'lr': 0.0004541185224530322, 'samples': 5951616, 'steps': 30997, 'loss/train': 1.4970251321792603} -11/07/2021 01:37:33 - INFO - __main__ - Step 30999: {'lr': 0.00045411545838798273, 'samples': 5951808, 'steps': 30998, 'loss/train': 1.1896541118621826} -11/07/2021 01:37:34 - INFO - __main__ - Step 31000: {'lr': 0.00045411239423096206, 'samples': 5952000, 'steps': 30999, 'loss/train': 1.9125195741653442} -11/07/2021 01:37:35 - INFO - __main__ - Step 31001: {'lr': 0.0004541093299819714, 'samples': 5952192, 'steps': 31000, 'loss/train': 1.6603349447250366} -11/07/2021 01:37:35 - INFO - __main__ - Step 31002: {'lr': 0.0004541062656410123, 'samples': 5952384, 'steps': 31001, 'loss/train': 5.856283187866211} -11/07/2021 01:37:35 - INFO - __main__ - Step 31003: {'lr': 0.000454103201208086, 'samples': 5952576, 'steps': 31002, 'loss/train': 1.9771652221679688} -11/07/2021 01:37:36 - INFO - __main__ - Step 31004: {'lr': 0.00045410013668319404, 'samples': 5952768, 'steps': 31003, 'loss/train': 0.9490795135498047} -11/07/2021 01:37:37 - INFO - __main__ - Step 31005: {'lr': 0.00045409707206633764, 'samples': 5952960, 'steps': 31004, 'loss/train': 1.821311354637146} -11/07/2021 01:37:37 - INFO - __main__ - Step 31006: {'lr': 0.0004540940073575183, 'samples': 5953152, 'steps': 31005, 'loss/train': 1.4057084321975708} -11/07/2021 01:37:38 - INFO - __main__ - Step 31007: {'lr': 0.00045409094255673734, 'samples': 5953344, 'steps': 31006, 'loss/train': 1.750818133354187} -11/07/2021 01:37:38 - INFO - __main__ - Step 31008: {'lr': 0.00045408787766399605, 'samples': 5953536, 'steps': 31007, 'loss/train': 1.7356077432632446} -11/07/2021 01:37:38 - INFO - __main__ - Step 31009: {'lr': 0.00045408481267929604, 'samples': 5953728, 'steps': 31008, 'loss/train': 3.454223155975342} -11/07/2021 01:37:39 - INFO - __main__ - Step 31010: {'lr': 0.0004540817476026385, 'samples': 5953920, 'steps': 31009, 'loss/train': 1.6089481115341187} -11/07/2021 01:37:40 - INFO - __main__ - Step 31011: {'lr': 0.00045407868243402483, 'samples': 5954112, 'steps': 31010, 'loss/train': 1.8852707147598267} -11/07/2021 01:37:40 - INFO - __main__ - Step 31012: {'lr': 0.0004540756171734565, 'samples': 5954304, 'steps': 31011, 'loss/train': 1.0137343406677246} -11/07/2021 01:37:40 - INFO - __main__ - Step 31013: {'lr': 0.0004540725518209349, 'samples': 5954496, 'steps': 31012, 'loss/train': 1.3237601518630981} -11/07/2021 01:37:41 - INFO - __main__ - Step 31014: {'lr': 0.0004540694863764613, 'samples': 5954688, 'steps': 31013, 'loss/train': 1.5047588348388672} -11/07/2021 01:37:41 - INFO - __main__ - Step 31015: {'lr': 0.0004540664208400371, 'samples': 5954880, 'steps': 31014, 'loss/train': 1.7855403423309326} -11/07/2021 01:37:42 - INFO - __main__ - Step 31016: {'lr': 0.0004540633552116638, 'samples': 5955072, 'steps': 31015, 'loss/train': 1.128483772277832} -11/07/2021 01:37:43 - INFO - __main__ - Step 31017: {'lr': 0.0004540602894913427, 'samples': 5955264, 'steps': 31016, 'loss/train': 1.2099534273147583} -11/07/2021 01:37:43 - INFO - __main__ - Step 31018: {'lr': 0.0004540572236790751, 'samples': 5955456, 'steps': 31017, 'loss/train': 1.6549265384674072} -11/07/2021 01:37:43 - INFO - __main__ - Step 31019: {'lr': 0.0004540541577748625, 'samples': 5955648, 'steps': 31018, 'loss/train': 1.7200446128845215} -11/07/2021 01:37:44 - INFO - __main__ - Step 31020: {'lr': 0.0004540510917787063, 'samples': 5955840, 'steps': 31019, 'loss/train': 1.4873820543289185} -11/07/2021 01:37:45 - INFO - __main__ - Step 31021: {'lr': 0.00045404802569060776, 'samples': 5956032, 'steps': 31020, 'loss/train': 1.7632642984390259} -11/07/2021 01:37:45 - INFO - __main__ - Step 31022: {'lr': 0.00045404495951056835, 'samples': 5956224, 'steps': 31021, 'loss/train': 1.854540228843689} -11/07/2021 01:37:45 - INFO - __main__ - Step 31023: {'lr': 0.00045404189323858946, 'samples': 5956416, 'steps': 31022, 'loss/train': 1.431431770324707} -11/07/2021 01:37:46 - INFO - __main__ - Step 31024: {'lr': 0.0004540388268746724, 'samples': 5956608, 'steps': 31023, 'loss/train': 1.7353435754776} -11/07/2021 01:37:46 - INFO - __main__ - Step 31025: {'lr': 0.0004540357604188186, 'samples': 5956800, 'steps': 31024, 'loss/train': 1.3156670331954956} -11/07/2021 01:37:47 - INFO - __main__ - Step 31026: {'lr': 0.0004540326938710295, 'samples': 5956992, 'steps': 31025, 'loss/train': 1.1969841718673706} -11/07/2021 01:37:47 - INFO - __main__ - Step 31027: {'lr': 0.0004540296272313064, 'samples': 5957184, 'steps': 31026, 'loss/train': 1.8228636980056763} -11/07/2021 01:37:48 - INFO - __main__ - Step 31028: {'lr': 0.00045402656049965055, 'samples': 5957376, 'steps': 31027, 'loss/train': 1.6666202545166016} -11/07/2021 01:37:48 - INFO - __main__ - Step 31029: {'lr': 0.0004540234936760636, 'samples': 5957568, 'steps': 31028, 'loss/train': 1.6700613498687744} -11/07/2021 01:37:48 - INFO - __main__ - Step 31030: {'lr': 0.00045402042676054684, 'samples': 5957760, 'steps': 31029, 'loss/train': 1.8225733041763306} -11/07/2021 01:37:49 - INFO - __main__ - Step 31031: {'lr': 0.0004540173597531015, 'samples': 5957952, 'steps': 31030, 'loss/train': 1.4744887351989746} -11/07/2021 01:37:50 - INFO - __main__ - Step 31032: {'lr': 0.00045401429265372925, 'samples': 5958144, 'steps': 31031, 'loss/train': 1.3476732969284058} -11/07/2021 01:37:50 - INFO - __main__ - Step 31033: {'lr': 0.0004540112254624312, 'samples': 5958336, 'steps': 31032, 'loss/train': 1.4836091995239258} -11/07/2021 01:37:51 - INFO - __main__ - Step 31034: {'lr': 0.0004540081581792089, 'samples': 5958528, 'steps': 31033, 'loss/train': 1.074027180671692} -11/07/2021 01:37:51 - INFO - __main__ - Step 31035: {'lr': 0.0004540050908040636, 'samples': 5958720, 'steps': 31034, 'loss/train': 1.2955214977264404} -11/07/2021 01:37:51 - INFO - __main__ - Step 31036: {'lr': 0.0004540020233369968, 'samples': 5958912, 'steps': 31035, 'loss/train': 1.5886207818984985} -11/07/2021 01:37:52 - INFO - __main__ - Step 31037: {'lr': 0.00045399895577800985, 'samples': 5959104, 'steps': 31036, 'loss/train': 1.8249047994613647} -11/07/2021 01:37:53 - INFO - __main__ - Step 31038: {'lr': 0.00045399588812710415, 'samples': 5959296, 'steps': 31037, 'loss/train': 1.6218334436416626} -11/07/2021 01:37:53 - INFO - __main__ - Step 31039: {'lr': 0.0004539928203842809, 'samples': 5959488, 'steps': 31038, 'loss/train': 1.527317762374878} -11/07/2021 01:37:53 - INFO - __main__ - Step 31040: {'lr': 0.0004539897525495418, 'samples': 5959680, 'steps': 31039, 'loss/train': 1.6444486379623413} -11/07/2021 01:37:54 - INFO - __main__ - Step 31041: {'lr': 0.0004539866846228879, 'samples': 5959872, 'steps': 31040, 'loss/train': 1.0026158094406128} -11/07/2021 01:37:55 - INFO - __main__ - Step 31042: {'lr': 0.0004539836166043209, 'samples': 5960064, 'steps': 31041, 'loss/train': 1.2307610511779785} -11/07/2021 01:37:55 - INFO - __main__ - Step 31043: {'lr': 0.00045398054849384197, 'samples': 5960256, 'steps': 31042, 'loss/train': 2.5408263206481934} -11/07/2021 01:37:55 - INFO - __main__ - Step 31044: {'lr': 0.0004539774802914526, 'samples': 5960448, 'steps': 31043, 'loss/train': 1.5283260345458984} -11/07/2021 01:37:56 - INFO - __main__ - Step 31045: {'lr': 0.00045397441199715406, 'samples': 5960640, 'steps': 31044, 'loss/train': 1.871448040008545} -11/07/2021 01:37:56 - INFO - __main__ - Step 31046: {'lr': 0.0004539713436109478, 'samples': 5960832, 'steps': 31045, 'loss/train': 2.1768293380737305} -11/07/2021 01:37:57 - INFO - __main__ - Step 31047: {'lr': 0.0004539682751328352, 'samples': 5961024, 'steps': 31046, 'loss/train': 1.7534023523330688} -11/07/2021 01:37:57 - INFO - __main__ - Step 31048: {'lr': 0.0004539652065628177, 'samples': 5961216, 'steps': 31047, 'loss/train': 1.5624446868896484} -11/07/2021 01:37:58 - INFO - __main__ - Step 31049: {'lr': 0.00045396213790089657, 'samples': 5961408, 'steps': 31048, 'loss/train': 2.0577123165130615} -11/07/2021 01:37:58 - INFO - __main__ - Step 31050: {'lr': 0.0004539590691470733, 'samples': 5961600, 'steps': 31049, 'loss/train': 1.3571999073028564} -11/07/2021 01:37:59 - INFO - __main__ - Step 31051: {'lr': 0.0004539560003013492, 'samples': 5961792, 'steps': 31050, 'loss/train': 1.3011759519577026} -11/07/2021 01:38:00 - INFO - __main__ - Step 31052: {'lr': 0.0004539529313637256, 'samples': 5961984, 'steps': 31051, 'loss/train': 1.3227177858352661} -11/07/2021 01:38:00 - INFO - __main__ - Step 31053: {'lr': 0.0004539498623342041, 'samples': 5962176, 'steps': 31052, 'loss/train': 1.3051633834838867} -11/07/2021 01:38:00 - INFO - __main__ - Step 31054: {'lr': 0.0004539467932127858, 'samples': 5962368, 'steps': 31053, 'loss/train': 1.5299521684646606} -11/07/2021 01:38:01 - INFO - __main__ - Step 31055: {'lr': 0.00045394372399947225, 'samples': 5962560, 'steps': 31054, 'loss/train': 1.6661772727966309} -11/07/2021 01:38:01 - INFO - __main__ - Step 31056: {'lr': 0.0004539406546942649, 'samples': 5962752, 'steps': 31055, 'loss/train': 0.8315156102180481} -11/07/2021 01:38:02 - INFO - __main__ - Step 31057: {'lr': 0.00045393758529716497, 'samples': 5962944, 'steps': 31056, 'loss/train': 1.5746870040893555} -11/07/2021 01:38:02 - INFO - __main__ - Step 31058: {'lr': 0.0004539345158081739, 'samples': 5963136, 'steps': 31057, 'loss/train': 1.131955862045288} -11/07/2021 01:38:03 - INFO - __main__ - Step 31059: {'lr': 0.0004539314462272931, 'samples': 5963328, 'steps': 31058, 'loss/train': 5.825372695922852} -11/07/2021 01:38:03 - INFO - __main__ - Step 31060: {'lr': 0.0004539283765545239, 'samples': 5963520, 'steps': 31059, 'loss/train': 1.8322217464447021} -11/07/2021 01:38:03 - INFO - __main__ - Step 31061: {'lr': 0.00045392530678986775, 'samples': 5963712, 'steps': 31060, 'loss/train': 1.517366647720337} -11/07/2021 01:38:04 - INFO - __main__ - Step 31062: {'lr': 0.00045392223693332604, 'samples': 5963904, 'steps': 31061, 'loss/train': 1.5481271743774414} -11/07/2021 01:38:05 - INFO - __main__ - Step 31063: {'lr': 0.0004539191669849001, 'samples': 5964096, 'steps': 31062, 'loss/train': 1.5892140865325928} -11/07/2021 01:38:05 - INFO - __main__ - Step 31064: {'lr': 0.0004539160969445913, 'samples': 5964288, 'steps': 31063, 'loss/train': 1.6205822229385376} -11/07/2021 01:38:06 - INFO - __main__ - Step 31065: {'lr': 0.0004539130268124011, 'samples': 5964480, 'steps': 31064, 'loss/train': 1.731955885887146} -11/07/2021 01:38:06 - INFO - __main__ - Step 31066: {'lr': 0.0004539099565883308, 'samples': 5964672, 'steps': 31065, 'loss/train': 1.4995030164718628} -11/07/2021 01:38:06 - INFO - __main__ - Step 31067: {'lr': 0.0004539068862723818, 'samples': 5964864, 'steps': 31066, 'loss/train': 1.1494752168655396} -11/07/2021 01:38:07 - INFO - __main__ - Step 31068: {'lr': 0.0004539038158645555, 'samples': 5965056, 'steps': 31067, 'loss/train': 1.4408982992172241} -11/07/2021 01:38:08 - INFO - __main__ - Step 31069: {'lr': 0.00045390074536485336, 'samples': 5965248, 'steps': 31068, 'loss/train': 1.6689640283584595} -11/07/2021 01:38:08 - INFO - __main__ - Step 31070: {'lr': 0.00045389767477327657, 'samples': 5965440, 'steps': 31069, 'loss/train': 2.307602643966675} -11/07/2021 01:38:08 - INFO - __main__ - Step 31071: {'lr': 0.00045389460408982676, 'samples': 5965632, 'steps': 31070, 'loss/train': 1.3233267068862915} -11/07/2021 01:38:09 - INFO - __main__ - Step 31072: {'lr': 0.0004538915333145052, 'samples': 5965824, 'steps': 31071, 'loss/train': 1.5080645084381104} -11/07/2021 01:38:09 - INFO - __main__ - Step 31073: {'lr': 0.00045388846244731314, 'samples': 5966016, 'steps': 31072, 'loss/train': 1.944614052772522} -11/07/2021 01:38:10 - INFO - __main__ - Step 31074: {'lr': 0.00045388539148825214, 'samples': 5966208, 'steps': 31073, 'loss/train': 1.272490382194519} -11/07/2021 01:38:10 - INFO - __main__ - Step 31075: {'lr': 0.0004538823204373235, 'samples': 5966400, 'steps': 31074, 'loss/train': 2.0401172637939453} -11/07/2021 01:38:11 - INFO - __main__ - Step 31076: {'lr': 0.00045387924929452873, 'samples': 5966592, 'steps': 31075, 'loss/train': 1.6341118812561035} -11/07/2021 01:38:11 - INFO - __main__ - Step 31077: {'lr': 0.000453876178059869, 'samples': 5966784, 'steps': 31076, 'loss/train': 1.3141553401947021} -11/07/2021 01:38:12 - INFO - __main__ - Step 31078: {'lr': 0.0004538731067333459, 'samples': 5966976, 'steps': 31077, 'loss/train': 1.8784071207046509} -11/07/2021 01:38:13 - INFO - __main__ - Step 31079: {'lr': 0.00045387003531496064, 'samples': 5967168, 'steps': 31078, 'loss/train': 1.3279436826705933} -11/07/2021 01:38:13 - INFO - __main__ - Step 31080: {'lr': 0.00045386696380471473, 'samples': 5967360, 'steps': 31079, 'loss/train': 1.4521465301513672} -11/07/2021 01:38:13 - INFO - __main__ - Step 31081: {'lr': 0.0004538638922026095, 'samples': 5967552, 'steps': 31080, 'loss/train': 1.4966466426849365} -11/07/2021 01:38:14 - INFO - __main__ - Step 31082: {'lr': 0.0004538608205086464, 'samples': 5967744, 'steps': 31081, 'loss/train': 1.457392692565918} -11/07/2021 01:38:14 - INFO - __main__ - Step 31083: {'lr': 0.0004538577487228267, 'samples': 5967936, 'steps': 31082, 'loss/train': 1.7701526880264282} -11/07/2021 01:38:15 - INFO - __main__ - Step 31084: {'lr': 0.00045385467684515193, 'samples': 5968128, 'steps': 31083, 'loss/train': 1.5525671243667603} -11/07/2021 01:38:16 - INFO - __main__ - Step 31085: {'lr': 0.0004538516048756233, 'samples': 5968320, 'steps': 31084, 'loss/train': 1.4492534399032593} -11/07/2021 01:38:16 - INFO - __main__ - Step 31086: {'lr': 0.00045384853281424235, 'samples': 5968512, 'steps': 31085, 'loss/train': 1.1388990879058838} -11/07/2021 01:38:16 - INFO - __main__ - Step 31087: {'lr': 0.0004538454606610103, 'samples': 5968704, 'steps': 31086, 'loss/train': 1.311660647392273} -11/07/2021 01:38:17 - INFO - __main__ - Step 31088: {'lr': 0.0004538423884159287, 'samples': 5968896, 'steps': 31087, 'loss/train': 1.760115146636963} -11/07/2021 01:38:18 - INFO - __main__ - Step 31089: {'lr': 0.0004538393160789988, 'samples': 5969088, 'steps': 31088, 'loss/train': 2.212783098220825} -11/07/2021 01:38:18 - INFO - __main__ - Step 31090: {'lr': 0.0004538362436502221, 'samples': 5969280, 'steps': 31089, 'loss/train': 0.6168873310089111} -11/07/2021 01:38:19 - INFO - __main__ - Step 31091: {'lr': 0.00045383317112959997, 'samples': 5969472, 'steps': 31090, 'loss/train': 0.956122636795044} -11/07/2021 01:38:19 - INFO - __main__ - Step 31092: {'lr': 0.0004538300985171337, 'samples': 5969664, 'steps': 31091, 'loss/train': 1.3800127506256104} -11/07/2021 01:38:19 - INFO - __main__ - Step 31093: {'lr': 0.00045382702581282477, 'samples': 5969856, 'steps': 31092, 'loss/train': 1.537808895111084} -11/07/2021 01:38:20 - INFO - __main__ - Step 31094: {'lr': 0.0004538239530166745, 'samples': 5970048, 'steps': 31093, 'loss/train': 1.8231440782546997} -11/07/2021 01:38:21 - INFO - __main__ - Step 31095: {'lr': 0.0004538208801286843, 'samples': 5970240, 'steps': 31094, 'loss/train': 1.6640911102294922} -11/07/2021 01:38:21 - INFO - __main__ - Step 31096: {'lr': 0.0004538178071488556, 'samples': 5970432, 'steps': 31095, 'loss/train': 0.9510982036590576} -11/07/2021 01:38:21 - INFO - __main__ - Step 31097: {'lr': 0.00045381473407718963, 'samples': 5970624, 'steps': 31096, 'loss/train': 2.8618736267089844} -11/07/2021 01:38:22 - INFO - __main__ - Step 31098: {'lr': 0.000453811660913688, 'samples': 5970816, 'steps': 31097, 'loss/train': 1.8852229118347168} -11/07/2021 01:38:22 - INFO - __main__ - Step 31099: {'lr': 0.000453808587658352, 'samples': 5971008, 'steps': 31098, 'loss/train': 1.3138790130615234} -11/07/2021 01:38:23 - INFO - __main__ - Step 31100: {'lr': 0.0004538055143111829, 'samples': 5971200, 'steps': 31099, 'loss/train': 1.3649941682815552} -11/07/2021 01:38:23 - INFO - __main__ - Step 31101: {'lr': 0.00045380244087218224, 'samples': 5971392, 'steps': 31100, 'loss/train': 1.3116509914398193} -11/07/2021 01:38:24 - INFO - __main__ - Step 31102: {'lr': 0.0004537993673413513, 'samples': 5971584, 'steps': 31101, 'loss/train': 1.72334885597229} -11/07/2021 01:38:24 - INFO - __main__ - Step 31103: {'lr': 0.0004537962937186916, 'samples': 5971776, 'steps': 31102, 'loss/train': 1.065061092376709} -11/07/2021 01:38:24 - INFO - __main__ - Step 31104: {'lr': 0.00045379322000420433, 'samples': 5971968, 'steps': 31103, 'loss/train': 1.550279140472412} -11/07/2021 01:38:25 - INFO - __main__ - Step 31105: {'lr': 0.00045379014619789106, 'samples': 5972160, 'steps': 31104, 'loss/train': 1.6130434274673462} -11/07/2021 01:38:26 - INFO - __main__ - Step 31106: {'lr': 0.00045378707229975303, 'samples': 5972352, 'steps': 31105, 'loss/train': 1.2381612062454224} -11/07/2021 01:38:26 - INFO - __main__ - Step 31107: {'lr': 0.0004537839983097917, 'samples': 5972544, 'steps': 31106, 'loss/train': 1.5743529796600342} -11/07/2021 01:38:26 - INFO - __main__ - Step 31108: {'lr': 0.0004537809242280085, 'samples': 5972736, 'steps': 31107, 'loss/train': 1.7774684429168701} -11/07/2021 01:38:27 - INFO - __main__ - Step 31109: {'lr': 0.0004537778500544047, 'samples': 5972928, 'steps': 31108, 'loss/train': 1.7018706798553467} -11/07/2021 01:38:28 - INFO - __main__ - Step 31110: {'lr': 0.0004537747757889817, 'samples': 5973120, 'steps': 31109, 'loss/train': 1.1860202550888062} -11/07/2021 01:38:28 - INFO - __main__ - Step 31111: {'lr': 0.0004537717014317411, 'samples': 5973312, 'steps': 31110, 'loss/train': 1.3271428346633911} -11/07/2021 01:38:28 - INFO - __main__ - Step 31112: {'lr': 0.00045376862698268393, 'samples': 5973504, 'steps': 31111, 'loss/train': 1.6374403238296509} -11/07/2021 01:38:29 - INFO - __main__ - Step 31113: {'lr': 0.0004537655524418119, 'samples': 5973696, 'steps': 31112, 'loss/train': 1.679964303970337} -11/07/2021 01:38:29 - INFO - __main__ - Step 31114: {'lr': 0.00045376247780912616, 'samples': 5973888, 'steps': 31113, 'loss/train': 1.6255829334259033} -11/07/2021 01:38:30 - INFO - __main__ - Step 31115: {'lr': 0.00045375940308462826, 'samples': 5974080, 'steps': 31114, 'loss/train': 1.6915082931518555} -11/07/2021 01:38:31 - INFO - __main__ - Step 31116: {'lr': 0.00045375632826831947, 'samples': 5974272, 'steps': 31115, 'loss/train': 1.3882372379302979} -11/07/2021 01:38:31 - INFO - __main__ - Step 31117: {'lr': 0.00045375325336020124, 'samples': 5974464, 'steps': 31116, 'loss/train': 1.4284358024597168} -11/07/2021 01:38:31 - INFO - __main__ - Step 31118: {'lr': 0.000453750178360275, 'samples': 5974656, 'steps': 31117, 'loss/train': 1.585280418395996} -11/07/2021 01:38:32 - INFO - __main__ - Step 31119: {'lr': 0.00045374710326854194, 'samples': 5974848, 'steps': 31118, 'loss/train': 1.8023872375488281} -11/07/2021 01:38:33 - INFO - __main__ - Step 31120: {'lr': 0.0004537440280850037, 'samples': 5975040, 'steps': 31119, 'loss/train': 1.4168965816497803} -11/07/2021 01:38:33 - INFO - __main__ - Step 31121: {'lr': 0.00045374095280966147, 'samples': 5975232, 'steps': 31120, 'loss/train': 2.086824417114258} -11/07/2021 01:38:33 - INFO - __main__ - Step 31122: {'lr': 0.00045373787744251677, 'samples': 5975424, 'steps': 31121, 'loss/train': 1.2819502353668213} -11/07/2021 01:38:34 - INFO - __main__ - Step 31123: {'lr': 0.0004537348019835709, 'samples': 5975616, 'steps': 31122, 'loss/train': 1.7239537239074707} -11/07/2021 01:38:34 - INFO - __main__ - Step 31124: {'lr': 0.0004537317264328252, 'samples': 5975808, 'steps': 31123, 'loss/train': 1.7349528074264526} -11/07/2021 01:38:35 - INFO - __main__ - Step 31125: {'lr': 0.00045372865079028123, 'samples': 5976000, 'steps': 31124, 'loss/train': 1.5164841413497925} -11/07/2021 01:38:36 - INFO - __main__ - Step 31126: {'lr': 0.00045372557505594024, 'samples': 5976192, 'steps': 31125, 'loss/train': 1.804694652557373} -11/07/2021 01:38:36 - INFO - __main__ - Step 31127: {'lr': 0.0004537224992298037, 'samples': 5976384, 'steps': 31126, 'loss/train': 1.4712467193603516} -11/07/2021 01:38:36 - INFO - __main__ - Step 31128: {'lr': 0.00045371942331187286, 'samples': 5976576, 'steps': 31127, 'loss/train': 1.8973110914230347} -11/07/2021 01:38:37 - INFO - __main__ - Step 31129: {'lr': 0.00045371634730214923, 'samples': 5976768, 'steps': 31128, 'loss/train': 1.736704707145691} -11/07/2021 01:38:37 - INFO - __main__ - Step 31130: {'lr': 0.00045371327120063417, 'samples': 5976960, 'steps': 31129, 'loss/train': 1.9374653100967407} -11/07/2021 01:38:38 - INFO - __main__ - Step 31131: {'lr': 0.00045371019500732904, 'samples': 5977152, 'steps': 31130, 'loss/train': 1.2832658290863037} -11/07/2021 01:38:39 - INFO - __main__ - Step 31132: {'lr': 0.00045370711872223525, 'samples': 5977344, 'steps': 31131, 'loss/train': 1.8077436685562134} -11/07/2021 01:38:39 - INFO - __main__ - Step 31133: {'lr': 0.00045370404234535414, 'samples': 5977536, 'steps': 31132, 'loss/train': 0.6687050461769104} -11/07/2021 01:38:40 - INFO - __main__ - Step 31134: {'lr': 0.00045370096587668714, 'samples': 5977728, 'steps': 31133, 'loss/train': 1.3561971187591553} -11/07/2021 01:38:40 - INFO - __main__ - Step 31135: {'lr': 0.0004536978893162357, 'samples': 5977920, 'steps': 31134, 'loss/train': 1.6032251119613647} -11/07/2021 01:38:40 - INFO - __main__ - Step 31136: {'lr': 0.000453694812664001, 'samples': 5978112, 'steps': 31135, 'loss/train': 1.2463250160217285} -11/07/2021 01:38:42 - INFO - __main__ - Step 31137: {'lr': 0.00045369173591998466, 'samples': 5978304, 'steps': 31136, 'loss/train': 1.5777970552444458} -11/07/2021 01:38:42 - INFO - __main__ - Step 31138: {'lr': 0.00045368865908418794, 'samples': 5978496, 'steps': 31137, 'loss/train': 1.6632001399993896} -11/07/2021 01:38:42 - INFO - __main__ - Step 31139: {'lr': 0.00045368558215661225, 'samples': 5978688, 'steps': 31138, 'loss/train': 1.4597536325454712} -11/07/2021 01:38:43 - INFO - __main__ - Step 31140: {'lr': 0.00045368250513725896, 'samples': 5978880, 'steps': 31139, 'loss/train': 5.873146057128906} -11/07/2021 01:38:43 - INFO - __main__ - Step 31141: {'lr': 0.00045367942802612953, 'samples': 5979072, 'steps': 31140, 'loss/train': 1.5452513694763184} -11/07/2021 01:38:43 - INFO - __main__ - Step 31142: {'lr': 0.0004536763508232252, 'samples': 5979264, 'steps': 31141, 'loss/train': 1.6367824077606201} -11/07/2021 01:38:44 - INFO - __main__ - Step 31143: {'lr': 0.0004536732735285476, 'samples': 5979456, 'steps': 31142, 'loss/train': 1.359701156616211} -11/07/2021 01:38:46 - INFO - __main__ - Step 31144: {'lr': 0.00045367019614209783, 'samples': 5979648, 'steps': 31143, 'loss/train': 1.3247382640838623} -11/07/2021 01:38:46 - INFO - __main__ - Step 31145: {'lr': 0.0004536671186638775, 'samples': 5979840, 'steps': 31144, 'loss/train': 1.2860476970672607} -11/07/2021 01:38:46 - INFO - __main__ - Step 31146: {'lr': 0.0004536640410938879, 'samples': 5980032, 'steps': 31145, 'loss/train': 0.5325157046318054} -11/07/2021 01:38:47 - INFO - __main__ - Step 31147: {'lr': 0.00045366096343213034, 'samples': 5980224, 'steps': 31146, 'loss/train': 1.368627667427063} -11/07/2021 01:38:47 - INFO - __main__ - Step 31148: {'lr': 0.0004536578856786064, 'samples': 5980416, 'steps': 31147, 'loss/train': 1.343773365020752} -11/07/2021 01:38:48 - INFO - __main__ - Step 31149: {'lr': 0.0004536548078333172, 'samples': 5980608, 'steps': 31148, 'loss/train': 1.6496331691741943} -11/07/2021 01:38:48 - INFO - __main__ - Step 31150: {'lr': 0.0004536517298962645, 'samples': 5980800, 'steps': 31149, 'loss/train': 2.274333953857422} -11/07/2021 01:38:49 - INFO - __main__ - Step 31151: {'lr': 0.00045364865186744936, 'samples': 5980992, 'steps': 31150, 'loss/train': 1.941991925239563} -11/07/2021 01:38:49 - INFO - __main__ - Step 31152: {'lr': 0.0004536455737468733, 'samples': 5981184, 'steps': 31151, 'loss/train': 1.501450538635254} -11/07/2021 01:38:49 - INFO - __main__ - Step 31153: {'lr': 0.00045364249553453764, 'samples': 5981376, 'steps': 31152, 'loss/train': 1.7700766324996948} -11/07/2021 01:38:50 - INFO - __main__ - Step 31154: {'lr': 0.00045363941723044386, 'samples': 5981568, 'steps': 31153, 'loss/train': 1.6942732334136963} -11/07/2021 01:38:51 - INFO - __main__ - Step 31155: {'lr': 0.0004536363388345933, 'samples': 5981760, 'steps': 31154, 'loss/train': 1.6029417514801025} -11/07/2021 01:38:51 - INFO - __main__ - Step 31156: {'lr': 0.0004536332603469873, 'samples': 5981952, 'steps': 31155, 'loss/train': 1.394454836845398} -11/07/2021 01:38:51 - INFO - __main__ - Step 31157: {'lr': 0.0004536301817676274, 'samples': 5982144, 'steps': 31156, 'loss/train': 1.6801949739456177} -11/07/2021 01:38:52 - INFO - __main__ - Step 31158: {'lr': 0.0004536271030965148, 'samples': 5982336, 'steps': 31157, 'loss/train': 1.5780308246612549} -11/07/2021 01:38:53 - INFO - __main__ - Step 31159: {'lr': 0.00045362402433365094, 'samples': 5982528, 'steps': 31158, 'loss/train': 1.2975704669952393} -11/07/2021 01:38:53 - INFO - __main__ - Step 31160: {'lr': 0.0004536209454790373, 'samples': 5982720, 'steps': 31159, 'loss/train': 1.505381464958191} -11/07/2021 01:38:53 - INFO - __main__ - Step 31161: {'lr': 0.00045361786653267517, 'samples': 5982912, 'steps': 31160, 'loss/train': 1.8381296396255493} -11/07/2021 01:38:54 - INFO - __main__ - Step 31162: {'lr': 0.00045361478749456595, 'samples': 5983104, 'steps': 31161, 'loss/train': 1.8032037019729614} -11/07/2021 01:38:54 - INFO - __main__ - Step 31163: {'lr': 0.0004536117083647111, 'samples': 5983296, 'steps': 31162, 'loss/train': 1.577376127243042} -11/07/2021 01:38:54 - INFO - __main__ - Step 31164: {'lr': 0.00045360862914311194, 'samples': 5983488, 'steps': 31163, 'loss/train': 1.6728628873825073} -11/07/2021 01:38:55 - INFO - __main__ - Step 31165: {'lr': 0.0004536055498297699, 'samples': 5983680, 'steps': 31164, 'loss/train': 1.7613489627838135} -11/07/2021 01:38:56 - INFO - __main__ - Step 31166: {'lr': 0.00045360247042468635, 'samples': 5983872, 'steps': 31165, 'loss/train': 1.4214516878128052} -11/07/2021 01:38:56 - INFO - __main__ - Step 31167: {'lr': 0.0004535993909278626, 'samples': 5984064, 'steps': 31166, 'loss/train': 1.4152767658233643} -11/07/2021 01:38:56 - INFO - __main__ - Step 31168: {'lr': 0.00045359631133930016, 'samples': 5984256, 'steps': 31167, 'loss/train': 1.7573238611221313} -11/07/2021 01:38:57 - INFO - __main__ - Step 31169: {'lr': 0.0004535932316590003, 'samples': 5984448, 'steps': 31168, 'loss/train': 1.2462897300720215} -11/07/2021 01:38:58 - INFO - __main__ - Step 31170: {'lr': 0.00045359015188696457, 'samples': 5984640, 'steps': 31169, 'loss/train': 1.7859525680541992} -11/07/2021 01:38:58 - INFO - __main__ - Step 31171: {'lr': 0.00045358707202319414, 'samples': 5984832, 'steps': 31170, 'loss/train': 1.3356480598449707} -11/07/2021 01:38:59 - INFO - __main__ - Step 31172: {'lr': 0.0004535839920676906, 'samples': 5985024, 'steps': 31171, 'loss/train': 1.5641802549362183} -11/07/2021 01:38:59 - INFO - __main__ - Step 31173: {'lr': 0.0004535809120204553, 'samples': 5985216, 'steps': 31172, 'loss/train': 2.0797674655914307} -11/07/2021 01:38:59 - INFO - __main__ - Step 31174: {'lr': 0.0004535778318814895, 'samples': 5985408, 'steps': 31173, 'loss/train': 1.4527065753936768} -11/07/2021 01:39:01 - INFO - __main__ - Step 31175: {'lr': 0.0004535747516507947, 'samples': 5985600, 'steps': 31174, 'loss/train': 1.1287404298782349} -11/07/2021 01:39:01 - INFO - __main__ - Step 31176: {'lr': 0.00045357167132837223, 'samples': 5985792, 'steps': 31175, 'loss/train': 1.2972478866577148} -11/07/2021 01:39:01 - INFO - __main__ - Step 31177: {'lr': 0.00045356859091422354, 'samples': 5985984, 'steps': 31176, 'loss/train': 1.5784897804260254} -11/07/2021 01:39:02 - INFO - __main__ - Step 31178: {'lr': 0.00045356551040835, 'samples': 5986176, 'steps': 31177, 'loss/train': 1.3720043897628784} -11/07/2021 01:39:02 - INFO - __main__ - Step 31179: {'lr': 0.0004535624298107529, 'samples': 5986368, 'steps': 31178, 'loss/train': 1.567328929901123} -11/07/2021 01:39:03 - INFO - __main__ - Step 31180: {'lr': 0.00045355934912143383, 'samples': 5986560, 'steps': 31179, 'loss/train': 1.5847002267837524} -11/07/2021 01:39:03 - INFO - __main__ - Step 31181: {'lr': 0.00045355626834039394, 'samples': 5986752, 'steps': 31180, 'loss/train': 1.4634809494018555} -11/07/2021 01:39:04 - INFO - __main__ - Step 31182: {'lr': 0.00045355318746763477, 'samples': 5986944, 'steps': 31181, 'loss/train': 0.7799688577651978} -11/07/2021 01:39:04 - INFO - __main__ - Step 31183: {'lr': 0.0004535501065031577, 'samples': 5987136, 'steps': 31182, 'loss/train': 1.4410059452056885} -11/07/2021 01:39:04 - INFO - __main__ - Step 31184: {'lr': 0.0004535470254469641, 'samples': 5987328, 'steps': 31183, 'loss/train': 1.0951820611953735} -11/07/2021 01:39:05 - INFO - __main__ - Step 31185: {'lr': 0.00045354394429905534, 'samples': 5987520, 'steps': 31184, 'loss/train': 1.872873306274414} -11/07/2021 01:39:06 - INFO - __main__ - Step 31186: {'lr': 0.0004535408630594328, 'samples': 5987712, 'steps': 31185, 'loss/train': 1.5808696746826172} -11/07/2021 01:39:06 - INFO - __main__ - Step 31187: {'lr': 0.0004535377817280979, 'samples': 5987904, 'steps': 31186, 'loss/train': 1.2969399690628052} -11/07/2021 01:39:06 - INFO - __main__ - Step 31188: {'lr': 0.0004535347003050521, 'samples': 5988096, 'steps': 31187, 'loss/train': 1.254632592201233} -11/07/2021 01:39:07 - INFO - __main__ - Step 31189: {'lr': 0.0004535316187902966, 'samples': 5988288, 'steps': 31188, 'loss/train': 1.425153136253357} -11/07/2021 01:39:07 - INFO - __main__ - Step 31190: {'lr': 0.00045352853718383287, 'samples': 5988480, 'steps': 31189, 'loss/train': 1.2327990531921387} -11/07/2021 01:39:08 - INFO - __main__ - Step 31191: {'lr': 0.00045352545548566235, 'samples': 5988672, 'steps': 31190, 'loss/train': 1.3700438737869263} -11/07/2021 01:39:08 - INFO - __main__ - Step 31192: {'lr': 0.00045352237369578643, 'samples': 5988864, 'steps': 31191, 'loss/train': 1.604499340057373} -11/07/2021 01:39:09 - INFO - __main__ - Step 31193: {'lr': 0.00045351929181420647, 'samples': 5989056, 'steps': 31192, 'loss/train': 1.962519645690918} -11/07/2021 01:39:09 - INFO - __main__ - Step 31194: {'lr': 0.0004535162098409238, 'samples': 5989248, 'steps': 31193, 'loss/train': 2.144946575164795} -11/07/2021 01:39:09 - INFO - __main__ - Step 31195: {'lr': 0.00045351312777593995, 'samples': 5989440, 'steps': 31194, 'loss/train': 1.7803518772125244} -11/07/2021 01:39:11 - INFO - __main__ - Step 31196: {'lr': 0.0004535100456192562, 'samples': 5989632, 'steps': 31195, 'loss/train': 1.4107824563980103} -11/07/2021 01:39:11 - INFO - __main__ - Step 31197: {'lr': 0.00045350696337087396, 'samples': 5989824, 'steps': 31196, 'loss/train': 1.4641228914260864} -11/07/2021 01:39:11 - INFO - __main__ - Step 31198: {'lr': 0.0004535038810307946, 'samples': 5990016, 'steps': 31197, 'loss/train': 0.8417909741401672} -11/07/2021 01:39:12 - INFO - __main__ - Step 31199: {'lr': 0.00045350079859901956, 'samples': 5990208, 'steps': 31198, 'loss/train': 1.6086115837097168} -11/07/2021 01:39:12 - INFO - __main__ - Step 31200: {'lr': 0.00045349771607555017, 'samples': 5990400, 'steps': 31199, 'loss/train': 1.4114199876785278} -11/07/2021 01:39:13 - INFO - __main__ - Step 31201: {'lr': 0.0004534946334603879, 'samples': 5990592, 'steps': 31200, 'loss/train': 1.380301833152771} -11/07/2021 01:39:13 - INFO - __main__ - Step 31202: {'lr': 0.000453491550753534, 'samples': 5990784, 'steps': 31201, 'loss/train': 1.8243534564971924} -11/07/2021 01:39:14 - INFO - __main__ - Step 31203: {'lr': 0.00045348846795499, 'samples': 5990976, 'steps': 31202, 'loss/train': 1.5747188329696655} -11/07/2021 01:39:14 - INFO - __main__ - Step 31204: {'lr': 0.0004534853850647572, 'samples': 5991168, 'steps': 31203, 'loss/train': 0.8451942205429077} -11/07/2021 01:39:14 - INFO - __main__ - Step 31205: {'lr': 0.00045348230208283716, 'samples': 5991360, 'steps': 31204, 'loss/train': 1.8767951726913452} -11/07/2021 01:39:15 - INFO - __main__ - Step 31206: {'lr': 0.000453479219009231, 'samples': 5991552, 'steps': 31205, 'loss/train': 1.5493534803390503} -11/07/2021 01:39:16 - INFO - __main__ - Step 31207: {'lr': 0.00045347613584394034, 'samples': 5991744, 'steps': 31206, 'loss/train': 1.2486952543258667} -11/07/2021 01:39:16 - INFO - __main__ - Step 31208: {'lr': 0.0004534730525869664, 'samples': 5991936, 'steps': 31207, 'loss/train': 0.9741658568382263} -11/07/2021 01:39:17 - INFO - __main__ - Step 31209: {'lr': 0.0004534699692383106, 'samples': 5992128, 'steps': 31208, 'loss/train': 2.1556811332702637} -11/07/2021 01:39:17 - INFO - __main__ - Step 31210: {'lr': 0.00045346688579797444, 'samples': 5992320, 'steps': 31209, 'loss/train': 1.6638199090957642} -11/07/2021 01:39:17 - INFO - __main__ - Step 31211: {'lr': 0.0004534638022659592, 'samples': 5992512, 'steps': 31210, 'loss/train': 2.4656479358673096} -11/07/2021 01:39:18 - INFO - __main__ - Step 31212: {'lr': 0.00045346071864226634, 'samples': 5992704, 'steps': 31211, 'loss/train': 1.1677452325820923} -11/07/2021 01:39:19 - INFO - __main__ - Step 31213: {'lr': 0.0004534576349268973, 'samples': 5992896, 'steps': 31212, 'loss/train': 1.6039478778839111} -11/07/2021 01:39:19 - INFO - __main__ - Step 31214: {'lr': 0.00045345455111985326, 'samples': 5993088, 'steps': 31213, 'loss/train': 2.0135111808776855} -11/07/2021 01:39:19 - INFO - __main__ - Step 31215: {'lr': 0.0004534514672211358, 'samples': 5993280, 'steps': 31214, 'loss/train': 1.1419930458068848} -11/07/2021 01:39:20 - INFO - __main__ - Step 31216: {'lr': 0.0004534483832307462, 'samples': 5993472, 'steps': 31215, 'loss/train': 1.2015453577041626} -11/07/2021 01:39:21 - INFO - __main__ - Step 31217: {'lr': 0.00045344529914868593, 'samples': 5993664, 'steps': 31216, 'loss/train': 1.2807214260101318} -11/07/2021 01:39:21 - INFO - __main__ - Step 31218: {'lr': 0.0004534422149749564, 'samples': 5993856, 'steps': 31217, 'loss/train': 1.241632342338562} -11/07/2021 01:39:22 - INFO - __main__ - Step 31219: {'lr': 0.0004534391307095589, 'samples': 5994048, 'steps': 31218, 'loss/train': 1.4084670543670654} -11/07/2021 01:39:22 - INFO - __main__ - Step 31220: {'lr': 0.0004534360463524948, 'samples': 5994240, 'steps': 31219, 'loss/train': 1.3927873373031616} -11/07/2021 01:39:22 - INFO - __main__ - Step 31221: {'lr': 0.00045343296190376566, 'samples': 5994432, 'steps': 31220, 'loss/train': 1.400227665901184} -11/07/2021 01:39:23 - INFO - __main__ - Step 31222: {'lr': 0.0004534298773633727, 'samples': 5994624, 'steps': 31221, 'loss/train': 1.4523824453353882} -11/07/2021 01:39:24 - INFO - __main__ - Step 31223: {'lr': 0.00045342679273131743, 'samples': 5994816, 'steps': 31222, 'loss/train': 1.671177864074707} -11/07/2021 01:39:24 - INFO - __main__ - Step 31224: {'lr': 0.0004534237080076011, 'samples': 5995008, 'steps': 31223, 'loss/train': 1.8985406160354614} -11/07/2021 01:39:24 - INFO - __main__ - Step 31225: {'lr': 0.0004534206231922253, 'samples': 5995200, 'steps': 31224, 'loss/train': 1.1981773376464844} -11/07/2021 01:39:25 - INFO - __main__ - Step 31226: {'lr': 0.0004534175382851913, 'samples': 5995392, 'steps': 31225, 'loss/train': 1.4175541400909424} -11/07/2021 01:39:26 - INFO - __main__ - Step 31227: {'lr': 0.0004534144532865004, 'samples': 5995584, 'steps': 31226, 'loss/train': 1.29689621925354} -11/07/2021 01:39:26 - INFO - __main__ - Step 31228: {'lr': 0.00045341136819615415, 'samples': 5995776, 'steps': 31227, 'loss/train': 1.5480940341949463} -11/07/2021 01:39:26 - INFO - __main__ - Step 31229: {'lr': 0.0004534082830141538, 'samples': 5995968, 'steps': 31228, 'loss/train': 0.43363645672798157} -11/07/2021 01:39:27 - INFO - __main__ - Step 31230: {'lr': 0.00045340519774050093, 'samples': 5996160, 'steps': 31229, 'loss/train': 1.1463749408721924} -11/07/2021 01:39:27 - INFO - __main__ - Step 31231: {'lr': 0.0004534021123751968, 'samples': 5996352, 'steps': 31230, 'loss/train': 1.552856206893921} -11/07/2021 01:39:29 - INFO - __main__ - Step 31232: {'lr': 0.00045339902691824275, 'samples': 5996544, 'steps': 31231, 'loss/train': 1.4515273571014404} -11/07/2021 01:39:29 - INFO - __main__ - Step 31233: {'lr': 0.0004533959413696402, 'samples': 5996736, 'steps': 31232, 'loss/train': 1.795810341835022} -11/07/2021 01:39:29 - INFO - __main__ - Step 31234: {'lr': 0.0004533928557293907, 'samples': 5996928, 'steps': 31233, 'loss/train': 1.6251254081726074} -11/07/2021 01:39:30 - INFO - __main__ - Step 31235: {'lr': 0.00045338976999749546, 'samples': 5997120, 'steps': 31234, 'loss/train': 0.5078571438789368} -11/07/2021 01:39:30 - INFO - __main__ - Step 31236: {'lr': 0.00045338668417395595, 'samples': 5997312, 'steps': 31235, 'loss/train': 0.497263103723526} -11/07/2021 01:39:30 - INFO - __main__ - Step 31237: {'lr': 0.0004533835982587735, 'samples': 5997504, 'steps': 31236, 'loss/train': 1.6334309577941895} -11/07/2021 01:39:32 - INFO - __main__ - Step 31238: {'lr': 0.00045338051225194954, 'samples': 5997696, 'steps': 31237, 'loss/train': 1.2597155570983887} -11/07/2021 01:39:32 - INFO - __main__ - Step 31239: {'lr': 0.0004533774261534855, 'samples': 5997888, 'steps': 31238, 'loss/train': 1.2250351905822754} -11/07/2021 01:39:32 - INFO - __main__ - Step 31240: {'lr': 0.00045337433996338274, 'samples': 5998080, 'steps': 31239, 'loss/train': 1.5766150951385498} -11/07/2021 01:39:33 - INFO - __main__ - Step 31241: {'lr': 0.0004533712536816426, 'samples': 5998272, 'steps': 31240, 'loss/train': 1.227736234664917} -11/07/2021 01:39:33 - INFO - __main__ - Step 31242: {'lr': 0.0004533681673082665, 'samples': 5998464, 'steps': 31241, 'loss/train': 1.553439974784851} -11/07/2021 01:39:34 - INFO - __main__ - Step 31243: {'lr': 0.00045336508084325587, 'samples': 5998656, 'steps': 31242, 'loss/train': 1.0459153652191162} -11/07/2021 01:39:34 - INFO - __main__ - Step 31244: {'lr': 0.0004533619942866121, 'samples': 5998848, 'steps': 31243, 'loss/train': 1.800862193107605} -11/07/2021 01:39:35 - INFO - __main__ - Step 31245: {'lr': 0.00045335890763833646, 'samples': 5999040, 'steps': 31244, 'loss/train': 2.0331690311431885} -11/07/2021 01:39:35 - INFO - __main__ - Step 31246: {'lr': 0.0004533558208984305, 'samples': 5999232, 'steps': 31245, 'loss/train': 1.387972354888916} -11/07/2021 01:39:35 - INFO - __main__ - Step 31247: {'lr': 0.0004533527340668956, 'samples': 5999424, 'steps': 31246, 'loss/train': 1.293097972869873} -11/07/2021 01:39:36 - INFO - __main__ - Step 31248: {'lr': 0.000453349647143733, 'samples': 5999616, 'steps': 31247, 'loss/train': 0.2818108797073364} -11/07/2021 01:39:37 - INFO - __main__ - Step 31249: {'lr': 0.00045334656012894424, 'samples': 5999808, 'steps': 31248, 'loss/train': 1.0691889524459839} -11/07/2021 01:39:37 - INFO - __main__ - Step 31250: {'lr': 0.00045334347302253064, 'samples': 6000000, 'steps': 31249, 'loss/train': 1.497523307800293} -11/07/2021 01:39:37 - INFO - __main__ - Step 31251: {'lr': 0.00045334038582449355, 'samples': 6000192, 'steps': 31250, 'loss/train': 1.2824853658676147} -11/07/2021 01:39:38 - INFO - __main__ - Step 31252: {'lr': 0.0004533372985348345, 'samples': 6000384, 'steps': 31251, 'loss/train': 1.5305395126342773} -11/07/2021 01:39:39 - INFO - __main__ - Step 31253: {'lr': 0.00045333421115355477, 'samples': 6000576, 'steps': 31252, 'loss/train': 1.006943702697754} -11/07/2021 01:39:39 - INFO - __main__ - Step 31254: {'lr': 0.00045333112368065585, 'samples': 6000768, 'steps': 31253, 'loss/train': 1.5808206796646118} -11/07/2021 01:39:40 - INFO - __main__ - Step 31255: {'lr': 0.00045332803611613896, 'samples': 6000960, 'steps': 31254, 'loss/train': 1.7644098997116089} -11/07/2021 01:39:40 - INFO - __main__ - Step 31256: {'lr': 0.00045332494846000564, 'samples': 6001152, 'steps': 31255, 'loss/train': 1.4161990880966187} -11/07/2021 01:39:40 - INFO - __main__ - Step 31257: {'lr': 0.00045332186071225724, 'samples': 6001344, 'steps': 31256, 'loss/train': 1.2591632604599} -11/07/2021 01:39:41 - INFO - __main__ - Step 31258: {'lr': 0.00045331877287289516, 'samples': 6001536, 'steps': 31257, 'loss/train': 1.2635985612869263} -11/07/2021 01:39:42 - INFO - __main__ - Step 31259: {'lr': 0.00045331568494192076, 'samples': 6001728, 'steps': 31258, 'loss/train': 1.3842456340789795} -11/07/2021 01:39:42 - INFO - __main__ - Step 31260: {'lr': 0.00045331259691933545, 'samples': 6001920, 'steps': 31259, 'loss/train': 1.3079363107681274} -11/07/2021 01:39:42 - INFO - __main__ - Step 31261: {'lr': 0.00045330950880514065, 'samples': 6002112, 'steps': 31260, 'loss/train': 1.3240946531295776} -11/07/2021 01:39:43 - INFO - __main__ - Step 31262: {'lr': 0.0004533064205993377, 'samples': 6002304, 'steps': 31261, 'loss/train': 1.4610227346420288} -11/07/2021 01:39:43 - INFO - __main__ - Step 31263: {'lr': 0.000453303332301928, 'samples': 6002496, 'steps': 31262, 'loss/train': 1.0992581844329834} -11/07/2021 01:39:44 - INFO - __main__ - Step 31264: {'lr': 0.00045330024391291294, 'samples': 6002688, 'steps': 31263, 'loss/train': 1.1758882999420166} -11/07/2021 01:39:44 - INFO - __main__ - Step 31265: {'lr': 0.00045329715543229396, 'samples': 6002880, 'steps': 31264, 'loss/train': 1.224266767501831} -11/07/2021 01:39:45 - INFO - __main__ - Step 31266: {'lr': 0.0004532940668600724, 'samples': 6003072, 'steps': 31265, 'loss/train': 0.8703139424324036} -11/07/2021 01:39:45 - INFO - __main__ - Step 31267: {'lr': 0.00045329097819624966, 'samples': 6003264, 'steps': 31266, 'loss/train': 1.3362345695495605} -11/07/2021 01:39:45 - INFO - __main__ - Step 31268: {'lr': 0.00045328788944082717, 'samples': 6003456, 'steps': 31267, 'loss/train': 1.6372350454330444} -11/07/2021 01:39:46 - INFO - __main__ - Step 31269: {'lr': 0.0004532848005938063, 'samples': 6003648, 'steps': 31268, 'loss/train': 1.5215959548950195} -11/07/2021 01:39:47 - INFO - __main__ - Step 31270: {'lr': 0.0004532817116551884, 'samples': 6003840, 'steps': 31269, 'loss/train': 1.169777512550354} -11/07/2021 01:39:47 - INFO - __main__ - Step 31271: {'lr': 0.00045327862262497495, 'samples': 6004032, 'steps': 31270, 'loss/train': 1.9799604415893555} -11/07/2021 01:39:47 - INFO - __main__ - Step 31272: {'lr': 0.00045327553350316726, 'samples': 6004224, 'steps': 31271, 'loss/train': 1.4954971075057983} -11/07/2021 01:39:48 - INFO - __main__ - Step 31273: {'lr': 0.00045327244428976677, 'samples': 6004416, 'steps': 31272, 'loss/train': 1.5546213388442993} -11/07/2021 01:39:49 - INFO - __main__ - Step 31274: {'lr': 0.00045326935498477477, 'samples': 6004608, 'steps': 31273, 'loss/train': 1.14182448387146} -11/07/2021 01:39:49 - INFO - __main__ - Step 31275: {'lr': 0.00045326626558819284, 'samples': 6004800, 'steps': 31274, 'loss/train': 1.727343201637268} -11/07/2021 01:39:49 - INFO - __main__ - Step 31276: {'lr': 0.00045326317610002223, 'samples': 6004992, 'steps': 31275, 'loss/train': 1.546411395072937} -11/07/2021 01:39:50 - INFO - __main__ - Step 31277: {'lr': 0.00045326008652026435, 'samples': 6005184, 'steps': 31276, 'loss/train': 1.3291178941726685} -11/07/2021 01:39:50 - INFO - __main__ - Step 31278: {'lr': 0.00045325699684892065, 'samples': 6005376, 'steps': 31277, 'loss/train': 1.491533875465393} -11/07/2021 01:39:51 - INFO - __main__ - Step 31279: {'lr': 0.00045325390708599245, 'samples': 6005568, 'steps': 31278, 'loss/train': 1.7529364824295044} -11/07/2021 01:39:52 - INFO - __main__ - Step 31280: {'lr': 0.0004532508172314812, 'samples': 6005760, 'steps': 31279, 'loss/train': 2.064553737640381} -11/07/2021 01:39:52 - INFO - __main__ - Step 31281: {'lr': 0.0004532477272853882, 'samples': 6005952, 'steps': 31280, 'loss/train': 1.5577925443649292} -11/07/2021 01:39:52 - INFO - __main__ - Step 31282: {'lr': 0.000453244637247715, 'samples': 6006144, 'steps': 31281, 'loss/train': 0.903304934501648} -11/07/2021 01:39:53 - INFO - __main__ - Step 31283: {'lr': 0.0004532415471184629, 'samples': 6006336, 'steps': 31282, 'loss/train': 1.596295952796936} -11/07/2021 01:39:54 - INFO - __main__ - Step 31284: {'lr': 0.0004532384568976332, 'samples': 6006528, 'steps': 31283, 'loss/train': 1.7317078113555908} -11/07/2021 01:39:54 - INFO - __main__ - Step 31285: {'lr': 0.00045323536658522747, 'samples': 6006720, 'steps': 31284, 'loss/train': 1.4143906831741333} -11/07/2021 01:39:55 - INFO - __main__ - Step 31286: {'lr': 0.00045323227618124695, 'samples': 6006912, 'steps': 31285, 'loss/train': 1.4001790285110474} -11/07/2021 01:39:55 - INFO - __main__ - Step 31287: {'lr': 0.00045322918568569315, 'samples': 6007104, 'steps': 31286, 'loss/train': 1.453641414642334} -11/07/2021 01:39:55 - INFO - __main__ - Step 31288: {'lr': 0.0004532260950985675, 'samples': 6007296, 'steps': 31287, 'loss/train': 1.6401914358139038} -11/07/2021 01:39:56 - INFO - __main__ - Step 31289: {'lr': 0.0004532230044198712, 'samples': 6007488, 'steps': 31288, 'loss/train': 1.590362787246704} -11/07/2021 01:39:57 - INFO - __main__ - Step 31290: {'lr': 0.00045321991364960577, 'samples': 6007680, 'steps': 31289, 'loss/train': 1.0576629638671875} -11/07/2021 01:39:57 - INFO - __main__ - Step 31291: {'lr': 0.00045321682278777253, 'samples': 6007872, 'steps': 31290, 'loss/train': 1.9191278219223022} -11/07/2021 01:39:57 - INFO - __main__ - Step 31292: {'lr': 0.00045321373183437305, 'samples': 6008064, 'steps': 31291, 'loss/train': 1.0246641635894775} -11/07/2021 01:39:58 - INFO - __main__ - Step 31293: {'lr': 0.0004532106407894085, 'samples': 6008256, 'steps': 31292, 'loss/train': 2.011497974395752} -11/07/2021 01:39:59 - INFO - __main__ - Step 31294: {'lr': 0.0004532075496528804, 'samples': 6008448, 'steps': 31293, 'loss/train': 1.4250741004943848} -11/07/2021 01:39:59 - INFO - __main__ - Step 31295: {'lr': 0.0004532044584247901, 'samples': 6008640, 'steps': 31294, 'loss/train': 1.4246947765350342} -11/07/2021 01:39:59 - INFO - __main__ - Step 31296: {'lr': 0.00045320136710513907, 'samples': 6008832, 'steps': 31295, 'loss/train': 1.3835338354110718} -11/07/2021 01:40:00 - INFO - __main__ - Step 31297: {'lr': 0.00045319827569392855, 'samples': 6009024, 'steps': 31296, 'loss/train': 1.537290096282959} -11/07/2021 01:40:00 - INFO - __main__ - Step 31298: {'lr': 0.00045319518419116014, 'samples': 6009216, 'steps': 31297, 'loss/train': 1.195200800895691} -11/07/2021 01:40:00 - INFO - __main__ - Step 31299: {'lr': 0.00045319209259683503, 'samples': 6009408, 'steps': 31298, 'loss/train': 1.696137547492981} -11/07/2021 01:40:02 - INFO - __main__ - Step 31300: {'lr': 0.0004531890009109547, 'samples': 6009600, 'steps': 31299, 'loss/train': 1.2820237874984741} -11/07/2021 01:40:02 - INFO - __main__ - Step 31301: {'lr': 0.0004531859091335205, 'samples': 6009792, 'steps': 31300, 'loss/train': 1.8485389947891235} -11/07/2021 01:40:02 - INFO - __main__ - Step 31302: {'lr': 0.00045318281726453393, 'samples': 6009984, 'steps': 31301, 'loss/train': 2.0493111610412598} -11/07/2021 01:40:03 - INFO - __main__ - Step 31303: {'lr': 0.00045317972530399634, 'samples': 6010176, 'steps': 31302, 'loss/train': 1.545304536819458} -11/07/2021 01:40:03 - INFO - __main__ - Step 31304: {'lr': 0.00045317663325190904, 'samples': 6010368, 'steps': 31303, 'loss/train': 1.0387685298919678} -11/07/2021 01:40:04 - INFO - __main__ - Step 31305: {'lr': 0.00045317354110827344, 'samples': 6010560, 'steps': 31304, 'loss/train': 1.1423134803771973} -11/07/2021 01:40:05 - INFO - __main__ - Step 31306: {'lr': 0.0004531704488730911, 'samples': 6010752, 'steps': 31305, 'loss/train': 1.5734665393829346} -11/07/2021 01:40:05 - INFO - __main__ - Step 31307: {'lr': 0.0004531673565463632, 'samples': 6010944, 'steps': 31306, 'loss/train': 1.2878657579421997} -11/07/2021 01:40:05 - INFO - __main__ - Step 31308: {'lr': 0.0004531642641280913, 'samples': 6011136, 'steps': 31307, 'loss/train': 1.762477159500122} -11/07/2021 01:40:06 - INFO - __main__ - Step 31309: {'lr': 0.0004531611716182767, 'samples': 6011328, 'steps': 31308, 'loss/train': 1.5436822175979614} -11/07/2021 01:40:07 - INFO - __main__ - Step 31310: {'lr': 0.0004531580790169207, 'samples': 6011520, 'steps': 31309, 'loss/train': 1.662217140197754} -11/07/2021 01:40:07 - INFO - __main__ - Step 31311: {'lr': 0.00045315498632402494, 'samples': 6011712, 'steps': 31310, 'loss/train': 1.181226372718811} -11/07/2021 01:40:07 - INFO - __main__ - Step 31312: {'lr': 0.0004531518935395906, 'samples': 6011904, 'steps': 31311, 'loss/train': 1.003279685974121} -11/07/2021 01:40:08 - INFO - __main__ - Step 31313: {'lr': 0.00045314880066361923, 'samples': 6012096, 'steps': 31312, 'loss/train': 1.1623375415802002} -11/07/2021 01:40:08 - INFO - __main__ - Step 31314: {'lr': 0.00045314570769611207, 'samples': 6012288, 'steps': 31313, 'loss/train': 3.8758158683776855} -11/07/2021 01:40:09 - INFO - __main__ - Step 31315: {'lr': 0.00045314261463707064, 'samples': 6012480, 'steps': 31314, 'loss/train': 0.8304257392883301} -11/07/2021 01:40:10 - INFO - __main__ - Step 31316: {'lr': 0.00045313952148649626, 'samples': 6012672, 'steps': 31315, 'loss/train': 1.7472083568572998} -11/07/2021 01:40:10 - INFO - __main__ - Step 31317: {'lr': 0.0004531364282443904, 'samples': 6012864, 'steps': 31316, 'loss/train': 1.6921648979187012} -11/07/2021 01:40:10 - INFO - __main__ - Step 31318: {'lr': 0.00045313333491075433, 'samples': 6013056, 'steps': 31317, 'loss/train': 1.840403437614441} -11/07/2021 01:40:11 - INFO - __main__ - Step 31319: {'lr': 0.0004531302414855895, 'samples': 6013248, 'steps': 31318, 'loss/train': 1.498241662979126} -11/07/2021 01:40:11 - INFO - __main__ - Step 31320: {'lr': 0.0004531271479688974, 'samples': 6013440, 'steps': 31319, 'loss/train': 1.4011257886886597} -11/07/2021 01:40:12 - INFO - __main__ - Step 31321: {'lr': 0.00045312405436067927, 'samples': 6013632, 'steps': 31320, 'loss/train': 1.671433687210083} -11/07/2021 01:40:12 - INFO - __main__ - Step 31322: {'lr': 0.00045312096066093654, 'samples': 6013824, 'steps': 31321, 'loss/train': 1.430420994758606} -11/07/2021 01:40:13 - INFO - __main__ - Step 31323: {'lr': 0.0004531178668696707, 'samples': 6014016, 'steps': 31322, 'loss/train': 1.492526650428772} -11/07/2021 01:40:13 - INFO - __main__ - Step 31324: {'lr': 0.00045311477298688306, 'samples': 6014208, 'steps': 31323, 'loss/train': 1.6847875118255615} -11/07/2021 01:40:14 - INFO - __main__ - Step 31325: {'lr': 0.0004531116790125751, 'samples': 6014400, 'steps': 31324, 'loss/train': 1.22118079662323} -11/07/2021 01:40:15 - INFO - __main__ - Step 31326: {'lr': 0.00045310858494674813, 'samples': 6014592, 'steps': 31325, 'loss/train': 1.5117628574371338} -11/07/2021 01:40:15 - INFO - __main__ - Step 31327: {'lr': 0.00045310549078940356, 'samples': 6014784, 'steps': 31326, 'loss/train': 1.5198588371276855} -11/07/2021 01:40:15 - INFO - __main__ - Step 31328: {'lr': 0.00045310239654054274, 'samples': 6014976, 'steps': 31327, 'loss/train': 1.6896679401397705} -11/07/2021 01:40:16 - INFO - __main__ - Step 31329: {'lr': 0.0004530993022001672, 'samples': 6015168, 'steps': 31328, 'loss/train': 2.6464505195617676} -11/07/2021 01:40:16 - INFO - __main__ - Step 31330: {'lr': 0.00045309620776827817, 'samples': 6015360, 'steps': 31329, 'loss/train': 1.5829106569290161} -11/07/2021 01:40:17 - INFO - __main__ - Step 31331: {'lr': 0.00045309311324487713, 'samples': 6015552, 'steps': 31330, 'loss/train': 1.3637856245040894} -11/07/2021 01:40:17 - INFO - __main__ - Step 31332: {'lr': 0.0004530900186299655, 'samples': 6015744, 'steps': 31331, 'loss/train': 1.5064327716827393} -11/07/2021 01:40:18 - INFO - __main__ - Step 31333: {'lr': 0.0004530869239235446, 'samples': 6015936, 'steps': 31332, 'loss/train': 1.8033262491226196} -11/07/2021 01:40:18 - INFO - __main__ - Step 31334: {'lr': 0.0004530838291256159, 'samples': 6016128, 'steps': 31333, 'loss/train': 1.8291977643966675} -11/07/2021 01:40:18 - INFO - __main__ - Step 31335: {'lr': 0.0004530807342361807, 'samples': 6016320, 'steps': 31334, 'loss/train': 2.119213581085205} -11/07/2021 01:40:19 - INFO - __main__ - Step 31336: {'lr': 0.0004530776392552406, 'samples': 6016512, 'steps': 31335, 'loss/train': 1.0838651657104492} -11/07/2021 01:40:20 - INFO - __main__ - Step 31337: {'lr': 0.0004530745441827967, 'samples': 6016704, 'steps': 31336, 'loss/train': 1.8087306022644043} -11/07/2021 01:40:20 - INFO - __main__ - Step 31338: {'lr': 0.0004530714490188506, 'samples': 6016896, 'steps': 31337, 'loss/train': 1.5076483488082886} -11/07/2021 01:40:21 - INFO - __main__ - Step 31339: {'lr': 0.00045306835376340366, 'samples': 6017088, 'steps': 31338, 'loss/train': 1.6746957302093506} -11/07/2021 01:40:21 - INFO - __main__ - Step 31340: {'lr': 0.00045306525841645723, 'samples': 6017280, 'steps': 31339, 'loss/train': 1.0600357055664062} -11/07/2021 01:40:21 - INFO - __main__ - Step 31341: {'lr': 0.0004530621629780127, 'samples': 6017472, 'steps': 31340, 'loss/train': 1.423075795173645} -11/07/2021 01:40:22 - INFO - __main__ - Step 31342: {'lr': 0.00045305906744807156, 'samples': 6017664, 'steps': 31341, 'loss/train': 1.7189316749572754} -11/07/2021 01:40:23 - INFO - __main__ - Step 31343: {'lr': 0.0004530559718266351, 'samples': 6017856, 'steps': 31342, 'loss/train': 1.5785162448883057} -11/07/2021 01:40:23 - INFO - __main__ - Step 31344: {'lr': 0.0004530528761137047, 'samples': 6018048, 'steps': 31343, 'loss/train': 1.2819000482559204} -11/07/2021 01:40:23 - INFO - __main__ - Step 31345: {'lr': 0.0004530497803092819, 'samples': 6018240, 'steps': 31344, 'loss/train': 1.6384159326553345} -11/07/2021 01:40:24 - INFO - __main__ - Step 31346: {'lr': 0.000453046684413368, 'samples': 6018432, 'steps': 31345, 'loss/train': 1.8902775049209595} -11/07/2021 01:40:25 - INFO - __main__ - Step 31347: {'lr': 0.0004530435884259644, 'samples': 6018624, 'steps': 31346, 'loss/train': 1.60947847366333} -11/07/2021 01:40:25 - INFO - __main__ - Step 31348: {'lr': 0.0004530404923470724, 'samples': 6018816, 'steps': 31347, 'loss/train': 1.114456295967102} -11/07/2021 01:40:25 - INFO - __main__ - Step 31349: {'lr': 0.0004530373961766935, 'samples': 6019008, 'steps': 31348, 'loss/train': 1.5226140022277832} -11/07/2021 01:40:26 - INFO - __main__ - Step 31350: {'lr': 0.00045303429991482914, 'samples': 6019200, 'steps': 31349, 'loss/train': 1.4229016304016113} -11/07/2021 01:40:26 - INFO - __main__ - Step 31351: {'lr': 0.00045303120356148067, 'samples': 6019392, 'steps': 31350, 'loss/train': 1.539341688156128} -11/07/2021 01:40:27 - INFO - __main__ - Step 31352: {'lr': 0.00045302810711664944, 'samples': 6019584, 'steps': 31351, 'loss/train': 1.164172649383545} -11/07/2021 01:40:27 - INFO - __main__ - Step 31353: {'lr': 0.00045302501058033687, 'samples': 6019776, 'steps': 31352, 'loss/train': 1.0640827417373657} -11/07/2021 01:40:28 - INFO - __main__ - Step 31354: {'lr': 0.0004530219139525444, 'samples': 6019968, 'steps': 31353, 'loss/train': 1.6237752437591553} -11/07/2021 01:40:28 - INFO - __main__ - Step 31355: {'lr': 0.0004530188172332733, 'samples': 6020160, 'steps': 31354, 'loss/train': 1.6850532293319702} -11/07/2021 01:40:28 - INFO - __main__ - Step 31356: {'lr': 0.00045301572042252516, 'samples': 6020352, 'steps': 31355, 'loss/train': 0.7566108703613281} -11/07/2021 01:40:30 - INFO - __main__ - Step 31357: {'lr': 0.00045301262352030123, 'samples': 6020544, 'steps': 31356, 'loss/train': 1.6130330562591553} -11/07/2021 01:40:30 - INFO - __main__ - Step 31358: {'lr': 0.00045300952652660296, 'samples': 6020736, 'steps': 31357, 'loss/train': 2.542454481124878} -11/07/2021 01:40:30 - INFO - __main__ - Step 31359: {'lr': 0.0004530064294414317, 'samples': 6020928, 'steps': 31358, 'loss/train': 1.5415786504745483} -11/07/2021 01:40:31 - INFO - __main__ - Step 31360: {'lr': 0.00045300333226478887, 'samples': 6021120, 'steps': 31359, 'loss/train': 1.4599359035491943} -11/07/2021 01:40:31 - INFO - __main__ - Step 31361: {'lr': 0.0004530002349966759, 'samples': 6021312, 'steps': 31360, 'loss/train': 1.840524435043335} -11/07/2021 01:40:31 - INFO - __main__ - Step 31362: {'lr': 0.0004529971376370941, 'samples': 6021504, 'steps': 31361, 'loss/train': 2.0179741382598877} -11/07/2021 01:40:32 - INFO - __main__ - Step 31363: {'lr': 0.00045299404018604494, 'samples': 6021696, 'steps': 31362, 'loss/train': 1.009627103805542} -11/07/2021 01:40:33 - INFO - __main__ - Step 31364: {'lr': 0.00045299094264352987, 'samples': 6021888, 'steps': 31363, 'loss/train': 1.5297051668167114} -11/07/2021 01:40:33 - INFO - __main__ - Step 31365: {'lr': 0.00045298784500955014, 'samples': 6022080, 'steps': 31364, 'loss/train': 1.5274115800857544} -11/07/2021 01:40:33 - INFO - __main__ - Step 31366: {'lr': 0.0004529847472841073, 'samples': 6022272, 'steps': 31365, 'loss/train': 1.376988410949707} -11/07/2021 01:40:34 - INFO - __main__ - Step 31367: {'lr': 0.00045298164946720254, 'samples': 6022464, 'steps': 31366, 'loss/train': 1.6952353715896606} -11/07/2021 01:40:35 - INFO - __main__ - Step 31368: {'lr': 0.0004529785515588375, 'samples': 6022656, 'steps': 31367, 'loss/train': 1.6672512292861938} -11/07/2021 01:40:35 - INFO - __main__ - Step 31369: {'lr': 0.00045297545355901336, 'samples': 6022848, 'steps': 31368, 'loss/train': 1.4154484272003174} -11/07/2021 01:40:35 - INFO - __main__ - Step 31370: {'lr': 0.00045297235546773175, 'samples': 6023040, 'steps': 31369, 'loss/train': 1.7862539291381836} -11/07/2021 01:40:36 - INFO - __main__ - Step 31371: {'lr': 0.0004529692572849938, 'samples': 6023232, 'steps': 31370, 'loss/train': 1.7392520904541016} -11/07/2021 01:40:36 - INFO - __main__ - Step 31372: {'lr': 0.00045296615901080107, 'samples': 6023424, 'steps': 31371, 'loss/train': 1.8784608840942383} -11/07/2021 01:40:37 - INFO - __main__ - Step 31373: {'lr': 0.00045296306064515493, 'samples': 6023616, 'steps': 31372, 'loss/train': 1.1499531269073486} -11/07/2021 01:40:38 - INFO - __main__ - Step 31374: {'lr': 0.0004529599621880567, 'samples': 6023808, 'steps': 31373, 'loss/train': 2.2191970348358154} -11/07/2021 01:40:38 - INFO - __main__ - Step 31375: {'lr': 0.00045295686363950796, 'samples': 6024000, 'steps': 31374, 'loss/train': 1.522124171257019} -11/07/2021 01:40:38 - INFO - __main__ - Step 31376: {'lr': 0.0004529537649995099, 'samples': 6024192, 'steps': 31375, 'loss/train': 1.51448392868042} -11/07/2021 01:40:39 - INFO - __main__ - Step 31377: {'lr': 0.0004529506662680641, 'samples': 6024384, 'steps': 31376, 'loss/train': 1.0709054470062256} -11/07/2021 01:40:40 - INFO - __main__ - Step 31378: {'lr': 0.00045294756744517173, 'samples': 6024576, 'steps': 31377, 'loss/train': 1.801628828048706} -11/07/2021 01:40:40 - INFO - __main__ - Step 31379: {'lr': 0.00045294446853083446, 'samples': 6024768, 'steps': 31378, 'loss/train': 1.7513327598571777} -11/07/2021 01:40:41 - INFO - __main__ - Step 31380: {'lr': 0.00045294136952505346, 'samples': 6024960, 'steps': 31379, 'loss/train': 1.8567157983779907} -11/07/2021 01:40:41 - INFO - __main__ - Step 31381: {'lr': 0.0004529382704278302, 'samples': 6025152, 'steps': 31380, 'loss/train': 1.5834095478057861} -11/07/2021 01:40:41 - INFO - __main__ - Step 31382: {'lr': 0.0004529351712391661, 'samples': 6025344, 'steps': 31381, 'loss/train': 1.2147400379180908} -11/07/2021 01:40:42 - INFO - __main__ - Step 31383: {'lr': 0.0004529320719590626, 'samples': 6025536, 'steps': 31382, 'loss/train': 1.2692679166793823} -11/07/2021 01:40:43 - INFO - __main__ - Step 31384: {'lr': 0.00045292897258752095, 'samples': 6025728, 'steps': 31383, 'loss/train': 5.561633110046387} -11/07/2021 01:40:43 - INFO - __main__ - Step 31385: {'lr': 0.0004529258731245427, 'samples': 6025920, 'steps': 31384, 'loss/train': 0.9220340847969055} -11/07/2021 01:40:43 - INFO - __main__ - Step 31386: {'lr': 0.0004529227735701291, 'samples': 6026112, 'steps': 31385, 'loss/train': 1.5717658996582031} -11/07/2021 01:40:44 - INFO - __main__ - Step 31387: {'lr': 0.00045291967392428175, 'samples': 6026304, 'steps': 31386, 'loss/train': 1.629934310913086} -11/07/2021 01:40:44 - INFO - __main__ - Step 31388: {'lr': 0.0004529165741870018, 'samples': 6026496, 'steps': 31387, 'loss/train': 1.2687602043151855} -11/07/2021 01:40:45 - INFO - __main__ - Step 31389: {'lr': 0.00045291347435829087, 'samples': 6026688, 'steps': 31388, 'loss/train': 1.2830164432525635} -11/07/2021 01:40:45 - INFO - __main__ - Step 31390: {'lr': 0.0004529103744381503, 'samples': 6026880, 'steps': 31389, 'loss/train': 1.6968694925308228} -11/07/2021 01:40:46 - INFO - __main__ - Step 31391: {'lr': 0.0004529072744265813, 'samples': 6027072, 'steps': 31390, 'loss/train': 1.6593273878097534} -11/07/2021 01:40:46 - INFO - __main__ - Step 31392: {'lr': 0.00045290417432358553, 'samples': 6027264, 'steps': 31391, 'loss/train': 1.7551089525222778} -11/07/2021 01:40:46 - INFO - __main__ - Step 31393: {'lr': 0.00045290107412916425, 'samples': 6027456, 'steps': 31392, 'loss/train': 1.7737340927124023} -11/07/2021 01:40:47 - INFO - __main__ - Step 31394: {'lr': 0.0004528979738433189, 'samples': 6027648, 'steps': 31393, 'loss/train': 1.4928796291351318} -11/07/2021 01:40:48 - INFO - __main__ - Step 31395: {'lr': 0.00045289487346605075, 'samples': 6027840, 'steps': 31394, 'loss/train': 1.5345834493637085} -11/07/2021 01:40:48 - INFO - __main__ - Step 31396: {'lr': 0.0004528917729973614, 'samples': 6028032, 'steps': 31395, 'loss/train': 1.5296452045440674} -11/07/2021 01:40:49 - INFO - __main__ - Step 31397: {'lr': 0.00045288867243725207, 'samples': 6028224, 'steps': 31396, 'loss/train': 0.6855195760726929} -11/07/2021 01:40:49 - INFO - __main__ - Step 31398: {'lr': 0.00045288557178572433, 'samples': 6028416, 'steps': 31397, 'loss/train': 1.5773770809173584} -11/07/2021 01:40:50 - INFO - __main__ - Step 31399: {'lr': 0.00045288247104277937, 'samples': 6028608, 'steps': 31398, 'loss/train': 1.0291240215301514} -11/07/2021 01:40:50 - INFO - __main__ - Step 31400: {'lr': 0.0004528793702084187, 'samples': 6028800, 'steps': 31399, 'loss/train': 1.807216763496399} -11/07/2021 01:40:51 - INFO - __main__ - Step 31401: {'lr': 0.0004528762692826439, 'samples': 6028992, 'steps': 31400, 'loss/train': 1.1373130083084106} -11/07/2021 01:40:51 - INFO - __main__ - Step 31402: {'lr': 0.000452873168265456, 'samples': 6029184, 'steps': 31401, 'loss/train': 1.3746041059494019} -11/07/2021 01:40:51 - INFO - __main__ - Step 31403: {'lr': 0.00045287006715685665, 'samples': 6029376, 'steps': 31402, 'loss/train': 1.6347107887268066} -11/07/2021 01:40:52 - INFO - __main__ - Step 31404: {'lr': 0.0004528669659568472, 'samples': 6029568, 'steps': 31403, 'loss/train': 1.9266588687896729} -11/07/2021 01:40:53 - INFO - __main__ - Step 31405: {'lr': 0.00045286386466542896, 'samples': 6029760, 'steps': 31404, 'loss/train': 0.9506607055664062} -11/07/2021 01:40:53 - INFO - __main__ - Step 31406: {'lr': 0.0004528607632826034, 'samples': 6029952, 'steps': 31405, 'loss/train': 1.502123236656189} -11/07/2021 01:40:53 - INFO - __main__ - Step 31407: {'lr': 0.00045285766180837197, 'samples': 6030144, 'steps': 31406, 'loss/train': 1.4770770072937012} -11/07/2021 01:40:54 - INFO - __main__ - Step 31408: {'lr': 0.000452854560242736, 'samples': 6030336, 'steps': 31407, 'loss/train': 1.152550458908081} -11/07/2021 01:40:54 - INFO - __main__ - Step 31409: {'lr': 0.0004528514585856968, 'samples': 6030528, 'steps': 31408, 'loss/train': 1.5592893362045288} -11/07/2021 01:40:55 - INFO - __main__ - Step 31410: {'lr': 0.0004528483568372559, 'samples': 6030720, 'steps': 31409, 'loss/train': 1.3015888929367065} -11/07/2021 01:40:55 - INFO - __main__ - Step 31411: {'lr': 0.00045284525499741474, 'samples': 6030912, 'steps': 31410, 'loss/train': 1.7930604219436646} -11/07/2021 01:40:56 - INFO - __main__ - Step 31412: {'lr': 0.0004528421530661746, 'samples': 6031104, 'steps': 31411, 'loss/train': 1.5233491659164429} -11/07/2021 01:40:56 - INFO - __main__ - Step 31413: {'lr': 0.0004528390510435368, 'samples': 6031296, 'steps': 31412, 'loss/train': 1.2986992597579956} -11/07/2021 01:40:56 - INFO - __main__ - Step 31414: {'lr': 0.0004528359489295031, 'samples': 6031488, 'steps': 31413, 'loss/train': 1.3755381107330322} -11/07/2021 01:40:58 - INFO - __main__ - Step 31415: {'lr': 0.00045283284672407444, 'samples': 6031680, 'steps': 31414, 'loss/train': 1.8881810903549194} -11/07/2021 01:40:58 - INFO - __main__ - Step 31416: {'lr': 0.0004528297444272525, 'samples': 6031872, 'steps': 31415, 'loss/train': 1.3041670322418213} -11/07/2021 01:40:58 - INFO - __main__ - Step 31417: {'lr': 0.0004528266420390386, 'samples': 6032064, 'steps': 31416, 'loss/train': 2.038400650024414} -11/07/2021 01:40:59 - INFO - __main__ - Step 31418: {'lr': 0.00045282353955943417, 'samples': 6032256, 'steps': 31417, 'loss/train': 1.755852222442627} -11/07/2021 01:40:59 - INFO - __main__ - Step 31419: {'lr': 0.00045282043698844054, 'samples': 6032448, 'steps': 31418, 'loss/train': 1.505255103111267} -11/07/2021 01:41:00 - INFO - __main__ - Step 31420: {'lr': 0.0004528173343260592, 'samples': 6032640, 'steps': 31419, 'loss/train': 1.8033087253570557} -11/07/2021 01:41:00 - INFO - __main__ - Step 31421: {'lr': 0.0004528142315722915, 'samples': 6032832, 'steps': 31420, 'loss/train': 1.9411840438842773} -11/07/2021 01:41:01 - INFO - __main__ - Step 31422: {'lr': 0.0004528111287271388, 'samples': 6033024, 'steps': 31421, 'loss/train': 1.262176752090454} -11/07/2021 01:41:01 - INFO - __main__ - Step 31423: {'lr': 0.00045280802579060253, 'samples': 6033216, 'steps': 31422, 'loss/train': 1.6663079261779785} -11/07/2021 01:41:01 - INFO - __main__ - Step 31424: {'lr': 0.00045280492276268414, 'samples': 6033408, 'steps': 31423, 'loss/train': 1.670093059539795} -11/07/2021 01:41:02 - INFO - __main__ - Step 31425: {'lr': 0.0004528018196433849, 'samples': 6033600, 'steps': 31424, 'loss/train': 1.385120153427124} -11/07/2021 01:41:03 - INFO - __main__ - Step 31426: {'lr': 0.0004527987164327063, 'samples': 6033792, 'steps': 31425, 'loss/train': 1.0587403774261475} -11/07/2021 01:41:03 - INFO - __main__ - Step 31427: {'lr': 0.0004527956131306498, 'samples': 6033984, 'steps': 31426, 'loss/train': 1.2909725904464722} -11/07/2021 01:41:03 - INFO - __main__ - Step 31428: {'lr': 0.0004527925097372168, 'samples': 6034176, 'steps': 31427, 'loss/train': 1.6139020919799805} -11/07/2021 01:41:04 - INFO - __main__ - Step 31429: {'lr': 0.0004527894062524084, 'samples': 6034368, 'steps': 31428, 'loss/train': 1.4685879945755005} -11/07/2021 01:41:05 - INFO - __main__ - Step 31430: {'lr': 0.00045278630267622637, 'samples': 6034560, 'steps': 31429, 'loss/train': 1.514011263847351} -11/07/2021 01:41:05 - INFO - __main__ - Step 31431: {'lr': 0.0004527831990086719, 'samples': 6034752, 'steps': 31430, 'loss/train': 1.653131127357483} -11/07/2021 01:41:06 - INFO - __main__ - Step 31432: {'lr': 0.0004527800952497465, 'samples': 6034944, 'steps': 31431, 'loss/train': 1.4159690141677856} -11/07/2021 01:41:06 - INFO - __main__ - Step 31433: {'lr': 0.0004527769913994515, 'samples': 6035136, 'steps': 31432, 'loss/train': 1.1822314262390137} -11/07/2021 01:41:06 - INFO - __main__ - Step 31434: {'lr': 0.00045277388745778836, 'samples': 6035328, 'steps': 31433, 'loss/train': 1.4472757577896118} -11/07/2021 01:41:07 - INFO - __main__ - Step 31435: {'lr': 0.00045277078342475835, 'samples': 6035520, 'steps': 31434, 'loss/train': 1.4460768699645996} -11/07/2021 01:41:08 - INFO - __main__ - Step 31436: {'lr': 0.000452767679300363, 'samples': 6035712, 'steps': 31435, 'loss/train': 0.7411298155784607} -11/07/2021 01:41:08 - INFO - __main__ - Step 31437: {'lr': 0.00045276457508460367, 'samples': 6035904, 'steps': 31436, 'loss/train': 1.0947308540344238} -11/07/2021 01:41:08 - INFO - __main__ - Step 31438: {'lr': 0.00045276147077748176, 'samples': 6036096, 'steps': 31437, 'loss/train': 1.8609302043914795} -11/07/2021 01:41:09 - INFO - __main__ - Step 31439: {'lr': 0.0004527583663789986, 'samples': 6036288, 'steps': 31438, 'loss/train': 0.918387770652771} -11/07/2021 01:41:09 - INFO - __main__ - Step 31440: {'lr': 0.0004527552618891557, 'samples': 6036480, 'steps': 31439, 'loss/train': 1.2426555156707764} -11/07/2021 01:41:10 - INFO - __main__ - Step 31441: {'lr': 0.0004527521573079544, 'samples': 6036672, 'steps': 31440, 'loss/train': 1.590278148651123} -11/07/2021 01:41:11 - INFO - __main__ - Step 31442: {'lr': 0.0004527490526353961, 'samples': 6036864, 'steps': 31441, 'loss/train': 1.5419851541519165} -11/07/2021 01:41:11 - INFO - __main__ - Step 31443: {'lr': 0.0004527459478714822, 'samples': 6037056, 'steps': 31442, 'loss/train': 1.2262630462646484} -11/07/2021 01:41:11 - INFO - __main__ - Step 31444: {'lr': 0.00045274284301621414, 'samples': 6037248, 'steps': 31443, 'loss/train': 1.4954262971878052} -11/07/2021 01:41:12 - INFO - __main__ - Step 31445: {'lr': 0.00045273973806959325, 'samples': 6037440, 'steps': 31444, 'loss/train': 1.7720775604248047} -11/07/2021 01:41:13 - INFO - __main__ - Step 31446: {'lr': 0.00045273663303162096, 'samples': 6037632, 'steps': 31445, 'loss/train': 1.8512814044952393} -11/07/2021 01:41:13 - INFO - __main__ - Step 31447: {'lr': 0.00045273352790229873, 'samples': 6037824, 'steps': 31446, 'loss/train': 1.5024912357330322} -11/07/2021 01:41:13 - INFO - __main__ - Step 31448: {'lr': 0.0004527304226816278, 'samples': 6038016, 'steps': 31447, 'loss/train': 1.6347882747650146} -11/07/2021 01:41:14 - INFO - __main__ - Step 31449: {'lr': 0.0004527273173696097, 'samples': 6038208, 'steps': 31448, 'loss/train': 1.7430769205093384} -11/07/2021 01:41:14 - INFO - __main__ - Step 31450: {'lr': 0.0004527242119662458, 'samples': 6038400, 'steps': 31449, 'loss/train': 2.1880335807800293} -11/07/2021 01:41:14 - INFO - __main__ - Step 31451: {'lr': 0.00045272110647153754, 'samples': 6038592, 'steps': 31450, 'loss/train': 1.2813395261764526} -11/07/2021 01:41:15 - INFO - __main__ - Step 31452: {'lr': 0.00045271800088548625, 'samples': 6038784, 'steps': 31451, 'loss/train': 1.6504584550857544} -11/07/2021 01:41:16 - INFO - __main__ - Step 31453: {'lr': 0.00045271489520809337, 'samples': 6038976, 'steps': 31452, 'loss/train': 1.8255902528762817} -11/07/2021 01:41:16 - INFO - __main__ - Step 31454: {'lr': 0.0004527117894393603, 'samples': 6039168, 'steps': 31453, 'loss/train': 1.3392289876937866} -11/07/2021 01:41:17 - INFO - __main__ - Step 31455: {'lr': 0.0004527086835792884, 'samples': 6039360, 'steps': 31454, 'loss/train': 1.391819715499878} -11/07/2021 01:41:17 - INFO - __main__ - Step 31456: {'lr': 0.0004527055776278791, 'samples': 6039552, 'steps': 31455, 'loss/train': 1.526758074760437} -11/07/2021 01:41:18 - INFO - __main__ - Step 31457: {'lr': 0.00045270247158513377, 'samples': 6039744, 'steps': 31456, 'loss/train': 1.5195149183273315} -11/07/2021 01:41:18 - INFO - __main__ - Step 31458: {'lr': 0.00045269936545105384, 'samples': 6039936, 'steps': 31457, 'loss/train': 1.703020453453064} -11/07/2021 01:41:19 - INFO - __main__ - Step 31459: {'lr': 0.0004526962592256407, 'samples': 6040128, 'steps': 31458, 'loss/train': 1.6962475776672363} -11/07/2021 01:41:19 - INFO - __main__ - Step 31460: {'lr': 0.00045269315290889583, 'samples': 6040320, 'steps': 31459, 'loss/train': 1.5722194910049438} -11/07/2021 01:41:19 - INFO - __main__ - Step 31461: {'lr': 0.00045269004650082045, 'samples': 6040512, 'steps': 31460, 'loss/train': 2.1078343391418457} -11/07/2021 01:41:20 - INFO - __main__ - Step 31462: {'lr': 0.0004526869400014162, 'samples': 6040704, 'steps': 31461, 'loss/train': 1.6594512462615967} -11/07/2021 01:41:21 - INFO - __main__ - Step 31463: {'lr': 0.0004526838334106842, 'samples': 6040896, 'steps': 31462, 'loss/train': 1.9305704832077026} -11/07/2021 01:41:21 - INFO - __main__ - Step 31464: {'lr': 0.000452680726728626, 'samples': 6041088, 'steps': 31463, 'loss/train': 1.2269365787506104} -11/07/2021 01:41:21 - INFO - __main__ - Step 31465: {'lr': 0.00045267761995524314, 'samples': 6041280, 'steps': 31464, 'loss/train': 1.296766996383667} -11/07/2021 01:41:22 - INFO - __main__ - Step 31466: {'lr': 0.00045267451309053677, 'samples': 6041472, 'steps': 31465, 'loss/train': 0.952112078666687} -11/07/2021 01:41:23 - INFO - __main__ - Step 31467: {'lr': 0.0004526714061345084, 'samples': 6041664, 'steps': 31466, 'loss/train': 0.7781227231025696} -11/07/2021 01:41:23 - INFO - __main__ - Step 31468: {'lr': 0.0004526682990871593, 'samples': 6041856, 'steps': 31467, 'loss/train': 1.4286562204360962} -11/07/2021 01:41:23 - INFO - __main__ - Step 31469: {'lr': 0.0004526651919484912, 'samples': 6042048, 'steps': 31468, 'loss/train': 1.330336332321167} -11/07/2021 01:41:24 - INFO - __main__ - Step 31470: {'lr': 0.00045266208471850516, 'samples': 6042240, 'steps': 31469, 'loss/train': 0.9660208821296692} -11/07/2021 01:41:24 - INFO - __main__ - Step 31471: {'lr': 0.00045265897739720277, 'samples': 6042432, 'steps': 31470, 'loss/train': 1.2458423376083374} -11/07/2021 01:41:25 - INFO - __main__ - Step 31472: {'lr': 0.00045265586998458534, 'samples': 6042624, 'steps': 31471, 'loss/train': 1.4908545017242432} -11/07/2021 01:41:25 - INFO - __main__ - Step 31473: {'lr': 0.00045265276248065436, 'samples': 6042816, 'steps': 31472, 'loss/train': 1.8791873455047607} -11/07/2021 01:41:26 - INFO - __main__ - Step 31474: {'lr': 0.0004526496548854111, 'samples': 6043008, 'steps': 31473, 'loss/train': 1.3738685846328735} -11/07/2021 01:41:26 - INFO - __main__ - Step 31475: {'lr': 0.000452646547198857, 'samples': 6043200, 'steps': 31474, 'loss/train': 1.3974919319152832} -11/07/2021 01:41:27 - INFO - __main__ - Step 31476: {'lr': 0.0004526434394209936, 'samples': 6043392, 'steps': 31475, 'loss/train': 1.493938684463501} -11/07/2021 01:41:27 - INFO - __main__ - Step 31477: {'lr': 0.00045264033155182216, 'samples': 6043584, 'steps': 31476, 'loss/train': 1.66843581199646} -11/07/2021 01:41:28 - INFO - __main__ - Step 31478: {'lr': 0.0004526372235913441, 'samples': 6043776, 'steps': 31477, 'loss/train': 1.3735740184783936} -11/07/2021 01:41:28 - INFO - __main__ - Step 31479: {'lr': 0.0004526341155395608, 'samples': 6043968, 'steps': 31478, 'loss/train': 1.2243516445159912} -11/07/2021 01:41:29 - INFO - __main__ - Step 31480: {'lr': 0.00045263100739647373, 'samples': 6044160, 'steps': 31479, 'loss/train': 1.4764176607131958} -11/07/2021 01:41:29 - INFO - __main__ - Step 31481: {'lr': 0.00045262789916208424, 'samples': 6044352, 'steps': 31480, 'loss/train': 1.6852359771728516} -11/07/2021 01:41:30 - INFO - __main__ - Step 31482: {'lr': 0.00045262479083639376, 'samples': 6044544, 'steps': 31481, 'loss/train': 1.6857291460037231} -11/07/2021 01:41:30 - INFO - __main__ - Step 31483: {'lr': 0.0004526216824194037, 'samples': 6044736, 'steps': 31482, 'loss/train': 0.5070812106132507} -11/07/2021 01:41:31 - INFO - __main__ - Step 31484: {'lr': 0.00045261857391111536, 'samples': 6044928, 'steps': 31483, 'loss/train': 0.8546400666236877} -11/07/2021 01:41:31 - INFO - __main__ - Step 31485: {'lr': 0.0004526154653115303, 'samples': 6045120, 'steps': 31484, 'loss/train': 1.9318288564682007} -11/07/2021 01:41:31 - INFO - __main__ - Step 31486: {'lr': 0.0004526123566206498, 'samples': 6045312, 'steps': 31485, 'loss/train': 1.4708870649337769} -11/07/2021 01:41:32 - INFO - __main__ - Step 31487: {'lr': 0.0004526092478384753, 'samples': 6045504, 'steps': 31486, 'loss/train': 1.7455925941467285} -11/07/2021 01:41:33 - INFO - __main__ - Step 31488: {'lr': 0.00045260613896500827, 'samples': 6045696, 'steps': 31487, 'loss/train': 1.8832435607910156} -11/07/2021 01:41:33 - INFO - __main__ - Step 31489: {'lr': 0.00045260303000024994, 'samples': 6045888, 'steps': 31488, 'loss/train': 1.7852832078933716} -11/07/2021 01:41:33 - INFO - __main__ - Step 31490: {'lr': 0.0004525999209442018, 'samples': 6046080, 'steps': 31489, 'loss/train': 1.0340776443481445} -11/07/2021 01:41:34 - INFO - __main__ - Step 31491: {'lr': 0.0004525968117968653, 'samples': 6046272, 'steps': 31490, 'loss/train': 1.484983205795288} -11/07/2021 01:41:34 - INFO - __main__ - Step 31492: {'lr': 0.00045259370255824183, 'samples': 6046464, 'steps': 31491, 'loss/train': 1.6369127035140991} -11/07/2021 01:41:35 - INFO - __main__ - Step 31493: {'lr': 0.0004525905932283327, 'samples': 6046656, 'steps': 31492, 'loss/train': 1.3930445909500122} -11/07/2021 01:41:36 - INFO - __main__ - Step 31494: {'lr': 0.00045258748380713943, 'samples': 6046848, 'steps': 31493, 'loss/train': 1.0716495513916016} -11/07/2021 01:41:36 - INFO - __main__ - Step 31495: {'lr': 0.00045258437429466337, 'samples': 6047040, 'steps': 31494, 'loss/train': 0.8319592475891113} -11/07/2021 01:41:36 - INFO - __main__ - Step 31496: {'lr': 0.0004525812646909059, 'samples': 6047232, 'steps': 31495, 'loss/train': 1.5362430810928345} -11/07/2021 01:41:37 - INFO - __main__ - Step 31497: {'lr': 0.0004525781549958684, 'samples': 6047424, 'steps': 31496, 'loss/train': 0.8949344754219055} -11/07/2021 01:41:38 - INFO - __main__ - Step 31498: {'lr': 0.0004525750452095524, 'samples': 6047616, 'steps': 31497, 'loss/train': 2.0039658546447754} -11/07/2021 01:41:38 - INFO - __main__ - Step 31499: {'lr': 0.00045257193533195916, 'samples': 6047808, 'steps': 31498, 'loss/train': 1.5422204732894897} -11/07/2021 01:41:38 - INFO - __main__ - Step 31500: {'lr': 0.0004525688253630901, 'samples': 6048000, 'steps': 31499, 'loss/train': 2.1831295490264893} -11/07/2021 01:41:39 - INFO - __main__ - Step 31501: {'lr': 0.00045256571530294664, 'samples': 6048192, 'steps': 31500, 'loss/train': 1.1621021032333374} -11/07/2021 01:41:39 - INFO - __main__ - Step 31502: {'lr': 0.0004525626051515302, 'samples': 6048384, 'steps': 31501, 'loss/train': 1.3157600164413452} -11/07/2021 01:41:40 - INFO - __main__ - Step 31503: {'lr': 0.0004525594949088423, 'samples': 6048576, 'steps': 31502, 'loss/train': 0.9412500262260437} -11/07/2021 01:41:40 - INFO - __main__ - Step 31504: {'lr': 0.00045255638457488415, 'samples': 6048768, 'steps': 31503, 'loss/train': 0.45820948481559753} -11/07/2021 01:41:41 - INFO - __main__ - Step 31505: {'lr': 0.0004525532741496572, 'samples': 6048960, 'steps': 31504, 'loss/train': 1.6507850885391235} -11/07/2021 01:41:41 - INFO - __main__ - Step 31506: {'lr': 0.0004525501636331628, 'samples': 6049152, 'steps': 31505, 'loss/train': 1.6992638111114502} -11/07/2021 01:41:41 - INFO - __main__ - Step 31507: {'lr': 0.00045254705302540257, 'samples': 6049344, 'steps': 31506, 'loss/train': 1.7947462797164917} -11/07/2021 01:41:43 - INFO - __main__ - Step 31508: {'lr': 0.00045254394232637765, 'samples': 6049536, 'steps': 31507, 'loss/train': 1.3244881629943848} -11/07/2021 01:41:43 - INFO - __main__ - Step 31509: {'lr': 0.0004525408315360896, 'samples': 6049728, 'steps': 31508, 'loss/train': 2.219317674636841} -11/07/2021 01:41:43 - INFO - __main__ - Step 31510: {'lr': 0.00045253772065453977, 'samples': 6049920, 'steps': 31509, 'loss/train': 1.6535799503326416} -11/07/2021 01:41:44 - INFO - __main__ - Step 31511: {'lr': 0.00045253460968172957, 'samples': 6050112, 'steps': 31510, 'loss/train': 1.5129849910736084} -11/07/2021 01:41:44 - INFO - __main__ - Step 31512: {'lr': 0.0004525314986176604, 'samples': 6050304, 'steps': 31511, 'loss/train': 1.443256139755249} -11/07/2021 01:41:45 - INFO - __main__ - Step 31513: {'lr': 0.0004525283874623336, 'samples': 6050496, 'steps': 31512, 'loss/train': 1.5510832071304321} -11/07/2021 01:41:45 - INFO - __main__ - Step 31514: {'lr': 0.00045252527621575075, 'samples': 6050688, 'steps': 31513, 'loss/train': 1.423369288444519} -11/07/2021 01:41:46 - INFO - __main__ - Step 31515: {'lr': 0.0004525221648779131, 'samples': 6050880, 'steps': 31514, 'loss/train': 0.9893391132354736} -11/07/2021 01:41:46 - INFO - __main__ - Step 31516: {'lr': 0.00045251905344882205, 'samples': 6051072, 'steps': 31515, 'loss/train': 1.3399033546447754} -11/07/2021 01:41:46 - INFO - __main__ - Step 31517: {'lr': 0.000452515941928479, 'samples': 6051264, 'steps': 31516, 'loss/train': 1.4280192852020264} -11/07/2021 01:41:47 - INFO - __main__ - Step 31518: {'lr': 0.0004525128303168855, 'samples': 6051456, 'steps': 31517, 'loss/train': 1.543757677078247} -11/07/2021 01:41:48 - INFO - __main__ - Step 31519: {'lr': 0.00045250971861404276, 'samples': 6051648, 'steps': 31518, 'loss/train': 1.4377233982086182} -11/07/2021 01:41:48 - INFO - __main__ - Step 31520: {'lr': 0.0004525066068199523, 'samples': 6051840, 'steps': 31519, 'loss/train': 1.5889067649841309} -11/07/2021 01:41:48 - INFO - __main__ - Step 31521: {'lr': 0.0004525034949346155, 'samples': 6052032, 'steps': 31520, 'loss/train': 1.63162100315094} -11/07/2021 01:41:49 - INFO - __main__ - Step 31522: {'lr': 0.0004525003829580337, 'samples': 6052224, 'steps': 31521, 'loss/train': 1.91524076461792} -11/07/2021 01:41:49 - INFO - __main__ - Step 31523: {'lr': 0.0004524972708902084, 'samples': 6052416, 'steps': 31522, 'loss/train': 1.4860838651657104} -11/07/2021 01:41:50 - INFO - __main__ - Step 31524: {'lr': 0.0004524941587311409, 'samples': 6052608, 'steps': 31523, 'loss/train': 1.5862531661987305} -11/07/2021 01:41:50 - INFO - __main__ - Step 31525: {'lr': 0.0004524910464808327, 'samples': 6052800, 'steps': 31524, 'loss/train': 1.6125633716583252} -11/07/2021 01:41:51 - INFO - __main__ - Step 31526: {'lr': 0.00045248793413928514, 'samples': 6052992, 'steps': 31525, 'loss/train': 1.2867863178253174} -11/07/2021 01:41:51 - INFO - __main__ - Step 31527: {'lr': 0.0004524848217064997, 'samples': 6053184, 'steps': 31526, 'loss/train': 1.5448814630508423} -11/07/2021 01:41:51 - INFO - __main__ - Step 31528: {'lr': 0.0004524817091824777, 'samples': 6053376, 'steps': 31527, 'loss/train': 1.3339594602584839} -11/07/2021 01:41:52 - INFO - __main__ - Step 31529: {'lr': 0.00045247859656722056, 'samples': 6053568, 'steps': 31528, 'loss/train': 1.3554816246032715} -11/07/2021 01:41:53 - INFO - __main__ - Step 31530: {'lr': 0.0004524754838607297, 'samples': 6053760, 'steps': 31529, 'loss/train': 1.2281231880187988} -11/07/2021 01:41:53 - INFO - __main__ - Step 31531: {'lr': 0.0004524723710630064, 'samples': 6053952, 'steps': 31530, 'loss/train': 1.370402455329895} -11/07/2021 01:41:53 - INFO - __main__ - Step 31532: {'lr': 0.0004524692581740523, 'samples': 6054144, 'steps': 31531, 'loss/train': 1.7626378536224365} -11/07/2021 01:41:54 - INFO - __main__ - Step 31533: {'lr': 0.00045246614519386865, 'samples': 6054336, 'steps': 31532, 'loss/train': 1.6262603998184204} -11/07/2021 01:41:55 - INFO - __main__ - Step 31534: {'lr': 0.0004524630321224569, 'samples': 6054528, 'steps': 31533, 'loss/train': 1.3756903409957886} -11/07/2021 01:41:55 - INFO - __main__ - Step 31535: {'lr': 0.0004524599189598183, 'samples': 6054720, 'steps': 31534, 'loss/train': 2.3842573165893555} -11/07/2021 01:41:56 - INFO - __main__ - Step 31536: {'lr': 0.0004524568057059545, 'samples': 6054912, 'steps': 31535, 'loss/train': 1.2920001745224} -11/07/2021 01:41:56 - INFO - __main__ - Step 31537: {'lr': 0.00045245369236086673, 'samples': 6055104, 'steps': 31536, 'loss/train': 1.7213891744613647} -11/07/2021 01:41:56 - INFO - __main__ - Step 31538: {'lr': 0.00045245057892455653, 'samples': 6055296, 'steps': 31537, 'loss/train': 1.6329360008239746} -11/07/2021 01:41:57 - INFO - __main__ - Step 31539: {'lr': 0.0004524474653970252, 'samples': 6055488, 'steps': 31538, 'loss/train': 1.9639887809753418} -11/07/2021 01:41:58 - INFO - __main__ - Step 31540: {'lr': 0.00045244435177827413, 'samples': 6055680, 'steps': 31539, 'loss/train': 1.7359849214553833} -11/07/2021 01:41:58 - INFO - __main__ - Step 31541: {'lr': 0.00045244123806830486, 'samples': 6055872, 'steps': 31540, 'loss/train': 1.2768898010253906} -11/07/2021 01:41:59 - INFO - __main__ - Step 31542: {'lr': 0.00045243812426711856, 'samples': 6056064, 'steps': 31541, 'loss/train': 1.4651298522949219} -11/07/2021 01:41:59 - INFO - __main__ - Step 31543: {'lr': 0.0004524350103747168, 'samples': 6056256, 'steps': 31542, 'loss/train': 1.398427128791809} -11/07/2021 01:42:00 - INFO - __main__ - Step 31544: {'lr': 0.00045243189639110093, 'samples': 6056448, 'steps': 31543, 'loss/train': 1.791009783744812} -11/07/2021 01:42:01 - INFO - __main__ - Step 31545: {'lr': 0.00045242878231627247, 'samples': 6056640, 'steps': 31544, 'loss/train': 1.4630930423736572} -11/07/2021 01:42:01 - INFO - __main__ - Step 31546: {'lr': 0.0004524256681502327, 'samples': 6056832, 'steps': 31545, 'loss/train': 1.5687968730926514} -11/07/2021 01:42:01 - INFO - __main__ - Step 31547: {'lr': 0.0004524225538929829, 'samples': 6057024, 'steps': 31546, 'loss/train': 1.714564323425293} -11/07/2021 01:42:02 - INFO - __main__ - Step 31548: {'lr': 0.0004524194395445248, 'samples': 6057216, 'steps': 31547, 'loss/train': 0.513561487197876} -11/07/2021 01:42:03 - INFO - __main__ - Step 31549: {'lr': 0.0004524163251048595, 'samples': 6057408, 'steps': 31548, 'loss/train': 1.0790307521820068} -11/07/2021 01:42:03 - INFO - __main__ - Step 31550: {'lr': 0.0004524132105739886, 'samples': 6057600, 'steps': 31549, 'loss/train': 1.5847446918487549} -11/07/2021 01:42:03 - INFO - __main__ - Step 31551: {'lr': 0.0004524100959519134, 'samples': 6057792, 'steps': 31550, 'loss/train': 1.0553903579711914} -11/07/2021 01:42:04 - INFO - __main__ - Step 31552: {'lr': 0.00045240698123863535, 'samples': 6057984, 'steps': 31551, 'loss/train': 1.499010443687439} -11/07/2021 01:42:04 - INFO - __main__ - Step 31553: {'lr': 0.0004524038664341558, 'samples': 6058176, 'steps': 31552, 'loss/train': 1.598149299621582} -11/07/2021 01:42:05 - INFO - __main__ - Step 31554: {'lr': 0.00045240075153847625, 'samples': 6058368, 'steps': 31553, 'loss/train': 1.6579509973526} -11/07/2021 01:42:05 - INFO - __main__ - Step 31555: {'lr': 0.00045239763655159805, 'samples': 6058560, 'steps': 31554, 'loss/train': 1.8098655939102173} -11/07/2021 01:42:06 - INFO - __main__ - Step 31556: {'lr': 0.00045239452147352257, 'samples': 6058752, 'steps': 31555, 'loss/train': 1.4907845258712769} -11/07/2021 01:42:06 - INFO - __main__ - Step 31557: {'lr': 0.0004523914063042512, 'samples': 6058944, 'steps': 31556, 'loss/train': 1.4728018045425415} -11/07/2021 01:42:07 - INFO - __main__ - Step 31558: {'lr': 0.00045238829104378545, 'samples': 6059136, 'steps': 31557, 'loss/train': 1.4942617416381836} -11/07/2021 01:42:07 - INFO - __main__ - Step 31559: {'lr': 0.0004523851756921266, 'samples': 6059328, 'steps': 31558, 'loss/train': 1.0715967416763306} -11/07/2021 01:42:08 - INFO - __main__ - Step 31560: {'lr': 0.00045238206024927614, 'samples': 6059520, 'steps': 31559, 'loss/train': 1.5499707460403442} -11/07/2021 01:42:08 - INFO - __main__ - Step 31561: {'lr': 0.00045237894471523543, 'samples': 6059712, 'steps': 31560, 'loss/train': 1.5776026248931885} -11/07/2021 01:42:09 - INFO - __main__ - Step 31562: {'lr': 0.00045237582909000594, 'samples': 6059904, 'steps': 31561, 'loss/train': 1.4897489547729492} -11/07/2021 01:42:09 - INFO - __main__ - Step 31563: {'lr': 0.00045237271337358897, 'samples': 6060096, 'steps': 31562, 'loss/train': 1.5823599100112915} -11/07/2021 01:42:09 - INFO - __main__ - Step 31564: {'lr': 0.00045236959756598605, 'samples': 6060288, 'steps': 31563, 'loss/train': 1.4825657606124878} -11/07/2021 01:42:10 - INFO - __main__ - Step 31565: {'lr': 0.0004523664816671985, 'samples': 6060480, 'steps': 31564, 'loss/train': 1.520081639289856} -11/07/2021 01:42:11 - INFO - __main__ - Step 31566: {'lr': 0.0004523633656772277, 'samples': 6060672, 'steps': 31565, 'loss/train': 1.5277254581451416} -11/07/2021 01:42:11 - INFO - __main__ - Step 31567: {'lr': 0.00045236024959607505, 'samples': 6060864, 'steps': 31566, 'loss/train': 1.4078350067138672} -11/07/2021 01:42:11 - INFO - __main__ - Step 31568: {'lr': 0.00045235713342374207, 'samples': 6061056, 'steps': 31567, 'loss/train': 1.245788812637329} -11/07/2021 01:42:12 - INFO - __main__ - Step 31569: {'lr': 0.00045235401716023, 'samples': 6061248, 'steps': 31568, 'loss/train': 1.6251945495605469} -11/07/2021 01:42:13 - INFO - __main__ - Step 31570: {'lr': 0.0004523509008055404, 'samples': 6061440, 'steps': 31569, 'loss/train': 0.8039262890815735} -11/07/2021 01:42:13 - INFO - __main__ - Step 31571: {'lr': 0.0004523477843596746, 'samples': 6061632, 'steps': 31570, 'loss/train': 1.3582419157028198} -11/07/2021 01:42:13 - INFO - __main__ - Step 31572: {'lr': 0.00045234466782263403, 'samples': 6061824, 'steps': 31571, 'loss/train': 1.2797014713287354} -11/07/2021 01:42:14 - INFO - __main__ - Step 31573: {'lr': 0.00045234155119442, 'samples': 6062016, 'steps': 31572, 'loss/train': 1.9971174001693726} -11/07/2021 01:42:14 - INFO - __main__ - Step 31574: {'lr': 0.00045233843447503407, 'samples': 6062208, 'steps': 31573, 'loss/train': 1.3037500381469727} -11/07/2021 01:42:15 - INFO - __main__ - Step 31575: {'lr': 0.00045233531766447757, 'samples': 6062400, 'steps': 31574, 'loss/train': 1.8818330764770508} -11/07/2021 01:42:16 - INFO - __main__ - Step 31576: {'lr': 0.00045233220076275186, 'samples': 6062592, 'steps': 31575, 'loss/train': 1.2794921398162842} -11/07/2021 01:42:16 - INFO - __main__ - Step 31577: {'lr': 0.0004523290837698583, 'samples': 6062784, 'steps': 31576, 'loss/train': 1.7762749195098877} -11/07/2021 01:42:17 - INFO - __main__ - Step 31578: {'lr': 0.0004523259666857985, 'samples': 6062976, 'steps': 31577, 'loss/train': 0.7119866013526917} -11/07/2021 01:42:17 - INFO - __main__ - Step 31579: {'lr': 0.00045232284951057366, 'samples': 6063168, 'steps': 31578, 'loss/train': 1.141363263130188} -11/07/2021 01:42:17 - INFO - __main__ - Step 31580: {'lr': 0.00045231973224418533, 'samples': 6063360, 'steps': 31579, 'loss/train': 1.2381643056869507} -11/07/2021 01:42:18 - INFO - __main__ - Step 31581: {'lr': 0.00045231661488663485, 'samples': 6063552, 'steps': 31580, 'loss/train': 1.0016676187515259} -11/07/2021 01:42:19 - INFO - __main__ - Step 31582: {'lr': 0.0004523134974379236, 'samples': 6063744, 'steps': 31581, 'loss/train': 1.7150145769119263} -11/07/2021 01:42:19 - INFO - __main__ - Step 31583: {'lr': 0.000452310379898053, 'samples': 6063936, 'steps': 31582, 'loss/train': 1.178554654121399} -11/07/2021 01:42:19 - INFO - __main__ - Step 31584: {'lr': 0.00045230726226702444, 'samples': 6064128, 'steps': 31583, 'loss/train': 1.5771918296813965} -11/07/2021 01:42:20 - INFO - __main__ - Step 31585: {'lr': 0.0004523041445448394, 'samples': 6064320, 'steps': 31584, 'loss/train': 1.6697421073913574} -11/07/2021 01:42:21 - INFO - __main__ - Step 31586: {'lr': 0.00045230102673149923, 'samples': 6064512, 'steps': 31585, 'loss/train': 1.4931589365005493} -11/07/2021 01:42:21 - INFO - __main__ - Step 31587: {'lr': 0.00045229790882700535, 'samples': 6064704, 'steps': 31586, 'loss/train': 1.292038917541504} -11/07/2021 01:42:21 - INFO - __main__ - Step 31588: {'lr': 0.00045229479083135917, 'samples': 6064896, 'steps': 31587, 'loss/train': 2.3265585899353027} -11/07/2021 01:42:22 - INFO - __main__ - Step 31589: {'lr': 0.000452291672744562, 'samples': 6065088, 'steps': 31588, 'loss/train': 0.961132824420929} -11/07/2021 01:42:22 - INFO - __main__ - Step 31590: {'lr': 0.0004522885545666153, 'samples': 6065280, 'steps': 31589, 'loss/train': 0.4769384562969208} -11/07/2021 01:42:24 - INFO - __main__ - Step 31591: {'lr': 0.0004522854362975206, 'samples': 6065472, 'steps': 31590, 'loss/train': 0.729523241519928} -11/07/2021 01:42:24 - INFO - __main__ - Step 31592: {'lr': 0.00045228231793727924, 'samples': 6065664, 'steps': 31591, 'loss/train': 0.5749496221542358} -11/07/2021 01:42:24 - INFO - __main__ - Step 31593: {'lr': 0.00045227919948589247, 'samples': 6065856, 'steps': 31592, 'loss/train': 1.5208745002746582} -11/07/2021 01:42:25 - INFO - __main__ - Step 31594: {'lr': 0.0004522760809433619, 'samples': 6066048, 'steps': 31593, 'loss/train': 5.449794292449951} -11/07/2021 01:42:25 - INFO - __main__ - Step 31595: {'lr': 0.0004522729623096888, 'samples': 6066240, 'steps': 31594, 'loss/train': 5.459228038787842} -11/07/2021 01:42:25 - INFO - __main__ - Step 31596: {'lr': 0.0004522698435848747, 'samples': 6066432, 'steps': 31595, 'loss/train': 1.2829856872558594} -11/07/2021 01:42:26 - INFO - __main__ - Step 31597: {'lr': 0.0004522667247689208, 'samples': 6066624, 'steps': 31596, 'loss/train': 1.6735295057296753} -11/07/2021 01:42:27 - INFO - __main__ - Step 31598: {'lr': 0.0004522636058618287, 'samples': 6066816, 'steps': 31597, 'loss/train': 0.953147828578949} -11/07/2021 01:42:27 - INFO - __main__ - Step 31599: {'lr': 0.0004522604868635998, 'samples': 6067008, 'steps': 31598, 'loss/train': 1.3888795375823975} -11/07/2021 01:42:27 - INFO - __main__ - Step 31600: {'lr': 0.0004522573677742353, 'samples': 6067200, 'steps': 31599, 'loss/train': 1.8566700220108032} -11/07/2021 01:42:28 - INFO - __main__ - Step 31601: {'lr': 0.0004522542485937369, 'samples': 6067392, 'steps': 31600, 'loss/train': 1.5361170768737793} -11/07/2021 01:42:28 - INFO - __main__ - Step 31602: {'lr': 0.0004522511293221058, 'samples': 6067584, 'steps': 31601, 'loss/train': 1.6162889003753662} -11/07/2021 01:42:29 - INFO - __main__ - Step 31603: {'lr': 0.00045224800995934345, 'samples': 6067776, 'steps': 31602, 'loss/train': 1.435838222503662} -11/07/2021 01:42:30 - INFO - __main__ - Step 31604: {'lr': 0.00045224489050545125, 'samples': 6067968, 'steps': 31603, 'loss/train': 1.3735251426696777} -11/07/2021 01:42:30 - INFO - __main__ - Step 31605: {'lr': 0.0004522417709604306, 'samples': 6068160, 'steps': 31604, 'loss/train': 1.6512362957000732} -11/07/2021 01:42:30 - INFO - __main__ - Step 31606: {'lr': 0.000452238651324283, 'samples': 6068352, 'steps': 31605, 'loss/train': 1.6479780673980713} -11/07/2021 01:42:31 - INFO - __main__ - Step 31607: {'lr': 0.0004522355315970098, 'samples': 6068544, 'steps': 31606, 'loss/train': 1.9048182964324951} -11/07/2021 01:42:32 - INFO - __main__ - Step 31608: {'lr': 0.0004522324117786123, 'samples': 6068736, 'steps': 31607, 'loss/train': 1.587449073791504} -11/07/2021 01:42:32 - INFO - __main__ - Step 31609: {'lr': 0.0004522292918690921, 'samples': 6068928, 'steps': 31608, 'loss/train': 1.3543143272399902} -11/07/2021 01:42:32 - INFO - __main__ - Step 31610: {'lr': 0.0004522261718684504, 'samples': 6069120, 'steps': 31609, 'loss/train': 1.546761393547058} -11/07/2021 01:42:33 - INFO - __main__ - Step 31611: {'lr': 0.00045222305177668875, 'samples': 6069312, 'steps': 31610, 'loss/train': 0.9692068696022034} -11/07/2021 01:42:33 - INFO - __main__ - Step 31612: {'lr': 0.00045221993159380857, 'samples': 6069504, 'steps': 31611, 'loss/train': 1.5525907278060913} -11/07/2021 01:42:34 - INFO - __main__ - Step 31613: {'lr': 0.00045221681131981116, 'samples': 6069696, 'steps': 31612, 'loss/train': 1.702857494354248} -11/07/2021 01:42:34 - INFO - __main__ - Step 31614: {'lr': 0.00045221369095469795, 'samples': 6069888, 'steps': 31613, 'loss/train': 0.9163973927497864} -11/07/2021 01:42:35 - INFO - __main__ - Step 31615: {'lr': 0.00045221057049847044, 'samples': 6070080, 'steps': 31614, 'loss/train': 1.3347078561782837} -11/07/2021 01:42:35 - INFO - __main__ - Step 31616: {'lr': 0.0004522074499511299, 'samples': 6070272, 'steps': 31615, 'loss/train': 1.5862935781478882} -11/07/2021 01:42:35 - INFO - __main__ - Step 31617: {'lr': 0.0004522043293126778, 'samples': 6070464, 'steps': 31616, 'loss/train': 2.0183849334716797} -11/07/2021 01:42:37 - INFO - __main__ - Step 31618: {'lr': 0.00045220120858311557, 'samples': 6070656, 'steps': 31617, 'loss/train': 1.6048452854156494} -11/07/2021 01:42:37 - INFO - __main__ - Step 31619: {'lr': 0.0004521980877624446, 'samples': 6070848, 'steps': 31618, 'loss/train': 1.529024362564087} -11/07/2021 01:42:37 - INFO - __main__ - Step 31620: {'lr': 0.0004521949668506663, 'samples': 6071040, 'steps': 31619, 'loss/train': 1.7623778581619263} -11/07/2021 01:42:38 - INFO - __main__ - Step 31621: {'lr': 0.00045219184584778207, 'samples': 6071232, 'steps': 31620, 'loss/train': 1.584256887435913} -11/07/2021 01:42:38 - INFO - __main__ - Step 31622: {'lr': 0.0004521887247537933, 'samples': 6071424, 'steps': 31621, 'loss/train': 1.4615974426269531} -11/07/2021 01:42:38 - INFO - __main__ - Step 31623: {'lr': 0.00045218560356870144, 'samples': 6071616, 'steps': 31622, 'loss/train': 1.1545277833938599} -11/07/2021 01:42:39 - INFO - __main__ - Step 31624: {'lr': 0.0004521824822925078, 'samples': 6071808, 'steps': 31623, 'loss/train': 1.0066297054290771} -11/07/2021 01:42:40 - INFO - __main__ - Step 31625: {'lr': 0.00045217936092521396, 'samples': 6072000, 'steps': 31624, 'loss/train': 1.429289698600769} -11/07/2021 01:42:40 - INFO - __main__ - Step 31626: {'lr': 0.00045217623946682114, 'samples': 6072192, 'steps': 31625, 'loss/train': 1.3774598836898804} -11/07/2021 01:42:40 - INFO - __main__ - Step 31627: {'lr': 0.00045217311791733084, 'samples': 6072384, 'steps': 31626, 'loss/train': 1.5545233488082886} -11/07/2021 01:42:41 - INFO - __main__ - Step 31628: {'lr': 0.00045216999627674436, 'samples': 6072576, 'steps': 31627, 'loss/train': 1.5675814151763916} -11/07/2021 01:42:42 - INFO - __main__ - Step 31629: {'lr': 0.0004521668745450633, 'samples': 6072768, 'steps': 31628, 'loss/train': 1.2844632863998413} -11/07/2021 01:42:42 - INFO - __main__ - Step 31630: {'lr': 0.00045216375272228907, 'samples': 6072960, 'steps': 31629, 'loss/train': 1.017756700515747} -11/07/2021 01:42:42 - INFO - __main__ - Step 31631: {'lr': 0.00045216063080842287, 'samples': 6073152, 'steps': 31630, 'loss/train': 1.531299114227295} -11/07/2021 01:42:43 - INFO - __main__ - Step 31632: {'lr': 0.00045215750880346617, 'samples': 6073344, 'steps': 31631, 'loss/train': 1.265383243560791} -11/07/2021 01:42:43 - INFO - __main__ - Step 31633: {'lr': 0.00045215438670742045, 'samples': 6073536, 'steps': 31632, 'loss/train': 1.9258782863616943} -11/07/2021 01:42:44 - INFO - __main__ - Step 31634: {'lr': 0.00045215126452028705, 'samples': 6073728, 'steps': 31633, 'loss/train': 1.5267999172210693} -11/07/2021 01:42:44 - INFO - __main__ - Step 31635: {'lr': 0.00045214814224206744, 'samples': 6073920, 'steps': 31634, 'loss/train': 1.5844289064407349} -11/07/2021 01:42:45 - INFO - __main__ - Step 31636: {'lr': 0.00045214501987276304, 'samples': 6074112, 'steps': 31635, 'loss/train': 1.2692776918411255} -11/07/2021 01:42:45 - INFO - __main__ - Step 31637: {'lr': 0.0004521418974123751, 'samples': 6074304, 'steps': 31636, 'loss/train': 1.620078682899475} -11/07/2021 01:42:45 - INFO - __main__ - Step 31638: {'lr': 0.00045213877486090524, 'samples': 6074496, 'steps': 31637, 'loss/train': 2.1654961109161377} -11/07/2021 01:42:47 - INFO - __main__ - Step 31639: {'lr': 0.00045213565221835473, 'samples': 6074688, 'steps': 31638, 'loss/train': 1.277814507484436} -11/07/2021 01:42:48 - INFO - __main__ - Step 31640: {'lr': 0.00045213252948472505, 'samples': 6074880, 'steps': 31639, 'loss/train': 1.407594919204712} -11/07/2021 01:42:48 - INFO - __main__ - Step 31641: {'lr': 0.0004521294066600175, 'samples': 6075072, 'steps': 31640, 'loss/train': 1.788429617881775} -11/07/2021 01:42:48 - INFO - __main__ - Step 31642: {'lr': 0.0004521262837442336, 'samples': 6075264, 'steps': 31641, 'loss/train': 1.7870267629623413} -11/07/2021 01:42:49 - INFO - __main__ - Step 31643: {'lr': 0.0004521231607373747, 'samples': 6075456, 'steps': 31642, 'loss/train': 1.7724577188491821} -11/07/2021 01:42:49 - INFO - __main__ - Step 31644: {'lr': 0.00045212003763944226, 'samples': 6075648, 'steps': 31643, 'loss/train': 1.35056734085083} -11/07/2021 01:42:50 - INFO - __main__ - Step 31645: {'lr': 0.00045211691445043765, 'samples': 6075840, 'steps': 31644, 'loss/train': 1.589632511138916} -11/07/2021 01:42:51 - INFO - __main__ - Step 31646: {'lr': 0.0004521137911703622, 'samples': 6076032, 'steps': 31645, 'loss/train': 1.411072015762329} -11/07/2021 01:42:51 - INFO - __main__ - Step 31647: {'lr': 0.0004521106677992175, 'samples': 6076224, 'steps': 31646, 'loss/train': 1.1863641738891602} -11/07/2021 01:42:51 - INFO - __main__ - Step 31648: {'lr': 0.0004521075443370048, 'samples': 6076416, 'steps': 31647, 'loss/train': 1.4727528095245361} -11/07/2021 01:42:52 - INFO - __main__ - Step 31649: {'lr': 0.0004521044207837256, 'samples': 6076608, 'steps': 31648, 'loss/train': 1.6370353698730469} -11/07/2021 01:42:52 - INFO - __main__ - Step 31650: {'lr': 0.0004521012971393812, 'samples': 6076800, 'steps': 31649, 'loss/train': 1.5181607007980347} -11/07/2021 01:42:52 - INFO - __main__ - Step 31651: {'lr': 0.0004520981734039731, 'samples': 6076992, 'steps': 31650, 'loss/train': 1.3422218561172485} -11/07/2021 01:42:53 - INFO - __main__ - Step 31652: {'lr': 0.0004520950495775027, 'samples': 6077184, 'steps': 31651, 'loss/train': 1.3841309547424316} -11/07/2021 01:42:54 - INFO - __main__ - Step 31653: {'lr': 0.00045209192565997137, 'samples': 6077376, 'steps': 31652, 'loss/train': 1.6002979278564453} -11/07/2021 01:42:54 - INFO - __main__ - Step 31654: {'lr': 0.00045208880165138054, 'samples': 6077568, 'steps': 31653, 'loss/train': 1.987862229347229} -11/07/2021 01:42:54 - INFO - __main__ - Step 31655: {'lr': 0.0004520856775517316, 'samples': 6077760, 'steps': 31654, 'loss/train': 1.7040534019470215} -11/07/2021 01:42:55 - INFO - __main__ - Step 31656: {'lr': 0.00045208255336102597, 'samples': 6077952, 'steps': 31655, 'loss/train': 1.6022289991378784} -11/07/2021 01:42:56 - INFO - __main__ - Step 31657: {'lr': 0.0004520794290792651, 'samples': 6078144, 'steps': 31656, 'loss/train': 1.529978632926941} -11/07/2021 01:42:56 - INFO - __main__ - Step 31658: {'lr': 0.0004520763047064503, 'samples': 6078336, 'steps': 31657, 'loss/train': 1.1939507722854614} -11/07/2021 01:42:57 - INFO - __main__ - Step 31659: {'lr': 0.0004520731802425831, 'samples': 6078528, 'steps': 31658, 'loss/train': 1.6138416528701782} -11/07/2021 01:42:57 - INFO - __main__ - Step 31660: {'lr': 0.0004520700556876648, 'samples': 6078720, 'steps': 31659, 'loss/train': 1.4073563814163208} -11/07/2021 01:42:57 - INFO - __main__ - Step 31661: {'lr': 0.0004520669310416969, 'samples': 6078912, 'steps': 31660, 'loss/train': 1.5274254083633423} -11/07/2021 01:42:59 - INFO - __main__ - Step 31662: {'lr': 0.0004520638063046807, 'samples': 6079104, 'steps': 31661, 'loss/train': 1.4219837188720703} -11/07/2021 01:42:59 - INFO - __main__ - Step 31663: {'lr': 0.0004520606814766177, 'samples': 6079296, 'steps': 31662, 'loss/train': 1.5876414775848389} -11/07/2021 01:42:59 - INFO - __main__ - Step 31664: {'lr': 0.00045205755655750924, 'samples': 6079488, 'steps': 31663, 'loss/train': 1.267156958580017} -11/07/2021 01:43:00 - INFO - __main__ - Step 31665: {'lr': 0.0004520544315473568, 'samples': 6079680, 'steps': 31664, 'loss/train': 1.715897798538208} -11/07/2021 01:43:00 - INFO - __main__ - Step 31666: {'lr': 0.00045205130644616177, 'samples': 6079872, 'steps': 31665, 'loss/train': 1.593644618988037} -11/07/2021 01:43:01 - INFO - __main__ - Step 31667: {'lr': 0.0004520481812539255, 'samples': 6080064, 'steps': 31666, 'loss/train': 1.4776939153671265} -11/07/2021 01:43:01 - INFO - __main__ - Step 31668: {'lr': 0.00045204505597064943, 'samples': 6080256, 'steps': 31667, 'loss/train': 1.5776082277297974} -11/07/2021 01:43:02 - INFO - __main__ - Step 31669: {'lr': 0.00045204193059633505, 'samples': 6080448, 'steps': 31668, 'loss/train': 1.3004459142684937} -11/07/2021 01:43:02 - INFO - __main__ - Step 31670: {'lr': 0.0004520388051309836, 'samples': 6080640, 'steps': 31669, 'loss/train': 1.5337731838226318} -11/07/2021 01:43:03 - INFO - __main__ - Step 31671: {'lr': 0.00045203567957459657, 'samples': 6080832, 'steps': 31670, 'loss/train': 1.2069718837738037} -11/07/2021 01:43:03 - INFO - __main__ - Step 31672: {'lr': 0.00045203255392717545, 'samples': 6081024, 'steps': 31671, 'loss/train': 5.560124397277832} -11/07/2021 01:43:04 - INFO - __main__ - Step 31673: {'lr': 0.00045202942818872157, 'samples': 6081216, 'steps': 31672, 'loss/train': 1.22538161277771} -11/07/2021 01:43:04 - INFO - __main__ - Step 31674: {'lr': 0.0004520263023592363, 'samples': 6081408, 'steps': 31673, 'loss/train': 1.615771770477295} -11/07/2021 01:43:05 - INFO - __main__ - Step 31675: {'lr': 0.00045202317643872113, 'samples': 6081600, 'steps': 31674, 'loss/train': 1.6662970781326294} -11/07/2021 01:43:05 - INFO - __main__ - Step 31676: {'lr': 0.00045202005042717743, 'samples': 6081792, 'steps': 31675, 'loss/train': 1.475319266319275} -11/07/2021 01:43:05 - INFO - __main__ - Step 31677: {'lr': 0.0004520169243246066, 'samples': 6081984, 'steps': 31676, 'loss/train': 1.3714836835861206} -11/07/2021 01:43:06 - INFO - __main__ - Step 31678: {'lr': 0.0004520137981310101, 'samples': 6082176, 'steps': 31677, 'loss/train': 1.3201550245285034} -11/07/2021 01:43:07 - INFO - __main__ - Step 31679: {'lr': 0.0004520106718463893, 'samples': 6082368, 'steps': 31678, 'loss/train': 1.5420702695846558} -11/07/2021 01:43:07 - INFO - __main__ - Step 31680: {'lr': 0.0004520075454707456, 'samples': 6082560, 'steps': 31679, 'loss/train': 1.2182254791259766} -11/07/2021 01:43:07 - INFO - __main__ - Step 31681: {'lr': 0.0004520044190040804, 'samples': 6082752, 'steps': 31680, 'loss/train': 1.6463545560836792} -11/07/2021 01:43:08 - INFO - __main__ - Step 31682: {'lr': 0.0004520012924463951, 'samples': 6082944, 'steps': 31681, 'loss/train': 1.6987247467041016} -11/07/2021 01:43:09 - INFO - __main__ - Step 31683: {'lr': 0.0004519981657976912, 'samples': 6083136, 'steps': 31682, 'loss/train': 1.5654196739196777} -11/07/2021 01:43:09 - INFO - __main__ - Step 31684: {'lr': 0.00045199503905797, 'samples': 6083328, 'steps': 31683, 'loss/train': 1.4091193675994873} -11/07/2021 01:43:10 - INFO - __main__ - Step 31685: {'lr': 0.0004519919122272329, 'samples': 6083520, 'steps': 31684, 'loss/train': 0.2060466855764389} -11/07/2021 01:43:10 - INFO - __main__ - Step 31686: {'lr': 0.00045198878530548146, 'samples': 6083712, 'steps': 31685, 'loss/train': 1.2138254642486572} -11/07/2021 01:43:10 - INFO - __main__ - Step 31687: {'lr': 0.0004519856582927169, 'samples': 6083904, 'steps': 31686, 'loss/train': 0.8990980982780457} -11/07/2021 01:43:11 - INFO - __main__ - Step 31688: {'lr': 0.00045198253118894084, 'samples': 6084096, 'steps': 31687, 'loss/train': 1.5900429487228394} -11/07/2021 01:43:12 - INFO - __main__ - Step 31689: {'lr': 0.0004519794039941545, 'samples': 6084288, 'steps': 31688, 'loss/train': 1.7415271997451782} -11/07/2021 01:43:12 - INFO - __main__ - Step 31690: {'lr': 0.0004519762767083593, 'samples': 6084480, 'steps': 31689, 'loss/train': 1.670418620109558} -11/07/2021 01:43:12 - INFO - __main__ - Step 31691: {'lr': 0.00045197314933155677, 'samples': 6084672, 'steps': 31690, 'loss/train': 1.6502057313919067} -11/07/2021 01:43:13 - INFO - __main__ - Step 31692: {'lr': 0.0004519700218637482, 'samples': 6084864, 'steps': 31691, 'loss/train': 1.5056148767471313} -11/07/2021 01:43:13 - INFO - __main__ - Step 31693: {'lr': 0.00045196689430493516, 'samples': 6085056, 'steps': 31692, 'loss/train': 1.3275924921035767} -11/07/2021 01:43:14 - INFO - __main__ - Step 31694: {'lr': 0.00045196376665511883, 'samples': 6085248, 'steps': 31693, 'loss/train': 1.2099881172180176} -11/07/2021 01:43:14 - INFO - __main__ - Step 31695: {'lr': 0.00045196063891430086, 'samples': 6085440, 'steps': 31694, 'loss/train': 1.4326869249343872} -11/07/2021 01:43:15 - INFO - __main__ - Step 31696: {'lr': 0.0004519575110824825, 'samples': 6085632, 'steps': 31695, 'loss/train': 1.1381953954696655} -11/07/2021 01:43:15 - INFO - __main__ - Step 31697: {'lr': 0.0004519543831596652, 'samples': 6085824, 'steps': 31696, 'loss/train': 1.0026839971542358} -11/07/2021 01:43:15 - INFO - __main__ - Step 31698: {'lr': 0.0004519512551458503, 'samples': 6086016, 'steps': 31697, 'loss/train': 1.536896824836731} -11/07/2021 01:43:17 - INFO - __main__ - Step 31699: {'lr': 0.0004519481270410394, 'samples': 6086208, 'steps': 31698, 'loss/train': 1.6450562477111816} -11/07/2021 01:43:17 - INFO - __main__ - Step 31700: {'lr': 0.00045194499884523376, 'samples': 6086400, 'steps': 31699, 'loss/train': 1.4656116962432861} -11/07/2021 01:43:17 - INFO - __main__ - Step 31701: {'lr': 0.0004519418705584348, 'samples': 6086592, 'steps': 31700, 'loss/train': 1.449439525604248} -11/07/2021 01:43:18 - INFO - __main__ - Step 31702: {'lr': 0.0004519387421806439, 'samples': 6086784, 'steps': 31701, 'loss/train': 1.4537426233291626} -11/07/2021 01:43:18 - INFO - __main__ - Step 31703: {'lr': 0.0004519356137118625, 'samples': 6086976, 'steps': 31702, 'loss/train': 1.1907501220703125} -11/07/2021 01:43:20 - INFO - __main__ - Step 31704: {'lr': 0.00045193248515209216, 'samples': 6087168, 'steps': 31703, 'loss/train': 1.3883063793182373} -11/07/2021 01:43:20 - INFO - __main__ - Step 31705: {'lr': 0.0004519293565013341, 'samples': 6087360, 'steps': 31704, 'loss/train': 1.6694093942642212} -11/07/2021 01:43:20 - INFO - __main__ - Step 31706: {'lr': 0.0004519262277595898, 'samples': 6087552, 'steps': 31705, 'loss/train': 1.9630138874053955} -11/07/2021 01:43:21 - INFO - __main__ - Step 31707: {'lr': 0.0004519230989268606, 'samples': 6087744, 'steps': 31706, 'loss/train': 1.0818159580230713} -11/07/2021 01:43:21 - INFO - __main__ - Step 31708: {'lr': 0.000451919970003148, 'samples': 6087936, 'steps': 31707, 'loss/train': 1.182492971420288} -11/07/2021 01:43:21 - INFO - __main__ - Step 31709: {'lr': 0.0004519168409884534, 'samples': 6088128, 'steps': 31708, 'loss/train': 0.6430357098579407} -11/07/2021 01:43:23 - INFO - __main__ - Step 31710: {'lr': 0.00045191371188277817, 'samples': 6088320, 'steps': 31709, 'loss/train': 1.2160098552703857} -11/07/2021 01:43:23 - INFO - __main__ - Step 31711: {'lr': 0.0004519105826861237, 'samples': 6088512, 'steps': 31710, 'loss/train': 2.0542500019073486} -11/07/2021 01:43:23 - INFO - __main__ - Step 31712: {'lr': 0.0004519074533984915, 'samples': 6088704, 'steps': 31711, 'loss/train': 1.3618507385253906} -11/07/2021 01:43:24 - INFO - __main__ - Step 31713: {'lr': 0.0004519043240198829, 'samples': 6088896, 'steps': 31712, 'loss/train': 1.457452654838562} -11/07/2021 01:43:24 - INFO - __main__ - Step 31714: {'lr': 0.0004519011945502993, 'samples': 6089088, 'steps': 31713, 'loss/train': 0.8872636556625366} -11/07/2021 01:43:26 - INFO - __main__ - Step 31715: {'lr': 0.00045189806498974216, 'samples': 6089280, 'steps': 31714, 'loss/train': 1.2994664907455444} -11/07/2021 01:43:26 - INFO - __main__ - Step 31716: {'lr': 0.00045189493533821285, 'samples': 6089472, 'steps': 31715, 'loss/train': 1.7757633924484253} -11/07/2021 01:43:26 - INFO - __main__ - Step 31717: {'lr': 0.0004518918055957128, 'samples': 6089664, 'steps': 31716, 'loss/train': 2.037893056869507} -11/07/2021 01:43:27 - INFO - __main__ - Step 31718: {'lr': 0.0004518886757622435, 'samples': 6089856, 'steps': 31717, 'loss/train': 1.869469165802002} -11/07/2021 01:43:27 - INFO - __main__ - Step 31719: {'lr': 0.0004518855458378062, 'samples': 6090048, 'steps': 31718, 'loss/train': 1.8262141942977905} -11/07/2021 01:43:27 - INFO - __main__ - Step 31720: {'lr': 0.0004518824158224023, 'samples': 6090240, 'steps': 31719, 'loss/train': 1.5757958889007568} -11/07/2021 01:43:28 - INFO - __main__ - Step 31721: {'lr': 0.00045187928571603343, 'samples': 6090432, 'steps': 31720, 'loss/train': 1.4796817302703857} -11/07/2021 01:43:29 - INFO - __main__ - Step 31722: {'lr': 0.0004518761555187008, 'samples': 6090624, 'steps': 31721, 'loss/train': 1.763049840927124} -11/07/2021 01:43:29 - INFO - __main__ - Step 31723: {'lr': 0.00045187302523040597, 'samples': 6090816, 'steps': 31722, 'loss/train': 1.7150776386260986} -11/07/2021 01:43:29 - INFO - __main__ - Step 31724: {'lr': 0.00045186989485115014, 'samples': 6091008, 'steps': 31723, 'loss/train': 1.8566874265670776} -11/07/2021 01:43:30 - INFO - __main__ - Step 31725: {'lr': 0.000451866764380935, 'samples': 6091200, 'steps': 31724, 'loss/train': 0.8527278900146484} -11/07/2021 01:43:30 - INFO - __main__ - Step 31726: {'lr': 0.0004518636338197617, 'samples': 6091392, 'steps': 31725, 'loss/train': 0.79350346326828} -11/07/2021 01:43:31 - INFO - __main__ - Step 31727: {'lr': 0.00045186050316763186, 'samples': 6091584, 'steps': 31726, 'loss/train': 1.8084723949432373} -11/07/2021 01:43:32 - INFO - __main__ - Step 31728: {'lr': 0.0004518573724245467, 'samples': 6091776, 'steps': 31727, 'loss/train': 1.43443763256073} -11/07/2021 01:43:32 - INFO - __main__ - Step 31729: {'lr': 0.00045185424159050776, 'samples': 6091968, 'steps': 31728, 'loss/train': 0.6599883437156677} -11/07/2021 01:43:32 - INFO - __main__ - Step 31730: {'lr': 0.00045185111066551643, 'samples': 6092160, 'steps': 31729, 'loss/train': 1.3211134672164917} -11/07/2021 01:43:33 - INFO - __main__ - Step 31731: {'lr': 0.0004518479796495741, 'samples': 6092352, 'steps': 31730, 'loss/train': 1.319759488105774} -11/07/2021 01:43:33 - INFO - __main__ - Step 31732: {'lr': 0.00045184484854268216, 'samples': 6092544, 'steps': 31731, 'loss/train': 2.2386746406555176} -11/07/2021 01:43:34 - INFO - __main__ - Step 31733: {'lr': 0.00045184171734484203, 'samples': 6092736, 'steps': 31732, 'loss/train': 1.6354384422302246} -11/07/2021 01:43:34 - INFO - __main__ - Step 31734: {'lr': 0.00045183858605605517, 'samples': 6092928, 'steps': 31733, 'loss/train': 1.3734209537506104} -11/07/2021 01:43:35 - INFO - __main__ - Step 31735: {'lr': 0.00045183545467632295, 'samples': 6093120, 'steps': 31734, 'loss/train': 1.4117457866668701} -11/07/2021 01:43:35 - INFO - __main__ - Step 31736: {'lr': 0.0004518323232056468, 'samples': 6093312, 'steps': 31735, 'loss/train': 1.3299400806427002} -11/07/2021 01:43:35 - INFO - __main__ - Step 31737: {'lr': 0.0004518291916440281, 'samples': 6093504, 'steps': 31736, 'loss/train': 1.7732288837432861} -11/07/2021 01:43:36 - INFO - __main__ - Step 31738: {'lr': 0.0004518260599914683, 'samples': 6093696, 'steps': 31737, 'loss/train': 1.7293723821640015} -11/07/2021 01:43:37 - INFO - __main__ - Step 31739: {'lr': 0.0004518229282479688, 'samples': 6093888, 'steps': 31738, 'loss/train': 1.130365252494812} -11/07/2021 01:43:37 - INFO - __main__ - Step 31740: {'lr': 0.000451819796413531, 'samples': 6094080, 'steps': 31739, 'loss/train': 1.5491985082626343} -11/07/2021 01:43:37 - INFO - __main__ - Step 31741: {'lr': 0.0004518166644881563, 'samples': 6094272, 'steps': 31740, 'loss/train': 1.8045982122421265} -11/07/2021 01:43:38 - INFO - __main__ - Step 31742: {'lr': 0.0004518135324718461, 'samples': 6094464, 'steps': 31741, 'loss/train': 1.6794017553329468} -11/07/2021 01:43:39 - INFO - __main__ - Step 31743: {'lr': 0.00045181040036460185, 'samples': 6094656, 'steps': 31742, 'loss/train': 1.4577114582061768} -11/07/2021 01:43:39 - INFO - __main__ - Step 31744: {'lr': 0.0004518072681664249, 'samples': 6094848, 'steps': 31743, 'loss/train': 1.1413843631744385} -11/07/2021 01:43:40 - INFO - __main__ - Step 31745: {'lr': 0.0004518041358773168, 'samples': 6095040, 'steps': 31744, 'loss/train': 1.9787827730178833} -11/07/2021 01:43:40 - INFO - __main__ - Step 31746: {'lr': 0.0004518010034972788, 'samples': 6095232, 'steps': 31745, 'loss/train': 0.9560813903808594} -11/07/2021 01:43:40 - INFO - __main__ - Step 31747: {'lr': 0.0004517978710263124, 'samples': 6095424, 'steps': 31746, 'loss/train': 2.453749179840088} -11/07/2021 01:43:42 - INFO - __main__ - Step 31748: {'lr': 0.0004517947384644191, 'samples': 6095616, 'steps': 31747, 'loss/train': 1.4488246440887451} -11/07/2021 01:43:42 - INFO - __main__ - Step 31749: {'lr': 0.00045179160581160005, 'samples': 6095808, 'steps': 31748, 'loss/train': 1.95890212059021} -11/07/2021 01:43:42 - INFO - __main__ - Step 31750: {'lr': 0.0004517884730678569, 'samples': 6096000, 'steps': 31749, 'loss/train': 2.0341854095458984} -11/07/2021 01:43:43 - INFO - __main__ - Step 31751: {'lr': 0.00045178534023319097, 'samples': 6096192, 'steps': 31750, 'loss/train': 1.2793896198272705} -11/07/2021 01:43:43 - INFO - __main__ - Step 31752: {'lr': 0.00045178220730760367, 'samples': 6096384, 'steps': 31751, 'loss/train': 1.2757604122161865} -11/07/2021 01:43:43 - INFO - __main__ - Step 31753: {'lr': 0.0004517790742910964, 'samples': 6096576, 'steps': 31752, 'loss/train': 1.3032244443893433} -11/07/2021 01:43:44 - INFO - __main__ - Step 31754: {'lr': 0.0004517759411836706, 'samples': 6096768, 'steps': 31753, 'loss/train': 1.0655202865600586} -11/07/2021 01:43:45 - INFO - __main__ - Step 31755: {'lr': 0.0004517728079853277, 'samples': 6096960, 'steps': 31754, 'loss/train': 1.4300718307495117} -11/07/2021 01:43:45 - INFO - __main__ - Step 31756: {'lr': 0.0004517696746960691, 'samples': 6097152, 'steps': 31755, 'loss/train': 1.6231884956359863} -11/07/2021 01:43:45 - INFO - __main__ - Step 31757: {'lr': 0.00045176654131589617, 'samples': 6097344, 'steps': 31756, 'loss/train': 1.2734031677246094} -11/07/2021 01:43:46 - INFO - __main__ - Step 31758: {'lr': 0.0004517634078448103, 'samples': 6097536, 'steps': 31757, 'loss/train': 1.4724065065383911} -11/07/2021 01:43:46 - INFO - __main__ - Step 31759: {'lr': 0.0004517602742828131, 'samples': 6097728, 'steps': 31758, 'loss/train': 1.2505757808685303} -11/07/2021 01:43:47 - INFO - __main__ - Step 31760: {'lr': 0.0004517571406299057, 'samples': 6097920, 'steps': 31759, 'loss/train': 1.5878269672393799} -11/07/2021 01:43:47 - INFO - __main__ - Step 31761: {'lr': 0.0004517540068860897, 'samples': 6098112, 'steps': 31760, 'loss/train': 1.867502212524414} -11/07/2021 01:43:48 - INFO - __main__ - Step 31762: {'lr': 0.0004517508730513664, 'samples': 6098304, 'steps': 31761, 'loss/train': 1.4676836729049683} -11/07/2021 01:43:48 - INFO - __main__ - Step 31763: {'lr': 0.00045174773912573735, 'samples': 6098496, 'steps': 31762, 'loss/train': 1.7907060384750366} -11/07/2021 01:43:49 - INFO - __main__ - Step 31764: {'lr': 0.00045174460510920386, 'samples': 6098688, 'steps': 31763, 'loss/train': 1.3359169960021973} -11/07/2021 01:43:49 - INFO - __main__ - Step 31765: {'lr': 0.00045174147100176734, 'samples': 6098880, 'steps': 31764, 'loss/train': 1.377150535583496} -11/07/2021 01:43:50 - INFO - __main__ - Step 31766: {'lr': 0.00045173833680342925, 'samples': 6099072, 'steps': 31765, 'loss/train': 1.5649809837341309} -11/07/2021 01:43:50 - INFO - __main__ - Step 31767: {'lr': 0.00045173520251419095, 'samples': 6099264, 'steps': 31766, 'loss/train': 1.931465983390808} -11/07/2021 01:43:51 - INFO - __main__ - Step 31768: {'lr': 0.0004517320681340539, 'samples': 6099456, 'steps': 31767, 'loss/train': 1.7786474227905273} -11/07/2021 01:43:51 - INFO - __main__ - Step 31769: {'lr': 0.0004517289336630195, 'samples': 6099648, 'steps': 31768, 'loss/train': 1.407793641090393} -11/07/2021 01:43:52 - INFO - __main__ - Step 31770: {'lr': 0.0004517257991010891, 'samples': 6099840, 'steps': 31769, 'loss/train': 1.3097972869873047} -11/07/2021 01:43:52 - INFO - __main__ - Step 31771: {'lr': 0.0004517226644482642, 'samples': 6100032, 'steps': 31770, 'loss/train': 1.1694785356521606} -11/07/2021 01:43:53 - INFO - __main__ - Step 31772: {'lr': 0.00045171952970454623, 'samples': 6100224, 'steps': 31771, 'loss/train': 1.6580748558044434} -11/07/2021 01:43:53 - INFO - __main__ - Step 31773: {'lr': 0.0004517163948699365, 'samples': 6100416, 'steps': 31772, 'loss/train': 1.575675129890442} -11/07/2021 01:43:53 - INFO - __main__ - Step 31774: {'lr': 0.00045171325994443644, 'samples': 6100608, 'steps': 31773, 'loss/train': 1.6436625719070435} -11/07/2021 01:43:54 - INFO - __main__ - Step 31775: {'lr': 0.00045171012492804753, 'samples': 6100800, 'steps': 31774, 'loss/train': 0.5877825021743774} -11/07/2021 01:43:55 - INFO - __main__ - Step 31776: {'lr': 0.0004517069898207712, 'samples': 6100992, 'steps': 31775, 'loss/train': 1.739137053489685} -11/07/2021 01:43:55 - INFO - __main__ - Step 31777: {'lr': 0.00045170385462260876, 'samples': 6101184, 'steps': 31776, 'loss/train': 1.6380271911621094} -11/07/2021 01:43:55 - INFO - __main__ - Step 31778: {'lr': 0.0004517007193335617, 'samples': 6101376, 'steps': 31777, 'loss/train': 1.0152171850204468} -11/07/2021 01:43:56 - INFO - __main__ - Step 31779: {'lr': 0.0004516975839536314, 'samples': 6101568, 'steps': 31778, 'loss/train': 1.0910487174987793} -11/07/2021 01:43:57 - INFO - __main__ - Step 31780: {'lr': 0.0004516944484828193, 'samples': 6101760, 'steps': 31779, 'loss/train': 1.5282224416732788} -11/07/2021 01:43:57 - INFO - __main__ - Step 31781: {'lr': 0.0004516913129211268, 'samples': 6101952, 'steps': 31780, 'loss/train': 0.6756600141525269} -11/07/2021 01:43:57 - INFO - __main__ - Step 31782: {'lr': 0.00045168817726855525, 'samples': 6102144, 'steps': 31781, 'loss/train': 0.26307106018066406} -11/07/2021 01:43:58 - INFO - __main__ - Step 31783: {'lr': 0.0004516850415251061, 'samples': 6102336, 'steps': 31782, 'loss/train': 1.4687156677246094} -11/07/2021 01:43:58 - INFO - __main__ - Step 31784: {'lr': 0.0004516819056907809, 'samples': 6102528, 'steps': 31783, 'loss/train': 1.848503589630127} -11/07/2021 01:43:59 - INFO - __main__ - Step 31785: {'lr': 0.0004516787697655809, 'samples': 6102720, 'steps': 31784, 'loss/train': 0.48024705052375793} -11/07/2021 01:44:00 - INFO - __main__ - Step 31786: {'lr': 0.0004516756337495075, 'samples': 6102912, 'steps': 31785, 'loss/train': 1.448751449584961} -11/07/2021 01:44:00 - INFO - __main__ - Step 31787: {'lr': 0.0004516724976425622, 'samples': 6103104, 'steps': 31786, 'loss/train': 1.7140107154846191} -11/07/2021 01:44:00 - INFO - __main__ - Step 31788: {'lr': 0.0004516693614447464, 'samples': 6103296, 'steps': 31787, 'loss/train': 1.5359638929367065} -11/07/2021 01:44:01 - INFO - __main__ - Step 31789: {'lr': 0.0004516662251560615, 'samples': 6103488, 'steps': 31788, 'loss/train': 1.5012446641921997} -11/07/2021 01:44:01 - INFO - __main__ - Step 31790: {'lr': 0.0004516630887765089, 'samples': 6103680, 'steps': 31789, 'loss/train': 1.7036118507385254} -11/07/2021 01:44:02 - INFO - __main__ - Step 31791: {'lr': 0.00045165995230609003, 'samples': 6103872, 'steps': 31790, 'loss/train': 1.1799037456512451} -11/07/2021 01:44:02 - INFO - __main__ - Step 31792: {'lr': 0.0004516568157448063, 'samples': 6104064, 'steps': 31791, 'loss/train': 1.6661583185195923} -11/07/2021 01:44:03 - INFO - __main__ - Step 31793: {'lr': 0.00045165367909265916, 'samples': 6104256, 'steps': 31792, 'loss/train': 0.8608067631721497} -11/07/2021 01:44:03 - INFO - __main__ - Step 31794: {'lr': 0.00045165054234964984, 'samples': 6104448, 'steps': 31793, 'loss/train': 1.4671131372451782} -11/07/2021 01:44:03 - INFO - __main__ - Step 31795: {'lr': 0.0004516474055157801, 'samples': 6104640, 'steps': 31794, 'loss/train': 1.7963557243347168} -11/07/2021 01:44:04 - INFO - __main__ - Step 31796: {'lr': 0.000451644268591051, 'samples': 6104832, 'steps': 31795, 'loss/train': 1.595018982887268} -11/07/2021 01:44:05 - INFO - __main__ - Step 31797: {'lr': 0.00045164113157546414, 'samples': 6105024, 'steps': 31796, 'loss/train': 1.6584199666976929} -11/07/2021 01:44:05 - INFO - __main__ - Step 31798: {'lr': 0.0004516379944690209, 'samples': 6105216, 'steps': 31797, 'loss/train': 1.519771933555603} -11/07/2021 01:44:05 - INFO - __main__ - Step 31799: {'lr': 0.0004516348572717227, 'samples': 6105408, 'steps': 31798, 'loss/train': 1.4903631210327148} -11/07/2021 01:44:06 - INFO - __main__ - Step 31800: {'lr': 0.000451631719983571, 'samples': 6105600, 'steps': 31799, 'loss/train': 1.4289230108261108} -11/07/2021 01:44:07 - INFO - __main__ - Step 31801: {'lr': 0.00045162858260456705, 'samples': 6105792, 'steps': 31800, 'loss/train': 1.5293996334075928} -11/07/2021 01:44:07 - INFO - __main__ - Step 31802: {'lr': 0.0004516254451347125, 'samples': 6105984, 'steps': 31801, 'loss/train': 1.545749306678772} -11/07/2021 01:44:08 - INFO - __main__ - Step 31803: {'lr': 0.0004516223075740085, 'samples': 6106176, 'steps': 31802, 'loss/train': 0.7313265204429626} -11/07/2021 01:44:08 - INFO - __main__ - Step 31804: {'lr': 0.00045161916992245664, 'samples': 6106368, 'steps': 31803, 'loss/train': 1.424360990524292} -11/07/2021 01:44:08 - INFO - __main__ - Step 31805: {'lr': 0.0004516160321800584, 'samples': 6106560, 'steps': 31804, 'loss/train': 1.6591503620147705} -11/07/2021 01:44:09 - INFO - __main__ - Step 31806: {'lr': 0.000451612894346815, 'samples': 6106752, 'steps': 31805, 'loss/train': 1.6420533657073975} -11/07/2021 01:44:10 - INFO - __main__ - Step 31807: {'lr': 0.00045160975642272795, 'samples': 6106944, 'steps': 31806, 'loss/train': 1.7411733865737915} -11/07/2021 01:44:10 - INFO - __main__ - Step 31808: {'lr': 0.0004516066184077986, 'samples': 6107136, 'steps': 31807, 'loss/train': 0.8653108477592468} -11/07/2021 01:44:10 - INFO - __main__ - Step 31809: {'lr': 0.0004516034803020285, 'samples': 6107328, 'steps': 31808, 'loss/train': 1.52175772190094} -11/07/2021 01:44:11 - INFO - __main__ - Step 31810: {'lr': 0.0004516003421054189, 'samples': 6107520, 'steps': 31809, 'loss/train': 1.6941521167755127} -11/07/2021 01:44:12 - INFO - __main__ - Step 31811: {'lr': 0.0004515972038179714, 'samples': 6107712, 'steps': 31810, 'loss/train': 1.3670642375946045} -11/07/2021 01:44:12 - INFO - __main__ - Step 31812: {'lr': 0.0004515940654396872, 'samples': 6107904, 'steps': 31811, 'loss/train': 2.074129581451416} -11/07/2021 01:44:13 - INFO - __main__ - Step 31813: {'lr': 0.00045159092697056794, 'samples': 6108096, 'steps': 31812, 'loss/train': 1.4383933544158936} -11/07/2021 01:44:13 - INFO - __main__ - Step 31814: {'lr': 0.00045158778841061483, 'samples': 6108288, 'steps': 31813, 'loss/train': 1.4272984266281128} -11/07/2021 01:44:13 - INFO - __main__ - Step 31815: {'lr': 0.0004515846497598294, 'samples': 6108480, 'steps': 31814, 'loss/train': 1.7123581171035767} -11/07/2021 01:44:14 - INFO - __main__ - Step 31816: {'lr': 0.000451581511018213, 'samples': 6108672, 'steps': 31815, 'loss/train': 1.681820034980774} -11/07/2021 01:44:15 - INFO - __main__ - Step 31817: {'lr': 0.00045157837218576713, 'samples': 6108864, 'steps': 31816, 'loss/train': 1.696065068244934} -11/07/2021 01:44:15 - INFO - __main__ - Step 31818: {'lr': 0.00045157523326249316, 'samples': 6109056, 'steps': 31817, 'loss/train': 1.6681617498397827} -11/07/2021 01:44:15 - INFO - __main__ - Step 31819: {'lr': 0.00045157209424839253, 'samples': 6109248, 'steps': 31818, 'loss/train': 1.529592752456665} -11/07/2021 01:44:16 - INFO - __main__ - Step 31820: {'lr': 0.0004515689551434665, 'samples': 6109440, 'steps': 31819, 'loss/train': 1.5102119445800781} -11/07/2021 01:44:17 - INFO - __main__ - Step 31821: {'lr': 0.00045156581594771675, 'samples': 6109632, 'steps': 31820, 'loss/train': 1.5752092599868774} -11/07/2021 01:44:17 - INFO - __main__ - Step 31822: {'lr': 0.00045156267666114446, 'samples': 6109824, 'steps': 31821, 'loss/train': 1.095093846321106} -11/07/2021 01:44:17 - INFO - __main__ - Step 31823: {'lr': 0.0004515595372837512, 'samples': 6110016, 'steps': 31822, 'loss/train': 1.6193000078201294} -11/07/2021 01:44:18 - INFO - __main__ - Step 31824: {'lr': 0.00045155639781553825, 'samples': 6110208, 'steps': 31823, 'loss/train': 1.6955679655075073} -11/07/2021 01:44:18 - INFO - __main__ - Step 31825: {'lr': 0.00045155325825650715, 'samples': 6110400, 'steps': 31824, 'loss/train': 1.2122478485107422} -11/07/2021 01:44:18 - INFO - __main__ - Step 31826: {'lr': 0.00045155011860665927, 'samples': 6110592, 'steps': 31825, 'loss/train': 1.2631003856658936} -11/07/2021 01:44:20 - INFO - __main__ - Step 31827: {'lr': 0.00045154697886599606, 'samples': 6110784, 'steps': 31826, 'loss/train': 0.4462384581565857} -11/07/2021 01:44:20 - INFO - __main__ - Step 31828: {'lr': 0.0004515438390345188, 'samples': 6110976, 'steps': 31827, 'loss/train': 1.3006891012191772} -11/07/2021 01:44:20 - INFO - __main__ - Step 31829: {'lr': 0.00045154069911222905, 'samples': 6111168, 'steps': 31828, 'loss/train': 1.6836390495300293} -11/07/2021 01:44:21 - INFO - __main__ - Step 31830: {'lr': 0.0004515375590991281, 'samples': 6111360, 'steps': 31829, 'loss/train': 1.4358208179473877} -11/07/2021 01:44:21 - INFO - __main__ - Step 31831: {'lr': 0.0004515344189952175, 'samples': 6111552, 'steps': 31830, 'loss/train': 1.475838541984558} -11/07/2021 01:44:22 - INFO - __main__ - Step 31832: {'lr': 0.0004515312788004986, 'samples': 6111744, 'steps': 31831, 'loss/train': 1.4673216342926025} -11/07/2021 01:44:22 - INFO - __main__ - Step 31833: {'lr': 0.00045152813851497274, 'samples': 6111936, 'steps': 31832, 'loss/train': 1.525496006011963} -11/07/2021 01:44:23 - INFO - __main__ - Step 31834: {'lr': 0.0004515249981386416, 'samples': 6112128, 'steps': 31833, 'loss/train': 1.4047716856002808} -11/07/2021 01:44:23 - INFO - __main__ - Step 31835: {'lr': 0.0004515218576715062, 'samples': 6112320, 'steps': 31834, 'loss/train': 1.6120771169662476} -11/07/2021 01:44:23 - INFO - __main__ - Step 31836: {'lr': 0.00045151871711356827, 'samples': 6112512, 'steps': 31835, 'loss/train': 0.9932732582092285} -11/07/2021 01:44:25 - INFO - __main__ - Step 31837: {'lr': 0.0004515155764648291, 'samples': 6112704, 'steps': 31836, 'loss/train': 1.6056442260742188} -11/07/2021 01:44:25 - INFO - __main__ - Step 31838: {'lr': 0.0004515124357252901, 'samples': 6112896, 'steps': 31837, 'loss/train': 0.9801680445671082} -11/07/2021 01:44:25 - INFO - __main__ - Step 31839: {'lr': 0.0004515092948949527, 'samples': 6113088, 'steps': 31838, 'loss/train': 1.792125940322876} -11/07/2021 01:44:26 - INFO - __main__ - Step 31840: {'lr': 0.00045150615397381835, 'samples': 6113280, 'steps': 31839, 'loss/train': 1.0138678550720215} -11/07/2021 01:44:26 - INFO - __main__ - Step 31841: {'lr': 0.0004515030129618884, 'samples': 6113472, 'steps': 31840, 'loss/train': 1.8094062805175781} -11/07/2021 01:44:27 - INFO - __main__ - Step 31842: {'lr': 0.0004514998718591643, 'samples': 6113664, 'steps': 31841, 'loss/train': 1.5744199752807617} -11/07/2021 01:44:27 - INFO - __main__ - Step 31843: {'lr': 0.0004514967306656475, 'samples': 6113856, 'steps': 31842, 'loss/train': 1.845720648765564} -11/07/2021 01:44:28 - INFO - __main__ - Step 31844: {'lr': 0.0004514935893813394, 'samples': 6114048, 'steps': 31843, 'loss/train': 1.3678845167160034} -11/07/2021 01:44:28 - INFO - __main__ - Step 31845: {'lr': 0.00045149044800624135, 'samples': 6114240, 'steps': 31844, 'loss/train': 1.5553712844848633} -11/07/2021 01:44:28 - INFO - __main__ - Step 31846: {'lr': 0.0004514873065403549, 'samples': 6114432, 'steps': 31845, 'loss/train': 1.1362268924713135} -11/07/2021 01:44:29 - INFO - __main__ - Step 31847: {'lr': 0.0004514841649836813, 'samples': 6114624, 'steps': 31846, 'loss/train': 1.644763708114624} -11/07/2021 01:44:30 - INFO - __main__ - Step 31848: {'lr': 0.000451481023336222, 'samples': 6114816, 'steps': 31847, 'loss/train': 1.5752571821212769} -11/07/2021 01:44:30 - INFO - __main__ - Step 31849: {'lr': 0.0004514778815979785, 'samples': 6115008, 'steps': 31848, 'loss/train': 1.764130711555481} -11/07/2021 01:44:30 - INFO - __main__ - Step 31850: {'lr': 0.0004514747397689522, 'samples': 6115200, 'steps': 31849, 'loss/train': 1.4945341348648071} -11/07/2021 01:44:31 - INFO - __main__ - Step 31851: {'lr': 0.0004514715978491445, 'samples': 6115392, 'steps': 31850, 'loss/train': 1.451790452003479} -11/07/2021 01:44:31 - INFO - __main__ - Step 31852: {'lr': 0.0004514684558385568, 'samples': 6115584, 'steps': 31851, 'loss/train': 1.7369520664215088} -11/07/2021 01:44:32 - INFO - __main__ - Step 31853: {'lr': 0.0004514653137371905, 'samples': 6115776, 'steps': 31852, 'loss/train': 1.2488102912902832} -11/07/2021 01:44:33 - INFO - __main__ - Step 31854: {'lr': 0.000451462171545047, 'samples': 6115968, 'steps': 31853, 'loss/train': 1.4568167924880981} -11/07/2021 01:44:33 - INFO - __main__ - Step 31855: {'lr': 0.00045145902926212785, 'samples': 6116160, 'steps': 31854, 'loss/train': 2.047454357147217} -11/07/2021 01:44:33 - INFO - __main__ - Step 31856: {'lr': 0.0004514558868884343, 'samples': 6116352, 'steps': 31855, 'loss/train': 1.3141847848892212} -11/07/2021 01:44:34 - INFO - __main__ - Step 31857: {'lr': 0.00045145274442396786, 'samples': 6116544, 'steps': 31856, 'loss/train': 1.307631015777588} -11/07/2021 01:44:35 - INFO - __main__ - Step 31858: {'lr': 0.00045144960186872996, 'samples': 6116736, 'steps': 31857, 'loss/train': 1.6855310201644897} -11/07/2021 01:44:35 - INFO - __main__ - Step 31859: {'lr': 0.0004514464592227219, 'samples': 6116928, 'steps': 31858, 'loss/train': 1.911537528038025} -11/07/2021 01:44:35 - INFO - __main__ - Step 31860: {'lr': 0.0004514433164859453, 'samples': 6117120, 'steps': 31859, 'loss/train': 1.107447862625122} -11/07/2021 01:44:36 - INFO - __main__ - Step 31861: {'lr': 0.0004514401736584013, 'samples': 6117312, 'steps': 31860, 'loss/train': 1.288212537765503} -11/07/2021 01:44:36 - INFO - __main__ - Step 31862: {'lr': 0.0004514370307400916, 'samples': 6117504, 'steps': 31861, 'loss/train': 2.230525016784668} -11/07/2021 01:44:36 - INFO - __main__ - Step 31863: {'lr': 0.00045143388773101733, 'samples': 6117696, 'steps': 31862, 'loss/train': 1.853481411933899} -11/07/2021 01:44:37 - INFO - __main__ - Step 31864: {'lr': 0.0004514307446311802, 'samples': 6117888, 'steps': 31863, 'loss/train': 1.6902889013290405} -11/07/2021 01:44:38 - INFO - __main__ - Step 31865: {'lr': 0.0004514276014405814, 'samples': 6118080, 'steps': 31864, 'loss/train': 0.38764888048171997} -11/07/2021 01:44:38 - INFO - __main__ - Step 31866: {'lr': 0.00045142445815922244, 'samples': 6118272, 'steps': 31865, 'loss/train': 1.5117849111557007} -11/07/2021 01:44:38 - INFO - __main__ - Step 31867: {'lr': 0.0004514213147871047, 'samples': 6118464, 'steps': 31866, 'loss/train': 1.4329771995544434} -11/07/2021 01:44:39 - INFO - __main__ - Step 31868: {'lr': 0.00045141817132422974, 'samples': 6118656, 'steps': 31867, 'loss/train': 1.3428623676300049} -11/07/2021 01:44:40 - INFO - __main__ - Step 31869: {'lr': 0.0004514150277705988, 'samples': 6118848, 'steps': 31868, 'loss/train': 1.7656563520431519} -11/07/2021 01:44:40 - INFO - __main__ - Step 31870: {'lr': 0.0004514118841262133, 'samples': 6119040, 'steps': 31869, 'loss/train': 1.6058647632598877} -11/07/2021 01:44:41 - INFO - __main__ - Step 31871: {'lr': 0.0004514087403910748, 'samples': 6119232, 'steps': 31870, 'loss/train': 1.6545133590698242} -11/07/2021 01:44:41 - INFO - __main__ - Step 31872: {'lr': 0.00045140559656518456, 'samples': 6119424, 'steps': 31871, 'loss/train': 1.609268069267273} -11/07/2021 01:44:41 - INFO - __main__ - Step 31873: {'lr': 0.0004514024526485441, 'samples': 6119616, 'steps': 31872, 'loss/train': 1.8082526922225952} -11/07/2021 01:44:43 - INFO - __main__ - Step 31874: {'lr': 0.0004513993086411548, 'samples': 6119808, 'steps': 31873, 'loss/train': 1.2211987972259521} -11/07/2021 01:44:43 - INFO - __main__ - Step 31875: {'lr': 0.00045139616454301806, 'samples': 6120000, 'steps': 31874, 'loss/train': 0.29446327686309814} -11/07/2021 01:44:43 - INFO - __main__ - Step 31876: {'lr': 0.00045139302035413534, 'samples': 6120192, 'steps': 31875, 'loss/train': 1.5343080759048462} -11/07/2021 01:44:44 - INFO - __main__ - Step 31877: {'lr': 0.00045138987607450803, 'samples': 6120384, 'steps': 31876, 'loss/train': 2.0093131065368652} -11/07/2021 01:44:44 - INFO - __main__ - Step 31878: {'lr': 0.00045138673170413756, 'samples': 6120576, 'steps': 31877, 'loss/train': 1.5735539197921753} -11/07/2021 01:44:45 - INFO - __main__ - Step 31879: {'lr': 0.0004513835872430253, 'samples': 6120768, 'steps': 31878, 'loss/train': 1.7831584215164185} -11/07/2021 01:44:46 - INFO - __main__ - Step 31880: {'lr': 0.0004513804426911727, 'samples': 6120960, 'steps': 31879, 'loss/train': 1.510374665260315} -11/07/2021 01:44:46 - INFO - __main__ - Step 31881: {'lr': 0.00045137729804858124, 'samples': 6121152, 'steps': 31880, 'loss/train': 1.622793436050415} -11/07/2021 01:44:46 - INFO - __main__ - Step 31882: {'lr': 0.00045137415331525225, 'samples': 6121344, 'steps': 31881, 'loss/train': 1.7737555503845215} -11/07/2021 01:44:47 - INFO - __main__ - Step 31883: {'lr': 0.0004513710084911872, 'samples': 6121536, 'steps': 31882, 'loss/train': 1.6020547151565552} -11/07/2021 01:44:48 - INFO - __main__ - Step 31884: {'lr': 0.00045136786357638736, 'samples': 6121728, 'steps': 31883, 'loss/train': 0.3957446217536926} -11/07/2021 01:44:48 - INFO - __main__ - Step 31885: {'lr': 0.00045136471857085435, 'samples': 6121920, 'steps': 31884, 'loss/train': 1.7443677186965942} -11/07/2021 01:44:48 - INFO - __main__ - Step 31886: {'lr': 0.0004513615734745895, 'samples': 6122112, 'steps': 31885, 'loss/train': 1.861700415611267} -11/07/2021 01:44:49 - INFO - __main__ - Step 31887: {'lr': 0.00045135842828759426, 'samples': 6122304, 'steps': 31886, 'loss/train': 1.7172307968139648} -11/07/2021 01:44:49 - INFO - __main__ - Step 31888: {'lr': 0.00045135528300987006, 'samples': 6122496, 'steps': 31887, 'loss/train': 1.388944149017334} -11/07/2021 01:44:50 - INFO - __main__ - Step 31889: {'lr': 0.00045135213764141814, 'samples': 6122688, 'steps': 31888, 'loss/train': 1.505753993988037} -11/07/2021 01:44:50 - INFO - __main__ - Step 31890: {'lr': 0.00045134899218224014, 'samples': 6122880, 'steps': 31889, 'loss/train': 1.5831694602966309} -11/07/2021 01:44:51 - INFO - __main__ - Step 31891: {'lr': 0.0004513458466323374, 'samples': 6123072, 'steps': 31890, 'loss/train': 1.688417673110962} -11/07/2021 01:44:51 - INFO - __main__ - Step 31892: {'lr': 0.0004513427009917113, 'samples': 6123264, 'steps': 31891, 'loss/train': 1.3869106769561768} -11/07/2021 01:44:52 - INFO - __main__ - Step 31893: {'lr': 0.0004513395552603633, 'samples': 6123456, 'steps': 31892, 'loss/train': 1.3275775909423828} -11/07/2021 01:44:52 - INFO - __main__ - Step 31894: {'lr': 0.0004513364094382948, 'samples': 6123648, 'steps': 31893, 'loss/train': 1.7369481325149536} -11/07/2021 01:44:53 - INFO - __main__ - Step 31895: {'lr': 0.00045133326352550724, 'samples': 6123840, 'steps': 31894, 'loss/train': 2.2003068923950195} -11/07/2021 01:44:53 - INFO - __main__ - Step 31896: {'lr': 0.000451330117522002, 'samples': 6124032, 'steps': 31895, 'loss/train': 1.3032506704330444} -11/07/2021 01:44:54 - INFO - __main__ - Step 31897: {'lr': 0.00045132697142778044, 'samples': 6124224, 'steps': 31896, 'loss/train': 1.6254322528839111} -11/07/2021 01:44:54 - INFO - __main__ - Step 31898: {'lr': 0.0004513238252428442, 'samples': 6124416, 'steps': 31897, 'loss/train': 1.728275179862976} -11/07/2021 01:44:54 - INFO - __main__ - Step 31899: {'lr': 0.0004513206789671945, 'samples': 6124608, 'steps': 31898, 'loss/train': 1.701587438583374} -11/07/2021 01:44:55 - INFO - __main__ - Step 31900: {'lr': 0.00045131753260083276, 'samples': 6124800, 'steps': 31899, 'loss/train': 1.1780604124069214} -11/07/2021 01:44:56 - INFO - __main__ - Step 31901: {'lr': 0.0004513143861437605, 'samples': 6124992, 'steps': 31900, 'loss/train': 1.972902536392212} -11/07/2021 01:44:56 - INFO - __main__ - Step 31902: {'lr': 0.00045131123959597905, 'samples': 6125184, 'steps': 31901, 'loss/train': 1.482000708580017} -11/07/2021 01:44:56 - INFO - __main__ - Step 31903: {'lr': 0.0004513080929574899, 'samples': 6125376, 'steps': 31902, 'loss/train': 1.3008524179458618} -11/07/2021 01:44:57 - INFO - __main__ - Step 31904: {'lr': 0.0004513049462282943, 'samples': 6125568, 'steps': 31903, 'loss/train': 1.3399587869644165} -11/07/2021 01:44:58 - INFO - __main__ - Step 31905: {'lr': 0.00045130179940839395, 'samples': 6125760, 'steps': 31904, 'loss/train': 1.515134334564209} -11/07/2021 01:44:58 - INFO - __main__ - Step 31906: {'lr': 0.00045129865249779, 'samples': 6125952, 'steps': 31905, 'loss/train': 1.4602670669555664} -11/07/2021 01:44:59 - INFO - __main__ - Step 31907: {'lr': 0.0004512955054964841, 'samples': 6126144, 'steps': 31906, 'loss/train': 1.7514537572860718} -11/07/2021 01:44:59 - INFO - __main__ - Step 31908: {'lr': 0.0004512923584044775, 'samples': 6126336, 'steps': 31907, 'loss/train': 2.1205618381500244} -11/07/2021 01:44:59 - INFO - __main__ - Step 31909: {'lr': 0.0004512892112217717, 'samples': 6126528, 'steps': 31908, 'loss/train': 1.4181747436523438} -11/07/2021 01:45:00 - INFO - __main__ - Step 31910: {'lr': 0.00045128606394836805, 'samples': 6126720, 'steps': 31909, 'loss/train': 1.6861112117767334} -11/07/2021 01:45:01 - INFO - __main__ - Step 31911: {'lr': 0.00045128291658426796, 'samples': 6126912, 'steps': 31910, 'loss/train': 2.197659492492676} -11/07/2021 01:45:01 - INFO - __main__ - Step 31912: {'lr': 0.00045127976912947296, 'samples': 6127104, 'steps': 31911, 'loss/train': 1.7058151960372925} -11/07/2021 01:45:01 - INFO - __main__ - Step 31913: {'lr': 0.00045127662158398434, 'samples': 6127296, 'steps': 31912, 'loss/train': 2.1316757202148438} -11/07/2021 01:45:02 - INFO - __main__ - Step 31914: {'lr': 0.00045127347394780367, 'samples': 6127488, 'steps': 31913, 'loss/train': 1.6989363431930542} -11/07/2021 01:45:02 - INFO - __main__ - Step 31915: {'lr': 0.00045127032622093225, 'samples': 6127680, 'steps': 31914, 'loss/train': 1.6610476970672607} -11/07/2021 01:45:03 - INFO - __main__ - Step 31916: {'lr': 0.0004512671784033715, 'samples': 6127872, 'steps': 31915, 'loss/train': 1.3292311429977417} -11/07/2021 01:45:03 - INFO - __main__ - Step 31917: {'lr': 0.00045126403049512286, 'samples': 6128064, 'steps': 31916, 'loss/train': 1.2609515190124512} -11/07/2021 01:45:04 - INFO - __main__ - Step 31918: {'lr': 0.0004512608824961878, 'samples': 6128256, 'steps': 31917, 'loss/train': 1.5588932037353516} -11/07/2021 01:45:04 - INFO - __main__ - Step 31919: {'lr': 0.00045125773440656756, 'samples': 6128448, 'steps': 31918, 'loss/train': 1.2627248764038086} -11/07/2021 01:45:05 - INFO - __main__ - Step 31920: {'lr': 0.0004512545862262638, 'samples': 6128640, 'steps': 31919, 'loss/train': 1.905514121055603} -11/07/2021 01:45:06 - INFO - __main__ - Step 31921: {'lr': 0.0004512514379552779, 'samples': 6128832, 'steps': 31920, 'loss/train': 1.595982313156128} -11/07/2021 01:45:06 - INFO - __main__ - Step 31922: {'lr': 0.0004512482895936111, 'samples': 6129024, 'steps': 31921, 'loss/train': 1.3344855308532715} -11/07/2021 01:45:06 - INFO - __main__ - Step 31923: {'lr': 0.00045124514114126493, 'samples': 6129216, 'steps': 31922, 'loss/train': 1.5508592128753662} -11/07/2021 01:45:07 - INFO - __main__ - Step 31924: {'lr': 0.0004512419925982408, 'samples': 6129408, 'steps': 31923, 'loss/train': 1.8285584449768066} -11/07/2021 01:45:07 - INFO - __main__ - Step 31925: {'lr': 0.0004512388439645402, 'samples': 6129600, 'steps': 31924, 'loss/train': 1.5829516649246216} -11/07/2021 01:45:08 - INFO - __main__ - Step 31926: {'lr': 0.00045123569524016446, 'samples': 6129792, 'steps': 31925, 'loss/train': 1.6425074338912964} -11/07/2021 01:45:09 - INFO - __main__ - Step 31927: {'lr': 0.00045123254642511504, 'samples': 6129984, 'steps': 31926, 'loss/train': 1.4603376388549805} -11/07/2021 01:45:09 - INFO - __main__ - Step 31928: {'lr': 0.0004512293975193933, 'samples': 6130176, 'steps': 31927, 'loss/train': 1.7124818563461304} -11/07/2021 01:45:09 - INFO - __main__ - Step 31929: {'lr': 0.0004512262485230007, 'samples': 6130368, 'steps': 31928, 'loss/train': 1.0703651905059814} -11/07/2021 01:45:10 - INFO - __main__ - Step 31930: {'lr': 0.00045122309943593865, 'samples': 6130560, 'steps': 31929, 'loss/train': 1.5126354694366455} -11/07/2021 01:45:11 - INFO - __main__ - Step 31931: {'lr': 0.0004512199502582086, 'samples': 6130752, 'steps': 31930, 'loss/train': 1.3348126411437988} -11/07/2021 01:45:11 - INFO - __main__ - Step 31932: {'lr': 0.00045121680098981186, 'samples': 6130944, 'steps': 31931, 'loss/train': 1.4302009344100952} -11/07/2021 01:45:11 - INFO - __main__ - Step 31933: {'lr': 0.00045121365163075007, 'samples': 6131136, 'steps': 31932, 'loss/train': 1.6032031774520874} -11/07/2021 01:45:12 - INFO - __main__ - Step 31934: {'lr': 0.0004512105021810244, 'samples': 6131328, 'steps': 31933, 'loss/train': 1.6673365831375122} -11/07/2021 01:45:12 - INFO - __main__ - Step 31935: {'lr': 0.0004512073526406365, 'samples': 6131520, 'steps': 31934, 'loss/train': 1.3719717264175415} -11/07/2021 01:45:12 - INFO - __main__ - Step 31936: {'lr': 0.0004512042030095876, 'samples': 6131712, 'steps': 31935, 'loss/train': 1.7193927764892578} -11/07/2021 01:45:13 - INFO - __main__ - Step 31937: {'lr': 0.0004512010532878792, 'samples': 6131904, 'steps': 31936, 'loss/train': 1.2810825109481812} -11/07/2021 01:45:14 - INFO - __main__ - Step 31938: {'lr': 0.0004511979034755127, 'samples': 6132096, 'steps': 31937, 'loss/train': 1.3766365051269531} -11/07/2021 01:45:14 - INFO - __main__ - Step 31939: {'lr': 0.0004511947535724895, 'samples': 6132288, 'steps': 31938, 'loss/train': 1.246138334274292} -11/07/2021 01:45:15 - INFO - __main__ - Step 31940: {'lr': 0.00045119160357881105, 'samples': 6132480, 'steps': 31939, 'loss/train': 1.8165699243545532} -11/07/2021 01:45:15 - INFO - __main__ - Step 31941: {'lr': 0.0004511884534944789, 'samples': 6132672, 'steps': 31940, 'loss/train': 1.4489672183990479} -11/07/2021 01:45:16 - INFO - __main__ - Step 31942: {'lr': 0.0004511853033194942, 'samples': 6132864, 'steps': 31941, 'loss/train': 0.7833683490753174} -11/07/2021 01:45:16 - INFO - __main__ - Step 31943: {'lr': 0.00045118215305385855, 'samples': 6133056, 'steps': 31942, 'loss/train': 1.383625864982605} -11/07/2021 01:45:16 - INFO - __main__ - Step 31944: {'lr': 0.0004511790026975733, 'samples': 6133248, 'steps': 31943, 'loss/train': 1.392366886138916} -11/07/2021 01:45:17 - INFO - __main__ - Step 31945: {'lr': 0.00045117585225063996, 'samples': 6133440, 'steps': 31944, 'loss/train': 1.6650818586349487} -11/07/2021 01:45:17 - INFO - __main__ - Step 31946: {'lr': 0.0004511727017130598, 'samples': 6133632, 'steps': 31945, 'loss/train': 1.8258341550827026} -11/07/2021 01:45:18 - INFO - __main__ - Step 31947: {'lr': 0.00045116955108483436, 'samples': 6133824, 'steps': 31946, 'loss/train': 1.6164908409118652} -11/07/2021 01:45:19 - INFO - __main__ - Step 31948: {'lr': 0.00045116640036596507, 'samples': 6134016, 'steps': 31947, 'loss/train': 1.5087451934814453} -11/07/2021 01:45:19 - INFO - __main__ - Step 31949: {'lr': 0.0004511632495564533, 'samples': 6134208, 'steps': 31948, 'loss/train': 1.5558593273162842} -11/07/2021 01:45:19 - INFO - __main__ - Step 31950: {'lr': 0.00045116009865630034, 'samples': 6134400, 'steps': 31949, 'loss/train': 1.8072712421417236} -11/07/2021 01:45:20 - INFO - __main__ - Step 31951: {'lr': 0.0004511569476655079, 'samples': 6134592, 'steps': 31950, 'loss/train': 1.579148530960083} -11/07/2021 01:45:21 - INFO - __main__ - Step 31952: {'lr': 0.00045115379658407717, 'samples': 6134784, 'steps': 31951, 'loss/train': 0.6126420497894287} -11/07/2021 01:45:21 - INFO - __main__ - Step 31953: {'lr': 0.0004511506454120097, 'samples': 6134976, 'steps': 31952, 'loss/train': 1.2280786037445068} -11/07/2021 01:45:21 - INFO - __main__ - Step 31954: {'lr': 0.00045114749414930676, 'samples': 6135168, 'steps': 31953, 'loss/train': 1.9271167516708374} -11/07/2021 01:45:22 - INFO - __main__ - Step 31955: {'lr': 0.00045114434279596994, 'samples': 6135360, 'steps': 31954, 'loss/train': 1.5438740253448486} -11/07/2021 01:45:22 - INFO - __main__ - Step 31956: {'lr': 0.0004511411913520006, 'samples': 6135552, 'steps': 31955, 'loss/train': 1.3665361404418945} -11/07/2021 01:45:23 - INFO - __main__ - Step 31957: {'lr': 0.0004511380398174001, 'samples': 6135744, 'steps': 31956, 'loss/train': 1.552093505859375} -11/07/2021 01:45:24 - INFO - __main__ - Step 31958: {'lr': 0.00045113488819216983, 'samples': 6135936, 'steps': 31957, 'loss/train': 1.0456637144088745} -11/07/2021 01:45:24 - INFO - __main__ - Step 31959: {'lr': 0.00045113173647631143, 'samples': 6136128, 'steps': 31958, 'loss/train': 0.6969603896141052} -11/07/2021 01:45:24 - INFO - __main__ - Step 31960: {'lr': 0.0004511285846698261, 'samples': 6136320, 'steps': 31959, 'loss/train': 1.286709189414978} -11/07/2021 01:45:25 - INFO - __main__ - Step 31961: {'lr': 0.0004511254327727153, 'samples': 6136512, 'steps': 31960, 'loss/train': 1.1964833736419678} -11/07/2021 01:45:25 - INFO - __main__ - Step 31962: {'lr': 0.00045112228078498053, 'samples': 6136704, 'steps': 31961, 'loss/train': 1.115088701248169} -11/07/2021 01:45:26 - INFO - __main__ - Step 31963: {'lr': 0.0004511191287066232, 'samples': 6136896, 'steps': 31962, 'loss/train': 1.9909965991973877} -11/07/2021 01:45:27 - INFO - __main__ - Step 31964: {'lr': 0.00045111597653764456, 'samples': 6137088, 'steps': 31963, 'loss/train': 1.7869207859039307} -11/07/2021 01:45:27 - INFO - __main__ - Step 31965: {'lr': 0.00045111282427804636, 'samples': 6137280, 'steps': 31964, 'loss/train': 3.042821168899536} -11/07/2021 01:45:27 - INFO - __main__ - Step 31966: {'lr': 0.0004511096719278297, 'samples': 6137472, 'steps': 31965, 'loss/train': 1.2482612133026123} -11/07/2021 01:45:28 - INFO - __main__ - Step 31967: {'lr': 0.0004511065194869961, 'samples': 6137664, 'steps': 31966, 'loss/train': 1.316340446472168} -11/07/2021 01:45:29 - INFO - __main__ - Step 31968: {'lr': 0.00045110336695554707, 'samples': 6137856, 'steps': 31967, 'loss/train': 1.5354576110839844} -11/07/2021 01:45:29 - INFO - __main__ - Step 31969: {'lr': 0.0004511002143334839, 'samples': 6138048, 'steps': 31968, 'loss/train': 5.773683071136475} -11/07/2021 01:45:29 - INFO - __main__ - Step 31970: {'lr': 0.0004510970616208081, 'samples': 6138240, 'steps': 31969, 'loss/train': 1.477264642715454} -11/07/2021 01:45:30 - INFO - __main__ - Step 31971: {'lr': 0.0004510939088175211, 'samples': 6138432, 'steps': 31970, 'loss/train': 1.5126852989196777} -11/07/2021 01:45:30 - INFO - __main__ - Step 31972: {'lr': 0.00045109075592362433, 'samples': 6138624, 'steps': 31971, 'loss/train': 1.9196875095367432} -11/07/2021 01:45:31 - INFO - __main__ - Step 31973: {'lr': 0.0004510876029391191, 'samples': 6138816, 'steps': 31972, 'loss/train': 1.5249228477478027} -11/07/2021 01:45:32 - INFO - __main__ - Step 31974: {'lr': 0.00045108444986400687, 'samples': 6139008, 'steps': 31973, 'loss/train': 1.2626824378967285} -11/07/2021 01:45:32 - INFO - __main__ - Step 31975: {'lr': 0.0004510812966982892, 'samples': 6139200, 'steps': 31974, 'loss/train': 1.2591478824615479} -11/07/2021 01:45:32 - INFO - __main__ - Step 31976: {'lr': 0.0004510781434419673, 'samples': 6139392, 'steps': 31975, 'loss/train': 2.4961934089660645} -11/07/2021 01:45:33 - INFO - __main__ - Step 31977: {'lr': 0.0004510749900950427, 'samples': 6139584, 'steps': 31976, 'loss/train': 1.5184125900268555} -11/07/2021 01:45:33 - INFO - __main__ - Step 31978: {'lr': 0.00045107183665751686, 'samples': 6139776, 'steps': 31977, 'loss/train': 1.482326865196228} -11/07/2021 01:45:34 - INFO - __main__ - Step 31979: {'lr': 0.00045106868312939116, 'samples': 6139968, 'steps': 31978, 'loss/train': 0.6979764103889465} -11/07/2021 01:45:34 - INFO - __main__ - Step 31980: {'lr': 0.0004510655295106669, 'samples': 6140160, 'steps': 31979, 'loss/train': 0.9233061671257019} -11/07/2021 01:45:35 - INFO - __main__ - Step 31981: {'lr': 0.00045106237580134573, 'samples': 6140352, 'steps': 31980, 'loss/train': 1.0737470388412476} -11/07/2021 01:45:35 - INFO - __main__ - Step 31982: {'lr': 0.000451059222001429, 'samples': 6140544, 'steps': 31981, 'loss/train': 1.8268646001815796} -11/07/2021 01:45:35 - INFO - __main__ - Step 31983: {'lr': 0.0004510560681109179, 'samples': 6140736, 'steps': 31982, 'loss/train': 1.8358553647994995} -11/07/2021 01:45:37 - INFO - __main__ - Step 31984: {'lr': 0.0004510529141298142, 'samples': 6140928, 'steps': 31983, 'loss/train': 1.2324832677841187} -11/07/2021 01:45:37 - INFO - __main__ - Step 31985: {'lr': 0.00045104976005811917, 'samples': 6141120, 'steps': 31984, 'loss/train': 1.5840585231781006} -11/07/2021 01:45:37 - INFO - __main__ - Step 31986: {'lr': 0.00045104660589583413, 'samples': 6141312, 'steps': 31985, 'loss/train': 1.898639440536499} -11/07/2021 01:45:38 - INFO - __main__ - Step 31987: {'lr': 0.0004510434516429606, 'samples': 6141504, 'steps': 31986, 'loss/train': 3.6436564922332764} -11/07/2021 01:45:38 - INFO - __main__ - Step 31988: {'lr': 0.0004510402972995, 'samples': 6141696, 'steps': 31987, 'loss/train': 1.653199553489685} -11/07/2021 01:45:39 - INFO - __main__ - Step 31989: {'lr': 0.0004510371428654538, 'samples': 6141888, 'steps': 31988, 'loss/train': 1.620031476020813} -11/07/2021 01:45:39 - INFO - __main__ - Step 31990: {'lr': 0.00045103398834082334, 'samples': 6142080, 'steps': 31989, 'loss/train': 1.748823642730713} -11/07/2021 01:45:40 - INFO - __main__ - Step 31991: {'lr': 0.00045103083372561003, 'samples': 6142272, 'steps': 31990, 'loss/train': 1.3456593751907349} -11/07/2021 01:45:40 - INFO - __main__ - Step 31992: {'lr': 0.0004510276790198153, 'samples': 6142464, 'steps': 31991, 'loss/train': 1.7565659284591675} -11/07/2021 01:45:40 - INFO - __main__ - Step 31993: {'lr': 0.00045102452422344065, 'samples': 6142656, 'steps': 31992, 'loss/train': 1.65485680103302} -11/07/2021 01:45:41 - INFO - __main__ - Step 31994: {'lr': 0.0004510213693364875, 'samples': 6142848, 'steps': 31993, 'loss/train': 1.589545488357544} -11/07/2021 01:45:42 - INFO - __main__ - Step 31995: {'lr': 0.0004510182143589572, 'samples': 6143040, 'steps': 31994, 'loss/train': 1.8118722438812256} -11/07/2021 01:45:42 - INFO - __main__ - Step 31996: {'lr': 0.0004510150592908511, 'samples': 6143232, 'steps': 31995, 'loss/train': 0.27138158679008484} -11/07/2021 01:45:42 - INFO - __main__ - Step 31997: {'lr': 0.00045101190413217085, 'samples': 6143424, 'steps': 31996, 'loss/train': 1.6206790208816528} -11/07/2021 01:45:43 - INFO - __main__ - Step 31998: {'lr': 0.0004510087488829177, 'samples': 6143616, 'steps': 31997, 'loss/train': 1.502052664756775} -11/07/2021 01:45:44 - INFO - __main__ - Step 31999: {'lr': 0.000451005593543093, 'samples': 6143808, 'steps': 31998, 'loss/train': 1.7499158382415771} -11/07/2021 01:45:44 - INFO - __main__ - Step 32000: {'lr': 0.00045100243811269834, 'samples': 6144000, 'steps': 31999, 'loss/train': 1.2587133646011353} -11/07/2021 01:45:45 - INFO - __main__ - Step 32001: {'lr': 0.00045099928259173516, 'samples': 6144192, 'steps': 32000, 'loss/train': 1.6135326623916626} -11/07/2021 01:45:45 - INFO - __main__ - Step 32002: {'lr': 0.0004509961269802048, 'samples': 6144384, 'steps': 32001, 'loss/train': 1.5403943061828613} -11/07/2021 01:45:45 - INFO - __main__ - Step 32003: {'lr': 0.00045099297127810855, 'samples': 6144576, 'steps': 32002, 'loss/train': 0.7216783165931702} -11/07/2021 01:45:46 - INFO - __main__ - Step 32004: {'lr': 0.0004509898154854481, 'samples': 6144768, 'steps': 32003, 'loss/train': 1.133880615234375} -11/07/2021 01:45:47 - INFO - __main__ - Step 32005: {'lr': 0.00045098665960222474, 'samples': 6144960, 'steps': 32004, 'loss/train': 1.5767760276794434} -11/07/2021 01:45:47 - INFO - __main__ - Step 32006: {'lr': 0.00045098350362843975, 'samples': 6145152, 'steps': 32005, 'loss/train': 1.8912142515182495} -11/07/2021 01:45:47 - INFO - __main__ - Step 32007: {'lr': 0.0004509803475640948, 'samples': 6145344, 'steps': 32006, 'loss/train': 1.3936712741851807} -11/07/2021 01:45:48 - INFO - __main__ - Step 32008: {'lr': 0.00045097719140919126, 'samples': 6145536, 'steps': 32007, 'loss/train': 1.929354190826416} -11/07/2021 01:45:48 - INFO - __main__ - Step 32009: {'lr': 0.0004509740351637304, 'samples': 6145728, 'steps': 32008, 'loss/train': 0.8071759939193726} -11/07/2021 01:45:49 - INFO - __main__ - Step 32010: {'lr': 0.0004509708788277138, 'samples': 6145920, 'steps': 32009, 'loss/train': 1.3026527166366577} -11/07/2021 01:45:50 - INFO - __main__ - Step 32011: {'lr': 0.0004509677224011428, 'samples': 6146112, 'steps': 32010, 'loss/train': 1.4915457963943481} -11/07/2021 01:45:50 - INFO - __main__ - Step 32012: {'lr': 0.00045096456588401883, 'samples': 6146304, 'steps': 32011, 'loss/train': 1.9986481666564941} -11/07/2021 01:45:50 - INFO - __main__ - Step 32013: {'lr': 0.0004509614092763434, 'samples': 6146496, 'steps': 32012, 'loss/train': 1.2444761991500854} -11/07/2021 01:45:51 - INFO - __main__ - Step 32014: {'lr': 0.00045095825257811776, 'samples': 6146688, 'steps': 32013, 'loss/train': 1.3719403743743896} -11/07/2021 01:45:52 - INFO - __main__ - Step 32015: {'lr': 0.00045095509578934353, 'samples': 6146880, 'steps': 32014, 'loss/train': 1.5320340394973755} -11/07/2021 01:45:52 - INFO - __main__ - Step 32016: {'lr': 0.00045095193891002194, 'samples': 6147072, 'steps': 32015, 'loss/train': 1.5162948369979858} -11/07/2021 01:45:53 - INFO - __main__ - Step 32017: {'lr': 0.00045094878194015456, 'samples': 6147264, 'steps': 32016, 'loss/train': 1.094167947769165} -11/07/2021 01:45:53 - INFO - __main__ - Step 32018: {'lr': 0.0004509456248797428, 'samples': 6147456, 'steps': 32017, 'loss/train': 2.1765406131744385} -11/07/2021 01:45:53 - INFO - __main__ - Step 32019: {'lr': 0.000450942467728788, 'samples': 6147648, 'steps': 32018, 'loss/train': 1.4130141735076904} -11/07/2021 01:45:54 - INFO - __main__ - Step 32020: {'lr': 0.00045093931048729156, 'samples': 6147840, 'steps': 32019, 'loss/train': 1.719070315361023} -11/07/2021 01:45:55 - INFO - __main__ - Step 32021: {'lr': 0.00045093615315525506, 'samples': 6148032, 'steps': 32020, 'loss/train': 1.7311382293701172} -11/07/2021 01:45:55 - INFO - __main__ - Step 32022: {'lr': 0.00045093299573267977, 'samples': 6148224, 'steps': 32021, 'loss/train': 1.6059623956680298} -11/07/2021 01:45:55 - INFO - __main__ - Step 32023: {'lr': 0.00045092983821956725, 'samples': 6148416, 'steps': 32022, 'loss/train': 1.6733207702636719} -11/07/2021 01:45:56 - INFO - __main__ - Step 32024: {'lr': 0.00045092668061591875, 'samples': 6148608, 'steps': 32023, 'loss/train': 1.3829171657562256} -11/07/2021 01:45:56 - INFO - __main__ - Step 32025: {'lr': 0.00045092352292173585, 'samples': 6148800, 'steps': 32024, 'loss/train': 0.8372914791107178} -11/07/2021 01:45:57 - INFO - __main__ - Step 32026: {'lr': 0.00045092036513701985, 'samples': 6148992, 'steps': 32025, 'loss/train': 1.7354086637496948} -11/07/2021 01:45:57 - INFO - __main__ - Step 32027: {'lr': 0.0004509172072617723, 'samples': 6149184, 'steps': 32026, 'loss/train': 2.015341281890869} -11/07/2021 01:45:58 - INFO - __main__ - Step 32028: {'lr': 0.00045091404929599455, 'samples': 6149376, 'steps': 32027, 'loss/train': 1.555013656616211} -11/07/2021 01:45:58 - INFO - __main__ - Step 32029: {'lr': 0.00045091089123968796, 'samples': 6149568, 'steps': 32028, 'loss/train': 1.7335764169692993} -11/07/2021 01:45:59 - INFO - __main__ - Step 32030: {'lr': 0.0004509077330928541, 'samples': 6149760, 'steps': 32029, 'loss/train': 1.2832915782928467} -11/07/2021 01:45:59 - INFO - __main__ - Step 32031: {'lr': 0.0004509045748554943, 'samples': 6149952, 'steps': 32030, 'loss/train': 1.601660132408142} -11/07/2021 01:46:00 - INFO - __main__ - Step 32032: {'lr': 0.00045090141652760995, 'samples': 6150144, 'steps': 32031, 'loss/train': 1.7143197059631348} -11/07/2021 01:46:00 - INFO - __main__ - Step 32033: {'lr': 0.0004508982581092026, 'samples': 6150336, 'steps': 32032, 'loss/train': 0.9741845726966858} -11/07/2021 01:46:01 - INFO - __main__ - Step 32034: {'lr': 0.00045089509960027354, 'samples': 6150528, 'steps': 32033, 'loss/train': 1.5302150249481201} -11/07/2021 01:46:01 - INFO - __main__ - Step 32035: {'lr': 0.00045089194100082433, 'samples': 6150720, 'steps': 32034, 'loss/train': 1.5801377296447754} -11/07/2021 01:46:02 - INFO - __main__ - Step 32036: {'lr': 0.00045088878231085616, 'samples': 6150912, 'steps': 32035, 'loss/train': 1.6848492622375488} -11/07/2021 01:46:02 - INFO - __main__ - Step 32037: {'lr': 0.00045088562353037077, 'samples': 6151104, 'steps': 32036, 'loss/train': 1.8636360168457031} -11/07/2021 01:46:02 - INFO - __main__ - Step 32038: {'lr': 0.00045088246465936936, 'samples': 6151296, 'steps': 32037, 'loss/train': 1.515488862991333} -11/07/2021 01:46:03 - INFO - __main__ - Step 32039: {'lr': 0.0004508793056978534, 'samples': 6151488, 'steps': 32038, 'loss/train': 1.8291229009628296} -11/07/2021 01:46:03 - INFO - __main__ - Step 32040: {'lr': 0.00045087614664582424, 'samples': 6151680, 'steps': 32039, 'loss/train': 1.4584295749664307} -11/07/2021 01:46:04 - INFO - __main__ - Step 32041: {'lr': 0.0004508729875032834, 'samples': 6151872, 'steps': 32040, 'loss/train': 1.70821213722229} -11/07/2021 01:46:05 - INFO - __main__ - Step 32042: {'lr': 0.0004508698282702324, 'samples': 6152064, 'steps': 32041, 'loss/train': 1.9895410537719727} -11/07/2021 01:46:05 - INFO - __main__ - Step 32043: {'lr': 0.0004508666689466725, 'samples': 6152256, 'steps': 32042, 'loss/train': 1.8032820224761963} -11/07/2021 01:46:05 - INFO - __main__ - Step 32044: {'lr': 0.00045086350953260526, 'samples': 6152448, 'steps': 32043, 'loss/train': 1.8391896486282349} -11/07/2021 01:46:06 - INFO - __main__ - Step 32045: {'lr': 0.0004508603500280319, 'samples': 6152640, 'steps': 32044, 'loss/train': 1.5459450483322144} -11/07/2021 01:46:07 - INFO - __main__ - Step 32046: {'lr': 0.00045085719043295406, 'samples': 6152832, 'steps': 32045, 'loss/train': 1.458228349685669} -11/07/2021 01:46:07 - INFO - __main__ - Step 32047: {'lr': 0.00045085403074737295, 'samples': 6153024, 'steps': 32046, 'loss/train': 1.8259520530700684} -11/07/2021 01:46:07 - INFO - __main__ - Step 32048: {'lr': 0.0004508508709712902, 'samples': 6153216, 'steps': 32047, 'loss/train': 1.78195321559906} -11/07/2021 01:46:08 - INFO - __main__ - Step 32049: {'lr': 0.00045084771110470717, 'samples': 6153408, 'steps': 32048, 'loss/train': 1.6490238904953003} -11/07/2021 01:46:08 - INFO - __main__ - Step 32050: {'lr': 0.00045084455114762525, 'samples': 6153600, 'steps': 32049, 'loss/train': 1.6333950757980347} -11/07/2021 01:46:09 - INFO - __main__ - Step 32051: {'lr': 0.00045084139110004585, 'samples': 6153792, 'steps': 32050, 'loss/train': 1.9807506799697876} -11/07/2021 01:46:10 - INFO - __main__ - Step 32052: {'lr': 0.0004508382309619704, 'samples': 6153984, 'steps': 32051, 'loss/train': 1.0197628736495972} -11/07/2021 01:46:10 - INFO - __main__ - Step 32053: {'lr': 0.0004508350707334004, 'samples': 6154176, 'steps': 32052, 'loss/train': 1.282412052154541} -11/07/2021 01:46:10 - INFO - __main__ - Step 32054: {'lr': 0.00045083191041433713, 'samples': 6154368, 'steps': 32053, 'loss/train': 0.9735081791877747} -11/07/2021 01:46:11 - INFO - __main__ - Step 32055: {'lr': 0.00045082875000478214, 'samples': 6154560, 'steps': 32054, 'loss/train': 1.6473565101623535} -11/07/2021 01:46:12 - INFO - __main__ - Step 32056: {'lr': 0.0004508255895047368, 'samples': 6154752, 'steps': 32055, 'loss/train': 1.4841833114624023} -11/07/2021 01:46:12 - INFO - __main__ - Step 32057: {'lr': 0.0004508224289142026, 'samples': 6154944, 'steps': 32056, 'loss/train': 1.6833237409591675} -11/07/2021 01:46:12 - INFO - __main__ - Step 32058: {'lr': 0.0004508192682331809, 'samples': 6155136, 'steps': 32057, 'loss/train': 1.6849783658981323} -11/07/2021 01:46:13 - INFO - __main__ - Step 32059: {'lr': 0.0004508161074616731, 'samples': 6155328, 'steps': 32058, 'loss/train': 1.8919442892074585} -11/07/2021 01:46:13 - INFO - __main__ - Step 32060: {'lr': 0.0004508129465996806, 'samples': 6155520, 'steps': 32059, 'loss/train': 1.4205477237701416} -11/07/2021 01:46:14 - INFO - __main__ - Step 32061: {'lr': 0.00045080978564720505, 'samples': 6155712, 'steps': 32060, 'loss/train': 1.436179757118225} -11/07/2021 01:46:15 - INFO - __main__ - Step 32062: {'lr': 0.0004508066246042476, 'samples': 6155904, 'steps': 32061, 'loss/train': 1.7141095399856567} -11/07/2021 01:46:15 - INFO - __main__ - Step 32063: {'lr': 0.0004508034634708098, 'samples': 6156096, 'steps': 32062, 'loss/train': 1.0422805547714233} -11/07/2021 01:46:15 - INFO - __main__ - Step 32064: {'lr': 0.0004508003022468931, 'samples': 6156288, 'steps': 32063, 'loss/train': 1.554802417755127} -11/07/2021 01:46:16 - INFO - __main__ - Step 32065: {'lr': 0.00045079714093249887, 'samples': 6156480, 'steps': 32064, 'loss/train': 1.9286205768585205} -11/07/2021 01:46:16 - INFO - __main__ - Step 32066: {'lr': 0.00045079397952762845, 'samples': 6156672, 'steps': 32065, 'loss/train': 1.645257830619812} -11/07/2021 01:46:17 - INFO - __main__ - Step 32067: {'lr': 0.0004507908180322835, 'samples': 6156864, 'steps': 32066, 'loss/train': 1.5263566970825195} -11/07/2021 01:46:17 - INFO - __main__ - Step 32068: {'lr': 0.00045078765644646524, 'samples': 6157056, 'steps': 32067, 'loss/train': 1.6802290678024292} -11/07/2021 01:46:18 - INFO - __main__ - Step 32069: {'lr': 0.00045078449477017516, 'samples': 6157248, 'steps': 32068, 'loss/train': 0.8311300277709961} -11/07/2021 01:46:18 - INFO - __main__ - Step 32070: {'lr': 0.0004507813330034147, 'samples': 6157440, 'steps': 32069, 'loss/train': 1.153349757194519} -11/07/2021 01:46:19 - INFO - __main__ - Step 32071: {'lr': 0.00045077817114618526, 'samples': 6157632, 'steps': 32070, 'loss/train': 1.3929682970046997} -11/07/2021 01:46:19 - INFO - __main__ - Step 32072: {'lr': 0.00045077500919848826, 'samples': 6157824, 'steps': 32071, 'loss/train': 1.6842589378356934} -11/07/2021 01:46:20 - INFO - __main__ - Step 32073: {'lr': 0.00045077184716032516, 'samples': 6158016, 'steps': 32072, 'loss/train': 1.767591118812561} -11/07/2021 01:46:20 - INFO - __main__ - Step 32074: {'lr': 0.0004507686850316973, 'samples': 6158208, 'steps': 32073, 'loss/train': 1.6692560911178589} -11/07/2021 01:46:21 - INFO - __main__ - Step 32075: {'lr': 0.00045076552281260625, 'samples': 6158400, 'steps': 32074, 'loss/train': 1.4434971809387207} -11/07/2021 01:46:21 - INFO - __main__ - Step 32076: {'lr': 0.0004507623605030533, 'samples': 6158592, 'steps': 32075, 'loss/train': 1.3661025762557983} -11/07/2021 01:46:22 - INFO - __main__ - Step 32077: {'lr': 0.00045075919810304, 'samples': 6158784, 'steps': 32076, 'loss/train': 1.3306758403778076} -11/07/2021 01:46:22 - INFO - __main__ - Step 32078: {'lr': 0.0004507560356125676, 'samples': 6158976, 'steps': 32077, 'loss/train': 1.8561049699783325} -11/07/2021 01:46:23 - INFO - __main__ - Step 32079: {'lr': 0.0004507528730316377, 'samples': 6159168, 'steps': 32078, 'loss/train': 1.629477858543396} -11/07/2021 01:46:23 - INFO - __main__ - Step 32080: {'lr': 0.0004507497103602517, 'samples': 6159360, 'steps': 32079, 'loss/train': 1.2134417295455933} -11/07/2021 01:46:23 - INFO - __main__ - Step 32081: {'lr': 0.00045074654759841087, 'samples': 6159552, 'steps': 32080, 'loss/train': 1.6609727144241333} -11/07/2021 01:46:24 - INFO - __main__ - Step 32082: {'lr': 0.00045074338474611683, 'samples': 6159744, 'steps': 32081, 'loss/train': 5.802849769592285} -11/07/2021 01:46:25 - INFO - __main__ - Step 32083: {'lr': 0.00045074022180337085, 'samples': 6159936, 'steps': 32082, 'loss/train': 1.6034067869186401} -11/07/2021 01:46:25 - INFO - __main__ - Step 32084: {'lr': 0.0004507370587701745, 'samples': 6160128, 'steps': 32083, 'loss/train': 1.6937822103500366} -11/07/2021 01:46:25 - INFO - __main__ - Step 32085: {'lr': 0.000450733895646529, 'samples': 6160320, 'steps': 32084, 'loss/train': 1.17350172996521} -11/07/2021 01:46:26 - INFO - __main__ - Step 32086: {'lr': 0.00045073073243243603, 'samples': 6160512, 'steps': 32085, 'loss/train': 1.0529669523239136} -11/07/2021 01:46:26 - INFO - __main__ - Step 32087: {'lr': 0.0004507275691278968, 'samples': 6160704, 'steps': 32086, 'loss/train': 1.3048980236053467} -11/07/2021 01:46:27 - INFO - __main__ - Step 32088: {'lr': 0.00045072440573291293, 'samples': 6160896, 'steps': 32087, 'loss/train': 1.3754926919937134} -11/07/2021 01:46:28 - INFO - __main__ - Step 32089: {'lr': 0.0004507212422474857, 'samples': 6161088, 'steps': 32088, 'loss/train': 1.2092654705047607} -11/07/2021 01:46:28 - INFO - __main__ - Step 32090: {'lr': 0.0004507180786716165, 'samples': 6161280, 'steps': 32089, 'loss/train': 1.558481216430664} -11/07/2021 01:46:28 - INFO - __main__ - Step 32091: {'lr': 0.00045071491500530694, 'samples': 6161472, 'steps': 32090, 'loss/train': 0.4279614984989166} -11/07/2021 01:46:29 - INFO - __main__ - Step 32092: {'lr': 0.0004507117512485582, 'samples': 6161664, 'steps': 32091, 'loss/train': 0.9977620244026184} -11/07/2021 01:46:30 - INFO - __main__ - Step 32093: {'lr': 0.000450708587401372, 'samples': 6161856, 'steps': 32092, 'loss/train': 1.0190815925598145} -11/07/2021 01:46:30 - INFO - __main__ - Step 32094: {'lr': 0.0004507054234637495, 'samples': 6162048, 'steps': 32093, 'loss/train': 1.9626078605651855} -11/07/2021 01:46:31 - INFO - __main__ - Step 32095: {'lr': 0.0004507022594356922, 'samples': 6162240, 'steps': 32094, 'loss/train': 1.7547073364257812} -11/07/2021 01:46:31 - INFO - __main__ - Step 32096: {'lr': 0.00045069909531720166, 'samples': 6162432, 'steps': 32095, 'loss/train': 1.469717025756836} -11/07/2021 01:46:31 - INFO - __main__ - Step 32097: {'lr': 0.0004506959311082792, 'samples': 6162624, 'steps': 32096, 'loss/train': 0.25666314363479614} -11/07/2021 01:46:33 - INFO - __main__ - Step 32098: {'lr': 0.00045069276680892624, 'samples': 6162816, 'steps': 32097, 'loss/train': 1.6708344221115112} -11/07/2021 01:46:33 - INFO - __main__ - Step 32099: {'lr': 0.00045068960241914413, 'samples': 6163008, 'steps': 32098, 'loss/train': 1.4840983152389526} -11/07/2021 01:46:33 - INFO - __main__ - Step 32100: {'lr': 0.00045068643793893447, 'samples': 6163200, 'steps': 32099, 'loss/train': 1.1935482025146484} -11/07/2021 01:46:34 - INFO - __main__ - Step 32101: {'lr': 0.0004506832733682986, 'samples': 6163392, 'steps': 32100, 'loss/train': 1.4337197542190552} -11/07/2021 01:46:34 - INFO - __main__ - Step 32102: {'lr': 0.00045068010870723783, 'samples': 6163584, 'steps': 32101, 'loss/train': 1.115096092224121} -11/07/2021 01:46:34 - INFO - __main__ - Step 32103: {'lr': 0.00045067694395575385, 'samples': 6163776, 'steps': 32102, 'loss/train': 1.8311907052993774} -11/07/2021 01:46:35 - INFO - __main__ - Step 32104: {'lr': 0.0004506737791138479, 'samples': 6163968, 'steps': 32103, 'loss/train': 1.3427801132202148} -11/07/2021 01:46:36 - INFO - __main__ - Step 32105: {'lr': 0.00045067061418152136, 'samples': 6164160, 'steps': 32104, 'loss/train': 1.3438457250595093} -11/07/2021 01:46:36 - INFO - __main__ - Step 32106: {'lr': 0.00045066744915877585, 'samples': 6164352, 'steps': 32105, 'loss/train': 1.156517744064331} -11/07/2021 01:46:36 - INFO - __main__ - Step 32107: {'lr': 0.0004506642840456126, 'samples': 6164544, 'steps': 32106, 'loss/train': 1.7105660438537598} -11/07/2021 01:46:37 - INFO - __main__ - Step 32108: {'lr': 0.00045066111884203315, 'samples': 6164736, 'steps': 32107, 'loss/train': 1.4578814506530762} -11/07/2021 01:46:38 - INFO - __main__ - Step 32109: {'lr': 0.0004506579535480389, 'samples': 6164928, 'steps': 32108, 'loss/train': 1.5972881317138672} -11/07/2021 01:46:38 - INFO - __main__ - Step 32110: {'lr': 0.00045065478816363124, 'samples': 6165120, 'steps': 32109, 'loss/train': 2.4207537174224854} -11/07/2021 01:46:38 - INFO - __main__ - Step 32111: {'lr': 0.00045065162268881164, 'samples': 6165312, 'steps': 32110, 'loss/train': 1.431797981262207} -11/07/2021 01:46:39 - INFO - __main__ - Step 32112: {'lr': 0.0004506484571235816, 'samples': 6165504, 'steps': 32111, 'loss/train': 1.3394352197647095} -11/07/2021 01:46:39 - INFO - __main__ - Step 32113: {'lr': 0.00045064529146794234, 'samples': 6165696, 'steps': 32112, 'loss/train': 2.1921451091766357} -11/07/2021 01:46:40 - INFO - __main__ - Step 32114: {'lr': 0.0004506421257218955, 'samples': 6165888, 'steps': 32113, 'loss/train': 1.3960522413253784} -11/07/2021 01:46:40 - INFO - __main__ - Step 32115: {'lr': 0.00045063895988544235, 'samples': 6166080, 'steps': 32114, 'loss/train': 1.5505790710449219} -11/07/2021 01:46:41 - INFO - __main__ - Step 32116: {'lr': 0.00045063579395858444, 'samples': 6166272, 'steps': 32115, 'loss/train': 1.7635595798492432} -11/07/2021 01:46:41 - INFO - __main__ - Step 32117: {'lr': 0.0004506326279413231, 'samples': 6166464, 'steps': 32116, 'loss/train': 1.816580891609192} -11/07/2021 01:46:41 - INFO - __main__ - Step 32118: {'lr': 0.0004506294618336598, 'samples': 6166656, 'steps': 32117, 'loss/train': 1.704832911491394} -11/07/2021 01:46:43 - INFO - __main__ - Step 32119: {'lr': 0.00045062629563559595, 'samples': 6166848, 'steps': 32118, 'loss/train': 1.7365407943725586} -11/07/2021 01:46:43 - INFO - __main__ - Step 32120: {'lr': 0.00045062312934713303, 'samples': 6167040, 'steps': 32119, 'loss/train': 1.4368287324905396} -11/07/2021 01:46:43 - INFO - __main__ - Step 32121: {'lr': 0.00045061996296827237, 'samples': 6167232, 'steps': 32120, 'loss/train': 1.7316168546676636} -11/07/2021 01:46:44 - INFO - __main__ - Step 32122: {'lr': 0.00045061679649901543, 'samples': 6167424, 'steps': 32121, 'loss/train': 1.6725994348526} -11/07/2021 01:46:44 - INFO - __main__ - Step 32123: {'lr': 0.00045061362993936374, 'samples': 6167616, 'steps': 32122, 'loss/train': 1.4833842515945435} -11/07/2021 01:46:45 - INFO - __main__ - Step 32124: {'lr': 0.0004506104632893185, 'samples': 6167808, 'steps': 32123, 'loss/train': 1.17832612991333} -11/07/2021 01:46:45 - INFO - __main__ - Step 32125: {'lr': 0.00045060729654888143, 'samples': 6168000, 'steps': 32124, 'loss/train': 0.9483261108398438} -11/07/2021 01:46:46 - INFO - __main__ - Step 32126: {'lr': 0.00045060412971805375, 'samples': 6168192, 'steps': 32125, 'loss/train': 1.0364069938659668} -11/07/2021 01:46:46 - INFO - __main__ - Step 32127: {'lr': 0.00045060096279683694, 'samples': 6168384, 'steps': 32126, 'loss/train': 1.4542152881622314} -11/07/2021 01:46:46 - INFO - __main__ - Step 32128: {'lr': 0.0004505977957852325, 'samples': 6168576, 'steps': 32127, 'loss/train': 1.5777549743652344} -11/07/2021 01:46:47 - INFO - __main__ - Step 32129: {'lr': 0.00045059462868324177, 'samples': 6168768, 'steps': 32128, 'loss/train': 1.4561687707901} -11/07/2021 01:46:48 - INFO - __main__ - Step 32130: {'lr': 0.00045059146149086605, 'samples': 6168960, 'steps': 32129, 'loss/train': 1.6465238332748413} -11/07/2021 01:46:48 - INFO - __main__ - Step 32131: {'lr': 0.00045058829420810707, 'samples': 6169152, 'steps': 32130, 'loss/train': 1.500243902206421} -11/07/2021 01:46:48 - INFO - __main__ - Step 32132: {'lr': 0.00045058512683496607, 'samples': 6169344, 'steps': 32131, 'loss/train': 1.505821943283081} -11/07/2021 01:46:49 - INFO - __main__ - Step 32133: {'lr': 0.00045058195937144446, 'samples': 6169536, 'steps': 32132, 'loss/train': 1.2399656772613525} -11/07/2021 01:46:50 - INFO - __main__ - Step 32134: {'lr': 0.00045057879181754375, 'samples': 6169728, 'steps': 32133, 'loss/train': 1.7505378723144531} -11/07/2021 01:46:50 - INFO - __main__ - Step 32135: {'lr': 0.0004505756241732653, 'samples': 6169920, 'steps': 32134, 'loss/train': 1.483353614807129} -11/07/2021 01:46:51 - INFO - __main__ - Step 32136: {'lr': 0.0004505724564386106, 'samples': 6170112, 'steps': 32135, 'loss/train': 1.8550945520401} -11/07/2021 01:46:51 - INFO - __main__ - Step 32137: {'lr': 0.00045056928861358106, 'samples': 6170304, 'steps': 32136, 'loss/train': 1.6168700456619263} -11/07/2021 01:46:51 - INFO - __main__ - Step 32138: {'lr': 0.000450566120698178, 'samples': 6170496, 'steps': 32137, 'loss/train': 1.487418293952942} -11/07/2021 01:46:52 - INFO - __main__ - Step 32139: {'lr': 0.0004505629526924031, 'samples': 6170688, 'steps': 32138, 'loss/train': 1.502426028251648} -11/07/2021 01:46:53 - INFO - __main__ - Step 32140: {'lr': 0.0004505597845962575, 'samples': 6170880, 'steps': 32139, 'loss/train': 1.7972909212112427} -11/07/2021 01:46:53 - INFO - __main__ - Step 32141: {'lr': 0.0004505566164097428, 'samples': 6171072, 'steps': 32140, 'loss/train': 2.0394623279571533} -11/07/2021 01:46:53 - INFO - __main__ - Step 32142: {'lr': 0.0004505534481328604, 'samples': 6171264, 'steps': 32141, 'loss/train': 1.7296563386917114} -11/07/2021 01:46:54 - INFO - __main__ - Step 32143: {'lr': 0.0004505502797656117, 'samples': 6171456, 'steps': 32142, 'loss/train': 1.802706003189087} -11/07/2021 01:46:55 - INFO - __main__ - Step 32144: {'lr': 0.00045054711130799806, 'samples': 6171648, 'steps': 32143, 'loss/train': 1.3463897705078125} -11/07/2021 01:46:55 - INFO - __main__ - Step 32145: {'lr': 0.00045054394276002106, 'samples': 6171840, 'steps': 32144, 'loss/train': 1.841357946395874} -11/07/2021 01:46:55 - INFO - __main__ - Step 32146: {'lr': 0.00045054077412168215, 'samples': 6172032, 'steps': 32145, 'loss/train': 1.4753705263137817} -11/07/2021 01:46:56 - INFO - __main__ - Step 32147: {'lr': 0.0004505376053929825, 'samples': 6172224, 'steps': 32146, 'loss/train': 1.3590627908706665} -11/07/2021 01:46:56 - INFO - __main__ - Step 32148: {'lr': 0.0004505344365739238, 'samples': 6172416, 'steps': 32147, 'loss/train': 1.6588155031204224} -11/07/2021 01:46:57 - INFO - __main__ - Step 32149: {'lr': 0.0004505312676645073, 'samples': 6172608, 'steps': 32148, 'loss/train': 1.8488324880599976} -11/07/2021 01:46:57 - INFO - __main__ - Step 32150: {'lr': 0.00045052809866473454, 'samples': 6172800, 'steps': 32149, 'loss/train': 2.2110037803649902} -11/07/2021 01:46:58 - INFO - __main__ - Step 32151: {'lr': 0.00045052492957460696, 'samples': 6172992, 'steps': 32150, 'loss/train': 1.240863561630249} -11/07/2021 01:46:58 - INFO - __main__ - Step 32152: {'lr': 0.00045052176039412587, 'samples': 6173184, 'steps': 32151, 'loss/train': 1.3574669361114502} -11/07/2021 01:46:58 - INFO - __main__ - Step 32153: {'lr': 0.0004505185911232928, 'samples': 6173376, 'steps': 32152, 'loss/train': 1.5875046253204346} -11/07/2021 01:47:00 - INFO - __main__ - Step 32154: {'lr': 0.00045051542176210914, 'samples': 6173568, 'steps': 32153, 'loss/train': 1.974134922027588} -11/07/2021 01:47:00 - INFO - __main__ - Step 32155: {'lr': 0.0004505122523105764, 'samples': 6173760, 'steps': 32154, 'loss/train': 1.2119091749191284} -11/07/2021 01:47:00 - INFO - __main__ - Step 32156: {'lr': 0.00045050908276869585, 'samples': 6173952, 'steps': 32155, 'loss/train': 2.0083765983581543} -11/07/2021 01:47:01 - INFO - __main__ - Step 32157: {'lr': 0.0004505059131364689, 'samples': 6174144, 'steps': 32156, 'loss/train': 1.6518559455871582} -11/07/2021 01:47:01 - INFO - __main__ - Step 32158: {'lr': 0.00045050274341389726, 'samples': 6174336, 'steps': 32157, 'loss/train': 1.3425853252410889} -11/07/2021 01:47:01 - INFO - __main__ - Step 32159: {'lr': 0.00045049957360098207, 'samples': 6174528, 'steps': 32158, 'loss/train': 5.946632385253906} -11/07/2021 01:47:02 - INFO - __main__ - Step 32160: {'lr': 0.0004504964036977249, 'samples': 6174720, 'steps': 32159, 'loss/train': 1.4935715198516846} -11/07/2021 01:47:03 - INFO - __main__ - Step 32161: {'lr': 0.00045049323370412723, 'samples': 6174912, 'steps': 32160, 'loss/train': 1.4618717432022095} -11/07/2021 01:47:03 - INFO - __main__ - Step 32162: {'lr': 0.0004504900636201903, 'samples': 6175104, 'steps': 32161, 'loss/train': 1.820804476737976} -11/07/2021 01:47:03 - INFO - __main__ - Step 32163: {'lr': 0.00045048689344591566, 'samples': 6175296, 'steps': 32162, 'loss/train': 1.4637774229049683} -11/07/2021 01:47:04 - INFO - __main__ - Step 32164: {'lr': 0.0004504837231813047, 'samples': 6175488, 'steps': 32163, 'loss/train': 1.688586711883545} -11/07/2021 01:47:05 - INFO - __main__ - Step 32165: {'lr': 0.0004504805528263589, 'samples': 6175680, 'steps': 32164, 'loss/train': 1.6876972913742065} -11/07/2021 01:47:05 - INFO - __main__ - Step 32166: {'lr': 0.00045047738238107967, 'samples': 6175872, 'steps': 32165, 'loss/train': 1.708917260169983} -11/07/2021 01:47:05 - INFO - __main__ - Step 32167: {'lr': 0.00045047421184546844, 'samples': 6176064, 'steps': 32166, 'loss/train': 1.567901611328125} -11/07/2021 01:47:06 - INFO - __main__ - Step 32168: {'lr': 0.0004504710412195265, 'samples': 6176256, 'steps': 32167, 'loss/train': 1.5221161842346191} -11/07/2021 01:47:06 - INFO - __main__ - Step 32169: {'lr': 0.00045046787050325555, 'samples': 6176448, 'steps': 32168, 'loss/train': 0.7906864285469055} -11/07/2021 01:47:07 - INFO - __main__ - Step 32170: {'lr': 0.0004504646996966568, 'samples': 6176640, 'steps': 32169, 'loss/train': 1.4437230825424194} -11/07/2021 01:47:07 - INFO - __main__ - Step 32171: {'lr': 0.0004504615287997318, 'samples': 6176832, 'steps': 32170, 'loss/train': 1.4785854816436768} -11/07/2021 01:47:08 - INFO - __main__ - Step 32172: {'lr': 0.00045045835781248184, 'samples': 6177024, 'steps': 32171, 'loss/train': 1.773765206336975} -11/07/2021 01:47:08 - INFO - __main__ - Step 32173: {'lr': 0.0004504551867349085, 'samples': 6177216, 'steps': 32172, 'loss/train': 1.5836315155029297} -11/07/2021 01:47:09 - INFO - __main__ - Step 32174: {'lr': 0.0004504520155670131, 'samples': 6177408, 'steps': 32173, 'loss/train': 1.4165898561477661} -11/07/2021 01:47:09 - INFO - __main__ - Step 32175: {'lr': 0.0004504488443087972, 'samples': 6177600, 'steps': 32174, 'loss/train': 1.5395853519439697} -11/07/2021 01:47:10 - INFO - __main__ - Step 32176: {'lr': 0.00045044567296026206, 'samples': 6177792, 'steps': 32175, 'loss/train': 1.4260025024414062} -11/07/2021 01:47:10 - INFO - __main__ - Step 32177: {'lr': 0.0004504425015214092, 'samples': 6177984, 'steps': 32176, 'loss/train': 1.4530431032180786} -11/07/2021 01:47:11 - INFO - __main__ - Step 32178: {'lr': 0.00045043932999224015, 'samples': 6178176, 'steps': 32177, 'loss/train': 1.5154881477355957} -11/07/2021 01:47:11 - INFO - __main__ - Step 32179: {'lr': 0.00045043615837275607, 'samples': 6178368, 'steps': 32178, 'loss/train': 1.7684738636016846} -11/07/2021 01:47:12 - INFO - __main__ - Step 32180: {'lr': 0.0004504329866629586, 'samples': 6178560, 'steps': 32179, 'loss/train': 1.756452202796936} -11/07/2021 01:47:13 - INFO - __main__ - Step 32181: {'lr': 0.0004504298148628492, 'samples': 6178752, 'steps': 32180, 'loss/train': 0.48151570558547974} -11/07/2021 01:47:13 - INFO - __main__ - Step 32182: {'lr': 0.0004504266429724292, 'samples': 6178944, 'steps': 32181, 'loss/train': 1.5893335342407227} -11/07/2021 01:47:13 - INFO - __main__ - Step 32183: {'lr': 0.0004504234709917, 'samples': 6179136, 'steps': 32182, 'loss/train': 1.4612712860107422} -11/07/2021 01:47:14 - INFO - __main__ - Step 32184: {'lr': 0.00045042029892066306, 'samples': 6179328, 'steps': 32183, 'loss/train': 1.3556455373764038} -11/07/2021 01:47:14 - INFO - __main__ - Step 32185: {'lr': 0.00045041712675931983, 'samples': 6179520, 'steps': 32184, 'loss/train': 1.6092675924301147} -11/07/2021 01:47:15 - INFO - __main__ - Step 32186: {'lr': 0.0004504139545076717, 'samples': 6179712, 'steps': 32185, 'loss/train': 1.374077320098877} -11/07/2021 01:47:15 - INFO - __main__ - Step 32187: {'lr': 0.0004504107821657203, 'samples': 6179904, 'steps': 32186, 'loss/train': 1.4730110168457031} -11/07/2021 01:47:16 - INFO - __main__ - Step 32188: {'lr': 0.00045040760973346673, 'samples': 6180096, 'steps': 32187, 'loss/train': 1.5549176931381226} -11/07/2021 01:47:16 - INFO - __main__ - Step 32189: {'lr': 0.00045040443721091266, 'samples': 6180288, 'steps': 32188, 'loss/train': 1.3511254787445068} -11/07/2021 01:47:16 - INFO - __main__ - Step 32190: {'lr': 0.0004504012645980594, 'samples': 6180480, 'steps': 32189, 'loss/train': 1.49689519405365} -11/07/2021 01:47:17 - INFO - __main__ - Step 32191: {'lr': 0.0004503980918949085, 'samples': 6180672, 'steps': 32190, 'loss/train': 1.4713667631149292} -11/07/2021 01:47:18 - INFO - __main__ - Step 32192: {'lr': 0.00045039491910146124, 'samples': 6180864, 'steps': 32191, 'loss/train': 1.3565356731414795} -11/07/2021 01:47:18 - INFO - __main__ - Step 32193: {'lr': 0.00045039174621771915, 'samples': 6181056, 'steps': 32192, 'loss/train': 2.052945852279663} -11/07/2021 01:47:18 - INFO - __main__ - Step 32194: {'lr': 0.00045038857324368367, 'samples': 6181248, 'steps': 32193, 'loss/train': 1.5134190320968628} -11/07/2021 01:47:19 - INFO - __main__ - Step 32195: {'lr': 0.0004503854001793561, 'samples': 6181440, 'steps': 32194, 'loss/train': 1.8116105794906616} -11/07/2021 01:47:20 - INFO - __main__ - Step 32196: {'lr': 0.00045038222702473797, 'samples': 6181632, 'steps': 32195, 'loss/train': 1.4274109601974487} -11/07/2021 01:47:20 - INFO - __main__ - Step 32197: {'lr': 0.0004503790537798308, 'samples': 6181824, 'steps': 32196, 'loss/train': 1.777016520500183} -11/07/2021 01:47:21 - INFO - __main__ - Step 32198: {'lr': 0.00045037588044463586, 'samples': 6182016, 'steps': 32197, 'loss/train': 1.5776311159133911} -11/07/2021 01:47:21 - INFO - __main__ - Step 32199: {'lr': 0.00045037270701915464, 'samples': 6182208, 'steps': 32198, 'loss/train': 1.589194655418396} -11/07/2021 01:47:21 - INFO - __main__ - Step 32200: {'lr': 0.0004503695335033885, 'samples': 6182400, 'steps': 32199, 'loss/train': 3.5294759273529053} -11/07/2021 01:47:22 - INFO - __main__ - Step 32201: {'lr': 0.00045036635989733904, 'samples': 6182592, 'steps': 32200, 'loss/train': 0.16695256531238556} -11/07/2021 01:47:22 - INFO - __main__ - Step 32202: {'lr': 0.0004503631862010076, 'samples': 6182784, 'steps': 32201, 'loss/train': 1.8757727146148682} -11/07/2021 01:47:23 - INFO - __main__ - Step 32203: {'lr': 0.0004503600124143955, 'samples': 6182976, 'steps': 32202, 'loss/train': 1.8070666790008545} -11/07/2021 01:47:24 - INFO - __main__ - Step 32204: {'lr': 0.0004503568385375043, 'samples': 6183168, 'steps': 32203, 'loss/train': 1.2195488214492798} -11/07/2021 01:47:24 - INFO - __main__ - Step 32205: {'lr': 0.00045035366457033546, 'samples': 6183360, 'steps': 32204, 'loss/train': 1.3440762758255005} -11/07/2021 01:47:24 - INFO - __main__ - Step 32206: {'lr': 0.00045035049051289037, 'samples': 6183552, 'steps': 32205, 'loss/train': 1.389227032661438} -11/07/2021 01:47:25 - INFO - __main__ - Step 32207: {'lr': 0.00045034731636517036, 'samples': 6183744, 'steps': 32206, 'loss/train': 1.765787959098816} -11/07/2021 01:47:26 - INFO - __main__ - Step 32208: {'lr': 0.0004503441421271769, 'samples': 6183936, 'steps': 32207, 'loss/train': 1.577767014503479} -11/07/2021 01:47:26 - INFO - __main__ - Step 32209: {'lr': 0.0004503409677989115, 'samples': 6184128, 'steps': 32208, 'loss/train': 1.5536357164382935} -11/07/2021 01:47:27 - INFO - __main__ - Step 32210: {'lr': 0.00045033779338037565, 'samples': 6184320, 'steps': 32209, 'loss/train': 3.0786328315734863} -11/07/2021 01:47:27 - INFO - __main__ - Step 32211: {'lr': 0.0004503346188715706, 'samples': 6184512, 'steps': 32210, 'loss/train': 1.5683656930923462} -11/07/2021 01:47:27 - INFO - __main__ - Step 32212: {'lr': 0.0004503314442724979, 'samples': 6184704, 'steps': 32211, 'loss/train': 1.1409876346588135} -11/07/2021 01:47:28 - INFO - __main__ - Step 32213: {'lr': 0.0004503282695831589, 'samples': 6184896, 'steps': 32212, 'loss/train': 2.376875400543213} -11/07/2021 01:47:29 - INFO - __main__ - Step 32214: {'lr': 0.0004503250948035551, 'samples': 6185088, 'steps': 32213, 'loss/train': 1.9134149551391602} -11/07/2021 01:47:29 - INFO - __main__ - Step 32215: {'lr': 0.0004503219199336879, 'samples': 6185280, 'steps': 32214, 'loss/train': 0.9256809949874878} -11/07/2021 01:47:30 - INFO - __main__ - Step 32216: {'lr': 0.00045031874497355876, 'samples': 6185472, 'steps': 32215, 'loss/train': 1.794251799583435} -11/07/2021 01:47:30 - INFO - __main__ - Step 32217: {'lr': 0.000450315569923169, 'samples': 6185664, 'steps': 32216, 'loss/train': 1.9647176265716553} -11/07/2021 01:47:30 - INFO - __main__ - Step 32218: {'lr': 0.00045031239478252017, 'samples': 6185856, 'steps': 32217, 'loss/train': 1.6685179471969604} -11/07/2021 01:47:31 - INFO - __main__ - Step 32219: {'lr': 0.00045030921955161373, 'samples': 6186048, 'steps': 32218, 'loss/train': 1.7403217554092407} -11/07/2021 01:47:32 - INFO - __main__ - Step 32220: {'lr': 0.000450306044230451, 'samples': 6186240, 'steps': 32219, 'loss/train': 1.0186405181884766} -11/07/2021 01:47:32 - INFO - __main__ - Step 32221: {'lr': 0.0004503028688190335, 'samples': 6186432, 'steps': 32220, 'loss/train': 1.6435362100601196} -11/07/2021 01:47:32 - INFO - __main__ - Step 32222: {'lr': 0.00045029969331736254, 'samples': 6186624, 'steps': 32221, 'loss/train': 1.9964864253997803} -11/07/2021 01:47:33 - INFO - __main__ - Step 32223: {'lr': 0.00045029651772543965, 'samples': 6186816, 'steps': 32222, 'loss/train': 1.9309375286102295} -11/07/2021 01:47:34 - INFO - __main__ - Step 32224: {'lr': 0.0004502933420432662, 'samples': 6187008, 'steps': 32223, 'loss/train': 1.053402304649353} -11/07/2021 01:47:34 - INFO - __main__ - Step 32225: {'lr': 0.0004502901662708437, 'samples': 6187200, 'steps': 32224, 'loss/train': 1.0154645442962646} -11/07/2021 01:47:34 - INFO - __main__ - Step 32226: {'lr': 0.0004502869904081736, 'samples': 6187392, 'steps': 32225, 'loss/train': 1.5956135988235474} -11/07/2021 01:47:35 - INFO - __main__ - Step 32227: {'lr': 0.00045028381445525725, 'samples': 6187584, 'steps': 32226, 'loss/train': 1.768977403640747} -11/07/2021 01:47:35 - INFO - __main__ - Step 32228: {'lr': 0.0004502806384120961, 'samples': 6187776, 'steps': 32227, 'loss/train': 1.180979609489441} -11/07/2021 01:47:36 - INFO - __main__ - Step 32229: {'lr': 0.0004502774622786915, 'samples': 6187968, 'steps': 32228, 'loss/train': 1.636723518371582} -11/07/2021 01:47:36 - INFO - __main__ - Step 32230: {'lr': 0.00045027428605504507, 'samples': 6188160, 'steps': 32229, 'loss/train': 1.6560455560684204} -11/07/2021 01:47:37 - INFO - __main__ - Step 32231: {'lr': 0.00045027110974115814, 'samples': 6188352, 'steps': 32230, 'loss/train': 1.9419082403182983} -11/07/2021 01:47:37 - INFO - __main__ - Step 32232: {'lr': 0.0004502679333370321, 'samples': 6188544, 'steps': 32231, 'loss/train': 1.2935874462127686} -11/07/2021 01:47:37 - INFO - __main__ - Step 32233: {'lr': 0.0004502647568426684, 'samples': 6188736, 'steps': 32232, 'loss/train': 1.598137378692627} -11/07/2021 01:47:38 - INFO - __main__ - Step 32234: {'lr': 0.0004502615802580685, 'samples': 6188928, 'steps': 32233, 'loss/train': 1.5005950927734375} -11/07/2021 01:47:39 - INFO - __main__ - Step 32235: {'lr': 0.0004502584035832338, 'samples': 6189120, 'steps': 32234, 'loss/train': 1.0328993797302246} -11/07/2021 01:47:39 - INFO - __main__ - Step 32236: {'lr': 0.00045025522681816586, 'samples': 6189312, 'steps': 32235, 'loss/train': 1.4519612789154053} -11/07/2021 01:47:39 - INFO - __main__ - Step 32237: {'lr': 0.0004502520499628659, 'samples': 6189504, 'steps': 32236, 'loss/train': 1.620317816734314} -11/07/2021 01:47:40 - INFO - __main__ - Step 32238: {'lr': 0.00045024887301733555, 'samples': 6189696, 'steps': 32237, 'loss/train': 1.6385005712509155} -11/07/2021 01:47:41 - INFO - __main__ - Step 32239: {'lr': 0.0004502456959815761, 'samples': 6189888, 'steps': 32238, 'loss/train': 1.7109335660934448} -11/07/2021 01:47:41 - INFO - __main__ - Step 32240: {'lr': 0.000450242518855589, 'samples': 6190080, 'steps': 32239, 'loss/train': 0.9207674860954285} -11/07/2021 01:47:42 - INFO - __main__ - Step 32241: {'lr': 0.00045023934163937565, 'samples': 6190272, 'steps': 32240, 'loss/train': 1.6926556825637817} -11/07/2021 01:47:42 - INFO - __main__ - Step 32242: {'lr': 0.00045023616433293763, 'samples': 6190464, 'steps': 32241, 'loss/train': 1.55082106590271} -11/07/2021 01:47:42 - INFO - __main__ - Step 32243: {'lr': 0.00045023298693627626, 'samples': 6190656, 'steps': 32242, 'loss/train': 1.2392164468765259} -11/07/2021 01:47:43 - INFO - __main__ - Step 32244: {'lr': 0.000450229809449393, 'samples': 6190848, 'steps': 32243, 'loss/train': 1.5431742668151855} -11/07/2021 01:47:44 - INFO - __main__ - Step 32245: {'lr': 0.00045022663187228927, 'samples': 6191040, 'steps': 32244, 'loss/train': 1.3102967739105225} -11/07/2021 01:47:44 - INFO - __main__ - Step 32246: {'lr': 0.0004502234542049666, 'samples': 6191232, 'steps': 32245, 'loss/train': 1.9321751594543457} -11/07/2021 01:47:44 - INFO - __main__ - Step 32247: {'lr': 0.00045022027644742624, 'samples': 6191424, 'steps': 32246, 'loss/train': 1.9687552452087402} -11/07/2021 01:47:45 - INFO - __main__ - Step 32248: {'lr': 0.0004502170985996697, 'samples': 6191616, 'steps': 32247, 'loss/train': 1.6017018556594849} -11/07/2021 01:47:45 - INFO - __main__ - Step 32249: {'lr': 0.00045021392066169844, 'samples': 6191808, 'steps': 32248, 'loss/train': 1.8045872449874878} -11/07/2021 01:47:46 - INFO - __main__ - Step 32250: {'lr': 0.0004502107426335139, 'samples': 6192000, 'steps': 32249, 'loss/train': 1.603269338607788} -11/07/2021 01:47:47 - INFO - __main__ - Step 32251: {'lr': 0.0004502075645151175, 'samples': 6192192, 'steps': 32250, 'loss/train': 1.9542632102966309} -11/07/2021 01:47:47 - INFO - __main__ - Step 32252: {'lr': 0.0004502043863065106, 'samples': 6192384, 'steps': 32251, 'loss/train': 1.8218039274215698} -11/07/2021 01:47:47 - INFO - __main__ - Step 32253: {'lr': 0.00045020120800769474, 'samples': 6192576, 'steps': 32252, 'loss/train': 1.427304744720459} -11/07/2021 01:47:48 - INFO - __main__ - Step 32254: {'lr': 0.0004501980296186713, 'samples': 6192768, 'steps': 32253, 'loss/train': 1.3513579368591309} -11/07/2021 01:47:48 - INFO - __main__ - Step 32255: {'lr': 0.0004501948511394417, 'samples': 6192960, 'steps': 32254, 'loss/train': 1.3751741647720337} -11/07/2021 01:47:49 - INFO - __main__ - Step 32256: {'lr': 0.0004501916725700074, 'samples': 6193152, 'steps': 32255, 'loss/train': 1.3976471424102783} -11/07/2021 01:47:50 - INFO - __main__ - Step 32257: {'lr': 0.00045018849391036987, 'samples': 6193344, 'steps': 32256, 'loss/train': 1.300757646560669} -11/07/2021 01:47:50 - INFO - __main__ - Step 32258: {'lr': 0.00045018531516053046, 'samples': 6193536, 'steps': 32257, 'loss/train': 1.3747690916061401} -11/07/2021 01:47:50 - INFO - __main__ - Step 32259: {'lr': 0.0004501821363204906, 'samples': 6193728, 'steps': 32258, 'loss/train': 1.2249864339828491} -11/07/2021 01:47:51 - INFO - __main__ - Step 32260: {'lr': 0.00045017895739025185, 'samples': 6193920, 'steps': 32259, 'loss/train': 0.8205302357673645} -11/07/2021 01:47:52 - INFO - __main__ - Step 32261: {'lr': 0.0004501757783698154, 'samples': 6194112, 'steps': 32260, 'loss/train': 1.5389779806137085} -11/07/2021 01:47:52 - INFO - __main__ - Step 32262: {'lr': 0.00045017259925918295, 'samples': 6194304, 'steps': 32261, 'loss/train': 1.7591694593429565} -11/07/2021 01:47:52 - INFO - __main__ - Step 32263: {'lr': 0.0004501694200583558, 'samples': 6194496, 'steps': 32262, 'loss/train': 1.3185373544692993} -11/07/2021 01:47:53 - INFO - __main__ - Step 32264: {'lr': 0.0004501662407673354, 'samples': 6194688, 'steps': 32263, 'loss/train': 1.338904857635498} -11/07/2021 01:47:53 - INFO - __main__ - Step 32265: {'lr': 0.00045016306138612313, 'samples': 6194880, 'steps': 32264, 'loss/train': 1.3383913040161133} -11/07/2021 01:47:54 - INFO - __main__ - Step 32266: {'lr': 0.0004501598819147205, 'samples': 6195072, 'steps': 32265, 'loss/train': 2.0385541915893555} -11/07/2021 01:47:54 - INFO - __main__ - Step 32267: {'lr': 0.00045015670235312895, 'samples': 6195264, 'steps': 32266, 'loss/train': 1.398764729499817} -11/07/2021 01:47:55 - INFO - __main__ - Step 32268: {'lr': 0.0004501535227013498, 'samples': 6195456, 'steps': 32267, 'loss/train': 1.4296706914901733} -11/07/2021 01:47:55 - INFO - __main__ - Step 32269: {'lr': 0.0004501503429593846, 'samples': 6195648, 'steps': 32268, 'loss/train': 2.022183418273926} -11/07/2021 01:47:55 - INFO - __main__ - Step 32270: {'lr': 0.0004501471631272348, 'samples': 6195840, 'steps': 32269, 'loss/train': 1.373524785041809} -11/07/2021 01:47:57 - INFO - __main__ - Step 32271: {'lr': 0.00045014398320490173, 'samples': 6196032, 'steps': 32270, 'loss/train': 1.0820329189300537} -11/07/2021 01:47:57 - INFO - __main__ - Step 32272: {'lr': 0.00045014080319238686, 'samples': 6196224, 'steps': 32271, 'loss/train': 1.12027907371521} -11/07/2021 01:47:57 - INFO - __main__ - Step 32273: {'lr': 0.00045013762308969164, 'samples': 6196416, 'steps': 32272, 'loss/train': 1.7232547998428345} -11/07/2021 01:47:58 - INFO - __main__ - Step 32274: {'lr': 0.00045013444289681757, 'samples': 6196608, 'steps': 32273, 'loss/train': 1.3769302368164062} -11/07/2021 01:47:58 - INFO - __main__ - Step 32275: {'lr': 0.0004501312626137659, 'samples': 6196800, 'steps': 32274, 'loss/train': 1.300300121307373} -11/07/2021 01:47:59 - INFO - __main__ - Step 32276: {'lr': 0.0004501280822405382, 'samples': 6196992, 'steps': 32275, 'loss/train': 1.6742898225784302} -11/07/2021 01:47:59 - INFO - __main__ - Step 32277: {'lr': 0.00045012490177713586, 'samples': 6197184, 'steps': 32276, 'loss/train': 1.5575422048568726} -11/07/2021 01:48:00 - INFO - __main__ - Step 32278: {'lr': 0.00045012172122356036, 'samples': 6197376, 'steps': 32277, 'loss/train': 1.6483980417251587} -11/07/2021 01:48:00 - INFO - __main__ - Step 32279: {'lr': 0.0004501185405798131, 'samples': 6197568, 'steps': 32278, 'loss/train': 1.6229832172393799} -11/07/2021 01:48:00 - INFO - __main__ - Step 32280: {'lr': 0.00045011535984589544, 'samples': 6197760, 'steps': 32279, 'loss/train': 1.3071985244750977} -11/07/2021 01:48:01 - INFO - __main__ - Step 32281: {'lr': 0.000450112179021809, 'samples': 6197952, 'steps': 32280, 'loss/train': 1.3725543022155762} -11/07/2021 01:48:02 - INFO - __main__ - Step 32282: {'lr': 0.00045010899810755506, 'samples': 6198144, 'steps': 32281, 'loss/train': 1.4773143529891968} -11/07/2021 01:48:02 - INFO - __main__ - Step 32283: {'lr': 0.00045010581710313506, 'samples': 6198336, 'steps': 32282, 'loss/train': 1.4009032249450684} -11/07/2021 01:48:02 - INFO - __main__ - Step 32284: {'lr': 0.0004501026360085505, 'samples': 6198528, 'steps': 32283, 'loss/train': 1.030112624168396} -11/07/2021 01:48:03 - INFO - __main__ - Step 32285: {'lr': 0.0004500994548238028, 'samples': 6198720, 'steps': 32284, 'loss/train': 1.2472800016403198} -11/07/2021 01:48:03 - INFO - __main__ - Step 32286: {'lr': 0.00045009627354889337, 'samples': 6198912, 'steps': 32285, 'loss/train': 1.8431708812713623} -11/07/2021 01:48:04 - INFO - __main__ - Step 32287: {'lr': 0.0004500930921838236, 'samples': 6199104, 'steps': 32286, 'loss/train': 1.1655179262161255} -11/07/2021 01:48:05 - INFO - __main__ - Step 32288: {'lr': 0.000450089910728595, 'samples': 6199296, 'steps': 32287, 'loss/train': 0.7153118252754211} -11/07/2021 01:48:05 - INFO - __main__ - Step 32289: {'lr': 0.0004500867291832089, 'samples': 6199488, 'steps': 32288, 'loss/train': 1.3063770532608032} -11/07/2021 01:48:05 - INFO - __main__ - Step 32290: {'lr': 0.00045008354754766687, 'samples': 6199680, 'steps': 32289, 'loss/train': 1.4782352447509766} -11/07/2021 01:48:06 - INFO - __main__ - Step 32291: {'lr': 0.0004500803658219703, 'samples': 6199872, 'steps': 32290, 'loss/train': 1.7052644491195679} -11/07/2021 01:48:07 - INFO - __main__ - Step 32292: {'lr': 0.0004500771840061206, 'samples': 6200064, 'steps': 32291, 'loss/train': 1.9112358093261719} -11/07/2021 01:48:07 - INFO - __main__ - Step 32293: {'lr': 0.00045007400210011925, 'samples': 6200256, 'steps': 32292, 'loss/train': 2.1962902545928955} -11/07/2021 01:48:07 - INFO - __main__ - Step 32294: {'lr': 0.0004500708201039676, 'samples': 6200448, 'steps': 32293, 'loss/train': 1.5316219329833984} -11/07/2021 01:48:08 - INFO - __main__ - Step 32295: {'lr': 0.0004500676380176671, 'samples': 6200640, 'steps': 32294, 'loss/train': 1.7628265619277954} -11/07/2021 01:48:08 - INFO - __main__ - Step 32296: {'lr': 0.00045006445584121923, 'samples': 6200832, 'steps': 32295, 'loss/train': 1.9976251125335693} -11/07/2021 01:48:09 - INFO - __main__ - Step 32297: {'lr': 0.00045006127357462533, 'samples': 6201024, 'steps': 32296, 'loss/train': 1.5440441370010376} -11/07/2021 01:48:09 - INFO - __main__ - Step 32298: {'lr': 0.000450058091217887, 'samples': 6201216, 'steps': 32297, 'loss/train': 1.672995924949646} -11/07/2021 01:48:10 - INFO - __main__ - Step 32299: {'lr': 0.0004500549087710056, 'samples': 6201408, 'steps': 32298, 'loss/train': 1.8858267068862915} -11/07/2021 01:48:10 - INFO - __main__ - Step 32300: {'lr': 0.0004500517262339825, 'samples': 6201600, 'steps': 32299, 'loss/train': 1.860845685005188} -11/07/2021 01:48:11 - INFO - __main__ - Step 32301: {'lr': 0.0004500485436068191, 'samples': 6201792, 'steps': 32300, 'loss/train': 1.3300939798355103} -11/07/2021 01:48:12 - INFO - __main__ - Step 32302: {'lr': 0.0004500453608895171, 'samples': 6201984, 'steps': 32301, 'loss/train': 1.4846974611282349} -11/07/2021 01:48:12 - INFO - __main__ - Step 32303: {'lr': 0.00045004217808207757, 'samples': 6202176, 'steps': 32302, 'loss/train': 1.9711004495620728} -11/07/2021 01:48:12 - INFO - __main__ - Step 32304: {'lr': 0.0004500389951845022, 'samples': 6202368, 'steps': 32303, 'loss/train': 0.865800678730011} -11/07/2021 01:48:13 - INFO - __main__ - Step 32305: {'lr': 0.00045003581219679235, 'samples': 6202560, 'steps': 32304, 'loss/train': 1.3765199184417725} -11/07/2021 01:48:13 - INFO - __main__ - Step 32306: {'lr': 0.00045003262911894943, 'samples': 6202752, 'steps': 32305, 'loss/train': 1.862096905708313} -11/07/2021 01:48:14 - INFO - __main__ - Step 32307: {'lr': 0.00045002944595097494, 'samples': 6202944, 'steps': 32306, 'loss/train': 1.1746426820755005} -11/07/2021 01:48:14 - INFO - __main__ - Step 32308: {'lr': 0.00045002626269287024, 'samples': 6203136, 'steps': 32307, 'loss/train': 1.4557210206985474} -11/07/2021 01:48:15 - INFO - __main__ - Step 32309: {'lr': 0.00045002307934463673, 'samples': 6203328, 'steps': 32308, 'loss/train': 1.4870140552520752} -11/07/2021 01:48:15 - INFO - __main__ - Step 32310: {'lr': 0.000450019895906276, 'samples': 6203520, 'steps': 32309, 'loss/train': 1.0892274379730225} -11/07/2021 01:48:15 - INFO - __main__ - Step 32311: {'lr': 0.0004500167123777894, 'samples': 6203712, 'steps': 32310, 'loss/train': 1.544129729270935} -11/07/2021 01:48:16 - INFO - __main__ - Step 32312: {'lr': 0.00045001352875917824, 'samples': 6203904, 'steps': 32311, 'loss/train': 1.6808295249938965} -11/07/2021 01:48:17 - INFO - __main__ - Step 32313: {'lr': 0.00045001034505044415, 'samples': 6204096, 'steps': 32312, 'loss/train': 1.686047077178955} -11/07/2021 01:48:17 - INFO - __main__ - Step 32314: {'lr': 0.00045000716125158846, 'samples': 6204288, 'steps': 32313, 'loss/train': 1.6952117681503296} -11/07/2021 01:48:18 - INFO - __main__ - Step 32315: {'lr': 0.0004500039773626127, 'samples': 6204480, 'steps': 32314, 'loss/train': 1.413800835609436} -11/07/2021 01:48:18 - INFO - __main__ - Step 32316: {'lr': 0.00045000079338351805, 'samples': 6204672, 'steps': 32315, 'loss/train': 1.6651508808135986} -11/07/2021 01:48:19 - INFO - __main__ - Step 32317: {'lr': 0.0004499976093143063, 'samples': 6204864, 'steps': 32316, 'loss/train': 1.5840280055999756} -11/07/2021 01:48:19 - INFO - __main__ - Step 32318: {'lr': 0.00044999442515497866, 'samples': 6205056, 'steps': 32317, 'loss/train': 1.7664008140563965} -11/07/2021 01:48:20 - INFO - __main__ - Step 32319: {'lr': 0.0004499912409055367, 'samples': 6205248, 'steps': 32318, 'loss/train': 1.6453135013580322} -11/07/2021 01:48:20 - INFO - __main__ - Step 32320: {'lr': 0.0004499880565659816, 'samples': 6205440, 'steps': 32319, 'loss/train': 1.4619554281234741} -11/07/2021 01:48:20 - INFO - __main__ - Step 32321: {'lr': 0.0004499848721363151, 'samples': 6205632, 'steps': 32320, 'loss/train': 2.0209126472473145} -11/07/2021 01:48:21 - INFO - __main__ - Step 32322: {'lr': 0.0004499816876165385, 'samples': 6205824, 'steps': 32321, 'loss/train': 1.6794594526290894} -11/07/2021 01:48:22 - INFO - __main__ - Step 32323: {'lr': 0.0004499785030066532, 'samples': 6206016, 'steps': 32322, 'loss/train': 1.405039668083191} -11/07/2021 01:48:22 - INFO - __main__ - Step 32324: {'lr': 0.00044997531830666073, 'samples': 6206208, 'steps': 32323, 'loss/train': 0.8761853575706482} -11/07/2021 01:48:23 - INFO - __main__ - Step 32325: {'lr': 0.00044997213351656237, 'samples': 6206400, 'steps': 32324, 'loss/train': 1.3782182931900024} -11/07/2021 01:48:23 - INFO - __main__ - Step 32326: {'lr': 0.00044996894863635965, 'samples': 6206592, 'steps': 32325, 'loss/train': 1.345014214515686} -11/07/2021 01:48:23 - INFO - __main__ - Step 32327: {'lr': 0.00044996576366605415, 'samples': 6206784, 'steps': 32326, 'loss/train': 1.9174363613128662} -11/07/2021 01:48:24 - INFO - __main__ - Step 32328: {'lr': 0.00044996257860564705, 'samples': 6206976, 'steps': 32327, 'loss/train': 1.2590142488479614} -11/07/2021 01:48:25 - INFO - __main__ - Step 32329: {'lr': 0.0004499593934551399, 'samples': 6207168, 'steps': 32328, 'loss/train': 3.155000686645508} -11/07/2021 01:48:25 - INFO - __main__ - Step 32330: {'lr': 0.00044995620821453416, 'samples': 6207360, 'steps': 32329, 'loss/train': 1.9484862089157104} -11/07/2021 01:48:25 - INFO - __main__ - Step 32331: {'lr': 0.00044995302288383123, 'samples': 6207552, 'steps': 32330, 'loss/train': 1.1827287673950195} -11/07/2021 01:48:26 - INFO - __main__ - Step 32332: {'lr': 0.0004499498374630325, 'samples': 6207744, 'steps': 32331, 'loss/train': 0.9975447654724121} -11/07/2021 01:48:26 - INFO - __main__ - Step 32333: {'lr': 0.0004499466519521396, 'samples': 6207936, 'steps': 32332, 'loss/train': 1.891614556312561} -11/07/2021 01:48:27 - INFO - __main__ - Step 32334: {'lr': 0.00044994346635115367, 'samples': 6208128, 'steps': 32333, 'loss/train': 1.2407118082046509} -11/07/2021 01:48:28 - INFO - __main__ - Step 32335: {'lr': 0.00044994028066007636, 'samples': 6208320, 'steps': 32334, 'loss/train': 0.8754911422729492} -11/07/2021 01:48:28 - INFO - __main__ - Step 32336: {'lr': 0.00044993709487890906, 'samples': 6208512, 'steps': 32335, 'loss/train': 1.402904748916626} -11/07/2021 01:48:28 - INFO - __main__ - Step 32337: {'lr': 0.0004499339090076532, 'samples': 6208704, 'steps': 32336, 'loss/train': 2.068150520324707} -11/07/2021 01:48:29 - INFO - __main__ - Step 32338: {'lr': 0.0004499307230463102, 'samples': 6208896, 'steps': 32337, 'loss/train': 1.460711121559143} -11/07/2021 01:48:30 - INFO - __main__ - Step 32339: {'lr': 0.0004499275369948814, 'samples': 6209088, 'steps': 32338, 'loss/train': 1.7848551273345947} -11/07/2021 01:48:30 - INFO - __main__ - Step 32340: {'lr': 0.0004499243508533685, 'samples': 6209280, 'steps': 32339, 'loss/train': 1.4753457307815552} -11/07/2021 01:48:30 - INFO - __main__ - Step 32341: {'lr': 0.0004499211646217727, 'samples': 6209472, 'steps': 32340, 'loss/train': 1.7661265134811401} -11/07/2021 01:48:31 - INFO - __main__ - Step 32342: {'lr': 0.00044991797830009543, 'samples': 6209664, 'steps': 32341, 'loss/train': 2.685377597808838} -11/07/2021 01:48:31 - INFO - __main__ - Step 32343: {'lr': 0.00044991479188833826, 'samples': 6209856, 'steps': 32342, 'loss/train': 1.4869948625564575} -11/07/2021 01:48:32 - INFO - __main__ - Step 32344: {'lr': 0.0004499116053865026, 'samples': 6210048, 'steps': 32343, 'loss/train': 1.4335551261901855} -11/07/2021 01:48:32 - INFO - __main__ - Step 32345: {'lr': 0.0004499084187945899, 'samples': 6210240, 'steps': 32344, 'loss/train': 1.3646057844161987} -11/07/2021 01:48:33 - INFO - __main__ - Step 32346: {'lr': 0.0004499052321126015, 'samples': 6210432, 'steps': 32345, 'loss/train': 1.448341965675354} -11/07/2021 01:48:33 - INFO - __main__ - Step 32347: {'lr': 0.0004499020453405388, 'samples': 6210624, 'steps': 32346, 'loss/train': 1.9387210607528687} -11/07/2021 01:48:33 - INFO - __main__ - Step 32348: {'lr': 0.00044989885847840344, 'samples': 6210816, 'steps': 32347, 'loss/train': 1.3974018096923828} -11/07/2021 01:48:35 - INFO - __main__ - Step 32349: {'lr': 0.0004498956715261967, 'samples': 6211008, 'steps': 32348, 'loss/train': 0.2207542210817337} -11/07/2021 01:48:35 - INFO - __main__ - Step 32350: {'lr': 0.00044989248448392007, 'samples': 6211200, 'steps': 32349, 'loss/train': 1.630966305732727} -11/07/2021 01:48:35 - INFO - __main__ - Step 32351: {'lr': 0.000449889297351575, 'samples': 6211392, 'steps': 32350, 'loss/train': 1.0773181915283203} -11/07/2021 01:48:36 - INFO - __main__ - Step 32352: {'lr': 0.0004498861101291628, 'samples': 6211584, 'steps': 32351, 'loss/train': 1.5037585496902466} -11/07/2021 01:48:36 - INFO - __main__ - Step 32353: {'lr': 0.0004498829228166851, 'samples': 6211776, 'steps': 32352, 'loss/train': 1.4931249618530273} -11/07/2021 01:48:37 - INFO - __main__ - Step 32354: {'lr': 0.0004498797354141432, 'samples': 6211968, 'steps': 32353, 'loss/train': 1.459004521369934} -11/07/2021 01:48:37 - INFO - __main__ - Step 32355: {'lr': 0.00044987654792153853, 'samples': 6212160, 'steps': 32354, 'loss/train': 1.4395281076431274} -11/07/2021 01:48:38 - INFO - __main__ - Step 32356: {'lr': 0.0004498733603388726, 'samples': 6212352, 'steps': 32355, 'loss/train': 1.4898239374160767} -11/07/2021 01:48:38 - INFO - __main__ - Step 32357: {'lr': 0.00044987017266614684, 'samples': 6212544, 'steps': 32356, 'loss/train': 1.539486289024353} -11/07/2021 01:48:38 - INFO - __main__ - Step 32358: {'lr': 0.00044986698490336263, 'samples': 6212736, 'steps': 32357, 'loss/train': 0.8823086023330688} -11/07/2021 01:48:39 - INFO - __main__ - Step 32359: {'lr': 0.0004498637970505215, 'samples': 6212928, 'steps': 32358, 'loss/train': 1.9765815734863281} -11/07/2021 01:48:40 - INFO - __main__ - Step 32360: {'lr': 0.0004498606091076248, 'samples': 6213120, 'steps': 32359, 'loss/train': 1.6369905471801758} -11/07/2021 01:48:40 - INFO - __main__ - Step 32361: {'lr': 0.000449857421074674, 'samples': 6213312, 'steps': 32360, 'loss/train': 1.4293484687805176} -11/07/2021 01:48:40 - INFO - __main__ - Step 32362: {'lr': 0.0004498542329516705, 'samples': 6213504, 'steps': 32361, 'loss/train': 1.5993635654449463} -11/07/2021 01:48:41 - INFO - __main__ - Step 32363: {'lr': 0.00044985104473861583, 'samples': 6213696, 'steps': 32362, 'loss/train': 1.6762796640396118} -11/07/2021 01:48:41 - INFO - __main__ - Step 32364: {'lr': 0.0004498478564355113, 'samples': 6213888, 'steps': 32363, 'loss/train': 1.624647617340088} -11/07/2021 01:48:42 - INFO - __main__ - Step 32365: {'lr': 0.0004498446680423584, 'samples': 6214080, 'steps': 32364, 'loss/train': 1.441513180732727} -11/07/2021 01:48:42 - INFO - __main__ - Step 32366: {'lr': 0.0004498414795591586, 'samples': 6214272, 'steps': 32365, 'loss/train': 1.322672963142395} -11/07/2021 01:48:43 - INFO - __main__ - Step 32367: {'lr': 0.00044983829098591336, 'samples': 6214464, 'steps': 32366, 'loss/train': 0.8546894788742065} -11/07/2021 01:48:43 - INFO - __main__ - Step 32368: {'lr': 0.00044983510232262405, 'samples': 6214656, 'steps': 32367, 'loss/train': 1.2581473588943481} -11/07/2021 01:48:43 - INFO - __main__ - Step 32369: {'lr': 0.0004498319135692921, 'samples': 6214848, 'steps': 32368, 'loss/train': 1.3132758140563965} -11/07/2021 01:48:44 - INFO - __main__ - Step 32370: {'lr': 0.00044982872472591897, 'samples': 6215040, 'steps': 32369, 'loss/train': 1.441627025604248} -11/07/2021 01:48:45 - INFO - __main__ - Step 32371: {'lr': 0.00044982553579250606, 'samples': 6215232, 'steps': 32370, 'loss/train': 1.1300324201583862} -11/07/2021 01:48:45 - INFO - __main__ - Step 32372: {'lr': 0.0004498223467690549, 'samples': 6215424, 'steps': 32371, 'loss/train': 1.257175087928772} -11/07/2021 01:48:45 - INFO - __main__ - Step 32373: {'lr': 0.0004498191576555669, 'samples': 6215616, 'steps': 32372, 'loss/train': 0.9374439120292664} -11/07/2021 01:48:46 - INFO - __main__ - Step 32374: {'lr': 0.00044981596845204344, 'samples': 6215808, 'steps': 32373, 'loss/train': 1.484535813331604} -11/07/2021 01:48:47 - INFO - __main__ - Step 32375: {'lr': 0.00044981277915848595, 'samples': 6216000, 'steps': 32374, 'loss/train': 1.8038363456726074} -11/07/2021 01:48:47 - INFO - __main__ - Step 32376: {'lr': 0.00044980958977489593, 'samples': 6216192, 'steps': 32375, 'loss/train': 1.2944344282150269} -11/07/2021 01:48:48 - INFO - __main__ - Step 32377: {'lr': 0.00044980640030127484, 'samples': 6216384, 'steps': 32376, 'loss/train': 1.5786190032958984} -11/07/2021 01:48:48 - INFO - __main__ - Step 32378: {'lr': 0.00044980321073762405, 'samples': 6216576, 'steps': 32377, 'loss/train': 1.259092926979065} -11/07/2021 01:48:48 - INFO - __main__ - Step 32379: {'lr': 0.00044980002108394496, 'samples': 6216768, 'steps': 32378, 'loss/train': 1.260203242301941} -11/07/2021 01:48:49 - INFO - __main__ - Step 32380: {'lr': 0.0004497968313402391, 'samples': 6216960, 'steps': 32379, 'loss/train': 1.7739508152008057} -11/07/2021 01:48:50 - INFO - __main__ - Step 32381: {'lr': 0.00044979364150650794, 'samples': 6217152, 'steps': 32380, 'loss/train': 1.782575011253357} -11/07/2021 01:48:50 - INFO - __main__ - Step 32382: {'lr': 0.00044979045158275273, 'samples': 6217344, 'steps': 32381, 'loss/train': 1.9300806522369385} -11/07/2021 01:48:51 - INFO - __main__ - Step 32383: {'lr': 0.0004497872615689751, 'samples': 6217536, 'steps': 32382, 'loss/train': 0.8333058953285217} -11/07/2021 01:48:51 - INFO - __main__ - Step 32384: {'lr': 0.00044978407146517634, 'samples': 6217728, 'steps': 32383, 'loss/train': 0.957953155040741} -11/07/2021 01:48:52 - INFO - __main__ - Step 32385: {'lr': 0.0004497808812713581, 'samples': 6217920, 'steps': 32384, 'loss/train': 1.0447723865509033} -11/07/2021 01:48:52 - INFO - __main__ - Step 32386: {'lr': 0.00044977769098752154, 'samples': 6218112, 'steps': 32385, 'loss/train': 1.5469779968261719} -11/07/2021 01:48:53 - INFO - __main__ - Step 32387: {'lr': 0.0004497745006136683, 'samples': 6218304, 'steps': 32386, 'loss/train': 1.6424702405929565} -11/07/2021 01:48:53 - INFO - __main__ - Step 32388: {'lr': 0.00044977131014979974, 'samples': 6218496, 'steps': 32387, 'loss/train': 1.2199071645736694} -11/07/2021 01:48:53 - INFO - __main__ - Step 32389: {'lr': 0.0004497681195959173, 'samples': 6218688, 'steps': 32388, 'loss/train': 1.6586096286773682} -11/07/2021 01:48:54 - INFO - __main__ - Step 32390: {'lr': 0.0004497649289520224, 'samples': 6218880, 'steps': 32389, 'loss/train': 0.7270222902297974} -11/07/2021 01:48:55 - INFO - __main__ - Step 32391: {'lr': 0.00044976173821811654, 'samples': 6219072, 'steps': 32390, 'loss/train': 1.5894689559936523} -11/07/2021 01:48:55 - INFO - __main__ - Step 32392: {'lr': 0.0004497585473942011, 'samples': 6219264, 'steps': 32391, 'loss/train': 1.3609628677368164} -11/07/2021 01:48:55 - INFO - __main__ - Step 32393: {'lr': 0.0004497553564802776, 'samples': 6219456, 'steps': 32392, 'loss/train': 1.3615731000900269} -11/07/2021 01:48:56 - INFO - __main__ - Step 32394: {'lr': 0.0004497521654763474, 'samples': 6219648, 'steps': 32393, 'loss/train': 1.7795207500457764} -11/07/2021 01:48:57 - INFO - __main__ - Step 32395: {'lr': 0.0004497489743824119, 'samples': 6219840, 'steps': 32394, 'loss/train': 1.0525424480438232} -11/07/2021 01:48:57 - INFO - __main__ - Step 32396: {'lr': 0.0004497457831984727, 'samples': 6220032, 'steps': 32395, 'loss/train': 1.5898518562316895} -11/07/2021 01:48:57 - INFO - __main__ - Step 32397: {'lr': 0.00044974259192453103, 'samples': 6220224, 'steps': 32396, 'loss/train': 1.645259141921997} -11/07/2021 01:48:58 - INFO - __main__ - Step 32398: {'lr': 0.0004497394005605885, 'samples': 6220416, 'steps': 32397, 'loss/train': 1.6547985076904297} -11/07/2021 01:48:58 - INFO - __main__ - Step 32399: {'lr': 0.00044973620910664645, 'samples': 6220608, 'steps': 32398, 'loss/train': 1.6538923978805542} -11/07/2021 01:48:59 - INFO - __main__ - Step 32400: {'lr': 0.00044973301756270635, 'samples': 6220800, 'steps': 32399, 'loss/train': 1.4757723808288574} -11/07/2021 01:49:00 - INFO - __main__ - Step 32401: {'lr': 0.0004497298259287696, 'samples': 6220992, 'steps': 32400, 'loss/train': 1.810659646987915} -11/07/2021 01:49:00 - INFO - __main__ - Step 32402: {'lr': 0.00044972663420483774, 'samples': 6221184, 'steps': 32401, 'loss/train': 1.176303505897522} -11/07/2021 01:49:00 - INFO - __main__ - Step 32403: {'lr': 0.00044972344239091206, 'samples': 6221376, 'steps': 32402, 'loss/train': 1.7836946249008179} -11/07/2021 01:49:01 - INFO - __main__ - Step 32404: {'lr': 0.0004497202504869941, 'samples': 6221568, 'steps': 32403, 'loss/train': 1.795836091041565} -11/07/2021 01:49:01 - INFO - __main__ - Step 32405: {'lr': 0.0004497170584930853, 'samples': 6221760, 'steps': 32404, 'loss/train': 2.021099090576172} -11/07/2021 01:49:02 - INFO - __main__ - Step 32406: {'lr': 0.0004497138664091871, 'samples': 6221952, 'steps': 32405, 'loss/train': 1.593692421913147} -11/07/2021 01:49:02 - INFO - __main__ - Step 32407: {'lr': 0.00044971067423530087, 'samples': 6222144, 'steps': 32406, 'loss/train': 1.3890024423599243} -11/07/2021 01:49:03 - INFO - __main__ - Step 32408: {'lr': 0.0004497074819714281, 'samples': 6222336, 'steps': 32407, 'loss/train': 1.8967686891555786} -11/07/2021 01:49:03 - INFO - __main__ - Step 32409: {'lr': 0.00044970428961757026, 'samples': 6222528, 'steps': 32408, 'loss/train': 1.5618425607681274} -11/07/2021 01:49:03 - INFO - __main__ - Step 32410: {'lr': 0.00044970109717372864, 'samples': 6222720, 'steps': 32409, 'loss/train': 1.4434159994125366} -11/07/2021 01:49:04 - INFO - __main__ - Step 32411: {'lr': 0.0004496979046399049, 'samples': 6222912, 'steps': 32410, 'loss/train': 0.6913343071937561} -11/07/2021 01:49:05 - INFO - __main__ - Step 32412: {'lr': 0.00044969471201610037, 'samples': 6223104, 'steps': 32411, 'loss/train': 1.7394918203353882} -11/07/2021 01:49:05 - INFO - __main__ - Step 32413: {'lr': 0.00044969151930231643, 'samples': 6223296, 'steps': 32412, 'loss/train': 1.5709692239761353} -11/07/2021 01:49:06 - INFO - __main__ - Step 32414: {'lr': 0.00044968832649855455, 'samples': 6223488, 'steps': 32413, 'loss/train': 1.6851338148117065} -11/07/2021 01:49:06 - INFO - __main__ - Step 32415: {'lr': 0.00044968513360481624, 'samples': 6223680, 'steps': 32414, 'loss/train': 1.2950356006622314} -11/07/2021 01:49:07 - INFO - __main__ - Step 32416: {'lr': 0.0004496819406211029, 'samples': 6223872, 'steps': 32415, 'loss/train': 1.3438385725021362} -11/07/2021 01:49:07 - INFO - __main__ - Step 32417: {'lr': 0.0004496787475474159, 'samples': 6224064, 'steps': 32416, 'loss/train': 1.436164140701294} -11/07/2021 01:49:08 - INFO - __main__ - Step 32418: {'lr': 0.00044967555438375675, 'samples': 6224256, 'steps': 32417, 'loss/train': 1.7283543348312378} -11/07/2021 01:49:08 - INFO - __main__ - Step 32419: {'lr': 0.0004496723611301269, 'samples': 6224448, 'steps': 32418, 'loss/train': 1.2320383787155151} -11/07/2021 01:49:08 - INFO - __main__ - Step 32420: {'lr': 0.00044966916778652776, 'samples': 6224640, 'steps': 32419, 'loss/train': 1.3301286697387695} -11/07/2021 01:49:09 - INFO - __main__ - Step 32421: {'lr': 0.0004496659743529608, 'samples': 6224832, 'steps': 32420, 'loss/train': 1.5266687870025635} -11/07/2021 01:49:10 - INFO - __main__ - Step 32422: {'lr': 0.00044966278082942746, 'samples': 6225024, 'steps': 32421, 'loss/train': 0.8708489537239075} -11/07/2021 01:49:10 - INFO - __main__ - Step 32423: {'lr': 0.000449659587215929, 'samples': 6225216, 'steps': 32422, 'loss/train': 1.3048748970031738} -11/07/2021 01:49:11 - INFO - __main__ - Step 32424: {'lr': 0.0004496563935124672, 'samples': 6225408, 'steps': 32423, 'loss/train': 0.9543754458427429} -11/07/2021 01:49:11 - INFO - __main__ - Step 32425: {'lr': 0.0004496531997190432, 'samples': 6225600, 'steps': 32424, 'loss/train': 1.8037725687026978} -11/07/2021 01:49:11 - INFO - __main__ - Step 32426: {'lr': 0.0004496500058356586, 'samples': 6225792, 'steps': 32425, 'loss/train': 0.3545287847518921} -11/07/2021 01:49:13 - INFO - __main__ - Step 32427: {'lr': 0.00044964681186231473, 'samples': 6225984, 'steps': 32426, 'loss/train': 0.7700253129005432} -11/07/2021 01:49:13 - INFO - __main__ - Step 32428: {'lr': 0.0004496436177990131, 'samples': 6226176, 'steps': 32427, 'loss/train': 1.4964241981506348} -11/07/2021 01:49:13 - INFO - __main__ - Step 32429: {'lr': 0.0004496404236457552, 'samples': 6226368, 'steps': 32428, 'loss/train': 1.5284323692321777} -11/07/2021 01:49:14 - INFO - __main__ - Step 32430: {'lr': 0.0004496372294025424, 'samples': 6226560, 'steps': 32429, 'loss/train': 0.7127718329429626} -11/07/2021 01:49:14 - INFO - __main__ - Step 32431: {'lr': 0.00044963403506937603, 'samples': 6226752, 'steps': 32430, 'loss/train': 2.3373682498931885} -11/07/2021 01:49:15 - INFO - __main__ - Step 32432: {'lr': 0.00044963084064625775, 'samples': 6226944, 'steps': 32431, 'loss/train': 1.677183747291565} -11/07/2021 01:49:15 - INFO - __main__ - Step 32433: {'lr': 0.00044962764613318886, 'samples': 6227136, 'steps': 32432, 'loss/train': 2.08242130279541} -11/07/2021 01:49:16 - INFO - __main__ - Step 32434: {'lr': 0.00044962445153017087, 'samples': 6227328, 'steps': 32433, 'loss/train': 1.7830533981323242} -11/07/2021 01:49:16 - INFO - __main__ - Step 32435: {'lr': 0.00044962125683720513, 'samples': 6227520, 'steps': 32434, 'loss/train': 1.3276549577713013} -11/07/2021 01:49:16 - INFO - __main__ - Step 32436: {'lr': 0.0004496180620542931, 'samples': 6227712, 'steps': 32435, 'loss/train': 1.2223323583602905} -11/07/2021 01:49:17 - INFO - __main__ - Step 32437: {'lr': 0.00044961486718143634, 'samples': 6227904, 'steps': 32436, 'loss/train': 1.3821481466293335} -11/07/2021 01:49:18 - INFO - __main__ - Step 32438: {'lr': 0.0004496116722186362, 'samples': 6228096, 'steps': 32437, 'loss/train': 1.492997169494629} -11/07/2021 01:49:18 - INFO - __main__ - Step 32439: {'lr': 0.00044960847716589403, 'samples': 6228288, 'steps': 32438, 'loss/train': 1.5349807739257812} -11/07/2021 01:49:18 - INFO - __main__ - Step 32440: {'lr': 0.00044960528202321143, 'samples': 6228480, 'steps': 32439, 'loss/train': 1.3973376750946045} -11/07/2021 01:49:19 - INFO - __main__ - Step 32441: {'lr': 0.0004496020867905898, 'samples': 6228672, 'steps': 32440, 'loss/train': 1.4841481447219849} -11/07/2021 01:49:19 - INFO - __main__ - Step 32442: {'lr': 0.00044959889146803047, 'samples': 6228864, 'steps': 32441, 'loss/train': 1.9865716695785522} -11/07/2021 01:49:20 - INFO - __main__ - Step 32443: {'lr': 0.00044959569605553494, 'samples': 6229056, 'steps': 32442, 'loss/train': 1.5784991979599} -11/07/2021 01:49:21 - INFO - __main__ - Step 32444: {'lr': 0.00044959250055310473, 'samples': 6229248, 'steps': 32443, 'loss/train': 0.6850621700286865} -11/07/2021 01:49:21 - INFO - __main__ - Step 32445: {'lr': 0.00044958930496074125, 'samples': 6229440, 'steps': 32444, 'loss/train': 0.20532159507274628} -11/07/2021 01:49:21 - INFO - __main__ - Step 32446: {'lr': 0.0004495861092784459, 'samples': 6229632, 'steps': 32445, 'loss/train': 1.6461862325668335} -11/07/2021 01:49:22 - INFO - __main__ - Step 32447: {'lr': 0.00044958291350622007, 'samples': 6229824, 'steps': 32446, 'loss/train': 1.5703867673873901} -11/07/2021 01:49:23 - INFO - __main__ - Step 32448: {'lr': 0.0004495797176440653, 'samples': 6230016, 'steps': 32447, 'loss/train': 1.3373690843582153} -11/07/2021 01:49:23 - INFO - __main__ - Step 32449: {'lr': 0.000449576521691983, 'samples': 6230208, 'steps': 32448, 'loss/train': 1.449952244758606} -11/07/2021 01:49:23 - INFO - __main__ - Step 32450: {'lr': 0.00044957332564997453, 'samples': 6230400, 'steps': 32449, 'loss/train': 1.6825079917907715} -11/07/2021 01:49:24 - INFO - __main__ - Step 32451: {'lr': 0.0004495701295180414, 'samples': 6230592, 'steps': 32450, 'loss/train': 1.9212239980697632} -11/07/2021 01:49:24 - INFO - __main__ - Step 32452: {'lr': 0.0004495669332961852, 'samples': 6230784, 'steps': 32451, 'loss/train': 1.3632677793502808} -11/07/2021 01:49:25 - INFO - __main__ - Step 32453: {'lr': 0.0004495637369844071, 'samples': 6230976, 'steps': 32452, 'loss/train': 1.0895562171936035} -11/07/2021 01:49:25 - INFO - __main__ - Step 32454: {'lr': 0.0004495605405827087, 'samples': 6231168, 'steps': 32453, 'loss/train': 1.1377387046813965} -11/07/2021 01:49:26 - INFO - __main__ - Step 32455: {'lr': 0.00044955734409109135, 'samples': 6231360, 'steps': 32454, 'loss/train': 1.732886791229248} -11/07/2021 01:49:26 - INFO - __main__ - Step 32456: {'lr': 0.0004495541475095566, 'samples': 6231552, 'steps': 32455, 'loss/train': 1.8484389781951904} -11/07/2021 01:49:26 - INFO - __main__ - Step 32457: {'lr': 0.0004495509508381058, 'samples': 6231744, 'steps': 32456, 'loss/train': 1.1795073747634888} -11/07/2021 01:49:27 - INFO - __main__ - Step 32458: {'lr': 0.00044954775407674035, 'samples': 6231936, 'steps': 32457, 'loss/train': 1.8034723997116089} -11/07/2021 01:49:28 - INFO - __main__ - Step 32459: {'lr': 0.00044954455722546186, 'samples': 6232128, 'steps': 32458, 'loss/train': 1.6304291486740112} -11/07/2021 01:49:28 - INFO - __main__ - Step 32460: {'lr': 0.0004495413602842716, 'samples': 6232320, 'steps': 32459, 'loss/train': 1.134009838104248} -11/07/2021 01:49:28 - INFO - __main__ - Step 32461: {'lr': 0.00044953816325317116, 'samples': 6232512, 'steps': 32460, 'loss/train': 1.4539257287979126} -11/07/2021 01:49:29 - INFO - __main__ - Step 32462: {'lr': 0.0004495349661321618, 'samples': 6232704, 'steps': 32461, 'loss/train': 1.4682179689407349} -11/07/2021 01:49:30 - INFO - __main__ - Step 32463: {'lr': 0.0004495317689212452, 'samples': 6232896, 'steps': 32462, 'loss/train': 1.2072484493255615} -11/07/2021 01:49:30 - INFO - __main__ - Step 32464: {'lr': 0.0004495285716204226, 'samples': 6233088, 'steps': 32463, 'loss/train': 1.7558974027633667} -11/07/2021 01:49:30 - INFO - __main__ - Step 32465: {'lr': 0.00044952537422969545, 'samples': 6233280, 'steps': 32464, 'loss/train': 1.4803388118743896} -11/07/2021 01:49:31 - INFO - __main__ - Step 32466: {'lr': 0.0004495221767490653, 'samples': 6233472, 'steps': 32465, 'loss/train': 1.3486028909683228} -11/07/2021 01:49:31 - INFO - __main__ - Step 32467: {'lr': 0.00044951897917853355, 'samples': 6233664, 'steps': 32466, 'loss/train': 1.2698243856430054} -11/07/2021 01:49:31 - INFO - __main__ - Step 32468: {'lr': 0.0004495157815181016, 'samples': 6233856, 'steps': 32467, 'loss/train': 1.788853645324707} -11/07/2021 01:49:33 - INFO - __main__ - Step 32469: {'lr': 0.00044951258376777094, 'samples': 6234048, 'steps': 32468, 'loss/train': 0.866815447807312} -11/07/2021 01:49:33 - INFO - __main__ - Step 32470: {'lr': 0.00044950938592754297, 'samples': 6234240, 'steps': 32469, 'loss/train': 1.0849798917770386} -11/07/2021 01:49:33 - INFO - __main__ - Step 32471: {'lr': 0.00044950618799741913, 'samples': 6234432, 'steps': 32470, 'loss/train': 1.2643122673034668} -11/07/2021 01:49:34 - INFO - __main__ - Step 32472: {'lr': 0.0004495029899774009, 'samples': 6234624, 'steps': 32471, 'loss/train': 1.5671745538711548} -11/07/2021 01:49:34 - INFO - __main__ - Step 32473: {'lr': 0.00044949979186748967, 'samples': 6234816, 'steps': 32472, 'loss/train': 1.7395416498184204} -11/07/2021 01:49:35 - INFO - __main__ - Step 32474: {'lr': 0.00044949659366768697, 'samples': 6235008, 'steps': 32473, 'loss/train': 1.6390635967254639} -11/07/2021 01:49:36 - INFO - __main__ - Step 32475: {'lr': 0.00044949339537799415, 'samples': 6235200, 'steps': 32474, 'loss/train': 1.600160002708435} -11/07/2021 01:49:36 - INFO - __main__ - Step 32476: {'lr': 0.0004494901969984127, 'samples': 6235392, 'steps': 32475, 'loss/train': 1.9038304090499878} -11/07/2021 01:49:36 - INFO - __main__ - Step 32477: {'lr': 0.000449486998528944, 'samples': 6235584, 'steps': 32476, 'loss/train': 1.197152853012085} -11/07/2021 01:49:37 - INFO - __main__ - Step 32478: {'lr': 0.00044948379996958963, 'samples': 6235776, 'steps': 32477, 'loss/train': 1.706484317779541} -11/07/2021 01:49:38 - INFO - __main__ - Step 32479: {'lr': 0.00044948060132035087, 'samples': 6235968, 'steps': 32478, 'loss/train': 1.5682185888290405} -11/07/2021 01:49:38 - INFO - __main__ - Step 32480: {'lr': 0.00044947740258122925, 'samples': 6236160, 'steps': 32479, 'loss/train': 1.4988538026809692} -11/07/2021 01:49:38 - INFO - __main__ - Step 32481: {'lr': 0.00044947420375222614, 'samples': 6236352, 'steps': 32480, 'loss/train': 1.2382683753967285} -11/07/2021 01:49:39 - INFO - __main__ - Step 32482: {'lr': 0.00044947100483334315, 'samples': 6236544, 'steps': 32481, 'loss/train': 1.956660509109497} -11/07/2021 01:49:39 - INFO - __main__ - Step 32483: {'lr': 0.0004494678058245815, 'samples': 6236736, 'steps': 32482, 'loss/train': 1.8256279230117798} -11/07/2021 01:49:40 - INFO - __main__ - Step 32484: {'lr': 0.00044946460672594277, 'samples': 6236928, 'steps': 32483, 'loss/train': 1.758445143699646} -11/07/2021 01:49:41 - INFO - __main__ - Step 32485: {'lr': 0.0004494614075374283, 'samples': 6237120, 'steps': 32484, 'loss/train': 1.2483205795288086} -11/07/2021 01:49:41 - INFO - __main__ - Step 32486: {'lr': 0.0004494582082590397, 'samples': 6237312, 'steps': 32485, 'loss/train': 1.7636712789535522} -11/07/2021 01:49:41 - INFO - __main__ - Step 32487: {'lr': 0.0004494550088907783, 'samples': 6237504, 'steps': 32486, 'loss/train': 1.5964031219482422} -11/07/2021 01:49:42 - INFO - __main__ - Step 32488: {'lr': 0.00044945180943264544, 'samples': 6237696, 'steps': 32487, 'loss/train': 1.6114511489868164} -11/07/2021 01:49:43 - INFO - __main__ - Step 32489: {'lr': 0.00044944860988464276, 'samples': 6237888, 'steps': 32488, 'loss/train': 1.499119520187378} -11/07/2021 01:49:43 - INFO - __main__ - Step 32490: {'lr': 0.0004494454102467716, 'samples': 6238080, 'steps': 32489, 'loss/train': 1.1793768405914307} -11/07/2021 01:49:43 - INFO - __main__ - Step 32491: {'lr': 0.00044944221051903345, 'samples': 6238272, 'steps': 32490, 'loss/train': 1.6606731414794922} -11/07/2021 01:49:44 - INFO - __main__ - Step 32492: {'lr': 0.0004494390107014297, 'samples': 6238464, 'steps': 32491, 'loss/train': 1.3472111225128174} -11/07/2021 01:49:44 - INFO - __main__ - Step 32493: {'lr': 0.0004494358107939618, 'samples': 6238656, 'steps': 32492, 'loss/train': 1.0546207427978516} -11/07/2021 01:49:44 - INFO - __main__ - Step 32494: {'lr': 0.0004494326107966311, 'samples': 6238848, 'steps': 32493, 'loss/train': 1.3394577503204346} -11/07/2021 01:49:46 - INFO - __main__ - Step 32495: {'lr': 0.0004494294107094393, 'samples': 6239040, 'steps': 32494, 'loss/train': 1.860493779182434} -11/07/2021 01:49:46 - INFO - __main__ - Step 32496: {'lr': 0.00044942621053238764, 'samples': 6239232, 'steps': 32495, 'loss/train': 1.495239019393921} -11/07/2021 01:49:46 - INFO - __main__ - Step 32497: {'lr': 0.00044942301026547755, 'samples': 6239424, 'steps': 32496, 'loss/train': 1.4385201930999756} -11/07/2021 01:49:47 - INFO - __main__ - Step 32498: {'lr': 0.0004494198099087106, 'samples': 6239616, 'steps': 32497, 'loss/train': 1.2754056453704834} -11/07/2021 01:49:47 - INFO - __main__ - Step 32499: {'lr': 0.00044941660946208806, 'samples': 6239808, 'steps': 32498, 'loss/train': 0.22919543087482452} -11/07/2021 01:49:48 - INFO - __main__ - Step 32500: {'lr': 0.00044941340892561154, 'samples': 6240000, 'steps': 32499, 'loss/train': 1.4570839405059814} -11/07/2021 01:49:48 - INFO - __main__ - Step 32501: {'lr': 0.00044941020829928247, 'samples': 6240192, 'steps': 32500, 'loss/train': 1.5001204013824463} -11/07/2021 01:49:49 - INFO - __main__ - Step 32502: {'lr': 0.00044940700758310214, 'samples': 6240384, 'steps': 32501, 'loss/train': 1.2210010290145874} -11/07/2021 01:49:49 - INFO - __main__ - Step 32503: {'lr': 0.00044940380677707214, 'samples': 6240576, 'steps': 32502, 'loss/train': 0.6593044400215149} -11/07/2021 01:49:49 - INFO - __main__ - Step 32504: {'lr': 0.00044940060588119393, 'samples': 6240768, 'steps': 32503, 'loss/train': 1.254817008972168} -11/07/2021 01:49:50 - INFO - __main__ - Step 32505: {'lr': 0.00044939740489546875, 'samples': 6240960, 'steps': 32504, 'loss/train': 1.3713253736495972} -11/07/2021 01:49:51 - INFO - __main__ - Step 32506: {'lr': 0.0004493942038198983, 'samples': 6241152, 'steps': 32505, 'loss/train': 1.299810528755188} -11/07/2021 01:49:51 - INFO - __main__ - Step 32507: {'lr': 0.0004493910026544838, 'samples': 6241344, 'steps': 32506, 'loss/train': 1.505722999572754} -11/07/2021 01:49:51 - INFO - __main__ - Step 32508: {'lr': 0.0004493878013992268, 'samples': 6241536, 'steps': 32507, 'loss/train': 1.458335518836975} -11/07/2021 01:49:52 - INFO - __main__ - Step 32509: {'lr': 0.0004493846000541287, 'samples': 6241728, 'steps': 32508, 'loss/train': 1.7668204307556152} -11/07/2021 01:49:53 - INFO - __main__ - Step 32510: {'lr': 0.00044938139861919115, 'samples': 6241920, 'steps': 32509, 'loss/train': 1.238909363746643} -11/07/2021 01:49:53 - INFO - __main__ - Step 32511: {'lr': 0.00044937819709441523, 'samples': 6242112, 'steps': 32510, 'loss/train': 1.5238277912139893} -11/07/2021 01:49:53 - INFO - __main__ - Step 32512: {'lr': 0.00044937499547980265, 'samples': 6242304, 'steps': 32511, 'loss/train': 1.2921862602233887} -11/07/2021 01:49:54 - INFO - __main__ - Step 32513: {'lr': 0.00044937179377535475, 'samples': 6242496, 'steps': 32512, 'loss/train': 1.3551661968231201} -11/07/2021 01:49:54 - INFO - __main__ - Step 32514: {'lr': 0.00044936859198107306, 'samples': 6242688, 'steps': 32513, 'loss/train': 1.663925051689148} -11/07/2021 01:49:55 - INFO - __main__ - Step 32515: {'lr': 0.0004493653900969589, 'samples': 6242880, 'steps': 32514, 'loss/train': 1.4537755250930786} -11/07/2021 01:49:55 - INFO - __main__ - Step 32516: {'lr': 0.0004493621881230138, 'samples': 6243072, 'steps': 32515, 'loss/train': 1.0435876846313477} -11/07/2021 01:49:56 - INFO - __main__ - Step 32517: {'lr': 0.00044935898605923916, 'samples': 6243264, 'steps': 32516, 'loss/train': 1.5774314403533936} -11/07/2021 01:49:56 - INFO - __main__ - Step 32518: {'lr': 0.0004493557839056364, 'samples': 6243456, 'steps': 32517, 'loss/train': 1.5218448638916016} -11/07/2021 01:49:56 - INFO - __main__ - Step 32519: {'lr': 0.00044935258166220704, 'samples': 6243648, 'steps': 32518, 'loss/train': 1.6474796533584595} -11/07/2021 01:49:58 - INFO - __main__ - Step 32520: {'lr': 0.00044934937932895246, 'samples': 6243840, 'steps': 32519, 'loss/train': 1.3461508750915527} -11/07/2021 01:49:58 - INFO - __main__ - Step 32521: {'lr': 0.0004493461769058742, 'samples': 6244032, 'steps': 32520, 'loss/train': 1.253962516784668} -11/07/2021 01:49:59 - INFO - __main__ - Step 32522: {'lr': 0.00044934297439297357, 'samples': 6244224, 'steps': 32521, 'loss/train': 0.16634128987789154} -11/07/2021 01:49:59 - INFO - __main__ - Step 32523: {'lr': 0.0004493397717902521, 'samples': 6244416, 'steps': 32522, 'loss/train': 1.3674840927124023} -11/07/2021 01:49:59 - INFO - __main__ - Step 32524: {'lr': 0.00044933656909771117, 'samples': 6244608, 'steps': 32523, 'loss/train': 1.438563585281372} -11/07/2021 01:50:00 - INFO - __main__ - Step 32525: {'lr': 0.00044933336631535224, 'samples': 6244800, 'steps': 32524, 'loss/train': 1.3042861223220825} -11/07/2021 01:50:01 - INFO - __main__ - Step 32526: {'lr': 0.0004493301634431768, 'samples': 6244992, 'steps': 32525, 'loss/train': 1.6236354112625122} -11/07/2021 01:50:01 - INFO - __main__ - Step 32527: {'lr': 0.0004493269604811863, 'samples': 6245184, 'steps': 32526, 'loss/train': 1.4350732564926147} -11/07/2021 01:50:01 - INFO - __main__ - Step 32528: {'lr': 0.000449323757429382, 'samples': 6245376, 'steps': 32527, 'loss/train': 1.4659003019332886} -11/07/2021 01:50:02 - INFO - __main__ - Step 32529: {'lr': 0.00044932055428776566, 'samples': 6245568, 'steps': 32528, 'loss/train': 1.1015076637268066} -11/07/2021 01:50:02 - INFO - __main__ - Step 32530: {'lr': 0.00044931735105633853, 'samples': 6245760, 'steps': 32529, 'loss/train': 1.3505935668945312} -11/07/2021 01:50:03 - INFO - __main__ - Step 32531: {'lr': 0.00044931414773510207, 'samples': 6245952, 'steps': 32530, 'loss/train': 1.467262864112854} -11/07/2021 01:50:04 - INFO - __main__ - Step 32532: {'lr': 0.00044931094432405766, 'samples': 6246144, 'steps': 32531, 'loss/train': 1.387347936630249} -11/07/2021 01:50:04 - INFO - __main__ - Step 32533: {'lr': 0.00044930774082320684, 'samples': 6246336, 'steps': 32532, 'loss/train': 1.7457025051116943} -11/07/2021 01:50:04 - INFO - __main__ - Step 32534: {'lr': 0.00044930453723255107, 'samples': 6246528, 'steps': 32533, 'loss/train': 1.3946459293365479} -11/07/2021 01:50:05 - INFO - __main__ - Step 32535: {'lr': 0.0004493013335520917, 'samples': 6246720, 'steps': 32534, 'loss/train': 1.4471338987350464} -11/07/2021 01:50:06 - INFO - __main__ - Step 32536: {'lr': 0.00044929812978183024, 'samples': 6246912, 'steps': 32535, 'loss/train': 1.768898606300354} -11/07/2021 01:50:06 - INFO - __main__ - Step 32537: {'lr': 0.0004492949259217681, 'samples': 6247104, 'steps': 32536, 'loss/train': 1.1240431070327759} -11/07/2021 01:50:06 - INFO - __main__ - Step 32538: {'lr': 0.00044929172197190684, 'samples': 6247296, 'steps': 32537, 'loss/train': 1.7329168319702148} -11/07/2021 01:50:07 - INFO - __main__ - Step 32539: {'lr': 0.00044928851793224765, 'samples': 6247488, 'steps': 32538, 'loss/train': 1.605699896812439} -11/07/2021 01:50:07 - INFO - __main__ - Step 32540: {'lr': 0.00044928531380279224, 'samples': 6247680, 'steps': 32539, 'loss/train': 1.6163506507873535} -11/07/2021 01:50:09 - INFO - __main__ - Step 32541: {'lr': 0.00044928210958354196, 'samples': 6247872, 'steps': 32540, 'loss/train': 1.6673510074615479} -11/07/2021 01:50:09 - INFO - __main__ - Step 32542: {'lr': 0.0004492789052744982, 'samples': 6248064, 'steps': 32541, 'loss/train': 1.6779664754867554} -11/07/2021 01:50:10 - INFO - __main__ - Step 32543: {'lr': 0.0004492757008756624, 'samples': 6248256, 'steps': 32542, 'loss/train': 1.5406057834625244} -11/07/2021 01:50:10 - INFO - __main__ - Step 32544: {'lr': 0.0004492724963870361, 'samples': 6248448, 'steps': 32543, 'loss/train': 1.3281011581420898} -11/07/2021 01:50:10 - INFO - __main__ - Step 32545: {'lr': 0.00044926929180862064, 'samples': 6248640, 'steps': 32544, 'loss/train': 1.0876872539520264} -11/07/2021 01:50:11 - INFO - __main__ - Step 32546: {'lr': 0.00044926608714041763, 'samples': 6248832, 'steps': 32545, 'loss/train': 1.8412197828292847} -11/07/2021 01:50:11 - INFO - __main__ - Step 32547: {'lr': 0.0004492628823824282, 'samples': 6249024, 'steps': 32546, 'loss/train': 1.2169973850250244} -11/07/2021 01:50:12 - INFO - __main__ - Step 32548: {'lr': 0.0004492596775346541, 'samples': 6249216, 'steps': 32547, 'loss/train': 1.6807281970977783} -11/07/2021 01:50:13 - INFO - __main__ - Step 32549: {'lr': 0.0004492564725970967, 'samples': 6249408, 'steps': 32548, 'loss/train': 1.6871615648269653} -11/07/2021 01:50:13 - INFO - __main__ - Step 32550: {'lr': 0.00044925326756975736, 'samples': 6249600, 'steps': 32549, 'loss/train': 1.5211896896362305} -11/07/2021 01:50:13 - INFO - __main__ - Step 32551: {'lr': 0.00044925006245263757, 'samples': 6249792, 'steps': 32550, 'loss/train': 1.6064367294311523} -11/07/2021 01:50:14 - INFO - __main__ - Step 32552: {'lr': 0.0004492468572457388, 'samples': 6249984, 'steps': 32551, 'loss/train': 1.7926182746887207} -11/07/2021 01:50:14 - INFO - __main__ - Step 32553: {'lr': 0.0004492436519490625, 'samples': 6250176, 'steps': 32552, 'loss/train': 1.2677383422851562} -11/07/2021 01:50:15 - INFO - __main__ - Step 32554: {'lr': 0.00044924044656260997, 'samples': 6250368, 'steps': 32553, 'loss/train': 1.7775638103485107} -11/07/2021 01:50:15 - INFO - __main__ - Step 32555: {'lr': 0.00044923724108638285, 'samples': 6250560, 'steps': 32554, 'loss/train': 1.6647224426269531} -11/07/2021 01:50:16 - INFO - __main__ - Step 32556: {'lr': 0.00044923403552038255, 'samples': 6250752, 'steps': 32555, 'loss/train': 1.6538268327713013} -11/07/2021 01:50:16 - INFO - __main__ - Step 32557: {'lr': 0.0004492308298646104, 'samples': 6250944, 'steps': 32556, 'loss/train': 0.9958004355430603} -11/07/2021 01:50:16 - INFO - __main__ - Step 32558: {'lr': 0.0004492276241190679, 'samples': 6251136, 'steps': 32557, 'loss/train': 1.4049321413040161} -11/07/2021 01:50:17 - INFO - __main__ - Step 32559: {'lr': 0.0004492244182837565, 'samples': 6251328, 'steps': 32558, 'loss/train': 1.5362626314163208} -11/07/2021 01:50:18 - INFO - __main__ - Step 32560: {'lr': 0.00044922121235867776, 'samples': 6251520, 'steps': 32559, 'loss/train': 1.790116548538208} -11/07/2021 01:50:18 - INFO - __main__ - Step 32561: {'lr': 0.00044921800634383294, 'samples': 6251712, 'steps': 32560, 'loss/train': 2.2426087856292725} -11/07/2021 01:50:18 - INFO - __main__ - Step 32562: {'lr': 0.0004492148002392235, 'samples': 6251904, 'steps': 32561, 'loss/train': 1.8030542135238647} -11/07/2021 01:50:19 - INFO - __main__ - Step 32563: {'lr': 0.000449211594044851, 'samples': 6252096, 'steps': 32562, 'loss/train': 1.7514045238494873} -11/07/2021 01:50:20 - INFO - __main__ - Step 32564: {'lr': 0.0004492083877607168, 'samples': 6252288, 'steps': 32563, 'loss/train': 0.4884999394416809} -11/07/2021 01:50:20 - INFO - __main__ - Step 32565: {'lr': 0.00044920518138682244, 'samples': 6252480, 'steps': 32564, 'loss/train': 1.502118468284607} -11/07/2021 01:50:21 - INFO - __main__ - Step 32566: {'lr': 0.00044920197492316925, 'samples': 6252672, 'steps': 32565, 'loss/train': 1.3578180074691772} -11/07/2021 01:50:21 - INFO - __main__ - Step 32567: {'lr': 0.00044919876836975876, 'samples': 6252864, 'steps': 32566, 'loss/train': 1.298283338546753} -11/07/2021 01:50:21 - INFO - __main__ - Step 32568: {'lr': 0.0004491955617265924, 'samples': 6253056, 'steps': 32567, 'loss/train': 1.2520887851715088} -11/07/2021 01:50:22 - INFO - __main__ - Step 32569: {'lr': 0.0004491923549936715, 'samples': 6253248, 'steps': 32568, 'loss/train': 2.1562204360961914} -11/07/2021 01:50:23 - INFO - __main__ - Step 32570: {'lr': 0.0004491891481709977, 'samples': 6253440, 'steps': 32569, 'loss/train': 0.5885365605354309} -11/07/2021 01:50:23 - INFO - __main__ - Step 32571: {'lr': 0.0004491859412585723, 'samples': 6253632, 'steps': 32570, 'loss/train': 1.0534669160842896} -11/07/2021 01:50:23 - INFO - __main__ - Step 32572: {'lr': 0.0004491827342563968, 'samples': 6253824, 'steps': 32571, 'loss/train': 1.350450038909912} -11/07/2021 01:50:24 - INFO - __main__ - Step 32573: {'lr': 0.0004491795271644726, 'samples': 6254016, 'steps': 32572, 'loss/train': 1.6586860418319702} -11/07/2021 01:50:25 - INFO - __main__ - Step 32574: {'lr': 0.0004491763199828012, 'samples': 6254208, 'steps': 32573, 'loss/train': 1.730752944946289} -11/07/2021 01:50:25 - INFO - __main__ - Step 32575: {'lr': 0.00044917311271138393, 'samples': 6254400, 'steps': 32574, 'loss/train': 2.4597697257995605} -11/07/2021 01:50:25 - INFO - __main__ - Step 32576: {'lr': 0.00044916990535022244, 'samples': 6254592, 'steps': 32575, 'loss/train': 1.6362158060073853} -11/07/2021 01:50:26 - INFO - __main__ - Step 32577: {'lr': 0.00044916669789931806, 'samples': 6254784, 'steps': 32576, 'loss/train': 1.377771258354187} -11/07/2021 01:50:26 - INFO - __main__ - Step 32578: {'lr': 0.0004491634903586722, 'samples': 6254976, 'steps': 32577, 'loss/train': 2.027752637863159} -11/07/2021 01:50:27 - INFO - __main__ - Step 32579: {'lr': 0.00044916028272828636, 'samples': 6255168, 'steps': 32578, 'loss/train': 1.014981985092163} -11/07/2021 01:50:28 - INFO - __main__ - Step 32580: {'lr': 0.00044915707500816206, 'samples': 6255360, 'steps': 32579, 'loss/train': 1.317042589187622} -11/07/2021 01:50:28 - INFO - __main__ - Step 32581: {'lr': 0.0004491538671983005, 'samples': 6255552, 'steps': 32580, 'loss/train': 1.6304385662078857} -11/07/2021 01:50:28 - INFO - __main__ - Step 32582: {'lr': 0.00044915065929870335, 'samples': 6255744, 'steps': 32581, 'loss/train': 1.2867671251296997} -11/07/2021 01:50:29 - INFO - __main__ - Step 32583: {'lr': 0.00044914745130937204, 'samples': 6255936, 'steps': 32582, 'loss/train': 1.5918105840682983} -11/07/2021 01:50:29 - INFO - __main__ - Step 32584: {'lr': 0.0004491442432303079, 'samples': 6256128, 'steps': 32583, 'loss/train': 1.6612629890441895} -11/07/2021 01:50:30 - INFO - __main__ - Step 32585: {'lr': 0.0004491410350615124, 'samples': 6256320, 'steps': 32584, 'loss/train': 1.5205086469650269} -11/07/2021 01:50:30 - INFO - __main__ - Step 32586: {'lr': 0.0004491378268029871, 'samples': 6256512, 'steps': 32585, 'loss/train': 1.4549225568771362} -11/07/2021 01:50:31 - INFO - __main__ - Step 32587: {'lr': 0.00044913461845473335, 'samples': 6256704, 'steps': 32586, 'loss/train': 1.4229557514190674} -11/07/2021 01:50:31 - INFO - __main__ - Step 32588: {'lr': 0.0004491314100167526, 'samples': 6256896, 'steps': 32587, 'loss/train': 1.5734999179840088} -11/07/2021 01:50:32 - INFO - __main__ - Step 32589: {'lr': 0.00044912820148904634, 'samples': 6257088, 'steps': 32588, 'loss/train': 1.9351128339767456} -11/07/2021 01:50:33 - INFO - __main__ - Step 32590: {'lr': 0.0004491249928716159, 'samples': 6257280, 'steps': 32589, 'loss/train': 1.3977437019348145} -11/07/2021 01:50:33 - INFO - __main__ - Step 32591: {'lr': 0.0004491217841644629, 'samples': 6257472, 'steps': 32590, 'loss/train': 1.452478051185608} -11/07/2021 01:50:33 - INFO - __main__ - Step 32592: {'lr': 0.0004491185753675886, 'samples': 6257664, 'steps': 32591, 'loss/train': 1.539903163909912} -11/07/2021 01:50:34 - INFO - __main__ - Step 32593: {'lr': 0.0004491153664809947, 'samples': 6257856, 'steps': 32592, 'loss/train': 2.1112542152404785} -11/07/2021 01:50:34 - INFO - __main__ - Step 32594: {'lr': 0.00044911215750468236, 'samples': 6258048, 'steps': 32593, 'loss/train': 0.5317099094390869} -11/07/2021 01:50:35 - INFO - __main__ - Step 32595: {'lr': 0.0004491089484386531, 'samples': 6258240, 'steps': 32594, 'loss/train': 1.503760814666748} -11/07/2021 01:50:36 - INFO - __main__ - Step 32596: {'lr': 0.0004491057392829086, 'samples': 6258432, 'steps': 32595, 'loss/train': 1.5326488018035889} -11/07/2021 01:50:36 - INFO - __main__ - Step 32597: {'lr': 0.00044910253003745007, 'samples': 6258624, 'steps': 32596, 'loss/train': 1.3503015041351318} -11/07/2021 01:50:36 - INFO - __main__ - Step 32598: {'lr': 0.00044909932070227887, 'samples': 6258816, 'steps': 32597, 'loss/train': 2.20670485496521} -11/07/2021 01:50:37 - INFO - __main__ - Step 32599: {'lr': 0.00044909611127739676, 'samples': 6259008, 'steps': 32598, 'loss/train': 1.7348023653030396} -11/07/2021 01:50:38 - INFO - __main__ - Step 32600: {'lr': 0.00044909290176280495, 'samples': 6259200, 'steps': 32599, 'loss/train': 0.8739935159683228} -11/07/2021 01:50:38 - INFO - __main__ - Step 32601: {'lr': 0.00044908969215850495, 'samples': 6259392, 'steps': 32600, 'loss/train': 1.4008625745773315} -11/07/2021 01:50:38 - INFO - __main__ - Step 32602: {'lr': 0.0004490864824644982, 'samples': 6259584, 'steps': 32601, 'loss/train': 1.0510605573654175} -11/07/2021 01:50:39 - INFO - __main__ - Step 32603: {'lr': 0.0004490832726807862, 'samples': 6259776, 'steps': 32602, 'loss/train': 1.8836473226547241} -11/07/2021 01:50:39 - INFO - __main__ - Step 32604: {'lr': 0.0004490800628073703, 'samples': 6259968, 'steps': 32603, 'loss/train': 0.8565096855163574} -11/07/2021 01:50:40 - INFO - __main__ - Step 32605: {'lr': 0.000449076852844252, 'samples': 6260160, 'steps': 32604, 'loss/train': 1.799138069152832} -11/07/2021 01:50:41 - INFO - __main__ - Step 32606: {'lr': 0.0004490736427914327, 'samples': 6260352, 'steps': 32605, 'loss/train': 1.4113820791244507} -11/07/2021 01:50:41 - INFO - __main__ - Step 32607: {'lr': 0.000449070432648914, 'samples': 6260544, 'steps': 32606, 'loss/train': 2.0013928413391113} -11/07/2021 01:50:41 - INFO - __main__ - Step 32608: {'lr': 0.0004490672224166972, 'samples': 6260736, 'steps': 32607, 'loss/train': 1.7255065441131592} -11/07/2021 01:50:42 - INFO - __main__ - Step 32609: {'lr': 0.00044906401209478367, 'samples': 6260928, 'steps': 32608, 'loss/train': 1.8993556499481201} -11/07/2021 01:50:43 - INFO - __main__ - Step 32610: {'lr': 0.00044906080168317507, 'samples': 6261120, 'steps': 32609, 'loss/train': 1.6636123657226562} -11/07/2021 01:50:43 - INFO - __main__ - Step 32611: {'lr': 0.0004490575911818727, 'samples': 6261312, 'steps': 32610, 'loss/train': 1.6317161321640015} -11/07/2021 01:50:43 - INFO - __main__ - Step 32612: {'lr': 0.0004490543805908781, 'samples': 6261504, 'steps': 32611, 'loss/train': 1.4363155364990234} -11/07/2021 01:50:44 - INFO - __main__ - Step 32613: {'lr': 0.00044905116991019264, 'samples': 6261696, 'steps': 32612, 'loss/train': 1.5295449495315552} -11/07/2021 01:50:44 - INFO - __main__ - Step 32614: {'lr': 0.00044904795913981775, 'samples': 6261888, 'steps': 32613, 'loss/train': 1.0661262273788452} -11/07/2021 01:50:45 - INFO - __main__ - Step 32615: {'lr': 0.00044904474827975506, 'samples': 6262080, 'steps': 32614, 'loss/train': 1.8657482862472534} -11/07/2021 01:50:45 - INFO - __main__ - Step 32616: {'lr': 0.00044904153733000575, 'samples': 6262272, 'steps': 32615, 'loss/train': 2.3484842777252197} -11/07/2021 01:50:46 - INFO - __main__ - Step 32617: {'lr': 0.0004490383262905714, 'samples': 6262464, 'steps': 32616, 'loss/train': 1.5342575311660767} -11/07/2021 01:50:46 - INFO - __main__ - Step 32618: {'lr': 0.00044903511516145353, 'samples': 6262656, 'steps': 32617, 'loss/train': 1.6417678594589233} -11/07/2021 01:50:47 - INFO - __main__ - Step 32619: {'lr': 0.0004490319039426535, 'samples': 6262848, 'steps': 32618, 'loss/train': 1.7578563690185547} -11/07/2021 01:50:47 - INFO - __main__ - Step 32620: {'lr': 0.0004490286926341727, 'samples': 6263040, 'steps': 32619, 'loss/train': 1.2401134967803955} -11/07/2021 01:50:48 - INFO - __main__ - Step 32621: {'lr': 0.0004490254812360126, 'samples': 6263232, 'steps': 32620, 'loss/train': 1.5842281579971313} -11/07/2021 01:50:48 - INFO - __main__ - Step 32622: {'lr': 0.0004490222697481748, 'samples': 6263424, 'steps': 32621, 'loss/train': 1.4485617876052856} -11/07/2021 01:50:49 - INFO - __main__ - Step 32623: {'lr': 0.00044901905817066055, 'samples': 6263616, 'steps': 32622, 'loss/train': 1.4813716411590576} -11/07/2021 01:50:49 - INFO - __main__ - Step 32624: {'lr': 0.00044901584650347147, 'samples': 6263808, 'steps': 32623, 'loss/train': 1.515797734260559} -11/07/2021 01:50:49 - INFO - __main__ - Step 32625: {'lr': 0.00044901263474660894, 'samples': 6264000, 'steps': 32624, 'loss/train': 1.7303627729415894} -11/07/2021 01:50:50 - INFO - __main__ - Step 32626: {'lr': 0.0004490094229000743, 'samples': 6264192, 'steps': 32625, 'loss/train': 1.6219604015350342} -11/07/2021 01:50:51 - INFO - __main__ - Step 32627: {'lr': 0.00044900621096386904, 'samples': 6264384, 'steps': 32626, 'loss/train': 1.5284425020217896} -11/07/2021 01:50:51 - INFO - __main__ - Step 32628: {'lr': 0.00044900299893799476, 'samples': 6264576, 'steps': 32627, 'loss/train': 2.063946008682251} -11/07/2021 01:50:51 - INFO - __main__ - Step 32629: {'lr': 0.0004489997868224528, 'samples': 6264768, 'steps': 32628, 'loss/train': 1.539214015007019} -11/07/2021 01:50:52 - INFO - __main__ - Step 32630: {'lr': 0.00044899657461724453, 'samples': 6264960, 'steps': 32629, 'loss/train': 1.2570024728775024} -11/07/2021 01:50:53 - INFO - __main__ - Step 32631: {'lr': 0.00044899336232237156, 'samples': 6265152, 'steps': 32630, 'loss/train': 1.4593011140823364} -11/07/2021 01:50:53 - INFO - __main__ - Step 32632: {'lr': 0.0004489901499378352, 'samples': 6265344, 'steps': 32631, 'loss/train': 1.3911088705062866} -11/07/2021 01:50:54 - INFO - __main__ - Step 32633: {'lr': 0.00044898693746363695, 'samples': 6265536, 'steps': 32632, 'loss/train': 1.2107559442520142} -11/07/2021 01:50:54 - INFO - __main__ - Step 32634: {'lr': 0.00044898372489977825, 'samples': 6265728, 'steps': 32633, 'loss/train': 1.6459823846817017} -11/07/2021 01:50:54 - INFO - __main__ - Step 32635: {'lr': 0.0004489805122462606, 'samples': 6265920, 'steps': 32634, 'loss/train': 1.6577672958374023} -11/07/2021 01:50:55 - INFO - __main__ - Step 32636: {'lr': 0.0004489772995030853, 'samples': 6266112, 'steps': 32635, 'loss/train': 1.554206371307373} -11/07/2021 01:50:56 - INFO - __main__ - Step 32637: {'lr': 0.00044897408667025397, 'samples': 6266304, 'steps': 32636, 'loss/train': 1.4235544204711914} -11/07/2021 01:50:56 - INFO - __main__ - Step 32638: {'lr': 0.000448970873747768, 'samples': 6266496, 'steps': 32637, 'loss/train': 1.7344202995300293} -11/07/2021 01:50:56 - INFO - __main__ - Step 32639: {'lr': 0.0004489676607356288, 'samples': 6266688, 'steps': 32638, 'loss/train': 1.4471172094345093} -11/07/2021 01:50:57 - INFO - __main__ - Step 32640: {'lr': 0.00044896444763383787, 'samples': 6266880, 'steps': 32639, 'loss/train': 1.6442102193832397} -11/07/2021 01:50:58 - INFO - __main__ - Step 32641: {'lr': 0.00044896123444239654, 'samples': 6267072, 'steps': 32640, 'loss/train': 1.3261736631393433} -11/07/2021 01:50:58 - INFO - __main__ - Step 32642: {'lr': 0.00044895802116130644, 'samples': 6267264, 'steps': 32641, 'loss/train': 1.5865647792816162} -11/07/2021 01:50:59 - INFO - __main__ - Step 32643: {'lr': 0.0004489548077905689, 'samples': 6267456, 'steps': 32642, 'loss/train': 1.6438711881637573} -11/07/2021 01:50:59 - INFO - __main__ - Step 32644: {'lr': 0.0004489515943301854, 'samples': 6267648, 'steps': 32643, 'loss/train': 1.586187720298767} -11/07/2021 01:50:59 - INFO - __main__ - Step 32645: {'lr': 0.0004489483807801574, 'samples': 6267840, 'steps': 32644, 'loss/train': 2.010782241821289} -11/07/2021 01:51:00 - INFO - __main__ - Step 32646: {'lr': 0.00044894516714048626, 'samples': 6268032, 'steps': 32645, 'loss/train': 0.6327466368675232} -11/07/2021 01:51:01 - INFO - __main__ - Step 32647: {'lr': 0.0004489419534111736, 'samples': 6268224, 'steps': 32646, 'loss/train': 1.2490745782852173} -11/07/2021 01:51:01 - INFO - __main__ - Step 32648: {'lr': 0.0004489387395922207, 'samples': 6268416, 'steps': 32647, 'loss/train': 1.1977260112762451} -11/07/2021 01:51:02 - INFO - __main__ - Step 32649: {'lr': 0.00044893552568362903, 'samples': 6268608, 'steps': 32648, 'loss/train': 1.0430372953414917} -11/07/2021 01:51:02 - INFO - __main__ - Step 32650: {'lr': 0.0004489323116854002, 'samples': 6268800, 'steps': 32649, 'loss/train': 2.163680076599121} -11/07/2021 01:51:02 - INFO - __main__ - Step 32651: {'lr': 0.00044892909759753545, 'samples': 6268992, 'steps': 32650, 'loss/train': 1.574050784111023} -11/07/2021 01:51:03 - INFO - __main__ - Step 32652: {'lr': 0.00044892588342003637, 'samples': 6269184, 'steps': 32651, 'loss/train': 1.681310772895813} -11/07/2021 01:51:04 - INFO - __main__ - Step 32653: {'lr': 0.00044892266915290435, 'samples': 6269376, 'steps': 32652, 'loss/train': 1.147005319595337} -11/07/2021 01:51:04 - INFO - __main__ - Step 32654: {'lr': 0.00044891945479614084, 'samples': 6269568, 'steps': 32653, 'loss/train': 1.4096343517303467} -11/07/2021 01:51:04 - INFO - __main__ - Step 32655: {'lr': 0.00044891624034974726, 'samples': 6269760, 'steps': 32654, 'loss/train': 0.13647647202014923} -11/07/2021 01:51:05 - INFO - __main__ - Step 32656: {'lr': 0.00044891302581372513, 'samples': 6269952, 'steps': 32655, 'loss/train': 1.183340072631836} -11/07/2021 01:51:06 - INFO - __main__ - Step 32657: {'lr': 0.00044890981118807585, 'samples': 6270144, 'steps': 32656, 'loss/train': 2.038282871246338} -11/07/2021 01:51:06 - INFO - __main__ - Step 32658: {'lr': 0.00044890659647280084, 'samples': 6270336, 'steps': 32657, 'loss/train': 1.4143182039260864} -11/07/2021 01:51:07 - INFO - __main__ - Step 32659: {'lr': 0.0004489033816679016, 'samples': 6270528, 'steps': 32658, 'loss/train': 1.9537559747695923} -11/07/2021 01:51:07 - INFO - __main__ - Step 32660: {'lr': 0.0004489001667733796, 'samples': 6270720, 'steps': 32659, 'loss/train': 1.4231013059616089} -11/07/2021 01:51:07 - INFO - __main__ - Step 32661: {'lr': 0.0004488969517892363, 'samples': 6270912, 'steps': 32660, 'loss/train': 0.7900300025939941} -11/07/2021 01:51:08 - INFO - __main__ - Step 32662: {'lr': 0.000448893736715473, 'samples': 6271104, 'steps': 32661, 'loss/train': 0.13605500757694244} -11/07/2021 01:51:09 - INFO - __main__ - Step 32663: {'lr': 0.0004488905215520913, 'samples': 6271296, 'steps': 32662, 'loss/train': 1.8541309833526611} -11/07/2021 01:51:09 - INFO - __main__ - Step 32664: {'lr': 0.00044888730629909256, 'samples': 6271488, 'steps': 32663, 'loss/train': 1.7157195806503296} -11/07/2021 01:51:09 - INFO - __main__ - Step 32665: {'lr': 0.00044888409095647833, 'samples': 6271680, 'steps': 32664, 'loss/train': 1.3088997602462769} -11/07/2021 01:51:10 - INFO - __main__ - Step 32666: {'lr': 0.00044888087552424997, 'samples': 6271872, 'steps': 32665, 'loss/train': 2.039842128753662} -11/07/2021 01:51:11 - INFO - __main__ - Step 32667: {'lr': 0.00044887766000240893, 'samples': 6272064, 'steps': 32666, 'loss/train': 1.5708863735198975} -11/07/2021 01:51:11 - INFO - __main__ - Step 32668: {'lr': 0.0004488744443909567, 'samples': 6272256, 'steps': 32667, 'loss/train': 0.8644485473632812} -11/07/2021 01:51:12 - INFO - __main__ - Step 32669: {'lr': 0.0004488712286898947, 'samples': 6272448, 'steps': 32668, 'loss/train': 1.4932048320770264} -11/07/2021 01:51:12 - INFO - __main__ - Step 32670: {'lr': 0.0004488680128992244, 'samples': 6272640, 'steps': 32669, 'loss/train': 1.103938341140747} -11/07/2021 01:51:12 - INFO - __main__ - Step 32671: {'lr': 0.00044886479701894736, 'samples': 6272832, 'steps': 32670, 'loss/train': 1.7463362216949463} -11/07/2021 01:51:13 - INFO - __main__ - Step 32672: {'lr': 0.00044886158104906476, 'samples': 6273024, 'steps': 32671, 'loss/train': 1.4635449647903442} -11/07/2021 01:51:14 - INFO - __main__ - Step 32673: {'lr': 0.0004488583649895782, 'samples': 6273216, 'steps': 32672, 'loss/train': 1.4198908805847168} -11/07/2021 01:51:14 - INFO - __main__ - Step 32674: {'lr': 0.00044885514884048926, 'samples': 6273408, 'steps': 32673, 'loss/train': 2.2054474353790283} -11/07/2021 01:51:14 - INFO - __main__ - Step 32675: {'lr': 0.0004488519326017991, 'samples': 6273600, 'steps': 32674, 'loss/train': 0.6003201603889465} -11/07/2021 01:51:15 - INFO - __main__ - Step 32676: {'lr': 0.0004488487162735094, 'samples': 6273792, 'steps': 32675, 'loss/train': 1.483665943145752} -11/07/2021 01:51:16 - INFO - __main__ - Step 32677: {'lr': 0.00044884549985562165, 'samples': 6273984, 'steps': 32676, 'loss/train': 1.7669689655303955} -11/07/2021 01:51:16 - INFO - __main__ - Step 32678: {'lr': 0.000448842283348137, 'samples': 6274176, 'steps': 32677, 'loss/train': 1.4703480005264282} -11/07/2021 01:51:16 - INFO - __main__ - Step 32679: {'lr': 0.0004488390667510572, 'samples': 6274368, 'steps': 32678, 'loss/train': 1.728654146194458} -11/07/2021 01:51:17 - INFO - __main__ - Step 32680: {'lr': 0.00044883585006438354, 'samples': 6274560, 'steps': 32679, 'loss/train': 2.1558849811553955} -11/07/2021 01:51:17 - INFO - __main__ - Step 32681: {'lr': 0.0004488326332881175, 'samples': 6274752, 'steps': 32680, 'loss/train': 1.354612946510315} -11/07/2021 01:51:17 - INFO - __main__ - Step 32682: {'lr': 0.0004488294164222606, 'samples': 6274944, 'steps': 32681, 'loss/train': 1.248321771621704} -11/07/2021 01:51:18 - INFO - __main__ - Step 32683: {'lr': 0.0004488261994668142, 'samples': 6275136, 'steps': 32682, 'loss/train': 1.4758888483047485} -11/07/2021 01:51:19 - INFO - __main__ - Step 32684: {'lr': 0.00044882298242177976, 'samples': 6275328, 'steps': 32683, 'loss/train': 1.4852855205535889} -11/07/2021 01:51:19 - INFO - __main__ - Step 32685: {'lr': 0.00044881976528715877, 'samples': 6275520, 'steps': 32684, 'loss/train': 1.3000860214233398} -11/07/2021 01:51:20 - INFO - __main__ - Step 32686: {'lr': 0.0004488165480629527, 'samples': 6275712, 'steps': 32685, 'loss/train': 1.4111723899841309} -11/07/2021 01:51:20 - INFO - __main__ - Step 32687: {'lr': 0.00044881333074916287, 'samples': 6275904, 'steps': 32686, 'loss/train': 1.4297772645950317} -11/07/2021 01:51:21 - INFO - __main__ - Step 32688: {'lr': 0.00044881011334579093, 'samples': 6276096, 'steps': 32687, 'loss/train': 1.4350974559783936} -11/07/2021 01:51:21 - INFO - __main__ - Step 32689: {'lr': 0.0004488068958528382, 'samples': 6276288, 'steps': 32688, 'loss/train': 1.2064836025238037} -11/07/2021 01:51:22 - INFO - __main__ - Step 32690: {'lr': 0.0004488036782703061, 'samples': 6276480, 'steps': 32689, 'loss/train': 1.6409106254577637} -11/07/2021 01:51:22 - INFO - __main__ - Step 32691: {'lr': 0.00044880046059819615, 'samples': 6276672, 'steps': 32690, 'loss/train': 1.3003720045089722} -11/07/2021 01:51:22 - INFO - __main__ - Step 32692: {'lr': 0.00044879724283650976, 'samples': 6276864, 'steps': 32691, 'loss/train': 1.6657252311706543} -11/07/2021 01:51:23 - INFO - __main__ - Step 32693: {'lr': 0.0004487940249852484, 'samples': 6277056, 'steps': 32692, 'loss/train': 1.2542271614074707} -11/07/2021 01:51:24 - INFO - __main__ - Step 32694: {'lr': 0.0004487908070444136, 'samples': 6277248, 'steps': 32693, 'loss/train': 1.806897521018982} -11/07/2021 01:51:24 - INFO - __main__ - Step 32695: {'lr': 0.00044878758901400665, 'samples': 6277440, 'steps': 32694, 'loss/train': 1.5347445011138916} -11/07/2021 01:51:24 - INFO - __main__ - Step 32696: {'lr': 0.00044878437089402906, 'samples': 6277632, 'steps': 32695, 'loss/train': 2.1197705268859863} -11/07/2021 01:51:25 - INFO - __main__ - Step 32697: {'lr': 0.0004487811526844824, 'samples': 6277824, 'steps': 32696, 'loss/train': 1.1654471158981323} -11/07/2021 01:51:26 - INFO - __main__ - Step 32698: {'lr': 0.0004487779343853679, 'samples': 6278016, 'steps': 32697, 'loss/train': 1.547286868095398} -11/07/2021 01:51:26 - INFO - __main__ - Step 32699: {'lr': 0.00044877471599668716, 'samples': 6278208, 'steps': 32698, 'loss/train': 0.7873335480690002} -11/07/2021 01:51:27 - INFO - __main__ - Step 32700: {'lr': 0.00044877149751844164, 'samples': 6278400, 'steps': 32699, 'loss/train': 2.0370588302612305} -11/07/2021 01:51:27 - INFO - __main__ - Step 32701: {'lr': 0.00044876827895063277, 'samples': 6278592, 'steps': 32700, 'loss/train': 1.2202073335647583} -11/07/2021 01:51:27 - INFO - __main__ - Step 32702: {'lr': 0.0004487650602932619, 'samples': 6278784, 'steps': 32701, 'loss/train': 1.208509087562561} -11/07/2021 01:51:28 - INFO - __main__ - Step 32703: {'lr': 0.00044876184154633066, 'samples': 6278976, 'steps': 32702, 'loss/train': 1.2279237508773804} -11/07/2021 01:51:29 - INFO - __main__ - Step 32704: {'lr': 0.00044875862270984035, 'samples': 6279168, 'steps': 32703, 'loss/train': 1.2749691009521484} -11/07/2021 01:51:29 - INFO - __main__ - Step 32705: {'lr': 0.0004487554037837925, 'samples': 6279360, 'steps': 32704, 'loss/train': 1.5158764123916626} -11/07/2021 01:51:29 - INFO - __main__ - Step 32706: {'lr': 0.00044875218476818845, 'samples': 6279552, 'steps': 32705, 'loss/train': 0.7631714940071106} -11/07/2021 01:51:30 - INFO - __main__ - Step 32707: {'lr': 0.0004487489656630298, 'samples': 6279744, 'steps': 32706, 'loss/train': 1.2436619997024536} -11/07/2021 01:51:31 - INFO - __main__ - Step 32708: {'lr': 0.00044874574646831794, 'samples': 6279936, 'steps': 32707, 'loss/train': 1.5233253240585327} -11/07/2021 01:51:31 - INFO - __main__ - Step 32709: {'lr': 0.0004487425271840543, 'samples': 6280128, 'steps': 32708, 'loss/train': 1.2317440509796143} -11/07/2021 01:51:32 - INFO - __main__ - Step 32710: {'lr': 0.0004487393078102403, 'samples': 6280320, 'steps': 32709, 'loss/train': 1.1704007387161255} -11/07/2021 01:51:32 - INFO - __main__ - Step 32711: {'lr': 0.00044873608834687754, 'samples': 6280512, 'steps': 32710, 'loss/train': 0.9771917462348938} -11/07/2021 01:51:32 - INFO - __main__ - Step 32712: {'lr': 0.00044873286879396724, 'samples': 6280704, 'steps': 32711, 'loss/train': 1.4926505088806152} -11/07/2021 01:51:33 - INFO - __main__ - Step 32713: {'lr': 0.00044872964915151106, 'samples': 6280896, 'steps': 32712, 'loss/train': 1.4966946840286255} -11/07/2021 01:51:33 - INFO - __main__ - Step 32714: {'lr': 0.00044872642941951035, 'samples': 6281088, 'steps': 32713, 'loss/train': 0.7444011569023132} -11/07/2021 01:51:34 - INFO - __main__ - Step 32715: {'lr': 0.0004487232095979666, 'samples': 6281280, 'steps': 32714, 'loss/train': 0.12462414056062698} -11/07/2021 01:51:35 - INFO - __main__ - Step 32716: {'lr': 0.0004487199896868812, 'samples': 6281472, 'steps': 32715, 'loss/train': 1.3743922710418701} -11/07/2021 01:51:35 - INFO - __main__ - Step 32717: {'lr': 0.00044871676968625564, 'samples': 6281664, 'steps': 32716, 'loss/train': 0.969983696937561} -11/07/2021 01:51:35 - INFO - __main__ - Step 32718: {'lr': 0.00044871354959609135, 'samples': 6281856, 'steps': 32717, 'loss/train': 0.7198702096939087} -11/07/2021 01:51:36 - INFO - __main__ - Step 32719: {'lr': 0.00044871032941638984, 'samples': 6282048, 'steps': 32718, 'loss/train': 1.4743660688400269} -11/07/2021 01:51:37 - INFO - __main__ - Step 32720: {'lr': 0.00044870710914715254, 'samples': 6282240, 'steps': 32719, 'loss/train': 1.7300770282745361} -11/07/2021 01:51:37 - INFO - __main__ - Step 32721: {'lr': 0.00044870388878838084, 'samples': 6282432, 'steps': 32720, 'loss/train': 1.1336641311645508} -11/07/2021 01:51:37 - INFO - __main__ - Step 32722: {'lr': 0.00044870066834007627, 'samples': 6282624, 'steps': 32721, 'loss/train': 2.130664587020874} -11/07/2021 01:51:38 - INFO - __main__ - Step 32723: {'lr': 0.0004486974478022402, 'samples': 6282816, 'steps': 32722, 'loss/train': 1.418270230293274} -11/07/2021 01:51:38 - INFO - __main__ - Step 32724: {'lr': 0.0004486942271748742, 'samples': 6283008, 'steps': 32723, 'loss/train': 1.6737797260284424} -11/07/2021 01:51:39 - INFO - __main__ - Step 32725: {'lr': 0.0004486910064579796, 'samples': 6283200, 'steps': 32724, 'loss/train': 1.8791981935501099} -11/07/2021 01:51:40 - INFO - __main__ - Step 32726: {'lr': 0.00044868778565155783, 'samples': 6283392, 'steps': 32725, 'loss/train': 1.7475714683532715} -11/07/2021 01:51:40 - INFO - __main__ - Step 32727: {'lr': 0.00044868456475561047, 'samples': 6283584, 'steps': 32726, 'loss/train': 1.5137977600097656} -11/07/2021 01:51:40 - INFO - __main__ - Step 32728: {'lr': 0.0004486813437701389, 'samples': 6283776, 'steps': 32727, 'loss/train': 1.4692602157592773} -11/07/2021 01:51:41 - INFO - __main__ - Step 32729: {'lr': 0.0004486781226951446, 'samples': 6283968, 'steps': 32728, 'loss/train': 1.7525389194488525} -11/07/2021 01:51:41 - INFO - __main__ - Step 32730: {'lr': 0.000448674901530629, 'samples': 6284160, 'steps': 32729, 'loss/train': 2.4053380489349365} -11/07/2021 01:51:42 - INFO - __main__ - Step 32731: {'lr': 0.00044867168027659356, 'samples': 6284352, 'steps': 32730, 'loss/train': 0.664936900138855} -11/07/2021 01:51:42 - INFO - __main__ - Step 32732: {'lr': 0.00044866845893303973, 'samples': 6284544, 'steps': 32731, 'loss/train': 1.8049708604812622} -11/07/2021 01:51:43 - INFO - __main__ - Step 32733: {'lr': 0.00044866523749996897, 'samples': 6284736, 'steps': 32732, 'loss/train': 1.127227783203125} -11/07/2021 01:51:43 - INFO - __main__ - Step 32734: {'lr': 0.0004486620159773827, 'samples': 6284928, 'steps': 32733, 'loss/train': 1.4827308654785156} -11/07/2021 01:51:43 - INFO - __main__ - Step 32735: {'lr': 0.0004486587943652823, 'samples': 6285120, 'steps': 32734, 'loss/train': 0.731379508972168} -11/07/2021 01:51:44 - INFO - __main__ - Step 32736: {'lr': 0.00044865557266366953, 'samples': 6285312, 'steps': 32735, 'loss/train': 1.535205602645874} -11/07/2021 01:51:45 - INFO - __main__ - Step 32737: {'lr': 0.0004486523508725454, 'samples': 6285504, 'steps': 32736, 'loss/train': 0.8805704712867737} -11/07/2021 01:51:45 - INFO - __main__ - Step 32738: {'lr': 0.00044864912899191174, 'samples': 6285696, 'steps': 32737, 'loss/train': 1.415027141571045} -11/07/2021 01:51:45 - INFO - __main__ - Step 32739: {'lr': 0.00044864590702176977, 'samples': 6285888, 'steps': 32738, 'loss/train': 2.4802517890930176} -11/07/2021 01:51:46 - INFO - __main__ - Step 32740: {'lr': 0.000448642684962121, 'samples': 6286080, 'steps': 32739, 'loss/train': 0.7023144364356995} -11/07/2021 01:51:47 - INFO - __main__ - Step 32741: {'lr': 0.000448639462812967, 'samples': 6286272, 'steps': 32740, 'loss/train': 1.2147858142852783} -11/07/2021 01:51:47 - INFO - __main__ - Step 32742: {'lr': 0.0004486362405743091, 'samples': 6286464, 'steps': 32741, 'loss/train': 1.6830997467041016} -11/07/2021 01:51:47 - INFO - __main__ - Step 32743: {'lr': 0.0004486330182461487, 'samples': 6286656, 'steps': 32742, 'loss/train': 1.9115580320358276} -11/07/2021 01:51:48 - INFO - __main__ - Step 32744: {'lr': 0.0004486297958284874, 'samples': 6286848, 'steps': 32743, 'loss/train': 1.754269003868103} -11/07/2021 01:51:48 - INFO - __main__ - Step 32745: {'lr': 0.0004486265733213265, 'samples': 6287040, 'steps': 32744, 'loss/train': 1.3951165676116943} -11/07/2021 01:51:49 - INFO - __main__ - Step 32746: {'lr': 0.00044862335072466767, 'samples': 6287232, 'steps': 32745, 'loss/train': 1.4054536819458008} -11/07/2021 01:51:49 - INFO - __main__ - Step 32747: {'lr': 0.00044862012803851203, 'samples': 6287424, 'steps': 32746, 'loss/train': 1.815017819404602} -11/07/2021 01:51:50 - INFO - __main__ - Step 32748: {'lr': 0.00044861690526286135, 'samples': 6287616, 'steps': 32747, 'loss/train': 1.6497738361358643} -11/07/2021 01:51:50 - INFO - __main__ - Step 32749: {'lr': 0.00044861368239771694, 'samples': 6287808, 'steps': 32748, 'loss/train': 1.5400633811950684} -11/07/2021 01:51:51 - INFO - __main__ - Step 32750: {'lr': 0.00044861045944308026, 'samples': 6288000, 'steps': 32749, 'loss/train': 2.035322427749634} -11/07/2021 01:51:52 - INFO - __main__ - Step 32751: {'lr': 0.0004486072363989528, 'samples': 6288192, 'steps': 32750, 'loss/train': 1.2623913288116455} -11/07/2021 01:51:52 - INFO - __main__ - Step 32752: {'lr': 0.00044860401326533595, 'samples': 6288384, 'steps': 32751, 'loss/train': 1.6374726295471191} -11/07/2021 01:51:52 - INFO - __main__ - Step 32753: {'lr': 0.0004486007900422312, 'samples': 6288576, 'steps': 32752, 'loss/train': 1.5325310230255127} -11/07/2021 01:51:53 - INFO - __main__ - Step 32754: {'lr': 0.00044859756672964, 'samples': 6288768, 'steps': 32753, 'loss/train': 1.6418508291244507} -11/07/2021 01:51:53 - INFO - __main__ - Step 32755: {'lr': 0.00044859434332756383, 'samples': 6288960, 'steps': 32754, 'loss/train': 1.3992834091186523} -11/07/2021 01:51:53 - INFO - __main__ - Step 32756: {'lr': 0.0004485911198360041, 'samples': 6289152, 'steps': 32755, 'loss/train': 1.0894807577133179} -11/07/2021 01:51:55 - INFO - __main__ - Step 32757: {'lr': 0.0004485878962549622, 'samples': 6289344, 'steps': 32756, 'loss/train': 1.551389217376709} -11/07/2021 01:51:55 - INFO - __main__ - Step 32758: {'lr': 0.0004485846725844398, 'samples': 6289536, 'steps': 32757, 'loss/train': 1.5550835132598877} -11/07/2021 01:51:55 - INFO - __main__ - Step 32759: {'lr': 0.0004485814488244381, 'samples': 6289728, 'steps': 32758, 'loss/train': 1.1718662977218628} -11/07/2021 01:51:56 - INFO - __main__ - Step 32760: {'lr': 0.0004485782249749587, 'samples': 6289920, 'steps': 32759, 'loss/train': 1.6369692087173462} -11/07/2021 01:51:57 - INFO - __main__ - Step 32761: {'lr': 0.00044857500103600304, 'samples': 6290112, 'steps': 32760, 'loss/train': 1.2651540040969849} -11/07/2021 01:51:57 - INFO - __main__ - Step 32762: {'lr': 0.00044857177700757247, 'samples': 6290304, 'steps': 32761, 'loss/train': 1.0267809629440308} -11/07/2021 01:51:58 - INFO - __main__ - Step 32763: {'lr': 0.00044856855288966856, 'samples': 6290496, 'steps': 32762, 'loss/train': 1.6318790912628174} -11/07/2021 01:51:58 - INFO - __main__ - Step 32764: {'lr': 0.0004485653286822927, 'samples': 6290688, 'steps': 32763, 'loss/train': 1.508261799812317} -11/07/2021 01:51:58 - INFO - __main__ - Step 32765: {'lr': 0.0004485621043854465, 'samples': 6290880, 'steps': 32764, 'loss/train': 1.1478630304336548} -11/07/2021 01:52:00 - INFO - __main__ - Step 32766: {'lr': 0.0004485588799991311, 'samples': 6291072, 'steps': 32765, 'loss/train': 1.610480785369873} -11/07/2021 01:52:00 - INFO - __main__ - Step 32767: {'lr': 0.0004485556555233483, 'samples': 6291264, 'steps': 32766, 'loss/train': 1.4900367259979248} -11/07/2021 01:52:01 - INFO - __main__ - Step 32768: {'lr': 0.0004485524309580993, 'samples': 6291456, 'steps': 32767, 'loss/train': 1.6736993789672852} -11/07/2021 01:52:01 - INFO - __main__ - Step 32769: {'lr': 0.0004485492063033856, 'samples': 6291648, 'steps': 32768, 'loss/train': 1.2844321727752686} -11/07/2021 01:52:01 - INFO - __main__ - Step 32770: {'lr': 0.0004485459815592087, 'samples': 6291840, 'steps': 32769, 'loss/train': 0.6486344933509827} -11/07/2021 01:52:02 - INFO - __main__ - Step 32771: {'lr': 0.0004485427567255701, 'samples': 6292032, 'steps': 32770, 'loss/train': 1.6293174028396606} -11/07/2021 01:52:03 - INFO - __main__ - Step 32772: {'lr': 0.0004485395318024712, 'samples': 6292224, 'steps': 32771, 'loss/train': 0.7933187484741211} -11/07/2021 01:52:03 - INFO - __main__ - Step 32773: {'lr': 0.00044853630678991344, 'samples': 6292416, 'steps': 32772, 'loss/train': 1.568111777305603} -11/07/2021 01:52:04 - INFO - __main__ - Step 32774: {'lr': 0.00044853308168789824, 'samples': 6292608, 'steps': 32773, 'loss/train': 1.1893032789230347} -11/07/2021 01:52:04 - INFO - __main__ - Step 32775: {'lr': 0.00044852985649642714, 'samples': 6292800, 'steps': 32774, 'loss/train': 1.2858831882476807} -11/07/2021 01:52:05 - INFO - __main__ - Step 32776: {'lr': 0.0004485266312155015, 'samples': 6292992, 'steps': 32775, 'loss/train': 0.5672725439071655} -11/07/2021 01:52:05 - INFO - __main__ - Step 32777: {'lr': 0.00044852340584512285, 'samples': 6293184, 'steps': 32776, 'loss/train': 1.5529122352600098} -11/07/2021 01:52:07 - INFO - __main__ - Step 32778: {'lr': 0.00044852018038529264, 'samples': 6293376, 'steps': 32777, 'loss/train': 0.8248746395111084} -11/07/2021 01:52:07 - INFO - __main__ - Step 32779: {'lr': 0.00044851695483601227, 'samples': 6293568, 'steps': 32778, 'loss/train': 1.5078567266464233} -11/07/2021 01:52:07 - INFO - __main__ - Step 32780: {'lr': 0.0004485137291972833, 'samples': 6293760, 'steps': 32779, 'loss/train': 0.17733517289161682} -11/07/2021 01:52:08 - INFO - __main__ - Step 32781: {'lr': 0.00044851050346910706, 'samples': 6293952, 'steps': 32780, 'loss/train': 1.8087482452392578} -11/07/2021 01:52:08 - INFO - __main__ - Step 32782: {'lr': 0.00044850727765148504, 'samples': 6294144, 'steps': 32781, 'loss/train': 1.6935482025146484} -11/07/2021 01:52:08 - INFO - __main__ - Step 32783: {'lr': 0.00044850405174441866, 'samples': 6294336, 'steps': 32782, 'loss/train': 1.7380541563034058} -11/07/2021 01:52:09 - INFO - __main__ - Step 32784: {'lr': 0.00044850082574790945, 'samples': 6294528, 'steps': 32783, 'loss/train': 1.4098385572433472} -11/07/2021 01:52:10 - INFO - __main__ - Step 32785: {'lr': 0.0004484975996619589, 'samples': 6294720, 'steps': 32784, 'loss/train': 1.4865195751190186} -11/07/2021 01:52:10 - INFO - __main__ - Step 32786: {'lr': 0.0004484943734865683, 'samples': 6294912, 'steps': 32785, 'loss/train': 1.7889684438705444} -11/07/2021 01:52:10 - INFO - __main__ - Step 32787: {'lr': 0.0004484911472217392, 'samples': 6295104, 'steps': 32786, 'loss/train': 1.7738747596740723} -11/07/2021 01:52:11 - INFO - __main__ - Step 32788: {'lr': 0.0004484879208674731, 'samples': 6295296, 'steps': 32787, 'loss/train': 1.524864673614502} -11/07/2021 01:52:12 - INFO - __main__ - Step 32789: {'lr': 0.0004484846944237714, 'samples': 6295488, 'steps': 32788, 'loss/train': 1.3773404359817505} -11/07/2021 01:52:12 - INFO - __main__ - Step 32790: {'lr': 0.0004484814678906355, 'samples': 6295680, 'steps': 32789, 'loss/train': 1.2628083229064941} -11/07/2021 01:52:12 - INFO - __main__ - Step 32791: {'lr': 0.00044847824126806703, 'samples': 6295872, 'steps': 32790, 'loss/train': 1.7810370922088623} -11/07/2021 01:52:13 - INFO - __main__ - Step 32792: {'lr': 0.0004484750145560672, 'samples': 6296064, 'steps': 32791, 'loss/train': 1.3144395351409912} -11/07/2021 01:52:13 - INFO - __main__ - Step 32793: {'lr': 0.0004484717877546377, 'samples': 6296256, 'steps': 32792, 'loss/train': 1.530842900276184} -11/07/2021 01:52:14 - INFO - __main__ - Step 32794: {'lr': 0.0004484685608637798, 'samples': 6296448, 'steps': 32793, 'loss/train': 2.359969139099121} -11/07/2021 01:52:14 - INFO - __main__ - Step 32795: {'lr': 0.00044846533388349507, 'samples': 6296640, 'steps': 32794, 'loss/train': 1.4508795738220215} -11/07/2021 01:52:15 - INFO - __main__ - Step 32796: {'lr': 0.00044846210681378487, 'samples': 6296832, 'steps': 32795, 'loss/train': 1.4554624557495117} -11/07/2021 01:52:15 - INFO - __main__ - Step 32797: {'lr': 0.00044845887965465076, 'samples': 6297024, 'steps': 32796, 'loss/train': 0.6192265748977661} -11/07/2021 01:52:16 - INFO - __main__ - Step 32798: {'lr': 0.0004484556524060941, 'samples': 6297216, 'steps': 32797, 'loss/train': 1.7106328010559082} -11/07/2021 01:52:16 - INFO - __main__ - Step 32799: {'lr': 0.00044845242506811646, 'samples': 6297408, 'steps': 32798, 'loss/train': 1.029484510421753} -11/07/2021 01:52:17 - INFO - __main__ - Step 32800: {'lr': 0.0004484491976407192, 'samples': 6297600, 'steps': 32799, 'loss/train': 0.9896617531776428} -11/07/2021 01:52:17 - INFO - __main__ - Step 32801: {'lr': 0.00044844597012390374, 'samples': 6297792, 'steps': 32800, 'loss/train': 1.7723320722579956} -11/07/2021 01:52:18 - INFO - __main__ - Step 32802: {'lr': 0.0004484427425176716, 'samples': 6297984, 'steps': 32801, 'loss/train': 1.3181513547897339} -11/07/2021 01:52:18 - INFO - __main__ - Step 32803: {'lr': 0.0004484395148220243, 'samples': 6298176, 'steps': 32802, 'loss/train': 1.4404723644256592} -11/07/2021 01:52:18 - INFO - __main__ - Step 32804: {'lr': 0.000448436287036963, 'samples': 6298368, 'steps': 32803, 'loss/train': 1.3333238363265991} -11/07/2021 01:52:19 - INFO - __main__ - Step 32805: {'lr': 0.0004484330591624896, 'samples': 6298560, 'steps': 32804, 'loss/train': 1.694399118423462} -11/07/2021 01:52:20 - INFO - __main__ - Step 32806: {'lr': 0.00044842983119860525, 'samples': 6298752, 'steps': 32805, 'loss/train': 1.9107273817062378} -11/07/2021 01:52:20 - INFO - __main__ - Step 32807: {'lr': 0.00044842660314531145, 'samples': 6298944, 'steps': 32806, 'loss/train': 1.6565542221069336} -11/07/2021 01:52:20 - INFO - __main__ - Step 32808: {'lr': 0.0004484233750026098, 'samples': 6299136, 'steps': 32807, 'loss/train': 1.9830169677734375} -11/07/2021 01:52:21 - INFO - __main__ - Step 32809: {'lr': 0.00044842014677050145, 'samples': 6299328, 'steps': 32808, 'loss/train': 1.630691409111023} -11/07/2021 01:52:22 - INFO - __main__ - Step 32810: {'lr': 0.0004484169184489882, 'samples': 6299520, 'steps': 32809, 'loss/train': 1.3876402378082275} -11/07/2021 01:52:22 - INFO - __main__ - Step 32811: {'lr': 0.0004484136900380713, 'samples': 6299712, 'steps': 32810, 'loss/train': 1.570265531539917} -11/07/2021 01:52:22 - INFO - __main__ - Step 32812: {'lr': 0.00044841046153775224, 'samples': 6299904, 'steps': 32811, 'loss/train': 1.195267915725708} -11/07/2021 01:52:23 - INFO - __main__ - Step 32813: {'lr': 0.0004484072329480325, 'samples': 6300096, 'steps': 32812, 'loss/train': 1.3839094638824463} -11/07/2021 01:52:23 - INFO - __main__ - Step 32814: {'lr': 0.00044840400426891347, 'samples': 6300288, 'steps': 32813, 'loss/train': 1.3134123086929321} -11/07/2021 01:52:24 - INFO - __main__ - Step 32815: {'lr': 0.00044840077550039676, 'samples': 6300480, 'steps': 32814, 'loss/train': 1.7066586017608643} -11/07/2021 01:52:24 - INFO - __main__ - Step 32816: {'lr': 0.0004483975466424837, 'samples': 6300672, 'steps': 32815, 'loss/train': 1.567929983139038} -11/07/2021 01:52:25 - INFO - __main__ - Step 32817: {'lr': 0.0004483943176951757, 'samples': 6300864, 'steps': 32816, 'loss/train': 1.2354013919830322} -11/07/2021 01:52:25 - INFO - __main__ - Step 32818: {'lr': 0.0004483910886584743, 'samples': 6301056, 'steps': 32817, 'loss/train': 1.8153525590896606} -11/07/2021 01:52:26 - INFO - __main__ - Step 32819: {'lr': 0.00044838785953238094, 'samples': 6301248, 'steps': 32818, 'loss/train': 1.7477885484695435} -11/07/2021 01:52:27 - INFO - __main__ - Step 32820: {'lr': 0.0004483846303168971, 'samples': 6301440, 'steps': 32819, 'loss/train': 1.4585903882980347} -11/07/2021 01:52:27 - INFO - __main__ - Step 32821: {'lr': 0.0004483814010120242, 'samples': 6301632, 'steps': 32820, 'loss/train': 1.7392491102218628} -11/07/2021 01:52:27 - INFO - __main__ - Step 32822: {'lr': 0.00044837817161776366, 'samples': 6301824, 'steps': 32821, 'loss/train': 1.7412809133529663} -11/07/2021 01:52:28 - INFO - __main__ - Step 32823: {'lr': 0.000448374942134117, 'samples': 6302016, 'steps': 32822, 'loss/train': 1.758912205696106} -11/07/2021 01:52:28 - INFO - __main__ - Step 32824: {'lr': 0.0004483717125610857, 'samples': 6302208, 'steps': 32823, 'loss/train': 1.3502815961837769} -11/07/2021 01:52:29 - INFO - __main__ - Step 32825: {'lr': 0.0004483684828986712, 'samples': 6302400, 'steps': 32824, 'loss/train': 1.465355396270752} -11/07/2021 01:52:29 - INFO - __main__ - Step 32826: {'lr': 0.00044836525314687477, 'samples': 6302592, 'steps': 32825, 'loss/train': 1.514260172843933} -11/07/2021 01:52:30 - INFO - __main__ - Step 32827: {'lr': 0.0004483620233056981, 'samples': 6302784, 'steps': 32826, 'loss/train': 1.2928588390350342} -11/07/2021 01:52:30 - INFO - __main__ - Step 32828: {'lr': 0.00044835879337514254, 'samples': 6302976, 'steps': 32827, 'loss/train': 1.0733113288879395} -11/07/2021 01:52:30 - INFO - __main__ - Step 32829: {'lr': 0.0004483555633552096, 'samples': 6303168, 'steps': 32828, 'loss/train': 1.7348523139953613} -11/07/2021 01:52:32 - INFO - __main__ - Step 32830: {'lr': 0.00044835233324590077, 'samples': 6303360, 'steps': 32829, 'loss/train': 1.7591265439987183} -11/07/2021 01:52:32 - INFO - __main__ - Step 32831: {'lr': 0.0004483491030472173, 'samples': 6303552, 'steps': 32830, 'loss/train': 0.8813719749450684} -11/07/2021 01:52:33 - INFO - __main__ - Step 32832: {'lr': 0.00044834587275916084, 'samples': 6303744, 'steps': 32831, 'loss/train': 1.1142882108688354} -11/07/2021 01:52:33 - INFO - __main__ - Step 32833: {'lr': 0.00044834264238173283, 'samples': 6303936, 'steps': 32832, 'loss/train': 0.9702965617179871} -11/07/2021 01:52:33 - INFO - __main__ - Step 32834: {'lr': 0.00044833941191493463, 'samples': 6304128, 'steps': 32833, 'loss/train': 1.464808464050293} -11/07/2021 01:52:34 - INFO - __main__ - Step 32835: {'lr': 0.0004483361813587678, 'samples': 6304320, 'steps': 32834, 'loss/train': 1.6141979694366455} -11/07/2021 01:52:35 - INFO - __main__ - Step 32836: {'lr': 0.0004483329507132337, 'samples': 6304512, 'steps': 32835, 'loss/train': 0.1967136561870575} -11/07/2021 01:52:35 - INFO - __main__ - Step 32837: {'lr': 0.0004483297199783338, 'samples': 6304704, 'steps': 32836, 'loss/train': 1.5581127405166626} -11/07/2021 01:52:36 - INFO - __main__ - Step 32838: {'lr': 0.0004483264891540697, 'samples': 6304896, 'steps': 32837, 'loss/train': 1.515840768814087} -11/07/2021 01:52:36 - INFO - __main__ - Step 32839: {'lr': 0.00044832325824044274, 'samples': 6305088, 'steps': 32838, 'loss/train': 1.810701847076416} -11/07/2021 01:52:36 - INFO - __main__ - Step 32840: {'lr': 0.0004483200272374543, 'samples': 6305280, 'steps': 32839, 'loss/train': 1.9597874879837036} -11/07/2021 01:52:37 - INFO - __main__ - Step 32841: {'lr': 0.0004483167961451059, 'samples': 6305472, 'steps': 32840, 'loss/train': 1.7444734573364258} -11/07/2021 01:52:38 - INFO - __main__ - Step 32842: {'lr': 0.00044831356496339913, 'samples': 6305664, 'steps': 32841, 'loss/train': 1.6750328540802002} -11/07/2021 01:52:38 - INFO - __main__ - Step 32843: {'lr': 0.0004483103336923352, 'samples': 6305856, 'steps': 32842, 'loss/train': 1.8195252418518066} -11/07/2021 01:52:38 - INFO - __main__ - Step 32844: {'lr': 0.00044830710233191573, 'samples': 6306048, 'steps': 32843, 'loss/train': 1.419494867324829} -11/07/2021 01:52:39 - INFO - __main__ - Step 32845: {'lr': 0.0004483038708821422, 'samples': 6306240, 'steps': 32844, 'loss/train': 1.6472922563552856} -11/07/2021 01:52:40 - INFO - __main__ - Step 32846: {'lr': 0.00044830063934301603, 'samples': 6306432, 'steps': 32845, 'loss/train': 1.400617241859436} -11/07/2021 01:52:40 - INFO - __main__ - Step 32847: {'lr': 0.0004482974077145385, 'samples': 6306624, 'steps': 32846, 'loss/train': 1.5048298835754395} -11/07/2021 01:52:40 - INFO - __main__ - Step 32848: {'lr': 0.0004482941759967113, 'samples': 6306816, 'steps': 32847, 'loss/train': 1.3856581449508667} -11/07/2021 01:52:41 - INFO - __main__ - Step 32849: {'lr': 0.00044829094418953586, 'samples': 6307008, 'steps': 32848, 'loss/train': 1.4409213066101074} -11/07/2021 01:52:41 - INFO - __main__ - Step 32850: {'lr': 0.00044828771229301354, 'samples': 6307200, 'steps': 32849, 'loss/train': 1.7861766815185547} -11/07/2021 01:52:43 - INFO - __main__ - Step 32851: {'lr': 0.0004482844803071458, 'samples': 6307392, 'steps': 32850, 'loss/train': 1.4633113145828247} -11/07/2021 01:52:43 - INFO - __main__ - Step 32852: {'lr': 0.00044828124823193417, 'samples': 6307584, 'steps': 32851, 'loss/train': 1.0925400257110596} -11/07/2021 01:52:44 - INFO - __main__ - Step 32853: {'lr': 0.00044827801606738004, 'samples': 6307776, 'steps': 32852, 'loss/train': 0.734474778175354} -11/07/2021 01:52:44 - INFO - __main__ - Step 32854: {'lr': 0.00044827478381348495, 'samples': 6307968, 'steps': 32853, 'loss/train': 0.8628458976745605} -11/07/2021 01:52:44 - INFO - __main__ - Step 32855: {'lr': 0.00044827155147025025, 'samples': 6308160, 'steps': 32854, 'loss/train': 1.8457977771759033} -11/07/2021 01:52:45 - INFO - __main__ - Step 32856: {'lr': 0.00044826831903767745, 'samples': 6308352, 'steps': 32855, 'loss/train': 1.9462559223175049} -11/07/2021 01:52:45 - INFO - __main__ - Step 32857: {'lr': 0.000448265086515768, 'samples': 6308544, 'steps': 32856, 'loss/train': 1.4201304912567139} -11/07/2021 01:52:45 - INFO - __main__ - Step 32858: {'lr': 0.0004482618539045234, 'samples': 6308736, 'steps': 32857, 'loss/train': 1.3535361289978027} -11/07/2021 01:52:46 - INFO - __main__ - Step 32859: {'lr': 0.00044825862120394504, 'samples': 6308928, 'steps': 32858, 'loss/train': 2.0859124660491943} -11/07/2021 01:52:47 - INFO - __main__ - Step 32860: {'lr': 0.00044825538841403444, 'samples': 6309120, 'steps': 32859, 'loss/train': 1.2962948083877563} -11/07/2021 01:52:47 - INFO - __main__ - Step 32861: {'lr': 0.000448252155534793, 'samples': 6309312, 'steps': 32860, 'loss/train': 1.482293963432312} -11/07/2021 01:52:47 - INFO - __main__ - Step 32862: {'lr': 0.0004482489225662222, 'samples': 6309504, 'steps': 32861, 'loss/train': 1.0501551628112793} -11/07/2021 01:52:48 - INFO - __main__ - Step 32863: {'lr': 0.00044824568950832343, 'samples': 6309696, 'steps': 32862, 'loss/train': 1.8620959520339966} -11/07/2021 01:52:49 - INFO - __main__ - Step 32864: {'lr': 0.0004482424563610983, 'samples': 6309888, 'steps': 32863, 'loss/train': 1.2694894075393677} -11/07/2021 01:52:49 - INFO - __main__ - Step 32865: {'lr': 0.00044823922312454815, 'samples': 6310080, 'steps': 32864, 'loss/train': 1.4919681549072266} -11/07/2021 01:52:50 - INFO - __main__ - Step 32866: {'lr': 0.00044823598979867445, 'samples': 6310272, 'steps': 32865, 'loss/train': 1.699884295463562} -11/07/2021 01:52:50 - INFO - __main__ - Step 32867: {'lr': 0.0004482327563834787, 'samples': 6310464, 'steps': 32866, 'loss/train': 2.1392643451690674} -11/07/2021 01:52:50 - INFO - __main__ - Step 32868: {'lr': 0.00044822952287896237, 'samples': 6310656, 'steps': 32867, 'loss/train': 4.73948860168457} -11/07/2021 01:52:51 - INFO - __main__ - Step 32869: {'lr': 0.00044822628928512675, 'samples': 6310848, 'steps': 32868, 'loss/train': 1.5720044374465942} -11/07/2021 01:52:52 - INFO - __main__ - Step 32870: {'lr': 0.0004482230556019735, 'samples': 6311040, 'steps': 32869, 'loss/train': 1.441838026046753} -11/07/2021 01:52:52 - INFO - __main__ - Step 32871: {'lr': 0.00044821982182950405, 'samples': 6311232, 'steps': 32870, 'loss/train': 1.2322503328323364} -11/07/2021 01:52:52 - INFO - __main__ - Step 32872: {'lr': 0.0004482165879677197, 'samples': 6311424, 'steps': 32871, 'loss/train': 1.16120183467865} -11/07/2021 01:52:53 - INFO - __main__ - Step 32873: {'lr': 0.0004482133540166221, 'samples': 6311616, 'steps': 32872, 'loss/train': 1.548761248588562} -11/07/2021 01:52:53 - INFO - __main__ - Step 32874: {'lr': 0.00044821011997621255, 'samples': 6311808, 'steps': 32873, 'loss/train': 1.5385053157806396} -11/07/2021 01:52:54 - INFO - __main__ - Step 32875: {'lr': 0.0004482068858464926, 'samples': 6312000, 'steps': 32874, 'loss/train': 1.227051019668579} -11/07/2021 01:52:54 - INFO - __main__ - Step 32876: {'lr': 0.00044820365162746373, 'samples': 6312192, 'steps': 32875, 'loss/train': 1.523007869720459} -11/07/2021 01:52:55 - INFO - __main__ - Step 32877: {'lr': 0.00044820041731912733, 'samples': 6312384, 'steps': 32876, 'loss/train': 1.4473198652267456} -11/07/2021 01:52:55 - INFO - __main__ - Step 32878: {'lr': 0.0004481971829214848, 'samples': 6312576, 'steps': 32877, 'loss/train': 1.064133644104004} -11/07/2021 01:52:55 - INFO - __main__ - Step 32879: {'lr': 0.0004481939484345378, 'samples': 6312768, 'steps': 32878, 'loss/train': 1.7819557189941406} -11/07/2021 01:52:56 - INFO - __main__ - Step 32880: {'lr': 0.0004481907138582876, 'samples': 6312960, 'steps': 32879, 'loss/train': 1.6354236602783203} -11/07/2021 01:52:57 - INFO - __main__ - Step 32881: {'lr': 0.00044818747919273574, 'samples': 6313152, 'steps': 32880, 'loss/train': 1.5709049701690674} -11/07/2021 01:52:57 - INFO - __main__ - Step 32882: {'lr': 0.0004481842444378837, 'samples': 6313344, 'steps': 32881, 'loss/train': 1.5239031314849854} -11/07/2021 01:52:58 - INFO - __main__ - Step 32883: {'lr': 0.0004481810095937329, 'samples': 6313536, 'steps': 32882, 'loss/train': 1.4392449855804443} -11/07/2021 01:52:58 - INFO - __main__ - Step 32884: {'lr': 0.00044817777466028467, 'samples': 6313728, 'steps': 32883, 'loss/train': 0.982414960861206} -11/07/2021 01:52:59 - INFO - __main__ - Step 32885: {'lr': 0.0004481745396375407, 'samples': 6313920, 'steps': 32884, 'loss/train': 1.0925793647766113} -11/07/2021 01:52:59 - INFO - __main__ - Step 32886: {'lr': 0.0004481713045255023, 'samples': 6314112, 'steps': 32885, 'loss/train': 1.6663484573364258} -11/07/2021 01:53:00 - INFO - __main__ - Step 32887: {'lr': 0.000448168069324171, 'samples': 6314304, 'steps': 32886, 'loss/train': 1.6085951328277588} -11/07/2021 01:53:00 - INFO - __main__ - Step 32888: {'lr': 0.0004481648340335482, 'samples': 6314496, 'steps': 32887, 'loss/train': 1.4408528804779053} -11/07/2021 01:53:00 - INFO - __main__ - Step 32889: {'lr': 0.0004481615986536354, 'samples': 6314688, 'steps': 32888, 'loss/train': 2.108576536178589} -11/07/2021 01:53:01 - INFO - __main__ - Step 32890: {'lr': 0.000448158363184434, 'samples': 6314880, 'steps': 32889, 'loss/train': 1.7130979299545288} -11/07/2021 01:53:02 - INFO - __main__ - Step 32891: {'lr': 0.00044815512762594556, 'samples': 6315072, 'steps': 32890, 'loss/train': 2.199972629547119} -11/07/2021 01:53:02 - INFO - __main__ - Step 32892: {'lr': 0.00044815189197817143, 'samples': 6315264, 'steps': 32891, 'loss/train': 1.4540982246398926} -11/07/2021 01:53:03 - INFO - __main__ - Step 32893: {'lr': 0.0004481486562411131, 'samples': 6315456, 'steps': 32892, 'loss/train': 0.44139307737350464} -11/07/2021 01:53:03 - INFO - __main__ - Step 32894: {'lr': 0.0004481454204147721, 'samples': 6315648, 'steps': 32893, 'loss/train': 1.2219226360321045} -11/07/2021 01:53:04 - INFO - __main__ - Step 32895: {'lr': 0.0004481421844991498, 'samples': 6315840, 'steps': 32894, 'loss/train': 1.4876707792282104} -11/07/2021 01:53:04 - INFO - __main__ - Step 32896: {'lr': 0.00044813894849424777, 'samples': 6316032, 'steps': 32895, 'loss/train': 1.8859457969665527} -11/07/2021 01:53:05 - INFO - __main__ - Step 32897: {'lr': 0.0004481357124000672, 'samples': 6316224, 'steps': 32896, 'loss/train': 1.562057375907898} -11/07/2021 01:53:05 - INFO - __main__ - Step 32898: {'lr': 0.0004481324762166099, 'samples': 6316416, 'steps': 32897, 'loss/train': 2.0499045848846436} -11/07/2021 01:53:05 - INFO - __main__ - Step 32899: {'lr': 0.0004481292399438771, 'samples': 6316608, 'steps': 32898, 'loss/train': 1.692986249923706} -11/07/2021 01:53:06 - INFO - __main__ - Step 32900: {'lr': 0.0004481260035818704, 'samples': 6316800, 'steps': 32899, 'loss/train': 0.8094185590744019} -11/07/2021 01:53:07 - INFO - __main__ - Step 32901: {'lr': 0.00044812276713059106, 'samples': 6316992, 'steps': 32900, 'loss/train': 1.7495591640472412} -11/07/2021 01:53:07 - INFO - __main__ - Step 32902: {'lr': 0.00044811953059004073, 'samples': 6317184, 'steps': 32901, 'loss/train': 1.744451880455017} -11/07/2021 01:53:07 - INFO - __main__ - Step 32903: {'lr': 0.0004481162939602208, 'samples': 6317376, 'steps': 32902, 'loss/train': 0.218343123793602} -11/07/2021 01:53:08 - INFO - __main__ - Step 32904: {'lr': 0.0004481130572411327, 'samples': 6317568, 'steps': 32903, 'loss/train': 1.5772401094436646} -11/07/2021 01:53:08 - INFO - __main__ - Step 32905: {'lr': 0.00044810982043277795, 'samples': 6317760, 'steps': 32904, 'loss/train': 1.4718493223190308} -11/07/2021 01:53:09 - INFO - __main__ - Step 32906: {'lr': 0.0004481065835351579, 'samples': 6317952, 'steps': 32905, 'loss/train': 1.7350021600723267} -11/07/2021 01:53:10 - INFO - __main__ - Step 32907: {'lr': 0.0004481033465482741, 'samples': 6318144, 'steps': 32906, 'loss/train': 1.5972042083740234} -11/07/2021 01:53:10 - INFO - __main__ - Step 32908: {'lr': 0.00044810010947212803, 'samples': 6318336, 'steps': 32907, 'loss/train': 1.625590443611145} -11/07/2021 01:53:10 - INFO - __main__ - Step 32909: {'lr': 0.00044809687230672115, 'samples': 6318528, 'steps': 32908, 'loss/train': 1.201430320739746} -11/07/2021 01:53:11 - INFO - __main__ - Step 32910: {'lr': 0.0004480936350520548, 'samples': 6318720, 'steps': 32909, 'loss/train': 1.5031765699386597} -11/07/2021 01:53:12 - INFO - __main__ - Step 32911: {'lr': 0.0004480903977081305, 'samples': 6318912, 'steps': 32910, 'loss/train': 1.6832504272460938} -11/07/2021 01:53:12 - INFO - __main__ - Step 32912: {'lr': 0.00044808716027494973, 'samples': 6319104, 'steps': 32911, 'loss/train': 1.54212486743927} -11/07/2021 01:53:13 - INFO - __main__ - Step 32913: {'lr': 0.000448083922752514, 'samples': 6319296, 'steps': 32912, 'loss/train': 1.823056936264038} -11/07/2021 01:53:13 - INFO - __main__ - Step 32914: {'lr': 0.00044808068514082467, 'samples': 6319488, 'steps': 32913, 'loss/train': 2.00506854057312} -11/07/2021 01:53:13 - INFO - __main__ - Step 32915: {'lr': 0.0004480774474398832, 'samples': 6319680, 'steps': 32914, 'loss/train': 1.3997207880020142} -11/07/2021 01:53:14 - INFO - __main__ - Step 32916: {'lr': 0.00044807420964969113, 'samples': 6319872, 'steps': 32915, 'loss/train': 1.5196776390075684} -11/07/2021 01:53:15 - INFO - __main__ - Step 32917: {'lr': 0.0004480709717702499, 'samples': 6320064, 'steps': 32916, 'loss/train': 1.6158102750778198} -11/07/2021 01:53:15 - INFO - __main__ - Step 32918: {'lr': 0.000448067733801561, 'samples': 6320256, 'steps': 32917, 'loss/train': 1.8232070207595825} -11/07/2021 01:53:15 - INFO - __main__ - Step 32919: {'lr': 0.00044806449574362575, 'samples': 6320448, 'steps': 32918, 'loss/train': 1.3813356161117554} -11/07/2021 01:53:16 - INFO - __main__ - Step 32920: {'lr': 0.00044806125759644567, 'samples': 6320640, 'steps': 32919, 'loss/train': 1.3492869138717651} -11/07/2021 01:53:17 - INFO - __main__ - Step 32921: {'lr': 0.00044805801936002225, 'samples': 6320832, 'steps': 32920, 'loss/train': 1.7767366170883179} -11/07/2021 01:53:17 - INFO - __main__ - Step 32922: {'lr': 0.00044805478103435707, 'samples': 6321024, 'steps': 32921, 'loss/train': 0.8150038719177246} -11/07/2021 01:53:17 - INFO - __main__ - Step 32923: {'lr': 0.0004480515426194513, 'samples': 6321216, 'steps': 32922, 'loss/train': 1.5820306539535522} -11/07/2021 01:53:18 - INFO - __main__ - Step 32924: {'lr': 0.0004480483041153066, 'samples': 6321408, 'steps': 32923, 'loss/train': 1.350351095199585} -11/07/2021 01:53:18 - INFO - __main__ - Step 32925: {'lr': 0.00044804506552192447, 'samples': 6321600, 'steps': 32924, 'loss/train': 1.5434849262237549} -11/07/2021 01:53:19 - INFO - __main__ - Step 32926: {'lr': 0.0004480418268393062, 'samples': 6321792, 'steps': 32925, 'loss/train': 1.0062862634658813} -11/07/2021 01:53:20 - INFO - __main__ - Step 32927: {'lr': 0.0004480385880674534, 'samples': 6321984, 'steps': 32926, 'loss/train': 1.7393062114715576} -11/07/2021 01:53:20 - INFO - __main__ - Step 32928: {'lr': 0.00044803534920636744, 'samples': 6322176, 'steps': 32927, 'loss/train': 2.093810796737671} -11/07/2021 01:53:20 - INFO - __main__ - Step 32929: {'lr': 0.00044803211025604985, 'samples': 6322368, 'steps': 32928, 'loss/train': 1.494863748550415} -11/07/2021 01:53:21 - INFO - __main__ - Step 32930: {'lr': 0.000448028871216502, 'samples': 6322560, 'steps': 32929, 'loss/train': 1.5068172216415405} -11/07/2021 01:53:22 - INFO - __main__ - Step 32931: {'lr': 0.0004480256320877254, 'samples': 6322752, 'steps': 32930, 'loss/train': 0.7170737385749817} -11/07/2021 01:53:22 - INFO - __main__ - Step 32932: {'lr': 0.00044802239286972147, 'samples': 6322944, 'steps': 32931, 'loss/train': 1.9031884670257568} -11/07/2021 01:53:22 - INFO - __main__ - Step 32933: {'lr': 0.0004480191535624918, 'samples': 6323136, 'steps': 32932, 'loss/train': 1.4989677667617798} -11/07/2021 01:53:23 - INFO - __main__ - Step 32934: {'lr': 0.0004480159141660377, 'samples': 6323328, 'steps': 32933, 'loss/train': 1.6413919925689697} -11/07/2021 01:53:23 - INFO - __main__ - Step 32935: {'lr': 0.00044801267468036064, 'samples': 6323520, 'steps': 32934, 'loss/train': 1.7031339406967163} -11/07/2021 01:53:23 - INFO - __main__ - Step 32936: {'lr': 0.0004480094351054622, 'samples': 6323712, 'steps': 32935, 'loss/train': 1.2702281475067139} -11/07/2021 01:53:24 - INFO - __main__ - Step 32937: {'lr': 0.00044800619544134375, 'samples': 6323904, 'steps': 32936, 'loss/train': 1.7458767890930176} -11/07/2021 01:53:25 - INFO - __main__ - Step 32938: {'lr': 0.00044800295568800673, 'samples': 6324096, 'steps': 32937, 'loss/train': 1.6693315505981445} -11/07/2021 01:53:25 - INFO - __main__ - Step 32939: {'lr': 0.0004479997158454526, 'samples': 6324288, 'steps': 32938, 'loss/train': 1.2809923887252808} -11/07/2021 01:53:25 - INFO - __main__ - Step 32940: {'lr': 0.00044799647591368296, 'samples': 6324480, 'steps': 32939, 'loss/train': 1.6685653924942017} -11/07/2021 01:53:26 - INFO - __main__ - Step 32941: {'lr': 0.00044799323589269914, 'samples': 6324672, 'steps': 32940, 'loss/train': 2.008671760559082} -11/07/2021 01:53:27 - INFO - __main__ - Step 32942: {'lr': 0.00044798999578250255, 'samples': 6324864, 'steps': 32941, 'loss/train': 1.6154990196228027} -11/07/2021 01:53:27 - INFO - __main__ - Step 32943: {'lr': 0.0004479867555830948, 'samples': 6325056, 'steps': 32942, 'loss/train': 1.376146674156189} -11/07/2021 01:53:27 - INFO - __main__ - Step 32944: {'lr': 0.0004479835152944772, 'samples': 6325248, 'steps': 32943, 'loss/train': 1.3978157043457031} -11/07/2021 01:53:28 - INFO - __main__ - Step 32945: {'lr': 0.00044798027491665135, 'samples': 6325440, 'steps': 32944, 'loss/train': 1.762140154838562} -11/07/2021 01:53:28 - INFO - __main__ - Step 32946: {'lr': 0.00044797703444961857, 'samples': 6325632, 'steps': 32945, 'loss/train': 2.225754976272583} -11/07/2021 01:53:29 - INFO - __main__ - Step 32947: {'lr': 0.00044797379389338045, 'samples': 6325824, 'steps': 32946, 'loss/train': 1.8722946643829346} -11/07/2021 01:53:29 - INFO - __main__ - Step 32948: {'lr': 0.0004479705532479384, 'samples': 6326016, 'steps': 32947, 'loss/train': 1.6617766618728638} -11/07/2021 01:53:30 - INFO - __main__ - Step 32949: {'lr': 0.0004479673125132938, 'samples': 6326208, 'steps': 32948, 'loss/train': 1.630037784576416} -11/07/2021 01:53:30 - INFO - __main__ - Step 32950: {'lr': 0.0004479640716894483, 'samples': 6326400, 'steps': 32949, 'loss/train': 1.559309720993042} -11/07/2021 01:53:31 - INFO - __main__ - Step 32951: {'lr': 0.00044796083077640314, 'samples': 6326592, 'steps': 32950, 'loss/train': 1.286965012550354} -11/07/2021 01:53:32 - INFO - __main__ - Step 32952: {'lr': 0.00044795758977416, 'samples': 6326784, 'steps': 32951, 'loss/train': 1.2813061475753784} -11/07/2021 01:53:32 - INFO - __main__ - Step 32953: {'lr': 0.0004479543486827201, 'samples': 6326976, 'steps': 32952, 'loss/train': 1.5169000625610352} -11/07/2021 01:53:32 - INFO - __main__ - Step 32954: {'lr': 0.0004479511075020851, 'samples': 6327168, 'steps': 32953, 'loss/train': 1.5031007528305054} -11/07/2021 01:53:33 - INFO - __main__ - Step 32955: {'lr': 0.00044794786623225636, 'samples': 6327360, 'steps': 32954, 'loss/train': 1.3424718379974365} -11/07/2021 01:53:33 - INFO - __main__ - Step 32956: {'lr': 0.0004479446248732354, 'samples': 6327552, 'steps': 32955, 'loss/train': 0.9912104606628418} -11/07/2021 01:53:34 - INFO - __main__ - Step 32957: {'lr': 0.00044794138342502354, 'samples': 6327744, 'steps': 32956, 'loss/train': 1.6631126403808594} -11/07/2021 01:53:35 - INFO - __main__ - Step 32958: {'lr': 0.0004479381418876225, 'samples': 6327936, 'steps': 32957, 'loss/train': 1.2141307592391968} -11/07/2021 01:53:35 - INFO - __main__ - Step 32959: {'lr': 0.00044793490026103346, 'samples': 6328128, 'steps': 32958, 'loss/train': 1.517661690711975} -11/07/2021 01:53:35 - INFO - __main__ - Step 32960: {'lr': 0.0004479316585452581, 'samples': 6328320, 'steps': 32959, 'loss/train': 1.7940460443496704} -11/07/2021 01:53:36 - INFO - __main__ - Step 32961: {'lr': 0.0004479284167402977, 'samples': 6328512, 'steps': 32960, 'loss/train': 1.6163368225097656} -11/07/2021 01:53:36 - INFO - __main__ - Step 32962: {'lr': 0.00044792517484615384, 'samples': 6328704, 'steps': 32961, 'loss/train': 1.1192171573638916} -11/07/2021 01:53:37 - INFO - __main__ - Step 32963: {'lr': 0.000447921932862828, 'samples': 6328896, 'steps': 32962, 'loss/train': 0.14294178783893585} -11/07/2021 01:53:37 - INFO - __main__ - Step 32964: {'lr': 0.00044791869079032154, 'samples': 6329088, 'steps': 32963, 'loss/train': 1.6653163433074951} -11/07/2021 01:53:38 - INFO - __main__ - Step 32965: {'lr': 0.000447915448628636, 'samples': 6329280, 'steps': 32964, 'loss/train': 1.598552942276001} -11/07/2021 01:53:38 - INFO - __main__ - Step 32966: {'lr': 0.0004479122063777728, 'samples': 6329472, 'steps': 32965, 'loss/train': 1.8037034273147583} -11/07/2021 01:53:38 - INFO - __main__ - Step 32967: {'lr': 0.0004479089640377334, 'samples': 6329664, 'steps': 32966, 'loss/train': 1.4403834342956543} -11/07/2021 01:53:39 - INFO - __main__ - Step 32968: {'lr': 0.00044790572160851926, 'samples': 6329856, 'steps': 32967, 'loss/train': 1.6658954620361328} -11/07/2021 01:53:40 - INFO - __main__ - Step 32969: {'lr': 0.00044790247909013195, 'samples': 6330048, 'steps': 32968, 'loss/train': 1.7885410785675049} -11/07/2021 01:53:40 - INFO - __main__ - Step 32970: {'lr': 0.0004478992364825728, 'samples': 6330240, 'steps': 32969, 'loss/train': 1.591148018836975} -11/07/2021 01:53:41 - INFO - __main__ - Step 32971: {'lr': 0.00044789599378584324, 'samples': 6330432, 'steps': 32970, 'loss/train': 1.7470932006835938} -11/07/2021 01:53:41 - INFO - __main__ - Step 32972: {'lr': 0.0004478927509999449, 'samples': 6330624, 'steps': 32971, 'loss/train': 1.6637678146362305} -11/07/2021 01:53:42 - INFO - __main__ - Step 32973: {'lr': 0.00044788950812487907, 'samples': 6330816, 'steps': 32972, 'loss/train': 1.8130570650100708} -11/07/2021 01:53:42 - INFO - __main__ - Step 32974: {'lr': 0.0004478862651606472, 'samples': 6331008, 'steps': 32973, 'loss/train': 1.705833077430725} -11/07/2021 01:53:43 - INFO - __main__ - Step 32975: {'lr': 0.000447883022107251, 'samples': 6331200, 'steps': 32974, 'loss/train': 1.3867896795272827} -11/07/2021 01:53:43 - INFO - __main__ - Step 32976: {'lr': 0.00044787977896469167, 'samples': 6331392, 'steps': 32975, 'loss/train': 1.3941127061843872} -11/07/2021 01:53:43 - INFO - __main__ - Step 32977: {'lr': 0.0004478765357329708, 'samples': 6331584, 'steps': 32976, 'loss/train': 1.7699060440063477} -11/07/2021 01:53:44 - INFO - __main__ - Step 32978: {'lr': 0.0004478732924120897, 'samples': 6331776, 'steps': 32977, 'loss/train': 1.2456763982772827} -11/07/2021 01:53:45 - INFO - __main__ - Step 32979: {'lr': 0.0004478700490020501, 'samples': 6331968, 'steps': 32978, 'loss/train': 1.3738280534744263} -11/07/2021 01:53:45 - INFO - __main__ - Step 32980: {'lr': 0.0004478668055028533, 'samples': 6332160, 'steps': 32979, 'loss/train': 1.2072436809539795} -11/07/2021 01:53:45 - INFO - __main__ - Step 32981: {'lr': 0.0004478635619145007, 'samples': 6332352, 'steps': 32980, 'loss/train': 1.619855284690857} -11/07/2021 01:53:46 - INFO - __main__ - Step 32982: {'lr': 0.00044786031823699384, 'samples': 6332544, 'steps': 32981, 'loss/train': 1.4322315454483032} -11/07/2021 01:53:46 - INFO - __main__ - Step 32983: {'lr': 0.0004478570744703342, 'samples': 6332736, 'steps': 32982, 'loss/train': 1.6997398138046265} -11/07/2021 01:53:47 - INFO - __main__ - Step 32984: {'lr': 0.00044785383061452324, 'samples': 6332928, 'steps': 32983, 'loss/train': 1.6025248765945435} -11/07/2021 01:53:48 - INFO - __main__ - Step 32985: {'lr': 0.00044785058666956234, 'samples': 6333120, 'steps': 32984, 'loss/train': 1.3251734972000122} -11/07/2021 01:53:48 - INFO - __main__ - Step 32986: {'lr': 0.000447847342635453, 'samples': 6333312, 'steps': 32985, 'loss/train': 2.5228066444396973} -11/07/2021 01:53:48 - INFO - __main__ - Step 32987: {'lr': 0.00044784409851219675, 'samples': 6333504, 'steps': 32986, 'loss/train': 1.1910200119018555} -11/07/2021 01:53:49 - INFO - __main__ - Step 32988: {'lr': 0.00044784085429979504, 'samples': 6333696, 'steps': 32987, 'loss/train': 1.3550323247909546} -11/07/2021 01:53:50 - INFO - __main__ - Step 32989: {'lr': 0.00044783760999824926, 'samples': 6333888, 'steps': 32988, 'loss/train': 1.6246103048324585} -11/07/2021 01:53:50 - INFO - __main__ - Step 32990: {'lr': 0.00044783436560756086, 'samples': 6334080, 'steps': 32989, 'loss/train': 1.7610799074172974} -11/07/2021 01:53:50 - INFO - __main__ - Step 32991: {'lr': 0.00044783112112773137, 'samples': 6334272, 'steps': 32990, 'loss/train': 1.7590878009796143} -11/07/2021 01:53:51 - INFO - __main__ - Step 32992: {'lr': 0.0004478278765587623, 'samples': 6334464, 'steps': 32991, 'loss/train': 1.602809190750122} -11/07/2021 01:53:51 - INFO - __main__ - Step 32993: {'lr': 0.000447824631900655, 'samples': 6334656, 'steps': 32992, 'loss/train': 1.953904151916504} -11/07/2021 01:53:52 - INFO - __main__ - Step 32994: {'lr': 0.00044782138715341094, 'samples': 6334848, 'steps': 32993, 'loss/train': 1.7642078399658203} -11/07/2021 01:53:53 - INFO - __main__ - Step 32995: {'lr': 0.00044781814231703164, 'samples': 6335040, 'steps': 32994, 'loss/train': 1.3278212547302246} -11/07/2021 01:53:53 - INFO - __main__ - Step 32996: {'lr': 0.00044781489739151856, 'samples': 6335232, 'steps': 32995, 'loss/train': 1.373674988746643} -11/07/2021 01:53:53 - INFO - __main__ - Step 32997: {'lr': 0.00044781165237687306, 'samples': 6335424, 'steps': 32996, 'loss/train': 1.150309443473816} -11/07/2021 01:53:54 - INFO - __main__ - Step 32998: {'lr': 0.00044780840727309676, 'samples': 6335616, 'steps': 32997, 'loss/train': 1.4560761451721191} -11/07/2021 01:53:54 - INFO - __main__ - Step 32999: {'lr': 0.000447805162080191, 'samples': 6335808, 'steps': 32998, 'loss/train': 0.7766704559326172} -11/07/2021 01:53:55 - INFO - __main__ - Step 33000: {'lr': 0.0004478019167981573, 'samples': 6336000, 'steps': 32999, 'loss/train': 1.489380955696106} -11/07/2021 01:53:55 - INFO - __main__ - Step 33001: {'lr': 0.00044779867142699713, 'samples': 6336192, 'steps': 33000, 'loss/train': 1.2429890632629395} -11/07/2021 01:53:56 - INFO - __main__ - Step 33002: {'lr': 0.0004477954259667119, 'samples': 6336384, 'steps': 33001, 'loss/train': 1.9934924840927124} -11/07/2021 01:53:56 - INFO - __main__ - Step 33003: {'lr': 0.00044779218041730314, 'samples': 6336576, 'steps': 33002, 'loss/train': 1.16958487033844} -11/07/2021 01:53:56 - INFO - __main__ - Step 33004: {'lr': 0.00044778893477877225, 'samples': 6336768, 'steps': 33003, 'loss/train': 1.4972314834594727} -11/07/2021 01:53:57 - INFO - __main__ - Step 33005: {'lr': 0.0004477856890511207, 'samples': 6336960, 'steps': 33004, 'loss/train': 2.1951231956481934} -11/07/2021 01:53:58 - INFO - __main__ - Step 33006: {'lr': 0.00044778244323435, 'samples': 6337152, 'steps': 33005, 'loss/train': 1.486146092414856} -11/07/2021 01:53:58 - INFO - __main__ - Step 33007: {'lr': 0.0004477791973284616, 'samples': 6337344, 'steps': 33006, 'loss/train': 1.2795722484588623} -11/07/2021 01:53:59 - INFO - __main__ - Step 33008: {'lr': 0.00044777595133345686, 'samples': 6337536, 'steps': 33007, 'loss/train': 1.5722613334655762} -11/07/2021 01:53:59 - INFO - __main__ - Step 33009: {'lr': 0.0004477727052493374, 'samples': 6337728, 'steps': 33008, 'loss/train': 1.4420450925827026} -11/07/2021 01:54:00 - INFO - __main__ - Step 33010: {'lr': 0.0004477694590761046, 'samples': 6337920, 'steps': 33009, 'loss/train': 1.5427229404449463} -11/07/2021 01:54:00 - INFO - __main__ - Step 33011: {'lr': 0.00044776621281375994, 'samples': 6338112, 'steps': 33010, 'loss/train': 1.6263377666473389} -11/07/2021 01:54:01 - INFO - __main__ - Step 33012: {'lr': 0.00044776296646230487, 'samples': 6338304, 'steps': 33011, 'loss/train': 5.8149800300598145} -11/07/2021 01:54:01 - INFO - __main__ - Step 33013: {'lr': 0.00044775972002174085, 'samples': 6338496, 'steps': 33012, 'loss/train': 1.5900511741638184} -11/07/2021 01:54:01 - INFO - __main__ - Step 33014: {'lr': 0.0004477564734920694, 'samples': 6338688, 'steps': 33013, 'loss/train': 1.2043906450271606} -11/07/2021 01:54:02 - INFO - __main__ - Step 33015: {'lr': 0.0004477532268732919, 'samples': 6338880, 'steps': 33014, 'loss/train': 0.8074337244033813} -11/07/2021 01:54:03 - INFO - __main__ - Step 33016: {'lr': 0.00044774998016540977, 'samples': 6339072, 'steps': 33015, 'loss/train': 2.2873222827911377} -11/07/2021 01:54:03 - INFO - __main__ - Step 33017: {'lr': 0.00044774673336842464, 'samples': 6339264, 'steps': 33016, 'loss/train': 1.6069782972335815} -11/07/2021 01:54:03 - INFO - __main__ - Step 33018: {'lr': 0.0004477434864823379, 'samples': 6339456, 'steps': 33017, 'loss/train': 1.5662287473678589} -11/07/2021 01:54:04 - INFO - __main__ - Step 33019: {'lr': 0.00044774023950715095, 'samples': 6339648, 'steps': 33018, 'loss/train': 1.329482078552246} -11/07/2021 01:54:05 - INFO - __main__ - Step 33020: {'lr': 0.0004477369924428653, 'samples': 6339840, 'steps': 33019, 'loss/train': 1.8639891147613525} -11/07/2021 01:54:05 - INFO - __main__ - Step 33021: {'lr': 0.0004477337452894824, 'samples': 6340032, 'steps': 33020, 'loss/train': 1.563912034034729} -11/07/2021 01:54:05 - INFO - __main__ - Step 33022: {'lr': 0.0004477304980470038, 'samples': 6340224, 'steps': 33021, 'loss/train': 1.6074427366256714} -11/07/2021 01:54:06 - INFO - __main__ - Step 33023: {'lr': 0.0004477272507154308, 'samples': 6340416, 'steps': 33022, 'loss/train': 1.5063848495483398} -11/07/2021 01:54:06 - INFO - __main__ - Step 33024: {'lr': 0.00044772400329476505, 'samples': 6340608, 'steps': 33023, 'loss/train': 1.8239989280700684} -11/07/2021 01:54:07 - INFO - __main__ - Step 33025: {'lr': 0.0004477207557850078, 'samples': 6340800, 'steps': 33024, 'loss/train': 1.4097603559494019} -11/07/2021 01:54:08 - INFO - __main__ - Step 33026: {'lr': 0.00044771750818616067, 'samples': 6340992, 'steps': 33025, 'loss/train': 1.4742379188537598} -11/07/2021 01:54:08 - INFO - __main__ - Step 33027: {'lr': 0.0004477142604982251, 'samples': 6341184, 'steps': 33026, 'loss/train': 1.2127858400344849} -11/07/2021 01:54:08 - INFO - __main__ - Step 33028: {'lr': 0.0004477110127212025, 'samples': 6341376, 'steps': 33027, 'loss/train': 1.0178325176239014} -11/07/2021 01:54:09 - INFO - __main__ - Step 33029: {'lr': 0.00044770776485509445, 'samples': 6341568, 'steps': 33028, 'loss/train': 1.7714896202087402} -11/07/2021 01:54:09 - INFO - __main__ - Step 33030: {'lr': 0.00044770451689990227, 'samples': 6341760, 'steps': 33029, 'loss/train': 1.6244250535964966} -11/07/2021 01:54:10 - INFO - __main__ - Step 33031: {'lr': 0.0004477012688556275, 'samples': 6341952, 'steps': 33030, 'loss/train': 1.3644365072250366} -11/07/2021 01:54:10 - INFO - __main__ - Step 33032: {'lr': 0.0004476980207222716, 'samples': 6342144, 'steps': 33031, 'loss/train': 1.3227752447128296} -11/07/2021 01:54:11 - INFO - __main__ - Step 33033: {'lr': 0.00044769477249983596, 'samples': 6342336, 'steps': 33032, 'loss/train': 1.5948199033737183} -11/07/2021 01:54:11 - INFO - __main__ - Step 33034: {'lr': 0.00044769152418832215, 'samples': 6342528, 'steps': 33033, 'loss/train': 1.3293739557266235} -11/07/2021 01:54:11 - INFO - __main__ - Step 33035: {'lr': 0.00044768827578773164, 'samples': 6342720, 'steps': 33034, 'loss/train': 1.208864688873291} -11/07/2021 01:54:13 - INFO - __main__ - Step 33036: {'lr': 0.00044768502729806574, 'samples': 6342912, 'steps': 33035, 'loss/train': 1.484110951423645} -11/07/2021 01:54:13 - INFO - __main__ - Step 33037: {'lr': 0.0004476817787193261, 'samples': 6343104, 'steps': 33036, 'loss/train': 1.348806381225586} -11/07/2021 01:54:13 - INFO - __main__ - Step 33038: {'lr': 0.0004476785300515141, 'samples': 6343296, 'steps': 33037, 'loss/train': 1.033874750137329} -11/07/2021 01:54:14 - INFO - __main__ - Step 33039: {'lr': 0.0004476752812946312, 'samples': 6343488, 'steps': 33038, 'loss/train': 1.3962721824645996} -11/07/2021 01:54:14 - INFO - __main__ - Step 33040: {'lr': 0.0004476720324486788, 'samples': 6343680, 'steps': 33039, 'loss/train': 1.698463797569275} -11/07/2021 01:54:15 - INFO - __main__ - Step 33041: {'lr': 0.0004476687835136585, 'samples': 6343872, 'steps': 33040, 'loss/train': 1.321233868598938} -11/07/2021 01:54:15 - INFO - __main__ - Step 33042: {'lr': 0.0004476655344895717, 'samples': 6344064, 'steps': 33041, 'loss/train': 1.7292245626449585} -11/07/2021 01:54:16 - INFO - __main__ - Step 33043: {'lr': 0.0004476622853764198, 'samples': 6344256, 'steps': 33042, 'loss/train': 1.1548570394515991} -11/07/2021 01:54:16 - INFO - __main__ - Step 33044: {'lr': 0.00044765903617420436, 'samples': 6344448, 'steps': 33043, 'loss/train': 1.1298271417617798} -11/07/2021 01:54:16 - INFO - __main__ - Step 33045: {'lr': 0.00044765578688292686, 'samples': 6344640, 'steps': 33044, 'loss/train': 1.1050087213516235} -11/07/2021 01:54:17 - INFO - __main__ - Step 33046: {'lr': 0.0004476525375025886, 'samples': 6344832, 'steps': 33045, 'loss/train': 1.1851271390914917} -11/07/2021 01:54:18 - INFO - __main__ - Step 33047: {'lr': 0.00044764928803319126, 'samples': 6345024, 'steps': 33046, 'loss/train': 1.1974475383758545} -11/07/2021 01:54:18 - INFO - __main__ - Step 33048: {'lr': 0.00044764603847473615, 'samples': 6345216, 'steps': 33047, 'loss/train': 0.9402886629104614} -11/07/2021 01:54:18 - INFO - __main__ - Step 33049: {'lr': 0.0004476427888272248, 'samples': 6345408, 'steps': 33048, 'loss/train': 1.2218657732009888} -11/07/2021 01:54:19 - INFO - __main__ - Step 33050: {'lr': 0.0004476395390906586, 'samples': 6345600, 'steps': 33049, 'loss/train': 1.2480854988098145} -11/07/2021 01:54:20 - INFO - __main__ - Step 33051: {'lr': 0.0004476362892650392, 'samples': 6345792, 'steps': 33050, 'loss/train': 1.395213007926941} -11/07/2021 01:54:20 - INFO - __main__ - Step 33052: {'lr': 0.0004476330393503678, 'samples': 6345984, 'steps': 33051, 'loss/train': 1.5939335823059082} -11/07/2021 01:54:20 - INFO - __main__ - Step 33053: {'lr': 0.0004476297893466461, 'samples': 6346176, 'steps': 33052, 'loss/train': 1.820644736289978} -11/07/2021 01:54:21 - INFO - __main__ - Step 33054: {'lr': 0.0004476265392538754, 'samples': 6346368, 'steps': 33053, 'loss/train': 1.1525547504425049} -11/07/2021 01:54:21 - INFO - __main__ - Step 33055: {'lr': 0.0004476232890720573, 'samples': 6346560, 'steps': 33054, 'loss/train': 1.3899204730987549} -11/07/2021 01:54:22 - INFO - __main__ - Step 33056: {'lr': 0.0004476200388011932, 'samples': 6346752, 'steps': 33055, 'loss/train': 1.2742310762405396} -11/07/2021 01:54:23 - INFO - __main__ - Step 33057: {'lr': 0.0004476167884412845, 'samples': 6346944, 'steps': 33056, 'loss/train': 1.7061872482299805} -11/07/2021 01:54:23 - INFO - __main__ - Step 33058: {'lr': 0.00044761353799233273, 'samples': 6347136, 'steps': 33057, 'loss/train': 1.2749007940292358} -11/07/2021 01:54:23 - INFO - __main__ - Step 33059: {'lr': 0.00044761028745433934, 'samples': 6347328, 'steps': 33058, 'loss/train': 1.2940367460250854} -11/07/2021 01:54:24 - INFO - __main__ - Step 33060: {'lr': 0.00044760703682730584, 'samples': 6347520, 'steps': 33059, 'loss/train': 3.064441680908203} -11/07/2021 01:54:25 - INFO - __main__ - Step 33061: {'lr': 0.00044760378611123365, 'samples': 6347712, 'steps': 33060, 'loss/train': 1.6477994918823242} -11/07/2021 01:54:25 - INFO - __main__ - Step 33062: {'lr': 0.0004476005353061242, 'samples': 6347904, 'steps': 33061, 'loss/train': 1.6297001838684082} -11/07/2021 01:54:25 - INFO - __main__ - Step 33063: {'lr': 0.00044759728441197904, 'samples': 6348096, 'steps': 33062, 'loss/train': 1.65060555934906} -11/07/2021 01:54:26 - INFO - __main__ - Step 33064: {'lr': 0.0004475940334287996, 'samples': 6348288, 'steps': 33063, 'loss/train': 1.500831961631775} -11/07/2021 01:54:26 - INFO - __main__ - Step 33065: {'lr': 0.0004475907823565873, 'samples': 6348480, 'steps': 33064, 'loss/train': 1.7707630395889282} -11/07/2021 01:54:27 - INFO - __main__ - Step 33066: {'lr': 0.00044758753119534373, 'samples': 6348672, 'steps': 33065, 'loss/train': 1.3939059972763062} -11/07/2021 01:54:28 - INFO - __main__ - Step 33067: {'lr': 0.0004475842799450702, 'samples': 6348864, 'steps': 33066, 'loss/train': 1.124437689781189} -11/07/2021 01:54:28 - INFO - __main__ - Step 33068: {'lr': 0.0004475810286057682, 'samples': 6349056, 'steps': 33067, 'loss/train': 1.4587339162826538} -11/07/2021 01:54:28 - INFO - __main__ - Step 33069: {'lr': 0.0004475777771774393, 'samples': 6349248, 'steps': 33068, 'loss/train': 1.1545443534851074} -11/07/2021 01:54:29 - INFO - __main__ - Step 33070: {'lr': 0.00044757452566008497, 'samples': 6349440, 'steps': 33069, 'loss/train': 0.7420926690101624} -11/07/2021 01:54:29 - INFO - __main__ - Step 33071: {'lr': 0.00044757127405370645, 'samples': 6349632, 'steps': 33070, 'loss/train': 1.7578048706054688} -11/07/2021 01:54:30 - INFO - __main__ - Step 33072: {'lr': 0.00044756802235830544, 'samples': 6349824, 'steps': 33071, 'loss/train': 1.780644416809082} -11/07/2021 01:54:30 - INFO - __main__ - Step 33073: {'lr': 0.00044756477057388336, 'samples': 6350016, 'steps': 33072, 'loss/train': 1.4639098644256592} -11/07/2021 01:54:31 - INFO - __main__ - Step 33074: {'lr': 0.0004475615187004416, 'samples': 6350208, 'steps': 33073, 'loss/train': 1.2951197624206543} -11/07/2021 01:54:31 - INFO - __main__ - Step 33075: {'lr': 0.0004475582667379817, 'samples': 6350400, 'steps': 33074, 'loss/train': 1.5856717824935913} -11/07/2021 01:54:31 - INFO - __main__ - Step 33076: {'lr': 0.0004475550146865051, 'samples': 6350592, 'steps': 33075, 'loss/train': 1.4116233587265015} -11/07/2021 01:54:33 - INFO - __main__ - Step 33077: {'lr': 0.00044755176254601323, 'samples': 6350784, 'steps': 33076, 'loss/train': 0.7812098860740662} -11/07/2021 01:54:33 - INFO - __main__ - Step 33078: {'lr': 0.00044754851031650756, 'samples': 6350976, 'steps': 33077, 'loss/train': 0.7144190073013306} -11/07/2021 01:54:33 - INFO - __main__ - Step 33079: {'lr': 0.0004475452579979896, 'samples': 6351168, 'steps': 33078, 'loss/train': 1.2214468717575073} -11/07/2021 01:54:34 - INFO - __main__ - Step 33080: {'lr': 0.00044754200559046076, 'samples': 6351360, 'steps': 33079, 'loss/train': 1.2222187519073486} -11/07/2021 01:54:34 - INFO - __main__ - Step 33081: {'lr': 0.0004475387530939226, 'samples': 6351552, 'steps': 33080, 'loss/train': 1.365666389465332} -11/07/2021 01:54:35 - INFO - __main__ - Step 33082: {'lr': 0.00044753550050837654, 'samples': 6351744, 'steps': 33081, 'loss/train': 1.3580585718154907} -11/07/2021 01:54:35 - INFO - __main__ - Step 33083: {'lr': 0.00044753224783382394, 'samples': 6351936, 'steps': 33082, 'loss/train': 1.7456175088882446} -11/07/2021 01:54:36 - INFO - __main__ - Step 33084: {'lr': 0.00044752899507026646, 'samples': 6352128, 'steps': 33083, 'loss/train': 1.4929946660995483} -11/07/2021 01:54:36 - INFO - __main__ - Step 33085: {'lr': 0.00044752574221770537, 'samples': 6352320, 'steps': 33084, 'loss/train': 1.0361472368240356} -11/07/2021 01:54:36 - INFO - __main__ - Step 33086: {'lr': 0.0004475224892761423, 'samples': 6352512, 'steps': 33085, 'loss/train': 1.3302377462387085} -11/07/2021 01:54:38 - INFO - __main__ - Step 33087: {'lr': 0.00044751923624557866, 'samples': 6352704, 'steps': 33086, 'loss/train': 1.3933597803115845} -11/07/2021 01:54:38 - INFO - __main__ - Step 33088: {'lr': 0.0004475159831260158, 'samples': 6352896, 'steps': 33087, 'loss/train': 1.3008657693862915} -11/07/2021 01:54:39 - INFO - __main__ - Step 33089: {'lr': 0.00044751272991745537, 'samples': 6353088, 'steps': 33088, 'loss/train': 1.3040766716003418} -11/07/2021 01:54:39 - INFO - __main__ - Step 33090: {'lr': 0.00044750947661989873, 'samples': 6353280, 'steps': 33089, 'loss/train': 1.4220153093338013} -11/07/2021 01:54:39 - INFO - __main__ - Step 33091: {'lr': 0.0004475062232333474, 'samples': 6353472, 'steps': 33090, 'loss/train': 1.1344974040985107} -11/07/2021 01:54:40 - INFO - __main__ - Step 33092: {'lr': 0.00044750296975780277, 'samples': 6353664, 'steps': 33091, 'loss/train': 1.87221097946167} -11/07/2021 01:54:40 - INFO - __main__ - Step 33093: {'lr': 0.00044749971619326633, 'samples': 6353856, 'steps': 33092, 'loss/train': 1.8795900344848633} -11/07/2021 01:54:41 - INFO - __main__ - Step 33094: {'lr': 0.0004474964625397396, 'samples': 6354048, 'steps': 33093, 'loss/train': 1.8172962665557861} -11/07/2021 01:54:41 - INFO - __main__ - Step 33095: {'lr': 0.000447493208797224, 'samples': 6354240, 'steps': 33094, 'loss/train': 1.0788723230361938} -11/07/2021 01:54:42 - INFO - __main__ - Step 33096: {'lr': 0.00044748995496572105, 'samples': 6354432, 'steps': 33095, 'loss/train': 1.5874394178390503} -11/07/2021 01:54:42 - INFO - __main__ - Step 33097: {'lr': 0.0004474867010452321, 'samples': 6354624, 'steps': 33096, 'loss/train': 1.044918179512024} -11/07/2021 01:54:42 - INFO - __main__ - Step 33098: {'lr': 0.0004474834470357587, 'samples': 6354816, 'steps': 33097, 'loss/train': 0.8912402987480164} -11/07/2021 01:54:43 - INFO - __main__ - Step 33099: {'lr': 0.00044748019293730236, 'samples': 6355008, 'steps': 33098, 'loss/train': 1.5409010648727417} -11/07/2021 01:54:44 - INFO - __main__ - Step 33100: {'lr': 0.0004474769387498645, 'samples': 6355200, 'steps': 33099, 'loss/train': 1.6009552478790283} -11/07/2021 01:54:44 - INFO - __main__ - Step 33101: {'lr': 0.0004474736844734465, 'samples': 6355392, 'steps': 33100, 'loss/train': 1.1920632123947144} -11/07/2021 01:54:44 - INFO - __main__ - Step 33102: {'lr': 0.00044747043010805, 'samples': 6355584, 'steps': 33101, 'loss/train': 1.7007176876068115} -11/07/2021 01:54:45 - INFO - __main__ - Step 33103: {'lr': 0.0004474671756536763, 'samples': 6355776, 'steps': 33102, 'loss/train': 1.4003307819366455} -11/07/2021 01:54:46 - INFO - __main__ - Step 33104: {'lr': 0.00044746392111032695, 'samples': 6355968, 'steps': 33103, 'loss/train': 1.2260773181915283} -11/07/2021 01:54:46 - INFO - __main__ - Step 33105: {'lr': 0.00044746066647800343, 'samples': 6356160, 'steps': 33104, 'loss/train': 1.6759220361709595} -11/07/2021 01:54:47 - INFO - __main__ - Step 33106: {'lr': 0.0004474574117567072, 'samples': 6356352, 'steps': 33105, 'loss/train': 1.1456880569458008} -11/07/2021 01:54:47 - INFO - __main__ - Step 33107: {'lr': 0.00044745415694643964, 'samples': 6356544, 'steps': 33106, 'loss/train': 1.1245477199554443} -11/07/2021 01:54:47 - INFO - __main__ - Step 33108: {'lr': 0.0004474509020472023, 'samples': 6356736, 'steps': 33107, 'loss/train': 1.9677975177764893} -11/07/2021 01:54:48 - INFO - __main__ - Step 33109: {'lr': 0.0004474476470589967, 'samples': 6356928, 'steps': 33108, 'loss/train': 1.1387183666229248} -11/07/2021 01:54:49 - INFO - __main__ - Step 33110: {'lr': 0.0004474443919818241, 'samples': 6357120, 'steps': 33109, 'loss/train': 1.4442769289016724} -11/07/2021 01:54:49 - INFO - __main__ - Step 33111: {'lr': 0.0004474411368156862, 'samples': 6357312, 'steps': 33110, 'loss/train': 1.4242744445800781} -11/07/2021 01:54:49 - INFO - __main__ - Step 33112: {'lr': 0.00044743788156058437, 'samples': 6357504, 'steps': 33111, 'loss/train': 1.6928004026412964} -11/07/2021 01:54:50 - INFO - __main__ - Step 33113: {'lr': 0.00044743462621652007, 'samples': 6357696, 'steps': 33112, 'loss/train': 1.145045518875122} -11/07/2021 01:54:51 - INFO - __main__ - Step 33114: {'lr': 0.0004474313707834947, 'samples': 6357888, 'steps': 33113, 'loss/train': 4.484914779663086} -11/07/2021 01:54:51 - INFO - __main__ - Step 33115: {'lr': 0.00044742811526150996, 'samples': 6358080, 'steps': 33114, 'loss/train': 1.396562933921814} -11/07/2021 01:54:51 - INFO - __main__ - Step 33116: {'lr': 0.000447424859650567, 'samples': 6358272, 'steps': 33115, 'loss/train': 1.4449611902236938} -11/07/2021 01:54:52 - INFO - __main__ - Step 33117: {'lr': 0.00044742160395066756, 'samples': 6358464, 'steps': 33116, 'loss/train': 1.3184423446655273} -11/07/2021 01:54:52 - INFO - __main__ - Step 33118: {'lr': 0.0004474183481618129, 'samples': 6358656, 'steps': 33117, 'loss/train': 1.3420227766036987} -11/07/2021 01:54:52 - INFO - __main__ - Step 33119: {'lr': 0.00044741509228400465, 'samples': 6358848, 'steps': 33118, 'loss/train': 5.817997932434082} -11/07/2021 01:54:54 - INFO - __main__ - Step 33120: {'lr': 0.0004474118363172441, 'samples': 6359040, 'steps': 33119, 'loss/train': 1.763843059539795} -11/07/2021 01:54:54 - INFO - __main__ - Step 33121: {'lr': 0.000447408580261533, 'samples': 6359232, 'steps': 33120, 'loss/train': 1.727284550666809} -11/07/2021 01:54:54 - INFO - __main__ - Step 33122: {'lr': 0.0004474053241168725, 'samples': 6359424, 'steps': 33121, 'loss/train': 1.9628920555114746} -11/07/2021 01:54:55 - INFO - __main__ - Step 33123: {'lr': 0.00044740206788326423, 'samples': 6359616, 'steps': 33122, 'loss/train': 1.0621058940887451} -11/07/2021 01:54:55 - INFO - __main__ - Step 33124: {'lr': 0.0004473988115607097, 'samples': 6359808, 'steps': 33123, 'loss/train': 1.2733900547027588} -11/07/2021 01:54:56 - INFO - __main__ - Step 33125: {'lr': 0.00044739555514921025, 'samples': 6360000, 'steps': 33124, 'loss/train': 1.3947138786315918} -11/07/2021 01:54:56 - INFO - __main__ - Step 33126: {'lr': 0.0004473922986487674, 'samples': 6360192, 'steps': 33125, 'loss/train': 1.3780709505081177} -11/07/2021 01:54:57 - INFO - __main__ - Step 33127: {'lr': 0.00044738904205938264, 'samples': 6360384, 'steps': 33126, 'loss/train': 1.715932846069336} -11/07/2021 01:54:57 - INFO - __main__ - Step 33128: {'lr': 0.00044738578538105746, 'samples': 6360576, 'steps': 33127, 'loss/train': 1.3106427192687988} -11/07/2021 01:54:58 - INFO - __main__ - Step 33129: {'lr': 0.0004473825286137933, 'samples': 6360768, 'steps': 33128, 'loss/train': 1.4293633699417114} -11/07/2021 01:54:58 - INFO - __main__ - Step 33130: {'lr': 0.0004473792717575915, 'samples': 6360960, 'steps': 33129, 'loss/train': 1.9495084285736084} -11/07/2021 01:54:59 - INFO - __main__ - Step 33131: {'lr': 0.00044737601481245376, 'samples': 6361152, 'steps': 33130, 'loss/train': 1.7546299695968628} -11/07/2021 01:54:59 - INFO - __main__ - Step 33132: {'lr': 0.00044737275777838136, 'samples': 6361344, 'steps': 33131, 'loss/train': 1.9084562063217163} -11/07/2021 01:55:00 - INFO - __main__ - Step 33133: {'lr': 0.0004473695006553759, 'samples': 6361536, 'steps': 33132, 'loss/train': 1.3284623622894287} -11/07/2021 01:55:00 - INFO - __main__ - Step 33134: {'lr': 0.0004473662434434388, 'samples': 6361728, 'steps': 33133, 'loss/train': 1.762020230293274} -11/07/2021 01:55:00 - INFO - __main__ - Step 33135: {'lr': 0.00044736298614257144, 'samples': 6361920, 'steps': 33134, 'loss/train': 2.226206064224243} -11/07/2021 01:55:01 - INFO - __main__ - Step 33136: {'lr': 0.0004473597287527754, 'samples': 6362112, 'steps': 33135, 'loss/train': 1.3786884546279907} -11/07/2021 01:55:02 - INFO - __main__ - Step 33137: {'lr': 0.00044735647127405216, 'samples': 6362304, 'steps': 33136, 'loss/train': 0.980176568031311} -11/07/2021 01:55:02 - INFO - __main__ - Step 33138: {'lr': 0.00044735321370640316, 'samples': 6362496, 'steps': 33137, 'loss/train': 1.749757170677185} -11/07/2021 01:55:02 - INFO - __main__ - Step 33139: {'lr': 0.00044734995604982973, 'samples': 6362688, 'steps': 33138, 'loss/train': 1.522831916809082} -11/07/2021 01:55:03 - INFO - __main__ - Step 33140: {'lr': 0.0004473466983043335, 'samples': 6362880, 'steps': 33139, 'loss/train': 1.335568904876709} -11/07/2021 01:55:04 - INFO - __main__ - Step 33141: {'lr': 0.0004473434404699159, 'samples': 6363072, 'steps': 33140, 'loss/train': 1.7207343578338623} -11/07/2021 01:55:05 - INFO - __main__ - Step 33142: {'lr': 0.00044734018254657845, 'samples': 6363264, 'steps': 33141, 'loss/train': 1.8754812479019165} -11/07/2021 01:55:05 - INFO - __main__ - Step 33143: {'lr': 0.00044733692453432253, 'samples': 6363456, 'steps': 33142, 'loss/train': 1.7550863027572632} -11/07/2021 01:55:05 - INFO - __main__ - Step 33144: {'lr': 0.00044733366643314956, 'samples': 6363648, 'steps': 33143, 'loss/train': 1.365227222442627} -11/07/2021 01:55:06 - INFO - __main__ - Step 33145: {'lr': 0.00044733040824306117, 'samples': 6363840, 'steps': 33144, 'loss/train': 1.446139931678772} -11/07/2021 01:55:07 - INFO - __main__ - Step 33146: {'lr': 0.00044732714996405866, 'samples': 6364032, 'steps': 33145, 'loss/train': 0.4527989327907562} -11/07/2021 01:55:07 - INFO - __main__ - Step 33147: {'lr': 0.0004473238915961436, 'samples': 6364224, 'steps': 33146, 'loss/train': 1.3928862810134888} -11/07/2021 01:55:08 - INFO - __main__ - Step 33148: {'lr': 0.0004473206331393175, 'samples': 6364416, 'steps': 33147, 'loss/train': 1.408677577972412} -11/07/2021 01:55:08 - INFO - __main__ - Step 33149: {'lr': 0.0004473173745935818, 'samples': 6364608, 'steps': 33148, 'loss/train': 1.4953867197036743} -11/07/2021 01:55:08 - INFO - __main__ - Step 33150: {'lr': 0.00044731411595893785, 'samples': 6364800, 'steps': 33149, 'loss/train': 0.8405914306640625} -11/07/2021 01:55:09 - INFO - __main__ - Step 33151: {'lr': 0.00044731085723538725, 'samples': 6364992, 'steps': 33150, 'loss/train': 1.1372485160827637} -11/07/2021 01:55:10 - INFO - __main__ - Step 33152: {'lr': 0.00044730759842293136, 'samples': 6365184, 'steps': 33151, 'loss/train': 0.7570802569389343} -11/07/2021 01:55:10 - INFO - __main__ - Step 33153: {'lr': 0.0004473043395215718, 'samples': 6365376, 'steps': 33152, 'loss/train': 1.256797432899475} -11/07/2021 01:55:10 - INFO - __main__ - Step 33154: {'lr': 0.00044730108053130986, 'samples': 6365568, 'steps': 33153, 'loss/train': 1.3361729383468628} -11/07/2021 01:55:11 - INFO - __main__ - Step 33155: {'lr': 0.00044729782145214717, 'samples': 6365760, 'steps': 33154, 'loss/train': 1.0276557207107544} -11/07/2021 01:55:12 - INFO - __main__ - Step 33156: {'lr': 0.00044729456228408506, 'samples': 6365952, 'steps': 33155, 'loss/train': 1.8448816537857056} -11/07/2021 01:55:12 - INFO - __main__ - Step 33157: {'lr': 0.00044729130302712504, 'samples': 6366144, 'steps': 33156, 'loss/train': 0.8225948810577393} -11/07/2021 01:55:12 - INFO - __main__ - Step 33158: {'lr': 0.00044728804368126873, 'samples': 6366336, 'steps': 33157, 'loss/train': 1.77656888961792} -11/07/2021 01:55:13 - INFO - __main__ - Step 33159: {'lr': 0.00044728478424651744, 'samples': 6366528, 'steps': 33158, 'loss/train': 0.8608505129814148} -11/07/2021 01:55:13 - INFO - __main__ - Step 33160: {'lr': 0.0004472815247228726, 'samples': 6366720, 'steps': 33159, 'loss/train': 1.0385569334030151} -11/07/2021 01:55:13 - INFO - __main__ - Step 33161: {'lr': 0.00044727826511033577, 'samples': 6366912, 'steps': 33160, 'loss/train': 1.214247226715088} -11/07/2021 01:55:15 - INFO - __main__ - Step 33162: {'lr': 0.0004472750054089084, 'samples': 6367104, 'steps': 33161, 'loss/train': 0.7041410207748413} -11/07/2021 01:55:15 - INFO - __main__ - Step 33163: {'lr': 0.00044727174561859194, 'samples': 6367296, 'steps': 33162, 'loss/train': 1.3713628053665161} -11/07/2021 01:55:15 - INFO - __main__ - Step 33164: {'lr': 0.00044726848573938796, 'samples': 6367488, 'steps': 33163, 'loss/train': 1.7455008029937744} -11/07/2021 01:55:16 - INFO - __main__ - Step 33165: {'lr': 0.0004472652257712978, 'samples': 6367680, 'steps': 33164, 'loss/train': 1.180960774421692} -11/07/2021 01:55:16 - INFO - __main__ - Step 33166: {'lr': 0.0004472619657143229, 'samples': 6367872, 'steps': 33165, 'loss/train': 1.4132847785949707} -11/07/2021 01:55:17 - INFO - __main__ - Step 33167: {'lr': 0.00044725870556846495, 'samples': 6368064, 'steps': 33166, 'loss/train': 1.4858864545822144} -11/07/2021 01:55:17 - INFO - __main__ - Step 33168: {'lr': 0.00044725544533372516, 'samples': 6368256, 'steps': 33167, 'loss/train': 1.4591635465621948} -11/07/2021 01:55:18 - INFO - __main__ - Step 33169: {'lr': 0.00044725218501010514, 'samples': 6368448, 'steps': 33168, 'loss/train': 1.80044686794281} -11/07/2021 01:55:18 - INFO - __main__ - Step 33170: {'lr': 0.0004472489245976063, 'samples': 6368640, 'steps': 33169, 'loss/train': 1.5054649114608765} -11/07/2021 01:55:18 - INFO - __main__ - Step 33171: {'lr': 0.00044724566409623013, 'samples': 6368832, 'steps': 33170, 'loss/train': 1.65577232837677} -11/07/2021 01:55:19 - INFO - __main__ - Step 33172: {'lr': 0.0004472424035059782, 'samples': 6369024, 'steps': 33171, 'loss/train': 1.4333148002624512} -11/07/2021 01:55:20 - INFO - __main__ - Step 33173: {'lr': 0.0004472391428268518, 'samples': 6369216, 'steps': 33172, 'loss/train': 1.6931020021438599} -11/07/2021 01:55:20 - INFO - __main__ - Step 33174: {'lr': 0.00044723588205885254, 'samples': 6369408, 'steps': 33173, 'loss/train': 1.4227957725524902} -11/07/2021 01:55:20 - INFO - __main__ - Step 33175: {'lr': 0.00044723262120198177, 'samples': 6369600, 'steps': 33174, 'loss/train': 1.5991913080215454} -11/07/2021 01:55:21 - INFO - __main__ - Step 33176: {'lr': 0.00044722936025624107, 'samples': 6369792, 'steps': 33175, 'loss/train': 1.453271746635437} -11/07/2021 01:55:21 - INFO - __main__ - Step 33177: {'lr': 0.00044722609922163184, 'samples': 6369984, 'steps': 33176, 'loss/train': 1.264987587928772} -11/07/2021 01:55:22 - INFO - __main__ - Step 33178: {'lr': 0.0004472228380981556, 'samples': 6370176, 'steps': 33177, 'loss/train': 2.117309093475342} -11/07/2021 01:55:23 - INFO - __main__ - Step 33179: {'lr': 0.0004472195768858138, 'samples': 6370368, 'steps': 33178, 'loss/train': 1.6110841035842896} -11/07/2021 01:55:23 - INFO - __main__ - Step 33180: {'lr': 0.0004472163155846078, 'samples': 6370560, 'steps': 33179, 'loss/train': 1.5283021926879883} -11/07/2021 01:55:23 - INFO - __main__ - Step 33181: {'lr': 0.0004472130541945393, 'samples': 6370752, 'steps': 33180, 'loss/train': 1.6061872243881226} -11/07/2021 01:55:24 - INFO - __main__ - Step 33182: {'lr': 0.00044720979271560963, 'samples': 6370944, 'steps': 33181, 'loss/train': 1.4953434467315674} -11/07/2021 01:55:25 - INFO - __main__ - Step 33183: {'lr': 0.00044720653114782024, 'samples': 6371136, 'steps': 33182, 'loss/train': 1.4750101566314697} -11/07/2021 01:55:25 - INFO - __main__ - Step 33184: {'lr': 0.0004472032694911726, 'samples': 6371328, 'steps': 33183, 'loss/train': 1.404825210571289} -11/07/2021 01:55:25 - INFO - __main__ - Step 33185: {'lr': 0.0004472000077456683, 'samples': 6371520, 'steps': 33184, 'loss/train': 1.6009184122085571} -11/07/2021 01:55:26 - INFO - __main__ - Step 33186: {'lr': 0.0004471967459113086, 'samples': 6371712, 'steps': 33185, 'loss/train': 0.953913688659668} -11/07/2021 01:55:26 - INFO - __main__ - Step 33187: {'lr': 0.0004471934839880951, 'samples': 6371904, 'steps': 33186, 'loss/train': 1.4461911916732788} -11/07/2021 01:55:27 - INFO - __main__ - Step 33188: {'lr': 0.00044719022197602933, 'samples': 6372096, 'steps': 33187, 'loss/train': 1.843044400215149} -11/07/2021 01:55:27 - INFO - __main__ - Step 33189: {'lr': 0.0004471869598751127, 'samples': 6372288, 'steps': 33188, 'loss/train': 1.5555542707443237} -11/07/2021 01:55:28 - INFO - __main__ - Step 33190: {'lr': 0.0004471836976853466, 'samples': 6372480, 'steps': 33189, 'loss/train': 1.6003851890563965} -11/07/2021 01:55:28 - INFO - __main__ - Step 33191: {'lr': 0.00044718043540673257, 'samples': 6372672, 'steps': 33190, 'loss/train': 1.7337013483047485} -11/07/2021 01:55:29 - INFO - __main__ - Step 33192: {'lr': 0.0004471771730392722, 'samples': 6372864, 'steps': 33191, 'loss/train': 1.5682861804962158} -11/07/2021 01:55:29 - INFO - __main__ - Step 33193: {'lr': 0.0004471739105829667, 'samples': 6373056, 'steps': 33192, 'loss/train': 1.4911301136016846} -11/07/2021 01:55:30 - INFO - __main__ - Step 33194: {'lr': 0.00044717064803781773, 'samples': 6373248, 'steps': 33193, 'loss/train': 1.4212634563446045} -11/07/2021 01:55:30 - INFO - __main__ - Step 33195: {'lr': 0.00044716738540382674, 'samples': 6373440, 'steps': 33194, 'loss/train': 1.1901922225952148} -11/07/2021 01:55:31 - INFO - __main__ - Step 33196: {'lr': 0.0004471641226809951, 'samples': 6373632, 'steps': 33195, 'loss/train': 1.32235848903656} -11/07/2021 01:55:31 - INFO - __main__ - Step 33197: {'lr': 0.0004471608598693244, 'samples': 6373824, 'steps': 33196, 'loss/train': 1.7602043151855469} -11/07/2021 01:55:32 - INFO - __main__ - Step 33198: {'lr': 0.000447157596968816, 'samples': 6374016, 'steps': 33197, 'loss/train': 1.5535030364990234} -11/07/2021 01:55:32 - INFO - __main__ - Step 33199: {'lr': 0.0004471543339794715, 'samples': 6374208, 'steps': 33198, 'loss/train': 1.2976843118667603} -11/07/2021 01:55:33 - INFO - __main__ - Step 33200: {'lr': 0.00044715107090129223, 'samples': 6374400, 'steps': 33199, 'loss/train': 1.5983165502548218} -11/07/2021 01:55:33 - INFO - __main__ - Step 33201: {'lr': 0.00044714780773427975, 'samples': 6374592, 'steps': 33200, 'loss/train': 1.6424078941345215} -11/07/2021 01:55:33 - INFO - __main__ - Step 33202: {'lr': 0.00044714454447843555, 'samples': 6374784, 'steps': 33201, 'loss/train': 1.4659985303878784} -11/07/2021 01:55:34 - INFO - __main__ - Step 33203: {'lr': 0.0004471412811337611, 'samples': 6374976, 'steps': 33202, 'loss/train': 1.6096456050872803} -11/07/2021 01:55:35 - INFO - __main__ - Step 33204: {'lr': 0.00044713801770025774, 'samples': 6375168, 'steps': 33203, 'loss/train': 1.6545803546905518} -11/07/2021 01:55:35 - INFO - __main__ - Step 33205: {'lr': 0.00044713475417792705, 'samples': 6375360, 'steps': 33204, 'loss/train': 1.561865210533142} -11/07/2021 01:55:36 - INFO - __main__ - Step 33206: {'lr': 0.0004471314905667705, 'samples': 6375552, 'steps': 33205, 'loss/train': 1.2108513116836548} -11/07/2021 01:55:36 - INFO - __main__ - Step 33207: {'lr': 0.00044712822686678955, 'samples': 6375744, 'steps': 33206, 'loss/train': 1.668056607246399} -11/07/2021 01:55:36 - INFO - __main__ - Step 33208: {'lr': 0.00044712496307798566, 'samples': 6375936, 'steps': 33207, 'loss/train': 1.120060682296753} -11/07/2021 01:55:37 - INFO - __main__ - Step 33209: {'lr': 0.0004471216992003603, 'samples': 6376128, 'steps': 33208, 'loss/train': 1.4917442798614502} -11/07/2021 01:55:38 - INFO - __main__ - Step 33210: {'lr': 0.0004471184352339149, 'samples': 6376320, 'steps': 33209, 'loss/train': 1.4822920560836792} -11/07/2021 01:55:38 - INFO - __main__ - Step 33211: {'lr': 0.00044711517117865105, 'samples': 6376512, 'steps': 33210, 'loss/train': 1.4753338098526} -11/07/2021 01:55:38 - INFO - __main__ - Step 33212: {'lr': 0.00044711190703457005, 'samples': 6376704, 'steps': 33211, 'loss/train': 1.2352567911148071} -11/07/2021 01:55:39 - INFO - __main__ - Step 33213: {'lr': 0.00044710864280167353, 'samples': 6376896, 'steps': 33212, 'loss/train': 1.4942405223846436} -11/07/2021 01:55:40 - INFO - __main__ - Step 33214: {'lr': 0.0004471053784799629, 'samples': 6377088, 'steps': 33213, 'loss/train': 1.5369149446487427} -11/07/2021 01:55:40 - INFO - __main__ - Step 33215: {'lr': 0.0004471021140694396, 'samples': 6377280, 'steps': 33214, 'loss/train': 1.7257037162780762} -11/07/2021 01:55:40 - INFO - __main__ - Step 33216: {'lr': 0.0004470988495701052, 'samples': 6377472, 'steps': 33215, 'loss/train': 1.591020107269287} -11/07/2021 01:55:41 - INFO - __main__ - Step 33217: {'lr': 0.00044709558498196104, 'samples': 6377664, 'steps': 33216, 'loss/train': 1.453142523765564} -11/07/2021 01:55:41 - INFO - __main__ - Step 33218: {'lr': 0.00044709232030500865, 'samples': 6377856, 'steps': 33217, 'loss/train': 1.6254675388336182} -11/07/2021 01:55:42 - INFO - __main__ - Step 33219: {'lr': 0.0004470890555392495, 'samples': 6378048, 'steps': 33218, 'loss/train': 1.5756146907806396} -11/07/2021 01:55:42 - INFO - __main__ - Step 33220: {'lr': 0.00044708579068468505, 'samples': 6378240, 'steps': 33219, 'loss/train': 1.5764384269714355} -11/07/2021 01:55:43 - INFO - __main__ - Step 33221: {'lr': 0.0004470825257413168, 'samples': 6378432, 'steps': 33220, 'loss/train': 1.4939641952514648} -11/07/2021 01:55:43 - INFO - __main__ - Step 33222: {'lr': 0.00044707926070914624, 'samples': 6378624, 'steps': 33221, 'loss/train': 1.782503604888916} -11/07/2021 01:55:43 - INFO - __main__ - Step 33223: {'lr': 0.0004470759955881748, 'samples': 6378816, 'steps': 33222, 'loss/train': 1.5841856002807617} -11/07/2021 01:55:44 - INFO - __main__ - Step 33224: {'lr': 0.0004470727303784039, 'samples': 6379008, 'steps': 33223, 'loss/train': 1.5153917074203491} -11/07/2021 01:55:45 - INFO - __main__ - Step 33225: {'lr': 0.00044706946507983513, 'samples': 6379200, 'steps': 33224, 'loss/train': 1.5163484811782837} -11/07/2021 01:55:45 - INFO - __main__ - Step 33226: {'lr': 0.00044706619969246984, 'samples': 6379392, 'steps': 33225, 'loss/train': 1.426256775856018} -11/07/2021 01:55:46 - INFO - __main__ - Step 33227: {'lr': 0.0004470629342163096, 'samples': 6379584, 'steps': 33226, 'loss/train': 1.8674992322921753} -11/07/2021 01:55:46 - INFO - __main__ - Step 33228: {'lr': 0.00044705966865135583, 'samples': 6379776, 'steps': 33227, 'loss/train': 2.1757476329803467} -11/07/2021 01:55:47 - INFO - __main__ - Step 33229: {'lr': 0.00044705640299761004, 'samples': 6379968, 'steps': 33228, 'loss/train': 1.5316298007965088} -11/07/2021 01:55:47 - INFO - __main__ - Step 33230: {'lr': 0.0004470531372550736, 'samples': 6380160, 'steps': 33229, 'loss/train': 1.7049391269683838} -11/07/2021 01:55:48 - INFO - __main__ - Step 33231: {'lr': 0.00044704987142374814, 'samples': 6380352, 'steps': 33230, 'loss/train': 1.018943428993225} -11/07/2021 01:55:48 - INFO - __main__ - Step 33232: {'lr': 0.00044704660550363507, 'samples': 6380544, 'steps': 33231, 'loss/train': 1.9485957622528076} -11/07/2021 01:55:48 - INFO - __main__ - Step 33233: {'lr': 0.00044704333949473576, 'samples': 6380736, 'steps': 33232, 'loss/train': 1.3192261457443237} -11/07/2021 01:55:49 - INFO - __main__ - Step 33234: {'lr': 0.0004470400733970518, 'samples': 6380928, 'steps': 33233, 'loss/train': 1.5830713510513306} -11/07/2021 01:55:50 - INFO - __main__ - Step 33235: {'lr': 0.0004470368072105846, 'samples': 6381120, 'steps': 33234, 'loss/train': 1.4584518671035767} -11/07/2021 01:55:50 - INFO - __main__ - Step 33236: {'lr': 0.00044703354093533564, 'samples': 6381312, 'steps': 33235, 'loss/train': 1.4330943822860718} -11/07/2021 01:55:50 - INFO - __main__ - Step 33237: {'lr': 0.0004470302745713065, 'samples': 6381504, 'steps': 33236, 'loss/train': 1.4370431900024414} -11/07/2021 01:55:51 - INFO - __main__ - Step 33238: {'lr': 0.0004470270081184985, 'samples': 6381696, 'steps': 33237, 'loss/train': 1.5408488512039185} -11/07/2021 01:55:51 - INFO - __main__ - Step 33239: {'lr': 0.00044702374157691316, 'samples': 6381888, 'steps': 33238, 'loss/train': 1.9147197008132935} -11/07/2021 01:55:52 - INFO - __main__ - Step 33240: {'lr': 0.00044702047494655194, 'samples': 6382080, 'steps': 33239, 'loss/train': 1.4002445936203003} -11/07/2021 01:55:53 - INFO - __main__ - Step 33241: {'lr': 0.0004470172082274164, 'samples': 6382272, 'steps': 33240, 'loss/train': 1.276917815208435} -11/07/2021 01:55:53 - INFO - __main__ - Step 33242: {'lr': 0.0004470139414195079, 'samples': 6382464, 'steps': 33241, 'loss/train': 1.0814828872680664} -11/07/2021 01:55:53 - INFO - __main__ - Step 33243: {'lr': 0.00044701067452282796, 'samples': 6382656, 'steps': 33242, 'loss/train': 0.8401081562042236} -11/07/2021 01:55:54 - INFO - __main__ - Step 33244: {'lr': 0.00044700740753737806, 'samples': 6382848, 'steps': 33243, 'loss/train': 1.2903378009796143} -11/07/2021 01:55:55 - INFO - __main__ - Step 33245: {'lr': 0.0004470041404631597, 'samples': 6383040, 'steps': 33244, 'loss/train': 0.9164215922355652} -11/07/2021 01:55:55 - INFO - __main__ - Step 33246: {'lr': 0.0004470008733001742, 'samples': 6383232, 'steps': 33245, 'loss/train': 1.027038335800171} -11/07/2021 01:55:55 - INFO - __main__ - Step 33247: {'lr': 0.0004469976060484233, 'samples': 6383424, 'steps': 33246, 'loss/train': 1.533467411994934} -11/07/2021 01:55:56 - INFO - __main__ - Step 33248: {'lr': 0.00044699433870790817, 'samples': 6383616, 'steps': 33247, 'loss/train': 1.3193182945251465} -11/07/2021 01:55:56 - INFO - __main__ - Step 33249: {'lr': 0.00044699107127863056, 'samples': 6383808, 'steps': 33248, 'loss/train': 1.3086721897125244} -11/07/2021 01:55:58 - INFO - __main__ - Step 33250: {'lr': 0.0004469878037605917, 'samples': 6384000, 'steps': 33249, 'loss/train': 1.1139196157455444} -11/07/2021 01:55:58 - INFO - __main__ - Step 33251: {'lr': 0.0004469845361537933, 'samples': 6384192, 'steps': 33250, 'loss/train': 1.488115668296814} -11/07/2021 01:55:58 - INFO - __main__ - Step 33252: {'lr': 0.0004469812684582366, 'samples': 6384384, 'steps': 33251, 'loss/train': 1.7786945104599} -11/07/2021 01:55:59 - INFO - __main__ - Step 33253: {'lr': 0.00044697800067392327, 'samples': 6384576, 'steps': 33252, 'loss/train': 1.573535680770874} -11/07/2021 01:55:59 - INFO - __main__ - Step 33254: {'lr': 0.00044697473280085455, 'samples': 6384768, 'steps': 33253, 'loss/train': 1.5784077644348145} -11/07/2021 01:55:59 - INFO - __main__ - Step 33255: {'lr': 0.0004469714648390322, 'samples': 6384960, 'steps': 33254, 'loss/train': 1.598545789718628} -11/07/2021 01:56:01 - INFO - __main__ - Step 33256: {'lr': 0.00044696819678845744, 'samples': 6385152, 'steps': 33255, 'loss/train': 1.2595524787902832} -11/07/2021 01:56:01 - INFO - __main__ - Step 33257: {'lr': 0.000446964928649132, 'samples': 6385344, 'steps': 33256, 'loss/train': 1.6089627742767334} -11/07/2021 01:56:01 - INFO - __main__ - Step 33258: {'lr': 0.00044696166042105704, 'samples': 6385536, 'steps': 33257, 'loss/train': 1.3691866397857666} -11/07/2021 01:56:02 - INFO - __main__ - Step 33259: {'lr': 0.0004469583921042343, 'samples': 6385728, 'steps': 33258, 'loss/train': 0.2382746934890747} -11/07/2021 01:56:02 - INFO - __main__ - Step 33260: {'lr': 0.0004469551236986651, 'samples': 6385920, 'steps': 33259, 'loss/train': 1.6525382995605469} -11/07/2021 01:56:03 - INFO - __main__ - Step 33261: {'lr': 0.00044695185520435087, 'samples': 6386112, 'steps': 33260, 'loss/train': 1.2914975881576538} -11/07/2021 01:56:03 - INFO - __main__ - Step 33262: {'lr': 0.00044694858662129333, 'samples': 6386304, 'steps': 33261, 'loss/train': 1.8371024131774902} -11/07/2021 01:56:04 - INFO - __main__ - Step 33263: {'lr': 0.0004469453179494938, 'samples': 6386496, 'steps': 33262, 'loss/train': 1.6654703617095947} -11/07/2021 01:56:04 - INFO - __main__ - Step 33264: {'lr': 0.00044694204918895367, 'samples': 6386688, 'steps': 33263, 'loss/train': 1.9074795246124268} -11/07/2021 01:56:04 - INFO - __main__ - Step 33265: {'lr': 0.0004469387803396745, 'samples': 6386880, 'steps': 33264, 'loss/train': 1.5051642656326294} -11/07/2021 01:56:05 - INFO - __main__ - Step 33266: {'lr': 0.0004469355114016577, 'samples': 6387072, 'steps': 33265, 'loss/train': 1.4132717847824097} -11/07/2021 01:56:06 - INFO - __main__ - Step 33267: {'lr': 0.00044693224237490485, 'samples': 6387264, 'steps': 33266, 'loss/train': 1.890087366104126} -11/07/2021 01:56:06 - INFO - __main__ - Step 33268: {'lr': 0.00044692897325941737, 'samples': 6387456, 'steps': 33267, 'loss/train': 1.05165433883667} -11/07/2021 01:56:06 - INFO - __main__ - Step 33269: {'lr': 0.00044692570405519683, 'samples': 6387648, 'steps': 33268, 'loss/train': 1.416410207748413} -11/07/2021 01:56:07 - INFO - __main__ - Step 33270: {'lr': 0.0004469224347622445, 'samples': 6387840, 'steps': 33269, 'loss/train': 1.4195667505264282} -11/07/2021 01:56:08 - INFO - __main__ - Step 33271: {'lr': 0.000446919165380562, 'samples': 6388032, 'steps': 33270, 'loss/train': 1.4561563730239868} -11/07/2021 01:56:08 - INFO - __main__ - Step 33272: {'lr': 0.0004469158959101507, 'samples': 6388224, 'steps': 33271, 'loss/train': 1.471016764640808} -11/07/2021 01:56:09 - INFO - __main__ - Step 33273: {'lr': 0.00044691262635101223, 'samples': 6388416, 'steps': 33272, 'loss/train': 1.933846354484558} -11/07/2021 01:56:09 - INFO - __main__ - Step 33274: {'lr': 0.0004469093567031479, 'samples': 6388608, 'steps': 33273, 'loss/train': 0.4682588577270508} -11/07/2021 01:56:09 - INFO - __main__ - Step 33275: {'lr': 0.00044690608696655923, 'samples': 6388800, 'steps': 33274, 'loss/train': 0.1448262631893158} -11/07/2021 01:56:10 - INFO - __main__ - Step 33276: {'lr': 0.0004469028171412478, 'samples': 6388992, 'steps': 33275, 'loss/train': 1.8468519449234009} -11/07/2021 01:56:11 - INFO - __main__ - Step 33277: {'lr': 0.00044689954722721494, 'samples': 6389184, 'steps': 33276, 'loss/train': 1.537747859954834} -11/07/2021 01:56:11 - INFO - __main__ - Step 33278: {'lr': 0.0004468962772244622, 'samples': 6389376, 'steps': 33277, 'loss/train': 1.2993748188018799} -11/07/2021 01:56:11 - INFO - __main__ - Step 33279: {'lr': 0.00044689300713299105, 'samples': 6389568, 'steps': 33278, 'loss/train': 2.205153465270996} -11/07/2021 01:56:12 - INFO - __main__ - Step 33280: {'lr': 0.0004468897369528029, 'samples': 6389760, 'steps': 33279, 'loss/train': 1.2932888269424438} -11/07/2021 01:56:12 - INFO - __main__ - Step 33281: {'lr': 0.00044688646668389933, 'samples': 6389952, 'steps': 33280, 'loss/train': 1.5683271884918213} -11/07/2021 01:56:13 - INFO - __main__ - Step 33282: {'lr': 0.0004468831963262817, 'samples': 6390144, 'steps': 33281, 'loss/train': 1.5767319202423096} -11/07/2021 01:56:14 - INFO - __main__ - Step 33283: {'lr': 0.00044687992587995155, 'samples': 6390336, 'steps': 33282, 'loss/train': 1.4285104274749756} -11/07/2021 01:56:14 - INFO - __main__ - Step 33284: {'lr': 0.0004468766553449104, 'samples': 6390528, 'steps': 33283, 'loss/train': 1.5589231252670288} -11/07/2021 01:56:14 - INFO - __main__ - Step 33285: {'lr': 0.00044687338472115964, 'samples': 6390720, 'steps': 33284, 'loss/train': 1.4872294664382935} -11/07/2021 01:56:15 - INFO - __main__ - Step 33286: {'lr': 0.00044687011400870074, 'samples': 6390912, 'steps': 33285, 'loss/train': 0.994925856590271} -11/07/2021 01:56:16 - INFO - __main__ - Step 33287: {'lr': 0.00044686684320753524, 'samples': 6391104, 'steps': 33286, 'loss/train': 1.6664528846740723} -11/07/2021 01:56:16 - INFO - __main__ - Step 33288: {'lr': 0.00044686357231766454, 'samples': 6391296, 'steps': 33287, 'loss/train': 1.7071375846862793} -11/07/2021 01:56:16 - INFO - __main__ - Step 33289: {'lr': 0.00044686030133909017, 'samples': 6391488, 'steps': 33288, 'loss/train': 1.7450517416000366} -11/07/2021 01:56:17 - INFO - __main__ - Step 33290: {'lr': 0.00044685703027181364, 'samples': 6391680, 'steps': 33289, 'loss/train': 1.8223915100097656} -11/07/2021 01:56:17 - INFO - __main__ - Step 33291: {'lr': 0.0004468537591158363, 'samples': 6391872, 'steps': 33290, 'loss/train': 1.4068268537521362} -11/07/2021 01:56:18 - INFO - __main__ - Step 33292: {'lr': 0.0004468504878711597, 'samples': 6392064, 'steps': 33291, 'loss/train': 1.7510511875152588} -11/07/2021 01:56:18 - INFO - __main__ - Step 33293: {'lr': 0.00044684721653778537, 'samples': 6392256, 'steps': 33292, 'loss/train': 1.8125139474868774} -11/07/2021 01:56:19 - INFO - __main__ - Step 33294: {'lr': 0.00044684394511571463, 'samples': 6392448, 'steps': 33293, 'loss/train': 1.2472978830337524} -11/07/2021 01:56:19 - INFO - __main__ - Step 33295: {'lr': 0.00044684067360494905, 'samples': 6392640, 'steps': 33294, 'loss/train': 1.848178744316101} -11/07/2021 01:56:19 - INFO - __main__ - Step 33296: {'lr': 0.00044683740200549015, 'samples': 6392832, 'steps': 33295, 'loss/train': 1.204787254333496} -11/07/2021 01:56:20 - INFO - __main__ - Step 33297: {'lr': 0.00044683413031733945, 'samples': 6393024, 'steps': 33296, 'loss/train': 0.9038345813751221} -11/07/2021 01:56:21 - INFO - __main__ - Step 33298: {'lr': 0.00044683085854049814, 'samples': 6393216, 'steps': 33297, 'loss/train': 1.6067466735839844} -11/07/2021 01:56:21 - INFO - __main__ - Step 33299: {'lr': 0.00044682758667496806, 'samples': 6393408, 'steps': 33298, 'loss/train': 1.0957818031311035} -11/07/2021 01:56:22 - INFO - __main__ - Step 33300: {'lr': 0.00044682431472075035, 'samples': 6393600, 'steps': 33299, 'loss/train': 1.1766695976257324} -11/07/2021 01:56:22 - INFO - __main__ - Step 33301: {'lr': 0.00044682104267784674, 'samples': 6393792, 'steps': 33300, 'loss/train': 1.4583467245101929} -11/07/2021 01:56:23 - INFO - __main__ - Step 33302: {'lr': 0.0004468177705462585, 'samples': 6393984, 'steps': 33301, 'loss/train': 1.3737915754318237} -11/07/2021 01:56:23 - INFO - __main__ - Step 33303: {'lr': 0.0004468144983259873, 'samples': 6394176, 'steps': 33302, 'loss/train': 1.6026164293289185} -11/07/2021 01:56:24 - INFO - __main__ - Step 33304: {'lr': 0.0004468112260170345, 'samples': 6394368, 'steps': 33303, 'loss/train': 1.5704874992370605} -11/07/2021 01:56:24 - INFO - __main__ - Step 33305: {'lr': 0.0004468079536194016, 'samples': 6394560, 'steps': 33304, 'loss/train': 1.5559061765670776} -11/07/2021 01:56:24 - INFO - __main__ - Step 33306: {'lr': 0.00044680468113309006, 'samples': 6394752, 'steps': 33305, 'loss/train': 1.0961544513702393} -11/07/2021 01:56:25 - INFO - __main__ - Step 33307: {'lr': 0.0004468014085581014, 'samples': 6394944, 'steps': 33306, 'loss/train': 2.8458991050720215} -11/07/2021 01:56:26 - INFO - __main__ - Step 33308: {'lr': 0.0004467981358944371, 'samples': 6395136, 'steps': 33307, 'loss/train': 1.6939728260040283} -11/07/2021 01:56:26 - INFO - __main__ - Step 33309: {'lr': 0.0004467948631420985, 'samples': 6395328, 'steps': 33308, 'loss/train': 1.5496588945388794} -11/07/2021 01:56:26 - INFO - __main__ - Step 33310: {'lr': 0.0004467915903010872, 'samples': 6395520, 'steps': 33309, 'loss/train': 1.1974292993545532} -11/07/2021 01:56:27 - INFO - __main__ - Step 33311: {'lr': 0.0004467883173714047, 'samples': 6395712, 'steps': 33310, 'loss/train': 1.6529051065444946} -11/07/2021 01:56:27 - INFO - __main__ - Step 33312: {'lr': 0.0004467850443530523, 'samples': 6395904, 'steps': 33311, 'loss/train': 1.399214267730713} -11/07/2021 01:56:28 - INFO - __main__ - Step 33313: {'lr': 0.0004467817712460317, 'samples': 6396096, 'steps': 33312, 'loss/train': 1.6385629177093506} -11/07/2021 01:56:28 - INFO - __main__ - Step 33314: {'lr': 0.00044677849805034424, 'samples': 6396288, 'steps': 33313, 'loss/train': 1.6142476797103882} -11/07/2021 01:56:29 - INFO - __main__ - Step 33315: {'lr': 0.0004467752247659914, 'samples': 6396480, 'steps': 33314, 'loss/train': 1.3866982460021973} -11/07/2021 01:56:29 - INFO - __main__ - Step 33316: {'lr': 0.00044677195139297476, 'samples': 6396672, 'steps': 33315, 'loss/train': 1.5994012355804443} -11/07/2021 01:56:29 - INFO - __main__ - Step 33317: {'lr': 0.00044676867793129574, 'samples': 6396864, 'steps': 33316, 'loss/train': 1.6208961009979248} -11/07/2021 01:56:30 - INFO - __main__ - Step 33318: {'lr': 0.00044676540438095565, 'samples': 6397056, 'steps': 33317, 'loss/train': 1.0598540306091309} -11/07/2021 01:56:31 - INFO - __main__ - Step 33319: {'lr': 0.0004467621307419562, 'samples': 6397248, 'steps': 33318, 'loss/train': 1.4713943004608154} -11/07/2021 01:56:31 - INFO - __main__ - Step 33320: {'lr': 0.00044675885701429873, 'samples': 6397440, 'steps': 33319, 'loss/train': 1.3172155618667603} -11/07/2021 01:56:32 - INFO - __main__ - Step 33321: {'lr': 0.00044675558319798477, 'samples': 6397632, 'steps': 33320, 'loss/train': 1.5222651958465576} -11/07/2021 01:56:32 - INFO - __main__ - Step 33322: {'lr': 0.00044675230929301575, 'samples': 6397824, 'steps': 33321, 'loss/train': 1.2951338291168213} -11/07/2021 01:56:33 - INFO - __main__ - Step 33323: {'lr': 0.0004467490352993932, 'samples': 6398016, 'steps': 33322, 'loss/train': 1.2071497440338135} -11/07/2021 01:56:33 - INFO - __main__ - Step 33324: {'lr': 0.00044674576121711855, 'samples': 6398208, 'steps': 33323, 'loss/train': 1.645951509475708} -11/07/2021 01:56:34 - INFO - __main__ - Step 33325: {'lr': 0.00044674248704619333, 'samples': 6398400, 'steps': 33324, 'loss/train': 1.4131158590316772} -11/07/2021 01:56:34 - INFO - __main__ - Step 33326: {'lr': 0.000446739212786619, 'samples': 6398592, 'steps': 33325, 'loss/train': 1.915831208229065} -11/07/2021 01:56:34 - INFO - __main__ - Step 33327: {'lr': 0.000446735938438397, 'samples': 6398784, 'steps': 33326, 'loss/train': 0.787378191947937} -11/07/2021 01:56:36 - INFO - __main__ - Step 33328: {'lr': 0.0004467326640015288, 'samples': 6398976, 'steps': 33327, 'loss/train': 1.6845728158950806} -11/07/2021 01:56:36 - INFO - __main__ - Step 33329: {'lr': 0.00044672938947601593, 'samples': 6399168, 'steps': 33328, 'loss/train': 1.1684160232543945} -11/07/2021 01:56:36 - INFO - __main__ - Step 33330: {'lr': 0.00044672611486185976, 'samples': 6399360, 'steps': 33329, 'loss/train': 0.7616485953330994} -11/07/2021 01:56:37 - INFO - __main__ - Step 33331: {'lr': 0.0004467228401590619, 'samples': 6399552, 'steps': 33330, 'loss/train': 1.2289947271347046} -11/07/2021 01:56:37 - INFO - __main__ - Step 33332: {'lr': 0.00044671956536762375, 'samples': 6399744, 'steps': 33331, 'loss/train': 0.993565022945404} -11/07/2021 01:56:38 - INFO - __main__ - Step 33333: {'lr': 0.00044671629048754683, 'samples': 6399936, 'steps': 33332, 'loss/train': 1.4252376556396484} -11/07/2021 01:56:38 - INFO - __main__ - Step 33334: {'lr': 0.00044671301551883253, 'samples': 6400128, 'steps': 33333, 'loss/train': 1.616149663925171} -11/07/2021 01:56:39 - INFO - __main__ - Step 33335: {'lr': 0.0004467097404614824, 'samples': 6400320, 'steps': 33334, 'loss/train': 1.5558617115020752} -11/07/2021 01:56:39 - INFO - __main__ - Step 33336: {'lr': 0.0004467064653154979, 'samples': 6400512, 'steps': 33335, 'loss/train': 1.4129722118377686} -11/07/2021 01:56:40 - INFO - __main__ - Step 33337: {'lr': 0.0004467031900808805, 'samples': 6400704, 'steps': 33336, 'loss/train': 1.6587660312652588} -11/07/2021 01:56:41 - INFO - __main__ - Step 33338: {'lr': 0.00044669991475763173, 'samples': 6400896, 'steps': 33337, 'loss/train': 1.0887442827224731} -11/07/2021 01:56:41 - INFO - __main__ - Step 33339: {'lr': 0.00044669663934575294, 'samples': 6401088, 'steps': 33338, 'loss/train': 1.6212620735168457} -11/07/2021 01:56:41 - INFO - __main__ - Step 33340: {'lr': 0.0004466933638452457, 'samples': 6401280, 'steps': 33339, 'loss/train': 1.008997917175293} -11/07/2021 01:56:42 - INFO - __main__ - Step 33341: {'lr': 0.0004466900882561115, 'samples': 6401472, 'steps': 33340, 'loss/train': 1.5845059156417847} -11/07/2021 01:56:42 - INFO - __main__ - Step 33342: {'lr': 0.00044668681257835173, 'samples': 6401664, 'steps': 33341, 'loss/train': 1.473926305770874} -11/07/2021 01:56:43 - INFO - __main__ - Step 33343: {'lr': 0.00044668353681196794, 'samples': 6401856, 'steps': 33342, 'loss/train': 1.2813016176223755} -11/07/2021 01:56:43 - INFO - __main__ - Step 33344: {'lr': 0.0004466802609569616, 'samples': 6402048, 'steps': 33343, 'loss/train': 1.5135631561279297} -11/07/2021 01:56:44 - INFO - __main__ - Step 33345: {'lr': 0.00044667698501333415, 'samples': 6402240, 'steps': 33344, 'loss/train': 1.1744544506072998} -11/07/2021 01:56:44 - INFO - __main__ - Step 33346: {'lr': 0.0004466737089810871, 'samples': 6402432, 'steps': 33345, 'loss/train': 1.721977710723877} -11/07/2021 01:56:44 - INFO - __main__ - Step 33347: {'lr': 0.00044667043286022193, 'samples': 6402624, 'steps': 33346, 'loss/train': 1.3514186143875122} -11/07/2021 01:56:45 - INFO - __main__ - Step 33348: {'lr': 0.00044666715665074, 'samples': 6402816, 'steps': 33347, 'loss/train': 0.6177819967269897} -11/07/2021 01:56:46 - INFO - __main__ - Step 33349: {'lr': 0.0004466638803526429, 'samples': 6403008, 'steps': 33348, 'loss/train': 1.8638166189193726} -11/07/2021 01:56:46 - INFO - __main__ - Step 33350: {'lr': 0.0004466606039659322, 'samples': 6403200, 'steps': 33349, 'loss/train': 1.4739454984664917} -11/07/2021 01:56:47 - INFO - __main__ - Step 33351: {'lr': 0.0004466573274906092, 'samples': 6403392, 'steps': 33350, 'loss/train': 1.2804734706878662} -11/07/2021 01:56:47 - INFO - __main__ - Step 33352: {'lr': 0.0004466540509266754, 'samples': 6403584, 'steps': 33351, 'loss/train': 1.2557836771011353} -11/07/2021 01:56:48 - INFO - __main__ - Step 33353: {'lr': 0.0004466507742741325, 'samples': 6403776, 'steps': 33352, 'loss/train': 1.5667165517807007} -11/07/2021 01:56:48 - INFO - __main__ - Step 33354: {'lr': 0.0004466474975329816, 'samples': 6403968, 'steps': 33353, 'loss/train': 1.852150797843933} -11/07/2021 01:56:48 - INFO - __main__ - Step 33355: {'lr': 0.0004466442207032244, 'samples': 6404160, 'steps': 33354, 'loss/train': 1.2369035482406616} -11/07/2021 01:56:49 - INFO - __main__ - Step 33356: {'lr': 0.00044664094378486243, 'samples': 6404352, 'steps': 33355, 'loss/train': 1.349674940109253} -11/07/2021 01:56:49 - INFO - __main__ - Step 33357: {'lr': 0.00044663766677789706, 'samples': 6404544, 'steps': 33356, 'loss/train': 2.1358084678649902} -11/07/2021 01:56:50 - INFO - __main__ - Step 33358: {'lr': 0.0004466343896823297, 'samples': 6404736, 'steps': 33357, 'loss/train': 1.5977809429168701} -11/07/2021 01:56:50 - INFO - __main__ - Step 33359: {'lr': 0.000446631112498162, 'samples': 6404928, 'steps': 33358, 'loss/train': 1.3789011240005493} -11/07/2021 01:56:51 - INFO - __main__ - Step 33360: {'lr': 0.0004466278352253954, 'samples': 6405120, 'steps': 33359, 'loss/train': 1.5842740535736084} -11/07/2021 01:56:51 - INFO - __main__ - Step 33361: {'lr': 0.00044662455786403124, 'samples': 6405312, 'steps': 33360, 'loss/train': 1.3825491666793823} -11/07/2021 01:56:52 - INFO - __main__ - Step 33362: {'lr': 0.0004466212804140711, 'samples': 6405504, 'steps': 33361, 'loss/train': 1.7108070850372314} -11/07/2021 01:56:52 - INFO - __main__ - Step 33363: {'lr': 0.00044661800287551653, 'samples': 6405696, 'steps': 33362, 'loss/train': 1.69106924533844} -11/07/2021 01:56:53 - INFO - __main__ - Step 33364: {'lr': 0.00044661472524836886, 'samples': 6405888, 'steps': 33363, 'loss/train': 1.4570802450180054} -11/07/2021 01:56:53 - INFO - __main__ - Step 33365: {'lr': 0.00044661144753262963, 'samples': 6406080, 'steps': 33364, 'loss/train': 1.4948817491531372} -11/07/2021 01:56:54 - INFO - __main__ - Step 33366: {'lr': 0.0004466081697283003, 'samples': 6406272, 'steps': 33365, 'loss/train': 0.9278396368026733} -11/07/2021 01:56:54 - INFO - __main__ - Step 33367: {'lr': 0.00044660489183538237, 'samples': 6406464, 'steps': 33366, 'loss/train': 1.8919562101364136} -11/07/2021 01:56:54 - INFO - __main__ - Step 33368: {'lr': 0.0004466016138538773, 'samples': 6406656, 'steps': 33367, 'loss/train': 1.572937250137329} -11/07/2021 01:56:56 - INFO - __main__ - Step 33369: {'lr': 0.0004465983357837866, 'samples': 6406848, 'steps': 33368, 'loss/train': 2.0625107288360596} -11/07/2021 01:56:56 - INFO - __main__ - Step 33370: {'lr': 0.00044659505762511176, 'samples': 6407040, 'steps': 33369, 'loss/train': 1.6907017230987549} -11/07/2021 01:56:56 - INFO - __main__ - Step 33371: {'lr': 0.00044659177937785417, 'samples': 6407232, 'steps': 33370, 'loss/train': 1.1050999164581299} -11/07/2021 01:56:57 - INFO - __main__ - Step 33372: {'lr': 0.0004465885010420154, 'samples': 6407424, 'steps': 33371, 'loss/train': 1.249595046043396} -11/07/2021 01:56:57 - INFO - __main__ - Step 33373: {'lr': 0.0004465852226175968, 'samples': 6407616, 'steps': 33372, 'loss/train': 0.7163944840431213} -11/07/2021 01:56:59 - INFO - __main__ - Step 33374: {'lr': 0.00044658194410460004, 'samples': 6407808, 'steps': 33373, 'loss/train': 1.4177186489105225} -11/07/2021 01:56:59 - INFO - __main__ - Step 33375: {'lr': 0.0004465786655030264, 'samples': 6408000, 'steps': 33374, 'loss/train': 5.1912384033203125} -11/07/2021 01:56:59 - INFO - __main__ - Step 33376: {'lr': 0.00044657538681287746, 'samples': 6408192, 'steps': 33375, 'loss/train': 4.983016014099121} -11/07/2021 01:57:00 - INFO - __main__ - Step 33377: {'lr': 0.0004465721080341547, 'samples': 6408384, 'steps': 33376, 'loss/train': 4.876257419586182} -11/07/2021 01:57:00 - INFO - __main__ - Step 33378: {'lr': 0.0004465688291668596, 'samples': 6408576, 'steps': 33377, 'loss/train': 1.365555763244629} -11/07/2021 01:57:00 - INFO - __main__ - Step 33379: {'lr': 0.00044656555021099363, 'samples': 6408768, 'steps': 33378, 'loss/train': 1.2451014518737793} -11/07/2021 01:57:01 - INFO - __main__ - Step 33380: {'lr': 0.00044656227116655824, 'samples': 6408960, 'steps': 33379, 'loss/train': 1.671711802482605} -11/07/2021 01:57:02 - INFO - __main__ - Step 33381: {'lr': 0.00044655899203355486, 'samples': 6409152, 'steps': 33380, 'loss/train': 1.3759804964065552} -11/07/2021 01:57:02 - INFO - __main__ - Step 33382: {'lr': 0.0004465557128119852, 'samples': 6409344, 'steps': 33381, 'loss/train': 1.7203022241592407} -11/07/2021 01:57:03 - INFO - __main__ - Step 33383: {'lr': 0.00044655243350185037, 'samples': 6409536, 'steps': 33382, 'loss/train': 1.7072322368621826} -11/07/2021 01:57:03 - INFO - __main__ - Step 33384: {'lr': 0.0004465491541031522, 'samples': 6409728, 'steps': 33383, 'loss/train': 1.633778691291809} -11/07/2021 01:57:03 - INFO - __main__ - Step 33385: {'lr': 0.00044654587461589193, 'samples': 6409920, 'steps': 33384, 'loss/train': 1.545433521270752} -11/07/2021 01:57:04 - INFO - __main__ - Step 33386: {'lr': 0.0004465425950400711, 'samples': 6410112, 'steps': 33385, 'loss/train': 1.7061132192611694} -11/07/2021 01:57:05 - INFO - __main__ - Step 33387: {'lr': 0.00044653931537569125, 'samples': 6410304, 'steps': 33386, 'loss/train': 7.1502532958984375} -11/07/2021 01:57:05 - INFO - __main__ - Step 33388: {'lr': 0.0004465360356227538, 'samples': 6410496, 'steps': 33387, 'loss/train': 1.4677163362503052} -11/07/2021 01:57:05 - INFO - __main__ - Step 33389: {'lr': 0.0004465327557812603, 'samples': 6410688, 'steps': 33388, 'loss/train': 1.8780077695846558} -11/07/2021 01:57:06 - INFO - __main__ - Step 33390: {'lr': 0.0004465294758512121, 'samples': 6410880, 'steps': 33389, 'loss/train': 1.5223056077957153} -11/07/2021 01:57:06 - INFO - __main__ - Step 33391: {'lr': 0.0004465261958326108, 'samples': 6411072, 'steps': 33390, 'loss/train': 2.0901994705200195} -11/07/2021 01:57:07 - INFO - __main__ - Step 33392: {'lr': 0.0004465229157254578, 'samples': 6411264, 'steps': 33391, 'loss/train': 1.741840124130249} -11/07/2021 01:57:07 - INFO - __main__ - Step 33393: {'lr': 0.0004465196355297546, 'samples': 6411456, 'steps': 33392, 'loss/train': 0.1811494380235672} -11/07/2021 01:57:08 - INFO - __main__ - Step 33394: {'lr': 0.0004465163552455027, 'samples': 6411648, 'steps': 33393, 'loss/train': 1.7289592027664185} -11/07/2021 01:57:08 - INFO - __main__ - Step 33395: {'lr': 0.0004465130748727036, 'samples': 6411840, 'steps': 33394, 'loss/train': 1.4100768566131592} -11/07/2021 01:57:09 - INFO - __main__ - Step 33396: {'lr': 0.0004465097944113587, 'samples': 6412032, 'steps': 33395, 'loss/train': 0.8781396746635437} -11/07/2021 01:57:10 - INFO - __main__ - Step 33397: {'lr': 0.00044650651386146954, 'samples': 6412224, 'steps': 33396, 'loss/train': 1.5576465129852295} -11/07/2021 01:57:10 - INFO - __main__ - Step 33398: {'lr': 0.00044650323322303757, 'samples': 6412416, 'steps': 33397, 'loss/train': 1.6613613367080688} -11/07/2021 01:57:11 - INFO - __main__ - Step 33399: {'lr': 0.0004464999524960642, 'samples': 6412608, 'steps': 33398, 'loss/train': 1.6993510723114014} -11/07/2021 01:57:11 - INFO - __main__ - Step 33400: {'lr': 0.0004464966716805511, 'samples': 6412800, 'steps': 33399, 'loss/train': 1.7051008939743042} -11/07/2021 01:57:11 - INFO - __main__ - Step 33401: {'lr': 0.0004464933907764996, 'samples': 6412992, 'steps': 33400, 'loss/train': 1.900296926498413} -11/07/2021 01:57:12 - INFO - __main__ - Step 33402: {'lr': 0.0004464901097839112, 'samples': 6413184, 'steps': 33401, 'loss/train': 0.3372882008552551} -11/07/2021 01:57:13 - INFO - __main__ - Step 33403: {'lr': 0.00044648682870278733, 'samples': 6413376, 'steps': 33402, 'loss/train': 1.684402346611023} -11/07/2021 01:57:13 - INFO - __main__ - Step 33404: {'lr': 0.0004464835475331296, 'samples': 6413568, 'steps': 33403, 'loss/train': 1.8330544233322144} -11/07/2021 01:57:13 - INFO - __main__ - Step 33405: {'lr': 0.0004464802662749394, 'samples': 6413760, 'steps': 33404, 'loss/train': 1.9801530838012695} -11/07/2021 01:57:14 - INFO - __main__ - Step 33406: {'lr': 0.00044647698492821826, 'samples': 6413952, 'steps': 33405, 'loss/train': 1.53224778175354} -11/07/2021 01:57:15 - INFO - __main__ - Step 33407: {'lr': 0.00044647370349296757, 'samples': 6414144, 'steps': 33406, 'loss/train': 1.296061396598816} -11/07/2021 01:57:15 - INFO - __main__ - Step 33408: {'lr': 0.00044647042196918884, 'samples': 6414336, 'steps': 33407, 'loss/train': 1.4821537733078003} -11/07/2021 01:57:16 - INFO - __main__ - Step 33409: {'lr': 0.00044646714035688365, 'samples': 6414528, 'steps': 33408, 'loss/train': 1.12440824508667} -11/07/2021 01:57:16 - INFO - __main__ - Step 33410: {'lr': 0.00044646385865605335, 'samples': 6414720, 'steps': 33409, 'loss/train': 1.8271406888961792} -11/07/2021 01:57:16 - INFO - __main__ - Step 33411: {'lr': 0.0004464605768666995, 'samples': 6414912, 'steps': 33410, 'loss/train': 1.5178637504577637} -11/07/2021 01:57:17 - INFO - __main__ - Step 33412: {'lr': 0.0004464572949888235, 'samples': 6415104, 'steps': 33411, 'loss/train': 1.2276266813278198} -11/07/2021 01:57:18 - INFO - __main__ - Step 33413: {'lr': 0.0004464540130224268, 'samples': 6415296, 'steps': 33412, 'loss/train': 1.6815807819366455} -11/07/2021 01:57:18 - INFO - __main__ - Step 33414: {'lr': 0.0004464507309675111, 'samples': 6415488, 'steps': 33413, 'loss/train': 1.7691391706466675} -11/07/2021 01:57:18 - INFO - __main__ - Step 33415: {'lr': 0.00044644744882407767, 'samples': 6415680, 'steps': 33414, 'loss/train': 2.3698713779449463} -11/07/2021 01:57:19 - INFO - __main__ - Step 33416: {'lr': 0.00044644416659212806, 'samples': 6415872, 'steps': 33415, 'loss/train': 1.6313021183013916} -11/07/2021 01:57:19 - INFO - __main__ - Step 33417: {'lr': 0.00044644088427166375, 'samples': 6416064, 'steps': 33416, 'loss/train': 1.6351815462112427} -11/07/2021 01:57:20 - INFO - __main__ - Step 33418: {'lr': 0.00044643760186268615, 'samples': 6416256, 'steps': 33417, 'loss/train': 1.43039071559906} -11/07/2021 01:57:20 - INFO - __main__ - Step 33419: {'lr': 0.00044643431936519683, 'samples': 6416448, 'steps': 33418, 'loss/train': 1.6958608627319336} -11/07/2021 01:57:21 - INFO - __main__ - Step 33420: {'lr': 0.00044643103677919726, 'samples': 6416640, 'steps': 33419, 'loss/train': 1.557178020477295} -11/07/2021 01:57:21 - INFO - __main__ - Step 33421: {'lr': 0.00044642775410468896, 'samples': 6416832, 'steps': 33420, 'loss/train': 1.6278393268585205} -11/07/2021 01:57:22 - INFO - __main__ - Step 33422: {'lr': 0.00044642447134167316, 'samples': 6417024, 'steps': 33421, 'loss/train': 1.4954309463500977} -11/07/2021 01:57:22 - INFO - __main__ - Step 33423: {'lr': 0.00044642118849015167, 'samples': 6417216, 'steps': 33422, 'loss/train': 1.7011927366256714} -11/07/2021 01:57:23 - INFO - __main__ - Step 33424: {'lr': 0.0004464179055501258, 'samples': 6417408, 'steps': 33423, 'loss/train': 1.4190086126327515} -11/07/2021 01:57:23 - INFO - __main__ - Step 33425: {'lr': 0.00044641462252159705, 'samples': 6417600, 'steps': 33424, 'loss/train': 1.3510175943374634} -11/07/2021 01:57:24 - INFO - __main__ - Step 33426: {'lr': 0.0004464113394045669, 'samples': 6417792, 'steps': 33425, 'loss/train': 2.233720064163208} -11/07/2021 01:57:24 - INFO - __main__ - Step 33427: {'lr': 0.00044640805619903677, 'samples': 6417984, 'steps': 33426, 'loss/train': 1.6520930528640747} -11/07/2021 01:57:25 - INFO - __main__ - Step 33428: {'lr': 0.00044640477290500824, 'samples': 6418176, 'steps': 33427, 'loss/train': 1.526247501373291} -11/07/2021 01:57:25 - INFO - __main__ - Step 33429: {'lr': 0.00044640148952248285, 'samples': 6418368, 'steps': 33428, 'loss/train': 1.2569032907485962} -11/07/2021 01:57:26 - INFO - __main__ - Step 33430: {'lr': 0.00044639820605146184, 'samples': 6418560, 'steps': 33429, 'loss/train': 0.49115127325057983} -11/07/2021 01:57:26 - INFO - __main__ - Step 33431: {'lr': 0.0004463949224919469, 'samples': 6418752, 'steps': 33430, 'loss/train': 1.3409916162490845} -11/07/2021 01:57:26 - INFO - __main__ - Step 33432: {'lr': 0.0004463916388439394, 'samples': 6418944, 'steps': 33431, 'loss/train': 1.5159145593643188} -11/07/2021 01:57:27 - INFO - __main__ - Step 33433: {'lr': 0.00044638835510744094, 'samples': 6419136, 'steps': 33432, 'loss/train': 1.2072536945343018} -11/07/2021 01:57:28 - INFO - __main__ - Step 33434: {'lr': 0.0004463850712824528, 'samples': 6419328, 'steps': 33433, 'loss/train': 1.160642385482788} -11/07/2021 01:57:28 - INFO - __main__ - Step 33435: {'lr': 0.0004463817873689766, 'samples': 6419520, 'steps': 33434, 'loss/train': 1.7231621742248535} -11/07/2021 01:57:28 - INFO - __main__ - Step 33436: {'lr': 0.00044637850336701386, 'samples': 6419712, 'steps': 33435, 'loss/train': 1.5787726640701294} -11/07/2021 01:57:29 - INFO - __main__ - Step 33437: {'lr': 0.000446375219276566, 'samples': 6419904, 'steps': 33436, 'loss/train': 1.4341305494308472} -11/07/2021 01:57:29 - INFO - __main__ - Step 33438: {'lr': 0.0004463719350976344, 'samples': 6420096, 'steps': 33437, 'loss/train': 1.730055570602417} -11/07/2021 01:57:30 - INFO - __main__ - Step 33439: {'lr': 0.0004463686508302207, 'samples': 6420288, 'steps': 33438, 'loss/train': 1.4806171655654907} -11/07/2021 01:57:30 - INFO - __main__ - Step 33440: {'lr': 0.00044636536647432636, 'samples': 6420480, 'steps': 33439, 'loss/train': 1.4073017835617065} -11/07/2021 01:57:31 - INFO - __main__ - Step 33441: {'lr': 0.00044636208202995277, 'samples': 6420672, 'steps': 33440, 'loss/train': 1.4302234649658203} -11/07/2021 01:57:31 - INFO - __main__ - Step 33442: {'lr': 0.0004463587974971014, 'samples': 6420864, 'steps': 33441, 'loss/train': 1.2936042547225952} -11/07/2021 01:57:32 - INFO - __main__ - Step 33443: {'lr': 0.0004463555128757739, 'samples': 6421056, 'steps': 33442, 'loss/train': 1.3029223680496216} -11/07/2021 01:57:33 - INFO - __main__ - Step 33444: {'lr': 0.00044635222816597153, 'samples': 6421248, 'steps': 33443, 'loss/train': 1.8932257890701294} -11/07/2021 01:57:33 - INFO - __main__ - Step 33445: {'lr': 0.0004463489433676959, 'samples': 6421440, 'steps': 33444, 'loss/train': 2.250821352005005} -11/07/2021 01:57:33 - INFO - __main__ - Step 33446: {'lr': 0.00044634565848094854, 'samples': 6421632, 'steps': 33445, 'loss/train': 1.5037392377853394} -11/07/2021 01:57:34 - INFO - __main__ - Step 33447: {'lr': 0.0004463423735057308, 'samples': 6421824, 'steps': 33446, 'loss/train': 1.1936708688735962} -11/07/2021 01:57:34 - INFO - __main__ - Step 33448: {'lr': 0.00044633908844204424, 'samples': 6422016, 'steps': 33447, 'loss/train': 1.7531934976577759} -11/07/2021 01:57:35 - INFO - __main__ - Step 33449: {'lr': 0.0004463358032898903, 'samples': 6422208, 'steps': 33448, 'loss/train': 2.1877307891845703} -11/07/2021 01:57:35 - INFO - __main__ - Step 33450: {'lr': 0.00044633251804927044, 'samples': 6422400, 'steps': 33449, 'loss/train': 1.2530103921890259} -11/07/2021 01:57:36 - INFO - __main__ - Step 33451: {'lr': 0.0004463292327201862, 'samples': 6422592, 'steps': 33450, 'loss/train': 1.3324371576309204} -11/07/2021 01:57:36 - INFO - __main__ - Step 33452: {'lr': 0.0004463259473026391, 'samples': 6422784, 'steps': 33451, 'loss/train': 1.1305065155029297} -11/07/2021 01:57:36 - INFO - __main__ - Step 33453: {'lr': 0.0004463226617966305, 'samples': 6422976, 'steps': 33452, 'loss/train': 1.6182461977005005} -11/07/2021 01:57:37 - INFO - __main__ - Step 33454: {'lr': 0.00044631937620216196, 'samples': 6423168, 'steps': 33453, 'loss/train': 1.6138521432876587} -11/07/2021 01:57:38 - INFO - __main__ - Step 33455: {'lr': 0.00044631609051923494, 'samples': 6423360, 'steps': 33454, 'loss/train': 1.4291763305664062} -11/07/2021 01:57:38 - INFO - __main__ - Step 33456: {'lr': 0.00044631280474785086, 'samples': 6423552, 'steps': 33455, 'loss/train': 1.4215017557144165} -11/07/2021 01:57:38 - INFO - __main__ - Step 33457: {'lr': 0.0004463095188880113, 'samples': 6423744, 'steps': 33456, 'loss/train': 1.511284589767456} -11/07/2021 01:57:39 - INFO - __main__ - Step 33458: {'lr': 0.00044630623293971775, 'samples': 6423936, 'steps': 33457, 'loss/train': 1.4104000329971313} -11/07/2021 01:57:40 - INFO - __main__ - Step 33459: {'lr': 0.0004463029469029716, 'samples': 6424128, 'steps': 33458, 'loss/train': 1.7511613368988037} -11/07/2021 01:57:40 - INFO - __main__ - Step 33460: {'lr': 0.0004462996607777743, 'samples': 6424320, 'steps': 33459, 'loss/train': 1.7468429803848267} -11/07/2021 01:57:41 - INFO - __main__ - Step 33461: {'lr': 0.00044629637456412754, 'samples': 6424512, 'steps': 33460, 'loss/train': 1.6965515613555908} -11/07/2021 01:57:41 - INFO - __main__ - Step 33462: {'lr': 0.0004462930882620325, 'samples': 6424704, 'steps': 33461, 'loss/train': 1.2532994747161865} -11/07/2021 01:57:41 - INFO - __main__ - Step 33463: {'lr': 0.0004462898018714909, 'samples': 6424896, 'steps': 33462, 'loss/train': 1.335274338722229} -11/07/2021 01:57:42 - INFO - __main__ - Step 33464: {'lr': 0.0004462865153925042, 'samples': 6425088, 'steps': 33463, 'loss/train': 1.3503310680389404} -11/07/2021 01:57:43 - INFO - __main__ - Step 33465: {'lr': 0.00044628322882507375, 'samples': 6425280, 'steps': 33464, 'loss/train': 1.1921557188034058} -11/07/2021 01:57:43 - INFO - __main__ - Step 33466: {'lr': 0.0004462799421692012, 'samples': 6425472, 'steps': 33465, 'loss/train': 1.49006986618042} -11/07/2021 01:57:43 - INFO - __main__ - Step 33467: {'lr': 0.0004462766554248878, 'samples': 6425664, 'steps': 33466, 'loss/train': 0.9925422072410583} -11/07/2021 01:57:44 - INFO - __main__ - Step 33468: {'lr': 0.0004462733685921353, 'samples': 6425856, 'steps': 33467, 'loss/train': 0.9103108048439026} -11/07/2021 01:57:44 - INFO - __main__ - Step 33469: {'lr': 0.000446270081670945, 'samples': 6426048, 'steps': 33468, 'loss/train': 0.8118385076522827} -11/07/2021 01:57:45 - INFO - __main__ - Step 33470: {'lr': 0.0004462667946613184, 'samples': 6426240, 'steps': 33469, 'loss/train': 1.6399989128112793} -11/07/2021 01:57:46 - INFO - __main__ - Step 33471: {'lr': 0.00044626350756325707, 'samples': 6426432, 'steps': 33470, 'loss/train': 1.365263819694519} -11/07/2021 01:57:46 - INFO - __main__ - Step 33472: {'lr': 0.0004462602203767624, 'samples': 6426624, 'steps': 33471, 'loss/train': 1.7585831880569458} -11/07/2021 01:57:46 - INFO - __main__ - Step 33473: {'lr': 0.0004462569331018359, 'samples': 6426816, 'steps': 33472, 'loss/train': 1.4998859167099} -11/07/2021 01:57:47 - INFO - __main__ - Step 33474: {'lr': 0.00044625364573847904, 'samples': 6427008, 'steps': 33473, 'loss/train': 0.8817580342292786} -11/07/2021 01:57:48 - INFO - __main__ - Step 33475: {'lr': 0.0004462503582866933, 'samples': 6427200, 'steps': 33474, 'loss/train': 0.19651857018470764} -11/07/2021 01:57:48 - INFO - __main__ - Step 33476: {'lr': 0.00044624707074648017, 'samples': 6427392, 'steps': 33475, 'loss/train': 1.4824800491333008} -11/07/2021 01:57:49 - INFO - __main__ - Step 33477: {'lr': 0.0004462437831178412, 'samples': 6427584, 'steps': 33476, 'loss/train': 0.8712844252586365} -11/07/2021 01:57:49 - INFO - __main__ - Step 33478: {'lr': 0.00044624049540077784, 'samples': 6427776, 'steps': 33477, 'loss/train': 1.6491341590881348} -11/07/2021 01:57:49 - INFO - __main__ - Step 33479: {'lr': 0.0004462372075952914, 'samples': 6427968, 'steps': 33478, 'loss/train': 1.6323633193969727} -11/07/2021 01:57:50 - INFO - __main__ - Step 33480: {'lr': 0.0004462339197013836, 'samples': 6428160, 'steps': 33479, 'loss/train': 1.5793582201004028} -11/07/2021 01:57:51 - INFO - __main__ - Step 33481: {'lr': 0.00044623063171905585, 'samples': 6428352, 'steps': 33480, 'loss/train': 1.7055293321609497} -11/07/2021 01:57:51 - INFO - __main__ - Step 33482: {'lr': 0.0004462273436483095, 'samples': 6428544, 'steps': 33481, 'loss/train': 2.0158817768096924} -11/07/2021 01:57:51 - INFO - __main__ - Step 33483: {'lr': 0.00044622405548914627, 'samples': 6428736, 'steps': 33482, 'loss/train': 1.3248236179351807} -11/07/2021 01:57:52 - INFO - __main__ - Step 33484: {'lr': 0.00044622076724156747, 'samples': 6428928, 'steps': 33483, 'loss/train': 1.8139656782150269} -11/07/2021 01:57:53 - INFO - __main__ - Step 33485: {'lr': 0.00044621747890557454, 'samples': 6429120, 'steps': 33484, 'loss/train': 1.4172933101654053} -11/07/2021 01:57:53 - INFO - __main__ - Step 33486: {'lr': 0.0004462141904811691, 'samples': 6429312, 'steps': 33485, 'loss/train': 1.271095633506775} -11/07/2021 01:57:53 - INFO - __main__ - Step 33487: {'lr': 0.00044621090196835254, 'samples': 6429504, 'steps': 33486, 'loss/train': 1.781255841255188} -11/07/2021 01:57:54 - INFO - __main__ - Step 33488: {'lr': 0.00044620761336712646, 'samples': 6429696, 'steps': 33487, 'loss/train': 1.747527837753296} -11/07/2021 01:57:54 - INFO - __main__ - Step 33489: {'lr': 0.00044620432467749215, 'samples': 6429888, 'steps': 33488, 'loss/train': 2.0125067234039307} -11/07/2021 01:57:55 - INFO - __main__ - Step 33490: {'lr': 0.0004462010358994513, 'samples': 6430080, 'steps': 33489, 'loss/train': 1.6507304906845093} -11/07/2021 01:57:56 - INFO - __main__ - Step 33491: {'lr': 0.0004461977470330052, 'samples': 6430272, 'steps': 33490, 'loss/train': 1.1020450592041016} -11/07/2021 01:57:56 - INFO - __main__ - Step 33492: {'lr': 0.00044619445807815545, 'samples': 6430464, 'steps': 33491, 'loss/train': 1.0469087362289429} -11/07/2021 01:57:56 - INFO - __main__ - Step 33493: {'lr': 0.00044619116903490356, 'samples': 6430656, 'steps': 33492, 'loss/train': 1.407516598701477} -11/07/2021 01:57:57 - INFO - __main__ - Step 33494: {'lr': 0.00044618787990325086, 'samples': 6430848, 'steps': 33493, 'loss/train': 1.9450844526290894} -11/07/2021 01:57:58 - INFO - __main__ - Step 33495: {'lr': 0.000446184590683199, 'samples': 6431040, 'steps': 33494, 'loss/train': 1.4101066589355469} -11/07/2021 01:57:58 - INFO - __main__ - Step 33496: {'lr': 0.00044618130137474935, 'samples': 6431232, 'steps': 33495, 'loss/train': 1.4940515756607056} -11/07/2021 01:57:58 - INFO - __main__ - Step 33497: {'lr': 0.0004461780119779034, 'samples': 6431424, 'steps': 33496, 'loss/train': 1.3933483362197876} -11/07/2021 01:57:59 - INFO - __main__ - Step 33498: {'lr': 0.0004461747224926628, 'samples': 6431616, 'steps': 33497, 'loss/train': 1.6501895189285278} -11/07/2021 01:57:59 - INFO - __main__ - Step 33499: {'lr': 0.0004461714329190288, 'samples': 6431808, 'steps': 33498, 'loss/train': 1.6280629634857178} -11/07/2021 01:58:00 - INFO - __main__ - Step 33500: {'lr': 0.00044616814325700293, 'samples': 6432000, 'steps': 33499, 'loss/train': 1.6826666593551636} -11/07/2021 01:58:00 - INFO - __main__ - Step 33501: {'lr': 0.0004461648535065869, 'samples': 6432192, 'steps': 33500, 'loss/train': 1.7501734495162964} -11/07/2021 01:58:01 - INFO - __main__ - Step 33502: {'lr': 0.0004461615636677818, 'samples': 6432384, 'steps': 33501, 'loss/train': 1.3026123046875} -11/07/2021 01:58:01 - INFO - __main__ - Step 33503: {'lr': 0.0004461582737405895, 'samples': 6432576, 'steps': 33502, 'loss/train': 1.302112340927124} -11/07/2021 01:58:02 - INFO - __main__ - Step 33504: {'lr': 0.00044615498372501116, 'samples': 6432768, 'steps': 33503, 'loss/train': 1.6485215425491333} -11/07/2021 01:58:02 - INFO - __main__ - Step 33505: {'lr': 0.00044615169362104856, 'samples': 6432960, 'steps': 33504, 'loss/train': 0.8213014602661133} -11/07/2021 01:58:03 - INFO - __main__ - Step 33506: {'lr': 0.00044614840342870293, 'samples': 6433152, 'steps': 33505, 'loss/train': 1.8052080869674683} -11/07/2021 01:58:03 - INFO - __main__ - Step 33507: {'lr': 0.0004461451131479759, 'samples': 6433344, 'steps': 33506, 'loss/train': 1.5932680368423462} -11/07/2021 01:58:04 - INFO - __main__ - Step 33508: {'lr': 0.0004461418227788689, 'samples': 6433536, 'steps': 33507, 'loss/train': 1.8350179195404053} -11/07/2021 01:58:04 - INFO - __main__ - Step 33509: {'lr': 0.00044613853232138343, 'samples': 6433728, 'steps': 33508, 'loss/train': 1.463523268699646} -11/07/2021 01:58:04 - INFO - __main__ - Step 33510: {'lr': 0.0004461352417755209, 'samples': 6433920, 'steps': 33509, 'loss/train': 1.4737497568130493} -11/07/2021 01:58:05 - INFO - __main__ - Step 33511: {'lr': 0.0004461319511412829, 'samples': 6434112, 'steps': 33510, 'loss/train': 1.8179429769515991} -11/07/2021 01:58:06 - INFO - __main__ - Step 33512: {'lr': 0.00044612866041867093, 'samples': 6434304, 'steps': 33511, 'loss/train': 1.6133488416671753} -11/07/2021 01:58:06 - INFO - __main__ - Step 33513: {'lr': 0.0004461253696076863, 'samples': 6434496, 'steps': 33512, 'loss/train': 1.5488224029541016} -11/07/2021 01:58:06 - INFO - __main__ - Step 33514: {'lr': 0.00044612207870833073, 'samples': 6434688, 'steps': 33513, 'loss/train': 1.478121042251587} -11/07/2021 01:58:07 - INFO - __main__ - Step 33515: {'lr': 0.0004461187877206055, 'samples': 6434880, 'steps': 33514, 'loss/train': 1.1957716941833496} -11/07/2021 01:58:08 - INFO - __main__ - Step 33516: {'lr': 0.00044611549664451216, 'samples': 6435072, 'steps': 33515, 'loss/train': 1.937234878540039} -11/07/2021 01:58:08 - INFO - __main__ - Step 33517: {'lr': 0.0004461122054800522, 'samples': 6435264, 'steps': 33516, 'loss/train': 1.4780783653259277} -11/07/2021 01:58:09 - INFO - __main__ - Step 33518: {'lr': 0.00044610891422722714, 'samples': 6435456, 'steps': 33517, 'loss/train': 1.3189829587936401} -11/07/2021 01:58:09 - INFO - __main__ - Step 33519: {'lr': 0.00044610562288603846, 'samples': 6435648, 'steps': 33518, 'loss/train': 1.0899434089660645} -11/07/2021 01:58:09 - INFO - __main__ - Step 33520: {'lr': 0.00044610233145648756, 'samples': 6435840, 'steps': 33519, 'loss/train': 1.1641112565994263} -11/07/2021 01:58:10 - INFO - __main__ - Step 33521: {'lr': 0.00044609903993857603, 'samples': 6436032, 'steps': 33520, 'loss/train': 1.6565847396850586} -11/07/2021 01:58:11 - INFO - __main__ - Step 33522: {'lr': 0.0004460957483323052, 'samples': 6436224, 'steps': 33521, 'loss/train': 1.5398041009902954} -11/07/2021 01:58:11 - INFO - __main__ - Step 33523: {'lr': 0.0004460924566376767, 'samples': 6436416, 'steps': 33522, 'loss/train': 1.4112274646759033} -11/07/2021 01:58:11 - INFO - __main__ - Step 33524: {'lr': 0.00044608916485469195, 'samples': 6436608, 'steps': 33523, 'loss/train': 1.9318363666534424} -11/07/2021 01:58:12 - INFO - __main__ - Step 33525: {'lr': 0.0004460858729833525, 'samples': 6436800, 'steps': 33524, 'loss/train': 1.6608656644821167} -11/07/2021 01:58:13 - INFO - __main__ - Step 33526: {'lr': 0.0004460825810236598, 'samples': 6436992, 'steps': 33525, 'loss/train': 1.7003602981567383} -11/07/2021 01:58:13 - INFO - __main__ - Step 33527: {'lr': 0.00044607928897561524, 'samples': 6437184, 'steps': 33526, 'loss/train': 1.3078749179840088} -11/07/2021 01:58:13 - INFO - __main__ - Step 33528: {'lr': 0.0004460759968392204, 'samples': 6437376, 'steps': 33527, 'loss/train': 1.5011610984802246} -11/07/2021 01:58:14 - INFO - __main__ - Step 33529: {'lr': 0.0004460727046144768, 'samples': 6437568, 'steps': 33528, 'loss/train': 0.829114556312561} -11/07/2021 01:58:14 - INFO - __main__ - Step 33530: {'lr': 0.00044606941230138574, 'samples': 6437760, 'steps': 33529, 'loss/train': 1.5233813524246216} -11/07/2021 01:58:15 - INFO - __main__ - Step 33531: {'lr': 0.0004460661198999489, 'samples': 6437952, 'steps': 33530, 'loss/train': 1.2734391689300537} -11/07/2021 01:58:15 - INFO - __main__ - Step 33532: {'lr': 0.0004460628274101677, 'samples': 6438144, 'steps': 33531, 'loss/train': 1.682828664779663} -11/07/2021 01:58:16 - INFO - __main__ - Step 33533: {'lr': 0.0004460595348320436, 'samples': 6438336, 'steps': 33532, 'loss/train': 1.3908790349960327} -11/07/2021 01:58:16 - INFO - __main__ - Step 33534: {'lr': 0.0004460562421655782, 'samples': 6438528, 'steps': 33533, 'loss/train': 1.3196871280670166} -11/07/2021 01:58:16 - INFO - __main__ - Step 33535: {'lr': 0.0004460529494107727, 'samples': 6438720, 'steps': 33534, 'loss/train': 1.2997703552246094} -11/07/2021 01:58:17 - INFO - __main__ - Step 33536: {'lr': 0.00044604965656762884, 'samples': 6438912, 'steps': 33535, 'loss/train': 1.7080373764038086} -11/07/2021 01:58:18 - INFO - __main__ - Step 33537: {'lr': 0.0004460463636361481, 'samples': 6439104, 'steps': 33536, 'loss/train': 1.4093761444091797} -11/07/2021 01:58:18 - INFO - __main__ - Step 33538: {'lr': 0.00044604307061633187, 'samples': 6439296, 'steps': 33537, 'loss/train': 2.498072624206543} -11/07/2021 01:58:18 - INFO - __main__ - Step 33539: {'lr': 0.0004460397775081816, 'samples': 6439488, 'steps': 33538, 'loss/train': 1.409963846206665} -11/07/2021 01:58:19 - INFO - __main__ - Step 33540: {'lr': 0.00044603648431169884, 'samples': 6439680, 'steps': 33539, 'loss/train': 1.581534504890442} -11/07/2021 01:58:19 - INFO - __main__ - Step 33541: {'lr': 0.0004460331910268851, 'samples': 6439872, 'steps': 33540, 'loss/train': 1.930228590965271} -11/07/2021 01:58:20 - INFO - __main__ - Step 33542: {'lr': 0.0004460298976537418, 'samples': 6440064, 'steps': 33541, 'loss/train': 1.6128143072128296} -11/07/2021 01:58:21 - INFO - __main__ - Step 33543: {'lr': 0.00044602660419227046, 'samples': 6440256, 'steps': 33542, 'loss/train': 1.5586212873458862} -11/07/2021 01:58:21 - INFO - __main__ - Step 33544: {'lr': 0.0004460233106424726, 'samples': 6440448, 'steps': 33543, 'loss/train': 1.1883673667907715} -11/07/2021 01:58:21 - INFO - __main__ - Step 33545: {'lr': 0.00044602001700434963, 'samples': 6440640, 'steps': 33544, 'loss/train': 0.7786942720413208} -11/07/2021 01:58:22 - INFO - __main__ - Step 33546: {'lr': 0.00044601672327790304, 'samples': 6440832, 'steps': 33545, 'loss/train': 1.3047401905059814} -11/07/2021 01:58:23 - INFO - __main__ - Step 33547: {'lr': 0.00044601342946313437, 'samples': 6441024, 'steps': 33546, 'loss/train': 1.2048883438110352} -11/07/2021 01:58:23 - INFO - __main__ - Step 33548: {'lr': 0.0004460101355600451, 'samples': 6441216, 'steps': 33547, 'loss/train': 1.9878222942352295} -11/07/2021 01:58:23 - INFO - __main__ - Step 33549: {'lr': 0.0004460068415686366, 'samples': 6441408, 'steps': 33548, 'loss/train': 1.798831582069397} -11/07/2021 01:58:24 - INFO - __main__ - Step 33550: {'lr': 0.0004460035474889105, 'samples': 6441600, 'steps': 33549, 'loss/train': 1.7199984788894653} -11/07/2021 01:58:24 - INFO - __main__ - Step 33551: {'lr': 0.00044600025332086824, 'samples': 6441792, 'steps': 33550, 'loss/train': 1.4604843854904175} -11/07/2021 01:58:25 - INFO - __main__ - Step 33552: {'lr': 0.0004459969590645113, 'samples': 6441984, 'steps': 33551, 'loss/train': 1.351448893547058} -11/07/2021 01:58:25 - INFO - __main__ - Step 33553: {'lr': 0.000445993664719841, 'samples': 6442176, 'steps': 33552, 'loss/train': 1.5944808721542358} -11/07/2021 01:58:26 - INFO - __main__ - Step 33554: {'lr': 0.0004459903702868592, 'samples': 6442368, 'steps': 33553, 'loss/train': 1.6904922723770142} -11/07/2021 01:58:26 - INFO - __main__ - Step 33555: {'lr': 0.00044598707576556706, 'samples': 6442560, 'steps': 33554, 'loss/train': 2.0922768115997314} -11/07/2021 01:58:26 - INFO - __main__ - Step 33556: {'lr': 0.00044598378115596614, 'samples': 6442752, 'steps': 33555, 'loss/train': 1.494410753250122} -11/07/2021 01:58:27 - INFO - __main__ - Step 33557: {'lr': 0.000445980486458058, 'samples': 6442944, 'steps': 33556, 'loss/train': 1.659221887588501} -11/07/2021 01:58:28 - INFO - __main__ - Step 33558: {'lr': 0.0004459771916718441, 'samples': 6443136, 'steps': 33557, 'loss/train': 1.557417392730713} -11/07/2021 01:58:28 - INFO - __main__ - Step 33559: {'lr': 0.0004459738967973258, 'samples': 6443328, 'steps': 33558, 'loss/train': 1.2724696397781372} -11/07/2021 01:58:29 - INFO - __main__ - Step 33560: {'lr': 0.00044597060183450477, 'samples': 6443520, 'steps': 33559, 'loss/train': 1.2706172466278076} -11/07/2021 01:58:29 - INFO - __main__ - Step 33561: {'lr': 0.00044596730678338236, 'samples': 6443712, 'steps': 33560, 'loss/train': 1.454308032989502} -11/07/2021 01:58:30 - INFO - __main__ - Step 33562: {'lr': 0.0004459640116439602, 'samples': 6443904, 'steps': 33561, 'loss/train': 1.3097172975540161} -11/07/2021 01:58:30 - INFO - __main__ - Step 33563: {'lr': 0.0004459607164162396, 'samples': 6444096, 'steps': 33562, 'loss/train': 1.4599028825759888} -11/07/2021 01:58:31 - INFO - __main__ - Step 33564: {'lr': 0.00044595742110022216, 'samples': 6444288, 'steps': 33563, 'loss/train': 1.3603464365005493} -11/07/2021 01:58:31 - INFO - __main__ - Step 33565: {'lr': 0.00044595412569590934, 'samples': 6444480, 'steps': 33564, 'loss/train': 1.0743993520736694} -11/07/2021 01:58:31 - INFO - __main__ - Step 33566: {'lr': 0.0004459508302033025, 'samples': 6444672, 'steps': 33565, 'loss/train': 1.602871060371399} -11/07/2021 01:58:32 - INFO - __main__ - Step 33567: {'lr': 0.00044594753462240335, 'samples': 6444864, 'steps': 33566, 'loss/train': 1.5943396091461182} -11/07/2021 01:58:33 - INFO - __main__ - Step 33568: {'lr': 0.0004459442389532132, 'samples': 6445056, 'steps': 33567, 'loss/train': 1.4100042581558228} -11/07/2021 01:58:33 - INFO - __main__ - Step 33569: {'lr': 0.0004459409431957337, 'samples': 6445248, 'steps': 33568, 'loss/train': 1.6690175533294678} -11/07/2021 01:58:33 - INFO - __main__ - Step 33570: {'lr': 0.00044593764734996615, 'samples': 6445440, 'steps': 33569, 'loss/train': 1.4638475179672241} -11/07/2021 01:58:34 - INFO - __main__ - Step 33571: {'lr': 0.00044593435141591215, 'samples': 6445632, 'steps': 33570, 'loss/train': 1.7800277471542358} -11/07/2021 01:58:35 - INFO - __main__ - Step 33572: {'lr': 0.00044593105539357313, 'samples': 6445824, 'steps': 33571, 'loss/train': 1.390863299369812} -11/07/2021 01:58:35 - INFO - __main__ - Step 33573: {'lr': 0.00044592775928295063, 'samples': 6446016, 'steps': 33572, 'loss/train': 1.5232267379760742} -11/07/2021 01:58:35 - INFO - __main__ - Step 33574: {'lr': 0.0004459244630840461, 'samples': 6446208, 'steps': 33573, 'loss/train': 0.9683477878570557} -11/07/2021 01:58:36 - INFO - __main__ - Step 33575: {'lr': 0.000445921166796861, 'samples': 6446400, 'steps': 33574, 'loss/train': 1.6692181825637817} -11/07/2021 01:58:36 - INFO - __main__ - Step 33576: {'lr': 0.00044591787042139684, 'samples': 6446592, 'steps': 33575, 'loss/train': 1.3814464807510376} -11/07/2021 01:58:37 - INFO - __main__ - Step 33577: {'lr': 0.0004459145739576552, 'samples': 6446784, 'steps': 33576, 'loss/train': 1.4177926778793335} -11/07/2021 01:58:38 - INFO - __main__ - Step 33578: {'lr': 0.0004459112774056374, 'samples': 6446976, 'steps': 33577, 'loss/train': 1.8841018676757812} -11/07/2021 01:58:38 - INFO - __main__ - Step 33579: {'lr': 0.000445907980765345, 'samples': 6447168, 'steps': 33578, 'loss/train': 1.088173508644104} -11/07/2021 01:58:38 - INFO - __main__ - Step 33580: {'lr': 0.00044590468403677954, 'samples': 6447360, 'steps': 33579, 'loss/train': 1.6133272647857666} -11/07/2021 01:58:39 - INFO - __main__ - Step 33581: {'lr': 0.00044590138721994243, 'samples': 6447552, 'steps': 33580, 'loss/train': 1.7381786108016968} -11/07/2021 01:58:40 - INFO - __main__ - Step 33582: {'lr': 0.00044589809031483517, 'samples': 6447744, 'steps': 33581, 'loss/train': 1.8601634502410889} -11/07/2021 01:58:40 - INFO - __main__ - Step 33583: {'lr': 0.0004458947933214592, 'samples': 6447936, 'steps': 33582, 'loss/train': 1.626869559288025} -11/07/2021 01:58:40 - INFO - __main__ - Step 33584: {'lr': 0.0004458914962398162, 'samples': 6448128, 'steps': 33583, 'loss/train': 1.0731712579727173} -11/07/2021 01:58:41 - INFO - __main__ - Step 33585: {'lr': 0.0004458881990699074, 'samples': 6448320, 'steps': 33584, 'loss/train': 1.6439554691314697} -11/07/2021 01:58:41 - INFO - __main__ - Step 33586: {'lr': 0.00044588490181173435, 'samples': 6448512, 'steps': 33585, 'loss/train': 1.6263537406921387} -11/07/2021 01:58:41 - INFO - __main__ - Step 33587: {'lr': 0.0004458816044652987, 'samples': 6448704, 'steps': 33586, 'loss/train': 1.4457780122756958} -11/07/2021 01:58:42 - INFO - __main__ - Step 33588: {'lr': 0.00044587830703060176, 'samples': 6448896, 'steps': 33587, 'loss/train': 1.634812831878662} -11/07/2021 01:58:43 - INFO - __main__ - Step 33589: {'lr': 0.00044587500950764514, 'samples': 6449088, 'steps': 33588, 'loss/train': 1.8523485660552979} -11/07/2021 01:58:43 - INFO - __main__ - Step 33590: {'lr': 0.0004458717118964302, 'samples': 6449280, 'steps': 33589, 'loss/train': 1.581408977508545} -11/07/2021 01:58:43 - INFO - __main__ - Step 33591: {'lr': 0.0004458684141969585, 'samples': 6449472, 'steps': 33590, 'loss/train': 1.5999499559402466} -11/07/2021 01:58:44 - INFO - __main__ - Step 33592: {'lr': 0.0004458651164092315, 'samples': 6449664, 'steps': 33591, 'loss/train': 1.786829948425293} -11/07/2021 01:58:45 - INFO - __main__ - Step 33593: {'lr': 0.00044586181853325076, 'samples': 6449856, 'steps': 33592, 'loss/train': 1.5149943828582764} -11/07/2021 01:58:45 - INFO - __main__ - Step 33594: {'lr': 0.0004458585205690177, 'samples': 6450048, 'steps': 33593, 'loss/train': 1.1522443294525146} -11/07/2021 01:58:46 - INFO - __main__ - Step 33595: {'lr': 0.0004458552225165338, 'samples': 6450240, 'steps': 33594, 'loss/train': 1.3876985311508179} -11/07/2021 01:58:46 - INFO - __main__ - Step 33596: {'lr': 0.00044585192437580044, 'samples': 6450432, 'steps': 33595, 'loss/train': 1.510378360748291} -11/07/2021 01:58:46 - INFO - __main__ - Step 33597: {'lr': 0.0004458486261468194, 'samples': 6450624, 'steps': 33596, 'loss/train': 1.6011792421340942} -11/07/2021 01:58:47 - INFO - __main__ - Step 33598: {'lr': 0.0004458453278295919, 'samples': 6450816, 'steps': 33597, 'loss/train': 1.1178830862045288} -11/07/2021 01:58:48 - INFO - __main__ - Step 33599: {'lr': 0.00044584202942411956, 'samples': 6451008, 'steps': 33598, 'loss/train': 1.7060731649398804} -11/07/2021 01:58:48 - INFO - __main__ - Step 33600: {'lr': 0.00044583873093040376, 'samples': 6451200, 'steps': 33599, 'loss/train': 1.4395594596862793} -11/07/2021 01:58:48 - INFO - __main__ - Step 33601: {'lr': 0.00044583543234844616, 'samples': 6451392, 'steps': 33600, 'loss/train': 1.3613064289093018} -11/07/2021 01:58:49 - INFO - __main__ - Step 33602: {'lr': 0.00044583213367824806, 'samples': 6451584, 'steps': 33601, 'loss/train': 1.7319318056106567} -11/07/2021 01:58:50 - INFO - __main__ - Step 33603: {'lr': 0.00044582883491981097, 'samples': 6451776, 'steps': 33602, 'loss/train': 1.7198821306228638} -11/07/2021 01:58:50 - INFO - __main__ - Step 33604: {'lr': 0.0004458255360731365, 'samples': 6451968, 'steps': 33603, 'loss/train': 1.7537992000579834} -11/07/2021 01:58:51 - INFO - __main__ - Step 33605: {'lr': 0.00044582223713822606, 'samples': 6452160, 'steps': 33604, 'loss/train': 1.4399713277816772} -11/07/2021 01:58:51 - INFO - __main__ - Step 33606: {'lr': 0.0004458189381150811, 'samples': 6452352, 'steps': 33605, 'loss/train': 1.2576117515563965} -11/07/2021 01:58:51 - INFO - __main__ - Step 33607: {'lr': 0.00044581563900370326, 'samples': 6452544, 'steps': 33606, 'loss/train': 1.5778969526290894} -11/07/2021 01:58:52 - INFO - __main__ - Step 33608: {'lr': 0.0004458123398040938, 'samples': 6452736, 'steps': 33607, 'loss/train': 1.6962167024612427} -11/07/2021 01:58:53 - INFO - __main__ - Step 33609: {'lr': 0.0004458090405162544, 'samples': 6452928, 'steps': 33608, 'loss/train': 1.5823737382888794} -11/07/2021 01:58:53 - INFO - __main__ - Step 33610: {'lr': 0.0004458057411401864, 'samples': 6453120, 'steps': 33609, 'loss/train': 1.258210301399231} -11/07/2021 01:58:53 - INFO - __main__ - Step 33611: {'lr': 0.00044580244167589136, 'samples': 6453312, 'steps': 33610, 'loss/train': 1.672492265701294} -11/07/2021 01:58:54 - INFO - __main__ - Step 33612: {'lr': 0.00044579914212337083, 'samples': 6453504, 'steps': 33611, 'loss/train': 1.6796356439590454} -11/07/2021 01:58:54 - INFO - __main__ - Step 33613: {'lr': 0.00044579584248262617, 'samples': 6453696, 'steps': 33612, 'loss/train': 1.7429602146148682} -11/07/2021 01:58:55 - INFO - __main__ - Step 33614: {'lr': 0.0004457925427536589, 'samples': 6453888, 'steps': 33613, 'loss/train': 1.4019567966461182} -11/07/2021 01:58:55 - INFO - __main__ - Step 33615: {'lr': 0.0004457892429364706, 'samples': 6454080, 'steps': 33614, 'loss/train': 1.949160099029541} -11/07/2021 01:58:56 - INFO - __main__ - Step 33616: {'lr': 0.00044578594303106266, 'samples': 6454272, 'steps': 33615, 'loss/train': 1.8838460445404053} -11/07/2021 01:58:56 - INFO - __main__ - Step 33617: {'lr': 0.00044578264303743654, 'samples': 6454464, 'steps': 33616, 'loss/train': 1.7442598342895508} -11/07/2021 01:58:56 - INFO - __main__ - Step 33618: {'lr': 0.00044577934295559387, 'samples': 6454656, 'steps': 33617, 'loss/train': 1.8235018253326416} -11/07/2021 01:58:58 - INFO - __main__ - Step 33619: {'lr': 0.000445776042785536, 'samples': 6454848, 'steps': 33618, 'loss/train': 1.3736298084259033} -11/07/2021 01:58:58 - INFO - __main__ - Step 33620: {'lr': 0.00044577274252726454, 'samples': 6455040, 'steps': 33619, 'loss/train': 1.5522053241729736} -11/07/2021 01:58:58 - INFO - __main__ - Step 33621: {'lr': 0.00044576944218078075, 'samples': 6455232, 'steps': 33620, 'loss/train': 2.243539571762085} -11/07/2021 01:58:59 - INFO - __main__ - Step 33622: {'lr': 0.00044576614174608644, 'samples': 6455424, 'steps': 33621, 'loss/train': 1.4455134868621826} -11/07/2021 01:58:59 - INFO - __main__ - Step 33623: {'lr': 0.0004457628412231828, 'samples': 6455616, 'steps': 33622, 'loss/train': 1.6696631908416748} -11/07/2021 01:59:00 - INFO - __main__ - Step 33624: {'lr': 0.0004457595406120715, 'samples': 6455808, 'steps': 33623, 'loss/train': 0.5843969583511353} -11/07/2021 01:59:00 - INFO - __main__ - Step 33625: {'lr': 0.000445756239912754, 'samples': 6456000, 'steps': 33624, 'loss/train': 1.5091285705566406} -11/07/2021 01:59:01 - INFO - __main__ - Step 33626: {'lr': 0.00044575293912523173, 'samples': 6456192, 'steps': 33625, 'loss/train': 1.6436296701431274} -11/07/2021 01:59:01 - INFO - __main__ - Step 33627: {'lr': 0.0004457496382495062, 'samples': 6456384, 'steps': 33626, 'loss/train': 1.0140951871871948} -11/07/2021 01:59:01 - INFO - __main__ - Step 33628: {'lr': 0.00044574633728557887, 'samples': 6456576, 'steps': 33627, 'loss/train': 1.8059523105621338} -11/07/2021 01:59:02 - INFO - __main__ - Step 33629: {'lr': 0.0004457430362334513, 'samples': 6456768, 'steps': 33628, 'loss/train': 1.9687384366989136} -11/07/2021 01:59:03 - INFO - __main__ - Step 33630: {'lr': 0.00044573973509312494, 'samples': 6456960, 'steps': 33629, 'loss/train': 1.120401382446289} -11/07/2021 01:59:03 - INFO - __main__ - Step 33631: {'lr': 0.00044573643386460127, 'samples': 6457152, 'steps': 33630, 'loss/train': 1.464900255203247} -11/07/2021 01:59:03 - INFO - __main__ - Step 33632: {'lr': 0.00044573313254788176, 'samples': 6457344, 'steps': 33631, 'loss/train': 1.1901419162750244} -11/07/2021 01:59:04 - INFO - __main__ - Step 33633: {'lr': 0.00044572983114296794, 'samples': 6457536, 'steps': 33632, 'loss/train': 2.5087969303131104} -11/07/2021 01:59:04 - INFO - __main__ - Step 33634: {'lr': 0.00044572652964986126, 'samples': 6457728, 'steps': 33633, 'loss/train': 1.0945255756378174} -11/07/2021 01:59:05 - INFO - __main__ - Step 33635: {'lr': 0.0004457232280685633, 'samples': 6457920, 'steps': 33634, 'loss/train': 1.6997337341308594} -11/07/2021 01:59:06 - INFO - __main__ - Step 33636: {'lr': 0.0004457199263990754, 'samples': 6458112, 'steps': 33635, 'loss/train': 1.3791000843048096} -11/07/2021 01:59:06 - INFO - __main__ - Step 33637: {'lr': 0.0004457166246413992, 'samples': 6458304, 'steps': 33636, 'loss/train': 1.040553092956543} -11/07/2021 01:59:06 - INFO - __main__ - Step 33638: {'lr': 0.000445713322795536, 'samples': 6458496, 'steps': 33637, 'loss/train': 1.3512609004974365} -11/07/2021 01:59:07 - INFO - __main__ - Step 33639: {'lr': 0.0004457100208614875, 'samples': 6458688, 'steps': 33638, 'loss/train': 1.6804062128067017} -11/07/2021 01:59:08 - INFO - __main__ - Step 33640: {'lr': 0.00044570671883925497, 'samples': 6458880, 'steps': 33639, 'loss/train': 1.4761654138565063} -11/07/2021 01:59:08 - INFO - __main__ - Step 33641: {'lr': 0.00044570341672884006, 'samples': 6459072, 'steps': 33640, 'loss/train': 1.2570524215698242} -11/07/2021 01:59:08 - INFO - __main__ - Step 33642: {'lr': 0.0004457001145302443, 'samples': 6459264, 'steps': 33641, 'loss/train': 1.4354379177093506} -11/07/2021 01:59:09 - INFO - __main__ - Step 33643: {'lr': 0.00044569681224346897, 'samples': 6459456, 'steps': 33642, 'loss/train': 1.6788442134857178} -11/07/2021 01:59:09 - INFO - __main__ - Step 33644: {'lr': 0.0004456935098685158, 'samples': 6459648, 'steps': 33643, 'loss/train': 1.1437855958938599} -11/07/2021 01:59:10 - INFO - __main__ - Step 33645: {'lr': 0.000445690207405386, 'samples': 6459840, 'steps': 33644, 'loss/train': 1.4899927377700806} -11/07/2021 01:59:10 - INFO - __main__ - Step 33646: {'lr': 0.00044568690485408125, 'samples': 6460032, 'steps': 33645, 'loss/train': 1.0562697649002075} -11/07/2021 01:59:11 - INFO - __main__ - Step 33647: {'lr': 0.0004456836022146031, 'samples': 6460224, 'steps': 33646, 'loss/train': 1.6380075216293335} -11/07/2021 01:59:11 - INFO - __main__ - Step 33648: {'lr': 0.00044568029948695287, 'samples': 6460416, 'steps': 33647, 'loss/train': 1.5932193994522095} -11/07/2021 01:59:12 - INFO - __main__ - Step 33649: {'lr': 0.0004456769966711321, 'samples': 6460608, 'steps': 33648, 'loss/train': 1.6578596830368042} -11/07/2021 01:59:12 - INFO - __main__ - Step 33650: {'lr': 0.00044567369376714226, 'samples': 6460800, 'steps': 33649, 'loss/train': 1.3997435569763184} -11/07/2021 01:59:13 - INFO - __main__ - Step 33651: {'lr': 0.00044567039077498497, 'samples': 6460992, 'steps': 33650, 'loss/train': 1.5730409622192383} -11/07/2021 01:59:13 - INFO - __main__ - Step 33652: {'lr': 0.00044566708769466155, 'samples': 6461184, 'steps': 33651, 'loss/train': 0.9869714379310608} -11/07/2021 01:59:14 - INFO - __main__ - Step 33653: {'lr': 0.00044566378452617363, 'samples': 6461376, 'steps': 33652, 'loss/train': 1.5953766107559204} -11/07/2021 01:59:14 - INFO - __main__ - Step 33654: {'lr': 0.0004456604812695226, 'samples': 6461568, 'steps': 33653, 'loss/train': 1.6929657459259033} -11/07/2021 01:59:15 - INFO - __main__ - Step 33655: {'lr': 0.0004456571779247099, 'samples': 6461760, 'steps': 33654, 'loss/train': 1.1120388507843018} -11/07/2021 01:59:15 - INFO - __main__ - Step 33656: {'lr': 0.0004456538744917372, 'samples': 6461952, 'steps': 33655, 'loss/train': 1.0251704454421997} -11/07/2021 01:59:16 - INFO - __main__ - Step 33657: {'lr': 0.0004456505709706059, 'samples': 6462144, 'steps': 33656, 'loss/train': 1.697401523590088} -11/07/2021 01:59:16 - INFO - __main__ - Step 33658: {'lr': 0.0004456472673613174, 'samples': 6462336, 'steps': 33657, 'loss/train': 1.685717225074768} -11/07/2021 01:59:16 - INFO - __main__ - Step 33659: {'lr': 0.00044564396366387327, 'samples': 6462528, 'steps': 33658, 'loss/train': 1.6014701128005981} -11/07/2021 01:59:17 - INFO - __main__ - Step 33660: {'lr': 0.000445640659878275, 'samples': 6462720, 'steps': 33659, 'loss/train': 1.3411377668380737} -11/07/2021 01:59:18 - INFO - __main__ - Step 33661: {'lr': 0.00044563735600452407, 'samples': 6462912, 'steps': 33660, 'loss/train': 1.6042089462280273} -11/07/2021 01:59:18 - INFO - __main__ - Step 33662: {'lr': 0.000445634052042622, 'samples': 6463104, 'steps': 33661, 'loss/train': 1.6241892576217651} -11/07/2021 01:59:18 - INFO - __main__ - Step 33663: {'lr': 0.00044563074799257015, 'samples': 6463296, 'steps': 33662, 'loss/train': 0.9637057781219482} -11/07/2021 01:59:19 - INFO - __main__ - Step 33664: {'lr': 0.0004456274438543702, 'samples': 6463488, 'steps': 33663, 'loss/train': 1.9259538650512695} -11/07/2021 01:59:20 - INFO - __main__ - Step 33665: {'lr': 0.0004456241396280234, 'samples': 6463680, 'steps': 33664, 'loss/train': 1.3537373542785645} -11/07/2021 01:59:20 - INFO - __main__ - Step 33666: {'lr': 0.00044562083531353154, 'samples': 6463872, 'steps': 33665, 'loss/train': 1.466401219367981} -11/07/2021 01:59:21 - INFO - __main__ - Step 33667: {'lr': 0.00044561753091089585, 'samples': 6464064, 'steps': 33666, 'loss/train': 1.6249371767044067} -11/07/2021 01:59:21 - INFO - __main__ - Step 33668: {'lr': 0.00044561422642011794, 'samples': 6464256, 'steps': 33667, 'loss/train': 1.7363765239715576} -11/07/2021 01:59:21 - INFO - __main__ - Step 33669: {'lr': 0.00044561092184119933, 'samples': 6464448, 'steps': 33668, 'loss/train': 1.6479049921035767} -11/07/2021 01:59:22 - INFO - __main__ - Step 33670: {'lr': 0.00044560761717414143, 'samples': 6464640, 'steps': 33669, 'loss/train': 0.8955526947975159} -11/07/2021 01:59:23 - INFO - __main__ - Step 33671: {'lr': 0.0004456043124189458, 'samples': 6464832, 'steps': 33670, 'loss/train': 1.129746913909912} -11/07/2021 01:59:23 - INFO - __main__ - Step 33672: {'lr': 0.00044560100757561386, 'samples': 6465024, 'steps': 33671, 'loss/train': 1.6933951377868652} -11/07/2021 01:59:23 - INFO - __main__ - Step 33673: {'lr': 0.000445597702644147, 'samples': 6465216, 'steps': 33672, 'loss/train': 1.821217656135559} -11/07/2021 01:59:24 - INFO - __main__ - Step 33674: {'lr': 0.000445594397624547, 'samples': 6465408, 'steps': 33673, 'loss/train': 1.5372188091278076} -11/07/2021 01:59:25 - INFO - __main__ - Step 33675: {'lr': 0.0004455910925168151, 'samples': 6465600, 'steps': 33674, 'loss/train': 1.3831593990325928} -11/07/2021 01:59:25 - INFO - __main__ - Step 33676: {'lr': 0.0004455877873209529, 'samples': 6465792, 'steps': 33675, 'loss/train': 1.8606778383255005} -11/07/2021 01:59:25 - INFO - __main__ - Step 33677: {'lr': 0.00044558448203696184, 'samples': 6465984, 'steps': 33676, 'loss/train': 1.8869925737380981} -11/07/2021 01:59:26 - INFO - __main__ - Step 33678: {'lr': 0.0004455811766648434, 'samples': 6466176, 'steps': 33677, 'loss/train': 1.6165025234222412} -11/07/2021 01:59:26 - INFO - __main__ - Step 33679: {'lr': 0.0004455778712045992, 'samples': 6466368, 'steps': 33678, 'loss/train': 1.620165228843689} -11/07/2021 01:59:27 - INFO - __main__ - Step 33680: {'lr': 0.0004455745656562306, 'samples': 6466560, 'steps': 33679, 'loss/train': 1.4367172718048096} -11/07/2021 01:59:28 - INFO - __main__ - Step 33681: {'lr': 0.000445571260019739, 'samples': 6466752, 'steps': 33680, 'loss/train': 1.590633511543274} -11/07/2021 01:59:28 - INFO - __main__ - Step 33682: {'lr': 0.00044556795429512617, 'samples': 6466944, 'steps': 33681, 'loss/train': 1.524424433708191} -11/07/2021 01:59:28 - INFO - __main__ - Step 33683: {'lr': 0.0004455646484823933, 'samples': 6467136, 'steps': 33682, 'loss/train': 2.1249895095825195} -11/07/2021 01:59:29 - INFO - __main__ - Step 33684: {'lr': 0.00044556134258154215, 'samples': 6467328, 'steps': 33683, 'loss/train': 1.1808171272277832} -11/07/2021 01:59:29 - INFO - __main__ - Step 33685: {'lr': 0.000445558036592574, 'samples': 6467520, 'steps': 33684, 'loss/train': 2.523301362991333} -11/07/2021 01:59:30 - INFO - __main__ - Step 33686: {'lr': 0.0004455547305154904, 'samples': 6467712, 'steps': 33685, 'loss/train': 1.156882643699646} -11/07/2021 01:59:30 - INFO - __main__ - Step 33687: {'lr': 0.00044555142435029284, 'samples': 6467904, 'steps': 33686, 'loss/train': 1.8231897354125977} -11/07/2021 01:59:31 - INFO - __main__ - Step 33688: {'lr': 0.0004455481180969829, 'samples': 6468096, 'steps': 33687, 'loss/train': 1.935068130493164} -11/07/2021 01:59:31 - INFO - __main__ - Step 33689: {'lr': 0.00044554481175556194, 'samples': 6468288, 'steps': 33688, 'loss/train': 1.3995652198791504} -11/07/2021 01:59:31 - INFO - __main__ - Step 33690: {'lr': 0.00044554150532603154, 'samples': 6468480, 'steps': 33689, 'loss/train': 1.949639081954956} -11/07/2021 01:59:32 - INFO - __main__ - Step 33691: {'lr': 0.00044553819880839313, 'samples': 6468672, 'steps': 33690, 'loss/train': 2.097712516784668} -11/07/2021 01:59:33 - INFO - __main__ - Step 33692: {'lr': 0.0004455348922026483, 'samples': 6468864, 'steps': 33691, 'loss/train': 1.9351541996002197} -11/07/2021 01:59:33 - INFO - __main__ - Step 33693: {'lr': 0.00044553158550879833, 'samples': 6469056, 'steps': 33692, 'loss/train': 1.3654865026474} -11/07/2021 01:59:34 - INFO - __main__ - Step 33694: {'lr': 0.00044552827872684493, 'samples': 6469248, 'steps': 33693, 'loss/train': 1.9272459745407104} -11/07/2021 01:59:34 - INFO - __main__ - Step 33695: {'lr': 0.00044552497185678953, 'samples': 6469440, 'steps': 33694, 'loss/train': 1.2972309589385986} -11/07/2021 01:59:35 - INFO - __main__ - Step 33696: {'lr': 0.00044552166489863354, 'samples': 6469632, 'steps': 33695, 'loss/train': 1.9361430406570435} -11/07/2021 01:59:35 - INFO - __main__ - Step 33697: {'lr': 0.0004455183578523785, 'samples': 6469824, 'steps': 33696, 'loss/train': 0.749098002910614} -11/07/2021 01:59:36 - INFO - __main__ - Step 33698: {'lr': 0.00044551505071802587, 'samples': 6470016, 'steps': 33697, 'loss/train': 1.533054232597351} -11/07/2021 01:59:36 - INFO - __main__ - Step 33699: {'lr': 0.00044551174349557733, 'samples': 6470208, 'steps': 33698, 'loss/train': 1.4626320600509644} -11/07/2021 01:59:36 - INFO - __main__ - Step 33700: {'lr': 0.0004455084361850341, 'samples': 6470400, 'steps': 33699, 'loss/train': 1.5492607355117798} -11/07/2021 01:59:37 - INFO - __main__ - Step 33701: {'lr': 0.00044550512878639784, 'samples': 6470592, 'steps': 33700, 'loss/train': 1.0996320247650146} -11/07/2021 01:59:38 - INFO - __main__ - Step 33702: {'lr': 0.0004455018212996699, 'samples': 6470784, 'steps': 33701, 'loss/train': 1.604270577430725} -11/07/2021 01:59:38 - INFO - __main__ - Step 33703: {'lr': 0.0004454985137248519, 'samples': 6470976, 'steps': 33702, 'loss/train': 1.4556504487991333} -11/07/2021 01:59:38 - INFO - __main__ - Step 33704: {'lr': 0.00044549520606194525, 'samples': 6471168, 'steps': 33703, 'loss/train': 1.2125494480133057} -11/07/2021 01:59:39 - INFO - __main__ - Step 33705: {'lr': 0.00044549189831095157, 'samples': 6471360, 'steps': 33704, 'loss/train': 1.5545730590820312} -11/07/2021 01:59:39 - INFO - __main__ - Step 33706: {'lr': 0.0004454885904718722, 'samples': 6471552, 'steps': 33705, 'loss/train': 1.6618608236312866} -11/07/2021 01:59:40 - INFO - __main__ - Step 33707: {'lr': 0.0004454852825447087, 'samples': 6471744, 'steps': 33706, 'loss/train': 1.672659158706665} -11/07/2021 01:59:40 - INFO - __main__ - Step 33708: {'lr': 0.0004454819745294625, 'samples': 6471936, 'steps': 33707, 'loss/train': 1.5245839357376099} -11/07/2021 01:59:41 - INFO - __main__ - Step 33709: {'lr': 0.0004454786664261352, 'samples': 6472128, 'steps': 33708, 'loss/train': 1.432139277458191} -11/07/2021 01:59:41 - INFO - __main__ - Step 33710: {'lr': 0.0004454753582347282, 'samples': 6472320, 'steps': 33709, 'loss/train': 1.639000415802002} -11/07/2021 01:59:42 - INFO - __main__ - Step 33711: {'lr': 0.00044547204995524305, 'samples': 6472512, 'steps': 33710, 'loss/train': 1.8348017930984497} -11/07/2021 01:59:43 - INFO - __main__ - Step 33712: {'lr': 0.00044546874158768115, 'samples': 6472704, 'steps': 33711, 'loss/train': 1.8240238428115845} -11/07/2021 01:59:43 - INFO - __main__ - Step 33713: {'lr': 0.00044546543313204415, 'samples': 6472896, 'steps': 33712, 'loss/train': 1.4014474153518677} -11/07/2021 01:59:43 - INFO - __main__ - Step 33714: {'lr': 0.00044546212458833334, 'samples': 6473088, 'steps': 33713, 'loss/train': 1.8096492290496826} -11/07/2021 01:59:44 - INFO - __main__ - Step 33715: {'lr': 0.00044545881595655035, 'samples': 6473280, 'steps': 33714, 'loss/train': 1.4596387147903442} -11/07/2021 01:59:44 - INFO - __main__ - Step 33716: {'lr': 0.00044545550723669664, 'samples': 6473472, 'steps': 33715, 'loss/train': 0.7976817488670349} -11/07/2021 01:59:45 - INFO - __main__ - Step 33717: {'lr': 0.00044545219842877373, 'samples': 6473664, 'steps': 33716, 'loss/train': 1.4980156421661377} -11/07/2021 01:59:45 - INFO - __main__ - Step 33718: {'lr': 0.000445448889532783, 'samples': 6473856, 'steps': 33717, 'loss/train': 1.0201311111450195} -11/07/2021 01:59:46 - INFO - __main__ - Step 33719: {'lr': 0.0004454455805487261, 'samples': 6474048, 'steps': 33718, 'loss/train': 1.7880730628967285} -11/07/2021 01:59:46 - INFO - __main__ - Step 33720: {'lr': 0.0004454422714766043, 'samples': 6474240, 'steps': 33719, 'loss/train': 1.2125518321990967} -11/07/2021 01:59:46 - INFO - __main__ - Step 33721: {'lr': 0.00044543896231641935, 'samples': 6474432, 'steps': 33720, 'loss/train': 1.5912449359893799} -11/07/2021 01:59:47 - INFO - __main__ - Step 33722: {'lr': 0.00044543565306817256, 'samples': 6474624, 'steps': 33721, 'loss/train': 1.6939294338226318} -11/07/2021 01:59:48 - INFO - __main__ - Step 33723: {'lr': 0.00044543234373186556, 'samples': 6474816, 'steps': 33722, 'loss/train': 1.5587968826293945} -11/07/2021 01:59:48 - INFO - __main__ - Step 33724: {'lr': 0.0004454290343074997, 'samples': 6475008, 'steps': 33723, 'loss/train': 1.2607208490371704} -11/07/2021 01:59:48 - INFO - __main__ - Step 33725: {'lr': 0.00044542572479507655, 'samples': 6475200, 'steps': 33724, 'loss/train': 1.7119576930999756} -11/07/2021 01:59:49 - INFO - __main__ - Step 33726: {'lr': 0.00044542241519459757, 'samples': 6475392, 'steps': 33725, 'loss/train': 1.4209587574005127} -11/07/2021 01:59:50 - INFO - __main__ - Step 33727: {'lr': 0.0004454191055060643, 'samples': 6475584, 'steps': 33726, 'loss/train': 1.4337310791015625} -11/07/2021 01:59:51 - INFO - __main__ - Step 33728: {'lr': 0.00044541579572947814, 'samples': 6475776, 'steps': 33727, 'loss/train': 1.5337797403335571} -11/07/2021 01:59:51 - INFO - __main__ - Step 33729: {'lr': 0.0004454124858648407, 'samples': 6475968, 'steps': 33728, 'loss/train': 0.11811182647943497} -11/07/2021 01:59:51 - INFO - __main__ - Step 33730: {'lr': 0.00044540917591215335, 'samples': 6476160, 'steps': 33729, 'loss/train': 1.6598936319351196} -11/07/2021 01:59:52 - INFO - __main__ - Step 33731: {'lr': 0.0004454058658714177, 'samples': 6476352, 'steps': 33730, 'loss/train': 1.5373272895812988} -11/07/2021 01:59:52 - INFO - __main__ - Step 33732: {'lr': 0.0004454025557426351, 'samples': 6476544, 'steps': 33731, 'loss/train': 0.6578313708305359} -11/07/2021 01:59:53 - INFO - __main__ - Step 33733: {'lr': 0.00044539924552580723, 'samples': 6476736, 'steps': 33732, 'loss/train': 1.5535787343978882} -11/07/2021 01:59:53 - INFO - __main__ - Step 33734: {'lr': 0.0004453959352209354, 'samples': 6476928, 'steps': 33733, 'loss/train': 1.8786280155181885} -11/07/2021 01:59:54 - INFO - __main__ - Step 33735: {'lr': 0.0004453926248280212, 'samples': 6477120, 'steps': 33734, 'loss/train': 1.306776762008667} -11/07/2021 01:59:54 - INFO - __main__ - Step 33736: {'lr': 0.0004453893143470661, 'samples': 6477312, 'steps': 33735, 'loss/train': 1.5552427768707275} -11/07/2021 01:59:54 - INFO - __main__ - Step 33737: {'lr': 0.0004453860037780716, 'samples': 6477504, 'steps': 33736, 'loss/train': 1.4108299016952515} -11/07/2021 01:59:55 - INFO - __main__ - Step 33738: {'lr': 0.00044538269312103916, 'samples': 6477696, 'steps': 33737, 'loss/train': 1.8733634948730469} -11/07/2021 01:59:56 - INFO - __main__ - Step 33739: {'lr': 0.00044537938237597033, 'samples': 6477888, 'steps': 33738, 'loss/train': 0.788608193397522} -11/07/2021 01:59:56 - INFO - __main__ - Step 33740: {'lr': 0.00044537607154286645, 'samples': 6478080, 'steps': 33739, 'loss/train': 1.1113461256027222} -11/07/2021 01:59:57 - INFO - __main__ - Step 33741: {'lr': 0.00044537276062172926, 'samples': 6478272, 'steps': 33740, 'loss/train': 1.4108548164367676} -11/07/2021 01:59:57 - INFO - __main__ - Step 33742: {'lr': 0.0004453694496125601, 'samples': 6478464, 'steps': 33741, 'loss/train': 1.6025670766830444} -11/07/2021 01:59:58 - INFO - __main__ - Step 33743: {'lr': 0.0004453661385153604, 'samples': 6478656, 'steps': 33742, 'loss/train': 1.8474880456924438} -11/07/2021 01:59:58 - INFO - __main__ - Step 33744: {'lr': 0.0004453628273301318, 'samples': 6478848, 'steps': 33743, 'loss/train': 1.5394790172576904} -11/07/2021 01:59:59 - INFO - __main__ - Step 33745: {'lr': 0.0004453595160568757, 'samples': 6479040, 'steps': 33744, 'loss/train': 1.138857126235962} -11/07/2021 01:59:59 - INFO - __main__ - Step 33746: {'lr': 0.0004453562046955937, 'samples': 6479232, 'steps': 33745, 'loss/train': 1.4568958282470703} -11/07/2021 01:59:59 - INFO - __main__ - Step 33747: {'lr': 0.00044535289324628704, 'samples': 6479424, 'steps': 33746, 'loss/train': 1.3100298643112183} -11/07/2021 02:00:00 - INFO - __main__ - Step 33748: {'lr': 0.00044534958170895753, 'samples': 6479616, 'steps': 33747, 'loss/train': 1.7168136835098267} -11/07/2021 02:00:01 - INFO - __main__ - Step 33749: {'lr': 0.0004453462700836064, 'samples': 6479808, 'steps': 33748, 'loss/train': 1.7134358882904053} -11/07/2021 02:00:01 - INFO - __main__ - Step 33750: {'lr': 0.0004453429583702353, 'samples': 6480000, 'steps': 33749, 'loss/train': 1.1795400381088257} -11/07/2021 02:00:01 - INFO - __main__ - Step 33751: {'lr': 0.0004453396465688457, 'samples': 6480192, 'steps': 33750, 'loss/train': 1.4245951175689697} -11/07/2021 02:00:02 - INFO - __main__ - Step 33752: {'lr': 0.00044533633467943906, 'samples': 6480384, 'steps': 33751, 'loss/train': 1.7902945280075073} -11/07/2021 02:00:03 - INFO - __main__ - Step 33753: {'lr': 0.00044533302270201693, 'samples': 6480576, 'steps': 33752, 'loss/train': 1.0339568853378296} -11/07/2021 02:00:03 - INFO - __main__ - Step 33754: {'lr': 0.00044532971063658067, 'samples': 6480768, 'steps': 33753, 'loss/train': 1.6112436056137085} -11/07/2021 02:00:04 - INFO - __main__ - Step 33755: {'lr': 0.00044532639848313187, 'samples': 6480960, 'steps': 33754, 'loss/train': 1.2984110116958618} -11/07/2021 02:00:04 - INFO - __main__ - Step 33756: {'lr': 0.0004453230862416721, 'samples': 6481152, 'steps': 33755, 'loss/train': 1.6372071504592896} -11/07/2021 02:00:04 - INFO - __main__ - Step 33757: {'lr': 0.00044531977391220267, 'samples': 6481344, 'steps': 33756, 'loss/train': 1.6506997346878052} -11/07/2021 02:00:05 - INFO - __main__ - Step 33758: {'lr': 0.00044531646149472516, 'samples': 6481536, 'steps': 33757, 'loss/train': 1.0395686626434326} -11/07/2021 02:00:06 - INFO - __main__ - Step 33759: {'lr': 0.00044531314898924116, 'samples': 6481728, 'steps': 33758, 'loss/train': 1.5042260885238647} -11/07/2021 02:00:06 - INFO - __main__ - Step 33760: {'lr': 0.00044530983639575193, 'samples': 6481920, 'steps': 33759, 'loss/train': 1.6232199668884277} -11/07/2021 02:00:06 - INFO - __main__ - Step 33761: {'lr': 0.00044530652371425916, 'samples': 6482112, 'steps': 33760, 'loss/train': 1.5966721773147583} -11/07/2021 02:00:07 - INFO - __main__ - Step 33762: {'lr': 0.00044530321094476434, 'samples': 6482304, 'steps': 33761, 'loss/train': 1.578473448753357} -11/07/2021 02:00:07 - INFO - __main__ - Step 33763: {'lr': 0.0004452998980872689, 'samples': 6482496, 'steps': 33762, 'loss/train': 1.1778452396392822} -11/07/2021 02:00:08 - INFO - __main__ - Step 33764: {'lr': 0.0004452965851417743, 'samples': 6482688, 'steps': 33763, 'loss/train': 1.709043025970459} -11/07/2021 02:00:09 - INFO - __main__ - Step 33765: {'lr': 0.000445293272108282, 'samples': 6482880, 'steps': 33764, 'loss/train': 1.7417343854904175} -11/07/2021 02:00:09 - INFO - __main__ - Step 33766: {'lr': 0.0004452899589867937, 'samples': 6483072, 'steps': 33765, 'loss/train': 0.9052668213844299} -11/07/2021 02:00:09 - INFO - __main__ - Step 33767: {'lr': 0.00044528664577731073, 'samples': 6483264, 'steps': 33766, 'loss/train': 1.6804091930389404} -11/07/2021 02:00:10 - INFO - __main__ - Step 33768: {'lr': 0.00044528333247983456, 'samples': 6483456, 'steps': 33767, 'loss/train': 2.097458600997925} -11/07/2021 02:00:10 - INFO - __main__ - Step 33769: {'lr': 0.0004452800190943667, 'samples': 6483648, 'steps': 33768, 'loss/train': 2.2681474685668945} -11/07/2021 02:00:11 - INFO - __main__ - Step 33770: {'lr': 0.0004452767056209087, 'samples': 6483840, 'steps': 33769, 'loss/train': 1.4090787172317505} -11/07/2021 02:00:11 - INFO - __main__ - Step 33771: {'lr': 0.0004452733920594621, 'samples': 6484032, 'steps': 33770, 'loss/train': 1.3013017177581787} -11/07/2021 02:00:12 - INFO - __main__ - Step 33772: {'lr': 0.0004452700784100283, 'samples': 6484224, 'steps': 33771, 'loss/train': 1.6307063102722168} -11/07/2021 02:00:12 - INFO - __main__ - Step 33773: {'lr': 0.0004452667646726088, 'samples': 6484416, 'steps': 33772, 'loss/train': 1.6249957084655762} -11/07/2021 02:00:13 - INFO - __main__ - Step 33774: {'lr': 0.0004452634508472051, 'samples': 6484608, 'steps': 33773, 'loss/train': 1.4302394390106201} -11/07/2021 02:00:14 - INFO - __main__ - Step 33775: {'lr': 0.0004452601369338187, 'samples': 6484800, 'steps': 33774, 'loss/train': 1.3013135194778442} -11/07/2021 02:00:14 - INFO - __main__ - Step 33776: {'lr': 0.00044525682293245107, 'samples': 6484992, 'steps': 33775, 'loss/train': 1.478948712348938} -11/07/2021 02:00:14 - INFO - __main__ - Step 33777: {'lr': 0.0004452535088431038, 'samples': 6485184, 'steps': 33776, 'loss/train': 1.4473791122436523} -11/07/2021 02:00:15 - INFO - __main__ - Step 33778: {'lr': 0.00044525019466577824, 'samples': 6485376, 'steps': 33777, 'loss/train': 1.9431716203689575} -11/07/2021 02:00:15 - INFO - __main__ - Step 33779: {'lr': 0.000445246880400476, 'samples': 6485568, 'steps': 33778, 'loss/train': 1.5126373767852783} -11/07/2021 02:00:15 - INFO - __main__ - Step 33780: {'lr': 0.0004452435660471985, 'samples': 6485760, 'steps': 33779, 'loss/train': 1.7080620527267456} -11/07/2021 02:00:16 - INFO - __main__ - Step 33781: {'lr': 0.00044524025160594735, 'samples': 6485952, 'steps': 33780, 'loss/train': 0.19829830527305603} -11/07/2021 02:00:17 - INFO - __main__ - Step 33782: {'lr': 0.00044523693707672384, 'samples': 6486144, 'steps': 33781, 'loss/train': 1.7072633504867554} -11/07/2021 02:00:17 - INFO - __main__ - Step 33783: {'lr': 0.0004452336224595296, 'samples': 6486336, 'steps': 33782, 'loss/train': 1.5358293056488037} -11/07/2021 02:00:17 - INFO - __main__ - Step 33784: {'lr': 0.00044523030775436617, 'samples': 6486528, 'steps': 33783, 'loss/train': 1.2860418558120728} -11/07/2021 02:00:18 - INFO - __main__ - Step 33785: {'lr': 0.00044522699296123495, 'samples': 6486720, 'steps': 33784, 'loss/train': 0.9292582273483276} -11/07/2021 02:00:19 - INFO - __main__ - Step 33786: {'lr': 0.0004452236780801374, 'samples': 6486912, 'steps': 33785, 'loss/train': 1.1000765562057495} -11/07/2021 02:00:19 - INFO - __main__ - Step 33787: {'lr': 0.00044522036311107514, 'samples': 6487104, 'steps': 33786, 'loss/train': 1.5459463596343994} -11/07/2021 02:00:20 - INFO - __main__ - Step 33788: {'lr': 0.0004452170480540496, 'samples': 6487296, 'steps': 33787, 'loss/train': 1.036749243736267} -11/07/2021 02:00:20 - INFO - __main__ - Step 33789: {'lr': 0.0004452137329090622, 'samples': 6487488, 'steps': 33788, 'loss/train': 1.3245213031768799} -11/07/2021 02:00:20 - INFO - __main__ - Step 33790: {'lr': 0.0004452104176761146, 'samples': 6487680, 'steps': 33789, 'loss/train': 1.3617459535598755} -11/07/2021 02:00:21 - INFO - __main__ - Step 33791: {'lr': 0.0004452071023552081, 'samples': 6487872, 'steps': 33790, 'loss/train': 1.1394017934799194} -11/07/2021 02:00:22 - INFO - __main__ - Step 33792: {'lr': 0.0004452037869463443, 'samples': 6488064, 'steps': 33791, 'loss/train': 2.0320191383361816} -11/07/2021 02:00:22 - INFO - __main__ - Step 33793: {'lr': 0.0004452004714495248, 'samples': 6488256, 'steps': 33792, 'loss/train': 1.3852721452713013} -11/07/2021 02:00:22 - INFO - __main__ - Step 33794: {'lr': 0.00044519715586475083, 'samples': 6488448, 'steps': 33793, 'loss/train': 1.6966907978057861} -11/07/2021 02:00:23 - INFO - __main__ - Step 33795: {'lr': 0.0004451938401920241, 'samples': 6488640, 'steps': 33794, 'loss/train': 1.5629920959472656} -11/07/2021 02:00:24 - INFO - __main__ - Step 33796: {'lr': 0.0004451905244313461, 'samples': 6488832, 'steps': 33795, 'loss/train': 1.5933583974838257} -11/07/2021 02:00:24 - INFO - __main__ - Step 33797: {'lr': 0.0004451872085827182, 'samples': 6489024, 'steps': 33796, 'loss/train': 1.5892422199249268} -11/07/2021 02:00:24 - INFO - __main__ - Step 33798: {'lr': 0.000445183892646142, 'samples': 6489216, 'steps': 33797, 'loss/train': 1.499814748764038} -11/07/2021 02:00:25 - INFO - __main__ - Step 33799: {'lr': 0.0004451805766216189, 'samples': 6489408, 'steps': 33798, 'loss/train': 1.4643924236297607} -11/07/2021 02:00:25 - INFO - __main__ - Step 33800: {'lr': 0.00044517726050915044, 'samples': 6489600, 'steps': 33799, 'loss/train': 1.5761510133743286} -11/07/2021 02:00:26 - INFO - __main__ - Step 33801: {'lr': 0.0004451739443087381, 'samples': 6489792, 'steps': 33800, 'loss/train': 1.3621511459350586} -11/07/2021 02:00:26 - INFO - __main__ - Step 33802: {'lr': 0.0004451706280203834, 'samples': 6489984, 'steps': 33801, 'loss/train': 1.673937439918518} -11/07/2021 02:00:27 - INFO - __main__ - Step 33803: {'lr': 0.0004451673116440879, 'samples': 6490176, 'steps': 33802, 'loss/train': 1.839440107345581} -11/07/2021 02:00:27 - INFO - __main__ - Step 33804: {'lr': 0.00044516399517985296, 'samples': 6490368, 'steps': 33803, 'loss/train': 1.7208832502365112} -11/07/2021 02:00:28 - INFO - __main__ - Step 33805: {'lr': 0.00044516067862768015, 'samples': 6490560, 'steps': 33804, 'loss/train': 1.5042489767074585} -11/07/2021 02:00:29 - INFO - __main__ - Step 33806: {'lr': 0.00044515736198757095, 'samples': 6490752, 'steps': 33805, 'loss/train': 2.0620195865631104} -11/07/2021 02:00:29 - INFO - __main__ - Step 33807: {'lr': 0.0004451540452595268, 'samples': 6490944, 'steps': 33806, 'loss/train': 1.3464220762252808} -11/07/2021 02:00:29 - INFO - __main__ - Step 33808: {'lr': 0.0004451507284435494, 'samples': 6491136, 'steps': 33807, 'loss/train': 1.5946115255355835} -11/07/2021 02:00:30 - INFO - __main__ - Step 33809: {'lr': 0.00044514741153964, 'samples': 6491328, 'steps': 33808, 'loss/train': 1.6844371557235718} -11/07/2021 02:00:30 - INFO - __main__ - Step 33810: {'lr': 0.00044514409454780016, 'samples': 6491520, 'steps': 33809, 'loss/train': 1.2887932062149048} -11/07/2021 02:00:30 - INFO - __main__ - Step 33811: {'lr': 0.0004451407774680314, 'samples': 6491712, 'steps': 33810, 'loss/train': 1.2394468784332275} -11/07/2021 02:00:31 - INFO - __main__ - Step 33812: {'lr': 0.0004451374603003353, 'samples': 6491904, 'steps': 33811, 'loss/train': 1.0655345916748047} -11/07/2021 02:00:32 - INFO - __main__ - Step 33813: {'lr': 0.0004451341430447132, 'samples': 6492096, 'steps': 33812, 'loss/train': 1.8083118200302124} -11/07/2021 02:00:32 - INFO - __main__ - Step 33814: {'lr': 0.0004451308257011667, 'samples': 6492288, 'steps': 33813, 'loss/train': 1.1663693189620972} -11/07/2021 02:00:32 - INFO - __main__ - Step 33815: {'lr': 0.00044512750826969724, 'samples': 6492480, 'steps': 33814, 'loss/train': 1.7158915996551514} -11/07/2021 02:00:33 - INFO - __main__ - Step 33816: {'lr': 0.0004451241907503063, 'samples': 6492672, 'steps': 33815, 'loss/train': 1.364975094795227} -11/07/2021 02:00:34 - INFO - __main__ - Step 33817: {'lr': 0.0004451208731429954, 'samples': 6492864, 'steps': 33816, 'loss/train': 1.61083984375} -11/07/2021 02:00:34 - INFO - __main__ - Step 33818: {'lr': 0.00044511755544776615, 'samples': 6493056, 'steps': 33817, 'loss/train': 1.5559664964675903} -11/07/2021 02:00:34 - INFO - __main__ - Step 33819: {'lr': 0.0004451142376646199, 'samples': 6493248, 'steps': 33818, 'loss/train': 1.484433889389038} -11/07/2021 02:00:35 - INFO - __main__ - Step 33820: {'lr': 0.0004451109197935582, 'samples': 6493440, 'steps': 33819, 'loss/train': 1.8341032266616821} -11/07/2021 02:00:35 - INFO - __main__ - Step 33821: {'lr': 0.0004451076018345824, 'samples': 6493632, 'steps': 33820, 'loss/train': 1.5442001819610596} -11/07/2021 02:00:36 - INFO - __main__ - Step 33822: {'lr': 0.0004451042837876943, 'samples': 6493824, 'steps': 33821, 'loss/train': 1.7790117263793945} -11/07/2021 02:00:37 - INFO - __main__ - Step 33823: {'lr': 0.00044510096565289513, 'samples': 6494016, 'steps': 33822, 'loss/train': 1.7140729427337646} -11/07/2021 02:00:37 - INFO - __main__ - Step 33824: {'lr': 0.0004450976474301865, 'samples': 6494208, 'steps': 33823, 'loss/train': 1.504670262336731} -11/07/2021 02:00:37 - INFO - __main__ - Step 33825: {'lr': 0.0004450943291195698, 'samples': 6494400, 'steps': 33824, 'loss/train': 1.624586820602417} -11/07/2021 02:00:38 - INFO - __main__ - Step 33826: {'lr': 0.0004450910107210467, 'samples': 6494592, 'steps': 33825, 'loss/train': 1.1198339462280273} -11/07/2021 02:00:39 - INFO - __main__ - Step 33827: {'lr': 0.00044508769223461863, 'samples': 6494784, 'steps': 33826, 'loss/train': 2.0186984539031982} -11/07/2021 02:00:39 - INFO - __main__ - Step 33828: {'lr': 0.00044508437366028695, 'samples': 6494976, 'steps': 33827, 'loss/train': 1.7827537059783936} -11/07/2021 02:00:39 - INFO - __main__ - Step 33829: {'lr': 0.00044508105499805337, 'samples': 6495168, 'steps': 33828, 'loss/train': 1.2118760347366333} -11/07/2021 02:00:40 - INFO - __main__ - Step 33830: {'lr': 0.0004450777362479192, 'samples': 6495360, 'steps': 33829, 'loss/train': 1.4964271783828735} -11/07/2021 02:00:40 - INFO - __main__ - Step 33831: {'lr': 0.000445074417409886, 'samples': 6495552, 'steps': 33830, 'loss/train': 1.4948548078536987} -11/07/2021 02:00:40 - INFO - __main__ - Step 33832: {'lr': 0.0004450710984839553, 'samples': 6495744, 'steps': 33831, 'loss/train': 1.772908329963684} -11/07/2021 02:00:41 - INFO - __main__ - Step 33833: {'lr': 0.00044506777947012863, 'samples': 6495936, 'steps': 33832, 'loss/train': 2.1931819915771484} -11/07/2021 02:00:42 - INFO - __main__ - Step 33834: {'lr': 0.0004450644603684074, 'samples': 6496128, 'steps': 33833, 'loss/train': 1.6842870712280273} -11/07/2021 02:00:42 - INFO - __main__ - Step 33835: {'lr': 0.0004450611411787931, 'samples': 6496320, 'steps': 33834, 'loss/train': 1.9571033716201782} -11/07/2021 02:00:42 - INFO - __main__ - Step 33836: {'lr': 0.0004450578219012873, 'samples': 6496512, 'steps': 33835, 'loss/train': 1.7628679275512695} -11/07/2021 02:00:43 - INFO - __main__ - Step 33837: {'lr': 0.00044505450253589144, 'samples': 6496704, 'steps': 33836, 'loss/train': 1.7430778741836548} -11/07/2021 02:00:44 - INFO - __main__ - Step 33838: {'lr': 0.00044505118308260693, 'samples': 6496896, 'steps': 33837, 'loss/train': 1.683057427406311} -11/07/2021 02:00:44 - INFO - __main__ - Step 33839: {'lr': 0.0004450478635414355, 'samples': 6497088, 'steps': 33838, 'loss/train': 1.1430109739303589} -11/07/2021 02:00:45 - INFO - __main__ - Step 33840: {'lr': 0.0004450445439123785, 'samples': 6497280, 'steps': 33839, 'loss/train': 1.5153329372406006} -11/07/2021 02:00:45 - INFO - __main__ - Step 33841: {'lr': 0.0004450412241954374, 'samples': 6497472, 'steps': 33840, 'loss/train': 1.6892775297164917} -11/07/2021 02:00:45 - INFO - __main__ - Step 33842: {'lr': 0.00044503790439061374, 'samples': 6497664, 'steps': 33841, 'loss/train': 1.6585344076156616} -11/07/2021 02:00:46 - INFO - __main__ - Step 33843: {'lr': 0.000445034584497909, 'samples': 6497856, 'steps': 33842, 'loss/train': 1.845517635345459} -11/07/2021 02:00:47 - INFO - __main__ - Step 33844: {'lr': 0.00044503126451732474, 'samples': 6498048, 'steps': 33843, 'loss/train': 1.7846750020980835} -11/07/2021 02:00:47 - INFO - __main__ - Step 33845: {'lr': 0.00044502794444886234, 'samples': 6498240, 'steps': 33844, 'loss/train': 1.4909343719482422} -11/07/2021 02:00:47 - INFO - __main__ - Step 33846: {'lr': 0.00044502462429252336, 'samples': 6498432, 'steps': 33845, 'loss/train': 1.6039619445800781} -11/07/2021 02:00:48 - INFO - __main__ - Step 33847: {'lr': 0.0004450213040483093, 'samples': 6498624, 'steps': 33846, 'loss/train': 1.3290834426879883} -11/07/2021 02:00:49 - INFO - __main__ - Step 33848: {'lr': 0.00044501798371622173, 'samples': 6498816, 'steps': 33847, 'loss/train': 1.3662832975387573} -11/07/2021 02:00:49 - INFO - __main__ - Step 33849: {'lr': 0.00044501466329626197, 'samples': 6499008, 'steps': 33848, 'loss/train': 1.15182363986969} -11/07/2021 02:00:49 - INFO - __main__ - Step 33850: {'lr': 0.0004450113427884317, 'samples': 6499200, 'steps': 33849, 'loss/train': 2.1332545280456543} -11/07/2021 02:00:50 - INFO - __main__ - Step 33851: {'lr': 0.00044500802219273224, 'samples': 6499392, 'steps': 33850, 'loss/train': 1.3523143529891968} -11/07/2021 02:00:50 - INFO - __main__ - Step 33852: {'lr': 0.00044500470150916514, 'samples': 6499584, 'steps': 33851, 'loss/train': 1.659804344177246} -11/07/2021 02:00:51 - INFO - __main__ - Step 33853: {'lr': 0.000445001380737732, 'samples': 6499776, 'steps': 33852, 'loss/train': 1.4241199493408203} -11/07/2021 02:00:52 - INFO - __main__ - Step 33854: {'lr': 0.0004449980598784343, 'samples': 6499968, 'steps': 33853, 'loss/train': 1.4666374921798706} -11/07/2021 02:00:52 - INFO - __main__ - Step 33855: {'lr': 0.0004449947389312734, 'samples': 6500160, 'steps': 33854, 'loss/train': 1.3092784881591797} -11/07/2021 02:00:53 - INFO - __main__ - Step 33856: {'lr': 0.00044499141789625086, 'samples': 6500352, 'steps': 33855, 'loss/train': 1.5748056173324585} -11/07/2021 02:00:53 - INFO - __main__ - Step 33857: {'lr': 0.0004449880967733683, 'samples': 6500544, 'steps': 33856, 'loss/train': 0.20113760232925415} -11/07/2021 02:00:54 - INFO - __main__ - Step 33858: {'lr': 0.0004449847755626271, 'samples': 6500736, 'steps': 33857, 'loss/train': 1.6535253524780273} -11/07/2021 02:00:55 - INFO - __main__ - Step 33859: {'lr': 0.0004449814542640287, 'samples': 6500928, 'steps': 33858, 'loss/train': 1.9745224714279175} -11/07/2021 02:00:55 - INFO - __main__ - Step 33860: {'lr': 0.0004449781328775746, 'samples': 6501120, 'steps': 33859, 'loss/train': 1.4337353706359863} -11/07/2021 02:00:55 - INFO - __main__ - Step 33861: {'lr': 0.0004449748114032665, 'samples': 6501312, 'steps': 33860, 'loss/train': 1.499574899673462} -11/07/2021 02:00:56 - INFO - __main__ - Step 33862: {'lr': 0.00044497148984110567, 'samples': 6501504, 'steps': 33861, 'loss/train': 1.399930715560913} -11/07/2021 02:00:56 - INFO - __main__ - Step 33863: {'lr': 0.00044496816819109377, 'samples': 6501696, 'steps': 33862, 'loss/train': 1.5060970783233643} -11/07/2021 02:00:56 - INFO - __main__ - Step 33864: {'lr': 0.0004449648464532322, 'samples': 6501888, 'steps': 33863, 'loss/train': 1.3464213609695435} -11/07/2021 02:00:57 - INFO - __main__ - Step 33865: {'lr': 0.0004449615246275225, 'samples': 6502080, 'steps': 33864, 'loss/train': 1.3262618780136108} -11/07/2021 02:00:58 - INFO - __main__ - Step 33866: {'lr': 0.000444958202713966, 'samples': 6502272, 'steps': 33865, 'loss/train': 1.3003273010253906} -11/07/2021 02:00:58 - INFO - __main__ - Step 33867: {'lr': 0.0004449548807125645, 'samples': 6502464, 'steps': 33866, 'loss/train': 1.1961196660995483} -11/07/2021 02:00:59 - INFO - __main__ - Step 33868: {'lr': 0.0004449515586233193, 'samples': 6502656, 'steps': 33867, 'loss/train': 0.7612836956977844} -11/07/2021 02:00:59 - INFO - __main__ - Step 33869: {'lr': 0.0004449482364462319, 'samples': 6502848, 'steps': 33868, 'loss/train': 1.5784677267074585} -11/07/2021 02:01:00 - INFO - __main__ - Step 33870: {'lr': 0.0004449449141813039, 'samples': 6503040, 'steps': 33869, 'loss/train': 1.3834257125854492} -11/07/2021 02:01:00 - INFO - __main__ - Step 33871: {'lr': 0.00044494159182853667, 'samples': 6503232, 'steps': 33870, 'loss/train': 1.4731563329696655} -11/07/2021 02:01:01 - INFO - __main__ - Step 33872: {'lr': 0.0004449382693879318, 'samples': 6503424, 'steps': 33871, 'loss/train': 1.233699083328247} -11/07/2021 02:01:01 - INFO - __main__ - Step 33873: {'lr': 0.0004449349468594908, 'samples': 6503616, 'steps': 33872, 'loss/train': 1.6775755882263184} -11/07/2021 02:01:01 - INFO - __main__ - Step 33874: {'lr': 0.000444931624243215, 'samples': 6503808, 'steps': 33873, 'loss/train': 1.4026579856872559} -11/07/2021 02:01:02 - INFO - __main__ - Step 33875: {'lr': 0.0004449283015391061, 'samples': 6504000, 'steps': 33874, 'loss/train': 1.7538774013519287} -11/07/2021 02:01:03 - INFO - __main__ - Step 33876: {'lr': 0.0004449249787471655, 'samples': 6504192, 'steps': 33875, 'loss/train': 1.0890296697616577} -11/07/2021 02:01:03 - INFO - __main__ - Step 33877: {'lr': 0.0004449216558673947, 'samples': 6504384, 'steps': 33876, 'loss/train': 1.704645037651062} -11/07/2021 02:01:03 - INFO - __main__ - Step 33878: {'lr': 0.0004449183328997952, 'samples': 6504576, 'steps': 33877, 'loss/train': 1.4584956169128418} -11/07/2021 02:01:04 - INFO - __main__ - Step 33879: {'lr': 0.0004449150098443685, 'samples': 6504768, 'steps': 33878, 'loss/train': 1.571358323097229} -11/07/2021 02:01:05 - INFO - __main__ - Step 33880: {'lr': 0.00044491168670111615, 'samples': 6504960, 'steps': 33879, 'loss/train': 1.1301995515823364} -11/07/2021 02:01:05 - INFO - __main__ - Step 33881: {'lr': 0.0004449083634700396, 'samples': 6505152, 'steps': 33880, 'loss/train': 1.473876714706421} -11/07/2021 02:01:05 - INFO - __main__ - Step 33882: {'lr': 0.00044490504015114033, 'samples': 6505344, 'steps': 33881, 'loss/train': 1.712478518486023} -11/07/2021 02:01:06 - INFO - __main__ - Step 33883: {'lr': 0.0004449017167444198, 'samples': 6505536, 'steps': 33882, 'loss/train': 1.813271164894104} -11/07/2021 02:01:06 - INFO - __main__ - Step 33884: {'lr': 0.0004448983932498797, 'samples': 6505728, 'steps': 33883, 'loss/train': 1.7393323183059692} -11/07/2021 02:01:06 - INFO - __main__ - Step 33885: {'lr': 0.00044489506966752127, 'samples': 6505920, 'steps': 33884, 'loss/train': 1.731095552444458} -11/07/2021 02:01:08 - INFO - __main__ - Step 33886: {'lr': 0.00044489174599734614, 'samples': 6506112, 'steps': 33885, 'loss/train': 1.4670522212982178} -11/07/2021 02:01:08 - INFO - __main__ - Step 33887: {'lr': 0.0004448884222393559, 'samples': 6506304, 'steps': 33886, 'loss/train': 1.4478570222854614} -11/07/2021 02:01:08 - INFO - __main__ - Step 33888: {'lr': 0.00044488509839355183, 'samples': 6506496, 'steps': 33887, 'loss/train': 1.1947063207626343} -11/07/2021 02:01:09 - INFO - __main__ - Step 33889: {'lr': 0.00044488177445993563, 'samples': 6506688, 'steps': 33888, 'loss/train': 1.2288641929626465} -11/07/2021 02:01:09 - INFO - __main__ - Step 33890: {'lr': 0.0004448784504385086, 'samples': 6506880, 'steps': 33889, 'loss/train': 1.3459579944610596} -11/07/2021 02:01:10 - INFO - __main__ - Step 33891: {'lr': 0.0004448751263292724, 'samples': 6507072, 'steps': 33890, 'loss/train': 1.4274922609329224} -11/07/2021 02:01:11 - INFO - __main__ - Step 33892: {'lr': 0.0004448718021322285, 'samples': 6507264, 'steps': 33891, 'loss/train': 1.4666961431503296} -11/07/2021 02:01:11 - INFO - __main__ - Step 33893: {'lr': 0.0004448684778473784, 'samples': 6507456, 'steps': 33892, 'loss/train': 1.6061058044433594} -11/07/2021 02:01:11 - INFO - __main__ - Step 33894: {'lr': 0.0004448651534747235, 'samples': 6507648, 'steps': 33893, 'loss/train': 1.383569359779358} -11/07/2021 02:01:12 - INFO - __main__ - Step 33895: {'lr': 0.0004448618290142654, 'samples': 6507840, 'steps': 33894, 'loss/train': 1.421039342880249} -11/07/2021 02:01:13 - INFO - __main__ - Step 33896: {'lr': 0.0004448585044660055, 'samples': 6508032, 'steps': 33895, 'loss/train': 0.20409615337848663} -11/07/2021 02:01:13 - INFO - __main__ - Step 33897: {'lr': 0.0004448551798299455, 'samples': 6508224, 'steps': 33896, 'loss/train': 1.7236816883087158} -11/07/2021 02:01:13 - INFO - __main__ - Step 33898: {'lr': 0.00044485185510608665, 'samples': 6508416, 'steps': 33897, 'loss/train': 1.4264075756072998} -11/07/2021 02:01:14 - INFO - __main__ - Step 33899: {'lr': 0.0004448485302944306, 'samples': 6508608, 'steps': 33898, 'loss/train': 1.5501539707183838} -11/07/2021 02:01:14 - INFO - __main__ - Step 33900: {'lr': 0.0004448452053949789, 'samples': 6508800, 'steps': 33899, 'loss/train': 1.3028892278671265} -11/07/2021 02:01:14 - INFO - __main__ - Step 33901: {'lr': 0.0004448418804077328, 'samples': 6508992, 'steps': 33900, 'loss/train': 1.5605762004852295} -11/07/2021 02:01:16 - INFO - __main__ - Step 33902: {'lr': 0.000444838555332694, 'samples': 6509184, 'steps': 33901, 'loss/train': 1.3784602880477905} -11/07/2021 02:01:16 - INFO - __main__ - Step 33903: {'lr': 0.000444835230169864, 'samples': 6509376, 'steps': 33902, 'loss/train': 2.122793674468994} -11/07/2021 02:01:16 - INFO - __main__ - Step 33904: {'lr': 0.00044483190491924427, 'samples': 6509568, 'steps': 33903, 'loss/train': 1.8116071224212646} -11/07/2021 02:01:17 - INFO - __main__ - Step 33905: {'lr': 0.0004448285795808362, 'samples': 6509760, 'steps': 33904, 'loss/train': 1.4722168445587158} -11/07/2021 02:01:17 - INFO - __main__ - Step 33906: {'lr': 0.00044482525415464144, 'samples': 6509952, 'steps': 33905, 'loss/train': 1.5740023851394653} -11/07/2021 02:01:18 - INFO - __main__ - Step 33907: {'lr': 0.0004448219286406614, 'samples': 6510144, 'steps': 33906, 'loss/train': 1.7123525142669678} -11/07/2021 02:01:18 - INFO - __main__ - Step 33908: {'lr': 0.00044481860303889766, 'samples': 6510336, 'steps': 33907, 'loss/train': 1.1449620723724365} -11/07/2021 02:01:19 - INFO - __main__ - Step 33909: {'lr': 0.0004448152773493516, 'samples': 6510528, 'steps': 33908, 'loss/train': 1.907379150390625} -11/07/2021 02:01:19 - INFO - __main__ - Step 33910: {'lr': 0.0004448119515720248, 'samples': 6510720, 'steps': 33909, 'loss/train': 1.6828466653823853} -11/07/2021 02:01:19 - INFO - __main__ - Step 33911: {'lr': 0.0004448086257069187, 'samples': 6510912, 'steps': 33910, 'loss/train': 1.4255051612854004} -11/07/2021 02:01:20 - INFO - __main__ - Step 33912: {'lr': 0.00044480529975403496, 'samples': 6511104, 'steps': 33911, 'loss/train': 1.3303273916244507} -11/07/2021 02:01:21 - INFO - __main__ - Step 33913: {'lr': 0.00044480197371337484, 'samples': 6511296, 'steps': 33912, 'loss/train': 0.7251231670379639} -11/07/2021 02:01:21 - INFO - __main__ - Step 33914: {'lr': 0.00044479864758494004, 'samples': 6511488, 'steps': 33913, 'loss/train': 1.377323865890503} -11/07/2021 02:01:22 - INFO - __main__ - Step 33915: {'lr': 0.0004447953213687319, 'samples': 6511680, 'steps': 33914, 'loss/train': 1.4334322214126587} -11/07/2021 02:01:22 - INFO - __main__ - Step 33916: {'lr': 0.00044479199506475205, 'samples': 6511872, 'steps': 33915, 'loss/train': 1.859991192817688} -11/07/2021 02:01:23 - INFO - __main__ - Step 33917: {'lr': 0.0004447886686730019, 'samples': 6512064, 'steps': 33916, 'loss/train': 1.1730103492736816} -11/07/2021 02:01:23 - INFO - __main__ - Step 33918: {'lr': 0.00044478534219348297, 'samples': 6512256, 'steps': 33917, 'loss/train': 1.6439616680145264} -11/07/2021 02:01:24 - INFO - __main__ - Step 33919: {'lr': 0.0004447820156261968, 'samples': 6512448, 'steps': 33918, 'loss/train': 1.3017641305923462} -11/07/2021 02:01:24 - INFO - __main__ - Step 33920: {'lr': 0.0004447786889711449, 'samples': 6512640, 'steps': 33919, 'loss/train': 1.3927388191223145} -11/07/2021 02:01:24 - INFO - __main__ - Step 33921: {'lr': 0.00044477536222832867, 'samples': 6512832, 'steps': 33920, 'loss/train': 1.7710654735565186} -11/07/2021 02:01:25 - INFO - __main__ - Step 33922: {'lr': 0.0004447720353977497, 'samples': 6513024, 'steps': 33921, 'loss/train': 1.3544845581054688} -11/07/2021 02:01:26 - INFO - __main__ - Step 33923: {'lr': 0.0004447687084794094, 'samples': 6513216, 'steps': 33922, 'loss/train': 1.0227186679840088} -11/07/2021 02:01:26 - INFO - __main__ - Step 33924: {'lr': 0.00044476538147330934, 'samples': 6513408, 'steps': 33923, 'loss/train': 7.762441635131836} -11/07/2021 02:01:27 - INFO - __main__ - Step 33925: {'lr': 0.00044476205437945105, 'samples': 6513600, 'steps': 33924, 'loss/train': 1.4574618339538574} -11/07/2021 02:01:27 - INFO - __main__ - Step 33926: {'lr': 0.0004447587271978359, 'samples': 6513792, 'steps': 33925, 'loss/train': 3.2924323081970215} -11/07/2021 02:01:27 - INFO - __main__ - Step 33927: {'lr': 0.0004447553999284656, 'samples': 6513984, 'steps': 33926, 'loss/train': 5.801220417022705} -11/07/2021 02:01:28 - INFO - __main__ - Step 33928: {'lr': 0.00044475207257134143, 'samples': 6514176, 'steps': 33927, 'loss/train': 1.7115229368209839} -11/07/2021 02:01:29 - INFO - __main__ - Step 33929: {'lr': 0.000444748745126465, 'samples': 6514368, 'steps': 33928, 'loss/train': 1.2595962285995483} -11/07/2021 02:01:29 - INFO - __main__ - Step 33930: {'lr': 0.0004447454175938378, 'samples': 6514560, 'steps': 33929, 'loss/train': 1.2194738388061523} -11/07/2021 02:01:29 - INFO - __main__ - Step 33931: {'lr': 0.00044474208997346133, 'samples': 6514752, 'steps': 33930, 'loss/train': 1.2058517932891846} -11/07/2021 02:01:30 - INFO - __main__ - Step 33932: {'lr': 0.00044473876226533703, 'samples': 6514944, 'steps': 33931, 'loss/train': 1.2794572114944458} -11/07/2021 02:01:30 - INFO - __main__ - Step 33933: {'lr': 0.0004447354344694665, 'samples': 6515136, 'steps': 33932, 'loss/train': 1.6853723526000977} -11/07/2021 02:01:31 - INFO - __main__ - Step 33934: {'lr': 0.0004447321065858512, 'samples': 6515328, 'steps': 33933, 'loss/train': 1.336300253868103} -11/07/2021 02:01:31 - INFO - __main__ - Step 33935: {'lr': 0.00044472877861449257, 'samples': 6515520, 'steps': 33934, 'loss/train': 1.6641114950180054} -11/07/2021 02:01:32 - INFO - __main__ - Step 33936: {'lr': 0.00044472545055539213, 'samples': 6515712, 'steps': 33935, 'loss/train': 1.3842114210128784} -11/07/2021 02:01:32 - INFO - __main__ - Step 33937: {'lr': 0.00044472212240855155, 'samples': 6515904, 'steps': 33936, 'loss/train': 1.6173049211502075} -11/07/2021 02:01:33 - INFO - __main__ - Step 33938: {'lr': 0.0004447187941739721, 'samples': 6516096, 'steps': 33937, 'loss/train': 1.6227734088897705} -11/07/2021 02:01:34 - INFO - __main__ - Step 33939: {'lr': 0.00044471546585165536, 'samples': 6516288, 'steps': 33938, 'loss/train': 1.2357654571533203} -11/07/2021 02:01:34 - INFO - __main__ - Step 33940: {'lr': 0.0004447121374416028, 'samples': 6516480, 'steps': 33939, 'loss/train': 1.5931684970855713} -11/07/2021 02:01:34 - INFO - __main__ - Step 33941: {'lr': 0.000444708808943816, 'samples': 6516672, 'steps': 33940, 'loss/train': 1.5928783416748047} -11/07/2021 02:01:35 - INFO - __main__ - Step 33942: {'lr': 0.00044470548035829637, 'samples': 6516864, 'steps': 33941, 'loss/train': 1.4349801540374756} -11/07/2021 02:01:35 - INFO - __main__ - Step 33943: {'lr': 0.00044470215168504554, 'samples': 6517056, 'steps': 33942, 'loss/train': 1.7674825191497803} -11/07/2021 02:01:36 - INFO - __main__ - Step 33944: {'lr': 0.0004446988229240648, 'samples': 6517248, 'steps': 33943, 'loss/train': 1.7986441850662231} -11/07/2021 02:01:36 - INFO - __main__ - Step 33945: {'lr': 0.00044469549407535593, 'samples': 6517440, 'steps': 33944, 'loss/train': 1.3439016342163086} -11/07/2021 02:01:37 - INFO - __main__ - Step 33946: {'lr': 0.0004446921651389202, 'samples': 6517632, 'steps': 33945, 'loss/train': 1.4017547369003296} -11/07/2021 02:01:37 - INFO - __main__ - Step 33947: {'lr': 0.00044468883611475913, 'samples': 6517824, 'steps': 33946, 'loss/train': 1.85745370388031} -11/07/2021 02:01:37 - INFO - __main__ - Step 33948: {'lr': 0.00044468550700287436, 'samples': 6518016, 'steps': 33947, 'loss/train': 0.9758426547050476} -11/07/2021 02:01:38 - INFO - __main__ - Step 33949: {'lr': 0.00044468217780326724, 'samples': 6518208, 'steps': 33948, 'loss/train': 1.5032635927200317} -11/07/2021 02:01:39 - INFO - __main__ - Step 33950: {'lr': 0.0004446788485159393, 'samples': 6518400, 'steps': 33949, 'loss/train': 1.3904517889022827} -11/07/2021 02:01:39 - INFO - __main__ - Step 33951: {'lr': 0.00044467551914089223, 'samples': 6518592, 'steps': 33950, 'loss/train': 2.2070465087890625} -11/07/2021 02:01:39 - INFO - __main__ - Step 33952: {'lr': 0.0004446721896781273, 'samples': 6518784, 'steps': 33951, 'loss/train': 1.8837158679962158} -11/07/2021 02:01:40 - INFO - __main__ - Step 33953: {'lr': 0.00044466886012764603, 'samples': 6518976, 'steps': 33952, 'loss/train': 1.2247635126113892} -11/07/2021 02:01:41 - INFO - __main__ - Step 33954: {'lr': 0.00044466553048944996, 'samples': 6519168, 'steps': 33953, 'loss/train': 1.437774419784546} -11/07/2021 02:01:41 - INFO - __main__ - Step 33955: {'lr': 0.0004446622007635407, 'samples': 6519360, 'steps': 33954, 'loss/train': 1.6104636192321777} -11/07/2021 02:01:42 - INFO - __main__ - Step 33956: {'lr': 0.0004446588709499196, 'samples': 6519552, 'steps': 33955, 'loss/train': 1.6318778991699219} -11/07/2021 02:01:42 - INFO - __main__ - Step 33957: {'lr': 0.00044465554104858817, 'samples': 6519744, 'steps': 33956, 'loss/train': 1.220327377319336} -11/07/2021 02:01:42 - INFO - __main__ - Step 33958: {'lr': 0.0004446522110595481, 'samples': 6519936, 'steps': 33957, 'loss/train': 1.54439377784729} -11/07/2021 02:01:43 - INFO - __main__ - Step 33959: {'lr': 0.00044464888098280067, 'samples': 6520128, 'steps': 33958, 'loss/train': 1.7272281646728516} -11/07/2021 02:01:44 - INFO - __main__ - Step 33960: {'lr': 0.00044464555081834745, 'samples': 6520320, 'steps': 33959, 'loss/train': 1.3974066972732544} -11/07/2021 02:01:44 - INFO - __main__ - Step 33961: {'lr': 0.00044464222056618996, 'samples': 6520512, 'steps': 33960, 'loss/train': 1.8621840476989746} -11/07/2021 02:01:44 - INFO - __main__ - Step 33962: {'lr': 0.00044463889022632963, 'samples': 6520704, 'steps': 33961, 'loss/train': 1.528019666671753} -11/07/2021 02:01:45 - INFO - __main__ - Step 33963: {'lr': 0.0004446355597987681, 'samples': 6520896, 'steps': 33962, 'loss/train': 1.360838770866394} -11/07/2021 02:01:46 - INFO - __main__ - Step 33964: {'lr': 0.00044463222928350677, 'samples': 6521088, 'steps': 33963, 'loss/train': 1.8312397003173828} -11/07/2021 02:01:46 - INFO - __main__ - Step 33965: {'lr': 0.0004446288986805471, 'samples': 6521280, 'steps': 33964, 'loss/train': 1.583130955696106} -11/07/2021 02:01:46 - INFO - __main__ - Step 33966: {'lr': 0.0004446255679898907, 'samples': 6521472, 'steps': 33965, 'loss/train': 1.6411830186843872} -11/07/2021 02:01:47 - INFO - __main__ - Step 33967: {'lr': 0.000444622237211539, 'samples': 6521664, 'steps': 33966, 'loss/train': 1.4181243181228638} -11/07/2021 02:01:47 - INFO - __main__ - Step 33968: {'lr': 0.00044461890634549364, 'samples': 6521856, 'steps': 33967, 'loss/train': 1.8298888206481934} -11/07/2021 02:01:49 - INFO - __main__ - Step 33969: {'lr': 0.00044461557539175587, 'samples': 6522048, 'steps': 33968, 'loss/train': 1.7349551916122437} -11/07/2021 02:01:49 - INFO - __main__ - Step 33970: {'lr': 0.0004446122443503274, 'samples': 6522240, 'steps': 33969, 'loss/train': 1.7679076194763184} -11/07/2021 02:01:49 - INFO - __main__ - Step 33971: {'lr': 0.00044460891322120963, 'samples': 6522432, 'steps': 33970, 'loss/train': 1.5789631605148315} -11/07/2021 02:01:50 - INFO - __main__ - Step 33972: {'lr': 0.000444605582004404, 'samples': 6522624, 'steps': 33971, 'loss/train': 0.24429169297218323} -11/07/2021 02:01:50 - INFO - __main__ - Step 33973: {'lr': 0.0004446022506999122, 'samples': 6522816, 'steps': 33972, 'loss/train': 1.216179370880127} -11/07/2021 02:01:51 - INFO - __main__ - Step 33974: {'lr': 0.0004445989193077356, 'samples': 6523008, 'steps': 33973, 'loss/train': 1.6011016368865967} -11/07/2021 02:01:51 - INFO - __main__ - Step 33975: {'lr': 0.0004445955878278758, 'samples': 6523200, 'steps': 33974, 'loss/train': 2.066823720932007} -11/07/2021 02:01:52 - INFO - __main__ - Step 33976: {'lr': 0.00044459225626033413, 'samples': 6523392, 'steps': 33975, 'loss/train': 1.8326551914215088} -11/07/2021 02:01:52 - INFO - __main__ - Step 33977: {'lr': 0.00044458892460511225, 'samples': 6523584, 'steps': 33976, 'loss/train': 1.4237685203552246} -11/07/2021 02:01:52 - INFO - __main__ - Step 33978: {'lr': 0.0004445855928622116, 'samples': 6523776, 'steps': 33977, 'loss/train': 1.754783272743225} -11/07/2021 02:01:53 - INFO - __main__ - Step 33979: {'lr': 0.00044458226103163365, 'samples': 6523968, 'steps': 33978, 'loss/train': 1.2844159603118896} -11/07/2021 02:01:54 - INFO - __main__ - Step 33980: {'lr': 0.0004445789291133799, 'samples': 6524160, 'steps': 33979, 'loss/train': 1.2192468643188477} -11/07/2021 02:01:54 - INFO - __main__ - Step 33981: {'lr': 0.0004445755971074519, 'samples': 6524352, 'steps': 33980, 'loss/train': 1.436919093132019} -11/07/2021 02:01:54 - INFO - __main__ - Step 33982: {'lr': 0.0004445722650138512, 'samples': 6524544, 'steps': 33981, 'loss/train': 1.6285544633865356} -11/07/2021 02:01:55 - INFO - __main__ - Step 33983: {'lr': 0.00044456893283257925, 'samples': 6524736, 'steps': 33982, 'loss/train': 1.518558144569397} -11/07/2021 02:01:55 - INFO - __main__ - Step 33984: {'lr': 0.00044456560056363746, 'samples': 6524928, 'steps': 33983, 'loss/train': 1.6287636756896973} -11/07/2021 02:01:56 - INFO - __main__ - Step 33985: {'lr': 0.0004445622682070275, 'samples': 6525120, 'steps': 33984, 'loss/train': 1.4861018657684326} -11/07/2021 02:01:56 - INFO - __main__ - Step 33986: {'lr': 0.00044455893576275077, 'samples': 6525312, 'steps': 33985, 'loss/train': 1.591300129890442} -11/07/2021 02:01:57 - INFO - __main__ - Step 33987: {'lr': 0.00044455560323080874, 'samples': 6525504, 'steps': 33986, 'loss/train': 1.9785436391830444} -11/07/2021 02:01:57 - INFO - __main__ - Step 33988: {'lr': 0.00044455227061120296, 'samples': 6525696, 'steps': 33987, 'loss/train': 1.6648945808410645} -11/07/2021 02:01:57 - INFO - __main__ - Step 33989: {'lr': 0.000444548937903935, 'samples': 6525888, 'steps': 33988, 'loss/train': 1.4953155517578125} -11/07/2021 02:01:58 - INFO - __main__ - Step 33990: {'lr': 0.0004445456051090062, 'samples': 6526080, 'steps': 33989, 'loss/train': 1.3475840091705322} -11/07/2021 02:01:59 - INFO - __main__ - Step 33991: {'lr': 0.0004445422722264182, 'samples': 6526272, 'steps': 33990, 'loss/train': 1.6253974437713623} -11/07/2021 02:01:59 - INFO - __main__ - Step 33992: {'lr': 0.0004445389392561724, 'samples': 6526464, 'steps': 33991, 'loss/train': 1.6526176929473877} -11/07/2021 02:01:59 - INFO - __main__ - Step 33993: {'lr': 0.0004445356061982704, 'samples': 6526656, 'steps': 33992, 'loss/train': 1.5785486698150635} -11/07/2021 02:02:00 - INFO - __main__ - Step 33994: {'lr': 0.0004445322730527137, 'samples': 6526848, 'steps': 33993, 'loss/train': 1.6258047819137573} -11/07/2021 02:02:01 - INFO - __main__ - Step 33995: {'lr': 0.0004445289398195037, 'samples': 6527040, 'steps': 33994, 'loss/train': 1.8948335647583008} -11/07/2021 02:02:01 - INFO - __main__ - Step 33996: {'lr': 0.000444525606498642, 'samples': 6527232, 'steps': 33995, 'loss/train': 1.3909330368041992} -11/07/2021 02:02:02 - INFO - __main__ - Step 33997: {'lr': 0.00044452227309013003, 'samples': 6527424, 'steps': 33996, 'loss/train': 1.4994609355926514} -11/07/2021 02:02:02 - INFO - __main__ - Step 33998: {'lr': 0.0004445189395939694, 'samples': 6527616, 'steps': 33997, 'loss/train': 1.4667303562164307} -11/07/2021 02:02:02 - INFO - __main__ - Step 33999: {'lr': 0.0004445156060101614, 'samples': 6527808, 'steps': 33998, 'loss/train': 1.8702677488327026} -11/07/2021 02:02:03 - INFO - __main__ - Step 34000: {'lr': 0.0004445122723387077, 'samples': 6528000, 'steps': 33999, 'loss/train': 1.4197800159454346} -11/07/2021 02:02:04 - INFO - __main__ - Step 34001: {'lr': 0.0004445089385796099, 'samples': 6528192, 'steps': 34000, 'loss/train': 1.6524118185043335} -11/07/2021 02:02:04 - INFO - __main__ - Step 34002: {'lr': 0.0004445056047328693, 'samples': 6528384, 'steps': 34001, 'loss/train': 1.7949652671813965} -11/07/2021 02:02:05 - INFO - __main__ - Step 34003: {'lr': 0.0004445022707984874, 'samples': 6528576, 'steps': 34002, 'loss/train': 0.221288800239563} -11/07/2021 02:02:05 - INFO - __main__ - Step 34004: {'lr': 0.0004444989367764659, 'samples': 6528768, 'steps': 34003, 'loss/train': 1.1219404935836792} -11/07/2021 02:02:06 - INFO - __main__ - Step 34005: {'lr': 0.0004444956026668061, 'samples': 6528960, 'steps': 34004, 'loss/train': 1.2909691333770752} -11/07/2021 02:02:07 - INFO - __main__ - Step 34006: {'lr': 0.00044449226846950964, 'samples': 6529152, 'steps': 34005, 'loss/train': 0.9231574535369873} -11/07/2021 02:02:07 - INFO - __main__ - Step 34007: {'lr': 0.00044448893418457794, 'samples': 6529344, 'steps': 34006, 'loss/train': 2.1114120483398438} -11/07/2021 02:02:07 - INFO - __main__ - Step 34008: {'lr': 0.00044448559981201256, 'samples': 6529536, 'steps': 34007, 'loss/train': 1.8139729499816895} -11/07/2021 02:02:08 - INFO - __main__ - Step 34009: {'lr': 0.00044448226535181485, 'samples': 6529728, 'steps': 34008, 'loss/train': 1.598117470741272} -11/07/2021 02:02:08 - INFO - __main__ - Step 34010: {'lr': 0.0004444789308039865, 'samples': 6529920, 'steps': 34009, 'loss/train': 2.2077717781066895} -11/07/2021 02:02:09 - INFO - __main__ - Step 34011: {'lr': 0.00044447559616852893, 'samples': 6530112, 'steps': 34010, 'loss/train': 1.6955511569976807} -11/07/2021 02:02:09 - INFO - __main__ - Step 34012: {'lr': 0.0004444722614454437, 'samples': 6530304, 'steps': 34011, 'loss/train': 1.916416049003601} -11/07/2021 02:02:10 - INFO - __main__ - Step 34013: {'lr': 0.00044446892663473227, 'samples': 6530496, 'steps': 34012, 'loss/train': 1.7840545177459717} -11/07/2021 02:02:10 - INFO - __main__ - Step 34014: {'lr': 0.0004444655917363961, 'samples': 6530688, 'steps': 34013, 'loss/train': 1.3438079357147217} -11/07/2021 02:02:10 - INFO - __main__ - Step 34015: {'lr': 0.00044446225675043684, 'samples': 6530880, 'steps': 34014, 'loss/train': 2.495532751083374} -11/07/2021 02:02:11 - INFO - __main__ - Step 34016: {'lr': 0.0004444589216768558, 'samples': 6531072, 'steps': 34015, 'loss/train': 1.3623573780059814} -11/07/2021 02:02:12 - INFO - __main__ - Step 34017: {'lr': 0.0004444555865156545, 'samples': 6531264, 'steps': 34016, 'loss/train': 1.2433745861053467} -11/07/2021 02:02:12 - INFO - __main__ - Step 34018: {'lr': 0.0004444522512668346, 'samples': 6531456, 'steps': 34017, 'loss/train': 1.8973829746246338} -11/07/2021 02:02:13 - INFO - __main__ - Step 34019: {'lr': 0.0004444489159303976, 'samples': 6531648, 'steps': 34018, 'loss/train': 1.5133620500564575} -11/07/2021 02:02:13 - INFO - __main__ - Step 34020: {'lr': 0.0004444455805063448, 'samples': 6531840, 'steps': 34019, 'loss/train': 1.4161401987075806} -11/07/2021 02:02:14 - INFO - __main__ - Step 34021: {'lr': 0.00044444224499467784, 'samples': 6532032, 'steps': 34020, 'loss/train': 1.7862776517868042} -11/07/2021 02:02:14 - INFO - __main__ - Step 34022: {'lr': 0.0004444389093953982, 'samples': 6532224, 'steps': 34021, 'loss/train': 1.5086743831634521} -11/07/2021 02:02:15 - INFO - __main__ - Step 34023: {'lr': 0.00044443557370850743, 'samples': 6532416, 'steps': 34022, 'loss/train': 1.3057926893234253} -11/07/2021 02:02:15 - INFO - __main__ - Step 34024: {'lr': 0.00044443223793400695, 'samples': 6532608, 'steps': 34023, 'loss/train': 1.6543852090835571} -11/07/2021 02:02:16 - INFO - __main__ - Step 34025: {'lr': 0.0004444289020718983, 'samples': 6532800, 'steps': 34024, 'loss/train': 1.9857542514801025} -11/07/2021 02:02:17 - INFO - __main__ - Step 34026: {'lr': 0.000444425566122183, 'samples': 6532992, 'steps': 34025, 'loss/train': 0.9507812261581421} -11/07/2021 02:02:17 - INFO - __main__ - Step 34027: {'lr': 0.0004444222300848626, 'samples': 6533184, 'steps': 34026, 'loss/train': 1.056647777557373} -11/07/2021 02:02:17 - INFO - __main__ - Step 34028: {'lr': 0.00044441889395993844, 'samples': 6533376, 'steps': 34027, 'loss/train': 1.6833502054214478} -11/07/2021 02:02:18 - INFO - __main__ - Step 34029: {'lr': 0.00044441555774741215, 'samples': 6533568, 'steps': 34028, 'loss/train': 1.3435801267623901} -11/07/2021 02:02:18 - INFO - __main__ - Step 34030: {'lr': 0.00044441222144728525, 'samples': 6533760, 'steps': 34029, 'loss/train': 1.3523625135421753} -11/07/2021 02:02:19 - INFO - __main__ - Step 34031: {'lr': 0.00044440888505955926, 'samples': 6533952, 'steps': 34030, 'loss/train': 2.1320152282714844} -11/07/2021 02:02:19 - INFO - __main__ - Step 34032: {'lr': 0.00044440554858423553, 'samples': 6534144, 'steps': 34031, 'loss/train': 1.4462076425552368} -11/07/2021 02:02:20 - INFO - __main__ - Step 34033: {'lr': 0.0004444022120213157, 'samples': 6534336, 'steps': 34032, 'loss/train': 1.2795424461364746} -11/07/2021 02:02:20 - INFO - __main__ - Step 34034: {'lr': 0.00044439887537080116, 'samples': 6534528, 'steps': 34033, 'loss/train': 1.4343459606170654} -11/07/2021 02:02:20 - INFO - __main__ - Step 34035: {'lr': 0.00044439553863269356, 'samples': 6534720, 'steps': 34034, 'loss/train': 1.7785248756408691} -11/07/2021 02:02:21 - INFO - __main__ - Step 34036: {'lr': 0.00044439220180699434, 'samples': 6534912, 'steps': 34035, 'loss/train': 1.6420665979385376} -11/07/2021 02:02:22 - INFO - __main__ - Step 34037: {'lr': 0.00044438886489370493, 'samples': 6535104, 'steps': 34036, 'loss/train': 1.4897013902664185} -11/07/2021 02:02:22 - INFO - __main__ - Step 34038: {'lr': 0.00044438552789282694, 'samples': 6535296, 'steps': 34037, 'loss/train': 1.4812804460525513} -11/07/2021 02:02:22 - INFO - __main__ - Step 34039: {'lr': 0.00044438219080436184, 'samples': 6535488, 'steps': 34038, 'loss/train': 1.7232627868652344} -11/07/2021 02:02:23 - INFO - __main__ - Step 34040: {'lr': 0.0004443788536283111, 'samples': 6535680, 'steps': 34039, 'loss/train': 1.4123303890228271} -11/07/2021 02:02:23 - INFO - __main__ - Step 34041: {'lr': 0.0004443755163646762, 'samples': 6535872, 'steps': 34040, 'loss/train': 1.4441375732421875} -11/07/2021 02:02:24 - INFO - __main__ - Step 34042: {'lr': 0.00044437217901345885, 'samples': 6536064, 'steps': 34041, 'loss/train': 1.9585773944854736} -11/07/2021 02:02:24 - INFO - __main__ - Step 34043: {'lr': 0.0004443688415746602, 'samples': 6536256, 'steps': 34042, 'loss/train': 0.7225326895713806} -11/07/2021 02:02:25 - INFO - __main__ - Step 34044: {'lr': 0.00044436550404828207, 'samples': 6536448, 'steps': 34043, 'loss/train': 1.2998487949371338} -11/07/2021 02:02:25 - INFO - __main__ - Step 34045: {'lr': 0.0004443621664343258, 'samples': 6536640, 'steps': 34044, 'loss/train': 1.6461623907089233} -11/07/2021 02:02:25 - INFO - __main__ - Step 34046: {'lr': 0.000444358828732793, 'samples': 6536832, 'steps': 34045, 'loss/train': 1.1608872413635254} -11/07/2021 02:02:27 - INFO - __main__ - Step 34047: {'lr': 0.000444355490943685, 'samples': 6537024, 'steps': 34046, 'loss/train': 1.3167895078659058} -11/07/2021 02:02:27 - INFO - __main__ - Step 34048: {'lr': 0.0004443521530670035, 'samples': 6537216, 'steps': 34047, 'loss/train': 1.7646113634109497} -11/07/2021 02:02:27 - INFO - __main__ - Step 34049: {'lr': 0.00044434881510274995, 'samples': 6537408, 'steps': 34048, 'loss/train': 1.6775469779968262} -11/07/2021 02:02:28 - INFO - __main__ - Step 34050: {'lr': 0.00044434547705092574, 'samples': 6537600, 'steps': 34049, 'loss/train': 1.299673318862915} -11/07/2021 02:02:28 - INFO - __main__ - Step 34051: {'lr': 0.0004443421389115325, 'samples': 6537792, 'steps': 34050, 'loss/train': 1.6322948932647705} -11/07/2021 02:02:29 - INFO - __main__ - Step 34052: {'lr': 0.00044433880068457166, 'samples': 6537984, 'steps': 34051, 'loss/train': 1.6336530447006226} -11/07/2021 02:02:29 - INFO - __main__ - Step 34053: {'lr': 0.0004443354623700447, 'samples': 6538176, 'steps': 34052, 'loss/train': 1.146722435951233} -11/07/2021 02:02:30 - INFO - __main__ - Step 34054: {'lr': 0.0004443321239679533, 'samples': 6538368, 'steps': 34053, 'loss/train': 1.7375221252441406} -11/07/2021 02:02:30 - INFO - __main__ - Step 34055: {'lr': 0.0004443287854782988, 'samples': 6538560, 'steps': 34054, 'loss/train': 1.0673551559448242} -11/07/2021 02:02:30 - INFO - __main__ - Step 34056: {'lr': 0.0004443254469010828, 'samples': 6538752, 'steps': 34055, 'loss/train': 1.014756441116333} -11/07/2021 02:02:31 - INFO - __main__ - Step 34057: {'lr': 0.0004443221082363067, 'samples': 6538944, 'steps': 34056, 'loss/train': 1.288285255432129} -11/07/2021 02:02:32 - INFO - __main__ - Step 34058: {'lr': 0.000444318769483972, 'samples': 6539136, 'steps': 34057, 'loss/train': 1.7834769487380981} -11/07/2021 02:02:32 - INFO - __main__ - Step 34059: {'lr': 0.0004443154306440803, 'samples': 6539328, 'steps': 34058, 'loss/train': 1.7867774963378906} -11/07/2021 02:02:32 - INFO - __main__ - Step 34060: {'lr': 0.00044431209171663313, 'samples': 6539520, 'steps': 34059, 'loss/train': 0.7567717432975769} -11/07/2021 02:02:33 - INFO - __main__ - Step 34061: {'lr': 0.00044430875270163185, 'samples': 6539712, 'steps': 34060, 'loss/train': 1.6711994409561157} -11/07/2021 02:02:33 - INFO - __main__ - Step 34062: {'lr': 0.00044430541359907804, 'samples': 6539904, 'steps': 34061, 'loss/train': 1.6374399662017822} -11/07/2021 02:02:34 - INFO - __main__ - Step 34063: {'lr': 0.0004443020744089733, 'samples': 6540096, 'steps': 34062, 'loss/train': 1.5656423568725586} -11/07/2021 02:02:35 - INFO - __main__ - Step 34064: {'lr': 0.00044429873513131897, 'samples': 6540288, 'steps': 34063, 'loss/train': 3.7890005111694336} -11/07/2021 02:02:35 - INFO - __main__ - Step 34065: {'lr': 0.00044429539576611664, 'samples': 6540480, 'steps': 34064, 'loss/train': 1.0325992107391357} -11/07/2021 02:02:35 - INFO - __main__ - Step 34066: {'lr': 0.0004442920563133678, 'samples': 6540672, 'steps': 34065, 'loss/train': 0.26503893733024597} -11/07/2021 02:02:36 - INFO - __main__ - Step 34067: {'lr': 0.000444288716773074, 'samples': 6540864, 'steps': 34066, 'loss/train': 1.4189012050628662} -11/07/2021 02:02:37 - INFO - __main__ - Step 34068: {'lr': 0.00044428537714523664, 'samples': 6541056, 'steps': 34067, 'loss/train': 1.4169859886169434} -11/07/2021 02:02:37 - INFO - __main__ - Step 34069: {'lr': 0.00044428203742985734, 'samples': 6541248, 'steps': 34068, 'loss/train': 1.668953776359558} -11/07/2021 02:02:37 - INFO - __main__ - Step 34070: {'lr': 0.0004442786976269375, 'samples': 6541440, 'steps': 34069, 'loss/train': 1.685661792755127} -11/07/2021 02:02:38 - INFO - __main__ - Step 34071: {'lr': 0.0004442753577364788, 'samples': 6541632, 'steps': 34070, 'loss/train': 2.0190627574920654} -11/07/2021 02:02:38 - INFO - __main__ - Step 34072: {'lr': 0.00044427201775848246, 'samples': 6541824, 'steps': 34071, 'loss/train': 1.4158926010131836} -11/07/2021 02:02:39 - INFO - __main__ - Step 34073: {'lr': 0.0004442686776929502, 'samples': 6542016, 'steps': 34072, 'loss/train': 1.2631921768188477} -11/07/2021 02:02:39 - INFO - __main__ - Step 34074: {'lr': 0.0004442653375398835, 'samples': 6542208, 'steps': 34073, 'loss/train': 1.4398088455200195} -11/07/2021 02:02:40 - INFO - __main__ - Step 34075: {'lr': 0.0004442619972992838, 'samples': 6542400, 'steps': 34074, 'loss/train': 1.88358473777771} -11/07/2021 02:02:40 - INFO - __main__ - Step 34076: {'lr': 0.00044425865697115266, 'samples': 6542592, 'steps': 34075, 'loss/train': 0.38768935203552246} -11/07/2021 02:02:40 - INFO - __main__ - Step 34077: {'lr': 0.00044425531655549157, 'samples': 6542784, 'steps': 34076, 'loss/train': 0.8294751048088074} -11/07/2021 02:02:42 - INFO - __main__ - Step 34078: {'lr': 0.0004442519760523021, 'samples': 6542976, 'steps': 34077, 'loss/train': 1.6006672382354736} -11/07/2021 02:02:42 - INFO - __main__ - Step 34079: {'lr': 0.00044424863546158554, 'samples': 6543168, 'steps': 34078, 'loss/train': 1.5854127407073975} -11/07/2021 02:02:42 - INFO - __main__ - Step 34080: {'lr': 0.00044424529478334364, 'samples': 6543360, 'steps': 34079, 'loss/train': 1.4523556232452393} -11/07/2021 02:02:43 - INFO - __main__ - Step 34081: {'lr': 0.0004442419540175778, 'samples': 6543552, 'steps': 34080, 'loss/train': 1.5299001932144165} -11/07/2021 02:02:43 - INFO - __main__ - Step 34082: {'lr': 0.0004442386131642895, 'samples': 6543744, 'steps': 34081, 'loss/train': 1.4755926132202148} -11/07/2021 02:02:43 - INFO - __main__ - Step 34083: {'lr': 0.0004442352722234803, 'samples': 6543936, 'steps': 34082, 'loss/train': 1.3150346279144287} -11/07/2021 02:02:44 - INFO - __main__ - Step 34084: {'lr': 0.0004442319311951517, 'samples': 6544128, 'steps': 34083, 'loss/train': 2.093810558319092} -11/07/2021 02:02:45 - INFO - __main__ - Step 34085: {'lr': 0.00044422859007930515, 'samples': 6544320, 'steps': 34084, 'loss/train': 0.9736217260360718} -11/07/2021 02:02:45 - INFO - __main__ - Step 34086: {'lr': 0.00044422524887594223, 'samples': 6544512, 'steps': 34085, 'loss/train': 1.3088901042938232} -11/07/2021 02:02:45 - INFO - __main__ - Step 34087: {'lr': 0.0004442219075850644, 'samples': 6544704, 'steps': 34086, 'loss/train': 2.357985734939575} -11/07/2021 02:02:46 - INFO - __main__ - Step 34088: {'lr': 0.0004442185662066731, 'samples': 6544896, 'steps': 34087, 'loss/train': 1.6649442911148071} -11/07/2021 02:02:47 - INFO - __main__ - Step 34089: {'lr': 0.00044421522474077, 'samples': 6545088, 'steps': 34088, 'loss/train': 1.016621708869934} -11/07/2021 02:02:47 - INFO - __main__ - Step 34090: {'lr': 0.0004442118831873565, 'samples': 6545280, 'steps': 34089, 'loss/train': 2.521681547164917} -11/07/2021 02:02:48 - INFO - __main__ - Step 34091: {'lr': 0.00044420854154643413, 'samples': 6545472, 'steps': 34090, 'loss/train': 1.7413277626037598} -11/07/2021 02:02:48 - INFO - __main__ - Step 34092: {'lr': 0.00044420519981800446, 'samples': 6545664, 'steps': 34091, 'loss/train': 1.9090162515640259} -11/07/2021 02:02:48 - INFO - __main__ - Step 34093: {'lr': 0.0004442018580020688, 'samples': 6545856, 'steps': 34092, 'loss/train': 1.6657209396362305} -11/07/2021 02:02:50 - INFO - __main__ - Step 34094: {'lr': 0.0004441985160986288, 'samples': 6546048, 'steps': 34093, 'loss/train': 1.4866628646850586} -11/07/2021 02:02:50 - INFO - __main__ - Step 34095: {'lr': 0.00044419517410768594, 'samples': 6546240, 'steps': 34094, 'loss/train': 1.7155829668045044} -11/07/2021 02:02:50 - INFO - __main__ - Step 34096: {'lr': 0.0004441918320292418, 'samples': 6546432, 'steps': 34095, 'loss/train': 2.6343283653259277} -11/07/2021 02:02:51 - INFO - __main__ - Step 34097: {'lr': 0.00044418848986329775, 'samples': 6546624, 'steps': 34096, 'loss/train': 1.75544273853302} -11/07/2021 02:02:51 - INFO - __main__ - Step 34098: {'lr': 0.0004441851476098554, 'samples': 6546816, 'steps': 34097, 'loss/train': 1.4818480014801025} -11/07/2021 02:02:52 - INFO - __main__ - Step 34099: {'lr': 0.0004441818052689162, 'samples': 6547008, 'steps': 34098, 'loss/train': 1.7657145261764526} -11/07/2021 02:02:52 - INFO - __main__ - Step 34100: {'lr': 0.0004441784628404817, 'samples': 6547200, 'steps': 34099, 'loss/train': 1.303661823272705} -11/07/2021 02:02:53 - INFO - __main__ - Step 34101: {'lr': 0.0004441751203245533, 'samples': 6547392, 'steps': 34100, 'loss/train': 1.3592103719711304} -11/07/2021 02:02:53 - INFO - __main__ - Step 34102: {'lr': 0.0004441717777211327, 'samples': 6547584, 'steps': 34101, 'loss/train': 1.1900908946990967} -11/07/2021 02:02:53 - INFO - __main__ - Step 34103: {'lr': 0.00044416843503022126, 'samples': 6547776, 'steps': 34102, 'loss/train': 1.4008874893188477} -11/07/2021 02:02:55 - INFO - __main__ - Step 34104: {'lr': 0.00044416509225182044, 'samples': 6547968, 'steps': 34103, 'loss/train': 1.9034819602966309} -11/07/2021 02:02:55 - INFO - __main__ - Step 34105: {'lr': 0.0004441617493859319, 'samples': 6548160, 'steps': 34104, 'loss/train': 1.9238120317459106} -11/07/2021 02:02:55 - INFO - __main__ - Step 34106: {'lr': 0.0004441584064325571, 'samples': 6548352, 'steps': 34105, 'loss/train': 1.6103079319000244} -11/07/2021 02:02:56 - INFO - __main__ - Step 34107: {'lr': 0.0004441550633916975, 'samples': 6548544, 'steps': 34106, 'loss/train': 1.407387375831604} -11/07/2021 02:02:56 - INFO - __main__ - Step 34108: {'lr': 0.0004441517202633546, 'samples': 6548736, 'steps': 34107, 'loss/train': 1.857909083366394} -11/07/2021 02:02:56 - INFO - __main__ - Step 34109: {'lr': 0.0004441483770475299, 'samples': 6548928, 'steps': 34108, 'loss/train': 1.783825397491455} -11/07/2021 02:02:58 - INFO - __main__ - Step 34110: {'lr': 0.000444145033744225, 'samples': 6549120, 'steps': 34109, 'loss/train': 1.9305288791656494} -11/07/2021 02:02:58 - INFO - __main__ - Step 34111: {'lr': 0.0004441416903534413, 'samples': 6549312, 'steps': 34110, 'loss/train': 1.528344988822937} -11/07/2021 02:02:59 - INFO - __main__ - Step 34112: {'lr': 0.00044413834687518034, 'samples': 6549504, 'steps': 34111, 'loss/train': 1.9612399339675903} -11/07/2021 02:02:59 - INFO - __main__ - Step 34113: {'lr': 0.00044413500330944366, 'samples': 6549696, 'steps': 34112, 'loss/train': 1.5819721221923828} -11/07/2021 02:02:59 - INFO - __main__ - Step 34114: {'lr': 0.00044413165965623275, 'samples': 6549888, 'steps': 34113, 'loss/train': 1.7284300327301025} -11/07/2021 02:03:01 - INFO - __main__ - Step 34115: {'lr': 0.00044412831591554916, 'samples': 6550080, 'steps': 34114, 'loss/train': 1.3581510782241821} -11/07/2021 02:03:01 - INFO - __main__ - Step 34116: {'lr': 0.0004441249720873942, 'samples': 6550272, 'steps': 34115, 'loss/train': 1.1771085262298584} -11/07/2021 02:03:01 - INFO - __main__ - Step 34117: {'lr': 0.00044412162817176966, 'samples': 6550464, 'steps': 34116, 'loss/train': 1.4967354536056519} -11/07/2021 02:03:02 - INFO - __main__ - Step 34118: {'lr': 0.00044411828416867684, 'samples': 6550656, 'steps': 34117, 'loss/train': 1.4765671491622925} -11/07/2021 02:03:02 - INFO - __main__ - Step 34119: {'lr': 0.00044411494007811736, 'samples': 6550848, 'steps': 34118, 'loss/train': 3.327427864074707} -11/07/2021 02:03:03 - INFO - __main__ - Step 34120: {'lr': 0.00044411159590009263, 'samples': 6551040, 'steps': 34119, 'loss/train': 5.610230445861816} -11/07/2021 02:03:03 - INFO - __main__ - Step 34121: {'lr': 0.0004441082516346043, 'samples': 6551232, 'steps': 34120, 'loss/train': 5.60709285736084} -11/07/2021 02:03:04 - INFO - __main__ - Step 34122: {'lr': 0.0004441049072816537, 'samples': 6551424, 'steps': 34121, 'loss/train': 1.4392449855804443} -11/07/2021 02:03:04 - INFO - __main__ - Step 34123: {'lr': 0.0004441015628412425, 'samples': 6551616, 'steps': 34122, 'loss/train': 1.6424055099487305} -11/07/2021 02:03:05 - INFO - __main__ - Step 34124: {'lr': 0.0004440982183133721, 'samples': 6551808, 'steps': 34123, 'loss/train': 1.508685827255249} -11/07/2021 02:03:05 - INFO - __main__ - Step 34125: {'lr': 0.00044409487369804395, 'samples': 6552000, 'steps': 34124, 'loss/train': 1.6763535737991333} -11/07/2021 02:03:05 - INFO - __main__ - Step 34126: {'lr': 0.00044409152899525973, 'samples': 6552192, 'steps': 34125, 'loss/train': 1.591783046722412} -11/07/2021 02:03:06 - INFO - __main__ - Step 34127: {'lr': 0.00044408818420502085, 'samples': 6552384, 'steps': 34126, 'loss/train': 1.2297704219818115} -11/07/2021 02:03:07 - INFO - __main__ - Step 34128: {'lr': 0.00044408483932732886, 'samples': 6552576, 'steps': 34127, 'loss/train': 1.5073697566986084} -11/07/2021 02:03:07 - INFO - __main__ - Step 34129: {'lr': 0.00044408149436218523, 'samples': 6552768, 'steps': 34128, 'loss/train': 1.2436527013778687} -11/07/2021 02:03:07 - INFO - __main__ - Step 34130: {'lr': 0.00044407814930959137, 'samples': 6552960, 'steps': 34129, 'loss/train': 1.310021162033081} -11/07/2021 02:03:08 - INFO - __main__ - Step 34131: {'lr': 0.000444074804169549, 'samples': 6553152, 'steps': 34130, 'loss/train': 1.5414221286773682} -11/07/2021 02:03:09 - INFO - __main__ - Step 34132: {'lr': 0.00044407145894205947, 'samples': 6553344, 'steps': 34131, 'loss/train': 1.5979948043823242} -11/07/2021 02:03:09 - INFO - __main__ - Step 34133: {'lr': 0.0004440681136271244, 'samples': 6553536, 'steps': 34132, 'loss/train': 1.8100224733352661} -11/07/2021 02:03:10 - INFO - __main__ - Step 34134: {'lr': 0.0004440647682247452, 'samples': 6553728, 'steps': 34133, 'loss/train': 1.0398575067520142} -11/07/2021 02:03:10 - INFO - __main__ - Step 34135: {'lr': 0.00044406142273492334, 'samples': 6553920, 'steps': 34134, 'loss/train': 1.5329359769821167} -11/07/2021 02:03:11 - INFO - __main__ - Step 34136: {'lr': 0.00044405807715766047, 'samples': 6554112, 'steps': 34135, 'loss/train': 1.1437962055206299} -11/07/2021 02:03:12 - INFO - __main__ - Step 34137: {'lr': 0.00044405473149295804, 'samples': 6554304, 'steps': 34136, 'loss/train': 1.5289555788040161} -11/07/2021 02:03:12 - INFO - __main__ - Step 34138: {'lr': 0.0004440513857408175, 'samples': 6554496, 'steps': 34137, 'loss/train': 1.8025574684143066} -11/07/2021 02:03:12 - INFO - __main__ - Step 34139: {'lr': 0.0004440480399012404, 'samples': 6554688, 'steps': 34138, 'loss/train': 1.7068231105804443} -11/07/2021 02:03:13 - INFO - __main__ - Step 34140: {'lr': 0.00044404469397422823, 'samples': 6554880, 'steps': 34139, 'loss/train': 0.6725926399230957} -11/07/2021 02:03:13 - INFO - __main__ - Step 34141: {'lr': 0.00044404134795978257, 'samples': 6555072, 'steps': 34140, 'loss/train': 1.5433404445648193} -11/07/2021 02:03:14 - INFO - __main__ - Step 34142: {'lr': 0.0004440380018579049, 'samples': 6555264, 'steps': 34141, 'loss/train': 1.7330764532089233} -11/07/2021 02:03:14 - INFO - __main__ - Step 34143: {'lr': 0.00044403465566859656, 'samples': 6555456, 'steps': 34142, 'loss/train': 1.6334328651428223} -11/07/2021 02:03:15 - INFO - __main__ - Step 34144: {'lr': 0.0004440313093918593, 'samples': 6555648, 'steps': 34143, 'loss/train': 1.4875729084014893} -11/07/2021 02:03:15 - INFO - __main__ - Step 34145: {'lr': 0.00044402796302769453, 'samples': 6555840, 'steps': 34144, 'loss/train': 0.7958040833473206} -11/07/2021 02:03:15 - INFO - __main__ - Step 34146: {'lr': 0.0004440246165761037, 'samples': 6556032, 'steps': 34145, 'loss/train': 1.0676820278167725} -11/07/2021 02:03:16 - INFO - __main__ - Step 34147: {'lr': 0.00044402127003708846, 'samples': 6556224, 'steps': 34146, 'loss/train': 1.3615130186080933} -11/07/2021 02:03:17 - INFO - __main__ - Step 34148: {'lr': 0.0004440179234106502, 'samples': 6556416, 'steps': 34147, 'loss/train': 1.5049426555633545} -11/07/2021 02:03:17 - INFO - __main__ - Step 34149: {'lr': 0.00044401457669679043, 'samples': 6556608, 'steps': 34148, 'loss/train': 1.7335518598556519} -11/07/2021 02:03:18 - INFO - __main__ - Step 34150: {'lr': 0.0004440112298955107, 'samples': 6556800, 'steps': 34149, 'loss/train': 2.2905702590942383} -11/07/2021 02:03:18 - INFO - __main__ - Step 34151: {'lr': 0.0004440078830068125, 'samples': 6556992, 'steps': 34150, 'loss/train': 1.9597066640853882} -11/07/2021 02:03:18 - INFO - __main__ - Step 34152: {'lr': 0.00044400453603069727, 'samples': 6557184, 'steps': 34151, 'loss/train': 1.5736281871795654} -11/07/2021 02:03:20 - INFO - __main__ - Step 34153: {'lr': 0.0004440011889671667, 'samples': 6557376, 'steps': 34152, 'loss/train': 1.454236626625061} -11/07/2021 02:03:20 - INFO - __main__ - Step 34154: {'lr': 0.00044399784181622216, 'samples': 6557568, 'steps': 34153, 'loss/train': 1.4838290214538574} -11/07/2021 02:03:20 - INFO - __main__ - Step 34155: {'lr': 0.0004439944945778651, 'samples': 6557760, 'steps': 34154, 'loss/train': 1.7440612316131592} -11/07/2021 02:03:21 - INFO - __main__ - Step 34156: {'lr': 0.0004439911472520972, 'samples': 6557952, 'steps': 34155, 'loss/train': 1.247413992881775} -11/07/2021 02:03:21 - INFO - __main__ - Step 34157: {'lr': 0.0004439877998389199, 'samples': 6558144, 'steps': 34156, 'loss/train': 1.444315791130066} -11/07/2021 02:03:22 - INFO - __main__ - Step 34158: {'lr': 0.0004439844523383346, 'samples': 6558336, 'steps': 34157, 'loss/train': 1.4981380701065063} -11/07/2021 02:03:22 - INFO - __main__ - Step 34159: {'lr': 0.000443981104750343, 'samples': 6558528, 'steps': 34158, 'loss/train': 1.642318606376648} -11/07/2021 02:03:23 - INFO - __main__ - Step 34160: {'lr': 0.0004439777570749465, 'samples': 6558720, 'steps': 34159, 'loss/train': 1.1470081806182861} -11/07/2021 02:03:23 - INFO - __main__ - Step 34161: {'lr': 0.0004439744093121465, 'samples': 6558912, 'steps': 34160, 'loss/train': 1.8299084901809692} -11/07/2021 02:03:23 - INFO - __main__ - Step 34162: {'lr': 0.00044397106146194473, 'samples': 6559104, 'steps': 34161, 'loss/train': 1.927542805671692} -11/07/2021 02:03:24 - INFO - __main__ - Step 34163: {'lr': 0.00044396771352434256, 'samples': 6559296, 'steps': 34162, 'loss/train': 1.4433425664901733} -11/07/2021 02:03:25 - INFO - __main__ - Step 34164: {'lr': 0.00044396436549934155, 'samples': 6559488, 'steps': 34163, 'loss/train': 1.2462340593338013} -11/07/2021 02:03:25 - INFO - __main__ - Step 34165: {'lr': 0.00044396101738694316, 'samples': 6559680, 'steps': 34164, 'loss/train': 1.1547960042953491} -11/07/2021 02:03:25 - INFO - __main__ - Step 34166: {'lr': 0.000443957669187149, 'samples': 6559872, 'steps': 34165, 'loss/train': 0.9203764200210571} -11/07/2021 02:03:26 - INFO - __main__ - Step 34167: {'lr': 0.0004439543208999604, 'samples': 6560064, 'steps': 34166, 'loss/train': 1.015457034111023} -11/07/2021 02:03:26 - INFO - __main__ - Step 34168: {'lr': 0.00044395097252537905, 'samples': 6560256, 'steps': 34167, 'loss/train': 1.355995535850525} -11/07/2021 02:03:27 - INFO - __main__ - Step 34169: {'lr': 0.0004439476240634064, 'samples': 6560448, 'steps': 34168, 'loss/train': 1.298944115638733} -11/07/2021 02:03:28 - INFO - __main__ - Step 34170: {'lr': 0.00044394427551404386, 'samples': 6560640, 'steps': 34169, 'loss/train': 5.923316478729248} -11/07/2021 02:03:28 - INFO - __main__ - Step 34171: {'lr': 0.00044394092687729305, 'samples': 6560832, 'steps': 34170, 'loss/train': 1.089755654335022} -11/07/2021 02:03:28 - INFO - __main__ - Step 34172: {'lr': 0.0004439375781531555, 'samples': 6561024, 'steps': 34171, 'loss/train': 1.5006424188613892} -11/07/2021 02:03:29 - INFO - __main__ - Step 34173: {'lr': 0.00044393422934163265, 'samples': 6561216, 'steps': 34172, 'loss/train': 1.8292887210845947} -11/07/2021 02:03:30 - INFO - __main__ - Step 34174: {'lr': 0.000443930880442726, 'samples': 6561408, 'steps': 34173, 'loss/train': 1.6458317041397095} -11/07/2021 02:03:30 - INFO - __main__ - Step 34175: {'lr': 0.0004439275314564371, 'samples': 6561600, 'steps': 34174, 'loss/train': 1.5969767570495605} -11/07/2021 02:03:30 - INFO - __main__ - Step 34176: {'lr': 0.0004439241823827674, 'samples': 6561792, 'steps': 34175, 'loss/train': 0.9351884722709656} -11/07/2021 02:03:31 - INFO - __main__ - Step 34177: {'lr': 0.0004439208332217186, 'samples': 6561984, 'steps': 34176, 'loss/train': 1.02590012550354} -11/07/2021 02:03:31 - INFO - __main__ - Step 34178: {'lr': 0.00044391748397329194, 'samples': 6562176, 'steps': 34177, 'loss/train': 1.222740888595581} -11/07/2021 02:03:32 - INFO - __main__ - Step 34179: {'lr': 0.0004439141346374891, 'samples': 6562368, 'steps': 34178, 'loss/train': 1.8320636749267578} -11/07/2021 02:03:32 - INFO - __main__ - Step 34180: {'lr': 0.0004439107852143115, 'samples': 6562560, 'steps': 34179, 'loss/train': 1.2978649139404297} -11/07/2021 02:03:33 - INFO - __main__ - Step 34181: {'lr': 0.0004439074357037607, 'samples': 6562752, 'steps': 34180, 'loss/train': 2.211667060852051} -11/07/2021 02:03:33 - INFO - __main__ - Step 34182: {'lr': 0.0004439040861058383, 'samples': 6562944, 'steps': 34181, 'loss/train': 1.599212408065796} -11/07/2021 02:03:33 - INFO - __main__ - Step 34183: {'lr': 0.00044390073642054564, 'samples': 6563136, 'steps': 34182, 'loss/train': 1.436307668685913} -11/07/2021 02:03:35 - INFO - __main__ - Step 34184: {'lr': 0.00044389738664788424, 'samples': 6563328, 'steps': 34183, 'loss/train': 0.9093039631843567} -11/07/2021 02:03:35 - INFO - __main__ - Step 34185: {'lr': 0.00044389403678785576, 'samples': 6563520, 'steps': 34184, 'loss/train': 1.4228278398513794} -11/07/2021 02:03:35 - INFO - __main__ - Step 34186: {'lr': 0.0004438906868404616, 'samples': 6563712, 'steps': 34185, 'loss/train': 1.4958488941192627} -11/07/2021 02:03:36 - INFO - __main__ - Step 34187: {'lr': 0.00044388733680570324, 'samples': 6563904, 'steps': 34186, 'loss/train': 1.353678584098816} -11/07/2021 02:03:36 - INFO - __main__ - Step 34188: {'lr': 0.00044388398668358234, 'samples': 6564096, 'steps': 34187, 'loss/train': 1.4119741916656494} -11/07/2021 02:03:36 - INFO - __main__ - Step 34189: {'lr': 0.00044388063647410016, 'samples': 6564288, 'steps': 34188, 'loss/train': 1.8877049684524536} -11/07/2021 02:03:37 - INFO - __main__ - Step 34190: {'lr': 0.00044387728617725845, 'samples': 6564480, 'steps': 34189, 'loss/train': 1.3518003225326538} -11/07/2021 02:03:38 - INFO - __main__ - Step 34191: {'lr': 0.0004438739357930586, 'samples': 6564672, 'steps': 34190, 'loss/train': 1.495152473449707} -11/07/2021 02:03:38 - INFO - __main__ - Step 34192: {'lr': 0.00044387058532150217, 'samples': 6564864, 'steps': 34191, 'loss/train': 1.3404079675674438} -11/07/2021 02:03:38 - INFO - __main__ - Step 34193: {'lr': 0.0004438672347625907, 'samples': 6565056, 'steps': 34192, 'loss/train': 1.344968557357788} -11/07/2021 02:03:39 - INFO - __main__ - Step 34194: {'lr': 0.0004438638841163255, 'samples': 6565248, 'steps': 34193, 'loss/train': 1.5332821607589722} -11/07/2021 02:03:40 - INFO - __main__ - Step 34195: {'lr': 0.0004438605333827083, 'samples': 6565440, 'steps': 34194, 'loss/train': 1.675861120223999} -11/07/2021 02:03:40 - INFO - __main__ - Step 34196: {'lr': 0.00044385718256174055, 'samples': 6565632, 'steps': 34195, 'loss/train': 1.3681551218032837} -11/07/2021 02:03:40 - INFO - __main__ - Step 34197: {'lr': 0.0004438538316534237, 'samples': 6565824, 'steps': 34196, 'loss/train': 1.3978954553604126} -11/07/2021 02:03:41 - INFO - __main__ - Step 34198: {'lr': 0.0004438504806577594, 'samples': 6566016, 'steps': 34197, 'loss/train': 1.6417779922485352} -11/07/2021 02:03:41 - INFO - __main__ - Step 34199: {'lr': 0.000443847129574749, 'samples': 6566208, 'steps': 34198, 'loss/train': 1.458509922027588} -11/07/2021 02:03:42 - INFO - __main__ - Step 34200: {'lr': 0.0004438437784043941, 'samples': 6566400, 'steps': 34199, 'loss/train': 1.0733407735824585} -11/07/2021 02:03:42 - INFO - __main__ - Step 34201: {'lr': 0.00044384042714669614, 'samples': 6566592, 'steps': 34200, 'loss/train': 1.784488320350647} -11/07/2021 02:03:43 - INFO - __main__ - Step 34202: {'lr': 0.0004438370758016567, 'samples': 6566784, 'steps': 34201, 'loss/train': 1.4622405767440796} -11/07/2021 02:03:43 - INFO - __main__ - Step 34203: {'lr': 0.00044383372436927727, 'samples': 6566976, 'steps': 34202, 'loss/train': 1.6074336767196655} -11/07/2021 02:03:44 - INFO - __main__ - Step 34204: {'lr': 0.00044383037284955937, 'samples': 6567168, 'steps': 34203, 'loss/train': 1.4448004961013794} -11/07/2021 02:03:45 - INFO - __main__ - Step 34205: {'lr': 0.00044382702124250444, 'samples': 6567360, 'steps': 34204, 'loss/train': 1.7972103357315063} -11/07/2021 02:03:45 - INFO - __main__ - Step 34206: {'lr': 0.0004438236695481141, 'samples': 6567552, 'steps': 34205, 'loss/train': 1.9503910541534424} -11/07/2021 02:03:45 - INFO - __main__ - Step 34207: {'lr': 0.00044382031776638974, 'samples': 6567744, 'steps': 34206, 'loss/train': 1.1128954887390137} -11/07/2021 02:03:46 - INFO - __main__ - Step 34208: {'lr': 0.000443816965897333, 'samples': 6567936, 'steps': 34207, 'loss/train': 1.2528254985809326} -11/07/2021 02:03:46 - INFO - __main__ - Step 34209: {'lr': 0.0004438136139409453, 'samples': 6568128, 'steps': 34208, 'loss/train': 1.4778404235839844} -11/07/2021 02:03:47 - INFO - __main__ - Step 34210: {'lr': 0.00044381026189722824, 'samples': 6568320, 'steps': 34209, 'loss/train': 1.6742136478424072} -11/07/2021 02:03:47 - INFO - __main__ - Step 34211: {'lr': 0.0004438069097661832, 'samples': 6568512, 'steps': 34210, 'loss/train': 1.3790103197097778} -11/07/2021 02:03:48 - INFO - __main__ - Step 34212: {'lr': 0.0004438035575478118, 'samples': 6568704, 'steps': 34211, 'loss/train': 0.9726940393447876} -11/07/2021 02:03:48 - INFO - __main__ - Step 34213: {'lr': 0.0004438002052421154, 'samples': 6568896, 'steps': 34212, 'loss/train': 1.7135347127914429} -11/07/2021 02:03:49 - INFO - __main__ - Step 34214: {'lr': 0.00044379685284909575, 'samples': 6569088, 'steps': 34213, 'loss/train': 1.9888619184494019} -11/07/2021 02:03:49 - INFO - __main__ - Step 34215: {'lr': 0.00044379350036875413, 'samples': 6569280, 'steps': 34214, 'loss/train': 1.7909215688705444} -11/07/2021 02:03:50 - INFO - __main__ - Step 34216: {'lr': 0.00044379014780109217, 'samples': 6569472, 'steps': 34215, 'loss/train': 1.947856068611145} -11/07/2021 02:03:50 - INFO - __main__ - Step 34217: {'lr': 0.00044378679514611144, 'samples': 6569664, 'steps': 34216, 'loss/train': 1.699139952659607} -11/07/2021 02:03:51 - INFO - __main__ - Step 34218: {'lr': 0.0004437834424038133, 'samples': 6569856, 'steps': 34217, 'loss/train': 0.8595290780067444} -11/07/2021 02:03:51 - INFO - __main__ - Step 34219: {'lr': 0.00044378008957419936, 'samples': 6570048, 'steps': 34218, 'loss/train': 1.4129565954208374} -11/07/2021 02:03:51 - INFO - __main__ - Step 34220: {'lr': 0.00044377673665727105, 'samples': 6570240, 'steps': 34219, 'loss/train': 1.8418340682983398} -11/07/2021 02:03:52 - INFO - __main__ - Step 34221: {'lr': 0.00044377338365303, 'samples': 6570432, 'steps': 34220, 'loss/train': 1.3927035331726074} -11/07/2021 02:03:53 - INFO - __main__ - Step 34222: {'lr': 0.00044377003056147757, 'samples': 6570624, 'steps': 34221, 'loss/train': 1.8908228874206543} -11/07/2021 02:03:53 - INFO - __main__ - Step 34223: {'lr': 0.00044376667738261545, 'samples': 6570816, 'steps': 34222, 'loss/train': 1.8357990980148315} -11/07/2021 02:03:53 - INFO - __main__ - Step 34224: {'lr': 0.000443763324116445, 'samples': 6571008, 'steps': 34223, 'loss/train': 1.339423418045044} -11/07/2021 02:03:54 - INFO - __main__ - Step 34225: {'lr': 0.00044375997076296774, 'samples': 6571200, 'steps': 34224, 'loss/train': 1.7065150737762451} -11/07/2021 02:03:55 - INFO - __main__ - Step 34226: {'lr': 0.0004437566173221853, 'samples': 6571392, 'steps': 34225, 'loss/train': 1.329896330833435} -11/07/2021 02:03:55 - INFO - __main__ - Step 34227: {'lr': 0.0004437532637940991, 'samples': 6571584, 'steps': 34226, 'loss/train': 1.8014112710952759} -11/07/2021 02:03:55 - INFO - __main__ - Step 34228: {'lr': 0.0004437499101787107, 'samples': 6571776, 'steps': 34227, 'loss/train': 1.0249602794647217} -11/07/2021 02:03:56 - INFO - __main__ - Step 34229: {'lr': 0.00044374655647602153, 'samples': 6571968, 'steps': 34228, 'loss/train': 1.4240094423294067} -11/07/2021 02:03:56 - INFO - __main__ - Step 34230: {'lr': 0.0004437432026860332, 'samples': 6572160, 'steps': 34229, 'loss/train': 1.3589770793914795} -11/07/2021 02:03:57 - INFO - __main__ - Step 34231: {'lr': 0.00044373984880874705, 'samples': 6572352, 'steps': 34230, 'loss/train': 1.9758151769638062} -11/07/2021 02:03:57 - INFO - __main__ - Step 34232: {'lr': 0.0004437364948441649, 'samples': 6572544, 'steps': 34231, 'loss/train': 1.4315061569213867} -11/07/2021 02:03:58 - INFO - __main__ - Step 34233: {'lr': 0.00044373314079228796, 'samples': 6572736, 'steps': 34232, 'loss/train': 1.163349986076355} -11/07/2021 02:03:58 - INFO - __main__ - Step 34234: {'lr': 0.0004437297866531179, 'samples': 6572928, 'steps': 34233, 'loss/train': 1.6355782747268677} -11/07/2021 02:03:59 - INFO - __main__ - Step 34235: {'lr': 0.0004437264324266561, 'samples': 6573120, 'steps': 34234, 'loss/train': 1.6662013530731201} -11/07/2021 02:03:59 - INFO - __main__ - Step 34236: {'lr': 0.00044372307811290425, 'samples': 6573312, 'steps': 34235, 'loss/train': 0.80659419298172} -11/07/2021 02:04:00 - INFO - __main__ - Step 34237: {'lr': 0.00044371972371186374, 'samples': 6573504, 'steps': 34236, 'loss/train': 1.1076829433441162} -11/07/2021 02:04:00 - INFO - __main__ - Step 34238: {'lr': 0.0004437163692235361, 'samples': 6573696, 'steps': 34237, 'loss/train': 1.6724625825881958} -11/07/2021 02:04:00 - INFO - __main__ - Step 34239: {'lr': 0.0004437130146479229, 'samples': 6573888, 'steps': 34238, 'loss/train': 1.646666169166565} -11/07/2021 02:04:01 - INFO - __main__ - Step 34240: {'lr': 0.00044370965998502554, 'samples': 6574080, 'steps': 34239, 'loss/train': 2.2665205001831055} -11/07/2021 02:04:01 - INFO - __main__ - Step 34241: {'lr': 0.0004437063052348457, 'samples': 6574272, 'steps': 34240, 'loss/train': 1.2336525917053223} -11/07/2021 02:04:02 - INFO - __main__ - Step 34242: {'lr': 0.0004437029503973847, 'samples': 6574464, 'steps': 34241, 'loss/train': 1.5797135829925537} -11/07/2021 02:04:03 - INFO - __main__ - Step 34243: {'lr': 0.00044369959547264416, 'samples': 6574656, 'steps': 34242, 'loss/train': 1.3858048915863037} -11/07/2021 02:04:03 - INFO - __main__ - Step 34244: {'lr': 0.0004436962404606255, 'samples': 6574848, 'steps': 34243, 'loss/train': 1.3134781122207642} -11/07/2021 02:04:03 - INFO - __main__ - Step 34245: {'lr': 0.0004436928853613304, 'samples': 6575040, 'steps': 34244, 'loss/train': 1.6575181484222412} -11/07/2021 02:04:04 - INFO - __main__ - Step 34246: {'lr': 0.0004436895301747602, 'samples': 6575232, 'steps': 34245, 'loss/train': 1.971530795097351} -11/07/2021 02:04:05 - INFO - __main__ - Step 34247: {'lr': 0.00044368617490091655, 'samples': 6575424, 'steps': 34246, 'loss/train': 1.436553955078125} -11/07/2021 02:04:05 - INFO - __main__ - Step 34248: {'lr': 0.0004436828195398009, 'samples': 6575616, 'steps': 34247, 'loss/train': 1.2922219038009644} -11/07/2021 02:04:05 - INFO - __main__ - Step 34249: {'lr': 0.0004436794640914148, 'samples': 6575808, 'steps': 34248, 'loss/train': 1.1830744743347168} -11/07/2021 02:04:06 - INFO - __main__ - Step 34250: {'lr': 0.00044367610855575965, 'samples': 6576000, 'steps': 34249, 'loss/train': 1.7076432704925537} -11/07/2021 02:04:06 - INFO - __main__ - Step 34251: {'lr': 0.00044367275293283705, 'samples': 6576192, 'steps': 34250, 'loss/train': 1.1485662460327148} -11/07/2021 02:04:07 - INFO - __main__ - Step 34252: {'lr': 0.00044366939722264843, 'samples': 6576384, 'steps': 34251, 'loss/train': 1.5567431449890137} -11/07/2021 02:04:07 - INFO - __main__ - Step 34253: {'lr': 0.00044366604142519547, 'samples': 6576576, 'steps': 34252, 'loss/train': 1.6270051002502441} -11/07/2021 02:04:08 - INFO - __main__ - Step 34254: {'lr': 0.0004436626855404796, 'samples': 6576768, 'steps': 34253, 'loss/train': 1.0859005451202393} -11/07/2021 02:04:08 - INFO - __main__ - Step 34255: {'lr': 0.0004436593295685022, 'samples': 6576960, 'steps': 34254, 'loss/train': 1.3940390348434448} -11/07/2021 02:04:09 - INFO - __main__ - Step 34256: {'lr': 0.00044365597350926495, 'samples': 6577152, 'steps': 34255, 'loss/train': 1.350616455078125} -11/07/2021 02:04:10 - INFO - __main__ - Step 34257: {'lr': 0.0004436526173627693, 'samples': 6577344, 'steps': 34256, 'loss/train': 1.7524422407150269} -11/07/2021 02:04:10 - INFO - __main__ - Step 34258: {'lr': 0.00044364926112901675, 'samples': 6577536, 'steps': 34257, 'loss/train': 1.117216944694519} -11/07/2021 02:04:10 - INFO - __main__ - Step 34259: {'lr': 0.0004436459048080089, 'samples': 6577728, 'steps': 34258, 'loss/train': 0.9890215992927551} -11/07/2021 02:04:11 - INFO - __main__ - Step 34260: {'lr': 0.00044364254839974717, 'samples': 6577920, 'steps': 34259, 'loss/train': 1.560340404510498} -11/07/2021 02:04:11 - INFO - __main__ - Step 34261: {'lr': 0.0004436391919042331, 'samples': 6578112, 'steps': 34260, 'loss/train': 1.3585392236709595} -11/07/2021 02:04:12 - INFO - __main__ - Step 34262: {'lr': 0.00044363583532146814, 'samples': 6578304, 'steps': 34261, 'loss/train': 1.6851139068603516} -11/07/2021 02:04:12 - INFO - __main__ - Step 34263: {'lr': 0.0004436324786514538, 'samples': 6578496, 'steps': 34262, 'loss/train': 1.8596597909927368} -11/07/2021 02:04:13 - INFO - __main__ - Step 34264: {'lr': 0.0004436291218941918, 'samples': 6578688, 'steps': 34263, 'loss/train': 1.6587039232254028} -11/07/2021 02:04:13 - INFO - __main__ - Step 34265: {'lr': 0.00044362576504968344, 'samples': 6578880, 'steps': 34264, 'loss/train': 0.7693606019020081} -11/07/2021 02:04:13 - INFO - __main__ - Step 34266: {'lr': 0.0004436224081179303, 'samples': 6579072, 'steps': 34265, 'loss/train': 1.7554024457931519} -11/07/2021 02:04:15 - INFO - __main__ - Step 34267: {'lr': 0.00044361905109893397, 'samples': 6579264, 'steps': 34266, 'loss/train': 1.649536371231079} -11/07/2021 02:04:15 - INFO - __main__ - Step 34268: {'lr': 0.00044361569399269574, 'samples': 6579456, 'steps': 34267, 'loss/train': 1.2417728900909424} -11/07/2021 02:04:15 - INFO - __main__ - Step 34269: {'lr': 0.0004436123367992174, 'samples': 6579648, 'steps': 34268, 'loss/train': 1.3689631223678589} -11/07/2021 02:04:16 - INFO - __main__ - Step 34270: {'lr': 0.0004436089795185003, 'samples': 6579840, 'steps': 34269, 'loss/train': 1.7414630651474} -11/07/2021 02:04:16 - INFO - __main__ - Step 34271: {'lr': 0.0004436056221505459, 'samples': 6580032, 'steps': 34270, 'loss/train': 1.6733810901641846} -11/07/2021 02:04:17 - INFO - __main__ - Step 34272: {'lr': 0.00044360226469535583, 'samples': 6580224, 'steps': 34271, 'loss/train': 1.5781022310256958} -11/07/2021 02:04:17 - INFO - __main__ - Step 34273: {'lr': 0.0004435989071529316, 'samples': 6580416, 'steps': 34272, 'loss/train': 1.8803343772888184} -11/07/2021 02:04:18 - INFO - __main__ - Step 34274: {'lr': 0.0004435955495232746, 'samples': 6580608, 'steps': 34273, 'loss/train': 1.4304903745651245} -11/07/2021 02:04:18 - INFO - __main__ - Step 34275: {'lr': 0.00044359219180638656, 'samples': 6580800, 'steps': 34274, 'loss/train': 1.7356127500534058} -11/07/2021 02:04:18 - INFO - __main__ - Step 34276: {'lr': 0.0004435888340022688, 'samples': 6580992, 'steps': 34275, 'loss/train': 1.8282495737075806} -11/07/2021 02:04:19 - INFO - __main__ - Step 34277: {'lr': 0.0004435854761109229, 'samples': 6581184, 'steps': 34276, 'loss/train': 1.6848821640014648} -11/07/2021 02:04:20 - INFO - __main__ - Step 34278: {'lr': 0.00044358211813235046, 'samples': 6581376, 'steps': 34277, 'loss/train': 1.6042040586471558} -11/07/2021 02:04:20 - INFO - __main__ - Step 34279: {'lr': 0.0004435787600665528, 'samples': 6581568, 'steps': 34278, 'loss/train': 2.087636947631836} -11/07/2021 02:04:21 - INFO - __main__ - Step 34280: {'lr': 0.0004435754019135315, 'samples': 6581760, 'steps': 34279, 'loss/train': 1.4953944683074951} -11/07/2021 02:04:21 - INFO - __main__ - Step 34281: {'lr': 0.0004435720436732882, 'samples': 6581952, 'steps': 34280, 'loss/train': 1.3213019371032715} -11/07/2021 02:04:21 - INFO - __main__ - Step 34282: {'lr': 0.0004435686853458243, 'samples': 6582144, 'steps': 34281, 'loss/train': 1.548249363899231} -11/07/2021 02:04:22 - INFO - __main__ - Step 34283: {'lr': 0.0004435653269311414, 'samples': 6582336, 'steps': 34282, 'loss/train': 1.2772735357284546} -11/07/2021 02:04:23 - INFO - __main__ - Step 34284: {'lr': 0.00044356196842924086, 'samples': 6582528, 'steps': 34283, 'loss/train': 0.16299578547477722} -11/07/2021 02:04:23 - INFO - __main__ - Step 34285: {'lr': 0.0004435586098401243, 'samples': 6582720, 'steps': 34284, 'loss/train': 1.3020122051239014} -11/07/2021 02:04:24 - INFO - __main__ - Step 34286: {'lr': 0.00044355525116379326, 'samples': 6582912, 'steps': 34285, 'loss/train': 1.6647453308105469} -11/07/2021 02:04:24 - INFO - __main__ - Step 34287: {'lr': 0.00044355189240024917, 'samples': 6583104, 'steps': 34286, 'loss/train': 1.517380952835083} -11/07/2021 02:04:24 - INFO - __main__ - Step 34288: {'lr': 0.00044354853354949353, 'samples': 6583296, 'steps': 34287, 'loss/train': 1.3190693855285645} -11/07/2021 02:04:25 - INFO - __main__ - Step 34289: {'lr': 0.000443545174611528, 'samples': 6583488, 'steps': 34288, 'loss/train': 1.1464428901672363} -11/07/2021 02:04:25 - INFO - __main__ - Step 34290: {'lr': 0.000443541815586354, 'samples': 6583680, 'steps': 34289, 'loss/train': 1.4929620027542114} -11/07/2021 02:04:26 - INFO - __main__ - Step 34291: {'lr': 0.0004435384564739729, 'samples': 6583872, 'steps': 34290, 'loss/train': 1.5682131052017212} -11/07/2021 02:04:26 - INFO - __main__ - Step 34292: {'lr': 0.00044353509727438657, 'samples': 6584064, 'steps': 34291, 'loss/train': 1.5812877416610718} -11/07/2021 02:04:27 - INFO - __main__ - Step 34293: {'lr': 0.00044353173798759616, 'samples': 6584256, 'steps': 34292, 'loss/train': 1.7356139421463013} -11/07/2021 02:04:28 - INFO - __main__ - Step 34294: {'lr': 0.0004435283786136034, 'samples': 6584448, 'steps': 34293, 'loss/train': 1.6473431587219238} -11/07/2021 02:04:28 - INFO - __main__ - Step 34295: {'lr': 0.0004435250191524097, 'samples': 6584640, 'steps': 34294, 'loss/train': 1.5632716417312622} -11/07/2021 02:04:28 - INFO - __main__ - Step 34296: {'lr': 0.0004435216596040167, 'samples': 6584832, 'steps': 34295, 'loss/train': 1.4862587451934814} -11/07/2021 02:04:29 - INFO - __main__ - Step 34297: {'lr': 0.00044351829996842575, 'samples': 6585024, 'steps': 34296, 'loss/train': 0.8310204148292542} -11/07/2021 02:04:29 - INFO - __main__ - Step 34298: {'lr': 0.00044351494024563845, 'samples': 6585216, 'steps': 34297, 'loss/train': 1.7653529644012451} -11/07/2021 02:04:30 - INFO - __main__ - Step 34299: {'lr': 0.0004435115804356563, 'samples': 6585408, 'steps': 34298, 'loss/train': 0.5662867426872253} -11/07/2021 02:04:30 - INFO - __main__ - Step 34300: {'lr': 0.0004435082205384808, 'samples': 6585600, 'steps': 34299, 'loss/train': 1.818901777267456} -11/07/2021 02:04:31 - INFO - __main__ - Step 34301: {'lr': 0.00044350486055411354, 'samples': 6585792, 'steps': 34300, 'loss/train': 1.3899507522583008} -11/07/2021 02:04:31 - INFO - __main__ - Step 34302: {'lr': 0.000443501500482556, 'samples': 6585984, 'steps': 34301, 'loss/train': 0.19430121779441833} -11/07/2021 02:04:31 - INFO - __main__ - Step 34303: {'lr': 0.0004434981403238096, 'samples': 6586176, 'steps': 34302, 'loss/train': 1.502541184425354} -11/07/2021 02:04:32 - INFO - __main__ - Step 34304: {'lr': 0.0004434947800778759, 'samples': 6586368, 'steps': 34303, 'loss/train': 0.8370174765586853} -11/07/2021 02:04:33 - INFO - __main__ - Step 34305: {'lr': 0.0004434914197447565, 'samples': 6586560, 'steps': 34304, 'loss/train': 1.4450031518936157} -11/07/2021 02:04:33 - INFO - __main__ - Step 34306: {'lr': 0.0004434880593244528, 'samples': 6586752, 'steps': 34305, 'loss/train': 1.5231199264526367} -11/07/2021 02:04:33 - INFO - __main__ - Step 34307: {'lr': 0.0004434846988169664, 'samples': 6586944, 'steps': 34306, 'loss/train': 0.9623751640319824} -11/07/2021 02:04:34 - INFO - __main__ - Step 34308: {'lr': 0.0004434813382222989, 'samples': 6587136, 'steps': 34307, 'loss/train': 1.5782952308654785} -11/07/2021 02:04:34 - INFO - __main__ - Step 34309: {'lr': 0.0004434779775404515, 'samples': 6587328, 'steps': 34308, 'loss/train': 1.2805538177490234} -11/07/2021 02:04:35 - INFO - __main__ - Step 34310: {'lr': 0.000443474616771426, 'samples': 6587520, 'steps': 34309, 'loss/train': 1.5393397808074951} -11/07/2021 02:04:36 - INFO - __main__ - Step 34311: {'lr': 0.00044347125591522377, 'samples': 6587712, 'steps': 34310, 'loss/train': 1.085399866104126} -11/07/2021 02:04:36 - INFO - __main__ - Step 34312: {'lr': 0.00044346789497184643, 'samples': 6587904, 'steps': 34311, 'loss/train': 1.8326754570007324} -11/07/2021 02:04:36 - INFO - __main__ - Step 34313: {'lr': 0.0004434645339412954, 'samples': 6588096, 'steps': 34312, 'loss/train': 1.1530722379684448} -11/07/2021 02:04:37 - INFO - __main__ - Step 34314: {'lr': 0.0004434611728235722, 'samples': 6588288, 'steps': 34313, 'loss/train': 1.2123658657073975} -11/07/2021 02:04:38 - INFO - __main__ - Step 34315: {'lr': 0.0004434578116186785, 'samples': 6588480, 'steps': 34314, 'loss/train': 1.23298978805542} -11/07/2021 02:04:38 - INFO - __main__ - Step 34316: {'lr': 0.00044345445032661565, 'samples': 6588672, 'steps': 34315, 'loss/train': 1.730208158493042} -11/07/2021 02:04:38 - INFO - __main__ - Step 34317: {'lr': 0.0004434510889473852, 'samples': 6588864, 'steps': 34316, 'loss/train': 1.5077552795410156} -11/07/2021 02:04:39 - INFO - __main__ - Step 34318: {'lr': 0.00044344772748098867, 'samples': 6589056, 'steps': 34317, 'loss/train': 1.4679759740829468} -11/07/2021 02:04:39 - INFO - __main__ - Step 34319: {'lr': 0.00044344436592742755, 'samples': 6589248, 'steps': 34318, 'loss/train': 1.4131392240524292} -11/07/2021 02:04:41 - INFO - __main__ - Step 34320: {'lr': 0.0004434410042867034, 'samples': 6589440, 'steps': 34319, 'loss/train': 1.2468388080596924} -11/07/2021 02:04:41 - INFO - __main__ - Step 34321: {'lr': 0.0004434376425588178, 'samples': 6589632, 'steps': 34320, 'loss/train': 1.5157110691070557} -11/07/2021 02:04:41 - INFO - __main__ - Step 34322: {'lr': 0.00044343428074377207, 'samples': 6589824, 'steps': 34321, 'loss/train': 1.6445945501327515} -11/07/2021 02:04:42 - INFO - __main__ - Step 34323: {'lr': 0.0004434309188415679, 'samples': 6590016, 'steps': 34322, 'loss/train': 1.7932441234588623} -11/07/2021 02:04:42 - INFO - __main__ - Step 34324: {'lr': 0.0004434275568522067, 'samples': 6590208, 'steps': 34323, 'loss/train': 1.385819673538208} -11/07/2021 02:04:42 - INFO - __main__ - Step 34325: {'lr': 0.0004434241947756901, 'samples': 6590400, 'steps': 34324, 'loss/train': 1.7647372484207153} -11/07/2021 02:04:43 - INFO - __main__ - Step 34326: {'lr': 0.0004434208326120195, 'samples': 6590592, 'steps': 34325, 'loss/train': 1.27634596824646} -11/07/2021 02:04:44 - INFO - __main__ - Step 34327: {'lr': 0.0004434174703611964, 'samples': 6590784, 'steps': 34326, 'loss/train': 1.4668068885803223} -11/07/2021 02:04:44 - INFO - __main__ - Step 34328: {'lr': 0.00044341410802322247, 'samples': 6590976, 'steps': 34327, 'loss/train': 1.522247076034546} -11/07/2021 02:04:45 - INFO - __main__ - Step 34329: {'lr': 0.00044341074559809903, 'samples': 6591168, 'steps': 34328, 'loss/train': 1.5705645084381104} -11/07/2021 02:04:45 - INFO - __main__ - Step 34330: {'lr': 0.00044340738308582775, 'samples': 6591360, 'steps': 34329, 'loss/train': 1.3702070713043213} -11/07/2021 02:04:46 - INFO - __main__ - Step 34331: {'lr': 0.0004434040204864101, 'samples': 6591552, 'steps': 34330, 'loss/train': 1.5339696407318115} -11/07/2021 02:04:46 - INFO - __main__ - Step 34332: {'lr': 0.00044340065779984757, 'samples': 6591744, 'steps': 34331, 'loss/train': 1.4517829418182373} -11/07/2021 02:04:47 - INFO - __main__ - Step 34333: {'lr': 0.0004433972950261417, 'samples': 6591936, 'steps': 34332, 'loss/train': 1.3155765533447266} -11/07/2021 02:04:47 - INFO - __main__ - Step 34334: {'lr': 0.00044339393216529394, 'samples': 6592128, 'steps': 34333, 'loss/train': 1.4728405475616455} -11/07/2021 02:04:47 - INFO - __main__ - Step 34335: {'lr': 0.00044339056921730593, 'samples': 6592320, 'steps': 34334, 'loss/train': 1.1240208148956299} -11/07/2021 02:04:48 - INFO - __main__ - Step 34336: {'lr': 0.000443387206182179, 'samples': 6592512, 'steps': 34335, 'loss/train': 1.7121858596801758} -11/07/2021 02:04:49 - INFO - __main__ - Step 34337: {'lr': 0.0004433838430599149, 'samples': 6592704, 'steps': 34336, 'loss/train': 1.7511014938354492} -11/07/2021 02:04:49 - INFO - __main__ - Step 34338: {'lr': 0.000443380479850515, 'samples': 6592896, 'steps': 34337, 'loss/train': 1.3754760026931763} -11/07/2021 02:04:49 - INFO - __main__ - Step 34339: {'lr': 0.00044337711655398083, 'samples': 6593088, 'steps': 34338, 'loss/train': 1.6327975988388062} -11/07/2021 02:04:50 - INFO - __main__ - Step 34340: {'lr': 0.00044337375317031393, 'samples': 6593280, 'steps': 34339, 'loss/train': 1.2993462085723877} -11/07/2021 02:04:50 - INFO - __main__ - Step 34341: {'lr': 0.0004433703896995157, 'samples': 6593472, 'steps': 34340, 'loss/train': 1.703192114830017} -11/07/2021 02:04:51 - INFO - __main__ - Step 34342: {'lr': 0.0004433670261415879, 'samples': 6593664, 'steps': 34341, 'loss/train': 1.6066464185714722} -11/07/2021 02:04:51 - INFO - __main__ - Step 34343: {'lr': 0.0004433636624965318, 'samples': 6593856, 'steps': 34342, 'loss/train': 2.237250328063965} -11/07/2021 02:04:52 - INFO - __main__ - Step 34344: {'lr': 0.0004433602987643491, 'samples': 6594048, 'steps': 34343, 'loss/train': 1.402521014213562} -11/07/2021 02:04:52 - INFO - __main__ - Step 34345: {'lr': 0.00044335693494504115, 'samples': 6594240, 'steps': 34344, 'loss/train': 1.711129903793335} -11/07/2021 02:04:52 - INFO - __main__ - Step 34346: {'lr': 0.00044335357103860964, 'samples': 6594432, 'steps': 34345, 'loss/train': 1.3711202144622803} -11/07/2021 02:04:53 - INFO - __main__ - Step 34347: {'lr': 0.0004433502070450559, 'samples': 6594624, 'steps': 34346, 'loss/train': 1.3290324211120605} -11/07/2021 02:04:54 - INFO - __main__ - Step 34348: {'lr': 0.0004433468429643816, 'samples': 6594816, 'steps': 34347, 'loss/train': 1.5208077430725098} -11/07/2021 02:04:54 - INFO - __main__ - Step 34349: {'lr': 0.00044334347879658817, 'samples': 6595008, 'steps': 34348, 'loss/train': 1.363816261291504} -11/07/2021 02:04:55 - INFO - __main__ - Step 34350: {'lr': 0.0004433401145416771, 'samples': 6595200, 'steps': 34349, 'loss/train': 1.1282519102096558} -11/07/2021 02:04:55 - INFO - __main__ - Step 34351: {'lr': 0.00044333675019965, 'samples': 6595392, 'steps': 34350, 'loss/train': 1.5368919372558594} -11/07/2021 02:04:56 - INFO - __main__ - Step 34352: {'lr': 0.00044333338577050844, 'samples': 6595584, 'steps': 34351, 'loss/train': 1.2156026363372803} -11/07/2021 02:04:56 - INFO - __main__ - Step 34353: {'lr': 0.0004433300212542537, 'samples': 6595776, 'steps': 34352, 'loss/train': 1.3872274160385132} -11/07/2021 02:04:57 - INFO - __main__ - Step 34354: {'lr': 0.00044332665665088755, 'samples': 6595968, 'steps': 34353, 'loss/train': 1.441105604171753} -11/07/2021 02:04:57 - INFO - __main__ - Step 34355: {'lr': 0.00044332329196041133, 'samples': 6596160, 'steps': 34354, 'loss/train': 1.3930827379226685} -11/07/2021 02:04:57 - INFO - __main__ - Step 34356: {'lr': 0.0004433199271828267, 'samples': 6596352, 'steps': 34355, 'loss/train': 1.6682108640670776} -11/07/2021 02:04:58 - INFO - __main__ - Step 34357: {'lr': 0.0004433165623181349, 'samples': 6596544, 'steps': 34356, 'loss/train': 1.5918173789978027} -11/07/2021 02:04:59 - INFO - __main__ - Step 34358: {'lr': 0.0004433131973663378, 'samples': 6596736, 'steps': 34357, 'loss/train': 1.7932053804397583} -11/07/2021 02:04:59 - INFO - __main__ - Step 34359: {'lr': 0.0004433098323274367, 'samples': 6596928, 'steps': 34358, 'loss/train': 1.6864224672317505} -11/07/2021 02:04:59 - INFO - __main__ - Step 34360: {'lr': 0.00044330646720143317, 'samples': 6597120, 'steps': 34359, 'loss/train': 1.3417962789535522} -11/07/2021 02:05:00 - INFO - __main__ - Step 34361: {'lr': 0.0004433031019883288, 'samples': 6597312, 'steps': 34360, 'loss/train': 1.8701308965682983} -11/07/2021 02:05:00 - INFO - __main__ - Step 34362: {'lr': 0.00044329973668812497, 'samples': 6597504, 'steps': 34361, 'loss/train': 1.982292652130127} -11/07/2021 02:05:01 - INFO - __main__ - Step 34363: {'lr': 0.00044329637130082324, 'samples': 6597696, 'steps': 34362, 'loss/train': 1.4699153900146484} -11/07/2021 02:05:02 - INFO - __main__ - Step 34364: {'lr': 0.00044329300582642516, 'samples': 6597888, 'steps': 34363, 'loss/train': 1.9153653383255005} -11/07/2021 02:05:02 - INFO - __main__ - Step 34365: {'lr': 0.0004432896402649323, 'samples': 6598080, 'steps': 34364, 'loss/train': 0.23294086754322052} -11/07/2021 02:05:02 - INFO - __main__ - Step 34366: {'lr': 0.0004432862746163461, 'samples': 6598272, 'steps': 34365, 'loss/train': 0.15816542506217957} -11/07/2021 02:05:03 - INFO - __main__ - Step 34367: {'lr': 0.000443282908880668, 'samples': 6598464, 'steps': 34366, 'loss/train': 1.5377881526947021} -11/07/2021 02:05:04 - INFO - __main__ - Step 34368: {'lr': 0.00044327954305789963, 'samples': 6598656, 'steps': 34367, 'loss/train': 1.5757653713226318} -11/07/2021 02:05:04 - INFO - __main__ - Step 34369: {'lr': 0.0004432761771480426, 'samples': 6598848, 'steps': 34368, 'loss/train': 1.7795270681381226} -11/07/2021 02:05:05 - INFO - __main__ - Step 34370: {'lr': 0.0004432728111510982, 'samples': 6599040, 'steps': 34369, 'loss/train': 1.7433745861053467} -11/07/2021 02:05:05 - INFO - __main__ - Step 34371: {'lr': 0.000443269445067068, 'samples': 6599232, 'steps': 34370, 'loss/train': 1.4963665008544922} -11/07/2021 02:05:05 - INFO - __main__ - Step 34372: {'lr': 0.0004432660788959537, 'samples': 6599424, 'steps': 34371, 'loss/train': 1.4771994352340698} -11/07/2021 02:05:06 - INFO - __main__ - Step 34373: {'lr': 0.00044326271263775657, 'samples': 6599616, 'steps': 34372, 'loss/train': 1.2979824542999268} -11/07/2021 02:05:07 - INFO - __main__ - Step 34374: {'lr': 0.0004432593462924783, 'samples': 6599808, 'steps': 34373, 'loss/train': 1.4521307945251465} -11/07/2021 02:05:07 - INFO - __main__ - Step 34375: {'lr': 0.0004432559798601203, 'samples': 6600000, 'steps': 34374, 'loss/train': 2.020451307296753} -11/07/2021 02:05:08 - INFO - __main__ - Step 34376: {'lr': 0.0004432526133406842, 'samples': 6600192, 'steps': 34375, 'loss/train': 1.3123501539230347} -11/07/2021 02:05:08 - INFO - __main__ - Step 34377: {'lr': 0.0004432492467341715, 'samples': 6600384, 'steps': 34376, 'loss/train': 1.956892967224121} -11/07/2021 02:05:09 - INFO - __main__ - Step 34378: {'lr': 0.00044324588004058364, 'samples': 6600576, 'steps': 34377, 'loss/train': 1.793972373008728} -11/07/2021 02:05:09 - INFO - __main__ - Step 34379: {'lr': 0.00044324251325992214, 'samples': 6600768, 'steps': 34378, 'loss/train': 1.768172264099121} -11/07/2021 02:05:10 - INFO - __main__ - Step 34380: {'lr': 0.0004432391463921885, 'samples': 6600960, 'steps': 34379, 'loss/train': 1.3202482461929321} -11/07/2021 02:05:10 - INFO - __main__ - Step 34381: {'lr': 0.00044323577943738437, 'samples': 6601152, 'steps': 34380, 'loss/train': 1.0357273817062378} -11/07/2021 02:05:10 - INFO - __main__ - Step 34382: {'lr': 0.00044323241239551113, 'samples': 6601344, 'steps': 34381, 'loss/train': 1.7776743173599243} -11/07/2021 02:05:11 - INFO - __main__ - Step 34383: {'lr': 0.0004432290452665704, 'samples': 6601536, 'steps': 34382, 'loss/train': 1.7808390855789185} -11/07/2021 02:05:12 - INFO - __main__ - Step 34384: {'lr': 0.00044322567805056356, 'samples': 6601728, 'steps': 34383, 'loss/train': 0.9358270764350891} -11/07/2021 02:05:12 - INFO - __main__ - Step 34385: {'lr': 0.00044322231074749225, 'samples': 6601920, 'steps': 34384, 'loss/train': 1.4120177030563354} -11/07/2021 02:05:12 - INFO - __main__ - Step 34386: {'lr': 0.0004432189433573579, 'samples': 6602112, 'steps': 34385, 'loss/train': 1.6435332298278809} -11/07/2021 02:05:13 - INFO - __main__ - Step 34387: {'lr': 0.00044321557588016214, 'samples': 6602304, 'steps': 34386, 'loss/train': 1.2353405952453613} -11/07/2021 02:05:14 - INFO - __main__ - Step 34388: {'lr': 0.0004432122083159065, 'samples': 6602496, 'steps': 34387, 'loss/train': 1.4600342512130737} -11/07/2021 02:05:14 - INFO - __main__ - Step 34389: {'lr': 0.0004432088406645922, 'samples': 6602688, 'steps': 34388, 'loss/train': 1.603829264640808} -11/07/2021 02:05:15 - INFO - __main__ - Step 34390: {'lr': 0.00044320547292622114, 'samples': 6602880, 'steps': 34389, 'loss/train': 1.6319403648376465} -11/07/2021 02:05:15 - INFO - __main__ - Step 34391: {'lr': 0.0004432021051007946, 'samples': 6603072, 'steps': 34390, 'loss/train': 5.095420837402344} -11/07/2021 02:05:15 - INFO - __main__ - Step 34392: {'lr': 0.00044319873718831425, 'samples': 6603264, 'steps': 34391, 'loss/train': 4.394473552703857} -11/07/2021 02:05:16 - INFO - __main__ - Step 34393: {'lr': 0.00044319536918878156, 'samples': 6603456, 'steps': 34392, 'loss/train': 0.47028297185897827} -11/07/2021 02:05:17 - INFO - __main__ - Step 34394: {'lr': 0.00044319200110219794, 'samples': 6603648, 'steps': 34393, 'loss/train': 1.8763916492462158} -11/07/2021 02:05:17 - INFO - __main__ - Step 34395: {'lr': 0.000443188632928565, 'samples': 6603840, 'steps': 34394, 'loss/train': 0.4508192241191864} -11/07/2021 02:05:17 - INFO - __main__ - Step 34396: {'lr': 0.0004431852646678842, 'samples': 6604032, 'steps': 34395, 'loss/train': 1.4153156280517578} -11/07/2021 02:05:18 - INFO - __main__ - Step 34397: {'lr': 0.00044318189632015716, 'samples': 6604224, 'steps': 34396, 'loss/train': 1.6592044830322266} -11/07/2021 02:05:18 - INFO - __main__ - Step 34398: {'lr': 0.0004431785278853853, 'samples': 6604416, 'steps': 34397, 'loss/train': 0.4165332317352295} -11/07/2021 02:05:19 - INFO - __main__ - Step 34399: {'lr': 0.0004431751593635702, 'samples': 6604608, 'steps': 34398, 'loss/train': 1.0399876832962036} -11/07/2021 02:05:20 - INFO - __main__ - Step 34400: {'lr': 0.00044317179075471335, 'samples': 6604800, 'steps': 34399, 'loss/train': 0.6964524388313293} -11/07/2021 02:05:20 - INFO - __main__ - Step 34401: {'lr': 0.00044316842205881625, 'samples': 6604992, 'steps': 34400, 'loss/train': 1.3911337852478027} -11/07/2021 02:05:20 - INFO - __main__ - Step 34402: {'lr': 0.00044316505327588054, 'samples': 6605184, 'steps': 34401, 'loss/train': 1.3631318807601929} -11/07/2021 02:05:21 - INFO - __main__ - Step 34403: {'lr': 0.00044316168440590757, 'samples': 6605376, 'steps': 34402, 'loss/train': 1.8850730657577515} -11/07/2021 02:05:22 - INFO - __main__ - Step 34404: {'lr': 0.00044315831544889886, 'samples': 6605568, 'steps': 34403, 'loss/train': 1.9254916906356812} -11/07/2021 02:05:22 - INFO - __main__ - Step 34405: {'lr': 0.0004431549464048561, 'samples': 6605760, 'steps': 34404, 'loss/train': 1.6083252429962158} -11/07/2021 02:05:22 - INFO - __main__ - Step 34406: {'lr': 0.0004431515772737806, 'samples': 6605952, 'steps': 34405, 'loss/train': 1.5108321905136108} -11/07/2021 02:05:23 - INFO - __main__ - Step 34407: {'lr': 0.000443148208055674, 'samples': 6606144, 'steps': 34406, 'loss/train': 1.199692726135254} -11/07/2021 02:05:23 - INFO - __main__ - Step 34408: {'lr': 0.0004431448387505379, 'samples': 6606336, 'steps': 34407, 'loss/train': 1.8412938117980957} -11/07/2021 02:05:23 - INFO - __main__ - Step 34409: {'lr': 0.00044314146935837365, 'samples': 6606528, 'steps': 34408, 'loss/train': 1.6678533554077148} -11/07/2021 02:05:24 - INFO - __main__ - Step 34410: {'lr': 0.0004431380998791828, 'samples': 6606720, 'steps': 34409, 'loss/train': 1.5640023946762085} -11/07/2021 02:05:25 - INFO - __main__ - Step 34411: {'lr': 0.0004431347303129669, 'samples': 6606912, 'steps': 34410, 'loss/train': 1.5821495056152344} -11/07/2021 02:05:25 - INFO - __main__ - Step 34412: {'lr': 0.00044313136065972754, 'samples': 6607104, 'steps': 34411, 'loss/train': 2.051985502243042} -11/07/2021 02:05:25 - INFO - __main__ - Step 34413: {'lr': 0.0004431279909194661, 'samples': 6607296, 'steps': 34412, 'loss/train': 2.042417526245117} -11/07/2021 02:05:26 - INFO - __main__ - Step 34414: {'lr': 0.00044312462109218423, 'samples': 6607488, 'steps': 34413, 'loss/train': 0.17461176216602325} -11/07/2021 02:05:27 - INFO - __main__ - Step 34415: {'lr': 0.0004431212511778834, 'samples': 6607680, 'steps': 34414, 'loss/train': 1.5423073768615723} -11/07/2021 02:05:27 - INFO - __main__ - Step 34416: {'lr': 0.000443117881176565, 'samples': 6607872, 'steps': 34415, 'loss/train': 2.077214002609253} -11/07/2021 02:05:28 - INFO - __main__ - Step 34417: {'lr': 0.00044311451108823075, 'samples': 6608064, 'steps': 34416, 'loss/train': 1.7995798587799072} -11/07/2021 02:05:28 - INFO - __main__ - Step 34418: {'lr': 0.00044311114091288205, 'samples': 6608256, 'steps': 34417, 'loss/train': 1.594545841217041} -11/07/2021 02:05:29 - INFO - __main__ - Step 34419: {'lr': 0.0004431077706505205, 'samples': 6608448, 'steps': 34418, 'loss/train': 1.0214651823043823} -11/07/2021 02:05:30 - INFO - __main__ - Step 34420: {'lr': 0.0004431044003011475, 'samples': 6608640, 'steps': 34419, 'loss/train': 1.7008183002471924} -11/07/2021 02:05:30 - INFO - __main__ - Step 34421: {'lr': 0.00044310102986476463, 'samples': 6608832, 'steps': 34420, 'loss/train': 1.6831791400909424} -11/07/2021 02:05:30 - INFO - __main__ - Step 34422: {'lr': 0.0004430976593413735, 'samples': 6609024, 'steps': 34421, 'loss/train': 1.9238362312316895} -11/07/2021 02:05:31 - INFO - __main__ - Step 34423: {'lr': 0.0004430942887309755, 'samples': 6609216, 'steps': 34422, 'loss/train': 1.5944414138793945} -11/07/2021 02:05:31 - INFO - __main__ - Step 34424: {'lr': 0.00044309091803357216, 'samples': 6609408, 'steps': 34423, 'loss/train': 2.4328577518463135} -11/07/2021 02:05:32 - INFO - __main__ - Step 34425: {'lr': 0.0004430875472491651, 'samples': 6609600, 'steps': 34424, 'loss/train': 1.4454017877578735} -11/07/2021 02:05:33 - INFO - __main__ - Step 34426: {'lr': 0.0004430841763777557, 'samples': 6609792, 'steps': 34425, 'loss/train': 0.7977309823036194} -11/07/2021 02:05:33 - INFO - __main__ - Step 34427: {'lr': 0.0004430808054193456, 'samples': 6609984, 'steps': 34426, 'loss/train': 1.1987460851669312} -11/07/2021 02:05:33 - INFO - __main__ - Step 34428: {'lr': 0.00044307743437393623, 'samples': 6610176, 'steps': 34427, 'loss/train': 0.5758892893791199} -11/07/2021 02:05:34 - INFO - __main__ - Step 34429: {'lr': 0.0004430740632415292, 'samples': 6610368, 'steps': 34428, 'loss/train': 1.741318702697754} -11/07/2021 02:05:34 - INFO - __main__ - Step 34430: {'lr': 0.0004430706920221259, 'samples': 6610560, 'steps': 34429, 'loss/train': 1.1640336513519287} -11/07/2021 02:05:35 - INFO - __main__ - Step 34431: {'lr': 0.00044306732071572796, 'samples': 6610752, 'steps': 34430, 'loss/train': 1.7533520460128784} -11/07/2021 02:05:35 - INFO - __main__ - Step 34432: {'lr': 0.00044306394932233694, 'samples': 6610944, 'steps': 34431, 'loss/train': 1.181859016418457} -11/07/2021 02:05:36 - INFO - __main__ - Step 34433: {'lr': 0.0004430605778419542, 'samples': 6611136, 'steps': 34432, 'loss/train': 0.981018602848053} -11/07/2021 02:05:36 - INFO - __main__ - Step 34434: {'lr': 0.00044305720627458136, 'samples': 6611328, 'steps': 34433, 'loss/train': 1.5004545450210571} -11/07/2021 02:05:36 - INFO - __main__ - Step 34435: {'lr': 0.00044305383462022, 'samples': 6611520, 'steps': 34434, 'loss/train': 1.9751158952713013} -11/07/2021 02:05:37 - INFO - __main__ - Step 34436: {'lr': 0.0004430504628788714, 'samples': 6611712, 'steps': 34435, 'loss/train': 1.7379834651947021} -11/07/2021 02:05:38 - INFO - __main__ - Step 34437: {'lr': 0.0004430470910505373, 'samples': 6611904, 'steps': 34436, 'loss/train': 1.6008168458938599} -11/07/2021 02:05:38 - INFO - __main__ - Step 34438: {'lr': 0.00044304371913521926, 'samples': 6612096, 'steps': 34437, 'loss/train': 1.5827112197875977} -11/07/2021 02:05:38 - INFO - __main__ - Step 34439: {'lr': 0.0004430403471329186, 'samples': 6612288, 'steps': 34438, 'loss/train': 1.6009305715560913} -11/07/2021 02:05:39 - INFO - __main__ - Step 34440: {'lr': 0.0004430369750436369, 'samples': 6612480, 'steps': 34439, 'loss/train': 1.3736330270767212} -11/07/2021 02:05:40 - INFO - __main__ - Step 34441: {'lr': 0.0004430336028673758, 'samples': 6612672, 'steps': 34440, 'loss/train': 1.412989854812622} -11/07/2021 02:05:40 - INFO - __main__ - Step 34442: {'lr': 0.00044303023060413677, 'samples': 6612864, 'steps': 34441, 'loss/train': 1.7590703964233398} -11/07/2021 02:05:41 - INFO - __main__ - Step 34443: {'lr': 0.0004430268582539212, 'samples': 6613056, 'steps': 34442, 'loss/train': 0.712694525718689} -11/07/2021 02:05:41 - INFO - __main__ - Step 34444: {'lr': 0.0004430234858167308, 'samples': 6613248, 'steps': 34443, 'loss/train': 1.2908469438552856} -11/07/2021 02:05:41 - INFO - __main__ - Step 34445: {'lr': 0.000443020113292567, 'samples': 6613440, 'steps': 34444, 'loss/train': 1.832324743270874} -11/07/2021 02:05:42 - INFO - __main__ - Step 34446: {'lr': 0.0004430167406814312, 'samples': 6613632, 'steps': 34445, 'loss/train': 1.7984143495559692} -11/07/2021 02:05:43 - INFO - __main__ - Step 34447: {'lr': 0.0004430133679833251, 'samples': 6613824, 'steps': 34446, 'loss/train': 1.3497729301452637} -11/07/2021 02:05:43 - INFO - __main__ - Step 34448: {'lr': 0.00044300999519825016, 'samples': 6614016, 'steps': 34447, 'loss/train': 1.2625563144683838} -11/07/2021 02:05:43 - INFO - __main__ - Step 34449: {'lr': 0.00044300662232620784, 'samples': 6614208, 'steps': 34448, 'loss/train': 1.7782011032104492} -11/07/2021 02:05:44 - INFO - __main__ - Step 34450: {'lr': 0.0004430032493671998, 'samples': 6614400, 'steps': 34449, 'loss/train': 1.4495292901992798} -11/07/2021 02:05:45 - INFO - __main__ - Step 34451: {'lr': 0.0004429998763212274, 'samples': 6614592, 'steps': 34450, 'loss/train': 1.4055038690567017} -11/07/2021 02:05:45 - INFO - __main__ - Step 34452: {'lr': 0.00044299650318829233, 'samples': 6614784, 'steps': 34451, 'loss/train': 1.5259429216384888} -11/07/2021 02:05:45 - INFO - __main__ - Step 34453: {'lr': 0.0004429931299683959, 'samples': 6614976, 'steps': 34452, 'loss/train': 1.4391940832138062} -11/07/2021 02:05:46 - INFO - __main__ - Step 34454: {'lr': 0.0004429897566615398, 'samples': 6615168, 'steps': 34453, 'loss/train': 1.6740025281906128} -11/07/2021 02:05:46 - INFO - __main__ - Step 34455: {'lr': 0.0004429863832677255, 'samples': 6615360, 'steps': 34454, 'loss/train': 1.5832898616790771} -11/07/2021 02:05:47 - INFO - __main__ - Step 34456: {'lr': 0.0004429830097869545, 'samples': 6615552, 'steps': 34455, 'loss/train': 2.2626101970672607} -11/07/2021 02:05:48 - INFO - __main__ - Step 34457: {'lr': 0.0004429796362192283, 'samples': 6615744, 'steps': 34456, 'loss/train': 1.631561279296875} -11/07/2021 02:05:48 - INFO - __main__ - Step 34458: {'lr': 0.0004429762625645485, 'samples': 6615936, 'steps': 34457, 'loss/train': 1.811454176902771} -11/07/2021 02:05:48 - INFO - __main__ - Step 34459: {'lr': 0.0004429728888229166, 'samples': 6616128, 'steps': 34458, 'loss/train': 0.7323458194732666} -11/07/2021 02:05:49 - INFO - __main__ - Step 34460: {'lr': 0.000442969514994334, 'samples': 6616320, 'steps': 34459, 'loss/train': 2.325310707092285} -11/07/2021 02:05:49 - INFO - __main__ - Step 34461: {'lr': 0.0004429661410788024, 'samples': 6616512, 'steps': 34460, 'loss/train': 1.6277323961257935} -11/07/2021 02:05:50 - INFO - __main__ - Step 34462: {'lr': 0.00044296276707632323, 'samples': 6616704, 'steps': 34461, 'loss/train': 1.4860053062438965} -11/07/2021 02:05:50 - INFO - __main__ - Step 34463: {'lr': 0.000442959392986898, 'samples': 6616896, 'steps': 34462, 'loss/train': 1.9971235990524292} -11/07/2021 02:05:51 - INFO - __main__ - Step 34464: {'lr': 0.0004429560188105282, 'samples': 6617088, 'steps': 34463, 'loss/train': 1.9872291088104248} -11/07/2021 02:05:51 - INFO - __main__ - Step 34465: {'lr': 0.00044295264454721544, 'samples': 6617280, 'steps': 34464, 'loss/train': 1.2352428436279297} -11/07/2021 02:05:51 - INFO - __main__ - Step 34466: {'lr': 0.0004429492701969612, 'samples': 6617472, 'steps': 34465, 'loss/train': 1.6460707187652588} -11/07/2021 02:05:52 - INFO - __main__ - Step 34467: {'lr': 0.00044294589575976696, 'samples': 6617664, 'steps': 34466, 'loss/train': 1.4971388578414917} -11/07/2021 02:05:53 - INFO - __main__ - Step 34468: {'lr': 0.00044294252123563434, 'samples': 6617856, 'steps': 34467, 'loss/train': 1.170795202255249} -11/07/2021 02:05:53 - INFO - __main__ - Step 34469: {'lr': 0.00044293914662456475, 'samples': 6618048, 'steps': 34468, 'loss/train': 1.8215768337249756} -11/07/2021 02:05:53 - INFO - __main__ - Step 34470: {'lr': 0.00044293577192655977, 'samples': 6618240, 'steps': 34469, 'loss/train': 1.0702993869781494} -11/07/2021 02:05:54 - INFO - __main__ - Step 34471: {'lr': 0.0004429323971416209, 'samples': 6618432, 'steps': 34470, 'loss/train': 1.573993444442749} -11/07/2021 02:05:55 - INFO - __main__ - Step 34472: {'lr': 0.0004429290222697497, 'samples': 6618624, 'steps': 34471, 'loss/train': 1.3658677339553833} -11/07/2021 02:05:55 - INFO - __main__ - Step 34473: {'lr': 0.0004429256473109476, 'samples': 6618816, 'steps': 34472, 'loss/train': 2.1451096534729004} -11/07/2021 02:05:56 - INFO - __main__ - Step 34474: {'lr': 0.0004429222722652162, 'samples': 6619008, 'steps': 34473, 'loss/train': 1.6938809156417847} -11/07/2021 02:05:56 - INFO - __main__ - Step 34475: {'lr': 0.0004429188971325571, 'samples': 6619200, 'steps': 34474, 'loss/train': 1.140890121459961} -11/07/2021 02:05:56 - INFO - __main__ - Step 34476: {'lr': 0.00044291552191297155, 'samples': 6619392, 'steps': 34475, 'loss/train': 1.288952350616455} -11/07/2021 02:05:57 - INFO - __main__ - Step 34477: {'lr': 0.0004429121466064614, 'samples': 6619584, 'steps': 34476, 'loss/train': 1.6861153841018677} -11/07/2021 02:05:58 - INFO - __main__ - Step 34478: {'lr': 0.0004429087712130279, 'samples': 6619776, 'steps': 34477, 'loss/train': 1.5473966598510742} -11/07/2021 02:05:58 - INFO - __main__ - Step 34479: {'lr': 0.00044290539573267276, 'samples': 6619968, 'steps': 34478, 'loss/train': 1.5820155143737793} -11/07/2021 02:05:58 - INFO - __main__ - Step 34480: {'lr': 0.00044290202016539736, 'samples': 6620160, 'steps': 34479, 'loss/train': 1.4073911905288696} -11/07/2021 02:05:59 - INFO - __main__ - Step 34481: {'lr': 0.0004428986445112033, 'samples': 6620352, 'steps': 34480, 'loss/train': 1.5794472694396973} -11/07/2021 02:06:00 - INFO - __main__ - Step 34482: {'lr': 0.00044289526877009213, 'samples': 6620544, 'steps': 34481, 'loss/train': 0.8621578216552734} -11/07/2021 02:06:00 - INFO - __main__ - Step 34483: {'lr': 0.00044289189294206534, 'samples': 6620736, 'steps': 34482, 'loss/train': 1.5604722499847412} -11/07/2021 02:06:01 - INFO - __main__ - Step 34484: {'lr': 0.0004428885170271244, 'samples': 6620928, 'steps': 34483, 'loss/train': 1.750520944595337} -11/07/2021 02:06:01 - INFO - __main__ - Step 34485: {'lr': 0.0004428851410252709, 'samples': 6621120, 'steps': 34484, 'loss/train': 1.702553629875183} -11/07/2021 02:06:01 - INFO - __main__ - Step 34486: {'lr': 0.0004428817649365063, 'samples': 6621312, 'steps': 34485, 'loss/train': 1.4129055738449097} -11/07/2021 02:06:02 - INFO - __main__ - Step 34487: {'lr': 0.0004428783887608321, 'samples': 6621504, 'steps': 34486, 'loss/train': 1.323349118232727} -11/07/2021 02:06:03 - INFO - __main__ - Step 34488: {'lr': 0.00044287501249824996, 'samples': 6621696, 'steps': 34487, 'loss/train': 1.4780468940734863} -11/07/2021 02:06:03 - INFO - __main__ - Step 34489: {'lr': 0.0004428716361487613, 'samples': 6621888, 'steps': 34488, 'loss/train': 1.4240431785583496} -11/07/2021 02:06:03 - INFO - __main__ - Step 34490: {'lr': 0.0004428682597123677, 'samples': 6622080, 'steps': 34489, 'loss/train': 1.1206878423690796} -11/07/2021 02:06:04 - INFO - __main__ - Step 34491: {'lr': 0.0004428648831890705, 'samples': 6622272, 'steps': 34490, 'loss/train': 1.1265442371368408} -11/07/2021 02:06:04 - INFO - __main__ - Step 34492: {'lr': 0.0004428615065788715, 'samples': 6622464, 'steps': 34491, 'loss/train': 1.5670143365859985} -11/07/2021 02:06:05 - INFO - __main__ - Step 34493: {'lr': 0.00044285812988177197, 'samples': 6622656, 'steps': 34492, 'loss/train': 1.810963749885559} -11/07/2021 02:06:05 - INFO - __main__ - Step 34494: {'lr': 0.0004428547530977736, 'samples': 6622848, 'steps': 34493, 'loss/train': 2.4662539958953857} -11/07/2021 02:06:06 - INFO - __main__ - Step 34495: {'lr': 0.0004428513762268779, 'samples': 6623040, 'steps': 34494, 'loss/train': 1.601396918296814} -11/07/2021 02:06:06 - INFO - __main__ - Step 34496: {'lr': 0.00044284799926908627, 'samples': 6623232, 'steps': 34495, 'loss/train': 1.6252416372299194} -11/07/2021 02:06:06 - INFO - __main__ - Step 34497: {'lr': 0.0004428446222244004, 'samples': 6623424, 'steps': 34496, 'loss/train': 1.8902145624160767} -11/07/2021 02:06:07 - INFO - __main__ - Step 34498: {'lr': 0.0004428412450928216, 'samples': 6623616, 'steps': 34497, 'loss/train': 2.3211231231689453} -11/07/2021 02:06:08 - INFO - __main__ - Step 34499: {'lr': 0.00044283786787435156, 'samples': 6623808, 'steps': 34498, 'loss/train': 1.5495243072509766} -11/07/2021 02:06:08 - INFO - __main__ - Step 34500: {'lr': 0.0004428344905689917, 'samples': 6624000, 'steps': 34499, 'loss/train': 1.4227359294891357} -11/07/2021 02:06:09 - INFO - __main__ - Step 34501: {'lr': 0.0004428311131767437, 'samples': 6624192, 'steps': 34500, 'loss/train': 1.3194031715393066} -11/07/2021 02:06:09 - INFO - __main__ - Step 34502: {'lr': 0.0004428277356976089, 'samples': 6624384, 'steps': 34501, 'loss/train': 1.5118417739868164} -11/07/2021 02:06:10 - INFO - __main__ - Step 34503: {'lr': 0.0004428243581315889, 'samples': 6624576, 'steps': 34502, 'loss/train': 1.6565394401550293} -11/07/2021 02:06:10 - INFO - __main__ - Step 34504: {'lr': 0.0004428209804786853, 'samples': 6624768, 'steps': 34503, 'loss/train': 2.0643577575683594} -11/07/2021 02:06:11 - INFO - __main__ - Step 34505: {'lr': 0.0004428176027388995, 'samples': 6624960, 'steps': 34504, 'loss/train': 1.7344928979873657} -11/07/2021 02:06:11 - INFO - __main__ - Step 34506: {'lr': 0.0004428142249122331, 'samples': 6625152, 'steps': 34505, 'loss/train': 1.3635393381118774} -11/07/2021 02:06:11 - INFO - __main__ - Step 34507: {'lr': 0.00044281084699868747, 'samples': 6625344, 'steps': 34506, 'loss/train': 2.03305983543396} -11/07/2021 02:06:12 - INFO - __main__ - Step 34508: {'lr': 0.0004428074689982643, 'samples': 6625536, 'steps': 34507, 'loss/train': 1.5268868207931519} -11/07/2021 02:06:13 - INFO - __main__ - Step 34509: {'lr': 0.0004428040909109651, 'samples': 6625728, 'steps': 34508, 'loss/train': 1.0226173400878906} -11/07/2021 02:06:13 - INFO - __main__ - Step 34510: {'lr': 0.00044280071273679133, 'samples': 6625920, 'steps': 34509, 'loss/train': 2.0236382484436035} -11/07/2021 02:06:13 - INFO - __main__ - Step 34511: {'lr': 0.00044279733447574456, 'samples': 6626112, 'steps': 34510, 'loss/train': 1.3775317668914795} -11/07/2021 02:06:14 - INFO - __main__ - Step 34512: {'lr': 0.00044279395612782625, 'samples': 6626304, 'steps': 34511, 'loss/train': 1.2630903720855713} -11/07/2021 02:06:14 - INFO - __main__ - Step 34513: {'lr': 0.0004427905776930379, 'samples': 6626496, 'steps': 34512, 'loss/train': 1.267950415611267} -11/07/2021 02:06:15 - INFO - __main__ - Step 34514: {'lr': 0.0004427871991713812, 'samples': 6626688, 'steps': 34513, 'loss/train': 1.7912590503692627} -11/07/2021 02:06:15 - INFO - __main__ - Step 34515: {'lr': 0.0004427838205628575, 'samples': 6626880, 'steps': 34514, 'loss/train': 1.34334397315979} -11/07/2021 02:06:16 - INFO - __main__ - Step 34516: {'lr': 0.0004427804418674684, 'samples': 6627072, 'steps': 34515, 'loss/train': 1.7392035722732544} -11/07/2021 02:06:16 - INFO - __main__ - Step 34517: {'lr': 0.00044277706308521543, 'samples': 6627264, 'steps': 34516, 'loss/train': 1.7281630039215088} -11/07/2021 02:06:16 - INFO - __main__ - Step 34518: {'lr': 0.0004427736842161001, 'samples': 6627456, 'steps': 34517, 'loss/train': 1.7590572834014893} -11/07/2021 02:06:18 - INFO - __main__ - Step 34519: {'lr': 0.00044277030526012386, 'samples': 6627648, 'steps': 34518, 'loss/train': 1.390249252319336} -11/07/2021 02:06:18 - INFO - __main__ - Step 34520: {'lr': 0.0004427669262172883, 'samples': 6627840, 'steps': 34519, 'loss/train': 1.3163725137710571} -11/07/2021 02:06:18 - INFO - __main__ - Step 34521: {'lr': 0.000442763547087595, 'samples': 6628032, 'steps': 34520, 'loss/train': 1.7077306509017944} -11/07/2021 02:06:19 - INFO - __main__ - Step 34522: {'lr': 0.00044276016787104535, 'samples': 6628224, 'steps': 34521, 'loss/train': 1.5454742908477783} -11/07/2021 02:06:19 - INFO - __main__ - Step 34523: {'lr': 0.000442756788567641, 'samples': 6628416, 'steps': 34522, 'loss/train': 1.7005842924118042} -11/07/2021 02:06:20 - INFO - __main__ - Step 34524: {'lr': 0.0004427534091773834, 'samples': 6628608, 'steps': 34523, 'loss/train': 1.4194958209991455} -11/07/2021 02:06:20 - INFO - __main__ - Step 34525: {'lr': 0.00044275002970027403, 'samples': 6628800, 'steps': 34524, 'loss/train': 1.3518060445785522} -11/07/2021 02:06:21 - INFO - __main__ - Step 34526: {'lr': 0.00044274665013631457, 'samples': 6628992, 'steps': 34525, 'loss/train': 1.4356197118759155} -11/07/2021 02:06:21 - INFO - __main__ - Step 34527: {'lr': 0.0004427432704855064, 'samples': 6629184, 'steps': 34526, 'loss/train': 2.385096311569214} -11/07/2021 02:06:21 - INFO - __main__ - Step 34528: {'lr': 0.000442739890747851, 'samples': 6629376, 'steps': 34527, 'loss/train': 1.1072453260421753} -11/07/2021 02:06:22 - INFO - __main__ - Step 34529: {'lr': 0.0004427365109233502, 'samples': 6629568, 'steps': 34528, 'loss/train': 1.5673176050186157} -11/07/2021 02:06:23 - INFO - __main__ - Step 34530: {'lr': 0.00044273313101200507, 'samples': 6629760, 'steps': 34529, 'loss/train': 1.4148625135421753} -11/07/2021 02:06:23 - INFO - __main__ - Step 34531: {'lr': 0.00044272975101381754, 'samples': 6629952, 'steps': 34530, 'loss/train': 1.4686460494995117} -11/07/2021 02:06:23 - INFO - __main__ - Step 34532: {'lr': 0.0004427263709287889, 'samples': 6630144, 'steps': 34531, 'loss/train': 1.4572937488555908} -11/07/2021 02:06:24 - INFO - __main__ - Step 34533: {'lr': 0.00044272299075692067, 'samples': 6630336, 'steps': 34532, 'loss/train': 1.7855355739593506} -11/07/2021 02:06:24 - INFO - __main__ - Step 34534: {'lr': 0.0004427196104982145, 'samples': 6630528, 'steps': 34533, 'loss/train': 1.7922431230545044} -11/07/2021 02:06:25 - INFO - __main__ - Step 34535: {'lr': 0.0004427162301526718, 'samples': 6630720, 'steps': 34534, 'loss/train': 1.4673815965652466} -11/07/2021 02:06:26 - INFO - __main__ - Step 34536: {'lr': 0.0004427128497202941, 'samples': 6630912, 'steps': 34535, 'loss/train': 1.608618974685669} -11/07/2021 02:06:26 - INFO - __main__ - Step 34537: {'lr': 0.00044270946920108305, 'samples': 6631104, 'steps': 34536, 'loss/train': 1.6207798719406128} -11/07/2021 02:06:26 - INFO - __main__ - Step 34538: {'lr': 0.00044270608859504006, 'samples': 6631296, 'steps': 34537, 'loss/train': 0.22153504192829132} -11/07/2021 02:06:27 - INFO - __main__ - Step 34539: {'lr': 0.0004427027079021667, 'samples': 6631488, 'steps': 34538, 'loss/train': 1.4280678033828735} -11/07/2021 02:06:28 - INFO - __main__ - Step 34540: {'lr': 0.0004426993271224645, 'samples': 6631680, 'steps': 34539, 'loss/train': 1.7425754070281982} -11/07/2021 02:06:28 - INFO - __main__ - Step 34541: {'lr': 0.0004426959462559349, 'samples': 6631872, 'steps': 34540, 'loss/train': 1.6339389085769653} -11/07/2021 02:06:28 - INFO - __main__ - Step 34542: {'lr': 0.0004426925653025795, 'samples': 6632064, 'steps': 34541, 'loss/train': 0.9596696496009827} -11/07/2021 02:06:29 - INFO - __main__ - Step 34543: {'lr': 0.0004426891842623998, 'samples': 6632256, 'steps': 34542, 'loss/train': 1.1412307024002075} -11/07/2021 02:06:29 - INFO - __main__ - Step 34544: {'lr': 0.0004426858031353973, 'samples': 6632448, 'steps': 34543, 'loss/train': 1.977781891822815} -11/07/2021 02:06:30 - INFO - __main__ - Step 34545: {'lr': 0.0004426824219215736, 'samples': 6632640, 'steps': 34544, 'loss/train': 1.415607213973999} -11/07/2021 02:06:31 - INFO - __main__ - Step 34546: {'lr': 0.00044267904062093014, 'samples': 6632832, 'steps': 34545, 'loss/train': 1.7016005516052246} -11/07/2021 02:06:31 - INFO - __main__ - Step 34547: {'lr': 0.0004426756592334685, 'samples': 6633024, 'steps': 34546, 'loss/train': 1.861208438873291} -11/07/2021 02:06:31 - INFO - __main__ - Step 34548: {'lr': 0.0004426722777591902, 'samples': 6633216, 'steps': 34547, 'loss/train': 1.6598010063171387} -11/07/2021 02:06:32 - INFO - __main__ - Step 34549: {'lr': 0.00044266889619809665, 'samples': 6633408, 'steps': 34548, 'loss/train': 0.9987548589706421} -11/07/2021 02:06:33 - INFO - __main__ - Step 34550: {'lr': 0.00044266551455018953, 'samples': 6633600, 'steps': 34549, 'loss/train': 1.3395533561706543} -11/07/2021 02:06:33 - INFO - __main__ - Step 34551: {'lr': 0.0004426621328154703, 'samples': 6633792, 'steps': 34550, 'loss/train': 1.5238016843795776} -11/07/2021 02:06:33 - INFO - __main__ - Step 34552: {'lr': 0.0004426587509939405, 'samples': 6633984, 'steps': 34551, 'loss/train': 1.5283972024917603} -11/07/2021 02:06:34 - INFO - __main__ - Step 34553: {'lr': 0.0004426553690856016, 'samples': 6634176, 'steps': 34552, 'loss/train': 0.9244617223739624} -11/07/2021 02:06:34 - INFO - __main__ - Step 34554: {'lr': 0.0004426519870904552, 'samples': 6634368, 'steps': 34553, 'loss/train': 1.0109336376190186} -11/07/2021 02:06:35 - INFO - __main__ - Step 34555: {'lr': 0.0004426486050085028, 'samples': 6634560, 'steps': 34554, 'loss/train': 1.4150766134262085} -11/07/2021 02:06:35 - INFO - __main__ - Step 34556: {'lr': 0.0004426452228397458, 'samples': 6634752, 'steps': 34555, 'loss/train': 1.6579521894454956} -11/07/2021 02:06:36 - INFO - __main__ - Step 34557: {'lr': 0.000442641840584186, 'samples': 6634944, 'steps': 34556, 'loss/train': 1.2919400930404663} -11/07/2021 02:06:36 - INFO - __main__ - Step 34558: {'lr': 0.00044263845824182467, 'samples': 6635136, 'steps': 34557, 'loss/train': 1.589131474494934} -11/07/2021 02:06:37 - INFO - __main__ - Step 34559: {'lr': 0.0004426350758126634, 'samples': 6635328, 'steps': 34558, 'loss/train': 1.3349565267562866} -11/07/2021 02:06:37 - INFO - __main__ - Step 34560: {'lr': 0.0004426316932967038, 'samples': 6635520, 'steps': 34559, 'loss/train': 1.3592138290405273} -11/07/2021 02:06:38 - INFO - __main__ - Step 34561: {'lr': 0.0004426283106939473, 'samples': 6635712, 'steps': 34560, 'loss/train': 0.11542725563049316} -11/07/2021 02:06:38 - INFO - __main__ - Step 34562: {'lr': 0.00044262492800439547, 'samples': 6635904, 'steps': 34561, 'loss/train': 1.0397703647613525} -11/07/2021 02:06:39 - INFO - __main__ - Step 34563: {'lr': 0.00044262154522804986, 'samples': 6636096, 'steps': 34562, 'loss/train': 1.0929821729660034} -11/07/2021 02:06:39 - INFO - __main__ - Step 34564: {'lr': 0.00044261816236491186, 'samples': 6636288, 'steps': 34563, 'loss/train': 1.6028127670288086} -11/07/2021 02:06:39 - INFO - __main__ - Step 34565: {'lr': 0.00044261477941498316, 'samples': 6636480, 'steps': 34564, 'loss/train': 1.8307973146438599} -11/07/2021 02:06:41 - INFO - __main__ - Step 34566: {'lr': 0.0004426113963782652, 'samples': 6636672, 'steps': 34565, 'loss/train': 1.577295184135437} -11/07/2021 02:06:41 - INFO - __main__ - Step 34567: {'lr': 0.00044260801325475953, 'samples': 6636864, 'steps': 34566, 'loss/train': 1.518283724784851} -11/07/2021 02:06:41 - INFO - __main__ - Step 34568: {'lr': 0.0004426046300444676, 'samples': 6637056, 'steps': 34567, 'loss/train': 1.3665200471878052} -11/07/2021 02:06:42 - INFO - __main__ - Step 34569: {'lr': 0.000442601246747391, 'samples': 6637248, 'steps': 34568, 'loss/train': 0.9717766046524048} -11/07/2021 02:06:42 - INFO - __main__ - Step 34570: {'lr': 0.0004425978633635313, 'samples': 6637440, 'steps': 34569, 'loss/train': 1.7114320993423462} -11/07/2021 02:06:43 - INFO - __main__ - Step 34571: {'lr': 0.0004425944798928899, 'samples': 6637632, 'steps': 34570, 'loss/train': 1.2611310482025146} -11/07/2021 02:06:43 - INFO - __main__ - Step 34572: {'lr': 0.0004425910963354685, 'samples': 6637824, 'steps': 34571, 'loss/train': 1.8750895261764526} -11/07/2021 02:06:44 - INFO - __main__ - Step 34573: {'lr': 0.0004425877126912685, 'samples': 6638016, 'steps': 34572, 'loss/train': 1.4090310335159302} -11/07/2021 02:06:44 - INFO - __main__ - Step 34574: {'lr': 0.00044258432896029145, 'samples': 6638208, 'steps': 34573, 'loss/train': 1.5623373985290527} -11/07/2021 02:06:44 - INFO - __main__ - Step 34575: {'lr': 0.00044258094514253876, 'samples': 6638400, 'steps': 34574, 'loss/train': 1.7206676006317139} -11/07/2021 02:06:46 - INFO - __main__ - Step 34576: {'lr': 0.00044257756123801216, 'samples': 6638592, 'steps': 34575, 'loss/train': 1.7571005821228027} -11/07/2021 02:06:46 - INFO - __main__ - Step 34577: {'lr': 0.0004425741772467131, 'samples': 6638784, 'steps': 34576, 'loss/train': 1.5985610485076904} -11/07/2021 02:06:46 - INFO - __main__ - Step 34578: {'lr': 0.0004425707931686431, 'samples': 6638976, 'steps': 34577, 'loss/train': 1.5311017036437988} -11/07/2021 02:06:47 - INFO - __main__ - Step 34579: {'lr': 0.00044256740900380364, 'samples': 6639168, 'steps': 34578, 'loss/train': 1.5247910022735596} -11/07/2021 02:06:47 - INFO - __main__ - Step 34580: {'lr': 0.0004425640247521963, 'samples': 6639360, 'steps': 34579, 'loss/train': 1.1286942958831787} -11/07/2021 02:06:48 - INFO - __main__ - Step 34581: {'lr': 0.00044256064041382255, 'samples': 6639552, 'steps': 34580, 'loss/train': 1.1327813863754272} -11/07/2021 02:06:48 - INFO - __main__ - Step 34582: {'lr': 0.0004425572559886839, 'samples': 6639744, 'steps': 34581, 'loss/train': 1.8219044208526611} -11/07/2021 02:06:49 - INFO - __main__ - Step 34583: {'lr': 0.00044255387147678206, 'samples': 6639936, 'steps': 34582, 'loss/train': 1.4360731840133667} -11/07/2021 02:06:49 - INFO - __main__ - Step 34584: {'lr': 0.0004425504868781183, 'samples': 6640128, 'steps': 34583, 'loss/train': 1.4580005407333374} -11/07/2021 02:06:49 - INFO - __main__ - Step 34585: {'lr': 0.0004425471021926943, 'samples': 6640320, 'steps': 34584, 'loss/train': 1.171671986579895} -11/07/2021 02:06:51 - INFO - __main__ - Step 34586: {'lr': 0.0004425437174205115, 'samples': 6640512, 'steps': 34585, 'loss/train': 1.599912166595459} -11/07/2021 02:06:51 - INFO - __main__ - Step 34587: {'lr': 0.00044254033256157154, 'samples': 6640704, 'steps': 34586, 'loss/train': 1.182337760925293} -11/07/2021 02:06:51 - INFO - __main__ - Step 34588: {'lr': 0.0004425369476158759, 'samples': 6640896, 'steps': 34587, 'loss/train': 1.4919441938400269} -11/07/2021 02:06:52 - INFO - __main__ - Step 34589: {'lr': 0.000442533562583426, 'samples': 6641088, 'steps': 34588, 'loss/train': 1.6986876726150513} -11/07/2021 02:06:52 - INFO - __main__ - Step 34590: {'lr': 0.00044253017746422355, 'samples': 6641280, 'steps': 34589, 'loss/train': 1.2049636840820312} -11/07/2021 02:06:53 - INFO - __main__ - Step 34591: {'lr': 0.00044252679225826984, 'samples': 6641472, 'steps': 34590, 'loss/train': 1.3515605926513672} -11/07/2021 02:06:53 - INFO - __main__ - Step 34592: {'lr': 0.0004425234069655666, 'samples': 6641664, 'steps': 34591, 'loss/train': 1.5792065858840942} -11/07/2021 02:06:54 - INFO - __main__ - Step 34593: {'lr': 0.0004425200215861153, 'samples': 6641856, 'steps': 34592, 'loss/train': 1.6354613304138184} -11/07/2021 02:06:54 - INFO - __main__ - Step 34594: {'lr': 0.00044251663611991743, 'samples': 6642048, 'steps': 34593, 'loss/train': 0.740597128868103} -11/07/2021 02:06:54 - INFO - __main__ - Step 34595: {'lr': 0.0004425132505669745, 'samples': 6642240, 'steps': 34594, 'loss/train': 0.7850571274757385} -11/07/2021 02:06:56 - INFO - __main__ - Step 34596: {'lr': 0.00044250986492728805, 'samples': 6642432, 'steps': 34595, 'loss/train': 1.890939712524414} -11/07/2021 02:06:56 - INFO - __main__ - Step 34597: {'lr': 0.0004425064792008597, 'samples': 6642624, 'steps': 34596, 'loss/train': 2.3666765689849854} -11/07/2021 02:06:56 - INFO - __main__ - Step 34598: {'lr': 0.0004425030933876909, 'samples': 6642816, 'steps': 34597, 'loss/train': 1.675109624862671} -11/07/2021 02:06:57 - INFO - __main__ - Step 34599: {'lr': 0.0004424997074877831, 'samples': 6643008, 'steps': 34598, 'loss/train': 1.7059627771377563} -11/07/2021 02:06:57 - INFO - __main__ - Step 34600: {'lr': 0.00044249632150113806, 'samples': 6643200, 'steps': 34599, 'loss/train': 1.568487286567688} -11/07/2021 02:06:57 - INFO - __main__ - Step 34601: {'lr': 0.000442492935427757, 'samples': 6643392, 'steps': 34600, 'loss/train': 1.5505502223968506} -11/07/2021 02:06:58 - INFO - __main__ - Step 34602: {'lr': 0.00044248954926764164, 'samples': 6643584, 'steps': 34601, 'loss/train': 1.3338634967803955} -11/07/2021 02:06:59 - INFO - __main__ - Step 34603: {'lr': 0.0004424861630207935, 'samples': 6643776, 'steps': 34602, 'loss/train': 1.2154052257537842} -11/07/2021 02:06:59 - INFO - __main__ - Step 34604: {'lr': 0.00044248277668721396, 'samples': 6643968, 'steps': 34603, 'loss/train': 1.4059666395187378} -11/07/2021 02:06:59 - INFO - __main__ - Step 34605: {'lr': 0.00044247939026690475, 'samples': 6644160, 'steps': 34604, 'loss/train': 1.9255297183990479} -11/07/2021 02:07:00 - INFO - __main__ - Step 34606: {'lr': 0.0004424760037598673, 'samples': 6644352, 'steps': 34605, 'loss/train': 1.4503154754638672} -11/07/2021 02:07:01 - INFO - __main__ - Step 34607: {'lr': 0.00044247261716610307, 'samples': 6644544, 'steps': 34606, 'loss/train': 2.0782949924468994} -11/07/2021 02:07:01 - INFO - __main__ - Step 34608: {'lr': 0.0004424692304856136, 'samples': 6644736, 'steps': 34607, 'loss/train': 1.8896739482879639} -11/07/2021 02:07:02 - INFO - __main__ - Step 34609: {'lr': 0.0004424658437184006, 'samples': 6644928, 'steps': 34608, 'loss/train': 1.4949098825454712} -11/07/2021 02:07:02 - INFO - __main__ - Step 34610: {'lr': 0.0004424624568644654, 'samples': 6645120, 'steps': 34609, 'loss/train': 1.5061067342758179} -11/07/2021 02:07:02 - INFO - __main__ - Step 34611: {'lr': 0.00044245906992380955, 'samples': 6645312, 'steps': 34610, 'loss/train': 1.4784544706344604} -11/07/2021 02:07:03 - INFO - __main__ - Step 34612: {'lr': 0.0004424556828964347, 'samples': 6645504, 'steps': 34611, 'loss/train': 1.0631170272827148} -11/07/2021 02:07:04 - INFO - __main__ - Step 34613: {'lr': 0.0004424522957823422, 'samples': 6645696, 'steps': 34612, 'loss/train': 1.161199927330017} -11/07/2021 02:07:04 - INFO - __main__ - Step 34614: {'lr': 0.00044244890858153376, 'samples': 6645888, 'steps': 34613, 'loss/train': 1.1820472478866577} -11/07/2021 02:07:04 - INFO - __main__ - Step 34615: {'lr': 0.00044244552129401075, 'samples': 6646080, 'steps': 34614, 'loss/train': 1.2303963899612427} -11/07/2021 02:07:05 - INFO - __main__ - Step 34616: {'lr': 0.0004424421339197747, 'samples': 6646272, 'steps': 34615, 'loss/train': 1.4271446466445923} -11/07/2021 02:07:06 - INFO - __main__ - Step 34617: {'lr': 0.00044243874645882733, 'samples': 6646464, 'steps': 34616, 'loss/train': 1.3017340898513794} -11/07/2021 02:07:06 - INFO - __main__ - Step 34618: {'lr': 0.0004424353589111699, 'samples': 6646656, 'steps': 34617, 'loss/train': 1.511954426765442} -11/07/2021 02:07:06 - INFO - __main__ - Step 34619: {'lr': 0.0004424319712768041, 'samples': 6646848, 'steps': 34618, 'loss/train': 1.4079127311706543} -11/07/2021 02:07:07 - INFO - __main__ - Step 34620: {'lr': 0.00044242858355573143, 'samples': 6647040, 'steps': 34619, 'loss/train': 1.2601699829101562} -11/07/2021 02:07:07 - INFO - __main__ - Step 34621: {'lr': 0.00044242519574795347, 'samples': 6647232, 'steps': 34620, 'loss/train': 1.5387800931930542} -11/07/2021 02:07:08 - INFO - __main__ - Step 34622: {'lr': 0.00044242180785347164, 'samples': 6647424, 'steps': 34621, 'loss/train': 1.591779112815857} -11/07/2021 02:07:09 - INFO - __main__ - Step 34623: {'lr': 0.00044241841987228747, 'samples': 6647616, 'steps': 34622, 'loss/train': 1.5455999374389648} -11/07/2021 02:07:09 - INFO - __main__ - Step 34624: {'lr': 0.00044241503180440263, 'samples': 6647808, 'steps': 34623, 'loss/train': 1.5934284925460815} -11/07/2021 02:07:09 - INFO - __main__ - Step 34625: {'lr': 0.0004424116436498185, 'samples': 6648000, 'steps': 34624, 'loss/train': 1.0495797395706177} -11/07/2021 02:07:10 - INFO - __main__ - Step 34626: {'lr': 0.0004424082554085366, 'samples': 6648192, 'steps': 34625, 'loss/train': 1.6510077714920044} -11/07/2021 02:07:11 - INFO - __main__ - Step 34627: {'lr': 0.0004424048670805586, 'samples': 6648384, 'steps': 34626, 'loss/train': 1.0533374547958374} -11/07/2021 02:07:11 - INFO - __main__ - Step 34628: {'lr': 0.0004424014786658859, 'samples': 6648576, 'steps': 34627, 'loss/train': 1.5134165287017822} -11/07/2021 02:07:11 - INFO - __main__ - Step 34629: {'lr': 0.00044239809016452, 'samples': 6648768, 'steps': 34628, 'loss/train': 1.4800750017166138} -11/07/2021 02:07:12 - INFO - __main__ - Step 34630: {'lr': 0.00044239470157646254, 'samples': 6648960, 'steps': 34629, 'loss/train': 1.61317777633667} -11/07/2021 02:07:12 - INFO - __main__ - Step 34631: {'lr': 0.000442391312901715, 'samples': 6649152, 'steps': 34630, 'loss/train': 1.6633764505386353} -11/07/2021 02:07:12 - INFO - __main__ - Step 34632: {'lr': 0.0004423879241402788, 'samples': 6649344, 'steps': 34631, 'loss/train': 1.8914424180984497} -11/07/2021 02:07:13 - INFO - __main__ - Step 34633: {'lr': 0.00044238453529215575, 'samples': 6649536, 'steps': 34632, 'loss/train': 1.3253827095031738} -11/07/2021 02:07:14 - INFO - __main__ - Step 34634: {'lr': 0.00044238114635734713, 'samples': 6649728, 'steps': 34633, 'loss/train': 1.6357054710388184} -11/07/2021 02:07:14 - INFO - __main__ - Step 34635: {'lr': 0.0004423777573358545, 'samples': 6649920, 'steps': 34634, 'loss/train': 1.5532491207122803} -11/07/2021 02:07:15 - INFO - __main__ - Step 34636: {'lr': 0.0004423743682276794, 'samples': 6650112, 'steps': 34635, 'loss/train': 1.3229199647903442} -11/07/2021 02:07:15 - INFO - __main__ - Step 34637: {'lr': 0.0004423709790328235, 'samples': 6650304, 'steps': 34636, 'loss/train': 1.3128234148025513} -11/07/2021 02:07:16 - INFO - __main__ - Step 34638: {'lr': 0.0004423675897512881, 'samples': 6650496, 'steps': 34637, 'loss/train': 1.764772653579712} -11/07/2021 02:07:16 - INFO - __main__ - Step 34639: {'lr': 0.0004423642003830748, 'samples': 6650688, 'steps': 34638, 'loss/train': 1.3187963962554932} -11/07/2021 02:07:17 - INFO - __main__ - Step 34640: {'lr': 0.00044236081092818527, 'samples': 6650880, 'steps': 34639, 'loss/train': 1.4747387170791626} -11/07/2021 02:07:17 - INFO - __main__ - Step 34641: {'lr': 0.00044235742138662085, 'samples': 6651072, 'steps': 34640, 'loss/train': 1.697799563407898} -11/07/2021 02:07:17 - INFO - __main__ - Step 34642: {'lr': 0.0004423540317583832, 'samples': 6651264, 'steps': 34641, 'loss/train': 1.5078938007354736} -11/07/2021 02:07:18 - INFO - __main__ - Step 34643: {'lr': 0.00044235064204347377, 'samples': 6651456, 'steps': 34642, 'loss/train': 1.9758487939834595} -11/07/2021 02:07:19 - INFO - __main__ - Step 34644: {'lr': 0.0004423472522418941, 'samples': 6651648, 'steps': 34643, 'loss/train': 1.5313408374786377} -11/07/2021 02:07:19 - INFO - __main__ - Step 34645: {'lr': 0.0004423438623536457, 'samples': 6651840, 'steps': 34644, 'loss/train': 1.3848991394042969} -11/07/2021 02:07:19 - INFO - __main__ - Step 34646: {'lr': 0.0004423404723787301, 'samples': 6652032, 'steps': 34645, 'loss/train': 0.7880754470825195} -11/07/2021 02:07:20 - INFO - __main__ - Step 34647: {'lr': 0.000442337082317149, 'samples': 6652224, 'steps': 34646, 'loss/train': 1.656903624534607} -11/07/2021 02:07:21 - INFO - __main__ - Step 34648: {'lr': 0.0004423336921689036, 'samples': 6652416, 'steps': 34647, 'loss/train': 1.0038855075836182} -11/07/2021 02:07:21 - INFO - __main__ - Step 34649: {'lr': 0.0004423303019339957, 'samples': 6652608, 'steps': 34648, 'loss/train': 1.808814525604248} -11/07/2021 02:07:21 - INFO - __main__ - Step 34650: {'lr': 0.0004423269116124267, 'samples': 6652800, 'steps': 34649, 'loss/train': 1.7514744997024536} -11/07/2021 02:07:22 - INFO - __main__ - Step 34651: {'lr': 0.0004423235212041982, 'samples': 6652992, 'steps': 34650, 'loss/train': 1.5523748397827148} -11/07/2021 02:07:22 - INFO - __main__ - Step 34652: {'lr': 0.00044232013070931165, 'samples': 6653184, 'steps': 34651, 'loss/train': 0.8525782823562622} -11/07/2021 02:07:23 - INFO - __main__ - Step 34653: {'lr': 0.00044231674012776864, 'samples': 6653376, 'steps': 34652, 'loss/train': 1.537770390510559} -11/07/2021 02:07:24 - INFO - __main__ - Step 34654: {'lr': 0.0004423133494595707, 'samples': 6653568, 'steps': 34653, 'loss/train': 1.724595546722412} -11/07/2021 02:07:24 - INFO - __main__ - Step 34655: {'lr': 0.00044230995870471923, 'samples': 6653760, 'steps': 34654, 'loss/train': 2.3284170627593994} -11/07/2021 02:07:24 - INFO - __main__ - Step 34656: {'lr': 0.000442306567863216, 'samples': 6653952, 'steps': 34655, 'loss/train': 1.2631199359893799} -11/07/2021 02:07:25 - INFO - __main__ - Step 34657: {'lr': 0.00044230317693506226, 'samples': 6654144, 'steps': 34656, 'loss/train': 1.8032299280166626} -11/07/2021 02:07:25 - INFO - __main__ - Step 34658: {'lr': 0.00044229978592025975, 'samples': 6654336, 'steps': 34657, 'loss/train': 1.4368984699249268} -11/07/2021 02:07:26 - INFO - __main__ - Step 34659: {'lr': 0.00044229639481881, 'samples': 6654528, 'steps': 34658, 'loss/train': 1.7114256620407104} -11/07/2021 02:07:26 - INFO - __main__ - Step 34660: {'lr': 0.00044229300363071434, 'samples': 6654720, 'steps': 34659, 'loss/train': 1.4131542444229126} -11/07/2021 02:07:27 - INFO - __main__ - Step 34661: {'lr': 0.0004422896123559744, 'samples': 6654912, 'steps': 34660, 'loss/train': 1.4714182615280151} -11/07/2021 02:07:27 - INFO - __main__ - Step 34662: {'lr': 0.00044228622099459183, 'samples': 6655104, 'steps': 34661, 'loss/train': 1.4233191013336182} -11/07/2021 02:07:27 - INFO - __main__ - Step 34663: {'lr': 0.000442282829546568, 'samples': 6655296, 'steps': 34662, 'loss/train': 1.2954325675964355} -11/07/2021 02:07:28 - INFO - __main__ - Step 34664: {'lr': 0.00044227943801190454, 'samples': 6655488, 'steps': 34663, 'loss/train': 1.5540417432785034} -11/07/2021 02:07:29 - INFO - __main__ - Step 34665: {'lr': 0.0004422760463906029, 'samples': 6655680, 'steps': 34664, 'loss/train': 1.7930601835250854} -11/07/2021 02:07:29 - INFO - __main__ - Step 34666: {'lr': 0.00044227265468266464, 'samples': 6655872, 'steps': 34665, 'loss/train': 1.5526427030563354} -11/07/2021 02:07:30 - INFO - __main__ - Step 34667: {'lr': 0.0004422692628880913, 'samples': 6656064, 'steps': 34666, 'loss/train': 1.0020115375518799} -11/07/2021 02:07:30 - INFO - __main__ - Step 34668: {'lr': 0.00044226587100688436, 'samples': 6656256, 'steps': 34667, 'loss/train': 0.9848887324333191} -11/07/2021 02:07:31 - INFO - __main__ - Step 34669: {'lr': 0.0004422624790390454, 'samples': 6656448, 'steps': 34668, 'loss/train': 1.892004370689392} -11/07/2021 02:07:31 - INFO - __main__ - Step 34670: {'lr': 0.000442259086984576, 'samples': 6656640, 'steps': 34669, 'loss/train': 0.9863758683204651} -11/07/2021 02:07:32 - INFO - __main__ - Step 34671: {'lr': 0.00044225569484347753, 'samples': 6656832, 'steps': 34670, 'loss/train': 1.4947410821914673} -11/07/2021 02:07:32 - INFO - __main__ - Step 34672: {'lr': 0.00044225230261575165, 'samples': 6657024, 'steps': 34671, 'loss/train': 1.550666332244873} -11/07/2021 02:07:32 - INFO - __main__ - Step 34673: {'lr': 0.00044224891030139986, 'samples': 6657216, 'steps': 34672, 'loss/train': 1.230271577835083} -11/07/2021 02:07:33 - INFO - __main__ - Step 34674: {'lr': 0.0004422455179004237, 'samples': 6657408, 'steps': 34673, 'loss/train': 1.6041208505630493} -11/07/2021 02:07:34 - INFO - __main__ - Step 34675: {'lr': 0.00044224212541282463, 'samples': 6657600, 'steps': 34674, 'loss/train': 1.1184190511703491} -11/07/2021 02:07:34 - INFO - __main__ - Step 34676: {'lr': 0.0004422387328386042, 'samples': 6657792, 'steps': 34675, 'loss/train': 1.2925069332122803} -11/07/2021 02:07:34 - INFO - __main__ - Step 34677: {'lr': 0.000442235340177764, 'samples': 6657984, 'steps': 34676, 'loss/train': 1.5358885526657104} -11/07/2021 02:07:35 - INFO - __main__ - Step 34678: {'lr': 0.00044223194743030556, 'samples': 6658176, 'steps': 34677, 'loss/train': 1.7155054807662964} -11/07/2021 02:07:36 - INFO - __main__ - Step 34679: {'lr': 0.00044222855459623034, 'samples': 6658368, 'steps': 34678, 'loss/train': 1.3513246774673462} -11/07/2021 02:07:37 - INFO - __main__ - Step 34680: {'lr': 0.00044222516167553985, 'samples': 6658560, 'steps': 34679, 'loss/train': 1.089221715927124} -11/07/2021 02:07:37 - INFO - __main__ - Step 34681: {'lr': 0.0004422217686682357, 'samples': 6658752, 'steps': 34680, 'loss/train': 0.9267388582229614} -11/07/2021 02:07:37 - INFO - __main__ - Step 34682: {'lr': 0.00044221837557431945, 'samples': 6658944, 'steps': 34681, 'loss/train': 1.5414425134658813} -11/07/2021 02:07:38 - INFO - __main__ - Step 34683: {'lr': 0.00044221498239379247, 'samples': 6659136, 'steps': 34682, 'loss/train': 1.783010482788086} -11/07/2021 02:07:38 - INFO - __main__ - Step 34684: {'lr': 0.0004422115891266565, 'samples': 6659328, 'steps': 34683, 'loss/train': 1.790891408920288} -11/07/2021 02:07:38 - INFO - __main__ - Step 34685: {'lr': 0.00044220819577291283, 'samples': 6659520, 'steps': 34684, 'loss/train': 1.6551603078842163} -11/07/2021 02:07:39 - INFO - __main__ - Step 34686: {'lr': 0.00044220480233256315, 'samples': 6659712, 'steps': 34685, 'loss/train': 1.8620059490203857} -11/07/2021 02:07:40 - INFO - __main__ - Step 34687: {'lr': 0.00044220140880560897, 'samples': 6659904, 'steps': 34686, 'loss/train': 1.5913258790969849} -11/07/2021 02:07:40 - INFO - __main__ - Step 34688: {'lr': 0.0004421980151920518, 'samples': 6660096, 'steps': 34687, 'loss/train': 1.3367774486541748} -11/07/2021 02:07:40 - INFO - __main__ - Step 34689: {'lr': 0.00044219462149189313, 'samples': 6660288, 'steps': 34688, 'loss/train': 1.2430310249328613} -11/07/2021 02:07:41 - INFO - __main__ - Step 34690: {'lr': 0.0004421912277051346, 'samples': 6660480, 'steps': 34689, 'loss/train': 1.542733907699585} -11/07/2021 02:07:42 - INFO - __main__ - Step 34691: {'lr': 0.00044218783383177763, 'samples': 6660672, 'steps': 34690, 'loss/train': 2.0949127674102783} -11/07/2021 02:07:42 - INFO - __main__ - Step 34692: {'lr': 0.00044218443987182384, 'samples': 6660864, 'steps': 34691, 'loss/train': 1.4428645372390747} -11/07/2021 02:07:42 - INFO - __main__ - Step 34693: {'lr': 0.0004421810458252746, 'samples': 6661056, 'steps': 34692, 'loss/train': 1.51067054271698} -11/07/2021 02:07:43 - INFO - __main__ - Step 34694: {'lr': 0.00044217765169213166, 'samples': 6661248, 'steps': 34693, 'loss/train': 2.990875244140625} -11/07/2021 02:07:43 - INFO - __main__ - Step 34695: {'lr': 0.00044217425747239636, 'samples': 6661440, 'steps': 34694, 'loss/train': 1.3043237924575806} -11/07/2021 02:07:44 - INFO - __main__ - Step 34696: {'lr': 0.00044217086316607033, 'samples': 6661632, 'steps': 34695, 'loss/train': 0.15015660226345062} -11/07/2021 02:07:45 - INFO - __main__ - Step 34697: {'lr': 0.00044216746877315504, 'samples': 6661824, 'steps': 34696, 'loss/train': 1.921492338180542} -11/07/2021 02:07:45 - INFO - __main__ - Step 34698: {'lr': 0.0004421640742936521, 'samples': 6662016, 'steps': 34697, 'loss/train': 1.4255037307739258} -11/07/2021 02:07:45 - INFO - __main__ - Step 34699: {'lr': 0.000442160679727563, 'samples': 6662208, 'steps': 34698, 'loss/train': 0.9124966859817505} -11/07/2021 02:07:46 - INFO - __main__ - Step 34700: {'lr': 0.0004421572850748893, 'samples': 6662400, 'steps': 34699, 'loss/train': 1.3457306623458862} -11/07/2021 02:07:47 - INFO - __main__ - Step 34701: {'lr': 0.00044215389033563235, 'samples': 6662592, 'steps': 34700, 'loss/train': 0.5043824911117554} -11/07/2021 02:07:47 - INFO - __main__ - Step 34702: {'lr': 0.00044215049550979394, 'samples': 6662784, 'steps': 34701, 'loss/train': 1.148721694946289} -11/07/2021 02:07:47 - INFO - __main__ - Step 34703: {'lr': 0.0004421471005973755, 'samples': 6662976, 'steps': 34702, 'loss/train': 3.545989990234375} -11/07/2021 02:07:48 - INFO - __main__ - Step 34704: {'lr': 0.0004421437055983785, 'samples': 6663168, 'steps': 34703, 'loss/train': 1.1789891719818115} -11/07/2021 02:07:48 - INFO - __main__ - Step 34705: {'lr': 0.0004421403105128045, 'samples': 6663360, 'steps': 34704, 'loss/train': 1.4928643703460693} -11/07/2021 02:07:49 - INFO - __main__ - Step 34706: {'lr': 0.00044213691534065503, 'samples': 6663552, 'steps': 34705, 'loss/train': 1.7695435285568237} -11/07/2021 02:07:49 - INFO - __main__ - Step 34707: {'lr': 0.0004421335200819316, 'samples': 6663744, 'steps': 34706, 'loss/train': 1.4045119285583496} -11/07/2021 02:07:50 - INFO - __main__ - Step 34708: {'lr': 0.00044213012473663584, 'samples': 6663936, 'steps': 34707, 'loss/train': 1.6348592042922974} -11/07/2021 02:07:50 - INFO - __main__ - Step 34709: {'lr': 0.0004421267293047692, 'samples': 6664128, 'steps': 34708, 'loss/train': 1.248964786529541} -11/07/2021 02:07:51 - INFO - __main__ - Step 34710: {'lr': 0.0004421233337863332, 'samples': 6664320, 'steps': 34709, 'loss/train': 1.435050368309021} -11/07/2021 02:07:52 - INFO - __main__ - Step 34711: {'lr': 0.0004421199381813293, 'samples': 6664512, 'steps': 34710, 'loss/train': 0.36825597286224365} -11/07/2021 02:07:52 - INFO - __main__ - Step 34712: {'lr': 0.0004421165424897593, 'samples': 6664704, 'steps': 34711, 'loss/train': 1.7275134325027466} -11/07/2021 02:07:52 - INFO - __main__ - Step 34713: {'lr': 0.00044211314671162446, 'samples': 6664896, 'steps': 34712, 'loss/train': 1.3651692867279053} -11/07/2021 02:07:53 - INFO - __main__ - Step 34714: {'lr': 0.0004421097508469264, 'samples': 6665088, 'steps': 34713, 'loss/train': 1.607322096824646} -11/07/2021 02:07:53 - INFO - __main__ - Step 34715: {'lr': 0.0004421063548956666, 'samples': 6665280, 'steps': 34714, 'loss/train': 1.7779440879821777} -11/07/2021 02:07:53 - INFO - __main__ - Step 34716: {'lr': 0.0004421029588578468, 'samples': 6665472, 'steps': 34715, 'loss/train': 1.2604187726974487} -11/07/2021 02:07:54 - INFO - __main__ - Step 34717: {'lr': 0.00044209956273346816, 'samples': 6665664, 'steps': 34716, 'loss/train': 1.660188913345337} -11/07/2021 02:07:55 - INFO - __main__ - Step 34718: {'lr': 0.0004420961665225326, 'samples': 6665856, 'steps': 34717, 'loss/train': 1.611341118812561} -11/07/2021 02:07:55 - INFO - __main__ - Step 34719: {'lr': 0.0004420927702250414, 'samples': 6666048, 'steps': 34718, 'loss/train': 1.270687222480774} -11/07/2021 02:07:56 - INFO - __main__ - Step 34720: {'lr': 0.00044208937384099614, 'samples': 6666240, 'steps': 34719, 'loss/train': 1.3792513608932495} -11/07/2021 02:07:56 - INFO - __main__ - Step 34721: {'lr': 0.0004420859773703985, 'samples': 6666432, 'steps': 34720, 'loss/train': 1.6422091722488403} -11/07/2021 02:07:57 - INFO - __main__ - Step 34722: {'lr': 0.0004420825808132497, 'samples': 6666624, 'steps': 34721, 'loss/train': 1.6275794506072998} -11/07/2021 02:07:57 - INFO - __main__ - Step 34723: {'lr': 0.0004420791841695515, 'samples': 6666816, 'steps': 34722, 'loss/train': 1.3561608791351318} -11/07/2021 02:07:58 - INFO - __main__ - Step 34724: {'lr': 0.00044207578743930544, 'samples': 6667008, 'steps': 34723, 'loss/train': 1.690434455871582} -11/07/2021 02:07:58 - INFO - __main__ - Step 34725: {'lr': 0.00044207239062251297, 'samples': 6667200, 'steps': 34724, 'loss/train': 1.4305295944213867} -11/07/2021 02:07:58 - INFO - __main__ - Step 34726: {'lr': 0.00044206899371917563, 'samples': 6667392, 'steps': 34725, 'loss/train': 1.0719469785690308} -11/07/2021 02:07:59 - INFO - __main__ - Step 34727: {'lr': 0.00044206559672929505, 'samples': 6667584, 'steps': 34726, 'loss/train': 1.5531504154205322} -11/07/2021 02:08:00 - INFO - __main__ - Step 34728: {'lr': 0.00044206219965287253, 'samples': 6667776, 'steps': 34727, 'loss/train': 1.0178858041763306} -11/07/2021 02:08:00 - INFO - __main__ - Step 34729: {'lr': 0.0004420588024899098, 'samples': 6667968, 'steps': 34728, 'loss/train': 1.555402159690857} -11/07/2021 02:08:00 - INFO - __main__ - Step 34730: {'lr': 0.00044205540524040846, 'samples': 6668160, 'steps': 34729, 'loss/train': 1.5309548377990723} -11/07/2021 02:08:01 - INFO - __main__ - Step 34731: {'lr': 0.0004420520079043698, 'samples': 6668352, 'steps': 34730, 'loss/train': 1.6775578260421753} -11/07/2021 02:08:01 - INFO - __main__ - Step 34732: {'lr': 0.00044204861048179544, 'samples': 6668544, 'steps': 34731, 'loss/train': 1.8591980934143066} -11/07/2021 02:08:02 - INFO - __main__ - Step 34733: {'lr': 0.000442045212972687, 'samples': 6668736, 'steps': 34732, 'loss/train': 1.4219645261764526} -11/07/2021 02:08:02 - INFO - __main__ - Step 34734: {'lr': 0.00044204181537704594, 'samples': 6668928, 'steps': 34733, 'loss/train': 3.3481669425964355} -11/07/2021 02:08:03 - INFO - __main__ - Step 34735: {'lr': 0.0004420384176948738, 'samples': 6669120, 'steps': 34734, 'loss/train': 1.136333703994751} -11/07/2021 02:08:03 - INFO - __main__ - Step 34736: {'lr': 0.0004420350199261721, 'samples': 6669312, 'steps': 34735, 'loss/train': 1.2063430547714233} -11/07/2021 02:08:03 - INFO - __main__ - Step 34737: {'lr': 0.0004420316220709424, 'samples': 6669504, 'steps': 34736, 'loss/train': 1.3695883750915527} -11/07/2021 02:08:05 - INFO - __main__ - Step 34738: {'lr': 0.0004420282241291862, 'samples': 6669696, 'steps': 34737, 'loss/train': 1.309014916419983} -11/07/2021 02:08:05 - INFO - __main__ - Step 34739: {'lr': 0.0004420248261009051, 'samples': 6669888, 'steps': 34738, 'loss/train': 1.4217370748519897} -11/07/2021 02:08:05 - INFO - __main__ - Step 34740: {'lr': 0.0004420214279861005, 'samples': 6670080, 'steps': 34739, 'loss/train': 1.6708537340164185} -11/07/2021 02:08:06 - INFO - __main__ - Step 34741: {'lr': 0.000442018029784774, 'samples': 6670272, 'steps': 34740, 'loss/train': 1.6417057514190674} -11/07/2021 02:08:06 - INFO - __main__ - Step 34742: {'lr': 0.00044201463149692725, 'samples': 6670464, 'steps': 34741, 'loss/train': 0.7682157754898071} -11/07/2021 02:08:07 - INFO - __main__ - Step 34743: {'lr': 0.0004420112331225616, 'samples': 6670656, 'steps': 34742, 'loss/train': 1.6508562564849854} -11/07/2021 02:08:07 - INFO - __main__ - Step 34744: {'lr': 0.0004420078346616786, 'samples': 6670848, 'steps': 34743, 'loss/train': 1.143585205078125} -11/07/2021 02:08:08 - INFO - __main__ - Step 34745: {'lr': 0.00044200443611427985, 'samples': 6671040, 'steps': 34744, 'loss/train': 1.240492343902588} -11/07/2021 02:08:08 - INFO - __main__ - Step 34746: {'lr': 0.000442001037480367, 'samples': 6671232, 'steps': 34745, 'loss/train': 1.3379449844360352} -11/07/2021 02:08:08 - INFO - __main__ - Step 34747: {'lr': 0.0004419976387599413, 'samples': 6671424, 'steps': 34746, 'loss/train': 1.318930983543396} -11/07/2021 02:08:09 - INFO - __main__ - Step 34748: {'lr': 0.0004419942399530045, 'samples': 6671616, 'steps': 34747, 'loss/train': 1.1978917121887207} -11/07/2021 02:08:10 - INFO - __main__ - Step 34749: {'lr': 0.000441990841059558, 'samples': 6671808, 'steps': 34748, 'loss/train': 1.252805471420288} -11/07/2021 02:08:10 - INFO - __main__ - Step 34750: {'lr': 0.0004419874420796034, 'samples': 6672000, 'steps': 34749, 'loss/train': 1.8787426948547363} -11/07/2021 02:08:10 - INFO - __main__ - Step 34751: {'lr': 0.00044198404301314223, 'samples': 6672192, 'steps': 34750, 'loss/train': 1.2014528512954712} -11/07/2021 02:08:11 - INFO - __main__ - Step 34752: {'lr': 0.000441980643860176, 'samples': 6672384, 'steps': 34751, 'loss/train': 1.153993844985962} -11/07/2021 02:08:12 - INFO - __main__ - Step 34753: {'lr': 0.0004419772446207063, 'samples': 6672576, 'steps': 34752, 'loss/train': 1.0246278047561646} -11/07/2021 02:08:12 - INFO - __main__ - Step 34754: {'lr': 0.0004419738452947346, 'samples': 6672768, 'steps': 34753, 'loss/train': 1.601043462753296} -11/07/2021 02:08:13 - INFO - __main__ - Step 34755: {'lr': 0.00044197044588226245, 'samples': 6672960, 'steps': 34754, 'loss/train': 1.3129998445510864} -11/07/2021 02:08:13 - INFO - __main__ - Step 34756: {'lr': 0.00044196704638329134, 'samples': 6673152, 'steps': 34755, 'loss/train': 1.5781275033950806} -11/07/2021 02:08:13 - INFO - __main__ - Step 34757: {'lr': 0.00044196364679782284, 'samples': 6673344, 'steps': 34756, 'loss/train': 1.534688115119934} -11/07/2021 02:08:14 - INFO - __main__ - Step 34758: {'lr': 0.00044196024712585854, 'samples': 6673536, 'steps': 34757, 'loss/train': 1.2186495065689087} -11/07/2021 02:08:15 - INFO - __main__ - Step 34759: {'lr': 0.0004419568473673999, 'samples': 6673728, 'steps': 34758, 'loss/train': 1.7138926982879639} -11/07/2021 02:08:15 - INFO - __main__ - Step 34760: {'lr': 0.00044195344752244844, 'samples': 6673920, 'steps': 34759, 'loss/train': 1.3245975971221924} -11/07/2021 02:08:15 - INFO - __main__ - Step 34761: {'lr': 0.0004419500475910057, 'samples': 6674112, 'steps': 34760, 'loss/train': 2.0108070373535156} -11/07/2021 02:08:16 - INFO - __main__ - Step 34762: {'lr': 0.0004419466475730732, 'samples': 6674304, 'steps': 34761, 'loss/train': 2.0209977626800537} -11/07/2021 02:08:17 - INFO - __main__ - Step 34763: {'lr': 0.00044194324746865265, 'samples': 6674496, 'steps': 34762, 'loss/train': 0.17314231395721436} -11/07/2021 02:08:17 - INFO - __main__ - Step 34764: {'lr': 0.00044193984727774533, 'samples': 6674688, 'steps': 34763, 'loss/train': 1.089399814605713} -11/07/2021 02:08:17 - INFO - __main__ - Step 34765: {'lr': 0.0004419364470003529, 'samples': 6674880, 'steps': 34764, 'loss/train': 1.7820653915405273} -11/07/2021 02:08:18 - INFO - __main__ - Step 34766: {'lr': 0.00044193304663647684, 'samples': 6675072, 'steps': 34765, 'loss/train': 0.5651389360427856} -11/07/2021 02:08:18 - INFO - __main__ - Step 34767: {'lr': 0.00044192964618611875, 'samples': 6675264, 'steps': 34766, 'loss/train': 1.915136694908142} -11/07/2021 02:08:19 - INFO - __main__ - Step 34768: {'lr': 0.0004419262456492801, 'samples': 6675456, 'steps': 34767, 'loss/train': 1.3549784421920776} -11/07/2021 02:08:19 - INFO - __main__ - Step 34769: {'lr': 0.0004419228450259625, 'samples': 6675648, 'steps': 34768, 'loss/train': 0.9835052490234375} -11/07/2021 02:08:20 - INFO - __main__ - Step 34770: {'lr': 0.00044191944431616734, 'samples': 6675840, 'steps': 34769, 'loss/train': 1.5672987699508667} -11/07/2021 02:08:20 - INFO - __main__ - Step 34771: {'lr': 0.0004419160435198963, 'samples': 6676032, 'steps': 34770, 'loss/train': 1.1811498403549194} -11/07/2021 02:08:21 - INFO - __main__ - Step 34772: {'lr': 0.00044191264263715083, 'samples': 6676224, 'steps': 34771, 'loss/train': 1.283642053604126} -11/07/2021 02:08:21 - INFO - __main__ - Step 34773: {'lr': 0.00044190924166793245, 'samples': 6676416, 'steps': 34772, 'loss/train': 1.3295031785964966} -11/07/2021 02:08:22 - INFO - __main__ - Step 34774: {'lr': 0.00044190584061224277, 'samples': 6676608, 'steps': 34773, 'loss/train': 1.20137357711792} -11/07/2021 02:08:22 - INFO - __main__ - Step 34775: {'lr': 0.0004419024394700833, 'samples': 6676800, 'steps': 34774, 'loss/train': 0.9757902026176453} -11/07/2021 02:08:23 - INFO - __main__ - Step 34776: {'lr': 0.0004418990382414555, 'samples': 6676992, 'steps': 34775, 'loss/train': 1.6098065376281738} -11/07/2021 02:08:23 - INFO - __main__ - Step 34777: {'lr': 0.000441895636926361, 'samples': 6677184, 'steps': 34776, 'loss/train': 1.4362106323242188} -11/07/2021 02:08:23 - INFO - __main__ - Step 34778: {'lr': 0.0004418922355248013, 'samples': 6677376, 'steps': 34777, 'loss/train': 1.3258627653121948} -11/07/2021 02:08:24 - INFO - __main__ - Step 34779: {'lr': 0.00044188883403677783, 'samples': 6677568, 'steps': 34778, 'loss/train': 1.1535234451293945} -11/07/2021 02:08:25 - INFO - __main__ - Step 34780: {'lr': 0.0004418854324622923, 'samples': 6677760, 'steps': 34779, 'loss/train': 1.4015830755233765} -11/07/2021 02:08:25 - INFO - __main__ - Step 34781: {'lr': 0.0004418820308013461, 'samples': 6677952, 'steps': 34780, 'loss/train': 1.5423986911773682} -11/07/2021 02:08:25 - INFO - __main__ - Step 34782: {'lr': 0.0004418786290539408, 'samples': 6678144, 'steps': 34781, 'loss/train': 2.191751718521118} -11/07/2021 02:08:26 - INFO - __main__ - Step 34783: {'lr': 0.000441875227220078, 'samples': 6678336, 'steps': 34782, 'loss/train': 1.3227585554122925} -11/07/2021 02:08:27 - INFO - __main__ - Step 34784: {'lr': 0.00044187182529975924, 'samples': 6678528, 'steps': 34783, 'loss/train': 1.5984337329864502} -11/07/2021 02:08:27 - INFO - __main__ - Step 34785: {'lr': 0.00044186842329298594, 'samples': 6678720, 'steps': 34784, 'loss/train': 1.293143391609192} -11/07/2021 02:08:27 - INFO - __main__ - Step 34786: {'lr': 0.0004418650211997596, 'samples': 6678912, 'steps': 34785, 'loss/train': 1.5011814832687378} -11/07/2021 02:08:28 - INFO - __main__ - Step 34787: {'lr': 0.00044186161902008193, 'samples': 6679104, 'steps': 34786, 'loss/train': 0.9370352625846863} -11/07/2021 02:08:28 - INFO - __main__ - Step 34788: {'lr': 0.0004418582167539544, 'samples': 6679296, 'steps': 34787, 'loss/train': 1.3798874616622925} -11/07/2021 02:08:29 - INFO - __main__ - Step 34789: {'lr': 0.00044185481440137846, 'samples': 6679488, 'steps': 34788, 'loss/train': 1.240277886390686} -11/07/2021 02:08:30 - INFO - __main__ - Step 34790: {'lr': 0.0004418514119623557, 'samples': 6679680, 'steps': 34789, 'loss/train': 1.4599852561950684} -11/07/2021 02:08:30 - INFO - __main__ - Step 34791: {'lr': 0.00044184800943688774, 'samples': 6679872, 'steps': 34790, 'loss/train': 1.3775103092193604} -11/07/2021 02:08:30 - INFO - __main__ - Step 34792: {'lr': 0.00044184460682497595, 'samples': 6680064, 'steps': 34791, 'loss/train': 1.8663573265075684} -11/07/2021 02:08:31 - INFO - __main__ - Step 34793: {'lr': 0.00044184120412662196, 'samples': 6680256, 'steps': 34792, 'loss/train': 0.7620434761047363} -11/07/2021 02:08:31 - INFO - __main__ - Step 34794: {'lr': 0.00044183780134182725, 'samples': 6680448, 'steps': 34793, 'loss/train': 1.5115052461624146} -11/07/2021 02:08:32 - INFO - __main__ - Step 34795: {'lr': 0.0004418343984705935, 'samples': 6680640, 'steps': 34794, 'loss/train': 1.2904330492019653} -11/07/2021 02:08:33 - INFO - __main__ - Step 34796: {'lr': 0.000441830995512922, 'samples': 6680832, 'steps': 34795, 'loss/train': 1.414196491241455} -11/07/2021 02:08:33 - INFO - __main__ - Step 34797: {'lr': 0.00044182759246881446, 'samples': 6681024, 'steps': 34796, 'loss/train': 1.9183604717254639} -11/07/2021 02:08:33 - INFO - __main__ - Step 34798: {'lr': 0.0004418241893382724, 'samples': 6681216, 'steps': 34797, 'loss/train': 1.7295217514038086} -11/07/2021 02:08:34 - INFO - __main__ - Step 34799: {'lr': 0.0004418207861212973, 'samples': 6681408, 'steps': 34798, 'loss/train': 1.2074306011199951} -11/07/2021 02:08:35 - INFO - __main__ - Step 34800: {'lr': 0.0004418173828178906, 'samples': 6681600, 'steps': 34799, 'loss/train': 1.9541829824447632} -11/07/2021 02:08:35 - INFO - __main__ - Step 34801: {'lr': 0.0004418139794280541, 'samples': 6681792, 'steps': 34800, 'loss/train': 1.5093656778335571} -11/07/2021 02:08:35 - INFO - __main__ - Step 34802: {'lr': 0.0004418105759517892, 'samples': 6681984, 'steps': 34801, 'loss/train': 0.3188191056251526} -11/07/2021 02:08:36 - INFO - __main__ - Step 34803: {'lr': 0.0004418071723890973, 'samples': 6682176, 'steps': 34802, 'loss/train': 1.9970906972885132} -11/07/2021 02:08:36 - INFO - __main__ - Step 34804: {'lr': 0.0004418037687399801, 'samples': 6682368, 'steps': 34803, 'loss/train': 1.8315550088882446} -11/07/2021 02:08:37 - INFO - __main__ - Step 34805: {'lr': 0.0004418003650044391, 'samples': 6682560, 'steps': 34804, 'loss/train': 1.305469274520874} -11/07/2021 02:08:37 - INFO - __main__ - Step 34806: {'lr': 0.0004417969611824758, 'samples': 6682752, 'steps': 34805, 'loss/train': 1.107684850692749} -11/07/2021 02:08:38 - INFO - __main__ - Step 34807: {'lr': 0.00044179355727409173, 'samples': 6682944, 'steps': 34806, 'loss/train': 1.085576057434082} -11/07/2021 02:08:38 - INFO - __main__ - Step 34808: {'lr': 0.00044179015327928847, 'samples': 6683136, 'steps': 34807, 'loss/train': 1.496474266052246} -11/07/2021 02:08:38 - INFO - __main__ - Step 34809: {'lr': 0.0004417867491980675, 'samples': 6683328, 'steps': 34808, 'loss/train': 1.8663268089294434} -11/07/2021 02:08:40 - INFO - __main__ - Step 34810: {'lr': 0.0004417833450304304, 'samples': 6683520, 'steps': 34809, 'loss/train': 1.9572205543518066} -11/07/2021 02:08:40 - INFO - __main__ - Step 34811: {'lr': 0.0004417799407763786, 'samples': 6683712, 'steps': 34810, 'loss/train': 1.5946073532104492} -11/07/2021 02:08:40 - INFO - __main__ - Step 34812: {'lr': 0.00044177653643591387, 'samples': 6683904, 'steps': 34811, 'loss/train': 1.580494999885559} -11/07/2021 02:08:41 - INFO - __main__ - Step 34813: {'lr': 0.00044177313200903745, 'samples': 6684096, 'steps': 34812, 'loss/train': 0.7876717448234558} -11/07/2021 02:08:41 - INFO - __main__ - Step 34814: {'lr': 0.0004417697274957511, 'samples': 6684288, 'steps': 34813, 'loss/train': 1.619801640510559} -11/07/2021 02:08:42 - INFO - __main__ - Step 34815: {'lr': 0.0004417663228960562, 'samples': 6684480, 'steps': 34814, 'loss/train': 1.3058736324310303} -11/07/2021 02:08:42 - INFO - __main__ - Step 34816: {'lr': 0.0004417629182099545, 'samples': 6684672, 'steps': 34815, 'loss/train': 1.5034188032150269} -11/07/2021 02:08:43 - INFO - __main__ - Step 34817: {'lr': 0.00044175951343744725, 'samples': 6684864, 'steps': 34816, 'loss/train': 1.7466281652450562} -11/07/2021 02:08:43 - INFO - __main__ - Step 34818: {'lr': 0.0004417561085785362, 'samples': 6685056, 'steps': 34817, 'loss/train': 1.3654601573944092} -11/07/2021 02:08:43 - INFO - __main__ - Step 34819: {'lr': 0.0004417527036332227, 'samples': 6685248, 'steps': 34818, 'loss/train': 1.158371090888977} -11/07/2021 02:08:44 - INFO - __main__ - Step 34820: {'lr': 0.0004417492986015085, 'samples': 6685440, 'steps': 34819, 'loss/train': 1.3802626132965088} -11/07/2021 02:08:45 - INFO - __main__ - Step 34821: {'lr': 0.000441745893483395, 'samples': 6685632, 'steps': 34820, 'loss/train': 1.6779146194458008} -11/07/2021 02:08:45 - INFO - __main__ - Step 34822: {'lr': 0.00044174248827888376, 'samples': 6685824, 'steps': 34821, 'loss/train': 1.3448272943496704} -11/07/2021 02:08:45 - INFO - __main__ - Step 34823: {'lr': 0.00044173908298797627, 'samples': 6686016, 'steps': 34822, 'loss/train': 1.4924274682998657} -11/07/2021 02:08:46 - INFO - __main__ - Step 34824: {'lr': 0.0004417356776106741, 'samples': 6686208, 'steps': 34823, 'loss/train': 2.0932040214538574} -11/07/2021 02:08:47 - INFO - __main__ - Step 34825: {'lr': 0.00044173227214697885, 'samples': 6686400, 'steps': 34824, 'loss/train': 1.7518690824508667} -11/07/2021 02:08:47 - INFO - __main__ - Step 34826: {'lr': 0.000441728866596892, 'samples': 6686592, 'steps': 34825, 'loss/train': 1.52781343460083} -11/07/2021 02:08:48 - INFO - __main__ - Step 34827: {'lr': 0.00044172546096041504, 'samples': 6686784, 'steps': 34826, 'loss/train': 0.2420790195465088} -11/07/2021 02:08:48 - INFO - __main__ - Step 34828: {'lr': 0.0004417220552375496, 'samples': 6686976, 'steps': 34827, 'loss/train': 1.4486048221588135} -11/07/2021 02:08:48 - INFO - __main__ - Step 34829: {'lr': 0.00044171864942829707, 'samples': 6687168, 'steps': 34828, 'loss/train': 1.6413379907608032} -11/07/2021 02:08:49 - INFO - __main__ - Step 34830: {'lr': 0.0004417152435326591, 'samples': 6687360, 'steps': 34829, 'loss/train': 1.489789366722107} -11/07/2021 02:08:50 - INFO - __main__ - Step 34831: {'lr': 0.00044171183755063726, 'samples': 6687552, 'steps': 34830, 'loss/train': 1.3714736700057983} -11/07/2021 02:08:50 - INFO - __main__ - Step 34832: {'lr': 0.00044170843148223305, 'samples': 6687744, 'steps': 34831, 'loss/train': 1.9806476831436157} -11/07/2021 02:08:51 - INFO - __main__ - Step 34833: {'lr': 0.0004417050253274479, 'samples': 6687936, 'steps': 34832, 'loss/train': 1.3821278810501099} -11/07/2021 02:08:51 - INFO - __main__ - Step 34834: {'lr': 0.00044170161908628345, 'samples': 6688128, 'steps': 34833, 'loss/train': 1.7906062602996826} -11/07/2021 02:08:51 - INFO - __main__ - Step 34835: {'lr': 0.0004416982127587412, 'samples': 6688320, 'steps': 34834, 'loss/train': 1.3996402025222778} -11/07/2021 02:08:52 - INFO - __main__ - Step 34836: {'lr': 0.00044169480634482274, 'samples': 6688512, 'steps': 34835, 'loss/train': 1.677834391593933} -11/07/2021 02:08:53 - INFO - __main__ - Step 34837: {'lr': 0.0004416913998445294, 'samples': 6688704, 'steps': 34836, 'loss/train': 1.5204591751098633} -11/07/2021 02:08:53 - INFO - __main__ - Step 34838: {'lr': 0.000441687993257863, 'samples': 6688896, 'steps': 34837, 'loss/train': 1.1863371133804321} -11/07/2021 02:08:53 - INFO - __main__ - Step 34839: {'lr': 0.000441684586584825, 'samples': 6689088, 'steps': 34838, 'loss/train': 1.1081938743591309} -11/07/2021 02:08:54 - INFO - __main__ - Step 34840: {'lr': 0.0004416811798254168, 'samples': 6689280, 'steps': 34839, 'loss/train': 1.6745431423187256} -11/07/2021 02:08:55 - INFO - __main__ - Step 34841: {'lr': 0.00044167777297964006, 'samples': 6689472, 'steps': 34840, 'loss/train': 1.4791312217712402} -11/07/2021 02:08:55 - INFO - __main__ - Step 34842: {'lr': 0.0004416743660474962, 'samples': 6689664, 'steps': 34841, 'loss/train': 1.4962350130081177} -11/07/2021 02:08:55 - INFO - __main__ - Step 34843: {'lr': 0.0004416709590289869, 'samples': 6689856, 'steps': 34842, 'loss/train': 1.2518876791000366} -11/07/2021 02:08:56 - INFO - __main__ - Step 34844: {'lr': 0.00044166755192411364, 'samples': 6690048, 'steps': 34843, 'loss/train': 2.0981333255767822} -11/07/2021 02:08:56 - INFO - __main__ - Step 34845: {'lr': 0.00044166414473287784, 'samples': 6690240, 'steps': 34844, 'loss/train': 1.6097639799118042} -11/07/2021 02:08:57 - INFO - __main__ - Step 34846: {'lr': 0.0004416607374552812, 'samples': 6690432, 'steps': 34845, 'loss/train': 1.0811222791671753} -11/07/2021 02:08:58 - INFO - __main__ - Step 34847: {'lr': 0.00044165733009132524, 'samples': 6690624, 'steps': 34846, 'loss/train': 1.3376858234405518} -11/07/2021 02:08:58 - INFO - __main__ - Step 34848: {'lr': 0.00044165392264101136, 'samples': 6690816, 'steps': 34847, 'loss/train': 1.521743655204773} -11/07/2021 02:08:58 - INFO - __main__ - Step 34849: {'lr': 0.0004416505151043412, 'samples': 6691008, 'steps': 34848, 'loss/train': 1.796020269393921} -11/07/2021 02:08:59 - INFO - __main__ - Step 34850: {'lr': 0.0004416471074813163, 'samples': 6691200, 'steps': 34849, 'loss/train': 1.783268690109253} -11/07/2021 02:09:00 - INFO - __main__ - Step 34851: {'lr': 0.0004416436997719382, 'samples': 6691392, 'steps': 34850, 'loss/train': 1.8800702095031738} -11/07/2021 02:09:00 - INFO - __main__ - Step 34852: {'lr': 0.0004416402919762084, 'samples': 6691584, 'steps': 34851, 'loss/train': 1.96084463596344} -11/07/2021 02:09:00 - INFO - __main__ - Step 34853: {'lr': 0.00044163688409412833, 'samples': 6691776, 'steps': 34852, 'loss/train': 1.48081636428833} -11/07/2021 02:09:01 - INFO - __main__ - Step 34854: {'lr': 0.0004416334761256997, 'samples': 6691968, 'steps': 34853, 'loss/train': 1.1761119365692139} -11/07/2021 02:09:01 - INFO - __main__ - Step 34855: {'lr': 0.000441630068070924, 'samples': 6692160, 'steps': 34854, 'loss/train': 1.4678617715835571} -11/07/2021 02:09:01 - INFO - __main__ - Step 34856: {'lr': 0.0004416266599298028, 'samples': 6692352, 'steps': 34855, 'loss/train': 1.2836898565292358} -11/07/2021 02:09:03 - INFO - __main__ - Step 34857: {'lr': 0.00044162325170233745, 'samples': 6692544, 'steps': 34856, 'loss/train': 0.8834148645401001} -11/07/2021 02:09:03 - INFO - __main__ - Step 34858: {'lr': 0.00044161984338852967, 'samples': 6692736, 'steps': 34857, 'loss/train': 1.5354430675506592} -11/07/2021 02:09:03 - INFO - __main__ - Step 34859: {'lr': 0.000441616434988381, 'samples': 6692928, 'steps': 34858, 'loss/train': 1.648168921470642} -11/07/2021 02:09:04 - INFO - __main__ - Step 34860: {'lr': 0.00044161302650189295, 'samples': 6693120, 'steps': 34859, 'loss/train': 1.5468337535858154} -11/07/2021 02:09:04 - INFO - __main__ - Step 34861: {'lr': 0.00044160961792906694, 'samples': 6693312, 'steps': 34860, 'loss/train': 1.5955241918563843} -11/07/2021 02:09:05 - INFO - __main__ - Step 34862: {'lr': 0.00044160620926990456, 'samples': 6693504, 'steps': 34861, 'loss/train': 1.1796307563781738} -11/07/2021 02:09:05 - INFO - __main__ - Step 34863: {'lr': 0.0004416028005244075, 'samples': 6693696, 'steps': 34862, 'loss/train': 1.7557843923568726} -11/07/2021 02:09:06 - INFO - __main__ - Step 34864: {'lr': 0.0004415993916925771, 'samples': 6693888, 'steps': 34863, 'loss/train': 1.9630286693572998} -11/07/2021 02:09:06 - INFO - __main__ - Step 34865: {'lr': 0.000441595982774415, 'samples': 6694080, 'steps': 34864, 'loss/train': 1.3882853984832764} -11/07/2021 02:09:06 - INFO - __main__ - Step 34866: {'lr': 0.00044159257376992267, 'samples': 6694272, 'steps': 34865, 'loss/train': 1.6050423383712769} -11/07/2021 02:09:07 - INFO - __main__ - Step 34867: {'lr': 0.0004415891646791017, 'samples': 6694464, 'steps': 34866, 'loss/train': 1.2810680866241455} -11/07/2021 02:09:08 - INFO - __main__ - Step 34868: {'lr': 0.0004415857555019536, 'samples': 6694656, 'steps': 34867, 'loss/train': 1.513373851776123} -11/07/2021 02:09:08 - INFO - __main__ - Step 34869: {'lr': 0.00044158234623847993, 'samples': 6694848, 'steps': 34868, 'loss/train': 1.4827241897583008} -11/07/2021 02:09:08 - INFO - __main__ - Step 34870: {'lr': 0.00044157893688868223, 'samples': 6695040, 'steps': 34869, 'loss/train': 1.635990023612976} -11/07/2021 02:09:09 - INFO - __main__ - Step 34871: {'lr': 0.00044157552745256203, 'samples': 6695232, 'steps': 34870, 'loss/train': 0.9106978178024292} -11/07/2021 02:09:09 - INFO - __main__ - Step 34872: {'lr': 0.0004415721179301208, 'samples': 6695424, 'steps': 34871, 'loss/train': 1.7310855388641357} -11/07/2021 02:09:10 - INFO - __main__ - Step 34873: {'lr': 0.00044156870832136015, 'samples': 6695616, 'steps': 34872, 'loss/train': 1.2648017406463623} -11/07/2021 02:09:11 - INFO - __main__ - Step 34874: {'lr': 0.00044156529862628157, 'samples': 6695808, 'steps': 34873, 'loss/train': 1.3931591510772705} -11/07/2021 02:09:11 - INFO - __main__ - Step 34875: {'lr': 0.00044156188884488667, 'samples': 6696000, 'steps': 34874, 'loss/train': 1.921125054359436} -11/07/2021 02:09:11 - INFO - __main__ - Step 34876: {'lr': 0.0004415584789771769, 'samples': 6696192, 'steps': 34875, 'loss/train': 1.4276232719421387} -11/07/2021 02:09:12 - INFO - __main__ - Step 34877: {'lr': 0.0004415550690231539, 'samples': 6696384, 'steps': 34876, 'loss/train': 1.5939267873764038} -11/07/2021 02:09:13 - INFO - __main__ - Step 34878: {'lr': 0.0004415516589828191, 'samples': 6696576, 'steps': 34877, 'loss/train': 1.5690876245498657} -11/07/2021 02:09:13 - INFO - __main__ - Step 34879: {'lr': 0.00044154824885617405, 'samples': 6696768, 'steps': 34878, 'loss/train': 1.8448790311813354} -11/07/2021 02:09:13 - INFO - __main__ - Step 34880: {'lr': 0.0004415448386432204, 'samples': 6696960, 'steps': 34879, 'loss/train': 1.4996871948242188} -11/07/2021 02:09:14 - INFO - __main__ - Step 34881: {'lr': 0.00044154142834395947, 'samples': 6697152, 'steps': 34880, 'loss/train': 1.8461229801177979} -11/07/2021 02:09:14 - INFO - __main__ - Step 34882: {'lr': 0.00044153801795839296, 'samples': 6697344, 'steps': 34881, 'loss/train': 1.3578943014144897} -11/07/2021 02:09:15 - INFO - __main__ - Step 34883: {'lr': 0.00044153460748652245, 'samples': 6697536, 'steps': 34882, 'loss/train': 0.4732913076877594} -11/07/2021 02:09:15 - INFO - __main__ - Step 34884: {'lr': 0.00044153119692834944, 'samples': 6697728, 'steps': 34883, 'loss/train': 1.1813597679138184} -11/07/2021 02:09:16 - INFO - __main__ - Step 34885: {'lr': 0.0004415277862838753, 'samples': 6697920, 'steps': 34884, 'loss/train': 1.055881142616272} -11/07/2021 02:09:16 - INFO - __main__ - Step 34886: {'lr': 0.00044152437555310174, 'samples': 6698112, 'steps': 34885, 'loss/train': 1.097977638244629} -11/07/2021 02:09:17 - INFO - __main__ - Step 34887: {'lr': 0.00044152096473603025, 'samples': 6698304, 'steps': 34886, 'loss/train': 1.558925986289978} -11/07/2021 02:09:18 - INFO - __main__ - Step 34888: {'lr': 0.00044151755383266234, 'samples': 6698496, 'steps': 34887, 'loss/train': 1.0544556379318237} -11/07/2021 02:09:18 - INFO - __main__ - Step 34889: {'lr': 0.0004415141428429997, 'samples': 6698688, 'steps': 34888, 'loss/train': 1.5570998191833496} -11/07/2021 02:09:18 - INFO - __main__ - Step 34890: {'lr': 0.0004415107317670436, 'samples': 6698880, 'steps': 34889, 'loss/train': 1.7016712427139282} -11/07/2021 02:09:19 - INFO - __main__ - Step 34891: {'lr': 0.0004415073206047958, 'samples': 6699072, 'steps': 34890, 'loss/train': 1.6461631059646606} -11/07/2021 02:09:19 - INFO - __main__ - Step 34892: {'lr': 0.0004415039093562577, 'samples': 6699264, 'steps': 34891, 'loss/train': 1.7420457601547241} -11/07/2021 02:09:20 - INFO - __main__ - Step 34893: {'lr': 0.00044150049802143095, 'samples': 6699456, 'steps': 34892, 'loss/train': 1.101386547088623} -11/07/2021 02:09:20 - INFO - __main__ - Step 34894: {'lr': 0.00044149708660031704, 'samples': 6699648, 'steps': 34893, 'loss/train': 1.4222402572631836} -11/07/2021 02:09:21 - INFO - __main__ - Step 34895: {'lr': 0.0004414936750929174, 'samples': 6699840, 'steps': 34894, 'loss/train': 1.5587239265441895} -11/07/2021 02:09:21 - INFO - __main__ - Step 34896: {'lr': 0.0004414902634992338, 'samples': 6700032, 'steps': 34895, 'loss/train': 1.662794589996338} -11/07/2021 02:09:21 - INFO - __main__ - Step 34897: {'lr': 0.0004414868518192675, 'samples': 6700224, 'steps': 34896, 'loss/train': 1.5693986415863037} -11/07/2021 02:09:22 - INFO - __main__ - Step 34898: {'lr': 0.0004414834400530203, 'samples': 6700416, 'steps': 34897, 'loss/train': 1.4663927555084229} -11/07/2021 02:09:23 - INFO - __main__ - Step 34899: {'lr': 0.00044148002820049354, 'samples': 6700608, 'steps': 34898, 'loss/train': 1.5058009624481201} -11/07/2021 02:09:23 - INFO - __main__ - Step 34900: {'lr': 0.00044147661626168887, 'samples': 6700800, 'steps': 34899, 'loss/train': 1.8423506021499634} -11/07/2021 02:09:24 - INFO - __main__ - Step 34901: {'lr': 0.0004414732042366078, 'samples': 6700992, 'steps': 34900, 'loss/train': 1.5679491758346558} -11/07/2021 02:09:24 - INFO - __main__ - Step 34902: {'lr': 0.00044146979212525184, 'samples': 6701184, 'steps': 34901, 'loss/train': 1.720201015472412} -11/07/2021 02:09:25 - INFO - __main__ - Step 34903: {'lr': 0.0004414663799276225, 'samples': 6701376, 'steps': 34902, 'loss/train': 1.7476109266281128} -11/07/2021 02:09:25 - INFO - __main__ - Step 34904: {'lr': 0.0004414629676437214, 'samples': 6701568, 'steps': 34903, 'loss/train': 1.56584632396698} -11/07/2021 02:09:26 - INFO - __main__ - Step 34905: {'lr': 0.00044145955527355007, 'samples': 6701760, 'steps': 34904, 'loss/train': 1.7871931791305542} -11/07/2021 02:09:26 - INFO - __main__ - Step 34906: {'lr': 0.00044145614281711, 'samples': 6701952, 'steps': 34905, 'loss/train': 1.3921641111373901} -11/07/2021 02:09:26 - INFO - __main__ - Step 34907: {'lr': 0.00044145273027440275, 'samples': 6702144, 'steps': 34906, 'loss/train': 0.9424101710319519} -11/07/2021 02:09:27 - INFO - __main__ - Step 34908: {'lr': 0.0004414493176454298, 'samples': 6702336, 'steps': 34907, 'loss/train': 1.542037844657898} -11/07/2021 02:09:28 - INFO - __main__ - Step 34909: {'lr': 0.0004414459049301929, 'samples': 6702528, 'steps': 34908, 'loss/train': 2.1305997371673584} -11/07/2021 02:09:28 - INFO - __main__ - Step 34910: {'lr': 0.00044144249212869327, 'samples': 6702720, 'steps': 34909, 'loss/train': 1.6564462184906006} -11/07/2021 02:09:28 - INFO - __main__ - Step 34911: {'lr': 0.0004414390792409326, 'samples': 6702912, 'steps': 34910, 'loss/train': 1.1971884965896606} -11/07/2021 02:09:29 - INFO - __main__ - Step 34912: {'lr': 0.0004414356662669126, 'samples': 6703104, 'steps': 34911, 'loss/train': 1.6676355600357056} -11/07/2021 02:09:29 - INFO - __main__ - Step 34913: {'lr': 0.0004414322532066345, 'samples': 6703296, 'steps': 34912, 'loss/train': 1.4663547277450562} -11/07/2021 02:09:30 - INFO - __main__ - Step 34914: {'lr': 0.0004414288400601, 'samples': 6703488, 'steps': 34913, 'loss/train': 1.660070538520813} -11/07/2021 02:09:30 - INFO - __main__ - Step 34915: {'lr': 0.0004414254268273107, 'samples': 6703680, 'steps': 34914, 'loss/train': 1.2348486185073853} -11/07/2021 02:09:31 - INFO - __main__ - Step 34916: {'lr': 0.0004414220135082679, 'samples': 6703872, 'steps': 34915, 'loss/train': 1.82661771774292} -11/07/2021 02:09:31 - INFO - __main__ - Step 34917: {'lr': 0.0004414186001029734, 'samples': 6704064, 'steps': 34916, 'loss/train': 0.8421643376350403} -11/07/2021 02:09:32 - INFO - __main__ - Step 34918: {'lr': 0.00044141518661142864, 'samples': 6704256, 'steps': 34917, 'loss/train': 1.6239686012268066} -11/07/2021 02:09:32 - INFO - __main__ - Step 34919: {'lr': 0.0004414117730336351, 'samples': 6704448, 'steps': 34918, 'loss/train': 1.4219346046447754} -11/07/2021 02:09:33 - INFO - __main__ - Step 34920: {'lr': 0.0004414083593695944, 'samples': 6704640, 'steps': 34919, 'loss/train': 1.5815865993499756} -11/07/2021 02:09:33 - INFO - __main__ - Step 34921: {'lr': 0.0004414049456193081, 'samples': 6704832, 'steps': 34920, 'loss/train': 1.4162994623184204} -11/07/2021 02:09:34 - INFO - __main__ - Step 34922: {'lr': 0.00044140153178277765, 'samples': 6705024, 'steps': 34921, 'loss/train': 1.4170336723327637} -11/07/2021 02:09:34 - INFO - __main__ - Step 34923: {'lr': 0.0004413981178600046, 'samples': 6705216, 'steps': 34922, 'loss/train': 1.5527942180633545} -11/07/2021 02:09:34 - INFO - __main__ - Step 34924: {'lr': 0.00044139470385099047, 'samples': 6705408, 'steps': 34923, 'loss/train': 1.1438456773757935} -11/07/2021 02:09:35 - INFO - __main__ - Step 34925: {'lr': 0.0004413912897557369, 'samples': 6705600, 'steps': 34924, 'loss/train': 1.6169018745422363} -11/07/2021 02:09:36 - INFO - __main__ - Step 34926: {'lr': 0.0004413878755742454, 'samples': 6705792, 'steps': 34925, 'loss/train': 1.356520414352417} -11/07/2021 02:09:36 - INFO - __main__ - Step 34927: {'lr': 0.00044138446130651736, 'samples': 6705984, 'steps': 34926, 'loss/train': 1.3168401718139648} -11/07/2021 02:09:36 - INFO - __main__ - Step 34928: {'lr': 0.00044138104695255455, 'samples': 6706176, 'steps': 34927, 'loss/train': 1.990412712097168} -11/07/2021 02:09:37 - INFO - __main__ - Step 34929: {'lr': 0.00044137763251235837, 'samples': 6706368, 'steps': 34928, 'loss/train': 1.5698679685592651} -11/07/2021 02:09:38 - INFO - __main__ - Step 34930: {'lr': 0.0004413742179859304, 'samples': 6706560, 'steps': 34929, 'loss/train': 1.8614038228988647} -11/07/2021 02:09:38 - INFO - __main__ - Step 34931: {'lr': 0.00044137080337327205, 'samples': 6706752, 'steps': 34930, 'loss/train': 1.3010913133621216} -11/07/2021 02:09:39 - INFO - __main__ - Step 34932: {'lr': 0.000441367388674385, 'samples': 6706944, 'steps': 34931, 'loss/train': 1.3092995882034302} -11/07/2021 02:09:39 - INFO - __main__ - Step 34933: {'lr': 0.00044136397388927083, 'samples': 6707136, 'steps': 34932, 'loss/train': 2.328650951385498} -11/07/2021 02:09:39 - INFO - __main__ - Step 34934: {'lr': 0.000441360559017931, 'samples': 6707328, 'steps': 34933, 'loss/train': 1.8487857580184937} -11/07/2021 02:09:40 - INFO - __main__ - Step 34935: {'lr': 0.00044135714406036696, 'samples': 6707520, 'steps': 34934, 'loss/train': 1.416915774345398} -11/07/2021 02:09:41 - INFO - __main__ - Step 34936: {'lr': 0.00044135372901658046, 'samples': 6707712, 'steps': 34935, 'loss/train': 1.6198914051055908} -11/07/2021 02:09:41 - INFO - __main__ - Step 34937: {'lr': 0.0004413503138865729, 'samples': 6707904, 'steps': 34936, 'loss/train': 1.4788812398910522} -11/07/2021 02:09:41 - INFO - __main__ - Step 34938: {'lr': 0.00044134689867034583, 'samples': 6708096, 'steps': 34937, 'loss/train': 1.63387131690979} -11/07/2021 02:09:42 - INFO - __main__ - Step 34939: {'lr': 0.00044134348336790074, 'samples': 6708288, 'steps': 34938, 'loss/train': 1.6570875644683838} -11/07/2021 02:09:43 - INFO - __main__ - Step 34940: {'lr': 0.0004413400679792393, 'samples': 6708480, 'steps': 34939, 'loss/train': 1.1660223007202148} -11/07/2021 02:09:43 - INFO - __main__ - Step 34941: {'lr': 0.00044133665250436295, 'samples': 6708672, 'steps': 34940, 'loss/train': 1.474959135055542} -11/07/2021 02:09:44 - INFO - __main__ - Step 34942: {'lr': 0.00044133323694327324, 'samples': 6708864, 'steps': 34941, 'loss/train': 1.4280176162719727} -11/07/2021 02:09:44 - INFO - __main__ - Step 34943: {'lr': 0.0004413298212959718, 'samples': 6709056, 'steps': 34942, 'loss/train': 1.8201326131820679} -11/07/2021 02:09:44 - INFO - __main__ - Step 34944: {'lr': 0.00044132640556246, 'samples': 6709248, 'steps': 34943, 'loss/train': 1.5002176761627197} -11/07/2021 02:09:45 - INFO - __main__ - Step 34945: {'lr': 0.00044132298974273955, 'samples': 6709440, 'steps': 34944, 'loss/train': 1.5995829105377197} -11/07/2021 02:09:46 - INFO - __main__ - Step 34946: {'lr': 0.00044131957383681186, 'samples': 6709632, 'steps': 34945, 'loss/train': 1.2983976602554321} -11/07/2021 02:09:46 - INFO - __main__ - Step 34947: {'lr': 0.0004413161578446785, 'samples': 6709824, 'steps': 34946, 'loss/train': 1.9769909381866455} -11/07/2021 02:09:46 - INFO - __main__ - Step 34948: {'lr': 0.00044131274176634113, 'samples': 6710016, 'steps': 34947, 'loss/train': 1.4638006687164307} -11/07/2021 02:09:47 - INFO - __main__ - Step 34949: {'lr': 0.00044130932560180114, 'samples': 6710208, 'steps': 34948, 'loss/train': 1.0998560190200806} -11/07/2021 02:09:48 - INFO - __main__ - Step 34950: {'lr': 0.0004413059093510601, 'samples': 6710400, 'steps': 34949, 'loss/train': 1.550802230834961} -11/07/2021 02:09:48 - INFO - __main__ - Step 34951: {'lr': 0.00044130249301411957, 'samples': 6710592, 'steps': 34950, 'loss/train': 1.3702425956726074} -11/07/2021 02:09:48 - INFO - __main__ - Step 34952: {'lr': 0.0004412990765909811, 'samples': 6710784, 'steps': 34951, 'loss/train': 1.2934271097183228} -11/07/2021 02:09:49 - INFO - __main__ - Step 34953: {'lr': 0.0004412956600816462, 'samples': 6710976, 'steps': 34952, 'loss/train': 1.6466397047042847} -11/07/2021 02:09:49 - INFO - __main__ - Step 34954: {'lr': 0.00044129224348611644, 'samples': 6711168, 'steps': 34953, 'loss/train': 1.0837256908416748} -11/07/2021 02:09:49 - INFO - __main__ - Step 34955: {'lr': 0.0004412888268043934, 'samples': 6711360, 'steps': 34954, 'loss/train': 1.3979381322860718} -11/07/2021 02:09:50 - INFO - __main__ - Step 34956: {'lr': 0.0004412854100364785, 'samples': 6711552, 'steps': 34955, 'loss/train': 1.2368285655975342} -11/07/2021 02:09:51 - INFO - __main__ - Step 34957: {'lr': 0.0004412819931823734, 'samples': 6711744, 'steps': 34956, 'loss/train': 1.5563851594924927} -11/07/2021 02:09:51 - INFO - __main__ - Step 34958: {'lr': 0.0004412785762420795, 'samples': 6711936, 'steps': 34957, 'loss/train': 1.4423242807388306} -11/07/2021 02:09:51 - INFO - __main__ - Step 34959: {'lr': 0.0004412751592155985, 'samples': 6712128, 'steps': 34958, 'loss/train': 1.4660046100616455} -11/07/2021 02:09:52 - INFO - __main__ - Step 34960: {'lr': 0.00044127174210293186, 'samples': 6712320, 'steps': 34959, 'loss/train': 1.6709436178207397} -11/07/2021 02:09:53 - INFO - __main__ - Step 34961: {'lr': 0.0004412683249040811, 'samples': 6712512, 'steps': 34960, 'loss/train': 5.549959182739258} -11/07/2021 02:09:53 - INFO - __main__ - Step 34962: {'lr': 0.0004412649076190478, 'samples': 6712704, 'steps': 34961, 'loss/train': 1.7965469360351562} -11/07/2021 02:09:54 - INFO - __main__ - Step 34963: {'lr': 0.00044126149024783346, 'samples': 6712896, 'steps': 34962, 'loss/train': 1.778951644897461} -11/07/2021 02:09:54 - INFO - __main__ - Step 34964: {'lr': 0.0004412580727904396, 'samples': 6713088, 'steps': 34963, 'loss/train': 1.7027897834777832} -11/07/2021 02:09:54 - INFO - __main__ - Step 34965: {'lr': 0.0004412546552468679, 'samples': 6713280, 'steps': 34964, 'loss/train': 1.5230058431625366} -11/07/2021 02:09:55 - INFO - __main__ - Step 34966: {'lr': 0.00044125123761711975, 'samples': 6713472, 'steps': 34965, 'loss/train': 1.532887578010559} -11/07/2021 02:09:56 - INFO - __main__ - Step 34967: {'lr': 0.00044124781990119677, 'samples': 6713664, 'steps': 34966, 'loss/train': 1.342242956161499} -11/07/2021 02:09:56 - INFO - __main__ - Step 34968: {'lr': 0.0004412444020991004, 'samples': 6713856, 'steps': 34967, 'loss/train': 1.6180024147033691} -11/07/2021 02:09:56 - INFO - __main__ - Step 34969: {'lr': 0.0004412409842108324, 'samples': 6714048, 'steps': 34968, 'loss/train': 1.4326096773147583} -11/07/2021 02:09:57 - INFO - __main__ - Step 34970: {'lr': 0.0004412375662363941, 'samples': 6714240, 'steps': 34969, 'loss/train': 1.4714924097061157} -11/07/2021 02:09:57 - INFO - __main__ - Step 34971: {'lr': 0.00044123414817578705, 'samples': 6714432, 'steps': 34970, 'loss/train': 1.4865937232971191} -11/07/2021 02:09:58 - INFO - __main__ - Step 34972: {'lr': 0.00044123073002901286, 'samples': 6714624, 'steps': 34971, 'loss/train': 0.8073616027832031} -11/07/2021 02:09:58 - INFO - __main__ - Step 34973: {'lr': 0.0004412273117960731, 'samples': 6714816, 'steps': 34972, 'loss/train': 1.7737014293670654} -11/07/2021 02:09:59 - INFO - __main__ - Step 34974: {'lr': 0.00044122389347696925, 'samples': 6715008, 'steps': 34973, 'loss/train': 2.0137529373168945} -11/07/2021 02:09:59 - INFO - __main__ - Step 34975: {'lr': 0.0004412204750717028, 'samples': 6715200, 'steps': 34974, 'loss/train': 0.3884543478488922} -11/07/2021 02:10:00 - INFO - __main__ - Step 34976: {'lr': 0.00044121705658027545, 'samples': 6715392, 'steps': 34975, 'loss/train': 1.497333288192749} -11/07/2021 02:10:01 - INFO - __main__ - Step 34977: {'lr': 0.00044121363800268853, 'samples': 6715584, 'steps': 34976, 'loss/train': 1.0845884084701538} -11/07/2021 02:10:01 - INFO - __main__ - Step 34978: {'lr': 0.0004412102193389438, 'samples': 6715776, 'steps': 34977, 'loss/train': 1.5789704322814941} -11/07/2021 02:10:01 - INFO - __main__ - Step 34979: {'lr': 0.0004412068005890427, 'samples': 6715968, 'steps': 34978, 'loss/train': 1.7439966201782227} -11/07/2021 02:10:02 - INFO - __main__ - Step 34980: {'lr': 0.0004412033817529867, 'samples': 6716160, 'steps': 34979, 'loss/train': 1.5079094171524048} -11/07/2021 02:10:02 - INFO - __main__ - Step 34981: {'lr': 0.0004411999628307775, 'samples': 6716352, 'steps': 34980, 'loss/train': 1.6859904527664185} -11/07/2021 02:10:03 - INFO - __main__ - Step 34982: {'lr': 0.0004411965438224164, 'samples': 6716544, 'steps': 34981, 'loss/train': 1.6609724760055542} -11/07/2021 02:10:03 - INFO - __main__ - Step 34983: {'lr': 0.0004411931247279052, 'samples': 6716736, 'steps': 34982, 'loss/train': 1.7958378791809082} -11/07/2021 02:10:04 - INFO - __main__ - Step 34984: {'lr': 0.00044118970554724523, 'samples': 6716928, 'steps': 34983, 'loss/train': 1.3812191486358643} -11/07/2021 02:10:04 - INFO - __main__ - Step 34985: {'lr': 0.0004411862862804382, 'samples': 6717120, 'steps': 34984, 'loss/train': 1.4085384607315063} -11/07/2021 02:10:04 - INFO - __main__ - Step 34986: {'lr': 0.0004411828669274856, 'samples': 6717312, 'steps': 34985, 'loss/train': 1.5094749927520752} -11/07/2021 02:10:05 - INFO - __main__ - Step 34987: {'lr': 0.0004411794474883889, 'samples': 6717504, 'steps': 34986, 'loss/train': 1.621686577796936} -11/07/2021 02:10:06 - INFO - __main__ - Step 34988: {'lr': 0.0004411760279631497, 'samples': 6717696, 'steps': 34987, 'loss/train': 1.5280160903930664} -11/07/2021 02:10:06 - INFO - __main__ - Step 34989: {'lr': 0.0004411726083517696, 'samples': 6717888, 'steps': 34988, 'loss/train': 1.2565999031066895} -11/07/2021 02:10:06 - INFO - __main__ - Step 34990: {'lr': 0.00044116918865425004, 'samples': 6718080, 'steps': 34989, 'loss/train': 1.393542766571045} -11/07/2021 02:10:07 - INFO - __main__ - Step 34991: {'lr': 0.00044116576887059255, 'samples': 6718272, 'steps': 34990, 'loss/train': 1.5766887664794922} -11/07/2021 02:10:07 - INFO - __main__ - Step 34992: {'lr': 0.0004411623490007988, 'samples': 6718464, 'steps': 34991, 'loss/train': 1.8799902200698853} -11/07/2021 02:10:08 - INFO - __main__ - Step 34993: {'lr': 0.0004411589290448701, 'samples': 6718656, 'steps': 34992, 'loss/train': 1.3170068264007568} -11/07/2021 02:10:09 - INFO - __main__ - Step 34994: {'lr': 0.0004411555090028082, 'samples': 6718848, 'steps': 34993, 'loss/train': 1.787194848060608} -11/07/2021 02:10:09 - INFO - __main__ - Step 34995: {'lr': 0.00044115208887461464, 'samples': 6719040, 'steps': 34994, 'loss/train': 1.9786200523376465} -11/07/2021 02:10:09 - INFO - __main__ - Step 34996: {'lr': 0.00044114866866029086, 'samples': 6719232, 'steps': 34995, 'loss/train': 1.6246813535690308} -11/07/2021 02:10:10 - INFO - __main__ - Step 34997: {'lr': 0.00044114524835983844, 'samples': 6719424, 'steps': 34996, 'loss/train': 1.6504180431365967} -11/07/2021 02:10:11 - INFO - __main__ - Step 34998: {'lr': 0.00044114182797325884, 'samples': 6719616, 'steps': 34997, 'loss/train': 1.5485693216323853} -11/07/2021 02:10:11 - INFO - __main__ - Step 34999: {'lr': 0.0004411384075005538, 'samples': 6719808, 'steps': 34998, 'loss/train': 1.5711191892623901} -11/07/2021 02:10:11 - INFO - __main__ - Step 35000: {'lr': 0.0004411349869417247, 'samples': 6720000, 'steps': 34999, 'loss/train': 1.5556280612945557} -11/07/2021 02:10:12 - INFO - __main__ - Step 35001: {'lr': 0.00044113156629677313, 'samples': 6720192, 'steps': 35000, 'loss/train': 1.2026489973068237} -11/07/2021 02:10:12 - INFO - __main__ - Step 35002: {'lr': 0.00044112814556570066, 'samples': 6720384, 'steps': 35001, 'loss/train': 1.5875060558319092} -11/07/2021 02:10:13 - INFO - __main__ - Step 35003: {'lr': 0.00044112472474850875, 'samples': 6720576, 'steps': 35002, 'loss/train': 1.0374408960342407} -11/07/2021 02:10:14 - INFO - __main__ - Step 35004: {'lr': 0.000441121303845199, 'samples': 6720768, 'steps': 35003, 'loss/train': 1.64098060131073} -11/07/2021 02:10:14 - INFO - __main__ - Step 35005: {'lr': 0.0004411178828557729, 'samples': 6720960, 'steps': 35004, 'loss/train': 1.4752988815307617} -11/07/2021 02:10:14 - INFO - __main__ - Step 35006: {'lr': 0.00044111446178023205, 'samples': 6721152, 'steps': 35005, 'loss/train': 1.3469408750534058} -11/07/2021 02:10:15 - INFO - __main__ - Step 35007: {'lr': 0.000441111040618578, 'samples': 6721344, 'steps': 35006, 'loss/train': 1.4651458263397217} -11/07/2021 02:10:16 - INFO - __main__ - Step 35008: {'lr': 0.0004411076193708122, 'samples': 6721536, 'steps': 35007, 'loss/train': 1.4971396923065186} -11/07/2021 02:10:16 - INFO - __main__ - Step 35009: {'lr': 0.00044110419803693635, 'samples': 6721728, 'steps': 35008, 'loss/train': 0.8315962553024292} -11/07/2021 02:10:16 - INFO - __main__ - Step 35010: {'lr': 0.00044110077661695194, 'samples': 6721920, 'steps': 35009, 'loss/train': 1.402260661125183} -11/07/2021 02:10:17 - INFO - __main__ - Step 35011: {'lr': 0.00044109735511086036, 'samples': 6722112, 'steps': 35010, 'loss/train': 1.282967448234558} -11/07/2021 02:10:17 - INFO - __main__ - Step 35012: {'lr': 0.00044109393351866324, 'samples': 6722304, 'steps': 35011, 'loss/train': 1.2022982835769653} -11/07/2021 02:10:18 - INFO - __main__ - Step 35013: {'lr': 0.0004410905118403622, 'samples': 6722496, 'steps': 35012, 'loss/train': 1.6865010261535645} -11/07/2021 02:10:18 - INFO - __main__ - Step 35014: {'lr': 0.0004410870900759587, 'samples': 6722688, 'steps': 35013, 'loss/train': 1.4623432159423828} -11/07/2021 02:10:19 - INFO - __main__ - Step 35015: {'lr': 0.0004410836682254543, 'samples': 6722880, 'steps': 35014, 'loss/train': 0.9109211564064026} -11/07/2021 02:10:19 - INFO - __main__ - Step 35016: {'lr': 0.0004410802462888506, 'samples': 6723072, 'steps': 35015, 'loss/train': 0.7895492911338806} -11/07/2021 02:10:19 - INFO - __main__ - Step 35017: {'lr': 0.00044107682426614903, 'samples': 6723264, 'steps': 35016, 'loss/train': 1.300127387046814} -11/07/2021 02:10:20 - INFO - __main__ - Step 35018: {'lr': 0.00044107340215735125, 'samples': 6723456, 'steps': 35017, 'loss/train': 1.3238352537155151} -11/07/2021 02:10:21 - INFO - __main__ - Step 35019: {'lr': 0.00044106997996245866, 'samples': 6723648, 'steps': 35018, 'loss/train': 2.105529546737671} -11/07/2021 02:10:21 - INFO - __main__ - Step 35020: {'lr': 0.000441066557681473, 'samples': 6723840, 'steps': 35019, 'loss/train': 1.2819880247116089} -11/07/2021 02:10:22 - INFO - __main__ - Step 35021: {'lr': 0.00044106313531439565, 'samples': 6724032, 'steps': 35020, 'loss/train': 1.5403814315795898} -11/07/2021 02:10:22 - INFO - __main__ - Step 35022: {'lr': 0.00044105971286122816, 'samples': 6724224, 'steps': 35021, 'loss/train': 1.7440218925476074} -11/07/2021 02:10:22 - INFO - __main__ - Step 35023: {'lr': 0.00044105629032197214, 'samples': 6724416, 'steps': 35022, 'loss/train': 1.8121604919433594} -11/07/2021 02:10:23 - INFO - __main__ - Step 35024: {'lr': 0.0004410528676966291, 'samples': 6724608, 'steps': 35023, 'loss/train': 1.0739877223968506} -11/07/2021 02:10:24 - INFO - __main__ - Step 35025: {'lr': 0.00044104944498520054, 'samples': 6724800, 'steps': 35024, 'loss/train': 1.7789803743362427} -11/07/2021 02:10:24 - INFO - __main__ - Step 35026: {'lr': 0.00044104602218768805, 'samples': 6724992, 'steps': 35025, 'loss/train': 1.231187105178833} -11/07/2021 02:10:24 - INFO - __main__ - Step 35027: {'lr': 0.0004410425993040933, 'samples': 6725184, 'steps': 35026, 'loss/train': 1.0795031785964966} -11/07/2021 02:10:25 - INFO - __main__ - Step 35028: {'lr': 0.0004410391763344176, 'samples': 6725376, 'steps': 35027, 'loss/train': 1.4300146102905273} -11/07/2021 02:10:26 - INFO - __main__ - Step 35029: {'lr': 0.00044103575327866264, 'samples': 6725568, 'steps': 35028, 'loss/train': 1.447784185409546} -11/07/2021 02:10:26 - INFO - __main__ - Step 35030: {'lr': 0.0004410323301368299, 'samples': 6725760, 'steps': 35029, 'loss/train': 1.640128254890442} -11/07/2021 02:10:26 - INFO - __main__ - Step 35031: {'lr': 0.0004410289069089209, 'samples': 6725952, 'steps': 35030, 'loss/train': 1.679473638534546} -11/07/2021 02:10:27 - INFO - __main__ - Step 35032: {'lr': 0.0004410254835949372, 'samples': 6726144, 'steps': 35031, 'loss/train': 2.850522041320801} -11/07/2021 02:10:27 - INFO - __main__ - Step 35033: {'lr': 0.00044102206019488045, 'samples': 6726336, 'steps': 35032, 'loss/train': 1.5364875793457031} -11/07/2021 02:10:28 - INFO - __main__ - Step 35034: {'lr': 0.00044101863670875207, 'samples': 6726528, 'steps': 35033, 'loss/train': 1.8543156385421753} -11/07/2021 02:10:28 - INFO - __main__ - Step 35035: {'lr': 0.0004410152131365536, 'samples': 6726720, 'steps': 35034, 'loss/train': 1.3566513061523438} -11/07/2021 02:10:29 - INFO - __main__ - Step 35036: {'lr': 0.00044101178947828667, 'samples': 6726912, 'steps': 35035, 'loss/train': 1.6695739030838013} -11/07/2021 02:10:29 - INFO - __main__ - Step 35037: {'lr': 0.0004410083657339528, 'samples': 6727104, 'steps': 35036, 'loss/train': 1.3210400342941284} -11/07/2021 02:10:30 - INFO - __main__ - Step 35038: {'lr': 0.00044100494190355347, 'samples': 6727296, 'steps': 35037, 'loss/train': 1.3826854228973389} -11/07/2021 02:10:30 - INFO - __main__ - Step 35039: {'lr': 0.0004410015179870903, 'samples': 6727488, 'steps': 35038, 'loss/train': 1.1722732782363892} -11/07/2021 02:10:31 - INFO - __main__ - Step 35040: {'lr': 0.0004409980939845647, 'samples': 6727680, 'steps': 35039, 'loss/train': 1.5157371759414673} -11/07/2021 02:10:31 - INFO - __main__ - Step 35041: {'lr': 0.00044099466989597837, 'samples': 6727872, 'steps': 35040, 'loss/train': 0.8572977781295776} -11/07/2021 02:10:32 - INFO - __main__ - Step 35042: {'lr': 0.00044099124572133283, 'samples': 6728064, 'steps': 35041, 'loss/train': 1.6489825248718262} -11/07/2021 02:10:32 - INFO - __main__ - Step 35043: {'lr': 0.00044098782146062955, 'samples': 6728256, 'steps': 35042, 'loss/train': 1.5331951379776} -11/07/2021 02:10:33 - INFO - __main__ - Step 35044: {'lr': 0.00044098439711387006, 'samples': 6728448, 'steps': 35043, 'loss/train': 2.036832332611084} -11/07/2021 02:10:33 - INFO - __main__ - Step 35045: {'lr': 0.000440980972681056, 'samples': 6728640, 'steps': 35044, 'loss/train': 1.3515995740890503} -11/07/2021 02:10:34 - INFO - __main__ - Step 35046: {'lr': 0.0004409775481621888, 'samples': 6728832, 'steps': 35045, 'loss/train': 1.6868525743484497} -11/07/2021 02:10:34 - INFO - __main__ - Step 35047: {'lr': 0.0004409741235572701, 'samples': 6729024, 'steps': 35046, 'loss/train': 1.4944453239440918} -11/07/2021 02:10:34 - INFO - __main__ - Step 35048: {'lr': 0.0004409706988663015, 'samples': 6729216, 'steps': 35047, 'loss/train': 1.173051357269287} -11/07/2021 02:10:35 - INFO - __main__ - Step 35049: {'lr': 0.00044096727408928426, 'samples': 6729408, 'steps': 35048, 'loss/train': 0.7876967787742615} -11/07/2021 02:10:36 - INFO - __main__ - Step 35050: {'lr': 0.0004409638492262202, 'samples': 6729600, 'steps': 35049, 'loss/train': 1.5770975351333618} -11/07/2021 02:10:36 - INFO - __main__ - Step 35051: {'lr': 0.0004409604242771108, 'samples': 6729792, 'steps': 35050, 'loss/train': 1.332051157951355} -11/07/2021 02:10:36 - INFO - __main__ - Step 35052: {'lr': 0.0004409569992419576, 'samples': 6729984, 'steps': 35051, 'loss/train': 1.4920984506607056} -11/07/2021 02:10:37 - INFO - __main__ - Step 35053: {'lr': 0.0004409535741207621, 'samples': 6730176, 'steps': 35052, 'loss/train': 1.529261589050293} -11/07/2021 02:10:37 - INFO - __main__ - Step 35054: {'lr': 0.00044095014891352584, 'samples': 6730368, 'steps': 35053, 'loss/train': 1.5102005004882812} -11/07/2021 02:10:38 - INFO - __main__ - Step 35055: {'lr': 0.0004409467236202505, 'samples': 6730560, 'steps': 35054, 'loss/train': 1.2564643621444702} -11/07/2021 02:10:38 - INFO - __main__ - Step 35056: {'lr': 0.0004409432982409374, 'samples': 6730752, 'steps': 35055, 'loss/train': 1.3979930877685547} -11/07/2021 02:10:39 - INFO - __main__ - Step 35057: {'lr': 0.0004409398727755882, 'samples': 6730944, 'steps': 35056, 'loss/train': 1.7569228410720825} -11/07/2021 02:10:39 - INFO - __main__ - Step 35058: {'lr': 0.00044093644722420445, 'samples': 6731136, 'steps': 35057, 'loss/train': 1.5639421939849854} -11/07/2021 02:10:40 - INFO - __main__ - Step 35059: {'lr': 0.00044093302158678766, 'samples': 6731328, 'steps': 35058, 'loss/train': 1.4638268947601318} -11/07/2021 02:10:41 - INFO - __main__ - Step 35060: {'lr': 0.0004409295958633394, 'samples': 6731520, 'steps': 35059, 'loss/train': 1.401228427886963} -11/07/2021 02:10:41 - INFO - __main__ - Step 35061: {'lr': 0.00044092617005386125, 'samples': 6731712, 'steps': 35060, 'loss/train': 1.2886829376220703} -11/07/2021 02:10:41 - INFO - __main__ - Step 35062: {'lr': 0.00044092274415835473, 'samples': 6731904, 'steps': 35061, 'loss/train': 1.3746353387832642} -11/07/2021 02:10:42 - INFO - __main__ - Step 35063: {'lr': 0.0004409193181768213, 'samples': 6732096, 'steps': 35062, 'loss/train': 1.3529815673828125} -11/07/2021 02:10:42 - INFO - __main__ - Step 35064: {'lr': 0.00044091589210926266, 'samples': 6732288, 'steps': 35063, 'loss/train': 1.3183367252349854} -11/07/2021 02:10:43 - INFO - __main__ - Step 35065: {'lr': 0.00044091246595568025, 'samples': 6732480, 'steps': 35064, 'loss/train': 1.1994445323944092} -11/07/2021 02:10:43 - INFO - __main__ - Step 35066: {'lr': 0.00044090903971607555, 'samples': 6732672, 'steps': 35065, 'loss/train': 1.7616498470306396} -11/07/2021 02:10:44 - INFO - __main__ - Step 35067: {'lr': 0.0004409056133904502, 'samples': 6732864, 'steps': 35066, 'loss/train': 1.6132047176361084} -11/07/2021 02:10:44 - INFO - __main__ - Step 35068: {'lr': 0.00044090218697880577, 'samples': 6733056, 'steps': 35067, 'loss/train': 1.7040773630142212} -11/07/2021 02:10:44 - INFO - __main__ - Step 35069: {'lr': 0.0004408987604811437, 'samples': 6733248, 'steps': 35068, 'loss/train': 1.5884809494018555} -11/07/2021 02:10:46 - INFO - __main__ - Step 35070: {'lr': 0.00044089533389746573, 'samples': 6733440, 'steps': 35069, 'loss/train': 1.5156008005142212} -11/07/2021 02:10:46 - INFO - __main__ - Step 35071: {'lr': 0.00044089190722777316, 'samples': 6733632, 'steps': 35070, 'loss/train': 0.1750890463590622} -11/07/2021 02:10:47 - INFO - __main__ - Step 35072: {'lr': 0.00044088848047206763, 'samples': 6733824, 'steps': 35071, 'loss/train': 1.5426185131072998} -11/07/2021 02:10:47 - INFO - __main__ - Step 35073: {'lr': 0.0004408850536303507, 'samples': 6734016, 'steps': 35072, 'loss/train': 1.6482864618301392} -11/07/2021 02:10:47 - INFO - __main__ - Step 35074: {'lr': 0.000440881626702624, 'samples': 6734208, 'steps': 35073, 'loss/train': 1.0828303098678589} -11/07/2021 02:10:48 - INFO - __main__ - Step 35075: {'lr': 0.00044087819968888887, 'samples': 6734400, 'steps': 35074, 'loss/train': 1.6241428852081299} -11/07/2021 02:10:49 - INFO - __main__ - Step 35076: {'lr': 0.00044087477258914696, 'samples': 6734592, 'steps': 35075, 'loss/train': 1.5479053258895874} -11/07/2021 02:10:49 - INFO - __main__ - Step 35077: {'lr': 0.00044087134540339996, 'samples': 6734784, 'steps': 35076, 'loss/train': 1.4886677265167236} -11/07/2021 02:10:50 - INFO - __main__ - Step 35078: {'lr': 0.00044086791813164916, 'samples': 6734976, 'steps': 35077, 'loss/train': 1.4844224452972412} -11/07/2021 02:10:50 - INFO - __main__ - Step 35079: {'lr': 0.00044086449077389636, 'samples': 6735168, 'steps': 35078, 'loss/train': 0.624704897403717} -11/07/2021 02:10:50 - INFO - __main__ - Step 35080: {'lr': 0.0004408610633301428, 'samples': 6735360, 'steps': 35079, 'loss/train': 1.6156529188156128} -11/07/2021 02:10:51 - INFO - __main__ - Step 35081: {'lr': 0.00044085763580039027, 'samples': 6735552, 'steps': 35080, 'loss/train': 2.0500946044921875} -11/07/2021 02:10:52 - INFO - __main__ - Step 35082: {'lr': 0.0004408542081846402, 'samples': 6735744, 'steps': 35081, 'loss/train': 1.3576505184173584} -11/07/2021 02:10:52 - INFO - __main__ - Step 35083: {'lr': 0.0004408507804828942, 'samples': 6735936, 'steps': 35082, 'loss/train': 1.5053588151931763} -11/07/2021 02:10:52 - INFO - __main__ - Step 35084: {'lr': 0.00044084735269515375, 'samples': 6736128, 'steps': 35083, 'loss/train': 1.6152665615081787} -11/07/2021 02:10:53 - INFO - __main__ - Step 35085: {'lr': 0.0004408439248214205, 'samples': 6736320, 'steps': 35084, 'loss/train': 1.7226558923721313} -11/07/2021 02:10:54 - INFO - __main__ - Step 35086: {'lr': 0.00044084049686169584, 'samples': 6736512, 'steps': 35085, 'loss/train': 0.5707530379295349} -11/07/2021 02:10:54 - INFO - __main__ - Step 35087: {'lr': 0.00044083706881598147, 'samples': 6736704, 'steps': 35086, 'loss/train': 1.0183169841766357} -11/07/2021 02:10:54 - INFO - __main__ - Step 35088: {'lr': 0.00044083364068427875, 'samples': 6736896, 'steps': 35087, 'loss/train': 1.3448383808135986} -11/07/2021 02:10:55 - INFO - __main__ - Step 35089: {'lr': 0.0004408302124665894, 'samples': 6737088, 'steps': 35088, 'loss/train': 1.307666540145874} -11/07/2021 02:10:55 - INFO - __main__ - Step 35090: {'lr': 0.00044082678416291495, 'samples': 6737280, 'steps': 35089, 'loss/train': 1.2448477745056152} -11/07/2021 02:10:56 - INFO - __main__ - Step 35091: {'lr': 0.00044082335577325685, 'samples': 6737472, 'steps': 35090, 'loss/train': 1.7214866876602173} -11/07/2021 02:10:56 - INFO - __main__ - Step 35092: {'lr': 0.0004408199272976167, 'samples': 6737664, 'steps': 35091, 'loss/train': 1.1318559646606445} -11/07/2021 02:10:57 - INFO - __main__ - Step 35093: {'lr': 0.00044081649873599604, 'samples': 6737856, 'steps': 35092, 'loss/train': 1.1720187664031982} -11/07/2021 02:10:57 - INFO - __main__ - Step 35094: {'lr': 0.0004408130700883964, 'samples': 6738048, 'steps': 35093, 'loss/train': 1.5962964296340942} -11/07/2021 02:10:57 - INFO - __main__ - Step 35095: {'lr': 0.0004408096413548193, 'samples': 6738240, 'steps': 35094, 'loss/train': 1.6870752573013306} -11/07/2021 02:10:59 - INFO - __main__ - Step 35096: {'lr': 0.00044080621253526637, 'samples': 6738432, 'steps': 35095, 'loss/train': 1.6659575700759888} -11/07/2021 02:10:59 - INFO - __main__ - Step 35097: {'lr': 0.00044080278362973913, 'samples': 6738624, 'steps': 35096, 'loss/train': 0.179875910282135} -11/07/2021 02:10:59 - INFO - __main__ - Step 35098: {'lr': 0.00044079935463823904, 'samples': 6738816, 'steps': 35097, 'loss/train': 1.3444435596466064} -11/07/2021 02:11:00 - INFO - __main__ - Step 35099: {'lr': 0.00044079592556076774, 'samples': 6739008, 'steps': 35098, 'loss/train': 1.744091510772705} -11/07/2021 02:11:00 - INFO - __main__ - Step 35100: {'lr': 0.00044079249639732664, 'samples': 6739200, 'steps': 35099, 'loss/train': 1.3593708276748657} -11/07/2021 02:11:00 - INFO - __main__ - Step 35101: {'lr': 0.00044078906714791757, 'samples': 6739392, 'steps': 35100, 'loss/train': 1.0961785316467285} -11/07/2021 02:11:01 - INFO - __main__ - Step 35102: {'lr': 0.0004407856378125418, 'samples': 6739584, 'steps': 35101, 'loss/train': 0.9805355668067932} -11/07/2021 02:11:02 - INFO - __main__ - Step 35103: {'lr': 0.00044078220839120086, 'samples': 6739776, 'steps': 35102, 'loss/train': 1.060352087020874} -11/07/2021 02:11:02 - INFO - __main__ - Step 35104: {'lr': 0.0004407787788838966, 'samples': 6739968, 'steps': 35103, 'loss/train': 1.8644888401031494} -11/07/2021 02:11:02 - INFO - __main__ - Step 35105: {'lr': 0.00044077534929063024, 'samples': 6740160, 'steps': 35104, 'loss/train': 0.9975321292877197} -11/07/2021 02:11:03 - INFO - __main__ - Step 35106: {'lr': 0.00044077191961140337, 'samples': 6740352, 'steps': 35105, 'loss/train': 1.116125226020813} -11/07/2021 02:11:04 - INFO - __main__ - Step 35107: {'lr': 0.00044076848984621775, 'samples': 6740544, 'steps': 35106, 'loss/train': 1.8047592639923096} -11/07/2021 02:11:04 - INFO - __main__ - Step 35108: {'lr': 0.00044076505999507474, 'samples': 6740736, 'steps': 35107, 'loss/train': 1.368557333946228} -11/07/2021 02:11:04 - INFO - __main__ - Step 35109: {'lr': 0.00044076163005797597, 'samples': 6740928, 'steps': 35108, 'loss/train': 1.1860182285308838} -11/07/2021 02:11:05 - INFO - __main__ - Step 35110: {'lr': 0.00044075820003492295, 'samples': 6741120, 'steps': 35109, 'loss/train': 1.5062674283981323} -11/07/2021 02:11:05 - INFO - __main__ - Step 35111: {'lr': 0.0004407547699259173, 'samples': 6741312, 'steps': 35110, 'loss/train': 0.8496090769767761} -11/07/2021 02:11:07 - INFO - __main__ - Step 35112: {'lr': 0.0004407513397309604, 'samples': 6741504, 'steps': 35111, 'loss/train': 1.6295762062072754} -11/07/2021 02:11:08 - INFO - __main__ - Step 35113: {'lr': 0.0004407479094500539, 'samples': 6741696, 'steps': 35112, 'loss/train': 1.8969480991363525} -11/07/2021 02:11:08 - INFO - __main__ - Step 35114: {'lr': 0.00044074447908319935, 'samples': 6741888, 'steps': 35113, 'loss/train': 1.7611387968063354} -11/07/2021 02:11:08 - INFO - __main__ - Step 35115: {'lr': 0.0004407410486303983, 'samples': 6742080, 'steps': 35114, 'loss/train': 1.7748589515686035} -11/07/2021 02:11:09 - INFO - __main__ - Step 35116: {'lr': 0.0004407376180916522, 'samples': 6742272, 'steps': 35115, 'loss/train': 1.7863101959228516} -11/07/2021 02:11:09 - INFO - __main__ - Step 35117: {'lr': 0.0004407341874669627, 'samples': 6742464, 'steps': 35116, 'loss/train': 1.1374247074127197} -11/07/2021 02:11:09 - INFO - __main__ - Step 35118: {'lr': 0.00044073075675633134, 'samples': 6742656, 'steps': 35117, 'loss/train': 1.0929744243621826} -11/07/2021 02:11:10 - INFO - __main__ - Step 35119: {'lr': 0.0004407273259597597, 'samples': 6742848, 'steps': 35118, 'loss/train': 1.2872812747955322} -11/07/2021 02:11:11 - INFO - __main__ - Step 35120: {'lr': 0.0004407238950772492, 'samples': 6743040, 'steps': 35119, 'loss/train': 1.0824187994003296} -11/07/2021 02:11:11 - INFO - __main__ - Step 35121: {'lr': 0.00044072046410880143, 'samples': 6743232, 'steps': 35120, 'loss/train': 1.271795392036438} -11/07/2021 02:11:12 - INFO - __main__ - Step 35122: {'lr': 0.000440717033054418, 'samples': 6743424, 'steps': 35121, 'loss/train': 1.3499759435653687} -11/07/2021 02:11:12 - INFO - __main__ - Step 35123: {'lr': 0.0004407136019141005, 'samples': 6743616, 'steps': 35122, 'loss/train': 2.010877847671509} -11/07/2021 02:11:12 - INFO - __main__ - Step 35124: {'lr': 0.0004407101706878502, 'samples': 6743808, 'steps': 35123, 'loss/train': 1.6080549955368042} -11/07/2021 02:11:13 - INFO - __main__ - Step 35125: {'lr': 0.000440706739375669, 'samples': 6744000, 'steps': 35124, 'loss/train': 1.2922800779342651} -11/07/2021 02:11:14 - INFO - __main__ - Step 35126: {'lr': 0.00044070330797755825, 'samples': 6744192, 'steps': 35125, 'loss/train': 1.4698541164398193} -11/07/2021 02:11:14 - INFO - __main__ - Step 35127: {'lr': 0.0004406998764935195, 'samples': 6744384, 'steps': 35126, 'loss/train': 1.8241018056869507} -11/07/2021 02:11:14 - INFO - __main__ - Step 35128: {'lr': 0.0004406964449235544, 'samples': 6744576, 'steps': 35127, 'loss/train': 1.5889697074890137} -11/07/2021 02:11:15 - INFO - __main__ - Step 35129: {'lr': 0.00044069301326766434, 'samples': 6744768, 'steps': 35128, 'loss/train': 1.4178204536437988} -11/07/2021 02:11:16 - INFO - __main__ - Step 35130: {'lr': 0.00044068958152585104, 'samples': 6744960, 'steps': 35129, 'loss/train': 1.3953704833984375} -11/07/2021 02:11:16 - INFO - __main__ - Step 35131: {'lr': 0.00044068614969811586, 'samples': 6745152, 'steps': 35130, 'loss/train': 1.991770625114441} -11/07/2021 02:11:16 - INFO - __main__ - Step 35132: {'lr': 0.0004406827177844605, 'samples': 6745344, 'steps': 35131, 'loss/train': 1.2228375673294067} -11/07/2021 02:11:17 - INFO - __main__ - Step 35133: {'lr': 0.00044067928578488645, 'samples': 6745536, 'steps': 35132, 'loss/train': 1.795264720916748} -11/07/2021 02:11:17 - INFO - __main__ - Step 35134: {'lr': 0.0004406758536993952, 'samples': 6745728, 'steps': 35133, 'loss/train': 1.8044919967651367} -11/07/2021 02:11:19 - INFO - __main__ - Step 35135: {'lr': 0.00044067242152798843, 'samples': 6745920, 'steps': 35134, 'loss/train': 1.4043021202087402} -11/07/2021 02:11:19 - INFO - __main__ - Step 35136: {'lr': 0.00044066898927066757, 'samples': 6746112, 'steps': 35135, 'loss/train': 1.4440217018127441} -11/07/2021 02:11:19 - INFO - __main__ - Step 35137: {'lr': 0.0004406655569274342, 'samples': 6746304, 'steps': 35136, 'loss/train': 0.3199705183506012} -11/07/2021 02:11:20 - INFO - __main__ - Step 35138: {'lr': 0.0004406621244982899, 'samples': 6746496, 'steps': 35137, 'loss/train': 1.5187562704086304} -11/07/2021 02:11:20 - INFO - __main__ - Step 35139: {'lr': 0.00044065869198323614, 'samples': 6746688, 'steps': 35138, 'loss/train': 1.7210921049118042} -11/07/2021 02:11:20 - INFO - __main__ - Step 35140: {'lr': 0.0004406552593822746, 'samples': 6746880, 'steps': 35139, 'loss/train': 1.8576350212097168} -11/07/2021 02:11:21 - INFO - __main__ - Step 35141: {'lr': 0.00044065182669540665, 'samples': 6747072, 'steps': 35140, 'loss/train': 1.4928169250488281} -11/07/2021 02:11:22 - INFO - __main__ - Step 35142: {'lr': 0.000440648393922634, 'samples': 6747264, 'steps': 35141, 'loss/train': 0.8861057162284851} -11/07/2021 02:11:22 - INFO - __main__ - Step 35143: {'lr': 0.0004406449610639581, 'samples': 6747456, 'steps': 35142, 'loss/train': 1.1979506015777588} -11/07/2021 02:11:22 - INFO - __main__ - Step 35144: {'lr': 0.0004406415281193805, 'samples': 6747648, 'steps': 35143, 'loss/train': 2.018486738204956} -11/07/2021 02:11:23 - INFO - __main__ - Step 35145: {'lr': 0.0004406380950889027, 'samples': 6747840, 'steps': 35144, 'loss/train': 1.4049015045166016} -11/07/2021 02:11:24 - INFO - __main__ - Step 35146: {'lr': 0.0004406346619725265, 'samples': 6748032, 'steps': 35145, 'loss/train': 1.5860729217529297} -11/07/2021 02:11:24 - INFO - __main__ - Step 35147: {'lr': 0.00044063122877025315, 'samples': 6748224, 'steps': 35146, 'loss/train': 1.0698484182357788} -11/07/2021 02:11:24 - INFO - __main__ - Step 35148: {'lr': 0.0004406277954820843, 'samples': 6748416, 'steps': 35147, 'loss/train': 1.1080349683761597} -11/07/2021 02:11:25 - INFO - __main__ - Step 35149: {'lr': 0.0004406243621080216, 'samples': 6748608, 'steps': 35148, 'loss/train': 1.8648744821548462} -11/07/2021 02:11:25 - INFO - __main__ - Step 35150: {'lr': 0.00044062092864806634, 'samples': 6748800, 'steps': 35149, 'loss/train': 1.0627784729003906} -11/07/2021 02:11:26 - INFO - __main__ - Step 35151: {'lr': 0.00044061749510222037, 'samples': 6748992, 'steps': 35150, 'loss/train': 1.6568477153778076} -11/07/2021 02:11:27 - INFO - __main__ - Step 35152: {'lr': 0.00044061406147048504, 'samples': 6749184, 'steps': 35151, 'loss/train': 1.7818259000778198} -11/07/2021 02:11:27 - INFO - __main__ - Step 35153: {'lr': 0.000440610627752862, 'samples': 6749376, 'steps': 35152, 'loss/train': 1.7012907266616821} -11/07/2021 02:11:27 - INFO - __main__ - Step 35154: {'lr': 0.00044060719394935265, 'samples': 6749568, 'steps': 35153, 'loss/train': 1.8704605102539062} -11/07/2021 02:11:28 - INFO - __main__ - Step 35155: {'lr': 0.0004406037600599588, 'samples': 6749760, 'steps': 35154, 'loss/train': 1.3309500217437744} -11/07/2021 02:11:29 - INFO - __main__ - Step 35156: {'lr': 0.0004406003260846817, 'samples': 6749952, 'steps': 35155, 'loss/train': 1.7605141401290894} -11/07/2021 02:11:29 - INFO - __main__ - Step 35157: {'lr': 0.0004405968920235231, 'samples': 6750144, 'steps': 35156, 'loss/train': 1.6250115633010864} -11/07/2021 02:11:29 - INFO - __main__ - Step 35158: {'lr': 0.0004405934578764845, 'samples': 6750336, 'steps': 35157, 'loss/train': 1.0034600496292114} -11/07/2021 02:11:30 - INFO - __main__ - Step 35159: {'lr': 0.0004405900236435674, 'samples': 6750528, 'steps': 35158, 'loss/train': 0.8062552809715271} -11/07/2021 02:11:30 - INFO - __main__ - Step 35160: {'lr': 0.00044058658932477336, 'samples': 6750720, 'steps': 35159, 'loss/train': 2.0084025859832764} -11/07/2021 02:11:31 - INFO - __main__ - Step 35161: {'lr': 0.0004405831549201039, 'samples': 6750912, 'steps': 35160, 'loss/train': 1.330609917640686} -11/07/2021 02:11:31 - INFO - __main__ - Step 35162: {'lr': 0.0004405797204295607, 'samples': 6751104, 'steps': 35161, 'loss/train': 1.5582258701324463} -11/07/2021 02:11:32 - INFO - __main__ - Step 35163: {'lr': 0.0004405762858531451, 'samples': 6751296, 'steps': 35162, 'loss/train': 1.6793432235717773} -11/07/2021 02:11:32 - INFO - __main__ - Step 35164: {'lr': 0.00044057285119085887, 'samples': 6751488, 'steps': 35163, 'loss/train': 1.3808073997497559} -11/07/2021 02:11:32 - INFO - __main__ - Step 35165: {'lr': 0.0004405694164427035, 'samples': 6751680, 'steps': 35164, 'loss/train': 2.0149216651916504} -11/07/2021 02:11:34 - INFO - __main__ - Step 35166: {'lr': 0.0004405659816086804, 'samples': 6751872, 'steps': 35165, 'loss/train': 0.9017762541770935} -11/07/2021 02:11:34 - INFO - __main__ - Step 35167: {'lr': 0.00044056254668879127, 'samples': 6752064, 'steps': 35166, 'loss/train': 1.2902568578720093} -11/07/2021 02:11:34 - INFO - __main__ - Step 35168: {'lr': 0.00044055911168303753, 'samples': 6752256, 'steps': 35167, 'loss/train': 1.8604564666748047} -11/07/2021 02:11:35 - INFO - __main__ - Step 35169: {'lr': 0.00044055567659142083, 'samples': 6752448, 'steps': 35168, 'loss/train': 0.897270679473877} -11/07/2021 02:11:35 - INFO - __main__ - Step 35170: {'lr': 0.0004405522414139427, 'samples': 6752640, 'steps': 35169, 'loss/train': 1.6258909702301025} -11/07/2021 02:11:36 - INFO - __main__ - Step 35171: {'lr': 0.0004405488061506047, 'samples': 6752832, 'steps': 35170, 'loss/train': 1.4886150360107422} -11/07/2021 02:11:36 - INFO - __main__ - Step 35172: {'lr': 0.0004405453708014082, 'samples': 6753024, 'steps': 35171, 'loss/train': 1.5348491668701172} -11/07/2021 02:11:37 - INFO - __main__ - Step 35173: {'lr': 0.00044054193536635503, 'samples': 6753216, 'steps': 35172, 'loss/train': 1.6122689247131348} -11/07/2021 02:11:37 - INFO - __main__ - Step 35174: {'lr': 0.00044053849984544653, 'samples': 6753408, 'steps': 35173, 'loss/train': 1.3885899782180786} -11/07/2021 02:11:37 - INFO - __main__ - Step 35175: {'lr': 0.0004405350642386844, 'samples': 6753600, 'steps': 35174, 'loss/train': 1.5848331451416016} -11/07/2021 02:11:38 - INFO - __main__ - Step 35176: {'lr': 0.00044053162854607004, 'samples': 6753792, 'steps': 35175, 'loss/train': 1.2173967361450195} -11/07/2021 02:11:39 - INFO - __main__ - Step 35177: {'lr': 0.0004405281927676051, 'samples': 6753984, 'steps': 35176, 'loss/train': 1.600562572479248} -11/07/2021 02:11:39 - INFO - __main__ - Step 35178: {'lr': 0.0004405247569032911, 'samples': 6754176, 'steps': 35177, 'loss/train': 1.6044585704803467} -11/07/2021 02:11:39 - INFO - __main__ - Step 35179: {'lr': 0.00044052132095312956, 'samples': 6754368, 'steps': 35178, 'loss/train': 1.7462291717529297} -11/07/2021 02:11:40 - INFO - __main__ - Step 35180: {'lr': 0.0004405178849171221, 'samples': 6754560, 'steps': 35179, 'loss/train': 1.35542631149292} -11/07/2021 02:11:40 - INFO - __main__ - Step 35181: {'lr': 0.00044051444879527013, 'samples': 6754752, 'steps': 35180, 'loss/train': 1.525868535041809} -11/07/2021 02:11:41 - INFO - __main__ - Step 35182: {'lr': 0.00044051101258757544, 'samples': 6754944, 'steps': 35181, 'loss/train': 1.3119614124298096} -11/07/2021 02:11:42 - INFO - __main__ - Step 35183: {'lr': 0.0004405075762940393, 'samples': 6755136, 'steps': 35182, 'loss/train': 1.6410095691680908} -11/07/2021 02:11:42 - INFO - __main__ - Step 35184: {'lr': 0.00044050413991466344, 'samples': 6755328, 'steps': 35183, 'loss/train': 2.1109349727630615} -11/07/2021 02:11:42 - INFO - __main__ - Step 35185: {'lr': 0.0004405007034494494, 'samples': 6755520, 'steps': 35184, 'loss/train': 1.5869981050491333} -11/07/2021 02:11:43 - INFO - __main__ - Step 35186: {'lr': 0.00044049726689839854, 'samples': 6755712, 'steps': 35185, 'loss/train': 1.2204842567443848} -11/07/2021 02:11:44 - INFO - __main__ - Step 35187: {'lr': 0.0004404938302615126, 'samples': 6755904, 'steps': 35186, 'loss/train': 2.1978719234466553} -11/07/2021 02:11:44 - INFO - __main__ - Step 35188: {'lr': 0.00044049039353879317, 'samples': 6756096, 'steps': 35187, 'loss/train': 1.2825113534927368} -11/07/2021 02:11:44 - INFO - __main__ - Step 35189: {'lr': 0.00044048695673024166, 'samples': 6756288, 'steps': 35188, 'loss/train': 1.7250984907150269} -11/07/2021 02:11:45 - INFO - __main__ - Step 35190: {'lr': 0.00044048351983585966, 'samples': 6756480, 'steps': 35189, 'loss/train': 1.7315864562988281} -11/07/2021 02:11:45 - INFO - __main__ - Step 35191: {'lr': 0.00044048008285564865, 'samples': 6756672, 'steps': 35190, 'loss/train': 1.1441526412963867} -11/07/2021 02:11:46 - INFO - __main__ - Step 35192: {'lr': 0.0004404766457896104, 'samples': 6756864, 'steps': 35191, 'loss/train': 1.5588198900222778} -11/07/2021 02:11:47 - INFO - __main__ - Step 35193: {'lr': 0.0004404732086377462, 'samples': 6757056, 'steps': 35192, 'loss/train': 1.1891738176345825} -11/07/2021 02:11:47 - INFO - __main__ - Step 35194: {'lr': 0.00044046977140005774, 'samples': 6757248, 'steps': 35193, 'loss/train': 1.190617561340332} -11/07/2021 02:11:47 - INFO - __main__ - Step 35195: {'lr': 0.00044046633407654657, 'samples': 6757440, 'steps': 35194, 'loss/train': 1.2330223321914673} -11/07/2021 02:11:48 - INFO - __main__ - Step 35196: {'lr': 0.0004404628966672142, 'samples': 6757632, 'steps': 35195, 'loss/train': 1.1752219200134277} -11/07/2021 02:11:49 - INFO - __main__ - Step 35197: {'lr': 0.0004404594591720622, 'samples': 6757824, 'steps': 35196, 'loss/train': 1.444063663482666} -11/07/2021 02:11:49 - INFO - __main__ - Step 35198: {'lr': 0.00044045602159109207, 'samples': 6758016, 'steps': 35197, 'loss/train': 1.4819884300231934} -11/07/2021 02:11:49 - INFO - __main__ - Step 35199: {'lr': 0.0004404525839243054, 'samples': 6758208, 'steps': 35198, 'loss/train': 1.7841776609420776} -11/07/2021 02:11:50 - INFO - __main__ - Step 35200: {'lr': 0.00044044914617170374, 'samples': 6758400, 'steps': 35199, 'loss/train': 1.6430798768997192} -11/07/2021 02:11:50 - INFO - __main__ - Step 35201: {'lr': 0.00044044570833328865, 'samples': 6758592, 'steps': 35200, 'loss/train': 1.6653860807418823} -11/07/2021 02:11:51 - INFO - __main__ - Step 35202: {'lr': 0.00044044227040906166, 'samples': 6758784, 'steps': 35201, 'loss/train': 1.5937496423721313} -11/07/2021 02:11:51 - INFO - __main__ - Step 35203: {'lr': 0.00044043883239902425, 'samples': 6758976, 'steps': 35202, 'loss/train': 0.7953693270683289} -11/07/2021 02:11:52 - INFO - __main__ - Step 35204: {'lr': 0.00044043539430317814, 'samples': 6759168, 'steps': 35203, 'loss/train': 1.1854610443115234} -11/07/2021 02:11:52 - INFO - __main__ - Step 35205: {'lr': 0.00044043195612152475, 'samples': 6759360, 'steps': 35204, 'loss/train': 1.4423195123672485} -11/07/2021 02:11:52 - INFO - __main__ - Step 35206: {'lr': 0.0004404285178540657, 'samples': 6759552, 'steps': 35205, 'loss/train': 1.2376537322998047} -11/07/2021 02:11:53 - INFO - __main__ - Step 35207: {'lr': 0.0004404250795008024, 'samples': 6759744, 'steps': 35206, 'loss/train': 1.9665284156799316} -11/07/2021 02:11:54 - INFO - __main__ - Step 35208: {'lr': 0.00044042164106173655, 'samples': 6759936, 'steps': 35207, 'loss/train': 1.6511269807815552} -11/07/2021 02:11:54 - INFO - __main__ - Step 35209: {'lr': 0.00044041820253686964, 'samples': 6760128, 'steps': 35208, 'loss/train': 1.4399462938308716} -11/07/2021 02:11:55 - INFO - __main__ - Step 35210: {'lr': 0.0004404147639262032, 'samples': 6760320, 'steps': 35209, 'loss/train': 2.1247313022613525} -11/07/2021 02:11:55 - INFO - __main__ - Step 35211: {'lr': 0.00044041132522973885, 'samples': 6760512, 'steps': 35210, 'loss/train': 1.3795652389526367} -11/07/2021 02:11:55 - INFO - __main__ - Step 35212: {'lr': 0.0004404078864474781, 'samples': 6760704, 'steps': 35211, 'loss/train': 1.4530143737792969} -11/07/2021 02:11:56 - INFO - __main__ - Step 35213: {'lr': 0.00044040444757942245, 'samples': 6760896, 'steps': 35212, 'loss/train': 0.6121195554733276} -11/07/2021 02:11:57 - INFO - __main__ - Step 35214: {'lr': 0.00044040100862557355, 'samples': 6761088, 'steps': 35213, 'loss/train': 1.6529427766799927} -11/07/2021 02:11:57 - INFO - __main__ - Step 35215: {'lr': 0.00044039756958593287, 'samples': 6761280, 'steps': 35214, 'loss/train': 1.8432458639144897} -11/07/2021 02:11:57 - INFO - __main__ - Step 35216: {'lr': 0.000440394130460502, 'samples': 6761472, 'steps': 35215, 'loss/train': 1.6579116582870483} -11/07/2021 02:11:58 - INFO - __main__ - Step 35217: {'lr': 0.00044039069124928245, 'samples': 6761664, 'steps': 35216, 'loss/train': 1.7480180263519287} -11/07/2021 02:11:59 - INFO - __main__ - Step 35218: {'lr': 0.0004403872519522758, 'samples': 6761856, 'steps': 35217, 'loss/train': 1.7644002437591553} -11/07/2021 02:11:59 - INFO - __main__ - Step 35219: {'lr': 0.00044038381256948357, 'samples': 6762048, 'steps': 35218, 'loss/train': 1.3994035720825195} -11/07/2021 02:11:59 - INFO - __main__ - Step 35220: {'lr': 0.00044038037310090736, 'samples': 6762240, 'steps': 35219, 'loss/train': 1.061874270439148} -11/07/2021 02:12:00 - INFO - __main__ - Step 35221: {'lr': 0.00044037693354654863, 'samples': 6762432, 'steps': 35220, 'loss/train': 1.141141653060913} -11/07/2021 02:12:00 - INFO - __main__ - Step 35222: {'lr': 0.0004403734939064091, 'samples': 6762624, 'steps': 35221, 'loss/train': 1.7482527494430542} -11/07/2021 02:12:01 - INFO - __main__ - Step 35223: {'lr': 0.00044037005418049016, 'samples': 6762816, 'steps': 35222, 'loss/train': 2.018164873123169} -11/07/2021 02:12:02 - INFO - __main__ - Step 35224: {'lr': 0.00044036661436879334, 'samples': 6763008, 'steps': 35223, 'loss/train': 1.7777644395828247} -11/07/2021 02:12:02 - INFO - __main__ - Step 35225: {'lr': 0.00044036317447132035, 'samples': 6763200, 'steps': 35224, 'loss/train': 1.500864863395691} -11/07/2021 02:12:02 - INFO - __main__ - Step 35226: {'lr': 0.00044035973448807266, 'samples': 6763392, 'steps': 35225, 'loss/train': 1.6354080438613892} -11/07/2021 02:12:03 - INFO - __main__ - Step 35227: {'lr': 0.00044035629441905173, 'samples': 6763584, 'steps': 35226, 'loss/train': 1.693660020828247} -11/07/2021 02:12:04 - INFO - __main__ - Step 35228: {'lr': 0.0004403528542642592, 'samples': 6763776, 'steps': 35227, 'loss/train': 1.55222487449646} -11/07/2021 02:12:04 - INFO - __main__ - Step 35229: {'lr': 0.00044034941402369666, 'samples': 6763968, 'steps': 35228, 'loss/train': 1.2032617330551147} -11/07/2021 02:12:04 - INFO - __main__ - Step 35230: {'lr': 0.0004403459736973656, 'samples': 6764160, 'steps': 35229, 'loss/train': 1.302371859550476} -11/07/2021 02:12:05 - INFO - __main__ - Step 35231: {'lr': 0.00044034253328526765, 'samples': 6764352, 'steps': 35230, 'loss/train': 1.5945069789886475} -11/07/2021 02:12:05 - INFO - __main__ - Step 35232: {'lr': 0.00044033909278740416, 'samples': 6764544, 'steps': 35231, 'loss/train': 1.67051362991333} -11/07/2021 02:12:06 - INFO - __main__ - Step 35233: {'lr': 0.0004403356522037769, 'samples': 6764736, 'steps': 35232, 'loss/train': 0.9942646622657776} -11/07/2021 02:12:06 - INFO - __main__ - Step 35234: {'lr': 0.00044033221153438727, 'samples': 6764928, 'steps': 35233, 'loss/train': 1.897809386253357} -11/07/2021 02:12:07 - INFO - __main__ - Step 35235: {'lr': 0.00044032877077923696, 'samples': 6765120, 'steps': 35234, 'loss/train': 1.6269075870513916} -11/07/2021 02:12:07 - INFO - __main__ - Step 35236: {'lr': 0.0004403253299383274, 'samples': 6765312, 'steps': 35235, 'loss/train': 1.3000872135162354} -11/07/2021 02:12:07 - INFO - __main__ - Step 35237: {'lr': 0.00044032188901166016, 'samples': 6765504, 'steps': 35236, 'loss/train': 1.3950632810592651} -11/07/2021 02:12:08 - INFO - __main__ - Step 35238: {'lr': 0.0004403184479992368, 'samples': 6765696, 'steps': 35237, 'loss/train': 1.5457737445831299} -11/07/2021 02:12:09 - INFO - __main__ - Step 35239: {'lr': 0.000440315006901059, 'samples': 6765888, 'steps': 35238, 'loss/train': 1.7797479629516602} -11/07/2021 02:12:09 - INFO - __main__ - Step 35240: {'lr': 0.00044031156571712807, 'samples': 6766080, 'steps': 35239, 'loss/train': 1.6283468008041382} -11/07/2021 02:12:10 - INFO - __main__ - Step 35241: {'lr': 0.0004403081244474457, 'samples': 6766272, 'steps': 35240, 'loss/train': 0.35879331827163696} -11/07/2021 02:12:10 - INFO - __main__ - Step 35242: {'lr': 0.00044030468309201354, 'samples': 6766464, 'steps': 35241, 'loss/train': 1.5128042697906494} -11/07/2021 02:12:10 - INFO - __main__ - Step 35243: {'lr': 0.0004403012416508329, 'samples': 6766656, 'steps': 35242, 'loss/train': 1.65208899974823} -11/07/2021 02:12:11 - INFO - __main__ - Step 35244: {'lr': 0.00044029780012390553, 'samples': 6766848, 'steps': 35243, 'loss/train': 1.3009748458862305} -11/07/2021 02:12:12 - INFO - __main__ - Step 35245: {'lr': 0.0004402943585112329, 'samples': 6767040, 'steps': 35244, 'loss/train': 1.2903783321380615} -11/07/2021 02:12:12 - INFO - __main__ - Step 35246: {'lr': 0.0004402909168128165, 'samples': 6767232, 'steps': 35245, 'loss/train': 0.9609237909317017} -11/07/2021 02:12:12 - INFO - __main__ - Step 35247: {'lr': 0.00044028747502865794, 'samples': 6767424, 'steps': 35246, 'loss/train': 1.4407219886779785} -11/07/2021 02:12:13 - INFO - __main__ - Step 35248: {'lr': 0.0004402840331587589, 'samples': 6767616, 'steps': 35247, 'loss/train': 1.1330758333206177} -11/07/2021 02:12:14 - INFO - __main__ - Step 35249: {'lr': 0.0004402805912031207, 'samples': 6767808, 'steps': 35248, 'loss/train': 1.5032768249511719} -11/07/2021 02:12:15 - INFO - __main__ - Step 35250: {'lr': 0.0004402771491617451, 'samples': 6768000, 'steps': 35249, 'loss/train': 1.1299022436141968} -11/07/2021 02:12:15 - INFO - __main__ - Step 35251: {'lr': 0.0004402737070346335, 'samples': 6768192, 'steps': 35250, 'loss/train': 1.785966396331787} -11/07/2021 02:12:15 - INFO - __main__ - Step 35252: {'lr': 0.0004402702648217875, 'samples': 6768384, 'steps': 35251, 'loss/train': 1.8759437799453735} -11/07/2021 02:12:16 - INFO - __main__ - Step 35253: {'lr': 0.00044026682252320864, 'samples': 6768576, 'steps': 35252, 'loss/train': 1.5136964321136475} -11/07/2021 02:12:16 - INFO - __main__ - Step 35254: {'lr': 0.00044026338013889853, 'samples': 6768768, 'steps': 35253, 'loss/train': 1.7734421491622925} -11/07/2021 02:12:17 - INFO - __main__ - Step 35255: {'lr': 0.00044025993766885866, 'samples': 6768960, 'steps': 35254, 'loss/train': 1.382339358329773} -11/07/2021 02:12:17 - INFO - __main__ - Step 35256: {'lr': 0.00044025649511309064, 'samples': 6769152, 'steps': 35255, 'loss/train': 1.1511459350585938} -11/07/2021 02:12:18 - INFO - __main__ - Step 35257: {'lr': 0.00044025305247159585, 'samples': 6769344, 'steps': 35256, 'loss/train': 1.6177397966384888} -11/07/2021 02:12:18 - INFO - __main__ - Step 35258: {'lr': 0.00044024960974437606, 'samples': 6769536, 'steps': 35257, 'loss/train': 1.3453264236450195} -11/07/2021 02:12:18 - INFO - __main__ - Step 35259: {'lr': 0.0004402461669314327, 'samples': 6769728, 'steps': 35258, 'loss/train': 1.6906169652938843} -11/07/2021 02:12:21 - INFO - __main__ - Step 35260: {'lr': 0.0004402427240327674, 'samples': 6769920, 'steps': 35259, 'loss/train': 1.5880019664764404} -11/07/2021 02:12:21 - INFO - __main__ - Step 35261: {'lr': 0.0004402392810483816, 'samples': 6770112, 'steps': 35260, 'loss/train': 1.5076464414596558} -11/07/2021 02:12:21 - INFO - __main__ - Step 35262: {'lr': 0.000440235837978277, 'samples': 6770304, 'steps': 35261, 'loss/train': 1.831540584564209} -11/07/2021 02:12:22 - INFO - __main__ - Step 35263: {'lr': 0.00044023239482245504, 'samples': 6770496, 'steps': 35262, 'loss/train': 2.123952865600586} -11/07/2021 02:12:22 - INFO - __main__ - Step 35264: {'lr': 0.0004402289515809172, 'samples': 6770688, 'steps': 35263, 'loss/train': 1.891985297203064} -11/07/2021 02:12:22 - INFO - __main__ - Step 35265: {'lr': 0.00044022550825366526, 'samples': 6770880, 'steps': 35264, 'loss/train': 1.8454724550247192} -11/07/2021 02:12:23 - INFO - __main__ - Step 35266: {'lr': 0.0004402220648407006, 'samples': 6771072, 'steps': 35265, 'loss/train': 1.8766562938690186} -11/07/2021 02:12:23 - INFO - __main__ - Step 35267: {'lr': 0.00044021862134202485, 'samples': 6771264, 'steps': 35266, 'loss/train': 1.5124690532684326} -11/07/2021 02:12:24 - INFO - __main__ - Step 35268: {'lr': 0.00044021517775763943, 'samples': 6771456, 'steps': 35267, 'loss/train': 1.4166333675384521} -11/07/2021 02:12:25 - INFO - __main__ - Step 35269: {'lr': 0.00044021173408754604, 'samples': 6771648, 'steps': 35268, 'loss/train': 1.3877267837524414} -11/07/2021 02:12:25 - INFO - __main__ - Step 35270: {'lr': 0.00044020829033174615, 'samples': 6771840, 'steps': 35269, 'loss/train': 1.5778212547302246} -11/07/2021 02:12:25 - INFO - __main__ - Step 35271: {'lr': 0.0004402048464902414, 'samples': 6772032, 'steps': 35270, 'loss/train': 1.4013853073120117} -11/07/2021 02:12:26 - INFO - __main__ - Step 35272: {'lr': 0.0004402014025630332, 'samples': 6772224, 'steps': 35271, 'loss/train': 2.010936737060547} -11/07/2021 02:12:27 - INFO - __main__ - Step 35273: {'lr': 0.00044019795855012325, 'samples': 6772416, 'steps': 35272, 'loss/train': 1.4244587421417236} -11/07/2021 02:12:27 - INFO - __main__ - Step 35274: {'lr': 0.00044019451445151305, 'samples': 6772608, 'steps': 35273, 'loss/train': 1.4892654418945312} -11/07/2021 02:12:27 - INFO - __main__ - Step 35275: {'lr': 0.00044019107026720404, 'samples': 6772800, 'steps': 35274, 'loss/train': 1.6502214670181274} -11/07/2021 02:12:28 - INFO - __main__ - Step 35276: {'lr': 0.00044018762599719796, 'samples': 6772992, 'steps': 35275, 'loss/train': 1.509718656539917} -11/07/2021 02:12:28 - INFO - __main__ - Step 35277: {'lr': 0.0004401841816414962, 'samples': 6773184, 'steps': 35276, 'loss/train': 0.5344533920288086} -11/07/2021 02:12:29 - INFO - __main__ - Step 35278: {'lr': 0.0004401807372001004, 'samples': 6773376, 'steps': 35277, 'loss/train': 1.63253915309906} -11/07/2021 02:12:29 - INFO - __main__ - Step 35279: {'lr': 0.0004401772926730122, 'samples': 6773568, 'steps': 35278, 'loss/train': 1.8484654426574707} -11/07/2021 02:12:30 - INFO - __main__ - Step 35280: {'lr': 0.0004401738480602329, 'samples': 6773760, 'steps': 35279, 'loss/train': 1.147681713104248} -11/07/2021 02:12:30 - INFO - __main__ - Step 35281: {'lr': 0.0004401704033617643, 'samples': 6773952, 'steps': 35280, 'loss/train': 1.761243462562561} -11/07/2021 02:12:30 - INFO - __main__ - Step 35282: {'lr': 0.0004401669585776078, 'samples': 6774144, 'steps': 35281, 'loss/train': 1.5396783351898193} -11/07/2021 02:12:31 - INFO - __main__ - Step 35283: {'lr': 0.000440163513707765, 'samples': 6774336, 'steps': 35282, 'loss/train': 1.0905910730361938} -11/07/2021 02:12:32 - INFO - __main__ - Step 35284: {'lr': 0.00044016006875223745, 'samples': 6774528, 'steps': 35283, 'loss/train': 1.369025468826294} -11/07/2021 02:12:32 - INFO - __main__ - Step 35285: {'lr': 0.00044015662371102676, 'samples': 6774720, 'steps': 35284, 'loss/train': 1.5036505460739136} -11/07/2021 02:12:32 - INFO - __main__ - Step 35286: {'lr': 0.0004401531785841344, 'samples': 6774912, 'steps': 35285, 'loss/train': 1.7355401515960693} -11/07/2021 02:12:33 - INFO - __main__ - Step 35287: {'lr': 0.00044014973337156197, 'samples': 6775104, 'steps': 35286, 'loss/train': 1.3399806022644043} -11/07/2021 02:12:34 - INFO - __main__ - Step 35288: {'lr': 0.0004401462880733109, 'samples': 6775296, 'steps': 35287, 'loss/train': 1.9543825387954712} -11/07/2021 02:12:34 - INFO - __main__ - Step 35289: {'lr': 0.000440142842689383, 'samples': 6775488, 'steps': 35288, 'loss/train': 1.6181656122207642} -11/07/2021 02:12:34 - INFO - __main__ - Step 35290: {'lr': 0.00044013939721977957, 'samples': 6775680, 'steps': 35289, 'loss/train': 2.1377604007720947} -11/07/2021 02:12:35 - INFO - __main__ - Step 35291: {'lr': 0.0004401359516645023, 'samples': 6775872, 'steps': 35290, 'loss/train': 1.8301565647125244} -11/07/2021 02:12:35 - INFO - __main__ - Step 35292: {'lr': 0.0004401325060235527, 'samples': 6776064, 'steps': 35291, 'loss/train': 1.776128888130188} -11/07/2021 02:12:36 - INFO - __main__ - Step 35293: {'lr': 0.00044012906029693236, 'samples': 6776256, 'steps': 35292, 'loss/train': 1.6864397525787354} -11/07/2021 02:12:37 - INFO - __main__ - Step 35294: {'lr': 0.0004401256144846427, 'samples': 6776448, 'steps': 35293, 'loss/train': 0.7780770659446716} -11/07/2021 02:12:37 - INFO - __main__ - Step 35295: {'lr': 0.0004401221685866854, 'samples': 6776640, 'steps': 35294, 'loss/train': 1.1424438953399658} -11/07/2021 02:12:37 - INFO - __main__ - Step 35296: {'lr': 0.00044011872260306205, 'samples': 6776832, 'steps': 35295, 'loss/train': 1.2669594287872314} -11/07/2021 02:12:38 - INFO - __main__ - Step 35297: {'lr': 0.00044011527653377416, 'samples': 6777024, 'steps': 35296, 'loss/train': 1.7180006504058838} -11/07/2021 02:12:38 - INFO - __main__ - Step 35298: {'lr': 0.0004401118303788232, 'samples': 6777216, 'steps': 35297, 'loss/train': 1.8391923904418945} -11/07/2021 02:12:39 - INFO - __main__ - Step 35299: {'lr': 0.00044010838413821075, 'samples': 6777408, 'steps': 35298, 'loss/train': 1.658327341079712} -11/07/2021 02:12:39 - INFO - __main__ - Step 35300: {'lr': 0.0004401049378119384, 'samples': 6777600, 'steps': 35299, 'loss/train': 1.3578120470046997} -11/07/2021 02:12:40 - INFO - __main__ - Step 35301: {'lr': 0.0004401014914000078, 'samples': 6777792, 'steps': 35300, 'loss/train': 1.9098882675170898} -11/07/2021 02:12:40 - INFO - __main__ - Step 35302: {'lr': 0.00044009804490242026, 'samples': 6777984, 'steps': 35301, 'loss/train': 0.855135977268219} -11/07/2021 02:12:40 - INFO - __main__ - Step 35303: {'lr': 0.00044009459831917755, 'samples': 6778176, 'steps': 35302, 'loss/train': 1.5483982563018799} -11/07/2021 02:12:42 - INFO - __main__ - Step 35304: {'lr': 0.00044009115165028113, 'samples': 6778368, 'steps': 35303, 'loss/train': 1.7052702903747559} -11/07/2021 02:12:42 - INFO - __main__ - Step 35305: {'lr': 0.0004400877048957326, 'samples': 6778560, 'steps': 35304, 'loss/train': 1.751997470855713} -11/07/2021 02:12:42 - INFO - __main__ - Step 35306: {'lr': 0.00044008425805553347, 'samples': 6778752, 'steps': 35305, 'loss/train': 2.147096872329712} -11/07/2021 02:12:43 - INFO - __main__ - Step 35307: {'lr': 0.00044008081112968537, 'samples': 6778944, 'steps': 35306, 'loss/train': 1.7320812940597534} -11/07/2021 02:12:43 - INFO - __main__ - Step 35308: {'lr': 0.0004400773641181897, 'samples': 6779136, 'steps': 35307, 'loss/train': 1.7000387907028198} -11/07/2021 02:12:44 - INFO - __main__ - Step 35309: {'lr': 0.0004400739170210481, 'samples': 6779328, 'steps': 35308, 'loss/train': 1.2110624313354492} -11/07/2021 02:12:44 - INFO - __main__ - Step 35310: {'lr': 0.00044007046983826213, 'samples': 6779520, 'steps': 35309, 'loss/train': 0.6447055339813232} -11/07/2021 02:12:45 - INFO - __main__ - Step 35311: {'lr': 0.0004400670225698333, 'samples': 6779712, 'steps': 35310, 'loss/train': 0.7492512464523315} -11/07/2021 02:12:45 - INFO - __main__ - Step 35312: {'lr': 0.00044006357521576334, 'samples': 6779904, 'steps': 35311, 'loss/train': 0.9323607087135315} -11/07/2021 02:12:45 - INFO - __main__ - Step 35313: {'lr': 0.0004400601277760536, 'samples': 6780096, 'steps': 35312, 'loss/train': 1.7272684574127197} -11/07/2021 02:12:46 - INFO - __main__ - Step 35314: {'lr': 0.0004400566802507057, 'samples': 6780288, 'steps': 35313, 'loss/train': 1.1753439903259277} -11/07/2021 02:12:47 - INFO - __main__ - Step 35315: {'lr': 0.0004400532326397211, 'samples': 6780480, 'steps': 35314, 'loss/train': 1.8355354070663452} -11/07/2021 02:12:47 - INFO - __main__ - Step 35316: {'lr': 0.00044004978494310154, 'samples': 6780672, 'steps': 35315, 'loss/train': 0.8124325275421143} -11/07/2021 02:12:47 - INFO - __main__ - Step 35317: {'lr': 0.00044004633716084854, 'samples': 6780864, 'steps': 35316, 'loss/train': 1.5831191539764404} -11/07/2021 02:12:48 - INFO - __main__ - Step 35318: {'lr': 0.0004400428892929635, 'samples': 6781056, 'steps': 35317, 'loss/train': 1.7521748542785645} -11/07/2021 02:12:48 - INFO - __main__ - Step 35319: {'lr': 0.00044003944133944804, 'samples': 6781248, 'steps': 35318, 'loss/train': 1.0224285125732422} -11/07/2021 02:12:49 - INFO - __main__ - Step 35320: {'lr': 0.00044003599330030385, 'samples': 6781440, 'steps': 35319, 'loss/train': 1.5260698795318604} -11/07/2021 02:12:50 - INFO - __main__ - Step 35321: {'lr': 0.00044003254517553225, 'samples': 6781632, 'steps': 35320, 'loss/train': 1.7216631174087524} -11/07/2021 02:12:50 - INFO - __main__ - Step 35322: {'lr': 0.000440029096965135, 'samples': 6781824, 'steps': 35321, 'loss/train': 1.5419079065322876} -11/07/2021 02:12:50 - INFO - __main__ - Step 35323: {'lr': 0.0004400256486691135, 'samples': 6782016, 'steps': 35322, 'loss/train': 1.5323067903518677} -11/07/2021 02:12:51 - INFO - __main__ - Step 35324: {'lr': 0.0004400222002874695, 'samples': 6782208, 'steps': 35323, 'loss/train': 1.541028380393982} -11/07/2021 02:12:52 - INFO - __main__ - Step 35325: {'lr': 0.0004400187518202043, 'samples': 6782400, 'steps': 35324, 'loss/train': 1.1801986694335938} -11/07/2021 02:12:53 - INFO - __main__ - Step 35326: {'lr': 0.00044001530326731966, 'samples': 6782592, 'steps': 35325, 'loss/train': 0.6416899561882019} -11/07/2021 02:12:53 - INFO - __main__ - Step 35327: {'lr': 0.00044001185462881707, 'samples': 6782784, 'steps': 35326, 'loss/train': 1.5198839902877808} -11/07/2021 02:12:53 - INFO - __main__ - Step 35328: {'lr': 0.000440008405904698, 'samples': 6782976, 'steps': 35327, 'loss/train': 1.5916683673858643} -11/07/2021 02:12:54 - INFO - __main__ - Step 35329: {'lr': 0.0004400049570949641, 'samples': 6783168, 'steps': 35328, 'loss/train': 1.5998841524124146} -11/07/2021 02:12:55 - INFO - __main__ - Step 35330: {'lr': 0.0004400015081996169, 'samples': 6783360, 'steps': 35329, 'loss/train': 1.3884435892105103} -11/07/2021 02:12:55 - INFO - __main__ - Step 35331: {'lr': 0.000439998059218658, 'samples': 6783552, 'steps': 35330, 'loss/train': 1.563869833946228} -11/07/2021 02:12:55 - INFO - __main__ - Step 35332: {'lr': 0.0004399946101520889, 'samples': 6783744, 'steps': 35331, 'loss/train': 1.4010270833969116} -11/07/2021 02:12:56 - INFO - __main__ - Step 35333: {'lr': 0.0004399911609999111, 'samples': 6783936, 'steps': 35332, 'loss/train': 1.2245500087738037} -11/07/2021 02:12:56 - INFO - __main__ - Step 35334: {'lr': 0.0004399877117621262, 'samples': 6784128, 'steps': 35333, 'loss/train': 0.999417781829834} -11/07/2021 02:12:57 - INFO - __main__ - Step 35335: {'lr': 0.0004399842624387358, 'samples': 6784320, 'steps': 35334, 'loss/train': 2.229874610900879} -11/07/2021 02:12:57 - INFO - __main__ - Step 35336: {'lr': 0.0004399808130297415, 'samples': 6784512, 'steps': 35335, 'loss/train': 1.3630006313323975} -11/07/2021 02:12:58 - INFO - __main__ - Step 35337: {'lr': 0.0004399773635351446, 'samples': 6784704, 'steps': 35336, 'loss/train': 1.609230637550354} -11/07/2021 02:12:58 - INFO - __main__ - Step 35338: {'lr': 0.000439973913954947, 'samples': 6784896, 'steps': 35337, 'loss/train': 1.4650626182556152} -11/07/2021 02:12:58 - INFO - __main__ - Step 35339: {'lr': 0.00043997046428915, 'samples': 6785088, 'steps': 35338, 'loss/train': 1.5246323347091675} -11/07/2021 02:12:59 - INFO - __main__ - Step 35340: {'lr': 0.00043996701453775526, 'samples': 6785280, 'steps': 35339, 'loss/train': 1.4155287742614746} -11/07/2021 02:13:00 - INFO - __main__ - Step 35341: {'lr': 0.0004399635647007643, 'samples': 6785472, 'steps': 35340, 'loss/train': 1.72676420211792} -11/07/2021 02:13:00 - INFO - __main__ - Step 35342: {'lr': 0.00043996011477817875, 'samples': 6785664, 'steps': 35341, 'loss/train': 2.053565740585327} -11/07/2021 02:13:00 - INFO - __main__ - Step 35343: {'lr': 0.0004399566647700001, 'samples': 6785856, 'steps': 35342, 'loss/train': 1.2722868919372559} -11/07/2021 02:13:01 - INFO - __main__ - Step 35344: {'lr': 0.00043995321467622984, 'samples': 6786048, 'steps': 35343, 'loss/train': 1.4926680326461792} -11/07/2021 02:13:02 - INFO - __main__ - Step 35345: {'lr': 0.00043994976449686964, 'samples': 6786240, 'steps': 35344, 'loss/train': 1.2482376098632812} -11/07/2021 02:13:02 - INFO - __main__ - Step 35346: {'lr': 0.000439946314231921, 'samples': 6786432, 'steps': 35345, 'loss/train': 1.3723719120025635} -11/07/2021 02:13:03 - INFO - __main__ - Step 35347: {'lr': 0.00043994286388138545, 'samples': 6786624, 'steps': 35346, 'loss/train': 1.4757342338562012} -11/07/2021 02:13:03 - INFO - __main__ - Step 35348: {'lr': 0.00043993941344526455, 'samples': 6786816, 'steps': 35347, 'loss/train': 1.232430100440979} -11/07/2021 02:13:03 - INFO - __main__ - Step 35349: {'lr': 0.00043993596292356, 'samples': 6787008, 'steps': 35348, 'loss/train': 1.8471217155456543} -11/07/2021 02:13:04 - INFO - __main__ - Step 35350: {'lr': 0.00043993251231627315, 'samples': 6787200, 'steps': 35349, 'loss/train': 1.4239959716796875} -11/07/2021 02:13:05 - INFO - __main__ - Step 35351: {'lr': 0.00043992906162340563, 'samples': 6787392, 'steps': 35350, 'loss/train': 1.6814604997634888} -11/07/2021 02:13:05 - INFO - __main__ - Step 35352: {'lr': 0.00043992561084495906, 'samples': 6787584, 'steps': 35351, 'loss/train': 0.9884973168373108} -11/07/2021 02:13:05 - INFO - __main__ - Step 35353: {'lr': 0.0004399221599809349, 'samples': 6787776, 'steps': 35352, 'loss/train': 1.569356918334961} -11/07/2021 02:13:06 - INFO - __main__ - Step 35354: {'lr': 0.0004399187090313348, 'samples': 6787968, 'steps': 35353, 'loss/train': 1.5267250537872314} -11/07/2021 02:13:06 - INFO - __main__ - Step 35355: {'lr': 0.00043991525799616017, 'samples': 6788160, 'steps': 35354, 'loss/train': 1.7280054092407227} -11/07/2021 02:13:07 - INFO - __main__ - Step 35356: {'lr': 0.0004399118068754127, 'samples': 6788352, 'steps': 35355, 'loss/train': 1.4081023931503296} -11/07/2021 02:13:08 - INFO - __main__ - Step 35357: {'lr': 0.0004399083556690939, 'samples': 6788544, 'steps': 35356, 'loss/train': 1.168870449066162} -11/07/2021 02:13:08 - INFO - __main__ - Step 35358: {'lr': 0.0004399049043772053, 'samples': 6788736, 'steps': 35357, 'loss/train': 1.4735119342803955} -11/07/2021 02:13:08 - INFO - __main__ - Step 35359: {'lr': 0.00043990145299974853, 'samples': 6788928, 'steps': 35358, 'loss/train': 1.1163095235824585} -11/07/2021 02:13:09 - INFO - __main__ - Step 35360: {'lr': 0.0004398980015367251, 'samples': 6789120, 'steps': 35359, 'loss/train': 5.794185638427734} -11/07/2021 02:13:10 - INFO - __main__ - Step 35361: {'lr': 0.00043989454998813655, 'samples': 6789312, 'steps': 35360, 'loss/train': 1.7031978368759155} -11/07/2021 02:13:10 - INFO - __main__ - Step 35362: {'lr': 0.00043989109835398444, 'samples': 6789504, 'steps': 35361, 'loss/train': 1.6699821949005127} -11/07/2021 02:13:10 - INFO - __main__ - Step 35363: {'lr': 0.0004398876466342703, 'samples': 6789696, 'steps': 35362, 'loss/train': 1.4967632293701172} -11/07/2021 02:13:11 - INFO - __main__ - Step 35364: {'lr': 0.0004398841948289958, 'samples': 6789888, 'steps': 35363, 'loss/train': 0.6771053075790405} -11/07/2021 02:13:11 - INFO - __main__ - Step 35365: {'lr': 0.0004398807429381623, 'samples': 6790080, 'steps': 35364, 'loss/train': 1.4188239574432373} -11/07/2021 02:13:11 - INFO - __main__ - Step 35366: {'lr': 0.0004398772909617715, 'samples': 6790272, 'steps': 35365, 'loss/train': 1.3704005479812622} -11/07/2021 02:13:12 - INFO - __main__ - Step 35367: {'lr': 0.00043987383889982495, 'samples': 6790464, 'steps': 35366, 'loss/train': 1.699660301208496} -11/07/2021 02:13:13 - INFO - __main__ - Step 35368: {'lr': 0.00043987038675232415, 'samples': 6790656, 'steps': 35367, 'loss/train': 1.3130336999893188} -11/07/2021 02:13:13 - INFO - __main__ - Step 35369: {'lr': 0.00043986693451927074, 'samples': 6790848, 'steps': 35368, 'loss/train': 0.9575570225715637} -11/07/2021 02:13:13 - INFO - __main__ - Step 35370: {'lr': 0.0004398634822006662, 'samples': 6791040, 'steps': 35369, 'loss/train': 0.9162417650222778} -11/07/2021 02:13:14 - INFO - __main__ - Step 35371: {'lr': 0.0004398600297965121, 'samples': 6791232, 'steps': 35370, 'loss/train': 1.3104331493377686} -11/07/2021 02:13:15 - INFO - __main__ - Step 35372: {'lr': 0.00043985657730680997, 'samples': 6791424, 'steps': 35371, 'loss/train': 1.8338526487350464} -11/07/2021 02:13:15 - INFO - __main__ - Step 35373: {'lr': 0.00043985312473156143, 'samples': 6791616, 'steps': 35372, 'loss/train': 1.758212924003601} -11/07/2021 02:13:16 - INFO - __main__ - Step 35374: {'lr': 0.000439849672070768, 'samples': 6791808, 'steps': 35373, 'loss/train': 1.1626574993133545} -11/07/2021 02:13:16 - INFO - __main__ - Step 35375: {'lr': 0.00043984621932443115, 'samples': 6792000, 'steps': 35374, 'loss/train': 1.2128241062164307} -11/07/2021 02:13:16 - INFO - __main__ - Step 35376: {'lr': 0.0004398427664925526, 'samples': 6792192, 'steps': 35375, 'loss/train': 1.3160113096237183} -11/07/2021 02:13:17 - INFO - __main__ - Step 35377: {'lr': 0.0004398393135751338, 'samples': 6792384, 'steps': 35376, 'loss/train': 0.8111445903778076} -11/07/2021 02:13:18 - INFO - __main__ - Step 35378: {'lr': 0.0004398358605721764, 'samples': 6792576, 'steps': 35377, 'loss/train': 1.995750904083252} -11/07/2021 02:13:18 - INFO - __main__ - Step 35379: {'lr': 0.00043983240748368186, 'samples': 6792768, 'steps': 35378, 'loss/train': 1.58150315284729} -11/07/2021 02:13:18 - INFO - __main__ - Step 35380: {'lr': 0.0004398289543096518, 'samples': 6792960, 'steps': 35379, 'loss/train': 1.2393131256103516} -11/07/2021 02:13:19 - INFO - __main__ - Step 35381: {'lr': 0.0004398255010500877, 'samples': 6793152, 'steps': 35380, 'loss/train': 1.5714269876480103} -11/07/2021 02:13:20 - INFO - __main__ - Step 35382: {'lr': 0.00043982204770499114, 'samples': 6793344, 'steps': 35381, 'loss/train': 1.323848843574524} -11/07/2021 02:13:20 - INFO - __main__ - Step 35383: {'lr': 0.0004398185942743637, 'samples': 6793536, 'steps': 35382, 'loss/train': 1.5941745042800903} -11/07/2021 02:13:21 - INFO - __main__ - Step 35384: {'lr': 0.00043981514075820693, 'samples': 6793728, 'steps': 35383, 'loss/train': 1.4334259033203125} -11/07/2021 02:13:21 - INFO - __main__ - Step 35385: {'lr': 0.0004398116871565224, 'samples': 6793920, 'steps': 35384, 'loss/train': 1.3924572467803955} -11/07/2021 02:13:21 - INFO - __main__ - Step 35386: {'lr': 0.0004398082334693116, 'samples': 6794112, 'steps': 35385, 'loss/train': 2.0170538425445557} -11/07/2021 02:13:23 - INFO - __main__ - Step 35387: {'lr': 0.0004398047796965762, 'samples': 6794304, 'steps': 35386, 'loss/train': 0.7017478942871094} -11/07/2021 02:13:23 - INFO - __main__ - Step 35388: {'lr': 0.0004398013258383177, 'samples': 6794496, 'steps': 35387, 'loss/train': 1.5313912630081177} -11/07/2021 02:13:23 - INFO - __main__ - Step 35389: {'lr': 0.0004397978718945377, 'samples': 6794688, 'steps': 35388, 'loss/train': 1.1975125074386597} -11/07/2021 02:13:24 - INFO - __main__ - Step 35390: {'lr': 0.0004397944178652376, 'samples': 6794880, 'steps': 35389, 'loss/train': 1.7182281017303467} -11/07/2021 02:13:24 - INFO - __main__ - Step 35391: {'lr': 0.0004397909637504191, 'samples': 6795072, 'steps': 35390, 'loss/train': 1.3362889289855957} -11/07/2021 02:13:24 - INFO - __main__ - Step 35392: {'lr': 0.00043978750955008374, 'samples': 6795264, 'steps': 35391, 'loss/train': 1.5932806730270386} -11/07/2021 02:13:26 - INFO - __main__ - Step 35393: {'lr': 0.00043978405526423305, 'samples': 6795456, 'steps': 35392, 'loss/train': 3.2164599895477295} -11/07/2021 02:13:26 - INFO - __main__ - Step 35394: {'lr': 0.0004397806008928686, 'samples': 6795648, 'steps': 35393, 'loss/train': 1.7339038848876953} -11/07/2021 02:13:26 - INFO - __main__ - Step 35395: {'lr': 0.00043977714643599194, 'samples': 6795840, 'steps': 35394, 'loss/train': 1.467126488685608} -11/07/2021 02:13:27 - INFO - __main__ - Step 35396: {'lr': 0.0004397736918936046, 'samples': 6796032, 'steps': 35395, 'loss/train': 1.4847302436828613} -11/07/2021 02:13:27 - INFO - __main__ - Step 35397: {'lr': 0.0004397702372657082, 'samples': 6796224, 'steps': 35396, 'loss/train': 1.2340567111968994} -11/07/2021 02:13:28 - INFO - __main__ - Step 35398: {'lr': 0.00043976678255230417, 'samples': 6796416, 'steps': 35397, 'loss/train': 1.5708730220794678} -11/07/2021 02:13:28 - INFO - __main__ - Step 35399: {'lr': 0.0004397633277533942, 'samples': 6796608, 'steps': 35398, 'loss/train': 1.2345236539840698} -11/07/2021 02:13:29 - INFO - __main__ - Step 35400: {'lr': 0.0004397598728689799, 'samples': 6796800, 'steps': 35399, 'loss/train': 1.1859363317489624} -11/07/2021 02:13:29 - INFO - __main__ - Step 35401: {'lr': 0.0004397564178990626, 'samples': 6796992, 'steps': 35400, 'loss/train': 1.856229305267334} -11/07/2021 02:13:30 - INFO - __main__ - Step 35402: {'lr': 0.0004397529628436441, 'samples': 6797184, 'steps': 35401, 'loss/train': 1.287499189376831} -11/07/2021 02:13:30 - INFO - __main__ - Step 35403: {'lr': 0.0004397495077027258, 'samples': 6797376, 'steps': 35402, 'loss/train': 1.4517358541488647} -11/07/2021 02:13:31 - INFO - __main__ - Step 35404: {'lr': 0.0004397460524763093, 'samples': 6797568, 'steps': 35403, 'loss/train': 0.9907420873641968} -11/07/2021 02:13:31 - INFO - __main__ - Step 35405: {'lr': 0.00043974259716439613, 'samples': 6797760, 'steps': 35404, 'loss/train': 1.5516440868377686} -11/07/2021 02:13:32 - INFO - __main__ - Step 35406: {'lr': 0.0004397391417669878, 'samples': 6797952, 'steps': 35405, 'loss/train': 1.601456880569458} -11/07/2021 02:13:32 - INFO - __main__ - Step 35407: {'lr': 0.0004397356862840861, 'samples': 6798144, 'steps': 35406, 'loss/train': 1.5725170373916626} -11/07/2021 02:13:33 - INFO - __main__ - Step 35408: {'lr': 0.00043973223071569234, 'samples': 6798336, 'steps': 35407, 'loss/train': 1.9015896320343018} -11/07/2021 02:13:33 - INFO - __main__ - Step 35409: {'lr': 0.0004397287750618082, 'samples': 6798528, 'steps': 35408, 'loss/train': 2.284215211868286} -11/07/2021 02:13:34 - INFO - __main__ - Step 35410: {'lr': 0.00043972531932243516, 'samples': 6798720, 'steps': 35409, 'loss/train': 1.706610918045044} -11/07/2021 02:13:34 - INFO - __main__ - Step 35411: {'lr': 0.00043972186349757484, 'samples': 6798912, 'steps': 35410, 'loss/train': 1.4776911735534668} -11/07/2021 02:13:34 - INFO - __main__ - Step 35412: {'lr': 0.0004397184075872288, 'samples': 6799104, 'steps': 35411, 'loss/train': 1.2144941091537476} -11/07/2021 02:13:35 - INFO - __main__ - Step 35413: {'lr': 0.0004397149515913985, 'samples': 6799296, 'steps': 35412, 'loss/train': 5.854411602020264} -11/07/2021 02:13:36 - INFO - __main__ - Step 35414: {'lr': 0.0004397114955100856, 'samples': 6799488, 'steps': 35413, 'loss/train': 1.5621206760406494} -11/07/2021 02:13:36 - INFO - __main__ - Step 35415: {'lr': 0.00043970803934329167, 'samples': 6799680, 'steps': 35414, 'loss/train': 1.4797799587249756} -11/07/2021 02:13:37 - INFO - __main__ - Step 35416: {'lr': 0.00043970458309101825, 'samples': 6799872, 'steps': 35415, 'loss/train': 1.556593656539917} -11/07/2021 02:13:37 - INFO - __main__ - Step 35417: {'lr': 0.0004397011267532668, 'samples': 6800064, 'steps': 35416, 'loss/train': 1.8843176364898682} -11/07/2021 02:13:37 - INFO - __main__ - Step 35418: {'lr': 0.00043969767033003894, 'samples': 6800256, 'steps': 35417, 'loss/train': 1.3072028160095215} -11/07/2021 02:13:38 - INFO - __main__ - Step 35419: {'lr': 0.0004396942138213363, 'samples': 6800448, 'steps': 35418, 'loss/train': 1.5829036235809326} -11/07/2021 02:13:38 - INFO - __main__ - Step 35420: {'lr': 0.00043969075722716033, 'samples': 6800640, 'steps': 35419, 'loss/train': 1.3367642164230347} -11/07/2021 02:13:39 - INFO - __main__ - Step 35421: {'lr': 0.0004396873005475127, 'samples': 6800832, 'steps': 35420, 'loss/train': 1.5796177387237549} -11/07/2021 02:13:39 - INFO - __main__ - Step 35422: {'lr': 0.00043968384378239477, 'samples': 6801024, 'steps': 35421, 'loss/train': 1.3193522691726685} -11/07/2021 02:13:40 - INFO - __main__ - Step 35423: {'lr': 0.00043968038693180834, 'samples': 6801216, 'steps': 35422, 'loss/train': 1.4077221155166626} -11/07/2021 02:13:40 - INFO - __main__ - Step 35424: {'lr': 0.00043967692999575484, 'samples': 6801408, 'steps': 35423, 'loss/train': 1.858082890510559} -11/07/2021 02:13:41 - INFO - __main__ - Step 35425: {'lr': 0.00043967347297423575, 'samples': 6801600, 'steps': 35424, 'loss/train': 1.2148572206497192} -11/07/2021 02:13:41 - INFO - __main__ - Step 35426: {'lr': 0.0004396700158672528, 'samples': 6801792, 'steps': 35425, 'loss/train': 0.840027928352356} -11/07/2021 02:13:42 - INFO - __main__ - Step 35427: {'lr': 0.0004396665586748075, 'samples': 6801984, 'steps': 35426, 'loss/train': 1.7397141456604004} -11/07/2021 02:13:42 - INFO - __main__ - Step 35428: {'lr': 0.0004396631013969013, 'samples': 6802176, 'steps': 35427, 'loss/train': 1.712583065032959} -11/07/2021 02:13:43 - INFO - __main__ - Step 35429: {'lr': 0.0004396596440335359, 'samples': 6802368, 'steps': 35428, 'loss/train': 0.4670521020889282} -11/07/2021 02:13:43 - INFO - __main__ - Step 35430: {'lr': 0.00043965618658471276, 'samples': 6802560, 'steps': 35429, 'loss/train': 1.2149841785430908} -11/07/2021 02:13:44 - INFO - __main__ - Step 35431: {'lr': 0.0004396527290504334, 'samples': 6802752, 'steps': 35430, 'loss/train': 3.315039873123169} -11/07/2021 02:13:44 - INFO - __main__ - Step 35432: {'lr': 0.00043964927143069955, 'samples': 6802944, 'steps': 35431, 'loss/train': 1.2933154106140137} -11/07/2021 02:13:44 - INFO - __main__ - Step 35433: {'lr': 0.0004396458137255126, 'samples': 6803136, 'steps': 35432, 'loss/train': 1.6630334854125977} -11/07/2021 02:13:45 - INFO - __main__ - Step 35434: {'lr': 0.0004396423559348742, 'samples': 6803328, 'steps': 35433, 'loss/train': 1.2026915550231934} -11/07/2021 02:13:46 - INFO - __main__ - Step 35435: {'lr': 0.0004396388980587859, 'samples': 6803520, 'steps': 35434, 'loss/train': 1.7204598188400269} -11/07/2021 02:13:46 - INFO - __main__ - Step 35436: {'lr': 0.0004396354400972492, 'samples': 6803712, 'steps': 35435, 'loss/train': 1.4436103105545044} -11/07/2021 02:13:46 - INFO - __main__ - Step 35437: {'lr': 0.0004396319820502657, 'samples': 6803904, 'steps': 35436, 'loss/train': 1.448534607887268} -11/07/2021 02:13:47 - INFO - __main__ - Step 35438: {'lr': 0.000439628523917837, 'samples': 6804096, 'steps': 35437, 'loss/train': 1.177272915840149} -11/07/2021 02:13:47 - INFO - __main__ - Step 35439: {'lr': 0.0004396250656999646, 'samples': 6804288, 'steps': 35438, 'loss/train': 1.060101866722107} -11/07/2021 02:13:48 - INFO - __main__ - Step 35440: {'lr': 0.00043962160739665, 'samples': 6804480, 'steps': 35439, 'loss/train': 1.3558481931686401} -11/07/2021 02:13:49 - INFO - __main__ - Step 35441: {'lr': 0.0004396181490078949, 'samples': 6804672, 'steps': 35440, 'loss/train': 1.5725367069244385} -11/07/2021 02:13:49 - INFO - __main__ - Step 35442: {'lr': 0.0004396146905337008, 'samples': 6804864, 'steps': 35441, 'loss/train': 1.5690183639526367} -11/07/2021 02:13:49 - INFO - __main__ - Step 35443: {'lr': 0.0004396112319740692, 'samples': 6805056, 'steps': 35442, 'loss/train': 1.7257599830627441} -11/07/2021 02:13:50 - INFO - __main__ - Step 35444: {'lr': 0.0004396077733290017, 'samples': 6805248, 'steps': 35443, 'loss/train': 1.7161669731140137} -11/07/2021 02:13:50 - INFO - __main__ - Step 35445: {'lr': 0.00043960431459849993, 'samples': 6805440, 'steps': 35444, 'loss/train': 2.2584564685821533} -11/07/2021 02:13:51 - INFO - __main__ - Step 35446: {'lr': 0.00043960085578256537, 'samples': 6805632, 'steps': 35445, 'loss/train': 1.974791407585144} -11/07/2021 02:13:51 - INFO - __main__ - Step 35447: {'lr': 0.0004395973968811995, 'samples': 6805824, 'steps': 35446, 'loss/train': 1.463413119316101} -11/07/2021 02:13:52 - INFO - __main__ - Step 35448: {'lr': 0.00043959393789440407, 'samples': 6806016, 'steps': 35447, 'loss/train': 2.0213165283203125} -11/07/2021 02:13:52 - INFO - __main__ - Step 35449: {'lr': 0.0004395904788221805, 'samples': 6806208, 'steps': 35448, 'loss/train': 1.3373453617095947} -11/07/2021 02:13:52 - INFO - __main__ - Step 35450: {'lr': 0.00043958701966453033, 'samples': 6806400, 'steps': 35449, 'loss/train': 1.6128551959991455} -11/07/2021 02:13:53 - INFO - __main__ - Step 35451: {'lr': 0.00043958356042145524, 'samples': 6806592, 'steps': 35450, 'loss/train': 1.284608244895935} -11/07/2021 02:13:54 - INFO - __main__ - Step 35452: {'lr': 0.0004395801010929567, 'samples': 6806784, 'steps': 35451, 'loss/train': 0.7865902185440063} -11/07/2021 02:13:54 - INFO - __main__ - Step 35453: {'lr': 0.0004395766416790363, 'samples': 6806976, 'steps': 35452, 'loss/train': 0.9731584787368774} -11/07/2021 02:13:54 - INFO - __main__ - Step 35454: {'lr': 0.0004395731821796956, 'samples': 6807168, 'steps': 35453, 'loss/train': 1.5661472082138062} -11/07/2021 02:13:55 - INFO - __main__ - Step 35455: {'lr': 0.00043956972259493615, 'samples': 6807360, 'steps': 35454, 'loss/train': 1.5036189556121826} -11/07/2021 02:13:56 - INFO - __main__ - Step 35456: {'lr': 0.0004395662629247595, 'samples': 6807552, 'steps': 35455, 'loss/train': 1.6254386901855469} -11/07/2021 02:13:56 - INFO - __main__ - Step 35457: {'lr': 0.0004395628031691672, 'samples': 6807744, 'steps': 35456, 'loss/train': 1.3540188074111938} -11/07/2021 02:13:57 - INFO - __main__ - Step 35458: {'lr': 0.00043955934332816083, 'samples': 6807936, 'steps': 35457, 'loss/train': 0.7331323623657227} -11/07/2021 02:13:57 - INFO - __main__ - Step 35459: {'lr': 0.00043955588340174195, 'samples': 6808128, 'steps': 35458, 'loss/train': 2.366567373275757} -11/07/2021 02:13:57 - INFO - __main__ - Step 35460: {'lr': 0.00043955242338991217, 'samples': 6808320, 'steps': 35459, 'loss/train': 0.8286648988723755} -11/07/2021 02:13:58 - INFO - __main__ - Step 35461: {'lr': 0.0004395489632926729, 'samples': 6808512, 'steps': 35460, 'loss/train': 1.2756918668746948} -11/07/2021 02:13:59 - INFO - __main__ - Step 35462: {'lr': 0.0004395455031100258, 'samples': 6808704, 'steps': 35461, 'loss/train': 0.8456819653511047} -11/07/2021 02:13:59 - INFO - __main__ - Step 35463: {'lr': 0.0004395420428419725, 'samples': 6808896, 'steps': 35462, 'loss/train': 1.4862419366836548} -11/07/2021 02:14:00 - INFO - __main__ - Step 35464: {'lr': 0.0004395385824885144, 'samples': 6809088, 'steps': 35463, 'loss/train': 1.42411208152771} -11/07/2021 02:14:00 - INFO - __main__ - Step 35465: {'lr': 0.0004395351220496532, 'samples': 6809280, 'steps': 35464, 'loss/train': 1.655928611755371} -11/07/2021 02:14:00 - INFO - __main__ - Step 35466: {'lr': 0.00043953166152539035, 'samples': 6809472, 'steps': 35465, 'loss/train': 1.353151559829712} -11/07/2021 02:14:01 - INFO - __main__ - Step 35467: {'lr': 0.00043952820091572753, 'samples': 6809664, 'steps': 35466, 'loss/train': 1.1998428106307983} -11/07/2021 02:14:02 - INFO - __main__ - Step 35468: {'lr': 0.0004395247402206662, 'samples': 6809856, 'steps': 35467, 'loss/train': 1.4462324380874634} -11/07/2021 02:14:02 - INFO - __main__ - Step 35469: {'lr': 0.0004395212794402079, 'samples': 6810048, 'steps': 35468, 'loss/train': 1.8410362005233765} -11/07/2021 02:14:02 - INFO - __main__ - Step 35470: {'lr': 0.00043951781857435424, 'samples': 6810240, 'steps': 35469, 'loss/train': 1.621268391609192} -11/07/2021 02:14:03 - INFO - __main__ - Step 35471: {'lr': 0.00043951435762310686, 'samples': 6810432, 'steps': 35470, 'loss/train': 1.4175527095794678} -11/07/2021 02:14:04 - INFO - __main__ - Step 35472: {'lr': 0.0004395108965864671, 'samples': 6810624, 'steps': 35471, 'loss/train': 1.7941079139709473} -11/07/2021 02:14:04 - INFO - __main__ - Step 35473: {'lr': 0.00043950743546443676, 'samples': 6810816, 'steps': 35472, 'loss/train': 1.252071738243103} -11/07/2021 02:14:04 - INFO - __main__ - Step 35474: {'lr': 0.0004395039742570173, 'samples': 6811008, 'steps': 35473, 'loss/train': 1.4083306789398193} -11/07/2021 02:14:05 - INFO - __main__ - Step 35475: {'lr': 0.00043950051296421023, 'samples': 6811200, 'steps': 35474, 'loss/train': 1.6213352680206299} -11/07/2021 02:14:05 - INFO - __main__ - Step 35476: {'lr': 0.00043949705158601715, 'samples': 6811392, 'steps': 35475, 'loss/train': 1.4592680931091309} -11/07/2021 02:14:06 - INFO - __main__ - Step 35477: {'lr': 0.00043949359012243963, 'samples': 6811584, 'steps': 35476, 'loss/train': 2.0029690265655518} -11/07/2021 02:14:06 - INFO - __main__ - Step 35478: {'lr': 0.00043949012857347924, 'samples': 6811776, 'steps': 35477, 'loss/train': 1.3724820613861084} -11/07/2021 02:14:07 - INFO - __main__ - Step 35479: {'lr': 0.0004394866669391375, 'samples': 6811968, 'steps': 35478, 'loss/train': 1.372178077697754} -11/07/2021 02:14:07 - INFO - __main__ - Step 35480: {'lr': 0.00043948320521941596, 'samples': 6812160, 'steps': 35479, 'loss/train': 1.7159295082092285} -11/07/2021 02:14:08 - INFO - __main__ - Step 35481: {'lr': 0.00043947974341431627, 'samples': 6812352, 'steps': 35480, 'loss/train': 1.0123029947280884} -11/07/2021 02:14:08 - INFO - __main__ - Step 35482: {'lr': 0.0004394762815238399, 'samples': 6812544, 'steps': 35481, 'loss/train': 1.3081108331680298} -11/07/2021 02:14:09 - INFO - __main__ - Step 35483: {'lr': 0.00043947281954798844, 'samples': 6812736, 'steps': 35482, 'loss/train': 1.5746831893920898} -11/07/2021 02:14:09 - INFO - __main__ - Step 35484: {'lr': 0.0004394693574867635, 'samples': 6812928, 'steps': 35483, 'loss/train': 1.6583791971206665} -11/07/2021 02:14:10 - INFO - __main__ - Step 35485: {'lr': 0.0004394658953401666, 'samples': 6813120, 'steps': 35484, 'loss/train': 1.2911481857299805} -11/07/2021 02:14:10 - INFO - __main__ - Step 35486: {'lr': 0.0004394624331081992, 'samples': 6813312, 'steps': 35485, 'loss/train': 1.4848313331604004} -11/07/2021 02:14:10 - INFO - __main__ - Step 35487: {'lr': 0.00043945897079086295, 'samples': 6813504, 'steps': 35486, 'loss/train': 1.6941444873809814} -11/07/2021 02:14:12 - INFO - __main__ - Step 35488: {'lr': 0.00043945550838815953, 'samples': 6813696, 'steps': 35487, 'loss/train': 1.4050376415252686} -11/07/2021 02:14:12 - INFO - __main__ - Step 35489: {'lr': 0.00043945204590009027, 'samples': 6813888, 'steps': 35488, 'loss/train': 1.667410969734192} -11/07/2021 02:14:12 - INFO - __main__ - Step 35490: {'lr': 0.0004394485833266569, 'samples': 6814080, 'steps': 35489, 'loss/train': 5.882075309753418} -11/07/2021 02:14:13 - INFO - __main__ - Step 35491: {'lr': 0.0004394451206678609, 'samples': 6814272, 'steps': 35490, 'loss/train': 1.7875516414642334} -11/07/2021 02:14:13 - INFO - __main__ - Step 35492: {'lr': 0.00043944165792370385, 'samples': 6814464, 'steps': 35491, 'loss/train': 1.8067296743392944} -11/07/2021 02:14:14 - INFO - __main__ - Step 35493: {'lr': 0.00043943819509418723, 'samples': 6814656, 'steps': 35492, 'loss/train': 0.9062034487724304} -11/07/2021 02:14:14 - INFO - __main__ - Step 35494: {'lr': 0.00043943473217931283, 'samples': 6814848, 'steps': 35493, 'loss/train': 1.8187721967697144} -11/07/2021 02:14:15 - INFO - __main__ - Step 35495: {'lr': 0.0004394312691790821, 'samples': 6815040, 'steps': 35494, 'loss/train': 1.4220510721206665} -11/07/2021 02:14:15 - INFO - __main__ - Step 35496: {'lr': 0.00043942780609349636, 'samples': 6815232, 'steps': 35495, 'loss/train': 1.5365619659423828} -11/07/2021 02:14:16 - INFO - __main__ - Step 35497: {'lr': 0.0004394243429225575, 'samples': 6815424, 'steps': 35496, 'loss/train': 1.6511274576187134} -11/07/2021 02:14:16 - INFO - __main__ - Step 35498: {'lr': 0.0004394208796662669, 'samples': 6815616, 'steps': 35497, 'loss/train': 0.9219018816947937} -11/07/2021 02:14:17 - INFO - __main__ - Step 35499: {'lr': 0.00043941741632462625, 'samples': 6815808, 'steps': 35498, 'loss/train': 1.7441105842590332} -11/07/2021 02:14:17 - INFO - __main__ - Step 35500: {'lr': 0.000439413952897637, 'samples': 6816000, 'steps': 35499, 'loss/train': 1.183741569519043} -11/07/2021 02:14:18 - INFO - __main__ - Step 35501: {'lr': 0.0004394104893853007, 'samples': 6816192, 'steps': 35500, 'loss/train': 0.7865248918533325} -11/07/2021 02:14:18 - INFO - __main__ - Step 35502: {'lr': 0.00043940702578761906, 'samples': 6816384, 'steps': 35501, 'loss/train': 1.31686532497406} -11/07/2021 02:14:19 - INFO - __main__ - Step 35503: {'lr': 0.00043940356210459344, 'samples': 6816576, 'steps': 35502, 'loss/train': 1.5352532863616943} -11/07/2021 02:14:19 - INFO - __main__ - Step 35504: {'lr': 0.0004394000983362255, 'samples': 6816768, 'steps': 35503, 'loss/train': 1.7768218517303467} -11/07/2021 02:14:20 - INFO - __main__ - Step 35505: {'lr': 0.0004393966344825168, 'samples': 6816960, 'steps': 35504, 'loss/train': 2.8831872940063477} -11/07/2021 02:14:20 - INFO - __main__ - Step 35506: {'lr': 0.00043939317054346894, 'samples': 6817152, 'steps': 35505, 'loss/train': 1.364589810371399} -11/07/2021 02:14:20 - INFO - __main__ - Step 35507: {'lr': 0.00043938970651908346, 'samples': 6817344, 'steps': 35506, 'loss/train': 1.6305081844329834} -11/07/2021 02:14:21 - INFO - __main__ - Step 35508: {'lr': 0.0004393862424093619, 'samples': 6817536, 'steps': 35507, 'loss/train': 1.354570746421814} -11/07/2021 02:14:22 - INFO - __main__ - Step 35509: {'lr': 0.0004393827782143057, 'samples': 6817728, 'steps': 35508, 'loss/train': 1.7895361185073853} -11/07/2021 02:14:22 - INFO - __main__ - Step 35510: {'lr': 0.00043937931393391667, 'samples': 6817920, 'steps': 35509, 'loss/train': 2.0235912799835205} -11/07/2021 02:14:22 - INFO - __main__ - Step 35511: {'lr': 0.0004393758495681962, 'samples': 6818112, 'steps': 35510, 'loss/train': 1.6815040111541748} -11/07/2021 02:14:23 - INFO - __main__ - Step 35512: {'lr': 0.0004393723851171459, 'samples': 6818304, 'steps': 35511, 'loss/train': 2.5056517124176025} -11/07/2021 02:14:23 - INFO - __main__ - Step 35513: {'lr': 0.0004393689205807673, 'samples': 6818496, 'steps': 35512, 'loss/train': 0.8651651740074158} -11/07/2021 02:14:24 - INFO - __main__ - Step 35514: {'lr': 0.00043936545595906206, 'samples': 6818688, 'steps': 35513, 'loss/train': 1.3810594081878662} -11/07/2021 02:14:25 - INFO - __main__ - Step 35515: {'lr': 0.00043936199125203156, 'samples': 6818880, 'steps': 35514, 'loss/train': 1.0598888397216797} -11/07/2021 02:14:25 - INFO - __main__ - Step 35516: {'lr': 0.00043935852645967755, 'samples': 6819072, 'steps': 35515, 'loss/train': 1.621749997138977} -11/07/2021 02:14:25 - INFO - __main__ - Step 35517: {'lr': 0.00043935506158200143, 'samples': 6819264, 'steps': 35516, 'loss/train': 1.2624260187149048} -11/07/2021 02:14:26 - INFO - __main__ - Step 35518: {'lr': 0.000439351596619005, 'samples': 6819456, 'steps': 35517, 'loss/train': 1.732316493988037} -11/07/2021 02:14:27 - INFO - __main__ - Step 35519: {'lr': 0.00043934813157068956, 'samples': 6819648, 'steps': 35518, 'loss/train': 0.9514675736427307} -11/07/2021 02:14:27 - INFO - __main__ - Step 35520: {'lr': 0.00043934466643705673, 'samples': 6819840, 'steps': 35519, 'loss/train': 2.08212947845459} -11/07/2021 02:14:27 - INFO - __main__ - Step 35521: {'lr': 0.00043934120121810814, 'samples': 6820032, 'steps': 35520, 'loss/train': 1.5012516975402832} -11/07/2021 02:14:28 - INFO - __main__ - Step 35522: {'lr': 0.0004393377359138454, 'samples': 6820224, 'steps': 35521, 'loss/train': 1.1675945520401} -11/07/2021 02:14:28 - INFO - __main__ - Step 35523: {'lr': 0.00043933427052426986, 'samples': 6820416, 'steps': 35522, 'loss/train': 1.2477281093597412} -11/07/2021 02:14:29 - INFO - __main__ - Step 35524: {'lr': 0.00043933080504938337, 'samples': 6820608, 'steps': 35523, 'loss/train': 1.6102840900421143} -11/07/2021 02:14:29 - INFO - __main__ - Step 35525: {'lr': 0.00043932733948918724, 'samples': 6820800, 'steps': 35524, 'loss/train': 0.9736477136611938} -11/07/2021 02:14:30 - INFO - __main__ - Step 35526: {'lr': 0.0004393238738436832, 'samples': 6820992, 'steps': 35525, 'loss/train': 1.7441880702972412} -11/07/2021 02:14:30 - INFO - __main__ - Step 35527: {'lr': 0.00043932040811287264, 'samples': 6821184, 'steps': 35526, 'loss/train': 1.398417353630066} -11/07/2021 02:14:30 - INFO - __main__ - Step 35528: {'lr': 0.0004393169422967573, 'samples': 6821376, 'steps': 35527, 'loss/train': 1.6070457696914673} -11/07/2021 02:14:31 - INFO - __main__ - Step 35529: {'lr': 0.0004393134763953387, 'samples': 6821568, 'steps': 35528, 'loss/train': 1.5105087757110596} -11/07/2021 02:14:32 - INFO - __main__ - Step 35530: {'lr': 0.00043931001040861835, 'samples': 6821760, 'steps': 35529, 'loss/train': 1.590580701828003} -11/07/2021 02:14:32 - INFO - __main__ - Step 35531: {'lr': 0.00043930654433659775, 'samples': 6821952, 'steps': 35530, 'loss/train': 1.6376655101776123} -11/07/2021 02:14:33 - INFO - __main__ - Step 35532: {'lr': 0.0004393030781792787, 'samples': 6822144, 'steps': 35531, 'loss/train': 1.5782145261764526} -11/07/2021 02:14:33 - INFO - __main__ - Step 35533: {'lr': 0.00043929961193666246, 'samples': 6822336, 'steps': 35532, 'loss/train': 1.3283123970031738} -11/07/2021 02:14:34 - INFO - __main__ - Step 35534: {'lr': 0.0004392961456087508, 'samples': 6822528, 'steps': 35533, 'loss/train': 1.3335016965866089} -11/07/2021 02:14:34 - INFO - __main__ - Step 35535: {'lr': 0.00043929267919554516, 'samples': 6822720, 'steps': 35534, 'loss/train': 0.9739982485771179} -11/07/2021 02:14:35 - INFO - __main__ - Step 35536: {'lr': 0.00043928921269704725, 'samples': 6822912, 'steps': 35535, 'loss/train': 1.3560470342636108} -11/07/2021 02:14:35 - INFO - __main__ - Step 35537: {'lr': 0.00043928574611325845, 'samples': 6823104, 'steps': 35536, 'loss/train': 2.5706093311309814} -11/07/2021 02:14:35 - INFO - __main__ - Step 35538: {'lr': 0.00043928227944418046, 'samples': 6823296, 'steps': 35537, 'loss/train': 0.8618325591087341} -11/07/2021 02:14:36 - INFO - __main__ - Step 35539: {'lr': 0.00043927881268981484, 'samples': 6823488, 'steps': 35538, 'loss/train': 1.1628984212875366} -11/07/2021 02:14:37 - INFO - __main__ - Step 35540: {'lr': 0.00043927534585016305, 'samples': 6823680, 'steps': 35539, 'loss/train': 1.6144016981124878} -11/07/2021 02:14:37 - INFO - __main__ - Step 35541: {'lr': 0.0004392718789252267, 'samples': 6823872, 'steps': 35540, 'loss/train': 1.7553297281265259} -11/07/2021 02:14:37 - INFO - __main__ - Step 35542: {'lr': 0.0004392684119150074, 'samples': 6824064, 'steps': 35541, 'loss/train': 1.8475892543792725} -11/07/2021 02:14:38 - INFO - __main__ - Step 35543: {'lr': 0.0004392649448195066, 'samples': 6824256, 'steps': 35542, 'loss/train': 1.538231372833252} -11/07/2021 02:14:38 - INFO - __main__ - Step 35544: {'lr': 0.000439261477638726, 'samples': 6824448, 'steps': 35543, 'loss/train': 1.5907025337219238} -11/07/2021 02:14:39 - INFO - __main__ - Step 35545: {'lr': 0.0004392580103726671, 'samples': 6824640, 'steps': 35544, 'loss/train': 1.6743935346603394} -11/07/2021 02:14:39 - INFO - __main__ - Step 35546: {'lr': 0.0004392545430213315, 'samples': 6824832, 'steps': 35545, 'loss/train': 1.476622462272644} -11/07/2021 02:14:40 - INFO - __main__ - Step 35547: {'lr': 0.00043925107558472065, 'samples': 6825024, 'steps': 35546, 'loss/train': 1.8071759939193726} -11/07/2021 02:14:40 - INFO - __main__ - Step 35548: {'lr': 0.0004392476080628363, 'samples': 6825216, 'steps': 35547, 'loss/train': 1.7994885444641113} -11/07/2021 02:14:40 - INFO - __main__ - Step 35549: {'lr': 0.00043924414045567973, 'samples': 6825408, 'steps': 35548, 'loss/train': 1.926434874534607} -11/07/2021 02:14:41 - INFO - __main__ - Step 35550: {'lr': 0.00043924067276325274, 'samples': 6825600, 'steps': 35549, 'loss/train': 1.4588193893432617} -11/07/2021 02:14:42 - INFO - __main__ - Step 35551: {'lr': 0.0004392372049855569, 'samples': 6825792, 'steps': 35550, 'loss/train': 1.6992769241333008} -11/07/2021 02:14:42 - INFO - __main__ - Step 35552: {'lr': 0.0004392337371225936, 'samples': 6825984, 'steps': 35551, 'loss/train': 1.381164312362671} -11/07/2021 02:14:43 - INFO - __main__ - Step 35553: {'lr': 0.0004392302691743645, 'samples': 6826176, 'steps': 35552, 'loss/train': 1.5796421766281128} -11/07/2021 02:14:43 - INFO - __main__ - Step 35554: {'lr': 0.0004392268011408712, 'samples': 6826368, 'steps': 35553, 'loss/train': 1.6246516704559326} -11/07/2021 02:14:44 - INFO - __main__ - Step 35555: {'lr': 0.0004392233330221152, 'samples': 6826560, 'steps': 35554, 'loss/train': 0.7908975481987} -11/07/2021 02:14:44 - INFO - __main__ - Step 35556: {'lr': 0.0004392198648180981, 'samples': 6826752, 'steps': 35555, 'loss/train': 1.2291918992996216} -11/07/2021 02:14:45 - INFO - __main__ - Step 35557: {'lr': 0.0004392163965288215, 'samples': 6826944, 'steps': 35556, 'loss/train': 1.5592041015625} -11/07/2021 02:14:45 - INFO - __main__ - Step 35558: {'lr': 0.0004392129281542868, 'samples': 6827136, 'steps': 35557, 'loss/train': 1.6843079328536987} -11/07/2021 02:14:45 - INFO - __main__ - Step 35559: {'lr': 0.00043920945969449577, 'samples': 6827328, 'steps': 35558, 'loss/train': 1.2580102682113647} -11/07/2021 02:14:46 - INFO - __main__ - Step 35560: {'lr': 0.0004392059911494498, 'samples': 6827520, 'steps': 35559, 'loss/train': 1.5198917388916016} -11/07/2021 02:14:47 - INFO - __main__ - Step 35561: {'lr': 0.0004392025225191506, 'samples': 6827712, 'steps': 35560, 'loss/train': 1.4956892728805542} -11/07/2021 02:14:47 - INFO - __main__ - Step 35562: {'lr': 0.0004391990538035996, 'samples': 6827904, 'steps': 35561, 'loss/train': 1.6502302885055542} -11/07/2021 02:14:48 - INFO - __main__ - Step 35563: {'lr': 0.00043919558500279845, 'samples': 6828096, 'steps': 35562, 'loss/train': 1.2379157543182373} -11/07/2021 02:14:48 - INFO - __main__ - Step 35564: {'lr': 0.0004391921161167487, 'samples': 6828288, 'steps': 35563, 'loss/train': 1.503430962562561} -11/07/2021 02:14:49 - INFO - __main__ - Step 35565: {'lr': 0.00043918864714545194, 'samples': 6828480, 'steps': 35564, 'loss/train': 1.0588741302490234} -11/07/2021 02:14:49 - INFO - __main__ - Step 35566: {'lr': 0.00043918517808890964, 'samples': 6828672, 'steps': 35565, 'loss/train': 2.0430285930633545} -11/07/2021 02:14:50 - INFO - __main__ - Step 35567: {'lr': 0.0004391817089471234, 'samples': 6828864, 'steps': 35566, 'loss/train': 0.12924258410930634} -11/07/2021 02:14:50 - INFO - __main__ - Step 35568: {'lr': 0.0004391782397200949, 'samples': 6829056, 'steps': 35567, 'loss/train': 0.8577550053596497} -11/07/2021 02:14:50 - INFO - __main__ - Step 35569: {'lr': 0.0004391747704078255, 'samples': 6829248, 'steps': 35568, 'loss/train': 2.1193783283233643} -11/07/2021 02:14:51 - INFO - __main__ - Step 35570: {'lr': 0.0004391713010103169, 'samples': 6829440, 'steps': 35569, 'loss/train': 1.119254469871521} -11/07/2021 02:14:52 - INFO - __main__ - Step 35571: {'lr': 0.0004391678315275706, 'samples': 6829632, 'steps': 35570, 'loss/train': 1.577763557434082} -11/07/2021 02:14:52 - INFO - __main__ - Step 35572: {'lr': 0.00043916436195958825, 'samples': 6829824, 'steps': 35571, 'loss/train': 1.3878240585327148} -11/07/2021 02:14:52 - INFO - __main__ - Step 35573: {'lr': 0.00043916089230637133, 'samples': 6830016, 'steps': 35572, 'loss/train': 1.3805381059646606} -11/07/2021 02:14:53 - INFO - __main__ - Step 35574: {'lr': 0.0004391574225679215, 'samples': 6830208, 'steps': 35573, 'loss/train': 1.2656093835830688} -11/07/2021 02:14:53 - INFO - __main__ - Step 35575: {'lr': 0.0004391539527442401, 'samples': 6830400, 'steps': 35574, 'loss/train': 1.359189510345459} -11/07/2021 02:14:55 - INFO - __main__ - Step 35576: {'lr': 0.000439150482835329, 'samples': 6830592, 'steps': 35575, 'loss/train': 1.4779083728790283} -11/07/2021 02:14:55 - INFO - __main__ - Step 35577: {'lr': 0.0004391470128411895, 'samples': 6830784, 'steps': 35576, 'loss/train': 1.0927032232284546} -11/07/2021 02:14:55 - INFO - __main__ - Step 35578: {'lr': 0.00043914354276182335, 'samples': 6830976, 'steps': 35577, 'loss/train': 1.5809870958328247} -11/07/2021 02:14:56 - INFO - __main__ - Step 35579: {'lr': 0.00043914007259723196, 'samples': 6831168, 'steps': 35578, 'loss/train': 0.13724112510681152} -11/07/2021 02:14:56 - INFO - __main__ - Step 35580: {'lr': 0.000439136602347417, 'samples': 6831360, 'steps': 35579, 'loss/train': 0.6508349180221558} -11/07/2021 02:14:57 - INFO - __main__ - Step 35581: {'lr': 0.00043913313201238017, 'samples': 6831552, 'steps': 35580, 'loss/train': 1.9046825170516968} -11/07/2021 02:14:57 - INFO - __main__ - Step 35582: {'lr': 0.00043912966159212263, 'samples': 6831744, 'steps': 35581, 'loss/train': 1.856600284576416} -11/07/2021 02:14:58 - INFO - __main__ - Step 35583: {'lr': 0.0004391261910866463, 'samples': 6831936, 'steps': 35582, 'loss/train': 1.4237700700759888} -11/07/2021 02:14:58 - INFO - __main__ - Step 35584: {'lr': 0.0004391227204959526, 'samples': 6832128, 'steps': 35583, 'loss/train': 1.4016250371932983} -11/07/2021 02:14:59 - INFO - __main__ - Step 35585: {'lr': 0.00043911924982004315, 'samples': 6832320, 'steps': 35584, 'loss/train': 1.6603078842163086} -11/07/2021 02:15:00 - INFO - __main__ - Step 35586: {'lr': 0.0004391157790589195, 'samples': 6832512, 'steps': 35585, 'loss/train': 1.489089012145996} -11/07/2021 02:15:00 - INFO - __main__ - Step 35587: {'lr': 0.00043911230821258313, 'samples': 6832704, 'steps': 35586, 'loss/train': 1.623017430305481} -11/07/2021 02:15:00 - INFO - __main__ - Step 35588: {'lr': 0.00043910883728103575, 'samples': 6832896, 'steps': 35587, 'loss/train': 1.4644653797149658} -11/07/2021 02:15:01 - INFO - __main__ - Step 35589: {'lr': 0.0004391053662642788, 'samples': 6833088, 'steps': 35588, 'loss/train': 0.9706271290779114} -11/07/2021 02:15:01 - INFO - __main__ - Step 35590: {'lr': 0.00043910189516231386, 'samples': 6833280, 'steps': 35589, 'loss/train': 1.742411732673645} -11/07/2021 02:15:02 - INFO - __main__ - Step 35591: {'lr': 0.00043909842397514255, 'samples': 6833472, 'steps': 35590, 'loss/train': 1.5278904438018799} -11/07/2021 02:15:02 - INFO - __main__ - Step 35592: {'lr': 0.00043909495270276646, 'samples': 6833664, 'steps': 35591, 'loss/train': 1.4585014581680298} -11/07/2021 02:15:03 - INFO - __main__ - Step 35593: {'lr': 0.00043909148134518703, 'samples': 6833856, 'steps': 35592, 'loss/train': 1.5156004428863525} -11/07/2021 02:15:03 - INFO - __main__ - Step 35594: {'lr': 0.0004390880099024059, 'samples': 6834048, 'steps': 35593, 'loss/train': 0.9020565748214722} -11/07/2021 02:15:03 - INFO - __main__ - Step 35595: {'lr': 0.00043908453837442464, 'samples': 6834240, 'steps': 35594, 'loss/train': 1.130458950996399} -11/07/2021 02:15:04 - INFO - __main__ - Step 35596: {'lr': 0.0004390810667612448, 'samples': 6834432, 'steps': 35595, 'loss/train': 0.2694261968135834} -11/07/2021 02:15:05 - INFO - __main__ - Step 35597: {'lr': 0.00043907759506286797, 'samples': 6834624, 'steps': 35596, 'loss/train': 0.9140653610229492} -11/07/2021 02:15:05 - INFO - __main__ - Step 35598: {'lr': 0.00043907412327929575, 'samples': 6834816, 'steps': 35597, 'loss/train': 1.7793086767196655} -11/07/2021 02:15:06 - INFO - __main__ - Step 35599: {'lr': 0.00043907065141052953, 'samples': 6835008, 'steps': 35598, 'loss/train': 0.11254219710826874} -11/07/2021 02:15:06 - INFO - __main__ - Step 35600: {'lr': 0.00043906717945657104, 'samples': 6835200, 'steps': 35599, 'loss/train': 1.2892582416534424} -11/07/2021 02:15:07 - INFO - __main__ - Step 35601: {'lr': 0.00043906370741742185, 'samples': 6835392, 'steps': 35600, 'loss/train': 1.770271897315979} -11/07/2021 02:15:07 - INFO - __main__ - Step 35602: {'lr': 0.0004390602352930834, 'samples': 6835584, 'steps': 35601, 'loss/train': 6.062001705169678} -11/07/2021 02:15:08 - INFO - __main__ - Step 35603: {'lr': 0.00043905676308355734, 'samples': 6835776, 'steps': 35602, 'loss/train': 1.4519600868225098} -11/07/2021 02:15:08 - INFO - __main__ - Step 35604: {'lr': 0.00043905329078884527, 'samples': 6835968, 'steps': 35603, 'loss/train': 0.758042573928833} -11/07/2021 02:15:08 - INFO - __main__ - Step 35605: {'lr': 0.00043904981840894863, 'samples': 6836160, 'steps': 35604, 'loss/train': 1.488784670829773} -11/07/2021 02:15:09 - INFO - __main__ - Step 35606: {'lr': 0.0004390463459438691, 'samples': 6836352, 'steps': 35605, 'loss/train': 1.6607863903045654} -11/07/2021 02:15:10 - INFO - __main__ - Step 35607: {'lr': 0.0004390428733936082, 'samples': 6836544, 'steps': 35606, 'loss/train': 0.6637961268424988} -11/07/2021 02:15:10 - INFO - __main__ - Step 35608: {'lr': 0.0004390394007581675, 'samples': 6836736, 'steps': 35607, 'loss/train': 1.5490474700927734} -11/07/2021 02:15:10 - INFO - __main__ - Step 35609: {'lr': 0.00043903592803754856, 'samples': 6836928, 'steps': 35608, 'loss/train': 1.330698013305664} -11/07/2021 02:15:11 - INFO - __main__ - Step 35610: {'lr': 0.00043903245523175296, 'samples': 6837120, 'steps': 35609, 'loss/train': 1.4494189023971558} -11/07/2021 02:15:11 - INFO - __main__ - Step 35611: {'lr': 0.00043902898234078223, 'samples': 6837312, 'steps': 35610, 'loss/train': 1.6454213857650757} -11/07/2021 02:15:13 - INFO - __main__ - Step 35612: {'lr': 0.000439025509364638, 'samples': 6837504, 'steps': 35611, 'loss/train': 1.4363117218017578} -11/07/2021 02:15:13 - INFO - __main__ - Step 35613: {'lr': 0.0004390220363033217, 'samples': 6837696, 'steps': 35612, 'loss/train': 1.6490654945373535} -11/07/2021 02:15:13 - INFO - __main__ - Step 35614: {'lr': 0.0004390185631568351, 'samples': 6837888, 'steps': 35613, 'loss/train': 1.2435897588729858} -11/07/2021 02:15:14 - INFO - __main__ - Step 35615: {'lr': 0.00043901508992517956, 'samples': 6838080, 'steps': 35614, 'loss/train': 0.969472348690033} -11/07/2021 02:15:14 - INFO - __main__ - Step 35616: {'lr': 0.0004390116166083568, 'samples': 6838272, 'steps': 35615, 'loss/train': 0.3451453149318695} -11/07/2021 02:15:14 - INFO - __main__ - Step 35617: {'lr': 0.00043900814320636827, 'samples': 6838464, 'steps': 35616, 'loss/train': 1.7469807863235474} -11/07/2021 02:15:15 - INFO - __main__ - Step 35618: {'lr': 0.00043900466971921563, 'samples': 6838656, 'steps': 35617, 'loss/train': 0.8231580853462219} -11/07/2021 02:15:16 - INFO - __main__ - Step 35619: {'lr': 0.00043900119614690043, 'samples': 6838848, 'steps': 35618, 'loss/train': 1.0175918340682983} -11/07/2021 02:15:16 - INFO - __main__ - Step 35620: {'lr': 0.00043899772248942413, 'samples': 6839040, 'steps': 35619, 'loss/train': 1.2768357992172241} -11/07/2021 02:15:16 - INFO - __main__ - Step 35621: {'lr': 0.0004389942487467884, 'samples': 6839232, 'steps': 35620, 'loss/train': 1.4337198734283447} -11/07/2021 02:15:17 - INFO - __main__ - Step 35622: {'lr': 0.00043899077491899485, 'samples': 6839424, 'steps': 35621, 'loss/train': 1.788061261177063} -11/07/2021 02:15:18 - INFO - __main__ - Step 35623: {'lr': 0.0004389873010060449, 'samples': 6839616, 'steps': 35622, 'loss/train': 0.8303018808364868} -11/07/2021 02:15:18 - INFO - __main__ - Step 35624: {'lr': 0.00043898382700794015, 'samples': 6839808, 'steps': 35623, 'loss/train': 1.1721681356430054} -11/07/2021 02:15:18 - INFO - __main__ - Step 35625: {'lr': 0.0004389803529246823, 'samples': 6840000, 'steps': 35624, 'loss/train': 1.319284439086914} -11/07/2021 02:15:19 - INFO - __main__ - Step 35626: {'lr': 0.00043897687875627277, 'samples': 6840192, 'steps': 35625, 'loss/train': 1.1438817977905273} -11/07/2021 02:15:19 - INFO - __main__ - Step 35627: {'lr': 0.00043897340450271317, 'samples': 6840384, 'steps': 35626, 'loss/train': 1.2990198135375977} -11/07/2021 02:15:20 - INFO - __main__ - Step 35628: {'lr': 0.0004389699301640051, 'samples': 6840576, 'steps': 35627, 'loss/train': 1.5525676012039185} -11/07/2021 02:15:21 - INFO - __main__ - Step 35629: {'lr': 0.00043896645574015004, 'samples': 6840768, 'steps': 35628, 'loss/train': 2.9011871814727783} -11/07/2021 02:15:21 - INFO - __main__ - Step 35630: {'lr': 0.00043896298123114965, 'samples': 6840960, 'steps': 35629, 'loss/train': 1.5629982948303223} -11/07/2021 02:15:21 - INFO - __main__ - Step 35631: {'lr': 0.00043895950663700546, 'samples': 6841152, 'steps': 35630, 'loss/train': 1.5904690027236938} -11/07/2021 02:15:22 - INFO - __main__ - Step 35632: {'lr': 0.000438956031957719, 'samples': 6841344, 'steps': 35631, 'loss/train': 1.8988369703292847} -11/07/2021 02:15:23 - INFO - __main__ - Step 35633: {'lr': 0.0004389525571932919, 'samples': 6841536, 'steps': 35632, 'loss/train': 1.0826889276504517} -11/07/2021 02:15:23 - INFO - __main__ - Step 35634: {'lr': 0.00043894908234372564, 'samples': 6841728, 'steps': 35633, 'loss/train': 0.31450581550598145} -11/07/2021 02:15:23 - INFO - __main__ - Step 35635: {'lr': 0.0004389456074090219, 'samples': 6841920, 'steps': 35634, 'loss/train': 1.471784234046936} -11/07/2021 02:15:24 - INFO - __main__ - Step 35636: {'lr': 0.0004389421323891822, 'samples': 6842112, 'steps': 35635, 'loss/train': 1.6761291027069092} -11/07/2021 02:15:24 - INFO - __main__ - Step 35637: {'lr': 0.000438938657284208, 'samples': 6842304, 'steps': 35636, 'loss/train': 1.598026990890503} -11/07/2021 02:15:25 - INFO - __main__ - Step 35638: {'lr': 0.000438935182094101, 'samples': 6842496, 'steps': 35637, 'loss/train': 1.366559386253357} -11/07/2021 02:15:25 - INFO - __main__ - Step 35639: {'lr': 0.0004389317068188628, 'samples': 6842688, 'steps': 35638, 'loss/train': 1.5255507230758667} -11/07/2021 02:15:26 - INFO - __main__ - Step 35640: {'lr': 0.0004389282314584948, 'samples': 6842880, 'steps': 35639, 'loss/train': 1.4930880069732666} -11/07/2021 02:15:26 - INFO - __main__ - Step 35641: {'lr': 0.0004389247560129987, 'samples': 6843072, 'steps': 35640, 'loss/train': 1.627358078956604} -11/07/2021 02:15:26 - INFO - __main__ - Step 35642: {'lr': 0.000438921280482376, 'samples': 6843264, 'steps': 35641, 'loss/train': 1.5437060594558716} -11/07/2021 02:15:28 - INFO - __main__ - Step 35643: {'lr': 0.00043891780486662825, 'samples': 6843456, 'steps': 35642, 'loss/train': 1.588767170906067} -11/07/2021 02:15:28 - INFO - __main__ - Step 35644: {'lr': 0.00043891432916575714, 'samples': 6843648, 'steps': 35643, 'loss/train': 1.012986183166504} -11/07/2021 02:15:28 - INFO - __main__ - Step 35645: {'lr': 0.0004389108533797641, 'samples': 6843840, 'steps': 35644, 'loss/train': 1.3460534811019897} -11/07/2021 02:15:29 - INFO - __main__ - Step 35646: {'lr': 0.00043890737750865074, 'samples': 6844032, 'steps': 35645, 'loss/train': 1.658281683921814} -11/07/2021 02:15:29 - INFO - __main__ - Step 35647: {'lr': 0.0004389039015524186, 'samples': 6844224, 'steps': 35646, 'loss/train': 0.9040864109992981} -11/07/2021 02:15:29 - INFO - __main__ - Step 35648: {'lr': 0.0004389004255110693, 'samples': 6844416, 'steps': 35647, 'loss/train': 1.8229610919952393} -11/07/2021 02:15:30 - INFO - __main__ - Step 35649: {'lr': 0.0004388969493846044, 'samples': 6844608, 'steps': 35648, 'loss/train': 5.77647590637207} -11/07/2021 02:15:31 - INFO - __main__ - Step 35650: {'lr': 0.00043889347317302543, 'samples': 6844800, 'steps': 35649, 'loss/train': 1.7431615591049194} -11/07/2021 02:15:31 - INFO - __main__ - Step 35651: {'lr': 0.000438889996876334, 'samples': 6844992, 'steps': 35650, 'loss/train': 0.9316908717155457} -11/07/2021 02:15:31 - INFO - __main__ - Step 35652: {'lr': 0.00043888652049453163, 'samples': 6845184, 'steps': 35651, 'loss/train': 1.656050443649292} -11/07/2021 02:15:32 - INFO - __main__ - Step 35653: {'lr': 0.0004388830440276199, 'samples': 6845376, 'steps': 35652, 'loss/train': 1.6132490634918213} -11/07/2021 02:15:33 - INFO - __main__ - Step 35654: {'lr': 0.0004388795674756004, 'samples': 6845568, 'steps': 35653, 'loss/train': 1.0542579889297485} -11/07/2021 02:15:33 - INFO - __main__ - Step 35655: {'lr': 0.0004388760908384747, 'samples': 6845760, 'steps': 35654, 'loss/train': 1.361189603805542} -11/07/2021 02:15:33 - INFO - __main__ - Step 35656: {'lr': 0.00043887261411624433, 'samples': 6845952, 'steps': 35655, 'loss/train': 1.5127336978912354} -11/07/2021 02:15:34 - INFO - __main__ - Step 35657: {'lr': 0.00043886913730891087, 'samples': 6846144, 'steps': 35656, 'loss/train': 1.7226002216339111} -11/07/2021 02:15:34 - INFO - __main__ - Step 35658: {'lr': 0.00043886566041647593, 'samples': 6846336, 'steps': 35657, 'loss/train': 1.3042670488357544} -11/07/2021 02:15:35 - INFO - __main__ - Step 35659: {'lr': 0.000438862183438941, 'samples': 6846528, 'steps': 35658, 'loss/train': 1.8118523359298706} -11/07/2021 02:15:36 - INFO - __main__ - Step 35660: {'lr': 0.00043885870637630763, 'samples': 6846720, 'steps': 35659, 'loss/train': 1.3242474794387817} -11/07/2021 02:15:36 - INFO - __main__ - Step 35661: {'lr': 0.00043885522922857757, 'samples': 6846912, 'steps': 35660, 'loss/train': 1.9415103197097778} -11/07/2021 02:15:36 - INFO - __main__ - Step 35662: {'lr': 0.00043885175199575216, 'samples': 6847104, 'steps': 35661, 'loss/train': 1.6594187021255493} -11/07/2021 02:15:37 - INFO - __main__ - Step 35663: {'lr': 0.00043884827467783303, 'samples': 6847296, 'steps': 35662, 'loss/train': 1.6623964309692383} -11/07/2021 02:15:37 - INFO - __main__ - Step 35664: {'lr': 0.00043884479727482193, 'samples': 6847488, 'steps': 35663, 'loss/train': 1.5567348003387451} -11/07/2021 02:15:38 - INFO - __main__ - Step 35665: {'lr': 0.00043884131978672014, 'samples': 6847680, 'steps': 35664, 'loss/train': 1.7647892236709595} -11/07/2021 02:15:38 - INFO - __main__ - Step 35666: {'lr': 0.00043883784221352947, 'samples': 6847872, 'steps': 35665, 'loss/train': 1.313801884651184} -11/07/2021 02:15:39 - INFO - __main__ - Step 35667: {'lr': 0.00043883436455525125, 'samples': 6848064, 'steps': 35666, 'loss/train': 1.6134251356124878} -11/07/2021 02:15:39 - INFO - __main__ - Step 35668: {'lr': 0.0004388308868118873, 'samples': 6848256, 'steps': 35667, 'loss/train': 0.6823694109916687} -11/07/2021 02:15:39 - INFO - __main__ - Step 35669: {'lr': 0.00043882740898343905, 'samples': 6848448, 'steps': 35668, 'loss/train': 1.1683130264282227} -11/07/2021 02:15:41 - INFO - __main__ - Step 35670: {'lr': 0.00043882393106990804, 'samples': 6848640, 'steps': 35669, 'loss/train': 1.3475676774978638} -11/07/2021 02:15:41 - INFO - __main__ - Step 35671: {'lr': 0.0004388204530712959, 'samples': 6848832, 'steps': 35670, 'loss/train': 1.5418709516525269} -11/07/2021 02:15:41 - INFO - __main__ - Step 35672: {'lr': 0.0004388169749876042, 'samples': 6849024, 'steps': 35671, 'loss/train': 1.551112174987793} -11/07/2021 02:15:42 - INFO - __main__ - Step 35673: {'lr': 0.0004388134968188344, 'samples': 6849216, 'steps': 35672, 'loss/train': 1.7342904806137085} -11/07/2021 02:15:42 - INFO - __main__ - Step 35674: {'lr': 0.00043881001856498823, 'samples': 6849408, 'steps': 35673, 'loss/train': 1.8497107028961182} -11/07/2021 02:15:43 - INFO - __main__ - Step 35675: {'lr': 0.0004388065402260672, 'samples': 6849600, 'steps': 35674, 'loss/train': 1.751163363456726} -11/07/2021 02:15:43 - INFO - __main__ - Step 35676: {'lr': 0.0004388030618020729, 'samples': 6849792, 'steps': 35675, 'loss/train': 0.6405913233757019} -11/07/2021 02:15:44 - INFO - __main__ - Step 35677: {'lr': 0.0004387995832930067, 'samples': 6849984, 'steps': 35676, 'loss/train': 1.7262928485870361} -11/07/2021 02:15:44 - INFO - __main__ - Step 35678: {'lr': 0.00043879610469887043, 'samples': 6850176, 'steps': 35677, 'loss/train': 1.0168603658676147} -11/07/2021 02:15:44 - INFO - __main__ - Step 35679: {'lr': 0.00043879262601966544, 'samples': 6850368, 'steps': 35678, 'loss/train': 1.1950746774673462} -11/07/2021 02:15:45 - INFO - __main__ - Step 35680: {'lr': 0.00043878914725539356, 'samples': 6850560, 'steps': 35679, 'loss/train': 1.5614596605300903} -11/07/2021 02:15:46 - INFO - __main__ - Step 35681: {'lr': 0.00043878566840605606, 'samples': 6850752, 'steps': 35680, 'loss/train': 0.8708986639976501} -11/07/2021 02:15:46 - INFO - __main__ - Step 35682: {'lr': 0.0004387821894716547, 'samples': 6850944, 'steps': 35681, 'loss/train': 1.5628100633621216} -11/07/2021 02:15:46 - INFO - __main__ - Step 35683: {'lr': 0.000438778710452191, 'samples': 6851136, 'steps': 35682, 'loss/train': 1.6288344860076904} -11/07/2021 02:15:47 - INFO - __main__ - Step 35684: {'lr': 0.00043877523134766664, 'samples': 6851328, 'steps': 35683, 'loss/train': 1.3384032249450684} -11/07/2021 02:15:48 - INFO - __main__ - Step 35685: {'lr': 0.0004387717521580829, 'samples': 6851520, 'steps': 35684, 'loss/train': 1.6574108600616455} -11/07/2021 02:15:48 - INFO - __main__ - Step 35686: {'lr': 0.00043876827288344156, 'samples': 6851712, 'steps': 35685, 'loss/train': 1.457568645477295} -11/07/2021 02:15:49 - INFO - __main__ - Step 35687: {'lr': 0.00043876479352374423, 'samples': 6851904, 'steps': 35686, 'loss/train': 1.7087618112564087} -11/07/2021 02:15:49 - INFO - __main__ - Step 35688: {'lr': 0.00043876131407899233, 'samples': 6852096, 'steps': 35687, 'loss/train': 0.9426607489585876} -11/07/2021 02:15:49 - INFO - __main__ - Step 35689: {'lr': 0.00043875783454918753, 'samples': 6852288, 'steps': 35688, 'loss/train': 1.389722228050232} -11/07/2021 02:15:50 - INFO - __main__ - Step 35690: {'lr': 0.00043875435493433135, 'samples': 6852480, 'steps': 35689, 'loss/train': 1.626808524131775} -11/07/2021 02:15:51 - INFO - __main__ - Step 35691: {'lr': 0.00043875087523442537, 'samples': 6852672, 'steps': 35690, 'loss/train': 1.179518699645996} -11/07/2021 02:15:51 - INFO - __main__ - Step 35692: {'lr': 0.0004387473954494712, 'samples': 6852864, 'steps': 35691, 'loss/train': 1.2149150371551514} -11/07/2021 02:15:51 - INFO - __main__ - Step 35693: {'lr': 0.00043874391557947027, 'samples': 6853056, 'steps': 35692, 'loss/train': 1.4332332611083984} -11/07/2021 02:15:52 - INFO - __main__ - Step 35694: {'lr': 0.0004387404356244243, 'samples': 6853248, 'steps': 35693, 'loss/train': 1.674772024154663} -11/07/2021 02:15:52 - INFO - __main__ - Step 35695: {'lr': 0.0004387369555843348, 'samples': 6853440, 'steps': 35694, 'loss/train': 1.6376999616622925} -11/07/2021 02:15:53 - INFO - __main__ - Step 35696: {'lr': 0.00043873347545920333, 'samples': 6853632, 'steps': 35695, 'loss/train': 1.5448943376541138} -11/07/2021 02:15:54 - INFO - __main__ - Step 35697: {'lr': 0.00043872999524903147, 'samples': 6853824, 'steps': 35696, 'loss/train': 1.4090485572814941} -11/07/2021 02:15:54 - INFO - __main__ - Step 35698: {'lr': 0.00043872651495382076, 'samples': 6854016, 'steps': 35697, 'loss/train': 1.7205495834350586} -11/07/2021 02:15:54 - INFO - __main__ - Step 35699: {'lr': 0.00043872303457357287, 'samples': 6854208, 'steps': 35698, 'loss/train': 1.7329543828964233} -11/07/2021 02:15:55 - INFO - __main__ - Step 35700: {'lr': 0.0004387195541082892, 'samples': 6854400, 'steps': 35699, 'loss/train': 1.2321515083312988} -11/07/2021 02:15:56 - INFO - __main__ - Step 35701: {'lr': 0.0004387160735579715, 'samples': 6854592, 'steps': 35700, 'loss/train': 1.6390836238861084} -11/07/2021 02:15:56 - INFO - __main__ - Step 35702: {'lr': 0.0004387125929226212, 'samples': 6854784, 'steps': 35701, 'loss/train': 1.5886253118515015} -11/07/2021 02:15:56 - INFO - __main__ - Step 35703: {'lr': 0.00043870911220224, 'samples': 6854976, 'steps': 35702, 'loss/train': 1.6304876804351807} -11/07/2021 02:15:57 - INFO - __main__ - Step 35704: {'lr': 0.0004387056313968293, 'samples': 6855168, 'steps': 35703, 'loss/train': 1.816699743270874} -11/07/2021 02:15:57 - INFO - __main__ - Step 35705: {'lr': 0.00043870215050639073, 'samples': 6855360, 'steps': 35704, 'loss/train': 5.773858070373535} -11/07/2021 02:15:57 - INFO - __main__ - Step 35706: {'lr': 0.00043869866953092593, 'samples': 6855552, 'steps': 35705, 'loss/train': 1.3915510177612305} -11/07/2021 02:15:58 - INFO - __main__ - Step 35707: {'lr': 0.00043869518847043643, 'samples': 6855744, 'steps': 35706, 'loss/train': 1.6798690557479858} -11/07/2021 02:15:59 - INFO - __main__ - Step 35708: {'lr': 0.0004386917073249237, 'samples': 6855936, 'steps': 35707, 'loss/train': 1.8041768074035645} -11/07/2021 02:15:59 - INFO - __main__ - Step 35709: {'lr': 0.00043868822609438953, 'samples': 6856128, 'steps': 35708, 'loss/train': 1.6509307622909546} -11/07/2021 02:15:59 - INFO - __main__ - Step 35710: {'lr': 0.00043868474477883523, 'samples': 6856320, 'steps': 35709, 'loss/train': 1.6956952810287476} -11/07/2021 02:16:00 - INFO - __main__ - Step 35711: {'lr': 0.0004386812633782626, 'samples': 6856512, 'steps': 35710, 'loss/train': 1.3712821006774902} -11/07/2021 02:16:01 - INFO - __main__ - Step 35712: {'lr': 0.00043867778189267306, 'samples': 6856704, 'steps': 35711, 'loss/train': 1.5459964275360107} -11/07/2021 02:16:02 - INFO - __main__ - Step 35713: {'lr': 0.0004386743003220682, 'samples': 6856896, 'steps': 35712, 'loss/train': 2.210019588470459} -11/07/2021 02:16:02 - INFO - __main__ - Step 35714: {'lr': 0.0004386708186664496, 'samples': 6857088, 'steps': 35713, 'loss/train': 2.363863945007324} -11/07/2021 02:16:02 - INFO - __main__ - Step 35715: {'lr': 0.00043866733692581896, 'samples': 6857280, 'steps': 35714, 'loss/train': 1.3447531461715698} -11/07/2021 02:16:03 - INFO - __main__ - Step 35716: {'lr': 0.0004386638551001777, 'samples': 6857472, 'steps': 35715, 'loss/train': 1.3204762935638428} -11/07/2021 02:16:04 - INFO - __main__ - Step 35717: {'lr': 0.00043866037318952735, 'samples': 6857664, 'steps': 35716, 'loss/train': 2.144253730773926} -11/07/2021 02:16:04 - INFO - __main__ - Step 35718: {'lr': 0.0004386568911938695, 'samples': 6857856, 'steps': 35717, 'loss/train': 1.7581815719604492} -11/07/2021 02:16:04 - INFO - __main__ - Step 35719: {'lr': 0.0004386534091132059, 'samples': 6858048, 'steps': 35718, 'loss/train': 1.5662397146224976} -11/07/2021 02:16:05 - INFO - __main__ - Step 35720: {'lr': 0.0004386499269475379, 'samples': 6858240, 'steps': 35719, 'loss/train': 1.9442492723464966} -11/07/2021 02:16:05 - INFO - __main__ - Step 35721: {'lr': 0.00043864644469686717, 'samples': 6858432, 'steps': 35720, 'loss/train': 0.9276940226554871} -11/07/2021 02:16:06 - INFO - __main__ - Step 35722: {'lr': 0.0004386429623611953, 'samples': 6858624, 'steps': 35721, 'loss/train': 1.2161866426467896} -11/07/2021 02:16:07 - INFO - __main__ - Step 35723: {'lr': 0.0004386394799405238, 'samples': 6858816, 'steps': 35722, 'loss/train': 1.693832516670227} -11/07/2021 02:16:07 - INFO - __main__ - Step 35724: {'lr': 0.00043863599743485416, 'samples': 6859008, 'steps': 35723, 'loss/train': 1.8028156757354736} -11/07/2021 02:16:08 - INFO - __main__ - Step 35725: {'lr': 0.0004386325148441882, 'samples': 6859200, 'steps': 35724, 'loss/train': 1.640588402748108} -11/07/2021 02:16:08 - INFO - __main__ - Step 35726: {'lr': 0.00043862903216852723, 'samples': 6859392, 'steps': 35725, 'loss/train': 1.5772079229354858} -11/07/2021 02:16:08 - INFO - __main__ - Step 35727: {'lr': 0.00043862554940787303, 'samples': 6859584, 'steps': 35726, 'loss/train': 2.072113037109375} -11/07/2021 02:16:09 - INFO - __main__ - Step 35728: {'lr': 0.000438622066562227, 'samples': 6859776, 'steps': 35727, 'loss/train': 1.4786450862884521} -11/07/2021 02:16:10 - INFO - __main__ - Step 35729: {'lr': 0.0004386185836315908, 'samples': 6859968, 'steps': 35728, 'loss/train': 1.6002217531204224} -11/07/2021 02:16:10 - INFO - __main__ - Step 35730: {'lr': 0.0004386151006159659, 'samples': 6860160, 'steps': 35729, 'loss/train': 1.2281548976898193} -11/07/2021 02:16:10 - INFO - __main__ - Step 35731: {'lr': 0.00043861161751535406, 'samples': 6860352, 'steps': 35730, 'loss/train': 0.9255541563034058} -11/07/2021 02:16:11 - INFO - __main__ - Step 35732: {'lr': 0.0004386081343297567, 'samples': 6860544, 'steps': 35731, 'loss/train': 1.7340439558029175} -11/07/2021 02:16:11 - INFO - __main__ - Step 35733: {'lr': 0.0004386046510591754, 'samples': 6860736, 'steps': 35732, 'loss/train': 1.8112010955810547} -11/07/2021 02:16:12 - INFO - __main__ - Step 35734: {'lr': 0.0004386011677036118, 'samples': 6860928, 'steps': 35733, 'loss/train': 1.756344199180603} -11/07/2021 02:16:12 - INFO - __main__ - Step 35735: {'lr': 0.00043859768426306737, 'samples': 6861120, 'steps': 35734, 'loss/train': 1.2330529689788818} -11/07/2021 02:16:13 - INFO - __main__ - Step 35736: {'lr': 0.00043859420073754377, 'samples': 6861312, 'steps': 35735, 'loss/train': 1.1958736181259155} -11/07/2021 02:16:13 - INFO - __main__ - Step 35737: {'lr': 0.0004385907171270425, 'samples': 6861504, 'steps': 35736, 'loss/train': 2.0505869388580322} -11/07/2021 02:16:13 - INFO - __main__ - Step 35738: {'lr': 0.00043858723343156514, 'samples': 6861696, 'steps': 35737, 'loss/train': 1.6566646099090576} -11/07/2021 02:16:15 - INFO - __main__ - Step 35739: {'lr': 0.00043858374965111336, 'samples': 6861888, 'steps': 35738, 'loss/train': 1.0120819807052612} -11/07/2021 02:16:15 - INFO - __main__ - Step 35740: {'lr': 0.00043858026578568864, 'samples': 6862080, 'steps': 35739, 'loss/train': 1.7157846689224243} -11/07/2021 02:16:15 - INFO - __main__ - Step 35741: {'lr': 0.00043857678183529256, 'samples': 6862272, 'steps': 35740, 'loss/train': 1.0181148052215576} -11/07/2021 02:16:16 - INFO - __main__ - Step 35742: {'lr': 0.0004385732977999266, 'samples': 6862464, 'steps': 35741, 'loss/train': 1.0279544591903687} -11/07/2021 02:16:16 - INFO - __main__ - Step 35743: {'lr': 0.0004385698136795926, 'samples': 6862656, 'steps': 35742, 'loss/train': 1.773728609085083} -11/07/2021 02:16:17 - INFO - __main__ - Step 35744: {'lr': 0.00043856632947429175, 'samples': 6862848, 'steps': 35743, 'loss/train': 0.8074324727058411} -11/07/2021 02:16:17 - INFO - __main__ - Step 35745: {'lr': 0.00043856284518402594, 'samples': 6863040, 'steps': 35744, 'loss/train': 1.3862853050231934} -11/07/2021 02:16:18 - INFO - __main__ - Step 35746: {'lr': 0.00043855936080879667, 'samples': 6863232, 'steps': 35745, 'loss/train': 1.3445626497268677} -11/07/2021 02:16:18 - INFO - __main__ - Step 35747: {'lr': 0.0004385558763486053, 'samples': 6863424, 'steps': 35746, 'loss/train': 1.5872620344161987} -11/07/2021 02:16:18 - INFO - __main__ - Step 35748: {'lr': 0.00043855239180345376, 'samples': 6863616, 'steps': 35747, 'loss/train': 1.3158793449401855} -11/07/2021 02:16:19 - INFO - __main__ - Step 35749: {'lr': 0.00043854890717334326, 'samples': 6863808, 'steps': 35748, 'loss/train': 1.9186967611312866} -11/07/2021 02:16:20 - INFO - __main__ - Step 35750: {'lr': 0.00043854542245827554, 'samples': 6864000, 'steps': 35749, 'loss/train': 1.4672558307647705} -11/07/2021 02:16:20 - INFO - __main__ - Step 35751: {'lr': 0.00043854193765825223, 'samples': 6864192, 'steps': 35750, 'loss/train': 1.7083171606063843} -11/07/2021 02:16:20 - INFO - __main__ - Step 35752: {'lr': 0.00043853845277327485, 'samples': 6864384, 'steps': 35751, 'loss/train': 1.9616976976394653} -11/07/2021 02:16:21 - INFO - __main__ - Step 35753: {'lr': 0.0004385349678033449, 'samples': 6864576, 'steps': 35752, 'loss/train': 1.361376166343689} -11/07/2021 02:16:21 - INFO - __main__ - Step 35754: {'lr': 0.000438531482748464, 'samples': 6864768, 'steps': 35753, 'loss/train': 1.4319709539413452} -11/07/2021 02:16:22 - INFO - __main__ - Step 35755: {'lr': 0.00043852799760863375, 'samples': 6864960, 'steps': 35754, 'loss/train': 1.3204424381256104} -11/07/2021 02:16:23 - INFO - __main__ - Step 35756: {'lr': 0.0004385245123838557, 'samples': 6865152, 'steps': 35755, 'loss/train': 1.7563824653625488} -11/07/2021 02:16:23 - INFO - __main__ - Step 35757: {'lr': 0.00043852102707413144, 'samples': 6865344, 'steps': 35756, 'loss/train': 1.5977060794830322} -11/07/2021 02:16:23 - INFO - __main__ - Step 35758: {'lr': 0.00043851754167946244, 'samples': 6865536, 'steps': 35757, 'loss/train': 1.4238637685775757} -11/07/2021 02:16:24 - INFO - __main__ - Step 35759: {'lr': 0.00043851405619985037, 'samples': 6865728, 'steps': 35758, 'loss/train': 1.9423731565475464} -11/07/2021 02:16:25 - INFO - __main__ - Step 35760: {'lr': 0.00043851057063529675, 'samples': 6865920, 'steps': 35759, 'loss/train': 1.5438404083251953} -11/07/2021 02:16:25 - INFO - __main__ - Step 35761: {'lr': 0.00043850708498580326, 'samples': 6866112, 'steps': 35760, 'loss/train': 1.65753173828125} -11/07/2021 02:16:25 - INFO - __main__ - Step 35762: {'lr': 0.00043850359925137126, 'samples': 6866304, 'steps': 35761, 'loss/train': 1.8983148336410522} -11/07/2021 02:16:26 - INFO - __main__ - Step 35763: {'lr': 0.0004385001134320026, 'samples': 6866496, 'steps': 35762, 'loss/train': 1.5388737916946411} -11/07/2021 02:16:26 - INFO - __main__ - Step 35764: {'lr': 0.0004384966275276986, 'samples': 6866688, 'steps': 35763, 'loss/train': 1.6825393438339233} -11/07/2021 02:16:27 - INFO - __main__ - Step 35765: {'lr': 0.00043849314153846094, 'samples': 6866880, 'steps': 35764, 'loss/train': 1.8381291627883911} -11/07/2021 02:16:28 - INFO - __main__ - Step 35766: {'lr': 0.0004384896554642912, 'samples': 6867072, 'steps': 35765, 'loss/train': 1.4535595178604126} -11/07/2021 02:16:28 - INFO - __main__ - Step 35767: {'lr': 0.00043848616930519094, 'samples': 6867264, 'steps': 35766, 'loss/train': 1.5976481437683105} -11/07/2021 02:16:28 - INFO - __main__ - Step 35768: {'lr': 0.0004384826830611617, 'samples': 6867456, 'steps': 35767, 'loss/train': 1.8629978895187378} -11/07/2021 02:16:29 - INFO - __main__ - Step 35769: {'lr': 0.00043847919673220504, 'samples': 6867648, 'steps': 35768, 'loss/train': 1.934322714805603} -11/07/2021 02:16:30 - INFO - __main__ - Step 35770: {'lr': 0.00043847571031832257, 'samples': 6867840, 'steps': 35769, 'loss/train': 1.3385542631149292} -11/07/2021 02:16:30 - INFO - __main__ - Step 35771: {'lr': 0.0004384722238195159, 'samples': 6868032, 'steps': 35770, 'loss/train': 0.987594723701477} -11/07/2021 02:16:30 - INFO - __main__ - Step 35772: {'lr': 0.0004384687372357865, 'samples': 6868224, 'steps': 35771, 'loss/train': 1.5806580781936646} -11/07/2021 02:16:31 - INFO - __main__ - Step 35773: {'lr': 0.000438465250567136, 'samples': 6868416, 'steps': 35772, 'loss/train': 1.2526181936264038} -11/07/2021 02:16:31 - INFO - __main__ - Step 35774: {'lr': 0.00043846176381356607, 'samples': 6868608, 'steps': 35773, 'loss/train': 1.3293781280517578} -11/07/2021 02:16:32 - INFO - __main__ - Step 35775: {'lr': 0.000438458276975078, 'samples': 6868800, 'steps': 35774, 'loss/train': 1.3052928447723389} -11/07/2021 02:16:32 - INFO - __main__ - Step 35776: {'lr': 0.0004384547900516737, 'samples': 6868992, 'steps': 35775, 'loss/train': 1.5681229829788208} -11/07/2021 02:16:33 - INFO - __main__ - Step 35777: {'lr': 0.00043845130304335454, 'samples': 6869184, 'steps': 35776, 'loss/train': 1.1610848903656006} -11/07/2021 02:16:33 - INFO - __main__ - Step 35778: {'lr': 0.00043844781595012204, 'samples': 6869376, 'steps': 35777, 'loss/train': 1.4218180179595947} -11/07/2021 02:16:33 - INFO - __main__ - Step 35779: {'lr': 0.0004384443287719779, 'samples': 6869568, 'steps': 35778, 'loss/train': 1.264674186706543} -11/07/2021 02:16:35 - INFO - __main__ - Step 35780: {'lr': 0.0004384408415089237, 'samples': 6869760, 'steps': 35779, 'loss/train': 1.3298534154891968} -11/07/2021 02:16:35 - INFO - __main__ - Step 35781: {'lr': 0.000438437354160961, 'samples': 6869952, 'steps': 35780, 'loss/train': 1.25020170211792} -11/07/2021 02:16:35 - INFO - __main__ - Step 35782: {'lr': 0.00043843386672809127, 'samples': 6870144, 'steps': 35781, 'loss/train': 1.6183899641036987} -11/07/2021 02:16:36 - INFO - __main__ - Step 35783: {'lr': 0.00043843037921031616, 'samples': 6870336, 'steps': 35782, 'loss/train': 1.6619880199432373} -11/07/2021 02:16:36 - INFO - __main__ - Step 35784: {'lr': 0.00043842689160763723, 'samples': 6870528, 'steps': 35783, 'loss/train': 1.8179965019226074} -11/07/2021 02:16:37 - INFO - __main__ - Step 35785: {'lr': 0.00043842340392005605, 'samples': 6870720, 'steps': 35784, 'loss/train': 1.1560782194137573} -11/07/2021 02:16:37 - INFO - __main__ - Step 35786: {'lr': 0.00043841991614757415, 'samples': 6870912, 'steps': 35785, 'loss/train': 1.5421417951583862} -11/07/2021 02:16:38 - INFO - __main__ - Step 35787: {'lr': 0.00043841642829019325, 'samples': 6871104, 'steps': 35786, 'loss/train': 1.424499750137329} -11/07/2021 02:16:38 - INFO - __main__ - Step 35788: {'lr': 0.00043841294034791466, 'samples': 6871296, 'steps': 35787, 'loss/train': 1.5242619514465332} -11/07/2021 02:16:38 - INFO - __main__ - Step 35789: {'lr': 0.0004384094523207403, 'samples': 6871488, 'steps': 35788, 'loss/train': 1.5820269584655762} -11/07/2021 02:16:39 - INFO - __main__ - Step 35790: {'lr': 0.0004384059642086714, 'samples': 6871680, 'steps': 35789, 'loss/train': 1.568547010421753} -11/07/2021 02:16:40 - INFO - __main__ - Step 35791: {'lr': 0.00043840247601170966, 'samples': 6871872, 'steps': 35790, 'loss/train': 1.5818415880203247} -11/07/2021 02:16:40 - INFO - __main__ - Step 35792: {'lr': 0.0004383989877298568, 'samples': 6872064, 'steps': 35791, 'loss/train': 1.6161761283874512} -11/07/2021 02:16:40 - INFO - __main__ - Step 35793: {'lr': 0.0004383954993631142, 'samples': 6872256, 'steps': 35792, 'loss/train': 1.337131381034851} -11/07/2021 02:16:41 - INFO - __main__ - Step 35794: {'lr': 0.0004383920109114835, 'samples': 6872448, 'steps': 35793, 'loss/train': 1.4632744789123535} -11/07/2021 02:16:41 - INFO - __main__ - Step 35795: {'lr': 0.00043838852237496626, 'samples': 6872640, 'steps': 35794, 'loss/train': 1.4462274312973022} -11/07/2021 02:16:42 - INFO - __main__ - Step 35796: {'lr': 0.000438385033753564, 'samples': 6872832, 'steps': 35795, 'loss/train': 1.5358773469924927} -11/07/2021 02:16:42 - INFO - __main__ - Step 35797: {'lr': 0.00043838154504727847, 'samples': 6873024, 'steps': 35796, 'loss/train': 1.5611079931259155} -11/07/2021 02:16:43 - INFO - __main__ - Step 35798: {'lr': 0.00043837805625611105, 'samples': 6873216, 'steps': 35797, 'loss/train': 1.5787655115127563} -11/07/2021 02:16:43 - INFO - __main__ - Step 35799: {'lr': 0.0004383745673800634, 'samples': 6873408, 'steps': 35798, 'loss/train': 2.0828986167907715} -11/07/2021 02:16:43 - INFO - __main__ - Step 35800: {'lr': 0.000438371078419137, 'samples': 6873600, 'steps': 35799, 'loss/train': 1.3921492099761963} -11/07/2021 02:16:44 - INFO - __main__ - Step 35801: {'lr': 0.00043836758937333366, 'samples': 6873792, 'steps': 35800, 'loss/train': 1.8202711343765259} -11/07/2021 02:16:45 - INFO - __main__ - Step 35802: {'lr': 0.0004383641002426547, 'samples': 6873984, 'steps': 35801, 'loss/train': 1.5541462898254395} -11/07/2021 02:16:45 - INFO - __main__ - Step 35803: {'lr': 0.0004383606110271018, 'samples': 6874176, 'steps': 35802, 'loss/train': 1.2755517959594727} -11/07/2021 02:16:45 - INFO - __main__ - Step 35804: {'lr': 0.00043835712172667643, 'samples': 6874368, 'steps': 35803, 'loss/train': 1.0208276510238647} -11/07/2021 02:16:46 - INFO - __main__ - Step 35805: {'lr': 0.00043835363234138037, 'samples': 6874560, 'steps': 35804, 'loss/train': 1.4622864723205566} -11/07/2021 02:16:47 - INFO - __main__ - Step 35806: {'lr': 0.00043835014287121497, 'samples': 6874752, 'steps': 35805, 'loss/train': 0.9984145760536194} -11/07/2021 02:16:47 - INFO - __main__ - Step 35807: {'lr': 0.00043834665331618196, 'samples': 6874944, 'steps': 35806, 'loss/train': 1.4266750812530518} -11/07/2021 02:16:48 - INFO - __main__ - Step 35808: {'lr': 0.00043834316367628287, 'samples': 6875136, 'steps': 35807, 'loss/train': 1.6676244735717773} -11/07/2021 02:16:48 - INFO - __main__ - Step 35809: {'lr': 0.0004383396739515192, 'samples': 6875328, 'steps': 35808, 'loss/train': 1.5520555973052979} -11/07/2021 02:16:48 - INFO - __main__ - Step 35810: {'lr': 0.00043833618414189265, 'samples': 6875520, 'steps': 35809, 'loss/train': 1.4976266622543335} -11/07/2021 02:16:49 - INFO - __main__ - Step 35811: {'lr': 0.0004383326942474046, 'samples': 6875712, 'steps': 35810, 'loss/train': 1.654467225074768} -11/07/2021 02:16:50 - INFO - __main__ - Step 35812: {'lr': 0.0004383292042680569, 'samples': 6875904, 'steps': 35811, 'loss/train': 1.66763436794281} -11/07/2021 02:16:50 - INFO - __main__ - Step 35813: {'lr': 0.0004383257142038509, 'samples': 6876096, 'steps': 35812, 'loss/train': 2.1094698905944824} -11/07/2021 02:16:50 - INFO - __main__ - Step 35814: {'lr': 0.0004383222240547882, 'samples': 6876288, 'steps': 35813, 'loss/train': 0.9822989702224731} -11/07/2021 02:16:51 - INFO - __main__ - Step 35815: {'lr': 0.00043831873382087043, 'samples': 6876480, 'steps': 35814, 'loss/train': 1.5135447978973389} -11/07/2021 02:16:52 - INFO - __main__ - Step 35816: {'lr': 0.0004383152435020992, 'samples': 6876672, 'steps': 35815, 'loss/train': 0.8099708557128906} -11/07/2021 02:16:52 - INFO - __main__ - Step 35817: {'lr': 0.0004383117530984759, 'samples': 6876864, 'steps': 35816, 'loss/train': 1.5529484748840332} -11/07/2021 02:16:52 - INFO - __main__ - Step 35818: {'lr': 0.0004383082626100024, 'samples': 6877056, 'steps': 35817, 'loss/train': 0.5928159356117249} -11/07/2021 02:16:53 - INFO - __main__ - Step 35819: {'lr': 0.00043830477203668, 'samples': 6877248, 'steps': 35818, 'loss/train': 1.6680653095245361} -11/07/2021 02:16:53 - INFO - __main__ - Step 35820: {'lr': 0.0004383012813785104, 'samples': 6877440, 'steps': 35819, 'loss/train': 1.5121403932571411} -11/07/2021 02:16:54 - INFO - __main__ - Step 35821: {'lr': 0.00043829779063549515, 'samples': 6877632, 'steps': 35820, 'loss/train': 1.6605607271194458} -11/07/2021 02:16:54 - INFO - __main__ - Step 35822: {'lr': 0.0004382942998076358, 'samples': 6877824, 'steps': 35821, 'loss/train': 1.255125641822815} -11/07/2021 02:16:55 - INFO - __main__ - Step 35823: {'lr': 0.000438290808894934, 'samples': 6878016, 'steps': 35822, 'loss/train': 1.2337799072265625} -11/07/2021 02:16:55 - INFO - __main__ - Step 35824: {'lr': 0.0004382873178973912, 'samples': 6878208, 'steps': 35823, 'loss/train': 1.0595225095748901} -11/07/2021 02:16:56 - INFO - __main__ - Step 35825: {'lr': 0.00043828382681500907, 'samples': 6878400, 'steps': 35824, 'loss/train': 1.4158706665039062} -11/07/2021 02:16:57 - INFO - __main__ - Step 35826: {'lr': 0.0004382803356477891, 'samples': 6878592, 'steps': 35825, 'loss/train': 0.6019604206085205} -11/07/2021 02:16:57 - INFO - __main__ - Step 35827: {'lr': 0.000438276844395733, 'samples': 6878784, 'steps': 35826, 'loss/train': 1.0249121189117432} -11/07/2021 02:16:57 - INFO - __main__ - Step 35828: {'lr': 0.0004382733530588422, 'samples': 6878976, 'steps': 35827, 'loss/train': 1.403064489364624} -11/07/2021 02:16:58 - INFO - __main__ - Step 35829: {'lr': 0.00043826986163711835, 'samples': 6879168, 'steps': 35828, 'loss/train': 1.2509788274765015} -11/07/2021 02:16:58 - INFO - __main__ - Step 35830: {'lr': 0.000438266370130563, 'samples': 6879360, 'steps': 35829, 'loss/train': 1.7037445306777954} -11/07/2021 02:16:59 - INFO - __main__ - Step 35831: {'lr': 0.0004382628785391778, 'samples': 6879552, 'steps': 35830, 'loss/train': 2.075359582901001} -11/07/2021 02:16:59 - INFO - __main__ - Step 35832: {'lr': 0.00043825938686296417, 'samples': 6879744, 'steps': 35831, 'loss/train': 1.9884377717971802} -11/07/2021 02:17:00 - INFO - __main__ - Step 35833: {'lr': 0.00043825589510192376, 'samples': 6879936, 'steps': 35832, 'loss/train': 1.0667155981063843} -11/07/2021 02:17:00 - INFO - __main__ - Step 35834: {'lr': 0.0004382524032560582, 'samples': 6880128, 'steps': 35833, 'loss/train': 1.533860683441162} -11/07/2021 02:17:00 - INFO - __main__ - Step 35835: {'lr': 0.000438248911325369, 'samples': 6880320, 'steps': 35834, 'loss/train': 1.6826927661895752} -11/07/2021 02:17:01 - INFO - __main__ - Step 35836: {'lr': 0.00043824541930985775, 'samples': 6880512, 'steps': 35835, 'loss/train': 1.4012782573699951} -11/07/2021 02:17:02 - INFO - __main__ - Step 35837: {'lr': 0.0004382419272095259, 'samples': 6880704, 'steps': 35836, 'loss/train': 1.4396758079528809} -11/07/2021 02:17:02 - INFO - __main__ - Step 35838: {'lr': 0.00043823843502437533, 'samples': 6880896, 'steps': 35837, 'loss/train': 1.3039255142211914} -11/07/2021 02:17:02 - INFO - __main__ - Step 35839: {'lr': 0.00043823494275440733, 'samples': 6881088, 'steps': 35838, 'loss/train': 1.4565870761871338} -11/07/2021 02:17:03 - INFO - __main__ - Step 35840: {'lr': 0.0004382314503996236, 'samples': 6881280, 'steps': 35839, 'loss/train': 1.4898042678833008} -11/07/2021 02:17:03 - INFO - __main__ - Step 35841: {'lr': 0.0004382279579600256, 'samples': 6881472, 'steps': 35840, 'loss/train': 1.6548384428024292} -11/07/2021 02:17:04 - INFO - __main__ - Step 35842: {'lr': 0.0004382244654356151, 'samples': 6881664, 'steps': 35841, 'loss/train': 1.4465525150299072} -11/07/2021 02:17:04 - INFO - __main__ - Step 35843: {'lr': 0.0004382209728263935, 'samples': 6881856, 'steps': 35842, 'loss/train': 1.3423986434936523} -11/07/2021 02:17:05 - INFO - __main__ - Step 35844: {'lr': 0.0004382174801323624, 'samples': 6882048, 'steps': 35843, 'loss/train': 0.9695390462875366} -11/07/2021 02:17:05 - INFO - __main__ - Step 35845: {'lr': 0.00043821398735352344, 'samples': 6882240, 'steps': 35844, 'loss/train': 1.79738450050354} -11/07/2021 02:17:05 - INFO - __main__ - Step 35846: {'lr': 0.0004382104944898782, 'samples': 6882432, 'steps': 35845, 'loss/train': 1.3911375999450684} -11/07/2021 02:17:07 - INFO - __main__ - Step 35847: {'lr': 0.00043820700154142825, 'samples': 6882624, 'steps': 35846, 'loss/train': 1.7680792808532715} -11/07/2021 02:17:07 - INFO - __main__ - Step 35848: {'lr': 0.00043820350850817504, 'samples': 6882816, 'steps': 35847, 'loss/train': 1.1441446542739868} -11/07/2021 02:17:07 - INFO - __main__ - Step 35849: {'lr': 0.00043820001539012025, 'samples': 6883008, 'steps': 35848, 'loss/train': 1.174292802810669} -11/07/2021 02:17:08 - INFO - __main__ - Step 35850: {'lr': 0.00043819652218726545, 'samples': 6883200, 'steps': 35849, 'loss/train': 1.4147001504898071} -11/07/2021 02:17:08 - INFO - __main__ - Step 35851: {'lr': 0.0004381930288996122, 'samples': 6883392, 'steps': 35850, 'loss/train': 1.5950745344161987} -11/07/2021 02:17:09 - INFO - __main__ - Step 35852: {'lr': 0.0004381895355271621, 'samples': 6883584, 'steps': 35851, 'loss/train': 1.5812777280807495} -11/07/2021 02:17:09 - INFO - __main__ - Step 35853: {'lr': 0.00043818604206991664, 'samples': 6883776, 'steps': 35852, 'loss/train': 1.6486752033233643} -11/07/2021 02:17:10 - INFO - __main__ - Step 35854: {'lr': 0.0004381825485278775, 'samples': 6883968, 'steps': 35853, 'loss/train': 1.576576828956604} -11/07/2021 02:17:10 - INFO - __main__ - Step 35855: {'lr': 0.00043817905490104613, 'samples': 6884160, 'steps': 35854, 'loss/train': 1.4157003164291382} -11/07/2021 02:17:10 - INFO - __main__ - Step 35856: {'lr': 0.00043817556118942426, 'samples': 6884352, 'steps': 35855, 'loss/train': 1.8426508903503418} -11/07/2021 02:17:11 - INFO - __main__ - Step 35857: {'lr': 0.0004381720673930134, 'samples': 6884544, 'steps': 35856, 'loss/train': 1.4605894088745117} -11/07/2021 02:17:12 - INFO - __main__ - Step 35858: {'lr': 0.00043816857351181503, 'samples': 6884736, 'steps': 35857, 'loss/train': 1.3808422088623047} -11/07/2021 02:17:12 - INFO - __main__ - Step 35859: {'lr': 0.0004381650795458309, 'samples': 6884928, 'steps': 35858, 'loss/train': 1.7283581495285034} -11/07/2021 02:17:12 - INFO - __main__ - Step 35860: {'lr': 0.0004381615854950625, 'samples': 6885120, 'steps': 35859, 'loss/train': 1.409956455230713} -11/07/2021 02:17:13 - INFO - __main__ - Step 35861: {'lr': 0.0004381580913595113, 'samples': 6885312, 'steps': 35860, 'loss/train': 1.3731625080108643} -11/07/2021 02:17:14 - INFO - __main__ - Step 35862: {'lr': 0.000438154597139179, 'samples': 6885504, 'steps': 35861, 'loss/train': 1.197447657585144} -11/07/2021 02:17:14 - INFO - __main__ - Step 35863: {'lr': 0.0004381511028340671, 'samples': 6885696, 'steps': 35862, 'loss/train': 1.5057181119918823} -11/07/2021 02:17:14 - INFO - __main__ - Step 35864: {'lr': 0.0004381476084441773, 'samples': 6885888, 'steps': 35863, 'loss/train': 1.9163185358047485} -11/07/2021 02:17:15 - INFO - __main__ - Step 35865: {'lr': 0.00043814411396951103, 'samples': 6886080, 'steps': 35864, 'loss/train': 1.081902027130127} -11/07/2021 02:17:15 - INFO - __main__ - Step 35866: {'lr': 0.00043814061941007, 'samples': 6886272, 'steps': 35865, 'loss/train': 1.0974922180175781} -11/07/2021 02:17:16 - INFO - __main__ - Step 35867: {'lr': 0.00043813712476585564, 'samples': 6886464, 'steps': 35866, 'loss/train': 1.9265427589416504} -11/07/2021 02:17:16 - INFO - __main__ - Step 35868: {'lr': 0.00043813363003686963, 'samples': 6886656, 'steps': 35867, 'loss/train': 1.4821633100509644} -11/07/2021 02:17:17 - INFO - __main__ - Step 35869: {'lr': 0.00043813013522311353, 'samples': 6886848, 'steps': 35868, 'loss/train': 1.6978538036346436} -11/07/2021 02:17:17 - INFO - __main__ - Step 35870: {'lr': 0.0004381266403245888, 'samples': 6887040, 'steps': 35869, 'loss/train': 1.4966309070587158} -11/07/2021 02:17:17 - INFO - __main__ - Step 35871: {'lr': 0.00043812314534129716, 'samples': 6887232, 'steps': 35870, 'loss/train': 1.0092236995697021} -11/07/2021 02:17:19 - INFO - __main__ - Step 35872: {'lr': 0.0004381196502732402, 'samples': 6887424, 'steps': 35871, 'loss/train': 1.904168963432312} -11/07/2021 02:17:19 - INFO - __main__ - Step 35873: {'lr': 0.00043811615512041934, 'samples': 6887616, 'steps': 35872, 'loss/train': 1.436159610748291} -11/07/2021 02:17:19 - INFO - __main__ - Step 35874: {'lr': 0.00043811265988283625, 'samples': 6887808, 'steps': 35873, 'loss/train': 1.665523648262024} -11/07/2021 02:17:20 - INFO - __main__ - Step 35875: {'lr': 0.00043810916456049257, 'samples': 6888000, 'steps': 35874, 'loss/train': 0.8110805153846741} -11/07/2021 02:17:20 - INFO - __main__ - Step 35876: {'lr': 0.00043810566915338965, 'samples': 6888192, 'steps': 35875, 'loss/train': 1.5055104494094849} -11/07/2021 02:17:21 - INFO - __main__ - Step 35877: {'lr': 0.0004381021736615294, 'samples': 6888384, 'steps': 35876, 'loss/train': 1.3504819869995117} -11/07/2021 02:17:21 - INFO - __main__ - Step 35878: {'lr': 0.0004380986780849131, 'samples': 6888576, 'steps': 35877, 'loss/train': 1.6569801568984985} -11/07/2021 02:17:22 - INFO - __main__ - Step 35879: {'lr': 0.0004380951824235425, 'samples': 6888768, 'steps': 35878, 'loss/train': 1.4905952215194702} -11/07/2021 02:17:22 - INFO - __main__ - Step 35880: {'lr': 0.00043809168667741907, 'samples': 6888960, 'steps': 35879, 'loss/train': 1.5604488849639893} -11/07/2021 02:17:22 - INFO - __main__ - Step 35881: {'lr': 0.0004380881908465445, 'samples': 6889152, 'steps': 35880, 'loss/train': 0.3603174090385437} -11/07/2021 02:17:23 - INFO - __main__ - Step 35882: {'lr': 0.0004380846949309202, 'samples': 6889344, 'steps': 35881, 'loss/train': 1.644689679145813} -11/07/2021 02:17:24 - INFO - __main__ - Step 35883: {'lr': 0.00043808119893054787, 'samples': 6889536, 'steps': 35882, 'loss/train': 1.728338599205017} -11/07/2021 02:17:24 - INFO - __main__ - Step 35884: {'lr': 0.0004380777028454291, 'samples': 6889728, 'steps': 35883, 'loss/train': 1.7343021631240845} -11/07/2021 02:17:25 - INFO - __main__ - Step 35885: {'lr': 0.0004380742066755654, 'samples': 6889920, 'steps': 35884, 'loss/train': 1.5336843729019165} -11/07/2021 02:17:25 - INFO - __main__ - Step 35886: {'lr': 0.0004380707104209583, 'samples': 6890112, 'steps': 35885, 'loss/train': 1.9161925315856934} -11/07/2021 02:17:25 - INFO - __main__ - Step 35887: {'lr': 0.0004380672140816095, 'samples': 6890304, 'steps': 35886, 'loss/train': 1.350689172744751} -11/07/2021 02:17:26 - INFO - __main__ - Step 35888: {'lr': 0.0004380637176575205, 'samples': 6890496, 'steps': 35887, 'loss/train': 1.5569615364074707} -11/07/2021 02:17:27 - INFO - __main__ - Step 35889: {'lr': 0.00043806022114869294, 'samples': 6890688, 'steps': 35888, 'loss/train': 1.4751020669937134} -11/07/2021 02:17:27 - INFO - __main__ - Step 35890: {'lr': 0.0004380567245551282, 'samples': 6890880, 'steps': 35889, 'loss/train': 1.6205087900161743} -11/07/2021 02:17:27 - INFO - __main__ - Step 35891: {'lr': 0.0004380532278768282, 'samples': 6891072, 'steps': 35890, 'loss/train': 1.6306557655334473} -11/07/2021 02:17:28 - INFO - __main__ - Step 35892: {'lr': 0.0004380497311137942, 'samples': 6891264, 'steps': 35891, 'loss/train': 1.3647589683532715} -11/07/2021 02:17:28 - INFO - __main__ - Step 35893: {'lr': 0.00043804623426602784, 'samples': 6891456, 'steps': 35892, 'loss/train': 1.743046760559082} -11/07/2021 02:17:29 - INFO - __main__ - Step 35894: {'lr': 0.00043804273733353085, 'samples': 6891648, 'steps': 35893, 'loss/train': 1.4048981666564941} -11/07/2021 02:17:30 - INFO - __main__ - Step 35895: {'lr': 0.0004380392403163047, 'samples': 6891840, 'steps': 35894, 'loss/train': 1.4988237619400024} -11/07/2021 02:17:30 - INFO - __main__ - Step 35896: {'lr': 0.00043803574321435093, 'samples': 6892032, 'steps': 35895, 'loss/train': 1.2499364614486694} -11/07/2021 02:17:31 - INFO - __main__ - Step 35897: {'lr': 0.00043803224602767115, 'samples': 6892224, 'steps': 35896, 'loss/train': 1.531029224395752} -11/07/2021 02:17:31 - INFO - __main__ - Step 35898: {'lr': 0.000438028748756267, 'samples': 6892416, 'steps': 35897, 'loss/train': 0.14744128286838531} -11/07/2021 02:17:32 - INFO - __main__ - Step 35899: {'lr': 0.00043802525140013994, 'samples': 6892608, 'steps': 35898, 'loss/train': 1.589914083480835} -11/07/2021 02:17:32 - INFO - __main__ - Step 35900: {'lr': 0.00043802175395929156, 'samples': 6892800, 'steps': 35899, 'loss/train': 1.3293200731277466} -11/07/2021 02:17:33 - INFO - __main__ - Step 35901: {'lr': 0.00043801825643372363, 'samples': 6892992, 'steps': 35900, 'loss/train': 1.0679981708526611} -11/07/2021 02:17:33 - INFO - __main__ - Step 35902: {'lr': 0.00043801475882343743, 'samples': 6893184, 'steps': 35901, 'loss/train': 1.5215486288070679} -11/07/2021 02:17:33 - INFO - __main__ - Step 35903: {'lr': 0.0004380112611284347, 'samples': 6893376, 'steps': 35902, 'loss/train': 1.6985673904418945} -11/07/2021 02:17:34 - INFO - __main__ - Step 35904: {'lr': 0.00043800776334871705, 'samples': 6893568, 'steps': 35903, 'loss/train': 1.8185510635375977} -11/07/2021 02:17:35 - INFO - __main__ - Step 35905: {'lr': 0.000438004265484286, 'samples': 6893760, 'steps': 35904, 'loss/train': 1.454746127128601} -11/07/2021 02:17:35 - INFO - __main__ - Step 35906: {'lr': 0.0004380007675351431, 'samples': 6893952, 'steps': 35905, 'loss/train': 0.9168397784233093} -11/07/2021 02:17:35 - INFO - __main__ - Step 35907: {'lr': 0.00043799726950128997, 'samples': 6894144, 'steps': 35906, 'loss/train': 1.206464171409607} -11/07/2021 02:17:36 - INFO - __main__ - Step 35908: {'lr': 0.0004379937713827282, 'samples': 6894336, 'steps': 35907, 'loss/train': 1.4056463241577148} -11/07/2021 02:17:37 - INFO - __main__ - Step 35909: {'lr': 0.0004379902731794593, 'samples': 6894528, 'steps': 35908, 'loss/train': 1.3022297620773315} -11/07/2021 02:17:37 - INFO - __main__ - Step 35910: {'lr': 0.00043798677489148487, 'samples': 6894720, 'steps': 35909, 'loss/train': 1.1841340065002441} -11/07/2021 02:17:37 - INFO - __main__ - Step 35911: {'lr': 0.0004379832765188065, 'samples': 6894912, 'steps': 35910, 'loss/train': 1.4022372961044312} -11/07/2021 02:17:38 - INFO - __main__ - Step 35912: {'lr': 0.00043797977806142585, 'samples': 6895104, 'steps': 35911, 'loss/train': 1.616759181022644} -11/07/2021 02:17:38 - INFO - __main__ - Step 35913: {'lr': 0.0004379762795193443, 'samples': 6895296, 'steps': 35912, 'loss/train': 1.444366216659546} -11/07/2021 02:17:39 - INFO - __main__ - Step 35914: {'lr': 0.0004379727808925636, 'samples': 6895488, 'steps': 35913, 'loss/train': 0.9257416129112244} -11/07/2021 02:17:40 - INFO - __main__ - Step 35915: {'lr': 0.00043796928218108527, 'samples': 6895680, 'steps': 35914, 'loss/train': 1.7744345664978027} -11/07/2021 02:17:40 - INFO - __main__ - Step 35916: {'lr': 0.0004379657833849109, 'samples': 6895872, 'steps': 35915, 'loss/train': 1.4082496166229248} -11/07/2021 02:17:40 - INFO - __main__ - Step 35917: {'lr': 0.000437962284504042, 'samples': 6896064, 'steps': 35916, 'loss/train': 1.4445488452911377} -11/07/2021 02:17:41 - INFO - __main__ - Step 35918: {'lr': 0.00043795878553848025, 'samples': 6896256, 'steps': 35917, 'loss/train': 3.3619754314422607} -11/07/2021 02:17:41 - INFO - __main__ - Step 35919: {'lr': 0.0004379552864882271, 'samples': 6896448, 'steps': 35918, 'loss/train': 1.4456998109817505} -11/07/2021 02:17:42 - INFO - __main__ - Step 35920: {'lr': 0.00043795178735328425, 'samples': 6896640, 'steps': 35919, 'loss/train': 1.248893141746521} -11/07/2021 02:17:42 - INFO - __main__ - Step 35921: {'lr': 0.0004379482881336532, 'samples': 6896832, 'steps': 35920, 'loss/train': 1.5730149745941162} -11/07/2021 02:17:43 - INFO - __main__ - Step 35922: {'lr': 0.0004379447888293355, 'samples': 6897024, 'steps': 35921, 'loss/train': 1.6229360103607178} -11/07/2021 02:17:43 - INFO - __main__ - Step 35923: {'lr': 0.0004379412894403328, 'samples': 6897216, 'steps': 35922, 'loss/train': 1.5293281078338623} -11/07/2021 02:17:43 - INFO - __main__ - Step 35924: {'lr': 0.0004379377899666468, 'samples': 6897408, 'steps': 35923, 'loss/train': 1.3089522123336792} -11/07/2021 02:17:44 - INFO - __main__ - Step 35925: {'lr': 0.0004379342904082788, 'samples': 6897600, 'steps': 35924, 'loss/train': 1.3258305788040161} -11/07/2021 02:17:45 - INFO - __main__ - Step 35926: {'lr': 0.00043793079076523053, 'samples': 6897792, 'steps': 35925, 'loss/train': 0.957828164100647} -11/07/2021 02:17:45 - INFO - __main__ - Step 35927: {'lr': 0.0004379272910375035, 'samples': 6897984, 'steps': 35926, 'loss/train': 1.5545063018798828} -11/07/2021 02:17:45 - INFO - __main__ - Step 35928: {'lr': 0.0004379237912250994, 'samples': 6898176, 'steps': 35927, 'loss/train': 1.6177557706832886} -11/07/2021 02:17:46 - INFO - __main__ - Step 35929: {'lr': 0.0004379202913280197, 'samples': 6898368, 'steps': 35928, 'loss/train': 1.0915831327438354} -11/07/2021 02:17:47 - INFO - __main__ - Step 35930: {'lr': 0.0004379167913462661, 'samples': 6898560, 'steps': 35929, 'loss/train': 1.5333443880081177} -11/07/2021 02:17:47 - INFO - __main__ - Step 35931: {'lr': 0.00043791329127984004, 'samples': 6898752, 'steps': 35930, 'loss/train': 1.651257872581482} -11/07/2021 02:17:48 - INFO - __main__ - Step 35932: {'lr': 0.0004379097911287431, 'samples': 6898944, 'steps': 35931, 'loss/train': 1.124588966369629} -11/07/2021 02:17:48 - INFO - __main__ - Step 35933: {'lr': 0.000437906290892977, 'samples': 6899136, 'steps': 35932, 'loss/train': 1.3447669744491577} -11/07/2021 02:17:48 - INFO - __main__ - Step 35934: {'lr': 0.00043790279057254314, 'samples': 6899328, 'steps': 35933, 'loss/train': 2.0153403282165527} -11/07/2021 02:17:49 - INFO - __main__ - Step 35935: {'lr': 0.00043789929016744324, 'samples': 6899520, 'steps': 35934, 'loss/train': 1.6986846923828125} -11/07/2021 02:17:50 - INFO - __main__ - Step 35936: {'lr': 0.0004378957896776787, 'samples': 6899712, 'steps': 35935, 'loss/train': 1.446560025215149} -11/07/2021 02:17:50 - INFO - __main__ - Step 35937: {'lr': 0.0004378922891032514, 'samples': 6899904, 'steps': 35936, 'loss/train': 1.6637734174728394} -11/07/2021 02:17:50 - INFO - __main__ - Step 35938: {'lr': 0.0004378887884441626, 'samples': 6900096, 'steps': 35937, 'loss/train': 0.8005592823028564} -11/07/2021 02:17:51 - INFO - __main__ - Step 35939: {'lr': 0.000437885287700414, 'samples': 6900288, 'steps': 35938, 'loss/train': 1.0051047801971436} -11/07/2021 02:17:51 - INFO - __main__ - Step 35940: {'lr': 0.0004378817868720073, 'samples': 6900480, 'steps': 35939, 'loss/train': 2.8363940715789795} -11/07/2021 02:17:52 - INFO - __main__ - Step 35941: {'lr': 0.0004378782859589439, 'samples': 6900672, 'steps': 35940, 'loss/train': 1.4257400035858154} -11/07/2021 02:17:52 - INFO - __main__ - Step 35942: {'lr': 0.00043787478496122546, 'samples': 6900864, 'steps': 35941, 'loss/train': 1.3198901414871216} -11/07/2021 02:17:53 - INFO - __main__ - Step 35943: {'lr': 0.0004378712838788536, 'samples': 6901056, 'steps': 35942, 'loss/train': 1.3227993249893188} -11/07/2021 02:17:53 - INFO - __main__ - Step 35944: {'lr': 0.0004378677827118297, 'samples': 6901248, 'steps': 35943, 'loss/train': 1.7186728715896606} -11/07/2021 02:17:53 - INFO - __main__ - Step 35945: {'lr': 0.0004378642814601556, 'samples': 6901440, 'steps': 35944, 'loss/train': 1.5145400762557983} -11/07/2021 02:17:55 - INFO - __main__ - Step 35946: {'lr': 0.0004378607801238327, 'samples': 6901632, 'steps': 35945, 'loss/train': 1.6515378952026367} -11/07/2021 02:17:55 - INFO - __main__ - Step 35947: {'lr': 0.00043785727870286265, 'samples': 6901824, 'steps': 35946, 'loss/train': 2.2473514080047607} -11/07/2021 02:17:55 - INFO - __main__ - Step 35948: {'lr': 0.00043785377719724697, 'samples': 6902016, 'steps': 35947, 'loss/train': 1.0143795013427734} -11/07/2021 02:17:56 - INFO - __main__ - Step 35949: {'lr': 0.0004378502756069873, 'samples': 6902208, 'steps': 35948, 'loss/train': 0.6523028612136841} -11/07/2021 02:17:56 - INFO - __main__ - Step 35950: {'lr': 0.0004378467739320852, 'samples': 6902400, 'steps': 35949, 'loss/train': 1.716147780418396} -11/07/2021 02:17:57 - INFO - __main__ - Step 35951: {'lr': 0.0004378432721725422, 'samples': 6902592, 'steps': 35950, 'loss/train': 1.1859630346298218} -11/07/2021 02:17:57 - INFO - __main__ - Step 35952: {'lr': 0.00043783977032836, 'samples': 6902784, 'steps': 35951, 'loss/train': 1.202818751335144} -11/07/2021 02:17:58 - INFO - __main__ - Step 35953: {'lr': 0.00043783626839954005, 'samples': 6902976, 'steps': 35952, 'loss/train': 1.3891003131866455} -11/07/2021 02:17:58 - INFO - __main__ - Step 35954: {'lr': 0.0004378327663860839, 'samples': 6903168, 'steps': 35953, 'loss/train': 1.661206841468811} -11/07/2021 02:17:58 - INFO - __main__ - Step 35955: {'lr': 0.00043782926428799333, 'samples': 6903360, 'steps': 35954, 'loss/train': 1.4225733280181885} -11/07/2021 02:17:59 - INFO - __main__ - Step 35956: {'lr': 0.0004378257621052698, 'samples': 6903552, 'steps': 35955, 'loss/train': 1.5549224615097046} -11/07/2021 02:18:00 - INFO - __main__ - Step 35957: {'lr': 0.0004378222598379148, 'samples': 6903744, 'steps': 35956, 'loss/train': 1.6702907085418701} -11/07/2021 02:18:00 - INFO - __main__ - Step 35958: {'lr': 0.00043781875748593, 'samples': 6903936, 'steps': 35957, 'loss/train': 1.0661641359329224} -11/07/2021 02:18:00 - INFO - __main__ - Step 35959: {'lr': 0.000437815255049317, 'samples': 6904128, 'steps': 35958, 'loss/train': 1.3309332132339478} -11/07/2021 02:18:01 - INFO - __main__ - Step 35960: {'lr': 0.0004378117525280773, 'samples': 6904320, 'steps': 35959, 'loss/train': 1.4166483879089355} -11/07/2021 02:18:02 - INFO - __main__ - Step 35961: {'lr': 0.00043780824992221257, 'samples': 6904512, 'steps': 35960, 'loss/train': 1.2731068134307861} -11/07/2021 02:18:02 - INFO - __main__ - Step 35962: {'lr': 0.00043780474723172433, 'samples': 6904704, 'steps': 35961, 'loss/train': 1.650513768196106} -11/07/2021 02:18:02 - INFO - __main__ - Step 35963: {'lr': 0.00043780124445661416, 'samples': 6904896, 'steps': 35962, 'loss/train': 1.721779704093933} -11/07/2021 02:18:03 - INFO - __main__ - Step 35964: {'lr': 0.00043779774159688364, 'samples': 6905088, 'steps': 35963, 'loss/train': 1.142958402633667} -11/07/2021 02:18:03 - INFO - __main__ - Step 35965: {'lr': 0.00043779423865253434, 'samples': 6905280, 'steps': 35964, 'loss/train': 1.630504846572876} -11/07/2021 02:18:04 - INFO - __main__ - Step 35966: {'lr': 0.00043779073562356783, 'samples': 6905472, 'steps': 35965, 'loss/train': 1.7916053533554077} -11/07/2021 02:18:04 - INFO - __main__ - Step 35967: {'lr': 0.0004377872325099858, 'samples': 6905664, 'steps': 35966, 'loss/train': 1.4563828706741333} -11/07/2021 02:18:05 - INFO - __main__ - Step 35968: {'lr': 0.00043778372931178974, 'samples': 6905856, 'steps': 35967, 'loss/train': 1.1095385551452637} -11/07/2021 02:18:05 - INFO - __main__ - Step 35969: {'lr': 0.00043778022602898115, 'samples': 6906048, 'steps': 35968, 'loss/train': 1.3237872123718262} -11/07/2021 02:18:05 - INFO - __main__ - Step 35970: {'lr': 0.0004377767226615617, 'samples': 6906240, 'steps': 35969, 'loss/train': 1.250608205795288} -11/07/2021 02:18:07 - INFO - __main__ - Step 35971: {'lr': 0.000437773219209533, 'samples': 6906432, 'steps': 35970, 'loss/train': 1.6383625268936157} -11/07/2021 02:18:07 - INFO - __main__ - Step 35972: {'lr': 0.00043776971567289656, 'samples': 6906624, 'steps': 35971, 'loss/train': 1.3096139430999756} -11/07/2021 02:18:07 - INFO - __main__ - Step 35973: {'lr': 0.00043776621205165404, 'samples': 6906816, 'steps': 35972, 'loss/train': 1.204809546470642} -11/07/2021 02:18:08 - INFO - __main__ - Step 35974: {'lr': 0.0004377627083458069, 'samples': 6907008, 'steps': 35973, 'loss/train': 1.3687340021133423} -11/07/2021 02:18:08 - INFO - __main__ - Step 35975: {'lr': 0.0004377592045553568, 'samples': 6907200, 'steps': 35974, 'loss/train': 1.6243177652359009} -11/07/2021 02:18:09 - INFO - __main__ - Step 35976: {'lr': 0.00043775570068030524, 'samples': 6907392, 'steps': 35975, 'loss/train': 1.8994401693344116} -11/07/2021 02:18:09 - INFO - __main__ - Step 35977: {'lr': 0.0004377521967206539, 'samples': 6907584, 'steps': 35976, 'loss/train': 1.6218942403793335} -11/07/2021 02:18:10 - INFO - __main__ - Step 35978: {'lr': 0.00043774869267640436, 'samples': 6907776, 'steps': 35977, 'loss/train': 1.7045758962631226} -11/07/2021 02:18:10 - INFO - __main__ - Step 35979: {'lr': 0.0004377451885475581, 'samples': 6907968, 'steps': 35978, 'loss/train': 0.8041215538978577} -11/07/2021 02:18:10 - INFO - __main__ - Step 35980: {'lr': 0.0004377416843341168, 'samples': 6908160, 'steps': 35979, 'loss/train': 1.9746583700180054} -11/07/2021 02:18:12 - INFO - __main__ - Step 35981: {'lr': 0.00043773818003608203, 'samples': 6908352, 'steps': 35980, 'loss/train': 1.262722134590149} -11/07/2021 02:18:12 - INFO - __main__ - Step 35982: {'lr': 0.00043773467565345523, 'samples': 6908544, 'steps': 35981, 'loss/train': 1.465383768081665} -11/07/2021 02:18:12 - INFO - __main__ - Step 35983: {'lr': 0.0004377311711862381, 'samples': 6908736, 'steps': 35982, 'loss/train': 1.469982385635376} -11/07/2021 02:18:13 - INFO - __main__ - Step 35984: {'lr': 0.0004377276666344322, 'samples': 6908928, 'steps': 35983, 'loss/train': 1.7502566576004028} -11/07/2021 02:18:13 - INFO - __main__ - Step 35985: {'lr': 0.00043772416199803924, 'samples': 6909120, 'steps': 35984, 'loss/train': 1.5767804384231567} -11/07/2021 02:18:13 - INFO - __main__ - Step 35986: {'lr': 0.00043772065727706053, 'samples': 6909312, 'steps': 35985, 'loss/train': 1.3555277585983276} -11/07/2021 02:18:15 - INFO - __main__ - Step 35987: {'lr': 0.0004377171524714978, 'samples': 6909504, 'steps': 35986, 'loss/train': 1.3033314943313599} -11/07/2021 02:18:15 - INFO - __main__ - Step 35988: {'lr': 0.0004377136475813527, 'samples': 6909696, 'steps': 35987, 'loss/train': 1.681982159614563} -11/07/2021 02:18:16 - INFO - __main__ - Step 35989: {'lr': 0.0004377101426066266, 'samples': 6909888, 'steps': 35988, 'loss/train': 1.3505668640136719} -11/07/2021 02:18:16 - INFO - __main__ - Step 35990: {'lr': 0.0004377066375473213, 'samples': 6910080, 'steps': 35989, 'loss/train': 0.25427624583244324} -11/07/2021 02:18:16 - INFO - __main__ - Step 35991: {'lr': 0.00043770313240343826, 'samples': 6910272, 'steps': 35990, 'loss/train': 1.435550570487976} -11/07/2021 02:18:17 - INFO - __main__ - Step 35992: {'lr': 0.00043769962717497916, 'samples': 6910464, 'steps': 35991, 'loss/train': 0.8674271106719971} -11/07/2021 02:18:18 - INFO - __main__ - Step 35993: {'lr': 0.0004376961218619454, 'samples': 6910656, 'steps': 35992, 'loss/train': 1.3199352025985718} -11/07/2021 02:18:18 - INFO - __main__ - Step 35994: {'lr': 0.00043769261646433867, 'samples': 6910848, 'steps': 35993, 'loss/train': 0.7368350028991699} -11/07/2021 02:18:18 - INFO - __main__ - Step 35995: {'lr': 0.0004376891109821606, 'samples': 6911040, 'steps': 35994, 'loss/train': 1.4026904106140137} -11/07/2021 02:18:19 - INFO - __main__ - Step 35996: {'lr': 0.0004376856054154127, 'samples': 6911232, 'steps': 35995, 'loss/train': 1.77277672290802} -11/07/2021 02:18:20 - INFO - __main__ - Step 35997: {'lr': 0.00043768209976409645, 'samples': 6911424, 'steps': 35996, 'loss/train': 1.7561774253845215} -11/07/2021 02:18:20 - INFO - __main__ - Step 35998: {'lr': 0.0004376785940282137, 'samples': 6911616, 'steps': 35997, 'loss/train': 0.8580551147460938} -11/07/2021 02:18:20 - INFO - __main__ - Step 35999: {'lr': 0.0004376750882077658, 'samples': 6911808, 'steps': 35998, 'loss/train': 1.5717216730117798} -11/07/2021 02:18:21 - INFO - __main__ - Step 36000: {'lr': 0.0004376715823027544, 'samples': 6912000, 'steps': 35999, 'loss/train': 1.4603431224822998} -11/07/2021 02:18:21 - INFO - __main__ - Step 36001: {'lr': 0.0004376680763131811, 'samples': 6912192, 'steps': 36000, 'loss/train': 0.7720442414283752} -11/07/2021 02:18:21 - INFO - __main__ - Step 36002: {'lr': 0.0004376645702390475, 'samples': 6912384, 'steps': 36001, 'loss/train': 1.1306639909744263} -11/07/2021 02:18:23 - INFO - __main__ - Step 36003: {'lr': 0.00043766106408035506, 'samples': 6912576, 'steps': 36002, 'loss/train': 0.8562272787094116} -11/07/2021 02:18:23 - INFO - __main__ - Step 36004: {'lr': 0.0004376575578371055, 'samples': 6912768, 'steps': 36003, 'loss/train': 1.6573060750961304} -11/07/2021 02:18:23 - INFO - __main__ - Step 36005: {'lr': 0.0004376540515093003, 'samples': 6912960, 'steps': 36004, 'loss/train': 1.3827896118164062} -11/07/2021 02:18:24 - INFO - __main__ - Step 36006: {'lr': 0.0004376505450969411, 'samples': 6913152, 'steps': 36005, 'loss/train': 1.5291324853897095} -11/07/2021 02:18:24 - INFO - __main__ - Step 36007: {'lr': 0.0004376470386000294, 'samples': 6913344, 'steps': 36006, 'loss/train': 1.5615692138671875} -11/07/2021 02:18:25 - INFO - __main__ - Step 36008: {'lr': 0.0004376435320185669, 'samples': 6913536, 'steps': 36007, 'loss/train': 1.4178293943405151} -11/07/2021 02:18:26 - INFO - __main__ - Step 36009: {'lr': 0.0004376400253525551, 'samples': 6913728, 'steps': 36008, 'loss/train': 1.5691521167755127} -11/07/2021 02:18:26 - INFO - __main__ - Step 36010: {'lr': 0.0004376365186019956, 'samples': 6913920, 'steps': 36009, 'loss/train': 1.0562870502471924} -11/07/2021 02:18:26 - INFO - __main__ - Step 36011: {'lr': 0.00043763301176689, 'samples': 6914112, 'steps': 36010, 'loss/train': 2.8755180835723877} -11/07/2021 02:18:27 - INFO - __main__ - Step 36012: {'lr': 0.0004376295048472399, 'samples': 6914304, 'steps': 36011, 'loss/train': 1.0411345958709717} -11/07/2021 02:18:28 - INFO - __main__ - Step 36013: {'lr': 0.0004376259978430468, 'samples': 6914496, 'steps': 36012, 'loss/train': 1.9251238107681274} -11/07/2021 02:18:28 - INFO - __main__ - Step 36014: {'lr': 0.0004376224907543123, 'samples': 6914688, 'steps': 36013, 'loss/train': 1.528991937637329} -11/07/2021 02:18:28 - INFO - __main__ - Step 36015: {'lr': 0.00043761898358103804, 'samples': 6914880, 'steps': 36014, 'loss/train': 1.6339377164840698} -11/07/2021 02:18:29 - INFO - __main__ - Step 36016: {'lr': 0.0004376154763232255, 'samples': 6915072, 'steps': 36015, 'loss/train': 1.160670518875122} -11/07/2021 02:18:29 - INFO - __main__ - Step 36017: {'lr': 0.0004376119689808764, 'samples': 6915264, 'steps': 36016, 'loss/train': 1.3139722347259521} -11/07/2021 02:18:29 - INFO - __main__ - Step 36018: {'lr': 0.00043760846155399216, 'samples': 6915456, 'steps': 36017, 'loss/train': 1.5870747566223145} -11/07/2021 02:18:31 - INFO - __main__ - Step 36019: {'lr': 0.0004376049540425745, 'samples': 6915648, 'steps': 36018, 'loss/train': 1.3712278604507446} -11/07/2021 02:18:31 - INFO - __main__ - Step 36020: {'lr': 0.0004376014464466249, 'samples': 6915840, 'steps': 36019, 'loss/train': 1.959718942642212} -11/07/2021 02:18:31 - INFO - __main__ - Step 36021: {'lr': 0.0004375979387661451, 'samples': 6916032, 'steps': 36020, 'loss/train': 1.5496079921722412} -11/07/2021 02:18:32 - INFO - __main__ - Step 36022: {'lr': 0.0004375944310011364, 'samples': 6916224, 'steps': 36021, 'loss/train': 1.8799645900726318} -11/07/2021 02:18:32 - INFO - __main__ - Step 36023: {'lr': 0.00043759092315160064, 'samples': 6916416, 'steps': 36022, 'loss/train': 1.4155391454696655} -11/07/2021 02:18:33 - INFO - __main__ - Step 36024: {'lr': 0.00043758741521753925, 'samples': 6916608, 'steps': 36023, 'loss/train': 1.5093621015548706} -11/07/2021 02:18:33 - INFO - __main__ - Step 36025: {'lr': 0.0004375839071989539, 'samples': 6916800, 'steps': 36024, 'loss/train': 1.1388566493988037} -11/07/2021 02:18:34 - INFO - __main__ - Step 36026: {'lr': 0.00043758039909584613, 'samples': 6916992, 'steps': 36025, 'loss/train': 1.8856382369995117} -11/07/2021 02:18:34 - INFO - __main__ - Step 36027: {'lr': 0.0004375768909082175, 'samples': 6917184, 'steps': 36026, 'loss/train': 1.2582416534423828} -11/07/2021 02:18:35 - INFO - __main__ - Step 36028: {'lr': 0.0004375733826360697, 'samples': 6917376, 'steps': 36027, 'loss/train': 1.3716334104537964} -11/07/2021 02:18:35 - INFO - __main__ - Step 36029: {'lr': 0.0004375698742794042, 'samples': 6917568, 'steps': 36028, 'loss/train': 1.2687499523162842} -11/07/2021 02:18:36 - INFO - __main__ - Step 36030: {'lr': 0.0004375663658382225, 'samples': 6917760, 'steps': 36029, 'loss/train': 1.315381646156311} -11/07/2021 02:18:36 - INFO - __main__ - Step 36031: {'lr': 0.0004375628573125264, 'samples': 6917952, 'steps': 36030, 'loss/train': 1.1570274829864502} -11/07/2021 02:18:37 - INFO - __main__ - Step 36032: {'lr': 0.0004375593487023174, 'samples': 6918144, 'steps': 36031, 'loss/train': 1.5267812013626099} -11/07/2021 02:18:37 - INFO - __main__ - Step 36033: {'lr': 0.00043755584000759696, 'samples': 6918336, 'steps': 36032, 'loss/train': 1.284977912902832} -11/07/2021 02:18:38 - INFO - __main__ - Step 36034: {'lr': 0.0004375523312283668, 'samples': 6918528, 'steps': 36033, 'loss/train': 1.2571640014648438} -11/07/2021 02:18:38 - INFO - __main__ - Step 36035: {'lr': 0.00043754882236462844, 'samples': 6918720, 'steps': 36034, 'loss/train': 1.487125277519226} -11/07/2021 02:18:39 - INFO - __main__ - Step 36036: {'lr': 0.00043754531341638346, 'samples': 6918912, 'steps': 36035, 'loss/train': 2.0117814540863037} -11/07/2021 02:18:39 - INFO - __main__ - Step 36037: {'lr': 0.00043754180438363344, 'samples': 6919104, 'steps': 36036, 'loss/train': 0.9645311832427979} -11/07/2021 02:18:39 - INFO - __main__ - Step 36038: {'lr': 0.00043753829526638, 'samples': 6919296, 'steps': 36037, 'loss/train': 1.0889891386032104} -11/07/2021 02:18:40 - INFO - __main__ - Step 36039: {'lr': 0.0004375347860646247, 'samples': 6919488, 'steps': 36038, 'loss/train': 1.0317258834838867} -11/07/2021 02:18:41 - INFO - __main__ - Step 36040: {'lr': 0.00043753127677836917, 'samples': 6919680, 'steps': 36039, 'loss/train': 0.44519782066345215} -11/07/2021 02:18:41 - INFO - __main__ - Step 36041: {'lr': 0.0004375277674076149, 'samples': 6919872, 'steps': 36040, 'loss/train': 1.6520081758499146} -11/07/2021 02:18:41 - INFO - __main__ - Step 36042: {'lr': 0.0004375242579523635, 'samples': 6920064, 'steps': 36041, 'loss/train': 1.540985107421875} -11/07/2021 02:18:42 - INFO - __main__ - Step 36043: {'lr': 0.0004375207484126166, 'samples': 6920256, 'steps': 36042, 'loss/train': 1.9579271078109741} -11/07/2021 02:18:43 - INFO - __main__ - Step 36044: {'lr': 0.0004375172387883757, 'samples': 6920448, 'steps': 36043, 'loss/train': 1.5872255563735962} -11/07/2021 02:18:43 - INFO - __main__ - Step 36045: {'lr': 0.00043751372907964247, 'samples': 6920640, 'steps': 36044, 'loss/train': 1.1674432754516602} -11/07/2021 02:18:43 - INFO - __main__ - Step 36046: {'lr': 0.00043751021928641845, 'samples': 6920832, 'steps': 36045, 'loss/train': 1.4402272701263428} -11/07/2021 02:18:44 - INFO - __main__ - Step 36047: {'lr': 0.0004375067094087051, 'samples': 6921024, 'steps': 36046, 'loss/train': 1.7606974840164185} -11/07/2021 02:18:44 - INFO - __main__ - Step 36048: {'lr': 0.0004375031994465042, 'samples': 6921216, 'steps': 36047, 'loss/train': 1.1131813526153564} -11/07/2021 02:18:44 - INFO - __main__ - Step 36049: {'lr': 0.00043749968939981734, 'samples': 6921408, 'steps': 36048, 'loss/train': 1.9732738733291626} -11/07/2021 02:18:46 - INFO - __main__ - Step 36050: {'lr': 0.0004374961792686459, 'samples': 6921600, 'steps': 36049, 'loss/train': 1.4669445753097534} -11/07/2021 02:18:46 - INFO - __main__ - Step 36051: {'lr': 0.00043749266905299155, 'samples': 6921792, 'steps': 36050, 'loss/train': 0.8080386519432068} -11/07/2021 02:18:46 - INFO - __main__ - Step 36052: {'lr': 0.000437489158752856, 'samples': 6921984, 'steps': 36051, 'loss/train': 0.20430973172187805} -11/07/2021 02:18:47 - INFO - __main__ - Step 36053: {'lr': 0.00043748564836824065, 'samples': 6922176, 'steps': 36052, 'loss/train': 1.7568432092666626} -11/07/2021 02:18:47 - INFO - __main__ - Step 36054: {'lr': 0.0004374821378991473, 'samples': 6922368, 'steps': 36053, 'loss/train': 1.6545710563659668} -11/07/2021 02:18:48 - INFO - __main__ - Step 36055: {'lr': 0.0004374786273455772, 'samples': 6922560, 'steps': 36054, 'loss/train': 1.3741494417190552} -11/07/2021 02:18:49 - INFO - __main__ - Step 36056: {'lr': 0.0004374751167075322, 'samples': 6922752, 'steps': 36055, 'loss/train': 1.911236047744751} -11/07/2021 02:18:49 - INFO - __main__ - Step 36057: {'lr': 0.0004374716059850138, 'samples': 6922944, 'steps': 36056, 'loss/train': 1.8412857055664062} -11/07/2021 02:18:49 - INFO - __main__ - Step 36058: {'lr': 0.0004374680951780236, 'samples': 6923136, 'steps': 36057, 'loss/train': 1.6093480587005615} -11/07/2021 02:18:50 - INFO - __main__ - Step 36059: {'lr': 0.00043746458428656324, 'samples': 6923328, 'steps': 36058, 'loss/train': 1.5204285383224487} -11/07/2021 02:18:51 - INFO - __main__ - Step 36060: {'lr': 0.00043746107331063414, 'samples': 6923520, 'steps': 36059, 'loss/train': 1.6594641208648682} -11/07/2021 02:18:51 - INFO - __main__ - Step 36061: {'lr': 0.000437457562250238, 'samples': 6923712, 'steps': 36060, 'loss/train': 1.6589689254760742} -11/07/2021 02:18:51 - INFO - __main__ - Step 36062: {'lr': 0.0004374540511053763, 'samples': 6923904, 'steps': 36061, 'loss/train': 1.4177128076553345} -11/07/2021 02:18:52 - INFO - __main__ - Step 36063: {'lr': 0.00043745053987605075, 'samples': 6924096, 'steps': 36062, 'loss/train': 1.710706353187561} -11/07/2021 02:18:52 - INFO - __main__ - Step 36064: {'lr': 0.00043744702856226295, 'samples': 6924288, 'steps': 36063, 'loss/train': 1.4724761247634888} -11/07/2021 02:18:53 - INFO - __main__ - Step 36065: {'lr': 0.0004374435171640144, 'samples': 6924480, 'steps': 36064, 'loss/train': 1.2224045991897583} -11/07/2021 02:18:53 - INFO - __main__ - Step 36066: {'lr': 0.0004374400056813066, 'samples': 6924672, 'steps': 36065, 'loss/train': 1.6701277494430542} -11/07/2021 02:18:54 - INFO - __main__ - Step 36067: {'lr': 0.0004374364941141413, 'samples': 6924864, 'steps': 36066, 'loss/train': 0.6505734920501709} -11/07/2021 02:18:54 - INFO - __main__ - Step 36068: {'lr': 0.00043743298246251994, 'samples': 6925056, 'steps': 36067, 'loss/train': 1.7695902585983276} -11/07/2021 02:18:54 - INFO - __main__ - Step 36069: {'lr': 0.00043742947072644424, 'samples': 6925248, 'steps': 36068, 'loss/train': 1.2349269390106201} -11/07/2021 02:18:55 - INFO - __main__ - Step 36070: {'lr': 0.0004374259589059157, 'samples': 6925440, 'steps': 36069, 'loss/train': 0.949213981628418} -11/07/2021 02:18:56 - INFO - __main__ - Step 36071: {'lr': 0.0004374224470009359, 'samples': 6925632, 'steps': 36070, 'loss/train': 0.6275143027305603} -11/07/2021 02:18:56 - INFO - __main__ - Step 36072: {'lr': 0.00043741893501150644, 'samples': 6925824, 'steps': 36071, 'loss/train': 1.3203625679016113} -11/07/2021 02:18:57 - INFO - __main__ - Step 36073: {'lr': 0.0004374154229376289, 'samples': 6926016, 'steps': 36072, 'loss/train': 1.954107642173767} -11/07/2021 02:18:57 - INFO - __main__ - Step 36074: {'lr': 0.00043741191077930486, 'samples': 6926208, 'steps': 36073, 'loss/train': 1.9093469381332397} -11/07/2021 02:18:58 - INFO - __main__ - Step 36075: {'lr': 0.00043740839853653594, 'samples': 6926400, 'steps': 36074, 'loss/train': 1.2463798522949219} -11/07/2021 02:18:58 - INFO - __main__ - Step 36076: {'lr': 0.0004374048862093236, 'samples': 6926592, 'steps': 36075, 'loss/train': 1.6173049211502075} -11/07/2021 02:18:59 - INFO - __main__ - Step 36077: {'lr': 0.00043740137379766954, 'samples': 6926784, 'steps': 36076, 'loss/train': 1.380768895149231} -11/07/2021 02:18:59 - INFO - __main__ - Step 36078: {'lr': 0.0004373978613015753, 'samples': 6926976, 'steps': 36077, 'loss/train': 1.100445032119751} -11/07/2021 02:18:59 - INFO - __main__ - Step 36079: {'lr': 0.00043739434872104257, 'samples': 6927168, 'steps': 36078, 'loss/train': 1.6051472425460815} -11/07/2021 02:19:00 - INFO - __main__ - Step 36080: {'lr': 0.00043739083605607275, 'samples': 6927360, 'steps': 36079, 'loss/train': 1.165663242340088} -11/07/2021 02:19:01 - INFO - __main__ - Step 36081: {'lr': 0.0004373873233066676, 'samples': 6927552, 'steps': 36080, 'loss/train': 1.3163766860961914} -11/07/2021 02:19:01 - INFO - __main__ - Step 36082: {'lr': 0.00043738381047282856, 'samples': 6927744, 'steps': 36081, 'loss/train': 1.433258056640625} -11/07/2021 02:19:01 - INFO - __main__ - Step 36083: {'lr': 0.00043738029755455724, 'samples': 6927936, 'steps': 36082, 'loss/train': 0.9717826247215271} -11/07/2021 02:19:02 - INFO - __main__ - Step 36084: {'lr': 0.00043737678455185524, 'samples': 6928128, 'steps': 36083, 'loss/train': 1.3838664293289185} -11/07/2021 02:19:02 - INFO - __main__ - Step 36085: {'lr': 0.0004373732714647242, 'samples': 6928320, 'steps': 36084, 'loss/train': 1.2434223890304565} -11/07/2021 02:19:03 - INFO - __main__ - Step 36086: {'lr': 0.0004373697582931657, 'samples': 6928512, 'steps': 36085, 'loss/train': 1.0288443565368652} -11/07/2021 02:19:04 - INFO - __main__ - Step 36087: {'lr': 0.0004373662450371812, 'samples': 6928704, 'steps': 36086, 'loss/train': 1.307567834854126} -11/07/2021 02:19:04 - INFO - __main__ - Step 36088: {'lr': 0.0004373627316967723, 'samples': 6928896, 'steps': 36087, 'loss/train': 1.4782875776290894} -11/07/2021 02:19:04 - INFO - __main__ - Step 36089: {'lr': 0.0004373592182719408, 'samples': 6929088, 'steps': 36088, 'loss/train': 1.0795824527740479} -11/07/2021 02:19:05 - INFO - __main__ - Step 36090: {'lr': 0.00043735570476268804, 'samples': 6929280, 'steps': 36089, 'loss/train': 1.4311720132827759} -11/07/2021 02:19:06 - INFO - __main__ - Step 36091: {'lr': 0.0004373521911690157, 'samples': 6929472, 'steps': 36090, 'loss/train': 1.5301270484924316} -11/07/2021 02:19:06 - INFO - __main__ - Step 36092: {'lr': 0.00043734867749092534, 'samples': 6929664, 'steps': 36091, 'loss/train': 0.7610101103782654} -11/07/2021 02:19:06 - INFO - __main__ - Step 36093: {'lr': 0.0004373451637284186, 'samples': 6929856, 'steps': 36092, 'loss/train': 2.1793367862701416} -11/07/2021 02:19:07 - INFO - __main__ - Step 36094: {'lr': 0.0004373416498814969, 'samples': 6930048, 'steps': 36093, 'loss/train': 1.5620012283325195} -11/07/2021 02:19:07 - INFO - __main__ - Step 36095: {'lr': 0.0004373381359501621, 'samples': 6930240, 'steps': 36094, 'loss/train': 1.59977388381958} -11/07/2021 02:19:08 - INFO - __main__ - Step 36096: {'lr': 0.00043733462193441553, 'samples': 6930432, 'steps': 36095, 'loss/train': 1.613214373588562} -11/07/2021 02:19:08 - INFO - __main__ - Step 36097: {'lr': 0.00043733110783425894, 'samples': 6930624, 'steps': 36096, 'loss/train': 1.4539893865585327} -11/07/2021 02:19:09 - INFO - __main__ - Step 36098: {'lr': 0.00043732759364969374, 'samples': 6930816, 'steps': 36097, 'loss/train': 1.4978737831115723} -11/07/2021 02:19:09 - INFO - __main__ - Step 36099: {'lr': 0.0004373240793807217, 'samples': 6931008, 'steps': 36098, 'loss/train': 2.053466320037842} -11/07/2021 02:19:09 - INFO - __main__ - Step 36100: {'lr': 0.00043732056502734435, 'samples': 6931200, 'steps': 36099, 'loss/train': 1.4732714891433716} -11/07/2021 02:19:11 - INFO - __main__ - Step 36101: {'lr': 0.0004373170505895632, 'samples': 6931392, 'steps': 36100, 'loss/train': 1.4807472229003906} -11/07/2021 02:19:11 - INFO - __main__ - Step 36102: {'lr': 0.0004373135360673799, 'samples': 6931584, 'steps': 36101, 'loss/train': 1.4360374212265015} -11/07/2021 02:19:11 - INFO - __main__ - Step 36103: {'lr': 0.000437310021460796, 'samples': 6931776, 'steps': 36102, 'loss/train': 1.6048221588134766} -11/07/2021 02:19:12 - INFO - __main__ - Step 36104: {'lr': 0.000437306506769813, 'samples': 6931968, 'steps': 36103, 'loss/train': 0.9805557727813721} -11/07/2021 02:19:12 - INFO - __main__ - Step 36105: {'lr': 0.0004373029919944327, 'samples': 6932160, 'steps': 36104, 'loss/train': 0.14362464845180511} -11/07/2021 02:19:13 - INFO - __main__ - Step 36106: {'lr': 0.00043729947713465653, 'samples': 6932352, 'steps': 36105, 'loss/train': 1.5470880270004272} -11/07/2021 02:19:13 - INFO - __main__ - Step 36107: {'lr': 0.00043729596219048607, 'samples': 6932544, 'steps': 36106, 'loss/train': 1.026743769645691} -11/07/2021 02:19:14 - INFO - __main__ - Step 36108: {'lr': 0.000437292447161923, 'samples': 6932736, 'steps': 36107, 'loss/train': 1.5140167474746704} -11/07/2021 02:19:14 - INFO - __main__ - Step 36109: {'lr': 0.0004372889320489688, 'samples': 6932928, 'steps': 36108, 'loss/train': 1.5239927768707275} -11/07/2021 02:19:14 - INFO - __main__ - Step 36110: {'lr': 0.00043728541685162503, 'samples': 6933120, 'steps': 36109, 'loss/train': 1.677078366279602} -11/07/2021 02:19:15 - INFO - __main__ - Step 36111: {'lr': 0.0004372819015698934, 'samples': 6933312, 'steps': 36110, 'loss/train': 1.5815430879592896} -11/07/2021 02:19:16 - INFO - __main__ - Step 36112: {'lr': 0.0004372783862037755, 'samples': 6933504, 'steps': 36111, 'loss/train': 1.2556015253067017} -11/07/2021 02:19:16 - INFO - __main__ - Step 36113: {'lr': 0.00043727487075327285, 'samples': 6933696, 'steps': 36112, 'loss/train': 0.9244870543479919} -11/07/2021 02:19:16 - INFO - __main__ - Step 36114: {'lr': 0.00043727135521838697, 'samples': 6933888, 'steps': 36113, 'loss/train': 1.4923559427261353} -11/07/2021 02:19:17 - INFO - __main__ - Step 36115: {'lr': 0.00043726783959911953, 'samples': 6934080, 'steps': 36114, 'loss/train': 1.527382254600525} -11/07/2021 02:19:18 - INFO - __main__ - Step 36116: {'lr': 0.00043726432389547205, 'samples': 6934272, 'steps': 36115, 'loss/train': 1.7110966444015503} -11/07/2021 02:19:18 - INFO - __main__ - Step 36117: {'lr': 0.00043726080810744616, 'samples': 6934464, 'steps': 36116, 'loss/train': 1.2762972116470337} -11/07/2021 02:19:19 - INFO - __main__ - Step 36118: {'lr': 0.0004372572922350435, 'samples': 6934656, 'steps': 36117, 'loss/train': 1.5502105951309204} -11/07/2021 02:19:19 - INFO - __main__ - Step 36119: {'lr': 0.0004372537762782656, 'samples': 6934848, 'steps': 36118, 'loss/train': 1.138943076133728} -11/07/2021 02:19:19 - INFO - __main__ - Step 36120: {'lr': 0.00043725026023711395, 'samples': 6935040, 'steps': 36119, 'loss/train': 1.5728424787521362} -11/07/2021 02:19:20 - INFO - __main__ - Step 36121: {'lr': 0.0004372467441115903, 'samples': 6935232, 'steps': 36120, 'loss/train': 1.1723154783248901} -11/07/2021 02:19:21 - INFO - __main__ - Step 36122: {'lr': 0.00043724322790169613, 'samples': 6935424, 'steps': 36121, 'loss/train': 1.4476337432861328} -11/07/2021 02:19:21 - INFO - __main__ - Step 36123: {'lr': 0.00043723971160743305, 'samples': 6935616, 'steps': 36122, 'loss/train': 1.4831031560897827} -11/07/2021 02:19:21 - INFO - __main__ - Step 36124: {'lr': 0.00043723619522880266, 'samples': 6935808, 'steps': 36123, 'loss/train': 1.0746320486068726} -11/07/2021 02:19:22 - INFO - __main__ - Step 36125: {'lr': 0.0004372326787658065, 'samples': 6936000, 'steps': 36124, 'loss/train': 0.9541419148445129} -11/07/2021 02:19:22 - INFO - __main__ - Step 36126: {'lr': 0.00043722916221844617, 'samples': 6936192, 'steps': 36125, 'loss/train': 0.38092461228370667} -11/07/2021 02:19:23 - INFO - __main__ - Step 36127: {'lr': 0.0004372256455867233, 'samples': 6936384, 'steps': 36126, 'loss/train': 1.2290235757827759} -11/07/2021 02:19:23 - INFO - __main__ - Step 36128: {'lr': 0.0004372221288706394, 'samples': 6936576, 'steps': 36127, 'loss/train': 1.2454577684402466} -11/07/2021 02:19:24 - INFO - __main__ - Step 36129: {'lr': 0.0004372186120701962, 'samples': 6936768, 'steps': 36128, 'loss/train': 1.9584871530532837} -11/07/2021 02:19:24 - INFO - __main__ - Step 36130: {'lr': 0.00043721509518539507, 'samples': 6936960, 'steps': 36129, 'loss/train': 1.2257826328277588} -11/07/2021 02:19:24 - INFO - __main__ - Step 36131: {'lr': 0.0004372115782162378, 'samples': 6937152, 'steps': 36130, 'loss/train': 1.4203920364379883} -11/07/2021 02:19:25 - INFO - __main__ - Step 36132: {'lr': 0.00043720806116272584, 'samples': 6937344, 'steps': 36131, 'loss/train': 1.0633304119110107} -11/07/2021 02:19:26 - INFO - __main__ - Step 36133: {'lr': 0.00043720454402486076, 'samples': 6937536, 'steps': 36132, 'loss/train': 0.8455348014831543} -11/07/2021 02:19:26 - INFO - __main__ - Step 36134: {'lr': 0.00043720102680264427, 'samples': 6937728, 'steps': 36133, 'loss/train': 1.6558862924575806} -11/07/2021 02:19:27 - INFO - __main__ - Step 36135: {'lr': 0.0004371975094960778, 'samples': 6937920, 'steps': 36134, 'loss/train': 1.6989877223968506} -11/07/2021 02:19:27 - INFO - __main__ - Step 36136: {'lr': 0.0004371939921051632, 'samples': 6938112, 'steps': 36135, 'loss/train': 1.5624903440475464} -11/07/2021 02:19:28 - INFO - __main__ - Step 36137: {'lr': 0.00043719047462990174, 'samples': 6938304, 'steps': 36136, 'loss/train': 1.592354416847229} -11/07/2021 02:19:28 - INFO - __main__ - Step 36138: {'lr': 0.0004371869570702952, 'samples': 6938496, 'steps': 36137, 'loss/train': 1.591860055923462} -11/07/2021 02:19:29 - INFO - __main__ - Step 36139: {'lr': 0.0004371834394263451, 'samples': 6938688, 'steps': 36138, 'loss/train': 1.3959500789642334} -11/07/2021 02:19:29 - INFO - __main__ - Step 36140: {'lr': 0.000437179921698053, 'samples': 6938880, 'steps': 36139, 'loss/train': 1.7648470401763916} -11/07/2021 02:19:29 - INFO - __main__ - Step 36141: {'lr': 0.00043717640388542045, 'samples': 6939072, 'steps': 36140, 'loss/train': 1.1295483112335205} -11/07/2021 02:19:30 - INFO - __main__ - Step 36142: {'lr': 0.00043717288598844916, 'samples': 6939264, 'steps': 36141, 'loss/train': 1.166265606880188} -11/07/2021 02:19:31 - INFO - __main__ - Step 36143: {'lr': 0.0004371693680071407, 'samples': 6939456, 'steps': 36142, 'loss/train': 1.6560958623886108} -11/07/2021 02:19:31 - INFO - __main__ - Step 36144: {'lr': 0.00043716584994149657, 'samples': 6939648, 'steps': 36143, 'loss/train': 1.515106201171875} -11/07/2021 02:19:31 - INFO - __main__ - Step 36145: {'lr': 0.0004371623317915184, 'samples': 6939840, 'steps': 36144, 'loss/train': 1.1427377462387085} -11/07/2021 02:19:32 - INFO - __main__ - Step 36146: {'lr': 0.00043715881355720776, 'samples': 6940032, 'steps': 36145, 'loss/train': 1.328829288482666} -11/07/2021 02:19:33 - INFO - __main__ - Step 36147: {'lr': 0.0004371552952385663, 'samples': 6940224, 'steps': 36146, 'loss/train': 1.6909960508346558} -11/07/2021 02:19:33 - INFO - __main__ - Step 36148: {'lr': 0.00043715177683559546, 'samples': 6940416, 'steps': 36147, 'loss/train': 1.5440813302993774} -11/07/2021 02:19:33 - INFO - __main__ - Step 36149: {'lr': 0.000437148258348297, 'samples': 6940608, 'steps': 36148, 'loss/train': 1.8825254440307617} -11/07/2021 02:19:34 - INFO - __main__ - Step 36150: {'lr': 0.0004371447397766724, 'samples': 6940800, 'steps': 36149, 'loss/train': 1.4469424486160278} -11/07/2021 02:19:34 - INFO - __main__ - Step 36151: {'lr': 0.0004371412211207233, 'samples': 6940992, 'steps': 36150, 'loss/train': 1.580246090888977} -11/07/2021 02:19:35 - INFO - __main__ - Step 36152: {'lr': 0.0004371377023804512, 'samples': 6941184, 'steps': 36151, 'loss/train': 1.47393000125885} -11/07/2021 02:19:35 - INFO - __main__ - Step 36153: {'lr': 0.0004371341835558578, 'samples': 6941376, 'steps': 36152, 'loss/train': 1.0574392080307007} -11/07/2021 02:19:36 - INFO - __main__ - Step 36154: {'lr': 0.0004371306646469445, 'samples': 6941568, 'steps': 36153, 'loss/train': 2.2134885787963867} -11/07/2021 02:19:36 - INFO - __main__ - Step 36155: {'lr': 0.00043712714565371315, 'samples': 6941760, 'steps': 36154, 'loss/train': 1.4620238542556763} -11/07/2021 02:19:37 - INFO - __main__ - Step 36156: {'lr': 0.0004371236265761651, 'samples': 6941952, 'steps': 36155, 'loss/train': 1.5506919622421265} -11/07/2021 02:19:37 - INFO - __main__ - Step 36157: {'lr': 0.0004371201074143021, 'samples': 6942144, 'steps': 36156, 'loss/train': 1.710616946220398} -11/07/2021 02:19:38 - INFO - __main__ - Step 36158: {'lr': 0.0004371165881681256, 'samples': 6942336, 'steps': 36157, 'loss/train': 1.4615522623062134} -11/07/2021 02:19:38 - INFO - __main__ - Step 36159: {'lr': 0.0004371130688376373, 'samples': 6942528, 'steps': 36158, 'loss/train': 1.606250524520874} -11/07/2021 02:19:39 - INFO - __main__ - Step 36160: {'lr': 0.00043710954942283875, 'samples': 6942720, 'steps': 36159, 'loss/train': 1.5076546669006348} -11/07/2021 02:19:39 - INFO - __main__ - Step 36161: {'lr': 0.0004371060299237315, 'samples': 6942912, 'steps': 36160, 'loss/train': 1.523021936416626} -11/07/2021 02:19:39 - INFO - __main__ - Step 36162: {'lr': 0.00043710251034031713, 'samples': 6943104, 'steps': 36161, 'loss/train': 1.4017515182495117} -11/07/2021 02:19:41 - INFO - __main__ - Step 36163: {'lr': 0.0004370989906725973, 'samples': 6943296, 'steps': 36162, 'loss/train': 1.7055500745773315} -11/07/2021 02:19:41 - INFO - __main__ - Step 36164: {'lr': 0.00043709547092057356, 'samples': 6943488, 'steps': 36163, 'loss/train': 1.627466082572937} -11/07/2021 02:19:41 - INFO - __main__ - Step 36165: {'lr': 0.00043709195108424746, 'samples': 6943680, 'steps': 36164, 'loss/train': 1.0193427801132202} -11/07/2021 02:19:42 - INFO - __main__ - Step 36166: {'lr': 0.0004370884311636206, 'samples': 6943872, 'steps': 36165, 'loss/train': 0.8380038142204285} -11/07/2021 02:19:42 - INFO - __main__ - Step 36167: {'lr': 0.0004370849111586946, 'samples': 6944064, 'steps': 36166, 'loss/train': 1.7870904207229614} -11/07/2021 02:19:43 - INFO - __main__ - Step 36168: {'lr': 0.000437081391069471, 'samples': 6944256, 'steps': 36167, 'loss/train': 1.1971633434295654} -11/07/2021 02:19:43 - INFO - __main__ - Step 36169: {'lr': 0.0004370778708959514, 'samples': 6944448, 'steps': 36168, 'loss/train': 1.4381688833236694} -11/07/2021 02:19:44 - INFO - __main__ - Step 36170: {'lr': 0.00043707435063813747, 'samples': 6944640, 'steps': 36169, 'loss/train': 1.353993535041809} -11/07/2021 02:19:44 - INFO - __main__ - Step 36171: {'lr': 0.0004370708302960307, 'samples': 6944832, 'steps': 36170, 'loss/train': 1.1478573083877563} -11/07/2021 02:19:44 - INFO - __main__ - Step 36172: {'lr': 0.00043706730986963274, 'samples': 6945024, 'steps': 36171, 'loss/train': 1.386587142944336} -11/07/2021 02:19:46 - INFO - __main__ - Step 36173: {'lr': 0.0004370637893589451, 'samples': 6945216, 'steps': 36172, 'loss/train': 1.4752625226974487} -11/07/2021 02:19:46 - INFO - __main__ - Step 36174: {'lr': 0.0004370602687639693, 'samples': 6945408, 'steps': 36173, 'loss/train': 1.3060412406921387} -11/07/2021 02:19:46 - INFO - __main__ - Step 36175: {'lr': 0.00043705674808470715, 'samples': 6945600, 'steps': 36174, 'loss/train': 1.583465337753296} -11/07/2021 02:19:47 - INFO - __main__ - Step 36176: {'lr': 0.00043705322732116007, 'samples': 6945792, 'steps': 36175, 'loss/train': 1.362337350845337} -11/07/2021 02:19:47 - INFO - __main__ - Step 36177: {'lr': 0.00043704970647332977, 'samples': 6945984, 'steps': 36176, 'loss/train': 1.276375651359558} -11/07/2021 02:19:48 - INFO - __main__ - Step 36178: {'lr': 0.00043704618554121766, 'samples': 6946176, 'steps': 36177, 'loss/train': 1.6004598140716553} -11/07/2021 02:19:48 - INFO - __main__ - Step 36179: {'lr': 0.0004370426645248254, 'samples': 6946368, 'steps': 36178, 'loss/train': 1.3531804084777832} -11/07/2021 02:19:49 - INFO - __main__ - Step 36180: {'lr': 0.00043703914342415473, 'samples': 6946560, 'steps': 36179, 'loss/train': 1.6111247539520264} -11/07/2021 02:19:49 - INFO - __main__ - Step 36181: {'lr': 0.000437035622239207, 'samples': 6946752, 'steps': 36180, 'loss/train': 0.882485568523407} -11/07/2021 02:19:49 - INFO - __main__ - Step 36182: {'lr': 0.00043703210096998396, 'samples': 6946944, 'steps': 36181, 'loss/train': 1.731668472290039} -11/07/2021 02:19:50 - INFO - __main__ - Step 36183: {'lr': 0.00043702857961648713, 'samples': 6947136, 'steps': 36182, 'loss/train': 1.1887149810791016} -11/07/2021 02:19:51 - INFO - __main__ - Step 36184: {'lr': 0.0004370250581787181, 'samples': 6947328, 'steps': 36183, 'loss/train': 0.8045414686203003} -11/07/2021 02:19:51 - INFO - __main__ - Step 36185: {'lr': 0.00043702153665667846, 'samples': 6947520, 'steps': 36184, 'loss/train': 1.8129420280456543} -11/07/2021 02:19:51 - INFO - __main__ - Step 36186: {'lr': 0.0004370180150503698, 'samples': 6947712, 'steps': 36185, 'loss/train': 1.8427050113677979} -11/07/2021 02:19:52 - INFO - __main__ - Step 36187: {'lr': 0.0004370144933597938, 'samples': 6947904, 'steps': 36186, 'loss/train': 1.2437989711761475} -11/07/2021 02:19:53 - INFO - __main__ - Step 36188: {'lr': 0.00043701097158495186, 'samples': 6948096, 'steps': 36187, 'loss/train': 1.0144716501235962} -11/07/2021 02:19:53 - INFO - __main__ - Step 36189: {'lr': 0.0004370074497258456, 'samples': 6948288, 'steps': 36188, 'loss/train': 1.7620385885238647} -11/07/2021 02:19:53 - INFO - __main__ - Step 36190: {'lr': 0.00043700392778247676, 'samples': 6948480, 'steps': 36189, 'loss/train': 1.395757794380188} -11/07/2021 02:19:54 - INFO - __main__ - Step 36191: {'lr': 0.0004370004057548468, 'samples': 6948672, 'steps': 36190, 'loss/train': 1.7740306854248047} -11/07/2021 02:19:54 - INFO - __main__ - Step 36192: {'lr': 0.0004369968836429574, 'samples': 6948864, 'steps': 36191, 'loss/train': 1.3015068769454956} -11/07/2021 02:19:55 - INFO - __main__ - Step 36193: {'lr': 0.0004369933614468101, 'samples': 6949056, 'steps': 36192, 'loss/train': 1.3714641332626343} -11/07/2021 02:19:55 - INFO - __main__ - Step 36194: {'lr': 0.0004369898391664064, 'samples': 6949248, 'steps': 36193, 'loss/train': 1.4054350852966309} -11/07/2021 02:19:56 - INFO - __main__ - Step 36195: {'lr': 0.000436986316801748, 'samples': 6949440, 'steps': 36194, 'loss/train': 1.5505949258804321} -11/07/2021 02:19:56 - INFO - __main__ - Step 36196: {'lr': 0.00043698279435283637, 'samples': 6949632, 'steps': 36195, 'loss/train': 1.662702202796936} -11/07/2021 02:19:56 - INFO - __main__ - Step 36197: {'lr': 0.0004369792718196733, 'samples': 6949824, 'steps': 36196, 'loss/train': 0.9160897135734558} -11/07/2021 02:19:58 - INFO - __main__ - Step 36198: {'lr': 0.0004369757492022602, 'samples': 6950016, 'steps': 36197, 'loss/train': 1.199594259262085} -11/07/2021 02:19:58 - INFO - __main__ - Step 36199: {'lr': 0.00043697222650059876, 'samples': 6950208, 'steps': 36198, 'loss/train': 1.3858470916748047} -11/07/2021 02:19:58 - INFO - __main__ - Step 36200: {'lr': 0.00043696870371469045, 'samples': 6950400, 'steps': 36199, 'loss/train': 1.6673192977905273} -11/07/2021 02:19:59 - INFO - __main__ - Step 36201: {'lr': 0.000436965180844537, 'samples': 6950592, 'steps': 36200, 'loss/train': 1.7721482515335083} -11/07/2021 02:19:59 - INFO - __main__ - Step 36202: {'lr': 0.00043696165789013986, 'samples': 6950784, 'steps': 36201, 'loss/train': 1.8136097192764282} -11/07/2021 02:20:00 - INFO - __main__ - Step 36203: {'lr': 0.0004369581348515007, 'samples': 6950976, 'steps': 36202, 'loss/train': 1.477937936782837} -11/07/2021 02:20:00 - INFO - __main__ - Step 36204: {'lr': 0.00043695461172862113, 'samples': 6951168, 'steps': 36203, 'loss/train': 1.594497799873352} -11/07/2021 02:20:01 - INFO - __main__ - Step 36205: {'lr': 0.0004369510885215026, 'samples': 6951360, 'steps': 36204, 'loss/train': 1.2825634479522705} -11/07/2021 02:20:01 - INFO - __main__ - Step 36206: {'lr': 0.0004369475652301469, 'samples': 6951552, 'steps': 36205, 'loss/train': 1.2375483512878418} -11/07/2021 02:20:01 - INFO - __main__ - Step 36207: {'lr': 0.0004369440418545555, 'samples': 6951744, 'steps': 36206, 'loss/train': 1.5646448135375977} -11/07/2021 02:20:02 - INFO - __main__ - Step 36208: {'lr': 0.00043694051839472995, 'samples': 6951936, 'steps': 36207, 'loss/train': 1.567756175994873} -11/07/2021 02:20:03 - INFO - __main__ - Step 36209: {'lr': 0.00043693699485067186, 'samples': 6952128, 'steps': 36208, 'loss/train': 1.2388901710510254} -11/07/2021 02:20:03 - INFO - __main__ - Step 36210: {'lr': 0.0004369334712223829, 'samples': 6952320, 'steps': 36209, 'loss/train': 1.9396334886550903} -11/07/2021 02:20:03 - INFO - __main__ - Step 36211: {'lr': 0.0004369299475098646, 'samples': 6952512, 'steps': 36210, 'loss/train': 0.9735457301139832} -11/07/2021 02:20:04 - INFO - __main__ - Step 36212: {'lr': 0.00043692642371311854, 'samples': 6952704, 'steps': 36211, 'loss/train': 1.311751127243042} -11/07/2021 02:20:04 - INFO - __main__ - Step 36213: {'lr': 0.00043692289983214626, 'samples': 6952896, 'steps': 36212, 'loss/train': 1.5022273063659668} -11/07/2021 02:20:05 - INFO - __main__ - Step 36214: {'lr': 0.0004369193758669495, 'samples': 6953088, 'steps': 36213, 'loss/train': 1.4548381567001343} -11/07/2021 02:20:05 - INFO - __main__ - Step 36215: {'lr': 0.0004369158518175297, 'samples': 6953280, 'steps': 36214, 'loss/train': 1.3823559284210205} -11/07/2021 02:20:06 - INFO - __main__ - Step 36216: {'lr': 0.00043691232768388856, 'samples': 6953472, 'steps': 36215, 'loss/train': 1.1766122579574585} -11/07/2021 02:20:06 - INFO - __main__ - Step 36217: {'lr': 0.00043690880346602755, 'samples': 6953664, 'steps': 36216, 'loss/train': 1.4669190645217896} -11/07/2021 02:20:07 - INFO - __main__ - Step 36218: {'lr': 0.0004369052791639483, 'samples': 6953856, 'steps': 36217, 'loss/train': 1.1427199840545654} -11/07/2021 02:20:07 - INFO - __main__ - Step 36219: {'lr': 0.0004369017547776525, 'samples': 6954048, 'steps': 36218, 'loss/train': 1.8163267374038696} -11/07/2021 02:20:08 - INFO - __main__ - Step 36220: {'lr': 0.0004368982303071416, 'samples': 6954240, 'steps': 36219, 'loss/train': 1.1658703088760376} -11/07/2021 02:20:08 - INFO - __main__ - Step 36221: {'lr': 0.0004368947057524173, 'samples': 6954432, 'steps': 36220, 'loss/train': 1.4470137357711792} -11/07/2021 02:20:09 - INFO - __main__ - Step 36222: {'lr': 0.00043689118111348105, 'samples': 6954624, 'steps': 36221, 'loss/train': 1.7597016096115112} -11/07/2021 02:20:09 - INFO - __main__ - Step 36223: {'lr': 0.00043688765639033456, 'samples': 6954816, 'steps': 36222, 'loss/train': 1.475920557975769} -11/07/2021 02:20:10 - INFO - __main__ - Step 36224: {'lr': 0.00043688413158297934, 'samples': 6955008, 'steps': 36223, 'loss/train': 0.4032767713069916} -11/07/2021 02:20:10 - INFO - __main__ - Step 36225: {'lr': 0.00043688060669141705, 'samples': 6955200, 'steps': 36224, 'loss/train': 1.700075387954712} -11/07/2021 02:20:11 - INFO - __main__ - Step 36226: {'lr': 0.00043687708171564923, 'samples': 6955392, 'steps': 36225, 'loss/train': 1.6373037099838257} -11/07/2021 02:20:11 - INFO - __main__ - Step 36227: {'lr': 0.00043687355665567745, 'samples': 6955584, 'steps': 36226, 'loss/train': 1.5465506315231323} -11/07/2021 02:20:11 - INFO - __main__ - Step 36228: {'lr': 0.0004368700315115034, 'samples': 6955776, 'steps': 36227, 'loss/train': 1.9873836040496826} -11/07/2021 02:20:12 - INFO - __main__ - Step 36229: {'lr': 0.00043686650628312854, 'samples': 6955968, 'steps': 36228, 'loss/train': 1.3647935390472412} -11/07/2021 02:20:13 - INFO - __main__ - Step 36230: {'lr': 0.00043686298097055456, 'samples': 6956160, 'steps': 36229, 'loss/train': 1.7766621112823486} -11/07/2021 02:20:13 - INFO - __main__ - Step 36231: {'lr': 0.0004368594555737829, 'samples': 6956352, 'steps': 36230, 'loss/train': 1.8264625072479248} -11/07/2021 02:20:13 - INFO - __main__ - Step 36232: {'lr': 0.0004368559300928153, 'samples': 6956544, 'steps': 36231, 'loss/train': 1.3406790494918823} -11/07/2021 02:20:14 - INFO - __main__ - Step 36233: {'lr': 0.0004368524045276534, 'samples': 6956736, 'steps': 36232, 'loss/train': 0.7710010409355164} -11/07/2021 02:20:15 - INFO - __main__ - Step 36234: {'lr': 0.00043684887887829863, 'samples': 6956928, 'steps': 36233, 'loss/train': 1.5048789978027344} -11/07/2021 02:20:15 - INFO - __main__ - Step 36235: {'lr': 0.0004368453531447526, 'samples': 6957120, 'steps': 36234, 'loss/train': 0.9283801913261414} -11/07/2021 02:20:15 - INFO - __main__ - Step 36236: {'lr': 0.00043684182732701694, 'samples': 6957312, 'steps': 36235, 'loss/train': 1.9875965118408203} -11/07/2021 02:20:16 - INFO - __main__ - Step 36237: {'lr': 0.00043683830142509327, 'samples': 6957504, 'steps': 36236, 'loss/train': 1.540000081062317} -11/07/2021 02:20:16 - INFO - __main__ - Step 36238: {'lr': 0.00043683477543898314, 'samples': 6957696, 'steps': 36237, 'loss/train': 0.8398938775062561} -11/07/2021 02:20:17 - INFO - __main__ - Step 36239: {'lr': 0.0004368312493686881, 'samples': 6957888, 'steps': 36238, 'loss/train': 1.4075531959533691} -11/07/2021 02:20:18 - INFO - __main__ - Step 36240: {'lr': 0.0004368277232142098, 'samples': 6958080, 'steps': 36239, 'loss/train': 1.2510409355163574} -11/07/2021 02:20:18 - INFO - __main__ - Step 36241: {'lr': 0.00043682419697554985, 'samples': 6958272, 'steps': 36240, 'loss/train': 1.9596631526947021} -11/07/2021 02:20:18 - INFO - __main__ - Step 36242: {'lr': 0.0004368206706527098, 'samples': 6958464, 'steps': 36241, 'loss/train': 1.5783356428146362} -11/07/2021 02:20:19 - INFO - __main__ - Step 36243: {'lr': 0.00043681714424569117, 'samples': 6958656, 'steps': 36242, 'loss/train': 0.5691535472869873} -11/07/2021 02:20:19 - INFO - __main__ - Step 36244: {'lr': 0.0004368136177544957, 'samples': 6958848, 'steps': 36243, 'loss/train': 1.6415650844573975} -11/07/2021 02:20:20 - INFO - __main__ - Step 36245: {'lr': 0.00043681009117912484, 'samples': 6959040, 'steps': 36244, 'loss/train': 1.0533183813095093} -11/07/2021 02:20:20 - INFO - __main__ - Step 36246: {'lr': 0.0004368065645195803, 'samples': 6959232, 'steps': 36245, 'loss/train': 0.1379714012145996} -11/07/2021 02:20:21 - INFO - __main__ - Step 36247: {'lr': 0.0004368030377758636, 'samples': 6959424, 'steps': 36246, 'loss/train': 1.1800734996795654} -11/07/2021 02:20:21 - INFO - __main__ - Step 36248: {'lr': 0.0004367995109479763, 'samples': 6959616, 'steps': 36247, 'loss/train': 1.4469062089920044} -11/07/2021 02:20:21 - INFO - __main__ - Step 36249: {'lr': 0.00043679598403592, 'samples': 6959808, 'steps': 36248, 'loss/train': 1.611397385597229} -11/07/2021 02:20:22 - INFO - __main__ - Step 36250: {'lr': 0.00043679245703969627, 'samples': 6960000, 'steps': 36249, 'loss/train': 1.2449549436569214} -11/07/2021 02:20:23 - INFO - __main__ - Step 36251: {'lr': 0.00043678892995930685, 'samples': 6960192, 'steps': 36250, 'loss/train': 1.9472393989562988} -11/07/2021 02:20:23 - INFO - __main__ - Step 36252: {'lr': 0.00043678540279475314, 'samples': 6960384, 'steps': 36251, 'loss/train': 1.4475023746490479} -11/07/2021 02:20:23 - INFO - __main__ - Step 36253: {'lr': 0.0004367818755460369, 'samples': 6960576, 'steps': 36252, 'loss/train': 1.3991891145706177} -11/07/2021 02:20:24 - INFO - __main__ - Step 36254: {'lr': 0.00043677834821315956, 'samples': 6960768, 'steps': 36253, 'loss/train': 0.6604613661766052} -11/07/2021 02:20:25 - INFO - __main__ - Step 36255: {'lr': 0.00043677482079612276, 'samples': 6960960, 'steps': 36254, 'loss/train': 1.4953562021255493} -11/07/2021 02:20:25 - INFO - __main__ - Step 36256: {'lr': 0.00043677129329492814, 'samples': 6961152, 'steps': 36255, 'loss/train': 1.5402852296829224} -11/07/2021 02:20:26 - INFO - __main__ - Step 36257: {'lr': 0.00043676776570957725, 'samples': 6961344, 'steps': 36256, 'loss/train': 1.8290815353393555} -11/07/2021 02:20:26 - INFO - __main__ - Step 36258: {'lr': 0.0004367642380400717, 'samples': 6961536, 'steps': 36257, 'loss/train': 1.542945146560669} -11/07/2021 02:20:26 - INFO - __main__ - Step 36259: {'lr': 0.0004367607102864131, 'samples': 6961728, 'steps': 36258, 'loss/train': 1.9337825775146484} -11/07/2021 02:20:27 - INFO - __main__ - Step 36260: {'lr': 0.00043675718244860296, 'samples': 6961920, 'steps': 36259, 'loss/train': 1.3398491144180298} -11/07/2021 02:20:28 - INFO - __main__ - Step 36261: {'lr': 0.00043675365452664286, 'samples': 6962112, 'steps': 36260, 'loss/train': 1.286232352256775} -11/07/2021 02:20:28 - INFO - __main__ - Step 36262: {'lr': 0.0004367501265205345, 'samples': 6962304, 'steps': 36261, 'loss/train': 1.5498446226119995} -11/07/2021 02:20:28 - INFO - __main__ - Step 36263: {'lr': 0.0004367465984302794, 'samples': 6962496, 'steps': 36262, 'loss/train': 1.3904285430908203} -11/07/2021 02:20:29 - INFO - __main__ - Step 36264: {'lr': 0.0004367430702558792, 'samples': 6962688, 'steps': 36263, 'loss/train': 1.4619240760803223} -11/07/2021 02:20:30 - INFO - __main__ - Step 36265: {'lr': 0.0004367395419973355, 'samples': 6962880, 'steps': 36264, 'loss/train': 1.400206208229065} -11/07/2021 02:20:30 - INFO - __main__ - Step 36266: {'lr': 0.00043673601365464975, 'samples': 6963072, 'steps': 36265, 'loss/train': 1.4053270816802979} -11/07/2021 02:20:31 - INFO - __main__ - Step 36267: {'lr': 0.00043673248522782364, 'samples': 6963264, 'steps': 36266, 'loss/train': 1.2345603704452515} -11/07/2021 02:20:31 - INFO - __main__ - Step 36268: {'lr': 0.0004367289567168588, 'samples': 6963456, 'steps': 36267, 'loss/train': 1.3548353910446167} -11/07/2021 02:20:31 - INFO - __main__ - Step 36269: {'lr': 0.00043672542812175675, 'samples': 6963648, 'steps': 36268, 'loss/train': 1.8345106840133667} -11/07/2021 02:20:32 - INFO - __main__ - Step 36270: {'lr': 0.00043672189944251905, 'samples': 6963840, 'steps': 36269, 'loss/train': 1.6689475774765015} -11/07/2021 02:20:33 - INFO - __main__ - Step 36271: {'lr': 0.0004367183706791474, 'samples': 6964032, 'steps': 36270, 'loss/train': 1.5568740367889404} -11/07/2021 02:20:33 - INFO - __main__ - Step 36272: {'lr': 0.0004367148418316434, 'samples': 6964224, 'steps': 36271, 'loss/train': 1.1501420736312866} -11/07/2021 02:20:33 - INFO - __main__ - Step 36273: {'lr': 0.0004367113129000085, 'samples': 6964416, 'steps': 36272, 'loss/train': 1.8946768045425415} -11/07/2021 02:20:34 - INFO - __main__ - Step 36274: {'lr': 0.00043670778388424434, 'samples': 6964608, 'steps': 36273, 'loss/train': 1.0662518739700317} -11/07/2021 02:20:35 - INFO - __main__ - Step 36275: {'lr': 0.00043670425478435263, 'samples': 6964800, 'steps': 36274, 'loss/train': 1.4347180128097534} -11/07/2021 02:20:35 - INFO - __main__ - Step 36276: {'lr': 0.00043670072560033474, 'samples': 6964992, 'steps': 36275, 'loss/train': 1.8485217094421387} -11/07/2021 02:20:35 - INFO - __main__ - Step 36277: {'lr': 0.00043669719633219247, 'samples': 6965184, 'steps': 36276, 'loss/train': 1.1847352981567383} -11/07/2021 02:20:36 - INFO - __main__ - Step 36278: {'lr': 0.0004366936669799273, 'samples': 6965376, 'steps': 36277, 'loss/train': 1.7239091396331787} -11/07/2021 02:20:36 - INFO - __main__ - Step 36279: {'lr': 0.0004366901375435408, 'samples': 6965568, 'steps': 36278, 'loss/train': 1.6254451274871826} -11/07/2021 02:20:37 - INFO - __main__ - Step 36280: {'lr': 0.0004366866080230347, 'samples': 6965760, 'steps': 36279, 'loss/train': 0.7942847609519958} -11/07/2021 02:20:37 - INFO - __main__ - Step 36281: {'lr': 0.0004366830784184104, 'samples': 6965952, 'steps': 36280, 'loss/train': 1.7162615060806274} -11/07/2021 02:20:38 - INFO - __main__ - Step 36282: {'lr': 0.00043667954872966965, 'samples': 6966144, 'steps': 36281, 'loss/train': 1.5471854209899902} -11/07/2021 02:20:38 - INFO - __main__ - Step 36283: {'lr': 0.000436676018956814, 'samples': 6966336, 'steps': 36282, 'loss/train': 1.441980004310608} -11/07/2021 02:20:38 - INFO - __main__ - Step 36284: {'lr': 0.0004366724890998449, 'samples': 6966528, 'steps': 36283, 'loss/train': 1.545427918434143} -11/07/2021 02:20:40 - INFO - __main__ - Step 36285: {'lr': 0.00043666895915876416, 'samples': 6966720, 'steps': 36284, 'loss/train': 1.0880110263824463} -11/07/2021 02:20:40 - INFO - __main__ - Step 36286: {'lr': 0.0004366654291335732, 'samples': 6966912, 'steps': 36285, 'loss/train': 1.8009814023971558} -11/07/2021 02:20:40 - INFO - __main__ - Step 36287: {'lr': 0.00043666189902427367, 'samples': 6967104, 'steps': 36286, 'loss/train': 1.3985798358917236} -11/07/2021 02:20:41 - INFO - __main__ - Step 36288: {'lr': 0.00043665836883086725, 'samples': 6967296, 'steps': 36287, 'loss/train': 1.3476370573043823} -11/07/2021 02:20:41 - INFO - __main__ - Step 36289: {'lr': 0.0004366548385533554, 'samples': 6967488, 'steps': 36288, 'loss/train': 0.9500797390937805} -11/07/2021 02:20:42 - INFO - __main__ - Step 36290: {'lr': 0.0004366513081917398, 'samples': 6967680, 'steps': 36289, 'loss/train': 1.5582741498947144} -11/07/2021 02:20:42 - INFO - __main__ - Step 36291: {'lr': 0.00043664777774602196, 'samples': 6967872, 'steps': 36290, 'loss/train': 1.4448840618133545} -11/07/2021 02:20:43 - INFO - __main__ - Step 36292: {'lr': 0.00043664424721620354, 'samples': 6968064, 'steps': 36291, 'loss/train': 1.062769889831543} -11/07/2021 02:20:43 - INFO - __main__ - Step 36293: {'lr': 0.00043664071660228605, 'samples': 6968256, 'steps': 36292, 'loss/train': 1.2941185235977173} -11/07/2021 02:20:43 - INFO - __main__ - Step 36294: {'lr': 0.00043663718590427117, 'samples': 6968448, 'steps': 36293, 'loss/train': 1.5335264205932617} -11/07/2021 02:20:44 - INFO - __main__ - Step 36295: {'lr': 0.0004366336551221605, 'samples': 6968640, 'steps': 36294, 'loss/train': 1.4312095642089844} -11/07/2021 02:20:45 - INFO - __main__ - Step 36296: {'lr': 0.0004366301242559555, 'samples': 6968832, 'steps': 36295, 'loss/train': 1.7201085090637207} -11/07/2021 02:20:45 - INFO - __main__ - Step 36297: {'lr': 0.00043662659330565793, 'samples': 6969024, 'steps': 36296, 'loss/train': 1.400758147239685} -11/07/2021 02:20:45 - INFO - __main__ - Step 36298: {'lr': 0.00043662306227126917, 'samples': 6969216, 'steps': 36297, 'loss/train': 1.5006085634231567} -11/07/2021 02:20:46 - INFO - __main__ - Step 36299: {'lr': 0.00043661953115279104, 'samples': 6969408, 'steps': 36298, 'loss/train': 0.569497287273407} -11/07/2021 02:20:46 - INFO - __main__ - Step 36300: {'lr': 0.000436615999950225, 'samples': 6969600, 'steps': 36299, 'loss/train': 0.7550137639045715} -11/07/2021 02:20:47 - INFO - __main__ - Step 36301: {'lr': 0.0004366124686635727, 'samples': 6969792, 'steps': 36300, 'loss/train': 1.804154396057129} -11/07/2021 02:20:47 - INFO - __main__ - Step 36302: {'lr': 0.00043660893729283564, 'samples': 6969984, 'steps': 36301, 'loss/train': 1.6032986640930176} -11/07/2021 02:20:48 - INFO - __main__ - Step 36303: {'lr': 0.0004366054058380155, 'samples': 6970176, 'steps': 36302, 'loss/train': 1.344807505607605} -11/07/2021 02:20:48 - INFO - __main__ - Step 36304: {'lr': 0.0004366018742991139, 'samples': 6970368, 'steps': 36303, 'loss/train': 1.6097887754440308} -11/07/2021 02:20:49 - INFO - __main__ - Step 36305: {'lr': 0.00043659834267613227, 'samples': 6970560, 'steps': 36304, 'loss/train': 1.4944956302642822} -11/07/2021 02:20:50 - INFO - __main__ - Step 36306: {'lr': 0.0004365948109690724, 'samples': 6970752, 'steps': 36305, 'loss/train': 1.6863945722579956} -11/07/2021 02:20:50 - INFO - __main__ - Step 36307: {'lr': 0.0004365912791779357, 'samples': 6970944, 'steps': 36306, 'loss/train': 1.2818877696990967} -11/07/2021 02:20:50 - INFO - __main__ - Step 36308: {'lr': 0.00043658774730272393, 'samples': 6971136, 'steps': 36307, 'loss/train': 1.4839028120040894} -11/07/2021 02:20:51 - INFO - __main__ - Step 36309: {'lr': 0.00043658421534343856, 'samples': 6971328, 'steps': 36308, 'loss/train': 1.585021734237671} -11/07/2021 02:20:51 - INFO - __main__ - Step 36310: {'lr': 0.0004365806833000813, 'samples': 6971520, 'steps': 36309, 'loss/train': 1.2770180702209473} -11/07/2021 02:20:52 - INFO - __main__ - Step 36311: {'lr': 0.0004365771511726535, 'samples': 6971712, 'steps': 36310, 'loss/train': 1.1752785444259644} -11/07/2021 02:20:53 - INFO - __main__ - Step 36312: {'lr': 0.00043657361896115706, 'samples': 6971904, 'steps': 36311, 'loss/train': 1.58674156665802} -11/07/2021 02:20:53 - INFO - __main__ - Step 36313: {'lr': 0.0004365700866655934, 'samples': 6972096, 'steps': 36312, 'loss/train': 1.2428057193756104} -11/07/2021 02:20:53 - INFO - __main__ - Step 36314: {'lr': 0.00043656655428596407, 'samples': 6972288, 'steps': 36313, 'loss/train': 1.4094693660736084} -11/07/2021 02:20:54 - INFO - __main__ - Step 36315: {'lr': 0.0004365630218222708, 'samples': 6972480, 'steps': 36314, 'loss/train': 1.0743906497955322} -11/07/2021 02:20:54 - INFO - __main__ - Step 36316: {'lr': 0.00043655948927451505, 'samples': 6972672, 'steps': 36315, 'loss/train': 0.8647530674934387} -11/07/2021 02:20:55 - INFO - __main__ - Step 36317: {'lr': 0.0004365559566426985, 'samples': 6972864, 'steps': 36316, 'loss/train': 1.3983964920043945} -11/07/2021 02:20:55 - INFO - __main__ - Step 36318: {'lr': 0.0004365524239268227, 'samples': 6973056, 'steps': 36317, 'loss/train': 1.3517965078353882} -11/07/2021 02:20:56 - INFO - __main__ - Step 36319: {'lr': 0.00043654889112688933, 'samples': 6973248, 'steps': 36318, 'loss/train': 1.9730541706085205} -11/07/2021 02:20:56 - INFO - __main__ - Step 36320: {'lr': 0.00043654535824289985, 'samples': 6973440, 'steps': 36319, 'loss/train': 1.7234567403793335} -11/07/2021 02:20:56 - INFO - __main__ - Step 36321: {'lr': 0.0004365418252748559, 'samples': 6973632, 'steps': 36320, 'loss/train': 1.5906174182891846} -11/07/2021 02:20:57 - INFO - __main__ - Step 36322: {'lr': 0.0004365382922227591, 'samples': 6973824, 'steps': 36321, 'loss/train': 1.6755872964859009} -11/07/2021 02:20:58 - INFO - __main__ - Step 36323: {'lr': 0.000436534759086611, 'samples': 6974016, 'steps': 36322, 'loss/train': 1.397365689277649} -11/07/2021 02:20:58 - INFO - __main__ - Step 36324: {'lr': 0.00043653122586641323, 'samples': 6974208, 'steps': 36323, 'loss/train': 1.6728856563568115} -11/07/2021 02:20:58 - INFO - __main__ - Step 36325: {'lr': 0.0004365276925621674, 'samples': 6974400, 'steps': 36324, 'loss/train': 1.2448979616165161} -11/07/2021 02:20:59 - INFO - __main__ - Step 36326: {'lr': 0.0004365241591738751, 'samples': 6974592, 'steps': 36325, 'loss/train': 1.7174886465072632} -11/07/2021 02:20:59 - INFO - __main__ - Step 36327: {'lr': 0.0004365206257015378, 'samples': 6974784, 'steps': 36326, 'loss/train': 1.560450792312622} -11/07/2021 02:21:00 - INFO - __main__ - Step 36328: {'lr': 0.0004365170921451572, 'samples': 6974976, 'steps': 36327, 'loss/train': 1.1287360191345215} -11/07/2021 02:21:01 - INFO - __main__ - Step 36329: {'lr': 0.00043651355850473495, 'samples': 6975168, 'steps': 36328, 'loss/train': 1.4507524967193604} -11/07/2021 02:21:01 - INFO - __main__ - Step 36330: {'lr': 0.0004365100247802725, 'samples': 6975360, 'steps': 36329, 'loss/train': 1.696042776107788} -11/07/2021 02:21:01 - INFO - __main__ - Step 36331: {'lr': 0.0004365064909717715, 'samples': 6975552, 'steps': 36330, 'loss/train': 1.5696899890899658} -11/07/2021 02:21:03 - INFO - __main__ - Step 36332: {'lr': 0.0004365029570792336, 'samples': 6975744, 'steps': 36331, 'loss/train': 1.5845402479171753} -11/07/2021 02:21:03 - INFO - __main__ - Step 36333: {'lr': 0.00043649942310266035, 'samples': 6975936, 'steps': 36332, 'loss/train': 0.9859981536865234} -11/07/2021 02:21:04 - INFO - __main__ - Step 36334: {'lr': 0.00043649588904205326, 'samples': 6976128, 'steps': 36333, 'loss/train': 1.5097932815551758} -11/07/2021 02:21:04 - INFO - __main__ - Step 36335: {'lr': 0.0004364923548974141, 'samples': 6976320, 'steps': 36334, 'loss/train': 2.3358113765716553} -11/07/2021 02:21:04 - INFO - __main__ - Step 36336: {'lr': 0.0004364888206687443, 'samples': 6976512, 'steps': 36335, 'loss/train': 2.372626304626465} -11/07/2021 02:21:05 - INFO - __main__ - Step 36337: {'lr': 0.00043648528635604556, 'samples': 6976704, 'steps': 36336, 'loss/train': 0.7707897424697876} -11/07/2021 02:21:06 - INFO - __main__ - Step 36338: {'lr': 0.00043648175195931937, 'samples': 6976896, 'steps': 36337, 'loss/train': 1.2917875051498413} -11/07/2021 02:21:06 - INFO - __main__ - Step 36339: {'lr': 0.0004364782174785674, 'samples': 6977088, 'steps': 36338, 'loss/train': 1.872575283050537} -11/07/2021 02:21:06 - INFO - __main__ - Step 36340: {'lr': 0.0004364746829137912, 'samples': 6977280, 'steps': 36339, 'loss/train': 1.193190336227417} -11/07/2021 02:21:07 - INFO - __main__ - Step 36341: {'lr': 0.0004364711482649925, 'samples': 6977472, 'steps': 36340, 'loss/train': 1.3252372741699219} -11/07/2021 02:21:07 - INFO - __main__ - Step 36342: {'lr': 0.00043646761353217266, 'samples': 6977664, 'steps': 36341, 'loss/train': 1.2717697620391846} -11/07/2021 02:21:08 - INFO - __main__ - Step 36343: {'lr': 0.0004364640787153334, 'samples': 6977856, 'steps': 36342, 'loss/train': 1.3853132724761963} -11/07/2021 02:21:08 - INFO - __main__ - Step 36344: {'lr': 0.0004364605438144764, 'samples': 6978048, 'steps': 36343, 'loss/train': 1.5299681425094604} -11/07/2021 02:21:09 - INFO - __main__ - Step 36345: {'lr': 0.000436457008829603, 'samples': 6978240, 'steps': 36344, 'loss/train': 1.5941821336746216} -11/07/2021 02:21:09 - INFO - __main__ - Step 36346: {'lr': 0.00043645347376071507, 'samples': 6978432, 'steps': 36345, 'loss/train': 1.7303555011749268} -11/07/2021 02:21:09 - INFO - __main__ - Step 36347: {'lr': 0.0004364499386078141, 'samples': 6978624, 'steps': 36346, 'loss/train': 1.1477150917053223} -11/07/2021 02:21:11 - INFO - __main__ - Step 36348: {'lr': 0.00043644640337090157, 'samples': 6978816, 'steps': 36347, 'loss/train': 1.7781087160110474} -11/07/2021 02:21:11 - INFO - __main__ - Step 36349: {'lr': 0.0004364428680499792, 'samples': 6979008, 'steps': 36348, 'loss/train': 1.4340267181396484} -11/07/2021 02:21:11 - INFO - __main__ - Step 36350: {'lr': 0.0004364393326450486, 'samples': 6979200, 'steps': 36349, 'loss/train': 1.4936268329620361} -11/07/2021 02:21:12 - INFO - __main__ - Step 36351: {'lr': 0.00043643579715611124, 'samples': 6979392, 'steps': 36350, 'loss/train': 1.516542673110962} -11/07/2021 02:21:12 - INFO - __main__ - Step 36352: {'lr': 0.00043643226158316886, 'samples': 6979584, 'steps': 36351, 'loss/train': 3.1933603286743164} -11/07/2021 02:21:12 - INFO - __main__ - Step 36353: {'lr': 0.00043642872592622293, 'samples': 6979776, 'steps': 36352, 'loss/train': 1.3439143896102905} -11/07/2021 02:21:13 - INFO - __main__ - Step 36354: {'lr': 0.0004364251901852751, 'samples': 6979968, 'steps': 36353, 'loss/train': 1.352319359779358} -11/07/2021 02:21:14 - INFO - __main__ - Step 36355: {'lr': 0.000436421654360327, 'samples': 6980160, 'steps': 36354, 'loss/train': 1.4244893789291382} -11/07/2021 02:21:14 - INFO - __main__ - Step 36356: {'lr': 0.00043641811845138016, 'samples': 6980352, 'steps': 36355, 'loss/train': 1.4638200998306274} -11/07/2021 02:21:14 - INFO - __main__ - Step 36357: {'lr': 0.0004364145824584361, 'samples': 6980544, 'steps': 36356, 'loss/train': 1.4082454442977905} -11/07/2021 02:21:15 - INFO - __main__ - Step 36358: {'lr': 0.00043641104638149656, 'samples': 6980736, 'steps': 36357, 'loss/train': 1.9423258304595947} -11/07/2021 02:21:16 - INFO - __main__ - Step 36359: {'lr': 0.00043640751022056316, 'samples': 6980928, 'steps': 36358, 'loss/train': 1.1190898418426514} -11/07/2021 02:21:16 - INFO - __main__ - Step 36360: {'lr': 0.00043640397397563737, 'samples': 6981120, 'steps': 36359, 'loss/train': 1.2740697860717773} -11/07/2021 02:21:16 - INFO - __main__ - Step 36361: {'lr': 0.00043640043764672077, 'samples': 6981312, 'steps': 36360, 'loss/train': 1.6111739873886108} -11/07/2021 02:21:17 - INFO - __main__ - Step 36362: {'lr': 0.00043639690123381503, 'samples': 6981504, 'steps': 36361, 'loss/train': 0.9121442437171936} -11/07/2021 02:21:17 - INFO - __main__ - Step 36363: {'lr': 0.00043639336473692174, 'samples': 6981696, 'steps': 36362, 'loss/train': 1.8936302661895752} -11/07/2021 02:21:18 - INFO - __main__ - Step 36364: {'lr': 0.00043638982815604247, 'samples': 6981888, 'steps': 36363, 'loss/train': 1.2038345336914062} -11/07/2021 02:21:19 - INFO - __main__ - Step 36365: {'lr': 0.00043638629149117883, 'samples': 6982080, 'steps': 36364, 'loss/train': 1.5564985275268555} -11/07/2021 02:21:19 - INFO - __main__ - Step 36366: {'lr': 0.0004363827547423324, 'samples': 6982272, 'steps': 36365, 'loss/train': 4.262648582458496} -11/07/2021 02:21:19 - INFO - __main__ - Step 36367: {'lr': 0.00043637921790950476, 'samples': 6982464, 'steps': 36366, 'loss/train': 1.6036688089370728} -11/07/2021 02:21:20 - INFO - __main__ - Step 36368: {'lr': 0.00043637568099269753, 'samples': 6982656, 'steps': 36367, 'loss/train': 1.0962079763412476} -11/07/2021 02:21:21 - INFO - __main__ - Step 36369: {'lr': 0.00043637214399191234, 'samples': 6982848, 'steps': 36368, 'loss/train': 1.3688468933105469} -11/07/2021 02:21:21 - INFO - __main__ - Step 36370: {'lr': 0.00043636860690715064, 'samples': 6983040, 'steps': 36369, 'loss/train': 1.4799058437347412} -11/07/2021 02:21:21 - INFO - __main__ - Step 36371: {'lr': 0.00043636506973841424, 'samples': 6983232, 'steps': 36370, 'loss/train': 1.8318012952804565} -11/07/2021 02:21:22 - INFO - __main__ - Step 36372: {'lr': 0.00043636153248570453, 'samples': 6983424, 'steps': 36371, 'loss/train': 1.3730608224868774} -11/07/2021 02:21:22 - INFO - __main__ - Step 36373: {'lr': 0.0004363579951490232, 'samples': 6983616, 'steps': 36372, 'loss/train': 1.7554099559783936} -11/07/2021 02:21:22 - INFO - __main__ - Step 36374: {'lr': 0.0004363544577283718, 'samples': 6983808, 'steps': 36373, 'loss/train': 1.4895075559616089} -11/07/2021 02:21:24 - INFO - __main__ - Step 36375: {'lr': 0.0004363509202237521, 'samples': 6984000, 'steps': 36374, 'loss/train': 1.4852935075759888} -11/07/2021 02:21:24 - INFO - __main__ - Step 36376: {'lr': 0.0004363473826351654, 'samples': 6984192, 'steps': 36375, 'loss/train': 1.0466312170028687} -11/07/2021 02:21:24 - INFO - __main__ - Step 36377: {'lr': 0.0004363438449626135, 'samples': 6984384, 'steps': 36376, 'loss/train': 1.2807888984680176} -11/07/2021 02:21:25 - INFO - __main__ - Step 36378: {'lr': 0.000436340307206098, 'samples': 6984576, 'steps': 36377, 'loss/train': 1.4843051433563232} -11/07/2021 02:21:25 - INFO - __main__ - Step 36379: {'lr': 0.00043633676936562026, 'samples': 6984768, 'steps': 36378, 'loss/train': 1.423012375831604} -11/07/2021 02:21:26 - INFO - __main__ - Step 36380: {'lr': 0.0004363332314411822, 'samples': 6984960, 'steps': 36379, 'loss/train': 1.7427172660827637} -11/07/2021 02:21:26 - INFO - __main__ - Step 36381: {'lr': 0.0004363296934327852, 'samples': 6985152, 'steps': 36380, 'loss/train': 1.600832223892212} -11/07/2021 02:21:27 - INFO - __main__ - Step 36382: {'lr': 0.00043632615534043096, 'samples': 6985344, 'steps': 36381, 'loss/train': 2.1246707439422607} -11/07/2021 02:21:27 - INFO - __main__ - Step 36383: {'lr': 0.00043632261716412097, 'samples': 6985536, 'steps': 36382, 'loss/train': 0.906044065952301} -11/07/2021 02:21:27 - INFO - __main__ - Step 36384: {'lr': 0.0004363190789038569, 'samples': 6985728, 'steps': 36383, 'loss/train': 1.3539206981658936} -11/07/2021 02:21:28 - INFO - __main__ - Step 36385: {'lr': 0.0004363155405596404, 'samples': 6985920, 'steps': 36384, 'loss/train': 1.7368046045303345} -11/07/2021 02:21:29 - INFO - __main__ - Step 36386: {'lr': 0.00043631200213147296, 'samples': 6986112, 'steps': 36385, 'loss/train': 1.5509334802627563} -11/07/2021 02:21:29 - INFO - __main__ - Step 36387: {'lr': 0.0004363084636193561, 'samples': 6986304, 'steps': 36386, 'loss/train': 1.6322015523910522} -11/07/2021 02:21:29 - INFO - __main__ - Step 36388: {'lr': 0.0004363049250232917, 'samples': 6986496, 'steps': 36387, 'loss/train': 0.9802109003067017} -11/07/2021 02:21:30 - INFO - __main__ - Step 36389: {'lr': 0.000436301386343281, 'samples': 6986688, 'steps': 36388, 'loss/train': 1.4826627969741821} -11/07/2021 02:21:31 - INFO - __main__ - Step 36390: {'lr': 0.0004362978475793259, 'samples': 6986880, 'steps': 36389, 'loss/train': 1.9039173126220703} -11/07/2021 02:21:31 - INFO - __main__ - Step 36391: {'lr': 0.00043629430873142773, 'samples': 6987072, 'steps': 36390, 'loss/train': 0.39275264739990234} -11/07/2021 02:21:31 - INFO - __main__ - Step 36392: {'lr': 0.00043629076979958837, 'samples': 6987264, 'steps': 36391, 'loss/train': 1.394723653793335} -11/07/2021 02:21:32 - INFO - __main__ - Step 36393: {'lr': 0.00043628723078380916, 'samples': 6987456, 'steps': 36392, 'loss/train': 1.5663731098175049} -11/07/2021 02:21:32 - INFO - __main__ - Step 36394: {'lr': 0.0004362836916840919, 'samples': 6987648, 'steps': 36393, 'loss/train': 1.3121269941329956} -11/07/2021 02:21:33 - INFO - __main__ - Step 36395: {'lr': 0.00043628015250043794, 'samples': 6987840, 'steps': 36394, 'loss/train': 1.107160210609436} -11/07/2021 02:21:33 - INFO - __main__ - Step 36396: {'lr': 0.00043627661323284914, 'samples': 6988032, 'steps': 36395, 'loss/train': 1.2629873752593994} -11/07/2021 02:21:34 - INFO - __main__ - Step 36397: {'lr': 0.00043627307388132693, 'samples': 6988224, 'steps': 36396, 'loss/train': 2.3927032947540283} -11/07/2021 02:21:34 - INFO - __main__ - Step 36398: {'lr': 0.0004362695344458729, 'samples': 6988416, 'steps': 36397, 'loss/train': 1.5395231246948242} -11/07/2021 02:21:35 - INFO - __main__ - Step 36399: {'lr': 0.00043626599492648877, 'samples': 6988608, 'steps': 36398, 'loss/train': 1.4821674823760986} -11/07/2021 02:21:36 - INFO - __main__ - Step 36400: {'lr': 0.000436262455323176, 'samples': 6988800, 'steps': 36399, 'loss/train': 1.1854488849639893} -11/07/2021 02:21:36 - INFO - __main__ - Step 36401: {'lr': 0.0004362589156359363, 'samples': 6988992, 'steps': 36400, 'loss/train': 1.455713152885437} -11/07/2021 02:21:36 - INFO - __main__ - Step 36402: {'lr': 0.00043625537586477114, 'samples': 6989184, 'steps': 36401, 'loss/train': 1.39728581905365} -11/07/2021 02:21:37 - INFO - __main__ - Step 36403: {'lr': 0.00043625183600968224, 'samples': 6989376, 'steps': 36402, 'loss/train': 1.764100193977356} -11/07/2021 02:21:37 - INFO - __main__ - Step 36404: {'lr': 0.00043624829607067105, 'samples': 6989568, 'steps': 36403, 'loss/train': 1.5400242805480957} -11/07/2021 02:21:37 - INFO - __main__ - Step 36405: {'lr': 0.0004362447560477394, 'samples': 6989760, 'steps': 36404, 'loss/train': 1.6310828924179077} -11/07/2021 02:21:38 - INFO - __main__ - Step 36406: {'lr': 0.0004362412159408886, 'samples': 6989952, 'steps': 36405, 'loss/train': 1.5401593446731567} -11/07/2021 02:21:39 - INFO - __main__ - Step 36407: {'lr': 0.0004362376757501205, 'samples': 6990144, 'steps': 36406, 'loss/train': 0.9658600091934204} -11/07/2021 02:21:39 - INFO - __main__ - Step 36408: {'lr': 0.00043623413547543645, 'samples': 6990336, 'steps': 36407, 'loss/train': 1.0938903093338013} -11/07/2021 02:21:39 - INFO - __main__ - Step 36409: {'lr': 0.00043623059511683826, 'samples': 6990528, 'steps': 36408, 'loss/train': 1.7532463073730469} -11/07/2021 02:21:40 - INFO - __main__ - Step 36410: {'lr': 0.0004362270546743274, 'samples': 6990720, 'steps': 36409, 'loss/train': 1.4016672372817993} -11/07/2021 02:21:41 - INFO - __main__ - Step 36411: {'lr': 0.0004362235141479055, 'samples': 6990912, 'steps': 36410, 'loss/train': 1.5435714721679688} -11/07/2021 02:21:41 - INFO - __main__ - Step 36412: {'lr': 0.0004362199735375742, 'samples': 6991104, 'steps': 36411, 'loss/train': 1.1211869716644287} -11/07/2021 02:21:42 - INFO - __main__ - Step 36413: {'lr': 0.000436216432843335, 'samples': 6991296, 'steps': 36412, 'loss/train': 0.736153244972229} -11/07/2021 02:21:42 - INFO - __main__ - Step 36414: {'lr': 0.00043621289206518957, 'samples': 6991488, 'steps': 36413, 'loss/train': 1.6953119039535522} -11/07/2021 02:21:42 - INFO - __main__ - Step 36415: {'lr': 0.00043620935120313955, 'samples': 6991680, 'steps': 36414, 'loss/train': 1.5244629383087158} -11/07/2021 02:21:44 - INFO - __main__ - Step 36416: {'lr': 0.0004362058102571864, 'samples': 6991872, 'steps': 36415, 'loss/train': 1.6046603918075562} -11/07/2021 02:21:44 - INFO - __main__ - Step 36417: {'lr': 0.00043620226922733174, 'samples': 6992064, 'steps': 36416, 'loss/train': 1.2570933103561401} -11/07/2021 02:21:44 - INFO - __main__ - Step 36418: {'lr': 0.0004361987281135773, 'samples': 6992256, 'steps': 36417, 'loss/train': 1.9624028205871582} -11/07/2021 02:21:45 - INFO - __main__ - Step 36419: {'lr': 0.00043619518691592453, 'samples': 6992448, 'steps': 36418, 'loss/train': 0.7464272975921631} -11/07/2021 02:21:45 - INFO - __main__ - Step 36420: {'lr': 0.00043619164563437506, 'samples': 6992640, 'steps': 36419, 'loss/train': 2.0012402534484863} -11/07/2021 02:21:46 - INFO - __main__ - Step 36421: {'lr': 0.0004361881042689306, 'samples': 6992832, 'steps': 36420, 'loss/train': 0.9991865754127502} -11/07/2021 02:21:46 - INFO - __main__ - Step 36422: {'lr': 0.00043618456281959263, 'samples': 6993024, 'steps': 36421, 'loss/train': 1.4010941982269287} -11/07/2021 02:21:47 - INFO - __main__ - Step 36423: {'lr': 0.0004361810212863627, 'samples': 6993216, 'steps': 36422, 'loss/train': 1.5331019163131714} -11/07/2021 02:21:47 - INFO - __main__ - Step 36424: {'lr': 0.0004361774796692425, 'samples': 6993408, 'steps': 36423, 'loss/train': 1.7541043758392334} -11/07/2021 02:21:47 - INFO - __main__ - Step 36425: {'lr': 0.00043617393796823367, 'samples': 6993600, 'steps': 36424, 'loss/train': 1.4145983457565308} -11/07/2021 02:21:48 - INFO - __main__ - Step 36426: {'lr': 0.00043617039618333765, 'samples': 6993792, 'steps': 36425, 'loss/train': 1.6360641717910767} -11/07/2021 02:21:49 - INFO - __main__ - Step 36427: {'lr': 0.00043616685431455615, 'samples': 6993984, 'steps': 36426, 'loss/train': 1.2648183107376099} -11/07/2021 02:21:49 - INFO - __main__ - Step 36428: {'lr': 0.0004361633123618908, 'samples': 6994176, 'steps': 36427, 'loss/train': 1.10480797290802} -11/07/2021 02:21:49 - INFO - __main__ - Step 36429: {'lr': 0.00043615977032534305, 'samples': 6994368, 'steps': 36428, 'loss/train': 1.7303485870361328} -11/07/2021 02:21:50 - INFO - __main__ - Step 36430: {'lr': 0.00043615622820491464, 'samples': 6994560, 'steps': 36429, 'loss/train': 1.4921950101852417} -11/07/2021 02:21:50 - INFO - __main__ - Step 36431: {'lr': 0.00043615268600060705, 'samples': 6994752, 'steps': 36430, 'loss/train': 1.4308103322982788} -11/07/2021 02:21:52 - INFO - __main__ - Step 36432: {'lr': 0.000436149143712422, 'samples': 6994944, 'steps': 36431, 'loss/train': 1.1433682441711426} -11/07/2021 02:21:52 - INFO - __main__ - Step 36433: {'lr': 0.0004361456013403609, 'samples': 6995136, 'steps': 36432, 'loss/train': 1.522065281867981} -11/07/2021 02:21:53 - INFO - __main__ - Step 36434: {'lr': 0.00043614205888442553, 'samples': 6995328, 'steps': 36433, 'loss/train': 1.2452378273010254} -11/07/2021 02:21:53 - INFO - __main__ - Step 36435: {'lr': 0.00043613851634461743, 'samples': 6995520, 'steps': 36434, 'loss/train': 1.5099252462387085} -11/07/2021 02:21:53 - INFO - __main__ - Step 36436: {'lr': 0.00043613497372093827, 'samples': 6995712, 'steps': 36435, 'loss/train': 1.4279507398605347} -11/07/2021 02:21:54 - INFO - __main__ - Step 36437: {'lr': 0.0004361314310133894, 'samples': 6995904, 'steps': 36436, 'loss/train': 1.2324637174606323} -11/07/2021 02:21:54 - INFO - __main__ - Step 36438: {'lr': 0.00043612788822197266, 'samples': 6996096, 'steps': 36437, 'loss/train': 1.9096089601516724} -11/07/2021 02:21:54 - INFO - __main__ - Step 36439: {'lr': 0.0004361243453466896, 'samples': 6996288, 'steps': 36438, 'loss/train': 1.8450305461883545} -11/07/2021 02:21:55 - INFO - __main__ - Step 36440: {'lr': 0.0004361208023875417, 'samples': 6996480, 'steps': 36439, 'loss/train': 1.8311712741851807} -11/07/2021 02:21:56 - INFO - __main__ - Step 36441: {'lr': 0.00043611725934453074, 'samples': 6996672, 'steps': 36440, 'loss/train': 1.368140459060669} -11/07/2021 02:21:56 - INFO - __main__ - Step 36442: {'lr': 0.00043611371621765817, 'samples': 6996864, 'steps': 36441, 'loss/train': 1.5333380699157715} -11/07/2021 02:21:57 - INFO - __main__ - Step 36443: {'lr': 0.0004361101730069256, 'samples': 6997056, 'steps': 36442, 'loss/train': 0.9707183837890625} -11/07/2021 02:21:57 - INFO - __main__ - Step 36444: {'lr': 0.00043610662971233465, 'samples': 6997248, 'steps': 36443, 'loss/train': 1.5515861511230469} -11/07/2021 02:21:58 - INFO - __main__ - Step 36445: {'lr': 0.00043610308633388695, 'samples': 6997440, 'steps': 36444, 'loss/train': 1.4722208976745605} -11/07/2021 02:21:58 - INFO - __main__ - Step 36446: {'lr': 0.0004360995428715841, 'samples': 6997632, 'steps': 36445, 'loss/train': 1.4910660982131958} -11/07/2021 02:21:59 - INFO - __main__ - Step 36447: {'lr': 0.00043609599932542764, 'samples': 6997824, 'steps': 36446, 'loss/train': 1.9633461236953735} -11/07/2021 02:21:59 - INFO - __main__ - Step 36448: {'lr': 0.00043609245569541924, 'samples': 6998016, 'steps': 36447, 'loss/train': 1.5884859561920166} -11/07/2021 02:21:59 - INFO - __main__ - Step 36449: {'lr': 0.00043608891198156037, 'samples': 6998208, 'steps': 36448, 'loss/train': 1.4491236209869385} -11/07/2021 02:22:00 - INFO - __main__ - Step 36450: {'lr': 0.0004360853681838528, 'samples': 6998400, 'steps': 36449, 'loss/train': 1.4041427373886108} -11/07/2021 02:22:01 - INFO - __main__ - Step 36451: {'lr': 0.0004360818243022979, 'samples': 6998592, 'steps': 36450, 'loss/train': 1.247759222984314} -11/07/2021 02:22:01 - INFO - __main__ - Step 36452: {'lr': 0.00043607828033689753, 'samples': 6998784, 'steps': 36451, 'loss/train': 1.145880937576294} -11/07/2021 02:22:01 - INFO - __main__ - Step 36453: {'lr': 0.000436074736287653, 'samples': 6998976, 'steps': 36452, 'loss/train': 1.6394306421279907} -11/07/2021 02:22:02 - INFO - __main__ - Step 36454: {'lr': 0.00043607119215456625, 'samples': 6999168, 'steps': 36453, 'loss/train': 1.3804353475570679} -11/07/2021 02:22:03 - INFO - __main__ - Step 36455: {'lr': 0.00043606764793763865, 'samples': 6999360, 'steps': 36454, 'loss/train': 1.7423021793365479} -11/07/2021 02:22:03 - INFO - __main__ - Step 36456: {'lr': 0.00043606410363687177, 'samples': 6999552, 'steps': 36455, 'loss/train': 1.3185689449310303} -11/07/2021 02:22:04 - INFO - __main__ - Step 36457: {'lr': 0.00043606055925226727, 'samples': 6999744, 'steps': 36456, 'loss/train': 1.5543650388717651} -11/07/2021 02:22:04 - INFO - __main__ - Step 36458: {'lr': 0.0004360570147838269, 'samples': 6999936, 'steps': 36457, 'loss/train': 1.7427715063095093} -11/07/2021 02:22:04 - INFO - __main__ - Step 36459: {'lr': 0.00043605347023155193, 'samples': 7000128, 'steps': 36458, 'loss/train': 1.5395492315292358} -11/07/2021 02:22:05 - INFO - __main__ - Step 36460: {'lr': 0.0004360499255954442, 'samples': 7000320, 'steps': 36459, 'loss/train': 1.176275372505188} -11/07/2021 02:22:06 - INFO - __main__ - Step 36461: {'lr': 0.0004360463808755053, 'samples': 7000512, 'steps': 36460, 'loss/train': 1.3563385009765625} -11/07/2021 02:22:06 - INFO - __main__ - Step 36462: {'lr': 0.00043604283607173673, 'samples': 7000704, 'steps': 36461, 'loss/train': 1.5283113718032837} -11/07/2021 02:22:06 - INFO - __main__ - Step 36463: {'lr': 0.0004360392911841401, 'samples': 7000896, 'steps': 36462, 'loss/train': 1.3267556428909302} -11/07/2021 02:22:07 - INFO - __main__ - Step 36464: {'lr': 0.0004360357462127171, 'samples': 7001088, 'steps': 36463, 'loss/train': 1.5522664785385132} -11/07/2021 02:22:07 - INFO - __main__ - Step 36465: {'lr': 0.0004360322011574692, 'samples': 7001280, 'steps': 36464, 'loss/train': 1.4915170669555664} -11/07/2021 02:22:08 - INFO - __main__ - Step 36466: {'lr': 0.00043602865601839817, 'samples': 7001472, 'steps': 36465, 'loss/train': 1.3296517133712769} -11/07/2021 02:22:08 - INFO - __main__ - Step 36467: {'lr': 0.00043602511079550535, 'samples': 7001664, 'steps': 36466, 'loss/train': 1.2712076902389526} -11/07/2021 02:22:09 - INFO - __main__ - Step 36468: {'lr': 0.0004360215654887926, 'samples': 7001856, 'steps': 36467, 'loss/train': 1.1578062772750854} -11/07/2021 02:22:09 - INFO - __main__ - Step 36469: {'lr': 0.0004360180200982613, 'samples': 7002048, 'steps': 36468, 'loss/train': 1.7998279333114624} -11/07/2021 02:22:09 - INFO - __main__ - Step 36470: {'lr': 0.00043601447462391317, 'samples': 7002240, 'steps': 36469, 'loss/train': 1.8373972177505493} -11/07/2021 02:22:10 - INFO - __main__ - Step 36471: {'lr': 0.00043601092906574986, 'samples': 7002432, 'steps': 36470, 'loss/train': 1.81533944606781} -11/07/2021 02:22:11 - INFO - __main__ - Step 36472: {'lr': 0.0004360073834237729, 'samples': 7002624, 'steps': 36471, 'loss/train': 1.2724525928497314} -11/07/2021 02:22:11 - INFO - __main__ - Step 36473: {'lr': 0.0004360038376979838, 'samples': 7002816, 'steps': 36472, 'loss/train': 1.720353364944458} -11/07/2021 02:22:12 - INFO - __main__ - Step 36474: {'lr': 0.0004360002918883843, 'samples': 7003008, 'steps': 36473, 'loss/train': 1.4903210401535034} -11/07/2021 02:22:12 - INFO - __main__ - Step 36475: {'lr': 0.00043599674599497593, 'samples': 7003200, 'steps': 36474, 'loss/train': 1.5465788841247559} -11/07/2021 02:22:13 - INFO - __main__ - Step 36476: {'lr': 0.00043599320001776025, 'samples': 7003392, 'steps': 36475, 'loss/train': 1.2533528804779053} -11/07/2021 02:22:13 - INFO - __main__ - Step 36477: {'lr': 0.00043598965395673893, 'samples': 7003584, 'steps': 36476, 'loss/train': 1.5747464895248413} -11/07/2021 02:22:14 - INFO - __main__ - Step 36478: {'lr': 0.0004359861078119136, 'samples': 7003776, 'steps': 36477, 'loss/train': 1.5156866312026978} -11/07/2021 02:22:14 - INFO - __main__ - Step 36479: {'lr': 0.00043598256158328575, 'samples': 7003968, 'steps': 36478, 'loss/train': 1.7108465433120728} -11/07/2021 02:22:14 - INFO - __main__ - Step 36480: {'lr': 0.00043597901527085703, 'samples': 7004160, 'steps': 36479, 'loss/train': 0.9954426884651184} -11/07/2021 02:22:15 - INFO - __main__ - Step 36481: {'lr': 0.000435975468874629, 'samples': 7004352, 'steps': 36480, 'loss/train': 1.4760842323303223} -11/07/2021 02:22:16 - INFO - __main__ - Step 36482: {'lr': 0.00043597192239460336, 'samples': 7004544, 'steps': 36481, 'loss/train': 1.4253824949264526} -11/07/2021 02:22:16 - INFO - __main__ - Step 36483: {'lr': 0.00043596837583078165, 'samples': 7004736, 'steps': 36482, 'loss/train': 1.7219206094741821} -11/07/2021 02:22:16 - INFO - __main__ - Step 36484: {'lr': 0.0004359648291831654, 'samples': 7004928, 'steps': 36483, 'loss/train': 1.0681475400924683} -11/07/2021 02:22:17 - INFO - __main__ - Step 36485: {'lr': 0.0004359612824517563, 'samples': 7005120, 'steps': 36484, 'loss/train': 1.6380879878997803} -11/07/2021 02:22:18 - INFO - __main__ - Step 36486: {'lr': 0.0004359577356365559, 'samples': 7005312, 'steps': 36485, 'loss/train': 1.3437206745147705} -11/07/2021 02:22:18 - INFO - __main__ - Step 36487: {'lr': 0.00043595418873756584, 'samples': 7005504, 'steps': 36486, 'loss/train': 1.4168643951416016} -11/07/2021 02:22:18 - INFO - __main__ - Step 36488: {'lr': 0.0004359506417547876, 'samples': 7005696, 'steps': 36487, 'loss/train': 1.3627259731292725} -11/07/2021 02:22:19 - INFO - __main__ - Step 36489: {'lr': 0.000435947094688223, 'samples': 7005888, 'steps': 36488, 'loss/train': 1.4367139339447021} -11/07/2021 02:22:19 - INFO - __main__ - Step 36490: {'lr': 0.0004359435475378735, 'samples': 7006080, 'steps': 36489, 'loss/train': 1.403445839881897} -11/07/2021 02:22:20 - INFO - __main__ - Step 36491: {'lr': 0.0004359400003037406, 'samples': 7006272, 'steps': 36490, 'loss/train': 1.608238697052002} -11/07/2021 02:22:20 - INFO - __main__ - Step 36492: {'lr': 0.0004359364529858261, 'samples': 7006464, 'steps': 36491, 'loss/train': 2.306702136993408} -11/07/2021 02:22:21 - INFO - __main__ - Step 36493: {'lr': 0.00043593290558413143, 'samples': 7006656, 'steps': 36492, 'loss/train': 1.7007659673690796} -11/07/2021 02:22:21 - INFO - __main__ - Step 36494: {'lr': 0.0004359293580986583, 'samples': 7006848, 'steps': 36493, 'loss/train': 1.8951630592346191} -11/07/2021 02:22:21 - INFO - __main__ - Step 36495: {'lr': 0.0004359258105294083, 'samples': 7007040, 'steps': 36494, 'loss/train': 1.4092471599578857} -11/07/2021 02:22:23 - INFO - __main__ - Step 36496: {'lr': 0.0004359222628763829, 'samples': 7007232, 'steps': 36495, 'loss/train': 1.3110671043395996} -11/07/2021 02:22:23 - INFO - __main__ - Step 36497: {'lr': 0.0004359187151395839, 'samples': 7007424, 'steps': 36496, 'loss/train': 1.6679835319519043} -11/07/2021 02:22:24 - INFO - __main__ - Step 36498: {'lr': 0.0004359151673190127, 'samples': 7007616, 'steps': 36497, 'loss/train': 1.349755883216858} -11/07/2021 02:22:24 - INFO - __main__ - Step 36499: {'lr': 0.0004359116194146711, 'samples': 7007808, 'steps': 36498, 'loss/train': 1.5411666631698608} -11/07/2021 02:22:24 - INFO - __main__ - Step 36500: {'lr': 0.0004359080714265605, 'samples': 7008000, 'steps': 36499, 'loss/train': 1.6351027488708496} -11/07/2021 02:22:25 - INFO - __main__ - Step 36501: {'lr': 0.00043590452335468265, 'samples': 7008192, 'steps': 36500, 'loss/train': 0.6577228307723999} -11/07/2021 02:22:26 - INFO - __main__ - Step 36502: {'lr': 0.00043590097519903917, 'samples': 7008384, 'steps': 36501, 'loss/train': 0.4223167896270752} -11/07/2021 02:22:26 - INFO - __main__ - Step 36503: {'lr': 0.0004358974269596314, 'samples': 7008576, 'steps': 36502, 'loss/train': 1.6163660287857056} -11/07/2021 02:22:26 - INFO - __main__ - Step 36504: {'lr': 0.00043589387863646125, 'samples': 7008768, 'steps': 36503, 'loss/train': 1.5610636472702026} -11/07/2021 02:22:27 - INFO - __main__ - Step 36505: {'lr': 0.0004358903302295301, 'samples': 7008960, 'steps': 36504, 'loss/train': 1.8605214357376099} -11/07/2021 02:22:27 - INFO - __main__ - Step 36506: {'lr': 0.0004358867817388397, 'samples': 7009152, 'steps': 36505, 'loss/train': 1.8321130275726318} -11/07/2021 02:22:28 - INFO - __main__ - Step 36507: {'lr': 0.0004358832331643916, 'samples': 7009344, 'steps': 36506, 'loss/train': 1.1233673095703125} -11/07/2021 02:22:29 - INFO - __main__ - Step 36508: {'lr': 0.0004358796845061873, 'samples': 7009536, 'steps': 36507, 'loss/train': 1.2812395095825195} -11/07/2021 02:22:29 - INFO - __main__ - Step 36509: {'lr': 0.00043587613576422855, 'samples': 7009728, 'steps': 36508, 'loss/train': 1.5616999864578247} -11/07/2021 02:22:29 - INFO - __main__ - Step 36510: {'lr': 0.00043587258693851685, 'samples': 7009920, 'steps': 36509, 'loss/train': 1.5353094339370728} -11/07/2021 02:22:30 - INFO - __main__ - Step 36511: {'lr': 0.0004358690380290539, 'samples': 7010112, 'steps': 36510, 'loss/train': 1.4021555185317993} -11/07/2021 02:22:31 - INFO - __main__ - Step 36512: {'lr': 0.00043586548903584113, 'samples': 7010304, 'steps': 36511, 'loss/train': 1.5102307796478271} -11/07/2021 02:22:31 - INFO - __main__ - Step 36513: {'lr': 0.0004358619399588802, 'samples': 7010496, 'steps': 36512, 'loss/train': 1.0852004289627075} -11/07/2021 02:22:31 - INFO - __main__ - Step 36514: {'lr': 0.0004358583907981729, 'samples': 7010688, 'steps': 36513, 'loss/train': 1.7945281267166138} -11/07/2021 02:22:32 - INFO - __main__ - Step 36515: {'lr': 0.0004358548415537206, 'samples': 7010880, 'steps': 36514, 'loss/train': 0.9975671768188477} -11/07/2021 02:22:32 - INFO - __main__ - Step 36516: {'lr': 0.000435851292225525, 'samples': 7011072, 'steps': 36515, 'loss/train': 1.5559824705123901} -11/07/2021 02:22:32 - INFO - __main__ - Step 36517: {'lr': 0.0004358477428135876, 'samples': 7011264, 'steps': 36516, 'loss/train': 1.3623974323272705} -11/07/2021 02:22:34 - INFO - __main__ - Step 36518: {'lr': 0.00043584419331791014, 'samples': 7011456, 'steps': 36517, 'loss/train': 1.2668063640594482} -11/07/2021 02:22:34 - INFO - __main__ - Step 36519: {'lr': 0.0004358406437384942, 'samples': 7011648, 'steps': 36518, 'loss/train': 1.5969531536102295} -11/07/2021 02:22:34 - INFO - __main__ - Step 36520: {'lr': 0.0004358370940753412, 'samples': 7011840, 'steps': 36519, 'loss/train': 0.9871808886528015} -11/07/2021 02:22:35 - INFO - __main__ - Step 36521: {'lr': 0.000435833544328453, 'samples': 7012032, 'steps': 36520, 'loss/train': 1.0032232999801636} -11/07/2021 02:22:35 - INFO - __main__ - Step 36522: {'lr': 0.00043582999449783103, 'samples': 7012224, 'steps': 36521, 'loss/train': 1.8288178443908691} -11/07/2021 02:22:36 - INFO - __main__ - Step 36523: {'lr': 0.0004358264445834769, 'samples': 7012416, 'steps': 36522, 'loss/train': 1.3894726037979126} -11/07/2021 02:22:37 - INFO - __main__ - Step 36524: {'lr': 0.00043582289458539224, 'samples': 7012608, 'steps': 36523, 'loss/train': 1.4437963962554932} -11/07/2021 02:22:37 - INFO - __main__ - Step 36525: {'lr': 0.00043581934450357876, 'samples': 7012800, 'steps': 36524, 'loss/train': 1.240963339805603} -11/07/2021 02:22:37 - INFO - __main__ - Step 36526: {'lr': 0.0004358157943380379, 'samples': 7012992, 'steps': 36525, 'loss/train': 1.2418889999389648} -11/07/2021 02:22:38 - INFO - __main__ - Step 36527: {'lr': 0.00043581224408877116, 'samples': 7013184, 'steps': 36526, 'loss/train': 1.6116684675216675} -11/07/2021 02:22:38 - INFO - __main__ - Step 36528: {'lr': 0.00043580869375578046, 'samples': 7013376, 'steps': 36527, 'loss/train': 1.7534099817276} -11/07/2021 02:22:39 - INFO - __main__ - Step 36529: {'lr': 0.00043580514333906717, 'samples': 7013568, 'steps': 36528, 'loss/train': 1.2966219186782837} -11/07/2021 02:22:39 - INFO - __main__ - Step 36530: {'lr': 0.000435801592838633, 'samples': 7013760, 'steps': 36529, 'loss/train': 1.220832347869873} -11/07/2021 02:22:40 - INFO - __main__ - Step 36531: {'lr': 0.0004357980422544794, 'samples': 7013952, 'steps': 36530, 'loss/train': 1.5813374519348145} -11/07/2021 02:22:40 - INFO - __main__ - Step 36532: {'lr': 0.00043579449158660815, 'samples': 7014144, 'steps': 36531, 'loss/train': 1.3674315214157104} -11/07/2021 02:22:40 - INFO - __main__ - Step 36533: {'lr': 0.0004357909408350208, 'samples': 7014336, 'steps': 36532, 'loss/train': 1.3425029516220093} -11/07/2021 02:22:42 - INFO - __main__ - Step 36534: {'lr': 0.00043578738999971886, 'samples': 7014528, 'steps': 36533, 'loss/train': 1.2998322248458862} -11/07/2021 02:22:42 - INFO - __main__ - Step 36535: {'lr': 0.000435783839080704, 'samples': 7014720, 'steps': 36534, 'loss/train': 1.6563870906829834} -11/07/2021 02:22:42 - INFO - __main__ - Step 36536: {'lr': 0.00043578028807797774, 'samples': 7014912, 'steps': 36535, 'loss/train': 1.437389850616455} -11/07/2021 02:22:43 - INFO - __main__ - Step 36537: {'lr': 0.0004357767369915419, 'samples': 7015104, 'steps': 36536, 'loss/train': 1.6424156427383423} -11/07/2021 02:22:43 - INFO - __main__ - Step 36538: {'lr': 0.0004357731858213978, 'samples': 7015296, 'steps': 36537, 'loss/train': 1.26777982711792} -11/07/2021 02:22:44 - INFO - __main__ - Step 36539: {'lr': 0.0004357696345675472, 'samples': 7015488, 'steps': 36538, 'loss/train': 1.8215261697769165} -11/07/2021 02:22:44 - INFO - __main__ - Step 36540: {'lr': 0.00043576608322999167, 'samples': 7015680, 'steps': 36539, 'loss/train': 1.4973750114440918} -11/07/2021 02:22:45 - INFO - __main__ - Step 36541: {'lr': 0.0004357625318087328, 'samples': 7015872, 'steps': 36540, 'loss/train': 1.465362787246704} -11/07/2021 02:22:45 - INFO - __main__ - Step 36542: {'lr': 0.00043575898030377225, 'samples': 7016064, 'steps': 36541, 'loss/train': 1.8516111373901367} -11/07/2021 02:22:45 - INFO - __main__ - Step 36543: {'lr': 0.00043575542871511155, 'samples': 7016256, 'steps': 36542, 'loss/train': 1.786741852760315} -11/07/2021 02:22:46 - INFO - __main__ - Step 36544: {'lr': 0.00043575187704275234, 'samples': 7016448, 'steps': 36543, 'loss/train': 1.696166753768921} -11/07/2021 02:22:47 - INFO - __main__ - Step 36545: {'lr': 0.0004357483252866961, 'samples': 7016640, 'steps': 36544, 'loss/train': 1.6869455575942993} -11/07/2021 02:22:47 - INFO - __main__ - Step 36546: {'lr': 0.00043574477344694463, 'samples': 7016832, 'steps': 36545, 'loss/train': 1.7611186504364014} -11/07/2021 02:22:47 - INFO - __main__ - Step 36547: {'lr': 0.0004357412215234994, 'samples': 7017024, 'steps': 36546, 'loss/train': 1.2742689847946167} -11/07/2021 02:22:48 - INFO - __main__ - Step 36548: {'lr': 0.00043573766951636206, 'samples': 7017216, 'steps': 36547, 'loss/train': 0.5363247990608215} -11/07/2021 02:22:49 - INFO - __main__ - Step 36549: {'lr': 0.00043573411742553415, 'samples': 7017408, 'steps': 36548, 'loss/train': 1.056071162223816} -11/07/2021 02:22:49 - INFO - __main__ - Step 36550: {'lr': 0.0004357305652510174, 'samples': 7017600, 'steps': 36549, 'loss/train': 1.721631646156311} -11/07/2021 02:22:50 - INFO - __main__ - Step 36551: {'lr': 0.00043572701299281327, 'samples': 7017792, 'steps': 36550, 'loss/train': 1.5491282939910889} -11/07/2021 02:22:50 - INFO - __main__ - Step 36552: {'lr': 0.0004357234606509234, 'samples': 7017984, 'steps': 36551, 'loss/train': 1.3987603187561035} -11/07/2021 02:22:50 - INFO - __main__ - Step 36553: {'lr': 0.00043571990822534936, 'samples': 7018176, 'steps': 36552, 'loss/train': 0.201223224401474} -11/07/2021 02:22:51 - INFO - __main__ - Step 36554: {'lr': 0.00043571635571609287, 'samples': 7018368, 'steps': 36553, 'loss/train': 1.3155345916748047} -11/07/2021 02:22:51 - INFO - __main__ - Step 36555: {'lr': 0.00043571280312315543, 'samples': 7018560, 'steps': 36554, 'loss/train': 0.42579716444015503} -11/07/2021 02:22:52 - INFO - __main__ - Step 36556: {'lr': 0.0004357092504465386, 'samples': 7018752, 'steps': 36555, 'loss/train': 1.812836766242981} -11/07/2021 02:22:52 - INFO - __main__ - Step 36557: {'lr': 0.00043570569768624416, 'samples': 7018944, 'steps': 36556, 'loss/train': 1.2242940664291382} -11/07/2021 02:22:53 - INFO - __main__ - Step 36558: {'lr': 0.00043570214484227353, 'samples': 7019136, 'steps': 36557, 'loss/train': 1.6130986213684082} -11/07/2021 02:22:54 - INFO - __main__ - Step 36559: {'lr': 0.00043569859191462847, 'samples': 7019328, 'steps': 36558, 'loss/train': 1.3331043720245361} -11/07/2021 02:22:54 - INFO - __main__ - Step 36560: {'lr': 0.0004356950389033104, 'samples': 7019520, 'steps': 36559, 'loss/train': 1.8335299491882324} -11/07/2021 02:22:54 - INFO - __main__ - Step 36561: {'lr': 0.0004356914858083211, 'samples': 7019712, 'steps': 36560, 'loss/train': 1.64692223072052} -11/07/2021 02:22:55 - INFO - __main__ - Step 36562: {'lr': 0.00043568793262966195, 'samples': 7019904, 'steps': 36561, 'loss/train': 1.4393301010131836} -11/07/2021 02:22:55 - INFO - __main__ - Step 36563: {'lr': 0.00043568437936733473, 'samples': 7020096, 'steps': 36562, 'loss/train': 1.5390021800994873} -11/07/2021 02:22:56 - INFO - __main__ - Step 36564: {'lr': 0.0004356808260213411, 'samples': 7020288, 'steps': 36563, 'loss/train': 1.780922293663025} -11/07/2021 02:22:57 - INFO - __main__ - Step 36565: {'lr': 0.00043567727259168244, 'samples': 7020480, 'steps': 36564, 'loss/train': 1.7212803363800049} -11/07/2021 02:22:57 - INFO - __main__ - Step 36566: {'lr': 0.0004356737190783605, 'samples': 7020672, 'steps': 36565, 'loss/train': 2.4525327682495117} -11/07/2021 02:22:57 - INFO - __main__ - Step 36567: {'lr': 0.00043567016548137685, 'samples': 7020864, 'steps': 36566, 'loss/train': 1.0905752182006836} -11/07/2021 02:22:58 - INFO - __main__ - Step 36568: {'lr': 0.00043566661180073304, 'samples': 7021056, 'steps': 36567, 'loss/train': 0.7993988394737244} -11/07/2021 02:22:59 - INFO - __main__ - Step 36569: {'lr': 0.00043566305803643073, 'samples': 7021248, 'steps': 36568, 'loss/train': 1.5785763263702393} -11/07/2021 02:22:59 - INFO - __main__ - Step 36570: {'lr': 0.00043565950418847154, 'samples': 7021440, 'steps': 36569, 'loss/train': 1.1388972997665405} -11/07/2021 02:23:00 - INFO - __main__ - Step 36571: {'lr': 0.00043565595025685705, 'samples': 7021632, 'steps': 36570, 'loss/train': 1.6771471500396729} -11/07/2021 02:23:00 - INFO - __main__ - Step 36572: {'lr': 0.0004356523962415889, 'samples': 7021824, 'steps': 36571, 'loss/train': 1.3315123319625854} -11/07/2021 02:23:00 - INFO - __main__ - Step 36573: {'lr': 0.00043564884214266855, 'samples': 7022016, 'steps': 36572, 'loss/train': 1.4760372638702393} -11/07/2021 02:23:01 - INFO - __main__ - Step 36574: {'lr': 0.00043564528796009774, 'samples': 7022208, 'steps': 36573, 'loss/train': 1.5408062934875488} -11/07/2021 02:23:02 - INFO - __main__ - Step 36575: {'lr': 0.00043564173369387807, 'samples': 7022400, 'steps': 36574, 'loss/train': 1.4901825189590454} -11/07/2021 02:23:02 - INFO - __main__ - Step 36576: {'lr': 0.00043563817934401107, 'samples': 7022592, 'steps': 36575, 'loss/train': 1.4674835205078125} -11/07/2021 02:23:03 - INFO - __main__ - Step 36577: {'lr': 0.0004356346249104983, 'samples': 7022784, 'steps': 36576, 'loss/train': 1.30613112449646} -11/07/2021 02:23:03 - INFO - __main__ - Step 36578: {'lr': 0.0004356310703933415, 'samples': 7022976, 'steps': 36577, 'loss/train': 0.35052648186683655} -11/07/2021 02:23:03 - INFO - __main__ - Step 36579: {'lr': 0.00043562751579254215, 'samples': 7023168, 'steps': 36578, 'loss/train': 1.4443248510360718} -11/07/2021 02:23:04 - INFO - __main__ - Step 36580: {'lr': 0.00043562396110810196, 'samples': 7023360, 'steps': 36579, 'loss/train': 2.2824246883392334} -11/07/2021 02:23:05 - INFO - __main__ - Step 36581: {'lr': 0.00043562040634002245, 'samples': 7023552, 'steps': 36580, 'loss/train': 1.9743016958236694} -11/07/2021 02:23:05 - INFO - __main__ - Step 36582: {'lr': 0.0004356168514883053, 'samples': 7023744, 'steps': 36581, 'loss/train': 1.9472196102142334} -11/07/2021 02:23:06 - INFO - __main__ - Step 36583: {'lr': 0.000435613296552952, 'samples': 7023936, 'steps': 36582, 'loss/train': 1.6587493419647217} -11/07/2021 02:23:06 - INFO - __main__ - Step 36584: {'lr': 0.0004356097415339643, 'samples': 7024128, 'steps': 36583, 'loss/train': 1.0660061836242676} -11/07/2021 02:23:07 - INFO - __main__ - Step 36585: {'lr': 0.0004356061864313436, 'samples': 7024320, 'steps': 36584, 'loss/train': 1.33091402053833} -11/07/2021 02:23:07 - INFO - __main__ - Step 36586: {'lr': 0.0004356026312450917, 'samples': 7024512, 'steps': 36585, 'loss/train': 1.5652490854263306} -11/07/2021 02:23:08 - INFO - __main__ - Step 36587: {'lr': 0.00043559907597521007, 'samples': 7024704, 'steps': 36586, 'loss/train': 1.6647975444793701} -11/07/2021 02:23:08 - INFO - __main__ - Step 36588: {'lr': 0.00043559552062170037, 'samples': 7024896, 'steps': 36587, 'loss/train': 1.09634268283844} -11/07/2021 02:23:08 - INFO - __main__ - Step 36589: {'lr': 0.00043559196518456425, 'samples': 7025088, 'steps': 36588, 'loss/train': 0.9539096355438232} -11/07/2021 02:23:10 - INFO - __main__ - Step 36590: {'lr': 0.0004355884096638032, 'samples': 7025280, 'steps': 36589, 'loss/train': 0.8309692740440369} -11/07/2021 02:23:10 - INFO - __main__ - Step 36591: {'lr': 0.0004355848540594188, 'samples': 7025472, 'steps': 36590, 'loss/train': 0.5594035387039185} -11/07/2021 02:23:10 - INFO - __main__ - Step 36592: {'lr': 0.00043558129837141285, 'samples': 7025664, 'steps': 36591, 'loss/train': 1.1925039291381836} -11/07/2021 02:23:11 - INFO - __main__ - Step 36593: {'lr': 0.0004355777425997868, 'samples': 7025856, 'steps': 36592, 'loss/train': 1.5464204549789429} -11/07/2021 02:23:11 - INFO - __main__ - Step 36594: {'lr': 0.0004355741867445423, 'samples': 7026048, 'steps': 36593, 'loss/train': 1.5897024869918823} -11/07/2021 02:23:12 - INFO - __main__ - Step 36595: {'lr': 0.00043557063080568094, 'samples': 7026240, 'steps': 36594, 'loss/train': 0.15254853665828705} -11/07/2021 02:23:12 - INFO - __main__ - Step 36596: {'lr': 0.00043556707478320425, 'samples': 7026432, 'steps': 36595, 'loss/train': 1.6399388313293457} -11/07/2021 02:23:13 - INFO - __main__ - Step 36597: {'lr': 0.000435563518677114, 'samples': 7026624, 'steps': 36596, 'loss/train': 1.5131480693817139} -11/07/2021 02:23:13 - INFO - __main__ - Step 36598: {'lr': 0.00043555996248741157, 'samples': 7026816, 'steps': 36597, 'loss/train': 1.5443997383117676} -11/07/2021 02:23:13 - INFO - __main__ - Step 36599: {'lr': 0.00043555640621409874, 'samples': 7027008, 'steps': 36598, 'loss/train': 1.3245813846588135} -11/07/2021 02:23:14 - INFO - __main__ - Step 36600: {'lr': 0.000435552849857177, 'samples': 7027200, 'steps': 36599, 'loss/train': 1.3773012161254883} -11/07/2021 02:23:15 - INFO - __main__ - Step 36601: {'lr': 0.0004355492934166481, 'samples': 7027392, 'steps': 36600, 'loss/train': 1.1193139553070068} -11/07/2021 02:23:15 - INFO - __main__ - Step 36602: {'lr': 0.00043554573689251355, 'samples': 7027584, 'steps': 36601, 'loss/train': 1.734878420829773} -11/07/2021 02:23:16 - INFO - __main__ - Step 36603: {'lr': 0.00043554218028477493, 'samples': 7027776, 'steps': 36602, 'loss/train': 1.6818993091583252} -11/07/2021 02:23:16 - INFO - __main__ - Step 36604: {'lr': 0.0004355386235934339, 'samples': 7027968, 'steps': 36603, 'loss/train': 1.6259936094284058} -11/07/2021 02:23:16 - INFO - __main__ - Step 36605: {'lr': 0.0004355350668184919, 'samples': 7028160, 'steps': 36604, 'loss/train': 1.6531397104263306} -11/07/2021 02:23:17 - INFO - __main__ - Step 36606: {'lr': 0.0004355315099599508, 'samples': 7028352, 'steps': 36605, 'loss/train': 1.665704369544983} -11/07/2021 02:23:18 - INFO - __main__ - Step 36607: {'lr': 0.000435527953017812, 'samples': 7028544, 'steps': 36606, 'loss/train': 2.162864923477173} -11/07/2021 02:23:18 - INFO - __main__ - Step 36608: {'lr': 0.00043552439599207714, 'samples': 7028736, 'steps': 36607, 'loss/train': 1.3255237340927124} -11/07/2021 02:23:18 - INFO - __main__ - Step 36609: {'lr': 0.00043552083888274794, 'samples': 7028928, 'steps': 36608, 'loss/train': 2.0128681659698486} -11/07/2021 02:23:19 - INFO - __main__ - Step 36610: {'lr': 0.00043551728168982583, 'samples': 7029120, 'steps': 36609, 'loss/train': 1.391836404800415} -11/07/2021 02:23:20 - INFO - __main__ - Step 36611: {'lr': 0.0004355137244133126, 'samples': 7029312, 'steps': 36610, 'loss/train': 0.7241917252540588} -11/07/2021 02:23:20 - INFO - __main__ - Step 36612: {'lr': 0.00043551016705320965, 'samples': 7029504, 'steps': 36611, 'loss/train': 1.4233378171920776} -11/07/2021 02:23:21 - INFO - __main__ - Step 36613: {'lr': 0.00043550660960951874, 'samples': 7029696, 'steps': 36612, 'loss/train': 1.660108208656311} -11/07/2021 02:23:21 - INFO - __main__ - Step 36614: {'lr': 0.0004355030520822414, 'samples': 7029888, 'steps': 36613, 'loss/train': 1.3485804796218872} -11/07/2021 02:23:21 - INFO - __main__ - Step 36615: {'lr': 0.00043549949447137915, 'samples': 7030080, 'steps': 36614, 'loss/train': 1.6928882598876953} -11/07/2021 02:23:22 - INFO - __main__ - Step 36616: {'lr': 0.00043549593677693385, 'samples': 7030272, 'steps': 36615, 'loss/train': 0.6086564064025879} -11/07/2021 02:23:23 - INFO - __main__ - Step 36617: {'lr': 0.0004354923789989068, 'samples': 7030464, 'steps': 36616, 'loss/train': 1.5144529342651367} -11/07/2021 02:23:23 - INFO - __main__ - Step 36618: {'lr': 0.0004354888211372998, 'samples': 7030656, 'steps': 36617, 'loss/train': 1.6198910474777222} -11/07/2021 02:23:24 - INFO - __main__ - Step 36619: {'lr': 0.0004354852631921145, 'samples': 7030848, 'steps': 36618, 'loss/train': 1.5385793447494507} -11/07/2021 02:23:24 - INFO - __main__ - Step 36620: {'lr': 0.0004354817051633523, 'samples': 7031040, 'steps': 36619, 'loss/train': 1.7353585958480835} -11/07/2021 02:23:24 - INFO - __main__ - Step 36621: {'lr': 0.00043547814705101486, 'samples': 7031232, 'steps': 36620, 'loss/train': 1.6816554069519043} -11/07/2021 02:23:25 - INFO - __main__ - Step 36622: {'lr': 0.00043547458885510393, 'samples': 7031424, 'steps': 36621, 'loss/train': 1.4382396936416626} -11/07/2021 02:23:26 - INFO - __main__ - Step 36623: {'lr': 0.00043547103057562097, 'samples': 7031616, 'steps': 36622, 'loss/train': 1.4511727094650269} -11/07/2021 02:23:26 - INFO - __main__ - Step 36624: {'lr': 0.00043546747221256764, 'samples': 7031808, 'steps': 36623, 'loss/train': 1.165474772453308} -11/07/2021 02:23:26 - INFO - __main__ - Step 36625: {'lr': 0.00043546391376594553, 'samples': 7032000, 'steps': 36624, 'loss/train': 0.9305865168571472} -11/07/2021 02:23:27 - INFO - __main__ - Step 36626: {'lr': 0.0004354603552357562, 'samples': 7032192, 'steps': 36625, 'loss/train': 1.2832889556884766} -11/07/2021 02:23:28 - INFO - __main__ - Step 36627: {'lr': 0.0004354567966220013, 'samples': 7032384, 'steps': 36626, 'loss/train': 0.542655348777771} -11/07/2021 02:23:28 - INFO - __main__ - Step 36628: {'lr': 0.0004354532379246825, 'samples': 7032576, 'steps': 36627, 'loss/train': 0.9858495593070984} -11/07/2021 02:23:28 - INFO - __main__ - Step 36629: {'lr': 0.0004354496791438013, 'samples': 7032768, 'steps': 36628, 'loss/train': 1.6054434776306152} -11/07/2021 02:23:29 - INFO - __main__ - Step 36630: {'lr': 0.0004354461202793593, 'samples': 7032960, 'steps': 36629, 'loss/train': 1.5780274868011475} -11/07/2021 02:23:29 - INFO - __main__ - Step 36631: {'lr': 0.00043544256133135815, 'samples': 7033152, 'steps': 36630, 'loss/train': 1.2616537809371948} -11/07/2021 02:23:30 - INFO - __main__ - Step 36632: {'lr': 0.0004354390022997995, 'samples': 7033344, 'steps': 36631, 'loss/train': 1.5695288181304932} -11/07/2021 02:23:31 - INFO - __main__ - Step 36633: {'lr': 0.0004354354431846848, 'samples': 7033536, 'steps': 36632, 'loss/train': 0.17641419172286987} -11/07/2021 02:23:31 - INFO - __main__ - Step 36634: {'lr': 0.00043543188398601586, 'samples': 7033728, 'steps': 36633, 'loss/train': 1.5314275026321411} -11/07/2021 02:23:31 - INFO - __main__ - Step 36635: {'lr': 0.00043542832470379415, 'samples': 7033920, 'steps': 36634, 'loss/train': 0.9428682923316956} -11/07/2021 02:23:32 - INFO - __main__ - Step 36636: {'lr': 0.0004354247653380212, 'samples': 7034112, 'steps': 36635, 'loss/train': 1.2503483295440674} -11/07/2021 02:23:33 - INFO - __main__ - Step 36637: {'lr': 0.00043542120588869885, 'samples': 7034304, 'steps': 36636, 'loss/train': 1.3206701278686523} -11/07/2021 02:23:33 - INFO - __main__ - Step 36638: {'lr': 0.0004354176463558284, 'samples': 7034496, 'steps': 36637, 'loss/train': 1.1053410768508911} -11/07/2021 02:23:33 - INFO - __main__ - Step 36639: {'lr': 0.00043541408673941173, 'samples': 7034688, 'steps': 36638, 'loss/train': 1.5448483228683472} -11/07/2021 02:23:34 - INFO - __main__ - Step 36640: {'lr': 0.00043541052703945034, 'samples': 7034880, 'steps': 36639, 'loss/train': 1.4707204103469849} -11/07/2021 02:23:34 - INFO - __main__ - Step 36641: {'lr': 0.0004354069672559458, 'samples': 7035072, 'steps': 36640, 'loss/train': 0.9098020195960999} -11/07/2021 02:23:35 - INFO - __main__ - Step 36642: {'lr': 0.0004354034073888997, 'samples': 7035264, 'steps': 36641, 'loss/train': 1.4666318893432617} -11/07/2021 02:23:35 - INFO - __main__ - Step 36643: {'lr': 0.00043539984743831375, 'samples': 7035456, 'steps': 36642, 'loss/train': 0.9557470083236694} -11/07/2021 02:23:36 - INFO - __main__ - Step 36644: {'lr': 0.0004353962874041895, 'samples': 7035648, 'steps': 36643, 'loss/train': 1.6082971096038818} -11/07/2021 02:23:36 - INFO - __main__ - Step 36645: {'lr': 0.0004353927272865285, 'samples': 7035840, 'steps': 36644, 'loss/train': 1.5697284936904907} -11/07/2021 02:23:36 - INFO - __main__ - Step 36646: {'lr': 0.0004353891670853324, 'samples': 7036032, 'steps': 36645, 'loss/train': 1.5849113464355469} -11/07/2021 02:23:37 - INFO - __main__ - Step 36647: {'lr': 0.00043538560680060287, 'samples': 7036224, 'steps': 36646, 'loss/train': 1.685613751411438} -11/07/2021 02:23:38 - INFO - __main__ - Step 36648: {'lr': 0.00043538204643234137, 'samples': 7036416, 'steps': 36647, 'loss/train': 2.1813371181488037} -11/07/2021 02:23:38 - INFO - __main__ - Step 36649: {'lr': 0.0004353784859805496, 'samples': 7036608, 'steps': 36648, 'loss/train': 1.4566642045974731} -11/07/2021 02:23:38 - INFO - __main__ - Step 36650: {'lr': 0.00043537492544522917, 'samples': 7036800, 'steps': 36649, 'loss/train': 1.6880543231964111} -11/07/2021 02:23:39 - INFO - __main__ - Step 36651: {'lr': 0.0004353713648263816, 'samples': 7036992, 'steps': 36650, 'loss/train': 1.4583431482315063} -11/07/2021 02:23:40 - INFO - __main__ - Step 36652: {'lr': 0.00043536780412400857, 'samples': 7037184, 'steps': 36651, 'loss/train': 1.5300203561782837} -11/07/2021 02:23:40 - INFO - __main__ - Step 36653: {'lr': 0.0004353642433381117, 'samples': 7037376, 'steps': 36652, 'loss/train': 1.5487596988677979} -11/07/2021 02:23:41 - INFO - __main__ - Step 36654: {'lr': 0.00043536068246869254, 'samples': 7037568, 'steps': 36653, 'loss/train': 5.736063480377197} -11/07/2021 02:23:41 - INFO - __main__ - Step 36655: {'lr': 0.00043535712151575274, 'samples': 7037760, 'steps': 36654, 'loss/train': 1.9262999296188354} -11/07/2021 02:23:41 - INFO - __main__ - Step 36656: {'lr': 0.00043535356047929387, 'samples': 7037952, 'steps': 36655, 'loss/train': 1.262406826019287} -11/07/2021 02:23:42 - INFO - __main__ - Step 36657: {'lr': 0.0004353499993593176, 'samples': 7038144, 'steps': 36656, 'loss/train': 1.1855562925338745} -11/07/2021 02:23:43 - INFO - __main__ - Step 36658: {'lr': 0.0004353464381558254, 'samples': 7038336, 'steps': 36657, 'loss/train': 1.3844404220581055} -11/07/2021 02:23:43 - INFO - __main__ - Step 36659: {'lr': 0.00043534287686881895, 'samples': 7038528, 'steps': 36658, 'loss/train': 1.4972984790802002} -11/07/2021 02:23:43 - INFO - __main__ - Step 36660: {'lr': 0.00043533931549829993, 'samples': 7038720, 'steps': 36659, 'loss/train': 1.7652618885040283} -11/07/2021 02:23:44 - INFO - __main__ - Step 36661: {'lr': 0.00043533575404426986, 'samples': 7038912, 'steps': 36660, 'loss/train': 1.4423415660858154} -11/07/2021 02:23:44 - INFO - __main__ - Step 36662: {'lr': 0.0004353321925067303, 'samples': 7039104, 'steps': 36661, 'loss/train': 1.2279847860336304} -11/07/2021 02:23:45 - INFO - __main__ - Step 36663: {'lr': 0.0004353286308856829, 'samples': 7039296, 'steps': 36662, 'loss/train': 1.6344609260559082} -11/07/2021 02:23:45 - INFO - __main__ - Step 36664: {'lr': 0.00043532506918112933, 'samples': 7039488, 'steps': 36663, 'loss/train': 1.8688920736312866} -11/07/2021 02:23:46 - INFO - __main__ - Step 36665: {'lr': 0.0004353215073930712, 'samples': 7039680, 'steps': 36664, 'loss/train': 1.543150544166565} -11/07/2021 02:23:46 - INFO - __main__ - Step 36666: {'lr': 0.00043531794552150994, 'samples': 7039872, 'steps': 36665, 'loss/train': 1.6412619352340698} -11/07/2021 02:23:47 - INFO - __main__ - Step 36667: {'lr': 0.0004353143835664474, 'samples': 7040064, 'steps': 36666, 'loss/train': 1.6174161434173584} -11/07/2021 02:23:48 - INFO - __main__ - Step 36668: {'lr': 0.00043531082152788495, 'samples': 7040256, 'steps': 36667, 'loss/train': 0.18082042038440704} -11/07/2021 02:23:48 - INFO - __main__ - Step 36669: {'lr': 0.0004353072594058243, 'samples': 7040448, 'steps': 36668, 'loss/train': 1.6925253868103027} -11/07/2021 02:23:48 - INFO - __main__ - Step 36670: {'lr': 0.0004353036972002671, 'samples': 7040640, 'steps': 36669, 'loss/train': 2.6391284465789795} -11/07/2021 02:23:49 - INFO - __main__ - Step 36671: {'lr': 0.00043530013491121497, 'samples': 7040832, 'steps': 36670, 'loss/train': 1.4973509311676025} -11/07/2021 02:23:49 - INFO - __main__ - Step 36672: {'lr': 0.00043529657253866936, 'samples': 7041024, 'steps': 36671, 'loss/train': 1.5227664709091187} -11/07/2021 02:23:50 - INFO - __main__ - Step 36673: {'lr': 0.000435293010082632, 'samples': 7041216, 'steps': 36672, 'loss/train': 1.4857127666473389} -11/07/2021 02:23:50 - INFO - __main__ - Step 36674: {'lr': 0.0004352894475431045, 'samples': 7041408, 'steps': 36673, 'loss/train': 1.3619614839553833} -11/07/2021 02:23:51 - INFO - __main__ - Step 36675: {'lr': 0.0004352858849200885, 'samples': 7041600, 'steps': 36674, 'loss/train': 1.106205940246582} -11/07/2021 02:23:51 - INFO - __main__ - Step 36676: {'lr': 0.0004352823222135854, 'samples': 7041792, 'steps': 36675, 'loss/train': 0.8346518278121948} -11/07/2021 02:23:51 - INFO - __main__ - Step 36677: {'lr': 0.00043527875942359697, 'samples': 7041984, 'steps': 36676, 'loss/train': 1.895818829536438} -11/07/2021 02:23:52 - INFO - __main__ - Step 36678: {'lr': 0.0004352751965501248, 'samples': 7042176, 'steps': 36677, 'loss/train': 1.3899580240249634} -11/07/2021 02:23:53 - INFO - __main__ - Step 36679: {'lr': 0.0004352716335931706, 'samples': 7042368, 'steps': 36678, 'loss/train': 1.309022307395935} -11/07/2021 02:23:53 - INFO - __main__ - Step 36680: {'lr': 0.0004352680705527357, 'samples': 7042560, 'steps': 36679, 'loss/train': 1.7067924737930298} -11/07/2021 02:23:53 - INFO - __main__ - Step 36681: {'lr': 0.00043526450742882193, 'samples': 7042752, 'steps': 36680, 'loss/train': 1.3617024421691895} -11/07/2021 02:23:54 - INFO - __main__ - Step 36682: {'lr': 0.0004352609442214309, 'samples': 7042944, 'steps': 36681, 'loss/train': 1.5160088539123535} -11/07/2021 02:23:54 - INFO - __main__ - Step 36683: {'lr': 0.00043525738093056404, 'samples': 7043136, 'steps': 36682, 'loss/train': 1.2032099962234497} -11/07/2021 02:23:55 - INFO - __main__ - Step 36684: {'lr': 0.0004352538175562231, 'samples': 7043328, 'steps': 36683, 'loss/train': 1.4337596893310547} -11/07/2021 02:23:56 - INFO - __main__ - Step 36685: {'lr': 0.00043525025409840967, 'samples': 7043520, 'steps': 36684, 'loss/train': 1.725263237953186} -11/07/2021 02:23:56 - INFO - __main__ - Step 36686: {'lr': 0.00043524669055712534, 'samples': 7043712, 'steps': 36685, 'loss/train': 1.6312520503997803} -11/07/2021 02:23:56 - INFO - __main__ - Step 36687: {'lr': 0.00043524312693237166, 'samples': 7043904, 'steps': 36686, 'loss/train': 1.4041990041732788} -11/07/2021 02:23:57 - INFO - __main__ - Step 36688: {'lr': 0.0004352395632241504, 'samples': 7044096, 'steps': 36687, 'loss/train': 1.4240286350250244} -11/07/2021 02:23:58 - INFO - __main__ - Step 36689: {'lr': 0.00043523599943246297, 'samples': 7044288, 'steps': 36688, 'loss/train': 1.589342474937439} -11/07/2021 02:23:58 - INFO - __main__ - Step 36690: {'lr': 0.00043523243555731094, 'samples': 7044480, 'steps': 36689, 'loss/train': 1.670009732246399} -11/07/2021 02:23:58 - INFO - __main__ - Step 36691: {'lr': 0.00043522887159869617, 'samples': 7044672, 'steps': 36690, 'loss/train': 1.1319444179534912} -11/07/2021 02:23:59 - INFO - __main__ - Step 36692: {'lr': 0.00043522530755662017, 'samples': 7044864, 'steps': 36691, 'loss/train': 1.1176179647445679} -11/07/2021 02:23:59 - INFO - __main__ - Step 36693: {'lr': 0.00043522174343108445, 'samples': 7045056, 'steps': 36692, 'loss/train': 1.937666416168213} -11/07/2021 02:24:00 - INFO - __main__ - Step 36694: {'lr': 0.00043521817922209064, 'samples': 7045248, 'steps': 36693, 'loss/train': 1.047343134880066} -11/07/2021 02:24:00 - INFO - __main__ - Step 36695: {'lr': 0.00043521461492964037, 'samples': 7045440, 'steps': 36694, 'loss/train': 1.0359920263290405} -11/07/2021 02:24:01 - INFO - __main__ - Step 36696: {'lr': 0.00043521105055373526, 'samples': 7045632, 'steps': 36695, 'loss/train': 1.6470108032226562} -11/07/2021 02:24:01 - INFO - __main__ - Step 36697: {'lr': 0.000435207486094377, 'samples': 7045824, 'steps': 36696, 'loss/train': 1.8380084037780762} -11/07/2021 02:24:02 - INFO - __main__ - Step 36698: {'lr': 0.00043520392155156694, 'samples': 7046016, 'steps': 36697, 'loss/train': 1.2285186052322388} -11/07/2021 02:24:02 - INFO - __main__ - Step 36699: {'lr': 0.000435200356925307, 'samples': 7046208, 'steps': 36698, 'loss/train': 1.6174869537353516} -11/07/2021 02:24:04 - INFO - __main__ - Step 36700: {'lr': 0.0004351967922155986, 'samples': 7046400, 'steps': 36699, 'loss/train': 1.3436497449874878} -11/07/2021 02:24:04 - INFO - __main__ - Step 36701: {'lr': 0.0004351932274224434, 'samples': 7046592, 'steps': 36700, 'loss/train': 1.2693761587142944} -11/07/2021 02:24:04 - INFO - __main__ - Step 36702: {'lr': 0.0004351896625458429, 'samples': 7046784, 'steps': 36701, 'loss/train': 1.9657156467437744} -11/07/2021 02:24:05 - INFO - __main__ - Step 36703: {'lr': 0.0004351860975857989, 'samples': 7046976, 'steps': 36702, 'loss/train': 1.970827579498291} -11/07/2021 02:24:05 - INFO - __main__ - Step 36704: {'lr': 0.00043518253254231276, 'samples': 7047168, 'steps': 36703, 'loss/train': 2.3808977603912354} -11/07/2021 02:24:06 - INFO - __main__ - Step 36705: {'lr': 0.00043517896741538634, 'samples': 7047360, 'steps': 36704, 'loss/train': 1.3965660333633423} -11/07/2021 02:24:07 - INFO - __main__ - Step 36706: {'lr': 0.0004351754022050212, 'samples': 7047552, 'steps': 36705, 'loss/train': 1.7651844024658203} -11/07/2021 02:24:07 - INFO - __main__ - Step 36707: {'lr': 0.00043517183691121875, 'samples': 7047744, 'steps': 36706, 'loss/train': 1.3832669258117676} -11/07/2021 02:24:07 - INFO - __main__ - Step 36708: {'lr': 0.00043516827153398073, 'samples': 7047936, 'steps': 36707, 'loss/train': 1.2296851873397827} -11/07/2021 02:24:08 - INFO - __main__ - Step 36709: {'lr': 0.0004351647060733088, 'samples': 7048128, 'steps': 36708, 'loss/train': 1.5138906240463257} -11/07/2021 02:24:08 - INFO - __main__ - Step 36710: {'lr': 0.00043516114052920453, 'samples': 7048320, 'steps': 36709, 'loss/train': 1.4793736934661865} -11/07/2021 02:24:09 - INFO - __main__ - Step 36711: {'lr': 0.00043515757490166944, 'samples': 7048512, 'steps': 36710, 'loss/train': 1.8552041053771973} -11/07/2021 02:24:09 - INFO - __main__ - Step 36712: {'lr': 0.00043515400919070526, 'samples': 7048704, 'steps': 36711, 'loss/train': 1.8112801313400269} -11/07/2021 02:24:10 - INFO - __main__ - Step 36713: {'lr': 0.0004351504433963135, 'samples': 7048896, 'steps': 36712, 'loss/train': 1.026114583015442} -11/07/2021 02:24:10 - INFO - __main__ - Step 36714: {'lr': 0.0004351468775184959, 'samples': 7049088, 'steps': 36713, 'loss/train': 1.2794389724731445} -11/07/2021 02:24:11 - INFO - __main__ - Step 36715: {'lr': 0.0004351433115572538, 'samples': 7049280, 'steps': 36714, 'loss/train': 1.2215988636016846} -11/07/2021 02:24:11 - INFO - __main__ - Step 36716: {'lr': 0.00043513974551258913, 'samples': 7049472, 'steps': 36715, 'loss/train': 1.294337511062622} -11/07/2021 02:24:12 - INFO - __main__ - Step 36717: {'lr': 0.00043513617938450327, 'samples': 7049664, 'steps': 36716, 'loss/train': 0.6976569294929504} -11/07/2021 02:24:12 - INFO - __main__ - Step 36718: {'lr': 0.00043513261317299797, 'samples': 7049856, 'steps': 36717, 'loss/train': 1.472899317741394} -11/07/2021 02:24:13 - INFO - __main__ - Step 36719: {'lr': 0.00043512904687807475, 'samples': 7050048, 'steps': 36718, 'loss/train': 1.4063820838928223} -11/07/2021 02:24:13 - INFO - __main__ - Step 36720: {'lr': 0.00043512548049973523, 'samples': 7050240, 'steps': 36719, 'loss/train': 1.2921974658966064} -11/07/2021 02:24:13 - INFO - __main__ - Step 36721: {'lr': 0.00043512191403798095, 'samples': 7050432, 'steps': 36720, 'loss/train': 1.3332635164260864} -11/07/2021 02:24:14 - INFO - __main__ - Step 36722: {'lr': 0.0004351183474928137, 'samples': 7050624, 'steps': 36721, 'loss/train': 0.9220923185348511} -11/07/2021 02:24:15 - INFO - __main__ - Step 36723: {'lr': 0.00043511478086423493, 'samples': 7050816, 'steps': 36722, 'loss/train': 1.4664701223373413} -11/07/2021 02:24:15 - INFO - __main__ - Step 36724: {'lr': 0.0004351112141522463, 'samples': 7051008, 'steps': 36723, 'loss/train': 1.647239327430725} -11/07/2021 02:24:15 - INFO - __main__ - Step 36725: {'lr': 0.00043510764735684945, 'samples': 7051200, 'steps': 36724, 'loss/train': 1.5401238203048706} -11/07/2021 02:24:16 - INFO - __main__ - Step 36726: {'lr': 0.0004351040804780459, 'samples': 7051392, 'steps': 36725, 'loss/train': 1.699589490890503} -11/07/2021 02:24:17 - INFO - __main__ - Step 36727: {'lr': 0.00043510051351583733, 'samples': 7051584, 'steps': 36726, 'loss/train': 1.6409080028533936} -11/07/2021 02:24:17 - INFO - __main__ - Step 36728: {'lr': 0.0004350969464702254, 'samples': 7051776, 'steps': 36727, 'loss/train': 1.6988903284072876} -11/07/2021 02:24:17 - INFO - __main__ - Step 36729: {'lr': 0.0004350933793412115, 'samples': 7051968, 'steps': 36728, 'loss/train': 1.8149951696395874} -11/07/2021 02:24:18 - INFO - __main__ - Step 36730: {'lr': 0.00043508981212879737, 'samples': 7052160, 'steps': 36729, 'loss/train': 1.5463894605636597} -11/07/2021 02:24:18 - INFO - __main__ - Step 36731: {'lr': 0.0004350862448329848, 'samples': 7052352, 'steps': 36730, 'loss/train': 1.5224485397338867} -11/07/2021 02:24:19 - INFO - __main__ - Step 36732: {'lr': 0.00043508267745377504, 'samples': 7052544, 'steps': 36731, 'loss/train': 1.1639156341552734} -11/07/2021 02:24:19 - INFO - __main__ - Step 36733: {'lr': 0.00043507910999117003, 'samples': 7052736, 'steps': 36732, 'loss/train': 1.5083235502243042} -11/07/2021 02:24:20 - INFO - __main__ - Step 36734: {'lr': 0.00043507554244517113, 'samples': 7052928, 'steps': 36733, 'loss/train': 1.9087817668914795} -11/07/2021 02:24:20 - INFO - __main__ - Step 36735: {'lr': 0.0004350719748157801, 'samples': 7053120, 'steps': 36734, 'loss/train': 1.727805733680725} -11/07/2021 02:24:21 - INFO - __main__ - Step 36736: {'lr': 0.00043506840710299844, 'samples': 7053312, 'steps': 36735, 'loss/train': 1.4072787761688232} -11/07/2021 02:24:21 - INFO - __main__ - Step 36737: {'lr': 0.00043506483930682785, 'samples': 7053504, 'steps': 36736, 'loss/train': 1.6502940654754639} -11/07/2021 02:24:22 - INFO - __main__ - Step 36738: {'lr': 0.0004350612714272699, 'samples': 7053696, 'steps': 36737, 'loss/train': 1.123324990272522} -11/07/2021 02:24:22 - INFO - __main__ - Step 36739: {'lr': 0.0004350577034643262, 'samples': 7053888, 'steps': 36738, 'loss/train': 1.5874708890914917} -11/07/2021 02:24:23 - INFO - __main__ - Step 36740: {'lr': 0.0004350541354179983, 'samples': 7054080, 'steps': 36739, 'loss/train': 1.4291845560073853} -11/07/2021 02:24:23 - INFO - __main__ - Step 36741: {'lr': 0.00043505056728828794, 'samples': 7054272, 'steps': 36740, 'loss/train': 1.6307123899459839} -11/07/2021 02:24:23 - INFO - __main__ - Step 36742: {'lr': 0.0004350469990751966, 'samples': 7054464, 'steps': 36741, 'loss/train': 1.233171820640564} -11/07/2021 02:24:24 - INFO - __main__ - Step 36743: {'lr': 0.000435043430778726, 'samples': 7054656, 'steps': 36742, 'loss/train': 1.7694103717803955} -11/07/2021 02:24:25 - INFO - __main__ - Step 36744: {'lr': 0.00043503986239887765, 'samples': 7054848, 'steps': 36743, 'loss/train': 1.4569706916809082} -11/07/2021 02:24:25 - INFO - __main__ - Step 36745: {'lr': 0.0004350362939356532, 'samples': 7055040, 'steps': 36744, 'loss/train': 1.8365846872329712} -11/07/2021 02:24:25 - INFO - __main__ - Step 36746: {'lr': 0.00043503272538905423, 'samples': 7055232, 'steps': 36745, 'loss/train': 1.5790698528289795} -11/07/2021 02:24:26 - INFO - __main__ - Step 36747: {'lr': 0.0004350291567590824, 'samples': 7055424, 'steps': 36746, 'loss/train': 1.2959239482879639} -11/07/2021 02:24:27 - INFO - __main__ - Step 36748: {'lr': 0.00043502558804573924, 'samples': 7055616, 'steps': 36747, 'loss/train': 1.3608461618423462} -11/07/2021 02:24:27 - INFO - __main__ - Step 36749: {'lr': 0.0004350220192490264, 'samples': 7055808, 'steps': 36748, 'loss/train': 1.5675292015075684} -11/07/2021 02:24:28 - INFO - __main__ - Step 36750: {'lr': 0.00043501845036894555, 'samples': 7056000, 'steps': 36749, 'loss/train': 1.1520994901657104} -11/07/2021 02:24:28 - INFO - __main__ - Step 36751: {'lr': 0.00043501488140549824, 'samples': 7056192, 'steps': 36750, 'loss/train': 1.3899540901184082} -11/07/2021 02:24:28 - INFO - __main__ - Step 36752: {'lr': 0.000435011312358686, 'samples': 7056384, 'steps': 36751, 'loss/train': 1.8039408922195435} -11/07/2021 02:24:29 - INFO - __main__ - Step 36753: {'lr': 0.0004350077432285106, 'samples': 7056576, 'steps': 36752, 'loss/train': 1.3066352605819702} -11/07/2021 02:24:30 - INFO - __main__ - Step 36754: {'lr': 0.0004350041740149735, 'samples': 7056768, 'steps': 36753, 'loss/train': 1.5671954154968262} -11/07/2021 02:24:30 - INFO - __main__ - Step 36755: {'lr': 0.00043500060471807645, 'samples': 7056960, 'steps': 36754, 'loss/train': 1.3846319913864136} -11/07/2021 02:24:30 - INFO - __main__ - Step 36756: {'lr': 0.000434997035337821, 'samples': 7057152, 'steps': 36755, 'loss/train': 1.269380807876587} -11/07/2021 02:24:31 - INFO - __main__ - Step 36757: {'lr': 0.0004349934658742086, 'samples': 7057344, 'steps': 36756, 'loss/train': 1.081022024154663} -11/07/2021 02:24:31 - INFO - __main__ - Step 36758: {'lr': 0.00043498989632724105, 'samples': 7057536, 'steps': 36757, 'loss/train': 1.3352800607681274} -11/07/2021 02:24:32 - INFO - __main__ - Step 36759: {'lr': 0.00043498632669692, 'samples': 7057728, 'steps': 36758, 'loss/train': 1.6395902633666992} -11/07/2021 02:24:32 - INFO - __main__ - Step 36760: {'lr': 0.0004349827569832469, 'samples': 7057920, 'steps': 36759, 'loss/train': 1.2451893091201782} -11/07/2021 02:24:33 - INFO - __main__ - Step 36761: {'lr': 0.00043497918718622344, 'samples': 7058112, 'steps': 36760, 'loss/train': 1.2479592561721802} -11/07/2021 02:24:33 - INFO - __main__ - Step 36762: {'lr': 0.0004349756173058512, 'samples': 7058304, 'steps': 36761, 'loss/train': 1.8825902938842773} -11/07/2021 02:24:33 - INFO - __main__ - Step 36763: {'lr': 0.0004349720473421318, 'samples': 7058496, 'steps': 36762, 'loss/train': 1.6168584823608398} -11/07/2021 02:24:35 - INFO - __main__ - Step 36764: {'lr': 0.00043496847729506685, 'samples': 7058688, 'steps': 36763, 'loss/train': 0.8299821019172668} -11/07/2021 02:24:35 - INFO - __main__ - Step 36765: {'lr': 0.000434964907164658, 'samples': 7058880, 'steps': 36764, 'loss/train': 1.609496831893921} -11/07/2021 02:24:35 - INFO - __main__ - Step 36766: {'lr': 0.0004349613369509067, 'samples': 7059072, 'steps': 36765, 'loss/train': 1.9354546070098877} -11/07/2021 02:24:36 - INFO - __main__ - Step 36767: {'lr': 0.0004349577666538148, 'samples': 7059264, 'steps': 36766, 'loss/train': 1.339677333831787} -11/07/2021 02:24:36 - INFO - __main__ - Step 36768: {'lr': 0.0004349541962733837, 'samples': 7059456, 'steps': 36767, 'loss/train': 1.247060775756836} -11/07/2021 02:24:37 - INFO - __main__ - Step 36769: {'lr': 0.0004349506258096152, 'samples': 7059648, 'steps': 36768, 'loss/train': 1.4814777374267578} -11/07/2021 02:24:37 - INFO - __main__ - Step 36770: {'lr': 0.00043494705526251064, 'samples': 7059840, 'steps': 36769, 'loss/train': 1.7929636240005493} -11/07/2021 02:24:38 - INFO - __main__ - Step 36771: {'lr': 0.00043494348463207197, 'samples': 7060032, 'steps': 36770, 'loss/train': 1.7439746856689453} -11/07/2021 02:24:38 - INFO - __main__ - Step 36772: {'lr': 0.0004349399139183005, 'samples': 7060224, 'steps': 36771, 'loss/train': 1.70767080783844} -11/07/2021 02:24:38 - INFO - __main__ - Step 36773: {'lr': 0.000434936343121198, 'samples': 7060416, 'steps': 36772, 'loss/train': 1.3965067863464355} -11/07/2021 02:24:40 - INFO - __main__ - Step 36774: {'lr': 0.000434932772240766, 'samples': 7060608, 'steps': 36773, 'loss/train': 1.1901990175247192} -11/07/2021 02:24:40 - INFO - __main__ - Step 36775: {'lr': 0.0004349292012770062, 'samples': 7060800, 'steps': 36774, 'loss/train': 1.4630550146102905} -11/07/2021 02:24:40 - INFO - __main__ - Step 36776: {'lr': 0.00043492563022992013, 'samples': 7060992, 'steps': 36775, 'loss/train': 1.6922273635864258} -11/07/2021 02:24:41 - INFO - __main__ - Step 36777: {'lr': 0.00043492205909950943, 'samples': 7061184, 'steps': 36776, 'loss/train': 1.1019692420959473} -11/07/2021 02:24:41 - INFO - __main__ - Step 36778: {'lr': 0.0004349184878857757, 'samples': 7061376, 'steps': 36777, 'loss/train': 1.772645354270935} -11/07/2021 02:24:41 - INFO - __main__ - Step 36779: {'lr': 0.0004349149165887205, 'samples': 7061568, 'steps': 36778, 'loss/train': 1.589666485786438} -11/07/2021 02:24:42 - INFO - __main__ - Step 36780: {'lr': 0.0004349113452083456, 'samples': 7061760, 'steps': 36779, 'loss/train': 0.10330658406019211} -11/07/2021 02:24:43 - INFO - __main__ - Step 36781: {'lr': 0.00043490777374465244, 'samples': 7061952, 'steps': 36780, 'loss/train': 1.489288091659546} -11/07/2021 02:24:43 - INFO - __main__ - Step 36782: {'lr': 0.0004349042021976427, 'samples': 7062144, 'steps': 36781, 'loss/train': 1.6141446828842163} -11/07/2021 02:24:43 - INFO - __main__ - Step 36783: {'lr': 0.000434900630567318, 'samples': 7062336, 'steps': 36782, 'loss/train': 1.4311100244522095} -11/07/2021 02:24:44 - INFO - __main__ - Step 36784: {'lr': 0.00043489705885367986, 'samples': 7062528, 'steps': 36783, 'loss/train': 1.6908950805664062} -11/07/2021 02:24:45 - INFO - __main__ - Step 36785: {'lr': 0.00043489348705673, 'samples': 7062720, 'steps': 36784, 'loss/train': 1.6144988536834717} -11/07/2021 02:24:46 - INFO - __main__ - Step 36786: {'lr': 0.00043488991517647, 'samples': 7062912, 'steps': 36785, 'loss/train': 1.3355114459991455} -11/07/2021 02:24:46 - INFO - __main__ - Step 36787: {'lr': 0.00043488634321290146, 'samples': 7063104, 'steps': 36786, 'loss/train': 0.8564496636390686} -11/07/2021 02:24:46 - INFO - __main__ - Step 36788: {'lr': 0.000434882771166026, 'samples': 7063296, 'steps': 36787, 'loss/train': 1.6882917881011963} -11/07/2021 02:24:47 - INFO - __main__ - Step 36789: {'lr': 0.00043487919903584515, 'samples': 7063488, 'steps': 36788, 'loss/train': 2.0521750450134277} -11/07/2021 02:24:47 - INFO - __main__ - Step 36790: {'lr': 0.00043487562682236066, 'samples': 7063680, 'steps': 36789, 'loss/train': 1.1685245037078857} -11/07/2021 02:24:48 - INFO - __main__ - Step 36791: {'lr': 0.000434872054525574, 'samples': 7063872, 'steps': 36790, 'loss/train': 0.06848043948411942} -11/07/2021 02:24:48 - INFO - __main__ - Step 36792: {'lr': 0.00043486848214548693, 'samples': 7064064, 'steps': 36791, 'loss/train': 1.5211457014083862} -11/07/2021 02:24:49 - INFO - __main__ - Step 36793: {'lr': 0.0004348649096821009, 'samples': 7064256, 'steps': 36792, 'loss/train': 1.2461212873458862} -11/07/2021 02:24:49 - INFO - __main__ - Step 36794: {'lr': 0.0004348613371354176, 'samples': 7064448, 'steps': 36793, 'loss/train': 1.6461915969848633} -11/07/2021 02:24:49 - INFO - __main__ - Step 36795: {'lr': 0.0004348577645054387, 'samples': 7064640, 'steps': 36794, 'loss/train': 0.5114266276359558} -11/07/2021 02:24:51 - INFO - __main__ - Step 36796: {'lr': 0.0004348541917921657, 'samples': 7064832, 'steps': 36795, 'loss/train': 1.4484294652938843} -11/07/2021 02:24:51 - INFO - __main__ - Step 36797: {'lr': 0.0004348506189956002, 'samples': 7065024, 'steps': 36796, 'loss/train': 0.8689265251159668} -11/07/2021 02:24:51 - INFO - __main__ - Step 36798: {'lr': 0.0004348470461157439, 'samples': 7065216, 'steps': 36797, 'loss/train': 1.5061328411102295} -11/07/2021 02:24:52 - INFO - __main__ - Step 36799: {'lr': 0.0004348434731525984, 'samples': 7065408, 'steps': 36798, 'loss/train': 1.167148232460022} -11/07/2021 02:24:52 - INFO - __main__ - Step 36800: {'lr': 0.00043483990010616524, 'samples': 7065600, 'steps': 36799, 'loss/train': 1.0397213697433472} -11/07/2021 02:24:53 - INFO - __main__ - Step 36801: {'lr': 0.00043483632697644616, 'samples': 7065792, 'steps': 36800, 'loss/train': 1.305525779724121} -11/07/2021 02:24:53 - INFO - __main__ - Step 36802: {'lr': 0.00043483275376344257, 'samples': 7065984, 'steps': 36801, 'loss/train': 1.4266273975372314} -11/07/2021 02:24:54 - INFO - __main__ - Step 36803: {'lr': 0.00043482918046715627, 'samples': 7066176, 'steps': 36802, 'loss/train': 1.41310453414917} -11/07/2021 02:24:54 - INFO - __main__ - Step 36804: {'lr': 0.00043482560708758876, 'samples': 7066368, 'steps': 36803, 'loss/train': 1.4844629764556885} -11/07/2021 02:24:55 - INFO - __main__ - Step 36805: {'lr': 0.0004348220336247417, 'samples': 7066560, 'steps': 36804, 'loss/train': 1.1278146505355835} -11/07/2021 02:24:56 - INFO - __main__ - Step 36806: {'lr': 0.0004348184600786167, 'samples': 7066752, 'steps': 36805, 'loss/train': 1.7667964696884155} -11/07/2021 02:24:56 - INFO - __main__ - Step 36807: {'lr': 0.0004348148864492153, 'samples': 7066944, 'steps': 36806, 'loss/train': 1.5919344425201416} -11/07/2021 02:24:56 - INFO - __main__ - Step 36808: {'lr': 0.00043481131273653926, 'samples': 7067136, 'steps': 36807, 'loss/train': 1.6064618825912476} -11/07/2021 02:24:57 - INFO - __main__ - Step 36809: {'lr': 0.00043480773894059, 'samples': 7067328, 'steps': 36808, 'loss/train': 1.606161117553711} -11/07/2021 02:24:57 - INFO - __main__ - Step 36810: {'lr': 0.0004348041650613692, 'samples': 7067520, 'steps': 36809, 'loss/train': 1.257421851158142} -11/07/2021 02:24:57 - INFO - __main__ - Step 36811: {'lr': 0.0004348005910988786, 'samples': 7067712, 'steps': 36810, 'loss/train': 0.9066978096961975} -11/07/2021 02:24:58 - INFO - __main__ - Step 36812: {'lr': 0.0004347970170531197, 'samples': 7067904, 'steps': 36811, 'loss/train': 0.178208589553833} -11/07/2021 02:24:59 - INFO - __main__ - Step 36813: {'lr': 0.000434793442924094, 'samples': 7068096, 'steps': 36812, 'loss/train': 0.929162859916687} -11/07/2021 02:24:59 - INFO - __main__ - Step 36814: {'lr': 0.0004347898687118033, 'samples': 7068288, 'steps': 36813, 'loss/train': 0.5680878162384033} -11/07/2021 02:25:00 - INFO - __main__ - Step 36815: {'lr': 0.0004347862944162492, 'samples': 7068480, 'steps': 36814, 'loss/train': 1.6141563653945923} -11/07/2021 02:25:00 - INFO - __main__ - Step 36816: {'lr': 0.00043478272003743315, 'samples': 7068672, 'steps': 36815, 'loss/train': 1.3449026346206665} -11/07/2021 02:25:01 - INFO - __main__ - Step 36817: {'lr': 0.0004347791455753569, 'samples': 7068864, 'steps': 36816, 'loss/train': 1.3908735513687134} -11/07/2021 02:25:01 - INFO - __main__ - Step 36818: {'lr': 0.00043477557103002197, 'samples': 7069056, 'steps': 36817, 'loss/train': 1.5589827299118042} -11/07/2021 02:25:02 - INFO - __main__ - Step 36819: {'lr': 0.00043477199640143004, 'samples': 7069248, 'steps': 36818, 'loss/train': 1.72110116481781} -11/07/2021 02:25:02 - INFO - __main__ - Step 36820: {'lr': 0.00043476842168958276, 'samples': 7069440, 'steps': 36819, 'loss/train': 1.308180332183838} -11/07/2021 02:25:02 - INFO - __main__ - Step 36821: {'lr': 0.0004347648468944816, 'samples': 7069632, 'steps': 36820, 'loss/train': 1.819994568824768} -11/07/2021 02:25:04 - INFO - __main__ - Step 36822: {'lr': 0.0004347612720161283, 'samples': 7069824, 'steps': 36821, 'loss/train': 1.3080558776855469} -11/07/2021 02:25:04 - INFO - __main__ - Step 36823: {'lr': 0.00043475769705452437, 'samples': 7070016, 'steps': 36822, 'loss/train': 1.2287598848342896} -11/07/2021 02:25:04 - INFO - __main__ - Step 36824: {'lr': 0.00043475412200967155, 'samples': 7070208, 'steps': 36823, 'loss/train': 1.4287643432617188} -11/07/2021 02:25:05 - INFO - __main__ - Step 36825: {'lr': 0.00043475054688157136, 'samples': 7070400, 'steps': 36824, 'loss/train': 1.386857509613037} -11/07/2021 02:25:05 - INFO - __main__ - Step 36826: {'lr': 0.00043474697167022536, 'samples': 7070592, 'steps': 36825, 'loss/train': 1.217334270477295} -11/07/2021 02:25:06 - INFO - __main__ - Step 36827: {'lr': 0.0004347433963756353, 'samples': 7070784, 'steps': 36826, 'loss/train': 1.668638825416565} -11/07/2021 02:25:06 - INFO - __main__ - Step 36828: {'lr': 0.0004347398209978027, 'samples': 7070976, 'steps': 36827, 'loss/train': 1.6760013103485107} -11/07/2021 02:25:07 - INFO - __main__ - Step 36829: {'lr': 0.0004347362455367292, 'samples': 7071168, 'steps': 36828, 'loss/train': 1.2976011037826538} -11/07/2021 02:25:07 - INFO - __main__ - Step 36830: {'lr': 0.0004347326699924163, 'samples': 7071360, 'steps': 36829, 'loss/train': 1.2785390615463257} -11/07/2021 02:25:07 - INFO - __main__ - Step 36831: {'lr': 0.0004347290943648658, 'samples': 7071552, 'steps': 36830, 'loss/train': 1.8591219186782837} -11/07/2021 02:25:09 - INFO - __main__ - Step 36832: {'lr': 0.00043472551865407917, 'samples': 7071744, 'steps': 36831, 'loss/train': 1.2369974851608276} -11/07/2021 02:25:09 - INFO - __main__ - Step 36833: {'lr': 0.0004347219428600581, 'samples': 7071936, 'steps': 36832, 'loss/train': 1.2083044052124023} -11/07/2021 02:25:09 - INFO - __main__ - Step 36834: {'lr': 0.0004347183669828042, 'samples': 7072128, 'steps': 36833, 'loss/train': 0.12292854487895966} -11/07/2021 02:25:10 - INFO - __main__ - Step 36835: {'lr': 0.00043471479102231904, 'samples': 7072320, 'steps': 36834, 'loss/train': 1.0675302743911743} -11/07/2021 02:25:10 - INFO - __main__ - Step 36836: {'lr': 0.0004347112149786042, 'samples': 7072512, 'steps': 36835, 'loss/train': 1.5071020126342773} -11/07/2021 02:25:11 - INFO - __main__ - Step 36837: {'lr': 0.0004347076388516614, 'samples': 7072704, 'steps': 36836, 'loss/train': 1.4102238416671753} -11/07/2021 02:25:11 - INFO - __main__ - Step 36838: {'lr': 0.00043470406264149215, 'samples': 7072896, 'steps': 36837, 'loss/train': 1.6307144165039062} -11/07/2021 02:25:12 - INFO - __main__ - Step 36839: {'lr': 0.00043470048634809813, 'samples': 7073088, 'steps': 36838, 'loss/train': 1.3599307537078857} -11/07/2021 02:25:12 - INFO - __main__ - Step 36840: {'lr': 0.00043469690997148086, 'samples': 7073280, 'steps': 36839, 'loss/train': 2.168046474456787} -11/07/2021 02:25:12 - INFO - __main__ - Step 36841: {'lr': 0.00043469333351164207, 'samples': 7073472, 'steps': 36840, 'loss/train': 1.3043498992919922} -11/07/2021 02:25:13 - INFO - __main__ - Step 36842: {'lr': 0.0004346897569685833, 'samples': 7073664, 'steps': 36841, 'loss/train': 1.4920456409454346} -11/07/2021 02:25:14 - INFO - __main__ - Step 36843: {'lr': 0.00043468618034230613, 'samples': 7073856, 'steps': 36842, 'loss/train': 1.8202351331710815} -11/07/2021 02:25:14 - INFO - __main__ - Step 36844: {'lr': 0.00043468260363281234, 'samples': 7074048, 'steps': 36843, 'loss/train': 1.4558583498001099} -11/07/2021 02:25:14 - INFO - __main__ - Step 36845: {'lr': 0.0004346790268401033, 'samples': 7074240, 'steps': 36844, 'loss/train': 2.1799943447113037} -11/07/2021 02:25:15 - INFO - __main__ - Step 36846: {'lr': 0.00043467544996418075, 'samples': 7074432, 'steps': 36845, 'loss/train': 1.497530221939087} -11/07/2021 02:25:16 - INFO - __main__ - Step 36847: {'lr': 0.0004346718730050463, 'samples': 7074624, 'steps': 36846, 'loss/train': 2.035320997238159} -11/07/2021 02:25:16 - INFO - __main__ - Step 36848: {'lr': 0.0004346682959627016, 'samples': 7074816, 'steps': 36847, 'loss/train': 1.273651361465454} -11/07/2021 02:25:17 - INFO - __main__ - Step 36849: {'lr': 0.0004346647188371482, 'samples': 7075008, 'steps': 36848, 'loss/train': 1.195306658744812} -11/07/2021 02:25:17 - INFO - __main__ - Step 36850: {'lr': 0.00043466114162838765, 'samples': 7075200, 'steps': 36849, 'loss/train': 1.5177725553512573} -11/07/2021 02:25:17 - INFO - __main__ - Step 36851: {'lr': 0.00043465756433642175, 'samples': 7075392, 'steps': 36850, 'loss/train': 1.799225091934204} -11/07/2021 02:25:18 - INFO - __main__ - Step 36852: {'lr': 0.0004346539869612519, 'samples': 7075584, 'steps': 36851, 'loss/train': 1.2354676723480225} -11/07/2021 02:25:19 - INFO - __main__ - Step 36853: {'lr': 0.0004346504095028799, 'samples': 7075776, 'steps': 36852, 'loss/train': 0.6996008157730103} -11/07/2021 02:25:19 - INFO - __main__ - Step 36854: {'lr': 0.00043464683196130726, 'samples': 7075968, 'steps': 36853, 'loss/train': 1.5860463380813599} -11/07/2021 02:25:19 - INFO - __main__ - Step 36855: {'lr': 0.00043464325433653563, 'samples': 7076160, 'steps': 36854, 'loss/train': 1.1152883768081665} -11/07/2021 02:25:20 - INFO - __main__ - Step 36856: {'lr': 0.0004346396766285665, 'samples': 7076352, 'steps': 36855, 'loss/train': 1.8893579244613647} -11/07/2021 02:25:20 - INFO - __main__ - Step 36857: {'lr': 0.0004346360988374016, 'samples': 7076544, 'steps': 36856, 'loss/train': 1.0569288730621338} -11/07/2021 02:25:21 - INFO - __main__ - Step 36858: {'lr': 0.0004346325209630426, 'samples': 7076736, 'steps': 36857, 'loss/train': 1.5878360271453857} -11/07/2021 02:25:22 - INFO - __main__ - Step 36859: {'lr': 0.00043462894300549097, 'samples': 7076928, 'steps': 36858, 'loss/train': 1.5616737604141235} -11/07/2021 02:25:22 - INFO - __main__ - Step 36860: {'lr': 0.0004346253649647485, 'samples': 7077120, 'steps': 36859, 'loss/train': 1.5420434474945068} -11/07/2021 02:25:22 - INFO - __main__ - Step 36861: {'lr': 0.00043462178684081657, 'samples': 7077312, 'steps': 36860, 'loss/train': 1.1887201070785522} -11/07/2021 02:25:23 - INFO - __main__ - Step 36862: {'lr': 0.00043461820863369697, 'samples': 7077504, 'steps': 36861, 'loss/train': 1.6546112298965454} -11/07/2021 02:25:24 - INFO - __main__ - Step 36863: {'lr': 0.0004346146303433912, 'samples': 7077696, 'steps': 36862, 'loss/train': 1.3106971979141235} -11/07/2021 02:25:24 - INFO - __main__ - Step 36864: {'lr': 0.00043461105196990093, 'samples': 7077888, 'steps': 36863, 'loss/train': 1.595474123954773} -11/07/2021 02:25:24 - INFO - __main__ - Step 36865: {'lr': 0.0004346074735132278, 'samples': 7078080, 'steps': 36864, 'loss/train': 0.924349844455719} -11/07/2021 02:25:25 - INFO - __main__ - Step 36866: {'lr': 0.0004346038949733734, 'samples': 7078272, 'steps': 36865, 'loss/train': 1.4717979431152344} -11/07/2021 02:25:25 - INFO - __main__ - Step 36867: {'lr': 0.0004346003163503393, 'samples': 7078464, 'steps': 36866, 'loss/train': 1.654711365699768} -11/07/2021 02:25:26 - INFO - __main__ - Step 36868: {'lr': 0.00043459673764412713, 'samples': 7078656, 'steps': 36867, 'loss/train': 1.5710206031799316} -11/07/2021 02:25:26 - INFO - __main__ - Step 36869: {'lr': 0.0004345931588547386, 'samples': 7078848, 'steps': 36868, 'loss/train': 1.3123658895492554} -11/07/2021 02:25:27 - INFO - __main__ - Step 36870: {'lr': 0.00043458957998217517, 'samples': 7079040, 'steps': 36869, 'loss/train': 0.5438855290412903} -11/07/2021 02:25:27 - INFO - __main__ - Step 36871: {'lr': 0.0004345860010264385, 'samples': 7079232, 'steps': 36870, 'loss/train': 1.6957143545150757} -11/07/2021 02:25:27 - INFO - __main__ - Step 36872: {'lr': 0.00043458242198753035, 'samples': 7079424, 'steps': 36871, 'loss/train': 1.5708094835281372} -11/07/2021 02:25:28 - INFO - __main__ - Step 36873: {'lr': 0.00043457884286545216, 'samples': 7079616, 'steps': 36872, 'loss/train': 1.5407085418701172} -11/07/2021 02:25:29 - INFO - __main__ - Step 36874: {'lr': 0.0004345752636602055, 'samples': 7079808, 'steps': 36873, 'loss/train': 0.5413639545440674} -11/07/2021 02:25:29 - INFO - __main__ - Step 36875: {'lr': 0.00043457168437179217, 'samples': 7080000, 'steps': 36874, 'loss/train': 1.3550437688827515} -11/07/2021 02:25:30 - INFO - __main__ - Step 36876: {'lr': 0.00043456810500021363, 'samples': 7080192, 'steps': 36875, 'loss/train': 1.5162456035614014} -11/07/2021 02:25:30 - INFO - __main__ - Step 36877: {'lr': 0.00043456452554547153, 'samples': 7080384, 'steps': 36876, 'loss/train': 1.5580357313156128} -11/07/2021 02:25:30 - INFO - __main__ - Step 36878: {'lr': 0.0004345609460075676, 'samples': 7080576, 'steps': 36877, 'loss/train': 1.3629759550094604} -11/07/2021 02:25:31 - INFO - __main__ - Step 36879: {'lr': 0.00043455736638650335, 'samples': 7080768, 'steps': 36878, 'loss/train': 1.707269310951233} -11/07/2021 02:25:32 - INFO - __main__ - Step 36880: {'lr': 0.0004345537866822803, 'samples': 7080960, 'steps': 36879, 'loss/train': 1.4857181310653687} -11/07/2021 02:25:32 - INFO - __main__ - Step 36881: {'lr': 0.0004345502068949002, 'samples': 7081152, 'steps': 36880, 'loss/train': 0.4709186255931854} -11/07/2021 02:25:32 - INFO - __main__ - Step 36882: {'lr': 0.0004345466270243646, 'samples': 7081344, 'steps': 36881, 'loss/train': 1.5124123096466064} -11/07/2021 02:25:33 - INFO - __main__ - Step 36883: {'lr': 0.0004345430470706753, 'samples': 7081536, 'steps': 36882, 'loss/train': 1.4317415952682495} -11/07/2021 02:25:34 - INFO - __main__ - Step 36884: {'lr': 0.00043453946703383354, 'samples': 7081728, 'steps': 36883, 'loss/train': 1.5005035400390625} -11/07/2021 02:25:34 - INFO - __main__ - Step 36885: {'lr': 0.00043453588691384125, 'samples': 7081920, 'steps': 36884, 'loss/train': 1.4188697338104248} -11/07/2021 02:25:34 - INFO - __main__ - Step 36886: {'lr': 0.0004345323067106999, 'samples': 7082112, 'steps': 36885, 'loss/train': 1.356079339981079} -11/07/2021 02:25:35 - INFO - __main__ - Step 36887: {'lr': 0.00043452872642441124, 'samples': 7082304, 'steps': 36886, 'loss/train': 1.3987716436386108} -11/07/2021 02:25:35 - INFO - __main__ - Step 36888: {'lr': 0.0004345251460549766, 'samples': 7082496, 'steps': 36887, 'loss/train': 1.269465684890747} -11/07/2021 02:25:36 - INFO - __main__ - Step 36889: {'lr': 0.0004345215656023979, 'samples': 7082688, 'steps': 36888, 'loss/train': 1.5068018436431885} -11/07/2021 02:25:36 - INFO - __main__ - Step 36890: {'lr': 0.0004345179850666766, 'samples': 7082880, 'steps': 36889, 'loss/train': 0.7879098057746887} -11/07/2021 02:25:37 - INFO - __main__ - Step 36891: {'lr': 0.0004345144044478144, 'samples': 7083072, 'steps': 36890, 'loss/train': 1.3742188215255737} -11/07/2021 02:25:37 - INFO - __main__ - Step 36892: {'lr': 0.0004345108237458128, 'samples': 7083264, 'steps': 36891, 'loss/train': 1.10400390625} -11/07/2021 02:25:38 - INFO - __main__ - Step 36893: {'lr': 0.00043450724296067344, 'samples': 7083456, 'steps': 36892, 'loss/train': 1.1535897254943848} -11/07/2021 02:25:39 - INFO - __main__ - Step 36894: {'lr': 0.00043450366209239803, 'samples': 7083648, 'steps': 36893, 'loss/train': 2.1971640586853027} -11/07/2021 02:25:39 - INFO - __main__ - Step 36895: {'lr': 0.0004345000811409881, 'samples': 7083840, 'steps': 36894, 'loss/train': 1.6039793491363525} -11/07/2021 02:25:39 - INFO - __main__ - Step 36896: {'lr': 0.0004344965001064453, 'samples': 7084032, 'steps': 36895, 'loss/train': 1.6271588802337646} -11/07/2021 02:25:40 - INFO - __main__ - Step 36897: {'lr': 0.0004344929189887712, 'samples': 7084224, 'steps': 36896, 'loss/train': 1.7677448987960815} -11/07/2021 02:25:40 - INFO - __main__ - Step 36898: {'lr': 0.0004344893377879674, 'samples': 7084416, 'steps': 36897, 'loss/train': 1.7011865377426147} -11/07/2021 02:25:40 - INFO - __main__ - Step 36899: {'lr': 0.00043448575650403555, 'samples': 7084608, 'steps': 36898, 'loss/train': 1.2332217693328857} -11/07/2021 02:25:41 - INFO - __main__ - Step 36900: {'lr': 0.00043448217513697727, 'samples': 7084800, 'steps': 36899, 'loss/train': 1.2743849754333496} -11/07/2021 02:25:42 - INFO - __main__ - Step 36901: {'lr': 0.0004344785936867942, 'samples': 7084992, 'steps': 36900, 'loss/train': 1.7653430700302124} -11/07/2021 02:25:42 - INFO - __main__ - Step 36902: {'lr': 0.00043447501215348794, 'samples': 7085184, 'steps': 36901, 'loss/train': 1.8011488914489746} -11/07/2021 02:25:43 - INFO - __main__ - Step 36903: {'lr': 0.00043447143053706007, 'samples': 7085376, 'steps': 36902, 'loss/train': 0.938480794429779} -11/07/2021 02:25:43 - INFO - __main__ - Step 36904: {'lr': 0.00043446784883751223, 'samples': 7085568, 'steps': 36903, 'loss/train': 1.3846172094345093} -11/07/2021 02:25:44 - INFO - __main__ - Step 36905: {'lr': 0.000434464267054846, 'samples': 7085760, 'steps': 36904, 'loss/train': 1.6487951278686523} -11/07/2021 02:25:44 - INFO - __main__ - Step 36906: {'lr': 0.000434460685189063, 'samples': 7085952, 'steps': 36905, 'loss/train': 1.008130431175232} -11/07/2021 02:25:45 - INFO - __main__ - Step 36907: {'lr': 0.0004344571032401649, 'samples': 7086144, 'steps': 36906, 'loss/train': 1.8134862184524536} -11/07/2021 02:25:45 - INFO - __main__ - Step 36908: {'lr': 0.0004344535212081533, 'samples': 7086336, 'steps': 36907, 'loss/train': 1.481315016746521} -11/07/2021 02:25:45 - INFO - __main__ - Step 36909: {'lr': 0.0004344499390930298, 'samples': 7086528, 'steps': 36908, 'loss/train': 1.0674848556518555} -11/07/2021 02:25:46 - INFO - __main__ - Step 36910: {'lr': 0.0004344463568947959, 'samples': 7086720, 'steps': 36909, 'loss/train': 1.404719591140747} -11/07/2021 02:25:47 - INFO - __main__ - Step 36911: {'lr': 0.0004344427746134534, 'samples': 7086912, 'steps': 36910, 'loss/train': 1.7163230180740356} -11/07/2021 02:25:47 - INFO - __main__ - Step 36912: {'lr': 0.0004344391922490037, 'samples': 7087104, 'steps': 36911, 'loss/train': 1.4719501733779907} -11/07/2021 02:25:47 - INFO - __main__ - Step 36913: {'lr': 0.0004344356098014487, 'samples': 7087296, 'steps': 36912, 'loss/train': 1.7014365196228027} -11/07/2021 02:25:48 - INFO - __main__ - Step 36914: {'lr': 0.0004344320272707898, 'samples': 7087488, 'steps': 36913, 'loss/train': 0.6131091713905334} -11/07/2021 02:25:49 - INFO - __main__ - Step 36915: {'lr': 0.0004344284446570287, 'samples': 7087680, 'steps': 36914, 'loss/train': 1.565171480178833} -11/07/2021 02:25:49 - INFO - __main__ - Step 36916: {'lr': 0.00043442486196016697, 'samples': 7087872, 'steps': 36915, 'loss/train': 1.4022310972213745} -11/07/2021 02:25:49 - INFO - __main__ - Step 36917: {'lr': 0.00043442127918020624, 'samples': 7088064, 'steps': 36916, 'loss/train': 1.5596140623092651} -11/07/2021 02:25:50 - INFO - __main__ - Step 36918: {'lr': 0.00043441769631714813, 'samples': 7088256, 'steps': 36917, 'loss/train': 1.1450285911560059} -11/07/2021 02:25:50 - INFO - __main__ - Step 36919: {'lr': 0.0004344141133709943, 'samples': 7088448, 'steps': 36918, 'loss/train': 1.3123325109481812} -11/07/2021 02:25:51 - INFO - __main__ - Step 36920: {'lr': 0.00043441053034174625, 'samples': 7088640, 'steps': 36919, 'loss/train': 1.5261822938919067} -11/07/2021 02:25:52 - INFO - __main__ - Step 36921: {'lr': 0.00043440694722940567, 'samples': 7088832, 'steps': 36920, 'loss/train': 1.166629672050476} -11/07/2021 02:25:52 - INFO - __main__ - Step 36922: {'lr': 0.00043440336403397417, 'samples': 7089024, 'steps': 36921, 'loss/train': 1.3760560750961304} -11/07/2021 02:25:52 - INFO - __main__ - Step 36923: {'lr': 0.00043439978075545337, 'samples': 7089216, 'steps': 36922, 'loss/train': 1.4996906518936157} -11/07/2021 02:25:53 - INFO - __main__ - Step 36924: {'lr': 0.0004343961973938449, 'samples': 7089408, 'steps': 36923, 'loss/train': 1.2339190244674683} -11/07/2021 02:25:54 - INFO - __main__ - Step 36925: {'lr': 0.00043439261394915033, 'samples': 7089600, 'steps': 36924, 'loss/train': 1.7183473110198975} -11/07/2021 02:25:54 - INFO - __main__ - Step 36926: {'lr': 0.0004343890304213713, 'samples': 7089792, 'steps': 36925, 'loss/train': 1.4664045572280884} -11/07/2021 02:25:54 - INFO - __main__ - Step 36927: {'lr': 0.0004343854468105094, 'samples': 7089984, 'steps': 36926, 'loss/train': 1.5949413776397705} -11/07/2021 02:25:55 - INFO - __main__ - Step 36928: {'lr': 0.00043438186311656624, 'samples': 7090176, 'steps': 36927, 'loss/train': 1.6770905256271362} -11/07/2021 02:25:55 - INFO - __main__ - Step 36929: {'lr': 0.0004343782793395435, 'samples': 7090368, 'steps': 36928, 'loss/train': 1.344126582145691} -11/07/2021 02:25:56 - INFO - __main__ - Step 36930: {'lr': 0.00043437469547944277, 'samples': 7090560, 'steps': 36929, 'loss/train': 1.7253801822662354} -11/07/2021 02:25:56 - INFO - __main__ - Step 36931: {'lr': 0.0004343711115362656, 'samples': 7090752, 'steps': 36930, 'loss/train': 1.561821460723877} -11/07/2021 02:25:57 - INFO - __main__ - Step 36932: {'lr': 0.00043436752751001365, 'samples': 7090944, 'steps': 36931, 'loss/train': 1.4372137784957886} -11/07/2021 02:25:57 - INFO - __main__ - Step 36933: {'lr': 0.0004343639434006885, 'samples': 7091136, 'steps': 36932, 'loss/train': 1.7856611013412476} -11/07/2021 02:25:57 - INFO - __main__ - Step 36934: {'lr': 0.00043436035920829186, 'samples': 7091328, 'steps': 36933, 'loss/train': 1.2089636325836182} -11/07/2021 02:25:58 - INFO - __main__ - Step 36935: {'lr': 0.0004343567749328253, 'samples': 7091520, 'steps': 36934, 'loss/train': 1.7776851654052734} -11/07/2021 02:25:59 - INFO - __main__ - Step 36936: {'lr': 0.00043435319057429046, 'samples': 7091712, 'steps': 36935, 'loss/train': 1.6643397808074951} -11/07/2021 02:25:59 - INFO - __main__ - Step 36937: {'lr': 0.0004343496061326888, 'samples': 7091904, 'steps': 36936, 'loss/train': 1.0694328546524048} -11/07/2021 02:26:00 - INFO - __main__ - Step 36938: {'lr': 0.0004343460216080221, 'samples': 7092096, 'steps': 36937, 'loss/train': 1.3263893127441406} -11/07/2021 02:26:00 - INFO - __main__ - Step 36939: {'lr': 0.00043434243700029196, 'samples': 7092288, 'steps': 36938, 'loss/train': 0.12158344686031342} -11/07/2021 02:26:00 - INFO - __main__ - Step 36940: {'lr': 0.0004343388523095, 'samples': 7092480, 'steps': 36939, 'loss/train': 0.7859086394309998} -11/07/2021 02:26:01 - INFO - __main__ - Step 36941: {'lr': 0.00043433526753564766, 'samples': 7092672, 'steps': 36940, 'loss/train': 1.9187930822372437} -11/07/2021 02:26:02 - INFO - __main__ - Step 36942: {'lr': 0.00043433168267873677, 'samples': 7092864, 'steps': 36941, 'loss/train': 1.7053115367889404} -11/07/2021 02:26:02 - INFO - __main__ - Step 36943: {'lr': 0.0004343280977387689, 'samples': 7093056, 'steps': 36942, 'loss/train': 1.142830729484558} -11/07/2021 02:26:02 - INFO - __main__ - Step 36944: {'lr': 0.0004343245127157456, 'samples': 7093248, 'steps': 36943, 'loss/train': 1.1533764600753784} -11/07/2021 02:26:03 - INFO - __main__ - Step 36945: {'lr': 0.0004343209276096686, 'samples': 7093440, 'steps': 36944, 'loss/train': 1.976108431816101} -11/07/2021 02:26:04 - INFO - __main__ - Step 36946: {'lr': 0.00043431734242053933, 'samples': 7093632, 'steps': 36945, 'loss/train': 1.3674890995025635} -11/07/2021 02:26:04 - INFO - __main__ - Step 36947: {'lr': 0.0004343137571483595, 'samples': 7093824, 'steps': 36946, 'loss/train': 1.2369861602783203} -11/07/2021 02:26:05 - INFO - __main__ - Step 36948: {'lr': 0.00043431017179313075, 'samples': 7094016, 'steps': 36947, 'loss/train': 1.1444861888885498} -11/07/2021 02:26:05 - INFO - __main__ - Step 36949: {'lr': 0.0004343065863548548, 'samples': 7094208, 'steps': 36948, 'loss/train': 1.6003363132476807} -11/07/2021 02:26:05 - INFO - __main__ - Step 36950: {'lr': 0.000434303000833533, 'samples': 7094400, 'steps': 36949, 'loss/train': 1.830175757408142} -11/07/2021 02:26:06 - INFO - __main__ - Step 36951: {'lr': 0.00043429941522916715, 'samples': 7094592, 'steps': 36950, 'loss/train': 1.4522465467453003} -11/07/2021 02:26:07 - INFO - __main__ - Step 36952: {'lr': 0.0004342958295417588, 'samples': 7094784, 'steps': 36951, 'loss/train': 1.5480337142944336} -11/07/2021 02:26:07 - INFO - __main__ - Step 36953: {'lr': 0.00043429224377130964, 'samples': 7094976, 'steps': 36952, 'loss/train': 1.239585041999817} -11/07/2021 02:26:07 - INFO - __main__ - Step 36954: {'lr': 0.00043428865791782126, 'samples': 7095168, 'steps': 36953, 'loss/train': 1.5699453353881836} -11/07/2021 02:26:08 - INFO - __main__ - Step 36955: {'lr': 0.0004342850719812952, 'samples': 7095360, 'steps': 36954, 'loss/train': 5.742282390594482} -11/07/2021 02:26:08 - INFO - __main__ - Step 36956: {'lr': 0.00043428148596173316, 'samples': 7095552, 'steps': 36955, 'loss/train': 1.2339860200881958} -11/07/2021 02:26:09 - INFO - __main__ - Step 36957: {'lr': 0.00043427789985913675, 'samples': 7095744, 'steps': 36956, 'loss/train': 1.3179750442504883} -11/07/2021 02:26:10 - INFO - __main__ - Step 36958: {'lr': 0.00043427431367350753, 'samples': 7095936, 'steps': 36957, 'loss/train': 3.1354281902313232} -11/07/2021 02:26:10 - INFO - __main__ - Step 36959: {'lr': 0.0004342707274048472, 'samples': 7096128, 'steps': 36958, 'loss/train': 1.6288416385650635} -11/07/2021 02:26:10 - INFO - __main__ - Step 36960: {'lr': 0.0004342671410531572, 'samples': 7096320, 'steps': 36959, 'loss/train': 1.7127184867858887} -11/07/2021 02:26:11 - INFO - __main__ - Step 36961: {'lr': 0.00043426355461843934, 'samples': 7096512, 'steps': 36960, 'loss/train': 1.260001540184021} -11/07/2021 02:26:12 - INFO - __main__ - Step 36962: {'lr': 0.00043425996810069525, 'samples': 7096704, 'steps': 36961, 'loss/train': 0.8840351104736328} -11/07/2021 02:26:12 - INFO - __main__ - Step 36963: {'lr': 0.0004342563814999264, 'samples': 7096896, 'steps': 36962, 'loss/train': 1.4114840030670166} -11/07/2021 02:26:12 - INFO - __main__ - Step 36964: {'lr': 0.0004342527948161344, 'samples': 7097088, 'steps': 36963, 'loss/train': 1.3243039846420288} -11/07/2021 02:26:13 - INFO - __main__ - Step 36965: {'lr': 0.000434249208049321, 'samples': 7097280, 'steps': 36964, 'loss/train': 1.5644744634628296} -11/07/2021 02:26:13 - INFO - __main__ - Step 36966: {'lr': 0.0004342456211994877, 'samples': 7097472, 'steps': 36965, 'loss/train': 1.495862603187561} -11/07/2021 02:26:14 - INFO - __main__ - Step 36967: {'lr': 0.00043424203426663623, 'samples': 7097664, 'steps': 36966, 'loss/train': 0.9820639491081238} -11/07/2021 02:26:14 - INFO - __main__ - Step 36968: {'lr': 0.0004342384472507681, 'samples': 7097856, 'steps': 36967, 'loss/train': 2.0179545879364014} -11/07/2021 02:26:15 - INFO - __main__ - Step 36969: {'lr': 0.00043423486015188497, 'samples': 7098048, 'steps': 36968, 'loss/train': 1.4496098756790161} -11/07/2021 02:26:15 - INFO - __main__ - Step 36970: {'lr': 0.00043423127296998845, 'samples': 7098240, 'steps': 36969, 'loss/train': 1.783840298652649} -11/07/2021 02:26:15 - INFO - __main__ - Step 36971: {'lr': 0.0004342276857050802, 'samples': 7098432, 'steps': 36970, 'loss/train': 1.8025826215744019} -11/07/2021 02:26:16 - INFO - __main__ - Step 36972: {'lr': 0.00043422409835716175, 'samples': 7098624, 'steps': 36971, 'loss/train': 1.6911512613296509} -11/07/2021 02:26:17 - INFO - __main__ - Step 36973: {'lr': 0.00043422051092623483, 'samples': 7098816, 'steps': 36972, 'loss/train': 1.4299386739730835} -11/07/2021 02:26:17 - INFO - __main__ - Step 36974: {'lr': 0.0004342169234123009, 'samples': 7099008, 'steps': 36973, 'loss/train': 1.6480128765106201} -11/07/2021 02:26:18 - INFO - __main__ - Step 36975: {'lr': 0.0004342133358153617, 'samples': 7099200, 'steps': 36974, 'loss/train': 1.752324104309082} -11/07/2021 02:26:18 - INFO - __main__ - Step 36976: {'lr': 0.0004342097481354189, 'samples': 7099392, 'steps': 36975, 'loss/train': 1.761583685874939} -11/07/2021 02:26:19 - INFO - __main__ - Step 36977: {'lr': 0.00043420616037247395, 'samples': 7099584, 'steps': 36976, 'loss/train': 1.5475198030471802} -11/07/2021 02:26:19 - INFO - __main__ - Step 36978: {'lr': 0.0004342025725265285, 'samples': 7099776, 'steps': 36977, 'loss/train': 1.5415979623794556} -11/07/2021 02:26:20 - INFO - __main__ - Step 36979: {'lr': 0.00043419898459758435, 'samples': 7099968, 'steps': 36978, 'loss/train': 1.387312889099121} -11/07/2021 02:26:20 - INFO - __main__ - Step 36980: {'lr': 0.00043419539658564286, 'samples': 7100160, 'steps': 36979, 'loss/train': 1.094067931175232} -11/07/2021 02:26:20 - INFO - __main__ - Step 36981: {'lr': 0.0004341918084907058, 'samples': 7100352, 'steps': 36980, 'loss/train': 2.066326379776001} -11/07/2021 02:26:21 - INFO - __main__ - Step 36982: {'lr': 0.0004341882203127747, 'samples': 7100544, 'steps': 36981, 'loss/train': 1.1311571598052979} -11/07/2021 02:26:22 - INFO - __main__ - Step 36983: {'lr': 0.00043418463205185134, 'samples': 7100736, 'steps': 36982, 'loss/train': 1.410170555114746} -11/07/2021 02:26:22 - INFO - __main__ - Step 36984: {'lr': 0.0004341810437079372, 'samples': 7100928, 'steps': 36983, 'loss/train': 1.2440638542175293} -11/07/2021 02:26:22 - INFO - __main__ - Step 36985: {'lr': 0.0004341774552810339, 'samples': 7101120, 'steps': 36984, 'loss/train': 0.09527873247861862} -11/07/2021 02:26:23 - INFO - __main__ - Step 36986: {'lr': 0.0004341738667711431, 'samples': 7101312, 'steps': 36985, 'loss/train': 1.8854491710662842} -11/07/2021 02:26:23 - INFO - __main__ - Step 36987: {'lr': 0.0004341702781782664, 'samples': 7101504, 'steps': 36986, 'loss/train': 1.4928325414657593} -11/07/2021 02:26:24 - INFO - __main__ - Step 36988: {'lr': 0.00043416668950240536, 'samples': 7101696, 'steps': 36987, 'loss/train': 1.3889577388763428} -11/07/2021 02:26:25 - INFO - __main__ - Step 36989: {'lr': 0.0004341631007435617, 'samples': 7101888, 'steps': 36988, 'loss/train': 1.1590068340301514} -11/07/2021 02:26:25 - INFO - __main__ - Step 36990: {'lr': 0.00043415951190173697, 'samples': 7102080, 'steps': 36989, 'loss/train': 1.2773730754852295} -11/07/2021 02:26:25 - INFO - __main__ - Step 36991: {'lr': 0.00043415592297693276, 'samples': 7102272, 'steps': 36990, 'loss/train': 1.5589598417282104} -11/07/2021 02:26:26 - INFO - __main__ - Step 36992: {'lr': 0.00043415233396915077, 'samples': 7102464, 'steps': 36991, 'loss/train': 1.318044662475586} -11/07/2021 02:26:27 - INFO - __main__ - Step 36993: {'lr': 0.0004341487448783926, 'samples': 7102656, 'steps': 36992, 'loss/train': 2.0069692134857178} -11/07/2021 02:26:27 - INFO - __main__ - Step 36994: {'lr': 0.00043414515570465987, 'samples': 7102848, 'steps': 36993, 'loss/train': 1.1666438579559326} -11/07/2021 02:26:27 - INFO - __main__ - Step 36995: {'lr': 0.0004341415664479541, 'samples': 7103040, 'steps': 36994, 'loss/train': 1.4736157655715942} -11/07/2021 02:26:28 - INFO - __main__ - Step 36996: {'lr': 0.00043413797710827707, 'samples': 7103232, 'steps': 36995, 'loss/train': 1.1507172584533691} -11/07/2021 02:26:28 - INFO - __main__ - Step 36997: {'lr': 0.00043413438768563026, 'samples': 7103424, 'steps': 36996, 'loss/train': 1.53364896774292} -11/07/2021 02:26:29 - INFO - __main__ - Step 36998: {'lr': 0.0004341307981800153, 'samples': 7103616, 'steps': 36997, 'loss/train': 1.4414423704147339} -11/07/2021 02:26:30 - INFO - __main__ - Step 36999: {'lr': 0.0004341272085914339, 'samples': 7103808, 'steps': 36998, 'loss/train': 1.2519278526306152} -11/07/2021 02:26:30 - INFO - __main__ - Step 37000: {'lr': 0.00043412361891988763, 'samples': 7104000, 'steps': 36999, 'loss/train': 1.7549240589141846} -11/07/2021 02:26:30 - INFO - __main__ - Step 37001: {'lr': 0.0004341200291653781, 'samples': 7104192, 'steps': 37000, 'loss/train': 1.153167486190796} -11/07/2021 02:26:31 - INFO - __main__ - Step 37002: {'lr': 0.00043411643932790686, 'samples': 7104384, 'steps': 37001, 'loss/train': 0.5130859613418579} -11/07/2021 02:26:32 - INFO - __main__ - Step 37003: {'lr': 0.0004341128494074756, 'samples': 7104576, 'steps': 37002, 'loss/train': 0.9205571413040161} -11/07/2021 02:26:32 - INFO - __main__ - Step 37004: {'lr': 0.00043410925940408595, 'samples': 7104768, 'steps': 37003, 'loss/train': 1.8095409870147705} -11/07/2021 02:26:32 - INFO - __main__ - Step 37005: {'lr': 0.00043410566931773953, 'samples': 7104960, 'steps': 37004, 'loss/train': 1.2690837383270264} -11/07/2021 02:26:33 - INFO - __main__ - Step 37006: {'lr': 0.000434102079148438, 'samples': 7105152, 'steps': 37005, 'loss/train': 1.5979087352752686} -11/07/2021 02:26:33 - INFO - __main__ - Step 37007: {'lr': 0.0004340984888961828, 'samples': 7105344, 'steps': 37006, 'loss/train': 1.3557651042938232} -11/07/2021 02:26:33 - INFO - __main__ - Step 37008: {'lr': 0.00043409489856097573, 'samples': 7105536, 'steps': 37007, 'loss/train': 1.4115225076675415} -11/07/2021 02:26:34 - INFO - __main__ - Step 37009: {'lr': 0.0004340913081428183, 'samples': 7105728, 'steps': 37008, 'loss/train': 1.5827487707138062} -11/07/2021 02:26:35 - INFO - __main__ - Step 37010: {'lr': 0.00043408771764171216, 'samples': 7105920, 'steps': 37009, 'loss/train': 1.5879969596862793} -11/07/2021 02:26:35 - INFO - __main__ - Step 37011: {'lr': 0.000434084127057659, 'samples': 7106112, 'steps': 37010, 'loss/train': 1.4903258085250854} -11/07/2021 02:26:35 - INFO - __main__ - Step 37012: {'lr': 0.0004340805363906603, 'samples': 7106304, 'steps': 37011, 'loss/train': 1.3931164741516113} -11/07/2021 02:26:36 - INFO - __main__ - Step 37013: {'lr': 0.00043407694564071773, 'samples': 7106496, 'steps': 37012, 'loss/train': 2.0241074562072754} -11/07/2021 02:26:37 - INFO - __main__ - Step 37014: {'lr': 0.00043407335480783306, 'samples': 7106688, 'steps': 37013, 'loss/train': 1.6712000370025635} -11/07/2021 02:26:37 - INFO - __main__ - Step 37015: {'lr': 0.0004340697638920077, 'samples': 7106880, 'steps': 37014, 'loss/train': 1.5157111883163452} -11/07/2021 02:26:38 - INFO - __main__ - Step 37016: {'lr': 0.0004340661728932433, 'samples': 7107072, 'steps': 37015, 'loss/train': 1.5959793329238892} -11/07/2021 02:26:38 - INFO - __main__ - Step 37017: {'lr': 0.0004340625818115416, 'samples': 7107264, 'steps': 37016, 'loss/train': 1.7012815475463867} -11/07/2021 02:26:38 - INFO - __main__ - Step 37018: {'lr': 0.00043405899064690405, 'samples': 7107456, 'steps': 37017, 'loss/train': 1.6925928592681885} -11/07/2021 02:26:39 - INFO - __main__ - Step 37019: {'lr': 0.0004340553993993325, 'samples': 7107648, 'steps': 37018, 'loss/train': 1.8460217714309692} -11/07/2021 02:26:40 - INFO - __main__ - Step 37020: {'lr': 0.0004340518080688283, 'samples': 7107840, 'steps': 37019, 'loss/train': 1.5365556478500366} -11/07/2021 02:26:40 - INFO - __main__ - Step 37021: {'lr': 0.0004340482166553932, 'samples': 7108032, 'steps': 37020, 'loss/train': 1.8368773460388184} -11/07/2021 02:26:40 - INFO - __main__ - Step 37022: {'lr': 0.0004340446251590289, 'samples': 7108224, 'steps': 37021, 'loss/train': 1.7531707286834717} -11/07/2021 02:26:41 - INFO - __main__ - Step 37023: {'lr': 0.00043404103357973684, 'samples': 7108416, 'steps': 37022, 'loss/train': 1.1846529245376587} -11/07/2021 02:26:42 - INFO - __main__ - Step 37024: {'lr': 0.0004340374419175188, 'samples': 7108608, 'steps': 37023, 'loss/train': 1.5365815162658691} -11/07/2021 02:26:42 - INFO - __main__ - Step 37025: {'lr': 0.0004340338501723763, 'samples': 7108800, 'steps': 37024, 'loss/train': 2.1280877590179443} -11/07/2021 02:26:42 - INFO - __main__ - Step 37026: {'lr': 0.00043403025834431097, 'samples': 7108992, 'steps': 37025, 'loss/train': 1.6921418905258179} -11/07/2021 02:26:43 - INFO - __main__ - Step 37027: {'lr': 0.00043402666643332444, 'samples': 7109184, 'steps': 37026, 'loss/train': 1.3075718879699707} -11/07/2021 02:26:43 - INFO - __main__ - Step 37028: {'lr': 0.00043402307443941835, 'samples': 7109376, 'steps': 37027, 'loss/train': 1.4104558229446411} -11/07/2021 02:26:44 - INFO - __main__ - Step 37029: {'lr': 0.00043401948236259437, 'samples': 7109568, 'steps': 37028, 'loss/train': 1.4770339727401733} -11/07/2021 02:26:45 - INFO - __main__ - Step 37030: {'lr': 0.000434015890202854, 'samples': 7109760, 'steps': 37029, 'loss/train': 1.0834112167358398} -11/07/2021 02:26:45 - INFO - __main__ - Step 37031: {'lr': 0.0004340122979601989, 'samples': 7109952, 'steps': 37030, 'loss/train': 1.4986871480941772} -11/07/2021 02:26:45 - INFO - __main__ - Step 37032: {'lr': 0.0004340087056346307, 'samples': 7110144, 'steps': 37031, 'loss/train': 1.2967861890792847} -11/07/2021 02:26:46 - INFO - __main__ - Step 37033: {'lr': 0.000434005113226151, 'samples': 7110336, 'steps': 37032, 'loss/train': 1.0271788835525513} -11/07/2021 02:26:47 - INFO - __main__ - Step 37034: {'lr': 0.0004340015207347614, 'samples': 7110528, 'steps': 37033, 'loss/train': 1.4559848308563232} -11/07/2021 02:26:47 - INFO - __main__ - Step 37035: {'lr': 0.0004339979281604636, 'samples': 7110720, 'steps': 37034, 'loss/train': 1.8344744443893433} -11/07/2021 02:26:48 - INFO - __main__ - Step 37036: {'lr': 0.00043399433550325917, 'samples': 7110912, 'steps': 37035, 'loss/train': 1.378834843635559} -11/07/2021 02:26:48 - INFO - __main__ - Step 37037: {'lr': 0.00043399074276314974, 'samples': 7111104, 'steps': 37036, 'loss/train': 1.4435096979141235} -11/07/2021 02:26:48 - INFO - __main__ - Step 37038: {'lr': 0.00043398714994013696, 'samples': 7111296, 'steps': 37037, 'loss/train': 1.315832257270813} -11/07/2021 02:26:49 - INFO - __main__ - Step 37039: {'lr': 0.00043398355703422233, 'samples': 7111488, 'steps': 37038, 'loss/train': 1.2000634670257568} -11/07/2021 02:26:50 - INFO - __main__ - Step 37040: {'lr': 0.0004339799640454076, 'samples': 7111680, 'steps': 37039, 'loss/train': 1.1245691776275635} -11/07/2021 02:26:50 - INFO - __main__ - Step 37041: {'lr': 0.00043397637097369434, 'samples': 7111872, 'steps': 37040, 'loss/train': 1.210996150970459} -11/07/2021 02:26:50 - INFO - __main__ - Step 37042: {'lr': 0.0004339727778190842, 'samples': 7112064, 'steps': 37041, 'loss/train': 1.5488569736480713} -11/07/2021 02:26:51 - INFO - __main__ - Step 37043: {'lr': 0.0004339691845815786, 'samples': 7112256, 'steps': 37042, 'loss/train': 1.4970704317092896} -11/07/2021 02:26:51 - INFO - __main__ - Step 37044: {'lr': 0.0004339655912611795, 'samples': 7112448, 'steps': 37043, 'loss/train': 1.3883769512176514} -11/07/2021 02:26:52 - INFO - __main__ - Step 37045: {'lr': 0.00043396199785788824, 'samples': 7112640, 'steps': 37044, 'loss/train': 1.9679926633834839} -11/07/2021 02:26:52 - INFO - __main__ - Step 37046: {'lr': 0.00043395840437170666, 'samples': 7112832, 'steps': 37045, 'loss/train': 1.365040898323059} -11/07/2021 02:26:53 - INFO - __main__ - Step 37047: {'lr': 0.00043395481080263614, 'samples': 7113024, 'steps': 37046, 'loss/train': 1.3028538227081299} -11/07/2021 02:26:53 - INFO - __main__ - Step 37048: {'lr': 0.0004339512171506785, 'samples': 7113216, 'steps': 37047, 'loss/train': 1.3216134309768677} -11/07/2021 02:26:53 - INFO - __main__ - Step 37049: {'lr': 0.0004339476234158352, 'samples': 7113408, 'steps': 37048, 'loss/train': 1.917819619178772} -11/07/2021 02:26:55 - INFO - __main__ - Step 37050: {'lr': 0.00043394402959810795, 'samples': 7113600, 'steps': 37049, 'loss/train': 1.5562846660614014} -11/07/2021 02:26:55 - INFO - __main__ - Step 37051: {'lr': 0.00043394043569749843, 'samples': 7113792, 'steps': 37050, 'loss/train': 1.555881381034851} -11/07/2021 02:26:55 - INFO - __main__ - Step 37052: {'lr': 0.00043393684171400817, 'samples': 7113984, 'steps': 37051, 'loss/train': 1.501509666442871} -11/07/2021 02:26:56 - INFO - __main__ - Step 37053: {'lr': 0.00043393324764763873, 'samples': 7114176, 'steps': 37052, 'loss/train': 1.3671139478683472} -11/07/2021 02:26:56 - INFO - __main__ - Step 37054: {'lr': 0.0004339296534983919, 'samples': 7114368, 'steps': 37053, 'loss/train': 1.194187045097351} -11/07/2021 02:26:58 - INFO - __main__ - Step 37055: {'lr': 0.00043392605926626914, 'samples': 7114560, 'steps': 37054, 'loss/train': 1.2914605140686035} -11/07/2021 02:26:58 - INFO - __main__ - Step 37056: {'lr': 0.0004339224649512722, 'samples': 7114752, 'steps': 37055, 'loss/train': 1.5854653120040894} -11/07/2021 02:26:58 - INFO - __main__ - Step 37057: {'lr': 0.00043391887055340263, 'samples': 7114944, 'steps': 37056, 'loss/train': 1.5734776258468628} -11/07/2021 02:26:59 - INFO - __main__ - Step 37058: {'lr': 0.000433915276072662, 'samples': 7115136, 'steps': 37057, 'loss/train': 1.7411218881607056} -11/07/2021 02:26:59 - INFO - __main__ - Step 37059: {'lr': 0.00043391168150905203, 'samples': 7115328, 'steps': 37058, 'loss/train': 1.6579246520996094} -11/07/2021 02:26:59 - INFO - __main__ - Step 37060: {'lr': 0.0004339080868625743, 'samples': 7115520, 'steps': 37059, 'loss/train': 0.5986313223838806} -11/07/2021 02:27:01 - INFO - __main__ - Step 37061: {'lr': 0.00043390449213323037, 'samples': 7115712, 'steps': 37060, 'loss/train': 0.4319573640823364} -11/07/2021 02:27:01 - INFO - __main__ - Step 37062: {'lr': 0.000433900897321022, 'samples': 7115904, 'steps': 37061, 'loss/train': 0.08170078694820404} -11/07/2021 02:27:01 - INFO - __main__ - Step 37063: {'lr': 0.0004338973024259506, 'samples': 7116096, 'steps': 37062, 'loss/train': 0.7094062566757202} -11/07/2021 02:27:02 - INFO - __main__ - Step 37064: {'lr': 0.00043389370744801806, 'samples': 7116288, 'steps': 37063, 'loss/train': 1.4509012699127197} -11/07/2021 02:27:02 - INFO - __main__ - Step 37065: {'lr': 0.00043389011238722575, 'samples': 7116480, 'steps': 37064, 'loss/train': 1.0019127130508423} -11/07/2021 02:27:03 - INFO - __main__ - Step 37066: {'lr': 0.0004338865172435754, 'samples': 7116672, 'steps': 37065, 'loss/train': 1.5191227197647095} -11/07/2021 02:27:03 - INFO - __main__ - Step 37067: {'lr': 0.00043388292201706867, 'samples': 7116864, 'steps': 37066, 'loss/train': 1.7019362449645996} -11/07/2021 02:27:04 - INFO - __main__ - Step 37068: {'lr': 0.0004338793267077071, 'samples': 7117056, 'steps': 37067, 'loss/train': 1.5938674211502075} -11/07/2021 02:27:04 - INFO - __main__ - Step 37069: {'lr': 0.0004338757313154923, 'samples': 7117248, 'steps': 37068, 'loss/train': 1.4200563430786133} -11/07/2021 02:27:04 - INFO - __main__ - Step 37070: {'lr': 0.000433872135840426, 'samples': 7117440, 'steps': 37069, 'loss/train': 0.9483161568641663} -11/07/2021 02:27:05 - INFO - __main__ - Step 37071: {'lr': 0.00043386854028250977, 'samples': 7117632, 'steps': 37070, 'loss/train': 1.6696423292160034} -11/07/2021 02:27:06 - INFO - __main__ - Step 37072: {'lr': 0.00043386494464174515, 'samples': 7117824, 'steps': 37071, 'loss/train': 2.824124336242676} -11/07/2021 02:27:06 - INFO - __main__ - Step 37073: {'lr': 0.0004338613489181338, 'samples': 7118016, 'steps': 37072, 'loss/train': 1.9422165155410767} -11/07/2021 02:27:06 - INFO - __main__ - Step 37074: {'lr': 0.00043385775311167746, 'samples': 7118208, 'steps': 37073, 'loss/train': 1.103857398033142} -11/07/2021 02:27:07 - INFO - __main__ - Step 37075: {'lr': 0.00043385415722237765, 'samples': 7118400, 'steps': 37074, 'loss/train': 1.910669207572937} -11/07/2021 02:27:08 - INFO - __main__ - Step 37076: {'lr': 0.0004338505612502359, 'samples': 7118592, 'steps': 37075, 'loss/train': 1.5614584684371948} -11/07/2021 02:27:08 - INFO - __main__ - Step 37077: {'lr': 0.000433846965195254, 'samples': 7118784, 'steps': 37076, 'loss/train': 1.5544991493225098} -11/07/2021 02:27:08 - INFO - __main__ - Step 37078: {'lr': 0.00043384336905743343, 'samples': 7118976, 'steps': 37077, 'loss/train': 1.7339357137680054} -11/07/2021 02:27:09 - INFO - __main__ - Step 37079: {'lr': 0.0004338397728367759, 'samples': 7119168, 'steps': 37078, 'loss/train': 1.6730190515518188} -11/07/2021 02:27:09 - INFO - __main__ - Step 37080: {'lr': 0.000433836176533283, 'samples': 7119360, 'steps': 37079, 'loss/train': 1.6230782270431519} -11/07/2021 02:27:10 - INFO - __main__ - Step 37081: {'lr': 0.0004338325801469564, 'samples': 7119552, 'steps': 37080, 'loss/train': 1.6183432340621948} -11/07/2021 02:27:11 - INFO - __main__ - Step 37082: {'lr': 0.00043382898367779767, 'samples': 7119744, 'steps': 37081, 'loss/train': 1.7554967403411865} -11/07/2021 02:27:11 - INFO - __main__ - Step 37083: {'lr': 0.00043382538712580845, 'samples': 7119936, 'steps': 37082, 'loss/train': 1.476054310798645} -11/07/2021 02:27:11 - INFO - __main__ - Step 37084: {'lr': 0.00043382179049099024, 'samples': 7120128, 'steps': 37083, 'loss/train': 1.7822281122207642} -11/07/2021 02:27:12 - INFO - __main__ - Step 37085: {'lr': 0.00043381819377334485, 'samples': 7120320, 'steps': 37084, 'loss/train': 1.2737452983856201} -11/07/2021 02:27:12 - INFO - __main__ - Step 37086: {'lr': 0.00043381459697287383, 'samples': 7120512, 'steps': 37085, 'loss/train': 1.7624574899673462} -11/07/2021 02:27:13 - INFO - __main__ - Step 37087: {'lr': 0.0004338110000895787, 'samples': 7120704, 'steps': 37086, 'loss/train': 1.9725539684295654} -11/07/2021 02:27:13 - INFO - __main__ - Step 37088: {'lr': 0.00043380740312346135, 'samples': 7120896, 'steps': 37087, 'loss/train': 1.3805655241012573} -11/07/2021 02:27:14 - INFO - __main__ - Step 37089: {'lr': 0.00043380380607452307, 'samples': 7121088, 'steps': 37088, 'loss/train': 2.1629951000213623} -11/07/2021 02:27:14 - INFO - __main__ - Step 37090: {'lr': 0.0004338002089427657, 'samples': 7121280, 'steps': 37089, 'loss/train': 1.704150676727295} -11/07/2021 02:27:14 - INFO - __main__ - Step 37091: {'lr': 0.00043379661172819075, 'samples': 7121472, 'steps': 37090, 'loss/train': 1.3050607442855835} -11/07/2021 02:27:15 - INFO - __main__ - Step 37092: {'lr': 0.0004337930144307999, 'samples': 7121664, 'steps': 37091, 'loss/train': 1.029489278793335} -11/07/2021 02:27:16 - INFO - __main__ - Step 37093: {'lr': 0.0004337894170505947, 'samples': 7121856, 'steps': 37092, 'loss/train': 1.5230679512023926} -11/07/2021 02:27:16 - INFO - __main__ - Step 37094: {'lr': 0.0004337858195875769, 'samples': 7122048, 'steps': 37093, 'loss/train': 1.5719635486602783} -11/07/2021 02:27:17 - INFO - __main__ - Step 37095: {'lr': 0.00043378222204174807, 'samples': 7122240, 'steps': 37094, 'loss/train': 1.6674373149871826} -11/07/2021 02:27:17 - INFO - __main__ - Step 37096: {'lr': 0.0004337786244131097, 'samples': 7122432, 'steps': 37095, 'loss/train': 1.4746836423873901} -11/07/2021 02:27:18 - INFO - __main__ - Step 37097: {'lr': 0.00043377502670166357, 'samples': 7122624, 'steps': 37096, 'loss/train': 2.1680285930633545} -11/07/2021 02:27:18 - INFO - __main__ - Step 37098: {'lr': 0.0004337714289074113, 'samples': 7122816, 'steps': 37097, 'loss/train': 1.1618105173110962} -11/07/2021 02:27:19 - INFO - __main__ - Step 37099: {'lr': 0.0004337678310303544, 'samples': 7123008, 'steps': 37098, 'loss/train': 1.6241350173950195} -11/07/2021 02:27:19 - INFO - __main__ - Step 37100: {'lr': 0.00043376423307049455, 'samples': 7123200, 'steps': 37099, 'loss/train': 0.8144013285636902} -11/07/2021 02:27:19 - INFO - __main__ - Step 37101: {'lr': 0.00043376063502783337, 'samples': 7123392, 'steps': 37100, 'loss/train': 1.6171725988388062} -11/07/2021 02:27:20 - INFO - __main__ - Step 37102: {'lr': 0.00043375703690237254, 'samples': 7123584, 'steps': 37101, 'loss/train': 1.6170181035995483} -11/07/2021 02:27:21 - INFO - __main__ - Step 37103: {'lr': 0.0004337534386941135, 'samples': 7123776, 'steps': 37102, 'loss/train': 1.580391764640808} -11/07/2021 02:27:21 - INFO - __main__ - Step 37104: {'lr': 0.00043374984040305816, 'samples': 7123968, 'steps': 37103, 'loss/train': 4.709044456481934} -11/07/2021 02:27:21 - INFO - __main__ - Step 37105: {'lr': 0.00043374624202920786, 'samples': 7124160, 'steps': 37104, 'loss/train': 1.4684909582138062} -11/07/2021 02:27:22 - INFO - __main__ - Step 37106: {'lr': 0.0004337426435725644, 'samples': 7124352, 'steps': 37105, 'loss/train': 1.618173599243164} -11/07/2021 02:27:23 - INFO - __main__ - Step 37107: {'lr': 0.00043373904503312934, 'samples': 7124544, 'steps': 37106, 'loss/train': 1.5031660795211792} -11/07/2021 02:27:23 - INFO - __main__ - Step 37108: {'lr': 0.0004337354464109042, 'samples': 7124736, 'steps': 37107, 'loss/train': 1.3616937398910522} -11/07/2021 02:27:23 - INFO - __main__ - Step 37109: {'lr': 0.0004337318477058908, 'samples': 7124928, 'steps': 37108, 'loss/train': 1.0435408353805542} -11/07/2021 02:27:24 - INFO - __main__ - Step 37110: {'lr': 0.0004337282489180907, 'samples': 7125120, 'steps': 37109, 'loss/train': 1.6722913980484009} -11/07/2021 02:27:24 - INFO - __main__ - Step 37111: {'lr': 0.0004337246500475054, 'samples': 7125312, 'steps': 37110, 'loss/train': 1.277995228767395} -11/07/2021 02:27:24 - INFO - __main__ - Step 37112: {'lr': 0.0004337210510941366, 'samples': 7125504, 'steps': 37111, 'loss/train': 1.1224045753479004} -11/07/2021 02:27:25 - INFO - __main__ - Step 37113: {'lr': 0.000433717452057986, 'samples': 7125696, 'steps': 37112, 'loss/train': 0.9895749092102051} -11/07/2021 02:27:26 - INFO - __main__ - Step 37114: {'lr': 0.00043371385293905517, 'samples': 7125888, 'steps': 37113, 'loss/train': 1.5234973430633545} -11/07/2021 02:27:26 - INFO - __main__ - Step 37115: {'lr': 0.0004337102537373456, 'samples': 7126080, 'steps': 37114, 'loss/train': 1.5487487316131592} -11/07/2021 02:27:27 - INFO - __main__ - Step 37116: {'lr': 0.0004337066544528591, 'samples': 7126272, 'steps': 37115, 'loss/train': 0.6512836217880249} -11/07/2021 02:27:27 - INFO - __main__ - Step 37117: {'lr': 0.00043370305508559723, 'samples': 7126464, 'steps': 37116, 'loss/train': 1.3662883043289185} -11/07/2021 02:27:28 - INFO - __main__ - Step 37118: {'lr': 0.00043369945563556157, 'samples': 7126656, 'steps': 37117, 'loss/train': 1.2095894813537598} -11/07/2021 02:27:28 - INFO - __main__ - Step 37119: {'lr': 0.00043369585610275374, 'samples': 7126848, 'steps': 37118, 'loss/train': 0.9861893057823181} -11/07/2021 02:27:29 - INFO - __main__ - Step 37120: {'lr': 0.0004336922564871755, 'samples': 7127040, 'steps': 37119, 'loss/train': 1.63252592086792} -11/07/2021 02:27:29 - INFO - __main__ - Step 37121: {'lr': 0.00043368865678882824, 'samples': 7127232, 'steps': 37120, 'loss/train': 1.4385783672332764} -11/07/2021 02:27:29 - INFO - __main__ - Step 37122: {'lr': 0.00043368505700771377, 'samples': 7127424, 'steps': 37121, 'loss/train': 1.6075456142425537} -11/07/2021 02:27:30 - INFO - __main__ - Step 37123: {'lr': 0.00043368145714383364, 'samples': 7127616, 'steps': 37122, 'loss/train': 1.1798597574234009} -11/07/2021 02:27:31 - INFO - __main__ - Step 37124: {'lr': 0.00043367785719718947, 'samples': 7127808, 'steps': 37123, 'loss/train': 1.5068614482879639} -11/07/2021 02:27:31 - INFO - __main__ - Step 37125: {'lr': 0.0004336742571677829, 'samples': 7128000, 'steps': 37124, 'loss/train': 1.5282413959503174} -11/07/2021 02:27:31 - INFO - __main__ - Step 37126: {'lr': 0.00043367065705561547, 'samples': 7128192, 'steps': 37125, 'loss/train': 1.5183273553848267} -11/07/2021 02:27:32 - INFO - __main__ - Step 37127: {'lr': 0.00043366705686068895, 'samples': 7128384, 'steps': 37126, 'loss/train': 1.2544848918914795} -11/07/2021 02:27:33 - INFO - __main__ - Step 37128: {'lr': 0.0004336634565830049, 'samples': 7128576, 'steps': 37127, 'loss/train': 1.8652119636535645} -11/07/2021 02:27:33 - INFO - __main__ - Step 37129: {'lr': 0.0004336598562225649, 'samples': 7128768, 'steps': 37128, 'loss/train': 1.3766703605651855} -11/07/2021 02:27:34 - INFO - __main__ - Step 37130: {'lr': 0.00043365625577937065, 'samples': 7128960, 'steps': 37129, 'loss/train': 1.6950541734695435} -11/07/2021 02:27:34 - INFO - __main__ - Step 37131: {'lr': 0.00043365265525342365, 'samples': 7129152, 'steps': 37130, 'loss/train': 1.2819048166275024} -11/07/2021 02:27:34 - INFO - __main__ - Step 37132: {'lr': 0.00043364905464472563, 'samples': 7129344, 'steps': 37131, 'loss/train': 1.628318428993225} -11/07/2021 02:27:35 - INFO - __main__ - Step 37133: {'lr': 0.0004336454539532782, 'samples': 7129536, 'steps': 37132, 'loss/train': 5.755924701690674} -11/07/2021 02:27:36 - INFO - __main__ - Step 37134: {'lr': 0.00043364185317908296, 'samples': 7129728, 'steps': 37133, 'loss/train': 1.2615383863449097} -11/07/2021 02:27:36 - INFO - __main__ - Step 37135: {'lr': 0.0004336382523221415, 'samples': 7129920, 'steps': 37134, 'loss/train': 1.1689530611038208} -11/07/2021 02:27:36 - INFO - __main__ - Step 37136: {'lr': 0.0004336346513824555, 'samples': 7130112, 'steps': 37135, 'loss/train': 1.9664125442504883} -11/07/2021 02:27:37 - INFO - __main__ - Step 37137: {'lr': 0.0004336310503600266, 'samples': 7130304, 'steps': 37136, 'loss/train': 1.0943663120269775} -11/07/2021 02:27:37 - INFO - __main__ - Step 37138: {'lr': 0.0004336274492548563, 'samples': 7130496, 'steps': 37137, 'loss/train': 1.752846598625183} -11/07/2021 02:27:38 - INFO - __main__ - Step 37139: {'lr': 0.0004336238480669463, 'samples': 7130688, 'steps': 37138, 'loss/train': 1.6972535848617554} -11/07/2021 02:27:39 - INFO - __main__ - Step 37140: {'lr': 0.0004336202467962983, 'samples': 7130880, 'steps': 37139, 'loss/train': 1.4095814228057861} -11/07/2021 02:27:39 - INFO - __main__ - Step 37141: {'lr': 0.0004336166454429139, 'samples': 7131072, 'steps': 37140, 'loss/train': 1.2461761236190796} -11/07/2021 02:27:39 - INFO - __main__ - Step 37142: {'lr': 0.0004336130440067946, 'samples': 7131264, 'steps': 37141, 'loss/train': 1.0689070224761963} -11/07/2021 02:27:40 - INFO - __main__ - Step 37143: {'lr': 0.000433609442487942, 'samples': 7131456, 'steps': 37142, 'loss/train': 1.5266462564468384} -11/07/2021 02:27:41 - INFO - __main__ - Step 37144: {'lr': 0.00043360584088635804, 'samples': 7131648, 'steps': 37143, 'loss/train': 1.4167495965957642} -11/07/2021 02:27:41 - INFO - __main__ - Step 37145: {'lr': 0.0004336022392020439, 'samples': 7131840, 'steps': 37144, 'loss/train': 1.4522278308868408} -11/07/2021 02:27:41 - INFO - __main__ - Step 37146: {'lr': 0.0004335986374350015, 'samples': 7132032, 'steps': 37145, 'loss/train': 1.5540838241577148} -11/07/2021 02:27:42 - INFO - __main__ - Step 37147: {'lr': 0.00043359503558523246, 'samples': 7132224, 'steps': 37146, 'loss/train': 1.2634097337722778} -11/07/2021 02:27:42 - INFO - __main__ - Step 37148: {'lr': 0.0004335914336527382, 'samples': 7132416, 'steps': 37147, 'loss/train': 1.746785044670105} -11/07/2021 02:27:43 - INFO - __main__ - Step 37149: {'lr': 0.0004335878316375206, 'samples': 7132608, 'steps': 37148, 'loss/train': 1.4561712741851807} -11/07/2021 02:27:43 - INFO - __main__ - Step 37150: {'lr': 0.0004335842295395811, 'samples': 7132800, 'steps': 37149, 'loss/train': 0.9840590953826904} -11/07/2021 02:27:44 - INFO - __main__ - Step 37151: {'lr': 0.0004335806273589214, 'samples': 7132992, 'steps': 37150, 'loss/train': 1.2678557634353638} -11/07/2021 02:27:44 - INFO - __main__ - Step 37152: {'lr': 0.0004335770250955431, 'samples': 7133184, 'steps': 37151, 'loss/train': 1.4049510955810547} -11/07/2021 02:27:45 - INFO - __main__ - Step 37153: {'lr': 0.0004335734227494478, 'samples': 7133376, 'steps': 37152, 'loss/train': 1.6425676345825195} -11/07/2021 02:27:46 - INFO - __main__ - Step 37154: {'lr': 0.0004335698203206372, 'samples': 7133568, 'steps': 37153, 'loss/train': 1.8100358247756958} -11/07/2021 02:27:46 - INFO - __main__ - Step 37155: {'lr': 0.00043356621780911273, 'samples': 7133760, 'steps': 37154, 'loss/train': 1.6426031589508057} -11/07/2021 02:27:46 - INFO - __main__ - Step 37156: {'lr': 0.0004335626152148763, 'samples': 7133952, 'steps': 37155, 'loss/train': 1.9970622062683105} -11/07/2021 02:27:47 - INFO - __main__ - Step 37157: {'lr': 0.0004335590125379293, 'samples': 7134144, 'steps': 37156, 'loss/train': 1.66996169090271} -11/07/2021 02:27:47 - INFO - __main__ - Step 37158: {'lr': 0.00043355540977827356, 'samples': 7134336, 'steps': 37157, 'loss/train': 1.1085461378097534} -11/07/2021 02:27:48 - INFO - __main__ - Step 37159: {'lr': 0.0004335518069359105, 'samples': 7134528, 'steps': 37158, 'loss/train': 0.21571595966815948} -11/07/2021 02:27:48 - INFO - __main__ - Step 37160: {'lr': 0.0004335482040108418, 'samples': 7134720, 'steps': 37159, 'loss/train': 1.7107292413711548} -11/07/2021 02:27:49 - INFO - __main__ - Step 37161: {'lr': 0.00043354460100306915, 'samples': 7134912, 'steps': 37160, 'loss/train': 1.9382342100143433} -11/07/2021 02:27:49 - INFO - __main__ - Step 37162: {'lr': 0.00043354099791259414, 'samples': 7135104, 'steps': 37161, 'loss/train': 0.9119004011154175} -11/07/2021 02:27:49 - INFO - __main__ - Step 37163: {'lr': 0.00043353739473941846, 'samples': 7135296, 'steps': 37162, 'loss/train': 1.6841670274734497} -11/07/2021 02:27:50 - INFO - __main__ - Step 37164: {'lr': 0.0004335337914835435, 'samples': 7135488, 'steps': 37163, 'loss/train': 1.644423484802246} -11/07/2021 02:27:51 - INFO - __main__ - Step 37165: {'lr': 0.0004335301881449711, 'samples': 7135680, 'steps': 37164, 'loss/train': 1.5664054155349731} -11/07/2021 02:27:51 - INFO - __main__ - Step 37166: {'lr': 0.00043352658472370294, 'samples': 7135872, 'steps': 37165, 'loss/train': 1.2007473707199097} -11/07/2021 02:27:51 - INFO - __main__ - Step 37167: {'lr': 0.00043352298121974043, 'samples': 7136064, 'steps': 37166, 'loss/train': 1.7131773233413696} -11/07/2021 02:27:52 - INFO - __main__ - Step 37168: {'lr': 0.00043351937763308533, 'samples': 7136256, 'steps': 37167, 'loss/train': 1.607792854309082} -11/07/2021 02:27:52 - INFO - __main__ - Step 37169: {'lr': 0.0004335157739637392, 'samples': 7136448, 'steps': 37168, 'loss/train': 1.5750174522399902} -11/07/2021 02:27:53 - INFO - __main__ - Step 37170: {'lr': 0.0004335121702117038, 'samples': 7136640, 'steps': 37169, 'loss/train': 1.431115746498108} -11/07/2021 02:27:54 - INFO - __main__ - Step 37171: {'lr': 0.0004335085663769805, 'samples': 7136832, 'steps': 37170, 'loss/train': 1.4753409624099731} -11/07/2021 02:27:54 - INFO - __main__ - Step 37172: {'lr': 0.00043350496245957116, 'samples': 7137024, 'steps': 37171, 'loss/train': 1.4689682722091675} -11/07/2021 02:27:54 - INFO - __main__ - Step 37173: {'lr': 0.00043350135845947725, 'samples': 7137216, 'steps': 37172, 'loss/train': 0.965884804725647} -11/07/2021 02:27:55 - INFO - __main__ - Step 37174: {'lr': 0.00043349775437670046, 'samples': 7137408, 'steps': 37173, 'loss/train': 0.5817450881004333} -11/07/2021 02:27:56 - INFO - __main__ - Step 37175: {'lr': 0.0004334941502112425, 'samples': 7137600, 'steps': 37174, 'loss/train': 1.1755576133728027} -11/07/2021 02:27:56 - INFO - __main__ - Step 37176: {'lr': 0.0004334905459631049, 'samples': 7137792, 'steps': 37175, 'loss/train': 1.4950543642044067} -11/07/2021 02:27:56 - INFO - __main__ - Step 37177: {'lr': 0.0004334869416322892, 'samples': 7137984, 'steps': 37176, 'loss/train': 1.5821439027786255} -11/07/2021 02:27:57 - INFO - __main__ - Step 37178: {'lr': 0.0004334833372187972, 'samples': 7138176, 'steps': 37177, 'loss/train': 1.3863235712051392} -11/07/2021 02:27:57 - INFO - __main__ - Step 37179: {'lr': 0.0004334797327226304, 'samples': 7138368, 'steps': 37178, 'loss/train': 1.3994529247283936} -11/07/2021 02:27:58 - INFO - __main__ - Step 37180: {'lr': 0.00043347612814379047, 'samples': 7138560, 'steps': 37179, 'loss/train': 1.3833494186401367} -11/07/2021 02:27:59 - INFO - __main__ - Step 37181: {'lr': 0.000433472523482279, 'samples': 7138752, 'steps': 37180, 'loss/train': 0.6981086134910583} -11/07/2021 02:27:59 - INFO - __main__ - Step 37182: {'lr': 0.0004334689187380977, 'samples': 7138944, 'steps': 37181, 'loss/train': 1.9053527116775513} -11/07/2021 02:27:59 - INFO - __main__ - Step 37183: {'lr': 0.0004334653139112481, 'samples': 7139136, 'steps': 37182, 'loss/train': 1.3545410633087158} -11/07/2021 02:28:00 - INFO - __main__ - Step 37184: {'lr': 0.0004334617090017319, 'samples': 7139328, 'steps': 37183, 'loss/train': 1.5792773962020874} -11/07/2021 02:28:00 - INFO - __main__ - Step 37185: {'lr': 0.0004334581040095506, 'samples': 7139520, 'steps': 37184, 'loss/train': 1.7746398448944092} -11/07/2021 02:28:01 - INFO - __main__ - Step 37186: {'lr': 0.00043345449893470594, 'samples': 7139712, 'steps': 37185, 'loss/train': 1.6468799114227295} -11/07/2021 02:28:02 - INFO - __main__ - Step 37187: {'lr': 0.00043345089377719954, 'samples': 7139904, 'steps': 37186, 'loss/train': 1.2727960348129272} -11/07/2021 02:28:02 - INFO - __main__ - Step 37188: {'lr': 0.00043344728853703297, 'samples': 7140096, 'steps': 37187, 'loss/train': 1.5978360176086426} -11/07/2021 02:28:02 - INFO - __main__ - Step 37189: {'lr': 0.0004334436832142079, 'samples': 7140288, 'steps': 37188, 'loss/train': 1.308510661125183} -11/07/2021 02:28:03 - INFO - __main__ - Step 37190: {'lr': 0.000433440077808726, 'samples': 7140480, 'steps': 37189, 'loss/train': 1.7172496318817139} -11/07/2021 02:28:03 - INFO - __main__ - Step 37191: {'lr': 0.00043343647232058877, 'samples': 7140672, 'steps': 37190, 'loss/train': 1.2515482902526855} -11/07/2021 02:28:04 - INFO - __main__ - Step 37192: {'lr': 0.0004334328667497979, 'samples': 7140864, 'steps': 37191, 'loss/train': 0.8863022923469543} -11/07/2021 02:28:04 - INFO - __main__ - Step 37193: {'lr': 0.00043342926109635497, 'samples': 7141056, 'steps': 37192, 'loss/train': 1.1954317092895508} -11/07/2021 02:28:05 - INFO - __main__ - Step 37194: {'lr': 0.0004334256553602617, 'samples': 7141248, 'steps': 37193, 'loss/train': 1.6151297092437744} -11/07/2021 02:28:05 - INFO - __main__ - Step 37195: {'lr': 0.00043342204954151963, 'samples': 7141440, 'steps': 37194, 'loss/train': 1.5363059043884277} -11/07/2021 02:28:05 - INFO - __main__ - Step 37196: {'lr': 0.00043341844364013047, 'samples': 7141632, 'steps': 37195, 'loss/train': 1.5967592000961304} -11/07/2021 02:28:07 - INFO - __main__ - Step 37197: {'lr': 0.00043341483765609566, 'samples': 7141824, 'steps': 37196, 'loss/train': 1.2228840589523315} -11/07/2021 02:28:07 - INFO - __main__ - Step 37198: {'lr': 0.0004334112315894171, 'samples': 7142016, 'steps': 37197, 'loss/train': 1.1674365997314453} -11/07/2021 02:28:07 - INFO - __main__ - Step 37199: {'lr': 0.00043340762544009627, 'samples': 7142208, 'steps': 37198, 'loss/train': 1.2941004037857056} -11/07/2021 02:28:08 - INFO - __main__ - Step 37200: {'lr': 0.0004334040192081347, 'samples': 7142400, 'steps': 37199, 'loss/train': 1.625350832939148} -11/07/2021 02:28:08 - INFO - __main__ - Step 37201: {'lr': 0.00043340041289353416, 'samples': 7142592, 'steps': 37200, 'loss/train': 1.4278935194015503} -11/07/2021 02:28:09 - INFO - __main__ - Step 37202: {'lr': 0.0004333968064962962, 'samples': 7142784, 'steps': 37201, 'loss/train': 1.6567054986953735} -11/07/2021 02:28:09 - INFO - __main__ - Step 37203: {'lr': 0.00043339320001642244, 'samples': 7142976, 'steps': 37202, 'loss/train': 1.620715618133545} -11/07/2021 02:28:10 - INFO - __main__ - Step 37204: {'lr': 0.0004333895934539146, 'samples': 7143168, 'steps': 37203, 'loss/train': 1.299027442932129} -11/07/2021 02:28:10 - INFO - __main__ - Step 37205: {'lr': 0.00043338598680877423, 'samples': 7143360, 'steps': 37204, 'loss/train': 1.6379092931747437} -11/07/2021 02:28:10 - INFO - __main__ - Step 37206: {'lr': 0.00043338238008100297, 'samples': 7143552, 'steps': 37205, 'loss/train': 1.3296124935150146} -11/07/2021 02:28:11 - INFO - __main__ - Step 37207: {'lr': 0.0004333787732706024, 'samples': 7143744, 'steps': 37206, 'loss/train': 1.4551992416381836} -11/07/2021 02:28:12 - INFO - __main__ - Step 37208: {'lr': 0.00043337516637757416, 'samples': 7143936, 'steps': 37207, 'loss/train': 1.1694921255111694} -11/07/2021 02:28:12 - INFO - __main__ - Step 37209: {'lr': 0.00043337155940191996, 'samples': 7144128, 'steps': 37208, 'loss/train': 1.6044751405715942} -11/07/2021 02:28:12 - INFO - __main__ - Step 37210: {'lr': 0.0004333679523436413, 'samples': 7144320, 'steps': 37209, 'loss/train': 1.1683112382888794} -11/07/2021 02:28:13 - INFO - __main__ - Step 37211: {'lr': 0.0004333643452027399, 'samples': 7144512, 'steps': 37210, 'loss/train': 0.2887013554573059} -11/07/2021 02:28:14 - INFO - __main__ - Step 37212: {'lr': 0.00043336073797921743, 'samples': 7144704, 'steps': 37211, 'loss/train': 1.025676965713501} -11/07/2021 02:28:14 - INFO - __main__ - Step 37213: {'lr': 0.0004333571306730754, 'samples': 7144896, 'steps': 37212, 'loss/train': 1.276005744934082} -11/07/2021 02:28:14 - INFO - __main__ - Step 37214: {'lr': 0.00043335352328431544, 'samples': 7145088, 'steps': 37213, 'loss/train': 1.3431577682495117} -11/07/2021 02:28:15 - INFO - __main__ - Step 37215: {'lr': 0.00043334991581293924, 'samples': 7145280, 'steps': 37214, 'loss/train': 1.2101293802261353} -11/07/2021 02:28:15 - INFO - __main__ - Step 37216: {'lr': 0.0004333463082589484, 'samples': 7145472, 'steps': 37215, 'loss/train': 1.5610136985778809} -11/07/2021 02:28:16 - INFO - __main__ - Step 37217: {'lr': 0.0004333427006223445, 'samples': 7145664, 'steps': 37216, 'loss/train': 1.2841063737869263} -11/07/2021 02:28:16 - INFO - __main__ - Step 37218: {'lr': 0.00043333909290312923, 'samples': 7145856, 'steps': 37217, 'loss/train': 1.0707043409347534} -11/07/2021 02:28:17 - INFO - __main__ - Step 37219: {'lr': 0.00043333548510130426, 'samples': 7146048, 'steps': 37218, 'loss/train': 1.5830148458480835} -11/07/2021 02:28:17 - INFO - __main__ - Step 37220: {'lr': 0.00043333187721687104, 'samples': 7146240, 'steps': 37219, 'loss/train': 1.8787128925323486} -11/07/2021 02:28:18 - INFO - __main__ - Step 37221: {'lr': 0.0004333282692498314, 'samples': 7146432, 'steps': 37220, 'loss/train': 2.0772974491119385} -11/07/2021 02:28:19 - INFO - __main__ - Step 37222: {'lr': 0.00043332466120018685, 'samples': 7146624, 'steps': 37221, 'loss/train': 1.8868778944015503} -11/07/2021 02:28:19 - INFO - __main__ - Step 37223: {'lr': 0.000433321053067939, 'samples': 7146816, 'steps': 37222, 'loss/train': 1.276110291481018} -11/07/2021 02:28:19 - INFO - __main__ - Step 37224: {'lr': 0.00043331744485308954, 'samples': 7147008, 'steps': 37223, 'loss/train': 1.0257227420806885} -11/07/2021 02:28:20 - INFO - __main__ - Step 37225: {'lr': 0.00043331383655564003, 'samples': 7147200, 'steps': 37224, 'loss/train': 1.7596057653427124} -11/07/2021 02:28:20 - INFO - __main__ - Step 37226: {'lr': 0.0004333102281755922, 'samples': 7147392, 'steps': 37225, 'loss/train': 1.1045256853103638} -11/07/2021 02:28:20 - INFO - __main__ - Step 37227: {'lr': 0.0004333066197129475, 'samples': 7147584, 'steps': 37226, 'loss/train': 1.3454959392547607} -11/07/2021 02:28:22 - INFO - __main__ - Step 37228: {'lr': 0.00043330301116770777, 'samples': 7147776, 'steps': 37227, 'loss/train': 1.0431512594223022} -11/07/2021 02:28:22 - INFO - __main__ - Step 37229: {'lr': 0.0004332994025398745, 'samples': 7147968, 'steps': 37228, 'loss/train': 1.4733880758285522} -11/07/2021 02:28:22 - INFO - __main__ - Step 37230: {'lr': 0.0004332957938294493, 'samples': 7148160, 'steps': 37229, 'loss/train': 1.5776143074035645} -11/07/2021 02:28:23 - INFO - __main__ - Step 37231: {'lr': 0.0004332921850364339, 'samples': 7148352, 'steps': 37230, 'loss/train': 0.6922283172607422} -11/07/2021 02:28:23 - INFO - __main__ - Step 37232: {'lr': 0.00043328857616082986, 'samples': 7148544, 'steps': 37231, 'loss/train': 1.354921579360962} -11/07/2021 02:28:24 - INFO - __main__ - Step 37233: {'lr': 0.0004332849672026388, 'samples': 7148736, 'steps': 37232, 'loss/train': 1.1492215394973755} -11/07/2021 02:28:24 - INFO - __main__ - Step 37234: {'lr': 0.0004332813581618624, 'samples': 7148928, 'steps': 37233, 'loss/train': 1.270585060119629} -11/07/2021 02:28:25 - INFO - __main__ - Step 37235: {'lr': 0.00043327774903850226, 'samples': 7149120, 'steps': 37234, 'loss/train': 1.6720829010009766} -11/07/2021 02:28:25 - INFO - __main__ - Step 37236: {'lr': 0.0004332741398325599, 'samples': 7149312, 'steps': 37235, 'loss/train': 1.7749427556991577} -11/07/2021 02:28:25 - INFO - __main__ - Step 37237: {'lr': 0.00043327053054403707, 'samples': 7149504, 'steps': 37236, 'loss/train': 1.336981177330017} -11/07/2021 02:28:26 - INFO - __main__ - Step 37238: {'lr': 0.0004332669211729354, 'samples': 7149696, 'steps': 37237, 'loss/train': 1.2597352266311646} -11/07/2021 02:28:27 - INFO - __main__ - Step 37239: {'lr': 0.00043326331171925656, 'samples': 7149888, 'steps': 37238, 'loss/train': 0.9623879194259644} -11/07/2021 02:28:27 - INFO - __main__ - Step 37240: {'lr': 0.000433259702183002, 'samples': 7150080, 'steps': 37239, 'loss/train': 1.4372882843017578} -11/07/2021 02:28:27 - INFO - __main__ - Step 37241: {'lr': 0.0004332560925641734, 'samples': 7150272, 'steps': 37240, 'loss/train': 1.8603291511535645} -11/07/2021 02:28:28 - INFO - __main__ - Step 37242: {'lr': 0.0004332524828627725, 'samples': 7150464, 'steps': 37241, 'loss/train': 1.3960036039352417} -11/07/2021 02:28:29 - INFO - __main__ - Step 37243: {'lr': 0.0004332488730788009, 'samples': 7150656, 'steps': 37242, 'loss/train': 1.51231050491333} -11/07/2021 02:28:29 - INFO - __main__ - Step 37244: {'lr': 0.0004332452632122601, 'samples': 7150848, 'steps': 37243, 'loss/train': 1.967123031616211} -11/07/2021 02:28:29 - INFO - __main__ - Step 37245: {'lr': 0.0004332416532631519, 'samples': 7151040, 'steps': 37244, 'loss/train': 1.2595200538635254} -11/07/2021 02:28:30 - INFO - __main__ - Step 37246: {'lr': 0.00043323804323147777, 'samples': 7151232, 'steps': 37245, 'loss/train': 0.15449711680412292} -11/07/2021 02:28:30 - INFO - __main__ - Step 37247: {'lr': 0.0004332344331172394, 'samples': 7151424, 'steps': 37246, 'loss/train': 1.4898953437805176} -11/07/2021 02:28:31 - INFO - __main__ - Step 37248: {'lr': 0.0004332308229204385, 'samples': 7151616, 'steps': 37247, 'loss/train': 1.775602102279663} -11/07/2021 02:28:32 - INFO - __main__ - Step 37249: {'lr': 0.00043322721264107657, 'samples': 7151808, 'steps': 37248, 'loss/train': 1.1206448078155518} -11/07/2021 02:28:32 - INFO - __main__ - Step 37250: {'lr': 0.00043322360227915526, 'samples': 7152000, 'steps': 37249, 'loss/train': 1.5136470794677734} -11/07/2021 02:28:32 - INFO - __main__ - Step 37251: {'lr': 0.0004332199918346763, 'samples': 7152192, 'steps': 37250, 'loss/train': 1.70261549949646} -11/07/2021 02:28:33 - INFO - __main__ - Step 37252: {'lr': 0.00043321638130764116, 'samples': 7152384, 'steps': 37251, 'loss/train': 1.5859137773513794} -11/07/2021 02:28:33 - INFO - __main__ - Step 37253: {'lr': 0.00043321277069805153, 'samples': 7152576, 'steps': 37252, 'loss/train': 1.2263541221618652} -11/07/2021 02:28:34 - INFO - __main__ - Step 37254: {'lr': 0.0004332091600059091, 'samples': 7152768, 'steps': 37253, 'loss/train': 0.814882755279541} -11/07/2021 02:28:35 - INFO - __main__ - Step 37255: {'lr': 0.00043320554923121545, 'samples': 7152960, 'steps': 37254, 'loss/train': 1.5587509870529175} -11/07/2021 02:28:35 - INFO - __main__ - Step 37256: {'lr': 0.0004332019383739722, 'samples': 7153152, 'steps': 37255, 'loss/train': 1.4879378080368042} -11/07/2021 02:28:35 - INFO - __main__ - Step 37257: {'lr': 0.000433198327434181, 'samples': 7153344, 'steps': 37256, 'loss/train': 1.7939229011535645} -11/07/2021 02:28:36 - INFO - __main__ - Step 37258: {'lr': 0.0004331947164118434, 'samples': 7153536, 'steps': 37257, 'loss/train': 1.3613734245300293} -11/07/2021 02:28:37 - INFO - __main__ - Step 37259: {'lr': 0.00043319110530696116, 'samples': 7153728, 'steps': 37258, 'loss/train': 1.498550534248352} -11/07/2021 02:28:37 - INFO - __main__ - Step 37260: {'lr': 0.00043318749411953584, 'samples': 7153920, 'steps': 37259, 'loss/train': 1.7559316158294678} -11/07/2021 02:28:37 - INFO - __main__ - Step 37261: {'lr': 0.000433183882849569, 'samples': 7154112, 'steps': 37260, 'loss/train': 1.7043496370315552} -11/07/2021 02:28:38 - INFO - __main__ - Step 37262: {'lr': 0.0004331802714970624, 'samples': 7154304, 'steps': 37261, 'loss/train': 1.487119197845459} -11/07/2021 02:28:38 - INFO - __main__ - Step 37263: {'lr': 0.0004331766600620175, 'samples': 7154496, 'steps': 37262, 'loss/train': 1.4115322828292847} -11/07/2021 02:28:39 - INFO - __main__ - Step 37264: {'lr': 0.00043317304854443607, 'samples': 7154688, 'steps': 37263, 'loss/train': 1.5334402322769165} -11/07/2021 02:28:40 - INFO - __main__ - Step 37265: {'lr': 0.0004331694369443197, 'samples': 7154880, 'steps': 37264, 'loss/train': 1.5968416929244995} -11/07/2021 02:28:40 - INFO - __main__ - Step 37266: {'lr': 0.00043316582526167004, 'samples': 7155072, 'steps': 37265, 'loss/train': 1.634678602218628} -11/07/2021 02:28:40 - INFO - __main__ - Step 37267: {'lr': 0.0004331622134964887, 'samples': 7155264, 'steps': 37266, 'loss/train': 1.4934666156768799} -11/07/2021 02:28:41 - INFO - __main__ - Step 37268: {'lr': 0.0004331586016487772, 'samples': 7155456, 'steps': 37267, 'loss/train': 1.3731762170791626} -11/07/2021 02:28:42 - INFO - __main__ - Step 37269: {'lr': 0.00043315498971853726, 'samples': 7155648, 'steps': 37268, 'loss/train': 1.780970573425293} -11/07/2021 02:28:42 - INFO - __main__ - Step 37270: {'lr': 0.0004331513777057706, 'samples': 7155840, 'steps': 37269, 'loss/train': 1.3365075588226318} -11/07/2021 02:28:42 - INFO - __main__ - Step 37271: {'lr': 0.00043314776561047865, 'samples': 7156032, 'steps': 37270, 'loss/train': 1.6340923309326172} -11/07/2021 02:28:43 - INFO - __main__ - Step 37272: {'lr': 0.0004331441534326632, 'samples': 7156224, 'steps': 37271, 'loss/train': 1.6194738149642944} -11/07/2021 02:28:43 - INFO - __main__ - Step 37273: {'lr': 0.0004331405411723258, 'samples': 7156416, 'steps': 37272, 'loss/train': 1.3026750087738037} -11/07/2021 02:28:44 - INFO - __main__ - Step 37274: {'lr': 0.0004331369288294681, 'samples': 7156608, 'steps': 37273, 'loss/train': 1.0709071159362793} -11/07/2021 02:28:44 - INFO - __main__ - Step 37275: {'lr': 0.0004331333164040918, 'samples': 7156800, 'steps': 37274, 'loss/train': 1.5334340333938599} -11/07/2021 02:28:45 - INFO - __main__ - Step 37276: {'lr': 0.0004331297038961984, 'samples': 7156992, 'steps': 37275, 'loss/train': 1.5693700313568115} -11/07/2021 02:28:45 - INFO - __main__ - Step 37277: {'lr': 0.00043312609130578963, 'samples': 7157184, 'steps': 37276, 'loss/train': 1.5914875268936157} -11/07/2021 02:28:45 - INFO - __main__ - Step 37278: {'lr': 0.000433122478632867, 'samples': 7157376, 'steps': 37277, 'loss/train': 0.8798840641975403} -11/07/2021 02:28:46 - INFO - __main__ - Step 37279: {'lr': 0.0004331188658774322, 'samples': 7157568, 'steps': 37278, 'loss/train': 1.3093528747558594} -11/07/2021 02:28:47 - INFO - __main__ - Step 37280: {'lr': 0.00043311525303948685, 'samples': 7157760, 'steps': 37279, 'loss/train': 1.349352478981018} -11/07/2021 02:28:47 - INFO - __main__ - Step 37281: {'lr': 0.0004331116401190327, 'samples': 7157952, 'steps': 37280, 'loss/train': 1.670189380645752} -11/07/2021 02:28:47 - INFO - __main__ - Step 37282: {'lr': 0.0004331080271160712, 'samples': 7158144, 'steps': 37281, 'loss/train': 1.5440136194229126} -11/07/2021 02:28:48 - INFO - __main__ - Step 37283: {'lr': 0.00043310441403060404, 'samples': 7158336, 'steps': 37282, 'loss/train': 1.0048491954803467} -11/07/2021 02:28:48 - INFO - __main__ - Step 37284: {'lr': 0.00043310080086263284, 'samples': 7158528, 'steps': 37283, 'loss/train': 0.912543535232544} -11/07/2021 02:28:49 - INFO - __main__ - Step 37285: {'lr': 0.0004330971876121593, 'samples': 7158720, 'steps': 37284, 'loss/train': 1.51612389087677} -11/07/2021 02:28:50 - INFO - __main__ - Step 37286: {'lr': 0.0004330935742791849, 'samples': 7158912, 'steps': 37285, 'loss/train': 1.4151886701583862} -11/07/2021 02:28:50 - INFO - __main__ - Step 37287: {'lr': 0.00043308996086371146, 'samples': 7159104, 'steps': 37286, 'loss/train': 0.7171698212623596} -11/07/2021 02:28:50 - INFO - __main__ - Step 37288: {'lr': 0.0004330863473657405, 'samples': 7159296, 'steps': 37287, 'loss/train': 1.3389252424240112} -11/07/2021 02:28:51 - INFO - __main__ - Step 37289: {'lr': 0.00043308273378527364, 'samples': 7159488, 'steps': 37288, 'loss/train': 1.61613929271698} -11/07/2021 02:28:52 - INFO - __main__ - Step 37290: {'lr': 0.00043307912012231255, 'samples': 7159680, 'steps': 37289, 'loss/train': 1.9408761262893677} -11/07/2021 02:28:52 - INFO - __main__ - Step 37291: {'lr': 0.0004330755063768588, 'samples': 7159872, 'steps': 37290, 'loss/train': 1.1934666633605957} -11/07/2021 02:28:52 - INFO - __main__ - Step 37292: {'lr': 0.000433071892548914, 'samples': 7160064, 'steps': 37291, 'loss/train': 1.5802807807922363} -11/07/2021 02:28:53 - INFO - __main__ - Step 37293: {'lr': 0.00043306827863847985, 'samples': 7160256, 'steps': 37292, 'loss/train': 1.3688923120498657} -11/07/2021 02:28:53 - INFO - __main__ - Step 37294: {'lr': 0.00043306466464555803, 'samples': 7160448, 'steps': 37293, 'loss/train': 1.7352780103683472} -11/07/2021 02:28:54 - INFO - __main__ - Step 37295: {'lr': 0.0004330610505701501, 'samples': 7160640, 'steps': 37294, 'loss/train': 1.8678953647613525} -11/07/2021 02:28:55 - INFO - __main__ - Step 37296: {'lr': 0.00043305743641225766, 'samples': 7160832, 'steps': 37295, 'loss/train': 1.132670283317566} -11/07/2021 02:28:55 - INFO - __main__ - Step 37297: {'lr': 0.00043305382217188225, 'samples': 7161024, 'steps': 37296, 'loss/train': 1.6592589616775513} -11/07/2021 02:28:55 - INFO - __main__ - Step 37298: {'lr': 0.0004330502078490258, 'samples': 7161216, 'steps': 37297, 'loss/train': 1.2880827188491821} -11/07/2021 02:28:56 - INFO - __main__ - Step 37299: {'lr': 0.0004330465934436896, 'samples': 7161408, 'steps': 37298, 'loss/train': 1.9087271690368652} -11/07/2021 02:28:56 - INFO - __main__ - Step 37300: {'lr': 0.00043304297895587553, 'samples': 7161600, 'steps': 37299, 'loss/train': 1.2395339012145996} -11/07/2021 02:28:57 - INFO - __main__ - Step 37301: {'lr': 0.0004330393643855851, 'samples': 7161792, 'steps': 37300, 'loss/train': 1.3079183101654053} -11/07/2021 02:28:57 - INFO - __main__ - Step 37302: {'lr': 0.0004330357497328199, 'samples': 7161984, 'steps': 37301, 'loss/train': 2.2721056938171387} -11/07/2021 02:28:58 - INFO - __main__ - Step 37303: {'lr': 0.00043303213499758166, 'samples': 7162176, 'steps': 37302, 'loss/train': 1.6880961656570435} -11/07/2021 02:28:58 - INFO - __main__ - Step 37304: {'lr': 0.00043302852017987196, 'samples': 7162368, 'steps': 37303, 'loss/train': 1.1895135641098022} -11/07/2021 02:28:58 - INFO - __main__ - Step 37305: {'lr': 0.0004330249052796924, 'samples': 7162560, 'steps': 37304, 'loss/train': 1.7214696407318115} -11/07/2021 02:28:59 - INFO - __main__ - Step 37306: {'lr': 0.0004330212902970447, 'samples': 7162752, 'steps': 37305, 'loss/train': 1.4084619283676147} -11/07/2021 02:29:00 - INFO - __main__ - Step 37307: {'lr': 0.0004330176752319304, 'samples': 7162944, 'steps': 37306, 'loss/train': 1.3558456897735596} -11/07/2021 02:29:00 - INFO - __main__ - Step 37308: {'lr': 0.0004330140600843512, 'samples': 7163136, 'steps': 37307, 'loss/train': 1.9286340475082397} -11/07/2021 02:29:00 - INFO - __main__ - Step 37309: {'lr': 0.0004330104448543086, 'samples': 7163328, 'steps': 37308, 'loss/train': 1.5556902885437012} -11/07/2021 02:29:01 - INFO - __main__ - Step 37310: {'lr': 0.0004330068295418044, 'samples': 7163520, 'steps': 37309, 'loss/train': 1.5030561685562134} -11/07/2021 02:29:02 - INFO - __main__ - Step 37311: {'lr': 0.0004330032141468401, 'samples': 7163712, 'steps': 37310, 'loss/train': 1.6441051959991455} -11/07/2021 02:29:02 - INFO - __main__ - Step 37312: {'lr': 0.0004329995986694174, 'samples': 7163904, 'steps': 37311, 'loss/train': 1.1074079275131226} -11/07/2021 02:29:02 - INFO - __main__ - Step 37313: {'lr': 0.00043299598310953793, 'samples': 7164096, 'steps': 37312, 'loss/train': 1.6179929971694946} -11/07/2021 02:29:03 - INFO - __main__ - Step 37314: {'lr': 0.0004329923674672032, 'samples': 7164288, 'steps': 37313, 'loss/train': 1.4974441528320312} -11/07/2021 02:29:03 - INFO - __main__ - Step 37315: {'lr': 0.00043298875174241504, 'samples': 7164480, 'steps': 37314, 'loss/train': 0.9005528092384338} -11/07/2021 02:29:04 - INFO - __main__ - Step 37316: {'lr': 0.00043298513593517483, 'samples': 7164672, 'steps': 37315, 'loss/train': 1.9145193099975586} -11/07/2021 02:29:04 - INFO - __main__ - Step 37317: {'lr': 0.0004329815200454845, 'samples': 7164864, 'steps': 37316, 'loss/train': 1.3091903924942017} -11/07/2021 02:29:05 - INFO - __main__ - Step 37318: {'lr': 0.00043297790407334545, 'samples': 7165056, 'steps': 37317, 'loss/train': 1.0597180128097534} -11/07/2021 02:29:05 - INFO - __main__ - Step 37319: {'lr': 0.0004329742880187594, 'samples': 7165248, 'steps': 37318, 'loss/train': 1.1523969173431396} -11/07/2021 02:29:06 - INFO - __main__ - Step 37320: {'lr': 0.0004329706718817279, 'samples': 7165440, 'steps': 37319, 'loss/train': 1.1664011478424072} -11/07/2021 02:29:07 - INFO - __main__ - Step 37321: {'lr': 0.00043296705566225267, 'samples': 7165632, 'steps': 37320, 'loss/train': 1.5477774143218994} -11/07/2021 02:29:07 - INFO - __main__ - Step 37322: {'lr': 0.00043296343936033535, 'samples': 7165824, 'steps': 37321, 'loss/train': 1.6472041606903076} -11/07/2021 02:29:07 - INFO - __main__ - Step 37323: {'lr': 0.0004329598229759775, 'samples': 7166016, 'steps': 37322, 'loss/train': 1.7595402002334595} -11/07/2021 02:29:08 - INFO - __main__ - Step 37324: {'lr': 0.00043295620650918076, 'samples': 7166208, 'steps': 37323, 'loss/train': 1.29658043384552} -11/07/2021 02:29:08 - INFO - __main__ - Step 37325: {'lr': 0.0004329525899599468, 'samples': 7166400, 'steps': 37324, 'loss/train': 1.2506625652313232} -11/07/2021 02:29:09 - INFO - __main__ - Step 37326: {'lr': 0.0004329489733282772, 'samples': 7166592, 'steps': 37325, 'loss/train': 1.4976551532745361} -11/07/2021 02:29:09 - INFO - __main__ - Step 37327: {'lr': 0.0004329453566141737, 'samples': 7166784, 'steps': 37326, 'loss/train': 1.637865424156189} -11/07/2021 02:29:10 - INFO - __main__ - Step 37328: {'lr': 0.00043294173981763776, 'samples': 7166976, 'steps': 37327, 'loss/train': 0.9973399639129639} -11/07/2021 02:29:10 - INFO - __main__ - Step 37329: {'lr': 0.00043293812293867113, 'samples': 7167168, 'steps': 37328, 'loss/train': 0.9981698393821716} -11/07/2021 02:29:10 - INFO - __main__ - Step 37330: {'lr': 0.0004329345059772754, 'samples': 7167360, 'steps': 37329, 'loss/train': 1.8823930025100708} -11/07/2021 02:29:11 - INFO - __main__ - Step 37331: {'lr': 0.0004329308889334522, 'samples': 7167552, 'steps': 37330, 'loss/train': 1.1413021087646484} -11/07/2021 02:29:12 - INFO - __main__ - Step 37332: {'lr': 0.00043292727180720315, 'samples': 7167744, 'steps': 37331, 'loss/train': 1.2384685277938843} -11/07/2021 02:29:12 - INFO - __main__ - Step 37333: {'lr': 0.0004329236545985299, 'samples': 7167936, 'steps': 37332, 'loss/train': 1.3601319789886475} -11/07/2021 02:29:12 - INFO - __main__ - Step 37334: {'lr': 0.000432920037307434, 'samples': 7168128, 'steps': 37333, 'loss/train': 1.5531187057495117} -11/07/2021 02:29:13 - INFO - __main__ - Step 37335: {'lr': 0.00043291641993391727, 'samples': 7168320, 'steps': 37334, 'loss/train': 1.5530239343643188} -11/07/2021 02:29:13 - INFO - __main__ - Step 37336: {'lr': 0.0004329128024779812, 'samples': 7168512, 'steps': 37335, 'loss/train': 1.7532144784927368} -11/07/2021 02:29:14 - INFO - __main__ - Step 37337: {'lr': 0.0004329091849396274, 'samples': 7168704, 'steps': 37336, 'loss/train': 1.3057897090911865} -11/07/2021 02:29:15 - INFO - __main__ - Step 37338: {'lr': 0.00043290556731885756, 'samples': 7168896, 'steps': 37337, 'loss/train': 2.0908994674682617} -11/07/2021 02:29:15 - INFO - __main__ - Step 37339: {'lr': 0.0004329019496156733, 'samples': 7169088, 'steps': 37338, 'loss/train': 1.0564286708831787} -11/07/2021 02:29:15 - INFO - __main__ - Step 37340: {'lr': 0.0004328983318300763, 'samples': 7169280, 'steps': 37339, 'loss/train': 1.6685435771942139} -11/07/2021 02:29:16 - INFO - __main__ - Step 37341: {'lr': 0.00043289471396206803, 'samples': 7169472, 'steps': 37340, 'loss/train': 1.920317530632019} -11/07/2021 02:29:17 - INFO - __main__ - Step 37342: {'lr': 0.0004328910960116503, 'samples': 7169664, 'steps': 37341, 'loss/train': 1.225765347480774} -11/07/2021 02:29:17 - INFO - __main__ - Step 37343: {'lr': 0.00043288747797882467, 'samples': 7169856, 'steps': 37342, 'loss/train': 1.519812822341919} -11/07/2021 02:29:17 - INFO - __main__ - Step 37344: {'lr': 0.00043288385986359266, 'samples': 7170048, 'steps': 37343, 'loss/train': 1.6947556734085083} -11/07/2021 02:29:18 - INFO - __main__ - Step 37345: {'lr': 0.00043288024166595614, 'samples': 7170240, 'steps': 37344, 'loss/train': 1.7099330425262451} -11/07/2021 02:29:18 - INFO - __main__ - Step 37346: {'lr': 0.00043287662338591657, 'samples': 7170432, 'steps': 37345, 'loss/train': 1.2091368436813354} -11/07/2021 02:29:19 - INFO - __main__ - Step 37347: {'lr': 0.0004328730050234756, 'samples': 7170624, 'steps': 37346, 'loss/train': 1.602807641029358} -11/07/2021 02:29:20 - INFO - __main__ - Step 37348: {'lr': 0.00043286938657863483, 'samples': 7170816, 'steps': 37347, 'loss/train': 1.6188071966171265} -11/07/2021 02:29:20 - INFO - __main__ - Step 37349: {'lr': 0.00043286576805139597, 'samples': 7171008, 'steps': 37348, 'loss/train': 1.606528639793396} -11/07/2021 02:29:20 - INFO - __main__ - Step 37350: {'lr': 0.0004328621494417606, 'samples': 7171200, 'steps': 37349, 'loss/train': 1.2447718381881714} -11/07/2021 02:29:21 - INFO - __main__ - Step 37351: {'lr': 0.0004328585307497304, 'samples': 7171392, 'steps': 37350, 'loss/train': 0.8961560726165771} -11/07/2021 02:29:21 - INFO - __main__ - Step 37352: {'lr': 0.00043285491197530694, 'samples': 7171584, 'steps': 37351, 'loss/train': 0.8640336394309998} -11/07/2021 02:29:22 - INFO - __main__ - Step 37353: {'lr': 0.00043285129311849193, 'samples': 7171776, 'steps': 37352, 'loss/train': 1.5787489414215088} -11/07/2021 02:29:22 - INFO - __main__ - Step 37354: {'lr': 0.0004328476741792869, 'samples': 7171968, 'steps': 37353, 'loss/train': 0.7472124695777893} -11/07/2021 02:29:23 - INFO - __main__ - Step 37355: {'lr': 0.00043284405515769356, 'samples': 7172160, 'steps': 37354, 'loss/train': 1.5969117879867554} -11/07/2021 02:29:23 - INFO - __main__ - Step 37356: {'lr': 0.00043284043605371346, 'samples': 7172352, 'steps': 37355, 'loss/train': 1.0829873085021973} -11/07/2021 02:29:23 - INFO - __main__ - Step 37357: {'lr': 0.0004328368168673483, 'samples': 7172544, 'steps': 37356, 'loss/train': 1.5583910942077637} -11/07/2021 02:29:24 - INFO - __main__ - Step 37358: {'lr': 0.00043283319759859974, 'samples': 7172736, 'steps': 37357, 'loss/train': 1.3432074785232544} -11/07/2021 02:29:25 - INFO - __main__ - Step 37359: {'lr': 0.0004328295782474693, 'samples': 7172928, 'steps': 37358, 'loss/train': 1.6358716487884521} -11/07/2021 02:29:25 - INFO - __main__ - Step 37360: {'lr': 0.0004328259588139587, 'samples': 7173120, 'steps': 37359, 'loss/train': 1.6624610424041748} -11/07/2021 02:29:25 - INFO - __main__ - Step 37361: {'lr': 0.0004328223392980696, 'samples': 7173312, 'steps': 37360, 'loss/train': 1.577709436416626} -11/07/2021 02:29:26 - INFO - __main__ - Step 37362: {'lr': 0.00043281871969980346, 'samples': 7173504, 'steps': 37361, 'loss/train': 1.5553466081619263} -11/07/2021 02:29:27 - INFO - __main__ - Step 37363: {'lr': 0.00043281510001916214, 'samples': 7173696, 'steps': 37362, 'loss/train': 1.6953697204589844} -11/07/2021 02:29:27 - INFO - __main__ - Step 37364: {'lr': 0.0004328114802561471, 'samples': 7173888, 'steps': 37363, 'loss/train': 1.4359856843948364} -11/07/2021 02:29:28 - INFO - __main__ - Step 37365: {'lr': 0.00043280786041076006, 'samples': 7174080, 'steps': 37364, 'loss/train': 0.9891050457954407} -11/07/2021 02:29:28 - INFO - __main__ - Step 37366: {'lr': 0.0004328042404830026, 'samples': 7174272, 'steps': 37365, 'loss/train': 1.09203040599823} -11/07/2021 02:29:28 - INFO - __main__ - Step 37367: {'lr': 0.0004328006204728763, 'samples': 7174464, 'steps': 37366, 'loss/train': 1.4810203313827515} -11/07/2021 02:29:29 - INFO - __main__ - Step 37368: {'lr': 0.00043279700038038296, 'samples': 7174656, 'steps': 37367, 'loss/train': 0.7582082748413086} -11/07/2021 02:29:30 - INFO - __main__ - Step 37369: {'lr': 0.0004327933802055241, 'samples': 7174848, 'steps': 37368, 'loss/train': 1.428175449371338} -11/07/2021 02:29:30 - INFO - __main__ - Step 37370: {'lr': 0.0004327897599483013, 'samples': 7175040, 'steps': 37369, 'loss/train': 1.807591438293457} -11/07/2021 02:29:30 - INFO - __main__ - Step 37371: {'lr': 0.00043278613960871624, 'samples': 7175232, 'steps': 37370, 'loss/train': 0.9312697649002075} -11/07/2021 02:29:31 - INFO - __main__ - Step 37372: {'lr': 0.00043278251918677066, 'samples': 7175424, 'steps': 37371, 'loss/train': 1.7605900764465332} -11/07/2021 02:29:32 - INFO - __main__ - Step 37373: {'lr': 0.00043277889868246605, 'samples': 7175616, 'steps': 37372, 'loss/train': 1.78399658203125} -11/07/2021 02:29:32 - INFO - __main__ - Step 37374: {'lr': 0.0004327752780958041, 'samples': 7175808, 'steps': 37373, 'loss/train': 1.1700432300567627} -11/07/2021 02:29:32 - INFO - __main__ - Step 37375: {'lr': 0.0004327716574267864, 'samples': 7176000, 'steps': 37374, 'loss/train': 1.495086908340454} -11/07/2021 02:29:33 - INFO - __main__ - Step 37376: {'lr': 0.00043276803667541465, 'samples': 7176192, 'steps': 37375, 'loss/train': 1.4538503885269165} -11/07/2021 02:29:33 - INFO - __main__ - Step 37377: {'lr': 0.0004327644158416905, 'samples': 7176384, 'steps': 37376, 'loss/train': 1.8409719467163086} -11/07/2021 02:29:34 - INFO - __main__ - Step 37378: {'lr': 0.0004327607949256154, 'samples': 7176576, 'steps': 37377, 'loss/train': 1.5816887617111206} -11/07/2021 02:29:35 - INFO - __main__ - Step 37379: {'lr': 0.00043275717392719115, 'samples': 7176768, 'steps': 37378, 'loss/train': 1.695273995399475} -11/07/2021 02:29:35 - INFO - __main__ - Step 37380: {'lr': 0.0004327535528464194, 'samples': 7176960, 'steps': 37379, 'loss/train': 1.7499052286148071} -11/07/2021 02:29:35 - INFO - __main__ - Step 37381: {'lr': 0.0004327499316833016, 'samples': 7177152, 'steps': 37380, 'loss/train': 1.8813824653625488} -11/07/2021 02:29:36 - INFO - __main__ - Step 37382: {'lr': 0.0004327463104378395, 'samples': 7177344, 'steps': 37381, 'loss/train': 1.160994291305542} -11/07/2021 02:29:36 - INFO - __main__ - Step 37383: {'lr': 0.0004327426891100349, 'samples': 7177536, 'steps': 37382, 'loss/train': 1.6030007600784302} -11/07/2021 02:29:37 - INFO - __main__ - Step 37384: {'lr': 0.0004327390676998891, 'samples': 7177728, 'steps': 37383, 'loss/train': 1.600156307220459} -11/07/2021 02:29:37 - INFO - __main__ - Step 37385: {'lr': 0.000432735446207404, 'samples': 7177920, 'steps': 37384, 'loss/train': 1.6125463247299194} -11/07/2021 02:29:38 - INFO - __main__ - Step 37386: {'lr': 0.0004327318246325811, 'samples': 7178112, 'steps': 37385, 'loss/train': 1.6646647453308105} -11/07/2021 02:29:38 - INFO - __main__ - Step 37387: {'lr': 0.000432728202975422, 'samples': 7178304, 'steps': 37386, 'loss/train': 1.385424256324768} -11/07/2021 02:29:38 - INFO - __main__ - Step 37388: {'lr': 0.0004327245812359285, 'samples': 7178496, 'steps': 37387, 'loss/train': 1.5408601760864258} -11/07/2021 02:29:39 - INFO - __main__ - Step 37389: {'lr': 0.000432720959414102, 'samples': 7178688, 'steps': 37388, 'loss/train': 1.6477293968200684} -11/07/2021 02:29:40 - INFO - __main__ - Step 37390: {'lr': 0.00043271733750994436, 'samples': 7178880, 'steps': 37389, 'loss/train': 1.4274452924728394} -11/07/2021 02:29:40 - INFO - __main__ - Step 37391: {'lr': 0.00043271371552345704, 'samples': 7179072, 'steps': 37390, 'loss/train': 1.5618799924850464} -11/07/2021 02:29:41 - INFO - __main__ - Step 37392: {'lr': 0.00043271009345464175, 'samples': 7179264, 'steps': 37391, 'loss/train': 1.3555269241333008} -11/07/2021 02:29:41 - INFO - __main__ - Step 37393: {'lr': 0.0004327064713035002, 'samples': 7179456, 'steps': 37392, 'loss/train': 1.3795374631881714} -11/07/2021 02:29:42 - INFO - __main__ - Step 37394: {'lr': 0.00043270284907003377, 'samples': 7179648, 'steps': 37393, 'loss/train': 0.3336257338523865} -11/07/2021 02:29:42 - INFO - __main__ - Step 37395: {'lr': 0.0004326992267542443, 'samples': 7179840, 'steps': 37394, 'loss/train': 1.483880639076233} -11/07/2021 02:29:43 - INFO - __main__ - Step 37396: {'lr': 0.0004326956043561335, 'samples': 7180032, 'steps': 37395, 'loss/train': 1.0873039960861206} -11/07/2021 02:29:43 - INFO - __main__ - Step 37397: {'lr': 0.0004326919818757028, 'samples': 7180224, 'steps': 37396, 'loss/train': 0.8401727676391602} -11/07/2021 02:29:43 - INFO - __main__ - Step 37398: {'lr': 0.00043268835931295393, 'samples': 7180416, 'steps': 37397, 'loss/train': 1.5042715072631836} -11/07/2021 02:29:44 - INFO - __main__ - Step 37399: {'lr': 0.00043268473666788844, 'samples': 7180608, 'steps': 37398, 'loss/train': 0.5492748618125916} -11/07/2021 02:29:45 - INFO - __main__ - Step 37400: {'lr': 0.0004326811139405081, 'samples': 7180800, 'steps': 37399, 'loss/train': 1.7564066648483276} -11/07/2021 02:29:45 - INFO - __main__ - Step 37401: {'lr': 0.0004326774911308145, 'samples': 7180992, 'steps': 37400, 'loss/train': 1.5959196090698242} -11/07/2021 02:29:45 - INFO - __main__ - Step 37402: {'lr': 0.00043267386823880904, 'samples': 7181184, 'steps': 37401, 'loss/train': 1.6912891864776611} -11/07/2021 02:29:46 - INFO - __main__ - Step 37403: {'lr': 0.00043267024526449374, 'samples': 7181376, 'steps': 37402, 'loss/train': 1.5138664245605469} -11/07/2021 02:29:46 - INFO - __main__ - Step 37404: {'lr': 0.00043266662220787003, 'samples': 7181568, 'steps': 37403, 'loss/train': 1.2460224628448486} -11/07/2021 02:29:47 - INFO - __main__ - Step 37405: {'lr': 0.0004326629990689395, 'samples': 7181760, 'steps': 37404, 'loss/train': 1.3983253240585327} -11/07/2021 02:29:48 - INFO - __main__ - Step 37406: {'lr': 0.0004326593758477039, 'samples': 7181952, 'steps': 37405, 'loss/train': 1.5294811725616455} -11/07/2021 02:29:48 - INFO - __main__ - Step 37407: {'lr': 0.0004326557525441648, 'samples': 7182144, 'steps': 37406, 'loss/train': 1.2356144189834595} -11/07/2021 02:29:48 - INFO - __main__ - Step 37408: {'lr': 0.00043265212915832374, 'samples': 7182336, 'steps': 37407, 'loss/train': 2.397145986557007} -11/07/2021 02:29:49 - INFO - __main__ - Step 37409: {'lr': 0.00043264850569018254, 'samples': 7182528, 'steps': 37408, 'loss/train': 1.4570412635803223} -11/07/2021 02:29:50 - INFO - __main__ - Step 37410: {'lr': 0.00043264488213974275, 'samples': 7182720, 'steps': 37409, 'loss/train': 1.3757929801940918} -11/07/2021 02:29:50 - INFO - __main__ - Step 37411: {'lr': 0.000432641258507006, 'samples': 7182912, 'steps': 37410, 'loss/train': 1.6848138570785522} -11/07/2021 02:29:51 - INFO - __main__ - Step 37412: {'lr': 0.0004326376347919738, 'samples': 7183104, 'steps': 37411, 'loss/train': 1.6494650840759277} -11/07/2021 02:29:51 - INFO - __main__ - Step 37413: {'lr': 0.00043263401099464805, 'samples': 7183296, 'steps': 37412, 'loss/train': 3.1627933979034424} -11/07/2021 02:29:52 - INFO - __main__ - Step 37414: {'lr': 0.00043263038711503017, 'samples': 7183488, 'steps': 37413, 'loss/train': 1.6756221055984497} -11/07/2021 02:29:52 - INFO - __main__ - Step 37415: {'lr': 0.00043262676315312183, 'samples': 7183680, 'steps': 37414, 'loss/train': 1.3630532026290894} -11/07/2021 02:29:53 - INFO - __main__ - Step 37416: {'lr': 0.0004326231391089247, 'samples': 7183872, 'steps': 37415, 'loss/train': 1.6684272289276123} -11/07/2021 02:29:53 - INFO - __main__ - Step 37417: {'lr': 0.00043261951498244045, 'samples': 7184064, 'steps': 37416, 'loss/train': 1.718359112739563} -11/07/2021 02:29:54 - INFO - __main__ - Step 37418: {'lr': 0.0004326158907736706, 'samples': 7184256, 'steps': 37417, 'loss/train': 1.6083804368972778} -11/07/2021 02:29:54 - INFO - __main__ - Step 37419: {'lr': 0.00043261226648261687, 'samples': 7184448, 'steps': 37418, 'loss/train': 1.5865517854690552} -11/07/2021 02:29:54 - INFO - __main__ - Step 37420: {'lr': 0.0004326086421092809, 'samples': 7184640, 'steps': 37419, 'loss/train': 1.3192373514175415} -11/07/2021 02:29:55 - INFO - __main__ - Step 37421: {'lr': 0.00043260501765366425, 'samples': 7184832, 'steps': 37420, 'loss/train': 1.606441617012024} -11/07/2021 02:29:56 - INFO - __main__ - Step 37422: {'lr': 0.00043260139311576863, 'samples': 7185024, 'steps': 37421, 'loss/train': 2.185137987136841} -11/07/2021 02:29:56 - INFO - __main__ - Step 37423: {'lr': 0.0004325977684955956, 'samples': 7185216, 'steps': 37422, 'loss/train': 1.5154505968093872} -11/07/2021 02:29:56 - INFO - __main__ - Step 37424: {'lr': 0.0004325941437931469, 'samples': 7185408, 'steps': 37423, 'loss/train': 1.1395184993743896} -11/07/2021 02:29:57 - INFO - __main__ - Step 37425: {'lr': 0.0004325905190084241, 'samples': 7185600, 'steps': 37424, 'loss/train': 1.191431999206543} -11/07/2021 02:29:58 - INFO - __main__ - Step 37426: {'lr': 0.00043258689414142875, 'samples': 7185792, 'steps': 37425, 'loss/train': 1.3336917161941528} -11/07/2021 02:29:58 - INFO - __main__ - Step 37427: {'lr': 0.0004325832691921626, 'samples': 7185984, 'steps': 37426, 'loss/train': 1.6650985479354858} -11/07/2021 02:29:59 - INFO - __main__ - Step 37428: {'lr': 0.00043257964416062723, 'samples': 7186176, 'steps': 37427, 'loss/train': 1.8389983177185059} -11/07/2021 02:29:59 - INFO - __main__ - Step 37429: {'lr': 0.0004325760190468243, 'samples': 7186368, 'steps': 37428, 'loss/train': 1.5231657028198242} -11/07/2021 02:29:59 - INFO - __main__ - Step 37430: {'lr': 0.0004325723938507555, 'samples': 7186560, 'steps': 37429, 'loss/train': 1.52488112449646} -11/07/2021 02:30:00 - INFO - __main__ - Step 37431: {'lr': 0.0004325687685724223, 'samples': 7186752, 'steps': 37430, 'loss/train': 1.412951946258545} -11/07/2021 02:30:01 - INFO - __main__ - Step 37432: {'lr': 0.0004325651432118265, 'samples': 7186944, 'steps': 37431, 'loss/train': 1.3657993078231812} -11/07/2021 02:30:01 - INFO - __main__ - Step 37433: {'lr': 0.00043256151776896955, 'samples': 7187136, 'steps': 37432, 'loss/train': 2.3355555534362793} -11/07/2021 02:30:01 - INFO - __main__ - Step 37434: {'lr': 0.0004325578922438533, 'samples': 7187328, 'steps': 37433, 'loss/train': 1.6410709619522095} -11/07/2021 02:30:02 - INFO - __main__ - Step 37435: {'lr': 0.0004325542666364793, 'samples': 7187520, 'steps': 37434, 'loss/train': 1.3707133531570435} -11/07/2021 02:30:02 - INFO - __main__ - Step 37436: {'lr': 0.00043255064094684917, 'samples': 7187712, 'steps': 37435, 'loss/train': 1.3452285528182983} -11/07/2021 02:30:03 - INFO - __main__ - Step 37437: {'lr': 0.0004325470151749644, 'samples': 7187904, 'steps': 37436, 'loss/train': 1.5764644145965576} -11/07/2021 02:30:03 - INFO - __main__ - Step 37438: {'lr': 0.00043254338932082696, 'samples': 7188096, 'steps': 37437, 'loss/train': 1.3807365894317627} -11/07/2021 02:30:04 - INFO - __main__ - Step 37439: {'lr': 0.00043253976338443814, 'samples': 7188288, 'steps': 37438, 'loss/train': 0.7496334314346313} -11/07/2021 02:30:04 - INFO - __main__ - Step 37440: {'lr': 0.00043253613736579975, 'samples': 7188480, 'steps': 37439, 'loss/train': 1.6858636140823364} -11/07/2021 02:30:05 - INFO - __main__ - Step 37441: {'lr': 0.0004325325112649134, 'samples': 7188672, 'steps': 37440, 'loss/train': 1.2810533046722412} -11/07/2021 02:30:06 - INFO - __main__ - Step 37442: {'lr': 0.00043252888508178066, 'samples': 7188864, 'steps': 37441, 'loss/train': 1.7188156843185425} -11/07/2021 02:30:06 - INFO - __main__ - Step 37443: {'lr': 0.0004325252588164033, 'samples': 7189056, 'steps': 37442, 'loss/train': 1.2332797050476074} -11/07/2021 02:30:06 - INFO - __main__ - Step 37444: {'lr': 0.00043252163246878286, 'samples': 7189248, 'steps': 37443, 'loss/train': 1.7089459896087646} -11/07/2021 02:30:07 - INFO - __main__ - Step 37445: {'lr': 0.000432518006038921, 'samples': 7189440, 'steps': 37444, 'loss/train': 1.2559268474578857} -11/07/2021 02:30:07 - INFO - __main__ - Step 37446: {'lr': 0.00043251437952681926, 'samples': 7189632, 'steps': 37445, 'loss/train': 1.6364524364471436} -11/07/2021 02:30:08 - INFO - __main__ - Step 37447: {'lr': 0.0004325107529324795, 'samples': 7189824, 'steps': 37446, 'loss/train': 1.7149345874786377} -11/07/2021 02:30:08 - INFO - __main__ - Step 37448: {'lr': 0.0004325071262559031, 'samples': 7190016, 'steps': 37447, 'loss/train': 1.6025023460388184} -11/07/2021 02:30:09 - INFO - __main__ - Step 37449: {'lr': 0.00043250349949709184, 'samples': 7190208, 'steps': 37448, 'loss/train': 1.4580620527267456} -11/07/2021 02:30:09 - INFO - __main__ - Step 37450: {'lr': 0.0004324998726560473, 'samples': 7190400, 'steps': 37449, 'loss/train': 1.1127818822860718} -11/07/2021 02:30:09 - INFO - __main__ - Step 37451: {'lr': 0.0004324962457327712, 'samples': 7190592, 'steps': 37450, 'loss/train': 1.3189001083374023} -11/07/2021 02:30:10 - INFO - __main__ - Step 37452: {'lr': 0.00043249261872726504, 'samples': 7190784, 'steps': 37451, 'loss/train': 1.1091448068618774} -11/07/2021 02:30:11 - INFO - __main__ - Step 37453: {'lr': 0.0004324889916395305, 'samples': 7190976, 'steps': 37452, 'loss/train': 1.6013160943984985} -11/07/2021 02:30:11 - INFO - __main__ - Step 37454: {'lr': 0.0004324853644695693, 'samples': 7191168, 'steps': 37453, 'loss/train': 1.1790231466293335} -11/07/2021 02:30:11 - INFO - __main__ - Step 37455: {'lr': 0.000432481737217383, 'samples': 7191360, 'steps': 37454, 'loss/train': 1.5752537250518799} -11/07/2021 02:30:12 - INFO - __main__ - Step 37456: {'lr': 0.0004324781098829732, 'samples': 7191552, 'steps': 37455, 'loss/train': 1.2282586097717285} -11/07/2021 02:30:12 - INFO - __main__ - Step 37457: {'lr': 0.0004324744824663417, 'samples': 7191744, 'steps': 37456, 'loss/train': 1.5415738821029663} -11/07/2021 02:30:13 - INFO - __main__ - Step 37458: {'lr': 0.00043247085496748983, 'samples': 7191936, 'steps': 37457, 'loss/train': 0.7288332581520081} -11/07/2021 02:30:14 - INFO - __main__ - Step 37459: {'lr': 0.0004324672273864195, 'samples': 7192128, 'steps': 37458, 'loss/train': 1.6295570135116577} -11/07/2021 02:30:14 - INFO - __main__ - Step 37460: {'lr': 0.00043246359972313233, 'samples': 7192320, 'steps': 37459, 'loss/train': 1.5285189151763916} -11/07/2021 02:30:14 - INFO - __main__ - Step 37461: {'lr': 0.0004324599719776298, 'samples': 7192512, 'steps': 37460, 'loss/train': 1.4358800649642944} -11/07/2021 02:30:15 - INFO - __main__ - Step 37462: {'lr': 0.00043245634414991365, 'samples': 7192704, 'steps': 37461, 'loss/train': 1.258275032043457} -11/07/2021 02:30:16 - INFO - __main__ - Step 37463: {'lr': 0.0004324527162399854, 'samples': 7192896, 'steps': 37462, 'loss/train': 1.5770810842514038} -11/07/2021 02:30:16 - INFO - __main__ - Step 37464: {'lr': 0.0004324490882478469, 'samples': 7193088, 'steps': 37463, 'loss/train': 1.6385400295257568} -11/07/2021 02:30:16 - INFO - __main__ - Step 37465: {'lr': 0.0004324454601734995, 'samples': 7193280, 'steps': 37464, 'loss/train': 1.7759833335876465} -11/07/2021 02:30:17 - INFO - __main__ - Step 37466: {'lr': 0.0004324418320169451, 'samples': 7193472, 'steps': 37465, 'loss/train': 1.5825846195220947} -11/07/2021 02:30:17 - INFO - __main__ - Step 37467: {'lr': 0.00043243820377818524, 'samples': 7193664, 'steps': 37466, 'loss/train': 1.4279179573059082} -11/07/2021 02:30:19 - INFO - __main__ - Step 37468: {'lr': 0.0004324345754572215, 'samples': 7193856, 'steps': 37467, 'loss/train': 0.7902894616127014} -11/07/2021 02:30:19 - INFO - __main__ - Step 37469: {'lr': 0.00043243094705405554, 'samples': 7194048, 'steps': 37468, 'loss/train': 1.3145751953125} -11/07/2021 02:30:19 - INFO - __main__ - Step 37470: {'lr': 0.0004324273185686891, 'samples': 7194240, 'steps': 37469, 'loss/train': 0.8086821436882019} -11/07/2021 02:30:20 - INFO - __main__ - Step 37471: {'lr': 0.00043242369000112365, 'samples': 7194432, 'steps': 37470, 'loss/train': 1.961127519607544} -11/07/2021 02:30:20 - INFO - __main__ - Step 37472: {'lr': 0.00043242006135136093, 'samples': 7194624, 'steps': 37471, 'loss/train': 2.164335250854492} -11/07/2021 02:30:21 - INFO - __main__ - Step 37473: {'lr': 0.00043241643261940246, 'samples': 7194816, 'steps': 37472, 'loss/train': 2.507589340209961} -11/07/2021 02:30:21 - INFO - __main__ - Step 37474: {'lr': 0.00043241280380525003, 'samples': 7195008, 'steps': 37473, 'loss/train': 1.6702580451965332} -11/07/2021 02:30:22 - INFO - __main__ - Step 37475: {'lr': 0.0004324091749089052, 'samples': 7195200, 'steps': 37474, 'loss/train': 1.4887938499450684} -11/07/2021 02:30:22 - INFO - __main__ - Step 37476: {'lr': 0.0004324055459303696, 'samples': 7195392, 'steps': 37475, 'loss/train': 2.0435266494750977} -11/07/2021 02:30:23 - INFO - __main__ - Step 37477: {'lr': 0.00043240191686964494, 'samples': 7195584, 'steps': 37476, 'loss/train': 1.1949541568756104} -11/07/2021 02:30:23 - INFO - __main__ - Step 37478: {'lr': 0.00043239828772673276, 'samples': 7195776, 'steps': 37477, 'loss/train': 1.53923499584198} -11/07/2021 02:30:23 - INFO - __main__ - Step 37479: {'lr': 0.0004323946585016347, 'samples': 7195968, 'steps': 37478, 'loss/train': 1.6027249097824097} -11/07/2021 02:30:24 - INFO - __main__ - Step 37480: {'lr': 0.00043239102919435235, 'samples': 7196160, 'steps': 37479, 'loss/train': 2.0103933811187744} -11/07/2021 02:30:25 - INFO - __main__ - Step 37481: {'lr': 0.0004323873998048875, 'samples': 7196352, 'steps': 37480, 'loss/train': 1.2224072217941284} -11/07/2021 02:30:25 - INFO - __main__ - Step 37482: {'lr': 0.00043238377033324175, 'samples': 7196544, 'steps': 37481, 'loss/train': 1.319748044013977} -11/07/2021 02:30:25 - INFO - __main__ - Step 37483: {'lr': 0.00043238014077941656, 'samples': 7196736, 'steps': 37482, 'loss/train': 1.6039621829986572} -11/07/2021 02:30:26 - INFO - __main__ - Step 37484: {'lr': 0.00043237651114341383, 'samples': 7196928, 'steps': 37483, 'loss/train': 1.4563041925430298} -11/07/2021 02:30:27 - INFO - __main__ - Step 37485: {'lr': 0.00043237288142523503, 'samples': 7197120, 'steps': 37484, 'loss/train': 2.3065671920776367} -11/07/2021 02:30:27 - INFO - __main__ - Step 37486: {'lr': 0.00043236925162488173, 'samples': 7197312, 'steps': 37485, 'loss/train': 1.2834789752960205} -11/07/2021 02:30:27 - INFO - __main__ - Step 37487: {'lr': 0.0004323656217423557, 'samples': 7197504, 'steps': 37486, 'loss/train': 1.5869083404541016} -11/07/2021 02:30:28 - INFO - __main__ - Step 37488: {'lr': 0.00043236199177765856, 'samples': 7197696, 'steps': 37487, 'loss/train': 1.7081737518310547} -11/07/2021 02:30:28 - INFO - __main__ - Step 37489: {'lr': 0.0004323583617307919, 'samples': 7197888, 'steps': 37488, 'loss/train': 1.4253218173980713} -11/07/2021 02:30:29 - INFO - __main__ - Step 37490: {'lr': 0.00043235473160175745, 'samples': 7198080, 'steps': 37489, 'loss/train': 1.9894713163375854} -11/07/2021 02:30:29 - INFO - __main__ - Step 37491: {'lr': 0.0004323511013905567, 'samples': 7198272, 'steps': 37490, 'loss/train': 1.5830626487731934} -11/07/2021 02:30:30 - INFO - __main__ - Step 37492: {'lr': 0.0004323474710971913, 'samples': 7198464, 'steps': 37491, 'loss/train': 1.5441548824310303} -11/07/2021 02:30:30 - INFO - __main__ - Step 37493: {'lr': 0.0004323438407216631, 'samples': 7198656, 'steps': 37492, 'loss/train': 1.6030843257904053} -11/07/2021 02:30:30 - INFO - __main__ - Step 37494: {'lr': 0.0004323402102639734, 'samples': 7198848, 'steps': 37493, 'loss/train': 1.7096853256225586} -11/07/2021 02:30:32 - INFO - __main__ - Step 37495: {'lr': 0.00043233657972412414, 'samples': 7199040, 'steps': 37494, 'loss/train': 1.8373485803604126} -11/07/2021 02:30:32 - INFO - __main__ - Step 37496: {'lr': 0.00043233294910211684, 'samples': 7199232, 'steps': 37495, 'loss/train': 1.551588535308838} -11/07/2021 02:30:32 - INFO - __main__ - Step 37497: {'lr': 0.0004323293183979531, 'samples': 7199424, 'steps': 37496, 'loss/train': 1.4369267225265503} -11/07/2021 02:30:33 - INFO - __main__ - Step 37498: {'lr': 0.0004323256876116345, 'samples': 7199616, 'steps': 37497, 'loss/train': 1.0210753679275513} -11/07/2021 02:30:33 - INFO - __main__ - Step 37499: {'lr': 0.0004323220567431628, 'samples': 7199808, 'steps': 37498, 'loss/train': 1.9081380367279053} -11/07/2021 02:30:34 - INFO - __main__ - Step 37500: {'lr': 0.0004323184257925397, 'samples': 7200000, 'steps': 37499, 'loss/train': 1.5604526996612549} -11/07/2021 02:30:34 - INFO - __main__ - Step 37501: {'lr': 0.0004323147947597667, 'samples': 7200192, 'steps': 37500, 'loss/train': 1.0608760118484497} -11/07/2021 02:30:35 - INFO - __main__ - Step 37502: {'lr': 0.00043231116364484534, 'samples': 7200384, 'steps': 37501, 'loss/train': 1.4155505895614624} -11/07/2021 02:30:35 - INFO - __main__ - Step 37503: {'lr': 0.00043230753244777743, 'samples': 7200576, 'steps': 37502, 'loss/train': 1.5481852293014526} -11/07/2021 02:30:35 - INFO - __main__ - Step 37504: {'lr': 0.00043230390116856467, 'samples': 7200768, 'steps': 37503, 'loss/train': 0.5808529257774353} -11/07/2021 02:30:36 - INFO - __main__ - Step 37505: {'lr': 0.00043230026980720847, 'samples': 7200960, 'steps': 37504, 'loss/train': 1.8550664186477661} -11/07/2021 02:30:37 - INFO - __main__ - Step 37506: {'lr': 0.00043229663836371056, 'samples': 7201152, 'steps': 37505, 'loss/train': 1.284300684928894} -11/07/2021 02:30:37 - INFO - __main__ - Step 37507: {'lr': 0.0004322930068380727, 'samples': 7201344, 'steps': 37506, 'loss/train': 1.435318112373352} -11/07/2021 02:30:37 - INFO - __main__ - Step 37508: {'lr': 0.00043228937523029636, 'samples': 7201536, 'steps': 37507, 'loss/train': 1.5970197916030884} -11/07/2021 02:30:38 - INFO - __main__ - Step 37509: {'lr': 0.00043228574354038326, 'samples': 7201728, 'steps': 37508, 'loss/train': 1.5501351356506348} -11/07/2021 02:30:38 - INFO - __main__ - Step 37510: {'lr': 0.00043228211176833496, 'samples': 7201920, 'steps': 37509, 'loss/train': 1.5573985576629639} -11/07/2021 02:30:39 - INFO - __main__ - Step 37511: {'lr': 0.00043227847991415326, 'samples': 7202112, 'steps': 37510, 'loss/train': 0.7737532258033752} -11/07/2021 02:30:40 - INFO - __main__ - Step 37512: {'lr': 0.00043227484797783965, 'samples': 7202304, 'steps': 37511, 'loss/train': 1.446190595626831} -11/07/2021 02:30:40 - INFO - __main__ - Step 37513: {'lr': 0.0004322712159593958, 'samples': 7202496, 'steps': 37512, 'loss/train': 2.2026243209838867} -11/07/2021 02:30:40 - INFO - __main__ - Step 37514: {'lr': 0.0004322675838588234, 'samples': 7202688, 'steps': 37513, 'loss/train': 1.200168490409851} -11/07/2021 02:30:41 - INFO - __main__ - Step 37515: {'lr': 0.0004322639516761239, 'samples': 7202880, 'steps': 37514, 'loss/train': 1.6389999389648438} -11/07/2021 02:30:42 - INFO - __main__ - Step 37516: {'lr': 0.0004322603194112992, 'samples': 7203072, 'steps': 37515, 'loss/train': 1.6824238300323486} -11/07/2021 02:30:42 - INFO - __main__ - Step 37517: {'lr': 0.00043225668706435073, 'samples': 7203264, 'steps': 37516, 'loss/train': 1.6325851678848267} -11/07/2021 02:30:42 - INFO - __main__ - Step 37518: {'lr': 0.0004322530546352803, 'samples': 7203456, 'steps': 37517, 'loss/train': 1.74091374874115} -11/07/2021 02:30:43 - INFO - __main__ - Step 37519: {'lr': 0.0004322494221240894, 'samples': 7203648, 'steps': 37518, 'loss/train': 1.3719381093978882} -11/07/2021 02:30:43 - INFO - __main__ - Step 37520: {'lr': 0.0004322457895307797, 'samples': 7203840, 'steps': 37519, 'loss/train': 2.352436065673828} -11/07/2021 02:30:44 - INFO - __main__ - Step 37521: {'lr': 0.00043224215685535287, 'samples': 7204032, 'steps': 37520, 'loss/train': 2.0461223125457764} -11/07/2021 02:30:44 - INFO - __main__ - Step 37522: {'lr': 0.0004322385240978106, 'samples': 7204224, 'steps': 37521, 'loss/train': 1.1710293292999268} -11/07/2021 02:30:45 - INFO - __main__ - Step 37523: {'lr': 0.0004322348912581544, 'samples': 7204416, 'steps': 37522, 'loss/train': 1.662919044494629} -11/07/2021 02:30:45 - INFO - __main__ - Step 37524: {'lr': 0.000432231258336386, 'samples': 7204608, 'steps': 37523, 'loss/train': 1.4173078536987305} -11/07/2021 02:30:46 - INFO - __main__ - Step 37525: {'lr': 0.000432227625332507, 'samples': 7204800, 'steps': 37524, 'loss/train': 0.7475195527076721} -11/07/2021 02:30:47 - INFO - __main__ - Step 37526: {'lr': 0.000432223992246519, 'samples': 7204992, 'steps': 37525, 'loss/train': 1.65089750289917} -11/07/2021 02:30:47 - INFO - __main__ - Step 37527: {'lr': 0.0004322203590784237, 'samples': 7205184, 'steps': 37526, 'loss/train': 1.536938190460205} -11/07/2021 02:30:47 - INFO - __main__ - Step 37528: {'lr': 0.0004322167258282228, 'samples': 7205376, 'steps': 37527, 'loss/train': 1.5707414150238037} -11/07/2021 02:30:48 - INFO - __main__ - Step 37529: {'lr': 0.0004322130924959178, 'samples': 7205568, 'steps': 37528, 'loss/train': 1.5095049142837524} -11/07/2021 02:30:48 - INFO - __main__ - Step 37530: {'lr': 0.0004322094590815104, 'samples': 7205760, 'steps': 37529, 'loss/train': 1.9747005701065063} -11/07/2021 02:30:50 - INFO - __main__ - Step 37531: {'lr': 0.00043220582558500223, 'samples': 7205952, 'steps': 37530, 'loss/train': 1.743624210357666} -11/07/2021 02:30:50 - INFO - __main__ - Step 37532: {'lr': 0.00043220219200639485, 'samples': 7206144, 'steps': 37531, 'loss/train': 1.7449406385421753} -11/07/2021 02:30:50 - INFO - __main__ - Step 37533: {'lr': 0.00043219855834569006, 'samples': 7206336, 'steps': 37532, 'loss/train': 2.2813148498535156} -11/07/2021 02:30:51 - INFO - __main__ - Step 37534: {'lr': 0.00043219492460288937, 'samples': 7206528, 'steps': 37533, 'loss/train': 1.6646699905395508} -11/07/2021 02:30:51 - INFO - __main__ - Step 37535: {'lr': 0.00043219129077799447, 'samples': 7206720, 'steps': 37534, 'loss/train': 1.7239679098129272} -11/07/2021 02:30:51 - INFO - __main__ - Step 37536: {'lr': 0.000432187656871007, 'samples': 7206912, 'steps': 37535, 'loss/train': 1.7892603874206543} -11/07/2021 02:30:52 - INFO - __main__ - Step 37537: {'lr': 0.0004321840228819286, 'samples': 7207104, 'steps': 37536, 'loss/train': 1.0783336162567139} -11/07/2021 02:30:53 - INFO - __main__ - Step 37538: {'lr': 0.0004321803888107608, 'samples': 7207296, 'steps': 37537, 'loss/train': 0.732699990272522} -11/07/2021 02:30:53 - INFO - __main__ - Step 37539: {'lr': 0.0004321767546575054, 'samples': 7207488, 'steps': 37538, 'loss/train': 1.7513829469680786} -11/07/2021 02:30:54 - INFO - __main__ - Step 37540: {'lr': 0.000432173120422164, 'samples': 7207680, 'steps': 37539, 'loss/train': 10.400634765625} -11/07/2021 02:30:54 - INFO - __main__ - Step 37541: {'lr': 0.00043216948610473816, 'samples': 7207872, 'steps': 37540, 'loss/train': 1.5212979316711426} -11/07/2021 02:30:54 - INFO - __main__ - Step 37542: {'lr': 0.0004321658517052296, 'samples': 7208064, 'steps': 37541, 'loss/train': 1.4999489784240723} -11/07/2021 02:30:55 - INFO - __main__ - Step 37543: {'lr': 0.00043216221722363983, 'samples': 7208256, 'steps': 37542, 'loss/train': 1.7804269790649414} -11/07/2021 02:30:56 - INFO - __main__ - Step 37544: {'lr': 0.00043215858265997065, 'samples': 7208448, 'steps': 37543, 'loss/train': 1.8416721820831299} -11/07/2021 02:30:56 - INFO - __main__ - Step 37545: {'lr': 0.0004321549480142236, 'samples': 7208640, 'steps': 37544, 'loss/train': 1.489058017730713} -11/07/2021 02:30:56 - INFO - __main__ - Step 37546: {'lr': 0.0004321513132864003, 'samples': 7208832, 'steps': 37545, 'loss/train': 1.4994314908981323} -11/07/2021 02:30:57 - INFO - __main__ - Step 37547: {'lr': 0.0004321476784765025, 'samples': 7209024, 'steps': 37546, 'loss/train': 1.3192144632339478} -11/07/2021 02:30:57 - INFO - __main__ - Step 37548: {'lr': 0.00043214404358453174, 'samples': 7209216, 'steps': 37547, 'loss/train': 1.5115631818771362} -11/07/2021 02:30:58 - INFO - __main__ - Step 37549: {'lr': 0.0004321404086104897, 'samples': 7209408, 'steps': 37548, 'loss/train': 0.9762508869171143} -11/07/2021 02:30:58 - INFO - __main__ - Step 37550: {'lr': 0.00043213677355437795, 'samples': 7209600, 'steps': 37549, 'loss/train': 1.087836742401123} -11/07/2021 02:30:59 - INFO - __main__ - Step 37551: {'lr': 0.0004321331384161983, 'samples': 7209792, 'steps': 37550, 'loss/train': 1.6014374494552612} -11/07/2021 02:30:59 - INFO - __main__ - Step 37552: {'lr': 0.00043212950319595215, 'samples': 7209984, 'steps': 37551, 'loss/train': 1.8291975259780884} -11/07/2021 02:30:59 - INFO - __main__ - Step 37553: {'lr': 0.0004321258678936413, 'samples': 7210176, 'steps': 37552, 'loss/train': 1.8783771991729736} -11/07/2021 02:31:01 - INFO - __main__ - Step 37554: {'lr': 0.00043212223250926727, 'samples': 7210368, 'steps': 37553, 'loss/train': 1.5376328229904175} -11/07/2021 02:31:01 - INFO - __main__ - Step 37555: {'lr': 0.00043211859704283184, 'samples': 7210560, 'steps': 37554, 'loss/train': 1.462335228919983} -11/07/2021 02:31:01 - INFO - __main__ - Step 37556: {'lr': 0.0004321149614943366, 'samples': 7210752, 'steps': 37555, 'loss/train': 1.7638007402420044} -11/07/2021 02:31:02 - INFO - __main__ - Step 37557: {'lr': 0.0004321113258637832, 'samples': 7210944, 'steps': 37556, 'loss/train': 1.3894625902175903} -11/07/2021 02:31:02 - INFO - __main__ - Step 37558: {'lr': 0.0004321076901511731, 'samples': 7211136, 'steps': 37557, 'loss/train': 1.167650818824768} -11/07/2021 02:31:03 - INFO - __main__ - Step 37559: {'lr': 0.0004321040543565082, 'samples': 7211328, 'steps': 37558, 'loss/train': 1.5407660007476807} -11/07/2021 02:31:03 - INFO - __main__ - Step 37560: {'lr': 0.00043210041847979003, 'samples': 7211520, 'steps': 37559, 'loss/train': 1.55744469165802} -11/07/2021 02:31:04 - INFO - __main__ - Step 37561: {'lr': 0.0004320967825210202, 'samples': 7211712, 'steps': 37560, 'loss/train': 1.7859392166137695} -11/07/2021 02:31:04 - INFO - __main__ - Step 37562: {'lr': 0.00043209314648020035, 'samples': 7211904, 'steps': 37561, 'loss/train': 1.5488879680633545} -11/07/2021 02:31:04 - INFO - __main__ - Step 37563: {'lr': 0.0004320895103573321, 'samples': 7212096, 'steps': 37562, 'loss/train': 2.0785441398620605} -11/07/2021 02:31:06 - INFO - __main__ - Step 37564: {'lr': 0.00043208587415241725, 'samples': 7212288, 'steps': 37563, 'loss/train': 2.692457675933838} -11/07/2021 02:31:06 - INFO - __main__ - Step 37565: {'lr': 0.00043208223786545723, 'samples': 7212480, 'steps': 37564, 'loss/train': 1.5505104064941406} -11/07/2021 02:31:06 - INFO - __main__ - Step 37566: {'lr': 0.0004320786014964538, 'samples': 7212672, 'steps': 37565, 'loss/train': 1.716882586479187} -11/07/2021 02:31:07 - INFO - __main__ - Step 37567: {'lr': 0.0004320749650454085, 'samples': 7212864, 'steps': 37566, 'loss/train': 1.477885127067566} -11/07/2021 02:31:07 - INFO - __main__ - Step 37568: {'lr': 0.0004320713285123231, 'samples': 7213056, 'steps': 37567, 'loss/train': 1.2575966119766235} -11/07/2021 02:31:07 - INFO - __main__ - Step 37569: {'lr': 0.0004320676918971991, 'samples': 7213248, 'steps': 37568, 'loss/train': 0.40955543518066406} -11/07/2021 02:31:08 - INFO - __main__ - Step 37570: {'lr': 0.00043206405520003824, 'samples': 7213440, 'steps': 37569, 'loss/train': 1.5961387157440186} -11/07/2021 02:31:09 - INFO - __main__ - Step 37571: {'lr': 0.00043206041842084214, 'samples': 7213632, 'steps': 37570, 'loss/train': 1.733590006828308} -11/07/2021 02:31:09 - INFO - __main__ - Step 37572: {'lr': 0.00043205678155961244, 'samples': 7213824, 'steps': 37571, 'loss/train': 1.8249460458755493} -11/07/2021 02:31:09 - INFO - __main__ - Step 37573: {'lr': 0.0004320531446163507, 'samples': 7214016, 'steps': 37572, 'loss/train': 1.5001862049102783} -11/07/2021 02:31:10 - INFO - __main__ - Step 37574: {'lr': 0.00043204950759105865, 'samples': 7214208, 'steps': 37573, 'loss/train': 0.9354721903800964} -11/07/2021 02:31:11 - INFO - __main__ - Step 37575: {'lr': 0.0004320458704837379, 'samples': 7214400, 'steps': 37574, 'loss/train': 1.4452364444732666} -11/07/2021 02:31:11 - INFO - __main__ - Step 37576: {'lr': 0.00043204223329439015, 'samples': 7214592, 'steps': 37575, 'loss/train': 1.3027896881103516} -11/07/2021 02:31:11 - INFO - __main__ - Step 37577: {'lr': 0.00043203859602301695, 'samples': 7214784, 'steps': 37576, 'loss/train': 1.559409499168396} -11/07/2021 02:31:12 - INFO - __main__ - Step 37578: {'lr': 0.00043203495866961996, 'samples': 7214976, 'steps': 37577, 'loss/train': 1.2092102766036987} -11/07/2021 02:31:12 - INFO - __main__ - Step 37579: {'lr': 0.00043203132123420074, 'samples': 7215168, 'steps': 37578, 'loss/train': 1.8662713766098022} -11/07/2021 02:31:13 - INFO - __main__ - Step 37580: {'lr': 0.00043202768371676113, 'samples': 7215360, 'steps': 37579, 'loss/train': 1.269534707069397} -11/07/2021 02:31:14 - INFO - __main__ - Step 37581: {'lr': 0.0004320240461173026, 'samples': 7215552, 'steps': 37580, 'loss/train': 0.5584875345230103} -11/07/2021 02:31:14 - INFO - __main__ - Step 37582: {'lr': 0.00043202040843582685, 'samples': 7215744, 'steps': 37581, 'loss/train': 1.0845144987106323} -11/07/2021 02:31:14 - INFO - __main__ - Step 37583: {'lr': 0.00043201677067233554, 'samples': 7215936, 'steps': 37582, 'loss/train': 2.1765105724334717} -11/07/2021 02:31:15 - INFO - __main__ - Step 37584: {'lr': 0.00043201313282683024, 'samples': 7216128, 'steps': 37583, 'loss/train': 1.4663903713226318} -11/07/2021 02:31:15 - INFO - __main__ - Step 37585: {'lr': 0.0004320094948993127, 'samples': 7216320, 'steps': 37584, 'loss/train': 1.7186776399612427} -11/07/2021 02:31:16 - INFO - __main__ - Step 37586: {'lr': 0.00043200585688978445, 'samples': 7216512, 'steps': 37585, 'loss/train': 1.0050069093704224} -11/07/2021 02:31:16 - INFO - __main__ - Step 37587: {'lr': 0.00043200221879824706, 'samples': 7216704, 'steps': 37586, 'loss/train': 1.7899430990219116} -11/07/2021 02:31:17 - INFO - __main__ - Step 37588: {'lr': 0.0004319985806247024, 'samples': 7216896, 'steps': 37587, 'loss/train': 1.0412225723266602} -11/07/2021 02:31:17 - INFO - __main__ - Step 37589: {'lr': 0.00043199494236915206, 'samples': 7217088, 'steps': 37588, 'loss/train': 2.0551319122314453} -11/07/2021 02:31:17 - INFO - __main__ - Step 37590: {'lr': 0.0004319913040315975, 'samples': 7217280, 'steps': 37589, 'loss/train': 1.3337748050689697} -11/07/2021 02:31:18 - INFO - __main__ - Step 37591: {'lr': 0.00043198766561204047, 'samples': 7217472, 'steps': 37590, 'loss/train': 1.7535258531570435} -11/07/2021 02:31:19 - INFO - __main__ - Step 37592: {'lr': 0.0004319840271104826, 'samples': 7217664, 'steps': 37591, 'loss/train': 1.6593502759933472} -11/07/2021 02:31:19 - INFO - __main__ - Step 37593: {'lr': 0.0004319803885269256, 'samples': 7217856, 'steps': 37592, 'loss/train': 1.2667961120605469} -11/07/2021 02:31:20 - INFO - __main__ - Step 37594: {'lr': 0.0004319767498613709, 'samples': 7218048, 'steps': 37593, 'loss/train': 1.6652697324752808} -11/07/2021 02:31:20 - INFO - __main__ - Step 37595: {'lr': 0.00043197311111382045, 'samples': 7218240, 'steps': 37594, 'loss/train': 1.6020832061767578} -11/07/2021 02:31:21 - INFO - __main__ - Step 37596: {'lr': 0.00043196947228427564, 'samples': 7218432, 'steps': 37595, 'loss/train': 1.2289795875549316} -11/07/2021 02:31:21 - INFO - __main__ - Step 37597: {'lr': 0.0004319658333727382, 'samples': 7218624, 'steps': 37596, 'loss/train': 2.1435749530792236} -11/07/2021 02:31:22 - INFO - __main__ - Step 37598: {'lr': 0.0004319621943792098, 'samples': 7218816, 'steps': 37597, 'loss/train': 0.6204817295074463} -11/07/2021 02:31:22 - INFO - __main__ - Step 37599: {'lr': 0.000431958555303692, 'samples': 7219008, 'steps': 37598, 'loss/train': 1.4375860691070557} -11/07/2021 02:31:22 - INFO - __main__ - Step 37600: {'lr': 0.00043195491614618655, 'samples': 7219200, 'steps': 37599, 'loss/train': 1.17434561252594} -11/07/2021 02:31:24 - INFO - __main__ - Step 37601: {'lr': 0.00043195127690669486, 'samples': 7219392, 'steps': 37600, 'loss/train': 1.445520281791687} -11/07/2021 02:31:24 - INFO - __main__ - Step 37602: {'lr': 0.00043194763758521896, 'samples': 7219584, 'steps': 37601, 'loss/train': 1.8835210800170898} -11/07/2021 02:31:24 - INFO - __main__ - Step 37603: {'lr': 0.00043194399818176013, 'samples': 7219776, 'steps': 37602, 'loss/train': 0.8516283631324768} -11/07/2021 02:31:25 - INFO - __main__ - Step 37604: {'lr': 0.00043194035869632017, 'samples': 7219968, 'steps': 37603, 'loss/train': 1.772552251815796} -11/07/2021 02:31:25 - INFO - __main__ - Step 37605: {'lr': 0.00043193671912890064, 'samples': 7220160, 'steps': 37604, 'loss/train': 1.627819299697876} -11/07/2021 02:31:25 - INFO - __main__ - Step 37606: {'lr': 0.0004319330794795033, 'samples': 7220352, 'steps': 37605, 'loss/train': 1.452150821685791} -11/07/2021 02:31:27 - INFO - __main__ - Step 37607: {'lr': 0.0004319294397481297, 'samples': 7220544, 'steps': 37606, 'loss/train': 1.6680288314819336} -11/07/2021 02:31:27 - INFO - __main__ - Step 37608: {'lr': 0.0004319257999347815, 'samples': 7220736, 'steps': 37607, 'loss/train': 1.2022203207015991} -11/07/2021 02:31:28 - INFO - __main__ - Step 37609: {'lr': 0.0004319221600394603, 'samples': 7220928, 'steps': 37608, 'loss/train': 1.7221713066101074} -11/07/2021 02:31:28 - INFO - __main__ - Step 37610: {'lr': 0.0004319185200621678, 'samples': 7221120, 'steps': 37609, 'loss/train': 0.6669997572898865} -11/07/2021 02:31:28 - INFO - __main__ - Step 37611: {'lr': 0.0004319148800029057, 'samples': 7221312, 'steps': 37610, 'loss/train': 1.5159608125686646} -11/07/2021 02:31:29 - INFO - __main__ - Step 37612: {'lr': 0.0004319112398616755, 'samples': 7221504, 'steps': 37611, 'loss/train': 1.4701101779937744} -11/07/2021 02:31:30 - INFO - __main__ - Step 37613: {'lr': 0.00043190759963847894, 'samples': 7221696, 'steps': 37612, 'loss/train': 0.991864025592804} -11/07/2021 02:31:30 - INFO - __main__ - Step 37614: {'lr': 0.00043190395933331757, 'samples': 7221888, 'steps': 37613, 'loss/train': 1.380480408668518} -11/07/2021 02:31:30 - INFO - __main__ - Step 37615: {'lr': 0.00043190031894619306, 'samples': 7222080, 'steps': 37614, 'loss/train': 1.7094345092773438} -11/07/2021 02:31:31 - INFO - __main__ - Step 37616: {'lr': 0.0004318966784771071, 'samples': 7222272, 'steps': 37615, 'loss/train': 1.7797966003417969} -11/07/2021 02:31:31 - INFO - __main__ - Step 37617: {'lr': 0.00043189303792606136, 'samples': 7222464, 'steps': 37616, 'loss/train': 1.494810938835144} -11/07/2021 02:31:32 - INFO - __main__ - Step 37618: {'lr': 0.0004318893972930574, 'samples': 7222656, 'steps': 37617, 'loss/train': 1.7728573083877563} -11/07/2021 02:31:33 - INFO - __main__ - Step 37619: {'lr': 0.00043188575657809685, 'samples': 7222848, 'steps': 37618, 'loss/train': 1.844686508178711} -11/07/2021 02:31:33 - INFO - __main__ - Step 37620: {'lr': 0.00043188211578118143, 'samples': 7223040, 'steps': 37619, 'loss/train': 1.6193997859954834} -11/07/2021 02:31:33 - INFO - __main__ - Step 37621: {'lr': 0.0004318784749023127, 'samples': 7223232, 'steps': 37620, 'loss/train': 1.4788497686386108} -11/07/2021 02:31:34 - INFO - __main__ - Step 37622: {'lr': 0.0004318748339414923, 'samples': 7223424, 'steps': 37621, 'loss/train': 1.5991002321243286} -11/07/2021 02:31:35 - INFO - __main__ - Step 37623: {'lr': 0.000431871192898722, 'samples': 7223616, 'steps': 37622, 'loss/train': 1.8423744440078735} -11/07/2021 02:31:35 - INFO - __main__ - Step 37624: {'lr': 0.0004318675517740033, 'samples': 7223808, 'steps': 37623, 'loss/train': 1.4404720067977905} -11/07/2021 02:31:35 - INFO - __main__ - Step 37625: {'lr': 0.0004318639105673379, 'samples': 7224000, 'steps': 37624, 'loss/train': 1.5224372148513794} -11/07/2021 02:31:36 - INFO - __main__ - Step 37626: {'lr': 0.00043186026927872736, 'samples': 7224192, 'steps': 37625, 'loss/train': 1.1585700511932373} -11/07/2021 02:31:36 - INFO - __main__ - Step 37627: {'lr': 0.0004318566279081735, 'samples': 7224384, 'steps': 37626, 'loss/train': 1.5932338237762451} -11/07/2021 02:31:36 - INFO - __main__ - Step 37628: {'lr': 0.0004318529864556777, 'samples': 7224576, 'steps': 37627, 'loss/train': 1.5945461988449097} -11/07/2021 02:31:37 - INFO - __main__ - Step 37629: {'lr': 0.0004318493449212419, 'samples': 7224768, 'steps': 37628, 'loss/train': 1.6314464807510376} -11/07/2021 02:31:38 - INFO - __main__ - Step 37630: {'lr': 0.00043184570330486756, 'samples': 7224960, 'steps': 37629, 'loss/train': 1.088186502456665} -11/07/2021 02:31:38 - INFO - __main__ - Step 37631: {'lr': 0.0004318420616065563, 'samples': 7225152, 'steps': 37630, 'loss/train': 1.3572551012039185} -11/07/2021 02:31:39 - INFO - __main__ - Step 37632: {'lr': 0.0004318384198263099, 'samples': 7225344, 'steps': 37631, 'loss/train': 1.4363213777542114} -11/07/2021 02:31:39 - INFO - __main__ - Step 37633: {'lr': 0.0004318347779641298, 'samples': 7225536, 'steps': 37632, 'loss/train': 1.7372273206710815} -11/07/2021 02:31:40 - INFO - __main__ - Step 37634: {'lr': 0.00043183113602001777, 'samples': 7225728, 'steps': 37633, 'loss/train': 0.5927386283874512} -11/07/2021 02:31:40 - INFO - __main__ - Step 37635: {'lr': 0.0004318274939939755, 'samples': 7225920, 'steps': 37634, 'loss/train': 1.5352866649627686} -11/07/2021 02:31:41 - INFO - __main__ - Step 37636: {'lr': 0.00043182385188600457, 'samples': 7226112, 'steps': 37635, 'loss/train': 1.1105045080184937} -11/07/2021 02:31:41 - INFO - __main__ - Step 37637: {'lr': 0.0004318202096961066, 'samples': 7226304, 'steps': 37636, 'loss/train': 0.7921403646469116} -11/07/2021 02:31:41 - INFO - __main__ - Step 37638: {'lr': 0.0004318165674242832, 'samples': 7226496, 'steps': 37637, 'loss/train': 0.8578131794929504} -11/07/2021 02:31:42 - INFO - __main__ - Step 37639: {'lr': 0.0004318129250705361, 'samples': 7226688, 'steps': 37638, 'loss/train': 1.8374136686325073} -11/07/2021 02:31:43 - INFO - __main__ - Step 37640: {'lr': 0.0004318092826348669, 'samples': 7226880, 'steps': 37639, 'loss/train': 1.7463501691818237} -11/07/2021 02:31:43 - INFO - __main__ - Step 37641: {'lr': 0.0004318056401172772, 'samples': 7227072, 'steps': 37640, 'loss/train': 1.500892996788025} -11/07/2021 02:31:44 - INFO - __main__ - Step 37642: {'lr': 0.0004318019975177688, 'samples': 7227264, 'steps': 37641, 'loss/train': 1.86619234085083} -11/07/2021 02:31:44 - INFO - __main__ - Step 37643: {'lr': 0.0004317983548363431, 'samples': 7227456, 'steps': 37642, 'loss/train': 1.6383424997329712} -11/07/2021 02:31:45 - INFO - __main__ - Step 37644: {'lr': 0.0004317947120730019, 'samples': 7227648, 'steps': 37643, 'loss/train': 1.8383617401123047} -11/07/2021 02:31:45 - INFO - __main__ - Step 37645: {'lr': 0.0004317910692277469, 'samples': 7227840, 'steps': 37644, 'loss/train': 1.0736067295074463} -11/07/2021 02:31:46 - INFO - __main__ - Step 37646: {'lr': 0.0004317874263005795, 'samples': 7228032, 'steps': 37645, 'loss/train': 0.9489991068840027} -11/07/2021 02:31:46 - INFO - __main__ - Step 37647: {'lr': 0.0004317837832915016, 'samples': 7228224, 'steps': 37646, 'loss/train': 1.8266150951385498} -11/07/2021 02:31:46 - INFO - __main__ - Step 37648: {'lr': 0.0004317801402005147, 'samples': 7228416, 'steps': 37647, 'loss/train': 1.5896239280700684} -11/07/2021 02:31:47 - INFO - __main__ - Step 37649: {'lr': 0.00043177649702762043, 'samples': 7228608, 'steps': 37648, 'loss/train': 1.2595068216323853} -11/07/2021 02:31:48 - INFO - __main__ - Step 37650: {'lr': 0.0004317728537728206, 'samples': 7228800, 'steps': 37649, 'loss/train': 1.6371251344680786} -11/07/2021 02:31:48 - INFO - __main__ - Step 37651: {'lr': 0.0004317692104361166, 'samples': 7228992, 'steps': 37650, 'loss/train': 1.5012624263763428} -11/07/2021 02:31:48 - INFO - __main__ - Step 37652: {'lr': 0.0004317655670175102, 'samples': 7229184, 'steps': 37651, 'loss/train': 1.1823043823242188} -11/07/2021 02:31:49 - INFO - __main__ - Step 37653: {'lr': 0.0004317619235170032, 'samples': 7229376, 'steps': 37652, 'loss/train': 1.0218074321746826} -11/07/2021 02:31:49 - INFO - __main__ - Step 37654: {'lr': 0.00043175827993459696, 'samples': 7229568, 'steps': 37653, 'loss/train': 1.5730572938919067} -11/07/2021 02:31:50 - INFO - __main__ - Step 37655: {'lr': 0.0004317546362702932, 'samples': 7229760, 'steps': 37654, 'loss/train': 1.5754374265670776} -11/07/2021 02:31:50 - INFO - __main__ - Step 37656: {'lr': 0.0004317509925240937, 'samples': 7229952, 'steps': 37655, 'loss/train': 1.760396122932434} -11/07/2021 02:31:51 - INFO - __main__ - Step 37657: {'lr': 0.00043174734869599993, 'samples': 7230144, 'steps': 37656, 'loss/train': 1.6367154121398926} -11/07/2021 02:31:51 - INFO - __main__ - Step 37658: {'lr': 0.0004317437047860137, 'samples': 7230336, 'steps': 37657, 'loss/train': 1.5266382694244385} -11/07/2021 02:31:51 - INFO - __main__ - Step 37659: {'lr': 0.0004317400607941364, 'samples': 7230528, 'steps': 37658, 'loss/train': 1.5288509130477905} -11/07/2021 02:31:53 - INFO - __main__ - Step 37660: {'lr': 0.00043173641672037, 'samples': 7230720, 'steps': 37659, 'loss/train': 1.6391620635986328} -11/07/2021 02:31:53 - INFO - __main__ - Step 37661: {'lr': 0.00043173277256471586, 'samples': 7230912, 'steps': 37660, 'loss/train': 1.4939783811569214} -11/07/2021 02:31:53 - INFO - __main__ - Step 37662: {'lr': 0.0004317291283271758, 'samples': 7231104, 'steps': 37661, 'loss/train': 1.5181828737258911} -11/07/2021 02:31:54 - INFO - __main__ - Step 37663: {'lr': 0.0004317254840077514, 'samples': 7231296, 'steps': 37662, 'loss/train': 1.6886277198791504} -11/07/2021 02:31:54 - INFO - __main__ - Step 37664: {'lr': 0.0004317218396064443, 'samples': 7231488, 'steps': 37663, 'loss/train': 1.5676177740097046} -11/07/2021 02:31:55 - INFO - __main__ - Step 37665: {'lr': 0.00043171819512325614, 'samples': 7231680, 'steps': 37664, 'loss/train': 1.3484420776367188} -11/07/2021 02:31:55 - INFO - __main__ - Step 37666: {'lr': 0.00043171455055818854, 'samples': 7231872, 'steps': 37665, 'loss/train': 1.4471410512924194} -11/07/2021 02:31:56 - INFO - __main__ - Step 37667: {'lr': 0.0004317109059112432, 'samples': 7232064, 'steps': 37666, 'loss/train': 1.7877618074417114} -11/07/2021 02:31:56 - INFO - __main__ - Step 37668: {'lr': 0.00043170726118242164, 'samples': 7232256, 'steps': 37667, 'loss/train': 2.937180280685425} -11/07/2021 02:31:56 - INFO - __main__ - Step 37669: {'lr': 0.0004317036163717257, 'samples': 7232448, 'steps': 37668, 'loss/train': 1.400524377822876} -11/07/2021 02:31:57 - INFO - __main__ - Step 37670: {'lr': 0.0004316999714791569, 'samples': 7232640, 'steps': 37669, 'loss/train': 1.571532964706421} -11/07/2021 02:31:58 - INFO - __main__ - Step 37671: {'lr': 0.0004316963265047169, 'samples': 7232832, 'steps': 37670, 'loss/train': 1.8768014907836914} -11/07/2021 02:31:58 - INFO - __main__ - Step 37672: {'lr': 0.00043169268144840726, 'samples': 7233024, 'steps': 37671, 'loss/train': 1.411942481994629} -11/07/2021 02:31:58 - INFO - __main__ - Step 37673: {'lr': 0.0004316890363102298, 'samples': 7233216, 'steps': 37672, 'loss/train': 1.3016736507415771} -11/07/2021 02:31:59 - INFO - __main__ - Step 37674: {'lr': 0.000431685391090186, 'samples': 7233408, 'steps': 37673, 'loss/train': 1.345513939857483} -11/07/2021 02:31:59 - INFO - __main__ - Step 37675: {'lr': 0.00043168174578827755, 'samples': 7233600, 'steps': 37674, 'loss/train': 1.5534780025482178} -11/07/2021 02:32:00 - INFO - __main__ - Step 37676: {'lr': 0.00043167810040450617, 'samples': 7233792, 'steps': 37675, 'loss/train': 1.6502912044525146} -11/07/2021 02:32:00 - INFO - __main__ - Step 37677: {'lr': 0.00043167445493887347, 'samples': 7233984, 'steps': 37676, 'loss/train': 1.8989665508270264} -11/07/2021 02:32:01 - INFO - __main__ - Step 37678: {'lr': 0.000431670809391381, 'samples': 7234176, 'steps': 37677, 'loss/train': 1.4615715742111206} -11/07/2021 02:32:01 - INFO - __main__ - Step 37679: {'lr': 0.00043166716376203047, 'samples': 7234368, 'steps': 37678, 'loss/train': 1.699442744255066} -11/07/2021 02:32:02 - INFO - __main__ - Step 37680: {'lr': 0.0004316635180508235, 'samples': 7234560, 'steps': 37679, 'loss/train': 1.6097488403320312} -11/07/2021 02:32:03 - INFO - __main__ - Step 37681: {'lr': 0.0004316598722577618, 'samples': 7234752, 'steps': 37680, 'loss/train': 1.2849406003952026} -11/07/2021 02:32:03 - INFO - __main__ - Step 37682: {'lr': 0.000431656226382847, 'samples': 7234944, 'steps': 37681, 'loss/train': 1.5217424631118774} -11/07/2021 02:32:03 - INFO - __main__ - Step 37683: {'lr': 0.00043165258042608055, 'samples': 7235136, 'steps': 37682, 'loss/train': 1.7335761785507202} -11/07/2021 02:32:04 - INFO - __main__ - Step 37684: {'lr': 0.0004316489343874644, 'samples': 7235328, 'steps': 37683, 'loss/train': 1.3470348119735718} -11/07/2021 02:32:04 - INFO - __main__ - Step 37685: {'lr': 0.000431645288267, 'samples': 7235520, 'steps': 37684, 'loss/train': 1.5445353984832764} -11/07/2021 02:32:05 - INFO - __main__ - Step 37686: {'lr': 0.00043164164206468904, 'samples': 7235712, 'steps': 37685, 'loss/train': 0.9622970819473267} -11/07/2021 02:32:05 - INFO - __main__ - Step 37687: {'lr': 0.00043163799578053313, 'samples': 7235904, 'steps': 37686, 'loss/train': 1.0782309770584106} -11/07/2021 02:32:06 - INFO - __main__ - Step 37688: {'lr': 0.00043163434941453395, 'samples': 7236096, 'steps': 37687, 'loss/train': 1.3358571529388428} -11/07/2021 02:32:06 - INFO - __main__ - Step 37689: {'lr': 0.00043163070296669317, 'samples': 7236288, 'steps': 37688, 'loss/train': 1.1718648672103882} -11/07/2021 02:32:06 - INFO - __main__ - Step 37690: {'lr': 0.00043162705643701236, 'samples': 7236480, 'steps': 37689, 'loss/train': 1.4089534282684326} -11/07/2021 02:32:07 - INFO - __main__ - Step 37691: {'lr': 0.00043162340982549327, 'samples': 7236672, 'steps': 37690, 'loss/train': 1.8753679990768433} -11/07/2021 02:32:08 - INFO - __main__ - Step 37692: {'lr': 0.00043161976313213735, 'samples': 7236864, 'steps': 37691, 'loss/train': 1.8158597946166992} -11/07/2021 02:32:08 - INFO - __main__ - Step 37693: {'lr': 0.0004316161163569465, 'samples': 7237056, 'steps': 37692, 'loss/train': 1.4391977787017822} -11/07/2021 02:32:08 - INFO - __main__ - Step 37694: {'lr': 0.0004316124694999222, 'samples': 7237248, 'steps': 37693, 'loss/train': 1.347544550895691} -11/07/2021 02:32:09 - INFO - __main__ - Step 37695: {'lr': 0.000431608822561066, 'samples': 7237440, 'steps': 37694, 'loss/train': 1.5738919973373413} -11/07/2021 02:32:10 - INFO - __main__ - Step 37696: {'lr': 0.0004316051755403798, 'samples': 7237632, 'steps': 37695, 'loss/train': 1.808718204498291} -11/07/2021 02:32:10 - INFO - __main__ - Step 37697: {'lr': 0.000431601528437865, 'samples': 7237824, 'steps': 37696, 'loss/train': 1.71670663356781} -11/07/2021 02:32:10 - INFO - __main__ - Step 37698: {'lr': 0.00043159788125352353, 'samples': 7238016, 'steps': 37697, 'loss/train': 1.798108458518982} -11/07/2021 02:32:11 - INFO - __main__ - Step 37699: {'lr': 0.0004315942339873567, 'samples': 7238208, 'steps': 37698, 'loss/train': 1.7028776407241821} -11/07/2021 02:32:11 - INFO - __main__ - Step 37700: {'lr': 0.00043159058663936635, 'samples': 7238400, 'steps': 37699, 'loss/train': 1.9503159523010254} -11/07/2021 02:32:12 - INFO - __main__ - Step 37701: {'lr': 0.0004315869392095542, 'samples': 7238592, 'steps': 37700, 'loss/train': 1.5541750192642212} -11/07/2021 02:32:13 - INFO - __main__ - Step 37702: {'lr': 0.0004315832916979216, 'samples': 7238784, 'steps': 37701, 'loss/train': 1.2538578510284424} -11/07/2021 02:32:13 - INFO - __main__ - Step 37703: {'lr': 0.00043157964410447047, 'samples': 7238976, 'steps': 37702, 'loss/train': 1.6704691648483276} -11/07/2021 02:32:13 - INFO - __main__ - Step 37704: {'lr': 0.0004315759964292023, 'samples': 7239168, 'steps': 37703, 'loss/train': 0.4037812352180481} -11/07/2021 02:32:14 - INFO - __main__ - Step 37705: {'lr': 0.0004315723486721188, 'samples': 7239360, 'steps': 37704, 'loss/train': 0.9939437508583069} -11/07/2021 02:32:14 - INFO - __main__ - Step 37706: {'lr': 0.00043156870083322166, 'samples': 7239552, 'steps': 37705, 'loss/train': 1.3555794954299927} -11/07/2021 02:32:15 - INFO - __main__ - Step 37707: {'lr': 0.00043156505291251234, 'samples': 7239744, 'steps': 37706, 'loss/train': 1.6051470041275024} -11/07/2021 02:32:16 - INFO - __main__ - Step 37708: {'lr': 0.00043156140490999275, 'samples': 7239936, 'steps': 37707, 'loss/train': 1.7810765504837036} -11/07/2021 02:32:16 - INFO - __main__ - Step 37709: {'lr': 0.0004315577568256643, 'samples': 7240128, 'steps': 37708, 'loss/train': 1.9991899728775024} -11/07/2021 02:32:16 - INFO - __main__ - Step 37710: {'lr': 0.0004315541086595288, 'samples': 7240320, 'steps': 37709, 'loss/train': 1.5813043117523193} -11/07/2021 02:32:17 - INFO - __main__ - Step 37711: {'lr': 0.00043155046041158776, 'samples': 7240512, 'steps': 37710, 'loss/train': 1.4850425720214844} -11/07/2021 02:32:18 - INFO - __main__ - Step 37712: {'lr': 0.0004315468120818429, 'samples': 7240704, 'steps': 37711, 'loss/train': 1.7535170316696167} -11/07/2021 02:32:18 - INFO - __main__ - Step 37713: {'lr': 0.0004315431636702959, 'samples': 7240896, 'steps': 37712, 'loss/train': 1.2823959589004517} -11/07/2021 02:32:18 - INFO - __main__ - Step 37714: {'lr': 0.00043153951517694824, 'samples': 7241088, 'steps': 37713, 'loss/train': 1.300570011138916} -11/07/2021 02:32:19 - INFO - __main__ - Step 37715: {'lr': 0.0004315358666018018, 'samples': 7241280, 'steps': 37714, 'loss/train': 1.6309016942977905} -11/07/2021 02:32:19 - INFO - __main__ - Step 37716: {'lr': 0.00043153221794485795, 'samples': 7241472, 'steps': 37715, 'loss/train': 0.8364524245262146} -11/07/2021 02:32:20 - INFO - __main__ - Step 37717: {'lr': 0.0004315285692061186, 'samples': 7241664, 'steps': 37716, 'loss/train': 1.4671432971954346} -11/07/2021 02:32:20 - INFO - __main__ - Step 37718: {'lr': 0.00043152492038558526, 'samples': 7241856, 'steps': 37717, 'loss/train': 1.6024607419967651} -11/07/2021 02:32:21 - INFO - __main__ - Step 37719: {'lr': 0.00043152127148325957, 'samples': 7242048, 'steps': 37718, 'loss/train': 1.3017303943634033} -11/07/2021 02:32:21 - INFO - __main__ - Step 37720: {'lr': 0.00043151762249914324, 'samples': 7242240, 'steps': 37719, 'loss/train': 1.588016152381897} -11/07/2021 02:32:21 - INFO - __main__ - Step 37721: {'lr': 0.00043151397343323784, 'samples': 7242432, 'steps': 37720, 'loss/train': 1.9084659814834595} -11/07/2021 02:32:23 - INFO - __main__ - Step 37722: {'lr': 0.00043151032428554505, 'samples': 7242624, 'steps': 37721, 'loss/train': 1.6454074382781982} -11/07/2021 02:32:23 - INFO - __main__ - Step 37723: {'lr': 0.0004315066750560665, 'samples': 7242816, 'steps': 37722, 'loss/train': 0.9799754023551941} -11/07/2021 02:32:23 - INFO - __main__ - Step 37724: {'lr': 0.0004315030257448038, 'samples': 7243008, 'steps': 37723, 'loss/train': 1.5956308841705322} -11/07/2021 02:32:24 - INFO - __main__ - Step 37725: {'lr': 0.00043149937635175874, 'samples': 7243200, 'steps': 37724, 'loss/train': 1.3453290462493896} -11/07/2021 02:32:24 - INFO - __main__ - Step 37726: {'lr': 0.0004314957268769328, 'samples': 7243392, 'steps': 37725, 'loss/train': 1.399642825126648} -11/07/2021 02:32:24 - INFO - __main__ - Step 37727: {'lr': 0.00043149207732032767, 'samples': 7243584, 'steps': 37726, 'loss/train': 1.6732821464538574} -11/07/2021 02:32:25 - INFO - __main__ - Step 37728: {'lr': 0.00043148842768194503, 'samples': 7243776, 'steps': 37727, 'loss/train': 1.9138143062591553} -11/07/2021 02:32:26 - INFO - __main__ - Step 37729: {'lr': 0.0004314847779617865, 'samples': 7243968, 'steps': 37728, 'loss/train': 1.4180481433868408} -11/07/2021 02:32:26 - INFO - __main__ - Step 37730: {'lr': 0.00043148112815985377, 'samples': 7244160, 'steps': 37729, 'loss/train': 1.4895565509796143} -11/07/2021 02:32:27 - INFO - __main__ - Step 37731: {'lr': 0.0004314774782761484, 'samples': 7244352, 'steps': 37730, 'loss/train': 1.2930500507354736} -11/07/2021 02:32:27 - INFO - __main__ - Step 37732: {'lr': 0.00043147382831067204, 'samples': 7244544, 'steps': 37731, 'loss/train': 1.820050597190857} -11/07/2021 02:32:28 - INFO - __main__ - Step 37733: {'lr': 0.0004314701782634264, 'samples': 7244736, 'steps': 37732, 'loss/train': 1.4728184938430786} -11/07/2021 02:32:28 - INFO - __main__ - Step 37734: {'lr': 0.0004314665281344132, 'samples': 7244928, 'steps': 37733, 'loss/train': 1.8691281080245972} -11/07/2021 02:32:29 - INFO - __main__ - Step 37735: {'lr': 0.0004314628779236339, 'samples': 7245120, 'steps': 37734, 'loss/train': 1.8617697954177856} -11/07/2021 02:32:29 - INFO - __main__ - Step 37736: {'lr': 0.00043145922763109017, 'samples': 7245312, 'steps': 37735, 'loss/train': 0.6751835942268372} -11/07/2021 02:32:29 - INFO - __main__ - Step 37737: {'lr': 0.0004314555772567838, 'samples': 7245504, 'steps': 37736, 'loss/train': 1.458873987197876} -11/07/2021 02:32:30 - INFO - __main__ - Step 37738: {'lr': 0.0004314519268007163, 'samples': 7245696, 'steps': 37737, 'loss/train': 1.4394382238388062} -11/07/2021 02:32:31 - INFO - __main__ - Step 37739: {'lr': 0.00043144827626288943, 'samples': 7245888, 'steps': 37738, 'loss/train': 1.5663368701934814} -11/07/2021 02:32:31 - INFO - __main__ - Step 37740: {'lr': 0.00043144462564330464, 'samples': 7246080, 'steps': 37739, 'loss/train': 2.232424020767212} -11/07/2021 02:32:31 - INFO - __main__ - Step 37741: {'lr': 0.0004314409749419638, 'samples': 7246272, 'steps': 37740, 'loss/train': 1.4186749458312988} -11/07/2021 02:32:32 - INFO - __main__ - Step 37742: {'lr': 0.00043143732415886843, 'samples': 7246464, 'steps': 37741, 'loss/train': 1.548527717590332} -11/07/2021 02:32:32 - INFO - __main__ - Step 37743: {'lr': 0.0004314336732940202, 'samples': 7246656, 'steps': 37742, 'loss/train': 0.8476759195327759} -11/07/2021 02:32:33 - INFO - __main__ - Step 37744: {'lr': 0.0004314300223474208, 'samples': 7246848, 'steps': 37743, 'loss/train': 1.3937143087387085} -11/07/2021 02:32:33 - INFO - __main__ - Step 37745: {'lr': 0.0004314263713190718, 'samples': 7247040, 'steps': 37744, 'loss/train': 0.32582950592041016} -11/07/2021 02:32:34 - INFO - __main__ - Step 37746: {'lr': 0.00043142272020897486, 'samples': 7247232, 'steps': 37745, 'loss/train': 1.4074898958206177} -11/07/2021 02:32:34 - INFO - __main__ - Step 37747: {'lr': 0.0004314190690171317, 'samples': 7247424, 'steps': 37746, 'loss/train': 1.3477909564971924} -11/07/2021 02:32:35 - INFO - __main__ - Step 37748: {'lr': 0.0004314154177435438, 'samples': 7247616, 'steps': 37747, 'loss/train': 1.3964956998825073} -11/07/2021 02:32:36 - INFO - __main__ - Step 37749: {'lr': 0.000431411766388213, 'samples': 7247808, 'steps': 37748, 'loss/train': 1.625677466392517} -11/07/2021 02:32:36 - INFO - __main__ - Step 37750: {'lr': 0.0004314081149511409, 'samples': 7248000, 'steps': 37749, 'loss/train': 1.4735047817230225} -11/07/2021 02:32:36 - INFO - __main__ - Step 37751: {'lr': 0.00043140446343232895, 'samples': 7248192, 'steps': 37750, 'loss/train': 1.6033672094345093} -11/07/2021 02:32:37 - INFO - __main__ - Step 37752: {'lr': 0.000431400811831779, 'samples': 7248384, 'steps': 37751, 'loss/train': 1.698687195777893} -11/07/2021 02:32:37 - INFO - __main__ - Step 37753: {'lr': 0.0004313971601494927, 'samples': 7248576, 'steps': 37752, 'loss/train': 1.3801158666610718} -11/07/2021 02:32:38 - INFO - __main__ - Step 37754: {'lr': 0.0004313935083854716, 'samples': 7248768, 'steps': 37753, 'loss/train': 1.691262125968933} -11/07/2021 02:32:38 - INFO - __main__ - Step 37755: {'lr': 0.0004313898565397174, 'samples': 7248960, 'steps': 37754, 'loss/train': 1.657094955444336} -11/07/2021 02:32:39 - INFO - __main__ - Step 37756: {'lr': 0.00043138620461223175, 'samples': 7249152, 'steps': 37755, 'loss/train': 1.5319207906723022} -11/07/2021 02:32:39 - INFO - __main__ - Step 37757: {'lr': 0.00043138255260301625, 'samples': 7249344, 'steps': 37756, 'loss/train': 1.534110188484192} -11/07/2021 02:32:39 - INFO - __main__ - Step 37758: {'lr': 0.0004313789005120725, 'samples': 7249536, 'steps': 37757, 'loss/train': 1.7224847078323364} -11/07/2021 02:32:40 - INFO - __main__ - Step 37759: {'lr': 0.00043137524833940233, 'samples': 7249728, 'steps': 37758, 'loss/train': 1.6888084411621094} -11/07/2021 02:32:41 - INFO - __main__ - Step 37760: {'lr': 0.0004313715960850072, 'samples': 7249920, 'steps': 37759, 'loss/train': 1.3553645610809326} -11/07/2021 02:32:41 - INFO - __main__ - Step 37761: {'lr': 0.00043136794374888887, 'samples': 7250112, 'steps': 37760, 'loss/train': 1.6526095867156982} -11/07/2021 02:32:41 - INFO - __main__ - Step 37762: {'lr': 0.0004313642913310489, 'samples': 7250304, 'steps': 37761, 'loss/train': 1.6274479627609253} -11/07/2021 02:32:42 - INFO - __main__ - Step 37763: {'lr': 0.00043136063883148905, 'samples': 7250496, 'steps': 37762, 'loss/train': 1.5382124185562134} -11/07/2021 02:32:43 - INFO - __main__ - Step 37764: {'lr': 0.00043135698625021093, 'samples': 7250688, 'steps': 37763, 'loss/train': 1.6963647603988647} -11/07/2021 02:32:43 - INFO - __main__ - Step 37765: {'lr': 0.000431353333587216, 'samples': 7250880, 'steps': 37764, 'loss/train': 1.4143861532211304} -11/07/2021 02:32:44 - INFO - __main__ - Step 37766: {'lr': 0.00043134968084250616, 'samples': 7251072, 'steps': 37765, 'loss/train': 1.3447948694229126} -11/07/2021 02:32:44 - INFO - __main__ - Step 37767: {'lr': 0.00043134602801608293, 'samples': 7251264, 'steps': 37766, 'loss/train': 1.1817660331726074} -11/07/2021 02:32:44 - INFO - __main__ - Step 37768: {'lr': 0.00043134237510794794, 'samples': 7251456, 'steps': 37767, 'loss/train': 0.40962114930152893} -11/07/2021 02:32:45 - INFO - __main__ - Step 37769: {'lr': 0.0004313387221181029, 'samples': 7251648, 'steps': 37768, 'loss/train': 1.8461116552352905} -11/07/2021 02:32:46 - INFO - __main__ - Step 37770: {'lr': 0.0004313350690465495, 'samples': 7251840, 'steps': 37769, 'loss/train': 5.757008075714111} -11/07/2021 02:32:46 - INFO - __main__ - Step 37771: {'lr': 0.00043133141589328923, 'samples': 7252032, 'steps': 37770, 'loss/train': 1.4343360662460327} -11/07/2021 02:32:46 - INFO - __main__ - Step 37772: {'lr': 0.0004313277626583239, 'samples': 7252224, 'steps': 37771, 'loss/train': 1.7761224508285522} -11/07/2021 02:32:47 - INFO - __main__ - Step 37773: {'lr': 0.000431324109341655, 'samples': 7252416, 'steps': 37772, 'loss/train': 1.9840986728668213} -11/07/2021 02:32:47 - INFO - __main__ - Step 37774: {'lr': 0.0004313204559432842, 'samples': 7252608, 'steps': 37773, 'loss/train': 1.5764964818954468} -11/07/2021 02:32:48 - INFO - __main__ - Step 37775: {'lr': 0.0004313168024632133, 'samples': 7252800, 'steps': 37774, 'loss/train': 1.5473870038986206} -11/07/2021 02:32:48 - INFO - __main__ - Step 37776: {'lr': 0.00043131314890144386, 'samples': 7252992, 'steps': 37775, 'loss/train': 1.4710793495178223} -11/07/2021 02:32:49 - INFO - __main__ - Step 37777: {'lr': 0.0004313094952579775, 'samples': 7253184, 'steps': 37776, 'loss/train': 1.7181931734085083} -11/07/2021 02:32:49 - INFO - __main__ - Step 37778: {'lr': 0.0004313058415328158, 'samples': 7253376, 'steps': 37777, 'loss/train': 1.3149781227111816} -11/07/2021 02:32:49 - INFO - __main__ - Step 37779: {'lr': 0.00043130218772596053, 'samples': 7253568, 'steps': 37778, 'loss/train': 1.5012356042861938} -11/07/2021 02:32:50 - INFO - __main__ - Step 37780: {'lr': 0.00043129853383741334, 'samples': 7253760, 'steps': 37779, 'loss/train': 1.810323715209961} -11/07/2021 02:32:51 - INFO - __main__ - Step 37781: {'lr': 0.00043129487986717574, 'samples': 7253952, 'steps': 37780, 'loss/train': 1.4915090799331665} -11/07/2021 02:32:51 - INFO - __main__ - Step 37782: {'lr': 0.00043129122581524957, 'samples': 7254144, 'steps': 37781, 'loss/train': 0.9132309556007385} -11/07/2021 02:32:52 - INFO - __main__ - Step 37783: {'lr': 0.0004312875716816363, 'samples': 7254336, 'steps': 37782, 'loss/train': 1.672573447227478} -11/07/2021 02:32:52 - INFO - __main__ - Step 37784: {'lr': 0.0004312839174663377, 'samples': 7254528, 'steps': 37783, 'loss/train': 1.327996850013733} -11/07/2021 02:32:53 - INFO - __main__ - Step 37785: {'lr': 0.0004312802631693553, 'samples': 7254720, 'steps': 37784, 'loss/train': 1.4877172708511353} -11/07/2021 02:32:53 - INFO - __main__ - Step 37786: {'lr': 0.00043127660879069084, 'samples': 7254912, 'steps': 37785, 'loss/train': 1.5174921751022339} -11/07/2021 02:32:54 - INFO - __main__ - Step 37787: {'lr': 0.00043127295433034594, 'samples': 7255104, 'steps': 37786, 'loss/train': 1.538757562637329} -11/07/2021 02:32:54 - INFO - __main__ - Step 37788: {'lr': 0.00043126929978832217, 'samples': 7255296, 'steps': 37787, 'loss/train': 1.6394915580749512} -11/07/2021 02:32:54 - INFO - __main__ - Step 37789: {'lr': 0.00043126564516462134, 'samples': 7255488, 'steps': 37788, 'loss/train': 1.9435192346572876} -11/07/2021 02:32:55 - INFO - __main__ - Step 37790: {'lr': 0.000431261990459245, 'samples': 7255680, 'steps': 37789, 'loss/train': 2.3344905376434326} -11/07/2021 02:32:56 - INFO - __main__ - Step 37791: {'lr': 0.0004312583356721948, 'samples': 7255872, 'steps': 37790, 'loss/train': 1.6491162776947021} -11/07/2021 02:32:56 - INFO - __main__ - Step 37792: {'lr': 0.0004312546808034724, 'samples': 7256064, 'steps': 37791, 'loss/train': 1.3833657503128052} -11/07/2021 02:32:56 - INFO - __main__ - Step 37793: {'lr': 0.0004312510258530794, 'samples': 7256256, 'steps': 37792, 'loss/train': 1.8957017660140991} -11/07/2021 02:32:57 - INFO - __main__ - Step 37794: {'lr': 0.0004312473708210175, 'samples': 7256448, 'steps': 37793, 'loss/train': 1.3169971704483032} -11/07/2021 02:32:57 - INFO - __main__ - Step 37795: {'lr': 0.0004312437157072884, 'samples': 7256640, 'steps': 37794, 'loss/train': 0.8353274464607239} -11/07/2021 02:32:59 - INFO - __main__ - Step 37796: {'lr': 0.00043124006051189356, 'samples': 7256832, 'steps': 37795, 'loss/train': 1.1799557209014893} -11/07/2021 02:32:59 - INFO - __main__ - Step 37797: {'lr': 0.0004312364052348348, 'samples': 7257024, 'steps': 37796, 'loss/train': 1.508033037185669} -11/07/2021 02:32:59 - INFO - __main__ - Step 37798: {'lr': 0.0004312327498761137, 'samples': 7257216, 'steps': 37797, 'loss/train': 0.404900461435318} -11/07/2021 02:33:00 - INFO - __main__ - Step 37799: {'lr': 0.000431229094435732, 'samples': 7257408, 'steps': 37798, 'loss/train': 1.551729440689087} -11/07/2021 02:33:00 - INFO - __main__ - Step 37800: {'lr': 0.0004312254389136911, 'samples': 7257600, 'steps': 37799, 'loss/train': 1.2227293252944946} -11/07/2021 02:33:01 - INFO - __main__ - Step 37801: {'lr': 0.00043122178330999296, 'samples': 7257792, 'steps': 37800, 'loss/train': 1.5652748346328735} -11/07/2021 02:33:01 - INFO - __main__ - Step 37802: {'lr': 0.0004312181276246391, 'samples': 7257984, 'steps': 37801, 'loss/train': 1.7289127111434937} -11/07/2021 02:33:02 - INFO - __main__ - Step 37803: {'lr': 0.00043121447185763106, 'samples': 7258176, 'steps': 37802, 'loss/train': 1.5276554822921753} -11/07/2021 02:33:02 - INFO - __main__ - Step 37804: {'lr': 0.0004312108160089706, 'samples': 7258368, 'steps': 37803, 'loss/train': 1.2928982973098755} -11/07/2021 02:33:03 - INFO - __main__ - Step 37805: {'lr': 0.00043120716007865933, 'samples': 7258560, 'steps': 37804, 'loss/train': 1.6584603786468506} -11/07/2021 02:33:03 - INFO - __main__ - Step 37806: {'lr': 0.0004312035040666989, 'samples': 7258752, 'steps': 37805, 'loss/train': 0.6836652755737305} -11/07/2021 02:33:04 - INFO - __main__ - Step 37807: {'lr': 0.000431199847973091, 'samples': 7258944, 'steps': 37806, 'loss/train': 1.5036001205444336} -11/07/2021 02:33:04 - INFO - __main__ - Step 37808: {'lr': 0.0004311961917978372, 'samples': 7259136, 'steps': 37807, 'loss/train': 1.5429991483688354} -11/07/2021 02:33:05 - INFO - __main__ - Step 37809: {'lr': 0.0004311925355409393, 'samples': 7259328, 'steps': 37808, 'loss/train': 1.3604049682617188} -11/07/2021 02:33:05 - INFO - __main__ - Step 37810: {'lr': 0.00043118887920239876, 'samples': 7259520, 'steps': 37809, 'loss/train': 1.240416407585144} -11/07/2021 02:33:06 - INFO - __main__ - Step 37811: {'lr': 0.00043118522278221726, 'samples': 7259712, 'steps': 37810, 'loss/train': 1.3365050554275513} -11/07/2021 02:33:06 - INFO - __main__ - Step 37812: {'lr': 0.0004311815662803966, 'samples': 7259904, 'steps': 37811, 'loss/train': 1.4456079006195068} -11/07/2021 02:33:07 - INFO - __main__ - Step 37813: {'lr': 0.00043117790969693826, 'samples': 7260096, 'steps': 37812, 'loss/train': 1.4940829277038574} -11/07/2021 02:33:07 - INFO - __main__ - Step 37814: {'lr': 0.00043117425303184395, 'samples': 7260288, 'steps': 37813, 'loss/train': 1.4381945133209229} -11/07/2021 02:33:07 - INFO - __main__ - Step 37815: {'lr': 0.0004311705962851153, 'samples': 7260480, 'steps': 37814, 'loss/train': 1.5033267736434937} -11/07/2021 02:33:10 - INFO - __main__ - Step 37816: {'lr': 0.000431166939456754, 'samples': 7260672, 'steps': 37815, 'loss/train': 1.637882947921753} -11/07/2021 02:33:10 - INFO - __main__ - Step 37817: {'lr': 0.0004311632825467617, 'samples': 7260864, 'steps': 37816, 'loss/train': 1.7710007429122925} -11/07/2021 02:33:10 - INFO - __main__ - Step 37818: {'lr': 0.00043115962555514, 'samples': 7261056, 'steps': 37817, 'loss/train': 1.43278968334198} -11/07/2021 02:33:11 - INFO - __main__ - Step 37819: {'lr': 0.0004311559684818905, 'samples': 7261248, 'steps': 37818, 'loss/train': 1.7777564525604248} -11/07/2021 02:33:11 - INFO - __main__ - Step 37820: {'lr': 0.000431152311327015, 'samples': 7261440, 'steps': 37819, 'loss/train': 1.7829294204711914} -11/07/2021 02:33:12 - INFO - __main__ - Step 37821: {'lr': 0.00043114865409051505, 'samples': 7261632, 'steps': 37820, 'loss/train': 1.788772463798523} -11/07/2021 02:33:12 - INFO - __main__ - Step 37822: {'lr': 0.0004311449967723923, 'samples': 7261824, 'steps': 37821, 'loss/train': 1.7570000886917114} -11/07/2021 02:33:12 - INFO - __main__ - Step 37823: {'lr': 0.00043114133937264843, 'samples': 7262016, 'steps': 37822, 'loss/train': 1.4681305885314941} -11/07/2021 02:33:13 - INFO - __main__ - Step 37824: {'lr': 0.000431137681891285, 'samples': 7262208, 'steps': 37823, 'loss/train': 1.901205062866211} -11/07/2021 02:33:14 - INFO - __main__ - Step 37825: {'lr': 0.0004311340243283038, 'samples': 7262400, 'steps': 37824, 'loss/train': 2.0343801975250244} -11/07/2021 02:33:14 - INFO - __main__ - Step 37826: {'lr': 0.0004311303666837064, 'samples': 7262592, 'steps': 37825, 'loss/train': 1.4734593629837036} -11/07/2021 02:33:14 - INFO - __main__ - Step 37827: {'lr': 0.0004311267089574944, 'samples': 7262784, 'steps': 37826, 'loss/train': 1.7053385972976685} -11/07/2021 02:33:15 - INFO - __main__ - Step 37828: {'lr': 0.00043112305114966957, 'samples': 7262976, 'steps': 37827, 'loss/train': 0.6940966248512268} -11/07/2021 02:33:16 - INFO - __main__ - Step 37829: {'lr': 0.0004311193932602334, 'samples': 7263168, 'steps': 37828, 'loss/train': 1.3707382678985596} -11/07/2021 02:33:16 - INFO - __main__ - Step 37830: {'lr': 0.0004311157352891877, 'samples': 7263360, 'steps': 37829, 'loss/train': 1.5984339714050293} -11/07/2021 02:33:16 - INFO - __main__ - Step 37831: {'lr': 0.000431112077236534, 'samples': 7263552, 'steps': 37830, 'loss/train': 1.326088547706604} -11/07/2021 02:33:17 - INFO - __main__ - Step 37832: {'lr': 0.0004311084191022741, 'samples': 7263744, 'steps': 37831, 'loss/train': 1.5728517770767212} -11/07/2021 02:33:17 - INFO - __main__ - Step 37833: {'lr': 0.00043110476088640935, 'samples': 7263936, 'steps': 37832, 'loss/train': 1.3312963247299194} -11/07/2021 02:33:18 - INFO - __main__ - Step 37834: {'lr': 0.00043110110258894177, 'samples': 7264128, 'steps': 37833, 'loss/train': 1.6761177778244019} -11/07/2021 02:33:18 - INFO - __main__ - Step 37835: {'lr': 0.00043109744420987274, 'samples': 7264320, 'steps': 37834, 'loss/train': 1.7098302841186523} -11/07/2021 02:33:19 - INFO - __main__ - Step 37836: {'lr': 0.000431093785749204, 'samples': 7264512, 'steps': 37835, 'loss/train': 1.6409319639205933} -11/07/2021 02:33:19 - INFO - __main__ - Step 37837: {'lr': 0.00043109012720693717, 'samples': 7264704, 'steps': 37836, 'loss/train': 1.404793381690979} -11/07/2021 02:33:19 - INFO - __main__ - Step 37838: {'lr': 0.000431086468583074, 'samples': 7264896, 'steps': 37837, 'loss/train': 1.2502204179763794} -11/07/2021 02:33:20 - INFO - __main__ - Step 37839: {'lr': 0.00043108280987761593, 'samples': 7265088, 'steps': 37838, 'loss/train': 2.034834146499634} -11/07/2021 02:33:21 - INFO - __main__ - Step 37840: {'lr': 0.0004310791510905649, 'samples': 7265280, 'steps': 37839, 'loss/train': 1.233948826789856} -11/07/2021 02:33:22 - INFO - __main__ - Step 37841: {'lr': 0.00043107549222192235, 'samples': 7265472, 'steps': 37840, 'loss/train': 0.8641500473022461} -11/07/2021 02:33:22 - INFO - __main__ - Step 37842: {'lr': 0.0004310718332716899, 'samples': 7265664, 'steps': 37841, 'loss/train': 0.9060410261154175} -11/07/2021 02:33:22 - INFO - __main__ - Step 37843: {'lr': 0.00043106817423986933, 'samples': 7265856, 'steps': 37842, 'loss/train': 1.6606569290161133} -11/07/2021 02:33:23 - INFO - __main__ - Step 37844: {'lr': 0.00043106451512646226, 'samples': 7266048, 'steps': 37843, 'loss/train': 1.746648907661438} -11/07/2021 02:33:24 - INFO - __main__ - Step 37845: {'lr': 0.00043106085593147027, 'samples': 7266240, 'steps': 37844, 'loss/train': 2.3888840675354004} -11/07/2021 02:33:24 - INFO - __main__ - Step 37846: {'lr': 0.00043105719665489505, 'samples': 7266432, 'steps': 37845, 'loss/train': 2.0307137966156006} -11/07/2021 02:33:24 - INFO - __main__ - Step 37847: {'lr': 0.0004310535372967383, 'samples': 7266624, 'steps': 37846, 'loss/train': 1.5262460708618164} -11/07/2021 02:33:25 - INFO - __main__ - Step 37848: {'lr': 0.0004310498778570016, 'samples': 7266816, 'steps': 37847, 'loss/train': 1.5267208814620972} -11/07/2021 02:33:25 - INFO - __main__ - Step 37849: {'lr': 0.0004310462183356866, 'samples': 7267008, 'steps': 37848, 'loss/train': 1.6285754442214966} -11/07/2021 02:33:26 - INFO - __main__ - Step 37850: {'lr': 0.00043104255873279497, 'samples': 7267200, 'steps': 37849, 'loss/train': 1.5782309770584106} -11/07/2021 02:33:26 - INFO - __main__ - Step 37851: {'lr': 0.00043103889904832837, 'samples': 7267392, 'steps': 37850, 'loss/train': 1.5631217956542969} -11/07/2021 02:33:27 - INFO - __main__ - Step 37852: {'lr': 0.0004310352392822884, 'samples': 7267584, 'steps': 37851, 'loss/train': 1.2980358600616455} -11/07/2021 02:33:27 - INFO - __main__ - Step 37853: {'lr': 0.00043103157943467674, 'samples': 7267776, 'steps': 37852, 'loss/train': 1.319003939628601} -11/07/2021 02:33:27 - INFO - __main__ - Step 37854: {'lr': 0.00043102791950549513, 'samples': 7267968, 'steps': 37853, 'loss/train': 1.1419496536254883} -11/07/2021 02:33:28 - INFO - __main__ - Step 37855: {'lr': 0.00043102425949474504, 'samples': 7268160, 'steps': 37854, 'loss/train': 0.9001447558403015} -11/07/2021 02:33:29 - INFO - __main__ - Step 37856: {'lr': 0.00043102059940242825, 'samples': 7268352, 'steps': 37855, 'loss/train': 1.6300129890441895} -11/07/2021 02:33:29 - INFO - __main__ - Step 37857: {'lr': 0.0004310169392285464, 'samples': 7268544, 'steps': 37856, 'loss/train': 1.0531177520751953} -11/07/2021 02:33:30 - INFO - __main__ - Step 37858: {'lr': 0.0004310132789731011, 'samples': 7268736, 'steps': 37857, 'loss/train': 0.9698438048362732} -11/07/2021 02:33:30 - INFO - __main__ - Step 37859: {'lr': 0.000431009618636094, 'samples': 7268928, 'steps': 37858, 'loss/train': 2.036407232284546} -11/07/2021 02:33:31 - INFO - __main__ - Step 37860: {'lr': 0.00043100595821752674, 'samples': 7269120, 'steps': 37859, 'loss/train': 1.3307468891143799} -11/07/2021 02:33:31 - INFO - __main__ - Step 37861: {'lr': 0.00043100229771740096, 'samples': 7269312, 'steps': 37860, 'loss/train': 1.7175347805023193} -11/07/2021 02:33:32 - INFO - __main__ - Step 37862: {'lr': 0.0004309986371357184, 'samples': 7269504, 'steps': 37861, 'loss/train': 1.4010646343231201} -11/07/2021 02:33:32 - INFO - __main__ - Step 37863: {'lr': 0.00043099497647248065, 'samples': 7269696, 'steps': 37862, 'loss/train': 1.5942286252975464} -11/07/2021 02:33:32 - INFO - __main__ - Step 37864: {'lr': 0.00043099131572768936, 'samples': 7269888, 'steps': 37863, 'loss/train': 1.4234338998794556} -11/07/2021 02:33:33 - INFO - __main__ - Step 37865: {'lr': 0.00043098765490134607, 'samples': 7270080, 'steps': 37864, 'loss/train': 1.3859913349151611} -11/07/2021 02:33:34 - INFO - __main__ - Step 37866: {'lr': 0.00043098399399345267, 'samples': 7270272, 'steps': 37865, 'loss/train': 1.5256638526916504} -11/07/2021 02:33:34 - INFO - __main__ - Step 37867: {'lr': 0.0004309803330040106, 'samples': 7270464, 'steps': 37866, 'loss/train': 1.1439716815948486} -11/07/2021 02:33:34 - INFO - __main__ - Step 37868: {'lr': 0.0004309766719330216, 'samples': 7270656, 'steps': 37867, 'loss/train': 1.7910076379776} -11/07/2021 02:33:35 - INFO - __main__ - Step 37869: {'lr': 0.00043097301078048736, 'samples': 7270848, 'steps': 37868, 'loss/train': 2.2756893634796143} -11/07/2021 02:33:35 - INFO - __main__ - Step 37870: {'lr': 0.00043096934954640935, 'samples': 7271040, 'steps': 37869, 'loss/train': 0.8272931575775146} -11/07/2021 02:33:36 - INFO - __main__ - Step 37871: {'lr': 0.0004309656882307894, 'samples': 7271232, 'steps': 37870, 'loss/train': 1.467457890510559} -11/07/2021 02:33:36 - INFO - __main__ - Step 37872: {'lr': 0.0004309620268336292, 'samples': 7271424, 'steps': 37871, 'loss/train': 1.2793571949005127} -11/07/2021 02:33:37 - INFO - __main__ - Step 37873: {'lr': 0.0004309583653549302, 'samples': 7271616, 'steps': 37872, 'loss/train': 1.2705497741699219} -11/07/2021 02:33:37 - INFO - __main__ - Step 37874: {'lr': 0.0004309547037946941, 'samples': 7271808, 'steps': 37873, 'loss/train': 1.276893138885498} -11/07/2021 02:33:37 - INFO - __main__ - Step 37875: {'lr': 0.0004309510421529227, 'samples': 7272000, 'steps': 37874, 'loss/train': 1.6498548984527588} -11/07/2021 02:33:39 - INFO - __main__ - Step 37876: {'lr': 0.00043094738042961754, 'samples': 7272192, 'steps': 37875, 'loss/train': 1.8039900064468384} -11/07/2021 02:33:39 - INFO - __main__ - Step 37877: {'lr': 0.0004309437186247803, 'samples': 7272384, 'steps': 37876, 'loss/train': 1.3540936708450317} -11/07/2021 02:33:39 - INFO - __main__ - Step 37878: {'lr': 0.00043094005673841257, 'samples': 7272576, 'steps': 37877, 'loss/train': 1.3922836780548096} -11/07/2021 02:33:40 - INFO - __main__ - Step 37879: {'lr': 0.00043093639477051606, 'samples': 7272768, 'steps': 37878, 'loss/train': 1.6267963647842407} -11/07/2021 02:33:40 - INFO - __main__ - Step 37880: {'lr': 0.0004309327327210923, 'samples': 7272960, 'steps': 37879, 'loss/train': 1.459894061088562} -11/07/2021 02:33:41 - INFO - __main__ - Step 37881: {'lr': 0.00043092907059014325, 'samples': 7273152, 'steps': 37880, 'loss/train': 1.5659189224243164} -11/07/2021 02:33:41 - INFO - __main__ - Step 37882: {'lr': 0.00043092540837767025, 'samples': 7273344, 'steps': 37881, 'loss/train': 1.1091625690460205} -11/07/2021 02:33:42 - INFO - __main__ - Step 37883: {'lr': 0.000430921746083675, 'samples': 7273536, 'steps': 37882, 'loss/train': 1.4476122856140137} -11/07/2021 02:33:42 - INFO - __main__ - Step 37884: {'lr': 0.00043091808370815935, 'samples': 7273728, 'steps': 37883, 'loss/train': 5.744571685791016} -11/07/2021 02:33:42 - INFO - __main__ - Step 37885: {'lr': 0.0004309144212511246, 'samples': 7273920, 'steps': 37884, 'loss/train': 2.258639097213745} -11/07/2021 02:33:43 - INFO - __main__ - Step 37886: {'lr': 0.00043091075871257275, 'samples': 7274112, 'steps': 37885, 'loss/train': 1.553177833557129} -11/07/2021 02:33:44 - INFO - __main__ - Step 37887: {'lr': 0.0004309070960925052, 'samples': 7274304, 'steps': 37886, 'loss/train': 1.8596436977386475} -11/07/2021 02:33:44 - INFO - __main__ - Step 37888: {'lr': 0.0004309034333909238, 'samples': 7274496, 'steps': 37887, 'loss/train': 0.9980459809303284} -11/07/2021 02:33:45 - INFO - __main__ - Step 37889: {'lr': 0.0004308997706078301, 'samples': 7274688, 'steps': 37888, 'loss/train': 1.687778115272522} -11/07/2021 02:33:45 - INFO - __main__ - Step 37890: {'lr': 0.00043089610774322575, 'samples': 7274880, 'steps': 37889, 'loss/train': 1.6858359575271606} -11/07/2021 02:33:45 - INFO - __main__ - Step 37891: {'lr': 0.00043089244479711233, 'samples': 7275072, 'steps': 37890, 'loss/train': 1.6822612285614014} -11/07/2021 02:33:46 - INFO - __main__ - Step 37892: {'lr': 0.00043088878176949163, 'samples': 7275264, 'steps': 37891, 'loss/train': 1.539404273033142} -11/07/2021 02:33:47 - INFO - __main__ - Step 37893: {'lr': 0.0004308851186603652, 'samples': 7275456, 'steps': 37892, 'loss/train': 1.781607985496521} -11/07/2021 02:33:47 - INFO - __main__ - Step 37894: {'lr': 0.0004308814554697348, 'samples': 7275648, 'steps': 37893, 'loss/train': 1.5547536611557007} -11/07/2021 02:33:47 - INFO - __main__ - Step 37895: {'lr': 0.0004308777921976019, 'samples': 7275840, 'steps': 37894, 'loss/train': 1.359387993812561} -11/07/2021 02:33:48 - INFO - __main__ - Step 37896: {'lr': 0.00043087412884396835, 'samples': 7276032, 'steps': 37895, 'loss/train': 1.5210968255996704} -11/07/2021 02:33:49 - INFO - __main__ - Step 37897: {'lr': 0.0004308704654088357, 'samples': 7276224, 'steps': 37896, 'loss/train': 1.327373743057251} -11/07/2021 02:33:50 - INFO - __main__ - Step 37898: {'lr': 0.00043086680189220554, 'samples': 7276416, 'steps': 37897, 'loss/train': 1.487549901008606} -11/07/2021 02:33:50 - INFO - __main__ - Step 37899: {'lr': 0.00043086313829407966, 'samples': 7276608, 'steps': 37898, 'loss/train': 1.7413653135299683} -11/07/2021 02:33:50 - INFO - __main__ - Step 37900: {'lr': 0.0004308594746144596, 'samples': 7276800, 'steps': 37899, 'loss/train': 1.532272219657898} -11/07/2021 02:33:51 - INFO - __main__ - Step 37901: {'lr': 0.0004308558108533471, 'samples': 7276992, 'steps': 37900, 'loss/train': 0.5073288679122925} -11/07/2021 02:33:52 - INFO - __main__ - Step 37902: {'lr': 0.0004308521470107437, 'samples': 7277184, 'steps': 37901, 'loss/train': 0.9130961894989014} -11/07/2021 02:33:52 - INFO - __main__ - Step 37903: {'lr': 0.00043084848308665115, 'samples': 7277376, 'steps': 37902, 'loss/train': 1.5158967971801758} -11/07/2021 02:33:52 - INFO - __main__ - Step 37904: {'lr': 0.00043084481908107103, 'samples': 7277568, 'steps': 37903, 'loss/train': 1.6894845962524414} -11/07/2021 02:33:53 - INFO - __main__ - Step 37905: {'lr': 0.00043084115499400505, 'samples': 7277760, 'steps': 37904, 'loss/train': 1.2803417444229126} -11/07/2021 02:33:53 - INFO - __main__ - Step 37906: {'lr': 0.0004308374908254549, 'samples': 7277952, 'steps': 37905, 'loss/train': 1.5752876996994019} -11/07/2021 02:33:54 - INFO - __main__ - Step 37907: {'lr': 0.000430833826575422, 'samples': 7278144, 'steps': 37906, 'loss/train': 1.7972919940948486} -11/07/2021 02:33:55 - INFO - __main__ - Step 37908: {'lr': 0.0004308301622439083, 'samples': 7278336, 'steps': 37907, 'loss/train': 0.9065421223640442} -11/07/2021 02:33:55 - INFO - __main__ - Step 37909: {'lr': 0.0004308264978309153, 'samples': 7278528, 'steps': 37908, 'loss/train': 1.333460807800293} -11/07/2021 02:33:55 - INFO - __main__ - Step 37910: {'lr': 0.0004308228333364447, 'samples': 7278720, 'steps': 37909, 'loss/train': 1.5436149835586548} -11/07/2021 02:33:56 - INFO - __main__ - Step 37911: {'lr': 0.000430819168760498, 'samples': 7278912, 'steps': 37910, 'loss/train': 1.4273598194122314} -11/07/2021 02:33:56 - INFO - __main__ - Step 37912: {'lr': 0.0004308155041030771, 'samples': 7279104, 'steps': 37911, 'loss/train': 1.3679322004318237} -11/07/2021 02:33:57 - INFO - __main__ - Step 37913: {'lr': 0.00043081183936418343, 'samples': 7279296, 'steps': 37912, 'loss/train': 1.7382436990737915} -11/07/2021 02:33:57 - INFO - __main__ - Step 37914: {'lr': 0.0004308081745438188, 'samples': 7279488, 'steps': 37913, 'loss/train': 1.7539761066436768} -11/07/2021 02:33:58 - INFO - __main__ - Step 37915: {'lr': 0.00043080450964198483, 'samples': 7279680, 'steps': 37914, 'loss/train': 1.1099629402160645} -11/07/2021 02:33:58 - INFO - __main__ - Step 37916: {'lr': 0.00043080084465868307, 'samples': 7279872, 'steps': 37915, 'loss/train': 1.9730298519134521} -11/07/2021 02:33:58 - INFO - __main__ - Step 37917: {'lr': 0.0004307971795939152, 'samples': 7280064, 'steps': 37916, 'loss/train': 1.7470884323120117} -11/07/2021 02:33:59 - INFO - __main__ - Step 37918: {'lr': 0.000430793514447683, 'samples': 7280256, 'steps': 37917, 'loss/train': 1.3940391540527344} -11/07/2021 02:34:00 - INFO - __main__ - Step 37919: {'lr': 0.000430789849219988, 'samples': 7280448, 'steps': 37918, 'loss/train': 1.257074236869812} -11/07/2021 02:34:00 - INFO - __main__ - Step 37920: {'lr': 0.0004307861839108319, 'samples': 7280640, 'steps': 37919, 'loss/train': 1.2887773513793945} -11/07/2021 02:34:01 - INFO - __main__ - Step 37921: {'lr': 0.00043078251852021634, 'samples': 7280832, 'steps': 37920, 'loss/train': 1.6662101745605469} -11/07/2021 02:34:01 - INFO - __main__ - Step 37922: {'lr': 0.0004307788530481429, 'samples': 7281024, 'steps': 37921, 'loss/train': 1.563852071762085} -11/07/2021 02:34:02 - INFO - __main__ - Step 37923: {'lr': 0.00043077518749461336, 'samples': 7281216, 'steps': 37922, 'loss/train': 1.7499343156814575} -11/07/2021 02:34:02 - INFO - __main__ - Step 37924: {'lr': 0.00043077152185962933, 'samples': 7281408, 'steps': 37923, 'loss/train': 1.418026328086853} -11/07/2021 02:34:03 - INFO - __main__ - Step 37925: {'lr': 0.00043076785614319234, 'samples': 7281600, 'steps': 37924, 'loss/train': 1.733856201171875} -11/07/2021 02:34:03 - INFO - __main__ - Step 37926: {'lr': 0.0004307641903453042, 'samples': 7281792, 'steps': 37925, 'loss/train': 1.2359224557876587} -11/07/2021 02:34:03 - INFO - __main__ - Step 37927: {'lr': 0.00043076052446596656, 'samples': 7281984, 'steps': 37926, 'loss/train': 1.7876313924789429} -11/07/2021 02:34:04 - INFO - __main__ - Step 37928: {'lr': 0.000430756858505181, 'samples': 7282176, 'steps': 37927, 'loss/train': 1.8781075477600098} -11/07/2021 02:34:05 - INFO - __main__ - Step 37929: {'lr': 0.00043075319246294914, 'samples': 7282368, 'steps': 37928, 'loss/train': 1.6325830221176147} -11/07/2021 02:34:05 - INFO - __main__ - Step 37930: {'lr': 0.0004307495263392727, 'samples': 7282560, 'steps': 37929, 'loss/train': 1.660241961479187} -11/07/2021 02:34:05 - INFO - __main__ - Step 37931: {'lr': 0.00043074586013415337, 'samples': 7282752, 'steps': 37930, 'loss/train': 1.76328444480896} -11/07/2021 02:34:06 - INFO - __main__ - Step 37932: {'lr': 0.0004307421938475926, 'samples': 7282944, 'steps': 37931, 'loss/train': 1.3810811042785645} -11/07/2021 02:34:06 - INFO - __main__ - Step 37933: {'lr': 0.0004307385274795923, 'samples': 7283136, 'steps': 37932, 'loss/train': 1.5373013019561768} -11/07/2021 02:34:07 - INFO - __main__ - Step 37934: {'lr': 0.000430734861030154, 'samples': 7283328, 'steps': 37933, 'loss/train': 1.6717209815979004} -11/07/2021 02:34:07 - INFO - __main__ - Step 37935: {'lr': 0.0004307311944992793, 'samples': 7283520, 'steps': 37934, 'loss/train': 1.2602779865264893} -11/07/2021 02:34:08 - INFO - __main__ - Step 37936: {'lr': 0.00043072752788697003, 'samples': 7283712, 'steps': 37935, 'loss/train': 1.6329361200332642} -11/07/2021 02:34:08 - INFO - __main__ - Step 37937: {'lr': 0.0004307238611932276, 'samples': 7283904, 'steps': 37936, 'loss/train': 1.5360777378082275} -11/07/2021 02:34:08 - INFO - __main__ - Step 37938: {'lr': 0.00043072019441805386, 'samples': 7284096, 'steps': 37937, 'loss/train': 1.425024390220642} -11/07/2021 02:34:11 - INFO - __main__ - Step 37939: {'lr': 0.00043071652756145035, 'samples': 7284288, 'steps': 37938, 'loss/train': 1.440492033958435} -11/07/2021 02:34:11 - INFO - __main__ - Step 37940: {'lr': 0.0004307128606234188, 'samples': 7284480, 'steps': 37939, 'loss/train': 1.5482230186462402} -11/07/2021 02:34:11 - INFO - __main__ - Step 37941: {'lr': 0.00043070919360396076, 'samples': 7284672, 'steps': 37940, 'loss/train': 1.8059606552124023} -11/07/2021 02:34:12 - INFO - __main__ - Step 37942: {'lr': 0.00043070552650307804, 'samples': 7284864, 'steps': 37941, 'loss/train': 1.8094056844711304} -11/07/2021 02:34:12 - INFO - __main__ - Step 37943: {'lr': 0.0004307018593207721, 'samples': 7285056, 'steps': 37942, 'loss/train': 1.8075382709503174} -11/07/2021 02:34:12 - INFO - __main__ - Step 37944: {'lr': 0.0004306981920570447, 'samples': 7285248, 'steps': 37943, 'loss/train': 1.4249544143676758} -11/07/2021 02:34:13 - INFO - __main__ - Step 37945: {'lr': 0.00043069452471189765, 'samples': 7285440, 'steps': 37944, 'loss/train': 1.518310308456421} -11/07/2021 02:34:14 - INFO - __main__ - Step 37946: {'lr': 0.00043069085728533225, 'samples': 7285632, 'steps': 37945, 'loss/train': 1.5919995307922363} -11/07/2021 02:34:14 - INFO - __main__ - Step 37947: {'lr': 0.0004306871897773504, 'samples': 7285824, 'steps': 37946, 'loss/train': 1.625312328338623} -11/07/2021 02:34:15 - INFO - __main__ - Step 37948: {'lr': 0.0004306835221879537, 'samples': 7286016, 'steps': 37947, 'loss/train': 1.3613947629928589} -11/07/2021 02:34:15 - INFO - __main__ - Step 37949: {'lr': 0.00043067985451714373, 'samples': 7286208, 'steps': 37948, 'loss/train': 1.5056431293487549} -11/07/2021 02:34:15 - INFO - __main__ - Step 37950: {'lr': 0.0004306761867649223, 'samples': 7286400, 'steps': 37949, 'loss/train': 1.7206279039382935} -11/07/2021 02:34:16 - INFO - __main__ - Step 37951: {'lr': 0.0004306725189312909, 'samples': 7286592, 'steps': 37950, 'loss/train': 1.5456422567367554} -11/07/2021 02:34:17 - INFO - __main__ - Step 37952: {'lr': 0.00043066885101625133, 'samples': 7286784, 'steps': 37951, 'loss/train': 1.7271060943603516} -11/07/2021 02:34:17 - INFO - __main__ - Step 37953: {'lr': 0.00043066518301980504, 'samples': 7286976, 'steps': 37952, 'loss/train': 1.534792423248291} -11/07/2021 02:34:17 - INFO - __main__ - Step 37954: {'lr': 0.00043066151494195387, 'samples': 7287168, 'steps': 37953, 'loss/train': 1.1038849353790283} -11/07/2021 02:34:18 - INFO - __main__ - Step 37955: {'lr': 0.00043065784678269944, 'samples': 7287360, 'steps': 37954, 'loss/train': 1.5833653211593628} -11/07/2021 02:34:18 - INFO - __main__ - Step 37956: {'lr': 0.00043065417854204333, 'samples': 7287552, 'steps': 37955, 'loss/train': 1.7715234756469727} -11/07/2021 02:34:19 - INFO - __main__ - Step 37957: {'lr': 0.0004306505102199872, 'samples': 7287744, 'steps': 37956, 'loss/train': 1.5732712745666504} -11/07/2021 02:34:19 - INFO - __main__ - Step 37958: {'lr': 0.0004306468418165328, 'samples': 7287936, 'steps': 37957, 'loss/train': 1.638083815574646} -11/07/2021 02:34:20 - INFO - __main__ - Step 37959: {'lr': 0.0004306431733316817, 'samples': 7288128, 'steps': 37958, 'loss/train': 1.445956826210022} -11/07/2021 02:34:20 - INFO - __main__ - Step 37960: {'lr': 0.00043063950476543563, 'samples': 7288320, 'steps': 37959, 'loss/train': 2.0494678020477295} -11/07/2021 02:34:20 - INFO - __main__ - Step 37961: {'lr': 0.0004306358361177961, 'samples': 7288512, 'steps': 37960, 'loss/train': 1.6257449388504028} -11/07/2021 02:34:22 - INFO - __main__ - Step 37962: {'lr': 0.00043063216738876487, 'samples': 7288704, 'steps': 37961, 'loss/train': 1.5832840204238892} -11/07/2021 02:34:22 - INFO - __main__ - Step 37963: {'lr': 0.0004306284985783436, 'samples': 7288896, 'steps': 37962, 'loss/train': 1.6308826208114624} -11/07/2021 02:34:22 - INFO - __main__ - Step 37964: {'lr': 0.00043062482968653394, 'samples': 7289088, 'steps': 37963, 'loss/train': 1.5397615432739258} -11/07/2021 02:34:23 - INFO - __main__ - Step 37965: {'lr': 0.00043062116071333745, 'samples': 7289280, 'steps': 37964, 'loss/train': 1.1325451135635376} -11/07/2021 02:34:23 - INFO - __main__ - Step 37966: {'lr': 0.0004306174916587559, 'samples': 7289472, 'steps': 37965, 'loss/train': 1.169539451599121} -11/07/2021 02:34:24 - INFO - __main__ - Step 37967: {'lr': 0.0004306138225227909, 'samples': 7289664, 'steps': 37966, 'loss/train': 1.4744054079055786} -11/07/2021 02:34:25 - INFO - __main__ - Step 37968: {'lr': 0.0004306101533054441, 'samples': 7289856, 'steps': 37967, 'loss/train': 1.580784559249878} -11/07/2021 02:34:25 - INFO - __main__ - Step 37969: {'lr': 0.0004306064840067171, 'samples': 7290048, 'steps': 37968, 'loss/train': 1.974003553390503} -11/07/2021 02:34:25 - INFO - __main__ - Step 37970: {'lr': 0.00043060281462661165, 'samples': 7290240, 'steps': 37969, 'loss/train': 0.612262487411499} -11/07/2021 02:34:26 - INFO - __main__ - Step 37971: {'lr': 0.0004305991451651293, 'samples': 7290432, 'steps': 37970, 'loss/train': 1.509476661682129} -11/07/2021 02:34:27 - INFO - __main__ - Step 37972: {'lr': 0.00043059547562227185, 'samples': 7290624, 'steps': 37971, 'loss/train': 1.5636862516403198} -11/07/2021 02:34:27 - INFO - __main__ - Step 37973: {'lr': 0.0004305918059980408, 'samples': 7290816, 'steps': 37972, 'loss/train': 1.6018271446228027} -11/07/2021 02:34:28 - INFO - __main__ - Step 37974: {'lr': 0.00043058813629243787, 'samples': 7291008, 'steps': 37973, 'loss/train': 1.2701356410980225} -11/07/2021 02:34:28 - INFO - __main__ - Step 37975: {'lr': 0.0004305844665054648, 'samples': 7291200, 'steps': 37974, 'loss/train': 1.5594356060028076} -11/07/2021 02:34:28 - INFO - __main__ - Step 37976: {'lr': 0.00043058079663712304, 'samples': 7291392, 'steps': 37975, 'loss/train': 1.4831064939498901} -11/07/2021 02:34:30 - INFO - __main__ - Step 37977: {'lr': 0.00043057712668741443, 'samples': 7291584, 'steps': 37976, 'loss/train': 1.7999645471572876} -11/07/2021 02:34:30 - INFO - __main__ - Step 37978: {'lr': 0.0004305734566563405, 'samples': 7291776, 'steps': 37977, 'loss/train': 1.4681727886199951} -11/07/2021 02:34:31 - INFO - __main__ - Step 37979: {'lr': 0.000430569786543903, 'samples': 7291968, 'steps': 37978, 'loss/train': 1.2198891639709473} -11/07/2021 02:34:31 - INFO - __main__ - Step 37980: {'lr': 0.00043056611635010355, 'samples': 7292160, 'steps': 37979, 'loss/train': 1.8494244813919067} -11/07/2021 02:34:31 - INFO - __main__ - Step 37981: {'lr': 0.00043056244607494375, 'samples': 7292352, 'steps': 37980, 'loss/train': 1.7782717943191528} -11/07/2021 02:34:32 - INFO - __main__ - Step 37982: {'lr': 0.0004305587757184254, 'samples': 7292544, 'steps': 37981, 'loss/train': 1.644851565361023} -11/07/2021 02:34:32 - INFO - __main__ - Step 37983: {'lr': 0.0004305551052805499, 'samples': 7292736, 'steps': 37982, 'loss/train': 1.0468441247940063} -11/07/2021 02:34:34 - INFO - __main__ - Step 37984: {'lr': 0.0004305514347613191, 'samples': 7292928, 'steps': 37983, 'loss/train': 1.4788124561309814} -11/07/2021 02:34:34 - INFO - __main__ - Step 37985: {'lr': 0.0004305477641607347, 'samples': 7293120, 'steps': 37984, 'loss/train': 1.492355227470398} -11/07/2021 02:34:34 - INFO - __main__ - Step 37986: {'lr': 0.0004305440934787982, 'samples': 7293312, 'steps': 37985, 'loss/train': 1.895719289779663} -11/07/2021 02:34:35 - INFO - __main__ - Step 37987: {'lr': 0.0004305404227155113, 'samples': 7293504, 'steps': 37986, 'loss/train': 1.0172924995422363} -11/07/2021 02:34:35 - INFO - __main__ - Step 37988: {'lr': 0.0004305367518708757, 'samples': 7293696, 'steps': 37987, 'loss/train': 1.722000241279602} -11/07/2021 02:34:35 - INFO - __main__ - Step 37989: {'lr': 0.000430533080944893, 'samples': 7293888, 'steps': 37988, 'loss/train': 1.4645875692367554} -11/07/2021 02:34:37 - INFO - __main__ - Step 37990: {'lr': 0.00043052940993756493, 'samples': 7294080, 'steps': 37989, 'loss/train': 1.7487901449203491} -11/07/2021 02:34:37 - INFO - __main__ - Step 37991: {'lr': 0.00043052573884889305, 'samples': 7294272, 'steps': 37990, 'loss/train': 1.0233213901519775} -11/07/2021 02:34:37 - INFO - __main__ - Step 37992: {'lr': 0.00043052206767887907, 'samples': 7294464, 'steps': 37991, 'loss/train': 2.0673677921295166} -11/07/2021 02:34:38 - INFO - __main__ - Step 37993: {'lr': 0.00043051839642752466, 'samples': 7294656, 'steps': 37992, 'loss/train': 1.400230050086975} -11/07/2021 02:34:38 - INFO - __main__ - Step 37994: {'lr': 0.00043051472509483135, 'samples': 7294848, 'steps': 37993, 'loss/train': 1.6917005777359009} -11/07/2021 02:34:39 - INFO - __main__ - Step 37995: {'lr': 0.00043051105368080103, 'samples': 7295040, 'steps': 37994, 'loss/train': 1.5717216730117798} -11/07/2021 02:34:39 - INFO - __main__ - Step 37996: {'lr': 0.00043050738218543505, 'samples': 7295232, 'steps': 37995, 'loss/train': 1.281235694885254} -11/07/2021 02:34:40 - INFO - __main__ - Step 37997: {'lr': 0.00043050371060873537, 'samples': 7295424, 'steps': 37996, 'loss/train': 1.25249445438385} -11/07/2021 02:34:40 - INFO - __main__ - Step 37998: {'lr': 0.00043050003895070345, 'samples': 7295616, 'steps': 37997, 'loss/train': 1.582495927810669} -11/07/2021 02:34:40 - INFO - __main__ - Step 37999: {'lr': 0.000430496367211341, 'samples': 7295808, 'steps': 37998, 'loss/train': 1.7385200262069702} -11/07/2021 02:34:41 - INFO - __main__ - Step 38000: {'lr': 0.00043049269539064967, 'samples': 7296000, 'steps': 37999, 'loss/train': 1.301990270614624} -11/07/2021 02:34:42 - INFO - __main__ - Step 38001: {'lr': 0.0004304890234886311, 'samples': 7296192, 'steps': 38000, 'loss/train': 1.387725830078125} -11/07/2021 02:34:42 - INFO - __main__ - Step 38002: {'lr': 0.000430485351505287, 'samples': 7296384, 'steps': 38001, 'loss/train': 1.957288146018982} -11/07/2021 02:34:42 - INFO - __main__ - Step 38003: {'lr': 0.000430481679440619, 'samples': 7296576, 'steps': 38002, 'loss/train': 0.9746781587600708} -11/07/2021 02:34:43 - INFO - __main__ - Step 38004: {'lr': 0.0004304780072946287, 'samples': 7296768, 'steps': 38003, 'loss/train': 1.7512469291687012} -11/07/2021 02:34:44 - INFO - __main__ - Step 38005: {'lr': 0.00043047433506731783, 'samples': 7296960, 'steps': 38004, 'loss/train': 1.5505845546722412} -11/07/2021 02:34:44 - INFO - __main__ - Step 38006: {'lr': 0.00043047066275868795, 'samples': 7297152, 'steps': 38005, 'loss/train': 1.0482814311981201} -11/07/2021 02:34:45 - INFO - __main__ - Step 38007: {'lr': 0.0004304669903687408, 'samples': 7297344, 'steps': 38006, 'loss/train': 0.8675975799560547} -11/07/2021 02:34:45 - INFO - __main__ - Step 38008: {'lr': 0.000430463317897478, 'samples': 7297536, 'steps': 38007, 'loss/train': 2.2233479022979736} -11/07/2021 02:34:45 - INFO - __main__ - Step 38009: {'lr': 0.0004304596453449012, 'samples': 7297728, 'steps': 38008, 'loss/train': 1.630285382270813} -11/07/2021 02:34:46 - INFO - __main__ - Step 38010: {'lr': 0.0004304559727110121, 'samples': 7297920, 'steps': 38009, 'loss/train': 1.7070844173431396} -11/07/2021 02:34:47 - INFO - __main__ - Step 38011: {'lr': 0.0004304522999958124, 'samples': 7298112, 'steps': 38010, 'loss/train': 2.6189193725585938} -11/07/2021 02:34:47 - INFO - __main__ - Step 38012: {'lr': 0.00043044862719930356, 'samples': 7298304, 'steps': 38011, 'loss/train': 1.5570639371871948} -11/07/2021 02:34:47 - INFO - __main__ - Step 38013: {'lr': 0.0004304449543214874, 'samples': 7298496, 'steps': 38012, 'loss/train': 2.0051374435424805} -11/07/2021 02:34:48 - INFO - __main__ - Step 38014: {'lr': 0.0004304412813623655, 'samples': 7298688, 'steps': 38013, 'loss/train': 1.8789836168289185} -11/07/2021 02:34:48 - INFO - __main__ - Step 38015: {'lr': 0.0004304376083219396, 'samples': 7298880, 'steps': 38014, 'loss/train': 1.4761950969696045} -11/07/2021 02:34:49 - INFO - __main__ - Step 38016: {'lr': 0.00043043393520021125, 'samples': 7299072, 'steps': 38015, 'loss/train': 1.8535746335983276} -11/07/2021 02:34:50 - INFO - __main__ - Step 38017: {'lr': 0.0004304302619971822, 'samples': 7299264, 'steps': 38016, 'loss/train': 1.2162835597991943} -11/07/2021 02:34:50 - INFO - __main__ - Step 38018: {'lr': 0.000430426588712854, 'samples': 7299456, 'steps': 38017, 'loss/train': 1.473557710647583} -11/07/2021 02:34:50 - INFO - __main__ - Step 38019: {'lr': 0.0004304229153472283, 'samples': 7299648, 'steps': 38018, 'loss/train': 1.200123906135559} -11/07/2021 02:34:51 - INFO - __main__ - Step 38020: {'lr': 0.0004304192419003069, 'samples': 7299840, 'steps': 38019, 'loss/train': 1.2828359603881836} -11/07/2021 02:34:52 - INFO - __main__ - Step 38021: {'lr': 0.0004304155683720914, 'samples': 7300032, 'steps': 38020, 'loss/train': 1.4277637004852295} -11/07/2021 02:34:52 - INFO - __main__ - Step 38022: {'lr': 0.0004304118947625835, 'samples': 7300224, 'steps': 38021, 'loss/train': 1.602111577987671} -11/07/2021 02:34:52 - INFO - __main__ - Step 38023: {'lr': 0.00043040822107178465, 'samples': 7300416, 'steps': 38022, 'loss/train': 1.7993630170822144} -11/07/2021 02:34:53 - INFO - __main__ - Step 38024: {'lr': 0.0004304045472996966, 'samples': 7300608, 'steps': 38023, 'loss/train': 1.5964939594268799} -11/07/2021 02:34:53 - INFO - __main__ - Step 38025: {'lr': 0.0004304008734463212, 'samples': 7300800, 'steps': 38024, 'loss/train': 1.7076945304870605} -11/07/2021 02:34:53 - INFO - __main__ - Step 38026: {'lr': 0.00043039719951165986, 'samples': 7300992, 'steps': 38025, 'loss/train': 1.7546823024749756} -11/07/2021 02:34:54 - INFO - __main__ - Step 38027: {'lr': 0.0004303935254957143, 'samples': 7301184, 'steps': 38026, 'loss/train': 1.6069893836975098} -11/07/2021 02:34:55 - INFO - __main__ - Step 38028: {'lr': 0.0004303898513984863, 'samples': 7301376, 'steps': 38027, 'loss/train': 1.5962930917739868} -11/07/2021 02:34:55 - INFO - __main__ - Step 38029: {'lr': 0.0004303861772199773, 'samples': 7301568, 'steps': 38028, 'loss/train': 1.200292706489563} -11/07/2021 02:34:55 - INFO - __main__ - Step 38030: {'lr': 0.00043038250296018916, 'samples': 7301760, 'steps': 38029, 'loss/train': 0.9734283685684204} -11/07/2021 02:34:56 - INFO - __main__ - Step 38031: {'lr': 0.00043037882861912344, 'samples': 7301952, 'steps': 38030, 'loss/train': 1.5647027492523193} -11/07/2021 02:34:57 - INFO - __main__ - Step 38032: {'lr': 0.00043037515419678174, 'samples': 7302144, 'steps': 38031, 'loss/train': 1.3203153610229492} -11/07/2021 02:34:57 - INFO - __main__ - Step 38033: {'lr': 0.0004303714796931658, 'samples': 7302336, 'steps': 38032, 'loss/train': 1.8147969245910645} -11/07/2021 02:34:58 - INFO - __main__ - Step 38034: {'lr': 0.0004303678051082773, 'samples': 7302528, 'steps': 38033, 'loss/train': 2.1749398708343506} -11/07/2021 02:34:58 - INFO - __main__ - Step 38035: {'lr': 0.00043036413044211786, 'samples': 7302720, 'steps': 38034, 'loss/train': 1.9432387351989746} -11/07/2021 02:34:58 - INFO - __main__ - Step 38036: {'lr': 0.0004303604556946891, 'samples': 7302912, 'steps': 38035, 'loss/train': 1.8085533380508423} -11/07/2021 02:34:59 - INFO - __main__ - Step 38037: {'lr': 0.00043035678086599265, 'samples': 7303104, 'steps': 38036, 'loss/train': 1.323421597480774} -11/07/2021 02:35:00 - INFO - __main__ - Step 38038: {'lr': 0.00043035310595603026, 'samples': 7303296, 'steps': 38037, 'loss/train': 1.8228347301483154} -11/07/2021 02:35:00 - INFO - __main__ - Step 38039: {'lr': 0.00043034943096480357, 'samples': 7303488, 'steps': 38038, 'loss/train': 1.2788726091384888} -11/07/2021 02:35:00 - INFO - __main__ - Step 38040: {'lr': 0.0004303457558923142, 'samples': 7303680, 'steps': 38039, 'loss/train': 0.3434649407863617} -11/07/2021 02:35:01 - INFO - __main__ - Step 38041: {'lr': 0.00043034208073856374, 'samples': 7303872, 'steps': 38040, 'loss/train': 1.8999801874160767} -11/07/2021 02:35:02 - INFO - __main__ - Step 38042: {'lr': 0.000430338405503554, 'samples': 7304064, 'steps': 38041, 'loss/train': 0.8197647929191589} -11/07/2021 02:35:02 - INFO - __main__ - Step 38043: {'lr': 0.00043033473018728655, 'samples': 7304256, 'steps': 38042, 'loss/train': 1.171054482460022} -11/07/2021 02:35:02 - INFO - __main__ - Step 38044: {'lr': 0.00043033105478976306, 'samples': 7304448, 'steps': 38043, 'loss/train': 1.650887131690979} -11/07/2021 02:35:03 - INFO - __main__ - Step 38045: {'lr': 0.00043032737931098517, 'samples': 7304640, 'steps': 38044, 'loss/train': 1.5681344270706177} -11/07/2021 02:35:03 - INFO - __main__ - Step 38046: {'lr': 0.0004303237037509545, 'samples': 7304832, 'steps': 38045, 'loss/train': 1.498640537261963} -11/07/2021 02:35:04 - INFO - __main__ - Step 38047: {'lr': 0.0004303200281096727, 'samples': 7305024, 'steps': 38046, 'loss/train': 0.21930217742919922} -11/07/2021 02:35:05 - INFO - __main__ - Step 38048: {'lr': 0.00043031635238714163, 'samples': 7305216, 'steps': 38047, 'loss/train': 1.0719927549362183} -11/07/2021 02:35:05 - INFO - __main__ - Step 38049: {'lr': 0.00043031267658336276, 'samples': 7305408, 'steps': 38048, 'loss/train': 1.2124830484390259} -11/07/2021 02:35:05 - INFO - __main__ - Step 38050: {'lr': 0.00043030900069833774, 'samples': 7305600, 'steps': 38049, 'loss/train': 1.630570888519287} -11/07/2021 02:35:06 - INFO - __main__ - Step 38051: {'lr': 0.0004303053247320683, 'samples': 7305792, 'steps': 38050, 'loss/train': 1.6434534788131714} -11/07/2021 02:35:07 - INFO - __main__ - Step 38052: {'lr': 0.000430301648684556, 'samples': 7305984, 'steps': 38051, 'loss/train': 1.8277837038040161} -11/07/2021 02:35:07 - INFO - __main__ - Step 38053: {'lr': 0.0004302979725558026, 'samples': 7306176, 'steps': 38052, 'loss/train': 1.3193963766098022} -11/07/2021 02:35:07 - INFO - __main__ - Step 38054: {'lr': 0.0004302942963458097, 'samples': 7306368, 'steps': 38053, 'loss/train': 1.8110835552215576} -11/07/2021 02:35:08 - INFO - __main__ - Step 38055: {'lr': 0.00043029062005457897, 'samples': 7306560, 'steps': 38054, 'loss/train': 1.2935056686401367} -11/07/2021 02:35:08 - INFO - __main__ - Step 38056: {'lr': 0.00043028694368211216, 'samples': 7306752, 'steps': 38055, 'loss/train': 1.2038893699645996} -11/07/2021 02:35:08 - INFO - __main__ - Step 38057: {'lr': 0.00043028326722841073, 'samples': 7306944, 'steps': 38056, 'loss/train': 1.8193788528442383} -11/07/2021 02:35:09 - INFO - __main__ - Step 38058: {'lr': 0.00043027959069347644, 'samples': 7307136, 'steps': 38057, 'loss/train': 1.7588491439819336} -11/07/2021 02:35:10 - INFO - __main__ - Step 38059: {'lr': 0.00043027591407731106, 'samples': 7307328, 'steps': 38058, 'loss/train': 1.366492748260498} -11/07/2021 02:35:10 - INFO - __main__ - Step 38060: {'lr': 0.000430272237379916, 'samples': 7307520, 'steps': 38059, 'loss/train': 0.8111729621887207} -11/07/2021 02:35:10 - INFO - __main__ - Step 38061: {'lr': 0.00043026856060129307, 'samples': 7307712, 'steps': 38060, 'loss/train': 1.5397465229034424} -11/07/2021 02:35:11 - INFO - __main__ - Step 38062: {'lr': 0.00043026488374144404, 'samples': 7307904, 'steps': 38061, 'loss/train': 1.6733875274658203} -11/07/2021 02:35:12 - INFO - __main__ - Step 38063: {'lr': 0.00043026120680037026, 'samples': 7308096, 'steps': 38062, 'loss/train': 1.1368083953857422} -11/07/2021 02:35:12 - INFO - __main__ - Step 38064: {'lr': 0.00043025752977807365, 'samples': 7308288, 'steps': 38063, 'loss/train': 1.9798434972763062} -11/07/2021 02:35:12 - INFO - __main__ - Step 38065: {'lr': 0.00043025385267455576, 'samples': 7308480, 'steps': 38064, 'loss/train': 1.3891901969909668} -11/07/2021 02:35:13 - INFO - __main__ - Step 38066: {'lr': 0.0004302501754898183, 'samples': 7308672, 'steps': 38065, 'loss/train': 1.7628917694091797} -11/07/2021 02:35:13 - INFO - __main__ - Step 38067: {'lr': 0.00043024649822386284, 'samples': 7308864, 'steps': 38066, 'loss/train': 1.3898802995681763} -11/07/2021 02:35:14 - INFO - __main__ - Step 38068: {'lr': 0.00043024282087669106, 'samples': 7309056, 'steps': 38067, 'loss/train': 1.7788422107696533} -11/07/2021 02:35:14 - INFO - __main__ - Step 38069: {'lr': 0.0004302391434483048, 'samples': 7309248, 'steps': 38068, 'loss/train': 1.2079501152038574} -11/07/2021 02:35:15 - INFO - __main__ - Step 38070: {'lr': 0.00043023546593870543, 'samples': 7309440, 'steps': 38069, 'loss/train': 0.31639406085014343} -11/07/2021 02:35:15 - INFO - __main__ - Step 38071: {'lr': 0.00043023178834789477, 'samples': 7309632, 'steps': 38070, 'loss/train': 1.4251023530960083} -11/07/2021 02:35:16 - INFO - __main__ - Step 38072: {'lr': 0.0004302281106758745, 'samples': 7309824, 'steps': 38071, 'loss/train': 1.5218110084533691} -11/07/2021 02:35:17 - INFO - __main__ - Step 38073: {'lr': 0.00043022443292264613, 'samples': 7310016, 'steps': 38072, 'loss/train': 1.7101134061813354} -11/07/2021 02:35:17 - INFO - __main__ - Step 38074: {'lr': 0.00043022075508821145, 'samples': 7310208, 'steps': 38073, 'loss/train': 1.4294854402542114} -11/07/2021 02:35:17 - INFO - __main__ - Step 38075: {'lr': 0.0004302170771725721, 'samples': 7310400, 'steps': 38074, 'loss/train': 1.5847716331481934} -11/07/2021 02:35:18 - INFO - __main__ - Step 38076: {'lr': 0.0004302133991757297, 'samples': 7310592, 'steps': 38075, 'loss/train': 1.3922067880630493} -11/07/2021 02:35:18 - INFO - __main__ - Step 38077: {'lr': 0.000430209721097686, 'samples': 7310784, 'steps': 38076, 'loss/train': 1.6040767431259155} -11/07/2021 02:35:19 - INFO - __main__ - Step 38078: {'lr': 0.00043020604293844244, 'samples': 7310976, 'steps': 38077, 'loss/train': 1.1318144798278809} -11/07/2021 02:35:19 - INFO - __main__ - Step 38079: {'lr': 0.0004302023646980009, 'samples': 7311168, 'steps': 38078, 'loss/train': 1.669752597808838} -11/07/2021 02:35:20 - INFO - __main__ - Step 38080: {'lr': 0.00043019868637636294, 'samples': 7311360, 'steps': 38079, 'loss/train': 1.3321876525878906} -11/07/2021 02:35:20 - INFO - __main__ - Step 38081: {'lr': 0.0004301950079735302, 'samples': 7311552, 'steps': 38080, 'loss/train': 1.4218177795410156} -11/07/2021 02:35:20 - INFO - __main__ - Step 38082: {'lr': 0.00043019132948950443, 'samples': 7311744, 'steps': 38081, 'loss/train': 0.9103419780731201} -11/07/2021 02:35:21 - INFO - __main__ - Step 38083: {'lr': 0.0004301876509242872, 'samples': 7311936, 'steps': 38082, 'loss/train': 1.6363718509674072} -11/07/2021 02:35:22 - INFO - __main__ - Step 38084: {'lr': 0.0004301839722778802, 'samples': 7312128, 'steps': 38083, 'loss/train': 1.5699800252914429} -11/07/2021 02:35:22 - INFO - __main__ - Step 38085: {'lr': 0.0004301802935502851, 'samples': 7312320, 'steps': 38084, 'loss/train': 1.228023648262024} -11/07/2021 02:35:22 - INFO - __main__ - Step 38086: {'lr': 0.00043017661474150347, 'samples': 7312512, 'steps': 38085, 'loss/train': 1.5643198490142822} -11/07/2021 02:35:23 - INFO - __main__ - Step 38087: {'lr': 0.0004301729358515371, 'samples': 7312704, 'steps': 38086, 'loss/train': 1.0907460451126099} -11/07/2021 02:35:24 - INFO - __main__ - Step 38088: {'lr': 0.00043016925688038756, 'samples': 7312896, 'steps': 38087, 'loss/train': 1.7797681093215942} -11/07/2021 02:35:24 - INFO - __main__ - Step 38089: {'lr': 0.00043016557782805655, 'samples': 7313088, 'steps': 38088, 'loss/train': 1.50370192527771} -11/07/2021 02:35:25 - INFO - __main__ - Step 38090: {'lr': 0.0004301618986945457, 'samples': 7313280, 'steps': 38089, 'loss/train': 1.3989465236663818} -11/07/2021 02:35:25 - INFO - __main__ - Step 38091: {'lr': 0.0004301582194798567, 'samples': 7313472, 'steps': 38090, 'loss/train': 1.1627254486083984} -11/07/2021 02:35:25 - INFO - __main__ - Step 38092: {'lr': 0.00043015454018399115, 'samples': 7313664, 'steps': 38091, 'loss/train': 1.59376060962677} -11/07/2021 02:35:26 - INFO - __main__ - Step 38093: {'lr': 0.00043015086080695075, 'samples': 7313856, 'steps': 38092, 'loss/train': 1.5860843658447266} -11/07/2021 02:35:27 - INFO - __main__ - Step 38094: {'lr': 0.0004301471813487372, 'samples': 7314048, 'steps': 38093, 'loss/train': 1.6321327686309814} -11/07/2021 02:35:27 - INFO - __main__ - Step 38095: {'lr': 0.00043014350180935207, 'samples': 7314240, 'steps': 38094, 'loss/train': 1.2975819110870361} -11/07/2021 02:35:27 - INFO - __main__ - Step 38096: {'lr': 0.0004301398221887971, 'samples': 7314432, 'steps': 38095, 'loss/train': 2.0996835231781006} -11/07/2021 02:35:28 - INFO - __main__ - Step 38097: {'lr': 0.0004301361424870739, 'samples': 7314624, 'steps': 38096, 'loss/train': 1.677228331565857} -11/07/2021 02:35:29 - INFO - __main__ - Step 38098: {'lr': 0.00043013246270418406, 'samples': 7314816, 'steps': 38097, 'loss/train': 1.5101380348205566} -11/07/2021 02:35:29 - INFO - __main__ - Step 38099: {'lr': 0.00043012878284012936, 'samples': 7315008, 'steps': 38098, 'loss/train': 1.5078647136688232} -11/07/2021 02:35:29 - INFO - __main__ - Step 38100: {'lr': 0.0004301251028949114, 'samples': 7315200, 'steps': 38099, 'loss/train': 1.506402850151062} -11/07/2021 02:35:30 - INFO - __main__ - Step 38101: {'lr': 0.00043012142286853185, 'samples': 7315392, 'steps': 38100, 'loss/train': 1.571759819984436} -11/07/2021 02:35:30 - INFO - __main__ - Step 38102: {'lr': 0.00043011774276099235, 'samples': 7315584, 'steps': 38101, 'loss/train': 1.5209771394729614} -11/07/2021 02:35:31 - INFO - __main__ - Step 38103: {'lr': 0.0004301140625722946, 'samples': 7315776, 'steps': 38102, 'loss/train': 1.6852452754974365} -11/07/2021 02:35:32 - INFO - __main__ - Step 38104: {'lr': 0.0004301103823024403, 'samples': 7315968, 'steps': 38103, 'loss/train': 1.4258034229278564} -11/07/2021 02:35:32 - INFO - __main__ - Step 38105: {'lr': 0.0004301067019514309, 'samples': 7316160, 'steps': 38104, 'loss/train': 1.3200912475585938} -11/07/2021 02:35:32 - INFO - __main__ - Step 38106: {'lr': 0.0004301030215192683, 'samples': 7316352, 'steps': 38105, 'loss/train': 1.657687783241272} -11/07/2021 02:35:33 - INFO - __main__ - Step 38107: {'lr': 0.00043009934100595403, 'samples': 7316544, 'steps': 38106, 'loss/train': 1.5879276990890503} -11/07/2021 02:35:33 - INFO - __main__ - Step 38108: {'lr': 0.00043009566041148973, 'samples': 7316736, 'steps': 38107, 'loss/train': 1.4185930490493774} -11/07/2021 02:35:34 - INFO - __main__ - Step 38109: {'lr': 0.0004300919797358772, 'samples': 7316928, 'steps': 38108, 'loss/train': 1.3224161863327026} -11/07/2021 02:35:34 - INFO - __main__ - Step 38110: {'lr': 0.00043008829897911796, 'samples': 7317120, 'steps': 38109, 'loss/train': 1.5699503421783447} -11/07/2021 02:35:35 - INFO - __main__ - Step 38111: {'lr': 0.0004300846181412137, 'samples': 7317312, 'steps': 38110, 'loss/train': 1.2713605165481567} -11/07/2021 02:35:35 - INFO - __main__ - Step 38112: {'lr': 0.00043008093722216603, 'samples': 7317504, 'steps': 38111, 'loss/train': 1.3977137804031372} -11/07/2021 02:35:36 - INFO - __main__ - Step 38113: {'lr': 0.00043007725622197675, 'samples': 7317696, 'steps': 38112, 'loss/train': 1.6717946529388428} -11/07/2021 02:35:37 - INFO - __main__ - Step 38114: {'lr': 0.0004300735751406474, 'samples': 7317888, 'steps': 38113, 'loss/train': 1.5027621984481812} -11/07/2021 02:35:37 - INFO - __main__ - Step 38115: {'lr': 0.00043006989397817967, 'samples': 7318080, 'steps': 38114, 'loss/train': 1.4531986713409424} -11/07/2021 02:35:37 - INFO - __main__ - Step 38116: {'lr': 0.00043006621273457523, 'samples': 7318272, 'steps': 38115, 'loss/train': 1.7254838943481445} -11/07/2021 02:35:38 - INFO - __main__ - Step 38117: {'lr': 0.0004300625314098358, 'samples': 7318464, 'steps': 38116, 'loss/train': 1.239201307296753} -11/07/2021 02:35:38 - INFO - __main__ - Step 38118: {'lr': 0.0004300588500039629, 'samples': 7318656, 'steps': 38117, 'loss/train': 1.312067985534668} -11/07/2021 02:35:39 - INFO - __main__ - Step 38119: {'lr': 0.0004300551685169583, 'samples': 7318848, 'steps': 38118, 'loss/train': 1.3828651905059814} -11/07/2021 02:35:39 - INFO - __main__ - Step 38120: {'lr': 0.0004300514869488236, 'samples': 7319040, 'steps': 38119, 'loss/train': 1.5329667329788208} -11/07/2021 02:35:40 - INFO - __main__ - Step 38121: {'lr': 0.00043004780529956046, 'samples': 7319232, 'steps': 38120, 'loss/train': 1.3659088611602783} -11/07/2021 02:35:40 - INFO - __main__ - Step 38122: {'lr': 0.00043004412356917055, 'samples': 7319424, 'steps': 38121, 'loss/train': 1.5442653894424438} -11/07/2021 02:35:40 - INFO - __main__ - Step 38123: {'lr': 0.0004300404417576556, 'samples': 7319616, 'steps': 38122, 'loss/train': 1.3420342206954956} -11/07/2021 02:35:41 - INFO - __main__ - Step 38124: {'lr': 0.00043003675986501717, 'samples': 7319808, 'steps': 38123, 'loss/train': 1.5655076503753662} -11/07/2021 02:35:42 - INFO - __main__ - Step 38125: {'lr': 0.00043003307789125694, 'samples': 7320000, 'steps': 38124, 'loss/train': 1.7089120149612427} -11/07/2021 02:35:42 - INFO - __main__ - Step 38126: {'lr': 0.0004300293958363766, 'samples': 7320192, 'steps': 38125, 'loss/train': 0.8477843999862671} -11/07/2021 02:35:43 - INFO - __main__ - Step 38127: {'lr': 0.00043002571370037777, 'samples': 7320384, 'steps': 38126, 'loss/train': 1.3977762460708618} -11/07/2021 02:35:43 - INFO - __main__ - Step 38128: {'lr': 0.00043002203148326213, 'samples': 7320576, 'steps': 38127, 'loss/train': 1.8233729600906372} -11/07/2021 02:35:44 - INFO - __main__ - Step 38129: {'lr': 0.0004300183491850314, 'samples': 7320768, 'steps': 38128, 'loss/train': 1.4460153579711914} -11/07/2021 02:35:44 - INFO - __main__ - Step 38130: {'lr': 0.0004300146668056871, 'samples': 7320960, 'steps': 38129, 'loss/train': 1.8460206985473633} -11/07/2021 02:35:45 - INFO - __main__ - Step 38131: {'lr': 0.00043001098434523107, 'samples': 7321152, 'steps': 38130, 'loss/train': 1.248296856880188} -11/07/2021 02:35:45 - INFO - __main__ - Step 38132: {'lr': 0.0004300073018036648, 'samples': 7321344, 'steps': 38131, 'loss/train': 1.5343341827392578} -11/07/2021 02:35:46 - INFO - __main__ - Step 38133: {'lr': 0.00043000361918099, 'samples': 7321536, 'steps': 38132, 'loss/train': 1.7700618505477905} -11/07/2021 02:35:46 - INFO - __main__ - Step 38134: {'lr': 0.00042999993647720836, 'samples': 7321728, 'steps': 38133, 'loss/train': 2.182451009750366} -11/07/2021 02:35:47 - INFO - __main__ - Step 38135: {'lr': 0.0004299962536923215, 'samples': 7321920, 'steps': 38134, 'loss/train': 1.4863643646240234} -11/07/2021 02:35:47 - INFO - __main__ - Step 38136: {'lr': 0.0004299925708263312, 'samples': 7322112, 'steps': 38135, 'loss/train': 1.7947341203689575} -11/07/2021 02:35:48 - INFO - __main__ - Step 38137: {'lr': 0.00042998888787923895, 'samples': 7322304, 'steps': 38136, 'loss/train': 1.6867958307266235} -11/07/2021 02:35:48 - INFO - __main__ - Step 38138: {'lr': 0.0004299852048510465, 'samples': 7322496, 'steps': 38137, 'loss/train': 1.5821454524993896} -11/07/2021 02:35:48 - INFO - __main__ - Step 38139: {'lr': 0.00042998152174175555, 'samples': 7322688, 'steps': 38138, 'loss/train': 1.2109464406967163} -11/07/2021 02:35:49 - INFO - __main__ - Step 38140: {'lr': 0.0004299778385513676, 'samples': 7322880, 'steps': 38139, 'loss/train': 1.8368099927902222} -11/07/2021 02:35:50 - INFO - __main__ - Step 38141: {'lr': 0.0004299741552798845, 'samples': 7323072, 'steps': 38140, 'loss/train': 1.569381594657898} -11/07/2021 02:35:50 - INFO - __main__ - Step 38142: {'lr': 0.0004299704719273078, 'samples': 7323264, 'steps': 38141, 'loss/train': 1.2834303379058838} -11/07/2021 02:35:50 - INFO - __main__ - Step 38143: {'lr': 0.00042996678849363914, 'samples': 7323456, 'steps': 38142, 'loss/train': 1.2398931980133057} -11/07/2021 02:35:51 - INFO - __main__ - Step 38144: {'lr': 0.00042996310497888025, 'samples': 7323648, 'steps': 38143, 'loss/train': 1.9385180473327637} -11/07/2021 02:35:51 - INFO - __main__ - Step 38145: {'lr': 0.00042995942138303274, 'samples': 7323840, 'steps': 38144, 'loss/train': 0.6801995635032654} -11/07/2021 02:35:52 - INFO - __main__ - Step 38146: {'lr': 0.0004299557377060983, 'samples': 7324032, 'steps': 38145, 'loss/train': 1.591407060623169} -11/07/2021 02:35:52 - INFO - __main__ - Step 38147: {'lr': 0.00042995205394807864, 'samples': 7324224, 'steps': 38146, 'loss/train': 1.4548685550689697} -11/07/2021 02:35:53 - INFO - __main__ - Step 38148: {'lr': 0.00042994837010897524, 'samples': 7324416, 'steps': 38147, 'loss/train': 1.6742019653320312} -11/07/2021 02:35:53 - INFO - __main__ - Step 38149: {'lr': 0.00042994468618879, 'samples': 7324608, 'steps': 38148, 'loss/train': 1.6510372161865234} -11/07/2021 02:35:54 - INFO - __main__ - Step 38150: {'lr': 0.0004299410021875244, 'samples': 7324800, 'steps': 38149, 'loss/train': 1.6389765739440918} -11/07/2021 02:35:55 - INFO - __main__ - Step 38151: {'lr': 0.00042993731810518025, 'samples': 7324992, 'steps': 38150, 'loss/train': 1.482251524925232} -11/07/2021 02:35:55 - INFO - __main__ - Step 38152: {'lr': 0.00042993363394175897, 'samples': 7325184, 'steps': 38151, 'loss/train': 2.3803791999816895} -11/07/2021 02:35:55 - INFO - __main__ - Step 38153: {'lr': 0.0004299299496972625, 'samples': 7325376, 'steps': 38152, 'loss/train': 1.4593158960342407} -11/07/2021 02:35:56 - INFO - __main__ - Step 38154: {'lr': 0.0004299262653716923, 'samples': 7325568, 'steps': 38153, 'loss/train': 1.8404978513717651} -11/07/2021 02:35:56 - INFO - __main__ - Step 38155: {'lr': 0.0004299225809650501, 'samples': 7325760, 'steps': 38154, 'loss/train': 1.2424695491790771} -11/07/2021 02:35:57 - INFO - __main__ - Step 38156: {'lr': 0.0004299188964773376, 'samples': 7325952, 'steps': 38155, 'loss/train': 1.2804923057556152} -11/07/2021 02:35:57 - INFO - __main__ - Step 38157: {'lr': 0.0004299152119085564, 'samples': 7326144, 'steps': 38156, 'loss/train': 1.5574463605880737} -11/07/2021 02:35:58 - INFO - __main__ - Step 38158: {'lr': 0.0004299115272587082, 'samples': 7326336, 'steps': 38157, 'loss/train': 0.36680254340171814} -11/07/2021 02:35:58 - INFO - __main__ - Step 38159: {'lr': 0.0004299078425277947, 'samples': 7326528, 'steps': 38158, 'loss/train': 1.097966194152832} -11/07/2021 02:35:58 - INFO - __main__ - Step 38160: {'lr': 0.00042990415771581734, 'samples': 7326720, 'steps': 38159, 'loss/train': 1.2340035438537598} -11/07/2021 02:35:59 - INFO - __main__ - Step 38161: {'lr': 0.0004299004728227781, 'samples': 7326912, 'steps': 38160, 'loss/train': 1.3330954313278198} -11/07/2021 02:36:00 - INFO - __main__ - Step 38162: {'lr': 0.0004298967878486784, 'samples': 7327104, 'steps': 38161, 'loss/train': 0.4179893136024475} -11/07/2021 02:36:00 - INFO - __main__ - Step 38163: {'lr': 0.00042989310279352, 'samples': 7327296, 'steps': 38162, 'loss/train': 0.3285816013813019} -11/07/2021 02:36:00 - INFO - __main__ - Step 38164: {'lr': 0.0004298894176573046, 'samples': 7327488, 'steps': 38163, 'loss/train': 1.6918214559555054} -11/07/2021 02:36:01 - INFO - __main__ - Step 38165: {'lr': 0.0004298857324400337, 'samples': 7327680, 'steps': 38164, 'loss/train': 1.8268216848373413} -11/07/2021 02:36:02 - INFO - __main__ - Step 38166: {'lr': 0.0004298820471417091, 'samples': 7327872, 'steps': 38165, 'loss/train': 1.4902230501174927} -11/07/2021 02:36:02 - INFO - __main__ - Step 38167: {'lr': 0.00042987836176233246, 'samples': 7328064, 'steps': 38166, 'loss/train': 1.3428443670272827} -11/07/2021 02:36:03 - INFO - __main__ - Step 38168: {'lr': 0.0004298746763019054, 'samples': 7328256, 'steps': 38167, 'loss/train': 0.43336984515190125} -11/07/2021 02:36:03 - INFO - __main__ - Step 38169: {'lr': 0.0004298709907604296, 'samples': 7328448, 'steps': 38168, 'loss/train': 1.229674220085144} -11/07/2021 02:36:03 - INFO - __main__ - Step 38170: {'lr': 0.0004298673051379066, 'samples': 7328640, 'steps': 38169, 'loss/train': 2.1229805946350098} -11/07/2021 02:36:04 - INFO - __main__ - Step 38171: {'lr': 0.0004298636194343383, 'samples': 7328832, 'steps': 38170, 'loss/train': 0.895877480506897} -11/07/2021 02:36:05 - INFO - __main__ - Step 38172: {'lr': 0.0004298599336497262, 'samples': 7329024, 'steps': 38171, 'loss/train': 1.468153476715088} -11/07/2021 02:36:05 - INFO - __main__ - Step 38173: {'lr': 0.00042985624778407196, 'samples': 7329216, 'steps': 38172, 'loss/train': 1.3250070810317993} -11/07/2021 02:36:05 - INFO - __main__ - Step 38174: {'lr': 0.00042985256183737723, 'samples': 7329408, 'steps': 38173, 'loss/train': 0.975612998008728} -11/07/2021 02:36:06 - INFO - __main__ - Step 38175: {'lr': 0.00042984887580964376, 'samples': 7329600, 'steps': 38174, 'loss/train': 1.6117653846740723} -11/07/2021 02:36:06 - INFO - __main__ - Step 38176: {'lr': 0.00042984518970087316, 'samples': 7329792, 'steps': 38175, 'loss/train': 1.356275200843811} -11/07/2021 02:36:07 - INFO - __main__ - Step 38177: {'lr': 0.0004298415035110671, 'samples': 7329984, 'steps': 38176, 'loss/train': 1.7516674995422363} -11/07/2021 02:36:08 - INFO - __main__ - Step 38178: {'lr': 0.00042983781724022723, 'samples': 7330176, 'steps': 38177, 'loss/train': 1.744294285774231} -11/07/2021 02:36:08 - INFO - __main__ - Step 38179: {'lr': 0.0004298341308883552, 'samples': 7330368, 'steps': 38178, 'loss/train': 2.2094287872314453} -11/07/2021 02:36:08 - INFO - __main__ - Step 38180: {'lr': 0.0004298304444554527, 'samples': 7330560, 'steps': 38179, 'loss/train': 1.6997636556625366} -11/07/2021 02:36:09 - INFO - __main__ - Step 38181: {'lr': 0.00042982675794152135, 'samples': 7330752, 'steps': 38180, 'loss/train': 2.0016207695007324} -11/07/2021 02:36:10 - INFO - __main__ - Step 38182: {'lr': 0.0004298230713465629, 'samples': 7330944, 'steps': 38181, 'loss/train': 1.2829039096832275} -11/07/2021 02:36:10 - INFO - __main__ - Step 38183: {'lr': 0.00042981938467057893, 'samples': 7331136, 'steps': 38182, 'loss/train': 0.7408188581466675} -11/07/2021 02:36:11 - INFO - __main__ - Step 38184: {'lr': 0.0004298156979135711, 'samples': 7331328, 'steps': 38183, 'loss/train': 1.2323633432388306} -11/07/2021 02:36:11 - INFO - __main__ - Step 38185: {'lr': 0.000429812011075541, 'samples': 7331520, 'steps': 38184, 'loss/train': 1.148552417755127} -11/07/2021 02:36:11 - INFO - __main__ - Step 38186: {'lr': 0.0004298083241564905, 'samples': 7331712, 'steps': 38185, 'loss/train': 1.3870030641555786} -11/07/2021 02:36:12 - INFO - __main__ - Step 38187: {'lr': 0.00042980463715642115, 'samples': 7331904, 'steps': 38186, 'loss/train': 1.4995348453521729} -11/07/2021 02:36:13 - INFO - __main__ - Step 38188: {'lr': 0.0004298009500753346, 'samples': 7332096, 'steps': 38187, 'loss/train': 1.3584494590759277} -11/07/2021 02:36:13 - INFO - __main__ - Step 38189: {'lr': 0.00042979726291323246, 'samples': 7332288, 'steps': 38188, 'loss/train': 1.6575303077697754} -11/07/2021 02:36:13 - INFO - __main__ - Step 38190: {'lr': 0.00042979357567011643, 'samples': 7332480, 'steps': 38189, 'loss/train': 1.3136870861053467} -11/07/2021 02:36:14 - INFO - __main__ - Step 38191: {'lr': 0.0004297898883459883, 'samples': 7332672, 'steps': 38190, 'loss/train': 1.2578123807907104} -11/07/2021 02:36:15 - INFO - __main__ - Step 38192: {'lr': 0.00042978620094084955, 'samples': 7332864, 'steps': 38191, 'loss/train': 1.4794684648513794} -11/07/2021 02:36:15 - INFO - __main__ - Step 38193: {'lr': 0.00042978251345470185, 'samples': 7333056, 'steps': 38192, 'loss/train': 1.5394213199615479} -11/07/2021 02:36:15 - INFO - __main__ - Step 38194: {'lr': 0.000429778825887547, 'samples': 7333248, 'steps': 38193, 'loss/train': 1.0442190170288086} -11/07/2021 02:36:16 - INFO - __main__ - Step 38195: {'lr': 0.00042977513823938665, 'samples': 7333440, 'steps': 38194, 'loss/train': 1.488396167755127} -11/07/2021 02:36:16 - INFO - __main__ - Step 38196: {'lr': 0.00042977145051022224, 'samples': 7333632, 'steps': 38195, 'loss/train': 1.642302393913269} -11/07/2021 02:36:17 - INFO - __main__ - Step 38197: {'lr': 0.0004297677627000557, 'samples': 7333824, 'steps': 38196, 'loss/train': 1.7927191257476807} -11/07/2021 02:36:17 - INFO - __main__ - Step 38198: {'lr': 0.0004297640748088886, 'samples': 7334016, 'steps': 38197, 'loss/train': 1.6281474828720093} -11/07/2021 02:36:18 - INFO - __main__ - Step 38199: {'lr': 0.0004297603868367225, 'samples': 7334208, 'steps': 38198, 'loss/train': 1.7086904048919678} -11/07/2021 02:36:18 - INFO - __main__ - Step 38200: {'lr': 0.00042975669878355917, 'samples': 7334400, 'steps': 38199, 'loss/train': 2.989762783050537} -11/07/2021 02:36:18 - INFO - __main__ - Step 38201: {'lr': 0.00042975301064940026, 'samples': 7334592, 'steps': 38200, 'loss/train': 1.8463572263717651} -11/07/2021 02:36:19 - INFO - __main__ - Step 38202: {'lr': 0.00042974932243424743, 'samples': 7334784, 'steps': 38201, 'loss/train': 2.0515167713165283} -11/07/2021 02:36:20 - INFO - __main__ - Step 38203: {'lr': 0.0004297456341381023, 'samples': 7334976, 'steps': 38202, 'loss/train': 0.7293980717658997} -11/07/2021 02:36:20 - INFO - __main__ - Step 38204: {'lr': 0.0004297419457609666, 'samples': 7335168, 'steps': 38203, 'loss/train': 1.7791290283203125} -11/07/2021 02:36:21 - INFO - __main__ - Step 38205: {'lr': 0.0004297382573028419, 'samples': 7335360, 'steps': 38204, 'loss/train': 1.5674655437469482} -11/07/2021 02:36:21 - INFO - __main__ - Step 38206: {'lr': 0.0004297345687637299, 'samples': 7335552, 'steps': 38205, 'loss/train': 2.14150333404541} -11/07/2021 02:36:21 - INFO - __main__ - Step 38207: {'lr': 0.00042973088014363237, 'samples': 7335744, 'steps': 38206, 'loss/train': 1.6745388507843018} -11/07/2021 02:36:22 - INFO - __main__ - Step 38208: {'lr': 0.0004297271914425508, 'samples': 7335936, 'steps': 38207, 'loss/train': 1.391538381576538} -11/07/2021 02:36:23 - INFO - __main__ - Step 38209: {'lr': 0.00042972350266048693, 'samples': 7336128, 'steps': 38208, 'loss/train': 0.917203962802887} -11/07/2021 02:36:23 - INFO - __main__ - Step 38210: {'lr': 0.0004297198137974425, 'samples': 7336320, 'steps': 38209, 'loss/train': 1.749819278717041} -11/07/2021 02:36:23 - INFO - __main__ - Step 38211: {'lr': 0.00042971612485341896, 'samples': 7336512, 'steps': 38210, 'loss/train': 0.9586760997772217} -11/07/2021 02:36:24 - INFO - __main__ - Step 38212: {'lr': 0.00042971243582841823, 'samples': 7336704, 'steps': 38211, 'loss/train': 0.8148049116134644} -11/07/2021 02:36:25 - INFO - __main__ - Step 38213: {'lr': 0.0004297087467224418, 'samples': 7336896, 'steps': 38212, 'loss/train': 1.433459758758545} -11/07/2021 02:36:25 - INFO - __main__ - Step 38214: {'lr': 0.0004297050575354914, 'samples': 7337088, 'steps': 38213, 'loss/train': 1.6563775539398193} -11/07/2021 02:36:25 - INFO - __main__ - Step 38215: {'lr': 0.0004297013682675687, 'samples': 7337280, 'steps': 38214, 'loss/train': 1.0042729377746582} -11/07/2021 02:36:26 - INFO - __main__ - Step 38216: {'lr': 0.0004296976789186753, 'samples': 7337472, 'steps': 38215, 'loss/train': 1.534716010093689} -11/07/2021 02:36:26 - INFO - __main__ - Step 38217: {'lr': 0.00042969398948881286, 'samples': 7337664, 'steps': 38216, 'loss/train': 1.5462156534194946} -11/07/2021 02:36:27 - INFO - __main__ - Step 38218: {'lr': 0.00042969029997798314, 'samples': 7337856, 'steps': 38217, 'loss/train': 1.679050326347351} -11/07/2021 02:36:27 - INFO - __main__ - Step 38219: {'lr': 0.00042968661038618775, 'samples': 7338048, 'steps': 38218, 'loss/train': 1.924902319908142} -11/07/2021 02:36:28 - INFO - __main__ - Step 38220: {'lr': 0.0004296829207134283, 'samples': 7338240, 'steps': 38219, 'loss/train': 1.2776870727539062} -11/07/2021 02:36:28 - INFO - __main__ - Step 38221: {'lr': 0.0004296792309597065, 'samples': 7338432, 'steps': 38220, 'loss/train': 1.4061015844345093} -11/07/2021 02:36:28 - INFO - __main__ - Step 38222: {'lr': 0.00042967554112502404, 'samples': 7338624, 'steps': 38221, 'loss/train': 1.2293282747268677} -11/07/2021 02:36:29 - INFO - __main__ - Step 38223: {'lr': 0.00042967185120938256, 'samples': 7338816, 'steps': 38222, 'loss/train': 1.0383968353271484} -11/07/2021 02:36:30 - INFO - __main__ - Step 38224: {'lr': 0.00042966816121278365, 'samples': 7339008, 'steps': 38223, 'loss/train': 1.7293782234191895} -11/07/2021 02:36:30 - INFO - __main__ - Step 38225: {'lr': 0.0004296644711352291, 'samples': 7339200, 'steps': 38224, 'loss/train': 1.6785378456115723} -11/07/2021 02:36:31 - INFO - __main__ - Step 38226: {'lr': 0.0004296607809767205, 'samples': 7339392, 'steps': 38225, 'loss/train': 1.3909289836883545} -11/07/2021 02:36:31 - INFO - __main__ - Step 38227: {'lr': 0.00042965709073725957, 'samples': 7339584, 'steps': 38226, 'loss/train': 1.9048470258712769} -11/07/2021 02:36:31 - INFO - __main__ - Step 38228: {'lr': 0.00042965340041684785, 'samples': 7339776, 'steps': 38227, 'loss/train': 1.051666021347046} -11/07/2021 02:36:32 - INFO - __main__ - Step 38229: {'lr': 0.00042964971001548715, 'samples': 7339968, 'steps': 38228, 'loss/train': 1.3761814832687378} -11/07/2021 02:36:33 - INFO - __main__ - Step 38230: {'lr': 0.00042964601953317895, 'samples': 7340160, 'steps': 38229, 'loss/train': 1.4855128526687622} -11/07/2021 02:36:33 - INFO - __main__ - Step 38231: {'lr': 0.0004296423289699252, 'samples': 7340352, 'steps': 38230, 'loss/train': 0.9149501323699951} -11/07/2021 02:36:33 - INFO - __main__ - Step 38232: {'lr': 0.00042963863832572727, 'samples': 7340544, 'steps': 38231, 'loss/train': 1.554993748664856} -11/07/2021 02:36:34 - INFO - __main__ - Step 38233: {'lr': 0.0004296349476005869, 'samples': 7340736, 'steps': 38232, 'loss/train': 1.3690378665924072} -11/07/2021 02:36:35 - INFO - __main__ - Step 38234: {'lr': 0.0004296312567945059, 'samples': 7340928, 'steps': 38233, 'loss/train': 1.3793355226516724} -11/07/2021 02:36:35 - INFO - __main__ - Step 38235: {'lr': 0.0004296275659074858, 'samples': 7341120, 'steps': 38234, 'loss/train': 1.2817461490631104} -11/07/2021 02:36:36 - INFO - __main__ - Step 38236: {'lr': 0.00042962387493952823, 'samples': 7341312, 'steps': 38235, 'loss/train': 1.375528335571289} -11/07/2021 02:36:36 - INFO - __main__ - Step 38237: {'lr': 0.00042962018389063495, 'samples': 7341504, 'steps': 38236, 'loss/train': 1.0297311544418335} -11/07/2021 02:36:36 - INFO - __main__ - Step 38238: {'lr': 0.0004296164927608076, 'samples': 7341696, 'steps': 38237, 'loss/train': 1.5794353485107422} -11/07/2021 02:36:37 - INFO - __main__ - Step 38239: {'lr': 0.00042961280155004786, 'samples': 7341888, 'steps': 38238, 'loss/train': 0.6085673570632935} -11/07/2021 02:36:38 - INFO - __main__ - Step 38240: {'lr': 0.0004296091102583573, 'samples': 7342080, 'steps': 38239, 'loss/train': 1.249404788017273} -11/07/2021 02:36:38 - INFO - __main__ - Step 38241: {'lr': 0.0004296054188857377, 'samples': 7342272, 'steps': 38240, 'loss/train': 1.118761420249939} -11/07/2021 02:36:38 - INFO - __main__ - Step 38242: {'lr': 0.0004296017274321906, 'samples': 7342464, 'steps': 38241, 'loss/train': 1.4748969078063965} -11/07/2021 02:36:39 - INFO - __main__ - Step 38243: {'lr': 0.0004295980358977178, 'samples': 7342656, 'steps': 38242, 'loss/train': 1.4010951519012451} -11/07/2021 02:36:40 - INFO - __main__ - Step 38244: {'lr': 0.0004295943442823209, 'samples': 7342848, 'steps': 38243, 'loss/train': 1.797529697418213} -11/07/2021 02:36:40 - INFO - __main__ - Step 38245: {'lr': 0.0004295906525860015, 'samples': 7343040, 'steps': 38244, 'loss/train': 1.5135968923568726} -11/07/2021 02:36:40 - INFO - __main__ - Step 38246: {'lr': 0.00042958696080876136, 'samples': 7343232, 'steps': 38245, 'loss/train': 1.836068868637085} -11/07/2021 02:36:41 - INFO - __main__ - Step 38247: {'lr': 0.00042958326895060206, 'samples': 7343424, 'steps': 38246, 'loss/train': 1.1405773162841797} -11/07/2021 02:36:41 - INFO - __main__ - Step 38248: {'lr': 0.0004295795770115254, 'samples': 7343616, 'steps': 38247, 'loss/train': 1.3413417339324951} -11/07/2021 02:36:42 - INFO - __main__ - Step 38249: {'lr': 0.0004295758849915329, 'samples': 7343808, 'steps': 38248, 'loss/train': 1.624894618988037} -11/07/2021 02:36:43 - INFO - __main__ - Step 38250: {'lr': 0.00042957219289062635, 'samples': 7344000, 'steps': 38249, 'loss/train': 1.6614336967468262} -11/07/2021 02:36:43 - INFO - __main__ - Step 38251: {'lr': 0.0004295685007088072, 'samples': 7344192, 'steps': 38250, 'loss/train': 1.712052822113037} -11/07/2021 02:36:43 - INFO - __main__ - Step 38252: {'lr': 0.00042956480844607734, 'samples': 7344384, 'steps': 38251, 'loss/train': 0.6693893074989319} -11/07/2021 02:36:44 - INFO - __main__ - Step 38253: {'lr': 0.00042956111610243833, 'samples': 7344576, 'steps': 38252, 'loss/train': 0.6600829362869263} -11/07/2021 02:36:44 - INFO - __main__ - Step 38254: {'lr': 0.0004295574236778919, 'samples': 7344768, 'steps': 38253, 'loss/train': 1.4803495407104492} -11/07/2021 02:36:45 - INFO - __main__ - Step 38255: {'lr': 0.00042955373117243954, 'samples': 7344960, 'steps': 38254, 'loss/train': 1.4988573789596558} -11/07/2021 02:36:45 - INFO - __main__ - Step 38256: {'lr': 0.0004295500385860832, 'samples': 7345152, 'steps': 38255, 'loss/train': 2.0637753009796143} -11/07/2021 02:36:46 - INFO - __main__ - Step 38257: {'lr': 0.0004295463459188243, 'samples': 7345344, 'steps': 38256, 'loss/train': 0.21861299872398376} -11/07/2021 02:36:46 - INFO - __main__ - Step 38258: {'lr': 0.00042954265317066457, 'samples': 7345536, 'steps': 38257, 'loss/train': 0.9756987690925598} -11/07/2021 02:36:46 - INFO - __main__ - Step 38259: {'lr': 0.0004295389603416057, 'samples': 7345728, 'steps': 38258, 'loss/train': 1.52315092086792} -11/07/2021 02:36:48 - INFO - __main__ - Step 38260: {'lr': 0.0004295352674316494, 'samples': 7345920, 'steps': 38259, 'loss/train': 1.6356688737869263} -11/07/2021 02:36:48 - INFO - __main__ - Step 38261: {'lr': 0.0004295315744407972, 'samples': 7346112, 'steps': 38260, 'loss/train': 1.7461309432983398} -11/07/2021 02:36:48 - INFO - __main__ - Step 38262: {'lr': 0.0004295278813690509, 'samples': 7346304, 'steps': 38261, 'loss/train': 1.6206568479537964} -11/07/2021 02:36:49 - INFO - __main__ - Step 38263: {'lr': 0.0004295241882164121, 'samples': 7346496, 'steps': 38262, 'loss/train': 1.4554109573364258} -11/07/2021 02:36:49 - INFO - __main__ - Step 38264: {'lr': 0.0004295204949828825, 'samples': 7346688, 'steps': 38263, 'loss/train': 1.0673553943634033} -11/07/2021 02:36:50 - INFO - __main__ - Step 38265: {'lr': 0.0004295168016684636, 'samples': 7346880, 'steps': 38264, 'loss/train': 1.2171517610549927} -11/07/2021 02:36:50 - INFO - __main__ - Step 38266: {'lr': 0.0004295131082731574, 'samples': 7347072, 'steps': 38265, 'loss/train': 2.0179131031036377} -11/07/2021 02:36:51 - INFO - __main__ - Step 38267: {'lr': 0.0004295094147969652, 'samples': 7347264, 'steps': 38266, 'loss/train': 1.5524829626083374} -11/07/2021 02:36:51 - INFO - __main__ - Step 38268: {'lr': 0.0004295057212398889, 'samples': 7347456, 'steps': 38267, 'loss/train': 1.5185699462890625} -11/07/2021 02:36:51 - INFO - __main__ - Step 38269: {'lr': 0.00042950202760193003, 'samples': 7347648, 'steps': 38268, 'loss/train': 1.997591495513916} -11/07/2021 02:36:53 - INFO - __main__ - Step 38270: {'lr': 0.0004294983338830904, 'samples': 7347840, 'steps': 38269, 'loss/train': 1.6346243619918823} -11/07/2021 02:36:53 - INFO - __main__ - Step 38271: {'lr': 0.0004294946400833716, 'samples': 7348032, 'steps': 38270, 'loss/train': 1.7416479587554932} -11/07/2021 02:36:53 - INFO - __main__ - Step 38272: {'lr': 0.0004294909462027752, 'samples': 7348224, 'steps': 38271, 'loss/train': 1.3885921239852905} -11/07/2021 02:36:54 - INFO - __main__ - Step 38273: {'lr': 0.000429487252241303, 'samples': 7348416, 'steps': 38272, 'loss/train': 0.7423022985458374} -11/07/2021 02:36:54 - INFO - __main__ - Step 38274: {'lr': 0.00042948355819895655, 'samples': 7348608, 'steps': 38273, 'loss/train': 1.4728059768676758} -11/07/2021 02:36:54 - INFO - __main__ - Step 38275: {'lr': 0.0004294798640757377, 'samples': 7348800, 'steps': 38274, 'loss/train': 0.8224681615829468} -11/07/2021 02:36:55 - INFO - __main__ - Step 38276: {'lr': 0.00042947616987164787, 'samples': 7348992, 'steps': 38275, 'loss/train': 1.8463332653045654} -11/07/2021 02:36:56 - INFO - __main__ - Step 38277: {'lr': 0.00042947247558668887, 'samples': 7349184, 'steps': 38276, 'loss/train': 1.5869121551513672} -11/07/2021 02:36:56 - INFO - __main__ - Step 38278: {'lr': 0.00042946878122086243, 'samples': 7349376, 'steps': 38277, 'loss/train': 1.624953269958496} -11/07/2021 02:36:56 - INFO - __main__ - Step 38279: {'lr': 0.00042946508677417007, 'samples': 7349568, 'steps': 38278, 'loss/train': 1.7056394815444946} -11/07/2021 02:36:57 - INFO - __main__ - Step 38280: {'lr': 0.0004294613922466135, 'samples': 7349760, 'steps': 38279, 'loss/train': 1.591142177581787} -11/07/2021 02:36:58 - INFO - __main__ - Step 38281: {'lr': 0.0004294576976381944, 'samples': 7349952, 'steps': 38280, 'loss/train': 1.4061824083328247} -11/07/2021 02:36:58 - INFO - __main__ - Step 38282: {'lr': 0.00042945400294891445, 'samples': 7350144, 'steps': 38281, 'loss/train': 1.90840482711792} -11/07/2021 02:36:58 - INFO - __main__ - Step 38283: {'lr': 0.0004294503081787753, 'samples': 7350336, 'steps': 38282, 'loss/train': 0.9647262692451477} -11/07/2021 02:36:59 - INFO - __main__ - Step 38284: {'lr': 0.0004294466133277786, 'samples': 7350528, 'steps': 38283, 'loss/train': 1.229430079460144} -11/07/2021 02:36:59 - INFO - __main__ - Step 38285: {'lr': 0.00042944291839592597, 'samples': 7350720, 'steps': 38284, 'loss/train': 0.9978717565536499} -11/07/2021 02:37:01 - INFO - __main__ - Step 38286: {'lr': 0.0004294392233832192, 'samples': 7350912, 'steps': 38285, 'loss/train': 1.2743558883666992} -11/07/2021 02:37:01 - INFO - __main__ - Step 38287: {'lr': 0.0004294355282896599, 'samples': 7351104, 'steps': 38286, 'loss/train': 1.7710016965866089} -11/07/2021 02:37:01 - INFO - __main__ - Step 38288: {'lr': 0.00042943183311524967, 'samples': 7351296, 'steps': 38287, 'loss/train': 1.8275021314620972} -11/07/2021 02:37:02 - INFO - __main__ - Step 38289: {'lr': 0.0004294281378599902, 'samples': 7351488, 'steps': 38288, 'loss/train': 1.90546452999115} -11/07/2021 02:37:02 - INFO - __main__ - Step 38290: {'lr': 0.00042942444252388323, 'samples': 7351680, 'steps': 38289, 'loss/train': 1.8090331554412842} -11/07/2021 02:37:02 - INFO - __main__ - Step 38291: {'lr': 0.0004294207471069304, 'samples': 7351872, 'steps': 38290, 'loss/train': 1.1580256223678589} -11/07/2021 02:37:03 - INFO - __main__ - Step 38292: {'lr': 0.0004294170516091332, 'samples': 7352064, 'steps': 38291, 'loss/train': 1.6080865859985352} -11/07/2021 02:37:04 - INFO - __main__ - Step 38293: {'lr': 0.0004294133560304936, 'samples': 7352256, 'steps': 38292, 'loss/train': 1.8003463745117188} -11/07/2021 02:37:04 - INFO - __main__ - Step 38294: {'lr': 0.00042940966037101314, 'samples': 7352448, 'steps': 38293, 'loss/train': 1.6777453422546387} -11/07/2021 02:37:05 - INFO - __main__ - Step 38295: {'lr': 0.00042940596463069336, 'samples': 7352640, 'steps': 38294, 'loss/train': 0.3316746652126312} -11/07/2021 02:37:05 - INFO - __main__ - Step 38296: {'lr': 0.00042940226880953605, 'samples': 7352832, 'steps': 38295, 'loss/train': 1.732701301574707} -11/07/2021 02:37:05 - INFO - __main__ - Step 38297: {'lr': 0.0004293985729075428, 'samples': 7353024, 'steps': 38296, 'loss/train': 1.5013654232025146} -11/07/2021 02:37:06 - INFO - __main__ - Step 38298: {'lr': 0.00042939487692471534, 'samples': 7353216, 'steps': 38297, 'loss/train': 1.4927855730056763} -11/07/2021 02:37:07 - INFO - __main__ - Step 38299: {'lr': 0.0004293911808610554, 'samples': 7353408, 'steps': 38298, 'loss/train': 1.6887056827545166} -11/07/2021 02:37:07 - INFO - __main__ - Step 38300: {'lr': 0.0004293874847165645, 'samples': 7353600, 'steps': 38299, 'loss/train': 1.4818027019500732} -11/07/2021 02:37:07 - INFO - __main__ - Step 38301: {'lr': 0.0004293837884912444, 'samples': 7353792, 'steps': 38300, 'loss/train': 2.025219678878784} -11/07/2021 02:37:08 - INFO - __main__ - Step 38302: {'lr': 0.00042938009218509667, 'samples': 7353984, 'steps': 38301, 'loss/train': 1.3994265794754028} -11/07/2021 02:37:08 - INFO - __main__ - Step 38303: {'lr': 0.00042937639579812304, 'samples': 7354176, 'steps': 38302, 'loss/train': 1.506459355354309} -11/07/2021 02:37:09 - INFO - __main__ - Step 38304: {'lr': 0.0004293726993303252, 'samples': 7354368, 'steps': 38303, 'loss/train': 1.719734787940979} -11/07/2021 02:37:09 - INFO - __main__ - Step 38305: {'lr': 0.0004293690027817048, 'samples': 7354560, 'steps': 38304, 'loss/train': 1.195610761642456} -11/07/2021 02:37:10 - INFO - __main__ - Step 38306: {'lr': 0.00042936530615226355, 'samples': 7354752, 'steps': 38305, 'loss/train': 1.3250503540039062} -11/07/2021 02:37:10 - INFO - __main__ - Step 38307: {'lr': 0.00042936160944200295, 'samples': 7354944, 'steps': 38306, 'loss/train': 1.7600414752960205} -11/07/2021 02:37:10 - INFO - __main__ - Step 38308: {'lr': 0.00042935791265092483, 'samples': 7355136, 'steps': 38307, 'loss/train': 1.7057290077209473} -11/07/2021 02:37:11 - INFO - __main__ - Step 38309: {'lr': 0.0004293542157790308, 'samples': 7355328, 'steps': 38308, 'loss/train': 1.512961983680725} -11/07/2021 02:37:12 - INFO - __main__ - Step 38310: {'lr': 0.00042935051882632245, 'samples': 7355520, 'steps': 38309, 'loss/train': 1.4231493473052979} -11/07/2021 02:37:12 - INFO - __main__ - Step 38311: {'lr': 0.0004293468217928017, 'samples': 7355712, 'steps': 38310, 'loss/train': 1.3613260984420776} -11/07/2021 02:37:12 - INFO - __main__ - Step 38312: {'lr': 0.0004293431246784699, 'samples': 7355904, 'steps': 38311, 'loss/train': 1.8416643142700195} -11/07/2021 02:37:13 - INFO - __main__ - Step 38313: {'lr': 0.0004293394274833289, 'samples': 7356096, 'steps': 38312, 'loss/train': 1.530188798904419} -11/07/2021 02:37:14 - INFO - __main__ - Step 38314: {'lr': 0.0004293357302073804, 'samples': 7356288, 'steps': 38313, 'loss/train': 1.4533849954605103} -11/07/2021 02:37:14 - INFO - __main__ - Step 38315: {'lr': 0.00042933203285062585, 'samples': 7356480, 'steps': 38314, 'loss/train': 1.5147393941879272} -11/07/2021 02:37:15 - INFO - __main__ - Step 38316: {'lr': 0.00042932833541306704, 'samples': 7356672, 'steps': 38315, 'loss/train': 1.3559811115264893} -11/07/2021 02:37:15 - INFO - __main__ - Step 38317: {'lr': 0.0004293246378947058, 'samples': 7356864, 'steps': 38316, 'loss/train': 1.9374382495880127} -11/07/2021 02:37:15 - INFO - __main__ - Step 38318: {'lr': 0.00042932094029554354, 'samples': 7357056, 'steps': 38317, 'loss/train': 1.3933587074279785} -11/07/2021 02:37:16 - INFO - __main__ - Step 38319: {'lr': 0.00042931724261558205, 'samples': 7357248, 'steps': 38318, 'loss/train': 1.1619360446929932} -11/07/2021 02:37:17 - INFO - __main__ - Step 38320: {'lr': 0.000429313544854823, 'samples': 7357440, 'steps': 38319, 'loss/train': 1.4888416528701782} -11/07/2021 02:37:17 - INFO - __main__ - Step 38321: {'lr': 0.00042930984701326796, 'samples': 7357632, 'steps': 38320, 'loss/train': 1.7033252716064453} -11/07/2021 02:37:17 - INFO - __main__ - Step 38322: {'lr': 0.0004293061490909187, 'samples': 7357824, 'steps': 38321, 'loss/train': 1.3759467601776123} -11/07/2021 02:37:18 - INFO - __main__ - Step 38323: {'lr': 0.0004293024510877769, 'samples': 7358016, 'steps': 38322, 'loss/train': 0.9921587109565735} -11/07/2021 02:37:19 - INFO - __main__ - Step 38324: {'lr': 0.00042929875300384417, 'samples': 7358208, 'steps': 38323, 'loss/train': 1.6296452283859253} -11/07/2021 02:37:19 - INFO - __main__ - Step 38325: {'lr': 0.0004292950548391222, 'samples': 7358400, 'steps': 38324, 'loss/train': 1.064168095588684} -11/07/2021 02:37:19 - INFO - __main__ - Step 38326: {'lr': 0.00042929135659361265, 'samples': 7358592, 'steps': 38325, 'loss/train': 0.5363820791244507} -11/07/2021 02:37:20 - INFO - __main__ - Step 38327: {'lr': 0.0004292876582673171, 'samples': 7358784, 'steps': 38326, 'loss/train': 0.9394339323043823} -11/07/2021 02:37:20 - INFO - __main__ - Step 38328: {'lr': 0.0004292839598602374, 'samples': 7358976, 'steps': 38327, 'loss/train': 0.8856777548789978} -11/07/2021 02:37:21 - INFO - __main__ - Step 38329: {'lr': 0.000429280261372375, 'samples': 7359168, 'steps': 38328, 'loss/train': 1.5098530054092407} -11/07/2021 02:37:22 - INFO - __main__ - Step 38330: {'lr': 0.00042927656280373176, 'samples': 7359360, 'steps': 38329, 'loss/train': 1.4925379753112793} -11/07/2021 02:37:22 - INFO - __main__ - Step 38331: {'lr': 0.00042927286415430933, 'samples': 7359552, 'steps': 38330, 'loss/train': 1.8342890739440918} -11/07/2021 02:37:22 - INFO - __main__ - Step 38332: {'lr': 0.0004292691654241092, 'samples': 7359744, 'steps': 38331, 'loss/train': 1.2873988151550293} -11/07/2021 02:37:23 - INFO - __main__ - Step 38333: {'lr': 0.00042926546661313313, 'samples': 7359936, 'steps': 38332, 'loss/train': 1.7223068475723267} -11/07/2021 02:37:23 - INFO - __main__ - Step 38334: {'lr': 0.00042926176772138295, 'samples': 7360128, 'steps': 38333, 'loss/train': 1.29563307762146} -11/07/2021 02:37:24 - INFO - __main__ - Step 38335: {'lr': 0.0004292580687488601, 'samples': 7360320, 'steps': 38334, 'loss/train': 1.639797568321228} -11/07/2021 02:37:24 - INFO - __main__ - Step 38336: {'lr': 0.0004292543696955663, 'samples': 7360512, 'steps': 38335, 'loss/train': 1.5832456350326538} -11/07/2021 02:37:25 - INFO - __main__ - Step 38337: {'lr': 0.00042925067056150324, 'samples': 7360704, 'steps': 38336, 'loss/train': 1.8844374418258667} -11/07/2021 02:37:25 - INFO - __main__ - Step 38338: {'lr': 0.0004292469713466727, 'samples': 7360896, 'steps': 38337, 'loss/train': 1.8090503215789795} -11/07/2021 02:37:25 - INFO - __main__ - Step 38339: {'lr': 0.00042924327205107616, 'samples': 7361088, 'steps': 38338, 'loss/train': 1.2895766496658325} -11/07/2021 02:37:27 - INFO - __main__ - Step 38340: {'lr': 0.00042923957267471536, 'samples': 7361280, 'steps': 38339, 'loss/train': 1.9198942184448242} -11/07/2021 02:37:27 - INFO - __main__ - Step 38341: {'lr': 0.000429235873217592, 'samples': 7361472, 'steps': 38340, 'loss/train': 1.340233564376831} -11/07/2021 02:37:27 - INFO - __main__ - Step 38342: {'lr': 0.0004292321736797077, 'samples': 7361664, 'steps': 38341, 'loss/train': 1.4563068151474} -11/07/2021 02:37:28 - INFO - __main__ - Step 38343: {'lr': 0.0004292284740610642, 'samples': 7361856, 'steps': 38342, 'loss/train': 1.0337316989898682} -11/07/2021 02:37:28 - INFO - __main__ - Step 38344: {'lr': 0.0004292247743616631, 'samples': 7362048, 'steps': 38343, 'loss/train': 1.9487308263778687} -11/07/2021 02:37:29 - INFO - __main__ - Step 38345: {'lr': 0.00042922107458150604, 'samples': 7362240, 'steps': 38344, 'loss/train': 1.299109697341919} -11/07/2021 02:37:29 - INFO - __main__ - Step 38346: {'lr': 0.00042921737472059474, 'samples': 7362432, 'steps': 38345, 'loss/train': 1.619086742401123} -11/07/2021 02:37:30 - INFO - __main__ - Step 38347: {'lr': 0.0004292136747789309, 'samples': 7362624, 'steps': 38346, 'loss/train': 1.6750733852386475} -11/07/2021 02:37:30 - INFO - __main__ - Step 38348: {'lr': 0.00042920997475651607, 'samples': 7362816, 'steps': 38347, 'loss/train': 1.1470671892166138} -11/07/2021 02:37:30 - INFO - __main__ - Step 38349: {'lr': 0.00042920627465335205, 'samples': 7363008, 'steps': 38348, 'loss/train': 1.635786533355713} -11/07/2021 02:37:31 - INFO - __main__ - Step 38350: {'lr': 0.00042920257446944044, 'samples': 7363200, 'steps': 38349, 'loss/train': 1.5170003175735474} -11/07/2021 02:37:32 - INFO - __main__ - Step 38351: {'lr': 0.0004291988742047829, 'samples': 7363392, 'steps': 38350, 'loss/train': 1.636959433555603} -11/07/2021 02:37:32 - INFO - __main__ - Step 38352: {'lr': 0.0004291951738593811, 'samples': 7363584, 'steps': 38351, 'loss/train': 1.6563864946365356} -11/07/2021 02:37:32 - INFO - __main__ - Step 38353: {'lr': 0.0004291914734332367, 'samples': 7363776, 'steps': 38352, 'loss/train': 2.0324835777282715} -11/07/2021 02:37:33 - INFO - __main__ - Step 38354: {'lr': 0.0004291877729263515, 'samples': 7363968, 'steps': 38353, 'loss/train': 1.2263227701187134} -11/07/2021 02:37:33 - INFO - __main__ - Step 38355: {'lr': 0.0004291840723387269, 'samples': 7364160, 'steps': 38354, 'loss/train': 1.572365164756775} -11/07/2021 02:37:35 - INFO - __main__ - Step 38356: {'lr': 0.0004291803716703648, 'samples': 7364352, 'steps': 38355, 'loss/train': 1.4267158508300781} -11/07/2021 02:37:35 - INFO - __main__ - Step 38357: {'lr': 0.0004291766709212668, 'samples': 7364544, 'steps': 38356, 'loss/train': 1.7175195217132568} -11/07/2021 02:37:35 - INFO - __main__ - Step 38358: {'lr': 0.00042917297009143455, 'samples': 7364736, 'steps': 38357, 'loss/train': 1.390121579170227} -11/07/2021 02:37:36 - INFO - __main__ - Step 38359: {'lr': 0.00042916926918086973, 'samples': 7364928, 'steps': 38358, 'loss/train': 0.26775655150413513} -11/07/2021 02:37:36 - INFO - __main__ - Step 38360: {'lr': 0.000429165568189574, 'samples': 7365120, 'steps': 38359, 'loss/train': 1.4750648736953735} -11/07/2021 02:37:37 - INFO - __main__ - Step 38361: {'lr': 0.000429161867117549, 'samples': 7365312, 'steps': 38360, 'loss/train': 0.9110004305839539} -11/07/2021 02:37:37 - INFO - __main__ - Step 38362: {'lr': 0.0004291581659647965, 'samples': 7365504, 'steps': 38361, 'loss/train': 1.269174575805664} -11/07/2021 02:37:38 - INFO - __main__ - Step 38363: {'lr': 0.00042915446473131805, 'samples': 7365696, 'steps': 38362, 'loss/train': 1.0548052787780762} -11/07/2021 02:37:38 - INFO - __main__ - Step 38364: {'lr': 0.0004291507634171153, 'samples': 7365888, 'steps': 38363, 'loss/train': 1.7208577394485474} -11/07/2021 02:37:38 - INFO - __main__ - Step 38365: {'lr': 0.0004291470620221901, 'samples': 7366080, 'steps': 38364, 'loss/train': 1.6459720134735107} -11/07/2021 02:37:39 - INFO - __main__ - Step 38366: {'lr': 0.0004291433605465439, 'samples': 7366272, 'steps': 38365, 'loss/train': 1.5473575592041016} -11/07/2021 02:37:40 - INFO - __main__ - Step 38367: {'lr': 0.00042913965899017855, 'samples': 7366464, 'steps': 38366, 'loss/train': 1.445980191230774} -11/07/2021 02:37:40 - INFO - __main__ - Step 38368: {'lr': 0.0004291359573530956, 'samples': 7366656, 'steps': 38367, 'loss/train': 0.7899708151817322} -11/07/2021 02:37:40 - INFO - __main__ - Step 38369: {'lr': 0.0004291322556352967, 'samples': 7366848, 'steps': 38368, 'loss/train': 1.4125922918319702} -11/07/2021 02:37:41 - INFO - __main__ - Step 38370: {'lr': 0.00042912855383678365, 'samples': 7367040, 'steps': 38369, 'loss/train': 1.8855928182601929} -11/07/2021 02:37:41 - INFO - __main__ - Step 38371: {'lr': 0.000429124851957558, 'samples': 7367232, 'steps': 38370, 'loss/train': 1.5229068994522095} -11/07/2021 02:37:42 - INFO - __main__ - Step 38372: {'lr': 0.0004291211499976214, 'samples': 7367424, 'steps': 38371, 'loss/train': 1.5820503234863281} -11/07/2021 02:37:43 - INFO - __main__ - Step 38373: {'lr': 0.0004291174479569757, 'samples': 7367616, 'steps': 38372, 'loss/train': 1.3003944158554077} -11/07/2021 02:37:43 - INFO - __main__ - Step 38374: {'lr': 0.00042911374583562233, 'samples': 7367808, 'steps': 38373, 'loss/train': 1.4751864671707153} -11/07/2021 02:37:43 - INFO - __main__ - Step 38375: {'lr': 0.0004291100436335631, 'samples': 7368000, 'steps': 38374, 'loss/train': 1.2032063007354736} -11/07/2021 02:37:44 - INFO - __main__ - Step 38376: {'lr': 0.00042910634135079963, 'samples': 7368192, 'steps': 38375, 'loss/train': 1.6390328407287598} -11/07/2021 02:37:45 - INFO - __main__ - Step 38377: {'lr': 0.00042910263898733364, 'samples': 7368384, 'steps': 38376, 'loss/train': 2.2559876441955566} -11/07/2021 02:37:45 - INFO - __main__ - Step 38378: {'lr': 0.0004290989365431668, 'samples': 7368576, 'steps': 38377, 'loss/train': 0.7892315983772278} -11/07/2021 02:37:45 - INFO - __main__ - Step 38379: {'lr': 0.0004290952340183007, 'samples': 7368768, 'steps': 38378, 'loss/train': 2.178373098373413} -11/07/2021 02:37:46 - INFO - __main__ - Step 38380: {'lr': 0.00042909153141273705, 'samples': 7368960, 'steps': 38379, 'loss/train': 1.791010856628418} -11/07/2021 02:37:46 - INFO - __main__ - Step 38381: {'lr': 0.0004290878287264775, 'samples': 7369152, 'steps': 38380, 'loss/train': 1.7731704711914062} -11/07/2021 02:37:47 - INFO - __main__ - Step 38382: {'lr': 0.0004290841259595237, 'samples': 7369344, 'steps': 38381, 'loss/train': 0.74814772605896} -11/07/2021 02:37:48 - INFO - __main__ - Step 38383: {'lr': 0.00042908042311187744, 'samples': 7369536, 'steps': 38382, 'loss/train': 1.4945881366729736} -11/07/2021 02:37:48 - INFO - __main__ - Step 38384: {'lr': 0.00042907672018354027, 'samples': 7369728, 'steps': 38383, 'loss/train': 1.2648224830627441} -11/07/2021 02:37:48 - INFO - __main__ - Step 38385: {'lr': 0.00042907301717451396, 'samples': 7369920, 'steps': 38384, 'loss/train': 1.0060302019119263} -11/07/2021 02:37:49 - INFO - __main__ - Step 38386: {'lr': 0.0004290693140848, 'samples': 7370112, 'steps': 38385, 'loss/train': 1.5758689641952515} -11/07/2021 02:37:50 - INFO - __main__ - Step 38387: {'lr': 0.0004290656109144003, 'samples': 7370304, 'steps': 38386, 'loss/train': 1.7817904949188232} -11/07/2021 02:37:50 - INFO - __main__ - Step 38388: {'lr': 0.0004290619076633163, 'samples': 7370496, 'steps': 38387, 'loss/train': 1.7534565925598145} -11/07/2021 02:37:51 - INFO - __main__ - Step 38389: {'lr': 0.0004290582043315498, 'samples': 7370688, 'steps': 38388, 'loss/train': 1.8690040111541748} -11/07/2021 02:37:51 - INFO - __main__ - Step 38390: {'lr': 0.0004290545009191024, 'samples': 7370880, 'steps': 38389, 'loss/train': 0.6957410573959351} -11/07/2021 02:37:51 - INFO - __main__ - Step 38391: {'lr': 0.0004290507974259759, 'samples': 7371072, 'steps': 38390, 'loss/train': 1.5398764610290527} -11/07/2021 02:37:52 - INFO - __main__ - Step 38392: {'lr': 0.0004290470938521718, 'samples': 7371264, 'steps': 38391, 'loss/train': 0.7379046678543091} -11/07/2021 02:37:53 - INFO - __main__ - Step 38393: {'lr': 0.0004290433901976918, 'samples': 7371456, 'steps': 38392, 'loss/train': 5.813073635101318} -11/07/2021 02:37:53 - INFO - __main__ - Step 38394: {'lr': 0.0004290396864625377, 'samples': 7371648, 'steps': 38393, 'loss/train': 1.6722701787948608} -11/07/2021 02:37:53 - INFO - __main__ - Step 38395: {'lr': 0.000429035982646711, 'samples': 7371840, 'steps': 38394, 'loss/train': 1.5052942037582397} -11/07/2021 02:37:54 - INFO - __main__ - Step 38396: {'lr': 0.0004290322787502135, 'samples': 7372032, 'steps': 38395, 'loss/train': 1.1739457845687866} -11/07/2021 02:37:54 - INFO - __main__ - Step 38397: {'lr': 0.0004290285747730468, 'samples': 7372224, 'steps': 38396, 'loss/train': 1.9641786813735962} -11/07/2021 02:37:54 - INFO - __main__ - Step 38398: {'lr': 0.00042902487071521257, 'samples': 7372416, 'steps': 38397, 'loss/train': 1.9700204133987427} -11/07/2021 02:37:55 - INFO - __main__ - Step 38399: {'lr': 0.0004290211665767125, 'samples': 7372608, 'steps': 38398, 'loss/train': 1.8752416372299194} -11/07/2021 02:37:56 - INFO - __main__ - Step 38400: {'lr': 0.00042901746235754837, 'samples': 7372800, 'steps': 38399, 'loss/train': 1.5767382383346558} -11/07/2021 02:37:56 - INFO - __main__ - Step 38401: {'lr': 0.0004290137580577216, 'samples': 7372992, 'steps': 38400, 'loss/train': 1.6494174003601074} -11/07/2021 02:37:56 - INFO - __main__ - Step 38402: {'lr': 0.000429010053677234, 'samples': 7373184, 'steps': 38401, 'loss/train': 1.7537641525268555} -11/07/2021 02:37:57 - INFO - __main__ - Step 38403: {'lr': 0.00042900634921608726, 'samples': 7373376, 'steps': 38402, 'loss/train': 1.3137192726135254} -11/07/2021 02:37:58 - INFO - __main__ - Step 38404: {'lr': 0.0004290026446742831, 'samples': 7373568, 'steps': 38403, 'loss/train': 4.322111129760742} -11/07/2021 02:37:58 - INFO - __main__ - Step 38405: {'lr': 0.00042899894005182294, 'samples': 7373760, 'steps': 38404, 'loss/train': 1.4622212648391724} -11/07/2021 02:37:59 - INFO - __main__ - Step 38406: {'lr': 0.0004289952353487088, 'samples': 7373952, 'steps': 38405, 'loss/train': 0.7398356795310974} -11/07/2021 02:37:59 - INFO - __main__ - Step 38407: {'lr': 0.000428991530564942, 'samples': 7374144, 'steps': 38406, 'loss/train': 0.5963699817657471} -11/07/2021 02:37:59 - INFO - __main__ - Step 38408: {'lr': 0.00042898782570052453, 'samples': 7374336, 'steps': 38407, 'loss/train': 1.9118536710739136} -11/07/2021 02:38:00 - INFO - __main__ - Step 38409: {'lr': 0.0004289841207554578, 'samples': 7374528, 'steps': 38408, 'loss/train': 1.7349226474761963} -11/07/2021 02:38:01 - INFO - __main__ - Step 38410: {'lr': 0.00042898041572974363, 'samples': 7374720, 'steps': 38409, 'loss/train': 1.2647113800048828} -11/07/2021 02:38:01 - INFO - __main__ - Step 38411: {'lr': 0.0004289767106233836, 'samples': 7374912, 'steps': 38410, 'loss/train': 1.462265968322754} -11/07/2021 02:38:01 - INFO - __main__ - Step 38412: {'lr': 0.0004289730054363795, 'samples': 7375104, 'steps': 38411, 'loss/train': 1.6180638074874878} -11/07/2021 02:38:02 - INFO - __main__ - Step 38413: {'lr': 0.00042896930016873293, 'samples': 7375296, 'steps': 38412, 'loss/train': 1.8184987306594849} -11/07/2021 02:38:03 - INFO - __main__ - Step 38414: {'lr': 0.0004289655948204455, 'samples': 7375488, 'steps': 38413, 'loss/train': 1.8326774835586548} -11/07/2021 02:38:03 - INFO - __main__ - Step 38415: {'lr': 0.00042896188939151893, 'samples': 7375680, 'steps': 38414, 'loss/train': 0.982987105846405} -11/07/2021 02:38:04 - INFO - __main__ - Step 38416: {'lr': 0.00042895818388195497, 'samples': 7375872, 'steps': 38415, 'loss/train': 1.4191560745239258} -11/07/2021 02:38:04 - INFO - __main__ - Step 38417: {'lr': 0.00042895447829175516, 'samples': 7376064, 'steps': 38416, 'loss/train': 1.3981465101242065} -11/07/2021 02:38:04 - INFO - __main__ - Step 38418: {'lr': 0.00042895077262092117, 'samples': 7376256, 'steps': 38417, 'loss/train': 1.7016116380691528} -11/07/2021 02:38:05 - INFO - __main__ - Step 38419: {'lr': 0.00042894706686945485, 'samples': 7376448, 'steps': 38418, 'loss/train': 0.9155838489532471} -11/07/2021 02:38:06 - INFO - __main__ - Step 38420: {'lr': 0.00042894336103735766, 'samples': 7376640, 'steps': 38419, 'loss/train': 0.9882771372795105} -11/07/2021 02:38:06 - INFO - __main__ - Step 38421: {'lr': 0.0004289396551246313, 'samples': 7376832, 'steps': 38420, 'loss/train': 1.5289490222930908} -11/07/2021 02:38:06 - INFO - __main__ - Step 38422: {'lr': 0.0004289359491312776, 'samples': 7377024, 'steps': 38421, 'loss/train': 1.6016318798065186} -11/07/2021 02:38:07 - INFO - __main__ - Step 38423: {'lr': 0.00042893224305729806, 'samples': 7377216, 'steps': 38422, 'loss/train': 1.8466453552246094} -11/07/2021 02:38:08 - INFO - __main__ - Step 38424: {'lr': 0.0004289285369026944, 'samples': 7377408, 'steps': 38423, 'loss/train': 1.7110973596572876} -11/07/2021 02:38:08 - INFO - __main__ - Step 38425: {'lr': 0.00042892483066746836, 'samples': 7377600, 'steps': 38424, 'loss/train': 1.5883793830871582} -11/07/2021 02:38:09 - INFO - __main__ - Step 38426: {'lr': 0.0004289211243516216, 'samples': 7377792, 'steps': 38425, 'loss/train': 1.6158411502838135} -11/07/2021 02:38:09 - INFO - __main__ - Step 38427: {'lr': 0.0004289174179551556, 'samples': 7377984, 'steps': 38426, 'loss/train': 1.451820969581604} -11/07/2021 02:38:09 - INFO - __main__ - Step 38428: {'lr': 0.0004289137114780722, 'samples': 7378176, 'steps': 38427, 'loss/train': 1.9416730403900146} -11/07/2021 02:38:12 - INFO - __main__ - Step 38429: {'lr': 0.00042891000492037315, 'samples': 7378368, 'steps': 38428, 'loss/train': 1.641010046005249} -11/07/2021 02:38:12 - INFO - __main__ - Step 38430: {'lr': 0.00042890629828205997, 'samples': 7378560, 'steps': 38429, 'loss/train': 1.5851696729660034} -11/07/2021 02:38:12 - INFO - __main__ - Step 38431: {'lr': 0.0004289025915631343, 'samples': 7378752, 'steps': 38430, 'loss/train': 1.72231924533844} -11/07/2021 02:38:13 - INFO - __main__ - Step 38432: {'lr': 0.00042889888476359793, 'samples': 7378944, 'steps': 38431, 'loss/train': 1.4775114059448242} -11/07/2021 02:38:13 - INFO - __main__ - Step 38433: {'lr': 0.0004288951778834525, 'samples': 7379136, 'steps': 38432, 'loss/train': 1.3398957252502441} -11/07/2021 02:38:13 - INFO - __main__ - Step 38434: {'lr': 0.00042889147092269964, 'samples': 7379328, 'steps': 38433, 'loss/train': 2.4124293327331543} -11/07/2021 02:38:14 - INFO - __main__ - Step 38435: {'lr': 0.0004288877638813411, 'samples': 7379520, 'steps': 38434, 'loss/train': 1.8824303150177002} -11/07/2021 02:38:14 - INFO - __main__ - Step 38436: {'lr': 0.00042888405675937843, 'samples': 7379712, 'steps': 38435, 'loss/train': 1.839871883392334} -11/07/2021 02:38:15 - INFO - __main__ - Step 38437: {'lr': 0.00042888034955681337, 'samples': 7379904, 'steps': 38436, 'loss/train': 1.8125609159469604} -11/07/2021 02:38:16 - INFO - __main__ - Step 38438: {'lr': 0.0004288766422736476, 'samples': 7380096, 'steps': 38437, 'loss/train': 2.059551477432251} -11/07/2021 02:38:16 - INFO - __main__ - Step 38439: {'lr': 0.00042887293490988276, 'samples': 7380288, 'steps': 38438, 'loss/train': 1.4829810857772827} -11/07/2021 02:38:16 - INFO - __main__ - Step 38440: {'lr': 0.00042886922746552056, 'samples': 7380480, 'steps': 38439, 'loss/train': 1.6527646780014038} -11/07/2021 02:38:17 - INFO - __main__ - Step 38441: {'lr': 0.0004288655199405626, 'samples': 7380672, 'steps': 38440, 'loss/train': 1.5163254737854004} -11/07/2021 02:38:18 - INFO - __main__ - Step 38442: {'lr': 0.00042886181233501067, 'samples': 7380864, 'steps': 38441, 'loss/train': 1.5011135339736938} -11/07/2021 02:38:18 - INFO - __main__ - Step 38443: {'lr': 0.00042885810464886635, 'samples': 7381056, 'steps': 38442, 'loss/train': 1.5980879068374634} -11/07/2021 02:38:19 - INFO - __main__ - Step 38444: {'lr': 0.0004288543968821312, 'samples': 7381248, 'steps': 38443, 'loss/train': 0.7294881939888} -11/07/2021 02:38:19 - INFO - __main__ - Step 38445: {'lr': 0.00042885068903480717, 'samples': 7381440, 'steps': 38444, 'loss/train': 0.9094494581222534} -11/07/2021 02:38:19 - INFO - __main__ - Step 38446: {'lr': 0.00042884698110689574, 'samples': 7381632, 'steps': 38445, 'loss/train': 1.5150995254516602} -11/07/2021 02:38:20 - INFO - __main__ - Step 38447: {'lr': 0.00042884327309839865, 'samples': 7381824, 'steps': 38446, 'loss/train': 1.807474970817566} -11/07/2021 02:38:21 - INFO - __main__ - Step 38448: {'lr': 0.0004288395650093174, 'samples': 7382016, 'steps': 38447, 'loss/train': 1.0160998106002808} -11/07/2021 02:38:21 - INFO - __main__ - Step 38449: {'lr': 0.000428835856839654, 'samples': 7382208, 'steps': 38448, 'loss/train': 1.399091124534607} -11/07/2021 02:38:21 - INFO - __main__ - Step 38450: {'lr': 0.0004288321485894098, 'samples': 7382400, 'steps': 38449, 'loss/train': 1.4129213094711304} -11/07/2021 02:38:22 - INFO - __main__ - Step 38451: {'lr': 0.0004288284402585866, 'samples': 7382592, 'steps': 38450, 'loss/train': 1.5371888875961304} -11/07/2021 02:38:22 - INFO - __main__ - Step 38452: {'lr': 0.0004288247318471861, 'samples': 7382784, 'steps': 38451, 'loss/train': 1.8664556741714478} -11/07/2021 02:38:23 - INFO - __main__ - Step 38453: {'lr': 0.0004288210233552099, 'samples': 7382976, 'steps': 38452, 'loss/train': 1.9075709581375122} -11/07/2021 02:38:24 - INFO - __main__ - Step 38454: {'lr': 0.00042881731478265975, 'samples': 7383168, 'steps': 38453, 'loss/train': 1.6259357929229736} -11/07/2021 02:38:24 - INFO - __main__ - Step 38455: {'lr': 0.00042881360612953724, 'samples': 7383360, 'steps': 38454, 'loss/train': 1.8561694622039795} -11/07/2021 02:38:24 - INFO - __main__ - Step 38456: {'lr': 0.0004288098973958441, 'samples': 7383552, 'steps': 38455, 'loss/train': 1.4659887552261353} -11/07/2021 02:38:25 - INFO - __main__ - Step 38457: {'lr': 0.000428806188581582, 'samples': 7383744, 'steps': 38456, 'loss/train': 1.8136464357376099} -11/07/2021 02:38:26 - INFO - __main__ - Step 38458: {'lr': 0.00042880247968675255, 'samples': 7383936, 'steps': 38457, 'loss/train': 1.191347360610962} -11/07/2021 02:38:26 - INFO - __main__ - Step 38459: {'lr': 0.00042879877071135746, 'samples': 7384128, 'steps': 38458, 'loss/train': 1.7995673418045044} -11/07/2021 02:38:26 - INFO - __main__ - Step 38460: {'lr': 0.0004287950616553984, 'samples': 7384320, 'steps': 38459, 'loss/train': 2.0367720127105713} -11/07/2021 02:38:27 - INFO - __main__ - Step 38461: {'lr': 0.0004287913525188771, 'samples': 7384512, 'steps': 38460, 'loss/train': 1.733862042427063} -11/07/2021 02:38:27 - INFO - __main__ - Step 38462: {'lr': 0.0004287876433017951, 'samples': 7384704, 'steps': 38461, 'loss/train': 1.1448413133621216} -11/07/2021 02:38:28 - INFO - __main__ - Step 38463: {'lr': 0.0004287839340041542, 'samples': 7384896, 'steps': 38462, 'loss/train': 1.2920781373977661} -11/07/2021 02:38:28 - INFO - __main__ - Step 38464: {'lr': 0.000428780224625956, 'samples': 7385088, 'steps': 38463, 'loss/train': 1.2339569330215454} -11/07/2021 02:38:29 - INFO - __main__ - Step 38465: {'lr': 0.00042877651516720215, 'samples': 7385280, 'steps': 38464, 'loss/train': 2.114656925201416} -11/07/2021 02:38:29 - INFO - __main__ - Step 38466: {'lr': 0.0004287728056278944, 'samples': 7385472, 'steps': 38465, 'loss/train': 1.7644872665405273} -11/07/2021 02:38:29 - INFO - __main__ - Step 38467: {'lr': 0.00042876909600803444, 'samples': 7385664, 'steps': 38466, 'loss/train': 1.7050596475601196} -11/07/2021 02:38:31 - INFO - __main__ - Step 38468: {'lr': 0.00042876538630762386, 'samples': 7385856, 'steps': 38467, 'loss/train': 2.0102365016937256} -11/07/2021 02:38:31 - INFO - __main__ - Step 38469: {'lr': 0.00042876167652666433, 'samples': 7386048, 'steps': 38468, 'loss/train': 1.2179516553878784} -11/07/2021 02:38:31 - INFO - __main__ - Step 38470: {'lr': 0.0004287579666651575, 'samples': 7386240, 'steps': 38469, 'loss/train': 1.756458044052124} -11/07/2021 02:38:32 - INFO - __main__ - Step 38471: {'lr': 0.00042875425672310506, 'samples': 7386432, 'steps': 38470, 'loss/train': 1.6783102750778198} -11/07/2021 02:38:32 - INFO - __main__ - Step 38472: {'lr': 0.00042875054670050885, 'samples': 7386624, 'steps': 38471, 'loss/train': 0.9036006331443787} -11/07/2021 02:38:33 - INFO - __main__ - Step 38473: {'lr': 0.00042874683659737035, 'samples': 7386816, 'steps': 38472, 'loss/train': 0.5149843692779541} -11/07/2021 02:38:33 - INFO - __main__ - Step 38474: {'lr': 0.0004287431264136913, 'samples': 7387008, 'steps': 38473, 'loss/train': 1.8024157285690308} -11/07/2021 02:38:34 - INFO - __main__ - Step 38475: {'lr': 0.0004287394161494733, 'samples': 7387200, 'steps': 38474, 'loss/train': 1.8952447175979614} -11/07/2021 02:38:34 - INFO - __main__ - Step 38476: {'lr': 0.0004287357058047181, 'samples': 7387392, 'steps': 38475, 'loss/train': 1.8905134201049805} -11/07/2021 02:38:34 - INFO - __main__ - Step 38477: {'lr': 0.00042873199537942733, 'samples': 7387584, 'steps': 38476, 'loss/train': 1.6807677745819092} -11/07/2021 02:38:35 - INFO - __main__ - Step 38478: {'lr': 0.0004287282848736027, 'samples': 7387776, 'steps': 38477, 'loss/train': 1.6995487213134766} -11/07/2021 02:38:36 - INFO - __main__ - Step 38479: {'lr': 0.00042872457428724586, 'samples': 7387968, 'steps': 38478, 'loss/train': 1.7590001821517944} -11/07/2021 02:38:36 - INFO - __main__ - Step 38480: {'lr': 0.00042872086362035844, 'samples': 7388160, 'steps': 38479, 'loss/train': 1.6011989116668701} -11/07/2021 02:38:36 - INFO - __main__ - Step 38481: {'lr': 0.00042871715287294223, 'samples': 7388352, 'steps': 38480, 'loss/train': 1.413744330406189} -11/07/2021 02:38:37 - INFO - __main__ - Step 38482: {'lr': 0.00042871344204499886, 'samples': 7388544, 'steps': 38481, 'loss/train': 1.6196192502975464} -11/07/2021 02:38:37 - INFO - __main__ - Step 38483: {'lr': 0.0004287097311365299, 'samples': 7388736, 'steps': 38482, 'loss/train': 1.6136687994003296} -11/07/2021 02:38:38 - INFO - __main__ - Step 38484: {'lr': 0.00042870602014753707, 'samples': 7388928, 'steps': 38483, 'loss/train': 1.3907452821731567} -11/07/2021 02:38:39 - INFO - __main__ - Step 38485: {'lr': 0.0004287023090780221, 'samples': 7389120, 'steps': 38484, 'loss/train': 1.3356413841247559} -11/07/2021 02:38:39 - INFO - __main__ - Step 38486: {'lr': 0.0004286985979279866, 'samples': 7389312, 'steps': 38485, 'loss/train': 1.608561635017395} -11/07/2021 02:38:39 - INFO - __main__ - Step 38487: {'lr': 0.0004286948866974323, 'samples': 7389504, 'steps': 38486, 'loss/train': 1.2108365297317505} -11/07/2021 02:38:40 - INFO - __main__ - Step 38488: {'lr': 0.0004286911753863608, 'samples': 7389696, 'steps': 38487, 'loss/train': 1.6934078931808472} -11/07/2021 02:38:41 - INFO - __main__ - Step 38489: {'lr': 0.0004286874639947739, 'samples': 7389888, 'steps': 38488, 'loss/train': 1.500806212425232} -11/07/2021 02:38:41 - INFO - __main__ - Step 38490: {'lr': 0.0004286837525226731, 'samples': 7390080, 'steps': 38489, 'loss/train': 1.5360748767852783} -11/07/2021 02:38:41 - INFO - __main__ - Step 38491: {'lr': 0.0004286800409700602, 'samples': 7390272, 'steps': 38490, 'loss/train': 1.1713488101959229} -11/07/2021 02:38:42 - INFO - __main__ - Step 38492: {'lr': 0.0004286763293369369, 'samples': 7390464, 'steps': 38491, 'loss/train': 1.2377177476882935} -11/07/2021 02:38:42 - INFO - __main__ - Step 38493: {'lr': 0.00042867261762330466, 'samples': 7390656, 'steps': 38492, 'loss/train': 1.7022583484649658} -11/07/2021 02:38:43 - INFO - __main__ - Step 38494: {'lr': 0.0004286689058291654, 'samples': 7390848, 'steps': 38493, 'loss/train': 1.2819725275039673} -11/07/2021 02:38:43 - INFO - __main__ - Step 38495: {'lr': 0.00042866519395452063, 'samples': 7391040, 'steps': 38494, 'loss/train': 1.3884963989257812} -11/07/2021 02:38:44 - INFO - __main__ - Step 38496: {'lr': 0.00042866148199937216, 'samples': 7391232, 'steps': 38495, 'loss/train': 1.4726425409317017} -11/07/2021 02:38:44 - INFO - __main__ - Step 38497: {'lr': 0.00042865776996372146, 'samples': 7391424, 'steps': 38496, 'loss/train': 1.3454011678695679} -11/07/2021 02:38:44 - INFO - __main__ - Step 38498: {'lr': 0.00042865405784757037, 'samples': 7391616, 'steps': 38497, 'loss/train': 2.008884906768799} -11/07/2021 02:38:45 - INFO - __main__ - Step 38499: {'lr': 0.0004286503456509206, 'samples': 7391808, 'steps': 38498, 'loss/train': 1.5773800611495972} -11/07/2021 02:38:46 - INFO - __main__ - Step 38500: {'lr': 0.0004286466333737737, 'samples': 7392000, 'steps': 38499, 'loss/train': 1.757792353630066} -11/07/2021 02:38:46 - INFO - __main__ - Step 38501: {'lr': 0.00042864292101613133, 'samples': 7392192, 'steps': 38500, 'loss/train': 1.4850726127624512} -11/07/2021 02:38:46 - INFO - __main__ - Step 38502: {'lr': 0.0004286392085779953, 'samples': 7392384, 'steps': 38501, 'loss/train': 1.7341381311416626} -11/07/2021 02:38:47 - INFO - __main__ - Step 38503: {'lr': 0.00042863549605936716, 'samples': 7392576, 'steps': 38502, 'loss/train': 1.6198322772979736} -11/07/2021 02:38:47 - INFO - __main__ - Step 38504: {'lr': 0.00042863178346024856, 'samples': 7392768, 'steps': 38503, 'loss/train': 1.4690289497375488} -11/07/2021 02:38:48 - INFO - __main__ - Step 38505: {'lr': 0.00042862807078064124, 'samples': 7392960, 'steps': 38504, 'loss/train': 2.190840244293213} -11/07/2021 02:38:49 - INFO - __main__ - Step 38506: {'lr': 0.00042862435802054703, 'samples': 7393152, 'steps': 38505, 'loss/train': 0.8740153908729553} -11/07/2021 02:38:49 - INFO - __main__ - Step 38507: {'lr': 0.00042862064517996723, 'samples': 7393344, 'steps': 38506, 'loss/train': 1.7972629070281982} -11/07/2021 02:38:49 - INFO - __main__ - Step 38508: {'lr': 0.00042861693225890385, 'samples': 7393536, 'steps': 38507, 'loss/train': 1.6027082204818726} -11/07/2021 02:38:50 - INFO - __main__ - Step 38509: {'lr': 0.0004286132192573584, 'samples': 7393728, 'steps': 38508, 'loss/train': 1.0021463632583618} -11/07/2021 02:38:51 - INFO - __main__ - Step 38510: {'lr': 0.0004286095061753326, 'samples': 7393920, 'steps': 38509, 'loss/train': 1.9077627658843994} -11/07/2021 02:38:51 - INFO - __main__ - Step 38511: {'lr': 0.0004286057930128281, 'samples': 7394112, 'steps': 38510, 'loss/train': 1.4616092443466187} -11/07/2021 02:38:51 - INFO - __main__ - Step 38512: {'lr': 0.00042860207976984664, 'samples': 7394304, 'steps': 38511, 'loss/train': 1.640619158744812} -11/07/2021 02:38:52 - INFO - __main__ - Step 38513: {'lr': 0.00042859836644638976, 'samples': 7394496, 'steps': 38512, 'loss/train': 3.527266502380371} -11/07/2021 02:38:52 - INFO - __main__ - Step 38514: {'lr': 0.00042859465304245927, 'samples': 7394688, 'steps': 38513, 'loss/train': 1.371895670890808} -11/07/2021 02:38:53 - INFO - __main__ - Step 38515: {'lr': 0.00042859093955805675, 'samples': 7394880, 'steps': 38514, 'loss/train': 1.5881764888763428} -11/07/2021 02:38:53 - INFO - __main__ - Step 38516: {'lr': 0.0004285872259931839, 'samples': 7395072, 'steps': 38515, 'loss/train': 1.1682759523391724} -11/07/2021 02:38:54 - INFO - __main__ - Step 38517: {'lr': 0.00042858351234784244, 'samples': 7395264, 'steps': 38516, 'loss/train': 1.5074559450149536} -11/07/2021 02:38:54 - INFO - __main__ - Step 38518: {'lr': 0.000428579798622034, 'samples': 7395456, 'steps': 38517, 'loss/train': 1.5640182495117188} -11/07/2021 02:38:54 - INFO - __main__ - Step 38519: {'lr': 0.0004285760848157603, 'samples': 7395648, 'steps': 38518, 'loss/train': 2.235804557800293} -11/07/2021 02:38:56 - INFO - __main__ - Step 38520: {'lr': 0.00042857237092902285, 'samples': 7395840, 'steps': 38519, 'loss/train': 1.3733848333358765} -11/07/2021 02:38:56 - INFO - __main__ - Step 38521: {'lr': 0.0004285686569618235, 'samples': 7396032, 'steps': 38520, 'loss/train': 1.7476186752319336} -11/07/2021 02:38:56 - INFO - __main__ - Step 38522: {'lr': 0.0004285649429141639, 'samples': 7396224, 'steps': 38521, 'loss/train': 1.8905295133590698} -11/07/2021 02:38:57 - INFO - __main__ - Step 38523: {'lr': 0.00042856122878604566, 'samples': 7396416, 'steps': 38522, 'loss/train': 1.5531270503997803} -11/07/2021 02:38:57 - INFO - __main__ - Step 38524: {'lr': 0.0004285575145774705, 'samples': 7396608, 'steps': 38523, 'loss/train': 1.5270588397979736} -11/07/2021 02:38:57 - INFO - __main__ - Step 38525: {'lr': 0.00042855380028844004, 'samples': 7396800, 'steps': 38524, 'loss/train': 1.3176720142364502} -11/07/2021 02:38:58 - INFO - __main__ - Step 38526: {'lr': 0.00042855008591895607, 'samples': 7396992, 'steps': 38525, 'loss/train': 1.2649494409561157} -11/07/2021 02:38:59 - INFO - __main__ - Step 38527: {'lr': 0.00042854637146902007, 'samples': 7397184, 'steps': 38526, 'loss/train': 1.1893590688705444} -11/07/2021 02:38:59 - INFO - __main__ - Step 38528: {'lr': 0.00042854265693863394, 'samples': 7397376, 'steps': 38527, 'loss/train': 1.7693283557891846} -11/07/2021 02:38:59 - INFO - __main__ - Step 38529: {'lr': 0.00042853894232779924, 'samples': 7397568, 'steps': 38528, 'loss/train': 1.7133264541625977} -11/07/2021 02:39:00 - INFO - __main__ - Step 38530: {'lr': 0.00042853522763651767, 'samples': 7397760, 'steps': 38529, 'loss/train': 1.9178385734558105} -11/07/2021 02:39:01 - INFO - __main__ - Step 38531: {'lr': 0.00042853151286479074, 'samples': 7397952, 'steps': 38530, 'loss/train': 3.3915510177612305} -11/07/2021 02:39:01 - INFO - __main__ - Step 38532: {'lr': 0.0004285277980126204, 'samples': 7398144, 'steps': 38531, 'loss/train': 1.5660945177078247} -11/07/2021 02:39:01 - INFO - __main__ - Step 38533: {'lr': 0.0004285240830800081, 'samples': 7398336, 'steps': 38532, 'loss/train': 1.3985246419906616} -11/07/2021 02:39:02 - INFO - __main__ - Step 38534: {'lr': 0.00042852036806695565, 'samples': 7398528, 'steps': 38533, 'loss/train': 1.6784566640853882} -11/07/2021 02:39:02 - INFO - __main__ - Step 38535: {'lr': 0.0004285166529734647, 'samples': 7398720, 'steps': 38534, 'loss/train': 1.5484535694122314} -11/07/2021 02:39:03 - INFO - __main__ - Step 38536: {'lr': 0.0004285129377995369, 'samples': 7398912, 'steps': 38535, 'loss/train': 1.6828726530075073} -11/07/2021 02:39:04 - INFO - __main__ - Step 38537: {'lr': 0.0004285092225451739, 'samples': 7399104, 'steps': 38536, 'loss/train': 1.7928122282028198} -11/07/2021 02:39:04 - INFO - __main__ - Step 38538: {'lr': 0.0004285055072103774, 'samples': 7399296, 'steps': 38537, 'loss/train': 1.6644047498703003} -11/07/2021 02:39:04 - INFO - __main__ - Step 38539: {'lr': 0.00042850179179514906, 'samples': 7399488, 'steps': 38538, 'loss/train': 1.8039556741714478} -11/07/2021 02:39:05 - INFO - __main__ - Step 38540: {'lr': 0.00042849807629949057, 'samples': 7399680, 'steps': 38539, 'loss/train': 1.33259117603302} -11/07/2021 02:39:05 - INFO - __main__ - Step 38541: {'lr': 0.0004284943607234036, 'samples': 7399872, 'steps': 38540, 'loss/train': 1.7744859457015991} -11/07/2021 02:39:07 - INFO - __main__ - Step 38542: {'lr': 0.00042849064506688984, 'samples': 7400064, 'steps': 38541, 'loss/train': 1.8936946392059326} -11/07/2021 02:39:07 - INFO - __main__ - Step 38543: {'lr': 0.00042848692932995094, 'samples': 7400256, 'steps': 38542, 'loss/train': 1.3653404712677002} -11/07/2021 02:39:07 - INFO - __main__ - Step 38544: {'lr': 0.0004284832135125886, 'samples': 7400448, 'steps': 38543, 'loss/train': 1.289848804473877} -11/07/2021 02:39:08 - INFO - __main__ - Step 38545: {'lr': 0.0004284794976148044, 'samples': 7400640, 'steps': 38544, 'loss/train': 0.7191889882087708} -11/07/2021 02:39:08 - INFO - __main__ - Step 38546: {'lr': 0.00042847578163660016, 'samples': 7400832, 'steps': 38545, 'loss/train': 1.2714651823043823} -11/07/2021 02:39:09 - INFO - __main__ - Step 38547: {'lr': 0.0004284720655779775, 'samples': 7401024, 'steps': 38546, 'loss/train': 1.4489455223083496} -11/07/2021 02:39:10 - INFO - __main__ - Step 38548: {'lr': 0.00042846834943893806, 'samples': 7401216, 'steps': 38547, 'loss/train': 1.9417572021484375} -11/07/2021 02:39:10 - INFO - __main__ - Step 38549: {'lr': 0.0004284646332194836, 'samples': 7401408, 'steps': 38548, 'loss/train': 1.0289621353149414} -11/07/2021 02:39:10 - INFO - __main__ - Step 38550: {'lr': 0.0004284609169196156, 'samples': 7401600, 'steps': 38549, 'loss/train': 1.6011112928390503} -11/07/2021 02:39:11 - INFO - __main__ - Step 38551: {'lr': 0.000428457200539336, 'samples': 7401792, 'steps': 38550, 'loss/train': 1.1118967533111572} -11/07/2021 02:39:11 - INFO - __main__ - Step 38552: {'lr': 0.0004284534840786463, 'samples': 7401984, 'steps': 38551, 'loss/train': 1.5389808416366577} -11/07/2021 02:39:12 - INFO - __main__ - Step 38553: {'lr': 0.0004284497675375482, 'samples': 7402176, 'steps': 38552, 'loss/train': 1.730039358139038} -11/07/2021 02:39:12 - INFO - __main__ - Step 38554: {'lr': 0.0004284460509160433, 'samples': 7402368, 'steps': 38553, 'loss/train': 1.4535332918167114} -11/07/2021 02:39:13 - INFO - __main__ - Step 38555: {'lr': 0.0004284423342141335, 'samples': 7402560, 'steps': 38554, 'loss/train': 1.4308903217315674} -11/07/2021 02:39:13 - INFO - __main__ - Step 38556: {'lr': 0.0004284386174318202, 'samples': 7402752, 'steps': 38555, 'loss/train': 1.5834574699401855} -11/07/2021 02:39:13 - INFO - __main__ - Step 38557: {'lr': 0.00042843490056910534, 'samples': 7402944, 'steps': 38556, 'loss/train': 1.7708011865615845} -11/07/2021 02:39:14 - INFO - __main__ - Step 38558: {'lr': 0.00042843118362599045, 'samples': 7403136, 'steps': 38557, 'loss/train': 1.0050923824310303} -11/07/2021 02:39:15 - INFO - __main__ - Step 38559: {'lr': 0.0004284274666024772, 'samples': 7403328, 'steps': 38558, 'loss/train': 1.5794517993927002} -11/07/2021 02:39:15 - INFO - __main__ - Step 38560: {'lr': 0.0004284237494985672, 'samples': 7403520, 'steps': 38559, 'loss/train': 1.651281714439392} -11/07/2021 02:39:15 - INFO - __main__ - Step 38561: {'lr': 0.0004284200323142623, 'samples': 7403712, 'steps': 38560, 'loss/train': 2.0764431953430176} -11/07/2021 02:39:16 - INFO - __main__ - Step 38562: {'lr': 0.0004284163150495641, 'samples': 7403904, 'steps': 38561, 'loss/train': 1.2969495058059692} -11/07/2021 02:39:17 - INFO - __main__ - Step 38563: {'lr': 0.00042841259770447427, 'samples': 7404096, 'steps': 38562, 'loss/train': 1.4701931476593018} -11/07/2021 02:39:17 - INFO - __main__ - Step 38564: {'lr': 0.00042840888027899436, 'samples': 7404288, 'steps': 38563, 'loss/train': 1.3531675338745117} -11/07/2021 02:39:18 - INFO - __main__ - Step 38565: {'lr': 0.0004284051627731263, 'samples': 7404480, 'steps': 38564, 'loss/train': 1.5186748504638672} -11/07/2021 02:39:18 - INFO - __main__ - Step 38566: {'lr': 0.0004284014451868716, 'samples': 7404672, 'steps': 38565, 'loss/train': 1.763478398323059} -11/07/2021 02:39:18 - INFO - __main__ - Step 38567: {'lr': 0.0004283977275202319, 'samples': 7404864, 'steps': 38566, 'loss/train': 1.5161564350128174} -11/07/2021 02:39:19 - INFO - __main__ - Step 38568: {'lr': 0.00042839400977320895, 'samples': 7405056, 'steps': 38567, 'loss/train': 1.660630226135254} -11/07/2021 02:39:20 - INFO - __main__ - Step 38569: {'lr': 0.00042839029194580446, 'samples': 7405248, 'steps': 38568, 'loss/train': 1.5722196102142334} -11/07/2021 02:39:20 - INFO - __main__ - Step 38570: {'lr': 0.0004283865740380201, 'samples': 7405440, 'steps': 38569, 'loss/train': 1.3853479623794556} -11/07/2021 02:39:20 - INFO - __main__ - Step 38571: {'lr': 0.0004283828560498574, 'samples': 7405632, 'steps': 38570, 'loss/train': 0.9588892459869385} -11/07/2021 02:39:21 - INFO - __main__ - Step 38572: {'lr': 0.0004283791379813181, 'samples': 7405824, 'steps': 38571, 'loss/train': 1.5066494941711426} -11/07/2021 02:39:22 - INFO - __main__ - Step 38573: {'lr': 0.000428375419832404, 'samples': 7406016, 'steps': 38572, 'loss/train': 1.527634620666504} -11/07/2021 02:39:22 - INFO - __main__ - Step 38574: {'lr': 0.0004283717016031167, 'samples': 7406208, 'steps': 38573, 'loss/train': 1.3006707429885864} -11/07/2021 02:39:22 - INFO - __main__ - Step 38575: {'lr': 0.0004283679832934578, 'samples': 7406400, 'steps': 38574, 'loss/train': 1.6669787168502808} -11/07/2021 02:39:23 - INFO - __main__ - Step 38576: {'lr': 0.0004283642649034291, 'samples': 7406592, 'steps': 38575, 'loss/train': 1.7991132736206055} -11/07/2021 02:39:23 - INFO - __main__ - Step 38577: {'lr': 0.00042836054643303226, 'samples': 7406784, 'steps': 38576, 'loss/train': 2.0059776306152344} -11/07/2021 02:39:24 - INFO - __main__ - Step 38578: {'lr': 0.0004283568278822688, 'samples': 7406976, 'steps': 38577, 'loss/train': 0.8108773827552795} -11/07/2021 02:39:25 - INFO - __main__ - Step 38579: {'lr': 0.0004283531092511405, 'samples': 7407168, 'steps': 38578, 'loss/train': 1.2539422512054443} -11/07/2021 02:39:25 - INFO - __main__ - Step 38580: {'lr': 0.0004283493905396491, 'samples': 7407360, 'steps': 38579, 'loss/train': 0.8251067996025085} -11/07/2021 02:39:25 - INFO - __main__ - Step 38581: {'lr': 0.00042834567174779623, 'samples': 7407552, 'steps': 38580, 'loss/train': 1.5102128982543945} -11/07/2021 02:39:26 - INFO - __main__ - Step 38582: {'lr': 0.00042834195287558356, 'samples': 7407744, 'steps': 38581, 'loss/train': 1.4471834897994995} -11/07/2021 02:39:26 - INFO - __main__ - Step 38583: {'lr': 0.00042833823392301264, 'samples': 7407936, 'steps': 38582, 'loss/train': 0.9997994303703308} -11/07/2021 02:39:27 - INFO - __main__ - Step 38584: {'lr': 0.00042833451489008537, 'samples': 7408128, 'steps': 38583, 'loss/train': 0.7278831005096436} -11/07/2021 02:39:27 - INFO - __main__ - Step 38585: {'lr': 0.00042833079577680327, 'samples': 7408320, 'steps': 38584, 'loss/train': 1.4909403324127197} -11/07/2021 02:39:28 - INFO - __main__ - Step 38586: {'lr': 0.0004283270765831682, 'samples': 7408512, 'steps': 38585, 'loss/train': 1.8982082605361938} -11/07/2021 02:39:28 - INFO - __main__ - Step 38587: {'lr': 0.00042832335730918147, 'samples': 7408704, 'steps': 38586, 'loss/train': 1.4644055366516113} -11/07/2021 02:39:29 - INFO - __main__ - Step 38588: {'lr': 0.0004283196379548451, 'samples': 7408896, 'steps': 38587, 'loss/train': 1.6861553192138672} -11/07/2021 02:39:30 - INFO - __main__ - Step 38589: {'lr': 0.0004283159185201607, 'samples': 7409088, 'steps': 38588, 'loss/train': 1.7528589963912964} -11/07/2021 02:39:30 - INFO - __main__ - Step 38590: {'lr': 0.00042831219900512984, 'samples': 7409280, 'steps': 38589, 'loss/train': 1.5910186767578125} -11/07/2021 02:39:30 - INFO - __main__ - Step 38591: {'lr': 0.0004283084794097543, 'samples': 7409472, 'steps': 38590, 'loss/train': 1.6175768375396729} -11/07/2021 02:39:31 - INFO - __main__ - Step 38592: {'lr': 0.00042830475973403573, 'samples': 7409664, 'steps': 38591, 'loss/train': 0.31639763712882996} -11/07/2021 02:39:31 - INFO - __main__ - Step 38593: {'lr': 0.0004283010399779757, 'samples': 7409856, 'steps': 38592, 'loss/train': 1.6801315546035767} -11/07/2021 02:39:32 - INFO - __main__ - Step 38594: {'lr': 0.000428297320141576, 'samples': 7410048, 'steps': 38593, 'loss/train': 1.7525479793548584} -11/07/2021 02:39:32 - INFO - __main__ - Step 38595: {'lr': 0.0004282936002248383, 'samples': 7410240, 'steps': 38594, 'loss/train': 1.3758429288864136} -11/07/2021 02:39:33 - INFO - __main__ - Step 38596: {'lr': 0.00042828988022776426, 'samples': 7410432, 'steps': 38595, 'loss/train': 1.3587149381637573} -11/07/2021 02:39:33 - INFO - __main__ - Step 38597: {'lr': 0.00042828616015035554, 'samples': 7410624, 'steps': 38596, 'loss/train': 1.565584659576416} -11/07/2021 02:39:33 - INFO - __main__ - Step 38598: {'lr': 0.00042828243999261384, 'samples': 7410816, 'steps': 38597, 'loss/train': 1.705330491065979} -11/07/2021 02:39:34 - INFO - __main__ - Step 38599: {'lr': 0.0004282787197545408, 'samples': 7411008, 'steps': 38598, 'loss/train': 1.0509960651397705} -11/07/2021 02:39:35 - INFO - __main__ - Step 38600: {'lr': 0.00042827499943613815, 'samples': 7411200, 'steps': 38599, 'loss/train': 1.2314541339874268} -11/07/2021 02:39:35 - INFO - __main__ - Step 38601: {'lr': 0.00042827127903740747, 'samples': 7411392, 'steps': 38600, 'loss/train': 1.5458012819290161} -11/07/2021 02:39:36 - INFO - __main__ - Step 38602: {'lr': 0.00042826755855835053, 'samples': 7411584, 'steps': 38601, 'loss/train': 1.6242434978485107} -11/07/2021 02:39:36 - INFO - __main__ - Step 38603: {'lr': 0.00042826383799896906, 'samples': 7411776, 'steps': 38602, 'loss/train': 1.4507431983947754} -11/07/2021 02:39:36 - INFO - __main__ - Step 38604: {'lr': 0.0004282601173592646, 'samples': 7411968, 'steps': 38603, 'loss/train': 1.4450706243515015} -11/07/2021 02:39:37 - INFO - __main__ - Step 38605: {'lr': 0.0004282563966392389, 'samples': 7412160, 'steps': 38604, 'loss/train': 1.1748977899551392} -11/07/2021 02:39:38 - INFO - __main__ - Step 38606: {'lr': 0.00042825267583889354, 'samples': 7412352, 'steps': 38605, 'loss/train': 1.4789282083511353} -11/07/2021 02:39:38 - INFO - __main__ - Step 38607: {'lr': 0.00042824895495823033, 'samples': 7412544, 'steps': 38606, 'loss/train': 1.350877285003662} -11/07/2021 02:39:38 - INFO - __main__ - Step 38608: {'lr': 0.0004282452339972509, 'samples': 7412736, 'steps': 38607, 'loss/train': 0.5122175216674805} -11/07/2021 02:39:39 - INFO - __main__ - Step 38609: {'lr': 0.00042824151295595695, 'samples': 7412928, 'steps': 38608, 'loss/train': 1.9182634353637695} -11/07/2021 02:39:40 - INFO - __main__ - Step 38610: {'lr': 0.0004282377918343501, 'samples': 7413120, 'steps': 38609, 'loss/train': 1.5004831552505493} -11/07/2021 02:39:40 - INFO - __main__ - Step 38611: {'lr': 0.00042823407063243197, 'samples': 7413312, 'steps': 38610, 'loss/train': 1.1725540161132812} -11/07/2021 02:39:40 - INFO - __main__ - Step 38612: {'lr': 0.0004282303493502044, 'samples': 7413504, 'steps': 38611, 'loss/train': 0.6597931981086731} -11/07/2021 02:39:41 - INFO - __main__ - Step 38613: {'lr': 0.000428226627987669, 'samples': 7413696, 'steps': 38612, 'loss/train': 1.3209978342056274} -11/07/2021 02:39:41 - INFO - __main__ - Step 38614: {'lr': 0.0004282229065448273, 'samples': 7413888, 'steps': 38613, 'loss/train': 1.6144988536834717} -11/07/2021 02:39:42 - INFO - __main__ - Step 38615: {'lr': 0.0004282191850216812, 'samples': 7414080, 'steps': 38614, 'loss/train': 1.519603967666626} -11/07/2021 02:39:42 - INFO - __main__ - Step 38616: {'lr': 0.00042821546341823236, 'samples': 7414272, 'steps': 38615, 'loss/train': 1.4626085758209229} -11/07/2021 02:39:43 - INFO - __main__ - Step 38617: {'lr': 0.0004282117417344823, 'samples': 7414464, 'steps': 38616, 'loss/train': 1.5803148746490479} -11/07/2021 02:39:43 - INFO - __main__ - Step 38618: {'lr': 0.00042820801997043277, 'samples': 7414656, 'steps': 38617, 'loss/train': 1.4064488410949707} -11/07/2021 02:39:43 - INFO - __main__ - Step 38619: {'lr': 0.0004282042981260855, 'samples': 7414848, 'steps': 38618, 'loss/train': 1.533360481262207} -11/07/2021 02:39:44 - INFO - __main__ - Step 38620: {'lr': 0.00042820057620144214, 'samples': 7415040, 'steps': 38619, 'loss/train': 1.3826243877410889} -11/07/2021 02:39:45 - INFO - __main__ - Step 38621: {'lr': 0.00042819685419650427, 'samples': 7415232, 'steps': 38620, 'loss/train': 1.0208340883255005} -11/07/2021 02:39:45 - INFO - __main__ - Step 38622: {'lr': 0.0004281931321112737, 'samples': 7415424, 'steps': 38621, 'loss/train': 1.1382410526275635} -11/07/2021 02:39:45 - INFO - __main__ - Step 38623: {'lr': 0.0004281894099457521, 'samples': 7415616, 'steps': 38622, 'loss/train': 1.4776126146316528} -11/07/2021 02:39:46 - INFO - __main__ - Step 38624: {'lr': 0.00042818568769994103, 'samples': 7415808, 'steps': 38623, 'loss/train': 0.15500399470329285} -11/07/2021 02:39:47 - INFO - __main__ - Step 38625: {'lr': 0.00042818196537384225, 'samples': 7416000, 'steps': 38624, 'loss/train': 1.2261273860931396} -11/07/2021 02:39:47 - INFO - __main__ - Step 38626: {'lr': 0.0004281782429674574, 'samples': 7416192, 'steps': 38625, 'loss/train': 1.6735538244247437} -11/07/2021 02:39:48 - INFO - __main__ - Step 38627: {'lr': 0.0004281745204807882, 'samples': 7416384, 'steps': 38626, 'loss/train': 1.849352478981018} -11/07/2021 02:39:48 - INFO - __main__ - Step 38628: {'lr': 0.00042817079791383636, 'samples': 7416576, 'steps': 38627, 'loss/train': 1.77236807346344} -11/07/2021 02:39:48 - INFO - __main__ - Step 38629: {'lr': 0.00042816707526660346, 'samples': 7416768, 'steps': 38628, 'loss/train': 1.4409795999526978} -11/07/2021 02:39:49 - INFO - __main__ - Step 38630: {'lr': 0.00042816335253909125, 'samples': 7416960, 'steps': 38629, 'loss/train': 1.3015356063842773} -11/07/2021 02:39:50 - INFO - __main__ - Step 38631: {'lr': 0.00042815962973130134, 'samples': 7417152, 'steps': 38630, 'loss/train': 1.5178568363189697} -11/07/2021 02:39:50 - INFO - __main__ - Step 38632: {'lr': 0.00042815590684323554, 'samples': 7417344, 'steps': 38631, 'loss/train': 1.4378799200057983} -11/07/2021 02:39:50 - INFO - __main__ - Step 38633: {'lr': 0.00042815218387489535, 'samples': 7417536, 'steps': 38632, 'loss/train': 1.3826674222946167} -11/07/2021 02:39:51 - INFO - __main__ - Step 38634: {'lr': 0.00042814846082628256, 'samples': 7417728, 'steps': 38633, 'loss/train': 1.2611559629440308} -11/07/2021 02:39:51 - INFO - __main__ - Step 38635: {'lr': 0.0004281447376973988, 'samples': 7417920, 'steps': 38634, 'loss/train': 1.0202590227127075} -11/07/2021 02:39:52 - INFO - __main__ - Step 38636: {'lr': 0.00042814101448824583, 'samples': 7418112, 'steps': 38635, 'loss/train': 1.3930331468582153} -11/07/2021 02:39:52 - INFO - __main__ - Step 38637: {'lr': 0.0004281372911988253, 'samples': 7418304, 'steps': 38636, 'loss/train': 1.5592061281204224} -11/07/2021 02:39:53 - INFO - __main__ - Step 38638: {'lr': 0.0004281335678291387, 'samples': 7418496, 'steps': 38637, 'loss/train': 1.780315637588501} -11/07/2021 02:39:53 - INFO - __main__ - Step 38639: {'lr': 0.000428129844379188, 'samples': 7418688, 'steps': 38638, 'loss/train': 1.7167903184890747} -11/07/2021 02:39:53 - INFO - __main__ - Step 38640: {'lr': 0.0004281261208489747, 'samples': 7418880, 'steps': 38639, 'loss/train': 1.198464274406433} -11/07/2021 02:39:54 - INFO - __main__ - Step 38641: {'lr': 0.0004281223972385004, 'samples': 7419072, 'steps': 38640, 'loss/train': 1.5182913541793823} -11/07/2021 02:39:55 - INFO - __main__ - Step 38642: {'lr': 0.00042811867354776705, 'samples': 7419264, 'steps': 38641, 'loss/train': 1.1084949970245361} -11/07/2021 02:39:55 - INFO - __main__ - Step 38643: {'lr': 0.0004281149497767761, 'samples': 7419456, 'steps': 38642, 'loss/train': 1.3935750722885132} -11/07/2021 02:39:56 - INFO - __main__ - Step 38644: {'lr': 0.00042811122592552943, 'samples': 7419648, 'steps': 38643, 'loss/train': 1.4061126708984375} -11/07/2021 02:39:56 - INFO - __main__ - Step 38645: {'lr': 0.0004281075019940285, 'samples': 7419840, 'steps': 38644, 'loss/train': 1.5206317901611328} -11/07/2021 02:39:57 - INFO - __main__ - Step 38646: {'lr': 0.00042810377798227506, 'samples': 7420032, 'steps': 38645, 'loss/train': 1.5615888833999634} -11/07/2021 02:39:57 - INFO - __main__ - Step 38647: {'lr': 0.00042810005389027077, 'samples': 7420224, 'steps': 38646, 'loss/train': 1.8336944580078125} -11/07/2021 02:39:58 - INFO - __main__ - Step 38648: {'lr': 0.0004280963297180174, 'samples': 7420416, 'steps': 38647, 'loss/train': 1.5942424535751343} -11/07/2021 02:39:58 - INFO - __main__ - Step 38649: {'lr': 0.0004280926054655165, 'samples': 7420608, 'steps': 38648, 'loss/train': 1.7997180223464966} -11/07/2021 02:39:58 - INFO - __main__ - Step 38650: {'lr': 0.00042808888113277, 'samples': 7420800, 'steps': 38649, 'loss/train': 1.1809117794036865} -11/07/2021 02:40:00 - INFO - __main__ - Step 38651: {'lr': 0.0004280851567197792, 'samples': 7420992, 'steps': 38650, 'loss/train': 1.705949068069458} -11/07/2021 02:40:00 - INFO - __main__ - Step 38652: {'lr': 0.0004280814322265461, 'samples': 7421184, 'steps': 38651, 'loss/train': 2.073387384414673} -11/07/2021 02:40:00 - INFO - __main__ - Step 38653: {'lr': 0.00042807770765307217, 'samples': 7421376, 'steps': 38652, 'loss/train': 0.7365889549255371} -11/07/2021 02:40:01 - INFO - __main__ - Step 38654: {'lr': 0.00042807398299935927, 'samples': 7421568, 'steps': 38653, 'loss/train': 0.6344184875488281} -11/07/2021 02:40:01 - INFO - __main__ - Step 38655: {'lr': 0.0004280702582654089, 'samples': 7421760, 'steps': 38654, 'loss/train': 2.5534884929656982} -11/07/2021 02:40:01 - INFO - __main__ - Step 38656: {'lr': 0.00042806653345122287, 'samples': 7421952, 'steps': 38655, 'loss/train': 1.5213661193847656} -11/07/2021 02:40:02 - INFO - __main__ - Step 38657: {'lr': 0.0004280628085568028, 'samples': 7422144, 'steps': 38656, 'loss/train': 1.452724814414978} -11/07/2021 02:40:03 - INFO - __main__ - Step 38658: {'lr': 0.0004280590835821503, 'samples': 7422336, 'steps': 38657, 'loss/train': 2.2942631244659424} -11/07/2021 02:40:03 - INFO - __main__ - Step 38659: {'lr': 0.0004280553585272672, 'samples': 7422528, 'steps': 38658, 'loss/train': 1.8796608448028564} -11/07/2021 02:40:03 - INFO - __main__ - Step 38660: {'lr': 0.0004280516333921551, 'samples': 7422720, 'steps': 38659, 'loss/train': 2.2061965465545654} -11/07/2021 02:40:04 - INFO - __main__ - Step 38661: {'lr': 0.00042804790817681574, 'samples': 7422912, 'steps': 38660, 'loss/train': 1.398537039756775} -11/07/2021 02:40:06 - INFO - __main__ - Step 38662: {'lr': 0.0004280441828812506, 'samples': 7423104, 'steps': 38661, 'loss/train': 1.5821424722671509} -11/07/2021 02:40:06 - INFO - __main__ - Step 38663: {'lr': 0.0004280404575054616, 'samples': 7423296, 'steps': 38662, 'loss/train': 2.0686147212982178} -11/07/2021 02:40:06 - INFO - __main__ - Step 38664: {'lr': 0.00042803673204945027, 'samples': 7423488, 'steps': 38663, 'loss/train': 2.4432177543640137} -11/07/2021 02:40:07 - INFO - __main__ - Step 38665: {'lr': 0.0004280330065132184, 'samples': 7423680, 'steps': 38664, 'loss/train': 0.8475606441497803} -11/07/2021 02:40:07 - INFO - __main__ - Step 38666: {'lr': 0.0004280292808967675, 'samples': 7423872, 'steps': 38665, 'loss/train': 0.8151193857192993} -11/07/2021 02:40:07 - INFO - __main__ - Step 38667: {'lr': 0.00042802555520009945, 'samples': 7424064, 'steps': 38666, 'loss/train': 1.1058653593063354} -11/07/2021 02:40:08 - INFO - __main__ - Step 38668: {'lr': 0.00042802182942321576, 'samples': 7424256, 'steps': 38667, 'loss/train': 1.372496485710144} -11/07/2021 02:40:09 - INFO - __main__ - Step 38669: {'lr': 0.0004280181035661182, 'samples': 7424448, 'steps': 38668, 'loss/train': 1.6026809215545654} -11/07/2021 02:40:09 - INFO - __main__ - Step 38670: {'lr': 0.0004280143776288085, 'samples': 7424640, 'steps': 38669, 'loss/train': 1.6136150360107422} -11/07/2021 02:40:09 - INFO - __main__ - Step 38671: {'lr': 0.00042801065161128814, 'samples': 7424832, 'steps': 38670, 'loss/train': 1.3479188680648804} -11/07/2021 02:40:10 - INFO - __main__ - Step 38672: {'lr': 0.000428006925513559, 'samples': 7425024, 'steps': 38671, 'loss/train': 1.8654686212539673} -11/07/2021 02:40:11 - INFO - __main__ - Step 38673: {'lr': 0.0004280031993356227, 'samples': 7425216, 'steps': 38672, 'loss/train': 1.4852941036224365} -11/07/2021 02:40:11 - INFO - __main__ - Step 38674: {'lr': 0.00042799947307748087, 'samples': 7425408, 'steps': 38673, 'loss/train': 1.26423978805542} -11/07/2021 02:40:12 - INFO - __main__ - Step 38675: {'lr': 0.0004279957467391353, 'samples': 7425600, 'steps': 38674, 'loss/train': 1.5272585153579712} -11/07/2021 02:40:12 - INFO - __main__ - Step 38676: {'lr': 0.0004279920203205875, 'samples': 7425792, 'steps': 38675, 'loss/train': 1.5036089420318604} -11/07/2021 02:40:12 - INFO - __main__ - Step 38677: {'lr': 0.0004279882938218393, 'samples': 7425984, 'steps': 38676, 'loss/train': 1.2998476028442383} -11/07/2021 02:40:13 - INFO - __main__ - Step 38678: {'lr': 0.00042798456724289227, 'samples': 7426176, 'steps': 38677, 'loss/train': 1.3719924688339233} -11/07/2021 02:40:14 - INFO - __main__ - Step 38679: {'lr': 0.0004279808405837482, 'samples': 7426368, 'steps': 38678, 'loss/train': 1.4804455041885376} -11/07/2021 02:40:14 - INFO - __main__ - Step 38680: {'lr': 0.00042797711384440863, 'samples': 7426560, 'steps': 38679, 'loss/train': 1.239966630935669} -11/07/2021 02:40:14 - INFO - __main__ - Step 38681: {'lr': 0.0004279733870248754, 'samples': 7426752, 'steps': 38680, 'loss/train': 1.6720571517944336} -11/07/2021 02:40:15 - INFO - __main__ - Step 38682: {'lr': 0.00042796966012515007, 'samples': 7426944, 'steps': 38681, 'loss/train': 1.2801110744476318} -11/07/2021 02:40:15 - INFO - __main__ - Step 38683: {'lr': 0.00042796593314523435, 'samples': 7427136, 'steps': 38682, 'loss/train': 1.1848257780075073} -11/07/2021 02:40:16 - INFO - __main__ - Step 38684: {'lr': 0.0004279622060851299, 'samples': 7427328, 'steps': 38683, 'loss/train': 1.4435261487960815} -11/07/2021 02:40:16 - INFO - __main__ - Step 38685: {'lr': 0.0004279584789448385, 'samples': 7427520, 'steps': 38684, 'loss/train': 1.6397520303726196} -11/07/2021 02:40:17 - INFO - __main__ - Step 38686: {'lr': 0.0004279547517243617, 'samples': 7427712, 'steps': 38685, 'loss/train': 2.541539430618286} -11/07/2021 02:40:17 - INFO - __main__ - Step 38687: {'lr': 0.00042795102442370127, 'samples': 7427904, 'steps': 38686, 'loss/train': 1.6271125078201294} -11/07/2021 02:40:17 - INFO - __main__ - Step 38688: {'lr': 0.0004279472970428588, 'samples': 7428096, 'steps': 38687, 'loss/train': 0.9081865549087524} -11/07/2021 02:40:19 - INFO - __main__ - Step 38689: {'lr': 0.0004279435695818361, 'samples': 7428288, 'steps': 38688, 'loss/train': 1.785889983177185} -11/07/2021 02:40:19 - INFO - __main__ - Step 38690: {'lr': 0.00042793984204063477, 'samples': 7428480, 'steps': 38689, 'loss/train': 1.6187974214553833} -11/07/2021 02:40:19 - INFO - __main__ - Step 38691: {'lr': 0.0004279361144192565, 'samples': 7428672, 'steps': 38690, 'loss/train': 1.9208132028579712} -11/07/2021 02:40:20 - INFO - __main__ - Step 38692: {'lr': 0.00042793238671770285, 'samples': 7428864, 'steps': 38691, 'loss/train': 1.7893801927566528} -11/07/2021 02:40:20 - INFO - __main__ - Step 38693: {'lr': 0.0004279286589359757, 'samples': 7429056, 'steps': 38692, 'loss/train': 1.4303791522979736} -11/07/2021 02:40:21 - INFO - __main__ - Step 38694: {'lr': 0.00042792493107407666, 'samples': 7429248, 'steps': 38693, 'loss/train': 1.673890471458435} -11/07/2021 02:40:21 - INFO - __main__ - Step 38695: {'lr': 0.0004279212031320073, 'samples': 7429440, 'steps': 38694, 'loss/train': 1.5759137868881226} -11/07/2021 02:40:22 - INFO - __main__ - Step 38696: {'lr': 0.00042791747510976955, 'samples': 7429632, 'steps': 38695, 'loss/train': 1.9982209205627441} -11/07/2021 02:40:22 - INFO - __main__ - Step 38697: {'lr': 0.0004279137470073648, 'samples': 7429824, 'steps': 38696, 'loss/train': 1.5088738203048706} -11/07/2021 02:40:22 - INFO - __main__ - Step 38698: {'lr': 0.00042791001882479485, 'samples': 7430016, 'steps': 38697, 'loss/train': 1.8029636144638062} -11/07/2021 02:40:23 - INFO - __main__ - Step 38699: {'lr': 0.0004279062905620614, 'samples': 7430208, 'steps': 38698, 'loss/train': 1.0119118690490723} -11/07/2021 02:40:24 - INFO - __main__ - Step 38700: {'lr': 0.0004279025622191662, 'samples': 7430400, 'steps': 38699, 'loss/train': 1.4782328605651855} -11/07/2021 02:40:24 - INFO - __main__ - Step 38701: {'lr': 0.00042789883379611084, 'samples': 7430592, 'steps': 38700, 'loss/train': 1.4868354797363281} -11/07/2021 02:40:24 - INFO - __main__ - Step 38702: {'lr': 0.000427895105292897, 'samples': 7430784, 'steps': 38701, 'loss/train': 1.3261916637420654} -11/07/2021 02:40:25 - INFO - __main__ - Step 38703: {'lr': 0.00042789137670952627, 'samples': 7430976, 'steps': 38702, 'loss/train': 1.4865633249282837} -11/07/2021 02:40:25 - INFO - __main__ - Step 38704: {'lr': 0.00042788764804600055, 'samples': 7431168, 'steps': 38703, 'loss/train': 1.27956223487854} -11/07/2021 02:40:26 - INFO - __main__ - Step 38705: {'lr': 0.0004278839193023214, 'samples': 7431360, 'steps': 38704, 'loss/train': 1.390254259109497} -11/07/2021 02:40:27 - INFO - __main__ - Step 38706: {'lr': 0.0004278801904784904, 'samples': 7431552, 'steps': 38705, 'loss/train': 1.5037397146224976} -11/07/2021 02:40:27 - INFO - __main__ - Step 38707: {'lr': 0.00042787646157450946, 'samples': 7431744, 'steps': 38706, 'loss/train': 1.4711500406265259} -11/07/2021 02:40:27 - INFO - __main__ - Step 38708: {'lr': 0.00042787273259038, 'samples': 7431936, 'steps': 38707, 'loss/train': 1.1879253387451172} -11/07/2021 02:40:28 - INFO - __main__ - Step 38709: {'lr': 0.00042786900352610393, 'samples': 7432128, 'steps': 38708, 'loss/train': 1.1754286289215088} -11/07/2021 02:40:29 - INFO - __main__ - Step 38710: {'lr': 0.0004278652743816828, 'samples': 7432320, 'steps': 38709, 'loss/train': 1.3880391120910645} -11/07/2021 02:40:29 - INFO - __main__ - Step 38711: {'lr': 0.00042786154515711826, 'samples': 7432512, 'steps': 38710, 'loss/train': 0.7310174703598022} -11/07/2021 02:40:29 - INFO - __main__ - Step 38712: {'lr': 0.0004278578158524121, 'samples': 7432704, 'steps': 38711, 'loss/train': 2.104560136795044} -11/07/2021 02:40:30 - INFO - __main__ - Step 38713: {'lr': 0.00042785408646756594, 'samples': 7432896, 'steps': 38712, 'loss/train': 1.6006711721420288} -11/07/2021 02:40:30 - INFO - __main__ - Step 38714: {'lr': 0.0004278503570025816, 'samples': 7433088, 'steps': 38713, 'loss/train': 1.1154862642288208} -11/07/2021 02:40:31 - INFO - __main__ - Step 38715: {'lr': 0.0004278466274574605, 'samples': 7433280, 'steps': 38714, 'loss/train': 0.30776089429855347} -11/07/2021 02:40:32 - INFO - __main__ - Step 38716: {'lr': 0.0004278428978322044, 'samples': 7433472, 'steps': 38715, 'loss/train': 1.6656759977340698} -11/07/2021 02:40:32 - INFO - __main__ - Step 38717: {'lr': 0.00042783916812681516, 'samples': 7433664, 'steps': 38716, 'loss/train': 2.2830231189727783} -11/07/2021 02:40:32 - INFO - __main__ - Step 38718: {'lr': 0.0004278354383412943, 'samples': 7433856, 'steps': 38717, 'loss/train': 1.4579813480377197} -11/07/2021 02:40:33 - INFO - __main__ - Step 38719: {'lr': 0.0004278317084756435, 'samples': 7434048, 'steps': 38718, 'loss/train': 1.6667070388793945} -11/07/2021 02:40:33 - INFO - __main__ - Step 38720: {'lr': 0.00042782797852986454, 'samples': 7434240, 'steps': 38719, 'loss/train': 1.509294033050537} -11/07/2021 02:40:34 - INFO - __main__ - Step 38721: {'lr': 0.00042782424850395894, 'samples': 7434432, 'steps': 38720, 'loss/train': 1.7709182500839233} -11/07/2021 02:40:34 - INFO - __main__ - Step 38722: {'lr': 0.00042782051839792857, 'samples': 7434624, 'steps': 38721, 'loss/train': 0.7755714654922485} -11/07/2021 02:40:35 - INFO - __main__ - Step 38723: {'lr': 0.000427816788211775, 'samples': 7434816, 'steps': 38722, 'loss/train': 1.6787524223327637} -11/07/2021 02:40:35 - INFO - __main__ - Step 38724: {'lr': 0.00042781305794549994, 'samples': 7435008, 'steps': 38723, 'loss/train': 1.6378754377365112} -11/07/2021 02:40:35 - INFO - __main__ - Step 38725: {'lr': 0.00042780932759910504, 'samples': 7435200, 'steps': 38724, 'loss/train': 1.700057864189148} -11/07/2021 02:40:36 - INFO - __main__ - Step 38726: {'lr': 0.00042780559717259194, 'samples': 7435392, 'steps': 38725, 'loss/train': 1.517086148262024} -11/07/2021 02:40:37 - INFO - __main__ - Step 38727: {'lr': 0.0004278018666659624, 'samples': 7435584, 'steps': 38726, 'loss/train': 1.5830868482589722} -11/07/2021 02:40:37 - INFO - __main__ - Step 38728: {'lr': 0.0004277981360792182, 'samples': 7435776, 'steps': 38727, 'loss/train': 1.8037893772125244} -11/07/2021 02:40:38 - INFO - __main__ - Step 38729: {'lr': 0.0004277944054123608, 'samples': 7435968, 'steps': 38728, 'loss/train': 1.5496574640274048} -11/07/2021 02:40:38 - INFO - __main__ - Step 38730: {'lr': 0.000427790674665392, 'samples': 7436160, 'steps': 38729, 'loss/train': 1.3973135948181152} -11/07/2021 02:40:39 - INFO - __main__ - Step 38731: {'lr': 0.00042778694383831354, 'samples': 7436352, 'steps': 38730, 'loss/train': 1.558529257774353} -11/07/2021 02:40:39 - INFO - __main__ - Step 38732: {'lr': 0.0004277832129311269, 'samples': 7436544, 'steps': 38731, 'loss/train': 1.8024917840957642} -11/07/2021 02:40:40 - INFO - __main__ - Step 38733: {'lr': 0.000427779481943834, 'samples': 7436736, 'steps': 38732, 'loss/train': 1.8078402280807495} -11/07/2021 02:40:40 - INFO - __main__ - Step 38734: {'lr': 0.0004277757508764363, 'samples': 7436928, 'steps': 38733, 'loss/train': 1.2723112106323242} -11/07/2021 02:40:40 - INFO - __main__ - Step 38735: {'lr': 0.00042777201972893564, 'samples': 7437120, 'steps': 38734, 'loss/train': 1.5691598653793335} -11/07/2021 02:40:41 - INFO - __main__ - Step 38736: {'lr': 0.00042776828850133364, 'samples': 7437312, 'steps': 38735, 'loss/train': 1.4892206192016602} -11/07/2021 02:40:42 - INFO - __main__ - Step 38737: {'lr': 0.0004277645571936321, 'samples': 7437504, 'steps': 38736, 'loss/train': 1.7327055931091309} -11/07/2021 02:40:42 - INFO - __main__ - Step 38738: {'lr': 0.0004277608258058324, 'samples': 7437696, 'steps': 38737, 'loss/train': 1.7947583198547363} -11/07/2021 02:40:42 - INFO - __main__ - Step 38739: {'lr': 0.00042775709433793657, 'samples': 7437888, 'steps': 38738, 'loss/train': 1.4090418815612793} -11/07/2021 02:40:43 - INFO - __main__ - Step 38740: {'lr': 0.0004277533627899461, 'samples': 7438080, 'steps': 38739, 'loss/train': 1.3038268089294434} -11/07/2021 02:40:44 - INFO - __main__ - Step 38741: {'lr': 0.00042774963116186274, 'samples': 7438272, 'steps': 38740, 'loss/train': 1.4376336336135864} -11/07/2021 02:40:44 - INFO - __main__ - Step 38742: {'lr': 0.000427745899453688, 'samples': 7438464, 'steps': 38741, 'loss/train': 1.7706702947616577} -11/07/2021 02:40:44 - INFO - __main__ - Step 38743: {'lr': 0.00042774216766542386, 'samples': 7438656, 'steps': 38742, 'loss/train': 1.64524245262146} -11/07/2021 02:40:45 - INFO - __main__ - Step 38744: {'lr': 0.0004277384357970717, 'samples': 7438848, 'steps': 38743, 'loss/train': 1.289526104927063} -11/07/2021 02:40:45 - INFO - __main__ - Step 38745: {'lr': 0.00042773470384863344, 'samples': 7439040, 'steps': 38744, 'loss/train': 1.7782156467437744} -11/07/2021 02:40:45 - INFO - __main__ - Step 38746: {'lr': 0.0004277309718201107, 'samples': 7439232, 'steps': 38745, 'loss/train': 1.1813396215438843} -11/07/2021 02:40:46 - INFO - __main__ - Step 38747: {'lr': 0.000427727239711505, 'samples': 7439424, 'steps': 38746, 'loss/train': 1.3218621015548706} -11/07/2021 02:40:47 - INFO - __main__ - Step 38748: {'lr': 0.00042772350752281823, 'samples': 7439616, 'steps': 38747, 'loss/train': 1.8541260957717896} -11/07/2021 02:40:47 - INFO - __main__ - Step 38749: {'lr': 0.000427719775254052, 'samples': 7439808, 'steps': 38748, 'loss/train': 1.7880030870437622} -11/07/2021 02:40:47 - INFO - __main__ - Step 38750: {'lr': 0.00042771604290520795, 'samples': 7440000, 'steps': 38749, 'loss/train': 1.229604959487915} -11/07/2021 02:40:48 - INFO - __main__ - Step 38751: {'lr': 0.00042771231047628776, 'samples': 7440192, 'steps': 38750, 'loss/train': 1.1183679103851318} -11/07/2021 02:40:49 - INFO - __main__ - Step 38752: {'lr': 0.0004277085779672932, 'samples': 7440384, 'steps': 38751, 'loss/train': 1.9162299633026123} -11/07/2021 02:40:49 - INFO - __main__ - Step 38753: {'lr': 0.0004277048453782259, 'samples': 7440576, 'steps': 38752, 'loss/train': 1.6994130611419678} -11/07/2021 02:40:50 - INFO - __main__ - Step 38754: {'lr': 0.0004277011127090875, 'samples': 7440768, 'steps': 38753, 'loss/train': 2.003278970718384} -11/07/2021 02:40:50 - INFO - __main__ - Step 38755: {'lr': 0.0004276973799598798, 'samples': 7440960, 'steps': 38754, 'loss/train': 1.5014312267303467} -11/07/2021 02:40:50 - INFO - __main__ - Step 38756: {'lr': 0.0004276936471306043, 'samples': 7441152, 'steps': 38755, 'loss/train': 1.0279024839401245} -11/07/2021 02:40:51 - INFO - __main__ - Step 38757: {'lr': 0.00042768991422126285, 'samples': 7441344, 'steps': 38756, 'loss/train': 0.6809089183807373} -11/07/2021 02:40:52 - INFO - __main__ - Step 38758: {'lr': 0.00042768618123185703, 'samples': 7441536, 'steps': 38757, 'loss/train': 1.3736629486083984} -11/07/2021 02:40:52 - INFO - __main__ - Step 38759: {'lr': 0.00042768244816238863, 'samples': 7441728, 'steps': 38758, 'loss/train': 1.0637315511703491} -11/07/2021 02:40:52 - INFO - __main__ - Step 38760: {'lr': 0.00042767871501285916, 'samples': 7441920, 'steps': 38759, 'loss/train': 1.5829507112503052} -11/07/2021 02:40:53 - INFO - __main__ - Step 38761: {'lr': 0.00042767498178327047, 'samples': 7442112, 'steps': 38760, 'loss/train': 1.4992541074752808} -11/07/2021 02:40:54 - INFO - __main__ - Step 38762: {'lr': 0.00042767124847362413, 'samples': 7442304, 'steps': 38761, 'loss/train': 1.995751976966858} -11/07/2021 02:40:54 - INFO - __main__ - Step 38763: {'lr': 0.00042766751508392187, 'samples': 7442496, 'steps': 38762, 'loss/train': 1.8400249481201172} -11/07/2021 02:40:54 - INFO - __main__ - Step 38764: {'lr': 0.00042766378161416543, 'samples': 7442688, 'steps': 38763, 'loss/train': 1.5340784788131714} -11/07/2021 02:40:55 - INFO - __main__ - Step 38765: {'lr': 0.00042766004806435643, 'samples': 7442880, 'steps': 38764, 'loss/train': 1.5389777421951294} -11/07/2021 02:40:55 - INFO - __main__ - Step 38766: {'lr': 0.0004276563144344965, 'samples': 7443072, 'steps': 38765, 'loss/train': 1.4644994735717773} -11/07/2021 02:40:56 - INFO - __main__ - Step 38767: {'lr': 0.00042765258072458733, 'samples': 7443264, 'steps': 38766, 'loss/train': 1.8041868209838867} -11/07/2021 02:40:57 - INFO - __main__ - Step 38768: {'lr': 0.00042764884693463075, 'samples': 7443456, 'steps': 38767, 'loss/train': 1.6728705167770386} -11/07/2021 02:40:57 - INFO - __main__ - Step 38769: {'lr': 0.0004276451130646283, 'samples': 7443648, 'steps': 38768, 'loss/train': 1.5693845748901367} -11/07/2021 02:40:57 - INFO - __main__ - Step 38770: {'lr': 0.0004276413791145817, 'samples': 7443840, 'steps': 38769, 'loss/train': 1.5388051271438599} -11/07/2021 02:40:58 - INFO - __main__ - Step 38771: {'lr': 0.00042763764508449263, 'samples': 7444032, 'steps': 38770, 'loss/train': 1.5940831899642944} -11/07/2021 02:40:59 - INFO - __main__ - Step 38772: {'lr': 0.0004276339109743628, 'samples': 7444224, 'steps': 38771, 'loss/train': 1.9035909175872803} -11/07/2021 02:40:59 - INFO - __main__ - Step 38773: {'lr': 0.0004276301767841939, 'samples': 7444416, 'steps': 38772, 'loss/train': 1.301182746887207} -11/07/2021 02:40:59 - INFO - __main__ - Step 38774: {'lr': 0.00042762644251398755, 'samples': 7444608, 'steps': 38773, 'loss/train': 1.6869004964828491} -11/07/2021 02:41:00 - INFO - __main__ - Step 38775: {'lr': 0.0004276227081637454, 'samples': 7444800, 'steps': 38774, 'loss/train': 1.445910930633545} -11/07/2021 02:41:00 - INFO - __main__ - Step 38776: {'lr': 0.00042761897373346923, 'samples': 7444992, 'steps': 38775, 'loss/train': 1.0125514268875122} -11/07/2021 02:41:01 - INFO - __main__ - Step 38777: {'lr': 0.0004276152392231608, 'samples': 7445184, 'steps': 38776, 'loss/train': 1.3907091617584229} -11/07/2021 02:41:02 - INFO - __main__ - Step 38778: {'lr': 0.00042761150463282164, 'samples': 7445376, 'steps': 38777, 'loss/train': 1.4133721590042114} -11/07/2021 02:41:02 - INFO - __main__ - Step 38779: {'lr': 0.0004276077699624534, 'samples': 7445568, 'steps': 38778, 'loss/train': 1.6160264015197754} -11/07/2021 02:41:02 - INFO - __main__ - Step 38780: {'lr': 0.0004276040352120578, 'samples': 7445760, 'steps': 38779, 'loss/train': 1.2119277715682983} -11/07/2021 02:41:03 - INFO - __main__ - Step 38781: {'lr': 0.0004276003003816367, 'samples': 7445952, 'steps': 38780, 'loss/train': 0.9591224193572998} -11/07/2021 02:41:04 - INFO - __main__ - Step 38782: {'lr': 0.0004275965654711916, 'samples': 7446144, 'steps': 38781, 'loss/train': 1.4609408378601074} -11/07/2021 02:41:04 - INFO - __main__ - Step 38783: {'lr': 0.0004275928304807242, 'samples': 7446336, 'steps': 38782, 'loss/train': 1.4006892442703247} -11/07/2021 02:41:04 - INFO - __main__ - Step 38784: {'lr': 0.0004275890954102362, 'samples': 7446528, 'steps': 38783, 'loss/train': 1.4045475721359253} -11/07/2021 02:41:05 - INFO - __main__ - Step 38785: {'lr': 0.0004275853602597294, 'samples': 7446720, 'steps': 38784, 'loss/train': 0.8429235219955444} -11/07/2021 02:41:05 - INFO - __main__ - Step 38786: {'lr': 0.00042758162502920527, 'samples': 7446912, 'steps': 38785, 'loss/train': 1.095483422279358} -11/07/2021 02:41:05 - INFO - __main__ - Step 38787: {'lr': 0.0004275778897186656, 'samples': 7447104, 'steps': 38786, 'loss/train': 1.2157950401306152} -11/07/2021 02:41:06 - INFO - __main__ - Step 38788: {'lr': 0.0004275741543281121, 'samples': 7447296, 'steps': 38787, 'loss/train': 1.3693673610687256} -11/07/2021 02:41:07 - INFO - __main__ - Step 38789: {'lr': 0.0004275704188575464, 'samples': 7447488, 'steps': 38788, 'loss/train': 1.5449576377868652} -11/07/2021 02:41:07 - INFO - __main__ - Step 38790: {'lr': 0.00042756668330697024, 'samples': 7447680, 'steps': 38789, 'loss/train': 1.5498528480529785} -11/07/2021 02:41:07 - INFO - __main__ - Step 38791: {'lr': 0.00042756294767638527, 'samples': 7447872, 'steps': 38790, 'loss/train': 0.6934214234352112} -11/07/2021 02:41:08 - INFO - __main__ - Step 38792: {'lr': 0.00042755921196579316, 'samples': 7448064, 'steps': 38791, 'loss/train': 1.606022596359253} -11/07/2021 02:41:09 - INFO - __main__ - Step 38793: {'lr': 0.0004275554761751956, 'samples': 7448256, 'steps': 38792, 'loss/train': 1.848496437072754} -11/07/2021 02:41:09 - INFO - __main__ - Step 38794: {'lr': 0.0004275517403045943, 'samples': 7448448, 'steps': 38793, 'loss/train': 0.4533573389053345} -11/07/2021 02:41:10 - INFO - __main__ - Step 38795: {'lr': 0.000427548004353991, 'samples': 7448640, 'steps': 38794, 'loss/train': 1.8403584957122803} -11/07/2021 02:41:10 - INFO - __main__ - Step 38796: {'lr': 0.00042754426832338724, 'samples': 7448832, 'steps': 38795, 'loss/train': 1.3824883699417114} -11/07/2021 02:41:10 - INFO - __main__ - Step 38797: {'lr': 0.00042754053221278476, 'samples': 7449024, 'steps': 38796, 'loss/train': 1.9527474641799927} -11/07/2021 02:41:11 - INFO - __main__ - Step 38798: {'lr': 0.0004275367960221853, 'samples': 7449216, 'steps': 38797, 'loss/train': 1.161024808883667} -11/07/2021 02:41:12 - INFO - __main__ - Step 38799: {'lr': 0.0004275330597515904, 'samples': 7449408, 'steps': 38798, 'loss/train': 1.4690824747085571} -11/07/2021 02:41:12 - INFO - __main__ - Step 38800: {'lr': 0.00042752932340100195, 'samples': 7449600, 'steps': 38799, 'loss/train': 1.634828805923462} -11/07/2021 02:41:12 - INFO - __main__ - Step 38801: {'lr': 0.00042752558697042143, 'samples': 7449792, 'steps': 38800, 'loss/train': 1.6765644550323486} -11/07/2021 02:41:13 - INFO - __main__ - Step 38802: {'lr': 0.0004275218504598507, 'samples': 7449984, 'steps': 38801, 'loss/train': 1.7828283309936523} -11/07/2021 02:41:14 - INFO - __main__ - Step 38803: {'lr': 0.0004275181138692914, 'samples': 7450176, 'steps': 38802, 'loss/train': 1.677453875541687} -11/07/2021 02:41:14 - INFO - __main__ - Step 38804: {'lr': 0.0004275143771987451, 'samples': 7450368, 'steps': 38803, 'loss/train': 1.3535674810409546} -11/07/2021 02:41:14 - INFO - __main__ - Step 38805: {'lr': 0.00042751064044821354, 'samples': 7450560, 'steps': 38804, 'loss/train': 1.4613144397735596} -11/07/2021 02:41:15 - INFO - __main__ - Step 38806: {'lr': 0.0004275069036176985, 'samples': 7450752, 'steps': 38805, 'loss/train': 1.706905722618103} -11/07/2021 02:41:15 - INFO - __main__ - Step 38807: {'lr': 0.0004275031667072015, 'samples': 7450944, 'steps': 38806, 'loss/train': 1.6436902284622192} -11/07/2021 02:41:16 - INFO - __main__ - Step 38808: {'lr': 0.0004274994297167244, 'samples': 7451136, 'steps': 38807, 'loss/train': 1.309851884841919} -11/07/2021 02:41:17 - INFO - __main__ - Step 38809: {'lr': 0.00042749569264626875, 'samples': 7451328, 'steps': 38808, 'loss/train': 1.4383822679519653} -11/07/2021 02:41:17 - INFO - __main__ - Step 38810: {'lr': 0.0004274919554958363, 'samples': 7451520, 'steps': 38809, 'loss/train': 1.6340030431747437} -11/07/2021 02:41:17 - INFO - __main__ - Step 38811: {'lr': 0.00042748821826542875, 'samples': 7451712, 'steps': 38810, 'loss/train': 1.627172827720642} -11/07/2021 02:41:18 - INFO - __main__ - Step 38812: {'lr': 0.00042748448095504765, 'samples': 7451904, 'steps': 38811, 'loss/train': 1.35011625289917} -11/07/2021 02:41:18 - INFO - __main__ - Step 38813: {'lr': 0.0004274807435646948, 'samples': 7452096, 'steps': 38812, 'loss/train': 1.7396658658981323} -11/07/2021 02:41:19 - INFO - __main__ - Step 38814: {'lr': 0.0004274770060943719, 'samples': 7452288, 'steps': 38813, 'loss/train': 5.9485344886779785} -11/07/2021 02:41:19 - INFO - __main__ - Step 38815: {'lr': 0.00042747326854408063, 'samples': 7452480, 'steps': 38814, 'loss/train': 1.7223875522613525} -11/07/2021 02:41:20 - INFO - __main__ - Step 38816: {'lr': 0.00042746953091382254, 'samples': 7452672, 'steps': 38815, 'loss/train': 1.614368200302124} -11/07/2021 02:41:20 - INFO - __main__ - Step 38817: {'lr': 0.00042746579320359956, 'samples': 7452864, 'steps': 38816, 'loss/train': 1.5527185201644897} -11/07/2021 02:41:21 - INFO - __main__ - Step 38818: {'lr': 0.00042746205541341315, 'samples': 7453056, 'steps': 38817, 'loss/train': 1.6299482583999634} -11/07/2021 02:41:22 - INFO - __main__ - Step 38819: {'lr': 0.0004274583175432651, 'samples': 7453248, 'steps': 38818, 'loss/train': 1.170392632484436} -11/07/2021 02:41:22 - INFO - __main__ - Step 38820: {'lr': 0.000427454579593157, 'samples': 7453440, 'steps': 38819, 'loss/train': 1.6622440814971924} -11/07/2021 02:41:23 - INFO - __main__ - Step 38821: {'lr': 0.00042745084156309065, 'samples': 7453632, 'steps': 38820, 'loss/train': 1.4594944715499878} -11/07/2021 02:41:23 - INFO - __main__ - Step 38822: {'lr': 0.00042744710345306774, 'samples': 7453824, 'steps': 38821, 'loss/train': 1.780123233795166} -11/07/2021 02:41:23 - INFO - __main__ - Step 38823: {'lr': 0.00042744336526308986, 'samples': 7454016, 'steps': 38822, 'loss/train': 1.5132795572280884} -11/07/2021 02:41:24 - INFO - __main__ - Step 38824: {'lr': 0.0004274396269931587, 'samples': 7454208, 'steps': 38823, 'loss/train': 1.9288641214370728} -11/07/2021 02:41:25 - INFO - __main__ - Step 38825: {'lr': 0.0004274358886432761, 'samples': 7454400, 'steps': 38824, 'loss/train': 1.3878891468048096} -11/07/2021 02:41:25 - INFO - __main__ - Step 38826: {'lr': 0.0004274321502134435, 'samples': 7454592, 'steps': 38825, 'loss/train': 1.3130568265914917} -11/07/2021 02:41:25 - INFO - __main__ - Step 38827: {'lr': 0.00042742841170366274, 'samples': 7454784, 'steps': 38826, 'loss/train': 1.8139756917953491} -11/07/2021 02:41:26 - INFO - __main__ - Step 38828: {'lr': 0.0004274246731139355, 'samples': 7454976, 'steps': 38827, 'loss/train': 1.597933292388916} -11/07/2021 02:41:26 - INFO - __main__ - Step 38829: {'lr': 0.0004274209344442634, 'samples': 7455168, 'steps': 38828, 'loss/train': 1.1701526641845703} -11/07/2021 02:41:27 - INFO - __main__ - Step 38830: {'lr': 0.00042741719569464834, 'samples': 7455360, 'steps': 38829, 'loss/train': 1.382586121559143} -11/07/2021 02:41:27 - INFO - __main__ - Step 38831: {'lr': 0.0004274134568650916, 'samples': 7455552, 'steps': 38830, 'loss/train': 1.5133731365203857} -11/07/2021 02:41:28 - INFO - __main__ - Step 38832: {'lr': 0.00042740971795559527, 'samples': 7455744, 'steps': 38831, 'loss/train': 1.5364069938659668} -11/07/2021 02:41:28 - INFO - __main__ - Step 38833: {'lr': 0.00042740597896616075, 'samples': 7455936, 'steps': 38832, 'loss/train': 1.4677929878234863} -11/07/2021 02:41:29 - INFO - __main__ - Step 38834: {'lr': 0.00042740223989678984, 'samples': 7456128, 'steps': 38833, 'loss/train': 1.2758821249008179} -11/07/2021 02:41:29 - INFO - __main__ - Step 38835: {'lr': 0.0004273985007474842, 'samples': 7456320, 'steps': 38834, 'loss/train': 1.6179077625274658} -11/07/2021 02:41:30 - INFO - __main__ - Step 38836: {'lr': 0.00042739476151824565, 'samples': 7456512, 'steps': 38835, 'loss/train': 0.5692052245140076} -11/07/2021 02:41:30 - INFO - __main__ - Step 38837: {'lr': 0.00042739102220907567, 'samples': 7456704, 'steps': 38836, 'loss/train': 1.2258596420288086} -11/07/2021 02:41:31 - INFO - __main__ - Step 38838: {'lr': 0.000427387282819976, 'samples': 7456896, 'steps': 38837, 'loss/train': 1.7110847234725952} -11/07/2021 02:41:31 - INFO - __main__ - Step 38839: {'lr': 0.0004273835433509484, 'samples': 7457088, 'steps': 38838, 'loss/train': 1.5911930799484253} -11/07/2021 02:41:31 - INFO - __main__ - Step 38840: {'lr': 0.0004273798038019945, 'samples': 7457280, 'steps': 38839, 'loss/train': 1.5180996656417847} -11/07/2021 02:41:32 - INFO - __main__ - Step 38841: {'lr': 0.000427376064173116, 'samples': 7457472, 'steps': 38840, 'loss/train': 1.6930204629898071} -11/07/2021 02:41:33 - INFO - __main__ - Step 38842: {'lr': 0.0004273723244643146, 'samples': 7457664, 'steps': 38841, 'loss/train': 1.7402244806289673} -11/07/2021 02:41:33 - INFO - __main__ - Step 38843: {'lr': 0.000427368584675592, 'samples': 7457856, 'steps': 38842, 'loss/train': 1.8798352479934692} -11/07/2021 02:41:33 - INFO - __main__ - Step 38844: {'lr': 0.0004273648448069498, 'samples': 7458048, 'steps': 38843, 'loss/train': 1.5837422609329224} -11/07/2021 02:41:34 - INFO - __main__ - Step 38845: {'lr': 0.00042736110485838973, 'samples': 7458240, 'steps': 38844, 'loss/train': 1.194349765777588} -11/07/2021 02:41:35 - INFO - __main__ - Step 38846: {'lr': 0.0004273573648299135, 'samples': 7458432, 'steps': 38845, 'loss/train': 1.6953762769699097} -11/07/2021 02:41:35 - INFO - __main__ - Step 38847: {'lr': 0.0004273536247215227, 'samples': 7458624, 'steps': 38846, 'loss/train': 2.0758681297302246} -11/07/2021 02:41:36 - INFO - __main__ - Step 38848: {'lr': 0.00042734988453321923, 'samples': 7458816, 'steps': 38847, 'loss/train': 1.132045030593872} -11/07/2021 02:41:36 - INFO - __main__ - Step 38849: {'lr': 0.0004273461442650046, 'samples': 7459008, 'steps': 38848, 'loss/train': 1.5473262071609497} -11/07/2021 02:41:36 - INFO - __main__ - Step 38850: {'lr': 0.0004273424039168805, 'samples': 7459200, 'steps': 38849, 'loss/train': 1.733851671218872} -11/07/2021 02:41:37 - INFO - __main__ - Step 38851: {'lr': 0.00042733866348884864, 'samples': 7459392, 'steps': 38850, 'loss/train': 1.4504001140594482} -11/07/2021 02:41:38 - INFO - __main__ - Step 38852: {'lr': 0.0004273349229809108, 'samples': 7459584, 'steps': 38851, 'loss/train': 1.7992230653762817} -11/07/2021 02:41:38 - INFO - __main__ - Step 38853: {'lr': 0.00042733118239306845, 'samples': 7459776, 'steps': 38852, 'loss/train': 1.5601048469543457} -11/07/2021 02:41:38 - INFO - __main__ - Step 38854: {'lr': 0.0004273274417253235, 'samples': 7459968, 'steps': 38853, 'loss/train': 1.4414904117584229} -11/07/2021 02:41:39 - INFO - __main__ - Step 38855: {'lr': 0.00042732370097767756, 'samples': 7460160, 'steps': 38854, 'loss/train': 1.7437254190444946} -11/07/2021 02:41:39 - INFO - __main__ - Step 38856: {'lr': 0.0004273199601501322, 'samples': 7460352, 'steps': 38855, 'loss/train': 1.7385590076446533} -11/07/2021 02:41:40 - INFO - __main__ - Step 38857: {'lr': 0.0004273162192426893, 'samples': 7460544, 'steps': 38856, 'loss/train': 1.4456984996795654} -11/07/2021 02:41:41 - INFO - __main__ - Step 38858: {'lr': 0.00042731247825535037, 'samples': 7460736, 'steps': 38857, 'loss/train': 1.4588637351989746} -11/07/2021 02:41:41 - INFO - __main__ - Step 38859: {'lr': 0.00042730873718811724, 'samples': 7460928, 'steps': 38858, 'loss/train': 1.9591647386550903} -11/07/2021 02:41:41 - INFO - __main__ - Step 38860: {'lr': 0.0004273049960409915, 'samples': 7461120, 'steps': 38859, 'loss/train': 1.8021929264068604} -11/07/2021 02:41:42 - INFO - __main__ - Step 38861: {'lr': 0.00042730125481397487, 'samples': 7461312, 'steps': 38860, 'loss/train': 1.1760722398757935} -11/07/2021 02:41:43 - INFO - __main__ - Step 38862: {'lr': 0.00042729751350706905, 'samples': 7461504, 'steps': 38861, 'loss/train': 1.177544116973877} -11/07/2021 02:41:43 - INFO - __main__ - Step 38863: {'lr': 0.00042729377212027557, 'samples': 7461696, 'steps': 38862, 'loss/train': 1.1901837587356567} -11/07/2021 02:41:44 - INFO - __main__ - Step 38864: {'lr': 0.0004272900306535964, 'samples': 7461888, 'steps': 38863, 'loss/train': 1.6480708122253418} -11/07/2021 02:41:44 - INFO - __main__ - Step 38865: {'lr': 0.00042728628910703305, 'samples': 7462080, 'steps': 38864, 'loss/train': 2.429159164428711} -11/07/2021 02:41:44 - INFO - __main__ - Step 38866: {'lr': 0.0004272825474805872, 'samples': 7462272, 'steps': 38865, 'loss/train': 1.8162816762924194} -11/07/2021 02:41:45 - INFO - __main__ - Step 38867: {'lr': 0.0004272788057742606, 'samples': 7462464, 'steps': 38866, 'loss/train': 1.9516806602478027} -11/07/2021 02:41:46 - INFO - __main__ - Step 38868: {'lr': 0.0004272750639880549, 'samples': 7462656, 'steps': 38867, 'loss/train': 0.7387398481369019} -11/07/2021 02:41:46 - INFO - __main__ - Step 38869: {'lr': 0.0004272713221219718, 'samples': 7462848, 'steps': 38868, 'loss/train': 1.3881351947784424} -11/07/2021 02:41:46 - INFO - __main__ - Step 38870: {'lr': 0.00042726758017601297, 'samples': 7463040, 'steps': 38869, 'loss/train': 1.5700926780700684} -11/07/2021 02:41:47 - INFO - __main__ - Step 38871: {'lr': 0.00042726383815018006, 'samples': 7463232, 'steps': 38870, 'loss/train': 1.3037258386611938} -11/07/2021 02:41:48 - INFO - __main__ - Step 38872: {'lr': 0.00042726009604447484, 'samples': 7463424, 'steps': 38871, 'loss/train': 1.5725196599960327} -11/07/2021 02:41:49 - INFO - __main__ - Step 38873: {'lr': 0.00042725635385889893, 'samples': 7463616, 'steps': 38872, 'loss/train': 1.7052489519119263} -11/07/2021 02:41:49 - INFO - __main__ - Step 38874: {'lr': 0.0004272526115934541, 'samples': 7463808, 'steps': 38873, 'loss/train': 1.9589136838912964} -11/07/2021 02:41:49 - INFO - __main__ - Step 38875: {'lr': 0.0004272488692481419, 'samples': 7464000, 'steps': 38874, 'loss/train': 1.8079824447631836} -11/07/2021 02:41:50 - INFO - __main__ - Step 38876: {'lr': 0.00042724512682296416, 'samples': 7464192, 'steps': 38875, 'loss/train': 1.7487462759017944} -11/07/2021 02:41:50 - INFO - __main__ - Step 38877: {'lr': 0.00042724138431792245, 'samples': 7464384, 'steps': 38876, 'loss/train': 0.17262661457061768} -11/07/2021 02:41:50 - INFO - __main__ - Step 38878: {'lr': 0.0004272376417330186, 'samples': 7464576, 'steps': 38877, 'loss/train': 1.7479337453842163} -11/07/2021 02:41:51 - INFO - __main__ - Step 38879: {'lr': 0.00042723389906825415, 'samples': 7464768, 'steps': 38878, 'loss/train': 1.7263894081115723} -11/07/2021 02:41:52 - INFO - __main__ - Step 38880: {'lr': 0.0004272301563236308, 'samples': 7464960, 'steps': 38879, 'loss/train': 1.2034226655960083} -11/07/2021 02:41:52 - INFO - __main__ - Step 38881: {'lr': 0.0004272264134991503, 'samples': 7465152, 'steps': 38880, 'loss/train': 1.4417294263839722} -11/07/2021 02:41:52 - INFO - __main__ - Step 38882: {'lr': 0.0004272226705948143, 'samples': 7465344, 'steps': 38881, 'loss/train': 0.8323983550071716} -11/07/2021 02:41:53 - INFO - __main__ - Step 38883: {'lr': 0.00042721892761062453, 'samples': 7465536, 'steps': 38882, 'loss/train': 1.609955906867981} -11/07/2021 02:41:54 - INFO - __main__ - Step 38884: {'lr': 0.00042721518454658265, 'samples': 7465728, 'steps': 38883, 'loss/train': 1.783393383026123} -11/07/2021 02:41:54 - INFO - __main__ - Step 38885: {'lr': 0.0004272114414026903, 'samples': 7465920, 'steps': 38884, 'loss/train': 1.819656252861023} -11/07/2021 02:41:54 - INFO - __main__ - Step 38886: {'lr': 0.00042720769817894926, 'samples': 7466112, 'steps': 38885, 'loss/train': 1.1744916439056396} -11/07/2021 02:41:55 - INFO - __main__ - Step 38887: {'lr': 0.00042720395487536115, 'samples': 7466304, 'steps': 38886, 'loss/train': 2.7242424488067627} -11/07/2021 02:41:55 - INFO - __main__ - Step 38888: {'lr': 0.0004272002114919277, 'samples': 7466496, 'steps': 38887, 'loss/train': 0.7330546379089355} -11/07/2021 02:41:56 - INFO - __main__ - Step 38889: {'lr': 0.0004271964680286505, 'samples': 7466688, 'steps': 38888, 'loss/train': 0.8956628441810608} -11/07/2021 02:41:57 - INFO - __main__ - Step 38890: {'lr': 0.00042719272448553137, 'samples': 7466880, 'steps': 38889, 'loss/train': 1.526174783706665} -11/07/2021 02:41:57 - INFO - __main__ - Step 38891: {'lr': 0.00042718898086257183, 'samples': 7467072, 'steps': 38890, 'loss/train': 1.5497913360595703} -11/07/2021 02:41:57 - INFO - __main__ - Step 38892: {'lr': 0.0004271852371597738, 'samples': 7467264, 'steps': 38891, 'loss/train': 1.5525308847427368} -11/07/2021 02:41:58 - INFO - __main__ - Step 38893: {'lr': 0.00042718149337713873, 'samples': 7467456, 'steps': 38892, 'loss/train': 1.6520709991455078} -11/07/2021 02:41:59 - INFO - __main__ - Step 38894: {'lr': 0.0004271777495146685, 'samples': 7467648, 'steps': 38893, 'loss/train': 1.3811542987823486} -11/07/2021 02:41:59 - INFO - __main__ - Step 38895: {'lr': 0.00042717400557236467, 'samples': 7467840, 'steps': 38894, 'loss/train': 1.4010035991668701} -11/07/2021 02:41:59 - INFO - __main__ - Step 38896: {'lr': 0.000427170261550229, 'samples': 7468032, 'steps': 38895, 'loss/train': 1.5982306003570557} -11/07/2021 02:42:00 - INFO - __main__ - Step 38897: {'lr': 0.0004271665174482631, 'samples': 7468224, 'steps': 38896, 'loss/train': 1.3285613059997559} -11/07/2021 02:42:00 - INFO - __main__ - Step 38898: {'lr': 0.0004271627732664687, 'samples': 7468416, 'steps': 38897, 'loss/train': 0.915793776512146} -11/07/2021 02:42:01 - INFO - __main__ - Step 38899: {'lr': 0.0004271590290048475, 'samples': 7468608, 'steps': 38898, 'loss/train': 1.3674812316894531} -11/07/2021 02:42:01 - INFO - __main__ - Step 38900: {'lr': 0.00042715528466340117, 'samples': 7468800, 'steps': 38899, 'loss/train': 1.742058515548706} -11/07/2021 02:42:02 - INFO - __main__ - Step 38901: {'lr': 0.00042715154024213143, 'samples': 7468992, 'steps': 38900, 'loss/train': 1.2003147602081299} -11/07/2021 02:42:02 - INFO - __main__ - Step 38902: {'lr': 0.0004271477957410399, 'samples': 7469184, 'steps': 38901, 'loss/train': 1.4027563333511353} -11/07/2021 02:42:02 - INFO - __main__ - Step 38903: {'lr': 0.00042714405116012834, 'samples': 7469376, 'steps': 38902, 'loss/train': 1.6637219190597534} -11/07/2021 02:42:04 - INFO - __main__ - Step 38904: {'lr': 0.0004271403064993984, 'samples': 7469568, 'steps': 38903, 'loss/train': 1.1860729455947876} -11/07/2021 02:42:04 - INFO - __main__ - Step 38905: {'lr': 0.00042713656175885173, 'samples': 7469760, 'steps': 38904, 'loss/train': 1.5975831747055054} -11/07/2021 02:42:05 - INFO - __main__ - Step 38906: {'lr': 0.00042713281693849015, 'samples': 7469952, 'steps': 38905, 'loss/train': 0.8513796925544739} -11/07/2021 02:42:05 - INFO - __main__ - Step 38907: {'lr': 0.0004271290720383152, 'samples': 7470144, 'steps': 38906, 'loss/train': 1.9151580333709717} -11/07/2021 02:42:05 - INFO - __main__ - Step 38908: {'lr': 0.00042712532705832865, 'samples': 7470336, 'steps': 38907, 'loss/train': 1.497770071029663} -11/07/2021 02:42:06 - INFO - __main__ - Step 38909: {'lr': 0.0004271215819985321, 'samples': 7470528, 'steps': 38908, 'loss/train': 0.600193202495575} -11/07/2021 02:42:07 - INFO - __main__ - Step 38910: {'lr': 0.0004271178368589273, 'samples': 7470720, 'steps': 38909, 'loss/train': 1.7031151056289673} -11/07/2021 02:42:07 - INFO - __main__ - Step 38911: {'lr': 0.000427114091639516, 'samples': 7470912, 'steps': 38910, 'loss/train': 0.9450470209121704} -11/07/2021 02:42:08 - INFO - __main__ - Step 38912: {'lr': 0.0004271103463402998, 'samples': 7471104, 'steps': 38911, 'loss/train': 1.601342797279358} -11/07/2021 02:42:08 - INFO - __main__ - Step 38913: {'lr': 0.0004271066009612804, 'samples': 7471296, 'steps': 38912, 'loss/train': 1.6177656650543213} -11/07/2021 02:42:08 - INFO - __main__ - Step 38914: {'lr': 0.0004271028555024594, 'samples': 7471488, 'steps': 38913, 'loss/train': 1.7592273950576782} -11/07/2021 02:42:10 - INFO - __main__ - Step 38915: {'lr': 0.0004270991099638387, 'samples': 7471680, 'steps': 38914, 'loss/train': 0.23037822544574738} -11/07/2021 02:42:10 - INFO - __main__ - Step 38916: {'lr': 0.0004270953643454199, 'samples': 7471872, 'steps': 38915, 'loss/train': 1.353023886680603} -11/07/2021 02:42:10 - INFO - __main__ - Step 38917: {'lr': 0.0004270916186472046, 'samples': 7472064, 'steps': 38916, 'loss/train': 0.954717218875885} -11/07/2021 02:42:11 - INFO - __main__ - Step 38918: {'lr': 0.0004270878728691946, 'samples': 7472256, 'steps': 38917, 'loss/train': 1.196390151977539} -11/07/2021 02:42:11 - INFO - __main__ - Step 38919: {'lr': 0.00042708412701139147, 'samples': 7472448, 'steps': 38918, 'loss/train': 1.3688315153121948} -11/07/2021 02:42:13 - INFO - __main__ - Step 38920: {'lr': 0.000427080381073797, 'samples': 7472640, 'steps': 38919, 'loss/train': 1.7761547565460205} -11/07/2021 02:42:13 - INFO - __main__ - Step 38921: {'lr': 0.00042707663505641287, 'samples': 7472832, 'steps': 38920, 'loss/train': 1.8193520307540894} -11/07/2021 02:42:13 - INFO - __main__ - Step 38922: {'lr': 0.00042707288895924066, 'samples': 7473024, 'steps': 38921, 'loss/train': 1.3390640020370483} -11/07/2021 02:42:14 - INFO - __main__ - Step 38923: {'lr': 0.0004270691427822823, 'samples': 7473216, 'steps': 38922, 'loss/train': 1.3779325485229492} -11/07/2021 02:42:14 - INFO - __main__ - Step 38924: {'lr': 0.0004270653965255391, 'samples': 7473408, 'steps': 38923, 'loss/train': 1.0960659980773926} -11/07/2021 02:42:14 - INFO - __main__ - Step 38925: {'lr': 0.0004270616501890131, 'samples': 7473600, 'steps': 38924, 'loss/train': 1.1420000791549683} -11/07/2021 02:42:15 - INFO - __main__ - Step 38926: {'lr': 0.0004270579037727058, 'samples': 7473792, 'steps': 38925, 'loss/train': 0.8926109075546265} -11/07/2021 02:42:15 - INFO - __main__ - Step 38927: {'lr': 0.000427054157276619, 'samples': 7473984, 'steps': 38926, 'loss/train': 1.9323151111602783} -11/07/2021 02:42:16 - INFO - __main__ - Step 38928: {'lr': 0.00042705041070075433, 'samples': 7474176, 'steps': 38927, 'loss/train': 0.7841858863830566} -11/07/2021 02:42:17 - INFO - __main__ - Step 38929: {'lr': 0.00042704666404511343, 'samples': 7474368, 'steps': 38928, 'loss/train': 1.7835983037948608} -11/07/2021 02:42:17 - INFO - __main__ - Step 38930: {'lr': 0.000427042917309698, 'samples': 7474560, 'steps': 38929, 'loss/train': 1.7741930484771729} -11/07/2021 02:42:17 - INFO - __main__ - Step 38931: {'lr': 0.00042703917049450983, 'samples': 7474752, 'steps': 38930, 'loss/train': 1.5438940525054932} -11/07/2021 02:42:18 - INFO - __main__ - Step 38932: {'lr': 0.0004270354235995505, 'samples': 7474944, 'steps': 38931, 'loss/train': 1.4355179071426392} -11/07/2021 02:42:19 - INFO - __main__ - Step 38933: {'lr': 0.0004270316766248218, 'samples': 7475136, 'steps': 38932, 'loss/train': 1.6149401664733887} -11/07/2021 02:42:19 - INFO - __main__ - Step 38934: {'lr': 0.0004270279295703253, 'samples': 7475328, 'steps': 38933, 'loss/train': 1.5284372568130493} -11/07/2021 02:42:19 - INFO - __main__ - Step 38935: {'lr': 0.00042702418243606275, 'samples': 7475520, 'steps': 38934, 'loss/train': 1.5661935806274414} -11/07/2021 02:42:20 - INFO - __main__ - Step 38936: {'lr': 0.00042702043522203594, 'samples': 7475712, 'steps': 38935, 'loss/train': 1.6040937900543213} -11/07/2021 02:42:20 - INFO - __main__ - Step 38937: {'lr': 0.00042701668792824633, 'samples': 7475904, 'steps': 38936, 'loss/train': 1.6600172519683838} -11/07/2021 02:42:21 - INFO - __main__ - Step 38938: {'lr': 0.00042701294055469576, 'samples': 7476096, 'steps': 38937, 'loss/train': 1.6687569618225098} -11/07/2021 02:42:21 - INFO - __main__ - Step 38939: {'lr': 0.0004270091931013859, 'samples': 7476288, 'steps': 38938, 'loss/train': 1.7354636192321777} -11/07/2021 02:42:22 - INFO - __main__ - Step 38940: {'lr': 0.00042700544556831846, 'samples': 7476480, 'steps': 38939, 'loss/train': 1.436832308769226} -11/07/2021 02:42:22 - INFO - __main__ - Step 38941: {'lr': 0.00042700169795549504, 'samples': 7476672, 'steps': 38940, 'loss/train': 1.759921669960022} -11/07/2021 02:42:23 - INFO - __main__ - Step 38942: {'lr': 0.00042699795026291743, 'samples': 7476864, 'steps': 38941, 'loss/train': 2.0764222145080566} -11/07/2021 02:42:24 - INFO - __main__ - Step 38943: {'lr': 0.0004269942024905872, 'samples': 7477056, 'steps': 38942, 'loss/train': 1.6727497577667236} -11/07/2021 02:42:24 - INFO - __main__ - Step 38944: {'lr': 0.00042699045463850623, 'samples': 7477248, 'steps': 38943, 'loss/train': 1.5481544733047485} -11/07/2021 02:42:25 - INFO - __main__ - Step 38945: {'lr': 0.000426986706706676, 'samples': 7477440, 'steps': 38944, 'loss/train': 1.027152180671692} -11/07/2021 02:42:25 - INFO - __main__ - Step 38946: {'lr': 0.00042698295869509836, 'samples': 7477632, 'steps': 38945, 'loss/train': 1.5602725744247437} -11/07/2021 02:42:25 - INFO - __main__ - Step 38947: {'lr': 0.0004269792106037749, 'samples': 7477824, 'steps': 38946, 'loss/train': 0.6573772430419922} -11/07/2021 02:42:26 - INFO - __main__ - Step 38948: {'lr': 0.0004269754624327073, 'samples': 7478016, 'steps': 38947, 'loss/train': 2.1020119190216064} -11/07/2021 02:42:27 - INFO - __main__ - Step 38949: {'lr': 0.0004269717141818973, 'samples': 7478208, 'steps': 38948, 'loss/train': 1.3972387313842773} -11/07/2021 02:42:27 - INFO - __main__ - Step 38950: {'lr': 0.0004269679658513466, 'samples': 7478400, 'steps': 38949, 'loss/train': 1.495678186416626} -11/07/2021 02:42:27 - INFO - __main__ - Step 38951: {'lr': 0.00042696421744105686, 'samples': 7478592, 'steps': 38950, 'loss/train': 1.2925618886947632} -11/07/2021 02:42:28 - INFO - __main__ - Step 38952: {'lr': 0.0004269604689510298, 'samples': 7478784, 'steps': 38951, 'loss/train': 2.0521535873413086} -11/07/2021 02:42:28 - INFO - __main__ - Step 38953: {'lr': 0.0004269567203812671, 'samples': 7478976, 'steps': 38952, 'loss/train': 1.5479966402053833} -11/07/2021 02:42:29 - INFO - __main__ - Step 38954: {'lr': 0.00042695297173177033, 'samples': 7479168, 'steps': 38953, 'loss/train': 0.9544076919555664} -11/07/2021 02:42:30 - INFO - __main__ - Step 38955: {'lr': 0.0004269492230025413, 'samples': 7479360, 'steps': 38954, 'loss/train': 1.1891474723815918} -11/07/2021 02:42:30 - INFO - __main__ - Step 38956: {'lr': 0.0004269454741935818, 'samples': 7479552, 'steps': 38955, 'loss/train': 1.60728919506073} -11/07/2021 02:42:30 - INFO - __main__ - Step 38957: {'lr': 0.00042694172530489326, 'samples': 7479744, 'steps': 38956, 'loss/train': 1.171259880065918} -11/07/2021 02:42:31 - INFO - __main__ - Step 38958: {'lr': 0.00042693797633647755, 'samples': 7479936, 'steps': 38957, 'loss/train': 1.6915109157562256} -11/07/2021 02:42:32 - INFO - __main__ - Step 38959: {'lr': 0.00042693422728833644, 'samples': 7480128, 'steps': 38958, 'loss/train': 1.4069545269012451} -11/07/2021 02:42:32 - INFO - __main__ - Step 38960: {'lr': 0.00042693047816047135, 'samples': 7480320, 'steps': 38959, 'loss/train': 1.5176678895950317} -11/07/2021 02:42:32 - INFO - __main__ - Step 38961: {'lr': 0.0004269267289528842, 'samples': 7480512, 'steps': 38960, 'loss/train': 2.151459217071533} -11/07/2021 02:42:33 - INFO - __main__ - Step 38962: {'lr': 0.00042692297966557657, 'samples': 7480704, 'steps': 38961, 'loss/train': 1.3303264379501343} -11/07/2021 02:42:33 - INFO - __main__ - Step 38963: {'lr': 0.0004269192302985502, 'samples': 7480896, 'steps': 38962, 'loss/train': 1.3381013870239258} -11/07/2021 02:42:34 - INFO - __main__ - Step 38964: {'lr': 0.00042691548085180666, 'samples': 7481088, 'steps': 38963, 'loss/train': 1.6442064046859741} -11/07/2021 02:42:34 - INFO - __main__ - Step 38965: {'lr': 0.00042691173132534775, 'samples': 7481280, 'steps': 38964, 'loss/train': 1.4329073429107666} -11/07/2021 02:42:35 - INFO - __main__ - Step 38966: {'lr': 0.0004269079817191752, 'samples': 7481472, 'steps': 38965, 'loss/train': 1.486147403717041} -11/07/2021 02:42:35 - INFO - __main__ - Step 38967: {'lr': 0.00042690423203329067, 'samples': 7481664, 'steps': 38966, 'loss/train': 1.5373287200927734} -11/07/2021 02:42:35 - INFO - __main__ - Step 38968: {'lr': 0.0004269004822676958, 'samples': 7481856, 'steps': 38967, 'loss/train': 1.4226380586624146} -11/07/2021 02:42:37 - INFO - __main__ - Step 38969: {'lr': 0.0004268967324223922, 'samples': 7482048, 'steps': 38968, 'loss/train': 1.3333868980407715} -11/07/2021 02:42:37 - INFO - __main__ - Step 38970: {'lr': 0.00042689298249738185, 'samples': 7482240, 'steps': 38969, 'loss/train': 0.6204865574836731} -11/07/2021 02:42:37 - INFO - __main__ - Step 38971: {'lr': 0.00042688923249266614, 'samples': 7482432, 'steps': 38970, 'loss/train': 1.3735517263412476} -11/07/2021 02:42:38 - INFO - __main__ - Step 38972: {'lr': 0.00042688548240824687, 'samples': 7482624, 'steps': 38971, 'loss/train': 1.390674114227295} -11/07/2021 02:42:38 - INFO - __main__ - Step 38973: {'lr': 0.00042688173224412573, 'samples': 7482816, 'steps': 38972, 'loss/train': 1.1444605588912964} -11/07/2021 02:42:39 - INFO - __main__ - Step 38974: {'lr': 0.00042687798200030446, 'samples': 7483008, 'steps': 38973, 'loss/train': 1.1193890571594238} -11/07/2021 02:42:39 - INFO - __main__ - Step 38975: {'lr': 0.00042687423167678463, 'samples': 7483200, 'steps': 38974, 'loss/train': 1.9068354368209839} -11/07/2021 02:42:40 - INFO - __main__ - Step 38976: {'lr': 0.0004268704812735681, 'samples': 7483392, 'steps': 38975, 'loss/train': 1.6004170179367065} -11/07/2021 02:42:40 - INFO - __main__ - Step 38977: {'lr': 0.00042686673079065637, 'samples': 7483584, 'steps': 38976, 'loss/train': 1.358608603477478} -11/07/2021 02:42:40 - INFO - __main__ - Step 38978: {'lr': 0.00042686298022805126, 'samples': 7483776, 'steps': 38977, 'loss/train': 1.4833357334136963} -11/07/2021 02:42:41 - INFO - __main__ - Step 38979: {'lr': 0.0004268592295857544, 'samples': 7483968, 'steps': 38978, 'loss/train': 1.4220755100250244} -11/07/2021 02:42:42 - INFO - __main__ - Step 38980: {'lr': 0.0004268554788637675, 'samples': 7484160, 'steps': 38979, 'loss/train': 1.1065647602081299} -11/07/2021 02:42:42 - INFO - __main__ - Step 38981: {'lr': 0.0004268517280620923, 'samples': 7484352, 'steps': 38980, 'loss/train': 1.544353723526001} -11/07/2021 02:42:42 - INFO - __main__ - Step 38982: {'lr': 0.0004268479771807303, 'samples': 7484544, 'steps': 38981, 'loss/train': 1.8099292516708374} -11/07/2021 02:42:43 - INFO - __main__ - Step 38983: {'lr': 0.00042684422621968346, 'samples': 7484736, 'steps': 38982, 'loss/train': 2.324009418487549} -11/07/2021 02:42:43 - INFO - __main__ - Step 38984: {'lr': 0.0004268404751789533, 'samples': 7484928, 'steps': 38983, 'loss/train': 1.7545044422149658} -11/07/2021 02:42:44 - INFO - __main__ - Step 38985: {'lr': 0.0004268367240585416, 'samples': 7485120, 'steps': 38984, 'loss/train': 1.7155299186706543} -11/07/2021 02:42:44 - INFO - __main__ - Step 38986: {'lr': 0.0004268329728584499, 'samples': 7485312, 'steps': 38985, 'loss/train': 1.4670684337615967} -11/07/2021 02:42:45 - INFO - __main__ - Step 38987: {'lr': 0.0004268292215786801, 'samples': 7485504, 'steps': 38986, 'loss/train': 1.6708879470825195} -11/07/2021 02:42:45 - INFO - __main__ - Step 38988: {'lr': 0.0004268254702192337, 'samples': 7485696, 'steps': 38987, 'loss/train': 1.7074424028396606} -11/07/2021 02:42:45 - INFO - __main__ - Step 38989: {'lr': 0.00042682171878011255, 'samples': 7485888, 'steps': 38988, 'loss/train': 1.547581672668457} -11/07/2021 02:42:47 - INFO - __main__ - Step 38990: {'lr': 0.00042681796726131815, 'samples': 7486080, 'steps': 38989, 'loss/train': 0.6456459760665894} -11/07/2021 02:42:47 - INFO - __main__ - Step 38991: {'lr': 0.0004268142156628524, 'samples': 7486272, 'steps': 38990, 'loss/train': 1.5809472799301147} -11/07/2021 02:42:47 - INFO - __main__ - Step 38992: {'lr': 0.00042681046398471693, 'samples': 7486464, 'steps': 38991, 'loss/train': 1.6774481534957886} -11/07/2021 02:42:48 - INFO - __main__ - Step 38993: {'lr': 0.00042680671222691325, 'samples': 7486656, 'steps': 38992, 'loss/train': 1.2868596315383911} -11/07/2021 02:42:48 - INFO - __main__ - Step 38994: {'lr': 0.0004268029603894433, 'samples': 7486848, 'steps': 38993, 'loss/train': 1.7931604385375977} -11/07/2021 02:42:49 - INFO - __main__ - Step 38995: {'lr': 0.00042679920847230865, 'samples': 7487040, 'steps': 38994, 'loss/train': 1.3785682916641235} -11/07/2021 02:42:49 - INFO - __main__ - Step 38996: {'lr': 0.000426795456475511, 'samples': 7487232, 'steps': 38995, 'loss/train': 1.4442554712295532} -11/07/2021 02:42:50 - INFO - __main__ - Step 38997: {'lr': 0.00042679170439905204, 'samples': 7487424, 'steps': 38996, 'loss/train': 1.5359501838684082} -11/07/2021 02:42:50 - INFO - __main__ - Step 38998: {'lr': 0.0004267879522429334, 'samples': 7487616, 'steps': 38997, 'loss/train': 1.2817848920822144} -11/07/2021 02:42:50 - INFO - __main__ - Step 38999: {'lr': 0.00042678420000715687, 'samples': 7487808, 'steps': 38998, 'loss/train': 1.5414429903030396} -11/07/2021 02:42:52 - INFO - __main__ - Step 39000: {'lr': 0.0004267804476917242, 'samples': 7488000, 'steps': 38999, 'loss/train': 1.793521761894226} -11/07/2021 02:42:52 - INFO - __main__ - Step 39001: {'lr': 0.00042677669529663686, 'samples': 7488192, 'steps': 39000, 'loss/train': 1.7577154636383057} -11/07/2021 02:42:52 - INFO - __main__ - Step 39002: {'lr': 0.0004267729428218968, 'samples': 7488384, 'steps': 39001, 'loss/train': 1.4497911930084229} -11/07/2021 02:42:53 - INFO - __main__ - Step 39003: {'lr': 0.0004267691902675055, 'samples': 7488576, 'steps': 39002, 'loss/train': 1.7540159225463867} -11/07/2021 02:42:53 - INFO - __main__ - Step 39004: {'lr': 0.0004267654376334647, 'samples': 7488768, 'steps': 39003, 'loss/train': 1.9711253643035889} -11/07/2021 02:42:53 - INFO - __main__ - Step 39005: {'lr': 0.00042676168491977617, 'samples': 7488960, 'steps': 39004, 'loss/train': 1.3152886629104614} -11/07/2021 02:42:55 - INFO - __main__ - Step 39006: {'lr': 0.00042675793212644156, 'samples': 7489152, 'steps': 39005, 'loss/train': 1.3990839719772339} -11/07/2021 02:42:55 - INFO - __main__ - Step 39007: {'lr': 0.00042675417925346255, 'samples': 7489344, 'steps': 39006, 'loss/train': 1.7867127656936646} -11/07/2021 02:42:55 - INFO - __main__ - Step 39008: {'lr': 0.0004267504263008408, 'samples': 7489536, 'steps': 39007, 'loss/train': 1.0118520259857178} -11/07/2021 02:42:56 - INFO - __main__ - Step 39009: {'lr': 0.0004267466732685781, 'samples': 7489728, 'steps': 39008, 'loss/train': 1.6900672912597656} -11/07/2021 02:42:56 - INFO - __main__ - Step 39010: {'lr': 0.000426742920156676, 'samples': 7489920, 'steps': 39009, 'loss/train': 1.5228233337402344} -11/07/2021 02:42:57 - INFO - __main__ - Step 39011: {'lr': 0.00042673916696513625, 'samples': 7490112, 'steps': 39010, 'loss/train': 1.2955700159072876} -11/07/2021 02:42:58 - INFO - __main__ - Step 39012: {'lr': 0.0004267354136939607, 'samples': 7490304, 'steps': 39011, 'loss/train': 1.5123738050460815} -11/07/2021 02:42:58 - INFO - __main__ - Step 39013: {'lr': 0.0004267316603431508, 'samples': 7490496, 'steps': 39012, 'loss/train': 0.2923266589641571} -11/07/2021 02:42:58 - INFO - __main__ - Step 39014: {'lr': 0.00042672790691270835, 'samples': 7490688, 'steps': 39013, 'loss/train': 0.26859769225120544} -11/07/2021 02:42:59 - INFO - __main__ - Step 39015: {'lr': 0.00042672415340263507, 'samples': 7490880, 'steps': 39014, 'loss/train': 1.77121102809906} -11/07/2021 02:42:59 - INFO - __main__ - Step 39016: {'lr': 0.00042672039981293255, 'samples': 7491072, 'steps': 39015, 'loss/train': 1.6089158058166504} -11/07/2021 02:43:00 - INFO - __main__ - Step 39017: {'lr': 0.0004267166461436025, 'samples': 7491264, 'steps': 39016, 'loss/train': 1.4633493423461914} -11/07/2021 02:43:00 - INFO - __main__ - Step 39018: {'lr': 0.0004267128923946468, 'samples': 7491456, 'steps': 39017, 'loss/train': 1.7290396690368652} -11/07/2021 02:43:01 - INFO - __main__ - Step 39019: {'lr': 0.00042670913856606693, 'samples': 7491648, 'steps': 39018, 'loss/train': 1.2950791120529175} -11/07/2021 02:43:01 - INFO - __main__ - Step 39020: {'lr': 0.0004267053846578646, 'samples': 7491840, 'steps': 39019, 'loss/train': 1.799487590789795} -11/07/2021 02:43:01 - INFO - __main__ - Step 39021: {'lr': 0.00042670163067004156, 'samples': 7492032, 'steps': 39020, 'loss/train': 1.414844036102295} -11/07/2021 02:43:02 - INFO - __main__ - Step 39022: {'lr': 0.00042669787660259956, 'samples': 7492224, 'steps': 39021, 'loss/train': 1.309682846069336} -11/07/2021 02:43:03 - INFO - __main__ - Step 39023: {'lr': 0.0004266941224555402, 'samples': 7492416, 'steps': 39022, 'loss/train': 1.3504818677902222} -11/07/2021 02:43:03 - INFO - __main__ - Step 39024: {'lr': 0.0004266903682288652, 'samples': 7492608, 'steps': 39023, 'loss/train': 1.6617196798324585} -11/07/2021 02:43:04 - INFO - __main__ - Step 39025: {'lr': 0.00042668661392257626, 'samples': 7492800, 'steps': 39024, 'loss/train': 0.6336386203765869} -11/07/2021 02:43:04 - INFO - __main__ - Step 39026: {'lr': 0.00042668285953667497, 'samples': 7492992, 'steps': 39025, 'loss/train': 2.098825693130493} -11/07/2021 02:43:05 - INFO - __main__ - Step 39027: {'lr': 0.0004266791050711632, 'samples': 7493184, 'steps': 39026, 'loss/train': 1.292114019393921} -11/07/2021 02:43:05 - INFO - __main__ - Step 39028: {'lr': 0.0004266753505260425, 'samples': 7493376, 'steps': 39027, 'loss/train': 0.9015293717384338} -11/07/2021 02:43:06 - INFO - __main__ - Step 39029: {'lr': 0.00042667159590131467, 'samples': 7493568, 'steps': 39028, 'loss/train': 1.6260732412338257} -11/07/2021 02:43:06 - INFO - __main__ - Step 39030: {'lr': 0.0004266678411969813, 'samples': 7493760, 'steps': 39029, 'loss/train': 1.626287579536438} -11/07/2021 02:43:06 - INFO - __main__ - Step 39031: {'lr': 0.0004266640864130441, 'samples': 7493952, 'steps': 39030, 'loss/train': 2.1639013290405273} -11/07/2021 02:43:07 - INFO - __main__ - Step 39032: {'lr': 0.00042666033154950485, 'samples': 7494144, 'steps': 39031, 'loss/train': 1.570765733718872} -11/07/2021 02:43:08 - INFO - __main__ - Step 39033: {'lr': 0.00042665657660636517, 'samples': 7494336, 'steps': 39032, 'loss/train': 1.9968924522399902} -11/07/2021 02:43:08 - INFO - __main__ - Step 39034: {'lr': 0.0004266528215836267, 'samples': 7494528, 'steps': 39033, 'loss/train': 2.419520854949951} -11/07/2021 02:43:08 - INFO - __main__ - Step 39035: {'lr': 0.0004266490664812913, 'samples': 7494720, 'steps': 39034, 'loss/train': 1.085390567779541} -11/07/2021 02:43:09 - INFO - __main__ - Step 39036: {'lr': 0.00042664531129936044, 'samples': 7494912, 'steps': 39035, 'loss/train': 1.7049858570098877} -11/07/2021 02:43:10 - INFO - __main__ - Step 39037: {'lr': 0.00042664155603783606, 'samples': 7495104, 'steps': 39036, 'loss/train': 1.748128056526184} -11/07/2021 02:43:10 - INFO - __main__ - Step 39038: {'lr': 0.00042663780069671965, 'samples': 7495296, 'steps': 39037, 'loss/train': 1.3688992261886597} -11/07/2021 02:43:11 - INFO - __main__ - Step 39039: {'lr': 0.00042663404527601293, 'samples': 7495488, 'steps': 39038, 'loss/train': 1.2607609033584595} -11/07/2021 02:43:11 - INFO - __main__ - Step 39040: {'lr': 0.00042663028977571774, 'samples': 7495680, 'steps': 39039, 'loss/train': 1.2940502166748047} -11/07/2021 02:43:11 - INFO - __main__ - Step 39041: {'lr': 0.0004266265341958355, 'samples': 7495872, 'steps': 39040, 'loss/train': 1.4089736938476562} -11/07/2021 02:43:12 - INFO - __main__ - Step 39042: {'lr': 0.0004266227785363682, 'samples': 7496064, 'steps': 39041, 'loss/train': 1.0120713710784912} -11/07/2021 02:43:13 - INFO - __main__ - Step 39043: {'lr': 0.0004266190227973174, 'samples': 7496256, 'steps': 39042, 'loss/train': 1.0299112796783447} -11/07/2021 02:43:13 - INFO - __main__ - Step 39044: {'lr': 0.00042661526697868475, 'samples': 7496448, 'steps': 39043, 'loss/train': 1.5314782857894897} -11/07/2021 02:43:13 - INFO - __main__ - Step 39045: {'lr': 0.000426611511080472, 'samples': 7496640, 'steps': 39044, 'loss/train': 1.5129510164260864} -11/07/2021 02:43:14 - INFO - __main__ - Step 39046: {'lr': 0.0004266077551026809, 'samples': 7496832, 'steps': 39045, 'loss/train': 1.6129285097122192} -11/07/2021 02:43:14 - INFO - __main__ - Step 39047: {'lr': 0.000426603999045313, 'samples': 7497024, 'steps': 39046, 'loss/train': 1.57774019241333} -11/07/2021 02:43:15 - INFO - __main__ - Step 39048: {'lr': 0.00042660024290837003, 'samples': 7497216, 'steps': 39047, 'loss/train': 1.5723294019699097} -11/07/2021 02:43:15 - INFO - __main__ - Step 39049: {'lr': 0.00042659648669185376, 'samples': 7497408, 'steps': 39048, 'loss/train': 1.8148497343063354} -11/07/2021 02:43:16 - INFO - __main__ - Step 39050: {'lr': 0.0004265927303957658, 'samples': 7497600, 'steps': 39049, 'loss/train': 1.5007797479629517} -11/07/2021 02:43:16 - INFO - __main__ - Step 39051: {'lr': 0.0004265889740201079, 'samples': 7497792, 'steps': 39050, 'loss/train': 0.9909560680389404} -11/07/2021 02:43:17 - INFO - __main__ - Step 39052: {'lr': 0.0004265852175648818, 'samples': 7497984, 'steps': 39051, 'loss/train': 1.711198091506958} -11/07/2021 02:43:17 - INFO - __main__ - Step 39053: {'lr': 0.00042658146103008904, 'samples': 7498176, 'steps': 39052, 'loss/train': 1.286407470703125} -11/07/2021 02:43:18 - INFO - __main__ - Step 39054: {'lr': 0.0004265777044157314, 'samples': 7498368, 'steps': 39053, 'loss/train': 1.2508012056350708} -11/07/2021 02:43:18 - INFO - __main__ - Step 39055: {'lr': 0.0004265739477218106, 'samples': 7498560, 'steps': 39054, 'loss/train': 1.1808032989501953} -11/07/2021 02:43:19 - INFO - __main__ - Step 39056: {'lr': 0.0004265701909483283, 'samples': 7498752, 'steps': 39055, 'loss/train': 1.7937642335891724} -11/07/2021 02:43:19 - INFO - __main__ - Step 39057: {'lr': 0.0004265664340952862, 'samples': 7498944, 'steps': 39056, 'loss/train': 1.225213646888733} -11/07/2021 02:43:20 - INFO - __main__ - Step 39058: {'lr': 0.00042656267716268596, 'samples': 7499136, 'steps': 39057, 'loss/train': 1.51992928981781} -11/07/2021 02:43:20 - INFO - __main__ - Step 39059: {'lr': 0.00042655892015052945, 'samples': 7499328, 'steps': 39058, 'loss/train': 1.9359447956085205} -11/07/2021 02:43:21 - INFO - __main__ - Step 39060: {'lr': 0.00042655516305881803, 'samples': 7499520, 'steps': 39059, 'loss/train': 1.600701093673706} -11/07/2021 02:43:21 - INFO - __main__ - Step 39061: {'lr': 0.00042655140588755366, 'samples': 7499712, 'steps': 39060, 'loss/train': 1.3078956604003906} -11/07/2021 02:43:21 - INFO - __main__ - Step 39062: {'lr': 0.0004265476486367379, 'samples': 7499904, 'steps': 39061, 'loss/train': 1.5851510763168335} -11/07/2021 02:43:22 - INFO - __main__ - Step 39063: {'lr': 0.00042654389130637255, 'samples': 7500096, 'steps': 39062, 'loss/train': 2.0155324935913086} -11/07/2021 02:43:23 - INFO - __main__ - Step 39064: {'lr': 0.0004265401338964592, 'samples': 7500288, 'steps': 39063, 'loss/train': 1.5076969861984253} -11/07/2021 02:43:23 - INFO - __main__ - Step 39065: {'lr': 0.0004265363764069997, 'samples': 7500480, 'steps': 39064, 'loss/train': 1.4725383520126343} -11/07/2021 02:43:24 - INFO - __main__ - Step 39066: {'lr': 0.0004265326188379955, 'samples': 7500672, 'steps': 39065, 'loss/train': 1.3737947940826416} -11/07/2021 02:43:24 - INFO - __main__ - Step 39067: {'lr': 0.00042652886118944844, 'samples': 7500864, 'steps': 39066, 'loss/train': 1.9032598733901978} -11/07/2021 02:43:25 - INFO - __main__ - Step 39068: {'lr': 0.0004265251034613603, 'samples': 7501056, 'steps': 39067, 'loss/train': 1.7712714672088623} -11/07/2021 02:43:25 - INFO - __main__ - Step 39069: {'lr': 0.0004265213456537326, 'samples': 7501248, 'steps': 39068, 'loss/train': 1.6109968423843384} -11/07/2021 02:43:26 - INFO - __main__ - Step 39070: {'lr': 0.0004265175877665671, 'samples': 7501440, 'steps': 39069, 'loss/train': 1.583343505859375} -11/07/2021 02:43:26 - INFO - __main__ - Step 39071: {'lr': 0.0004265138297998655, 'samples': 7501632, 'steps': 39070, 'loss/train': 1.392993688583374} -11/07/2021 02:43:26 - INFO - __main__ - Step 39072: {'lr': 0.0004265100717536295, 'samples': 7501824, 'steps': 39071, 'loss/train': 1.5252935886383057} -11/07/2021 02:43:27 - INFO - __main__ - Step 39073: {'lr': 0.0004265063136278608, 'samples': 7502016, 'steps': 39072, 'loss/train': 1.0011496543884277} -11/07/2021 02:43:28 - INFO - __main__ - Step 39074: {'lr': 0.00042650255542256107, 'samples': 7502208, 'steps': 39073, 'loss/train': 0.8705465793609619} -11/07/2021 02:43:28 - INFO - __main__ - Step 39075: {'lr': 0.000426498797137732, 'samples': 7502400, 'steps': 39074, 'loss/train': 1.4799444675445557} -11/07/2021 02:43:28 - INFO - __main__ - Step 39076: {'lr': 0.00042649503877337523, 'samples': 7502592, 'steps': 39075, 'loss/train': 1.2689144611358643} -11/07/2021 02:43:29 - INFO - __main__ - Step 39077: {'lr': 0.0004264912803294926, 'samples': 7502784, 'steps': 39076, 'loss/train': 1.2915695905685425} -11/07/2021 02:43:29 - INFO - __main__ - Step 39078: {'lr': 0.0004264875218060857, 'samples': 7502976, 'steps': 39077, 'loss/train': 1.4235657453536987} -11/07/2021 02:43:30 - INFO - __main__ - Step 39079: {'lr': 0.00042648376320315634, 'samples': 7503168, 'steps': 39078, 'loss/train': 1.135210633277893} -11/07/2021 02:43:30 - INFO - __main__ - Step 39080: {'lr': 0.000426480004520706, 'samples': 7503360, 'steps': 39079, 'loss/train': 1.3262708187103271} -11/07/2021 02:43:31 - INFO - __main__ - Step 39081: {'lr': 0.00042647624575873656, 'samples': 7503552, 'steps': 39080, 'loss/train': 1.3059016466140747} -11/07/2021 02:43:31 - INFO - __main__ - Step 39082: {'lr': 0.0004264724869172496, 'samples': 7503744, 'steps': 39081, 'loss/train': 1.7730166912078857} -11/07/2021 02:43:31 - INFO - __main__ - Step 39083: {'lr': 0.00042646872799624694, 'samples': 7503936, 'steps': 39082, 'loss/train': 1.3689271211624146} -11/07/2021 02:43:33 - INFO - __main__ - Step 39084: {'lr': 0.00042646496899573005, 'samples': 7504128, 'steps': 39083, 'loss/train': 1.578107476234436} -11/07/2021 02:43:33 - INFO - __main__ - Step 39085: {'lr': 0.0004264612099157009, 'samples': 7504320, 'steps': 39084, 'loss/train': 1.7110601663589478} -11/07/2021 02:43:33 - INFO - __main__ - Step 39086: {'lr': 0.00042645745075616106, 'samples': 7504512, 'steps': 39085, 'loss/train': 0.18499447405338287} -11/07/2021 02:43:34 - INFO - __main__ - Step 39087: {'lr': 0.0004264536915171121, 'samples': 7504704, 'steps': 39086, 'loss/train': 1.8357080221176147} -11/07/2021 02:43:34 - INFO - __main__ - Step 39088: {'lr': 0.0004264499321985559, 'samples': 7504896, 'steps': 39087, 'loss/train': 1.2061140537261963} -11/07/2021 02:43:35 - INFO - __main__ - Step 39089: {'lr': 0.0004264461728004941, 'samples': 7505088, 'steps': 39088, 'loss/train': 1.141921877861023} -11/07/2021 02:43:35 - INFO - __main__ - Step 39090: {'lr': 0.0004264424133229283, 'samples': 7505280, 'steps': 39089, 'loss/train': 0.20083756744861603} -11/07/2021 02:43:36 - INFO - __main__ - Step 39091: {'lr': 0.0004264386537658603, 'samples': 7505472, 'steps': 39090, 'loss/train': 6.336944103240967} -11/07/2021 02:43:36 - INFO - __main__ - Step 39092: {'lr': 0.0004264348941292919, 'samples': 7505664, 'steps': 39091, 'loss/train': 1.4087821245193481} -11/07/2021 02:43:37 - INFO - __main__ - Step 39093: {'lr': 0.0004264311344132245, 'samples': 7505856, 'steps': 39092, 'loss/train': 1.8912596702575684} -11/07/2021 02:43:38 - INFO - __main__ - Step 39094: {'lr': 0.00042642737461766003, 'samples': 7506048, 'steps': 39093, 'loss/train': 1.4628355503082275} -11/07/2021 02:43:38 - INFO - __main__ - Step 39095: {'lr': 0.0004264236147426, 'samples': 7506240, 'steps': 39094, 'loss/train': 1.4418323040008545} -11/07/2021 02:43:38 - INFO - __main__ - Step 39096: {'lr': 0.0004264198547880464, 'samples': 7506432, 'steps': 39095, 'loss/train': 1.587921380996704} -11/07/2021 02:43:39 - INFO - __main__ - Step 39097: {'lr': 0.00042641609475400054, 'samples': 7506624, 'steps': 39096, 'loss/train': 2.056940793991089} -11/07/2021 02:43:39 - INFO - __main__ - Step 39098: {'lr': 0.0004264123346404644, 'samples': 7506816, 'steps': 39097, 'loss/train': 1.7755131721496582} -11/07/2021 02:43:39 - INFO - __main__ - Step 39099: {'lr': 0.0004264085744474396, 'samples': 7507008, 'steps': 39098, 'loss/train': 1.3965548276901245} -11/07/2021 02:43:40 - INFO - __main__ - Step 39100: {'lr': 0.0004264048141749278, 'samples': 7507200, 'steps': 39099, 'loss/train': 1.769647240638733} -11/07/2021 02:43:41 - INFO - __main__ - Step 39101: {'lr': 0.00042640105382293073, 'samples': 7507392, 'steps': 39100, 'loss/train': 1.4096415042877197} -11/07/2021 02:43:41 - INFO - __main__ - Step 39102: {'lr': 0.00042639729339145004, 'samples': 7507584, 'steps': 39101, 'loss/train': 0.1855313628911972} -11/07/2021 02:43:42 - INFO - __main__ - Step 39103: {'lr': 0.0004263935328804874, 'samples': 7507776, 'steps': 39102, 'loss/train': 1.5442306995391846} -11/07/2021 02:43:42 - INFO - __main__ - Step 39104: {'lr': 0.0004263897722900447, 'samples': 7507968, 'steps': 39103, 'loss/train': 0.9975839853286743} -11/07/2021 02:43:43 - INFO - __main__ - Step 39105: {'lr': 0.0004263860116201234, 'samples': 7508160, 'steps': 39104, 'loss/train': 1.142077088356018} -11/07/2021 02:43:43 - INFO - __main__ - Step 39106: {'lr': 0.00042638225087072523, 'samples': 7508352, 'steps': 39105, 'loss/train': 1.9047843217849731} -11/07/2021 02:43:44 - INFO - __main__ - Step 39107: {'lr': 0.00042637849004185203, 'samples': 7508544, 'steps': 39106, 'loss/train': 2.055018663406372} -11/07/2021 02:43:44 - INFO - __main__ - Step 39108: {'lr': 0.0004263747291335054, 'samples': 7508736, 'steps': 39107, 'loss/train': 1.40550696849823} -11/07/2021 02:43:44 - INFO - __main__ - Step 39109: {'lr': 0.00042637096814568696, 'samples': 7508928, 'steps': 39108, 'loss/train': 1.4031354188919067} -11/07/2021 02:43:45 - INFO - __main__ - Step 39110: {'lr': 0.0004263672070783986, 'samples': 7509120, 'steps': 39109, 'loss/train': 2.0347707271575928} -11/07/2021 02:43:46 - INFO - __main__ - Step 39111: {'lr': 0.0004263634459316418, 'samples': 7509312, 'steps': 39110, 'loss/train': 1.3580670356750488} -11/07/2021 02:43:46 - INFO - __main__ - Step 39112: {'lr': 0.0004263596847054184, 'samples': 7509504, 'steps': 39111, 'loss/train': 1.6178772449493408} -11/07/2021 02:43:46 - INFO - __main__ - Step 39113: {'lr': 0.00042635592339973006, 'samples': 7509696, 'steps': 39112, 'loss/train': 1.6451839208602905} -11/07/2021 02:43:47 - INFO - __main__ - Step 39114: {'lr': 0.00042635216201457836, 'samples': 7509888, 'steps': 39113, 'loss/train': 1.5635451078414917} -11/07/2021 02:43:48 - INFO - __main__ - Step 39115: {'lr': 0.00042634840054996527, 'samples': 7510080, 'steps': 39114, 'loss/train': 1.6748383045196533} -11/07/2021 02:43:48 - INFO - __main__ - Step 39116: {'lr': 0.00042634463900589214, 'samples': 7510272, 'steps': 39115, 'loss/train': 1.7744406461715698} -11/07/2021 02:43:49 - INFO - __main__ - Step 39117: {'lr': 0.0004263408773823609, 'samples': 7510464, 'steps': 39116, 'loss/train': 1.3158316612243652} -11/07/2021 02:43:49 - INFO - __main__ - Step 39118: {'lr': 0.00042633711567937325, 'samples': 7510656, 'steps': 39117, 'loss/train': 1.6775025129318237} -11/07/2021 02:43:49 - INFO - __main__ - Step 39119: {'lr': 0.00042633335389693073, 'samples': 7510848, 'steps': 39118, 'loss/train': 0.40122219920158386} -11/07/2021 02:43:51 - INFO - __main__ - Step 39120: {'lr': 0.0004263295920350352, 'samples': 7511040, 'steps': 39119, 'loss/train': 1.5833914279937744} -11/07/2021 02:43:51 - INFO - __main__ - Step 39121: {'lr': 0.0004263258300936882, 'samples': 7511232, 'steps': 39120, 'loss/train': 1.6524046659469604} -11/07/2021 02:43:51 - INFO - __main__ - Step 39122: {'lr': 0.00042632206807289154, 'samples': 7511424, 'steps': 39121, 'loss/train': 1.775888442993164} -11/07/2021 02:43:52 - INFO - __main__ - Step 39123: {'lr': 0.00042631830597264687, 'samples': 7511616, 'steps': 39122, 'loss/train': 0.7915307879447937} -11/07/2021 02:43:52 - INFO - __main__ - Step 39124: {'lr': 0.0004263145437929559, 'samples': 7511808, 'steps': 39123, 'loss/train': 1.0251669883728027} -11/07/2021 02:43:52 - INFO - __main__ - Step 39125: {'lr': 0.0004263107815338203, 'samples': 7512000, 'steps': 39124, 'loss/train': 1.103756308555603} -11/07/2021 02:43:54 - INFO - __main__ - Step 39126: {'lr': 0.00042630701919524176, 'samples': 7512192, 'steps': 39125, 'loss/train': 1.082054853439331} -11/07/2021 02:43:55 - INFO - __main__ - Step 39127: {'lr': 0.00042630325677722204, 'samples': 7512384, 'steps': 39126, 'loss/train': 1.9423552751541138} -11/07/2021 02:43:55 - INFO - __main__ - Step 39128: {'lr': 0.0004262994942797628, 'samples': 7512576, 'steps': 39127, 'loss/train': 1.4827128648757935} -11/07/2021 02:43:55 - INFO - __main__ - Step 39129: {'lr': 0.0004262957317028657, 'samples': 7512768, 'steps': 39128, 'loss/train': 1.9064688682556152} -11/07/2021 02:43:56 - INFO - __main__ - Step 39130: {'lr': 0.00042629196904653245, 'samples': 7512960, 'steps': 39129, 'loss/train': 1.6398931741714478} -11/07/2021 02:43:56 - INFO - __main__ - Step 39131: {'lr': 0.00042628820631076484, 'samples': 7513152, 'steps': 39130, 'loss/train': 1.8073322772979736} -11/07/2021 02:43:56 - INFO - __main__ - Step 39132: {'lr': 0.0004262844434955644, 'samples': 7513344, 'steps': 39131, 'loss/train': 1.827433705329895} -11/07/2021 02:43:57 - INFO - __main__ - Step 39133: {'lr': 0.00042628068060093294, 'samples': 7513536, 'steps': 39132, 'loss/train': 1.417256474494934} -11/07/2021 02:43:58 - INFO - __main__ - Step 39134: {'lr': 0.0004262769176268722, 'samples': 7513728, 'steps': 39133, 'loss/train': 1.0433682203292847} -11/07/2021 02:43:58 - INFO - __main__ - Step 39135: {'lr': 0.0004262731545733837, 'samples': 7513920, 'steps': 39134, 'loss/train': 0.5978344082832336} -11/07/2021 02:43:59 - INFO - __main__ - Step 39136: {'lr': 0.0004262693914404692, 'samples': 7514112, 'steps': 39135, 'loss/train': 2.1662096977233887} -11/07/2021 02:43:59 - INFO - __main__ - Step 39137: {'lr': 0.0004262656282281305, 'samples': 7514304, 'steps': 39136, 'loss/train': 1.5228852033615112} -11/07/2021 02:43:59 - INFO - __main__ - Step 39138: {'lr': 0.0004262618649363692, 'samples': 7514496, 'steps': 39137, 'loss/train': 1.7849223613739014} -11/07/2021 02:44:00 - INFO - __main__ - Step 39139: {'lr': 0.0004262581015651871, 'samples': 7514688, 'steps': 39138, 'loss/train': 1.654083251953125} -11/07/2021 02:44:01 - INFO - __main__ - Step 39140: {'lr': 0.0004262543381145857, 'samples': 7514880, 'steps': 39139, 'loss/train': 1.332046627998352} -11/07/2021 02:44:01 - INFO - __main__ - Step 39141: {'lr': 0.0004262505745845669, 'samples': 7515072, 'steps': 39140, 'loss/train': 1.7173765897750854} -11/07/2021 02:44:01 - INFO - __main__ - Step 39142: {'lr': 0.0004262468109751323, 'samples': 7515264, 'steps': 39141, 'loss/train': 0.9578734636306763} -11/07/2021 02:44:02 - INFO - __main__ - Step 39143: {'lr': 0.0004262430472862836, 'samples': 7515456, 'steps': 39142, 'loss/train': 1.4384714365005493} -11/07/2021 02:44:03 - INFO - __main__ - Step 39144: {'lr': 0.00042623928351802245, 'samples': 7515648, 'steps': 39143, 'loss/train': 1.6106135845184326} -11/07/2021 02:44:03 - INFO - __main__ - Step 39145: {'lr': 0.00042623551967035066, 'samples': 7515840, 'steps': 39144, 'loss/train': 1.6195812225341797} -11/07/2021 02:44:03 - INFO - __main__ - Step 39146: {'lr': 0.0004262317557432699, 'samples': 7516032, 'steps': 39145, 'loss/train': 1.3861796855926514} -11/07/2021 02:44:04 - INFO - __main__ - Step 39147: {'lr': 0.0004262279917367817, 'samples': 7516224, 'steps': 39146, 'loss/train': 2.5530037879943848} -11/07/2021 02:44:04 - INFO - __main__ - Step 39148: {'lr': 0.00042622422765088805, 'samples': 7516416, 'steps': 39147, 'loss/train': 1.7445322275161743} -11/07/2021 02:44:05 - INFO - __main__ - Step 39149: {'lr': 0.00042622046348559034, 'samples': 7516608, 'steps': 39148, 'loss/train': 1.8676589727401733} -11/07/2021 02:44:06 - INFO - __main__ - Step 39150: {'lr': 0.00042621669924089044, 'samples': 7516800, 'steps': 39149, 'loss/train': 1.1236180067062378} -11/07/2021 02:44:06 - INFO - __main__ - Step 39151: {'lr': 0.00042621293491679007, 'samples': 7516992, 'steps': 39150, 'loss/train': 1.6182490587234497} -11/07/2021 02:44:06 - INFO - __main__ - Step 39152: {'lr': 0.00042620917051329086, 'samples': 7517184, 'steps': 39151, 'loss/train': 1.8522018194198608} -11/07/2021 02:44:07 - INFO - __main__ - Step 39153: {'lr': 0.0004262054060303945, 'samples': 7517376, 'steps': 39152, 'loss/train': 1.569541335105896} -11/07/2021 02:44:08 - INFO - __main__ - Step 39154: {'lr': 0.00042620164146810267, 'samples': 7517568, 'steps': 39153, 'loss/train': 1.5665749311447144} -11/07/2021 02:44:08 - INFO - __main__ - Step 39155: {'lr': 0.0004261978768264172, 'samples': 7517760, 'steps': 39154, 'loss/train': 1.3959105014801025} -11/07/2021 02:44:08 - INFO - __main__ - Step 39156: {'lr': 0.00042619411210533957, 'samples': 7517952, 'steps': 39155, 'loss/train': 1.1868535280227661} -11/07/2021 02:44:09 - INFO - __main__ - Step 39157: {'lr': 0.00042619034730487167, 'samples': 7518144, 'steps': 39156, 'loss/train': 1.2965528964996338} -11/07/2021 02:44:09 - INFO - __main__ - Step 39158: {'lr': 0.00042618658242501507, 'samples': 7518336, 'steps': 39157, 'loss/train': 1.6020418405532837} -11/07/2021 02:44:09 - INFO - __main__ - Step 39159: {'lr': 0.0004261828174657716, 'samples': 7518528, 'steps': 39158, 'loss/train': 1.598738431930542} -11/07/2021 02:44:11 - INFO - __main__ - Step 39160: {'lr': 0.0004261790524271427, 'samples': 7518720, 'steps': 39159, 'loss/train': 0.7763488292694092} -11/07/2021 02:44:11 - INFO - __main__ - Step 39161: {'lr': 0.00042617528730913036, 'samples': 7518912, 'steps': 39160, 'loss/train': 1.378023386001587} -11/07/2021 02:44:11 - INFO - __main__ - Step 39162: {'lr': 0.00042617152211173615, 'samples': 7519104, 'steps': 39161, 'loss/train': 1.0492256879806519} -11/07/2021 02:44:12 - INFO - __main__ - Step 39163: {'lr': 0.0004261677568349618, 'samples': 7519296, 'steps': 39162, 'loss/train': 1.1615722179412842} -11/07/2021 02:44:12 - INFO - __main__ - Step 39164: {'lr': 0.0004261639914788089, 'samples': 7519488, 'steps': 39163, 'loss/train': 1.13607919216156} -11/07/2021 02:44:13 - INFO - __main__ - Step 39165: {'lr': 0.0004261602260432792, 'samples': 7519680, 'steps': 39164, 'loss/train': 1.5264469385147095} -11/07/2021 02:44:13 - INFO - __main__ - Step 39166: {'lr': 0.0004261564605283745, 'samples': 7519872, 'steps': 39165, 'loss/train': 1.8770747184753418} -11/07/2021 02:44:14 - INFO - __main__ - Step 39167: {'lr': 0.0004261526949340965, 'samples': 7520064, 'steps': 39166, 'loss/train': 1.918188452720642} -11/07/2021 02:44:14 - INFO - __main__ - Step 39168: {'lr': 0.0004261489292604467, 'samples': 7520256, 'steps': 39167, 'loss/train': 1.4785051345825195} -11/07/2021 02:44:14 - INFO - __main__ - Step 39169: {'lr': 0.0004261451635074269, 'samples': 7520448, 'steps': 39168, 'loss/train': 1.4458575248718262} -11/07/2021 02:44:15 - INFO - __main__ - Step 39170: {'lr': 0.0004261413976750388, 'samples': 7520640, 'steps': 39169, 'loss/train': 1.223093032836914} -11/07/2021 02:44:16 - INFO - __main__ - Step 39171: {'lr': 0.00042613763176328415, 'samples': 7520832, 'steps': 39170, 'loss/train': 1.6749415397644043} -11/07/2021 02:44:16 - INFO - __main__ - Step 39172: {'lr': 0.00042613386577216455, 'samples': 7521024, 'steps': 39171, 'loss/train': 1.0120102167129517} -11/07/2021 02:44:16 - INFO - __main__ - Step 39173: {'lr': 0.0004261300997016818, 'samples': 7521216, 'steps': 39172, 'loss/train': 1.5103209018707275} -11/07/2021 02:44:17 - INFO - __main__ - Step 39174: {'lr': 0.0004261263335518375, 'samples': 7521408, 'steps': 39173, 'loss/train': 1.765062689781189} -11/07/2021 02:44:18 - INFO - __main__ - Step 39175: {'lr': 0.00042612256732263345, 'samples': 7521600, 'steps': 39174, 'loss/train': 1.3832707405090332} -11/07/2021 02:44:18 - INFO - __main__ - Step 39176: {'lr': 0.0004261188010140712, 'samples': 7521792, 'steps': 39175, 'loss/train': 1.7844562530517578} -11/07/2021 02:44:19 - INFO - __main__ - Step 39177: {'lr': 0.00042611503462615266, 'samples': 7521984, 'steps': 39176, 'loss/train': 1.3058295249938965} -11/07/2021 02:44:19 - INFO - __main__ - Step 39178: {'lr': 0.0004261112681588793, 'samples': 7522176, 'steps': 39177, 'loss/train': 1.85269033908844} -11/07/2021 02:44:19 - INFO - __main__ - Step 39179: {'lr': 0.000426107501612253, 'samples': 7522368, 'steps': 39178, 'loss/train': 0.9109247922897339} -11/07/2021 02:44:20 - INFO - __main__ - Step 39180: {'lr': 0.0004261037349862753, 'samples': 7522560, 'steps': 39179, 'loss/train': 1.7155182361602783} -11/07/2021 02:44:21 - INFO - __main__ - Step 39181: {'lr': 0.000426099968280948, 'samples': 7522752, 'steps': 39180, 'loss/train': 1.9949593544006348} -11/07/2021 02:44:21 - INFO - __main__ - Step 39182: {'lr': 0.00042609620149627284, 'samples': 7522944, 'steps': 39181, 'loss/train': 1.5575292110443115} -11/07/2021 02:44:21 - INFO - __main__ - Step 39183: {'lr': 0.00042609243463225134, 'samples': 7523136, 'steps': 39182, 'loss/train': 1.2065694332122803} -11/07/2021 02:44:22 - INFO - __main__ - Step 39184: {'lr': 0.00042608866768888533, 'samples': 7523328, 'steps': 39183, 'loss/train': 1.510762333869934} -11/07/2021 02:44:22 - INFO - __main__ - Step 39185: {'lr': 0.0004260849006661765, 'samples': 7523520, 'steps': 39184, 'loss/train': 0.8770667314529419} -11/07/2021 02:44:23 - INFO - __main__ - Step 39186: {'lr': 0.0004260811335641266, 'samples': 7523712, 'steps': 39185, 'loss/train': 1.672101616859436} -11/07/2021 02:44:24 - INFO - __main__ - Step 39187: {'lr': 0.0004260773663827372, 'samples': 7523904, 'steps': 39186, 'loss/train': 1.276141881942749} -11/07/2021 02:44:24 - INFO - __main__ - Step 39188: {'lr': 0.00042607359912201004, 'samples': 7524096, 'steps': 39187, 'loss/train': 0.5991111397743225} -11/07/2021 02:44:24 - INFO - __main__ - Step 39189: {'lr': 0.0004260698317819468, 'samples': 7524288, 'steps': 39188, 'loss/train': 1.2625077962875366} -11/07/2021 02:44:25 - INFO - __main__ - Step 39190: {'lr': 0.00042606606436254926, 'samples': 7524480, 'steps': 39189, 'loss/train': 1.1217215061187744} -11/07/2021 02:44:26 - INFO - __main__ - Step 39191: {'lr': 0.000426062296863819, 'samples': 7524672, 'steps': 39190, 'loss/train': 1.4759544134140015} -11/07/2021 02:44:26 - INFO - __main__ - Step 39192: {'lr': 0.00042605852928575796, 'samples': 7524864, 'steps': 39191, 'loss/train': 1.1649805307388306} -11/07/2021 02:44:26 - INFO - __main__ - Step 39193: {'lr': 0.00042605476162836756, 'samples': 7525056, 'steps': 39192, 'loss/train': 0.11307892203330994} -11/07/2021 02:44:27 - INFO - __main__ - Step 39194: {'lr': 0.00042605099389164957, 'samples': 7525248, 'steps': 39193, 'loss/train': 1.0232011079788208} -11/07/2021 02:44:27 - INFO - __main__ - Step 39195: {'lr': 0.00042604722607560575, 'samples': 7525440, 'steps': 39194, 'loss/train': 1.8840378522872925} -11/07/2021 02:44:28 - INFO - __main__ - Step 39196: {'lr': 0.0004260434581802377, 'samples': 7525632, 'steps': 39195, 'loss/train': 1.325415015220642} -11/07/2021 02:44:29 - INFO - __main__ - Step 39197: {'lr': 0.0004260396902055473, 'samples': 7525824, 'steps': 39196, 'loss/train': 1.6330317258834839} -11/07/2021 02:44:29 - INFO - __main__ - Step 39198: {'lr': 0.0004260359221515361, 'samples': 7526016, 'steps': 39197, 'loss/train': 2.978104829788208} -11/07/2021 02:44:29 - INFO - __main__ - Step 39199: {'lr': 0.0004260321540182057, 'samples': 7526208, 'steps': 39198, 'loss/train': 1.3887532949447632} -11/07/2021 02:44:30 - INFO - __main__ - Step 39200: {'lr': 0.00042602838580555814, 'samples': 7526400, 'steps': 39199, 'loss/train': 1.367277979850769} -11/07/2021 02:44:31 - INFO - __main__ - Step 39201: {'lr': 0.0004260246175135948, 'samples': 7526592, 'steps': 39200, 'loss/train': 1.5049934387207031} -11/07/2021 02:44:31 - INFO - __main__ - Step 39202: {'lr': 0.00042602084914231743, 'samples': 7526784, 'steps': 39201, 'loss/train': 2.2483091354370117} -11/07/2021 02:44:31 - INFO - __main__ - Step 39203: {'lr': 0.0004260170806917278, 'samples': 7526976, 'steps': 39202, 'loss/train': 1.7197997570037842} -11/07/2021 02:44:32 - INFO - __main__ - Step 39204: {'lr': 0.0004260133121618276, 'samples': 7527168, 'steps': 39203, 'loss/train': 1.5005837678909302} -11/07/2021 02:44:32 - INFO - __main__ - Step 39205: {'lr': 0.0004260095435526186, 'samples': 7527360, 'steps': 39204, 'loss/train': 1.5221214294433594} -11/07/2021 02:44:32 - INFO - __main__ - Step 39206: {'lr': 0.0004260057748641024, 'samples': 7527552, 'steps': 39205, 'loss/train': 1.5341522693634033} -11/07/2021 02:44:33 - INFO - __main__ - Step 39207: {'lr': 0.00042600200609628063, 'samples': 7527744, 'steps': 39206, 'loss/train': 1.2754578590393066} -11/07/2021 02:44:34 - INFO - __main__ - Step 39208: {'lr': 0.0004259982372491551, 'samples': 7527936, 'steps': 39207, 'loss/train': 1.186719536781311} -11/07/2021 02:44:34 - INFO - __main__ - Step 39209: {'lr': 0.00042599446832272746, 'samples': 7528128, 'steps': 39208, 'loss/train': 1.3470895290374756} -11/07/2021 02:44:34 - INFO - __main__ - Step 39210: {'lr': 0.0004259906993169995, 'samples': 7528320, 'steps': 39209, 'loss/train': 1.8728010654449463} -11/07/2021 02:44:35 - INFO - __main__ - Step 39211: {'lr': 0.00042598693023197283, 'samples': 7528512, 'steps': 39210, 'loss/train': 1.5531646013259888} -11/07/2021 02:44:36 - INFO - __main__ - Step 39212: {'lr': 0.00042598316106764913, 'samples': 7528704, 'steps': 39211, 'loss/train': 1.987898588180542} -11/07/2021 02:44:36 - INFO - __main__ - Step 39213: {'lr': 0.0004259793918240302, 'samples': 7528896, 'steps': 39212, 'loss/train': 1.207327127456665} -11/07/2021 02:44:37 - INFO - __main__ - Step 39214: {'lr': 0.00042597562250111753, 'samples': 7529088, 'steps': 39213, 'loss/train': 1.4415658712387085} -11/07/2021 02:44:37 - INFO - __main__ - Step 39215: {'lr': 0.00042597185309891305, 'samples': 7529280, 'steps': 39214, 'loss/train': 1.9070416688919067} -11/07/2021 02:44:37 - INFO - __main__ - Step 39216: {'lr': 0.0004259680836174184, 'samples': 7529472, 'steps': 39215, 'loss/train': 1.5507830381393433} -11/07/2021 02:44:39 - INFO - __main__ - Step 39217: {'lr': 0.0004259643140566352, 'samples': 7529664, 'steps': 39216, 'loss/train': 0.5437787175178528} -11/07/2021 02:44:40 - INFO - __main__ - Step 39218: {'lr': 0.0004259605444165652, 'samples': 7529856, 'steps': 39217, 'loss/train': 1.7301392555236816} -11/07/2021 02:44:40 - INFO - __main__ - Step 39219: {'lr': 0.0004259567746972101, 'samples': 7530048, 'steps': 39218, 'loss/train': 1.3682011365890503} -11/07/2021 02:44:40 - INFO - __main__ - Step 39220: {'lr': 0.00042595300489857164, 'samples': 7530240, 'steps': 39219, 'loss/train': 0.709819495677948} -11/07/2021 02:44:41 - INFO - __main__ - Step 39221: {'lr': 0.0004259492350206514, 'samples': 7530432, 'steps': 39220, 'loss/train': 0.7055956721305847} -11/07/2021 02:44:41 - INFO - __main__ - Step 39222: {'lr': 0.00042594546506345124, 'samples': 7530624, 'steps': 39221, 'loss/train': 0.7826408743858337} -11/07/2021 02:44:41 - INFO - __main__ - Step 39223: {'lr': 0.00042594169502697265, 'samples': 7530816, 'steps': 39222, 'loss/train': 1.359542727470398} -11/07/2021 02:44:42 - INFO - __main__ - Step 39224: {'lr': 0.00042593792491121753, 'samples': 7531008, 'steps': 39223, 'loss/train': 1.3976107835769653} -11/07/2021 02:44:43 - INFO - __main__ - Step 39225: {'lr': 0.00042593415471618744, 'samples': 7531200, 'steps': 39224, 'loss/train': 1.443656086921692} -11/07/2021 02:44:43 - INFO - __main__ - Step 39226: {'lr': 0.0004259303844418841, 'samples': 7531392, 'steps': 39225, 'loss/train': 1.6289358139038086} -11/07/2021 02:44:43 - INFO - __main__ - Step 39227: {'lr': 0.00042592661408830937, 'samples': 7531584, 'steps': 39226, 'loss/train': 1.7915257215499878} -11/07/2021 02:44:44 - INFO - __main__ - Step 39228: {'lr': 0.00042592284365546474, 'samples': 7531776, 'steps': 39227, 'loss/train': 1.7885856628417969} -11/07/2021 02:44:45 - INFO - __main__ - Step 39229: {'lr': 0.00042591907314335197, 'samples': 7531968, 'steps': 39228, 'loss/train': 1.8358139991760254} -11/07/2021 02:44:45 - INFO - __main__ - Step 39230: {'lr': 0.00042591530255197286, 'samples': 7532160, 'steps': 39229, 'loss/train': 1.45115327835083} -11/07/2021 02:44:45 - INFO - __main__ - Step 39231: {'lr': 0.00042591153188132903, 'samples': 7532352, 'steps': 39230, 'loss/train': 1.6204403638839722} -11/07/2021 02:44:46 - INFO - __main__ - Step 39232: {'lr': 0.00042590776113142216, 'samples': 7532544, 'steps': 39231, 'loss/train': 1.5731817483901978} -11/07/2021 02:44:46 - INFO - __main__ - Step 39233: {'lr': 0.00042590399030225393, 'samples': 7532736, 'steps': 39232, 'loss/train': 1.7579594850540161} -11/07/2021 02:44:48 - INFO - __main__ - Step 39234: {'lr': 0.0004259002193938261, 'samples': 7532928, 'steps': 39233, 'loss/train': 2.0346720218658447} -11/07/2021 02:44:48 - INFO - __main__ - Step 39235: {'lr': 0.0004258964484061403, 'samples': 7533120, 'steps': 39234, 'loss/train': 1.7093135118484497} -11/07/2021 02:44:49 - INFO - __main__ - Step 39236: {'lr': 0.00042589267733919833, 'samples': 7533312, 'steps': 39235, 'loss/train': 1.5987120866775513} -11/07/2021 02:44:49 - INFO - __main__ - Step 39237: {'lr': 0.0004258889061930018, 'samples': 7533504, 'steps': 39236, 'loss/train': 1.6044750213623047} -11/07/2021 02:44:50 - INFO - __main__ - Step 39238: {'lr': 0.0004258851349675524, 'samples': 7533696, 'steps': 39237, 'loss/train': 1.6669312715530396} -11/07/2021 02:44:50 - INFO - __main__ - Step 39239: {'lr': 0.00042588136366285197, 'samples': 7533888, 'steps': 39238, 'loss/train': 1.5280288457870483} -11/07/2021 02:44:50 - INFO - __main__ - Step 39240: {'lr': 0.0004258775922789021, 'samples': 7534080, 'steps': 39239, 'loss/train': 1.1162550449371338} -11/07/2021 02:44:51 - INFO - __main__ - Step 39241: {'lr': 0.0004258738208157045, 'samples': 7534272, 'steps': 39240, 'loss/train': 1.8857530355453491} -11/07/2021 02:44:52 - INFO - __main__ - Step 39242: {'lr': 0.0004258700492732608, 'samples': 7534464, 'steps': 39241, 'loss/train': 1.784043312072754} -11/07/2021 02:44:52 - INFO - __main__ - Step 39243: {'lr': 0.0004258662776515728, 'samples': 7534656, 'steps': 39242, 'loss/train': 1.8259460926055908} -11/07/2021 02:44:52 - INFO - __main__ - Step 39244: {'lr': 0.00042586250595064216, 'samples': 7534848, 'steps': 39243, 'loss/train': 1.4832545518875122} -11/07/2021 02:44:53 - INFO - __main__ - Step 39245: {'lr': 0.0004258587341704706, 'samples': 7535040, 'steps': 39244, 'loss/train': 1.3301485776901245} -11/07/2021 02:44:53 - INFO - __main__ - Step 39246: {'lr': 0.00042585496231105986, 'samples': 7535232, 'steps': 39245, 'loss/train': 0.8189593553543091} -11/07/2021 02:44:54 - INFO - __main__ - Step 39247: {'lr': 0.00042585119037241156, 'samples': 7535424, 'steps': 39246, 'loss/train': 1.3747432231903076} -11/07/2021 02:44:54 - INFO - __main__ - Step 39248: {'lr': 0.00042584741835452743, 'samples': 7535616, 'steps': 39247, 'loss/train': 1.4216407537460327} -11/07/2021 02:44:55 - INFO - __main__ - Step 39249: {'lr': 0.0004258436462574091, 'samples': 7535808, 'steps': 39248, 'loss/train': 1.5498663187026978} -11/07/2021 02:44:55 - INFO - __main__ - Step 39250: {'lr': 0.0004258398740810584, 'samples': 7536000, 'steps': 39249, 'loss/train': 1.7944103479385376} -11/07/2021 02:44:55 - INFO - __main__ - Step 39251: {'lr': 0.00042583610182547694, 'samples': 7536192, 'steps': 39250, 'loss/train': 1.286428451538086} -11/07/2021 02:44:56 - INFO - __main__ - Step 39252: {'lr': 0.0004258323294906665, 'samples': 7536384, 'steps': 39251, 'loss/train': 1.1772104501724243} -11/07/2021 02:44:57 - INFO - __main__ - Step 39253: {'lr': 0.00042582855707662864, 'samples': 7536576, 'steps': 39252, 'loss/train': 1.6651321649551392} -11/07/2021 02:44:57 - INFO - __main__ - Step 39254: {'lr': 0.00042582478458336523, 'samples': 7536768, 'steps': 39253, 'loss/train': 1.6486400365829468} -11/07/2021 02:44:57 - INFO - __main__ - Step 39255: {'lr': 0.00042582101201087786, 'samples': 7536960, 'steps': 39254, 'loss/train': 1.1267701387405396} -11/07/2021 02:44:58 - INFO - __main__ - Step 39256: {'lr': 0.00042581723935916817, 'samples': 7537152, 'steps': 39255, 'loss/train': 1.9030141830444336} -11/07/2021 02:44:59 - INFO - __main__ - Step 39257: {'lr': 0.00042581346662823804, 'samples': 7537344, 'steps': 39256, 'loss/train': 1.0102065801620483} -11/07/2021 02:44:59 - INFO - __main__ - Step 39258: {'lr': 0.00042580969381808906, 'samples': 7537536, 'steps': 39257, 'loss/train': 1.8677732944488525} -11/07/2021 02:45:00 - INFO - __main__ - Step 39259: {'lr': 0.00042580592092872295, 'samples': 7537728, 'steps': 39258, 'loss/train': 1.4082847833633423} -11/07/2021 02:45:00 - INFO - __main__ - Step 39260: {'lr': 0.0004258021479601414, 'samples': 7537920, 'steps': 39259, 'loss/train': 1.3875758647918701} -11/07/2021 02:45:00 - INFO - __main__ - Step 39261: {'lr': 0.0004257983749123461, 'samples': 7538112, 'steps': 39260, 'loss/train': 1.4950883388519287} -11/07/2021 02:45:01 - INFO - __main__ - Step 39262: {'lr': 0.00042579460178533875, 'samples': 7538304, 'steps': 39261, 'loss/train': 1.6318151950836182} -11/07/2021 02:45:02 - INFO - __main__ - Step 39263: {'lr': 0.0004257908285791211, 'samples': 7538496, 'steps': 39262, 'loss/train': 1.4447813034057617} -11/07/2021 02:45:02 - INFO - __main__ - Step 39264: {'lr': 0.00042578705529369476, 'samples': 7538688, 'steps': 39263, 'loss/train': 0.8829726576805115} -11/07/2021 02:45:03 - INFO - __main__ - Step 39265: {'lr': 0.00042578328192906153, 'samples': 7538880, 'steps': 39264, 'loss/train': 1.7114918231964111} -11/07/2021 02:45:03 - INFO - __main__ - Step 39266: {'lr': 0.00042577950848522305, 'samples': 7539072, 'steps': 39265, 'loss/train': 0.7462561130523682} -11/07/2021 02:45:03 - INFO - __main__ - Step 39267: {'lr': 0.0004257757349621811, 'samples': 7539264, 'steps': 39266, 'loss/train': 1.6467303037643433} -11/07/2021 02:45:04 - INFO - __main__ - Step 39268: {'lr': 0.0004257719613599372, 'samples': 7539456, 'steps': 39267, 'loss/train': 1.3126444816589355} -11/07/2021 02:45:05 - INFO - __main__ - Step 39269: {'lr': 0.0004257681876784932, 'samples': 7539648, 'steps': 39268, 'loss/train': 1.579737663269043} -11/07/2021 02:45:05 - INFO - __main__ - Step 39270: {'lr': 0.0004257644139178508, 'samples': 7539840, 'steps': 39269, 'loss/train': 1.1076663732528687} -11/07/2021 02:45:05 - INFO - __main__ - Step 39271: {'lr': 0.0004257606400780117, 'samples': 7540032, 'steps': 39270, 'loss/train': 1.5877642631530762} -11/07/2021 02:45:06 - INFO - __main__ - Step 39272: {'lr': 0.0004257568661589775, 'samples': 7540224, 'steps': 39271, 'loss/train': 1.1899365186691284} -11/07/2021 02:45:07 - INFO - __main__ - Step 39273: {'lr': 0.00042575309216074997, 'samples': 7540416, 'steps': 39272, 'loss/train': 1.7019377946853638} -11/07/2021 02:45:07 - INFO - __main__ - Step 39274: {'lr': 0.00042574931808333095, 'samples': 7540608, 'steps': 39273, 'loss/train': 1.2056797742843628} -11/07/2021 02:45:07 - INFO - __main__ - Step 39275: {'lr': 0.0004257455439267218, 'samples': 7540800, 'steps': 39274, 'loss/train': 1.438101053237915} -11/07/2021 02:45:08 - INFO - __main__ - Step 39276: {'lr': 0.00042574176969092454, 'samples': 7540992, 'steps': 39275, 'loss/train': 1.626620888710022} -11/07/2021 02:45:08 - INFO - __main__ - Step 39277: {'lr': 0.0004257379953759407, 'samples': 7541184, 'steps': 39276, 'loss/train': 1.5642321109771729} -11/07/2021 02:45:09 - INFO - __main__ - Step 39278: {'lr': 0.00042573422098177204, 'samples': 7541376, 'steps': 39277, 'loss/train': 1.5449275970458984} -11/07/2021 02:45:09 - INFO - __main__ - Step 39279: {'lr': 0.0004257304465084203, 'samples': 7541568, 'steps': 39278, 'loss/train': 1.7904508113861084} -11/07/2021 02:45:10 - INFO - __main__ - Step 39280: {'lr': 0.0004257266719558871, 'samples': 7541760, 'steps': 39279, 'loss/train': 1.0784425735473633} -11/07/2021 02:45:10 - INFO - __main__ - Step 39281: {'lr': 0.0004257228973241741, 'samples': 7541952, 'steps': 39280, 'loss/train': 1.1655843257904053} -11/07/2021 02:45:10 - INFO - __main__ - Step 39282: {'lr': 0.00042571912261328315, 'samples': 7542144, 'steps': 39281, 'loss/train': 1.0028207302093506} -11/07/2021 02:45:11 - INFO - __main__ - Step 39283: {'lr': 0.00042571534782321593, 'samples': 7542336, 'steps': 39282, 'loss/train': 1.4070467948913574} -11/07/2021 02:45:12 - INFO - __main__ - Step 39284: {'lr': 0.000425711572953974, 'samples': 7542528, 'steps': 39283, 'loss/train': 1.9504486322402954} -11/07/2021 02:45:12 - INFO - __main__ - Step 39285: {'lr': 0.00042570779800555914, 'samples': 7542720, 'steps': 39284, 'loss/train': 1.4157495498657227} -11/07/2021 02:45:13 - INFO - __main__ - Step 39286: {'lr': 0.00042570402297797304, 'samples': 7542912, 'steps': 39285, 'loss/train': 1.3681554794311523} -11/07/2021 02:45:13 - INFO - __main__ - Step 39287: {'lr': 0.0004257002478712175, 'samples': 7543104, 'steps': 39286, 'loss/train': 1.1086269617080688} -11/07/2021 02:45:13 - INFO - __main__ - Step 39288: {'lr': 0.0004256964726852941, 'samples': 7543296, 'steps': 39287, 'loss/train': 0.5984827280044556} -11/07/2021 02:45:14 - INFO - __main__ - Step 39289: {'lr': 0.0004256926974202046, 'samples': 7543488, 'steps': 39288, 'loss/train': 1.4696334600448608} -11/07/2021 02:45:15 - INFO - __main__ - Step 39290: {'lr': 0.00042568892207595066, 'samples': 7543680, 'steps': 39289, 'loss/train': 1.3621699810028076} -11/07/2021 02:45:15 - INFO - __main__ - Step 39291: {'lr': 0.000425685146652534, 'samples': 7543872, 'steps': 39290, 'loss/train': 1.0785452127456665} -11/07/2021 02:45:16 - INFO - __main__ - Step 39292: {'lr': 0.00042568137114995633, 'samples': 7544064, 'steps': 39291, 'loss/train': 1.7251018285751343} -11/07/2021 02:45:16 - INFO - __main__ - Step 39293: {'lr': 0.00042567759556821937, 'samples': 7544256, 'steps': 39292, 'loss/train': 1.6907563209533691} -11/07/2021 02:45:17 - INFO - __main__ - Step 39294: {'lr': 0.00042567381990732476, 'samples': 7544448, 'steps': 39293, 'loss/train': 1.4064091444015503} -11/07/2021 02:45:17 - INFO - __main__ - Step 39295: {'lr': 0.0004256700441672743, 'samples': 7544640, 'steps': 39294, 'loss/train': 1.557332992553711} -11/07/2021 02:45:18 - INFO - __main__ - Step 39296: {'lr': 0.0004256662683480695, 'samples': 7544832, 'steps': 39295, 'loss/train': 1.9215407371520996} -11/07/2021 02:45:18 - INFO - __main__ - Step 39297: {'lr': 0.00042566249244971235, 'samples': 7545024, 'steps': 39296, 'loss/train': 1.4755570888519287} -11/07/2021 02:45:18 - INFO - __main__ - Step 39298: {'lr': 0.0004256587164722043, 'samples': 7545216, 'steps': 39297, 'loss/train': 0.8738113045692444} -11/07/2021 02:45:19 - INFO - __main__ - Step 39299: {'lr': 0.0004256549404155471, 'samples': 7545408, 'steps': 39298, 'loss/train': 1.4364068508148193} -11/07/2021 02:45:20 - INFO - __main__ - Step 39300: {'lr': 0.0004256511642797426, 'samples': 7545600, 'steps': 39299, 'loss/train': 1.5300726890563965} -11/07/2021 02:45:20 - INFO - __main__ - Step 39301: {'lr': 0.0004256473880647923, 'samples': 7545792, 'steps': 39300, 'loss/train': 0.16604219377040863} -11/07/2021 02:45:20 - INFO - __main__ - Step 39302: {'lr': 0.0004256436117706981, 'samples': 7545984, 'steps': 39301, 'loss/train': 0.8302720189094543} -11/07/2021 02:45:21 - INFO - __main__ - Step 39303: {'lr': 0.0004256398353974615, 'samples': 7546176, 'steps': 39302, 'loss/train': 0.9688646197319031} -11/07/2021 02:45:22 - INFO - __main__ - Step 39304: {'lr': 0.00042563605894508434, 'samples': 7546368, 'steps': 39303, 'loss/train': 1.3211116790771484} -11/07/2021 02:45:22 - INFO - __main__ - Step 39305: {'lr': 0.00042563228241356834, 'samples': 7546560, 'steps': 39304, 'loss/train': 2.016324520111084} -11/07/2021 02:45:22 - INFO - __main__ - Step 39306: {'lr': 0.000425628505802915, 'samples': 7546752, 'steps': 39305, 'loss/train': 0.9035109877586365} -11/07/2021 02:45:23 - INFO - __main__ - Step 39307: {'lr': 0.0004256247291131263, 'samples': 7546944, 'steps': 39306, 'loss/train': 1.6596336364746094} -11/07/2021 02:45:23 - INFO - __main__ - Step 39308: {'lr': 0.00042562095234420375, 'samples': 7547136, 'steps': 39307, 'loss/train': 1.361107349395752} -11/07/2021 02:45:24 - INFO - __main__ - Step 39309: {'lr': 0.00042561717549614907, 'samples': 7547328, 'steps': 39308, 'loss/train': 1.4581472873687744} -11/07/2021 02:45:24 - INFO - __main__ - Step 39310: {'lr': 0.0004256133985689641, 'samples': 7547520, 'steps': 39309, 'loss/train': 1.205946445465088} -11/07/2021 02:45:25 - INFO - __main__ - Step 39311: {'lr': 0.0004256096215626504, 'samples': 7547712, 'steps': 39310, 'loss/train': 1.3667376041412354} -11/07/2021 02:45:25 - INFO - __main__ - Step 39312: {'lr': 0.0004256058444772097, 'samples': 7547904, 'steps': 39311, 'loss/train': 1.536171317100525} -11/07/2021 02:45:25 - INFO - __main__ - Step 39313: {'lr': 0.0004256020673126437, 'samples': 7548096, 'steps': 39312, 'loss/train': 1.3614702224731445} -11/07/2021 02:45:27 - INFO - __main__ - Step 39314: {'lr': 0.0004255982900689541, 'samples': 7548288, 'steps': 39313, 'loss/train': 1.150659441947937} -11/07/2021 02:45:27 - INFO - __main__ - Step 39315: {'lr': 0.0004255945127461427, 'samples': 7548480, 'steps': 39314, 'loss/train': 1.6493338346481323} -11/07/2021 02:45:27 - INFO - __main__ - Step 39316: {'lr': 0.00042559073534421114, 'samples': 7548672, 'steps': 39315, 'loss/train': 1.3953452110290527} -11/07/2021 02:45:28 - INFO - __main__ - Step 39317: {'lr': 0.00042558695786316106, 'samples': 7548864, 'steps': 39316, 'loss/train': 1.6797736883163452} -11/07/2021 02:45:28 - INFO - __main__ - Step 39318: {'lr': 0.00042558318030299415, 'samples': 7549056, 'steps': 39317, 'loss/train': 1.3615410327911377} -11/07/2021 02:45:28 - INFO - __main__ - Step 39319: {'lr': 0.0004255794026637122, 'samples': 7549248, 'steps': 39318, 'loss/train': 3.0827596187591553} -11/07/2021 02:45:29 - INFO - __main__ - Step 39320: {'lr': 0.0004255756249453169, 'samples': 7549440, 'steps': 39319, 'loss/train': 1.328766107559204} -11/07/2021 02:45:30 - INFO - __main__ - Step 39321: {'lr': 0.00042557184714780993, 'samples': 7549632, 'steps': 39320, 'loss/train': 1.630851149559021} -11/07/2021 02:45:30 - INFO - __main__ - Step 39322: {'lr': 0.000425568069271193, 'samples': 7549824, 'steps': 39321, 'loss/train': 1.5530668497085571} -11/07/2021 02:45:30 - INFO - __main__ - Step 39323: {'lr': 0.00042556429131546775, 'samples': 7550016, 'steps': 39322, 'loss/train': 1.649032711982727} -11/07/2021 02:45:31 - INFO - __main__ - Step 39324: {'lr': 0.000425560513280636, 'samples': 7550208, 'steps': 39323, 'loss/train': 1.1001230478286743} -11/07/2021 02:45:32 - INFO - __main__ - Step 39325: {'lr': 0.00042555673516669933, 'samples': 7550400, 'steps': 39324, 'loss/train': 1.2240439653396606} -11/07/2021 02:45:32 - INFO - __main__ - Step 39326: {'lr': 0.0004255529569736596, 'samples': 7550592, 'steps': 39325, 'loss/train': 1.6975648403167725} -11/07/2021 02:45:33 - INFO - __main__ - Step 39327: {'lr': 0.0004255491787015183, 'samples': 7550784, 'steps': 39326, 'loss/train': 1.6072126626968384} -11/07/2021 02:45:33 - INFO - __main__ - Step 39328: {'lr': 0.0004255454003502774, 'samples': 7550976, 'steps': 39327, 'loss/train': 1.4416260719299316} -11/07/2021 02:45:33 - INFO - __main__ - Step 39329: {'lr': 0.0004255416219199384, 'samples': 7551168, 'steps': 39328, 'loss/train': 1.4229910373687744} -11/07/2021 02:45:34 - INFO - __main__ - Step 39330: {'lr': 0.0004255378434105029, 'samples': 7551360, 'steps': 39329, 'loss/train': 0.758528470993042} -11/07/2021 02:45:35 - INFO - __main__ - Step 39331: {'lr': 0.00042553406482197297, 'samples': 7551552, 'steps': 39330, 'loss/train': 2.1144182682037354} -11/07/2021 02:45:35 - INFO - __main__ - Step 39332: {'lr': 0.00042553028615434997, 'samples': 7551744, 'steps': 39331, 'loss/train': 1.465710997581482} -11/07/2021 02:45:35 - INFO - __main__ - Step 39333: {'lr': 0.0004255265074076358, 'samples': 7551936, 'steps': 39332, 'loss/train': 0.8778195381164551} -11/07/2021 02:45:36 - INFO - __main__ - Step 39334: {'lr': 0.00042552272858183203, 'samples': 7552128, 'steps': 39333, 'loss/train': 1.2574025392532349} -11/07/2021 02:45:37 - INFO - __main__ - Step 39335: {'lr': 0.0004255189496769405, 'samples': 7552320, 'steps': 39334, 'loss/train': 1.6069217920303345} -11/07/2021 02:45:38 - INFO - __main__ - Step 39336: {'lr': 0.00042551517069296276, 'samples': 7552512, 'steps': 39335, 'loss/train': 1.5512158870697021} -11/07/2021 02:45:38 - INFO - __main__ - Step 39337: {'lr': 0.00042551139162990065, 'samples': 7552704, 'steps': 39336, 'loss/train': 1.6924312114715576} -11/07/2021 02:45:38 - INFO - __main__ - Step 39338: {'lr': 0.0004255076124877558, 'samples': 7552896, 'steps': 39337, 'loss/train': 1.810476541519165} -11/07/2021 02:45:39 - INFO - __main__ - Step 39339: {'lr': 0.0004255038332665299, 'samples': 7553088, 'steps': 39338, 'loss/train': 1.5786186456680298} -11/07/2021 02:45:39 - INFO - __main__ - Step 39340: {'lr': 0.0004255000539662247, 'samples': 7553280, 'steps': 39339, 'loss/train': 1.684509038925171} -11/07/2021 02:45:40 - INFO - __main__ - Step 39341: {'lr': 0.0004254962745868419, 'samples': 7553472, 'steps': 39340, 'loss/train': 0.9445256590843201} -11/07/2021 02:45:40 - INFO - __main__ - Step 39342: {'lr': 0.00042549249512838325, 'samples': 7553664, 'steps': 39341, 'loss/train': 1.8878004550933838} -11/07/2021 02:45:41 - INFO - __main__ - Step 39343: {'lr': 0.00042548871559085026, 'samples': 7553856, 'steps': 39342, 'loss/train': 1.388020634651184} -11/07/2021 02:45:41 - INFO - __main__ - Step 39344: {'lr': 0.0004254849359742449, 'samples': 7554048, 'steps': 39343, 'loss/train': 1.0768413543701172} -11/07/2021 02:45:41 - INFO - __main__ - Step 39345: {'lr': 0.0004254811562785686, 'samples': 7554240, 'steps': 39344, 'loss/train': 1.4457755088806152} -11/07/2021 02:45:42 - INFO - __main__ - Step 39346: {'lr': 0.00042547737650382324, 'samples': 7554432, 'steps': 39345, 'loss/train': 1.4694263935089111} -11/07/2021 02:45:43 - INFO - __main__ - Step 39347: {'lr': 0.0004254735966500105, 'samples': 7554624, 'steps': 39346, 'loss/train': 1.3930296897888184} -11/07/2021 02:45:43 - INFO - __main__ - Step 39348: {'lr': 0.00042546981671713206, 'samples': 7554816, 'steps': 39347, 'loss/train': 0.8317453265190125} -11/07/2021 02:45:44 - INFO - __main__ - Step 39349: {'lr': 0.0004254660367051896, 'samples': 7555008, 'steps': 39348, 'loss/train': 1.5087776184082031} -11/07/2021 02:45:44 - INFO - __main__ - Step 39350: {'lr': 0.0004254622566141849, 'samples': 7555200, 'steps': 39349, 'loss/train': 1.4444903135299683} -11/07/2021 02:45:44 - INFO - __main__ - Step 39351: {'lr': 0.0004254584764441196, 'samples': 7555392, 'steps': 39350, 'loss/train': 1.4392361640930176} -11/07/2021 02:45:45 - INFO - __main__ - Step 39352: {'lr': 0.00042545469619499545, 'samples': 7555584, 'steps': 39351, 'loss/train': 1.4138058423995972} -11/07/2021 02:45:46 - INFO - __main__ - Step 39353: {'lr': 0.00042545091586681404, 'samples': 7555776, 'steps': 39352, 'loss/train': 1.6890608072280884} -11/07/2021 02:45:46 - INFO - __main__ - Step 39354: {'lr': 0.0004254471354595772, 'samples': 7555968, 'steps': 39353, 'loss/train': 1.4956886768341064} -11/07/2021 02:45:46 - INFO - __main__ - Step 39355: {'lr': 0.0004254433549732866, 'samples': 7556160, 'steps': 39354, 'loss/train': 1.7300609350204468} -11/07/2021 02:45:47 - INFO - __main__ - Step 39356: {'lr': 0.0004254395744079439, 'samples': 7556352, 'steps': 39355, 'loss/train': 1.515649676322937} -11/07/2021 02:45:48 - INFO - __main__ - Step 39357: {'lr': 0.0004254357937635509, 'samples': 7556544, 'steps': 39356, 'loss/train': 1.8868955373764038} -11/07/2021 02:45:48 - INFO - __main__ - Step 39358: {'lr': 0.00042543201304010914, 'samples': 7556736, 'steps': 39357, 'loss/train': 0.9736785292625427} -11/07/2021 02:45:48 - INFO - __main__ - Step 39359: {'lr': 0.0004254282322376205, 'samples': 7556928, 'steps': 39358, 'loss/train': 0.7911121845245361} -11/07/2021 02:45:49 - INFO - __main__ - Step 39360: {'lr': 0.0004254244513560866, 'samples': 7557120, 'steps': 39359, 'loss/train': 1.9326436519622803} -11/07/2021 02:45:49 - INFO - __main__ - Step 39361: {'lr': 0.00042542067039550916, 'samples': 7557312, 'steps': 39360, 'loss/train': 1.9013553857803345} -11/07/2021 02:45:50 - INFO - __main__ - Step 39362: {'lr': 0.00042541688935588984, 'samples': 7557504, 'steps': 39361, 'loss/train': 0.8181159496307373} -11/07/2021 02:45:50 - INFO - __main__ - Step 39363: {'lr': 0.00042541310823723035, 'samples': 7557696, 'steps': 39362, 'loss/train': 1.1350655555725098} -11/07/2021 02:45:51 - INFO - __main__ - Step 39364: {'lr': 0.00042540932703953246, 'samples': 7557888, 'steps': 39363, 'loss/train': 1.395199179649353} -11/07/2021 02:45:51 - INFO - __main__ - Step 39365: {'lr': 0.00042540554576279776, 'samples': 7558080, 'steps': 39364, 'loss/train': 1.6894145011901855} -11/07/2021 02:45:51 - INFO - __main__ - Step 39366: {'lr': 0.0004254017644070282, 'samples': 7558272, 'steps': 39365, 'loss/train': 1.7289868593215942} -11/07/2021 02:45:53 - INFO - __main__ - Step 39367: {'lr': 0.0004253979829722251, 'samples': 7558464, 'steps': 39366, 'loss/train': 1.5356981754302979} -11/07/2021 02:45:53 - INFO - __main__ - Step 39368: {'lr': 0.00042539420145839055, 'samples': 7558656, 'steps': 39367, 'loss/train': 0.863486111164093} -11/07/2021 02:45:53 - INFO - __main__ - Step 39369: {'lr': 0.00042539041986552596, 'samples': 7558848, 'steps': 39368, 'loss/train': 1.0760917663574219} -11/07/2021 02:45:54 - INFO - __main__ - Step 39370: {'lr': 0.00042538663819363323, 'samples': 7559040, 'steps': 39369, 'loss/train': 1.4790570735931396} -11/07/2021 02:45:54 - INFO - __main__ - Step 39371: {'lr': 0.000425382856442714, 'samples': 7559232, 'steps': 39370, 'loss/train': 1.5317871570587158} -11/07/2021 02:45:54 - INFO - __main__ - Step 39372: {'lr': 0.0004253790746127699, 'samples': 7559424, 'steps': 39371, 'loss/train': 1.7790511846542358} -11/07/2021 02:45:55 - INFO - __main__ - Step 39373: {'lr': 0.0004253752927038027, 'samples': 7559616, 'steps': 39372, 'loss/train': 1.676537036895752} -11/07/2021 02:45:56 - INFO - __main__ - Step 39374: {'lr': 0.0004253715107158141, 'samples': 7559808, 'steps': 39373, 'loss/train': 1.566117286682129} -11/07/2021 02:45:56 - INFO - __main__ - Step 39375: {'lr': 0.0004253677286488058, 'samples': 7560000, 'steps': 39374, 'loss/train': 1.004982352256775} -11/07/2021 02:45:56 - INFO - __main__ - Step 39376: {'lr': 0.00042536394650277953, 'samples': 7560192, 'steps': 39375, 'loss/train': 1.3873460292816162} -11/07/2021 02:45:57 - INFO - __main__ - Step 39377: {'lr': 0.000425360164277737, 'samples': 7560384, 'steps': 39376, 'loss/train': 1.6033751964569092} -11/07/2021 02:45:58 - INFO - __main__ - Step 39378: {'lr': 0.00042535638197367984, 'samples': 7560576, 'steps': 39377, 'loss/train': 1.3536235094070435} -11/07/2021 02:45:58 - INFO - __main__ - Step 39379: {'lr': 0.0004253525995906098, 'samples': 7560768, 'steps': 39378, 'loss/train': 1.5641216039657593} -11/07/2021 02:45:58 - INFO - __main__ - Step 39380: {'lr': 0.00042534881712852856, 'samples': 7560960, 'steps': 39379, 'loss/train': 1.5420782566070557} -11/07/2021 02:45:59 - INFO - __main__ - Step 39381: {'lr': 0.0004253450345874379, 'samples': 7561152, 'steps': 39380, 'loss/train': 1.4883129596710205} -11/07/2021 02:45:59 - INFO - __main__ - Step 39382: {'lr': 0.00042534125196733955, 'samples': 7561344, 'steps': 39381, 'loss/train': 1.754917860031128} -11/07/2021 02:46:00 - INFO - __main__ - Step 39383: {'lr': 0.000425337469268235, 'samples': 7561536, 'steps': 39382, 'loss/train': 1.8359870910644531} -11/07/2021 02:46:01 - INFO - __main__ - Step 39384: {'lr': 0.00042533368649012615, 'samples': 7561728, 'steps': 39383, 'loss/train': 1.5123169422149658} -11/07/2021 02:46:01 - INFO - __main__ - Step 39385: {'lr': 0.0004253299036330146, 'samples': 7561920, 'steps': 39384, 'loss/train': 1.6789470911026} -11/07/2021 02:46:01 - INFO - __main__ - Step 39386: {'lr': 0.00042532612069690214, 'samples': 7562112, 'steps': 39385, 'loss/train': 1.331007719039917} -11/07/2021 02:46:02 - INFO - __main__ - Step 39387: {'lr': 0.0004253223376817904, 'samples': 7562304, 'steps': 39386, 'loss/train': 1.7500447034835815} -11/07/2021 02:46:03 - INFO - __main__ - Step 39388: {'lr': 0.0004253185545876812, 'samples': 7562496, 'steps': 39387, 'loss/train': 1.3423337936401367} -11/07/2021 02:46:03 - INFO - __main__ - Step 39389: {'lr': 0.0004253147714145761, 'samples': 7562688, 'steps': 39388, 'loss/train': 1.7974839210510254} -11/07/2021 02:46:03 - INFO - __main__ - Step 39390: {'lr': 0.00042531098816247695, 'samples': 7562880, 'steps': 39389, 'loss/train': 1.8890057802200317} -11/07/2021 02:46:04 - INFO - __main__ - Step 39391: {'lr': 0.00042530720483138524, 'samples': 7563072, 'steps': 39390, 'loss/train': 0.7283228635787964} -11/07/2021 02:46:04 - INFO - __main__ - Step 39392: {'lr': 0.00042530342142130283, 'samples': 7563264, 'steps': 39391, 'loss/train': 1.046333909034729} -11/07/2021 02:46:05 - INFO - __main__ - Step 39393: {'lr': 0.0004252996379322315, 'samples': 7563456, 'steps': 39392, 'loss/train': 1.3759727478027344} -11/07/2021 02:46:06 - INFO - __main__ - Step 39394: {'lr': 0.0004252958543641728, 'samples': 7563648, 'steps': 39393, 'loss/train': 1.343981146812439} -11/07/2021 02:46:06 - INFO - __main__ - Step 39395: {'lr': 0.0004252920707171285, 'samples': 7563840, 'steps': 39394, 'loss/train': 1.5883010625839233} -11/07/2021 02:46:06 - INFO - __main__ - Step 39396: {'lr': 0.00042528828699110033, 'samples': 7564032, 'steps': 39395, 'loss/train': 1.370940089225769} -11/07/2021 02:46:07 - INFO - __main__ - Step 39397: {'lr': 0.0004252845031860899, 'samples': 7564224, 'steps': 39396, 'loss/train': 1.7147272825241089} -11/07/2021 02:46:07 - INFO - __main__ - Step 39398: {'lr': 0.000425280719302099, 'samples': 7564416, 'steps': 39397, 'loss/train': 1.6413315534591675} -11/07/2021 02:46:08 - INFO - __main__ - Step 39399: {'lr': 0.0004252769353391294, 'samples': 7564608, 'steps': 39398, 'loss/train': 0.9206255078315735} -11/07/2021 02:46:08 - INFO - __main__ - Step 39400: {'lr': 0.00042527315129718257, 'samples': 7564800, 'steps': 39399, 'loss/train': 1.7017139196395874} -11/07/2021 02:46:09 - INFO - __main__ - Step 39401: {'lr': 0.00042526936717626046, 'samples': 7564992, 'steps': 39400, 'loss/train': 1.9394193887710571} -11/07/2021 02:46:09 - INFO - __main__ - Step 39402: {'lr': 0.00042526558297636464, 'samples': 7565184, 'steps': 39401, 'loss/train': 1.4708151817321777} -11/07/2021 02:46:09 - INFO - __main__ - Step 39403: {'lr': 0.0004252617986974969, 'samples': 7565376, 'steps': 39402, 'loss/train': 0.9733449816703796} -11/07/2021 02:46:10 - INFO - __main__ - Step 39404: {'lr': 0.00042525801433965883, 'samples': 7565568, 'steps': 39403, 'loss/train': 1.8433624505996704} -11/07/2021 02:46:11 - INFO - __main__ - Step 39405: {'lr': 0.00042525422990285225, 'samples': 7565760, 'steps': 39404, 'loss/train': 1.5334631204605103} -11/07/2021 02:46:11 - INFO - __main__ - Step 39406: {'lr': 0.0004252504453870788, 'samples': 7565952, 'steps': 39405, 'loss/train': 1.3392281532287598} -11/07/2021 02:46:11 - INFO - __main__ - Step 39407: {'lr': 0.0004252466607923402, 'samples': 7566144, 'steps': 39406, 'loss/train': 1.5809663534164429} -11/07/2021 02:46:12 - INFO - __main__ - Step 39408: {'lr': 0.0004252428761186382, 'samples': 7566336, 'steps': 39407, 'loss/train': 2.1655049324035645} -11/07/2021 02:46:13 - INFO - __main__ - Step 39409: {'lr': 0.0004252390913659744, 'samples': 7566528, 'steps': 39408, 'loss/train': 1.7455583810806274} -11/07/2021 02:46:13 - INFO - __main__ - Step 39410: {'lr': 0.0004252353065343506, 'samples': 7566720, 'steps': 39409, 'loss/train': 0.2890855371952057} -11/07/2021 02:46:14 - INFO - __main__ - Step 39411: {'lr': 0.0004252315216237684, 'samples': 7566912, 'steps': 39410, 'loss/train': 1.478803277015686} -11/07/2021 02:46:14 - INFO - __main__ - Step 39412: {'lr': 0.00042522773663422977, 'samples': 7567104, 'steps': 39411, 'loss/train': 1.7798511981964111} -11/07/2021 02:46:14 - INFO - __main__ - Step 39413: {'lr': 0.000425223951565736, 'samples': 7567296, 'steps': 39412, 'loss/train': 1.5644084215164185} -11/07/2021 02:46:16 - INFO - __main__ - Step 39414: {'lr': 0.0004252201664182892, 'samples': 7567488, 'steps': 39413, 'loss/train': 1.9910378456115723} -11/07/2021 02:46:16 - INFO - __main__ - Step 39415: {'lr': 0.0004252163811918909, 'samples': 7567680, 'steps': 39414, 'loss/train': 1.361193060874939} -11/07/2021 02:46:16 - INFO - __main__ - Step 39416: {'lr': 0.00042521259588654264, 'samples': 7567872, 'steps': 39415, 'loss/train': 1.2348101139068604} -11/07/2021 02:46:17 - INFO - __main__ - Step 39417: {'lr': 0.00042520881050224637, 'samples': 7568064, 'steps': 39416, 'loss/train': 1.742704153060913} -11/07/2021 02:46:17 - INFO - __main__ - Step 39418: {'lr': 0.0004252050250390037, 'samples': 7568256, 'steps': 39417, 'loss/train': 1.4445207118988037} -11/07/2021 02:46:17 - INFO - __main__ - Step 39419: {'lr': 0.0004252012394968164, 'samples': 7568448, 'steps': 39418, 'loss/train': 1.140768051147461} -11/07/2021 02:46:18 - INFO - __main__ - Step 39420: {'lr': 0.0004251974538756861, 'samples': 7568640, 'steps': 39419, 'loss/train': 1.236556887626648} -11/07/2021 02:46:19 - INFO - __main__ - Step 39421: {'lr': 0.00042519366817561453, 'samples': 7568832, 'steps': 39420, 'loss/train': 1.6497478485107422} -11/07/2021 02:46:19 - INFO - __main__ - Step 39422: {'lr': 0.0004251898823966034, 'samples': 7569024, 'steps': 39421, 'loss/train': 1.5852000713348389} -11/07/2021 02:46:19 - INFO - __main__ - Step 39423: {'lr': 0.00042518609653865444, 'samples': 7569216, 'steps': 39422, 'loss/train': 1.822353720664978} -11/07/2021 02:46:20 - INFO - __main__ - Step 39424: {'lr': 0.00042518231060176926, 'samples': 7569408, 'steps': 39423, 'loss/train': 1.4493063688278198} -11/07/2021 02:46:21 - INFO - __main__ - Step 39425: {'lr': 0.00042517852458594967, 'samples': 7569600, 'steps': 39424, 'loss/train': 1.5626758337020874} -11/07/2021 02:46:21 - INFO - __main__ - Step 39426: {'lr': 0.00042517473849119734, 'samples': 7569792, 'steps': 39425, 'loss/train': 1.4561035633087158} -11/07/2021 02:46:21 - INFO - __main__ - Step 39427: {'lr': 0.000425170952317514, 'samples': 7569984, 'steps': 39426, 'loss/train': 1.5167341232299805} -11/07/2021 02:46:22 - INFO - __main__ - Step 39428: {'lr': 0.0004251671660649013, 'samples': 7570176, 'steps': 39427, 'loss/train': 1.613086223602295} -11/07/2021 02:46:22 - INFO - __main__ - Step 39429: {'lr': 0.000425163379733361, 'samples': 7570368, 'steps': 39428, 'loss/train': 1.4827110767364502} -11/07/2021 02:46:23 - INFO - __main__ - Step 39430: {'lr': 0.00042515959332289476, 'samples': 7570560, 'steps': 39429, 'loss/train': 1.8132240772247314} -11/07/2021 02:46:24 - INFO - __main__ - Step 39431: {'lr': 0.0004251558068335043, 'samples': 7570752, 'steps': 39430, 'loss/train': 1.5489274263381958} -11/07/2021 02:46:24 - INFO - __main__ - Step 39432: {'lr': 0.00042515202026519136, 'samples': 7570944, 'steps': 39431, 'loss/train': 1.3465017080307007} -11/07/2021 02:46:24 - INFO - __main__ - Step 39433: {'lr': 0.00042514823361795764, 'samples': 7571136, 'steps': 39432, 'loss/train': 0.7617422938346863} -11/07/2021 02:46:25 - INFO - __main__ - Step 39434: {'lr': 0.0004251444468918048, 'samples': 7571328, 'steps': 39433, 'loss/train': 1.3461247682571411} -11/07/2021 02:46:26 - INFO - __main__ - Step 39435: {'lr': 0.0004251406600867346, 'samples': 7571520, 'steps': 39434, 'loss/train': 0.49319687485694885} -11/07/2021 02:46:26 - INFO - __main__ - Step 39436: {'lr': 0.00042513687320274866, 'samples': 7571712, 'steps': 39435, 'loss/train': 1.7188775539398193} -11/07/2021 02:46:26 - INFO - __main__ - Step 39437: {'lr': 0.0004251330862398488, 'samples': 7571904, 'steps': 39436, 'loss/train': 1.560532569885254} -11/07/2021 02:46:27 - INFO - __main__ - Step 39438: {'lr': 0.0004251292991980367, 'samples': 7572096, 'steps': 39437, 'loss/train': 1.5440956354141235} -11/07/2021 02:46:27 - INFO - __main__ - Step 39439: {'lr': 0.000425125512077314, 'samples': 7572288, 'steps': 39438, 'loss/train': 1.5055773258209229} -11/07/2021 02:46:28 - INFO - __main__ - Step 39440: {'lr': 0.00042512172487768244, 'samples': 7572480, 'steps': 39439, 'loss/train': 1.3813639879226685} -11/07/2021 02:46:29 - INFO - __main__ - Step 39441: {'lr': 0.00042511793759914375, 'samples': 7572672, 'steps': 39440, 'loss/train': 1.7512849569320679} -11/07/2021 02:46:29 - INFO - __main__ - Step 39442: {'lr': 0.0004251141502416996, 'samples': 7572864, 'steps': 39441, 'loss/train': 1.831099510192871} -11/07/2021 02:46:29 - INFO - __main__ - Step 39443: {'lr': 0.0004251103628053517, 'samples': 7573056, 'steps': 39442, 'loss/train': 1.3687280416488647} -11/07/2021 02:46:30 - INFO - __main__ - Step 39444: {'lr': 0.0004251065752901018, 'samples': 7573248, 'steps': 39443, 'loss/train': 1.537869930267334} -11/07/2021 02:46:30 - INFO - __main__ - Step 39445: {'lr': 0.0004251027876959516, 'samples': 7573440, 'steps': 39444, 'loss/train': 1.254869818687439} -11/07/2021 02:46:31 - INFO - __main__ - Step 39446: {'lr': 0.0004250990000229028, 'samples': 7573632, 'steps': 39445, 'loss/train': 0.9443804025650024} -11/07/2021 02:46:31 - INFO - __main__ - Step 39447: {'lr': 0.00042509521227095706, 'samples': 7573824, 'steps': 39446, 'loss/train': 2.0799334049224854} -11/07/2021 02:46:32 - INFO - __main__ - Step 39448: {'lr': 0.0004250914244401161, 'samples': 7574016, 'steps': 39447, 'loss/train': 1.4163551330566406} -11/07/2021 02:46:32 - INFO - __main__ - Step 39449: {'lr': 0.00042508763653038167, 'samples': 7574208, 'steps': 39448, 'loss/train': 1.785377025604248} -11/07/2021 02:46:32 - INFO - __main__ - Step 39450: {'lr': 0.0004250838485417554, 'samples': 7574400, 'steps': 39449, 'loss/train': 1.613315463066101} -11/07/2021 02:46:34 - INFO - __main__ - Step 39451: {'lr': 0.00042508006047423916, 'samples': 7574592, 'steps': 39450, 'loss/train': 0.802128255367279} -11/07/2021 02:46:34 - INFO - __main__ - Step 39452: {'lr': 0.0004250762723278344, 'samples': 7574784, 'steps': 39451, 'loss/train': 0.8597303628921509} -11/07/2021 02:46:34 - INFO - __main__ - Step 39453: {'lr': 0.00042507248410254307, 'samples': 7574976, 'steps': 39452, 'loss/train': 1.2439583539962769} -11/07/2021 02:46:35 - INFO - __main__ - Step 39454: {'lr': 0.0004250686957983668, 'samples': 7575168, 'steps': 39453, 'loss/train': 1.4560964107513428} -11/07/2021 02:46:35 - INFO - __main__ - Step 39455: {'lr': 0.00042506490741530724, 'samples': 7575360, 'steps': 39454, 'loss/train': 1.489845633506775} -11/07/2021 02:46:36 - INFO - __main__ - Step 39456: {'lr': 0.00042506111895336616, 'samples': 7575552, 'steps': 39455, 'loss/train': 1.9019747972488403} -11/07/2021 02:46:36 - INFO - __main__ - Step 39457: {'lr': 0.00042505733041254526, 'samples': 7575744, 'steps': 39456, 'loss/train': 1.4447280168533325} -11/07/2021 02:46:37 - INFO - __main__ - Step 39458: {'lr': 0.00042505354179284615, 'samples': 7575936, 'steps': 39457, 'loss/train': 1.6310251951217651} -11/07/2021 02:46:37 - INFO - __main__ - Step 39459: {'lr': 0.00042504975309427064, 'samples': 7576128, 'steps': 39458, 'loss/train': 1.4011722803115845} -11/07/2021 02:46:37 - INFO - __main__ - Step 39460: {'lr': 0.0004250459643168204, 'samples': 7576320, 'steps': 39459, 'loss/train': 1.6884933710098267} -11/07/2021 02:46:38 - INFO - __main__ - Step 39461: {'lr': 0.0004250421754604972, 'samples': 7576512, 'steps': 39460, 'loss/train': 1.4346963167190552} -11/07/2021 02:46:39 - INFO - __main__ - Step 39462: {'lr': 0.0004250383865253027, 'samples': 7576704, 'steps': 39461, 'loss/train': 1.5717755556106567} -11/07/2021 02:46:39 - INFO - __main__ - Step 39463: {'lr': 0.00042503459751123854, 'samples': 7576896, 'steps': 39462, 'loss/train': 1.5766115188598633} -11/07/2021 02:46:39 - INFO - __main__ - Step 39464: {'lr': 0.00042503080841830654, 'samples': 7577088, 'steps': 39463, 'loss/train': 1.5276356935501099} -11/07/2021 02:46:40 - INFO - __main__ - Step 39465: {'lr': 0.0004250270192465083, 'samples': 7577280, 'steps': 39464, 'loss/train': 1.3183841705322266} -11/07/2021 02:46:41 - INFO - __main__ - Step 39466: {'lr': 0.0004250232299958456, 'samples': 7577472, 'steps': 39465, 'loss/train': 1.2871264219284058} -11/07/2021 02:46:41 - INFO - __main__ - Step 39467: {'lr': 0.0004250194406663203, 'samples': 7577664, 'steps': 39466, 'loss/train': 1.6174371242523193} -11/07/2021 02:46:42 - INFO - __main__ - Step 39468: {'lr': 0.00042501565125793375, 'samples': 7577856, 'steps': 39467, 'loss/train': 1.5066871643066406} -11/07/2021 02:46:42 - INFO - __main__ - Step 39469: {'lr': 0.0004250118617706879, 'samples': 7578048, 'steps': 39468, 'loss/train': 1.4779454469680786} -11/07/2021 02:46:42 - INFO - __main__ - Step 39470: {'lr': 0.0004250080722045844, 'samples': 7578240, 'steps': 39469, 'loss/train': 1.5967754125595093} -11/07/2021 02:46:43 - INFO - __main__ - Step 39471: {'lr': 0.000425004282559625, 'samples': 7578432, 'steps': 39470, 'loss/train': 2.041210889816284} -11/07/2021 02:46:44 - INFO - __main__ - Step 39472: {'lr': 0.0004250004928358113, 'samples': 7578624, 'steps': 39471, 'loss/train': 1.4292852878570557} -11/07/2021 02:46:44 - INFO - __main__ - Step 39473: {'lr': 0.0004249967030331451, 'samples': 7578816, 'steps': 39472, 'loss/train': 1.746503472328186} -11/07/2021 02:46:44 - INFO - __main__ - Step 39474: {'lr': 0.0004249929131516281, 'samples': 7579008, 'steps': 39473, 'loss/train': 1.8705283403396606} -11/07/2021 02:46:45 - INFO - __main__ - Step 39475: {'lr': 0.00042498912319126206, 'samples': 7579200, 'steps': 39474, 'loss/train': 1.8053672313690186} -11/07/2021 02:46:45 - INFO - __main__ - Step 39476: {'lr': 0.00042498533315204855, 'samples': 7579392, 'steps': 39475, 'loss/train': 2.0949859619140625} -11/07/2021 02:46:46 - INFO - __main__ - Step 39477: {'lr': 0.0004249815430339894, 'samples': 7579584, 'steps': 39476, 'loss/train': 0.690558135509491} -11/07/2021 02:46:46 - INFO - __main__ - Step 39478: {'lr': 0.0004249777528370862, 'samples': 7579776, 'steps': 39477, 'loss/train': 0.9026269316673279} -11/07/2021 02:46:47 - INFO - __main__ - Step 39479: {'lr': 0.00042497396256134073, 'samples': 7579968, 'steps': 39478, 'loss/train': 1.6150840520858765} -11/07/2021 02:46:47 - INFO - __main__ - Step 39480: {'lr': 0.0004249701722067547, 'samples': 7580160, 'steps': 39479, 'loss/train': 1.5659527778625488} -11/07/2021 02:46:47 - INFO - __main__ - Step 39481: {'lr': 0.0004249663817733298, 'samples': 7580352, 'steps': 39480, 'loss/train': 1.2330738306045532} -11/07/2021 02:46:48 - INFO - __main__ - Step 39482: {'lr': 0.00042496259126106786, 'samples': 7580544, 'steps': 39481, 'loss/train': 1.7414649724960327} -11/07/2021 02:46:49 - INFO - __main__ - Step 39483: {'lr': 0.0004249588006699704, 'samples': 7580736, 'steps': 39482, 'loss/train': 1.373297929763794} -11/07/2021 02:46:49 - INFO - __main__ - Step 39484: {'lr': 0.0004249550100000392, 'samples': 7580928, 'steps': 39483, 'loss/train': 1.433725357055664} -11/07/2021 02:46:50 - INFO - __main__ - Step 39485: {'lr': 0.0004249512192512759, 'samples': 7581120, 'steps': 39484, 'loss/train': 1.6692142486572266} -11/07/2021 02:46:50 - INFO - __main__ - Step 39486: {'lr': 0.0004249474284236824, 'samples': 7581312, 'steps': 39485, 'loss/train': 1.6300110816955566} -11/07/2021 02:46:51 - INFO - __main__ - Step 39487: {'lr': 0.0004249436375172602, 'samples': 7581504, 'steps': 39486, 'loss/train': 1.0745890140533447} -11/07/2021 02:46:51 - INFO - __main__ - Step 39488: {'lr': 0.0004249398465320111, 'samples': 7581696, 'steps': 39487, 'loss/train': 1.595900535583496} -11/07/2021 02:46:52 - INFO - __main__ - Step 39489: {'lr': 0.0004249360554679369, 'samples': 7581888, 'steps': 39488, 'loss/train': 1.4993693828582764} -11/07/2021 02:46:52 - INFO - __main__ - Step 39490: {'lr': 0.00042493226432503917, 'samples': 7582080, 'steps': 39489, 'loss/train': 1.0378392934799194} -11/07/2021 02:46:52 - INFO - __main__ - Step 39491: {'lr': 0.00042492847310331963, 'samples': 7582272, 'steps': 39490, 'loss/train': 1.5508944988250732} -11/07/2021 02:46:53 - INFO - __main__ - Step 39492: {'lr': 0.00042492468180278, 'samples': 7582464, 'steps': 39491, 'loss/train': 1.510115385055542} -11/07/2021 02:46:54 - INFO - __main__ - Step 39493: {'lr': 0.000424920890423422, 'samples': 7582656, 'steps': 39492, 'loss/train': 1.385694980621338} -11/07/2021 02:46:54 - INFO - __main__ - Step 39494: {'lr': 0.0004249170989652474, 'samples': 7582848, 'steps': 39493, 'loss/train': 1.5371301174163818} -11/07/2021 02:46:54 - INFO - __main__ - Step 39495: {'lr': 0.00042491330742825783, 'samples': 7583040, 'steps': 39494, 'loss/train': 1.4411581754684448} -11/07/2021 02:46:55 - INFO - __main__ - Step 39496: {'lr': 0.0004249095158124551, 'samples': 7583232, 'steps': 39495, 'loss/train': 1.6034796237945557} -11/07/2021 02:46:57 - INFO - __main__ - Step 39497: {'lr': 0.0004249057241178407, 'samples': 7583424, 'steps': 39496, 'loss/train': 1.4687601327896118} -11/07/2021 02:46:58 - INFO - __main__ - Step 39498: {'lr': 0.00042490193234441656, 'samples': 7583616, 'steps': 39497, 'loss/train': 1.361867904663086} -11/07/2021 02:46:58 - INFO - __main__ - Step 39499: {'lr': 0.00042489814049218434, 'samples': 7583808, 'steps': 39498, 'loss/train': 1.3539139032363892} -11/07/2021 02:46:58 - INFO - __main__ - Step 39500: {'lr': 0.00042489434856114565, 'samples': 7584000, 'steps': 39499, 'loss/train': 1.4942436218261719} -11/07/2021 02:46:59 - INFO - __main__ - Step 39501: {'lr': 0.00042489055655130226, 'samples': 7584192, 'steps': 39500, 'loss/train': 1.5138282775878906} -11/07/2021 02:46:59 - INFO - __main__ - Step 39502: {'lr': 0.00042488676446265596, 'samples': 7584384, 'steps': 39501, 'loss/train': 1.1894440650939941} -11/07/2021 02:46:59 - INFO - __main__ - Step 39503: {'lr': 0.00042488297229520834, 'samples': 7584576, 'steps': 39502, 'loss/train': 1.7873018980026245} -11/07/2021 02:47:00 - INFO - __main__ - Step 39504: {'lr': 0.00042487918004896117, 'samples': 7584768, 'steps': 39503, 'loss/train': 1.7786004543304443} -11/07/2021 02:47:01 - INFO - __main__ - Step 39505: {'lr': 0.0004248753877239161, 'samples': 7584960, 'steps': 39504, 'loss/train': 1.7644140720367432} -11/07/2021 02:47:01 - INFO - __main__ - Step 39506: {'lr': 0.0004248715953200749, 'samples': 7585152, 'steps': 39505, 'loss/train': 1.6513596773147583} -11/07/2021 02:47:01 - INFO - __main__ - Step 39507: {'lr': 0.00042486780283743927, 'samples': 7585344, 'steps': 39506, 'loss/train': 2.035029172897339} -11/07/2021 02:47:02 - INFO - __main__ - Step 39508: {'lr': 0.00042486401027601084, 'samples': 7585536, 'steps': 39507, 'loss/train': 1.7957890033721924} -11/07/2021 02:47:02 - INFO - __main__ - Step 39509: {'lr': 0.0004248602176357915, 'samples': 7585728, 'steps': 39508, 'loss/train': 1.3580241203308105} -11/07/2021 02:47:03 - INFO - __main__ - Step 39510: {'lr': 0.0004248564249167828, 'samples': 7585920, 'steps': 39509, 'loss/train': 1.7206439971923828} -11/07/2021 02:47:03 - INFO - __main__ - Step 39511: {'lr': 0.00042485263211898647, 'samples': 7586112, 'steps': 39510, 'loss/train': 0.794846773147583} -11/07/2021 02:47:04 - INFO - __main__ - Step 39512: {'lr': 0.00042484883924240427, 'samples': 7586304, 'steps': 39511, 'loss/train': 1.5746791362762451} -11/07/2021 02:47:04 - INFO - __main__ - Step 39513: {'lr': 0.0004248450462870378, 'samples': 7586496, 'steps': 39512, 'loss/train': 1.3140740394592285} -11/07/2021 02:47:04 - INFO - __main__ - Step 39514: {'lr': 0.0004248412532528889, 'samples': 7586688, 'steps': 39513, 'loss/train': 1.3792023658752441} -11/07/2021 02:47:05 - INFO - __main__ - Step 39515: {'lr': 0.00042483746013995924, 'samples': 7586880, 'steps': 39514, 'loss/train': 1.413406491279602} -11/07/2021 02:47:06 - INFO - __main__ - Step 39516: {'lr': 0.00042483366694825054, 'samples': 7587072, 'steps': 39515, 'loss/train': 1.7062214612960815} -11/07/2021 02:47:06 - INFO - __main__ - Step 39517: {'lr': 0.0004248298736777645, 'samples': 7587264, 'steps': 39516, 'loss/train': 1.7617663145065308} -11/07/2021 02:47:06 - INFO - __main__ - Step 39518: {'lr': 0.00042482608032850275, 'samples': 7587456, 'steps': 39517, 'loss/train': 1.4334967136383057} -11/07/2021 02:47:07 - INFO - __main__ - Step 39519: {'lr': 0.0004248222869004671, 'samples': 7587648, 'steps': 39518, 'loss/train': 1.6987298727035522} -11/07/2021 02:47:08 - INFO - __main__ - Step 39520: {'lr': 0.0004248184933936592, 'samples': 7587840, 'steps': 39519, 'loss/train': 1.8820641040802002} -11/07/2021 02:47:08 - INFO - __main__ - Step 39521: {'lr': 0.0004248146998080808, 'samples': 7588032, 'steps': 39520, 'loss/train': 1.3323283195495605} -11/07/2021 02:47:09 - INFO - __main__ - Step 39522: {'lr': 0.00042481090614373364, 'samples': 7588224, 'steps': 39521, 'loss/train': 1.578730583190918} -11/07/2021 02:47:09 - INFO - __main__ - Step 39523: {'lr': 0.00042480711240061933, 'samples': 7588416, 'steps': 39522, 'loss/train': 1.1655219793319702} -11/07/2021 02:47:09 - INFO - __main__ - Step 39524: {'lr': 0.0004248033185787397, 'samples': 7588608, 'steps': 39523, 'loss/train': 0.2873501479625702} -11/07/2021 02:47:10 - INFO - __main__ - Step 39525: {'lr': 0.00042479952467809623, 'samples': 7588800, 'steps': 39524, 'loss/train': 1.5925241708755493} -11/07/2021 02:47:11 - INFO - __main__ - Step 39526: {'lr': 0.00042479573069869095, 'samples': 7588992, 'steps': 39525, 'loss/train': 1.9888464212417603} -11/07/2021 02:47:11 - INFO - __main__ - Step 39527: {'lr': 0.0004247919366405253, 'samples': 7589184, 'steps': 39526, 'loss/train': 1.2977604866027832} -11/07/2021 02:47:11 - INFO - __main__ - Step 39528: {'lr': 0.0004247881425036012, 'samples': 7589376, 'steps': 39527, 'loss/train': 1.3489466905593872} -11/07/2021 02:47:12 - INFO - __main__ - Step 39529: {'lr': 0.00042478434828792025, 'samples': 7589568, 'steps': 39528, 'loss/train': 1.9120523929595947} -11/07/2021 02:47:12 - INFO - __main__ - Step 39530: {'lr': 0.00042478055399348415, 'samples': 7589760, 'steps': 39529, 'loss/train': 1.7055436372756958} -11/07/2021 02:47:13 - INFO - __main__ - Step 39531: {'lr': 0.0004247767596202946, 'samples': 7589952, 'steps': 39530, 'loss/train': 1.397582769393921} -11/07/2021 02:47:14 - INFO - __main__ - Step 39532: {'lr': 0.00042477296516835335, 'samples': 7590144, 'steps': 39531, 'loss/train': 1.6137359142303467} -11/07/2021 02:47:14 - INFO - __main__ - Step 39533: {'lr': 0.00042476917063766207, 'samples': 7590336, 'steps': 39532, 'loss/train': 1.2835636138916016} -11/07/2021 02:47:14 - INFO - __main__ - Step 39534: {'lr': 0.0004247653760282225, 'samples': 7590528, 'steps': 39533, 'loss/train': 1.2379640340805054} -11/07/2021 02:47:15 - INFO - __main__ - Step 39535: {'lr': 0.0004247615813400364, 'samples': 7590720, 'steps': 39534, 'loss/train': 1.3855849504470825} -11/07/2021 02:47:16 - INFO - __main__ - Step 39536: {'lr': 0.0004247577865731055, 'samples': 7590912, 'steps': 39535, 'loss/train': 1.8534126281738281} -11/07/2021 02:47:16 - INFO - __main__ - Step 39537: {'lr': 0.00042475399172743134, 'samples': 7591104, 'steps': 39536, 'loss/train': 1.2669944763183594} -11/07/2021 02:47:16 - INFO - __main__ - Step 39538: {'lr': 0.0004247501968030157, 'samples': 7591296, 'steps': 39537, 'loss/train': 1.1878610849380493} -11/07/2021 02:47:17 - INFO - __main__ - Step 39539: {'lr': 0.00042474640179986035, 'samples': 7591488, 'steps': 39538, 'loss/train': 1.5407204627990723} -11/07/2021 02:47:17 - INFO - __main__ - Step 39540: {'lr': 0.00042474260671796697, 'samples': 7591680, 'steps': 39539, 'loss/train': 1.8082916736602783} -11/07/2021 02:47:18 - INFO - __main__ - Step 39541: {'lr': 0.0004247388115573373, 'samples': 7591872, 'steps': 39540, 'loss/train': 1.6505813598632812} -11/07/2021 02:47:18 - INFO - __main__ - Step 39542: {'lr': 0.00042473501631797294, 'samples': 7592064, 'steps': 39541, 'loss/train': 1.686454176902771} -11/07/2021 02:47:19 - INFO - __main__ - Step 39543: {'lr': 0.0004247312209998758, 'samples': 7592256, 'steps': 39542, 'loss/train': 1.6812511682510376} -11/07/2021 02:47:19 - INFO - __main__ - Step 39544: {'lr': 0.00042472742560304734, 'samples': 7592448, 'steps': 39543, 'loss/train': 1.4964607954025269} -11/07/2021 02:47:19 - INFO - __main__ - Step 39545: {'lr': 0.00042472363012748947, 'samples': 7592640, 'steps': 39544, 'loss/train': 1.4741764068603516} -11/07/2021 02:47:21 - INFO - __main__ - Step 39546: {'lr': 0.00042471983457320384, 'samples': 7592832, 'steps': 39545, 'loss/train': 0.9633825421333313} -11/07/2021 02:47:21 - INFO - __main__ - Step 39547: {'lr': 0.00042471603894019206, 'samples': 7593024, 'steps': 39546, 'loss/train': 1.115648865699768} -11/07/2021 02:47:21 - INFO - __main__ - Step 39548: {'lr': 0.00042471224322845603, 'samples': 7593216, 'steps': 39547, 'loss/train': 1.6646112203598022} -11/07/2021 02:47:22 - INFO - __main__ - Step 39549: {'lr': 0.00042470844743799734, 'samples': 7593408, 'steps': 39548, 'loss/train': 1.172352910041809} -11/07/2021 02:47:22 - INFO - __main__ - Step 39550: {'lr': 0.00042470465156881765, 'samples': 7593600, 'steps': 39549, 'loss/train': 1.7505109310150146} -11/07/2021 02:47:23 - INFO - __main__ - Step 39551: {'lr': 0.00042470085562091887, 'samples': 7593792, 'steps': 39550, 'loss/train': 0.6108179092407227} -11/07/2021 02:47:23 - INFO - __main__ - Step 39552: {'lr': 0.0004246970595943025, 'samples': 7593984, 'steps': 39551, 'loss/train': 1.7491813898086548} -11/07/2021 02:47:24 - INFO - __main__ - Step 39553: {'lr': 0.0004246932634889703, 'samples': 7594176, 'steps': 39552, 'loss/train': 1.6450272798538208} -11/07/2021 02:47:24 - INFO - __main__ - Step 39554: {'lr': 0.00042468946730492404, 'samples': 7594368, 'steps': 39553, 'loss/train': 1.6657792329788208} -11/07/2021 02:47:24 - INFO - __main__ - Step 39555: {'lr': 0.00042468567104216536, 'samples': 7594560, 'steps': 39554, 'loss/train': 1.3390445709228516} -11/07/2021 02:47:25 - INFO - __main__ - Step 39556: {'lr': 0.0004246818747006961, 'samples': 7594752, 'steps': 39555, 'loss/train': 0.4458675682544708} -11/07/2021 02:47:26 - INFO - __main__ - Step 39557: {'lr': 0.00042467807828051787, 'samples': 7594944, 'steps': 39556, 'loss/train': 0.5895477533340454} -11/07/2021 02:47:26 - INFO - __main__ - Step 39558: {'lr': 0.0004246742817816323, 'samples': 7595136, 'steps': 39557, 'loss/train': 1.8787654638290405} -11/07/2021 02:47:27 - INFO - __main__ - Step 39559: {'lr': 0.00042467048520404126, 'samples': 7595328, 'steps': 39558, 'loss/train': 1.1775028705596924} -11/07/2021 02:47:27 - INFO - __main__ - Step 39560: {'lr': 0.00042466668854774636, 'samples': 7595520, 'steps': 39559, 'loss/train': 1.6932798624038696} -11/07/2021 02:47:27 - INFO - __main__ - Step 39561: {'lr': 0.00042466289181274943, 'samples': 7595712, 'steps': 39560, 'loss/train': 2.1152291297912598} -11/07/2021 02:47:28 - INFO - __main__ - Step 39562: {'lr': 0.00042465909499905206, 'samples': 7595904, 'steps': 39561, 'loss/train': 1.601305603981018} -11/07/2021 02:47:29 - INFO - __main__ - Step 39563: {'lr': 0.0004246552981066559, 'samples': 7596096, 'steps': 39562, 'loss/train': 1.5690134763717651} -11/07/2021 02:47:29 - INFO - __main__ - Step 39564: {'lr': 0.0004246515011355629, 'samples': 7596288, 'steps': 39563, 'loss/train': 1.7379307746887207} -11/07/2021 02:47:29 - INFO - __main__ - Step 39565: {'lr': 0.0004246477040857746, 'samples': 7596480, 'steps': 39564, 'loss/train': 1.4712262153625488} -11/07/2021 02:47:30 - INFO - __main__ - Step 39566: {'lr': 0.0004246439069572926, 'samples': 7596672, 'steps': 39565, 'loss/train': 0.4988980293273926} -11/07/2021 02:47:31 - INFO - __main__ - Step 39567: {'lr': 0.00042464010975011893, 'samples': 7596864, 'steps': 39566, 'loss/train': 2.626159429550171} -11/07/2021 02:47:31 - INFO - __main__ - Step 39568: {'lr': 0.00042463631246425504, 'samples': 7597056, 'steps': 39567, 'loss/train': 1.4757068157196045} -11/07/2021 02:47:32 - INFO - __main__ - Step 39569: {'lr': 0.0004246325150997027, 'samples': 7597248, 'steps': 39568, 'loss/train': 1.5218952894210815} -11/07/2021 02:47:32 - INFO - __main__ - Step 39570: {'lr': 0.0004246287176564637, 'samples': 7597440, 'steps': 39569, 'loss/train': 1.8463135957717896} -11/07/2021 02:47:32 - INFO - __main__ - Step 39571: {'lr': 0.0004246249201345397, 'samples': 7597632, 'steps': 39570, 'loss/train': 1.5711888074874878} -11/07/2021 02:47:33 - INFO - __main__ - Step 39572: {'lr': 0.0004246211225339323, 'samples': 7597824, 'steps': 39571, 'loss/train': 1.0583667755126953} -11/07/2021 02:47:34 - INFO - __main__ - Step 39573: {'lr': 0.0004246173248546434, 'samples': 7598016, 'steps': 39572, 'loss/train': 0.8221028447151184} -11/07/2021 02:47:34 - INFO - __main__ - Step 39574: {'lr': 0.0004246135270966747, 'samples': 7598208, 'steps': 39573, 'loss/train': 1.1225409507751465} -11/07/2021 02:47:34 - INFO - __main__ - Step 39575: {'lr': 0.00042460972926002774, 'samples': 7598400, 'steps': 39574, 'loss/train': 1.4795197248458862} -11/07/2021 02:47:35 - INFO - __main__ - Step 39576: {'lr': 0.00042460593134470426, 'samples': 7598592, 'steps': 39575, 'loss/train': 1.1359695196151733} -11/07/2021 02:47:35 - INFO - __main__ - Step 39577: {'lr': 0.0004246021333507062, 'samples': 7598784, 'steps': 39576, 'loss/train': 1.8443375825881958} -11/07/2021 02:47:36 - INFO - __main__ - Step 39578: {'lr': 0.00042459833527803503, 'samples': 7598976, 'steps': 39577, 'loss/train': 1.4954917430877686} -11/07/2021 02:47:36 - INFO - __main__ - Step 39579: {'lr': 0.00042459453712669255, 'samples': 7599168, 'steps': 39578, 'loss/train': 1.6938172578811646} -11/07/2021 02:47:37 - INFO - __main__ - Step 39580: {'lr': 0.0004245907388966804, 'samples': 7599360, 'steps': 39579, 'loss/train': 1.2286467552185059} -11/07/2021 02:47:37 - INFO - __main__ - Step 39581: {'lr': 0.0004245869405880005, 'samples': 7599552, 'steps': 39580, 'loss/train': 1.6558587551116943} -11/07/2021 02:47:37 - INFO - __main__ - Step 39582: {'lr': 0.0004245831422006543, 'samples': 7599744, 'steps': 39581, 'loss/train': 1.961647868156433} -11/07/2021 02:47:39 - INFO - __main__ - Step 39583: {'lr': 0.0004245793437346437, 'samples': 7599936, 'steps': 39582, 'loss/train': 1.524979829788208} -11/07/2021 02:47:39 - INFO - __main__ - Step 39584: {'lr': 0.0004245755451899703, 'samples': 7600128, 'steps': 39583, 'loss/train': 2.1289525032043457} -11/07/2021 02:47:39 - INFO - __main__ - Step 39585: {'lr': 0.0004245717465666359, 'samples': 7600320, 'steps': 39584, 'loss/train': 1.25424063205719} -11/07/2021 02:47:40 - INFO - __main__ - Step 39586: {'lr': 0.0004245679478646421, 'samples': 7600512, 'steps': 39585, 'loss/train': 1.688192367553711} -11/07/2021 02:47:40 - INFO - __main__ - Step 39587: {'lr': 0.00042456414908399075, 'samples': 7600704, 'steps': 39586, 'loss/train': 1.6947143077850342} -11/07/2021 02:47:41 - INFO - __main__ - Step 39588: {'lr': 0.00042456035022468344, 'samples': 7600896, 'steps': 39587, 'loss/train': 1.5494352579116821} -11/07/2021 02:47:41 - INFO - __main__ - Step 39589: {'lr': 0.0004245565512867219, 'samples': 7601088, 'steps': 39588, 'loss/train': 1.519472360610962} -11/07/2021 02:47:42 - INFO - __main__ - Step 39590: {'lr': 0.000424552752270108, 'samples': 7601280, 'steps': 39589, 'loss/train': 1.1904324293136597} -11/07/2021 02:47:42 - INFO - __main__ - Step 39591: {'lr': 0.0004245489531748432, 'samples': 7601472, 'steps': 39590, 'loss/train': 1.3604559898376465} -11/07/2021 02:47:42 - INFO - __main__ - Step 39592: {'lr': 0.00042454515400092944, 'samples': 7601664, 'steps': 39591, 'loss/train': 1.5542364120483398} -11/07/2021 02:47:43 - INFO - __main__ - Step 39593: {'lr': 0.00042454135474836817, 'samples': 7601856, 'steps': 39592, 'loss/train': 1.7233147621154785} -11/07/2021 02:47:44 - INFO - __main__ - Step 39594: {'lr': 0.0004245375554171613, 'samples': 7602048, 'steps': 39593, 'loss/train': 1.5351544618606567} -11/07/2021 02:47:44 - INFO - __main__ - Step 39595: {'lr': 0.00042453375600731057, 'samples': 7602240, 'steps': 39594, 'loss/train': 1.5188515186309814} -11/07/2021 02:47:45 - INFO - __main__ - Step 39596: {'lr': 0.00042452995651881764, 'samples': 7602432, 'steps': 39595, 'loss/train': 1.5693578720092773} -11/07/2021 02:47:45 - INFO - __main__ - Step 39597: {'lr': 0.0004245261569516842, 'samples': 7602624, 'steps': 39596, 'loss/train': 1.073722004890442} -11/07/2021 02:47:46 - INFO - __main__ - Step 39598: {'lr': 0.00042452235730591195, 'samples': 7602816, 'steps': 39597, 'loss/train': 1.8061981201171875} -11/07/2021 02:47:46 - INFO - __main__ - Step 39599: {'lr': 0.00042451855758150254, 'samples': 7603008, 'steps': 39598, 'loss/train': 1.7523164749145508} -11/07/2021 02:47:47 - INFO - __main__ - Step 39600: {'lr': 0.00042451475777845784, 'samples': 7603200, 'steps': 39599, 'loss/train': 1.640657901763916} -11/07/2021 02:47:47 - INFO - __main__ - Step 39601: {'lr': 0.00042451095789677943, 'samples': 7603392, 'steps': 39600, 'loss/train': 0.8249521255493164} -11/07/2021 02:47:47 - INFO - __main__ - Step 39602: {'lr': 0.0004245071579364691, 'samples': 7603584, 'steps': 39601, 'loss/train': 1.4024829864501953} -11/07/2021 02:47:48 - INFO - __main__ - Step 39603: {'lr': 0.0004245033578975286, 'samples': 7603776, 'steps': 39602, 'loss/train': 1.5897529125213623} -11/07/2021 02:47:49 - INFO - __main__ - Step 39604: {'lr': 0.00042449955777995954, 'samples': 7603968, 'steps': 39603, 'loss/train': 1.592136025428772} -11/07/2021 02:47:49 - INFO - __main__ - Step 39605: {'lr': 0.0004244957575837636, 'samples': 7604160, 'steps': 39604, 'loss/train': 1.688389539718628} -11/07/2021 02:47:49 - INFO - __main__ - Step 39606: {'lr': 0.00042449195730894266, 'samples': 7604352, 'steps': 39605, 'loss/train': 1.7507917881011963} -11/07/2021 02:47:50 - INFO - __main__ - Step 39607: {'lr': 0.00042448815695549823, 'samples': 7604544, 'steps': 39606, 'loss/train': 1.3852903842926025} -11/07/2021 02:47:50 - INFO - __main__ - Step 39608: {'lr': 0.00042448435652343223, 'samples': 7604736, 'steps': 39607, 'loss/train': 1.5574475526809692} -11/07/2021 02:47:51 - INFO - __main__ - Step 39609: {'lr': 0.0004244805560127463, 'samples': 7604928, 'steps': 39608, 'loss/train': 1.4441529512405396} -11/07/2021 02:47:51 - INFO - __main__ - Step 39610: {'lr': 0.00042447675542344203, 'samples': 7605120, 'steps': 39609, 'loss/train': 1.3182731866836548} -11/07/2021 02:47:52 - INFO - __main__ - Step 39611: {'lr': 0.0004244729547555213, 'samples': 7605312, 'steps': 39610, 'loss/train': 1.9568254947662354} -11/07/2021 02:47:52 - INFO - __main__ - Step 39612: {'lr': 0.00042446915400898565, 'samples': 7605504, 'steps': 39611, 'loss/train': 1.1934031248092651} -11/07/2021 02:47:52 - INFO - __main__ - Step 39613: {'lr': 0.00042446535318383695, 'samples': 7605696, 'steps': 39612, 'loss/train': 1.4212074279785156} -11/07/2021 02:47:54 - INFO - __main__ - Step 39614: {'lr': 0.00042446155228007687, 'samples': 7605888, 'steps': 39613, 'loss/train': 1.625552773475647} -11/07/2021 02:47:54 - INFO - __main__ - Step 39615: {'lr': 0.0004244577512977071, 'samples': 7606080, 'steps': 39614, 'loss/train': 1.0876522064208984} -11/07/2021 02:47:54 - INFO - __main__ - Step 39616: {'lr': 0.00042445395023672935, 'samples': 7606272, 'steps': 39615, 'loss/train': 1.587868332862854} -11/07/2021 02:47:55 - INFO - __main__ - Step 39617: {'lr': 0.0004244501490971454, 'samples': 7606464, 'steps': 39616, 'loss/train': 0.39124223589897156} -11/07/2021 02:47:55 - INFO - __main__ - Step 39618: {'lr': 0.0004244463478789568, 'samples': 7606656, 'steps': 39617, 'loss/train': 0.7393484711647034} -11/07/2021 02:47:56 - INFO - __main__ - Step 39619: {'lr': 0.0004244425465821654, 'samples': 7606848, 'steps': 39618, 'loss/train': 1.4141795635223389} -11/07/2021 02:47:56 - INFO - __main__ - Step 39620: {'lr': 0.0004244387452067729, 'samples': 7607040, 'steps': 39619, 'loss/train': 1.529541254043579} -11/07/2021 02:47:57 - INFO - __main__ - Step 39621: {'lr': 0.000424434943752781, 'samples': 7607232, 'steps': 39620, 'loss/train': 0.9253093004226685} -11/07/2021 02:47:57 - INFO - __main__ - Step 39622: {'lr': 0.0004244311422201914, 'samples': 7607424, 'steps': 39621, 'loss/train': 0.8912478089332581} -11/07/2021 02:47:57 - INFO - __main__ - Step 39623: {'lr': 0.0004244273406090058, 'samples': 7607616, 'steps': 39622, 'loss/train': 1.4458396434783936} -11/07/2021 02:47:58 - INFO - __main__ - Step 39624: {'lr': 0.000424423538919226, 'samples': 7607808, 'steps': 39623, 'loss/train': 1.4262381792068481} -11/07/2021 02:47:59 - INFO - __main__ - Step 39625: {'lr': 0.0004244197371508536, 'samples': 7608000, 'steps': 39624, 'loss/train': 1.5457366704940796} -11/07/2021 02:47:59 - INFO - __main__ - Step 39626: {'lr': 0.00042441593530389025, 'samples': 7608192, 'steps': 39625, 'loss/train': 1.671734094619751} -11/07/2021 02:48:00 - INFO - __main__ - Step 39627: {'lr': 0.0004244121333783379, 'samples': 7608384, 'steps': 39626, 'loss/train': 1.4473621845245361} -11/07/2021 02:48:00 - INFO - __main__ - Step 39628: {'lr': 0.0004244083313741981, 'samples': 7608576, 'steps': 39627, 'loss/train': 1.5875861644744873} -11/07/2021 02:48:01 - INFO - __main__ - Step 39629: {'lr': 0.0004244045292914726, 'samples': 7608768, 'steps': 39628, 'loss/train': 1.6657663583755493} -11/07/2021 02:48:01 - INFO - __main__ - Step 39630: {'lr': 0.00042440072713016317, 'samples': 7608960, 'steps': 39629, 'loss/train': 2.132669687271118} -11/07/2021 02:48:02 - INFO - __main__ - Step 39631: {'lr': 0.00042439692489027136, 'samples': 7609152, 'steps': 39630, 'loss/train': 1.6087201833724976} -11/07/2021 02:48:02 - INFO - __main__ - Step 39632: {'lr': 0.000424393122571799, 'samples': 7609344, 'steps': 39631, 'loss/train': 1.6041347980499268} -11/07/2021 02:48:02 - INFO - __main__ - Step 39633: {'lr': 0.00042438932017474783, 'samples': 7609536, 'steps': 39632, 'loss/train': 1.414711594581604} -11/07/2021 02:48:03 - INFO - __main__ - Step 39634: {'lr': 0.0004243855176991195, 'samples': 7609728, 'steps': 39633, 'loss/train': 1.6235281229019165} -11/07/2021 02:48:04 - INFO - __main__ - Step 39635: {'lr': 0.0004243817151449158, 'samples': 7609920, 'steps': 39634, 'loss/train': 1.363830327987671} -11/07/2021 02:48:04 - INFO - __main__ - Step 39636: {'lr': 0.0004243779125121383, 'samples': 7610112, 'steps': 39635, 'loss/train': 1.6997758150100708} -11/07/2021 02:48:04 - INFO - __main__ - Step 39637: {'lr': 0.00042437410980078894, 'samples': 7610304, 'steps': 39636, 'loss/train': 1.1887015104293823} -11/07/2021 02:48:05 - INFO - __main__ - Step 39638: {'lr': 0.0004243703070108692, 'samples': 7610496, 'steps': 39637, 'loss/train': 1.7544221878051758} -11/07/2021 02:48:05 - INFO - __main__ - Step 39639: {'lr': 0.00042436650414238086, 'samples': 7610688, 'steps': 39638, 'loss/train': 2.068868398666382} -11/07/2021 02:48:06 - INFO - __main__ - Step 39640: {'lr': 0.0004243627011953257, 'samples': 7610880, 'steps': 39639, 'loss/train': 1.4439142942428589} -11/07/2021 02:48:06 - INFO - __main__ - Step 39641: {'lr': 0.0004243588981697054, 'samples': 7611072, 'steps': 39640, 'loss/train': 1.7286045551300049} -11/07/2021 02:48:07 - INFO - __main__ - Step 39642: {'lr': 0.0004243550950655217, 'samples': 7611264, 'steps': 39641, 'loss/train': 0.8495831489562988} -11/07/2021 02:48:07 - INFO - __main__ - Step 39643: {'lr': 0.00042435129188277625, 'samples': 7611456, 'steps': 39642, 'loss/train': 1.5878719091415405} -11/07/2021 02:48:07 - INFO - __main__ - Step 39644: {'lr': 0.0004243474886214708, 'samples': 7611648, 'steps': 39643, 'loss/train': 1.6149377822875977} -11/07/2021 02:48:09 - INFO - __main__ - Step 39645: {'lr': 0.0004243436852816071, 'samples': 7611840, 'steps': 39644, 'loss/train': 1.3852001428604126} -11/07/2021 02:48:09 - INFO - __main__ - Step 39646: {'lr': 0.0004243398818631868, 'samples': 7612032, 'steps': 39645, 'loss/train': 1.6688364744186401} -11/07/2021 02:48:09 - INFO - __main__ - Step 39647: {'lr': 0.0004243360783662116, 'samples': 7612224, 'steps': 39646, 'loss/train': 2.061065673828125} -11/07/2021 02:48:10 - INFO - __main__ - Step 39648: {'lr': 0.0004243322747906833, 'samples': 7612416, 'steps': 39647, 'loss/train': 0.6897776126861572} -11/07/2021 02:48:10 - INFO - __main__ - Step 39649: {'lr': 0.00042432847113660355, 'samples': 7612608, 'steps': 39648, 'loss/train': 1.325101375579834} -11/07/2021 02:48:11 - INFO - __main__ - Step 39650: {'lr': 0.0004243246674039741, 'samples': 7612800, 'steps': 39649, 'loss/train': 1.4035671949386597} -11/07/2021 02:48:12 - INFO - __main__ - Step 39651: {'lr': 0.00042432086359279667, 'samples': 7612992, 'steps': 39650, 'loss/train': 1.6981890201568604} -11/07/2021 02:48:12 - INFO - __main__ - Step 39652: {'lr': 0.0004243170597030729, 'samples': 7613184, 'steps': 39651, 'loss/train': 1.5480200052261353} -11/07/2021 02:48:12 - INFO - __main__ - Step 39653: {'lr': 0.0004243132557348045, 'samples': 7613376, 'steps': 39652, 'loss/train': 0.45958590507507324} -11/07/2021 02:48:13 - INFO - __main__ - Step 39654: {'lr': 0.00042430945168799326, 'samples': 7613568, 'steps': 39653, 'loss/train': 1.4481576681137085} -11/07/2021 02:48:14 - INFO - __main__ - Step 39655: {'lr': 0.000424305647562641, 'samples': 7613760, 'steps': 39654, 'loss/train': 1.632983684539795} -11/07/2021 02:48:14 - INFO - __main__ - Step 39656: {'lr': 0.00042430184335874924, 'samples': 7613952, 'steps': 39655, 'loss/train': 1.5062471628189087} -11/07/2021 02:48:15 - INFO - __main__ - Step 39657: {'lr': 0.0004242980390763197, 'samples': 7614144, 'steps': 39656, 'loss/train': 1.5032585859298706} -11/07/2021 02:48:15 - INFO - __main__ - Step 39658: {'lr': 0.0004242942347153542, 'samples': 7614336, 'steps': 39657, 'loss/train': 1.1589655876159668} -11/07/2021 02:48:15 - INFO - __main__ - Step 39659: {'lr': 0.00042429043027585435, 'samples': 7614528, 'steps': 39658, 'loss/train': 0.9075229167938232} -11/07/2021 02:48:16 - INFO - __main__ - Step 39660: {'lr': 0.000424286625757822, 'samples': 7614720, 'steps': 39659, 'loss/train': 1.7922099828720093} -11/07/2021 02:48:17 - INFO - __main__ - Step 39661: {'lr': 0.00042428282116125873, 'samples': 7614912, 'steps': 39660, 'loss/train': 1.5930705070495605} -11/07/2021 02:48:17 - INFO - __main__ - Step 39662: {'lr': 0.0004242790164861663, 'samples': 7615104, 'steps': 39661, 'loss/train': 1.6237225532531738} -11/07/2021 02:48:18 - INFO - __main__ - Step 39663: {'lr': 0.0004242752117325465, 'samples': 7615296, 'steps': 39662, 'loss/train': 1.5321625471115112} -11/07/2021 02:48:18 - INFO - __main__ - Step 39664: {'lr': 0.000424271406900401, 'samples': 7615488, 'steps': 39663, 'loss/train': 1.7925151586532593} -11/07/2021 02:48:18 - INFO - __main__ - Step 39665: {'lr': 0.0004242676019897314, 'samples': 7615680, 'steps': 39664, 'loss/train': 1.6339011192321777} -11/07/2021 02:48:19 - INFO - __main__ - Step 39666: {'lr': 0.00042426379700053954, 'samples': 7615872, 'steps': 39665, 'loss/train': 1.840277910232544} -11/07/2021 02:48:20 - INFO - __main__ - Step 39667: {'lr': 0.00042425999193282713, 'samples': 7616064, 'steps': 39666, 'loss/train': 1.262918472290039} -11/07/2021 02:48:20 - INFO - __main__ - Step 39668: {'lr': 0.0004242561867865958, 'samples': 7616256, 'steps': 39667, 'loss/train': 2.535017967224121} -11/07/2021 02:48:20 - INFO - __main__ - Step 39669: {'lr': 0.0004242523815618473, 'samples': 7616448, 'steps': 39668, 'loss/train': 1.4685289859771729} -11/07/2021 02:48:21 - INFO - __main__ - Step 39670: {'lr': 0.0004242485762585835, 'samples': 7616640, 'steps': 39669, 'loss/train': 1.8454334735870361} -11/07/2021 02:48:22 - INFO - __main__ - Step 39671: {'lr': 0.0004242447708768059, 'samples': 7616832, 'steps': 39670, 'loss/train': 0.6174976825714111} -11/07/2021 02:48:22 - INFO - __main__ - Step 39672: {'lr': 0.0004242409654165163, 'samples': 7617024, 'steps': 39671, 'loss/train': 1.0872056484222412} -11/07/2021 02:48:22 - INFO - __main__ - Step 39673: {'lr': 0.00042423715987771637, 'samples': 7617216, 'steps': 39672, 'loss/train': 1.2014278173446655} -11/07/2021 02:48:23 - INFO - __main__ - Step 39674: {'lr': 0.0004242333542604079, 'samples': 7617408, 'steps': 39673, 'loss/train': 1.5013810396194458} -11/07/2021 02:48:23 - INFO - __main__ - Step 39675: {'lr': 0.0004242295485645926, 'samples': 7617600, 'steps': 39674, 'loss/train': 1.7303569316864014} -11/07/2021 02:48:24 - INFO - __main__ - Step 39676: {'lr': 0.0004242257427902721, 'samples': 7617792, 'steps': 39675, 'loss/train': 2.2309410572052} -11/07/2021 02:48:25 - INFO - __main__ - Step 39677: {'lr': 0.00042422193693744827, 'samples': 7617984, 'steps': 39676, 'loss/train': 1.37846040725708} -11/07/2021 02:48:25 - INFO - __main__ - Step 39678: {'lr': 0.0004242181310061226, 'samples': 7618176, 'steps': 39677, 'loss/train': 0.8689545392990112} -11/07/2021 02:48:25 - INFO - __main__ - Step 39679: {'lr': 0.000424214324996297, 'samples': 7618368, 'steps': 39678, 'loss/train': 1.9211291074752808} -11/07/2021 02:48:26 - INFO - __main__ - Step 39680: {'lr': 0.000424210518907973, 'samples': 7618560, 'steps': 39679, 'loss/train': 1.9578702449798584} -11/07/2021 02:48:27 - INFO - __main__ - Step 39681: {'lr': 0.0004242067127411525, 'samples': 7618752, 'steps': 39680, 'loss/train': 1.311366319656372} -11/07/2021 02:48:27 - INFO - __main__ - Step 39682: {'lr': 0.0004242029064958372, 'samples': 7618944, 'steps': 39681, 'loss/train': 1.0614537000656128} -11/07/2021 02:48:27 - INFO - __main__ - Step 39683: {'lr': 0.0004241991001720287, 'samples': 7619136, 'steps': 39682, 'loss/train': 1.565509557723999} -11/07/2021 02:48:28 - INFO - __main__ - Step 39684: {'lr': 0.00042419529376972885, 'samples': 7619328, 'steps': 39683, 'loss/train': 1.3136285543441772} -11/07/2021 02:48:28 - INFO - __main__ - Step 39685: {'lr': 0.0004241914872889392, 'samples': 7619520, 'steps': 39684, 'loss/train': 1.6138375997543335} -11/07/2021 02:48:29 - INFO - __main__ - Step 39686: {'lr': 0.00042418768072966163, 'samples': 7619712, 'steps': 39685, 'loss/train': 1.621649980545044} -11/07/2021 02:48:29 - INFO - __main__ - Step 39687: {'lr': 0.0004241838740918977, 'samples': 7619904, 'steps': 39686, 'loss/train': 1.4917651414871216} -11/07/2021 02:48:30 - INFO - __main__ - Step 39688: {'lr': 0.00042418006737564924, 'samples': 7620096, 'steps': 39687, 'loss/train': 1.7346736192703247} -11/07/2021 02:48:30 - INFO - __main__ - Step 39689: {'lr': 0.0004241762605809179, 'samples': 7620288, 'steps': 39688, 'loss/train': 1.132972240447998} -11/07/2021 02:48:30 - INFO - __main__ - Step 39690: {'lr': 0.00042417245370770547, 'samples': 7620480, 'steps': 39689, 'loss/train': 1.6081323623657227} -11/07/2021 02:48:31 - INFO - __main__ - Step 39691: {'lr': 0.00042416864675601365, 'samples': 7620672, 'steps': 39690, 'loss/train': 1.4430608749389648} -11/07/2021 02:48:32 - INFO - __main__ - Step 39692: {'lr': 0.0004241648397258441, 'samples': 7620864, 'steps': 39691, 'loss/train': 1.5008991956710815} -11/07/2021 02:48:32 - INFO - __main__ - Step 39693: {'lr': 0.0004241610326171985, 'samples': 7621056, 'steps': 39692, 'loss/train': 1.5701279640197754} -11/07/2021 02:48:32 - INFO - __main__ - Step 39694: {'lr': 0.0004241572254300786, 'samples': 7621248, 'steps': 39693, 'loss/train': 0.6049160957336426} -11/07/2021 02:48:33 - INFO - __main__ - Step 39695: {'lr': 0.00042415341816448625, 'samples': 7621440, 'steps': 39694, 'loss/train': 1.5551038980484009} -11/07/2021 02:48:33 - INFO - __main__ - Step 39696: {'lr': 0.000424149610820423, 'samples': 7621632, 'steps': 39695, 'loss/train': 1.4827028512954712} -11/07/2021 02:48:34 - INFO - __main__ - Step 39697: {'lr': 0.00042414580339789065, 'samples': 7621824, 'steps': 39696, 'loss/train': 1.496288537979126} -11/07/2021 02:48:34 - INFO - __main__ - Step 39698: {'lr': 0.00042414199589689084, 'samples': 7622016, 'steps': 39697, 'loss/train': 1.3225457668304443} -11/07/2021 02:48:35 - INFO - __main__ - Step 39699: {'lr': 0.0004241381883174254, 'samples': 7622208, 'steps': 39698, 'loss/train': 1.345666527748108} -11/07/2021 02:48:35 - INFO - __main__ - Step 39700: {'lr': 0.00042413438065949595, 'samples': 7622400, 'steps': 39699, 'loss/train': 1.0294551849365234} -11/07/2021 02:48:35 - INFO - __main__ - Step 39701: {'lr': 0.0004241305729231042, 'samples': 7622592, 'steps': 39700, 'loss/train': 1.5337921380996704} -11/07/2021 02:48:37 - INFO - __main__ - Step 39702: {'lr': 0.00042412676510825197, 'samples': 7622784, 'steps': 39701, 'loss/train': 1.2330243587493896} -11/07/2021 02:48:37 - INFO - __main__ - Step 39703: {'lr': 0.00042412295721494086, 'samples': 7622976, 'steps': 39702, 'loss/train': 1.093245267868042} -11/07/2021 02:48:37 - INFO - __main__ - Step 39704: {'lr': 0.00042411914924317265, 'samples': 7623168, 'steps': 39703, 'loss/train': 1.3550559282302856} -11/07/2021 02:48:38 - INFO - __main__ - Step 39705: {'lr': 0.00042411534119294903, 'samples': 7623360, 'steps': 39704, 'loss/train': 1.4321473836898804} -11/07/2021 02:48:38 - INFO - __main__ - Step 39706: {'lr': 0.0004241115330642717, 'samples': 7623552, 'steps': 39705, 'loss/train': 1.345481514930725} -11/07/2021 02:48:39 - INFO - __main__ - Step 39707: {'lr': 0.0004241077248571424, 'samples': 7623744, 'steps': 39706, 'loss/train': 1.318536639213562} -11/07/2021 02:48:39 - INFO - __main__ - Step 39708: {'lr': 0.0004241039165715629, 'samples': 7623936, 'steps': 39707, 'loss/train': 1.6019287109375} -11/07/2021 02:48:40 - INFO - __main__ - Step 39709: {'lr': 0.00042410010820753485, 'samples': 7624128, 'steps': 39708, 'loss/train': 1.2462016344070435} -11/07/2021 02:48:40 - INFO - __main__ - Step 39710: {'lr': 0.00042409629976505994, 'samples': 7624320, 'steps': 39709, 'loss/train': 1.191588044166565} -11/07/2021 02:48:41 - INFO - __main__ - Step 39711: {'lr': 0.00042409249124414, 'samples': 7624512, 'steps': 39710, 'loss/train': 1.242682933807373} -11/07/2021 02:48:41 - INFO - __main__ - Step 39712: {'lr': 0.00042408868264477657, 'samples': 7624704, 'steps': 39711, 'loss/train': 1.5885920524597168} -11/07/2021 02:48:42 - INFO - __main__ - Step 39713: {'lr': 0.00042408487396697147, 'samples': 7624896, 'steps': 39712, 'loss/train': 1.158028483390808} -11/07/2021 02:48:42 - INFO - __main__ - Step 39714: {'lr': 0.0004240810652107265, 'samples': 7625088, 'steps': 39713, 'loss/train': 0.7398699522018433} -11/07/2021 02:48:43 - INFO - __main__ - Step 39715: {'lr': 0.0004240772563760432, 'samples': 7625280, 'steps': 39714, 'loss/train': 1.3761696815490723} -11/07/2021 02:48:43 - INFO - __main__ - Step 39716: {'lr': 0.00042407344746292345, 'samples': 7625472, 'steps': 39715, 'loss/train': 1.2336206436157227} -11/07/2021 02:48:44 - INFO - __main__ - Step 39717: {'lr': 0.00042406963847136883, 'samples': 7625664, 'steps': 39716, 'loss/train': 1.5653035640716553} -11/07/2021 02:48:44 - INFO - __main__ - Step 39718: {'lr': 0.0004240658294013812, 'samples': 7625856, 'steps': 39717, 'loss/train': 1.227238416671753} -11/07/2021 02:48:45 - INFO - __main__ - Step 39719: {'lr': 0.00042406202025296213, 'samples': 7626048, 'steps': 39718, 'loss/train': 1.6440476179122925} -11/07/2021 02:48:45 - INFO - __main__ - Step 39720: {'lr': 0.00042405821102611336, 'samples': 7626240, 'steps': 39719, 'loss/train': 1.7578482627868652} -11/07/2021 02:48:45 - INFO - __main__ - Step 39721: {'lr': 0.0004240544017208367, 'samples': 7626432, 'steps': 39720, 'loss/train': 1.5157376527786255} -11/07/2021 02:48:46 - INFO - __main__ - Step 39722: {'lr': 0.0004240505923371338, 'samples': 7626624, 'steps': 39721, 'loss/train': 1.4250826835632324} -11/07/2021 02:48:47 - INFO - __main__ - Step 39723: {'lr': 0.0004240467828750064, 'samples': 7626816, 'steps': 39722, 'loss/train': 1.5825248956680298} -11/07/2021 02:48:47 - INFO - __main__ - Step 39724: {'lr': 0.0004240429733344562, 'samples': 7627008, 'steps': 39723, 'loss/train': 2.1459078788757324} -11/07/2021 02:48:47 - INFO - __main__ - Step 39725: {'lr': 0.0004240391637154849, 'samples': 7627200, 'steps': 39724, 'loss/train': 1.8433314561843872} -11/07/2021 02:48:48 - INFO - __main__ - Step 39726: {'lr': 0.0004240353540180942, 'samples': 7627392, 'steps': 39725, 'loss/train': 2.6465625762939453} -11/07/2021 02:48:48 - INFO - __main__ - Step 39727: {'lr': 0.00042403154424228596, 'samples': 7627584, 'steps': 39726, 'loss/train': 0.6849703192710876} -11/07/2021 02:48:49 - INFO - __main__ - Step 39728: {'lr': 0.00042402773438806175, 'samples': 7627776, 'steps': 39727, 'loss/train': 1.4673601388931274} -11/07/2021 02:48:50 - INFO - __main__ - Step 39729: {'lr': 0.00042402392445542333, 'samples': 7627968, 'steps': 39728, 'loss/train': 1.9610875844955444} -11/07/2021 02:48:50 - INFO - __main__ - Step 39730: {'lr': 0.0004240201144443724, 'samples': 7628160, 'steps': 39729, 'loss/train': 1.4347823858261108} -11/07/2021 02:48:50 - INFO - __main__ - Step 39731: {'lr': 0.00042401630435491073, 'samples': 7628352, 'steps': 39730, 'loss/train': 1.7260664701461792} -11/07/2021 02:48:51 - INFO - __main__ - Step 39732: {'lr': 0.00042401249418703996, 'samples': 7628544, 'steps': 39731, 'loss/train': 1.3634346723556519} -11/07/2021 02:48:52 - INFO - __main__ - Step 39733: {'lr': 0.00042400868394076185, 'samples': 7628736, 'steps': 39732, 'loss/train': 1.4103978872299194} -11/07/2021 02:48:52 - INFO - __main__ - Step 39734: {'lr': 0.0004240048736160781, 'samples': 7628928, 'steps': 39733, 'loss/train': 1.412202000617981} -11/07/2021 02:48:52 - INFO - __main__ - Step 39735: {'lr': 0.0004240010632129905, 'samples': 7629120, 'steps': 39734, 'loss/train': 1.230157494544983} -11/07/2021 02:48:53 - INFO - __main__ - Step 39736: {'lr': 0.00042399725273150056, 'samples': 7629312, 'steps': 39735, 'loss/train': 1.8496798276901245} -11/07/2021 02:48:53 - INFO - __main__ - Step 39737: {'lr': 0.0004239934421716103, 'samples': 7629504, 'steps': 39736, 'loss/train': 1.4702967405319214} -11/07/2021 02:48:54 - INFO - __main__ - Step 39738: {'lr': 0.00042398963153332124, 'samples': 7629696, 'steps': 39737, 'loss/train': 2.123060464859009} -11/07/2021 02:48:55 - INFO - __main__ - Step 39739: {'lr': 0.00042398582081663513, 'samples': 7629888, 'steps': 39738, 'loss/train': 1.6703587770462036} -11/07/2021 02:48:55 - INFO - __main__ - Step 39740: {'lr': 0.0004239820100215537, 'samples': 7630080, 'steps': 39739, 'loss/train': 1.3782191276550293} -11/07/2021 02:48:55 - INFO - __main__ - Step 39741: {'lr': 0.00042397819914807855, 'samples': 7630272, 'steps': 39740, 'loss/train': 1.7067298889160156} -11/07/2021 02:48:56 - INFO - __main__ - Step 39742: {'lr': 0.00042397438819621164, 'samples': 7630464, 'steps': 39741, 'loss/train': 1.5283854007720947} -11/07/2021 02:48:56 - INFO - __main__ - Step 39743: {'lr': 0.0004239705771659545, 'samples': 7630656, 'steps': 39742, 'loss/train': 1.3885010480880737} -11/07/2021 02:48:57 - INFO - __main__ - Step 39744: {'lr': 0.000423966766057309, 'samples': 7630848, 'steps': 39743, 'loss/train': 1.6397227048873901} -11/07/2021 02:48:57 - INFO - __main__ - Step 39745: {'lr': 0.00042396295487027666, 'samples': 7631040, 'steps': 39744, 'loss/train': 2.084167003631592} -11/07/2021 02:48:58 - INFO - __main__ - Step 39746: {'lr': 0.0004239591436048593, 'samples': 7631232, 'steps': 39745, 'loss/train': 1.6590286493301392} -11/07/2021 02:48:58 - INFO - __main__ - Step 39747: {'lr': 0.0004239553322610586, 'samples': 7631424, 'steps': 39746, 'loss/train': 1.4515533447265625} -11/07/2021 02:48:58 - INFO - __main__ - Step 39748: {'lr': 0.0004239515208388764, 'samples': 7631616, 'steps': 39747, 'loss/train': 1.706516981124878} -11/07/2021 02:49:00 - INFO - __main__ - Step 39749: {'lr': 0.00042394770933831425, 'samples': 7631808, 'steps': 39748, 'loss/train': 1.4649534225463867} -11/07/2021 02:49:00 - INFO - __main__ - Step 39750: {'lr': 0.00042394389775937403, 'samples': 7632000, 'steps': 39749, 'loss/train': 1.754453182220459} -11/07/2021 02:49:00 - INFO - __main__ - Step 39751: {'lr': 0.0004239400861020574, 'samples': 7632192, 'steps': 39750, 'loss/train': 1.0220494270324707} -11/07/2021 02:49:01 - INFO - __main__ - Step 39752: {'lr': 0.00042393627436636597, 'samples': 7632384, 'steps': 39751, 'loss/train': 1.8266533613204956} -11/07/2021 02:49:01 - INFO - __main__ - Step 39753: {'lr': 0.0004239324625523015, 'samples': 7632576, 'steps': 39752, 'loss/train': 1.4264540672302246} -11/07/2021 02:49:01 - INFO - __main__ - Step 39754: {'lr': 0.00042392865065986573, 'samples': 7632768, 'steps': 39753, 'loss/train': 1.504227638244629} -11/07/2021 02:49:02 - INFO - __main__ - Step 39755: {'lr': 0.00042392483868906053, 'samples': 7632960, 'steps': 39754, 'loss/train': 1.9210301637649536} -11/07/2021 02:49:03 - INFO - __main__ - Step 39756: {'lr': 0.0004239210266398874, 'samples': 7633152, 'steps': 39755, 'loss/train': 1.643656849861145} -11/07/2021 02:49:03 - INFO - __main__ - Step 39757: {'lr': 0.0004239172145123481, 'samples': 7633344, 'steps': 39756, 'loss/train': 1.6792773008346558} -11/07/2021 02:49:03 - INFO - __main__ - Step 39758: {'lr': 0.0004239134023064445, 'samples': 7633536, 'steps': 39757, 'loss/train': 1.3707860708236694} -11/07/2021 02:49:04 - INFO - __main__ - Step 39759: {'lr': 0.0004239095900221781, 'samples': 7633728, 'steps': 39758, 'loss/train': 1.836814284324646} -11/07/2021 02:49:05 - INFO - __main__ - Step 39760: {'lr': 0.00042390577765955077, 'samples': 7633920, 'steps': 39759, 'loss/train': 1.3591474294662476} -11/07/2021 02:49:05 - INFO - __main__ - Step 39761: {'lr': 0.00042390196521856417, 'samples': 7634112, 'steps': 39760, 'loss/train': 1.8055552244186401} -11/07/2021 02:49:06 - INFO - __main__ - Step 39762: {'lr': 0.00042389815269922005, 'samples': 7634304, 'steps': 39761, 'loss/train': 1.6083821058273315} -11/07/2021 02:49:06 - INFO - __main__ - Step 39763: {'lr': 0.0004238943401015201, 'samples': 7634496, 'steps': 39762, 'loss/train': 1.406672716140747} -11/07/2021 02:49:06 - INFO - __main__ - Step 39764: {'lr': 0.0004238905274254661, 'samples': 7634688, 'steps': 39763, 'loss/train': 1.3256386518478394} -11/07/2021 02:49:07 - INFO - __main__ - Step 39765: {'lr': 0.0004238867146710596, 'samples': 7634880, 'steps': 39764, 'loss/train': 1.0616670846939087} -11/07/2021 02:49:08 - INFO - __main__ - Step 39766: {'lr': 0.0004238829018383025, 'samples': 7635072, 'steps': 39765, 'loss/train': 1.067506194114685} -11/07/2021 02:49:08 - INFO - __main__ - Step 39767: {'lr': 0.0004238790889271964, 'samples': 7635264, 'steps': 39766, 'loss/train': 1.3006850481033325} -11/07/2021 02:49:08 - INFO - __main__ - Step 39768: {'lr': 0.0004238752759377431, 'samples': 7635456, 'steps': 39767, 'loss/train': 1.544019103050232} -11/07/2021 02:49:09 - INFO - __main__ - Step 39769: {'lr': 0.0004238714628699443, 'samples': 7635648, 'steps': 39768, 'loss/train': 1.4632283449172974} -11/07/2021 02:49:10 - INFO - __main__ - Step 39770: {'lr': 0.00042386764972380164, 'samples': 7635840, 'steps': 39769, 'loss/train': 1.483447790145874} -11/07/2021 02:49:10 - INFO - __main__ - Step 39771: {'lr': 0.00042386383649931693, 'samples': 7636032, 'steps': 39770, 'loss/train': 1.311075210571289} -11/07/2021 02:49:10 - INFO - __main__ - Step 39772: {'lr': 0.00042386002319649184, 'samples': 7636224, 'steps': 39771, 'loss/train': 1.4680263996124268} -11/07/2021 02:49:11 - INFO - __main__ - Step 39773: {'lr': 0.0004238562098153281, 'samples': 7636416, 'steps': 39772, 'loss/train': 1.5938646793365479} -11/07/2021 02:49:11 - INFO - __main__ - Step 39774: {'lr': 0.0004238523963558275, 'samples': 7636608, 'steps': 39773, 'loss/train': 1.0459965467453003} -11/07/2021 02:49:12 - INFO - __main__ - Step 39775: {'lr': 0.0004238485828179917, 'samples': 7636800, 'steps': 39774, 'loss/train': 1.9813939332962036} -11/07/2021 02:49:12 - INFO - __main__ - Step 39776: {'lr': 0.00042384476920182234, 'samples': 7636992, 'steps': 39775, 'loss/train': 1.984336018562317} -11/07/2021 02:49:13 - INFO - __main__ - Step 39777: {'lr': 0.0004238409555073212, 'samples': 7637184, 'steps': 39776, 'loss/train': 1.0975687503814697} -11/07/2021 02:49:13 - INFO - __main__ - Step 39778: {'lr': 0.00042383714173449007, 'samples': 7637376, 'steps': 39777, 'loss/train': 1.3706766366958618} -11/07/2021 02:49:13 - INFO - __main__ - Step 39779: {'lr': 0.00042383332788333055, 'samples': 7637568, 'steps': 39778, 'loss/train': 1.4491437673568726} -11/07/2021 02:49:14 - INFO - __main__ - Step 39780: {'lr': 0.0004238295139538445, 'samples': 7637760, 'steps': 39779, 'loss/train': 1.1163655519485474} -11/07/2021 02:49:15 - INFO - __main__ - Step 39781: {'lr': 0.0004238256999460335, 'samples': 7637952, 'steps': 39780, 'loss/train': 1.6790413856506348} -11/07/2021 02:49:15 - INFO - __main__ - Step 39782: {'lr': 0.00042382188585989933, 'samples': 7638144, 'steps': 39781, 'loss/train': 1.1418988704681396} -11/07/2021 02:49:16 - INFO - __main__ - Step 39783: {'lr': 0.0004238180716954436, 'samples': 7638336, 'steps': 39782, 'loss/train': 1.5400171279907227} -11/07/2021 02:49:16 - INFO - __main__ - Step 39784: {'lr': 0.0004238142574526683, 'samples': 7638528, 'steps': 39783, 'loss/train': 1.503924012184143} -11/07/2021 02:49:16 - INFO - __main__ - Step 39785: {'lr': 0.0004238104431315749, 'samples': 7638720, 'steps': 39784, 'loss/train': 1.6826781034469604} -11/07/2021 02:49:18 - INFO - __main__ - Step 39786: {'lr': 0.00042380662873216517, 'samples': 7638912, 'steps': 39785, 'loss/train': 1.4812978506088257} -11/07/2021 02:49:18 - INFO - __main__ - Step 39787: {'lr': 0.00042380281425444087, 'samples': 7639104, 'steps': 39786, 'loss/train': 1.9437432289123535} -11/07/2021 02:49:18 - INFO - __main__ - Step 39788: {'lr': 0.0004237989996984037, 'samples': 7639296, 'steps': 39787, 'loss/train': 1.8986597061157227} -11/07/2021 02:49:19 - INFO - __main__ - Step 39789: {'lr': 0.0004237951850640555, 'samples': 7639488, 'steps': 39788, 'loss/train': 1.75411057472229} -11/07/2021 02:49:19 - INFO - __main__ - Step 39790: {'lr': 0.0004237913703513977, 'samples': 7639680, 'steps': 39789, 'loss/train': 2.432239532470703} -11/07/2021 02:49:20 - INFO - __main__ - Step 39791: {'lr': 0.00042378755556043225, 'samples': 7639872, 'steps': 39790, 'loss/train': 2.40262508392334} -11/07/2021 02:49:20 - INFO - __main__ - Step 39792: {'lr': 0.0004237837406911608, 'samples': 7640064, 'steps': 39791, 'loss/train': 1.3880094289779663} -11/07/2021 02:49:21 - INFO - __main__ - Step 39793: {'lr': 0.00042377992574358514, 'samples': 7640256, 'steps': 39792, 'loss/train': 1.0807527303695679} -11/07/2021 02:49:21 - INFO - __main__ - Step 39794: {'lr': 0.0004237761107177068, 'samples': 7640448, 'steps': 39793, 'loss/train': 1.2133203744888306} -11/07/2021 02:49:21 - INFO - __main__ - Step 39795: {'lr': 0.00042377229561352774, 'samples': 7640640, 'steps': 39794, 'loss/train': 0.7437110543251038} -11/07/2021 02:49:22 - INFO - __main__ - Step 39796: {'lr': 0.00042376848043104953, 'samples': 7640832, 'steps': 39795, 'loss/train': 1.7172738313674927} -11/07/2021 02:49:23 - INFO - __main__ - Step 39797: {'lr': 0.00042376466517027387, 'samples': 7641024, 'steps': 39796, 'loss/train': 1.2570029497146606} -11/07/2021 02:49:23 - INFO - __main__ - Step 39798: {'lr': 0.00042376084983120266, 'samples': 7641216, 'steps': 39797, 'loss/train': 1.6518914699554443} -11/07/2021 02:49:24 - INFO - __main__ - Step 39799: {'lr': 0.0004237570344138374, 'samples': 7641408, 'steps': 39798, 'loss/train': 1.1588325500488281} -11/07/2021 02:49:24 - INFO - __main__ - Step 39800: {'lr': 0.00042375321891818, 'samples': 7641600, 'steps': 39799, 'loss/train': 1.3438451290130615} -11/07/2021 02:49:24 - INFO - __main__ - Step 39801: {'lr': 0.00042374940334423194, 'samples': 7641792, 'steps': 39800, 'loss/train': 1.038809895515442} -11/07/2021 02:49:25 - INFO - __main__ - Step 39802: {'lr': 0.00042374558769199517, 'samples': 7641984, 'steps': 39801, 'loss/train': 1.4980303049087524} -11/07/2021 02:49:26 - INFO - __main__ - Step 39803: {'lr': 0.0004237417719614713, 'samples': 7642176, 'steps': 39802, 'loss/train': 1.2092492580413818} -11/07/2021 02:49:26 - INFO - __main__ - Step 39804: {'lr': 0.000423737956152662, 'samples': 7642368, 'steps': 39803, 'loss/train': 1.3670045137405396} -11/07/2021 02:49:26 - INFO - __main__ - Step 39805: {'lr': 0.0004237341402655692, 'samples': 7642560, 'steps': 39804, 'loss/train': 1.4463545083999634} -11/07/2021 02:49:27 - INFO - __main__ - Step 39806: {'lr': 0.00042373032430019443, 'samples': 7642752, 'steps': 39805, 'loss/train': 1.3591455221176147} -11/07/2021 02:49:28 - INFO - __main__ - Step 39807: {'lr': 0.00042372650825653937, 'samples': 7642944, 'steps': 39806, 'loss/train': 1.7041791677474976} -11/07/2021 02:49:28 - INFO - __main__ - Step 39808: {'lr': 0.0004237226921346059, 'samples': 7643136, 'steps': 39807, 'loss/train': 1.2431955337524414} -11/07/2021 02:49:28 - INFO - __main__ - Step 39809: {'lr': 0.0004237188759343956, 'samples': 7643328, 'steps': 39808, 'loss/train': 0.7306289076805115} -11/07/2021 02:49:29 - INFO - __main__ - Step 39810: {'lr': 0.0004237150596559103, 'samples': 7643520, 'steps': 39809, 'loss/train': 1.6761316061019897} -11/07/2021 02:49:29 - INFO - __main__ - Step 39811: {'lr': 0.00042371124329915167, 'samples': 7643712, 'steps': 39810, 'loss/train': 0.20795224606990814} -11/07/2021 02:49:30 - INFO - __main__ - Step 39812: {'lr': 0.0004237074268641215, 'samples': 7643904, 'steps': 39811, 'loss/train': 1.5500051975250244} -11/07/2021 02:49:31 - INFO - __main__ - Step 39813: {'lr': 0.00042370361035082136, 'samples': 7644096, 'steps': 39812, 'loss/train': 1.7766578197479248} -11/07/2021 02:49:31 - INFO - __main__ - Step 39814: {'lr': 0.000423699793759253, 'samples': 7644288, 'steps': 39813, 'loss/train': 1.3118033409118652} -11/07/2021 02:49:31 - INFO - __main__ - Step 39815: {'lr': 0.0004236959770894183, 'samples': 7644480, 'steps': 39814, 'loss/train': 1.6286885738372803} -11/07/2021 02:49:32 - INFO - __main__ - Step 39816: {'lr': 0.00042369216034131887, 'samples': 7644672, 'steps': 39815, 'loss/train': 1.7368838787078857} -11/07/2021 02:49:33 - INFO - __main__ - Step 39817: {'lr': 0.0004236883435149564, 'samples': 7644864, 'steps': 39816, 'loss/train': 1.5768975019454956} -11/07/2021 02:49:33 - INFO - __main__ - Step 39818: {'lr': 0.0004236845266103327, 'samples': 7645056, 'steps': 39817, 'loss/train': 1.579480528831482} -11/07/2021 02:49:33 - INFO - __main__ - Step 39819: {'lr': 0.00042368070962744937, 'samples': 7645248, 'steps': 39818, 'loss/train': 0.9204245805740356} -11/07/2021 02:49:34 - INFO - __main__ - Step 39820: {'lr': 0.0004236768925663082, 'samples': 7645440, 'steps': 39819, 'loss/train': 1.6000114679336548} -11/07/2021 02:49:34 - INFO - __main__ - Step 39821: {'lr': 0.0004236730754269109, 'samples': 7645632, 'steps': 39820, 'loss/train': 1.3265875577926636} -11/07/2021 02:49:35 - INFO - __main__ - Step 39822: {'lr': 0.00042366925820925915, 'samples': 7645824, 'steps': 39821, 'loss/train': 1.3526073694229126} -11/07/2021 02:49:36 - INFO - __main__ - Step 39823: {'lr': 0.0004236654409133548, 'samples': 7646016, 'steps': 39822, 'loss/train': 1.3544975519180298} -11/07/2021 02:49:36 - INFO - __main__ - Step 39824: {'lr': 0.0004236616235391995, 'samples': 7646208, 'steps': 39823, 'loss/train': 1.2097423076629639} -11/07/2021 02:49:36 - INFO - __main__ - Step 39825: {'lr': 0.0004236578060867949, 'samples': 7646400, 'steps': 39824, 'loss/train': 1.4299346208572388} -11/07/2021 02:49:37 - INFO - __main__ - Step 39826: {'lr': 0.0004236539885561427, 'samples': 7646592, 'steps': 39825, 'loss/train': 1.4713175296783447} -11/07/2021 02:49:38 - INFO - __main__ - Step 39827: {'lr': 0.0004236501709472448, 'samples': 7646784, 'steps': 39826, 'loss/train': 0.9976240396499634} -11/07/2021 02:49:38 - INFO - __main__ - Step 39828: {'lr': 0.00042364635326010277, 'samples': 7646976, 'steps': 39827, 'loss/train': 1.8949692249298096} -11/07/2021 02:49:38 - INFO - __main__ - Step 39829: {'lr': 0.0004236425354947183, 'samples': 7647168, 'steps': 39828, 'loss/train': 1.5358874797821045} -11/07/2021 02:49:39 - INFO - __main__ - Step 39830: {'lr': 0.0004236387176510933, 'samples': 7647360, 'steps': 39829, 'loss/train': 1.5187652111053467} -11/07/2021 02:49:39 - INFO - __main__ - Step 39831: {'lr': 0.00042363489972922937, 'samples': 7647552, 'steps': 39830, 'loss/train': 1.2138946056365967} -11/07/2021 02:49:40 - INFO - __main__ - Step 39832: {'lr': 0.00042363108172912824, 'samples': 7647744, 'steps': 39831, 'loss/train': 1.8676568269729614} -11/07/2021 02:49:40 - INFO - __main__ - Step 39833: {'lr': 0.0004236272636507915, 'samples': 7647936, 'steps': 39832, 'loss/train': 1.081512689590454} -11/07/2021 02:49:41 - INFO - __main__ - Step 39834: {'lr': 0.0004236234454942211, 'samples': 7648128, 'steps': 39833, 'loss/train': 1.7128548622131348} -11/07/2021 02:49:41 - INFO - __main__ - Step 39835: {'lr': 0.0004236196272594186, 'samples': 7648320, 'steps': 39834, 'loss/train': 1.5928826332092285} -11/07/2021 02:49:41 - INFO - __main__ - Step 39836: {'lr': 0.00042361580894638586, 'samples': 7648512, 'steps': 39835, 'loss/train': 1.5246357917785645} -11/07/2021 02:49:42 - INFO - __main__ - Step 39837: {'lr': 0.0004236119905551244, 'samples': 7648704, 'steps': 39836, 'loss/train': 1.721874713897705} -11/07/2021 02:49:43 - INFO - __main__ - Step 39838: {'lr': 0.0004236081720856362, 'samples': 7648896, 'steps': 39837, 'loss/train': 1.6592479944229126} -11/07/2021 02:49:43 - INFO - __main__ - Step 39839: {'lr': 0.0004236043535379227, 'samples': 7649088, 'steps': 39838, 'loss/train': 1.5822508335113525} -11/07/2021 02:49:43 - INFO - __main__ - Step 39840: {'lr': 0.0004236005349119858, 'samples': 7649280, 'steps': 39839, 'loss/train': 1.6861557960510254} -11/07/2021 02:49:44 - INFO - __main__ - Step 39841: {'lr': 0.0004235967162078272, 'samples': 7649472, 'steps': 39840, 'loss/train': 0.9433187246322632} -11/07/2021 02:49:44 - INFO - __main__ - Step 39842: {'lr': 0.0004235928974254486, 'samples': 7649664, 'steps': 39841, 'loss/train': 1.473461627960205} -11/07/2021 02:49:45 - INFO - __main__ - Step 39843: {'lr': 0.00042358907856485166, 'samples': 7649856, 'steps': 39842, 'loss/train': 1.4653620719909668} -11/07/2021 02:49:45 - INFO - __main__ - Step 39844: {'lr': 0.0004235852596260382, 'samples': 7650048, 'steps': 39843, 'loss/train': 1.425424575805664} -11/07/2021 02:49:46 - INFO - __main__ - Step 39845: {'lr': 0.0004235814406090099, 'samples': 7650240, 'steps': 39844, 'loss/train': 1.3061177730560303} -11/07/2021 02:49:46 - INFO - __main__ - Step 39846: {'lr': 0.0004235776215137686, 'samples': 7650432, 'steps': 39845, 'loss/train': 0.9308658242225647} -11/07/2021 02:49:47 - INFO - __main__ - Step 39847: {'lr': 0.0004235738023403157, 'samples': 7650624, 'steps': 39846, 'loss/train': 1.448547124862671} -11/07/2021 02:49:47 - INFO - __main__ - Step 39848: {'lr': 0.00042356998308865323, 'samples': 7650816, 'steps': 39847, 'loss/train': 2.0486652851104736} -11/07/2021 02:49:48 - INFO - __main__ - Step 39849: {'lr': 0.00042356616375878274, 'samples': 7651008, 'steps': 39848, 'loss/train': 1.8110203742980957} -11/07/2021 02:49:48 - INFO - __main__ - Step 39850: {'lr': 0.00042356234435070604, 'samples': 7651200, 'steps': 39849, 'loss/train': 1.2810955047607422} -11/07/2021 02:49:49 - INFO - __main__ - Step 39851: {'lr': 0.0004235585248644249, 'samples': 7651392, 'steps': 39850, 'loss/train': 1.4850274324417114} -11/07/2021 02:49:49 - INFO - __main__ - Step 39852: {'lr': 0.0004235547052999409, 'samples': 7651584, 'steps': 39851, 'loss/train': 1.3674862384796143} -11/07/2021 02:49:50 - INFO - __main__ - Step 39853: {'lr': 0.00042355088565725584, 'samples': 7651776, 'steps': 39852, 'loss/train': 1.4045926332473755} -11/07/2021 02:49:50 - INFO - __main__ - Step 39854: {'lr': 0.0004235470659363714, 'samples': 7651968, 'steps': 39853, 'loss/train': 1.8996695280075073} -11/07/2021 02:49:51 - INFO - __main__ - Step 39855: {'lr': 0.0004235432461372894, 'samples': 7652160, 'steps': 39854, 'loss/train': 1.3678069114685059} -11/07/2021 02:49:51 - INFO - __main__ - Step 39856: {'lr': 0.0004235394262600114, 'samples': 7652352, 'steps': 39855, 'loss/train': 1.801565170288086} -11/07/2021 02:49:51 - INFO - __main__ - Step 39857: {'lr': 0.0004235356063045393, 'samples': 7652544, 'steps': 39856, 'loss/train': 0.8615394234657288} -11/07/2021 02:49:52 - INFO - __main__ - Step 39858: {'lr': 0.0004235317862708747, 'samples': 7652736, 'steps': 39857, 'loss/train': 1.7578961849212646} -11/07/2021 02:49:53 - INFO - __main__ - Step 39859: {'lr': 0.00042352796615901937, 'samples': 7652928, 'steps': 39858, 'loss/train': 1.4292079210281372} -11/07/2021 02:49:53 - INFO - __main__ - Step 39860: {'lr': 0.000423524145968975, 'samples': 7653120, 'steps': 39859, 'loss/train': 1.4792885780334473} -11/07/2021 02:49:53 - INFO - __main__ - Step 39861: {'lr': 0.00042352032570074327, 'samples': 7653312, 'steps': 39860, 'loss/train': 1.4000568389892578} -11/07/2021 02:49:54 - INFO - __main__ - Step 39862: {'lr': 0.00042351650535432607, 'samples': 7653504, 'steps': 39861, 'loss/train': 1.2337876558303833} -11/07/2021 02:49:55 - INFO - __main__ - Step 39863: {'lr': 0.00042351268492972494, 'samples': 7653696, 'steps': 39862, 'loss/train': 1.6213442087173462} -11/07/2021 02:49:55 - INFO - __main__ - Step 39864: {'lr': 0.0004235088644269417, 'samples': 7653888, 'steps': 39863, 'loss/train': 1.136330246925354} -11/07/2021 02:49:56 - INFO - __main__ - Step 39865: {'lr': 0.00042350504384597803, 'samples': 7654080, 'steps': 39864, 'loss/train': 1.6284946203231812} -11/07/2021 02:49:56 - INFO - __main__ - Step 39866: {'lr': 0.0004235012231868357, 'samples': 7654272, 'steps': 39865, 'loss/train': 1.7181075811386108} -11/07/2021 02:49:56 - INFO - __main__ - Step 39867: {'lr': 0.0004234974024495163, 'samples': 7654464, 'steps': 39866, 'loss/train': 0.9383137822151184} -11/07/2021 02:49:57 - INFO - __main__ - Step 39868: {'lr': 0.00042349358163402175, 'samples': 7654656, 'steps': 39867, 'loss/train': 2.038564920425415} -11/07/2021 02:49:58 - INFO - __main__ - Step 39869: {'lr': 0.0004234897607403536, 'samples': 7654848, 'steps': 39868, 'loss/train': 1.292812705039978} -11/07/2021 02:49:58 - INFO - __main__ - Step 39870: {'lr': 0.0004234859397685137, 'samples': 7655040, 'steps': 39869, 'loss/train': 1.2042925357818604} -11/07/2021 02:49:58 - INFO - __main__ - Step 39871: {'lr': 0.0004234821187185036, 'samples': 7655232, 'steps': 39870, 'loss/train': 1.6875336170196533} -11/07/2021 02:49:59 - INFO - __main__ - Step 39872: {'lr': 0.0004234782975903253, 'samples': 7655424, 'steps': 39871, 'loss/train': 1.6400891542434692} -11/07/2021 02:49:59 - INFO - __main__ - Step 39873: {'lr': 0.00042347447638398024, 'samples': 7655616, 'steps': 39872, 'loss/train': 1.468469500541687} -11/07/2021 02:50:00 - INFO - __main__ - Step 39874: {'lr': 0.00042347065509947023, 'samples': 7655808, 'steps': 39873, 'loss/train': 1.1016398668289185} -11/07/2021 02:50:00 - INFO - __main__ - Step 39875: {'lr': 0.0004234668337367971, 'samples': 7656000, 'steps': 39874, 'loss/train': 1.3569303750991821} -11/07/2021 02:50:01 - INFO - __main__ - Step 39876: {'lr': 0.0004234630122959625, 'samples': 7656192, 'steps': 39875, 'loss/train': 1.2579153776168823} -11/07/2021 02:50:01 - INFO - __main__ - Step 39877: {'lr': 0.0004234591907769681, 'samples': 7656384, 'steps': 39876, 'loss/train': 1.3981540203094482} -11/07/2021 02:50:01 - INFO - __main__ - Step 39878: {'lr': 0.0004234553691798156, 'samples': 7656576, 'steps': 39877, 'loss/train': 1.766584873199463} -11/07/2021 02:50:03 - INFO - __main__ - Step 39879: {'lr': 0.000423451547504507, 'samples': 7656768, 'steps': 39878, 'loss/train': 1.8074575662612915} -11/07/2021 02:50:03 - INFO - __main__ - Step 39880: {'lr': 0.0004234477257510436, 'samples': 7656960, 'steps': 39879, 'loss/train': 1.5272505283355713} -11/07/2021 02:50:03 - INFO - __main__ - Step 39881: {'lr': 0.00042344390391942745, 'samples': 7657152, 'steps': 39880, 'loss/train': 1.7444243431091309} -11/07/2021 02:50:04 - INFO - __main__ - Step 39882: {'lr': 0.0004234400820096601, 'samples': 7657344, 'steps': 39881, 'loss/train': 1.6279277801513672} -11/07/2021 02:50:04 - INFO - __main__ - Step 39883: {'lr': 0.0004234362600217433, 'samples': 7657536, 'steps': 39882, 'loss/train': 1.5940405130386353} -11/07/2021 02:50:05 - INFO - __main__ - Step 39884: {'lr': 0.0004234324379556789, 'samples': 7657728, 'steps': 39883, 'loss/train': 1.443777322769165} -11/07/2021 02:50:05 - INFO - __main__ - Step 39885: {'lr': 0.0004234286158114684, 'samples': 7657920, 'steps': 39884, 'loss/train': 1.5703567266464233} -11/07/2021 02:50:06 - INFO - __main__ - Step 39886: {'lr': 0.0004234247935891137, 'samples': 7658112, 'steps': 39885, 'loss/train': 1.7871206998825073} -11/07/2021 02:50:06 - INFO - __main__ - Step 39887: {'lr': 0.00042342097128861647, 'samples': 7658304, 'steps': 39886, 'loss/train': 1.869883418083191} -11/07/2021 02:50:06 - INFO - __main__ - Step 39888: {'lr': 0.0004234171489099784, 'samples': 7658496, 'steps': 39887, 'loss/train': 1.3405208587646484} -11/07/2021 02:50:07 - INFO - __main__ - Step 39889: {'lr': 0.00042341332645320126, 'samples': 7658688, 'steps': 39888, 'loss/train': 1.503919243812561} -11/07/2021 02:50:08 - INFO - __main__ - Step 39890: {'lr': 0.0004234095039182867, 'samples': 7658880, 'steps': 39889, 'loss/train': 0.8980141282081604} -11/07/2021 02:50:08 - INFO - __main__ - Step 39891: {'lr': 0.00042340568130523653, 'samples': 7659072, 'steps': 39890, 'loss/train': 1.4018449783325195} -11/07/2021 02:50:08 - INFO - __main__ - Step 39892: {'lr': 0.0004234018586140525, 'samples': 7659264, 'steps': 39891, 'loss/train': 1.499969482421875} -11/07/2021 02:50:09 - INFO - __main__ - Step 39893: {'lr': 0.00042339803584473626, 'samples': 7659456, 'steps': 39892, 'loss/train': 1.4663480520248413} -11/07/2021 02:50:09 - INFO - __main__ - Step 39894: {'lr': 0.0004233942129972894, 'samples': 7659648, 'steps': 39893, 'loss/train': 1.5299068689346313} -11/07/2021 02:50:10 - INFO - __main__ - Step 39895: {'lr': 0.00042339039007171386, 'samples': 7659840, 'steps': 39894, 'loss/train': 2.0362446308135986} -11/07/2021 02:50:11 - INFO - __main__ - Step 39896: {'lr': 0.00042338656706801135, 'samples': 7660032, 'steps': 39895, 'loss/train': 1.2440659999847412} -11/07/2021 02:50:11 - INFO - __main__ - Step 39897: {'lr': 0.00042338274398618346, 'samples': 7660224, 'steps': 39896, 'loss/train': 1.6488834619522095} -11/07/2021 02:50:11 - INFO - __main__ - Step 39898: {'lr': 0.000423378920826232, 'samples': 7660416, 'steps': 39897, 'loss/train': 3.15498423576355} -11/07/2021 02:50:12 - INFO - __main__ - Step 39899: {'lr': 0.0004233750975881587, 'samples': 7660608, 'steps': 39898, 'loss/train': 1.5884058475494385} -11/07/2021 02:50:13 - INFO - __main__ - Step 39900: {'lr': 0.0004233712742719652, 'samples': 7660800, 'steps': 39899, 'loss/train': 1.2452188730239868} -11/07/2021 02:50:13 - INFO - __main__ - Step 39901: {'lr': 0.0004233674508776533, 'samples': 7660992, 'steps': 39900, 'loss/train': 1.4315701723098755} -11/07/2021 02:50:13 - INFO - __main__ - Step 39902: {'lr': 0.00042336362740522473, 'samples': 7661184, 'steps': 39901, 'loss/train': 1.4178969860076904} -11/07/2021 02:50:14 - INFO - __main__ - Step 39903: {'lr': 0.0004233598038546812, 'samples': 7661376, 'steps': 39902, 'loss/train': 1.5171977281570435} -11/07/2021 02:50:14 - INFO - __main__ - Step 39904: {'lr': 0.0004233559802260244, 'samples': 7661568, 'steps': 39903, 'loss/train': 1.2969151735305786} -11/07/2021 02:50:15 - INFO - __main__ - Step 39905: {'lr': 0.000423352156519256, 'samples': 7661760, 'steps': 39904, 'loss/train': 0.9684048891067505} -11/07/2021 02:50:16 - INFO - __main__ - Step 39906: {'lr': 0.0004233483327343779, 'samples': 7661952, 'steps': 39905, 'loss/train': 1.567678451538086} -11/07/2021 02:50:16 - INFO - __main__ - Step 39907: {'lr': 0.0004233445088713916, 'samples': 7662144, 'steps': 39906, 'loss/train': 0.30363214015960693} -11/07/2021 02:50:16 - INFO - __main__ - Step 39908: {'lr': 0.000423340684930299, 'samples': 7662336, 'steps': 39907, 'loss/train': 1.196516752243042} -11/07/2021 02:50:17 - INFO - __main__ - Step 39909: {'lr': 0.0004233368609111018, 'samples': 7662528, 'steps': 39908, 'loss/train': 1.5008447170257568} -11/07/2021 02:50:18 - INFO - __main__ - Step 39910: {'lr': 0.00042333303681380165, 'samples': 7662720, 'steps': 39909, 'loss/train': 1.294662594795227} -11/07/2021 02:50:18 - INFO - __main__ - Step 39911: {'lr': 0.0004233292126384003, 'samples': 7662912, 'steps': 39910, 'loss/train': 1.9347686767578125} -11/07/2021 02:50:18 - INFO - __main__ - Step 39912: {'lr': 0.00042332538838489955, 'samples': 7663104, 'steps': 39911, 'loss/train': 1.5069063901901245} -11/07/2021 02:50:19 - INFO - __main__ - Step 39913: {'lr': 0.0004233215640533009, 'samples': 7663296, 'steps': 39912, 'loss/train': 1.3123886585235596} -11/07/2021 02:50:19 - INFO - __main__ - Step 39914: {'lr': 0.0004233177396436064, 'samples': 7663488, 'steps': 39913, 'loss/train': 1.651315689086914} -11/07/2021 02:50:19 - INFO - __main__ - Step 39915: {'lr': 0.00042331391515581753, 'samples': 7663680, 'steps': 39914, 'loss/train': 1.380843997001648} -11/07/2021 02:50:20 - INFO - __main__ - Step 39916: {'lr': 0.00042331009058993604, 'samples': 7663872, 'steps': 39915, 'loss/train': 0.7182490825653076} -11/07/2021 02:50:21 - INFO - __main__ - Step 39917: {'lr': 0.00042330626594596374, 'samples': 7664064, 'steps': 39916, 'loss/train': 1.447251319885254} -11/07/2021 02:50:21 - INFO - __main__ - Step 39918: {'lr': 0.00042330244122390227, 'samples': 7664256, 'steps': 39917, 'loss/train': 1.3649463653564453} -11/07/2021 02:50:21 - INFO - __main__ - Step 39919: {'lr': 0.00042329861642375347, 'samples': 7664448, 'steps': 39918, 'loss/train': 1.5415047407150269} -11/07/2021 02:50:22 - INFO - __main__ - Step 39920: {'lr': 0.00042329479154551897, 'samples': 7664640, 'steps': 39919, 'loss/train': 1.8297853469848633} -11/07/2021 02:50:23 - INFO - __main__ - Step 39921: {'lr': 0.0004232909665892005, 'samples': 7664832, 'steps': 39920, 'loss/train': 0.19549989700317383} -11/07/2021 02:50:23 - INFO - __main__ - Step 39922: {'lr': 0.00042328714155479973, 'samples': 7665024, 'steps': 39921, 'loss/train': 2.007741689682007} -11/07/2021 02:50:23 - INFO - __main__ - Step 39923: {'lr': 0.0004232833164423185, 'samples': 7665216, 'steps': 39922, 'loss/train': 0.6382672786712646} -11/07/2021 02:50:24 - INFO - __main__ - Step 39924: {'lr': 0.00042327949125175844, 'samples': 7665408, 'steps': 39923, 'loss/train': 1.445731282234192} -11/07/2021 02:50:24 - INFO - __main__ - Step 39925: {'lr': 0.0004232756659831214, 'samples': 7665600, 'steps': 39924, 'loss/train': 2.180142641067505} -11/07/2021 02:50:25 - INFO - __main__ - Step 39926: {'lr': 0.000423271840636409, 'samples': 7665792, 'steps': 39925, 'loss/train': 1.5678489208221436} -11/07/2021 02:50:25 - INFO - __main__ - Step 39927: {'lr': 0.00042326801521162295, 'samples': 7665984, 'steps': 39926, 'loss/train': 1.4961837530136108} -11/07/2021 02:50:26 - INFO - __main__ - Step 39928: {'lr': 0.000423264189708765, 'samples': 7666176, 'steps': 39927, 'loss/train': 1.2989650964736938} -11/07/2021 02:50:26 - INFO - __main__ - Step 39929: {'lr': 0.0004232603641278369, 'samples': 7666368, 'steps': 39928, 'loss/train': 0.9029120802879333} -11/07/2021 02:50:26 - INFO - __main__ - Step 39930: {'lr': 0.00042325653846884037, 'samples': 7666560, 'steps': 39929, 'loss/train': 1.4112350940704346} -11/07/2021 02:50:28 - INFO - __main__ - Step 39931: {'lr': 0.00042325271273177707, 'samples': 7666752, 'steps': 39930, 'loss/train': 1.0451306104660034} -11/07/2021 02:50:28 - INFO - __main__ - Step 39932: {'lr': 0.0004232488869166488, 'samples': 7666944, 'steps': 39931, 'loss/train': 1.7143346071243286} -11/07/2021 02:50:28 - INFO - __main__ - Step 39933: {'lr': 0.0004232450610234573, 'samples': 7667136, 'steps': 39932, 'loss/train': 1.4348359107971191} -11/07/2021 02:50:29 - INFO - __main__ - Step 39934: {'lr': 0.00042324123505220414, 'samples': 7667328, 'steps': 39933, 'loss/train': 1.8266007900238037} -11/07/2021 02:50:29 - INFO - __main__ - Step 39935: {'lr': 0.0004232374090028912, 'samples': 7667520, 'steps': 39934, 'loss/train': 1.6461167335510254} -11/07/2021 02:50:30 - INFO - __main__ - Step 39936: {'lr': 0.00042323358287552017, 'samples': 7667712, 'steps': 39935, 'loss/train': 1.599936842918396} -11/07/2021 02:50:30 - INFO - __main__ - Step 39937: {'lr': 0.0004232297566700928, 'samples': 7667904, 'steps': 39936, 'loss/train': 1.6643856763839722} -11/07/2021 02:50:31 - INFO - __main__ - Step 39938: {'lr': 0.00042322593038661074, 'samples': 7668096, 'steps': 39937, 'loss/train': 1.547898769378662} -11/07/2021 02:50:31 - INFO - __main__ - Step 39939: {'lr': 0.0004232221040250758, 'samples': 7668288, 'steps': 39938, 'loss/train': 1.211232304573059} -11/07/2021 02:50:31 - INFO - __main__ - Step 39940: {'lr': 0.00042321827758548953, 'samples': 7668480, 'steps': 39939, 'loss/train': 1.2328039407730103} -11/07/2021 02:50:32 - INFO - __main__ - Step 39941: {'lr': 0.00042321445106785385, 'samples': 7668672, 'steps': 39940, 'loss/train': 1.5373095273971558} -11/07/2021 02:50:33 - INFO - __main__ - Step 39942: {'lr': 0.0004232106244721704, 'samples': 7668864, 'steps': 39941, 'loss/train': 1.4850554466247559} -11/07/2021 02:50:33 - INFO - __main__ - Step 39943: {'lr': 0.0004232067977984409, 'samples': 7669056, 'steps': 39942, 'loss/train': 1.7178964614868164} -11/07/2021 02:50:33 - INFO - __main__ - Step 39944: {'lr': 0.0004232029710466671, 'samples': 7669248, 'steps': 39943, 'loss/train': 1.740206003189087} -11/07/2021 02:50:34 - INFO - __main__ - Step 39945: {'lr': 0.00042319914421685067, 'samples': 7669440, 'steps': 39944, 'loss/train': 1.894906997680664} -11/07/2021 02:50:35 - INFO - __main__ - Step 39946: {'lr': 0.0004231953173089935, 'samples': 7669632, 'steps': 39945, 'loss/train': 0.6198977828025818} -11/07/2021 02:50:35 - INFO - __main__ - Step 39947: {'lr': 0.00042319149032309713, 'samples': 7669824, 'steps': 39946, 'loss/train': 1.033416986465454} -11/07/2021 02:50:36 - INFO - __main__ - Step 39948: {'lr': 0.00042318766325916336, 'samples': 7670016, 'steps': 39947, 'loss/train': 1.8405121564865112} -11/07/2021 02:50:36 - INFO - __main__ - Step 39949: {'lr': 0.00042318383611719386, 'samples': 7670208, 'steps': 39948, 'loss/train': 0.4601535201072693} -11/07/2021 02:50:36 - INFO - __main__ - Step 39950: {'lr': 0.00042318000889719044, 'samples': 7670400, 'steps': 39949, 'loss/train': 1.8714054822921753} -11/07/2021 02:50:37 - INFO - __main__ - Step 39951: {'lr': 0.0004231761815991547, 'samples': 7670592, 'steps': 39950, 'loss/train': 0.18940521776676178} -11/07/2021 02:50:38 - INFO - __main__ - Step 39952: {'lr': 0.0004231723542230885, 'samples': 7670784, 'steps': 39951, 'loss/train': 1.4010276794433594} -11/07/2021 02:50:38 - INFO - __main__ - Step 39953: {'lr': 0.0004231685267689935, 'samples': 7670976, 'steps': 39952, 'loss/train': 1.1936516761779785} -11/07/2021 02:50:38 - INFO - __main__ - Step 39954: {'lr': 0.0004231646992368715, 'samples': 7671168, 'steps': 39953, 'loss/train': 1.1189135313034058} -11/07/2021 02:50:39 - INFO - __main__ - Step 39955: {'lr': 0.00042316087162672415, 'samples': 7671360, 'steps': 39954, 'loss/train': 1.3866944313049316} -11/07/2021 02:50:40 - INFO - __main__ - Step 39956: {'lr': 0.0004231570439385531, 'samples': 7671552, 'steps': 39955, 'loss/train': 2.2703516483306885} -11/07/2021 02:50:40 - INFO - __main__ - Step 39957: {'lr': 0.0004231532161723602, 'samples': 7671744, 'steps': 39956, 'loss/train': 1.7356328964233398} -11/07/2021 02:50:41 - INFO - __main__ - Step 39958: {'lr': 0.0004231493883281471, 'samples': 7671936, 'steps': 39957, 'loss/train': 1.8447068929672241} -11/07/2021 02:50:41 - INFO - __main__ - Step 39959: {'lr': 0.00042314556040591567, 'samples': 7672128, 'steps': 39958, 'loss/train': 1.6826385259628296} -11/07/2021 02:50:41 - INFO - __main__ - Step 39960: {'lr': 0.0004231417324056674, 'samples': 7672320, 'steps': 39959, 'loss/train': 1.5038126707077026} -11/07/2021 02:50:42 - INFO - __main__ - Step 39961: {'lr': 0.00042313790432740416, 'samples': 7672512, 'steps': 39960, 'loss/train': 1.671659231185913} -11/07/2021 02:50:43 - INFO - __main__ - Step 39962: {'lr': 0.00042313407617112765, 'samples': 7672704, 'steps': 39961, 'loss/train': 1.5262469053268433} -11/07/2021 02:50:43 - INFO - __main__ - Step 39963: {'lr': 0.00042313024793683965, 'samples': 7672896, 'steps': 39962, 'loss/train': 1.3900421857833862} -11/07/2021 02:50:43 - INFO - __main__ - Step 39964: {'lr': 0.0004231264196245418, 'samples': 7673088, 'steps': 39963, 'loss/train': 0.8114240765571594} -11/07/2021 02:50:44 - INFO - __main__ - Step 39965: {'lr': 0.00042312259123423584, 'samples': 7673280, 'steps': 39964, 'loss/train': 1.3081835508346558} -11/07/2021 02:50:44 - INFO - __main__ - Step 39966: {'lr': 0.00042311876276592355, 'samples': 7673472, 'steps': 39965, 'loss/train': 1.5169175863265991} -11/07/2021 02:50:45 - INFO - __main__ - Step 39967: {'lr': 0.00042311493421960656, 'samples': 7673664, 'steps': 39966, 'loss/train': 1.569330096244812} -11/07/2021 02:50:45 - INFO - __main__ - Step 39968: {'lr': 0.0004231111055952867, 'samples': 7673856, 'steps': 39967, 'loss/train': 1.5341840982437134} -11/07/2021 02:50:46 - INFO - __main__ - Step 39969: {'lr': 0.00042310727689296563, 'samples': 7674048, 'steps': 39968, 'loss/train': 0.4142704904079437} -11/07/2021 02:50:46 - INFO - __main__ - Step 39970: {'lr': 0.0004231034481126451, 'samples': 7674240, 'steps': 39969, 'loss/train': 1.8657910823822021} -11/07/2021 02:50:46 - INFO - __main__ - Step 39971: {'lr': 0.0004230996192543268, 'samples': 7674432, 'steps': 39970, 'loss/train': 1.4104971885681152} -11/07/2021 02:50:48 - INFO - __main__ - Step 39972: {'lr': 0.0004230957903180125, 'samples': 7674624, 'steps': 39971, 'loss/train': 0.7122201919555664} -11/07/2021 02:50:48 - INFO - __main__ - Step 39973: {'lr': 0.00042309196130370396, 'samples': 7674816, 'steps': 39972, 'loss/train': 1.4492918252944946} -11/07/2021 02:50:48 - INFO - __main__ - Step 39974: {'lr': 0.00042308813221140275, 'samples': 7675008, 'steps': 39973, 'loss/train': 1.5777790546417236} -11/07/2021 02:50:49 - INFO - __main__ - Step 39975: {'lr': 0.00042308430304111076, 'samples': 7675200, 'steps': 39974, 'loss/train': 1.6017565727233887} -11/07/2021 02:50:49 - INFO - __main__ - Step 39976: {'lr': 0.00042308047379282967, 'samples': 7675392, 'steps': 39975, 'loss/train': 2.0214884281158447} -11/07/2021 02:50:50 - INFO - __main__ - Step 39977: {'lr': 0.00042307664446656116, 'samples': 7675584, 'steps': 39976, 'loss/train': 1.8707165718078613} -11/07/2021 02:50:50 - INFO - __main__ - Step 39978: {'lr': 0.000423072815062307, 'samples': 7675776, 'steps': 39977, 'loss/train': 1.5159759521484375} -11/07/2021 02:50:51 - INFO - __main__ - Step 39979: {'lr': 0.0004230689855800689, 'samples': 7675968, 'steps': 39978, 'loss/train': 1.1753299236297607} -11/07/2021 02:50:51 - INFO - __main__ - Step 39980: {'lr': 0.0004230651560198486, 'samples': 7676160, 'steps': 39979, 'loss/train': 1.4214001893997192} -11/07/2021 02:50:51 - INFO - __main__ - Step 39981: {'lr': 0.0004230613263816478, 'samples': 7676352, 'steps': 39980, 'loss/train': 1.6573978662490845} -11/07/2021 02:50:52 - INFO - __main__ - Step 39982: {'lr': 0.0004230574966654682, 'samples': 7676544, 'steps': 39981, 'loss/train': 1.2650606632232666} -11/07/2021 02:50:53 - INFO - __main__ - Step 39983: {'lr': 0.0004230536668713116, 'samples': 7676736, 'steps': 39982, 'loss/train': 1.456331491470337} -11/07/2021 02:50:53 - INFO - __main__ - Step 39984: {'lr': 0.00042304983699917965, 'samples': 7676928, 'steps': 39983, 'loss/train': 1.0845017433166504} -11/07/2021 02:50:53 - INFO - __main__ - Step 39985: {'lr': 0.00042304600704907416, 'samples': 7677120, 'steps': 39984, 'loss/train': 1.2177273035049438} -11/07/2021 02:50:54 - INFO - __main__ - Step 39986: {'lr': 0.0004230421770209968, 'samples': 7677312, 'steps': 39985, 'loss/train': 1.704351782798767} -11/07/2021 02:50:55 - INFO - __main__ - Step 39987: {'lr': 0.0004230383469149493, 'samples': 7677504, 'steps': 39986, 'loss/train': 1.204689860343933} -11/07/2021 02:50:55 - INFO - __main__ - Step 39988: {'lr': 0.0004230345167309334, 'samples': 7677696, 'steps': 39987, 'loss/train': 1.5267856121063232} -11/07/2021 02:50:55 - INFO - __main__ - Step 39989: {'lr': 0.00042303068646895077, 'samples': 7677888, 'steps': 39988, 'loss/train': 1.614537000656128} -11/07/2021 02:50:56 - INFO - __main__ - Step 39990: {'lr': 0.0004230268561290032, 'samples': 7678080, 'steps': 39989, 'loss/train': 1.267861247062683} -11/07/2021 02:50:56 - INFO - __main__ - Step 39991: {'lr': 0.0004230230257110924, 'samples': 7678272, 'steps': 39990, 'loss/train': 0.7846195101737976} -11/07/2021 02:50:57 - INFO - __main__ - Step 39992: {'lr': 0.00042301919521522014, 'samples': 7678464, 'steps': 39991, 'loss/train': 2.2181107997894287} -11/07/2021 02:50:57 - INFO - __main__ - Step 39993: {'lr': 0.0004230153646413881, 'samples': 7678656, 'steps': 39992, 'loss/train': 1.6313539743423462} -11/07/2021 02:50:58 - INFO - __main__ - Step 39994: {'lr': 0.000423011533989598, 'samples': 7678848, 'steps': 39993, 'loss/train': 1.669006586074829} -11/07/2021 02:50:58 - INFO - __main__ - Step 39995: {'lr': 0.0004230077032598515, 'samples': 7679040, 'steps': 39994, 'loss/train': 2.0103037357330322} -11/07/2021 02:50:59 - INFO - __main__ - Step 39996: {'lr': 0.00042300387245215043, 'samples': 7679232, 'steps': 39995, 'loss/train': 1.4996882677078247} -11/07/2021 02:50:59 - INFO - __main__ - Step 39997: {'lr': 0.00042300004156649654, 'samples': 7679424, 'steps': 39996, 'loss/train': 1.631992220878601} -11/07/2021 02:51:00 - INFO - __main__ - Step 39998: {'lr': 0.0004229962106028914, 'samples': 7679616, 'steps': 39997, 'loss/train': 5.746405601501465} -11/07/2021 02:51:00 - INFO - __main__ - Step 39999: {'lr': 0.0004229923795613369, 'samples': 7679808, 'steps': 39998, 'loss/train': 1.672818899154663} -11/07/2021 02:51:01 - INFO - __main__ - Step 40000: {'lr': 0.00042298854844183476, 'samples': 7680000, 'steps': 39999, 'loss/train': 0.5506977438926697} -11/07/2021 02:51:01 - INFO - __main__ - Step 40001: {'lr': 0.0004229847172443866, 'samples': 7680192, 'steps': 40000, 'loss/train': 1.474384069442749} -11/07/2021 02:51:01 - INFO - __main__ - Step 40002: {'lr': 0.0004229808859689941, 'samples': 7680384, 'steps': 40001, 'loss/train': 0.9800273776054382} -11/07/2021 02:51:02 - INFO - __main__ - Step 40003: {'lr': 0.0004229770546156592, 'samples': 7680576, 'steps': 40002, 'loss/train': 1.1151974201202393} -11/07/2021 02:51:03 - INFO - __main__ - Step 40004: {'lr': 0.00042297322318438345, 'samples': 7680768, 'steps': 40003, 'loss/train': 1.5029839277267456} -11/07/2021 02:51:03 - INFO - __main__ - Step 40005: {'lr': 0.0004229693916751687, 'samples': 7680960, 'steps': 40004, 'loss/train': 1.0324509143829346} -11/07/2021 02:51:04 - INFO - __main__ - Step 40006: {'lr': 0.00042296556008801663, 'samples': 7681152, 'steps': 40005, 'loss/train': 1.5770862102508545} -11/07/2021 02:51:04 - INFO - __main__ - Step 40007: {'lr': 0.0004229617284229289, 'samples': 7681344, 'steps': 40006, 'loss/train': 1.2624397277832031} -11/07/2021 02:51:04 - INFO - __main__ - Step 40008: {'lr': 0.00042295789667990726, 'samples': 7681536, 'steps': 40007, 'loss/train': 1.0099983215332031} -11/07/2021 02:51:05 - INFO - __main__ - Step 40009: {'lr': 0.00042295406485895346, 'samples': 7681728, 'steps': 40008, 'loss/train': 0.8953605890274048} -11/07/2021 02:51:06 - INFO - __main__ - Step 40010: {'lr': 0.0004229502329600692, 'samples': 7681920, 'steps': 40009, 'loss/train': 1.3491777181625366} -11/07/2021 02:51:06 - INFO - __main__ - Step 40011: {'lr': 0.0004229464009832563, 'samples': 7682112, 'steps': 40010, 'loss/train': 1.033262014389038} -11/07/2021 02:51:06 - INFO - __main__ - Step 40012: {'lr': 0.0004229425689285163, 'samples': 7682304, 'steps': 40011, 'loss/train': 1.3582239151000977} -11/07/2021 02:51:07 - INFO - __main__ - Step 40013: {'lr': 0.00042293873679585125, 'samples': 7682496, 'steps': 40012, 'loss/train': 1.4142736196517944} -11/07/2021 02:51:08 - INFO - __main__ - Step 40014: {'lr': 0.00042293490458526257, 'samples': 7682688, 'steps': 40013, 'loss/train': 1.2864668369293213} -11/07/2021 02:51:08 - INFO - __main__ - Step 40015: {'lr': 0.0004229310722967521, 'samples': 7682880, 'steps': 40014, 'loss/train': 1.7777926921844482} -11/07/2021 02:51:09 - INFO - __main__ - Step 40016: {'lr': 0.00042292723993032157, 'samples': 7683072, 'steps': 40015, 'loss/train': 0.7587130069732666} -11/07/2021 02:51:09 - INFO - __main__ - Step 40017: {'lr': 0.0004229234074859726, 'samples': 7683264, 'steps': 40016, 'loss/train': 1.6694526672363281} -11/07/2021 02:51:09 - INFO - __main__ - Step 40018: {'lr': 0.00042291957496370713, 'samples': 7683456, 'steps': 40017, 'loss/train': 1.007763385772705} -11/07/2021 02:51:10 - INFO - __main__ - Step 40019: {'lr': 0.0004229157423635267, 'samples': 7683648, 'steps': 40018, 'loss/train': 1.8507840633392334} -11/07/2021 02:51:11 - INFO - __main__ - Step 40020: {'lr': 0.00042291190968543315, 'samples': 7683840, 'steps': 40019, 'loss/train': 1.412222981452942} -11/07/2021 02:51:11 - INFO - __main__ - Step 40021: {'lr': 0.0004229080769294281, 'samples': 7684032, 'steps': 40020, 'loss/train': 1.9351446628570557} -11/07/2021 02:51:11 - INFO - __main__ - Step 40022: {'lr': 0.00042290424409551343, 'samples': 7684224, 'steps': 40021, 'loss/train': 1.4295390844345093} -11/07/2021 02:51:12 - INFO - __main__ - Step 40023: {'lr': 0.0004229004111836907, 'samples': 7684416, 'steps': 40022, 'loss/train': 1.340185523033142} -11/07/2021 02:51:12 - INFO - __main__ - Step 40024: {'lr': 0.0004228965781939617, 'samples': 7684608, 'steps': 40023, 'loss/train': 1.2513066530227661} -11/07/2021 02:51:13 - INFO - __main__ - Step 40025: {'lr': 0.00042289274512632817, 'samples': 7684800, 'steps': 40024, 'loss/train': 1.5568289756774902} -11/07/2021 02:51:13 - INFO - __main__ - Step 40026: {'lr': 0.00042288891198079194, 'samples': 7684992, 'steps': 40025, 'loss/train': 1.7078965902328491} -11/07/2021 02:51:14 - INFO - __main__ - Step 40027: {'lr': 0.00042288507875735455, 'samples': 7685184, 'steps': 40026, 'loss/train': 1.5051108598709106} -11/07/2021 02:51:14 - INFO - __main__ - Step 40028: {'lr': 0.0004228812454560178, 'samples': 7685376, 'steps': 40027, 'loss/train': 1.5787116289138794} -11/07/2021 02:51:14 - INFO - __main__ - Step 40029: {'lr': 0.0004228774120767835, 'samples': 7685568, 'steps': 40028, 'loss/train': 1.5780994892120361} -11/07/2021 02:51:16 - INFO - __main__ - Step 40030: {'lr': 0.00042287357861965326, 'samples': 7685760, 'steps': 40029, 'loss/train': 1.6224216222763062} -11/07/2021 02:51:17 - INFO - __main__ - Step 40031: {'lr': 0.00042286974508462885, 'samples': 7685952, 'steps': 40030, 'loss/train': 1.374077320098877} -11/07/2021 02:51:17 - INFO - __main__ - Step 40032: {'lr': 0.000422865911471712, 'samples': 7686144, 'steps': 40031, 'loss/train': 1.3748855590820312} -11/07/2021 02:51:17 - INFO - __main__ - Step 40033: {'lr': 0.00042286207778090447, 'samples': 7686336, 'steps': 40032, 'loss/train': 1.6635338068008423} -11/07/2021 02:51:18 - INFO - __main__ - Step 40034: {'lr': 0.00042285824401220787, 'samples': 7686528, 'steps': 40033, 'loss/train': 1.7877252101898193} -11/07/2021 02:51:18 - INFO - __main__ - Step 40035: {'lr': 0.0004228544101656241, 'samples': 7686720, 'steps': 40034, 'loss/train': 2.0744729042053223} -11/07/2021 02:51:18 - INFO - __main__ - Step 40036: {'lr': 0.00042285057624115473, 'samples': 7686912, 'steps': 40035, 'loss/train': 1.5142874717712402} -11/07/2021 02:51:19 - INFO - __main__ - Step 40037: {'lr': 0.0004228467422388016, 'samples': 7687104, 'steps': 40036, 'loss/train': 1.9819977283477783} -11/07/2021 02:51:20 - INFO - __main__ - Step 40038: {'lr': 0.0004228429081585664, 'samples': 7687296, 'steps': 40037, 'loss/train': 1.2760931253433228} -11/07/2021 02:51:20 - INFO - __main__ - Step 40039: {'lr': 0.00042283907400045084, 'samples': 7687488, 'steps': 40038, 'loss/train': 1.119479775428772} -11/07/2021 02:51:20 - INFO - __main__ - Step 40040: {'lr': 0.0004228352397644567, 'samples': 7687680, 'steps': 40039, 'loss/train': 1.8740752935409546} -11/07/2021 02:51:21 - INFO - __main__ - Step 40041: {'lr': 0.0004228314054505856, 'samples': 7687872, 'steps': 40040, 'loss/train': 2.0900299549102783} -11/07/2021 02:51:22 - INFO - __main__ - Step 40042: {'lr': 0.0004228275710588394, 'samples': 7688064, 'steps': 40041, 'loss/train': 1.1090223789215088} -11/07/2021 02:51:22 - INFO - __main__ - Step 40043: {'lr': 0.0004228237365892197, 'samples': 7688256, 'steps': 40042, 'loss/train': 1.7269837856292725} -11/07/2021 02:51:22 - INFO - __main__ - Step 40044: {'lr': 0.00042281990204172837, 'samples': 7688448, 'steps': 40043, 'loss/train': 1.4572423696517944} -11/07/2021 02:51:23 - INFO - __main__ - Step 40045: {'lr': 0.000422816067416367, 'samples': 7688640, 'steps': 40044, 'loss/train': 1.5706082582473755} -11/07/2021 02:51:23 - INFO - __main__ - Step 40046: {'lr': 0.00042281223271313734, 'samples': 7688832, 'steps': 40045, 'loss/train': 1.2158195972442627} -11/07/2021 02:51:24 - INFO - __main__ - Step 40047: {'lr': 0.0004228083979320412, 'samples': 7689024, 'steps': 40046, 'loss/train': 1.4072970151901245} -11/07/2021 02:51:25 - INFO - __main__ - Step 40048: {'lr': 0.00042280456307308034, 'samples': 7689216, 'steps': 40047, 'loss/train': 1.435637354850769} -11/07/2021 02:51:25 - INFO - __main__ - Step 40049: {'lr': 0.0004228007281362563, 'samples': 7689408, 'steps': 40048, 'loss/train': 1.7101787328720093} -11/07/2021 02:51:25 - INFO - __main__ - Step 40050: {'lr': 0.0004227968931215709, 'samples': 7689600, 'steps': 40049, 'loss/train': 1.7233060598373413} -11/07/2021 02:51:26 - INFO - __main__ - Step 40051: {'lr': 0.000422793058029026, 'samples': 7689792, 'steps': 40050, 'loss/train': 1.6261519193649292} -11/07/2021 02:51:26 - INFO - __main__ - Step 40052: {'lr': 0.0004227892228586231, 'samples': 7689984, 'steps': 40051, 'loss/train': 1.8170970678329468} -11/07/2021 02:51:27 - INFO - __main__ - Step 40053: {'lr': 0.0004227853876103641, 'samples': 7690176, 'steps': 40052, 'loss/train': 1.5851227045059204} -11/07/2021 02:51:27 - INFO - __main__ - Step 40054: {'lr': 0.0004227815522842507, 'samples': 7690368, 'steps': 40053, 'loss/train': 1.2808752059936523} -11/07/2021 02:51:28 - INFO - __main__ - Step 40055: {'lr': 0.00042277771688028457, 'samples': 7690560, 'steps': 40054, 'loss/train': 0.8093523979187012} -11/07/2021 02:51:28 - INFO - __main__ - Step 40056: {'lr': 0.0004227738813984675, 'samples': 7690752, 'steps': 40055, 'loss/train': 1.4373022317886353} -11/07/2021 02:51:28 - INFO - __main__ - Step 40057: {'lr': 0.00042277004583880106, 'samples': 7690944, 'steps': 40056, 'loss/train': 1.190751075744629} -11/07/2021 02:51:29 - INFO - __main__ - Step 40058: {'lr': 0.00042276621020128724, 'samples': 7691136, 'steps': 40057, 'loss/train': 1.1999469995498657} -11/07/2021 02:51:30 - INFO - __main__ - Step 40059: {'lr': 0.0004227623744859276, 'samples': 7691328, 'steps': 40058, 'loss/train': 1.6112170219421387} -11/07/2021 02:51:30 - INFO - __main__ - Step 40060: {'lr': 0.0004227585386927239, 'samples': 7691520, 'steps': 40059, 'loss/train': 1.305436372756958} -11/07/2021 02:51:30 - INFO - __main__ - Step 40061: {'lr': 0.0004227547028216778, 'samples': 7691712, 'steps': 40060, 'loss/train': 1.8070495128631592} -11/07/2021 02:51:31 - INFO - __main__ - Step 40062: {'lr': 0.00042275086687279116, 'samples': 7691904, 'steps': 40061, 'loss/train': 1.6936426162719727} -11/07/2021 02:51:32 - INFO - __main__ - Step 40063: {'lr': 0.0004227470308460657, 'samples': 7692096, 'steps': 40062, 'loss/train': 1.5447250604629517} -11/07/2021 02:51:32 - INFO - __main__ - Step 40064: {'lr': 0.000422743194741503, 'samples': 7692288, 'steps': 40063, 'loss/train': 1.3440648317337036} -11/07/2021 02:51:33 - INFO - __main__ - Step 40065: {'lr': 0.00042273935855910487, 'samples': 7692480, 'steps': 40064, 'loss/train': 1.8710362911224365} -11/07/2021 02:51:33 - INFO - __main__ - Step 40066: {'lr': 0.00042273552229887313, 'samples': 7692672, 'steps': 40065, 'loss/train': 1.440974473953247} -11/07/2021 02:51:33 - INFO - __main__ - Step 40067: {'lr': 0.00042273168596080934, 'samples': 7692864, 'steps': 40066, 'loss/train': 1.5752909183502197} -11/07/2021 02:51:34 - INFO - __main__ - Step 40068: {'lr': 0.0004227278495449154, 'samples': 7693056, 'steps': 40067, 'loss/train': 1.2198938131332397} -11/07/2021 02:51:35 - INFO - __main__ - Step 40069: {'lr': 0.0004227240130511929, 'samples': 7693248, 'steps': 40068, 'loss/train': 0.8190735578536987} -11/07/2021 02:51:35 - INFO - __main__ - Step 40070: {'lr': 0.0004227201764796437, 'samples': 7693440, 'steps': 40069, 'loss/train': 1.6285350322723389} -11/07/2021 02:51:35 - INFO - __main__ - Step 40071: {'lr': 0.00042271633983026935, 'samples': 7693632, 'steps': 40070, 'loss/train': 1.406765341758728} -11/07/2021 02:51:36 - INFO - __main__ - Step 40072: {'lr': 0.00042271250310307174, 'samples': 7693824, 'steps': 40071, 'loss/train': 1.2084912061691284} -11/07/2021 02:51:37 - INFO - __main__ - Step 40073: {'lr': 0.0004227086662980525, 'samples': 7694016, 'steps': 40072, 'loss/train': 1.4927854537963867} -11/07/2021 02:51:37 - INFO - __main__ - Step 40074: {'lr': 0.00042270482941521347, 'samples': 7694208, 'steps': 40073, 'loss/train': 1.2841883897781372} -11/07/2021 02:51:37 - INFO - __main__ - Step 40075: {'lr': 0.0004227009924545563, 'samples': 7694400, 'steps': 40074, 'loss/train': 1.3613510131835938} -11/07/2021 02:51:38 - INFO - __main__ - Step 40076: {'lr': 0.00042269715541608265, 'samples': 7694592, 'steps': 40075, 'loss/train': 0.6684977412223816} -11/07/2021 02:51:38 - INFO - __main__ - Step 40077: {'lr': 0.0004226933182997944, 'samples': 7694784, 'steps': 40076, 'loss/train': 1.1968653202056885} -11/07/2021 02:51:39 - INFO - __main__ - Step 40078: {'lr': 0.00042268948110569317, 'samples': 7694976, 'steps': 40077, 'loss/train': 1.1509777307510376} -11/07/2021 02:51:40 - INFO - __main__ - Step 40079: {'lr': 0.00042268564383378073, 'samples': 7695168, 'steps': 40078, 'loss/train': 1.282145380973816} -11/07/2021 02:51:40 - INFO - __main__ - Step 40080: {'lr': 0.00042268180648405884, 'samples': 7695360, 'steps': 40079, 'loss/train': 1.6849303245544434} -11/07/2021 02:51:40 - INFO - __main__ - Step 40081: {'lr': 0.00042267796905652924, 'samples': 7695552, 'steps': 40080, 'loss/train': 1.3607251644134521} -11/07/2021 02:51:41 - INFO - __main__ - Step 40082: {'lr': 0.0004226741315511935, 'samples': 7695744, 'steps': 40081, 'loss/train': 1.2177730798721313} -11/07/2021 02:51:42 - INFO - __main__ - Step 40083: {'lr': 0.00042267029396805345, 'samples': 7695936, 'steps': 40082, 'loss/train': 1.407575011253357} -11/07/2021 02:51:42 - INFO - __main__ - Step 40084: {'lr': 0.0004226664563071109, 'samples': 7696128, 'steps': 40083, 'loss/train': 0.9506791234016418} -11/07/2021 02:51:42 - INFO - __main__ - Step 40085: {'lr': 0.0004226626185683675, 'samples': 7696320, 'steps': 40084, 'loss/train': 1.4657553434371948} -11/07/2021 02:51:43 - INFO - __main__ - Step 40086: {'lr': 0.00042265878075182497, 'samples': 7696512, 'steps': 40085, 'loss/train': 1.5130643844604492} -11/07/2021 02:51:43 - INFO - __main__ - Step 40087: {'lr': 0.0004226549428574851, 'samples': 7696704, 'steps': 40086, 'loss/train': 1.7923390865325928} -11/07/2021 02:51:44 - INFO - __main__ - Step 40088: {'lr': 0.0004226511048853495, 'samples': 7696896, 'steps': 40087, 'loss/train': 1.7920674085617065} -11/07/2021 02:51:44 - INFO - __main__ - Step 40089: {'lr': 0.00042264726683542, 'samples': 7697088, 'steps': 40088, 'loss/train': 1.546301007270813} -11/07/2021 02:51:45 - INFO - __main__ - Step 40090: {'lr': 0.00042264342870769835, 'samples': 7697280, 'steps': 40089, 'loss/train': 1.045566439628601} -11/07/2021 02:51:45 - INFO - __main__ - Step 40091: {'lr': 0.0004226395905021862, 'samples': 7697472, 'steps': 40090, 'loss/train': 1.8828248977661133} -11/07/2021 02:51:45 - INFO - __main__ - Step 40092: {'lr': 0.0004226357522188853, 'samples': 7697664, 'steps': 40091, 'loss/train': 1.5058112144470215} -11/07/2021 02:51:46 - INFO - __main__ - Step 40093: {'lr': 0.0004226319138577974, 'samples': 7697856, 'steps': 40092, 'loss/train': 1.7309236526489258} -11/07/2021 02:51:47 - INFO - __main__ - Step 40094: {'lr': 0.0004226280754189243, 'samples': 7698048, 'steps': 40093, 'loss/train': 1.5191304683685303} -11/07/2021 02:51:47 - INFO - __main__ - Step 40095: {'lr': 0.0004226242369022676, 'samples': 7698240, 'steps': 40094, 'loss/train': 1.419395089149475} -11/07/2021 02:51:48 - INFO - __main__ - Step 40096: {'lr': 0.00042262039830782906, 'samples': 7698432, 'steps': 40095, 'loss/train': 0.8884421586990356} -11/07/2021 02:51:48 - INFO - __main__ - Step 40097: {'lr': 0.00042261655963561043, 'samples': 7698624, 'steps': 40096, 'loss/train': 1.6845612525939941} -11/07/2021 02:51:48 - INFO - __main__ - Step 40098: {'lr': 0.0004226127208856134, 'samples': 7698816, 'steps': 40097, 'loss/train': 1.6713262796401978} -11/07/2021 02:51:49 - INFO - __main__ - Step 40099: {'lr': 0.0004226088820578399, 'samples': 7699008, 'steps': 40098, 'loss/train': 1.7476264238357544} -11/07/2021 02:51:49 - INFO - __main__ - Step 40100: {'lr': 0.00042260504315229136, 'samples': 7699200, 'steps': 40099, 'loss/train': 1.2733943462371826} -11/07/2021 02:51:50 - INFO - __main__ - Step 40101: {'lr': 0.00042260120416896975, 'samples': 7699392, 'steps': 40100, 'loss/train': 1.2876131534576416} -11/07/2021 02:51:50 - INFO - __main__ - Step 40102: {'lr': 0.0004225973651078766, 'samples': 7699584, 'steps': 40101, 'loss/train': 1.56428861618042} -11/07/2021 02:51:51 - INFO - __main__ - Step 40103: {'lr': 0.0004225935259690138, 'samples': 7699776, 'steps': 40102, 'loss/train': 1.4476832151412964} -11/07/2021 02:51:52 - INFO - __main__ - Step 40104: {'lr': 0.00042258968675238295, 'samples': 7699968, 'steps': 40103, 'loss/train': 1.598578929901123} -11/07/2021 02:51:52 - INFO - __main__ - Step 40105: {'lr': 0.00042258584745798595, 'samples': 7700160, 'steps': 40104, 'loss/train': 1.4063727855682373} -11/07/2021 02:51:52 - INFO - __main__ - Step 40106: {'lr': 0.00042258200808582434, 'samples': 7700352, 'steps': 40105, 'loss/train': 1.5410844087600708} -11/07/2021 02:51:53 - INFO - __main__ - Step 40107: {'lr': 0.00042257816863590006, 'samples': 7700544, 'steps': 40106, 'loss/train': 1.3327895402908325} -11/07/2021 02:51:53 - INFO - __main__ - Step 40108: {'lr': 0.0004225743291082146, 'samples': 7700736, 'steps': 40107, 'loss/train': 1.3556232452392578} -11/07/2021 02:51:54 - INFO - __main__ - Step 40109: {'lr': 0.0004225704895027699, 'samples': 7700928, 'steps': 40108, 'loss/train': 1.637282133102417} -11/07/2021 02:51:54 - INFO - __main__ - Step 40110: {'lr': 0.0004225666498195675, 'samples': 7701120, 'steps': 40109, 'loss/train': 1.1232974529266357} -11/07/2021 02:51:55 - INFO - __main__ - Step 40111: {'lr': 0.0004225628100586093, 'samples': 7701312, 'steps': 40110, 'loss/train': 1.66632080078125} -11/07/2021 02:51:55 - INFO - __main__ - Step 40112: {'lr': 0.00042255897021989695, 'samples': 7701504, 'steps': 40111, 'loss/train': 1.9927699565887451} -11/07/2021 02:51:55 - INFO - __main__ - Step 40113: {'lr': 0.0004225551303034322, 'samples': 7701696, 'steps': 40112, 'loss/train': 1.6477985382080078} -11/07/2021 02:51:56 - INFO - __main__ - Step 40114: {'lr': 0.00042255129030921673, 'samples': 7701888, 'steps': 40113, 'loss/train': 1.6133326292037964} -11/07/2021 02:51:57 - INFO - __main__ - Step 40115: {'lr': 0.0004225474502372524, 'samples': 7702080, 'steps': 40114, 'loss/train': 1.1240192651748657} -11/07/2021 02:51:57 - INFO - __main__ - Step 40116: {'lr': 0.00042254361008754076, 'samples': 7702272, 'steps': 40115, 'loss/train': 0.5389991998672485} -11/07/2021 02:51:57 - INFO - __main__ - Step 40117: {'lr': 0.0004225397698600837, 'samples': 7702464, 'steps': 40116, 'loss/train': 1.5630342960357666} -11/07/2021 02:51:58 - INFO - __main__ - Step 40118: {'lr': 0.0004225359295548828, 'samples': 7702656, 'steps': 40117, 'loss/train': 2.005375623703003} -11/07/2021 02:51:58 - INFO - __main__ - Step 40119: {'lr': 0.0004225320891719399, 'samples': 7702848, 'steps': 40118, 'loss/train': 1.270519733428955} -11/07/2021 02:51:59 - INFO - __main__ - Step 40120: {'lr': 0.0004225282487112567, 'samples': 7703040, 'steps': 40119, 'loss/train': 1.010699987411499} -11/07/2021 02:52:00 - INFO - __main__ - Step 40121: {'lr': 0.000422524408172835, 'samples': 7703232, 'steps': 40120, 'loss/train': 1.0963070392608643} -11/07/2021 02:52:00 - INFO - __main__ - Step 40122: {'lr': 0.0004225205675566765, 'samples': 7703424, 'steps': 40121, 'loss/train': 1.7472093105316162} -11/07/2021 02:52:00 - INFO - __main__ - Step 40123: {'lr': 0.00042251672686278275, 'samples': 7703616, 'steps': 40122, 'loss/train': 1.510049819946289} -11/07/2021 02:52:01 - INFO - __main__ - Step 40124: {'lr': 0.0004225128860911557, 'samples': 7703808, 'steps': 40123, 'loss/train': 1.5101922750473022} -11/07/2021 02:52:02 - INFO - __main__ - Step 40125: {'lr': 0.00042250904524179697, 'samples': 7704000, 'steps': 40124, 'loss/train': 1.3982422351837158} -11/07/2021 02:52:02 - INFO - __main__ - Step 40126: {'lr': 0.00042250520431470827, 'samples': 7704192, 'steps': 40125, 'loss/train': 0.7441375851631165} -11/07/2021 02:52:02 - INFO - __main__ - Step 40127: {'lr': 0.00042250136330989154, 'samples': 7704384, 'steps': 40126, 'loss/train': 1.6617443561553955} -11/07/2021 02:52:03 - INFO - __main__ - Step 40128: {'lr': 0.00042249752222734826, 'samples': 7704576, 'steps': 40127, 'loss/train': 2.0717756748199463} -11/07/2021 02:52:03 - INFO - __main__ - Step 40129: {'lr': 0.0004224936810670803, 'samples': 7704768, 'steps': 40128, 'loss/train': 1.5525445938110352} -11/07/2021 02:52:04 - INFO - __main__ - Step 40130: {'lr': 0.0004224898398290893, 'samples': 7704960, 'steps': 40129, 'loss/train': 1.2647972106933594} -11/07/2021 02:52:05 - INFO - __main__ - Step 40131: {'lr': 0.0004224859985133771, 'samples': 7705152, 'steps': 40130, 'loss/train': 1.3948974609375} -11/07/2021 02:52:05 - INFO - __main__ - Step 40132: {'lr': 0.0004224821571199453, 'samples': 7705344, 'steps': 40131, 'loss/train': 1.5660887956619263} -11/07/2021 02:52:05 - INFO - __main__ - Step 40133: {'lr': 0.0004224783156487958, 'samples': 7705536, 'steps': 40132, 'loss/train': 1.4071072340011597} -11/07/2021 02:52:06 - INFO - __main__ - Step 40134: {'lr': 0.0004224744740999302, 'samples': 7705728, 'steps': 40133, 'loss/train': 1.0452232360839844} -11/07/2021 02:52:07 - INFO - __main__ - Step 40135: {'lr': 0.0004224706324733502, 'samples': 7705920, 'steps': 40134, 'loss/train': 1.9273301362991333} -11/07/2021 02:52:07 - INFO - __main__ - Step 40136: {'lr': 0.00042246679076905763, 'samples': 7706112, 'steps': 40135, 'loss/train': 1.8715548515319824} -11/07/2021 02:52:07 - INFO - __main__ - Step 40137: {'lr': 0.00042246294898705416, 'samples': 7706304, 'steps': 40136, 'loss/train': 1.7802073955535889} -11/07/2021 02:52:08 - INFO - __main__ - Step 40138: {'lr': 0.0004224591071273416, 'samples': 7706496, 'steps': 40137, 'loss/train': 1.529614806175232} -11/07/2021 02:52:08 - INFO - __main__ - Step 40139: {'lr': 0.00042245526518992164, 'samples': 7706688, 'steps': 40138, 'loss/train': 1.316225528717041} -11/07/2021 02:52:09 - INFO - __main__ - Step 40140: {'lr': 0.0004224514231747959, 'samples': 7706880, 'steps': 40139, 'loss/train': 1.9425132274627686} -11/07/2021 02:52:09 - INFO - __main__ - Step 40141: {'lr': 0.00042244758108196635, 'samples': 7707072, 'steps': 40140, 'loss/train': 1.6781806945800781} -11/07/2021 02:52:10 - INFO - __main__ - Step 40142: {'lr': 0.00042244373891143453, 'samples': 7707264, 'steps': 40141, 'loss/train': 3.466099739074707} -11/07/2021 02:52:10 - INFO - __main__ - Step 40143: {'lr': 0.00042243989666320217, 'samples': 7707456, 'steps': 40142, 'loss/train': 1.2785730361938477} -11/07/2021 02:52:10 - INFO - __main__ - Step 40144: {'lr': 0.00042243605433727106, 'samples': 7707648, 'steps': 40143, 'loss/train': 1.637807011604309} -11/07/2021 02:52:11 - INFO - __main__ - Step 40145: {'lr': 0.0004224322119336429, 'samples': 7707840, 'steps': 40144, 'loss/train': 1.394010305404663} -11/07/2021 02:52:12 - INFO - __main__ - Step 40146: {'lr': 0.0004224283694523195, 'samples': 7708032, 'steps': 40145, 'loss/train': 1.388095498085022} -11/07/2021 02:52:13 - INFO - __main__ - Step 40147: {'lr': 0.0004224245268933025, 'samples': 7708224, 'steps': 40146, 'loss/train': 1.3383760452270508} -11/07/2021 02:52:13 - INFO - __main__ - Step 40148: {'lr': 0.0004224206842565937, 'samples': 7708416, 'steps': 40147, 'loss/train': 1.5303736925125122} -11/07/2021 02:52:13 - INFO - __main__ - Step 40149: {'lr': 0.0004224168415421948, 'samples': 7708608, 'steps': 40148, 'loss/train': 1.2203428745269775} -11/07/2021 02:52:14 - INFO - __main__ - Step 40150: {'lr': 0.0004224129987501075, 'samples': 7708800, 'steps': 40149, 'loss/train': 1.2419692277908325} -11/07/2021 02:52:15 - INFO - __main__ - Step 40151: {'lr': 0.0004224091558803337, 'samples': 7708992, 'steps': 40150, 'loss/train': 0.2047809660434723} -11/07/2021 02:52:15 - INFO - __main__ - Step 40152: {'lr': 0.0004224053129328748, 'samples': 7709184, 'steps': 40151, 'loss/train': 1.0908914804458618} -11/07/2021 02:52:15 - INFO - __main__ - Step 40153: {'lr': 0.0004224014699077329, 'samples': 7709376, 'steps': 40152, 'loss/train': 2.108187675476074} -11/07/2021 02:52:16 - INFO - __main__ - Step 40154: {'lr': 0.00042239762680490944, 'samples': 7709568, 'steps': 40153, 'loss/train': 1.6479051113128662} -11/07/2021 02:52:16 - INFO - __main__ - Step 40155: {'lr': 0.00042239378362440627, 'samples': 7709760, 'steps': 40154, 'loss/train': 1.5548971891403198} -11/07/2021 02:52:17 - INFO - __main__ - Step 40156: {'lr': 0.0004223899403662251, 'samples': 7709952, 'steps': 40155, 'loss/train': 0.6885210275650024} -11/07/2021 02:52:18 - INFO - __main__ - Step 40157: {'lr': 0.0004223860970303678, 'samples': 7710144, 'steps': 40156, 'loss/train': 1.4032775163650513} -11/07/2021 02:52:18 - INFO - __main__ - Step 40158: {'lr': 0.00042238225361683593, 'samples': 7710336, 'steps': 40157, 'loss/train': 1.1780622005462646} -11/07/2021 02:52:18 - INFO - __main__ - Step 40159: {'lr': 0.00042237841012563126, 'samples': 7710528, 'steps': 40158, 'loss/train': 1.3725476264953613} -11/07/2021 02:52:19 - INFO - __main__ - Step 40160: {'lr': 0.00042237456655675555, 'samples': 7710720, 'steps': 40159, 'loss/train': 1.0629607439041138} -11/07/2021 02:52:20 - INFO - __main__ - Step 40161: {'lr': 0.0004223707229102105, 'samples': 7710912, 'steps': 40160, 'loss/train': 0.9321591258049011} -11/07/2021 02:52:20 - INFO - __main__ - Step 40162: {'lr': 0.0004223668791859979, 'samples': 7711104, 'steps': 40161, 'loss/train': 1.98379385471344} -11/07/2021 02:52:20 - INFO - __main__ - Step 40163: {'lr': 0.00042236303538411934, 'samples': 7711296, 'steps': 40162, 'loss/train': 1.5861923694610596} -11/07/2021 02:52:21 - INFO - __main__ - Step 40164: {'lr': 0.0004223591915045768, 'samples': 7711488, 'steps': 40163, 'loss/train': 1.249192237854004} -11/07/2021 02:52:21 - INFO - __main__ - Step 40165: {'lr': 0.0004223553475473718, 'samples': 7711680, 'steps': 40164, 'loss/train': 1.4634073972702026} -11/07/2021 02:52:21 - INFO - __main__ - Step 40166: {'lr': 0.00042235150351250617, 'samples': 7711872, 'steps': 40165, 'loss/train': 1.8517236709594727} -11/07/2021 02:52:22 - INFO - __main__ - Step 40167: {'lr': 0.00042234765939998156, 'samples': 7712064, 'steps': 40166, 'loss/train': 1.651535153388977} -11/07/2021 02:52:23 - INFO - __main__ - Step 40168: {'lr': 0.00042234381520979983, 'samples': 7712256, 'steps': 40167, 'loss/train': 1.5286800861358643} -11/07/2021 02:52:23 - INFO - __main__ - Step 40169: {'lr': 0.0004223399709419625, 'samples': 7712448, 'steps': 40168, 'loss/train': 2.0702335834503174} -11/07/2021 02:52:23 - INFO - __main__ - Step 40170: {'lr': 0.0004223361265964716, 'samples': 7712640, 'steps': 40169, 'loss/train': 1.5532838106155396} -11/07/2021 02:52:24 - INFO - __main__ - Step 40171: {'lr': 0.0004223322821733286, 'samples': 7712832, 'steps': 40170, 'loss/train': 1.1976006031036377} -11/07/2021 02:52:25 - INFO - __main__ - Step 40172: {'lr': 0.0004223284376725354, 'samples': 7713024, 'steps': 40171, 'loss/train': 1.5690964460372925} -11/07/2021 02:52:25 - INFO - __main__ - Step 40173: {'lr': 0.00042232459309409355, 'samples': 7713216, 'steps': 40172, 'loss/train': 1.2744946479797363} -11/07/2021 02:52:25 - INFO - __main__ - Step 40174: {'lr': 0.00042232074843800494, 'samples': 7713408, 'steps': 40173, 'loss/train': 1.3678518533706665} -11/07/2021 02:52:26 - INFO - __main__ - Step 40175: {'lr': 0.00042231690370427135, 'samples': 7713600, 'steps': 40174, 'loss/train': 1.6584599018096924} -11/07/2021 02:52:26 - INFO - __main__ - Step 40176: {'lr': 0.00042231305889289437, 'samples': 7713792, 'steps': 40175, 'loss/train': 1.1790246963500977} -11/07/2021 02:52:27 - INFO - __main__ - Step 40177: {'lr': 0.00042230921400387576, 'samples': 7713984, 'steps': 40176, 'loss/train': 1.514189600944519} -11/07/2021 02:52:27 - INFO - __main__ - Step 40178: {'lr': 0.0004223053690372173, 'samples': 7714176, 'steps': 40177, 'loss/train': 2.0193939208984375} -11/07/2021 02:52:28 - INFO - __main__ - Step 40179: {'lr': 0.00042230152399292065, 'samples': 7714368, 'steps': 40178, 'loss/train': 1.0819612741470337} -11/07/2021 02:52:28 - INFO - __main__ - Step 40180: {'lr': 0.00042229767887098766, 'samples': 7714560, 'steps': 40179, 'loss/train': 0.5604084730148315} -11/07/2021 02:52:28 - INFO - __main__ - Step 40181: {'lr': 0.00042229383367142, 'samples': 7714752, 'steps': 40180, 'loss/train': 1.6694213151931763} -11/07/2021 02:52:30 - INFO - __main__ - Step 40182: {'lr': 0.0004222899883942194, 'samples': 7714944, 'steps': 40181, 'loss/train': 1.8260314464569092} -11/07/2021 02:52:30 - INFO - __main__ - Step 40183: {'lr': 0.0004222861430393875, 'samples': 7715136, 'steps': 40182, 'loss/train': 1.5716710090637207} -11/07/2021 02:52:30 - INFO - __main__ - Step 40184: {'lr': 0.0004222822976069262, 'samples': 7715328, 'steps': 40183, 'loss/train': 1.618808627128601} -11/07/2021 02:52:31 - INFO - __main__ - Step 40185: {'lr': 0.0004222784520968371, 'samples': 7715520, 'steps': 40184, 'loss/train': 1.6012680530548096} -11/07/2021 02:52:31 - INFO - __main__ - Step 40186: {'lr': 0.0004222746065091221, 'samples': 7715712, 'steps': 40185, 'loss/train': 1.499024510383606} -11/07/2021 02:52:31 - INFO - __main__ - Step 40187: {'lr': 0.0004222707608437827, 'samples': 7715904, 'steps': 40186, 'loss/train': 1.881104826927185} -11/07/2021 02:52:32 - INFO - __main__ - Step 40188: {'lr': 0.00042226691510082083, 'samples': 7716096, 'steps': 40187, 'loss/train': 0.5944708585739136} -11/07/2021 02:52:33 - INFO - __main__ - Step 40189: {'lr': 0.0004222630692802381, 'samples': 7716288, 'steps': 40188, 'loss/train': 1.5961015224456787} -11/07/2021 02:52:33 - INFO - __main__ - Step 40190: {'lr': 0.00042225922338203625, 'samples': 7716480, 'steps': 40189, 'loss/train': 1.6296290159225464} -11/07/2021 02:52:33 - INFO - __main__ - Step 40191: {'lr': 0.00042225537740621713, 'samples': 7716672, 'steps': 40190, 'loss/train': 1.8040450811386108} -11/07/2021 02:52:34 - INFO - __main__ - Step 40192: {'lr': 0.00042225153135278236, 'samples': 7716864, 'steps': 40191, 'loss/train': 0.49315086007118225} -11/07/2021 02:52:35 - INFO - __main__ - Step 40193: {'lr': 0.00042224768522173374, 'samples': 7717056, 'steps': 40192, 'loss/train': 1.218572974205017} -11/07/2021 02:52:35 - INFO - __main__ - Step 40194: {'lr': 0.00042224383901307293, 'samples': 7717248, 'steps': 40193, 'loss/train': 1.7356516122817993} -11/07/2021 02:52:35 - INFO - __main__ - Step 40195: {'lr': 0.0004222399927268018, 'samples': 7717440, 'steps': 40194, 'loss/train': 1.3899880647659302} -11/07/2021 02:52:36 - INFO - __main__ - Step 40196: {'lr': 0.0004222361463629218, 'samples': 7717632, 'steps': 40195, 'loss/train': 1.5748728513717651} -11/07/2021 02:52:36 - INFO - __main__ - Step 40197: {'lr': 0.00042223229992143505, 'samples': 7717824, 'steps': 40196, 'loss/train': 1.9716410636901855} -11/07/2021 02:52:37 - INFO - __main__ - Step 40198: {'lr': 0.00042222845340234293, 'samples': 7718016, 'steps': 40197, 'loss/train': 1.2805557250976562} -11/07/2021 02:52:38 - INFO - __main__ - Step 40199: {'lr': 0.00042222460680564747, 'samples': 7718208, 'steps': 40198, 'loss/train': 1.248995304107666} -11/07/2021 02:52:38 - INFO - __main__ - Step 40200: {'lr': 0.0004222207601313501, 'samples': 7718400, 'steps': 40199, 'loss/train': 1.1626522541046143} -11/07/2021 02:52:39 - INFO - __main__ - Step 40201: {'lr': 0.00042221691337945285, 'samples': 7718592, 'steps': 40200, 'loss/train': 1.5353505611419678} -11/07/2021 02:52:39 - INFO - __main__ - Step 40202: {'lr': 0.0004222130665499573, 'samples': 7718784, 'steps': 40201, 'loss/train': 0.5865015983581543} -11/07/2021 02:52:40 - INFO - __main__ - Step 40203: {'lr': 0.0004222092196428651, 'samples': 7718976, 'steps': 40202, 'loss/train': 1.5902080535888672} -11/07/2021 02:52:40 - INFO - __main__ - Step 40204: {'lr': 0.0004222053726581782, 'samples': 7719168, 'steps': 40203, 'loss/train': 1.7543646097183228} -11/07/2021 02:52:41 - INFO - __main__ - Step 40205: {'lr': 0.0004222015255958981, 'samples': 7719360, 'steps': 40204, 'loss/train': 1.538298487663269} -11/07/2021 02:52:41 - INFO - __main__ - Step 40206: {'lr': 0.0004221976784560267, 'samples': 7719552, 'steps': 40205, 'loss/train': 1.2510653734207153} -11/07/2021 02:52:41 - INFO - __main__ - Step 40207: {'lr': 0.0004221938312385657, 'samples': 7719744, 'steps': 40206, 'loss/train': 1.6789195537567139} -11/07/2021 02:52:42 - INFO - __main__ - Step 40208: {'lr': 0.00042218998394351684, 'samples': 7719936, 'steps': 40207, 'loss/train': 1.4205678701400757} -11/07/2021 02:52:43 - INFO - __main__ - Step 40209: {'lr': 0.0004221861365708818, 'samples': 7720128, 'steps': 40208, 'loss/train': 1.5723936557769775} -11/07/2021 02:52:43 - INFO - __main__ - Step 40210: {'lr': 0.0004221822891206623, 'samples': 7720320, 'steps': 40209, 'loss/train': 1.513080358505249} -11/07/2021 02:52:43 - INFO - __main__ - Step 40211: {'lr': 0.00042217844159286015, 'samples': 7720512, 'steps': 40210, 'loss/train': 1.6374874114990234} -11/07/2021 02:52:44 - INFO - __main__ - Step 40212: {'lr': 0.00042217459398747703, 'samples': 7720704, 'steps': 40211, 'loss/train': 1.9883413314819336} -11/07/2021 02:52:45 - INFO - __main__ - Step 40213: {'lr': 0.0004221707463045148, 'samples': 7720896, 'steps': 40212, 'loss/train': 1.5096373558044434} -11/07/2021 02:52:45 - INFO - __main__ - Step 40214: {'lr': 0.0004221668985439749, 'samples': 7721088, 'steps': 40213, 'loss/train': 0.14097359776496887} -11/07/2021 02:52:46 - INFO - __main__ - Step 40215: {'lr': 0.00042216305070585946, 'samples': 7721280, 'steps': 40214, 'loss/train': 1.5622889995574951} -11/07/2021 02:52:46 - INFO - __main__ - Step 40216: {'lr': 0.00042215920279016993, 'samples': 7721472, 'steps': 40215, 'loss/train': 1.5851691961288452} -11/07/2021 02:52:46 - INFO - __main__ - Step 40217: {'lr': 0.00042215535479690807, 'samples': 7721664, 'steps': 40216, 'loss/train': 1.330405592918396} -11/07/2021 02:52:47 - INFO - __main__ - Step 40218: {'lr': 0.0004221515067260757, 'samples': 7721856, 'steps': 40217, 'loss/train': 1.0161442756652832} -11/07/2021 02:52:48 - INFO - __main__ - Step 40219: {'lr': 0.0004221476585776745, 'samples': 7722048, 'steps': 40218, 'loss/train': 1.7406327724456787} -11/07/2021 02:52:48 - INFO - __main__ - Step 40220: {'lr': 0.00042214381035170624, 'samples': 7722240, 'steps': 40219, 'loss/train': 1.4465067386627197} -11/07/2021 02:52:48 - INFO - __main__ - Step 40221: {'lr': 0.0004221399620481726, 'samples': 7722432, 'steps': 40220, 'loss/train': 0.31174546480178833} -11/07/2021 02:52:49 - INFO - __main__ - Step 40222: {'lr': 0.00042213611366707547, 'samples': 7722624, 'steps': 40221, 'loss/train': 1.4638572931289673} -11/07/2021 02:52:50 - INFO - __main__ - Step 40223: {'lr': 0.0004221322652084163, 'samples': 7722816, 'steps': 40222, 'loss/train': 1.0964359045028687} -11/07/2021 02:52:50 - INFO - __main__ - Step 40224: {'lr': 0.0004221284166721971, 'samples': 7723008, 'steps': 40223, 'loss/train': 1.2773767709732056} -11/07/2021 02:52:51 - INFO - __main__ - Step 40225: {'lr': 0.00042212456805841944, 'samples': 7723200, 'steps': 40224, 'loss/train': 1.7557947635650635} -11/07/2021 02:52:51 - INFO - __main__ - Step 40226: {'lr': 0.00042212071936708506, 'samples': 7723392, 'steps': 40225, 'loss/train': 1.4272174835205078} -11/07/2021 02:52:51 - INFO - __main__ - Step 40227: {'lr': 0.0004221168705981958, 'samples': 7723584, 'steps': 40226, 'loss/train': 1.4838918447494507} -11/07/2021 02:52:52 - INFO - __main__ - Step 40228: {'lr': 0.00042211302175175334, 'samples': 7723776, 'steps': 40227, 'loss/train': 1.2917256355285645} -11/07/2021 02:52:53 - INFO - __main__ - Step 40229: {'lr': 0.0004221091728277595, 'samples': 7723968, 'steps': 40228, 'loss/train': 1.401443600654602} -11/07/2021 02:52:53 - INFO - __main__ - Step 40230: {'lr': 0.0004221053238262158, 'samples': 7724160, 'steps': 40229, 'loss/train': 1.6499395370483398} -11/07/2021 02:52:53 - INFO - __main__ - Step 40231: {'lr': 0.0004221014747471241, 'samples': 7724352, 'steps': 40230, 'loss/train': 1.2536239624023438} -11/07/2021 02:52:54 - INFO - __main__ - Step 40232: {'lr': 0.0004220976255904861, 'samples': 7724544, 'steps': 40231, 'loss/train': 1.606628656387329} -11/07/2021 02:52:55 - INFO - __main__ - Step 40233: {'lr': 0.00042209377635630364, 'samples': 7724736, 'steps': 40232, 'loss/train': 1.4865119457244873} -11/07/2021 02:52:55 - INFO - __main__ - Step 40234: {'lr': 0.00042208992704457837, 'samples': 7724928, 'steps': 40233, 'loss/train': 0.8506203889846802} -11/07/2021 02:52:55 - INFO - __main__ - Step 40235: {'lr': 0.00042208607765531204, 'samples': 7725120, 'steps': 40234, 'loss/train': 1.1438913345336914} -11/07/2021 02:52:56 - INFO - __main__ - Step 40236: {'lr': 0.00042208222818850634, 'samples': 7725312, 'steps': 40235, 'loss/train': 1.2168179750442505} -11/07/2021 02:52:56 - INFO - __main__ - Step 40237: {'lr': 0.0004220783786441631, 'samples': 7725504, 'steps': 40236, 'loss/train': 1.3755687475204468} -11/07/2021 02:52:56 - INFO - __main__ - Step 40238: {'lr': 0.0004220745290222839, 'samples': 7725696, 'steps': 40237, 'loss/train': 1.1750071048736572} -11/07/2021 02:52:57 - INFO - __main__ - Step 40239: {'lr': 0.00042207067932287066, 'samples': 7725888, 'steps': 40238, 'loss/train': 1.6734548807144165} -11/07/2021 02:52:58 - INFO - __main__ - Step 40240: {'lr': 0.00042206682954592503, 'samples': 7726080, 'steps': 40239, 'loss/train': 1.5095839500427246} -11/07/2021 02:52:58 - INFO - __main__ - Step 40241: {'lr': 0.0004220629796914487, 'samples': 7726272, 'steps': 40240, 'loss/train': 1.7802373170852661} -11/07/2021 02:52:58 - INFO - __main__ - Step 40242: {'lr': 0.00042205912975944344, 'samples': 7726464, 'steps': 40241, 'loss/train': 1.1329573392868042} -11/07/2021 02:52:59 - INFO - __main__ - Step 40243: {'lr': 0.00042205527974991096, 'samples': 7726656, 'steps': 40242, 'loss/train': 1.934626817703247} -11/07/2021 02:53:00 - INFO - __main__ - Step 40244: {'lr': 0.00042205142966285315, 'samples': 7726848, 'steps': 40243, 'loss/train': 1.7891731262207031} -11/07/2021 02:53:01 - INFO - __main__ - Step 40245: {'lr': 0.0004220475794982716, 'samples': 7727040, 'steps': 40244, 'loss/train': 1.6130657196044922} -11/07/2021 02:53:01 - INFO - __main__ - Step 40246: {'lr': 0.00042204372925616797, 'samples': 7727232, 'steps': 40245, 'loss/train': 1.7765222787857056} -11/07/2021 02:53:01 - INFO - __main__ - Step 40247: {'lr': 0.0004220398789365441, 'samples': 7727424, 'steps': 40246, 'loss/train': 1.2992706298828125} -11/07/2021 02:53:02 - INFO - __main__ - Step 40248: {'lr': 0.0004220360285394017, 'samples': 7727616, 'steps': 40247, 'loss/train': 1.0947076082229614} -11/07/2021 02:53:02 - INFO - __main__ - Step 40249: {'lr': 0.0004220321780647426, 'samples': 7727808, 'steps': 40248, 'loss/train': 1.3187216520309448} -11/07/2021 02:53:03 - INFO - __main__ - Step 40250: {'lr': 0.00042202832751256846, 'samples': 7728000, 'steps': 40249, 'loss/train': 1.7385437488555908} -11/07/2021 02:53:03 - INFO - __main__ - Step 40251: {'lr': 0.0004220244768828809, 'samples': 7728192, 'steps': 40250, 'loss/train': 1.3357092142105103} -11/07/2021 02:53:04 - INFO - __main__ - Step 40252: {'lr': 0.0004220206261756819, 'samples': 7728384, 'steps': 40251, 'loss/train': 0.9959414005279541} -11/07/2021 02:53:04 - INFO - __main__ - Step 40253: {'lr': 0.00042201677539097294, 'samples': 7728576, 'steps': 40252, 'loss/train': 1.3090541362762451} -11/07/2021 02:53:04 - INFO - __main__ - Step 40254: {'lr': 0.00042201292452875595, 'samples': 7728768, 'steps': 40253, 'loss/train': 1.762420654296875} -11/07/2021 02:53:06 - INFO - __main__ - Step 40255: {'lr': 0.00042200907358903264, 'samples': 7728960, 'steps': 40254, 'loss/train': 1.5239912271499634} -11/07/2021 02:53:06 - INFO - __main__ - Step 40256: {'lr': 0.0004220052225718046, 'samples': 7729152, 'steps': 40255, 'loss/train': 1.4988716840744019} -11/07/2021 02:53:06 - INFO - __main__ - Step 40257: {'lr': 0.0004220013714770737, 'samples': 7729344, 'steps': 40256, 'loss/train': 1.5974842309951782} -11/07/2021 02:53:07 - INFO - __main__ - Step 40258: {'lr': 0.0004219975203048416, 'samples': 7729536, 'steps': 40257, 'loss/train': 1.612775206565857} -11/07/2021 02:53:07 - INFO - __main__ - Step 40259: {'lr': 0.0004219936690551101, 'samples': 7729728, 'steps': 40258, 'loss/train': 1.3531855344772339} -11/07/2021 02:53:07 - INFO - __main__ - Step 40260: {'lr': 0.0004219898177278809, 'samples': 7729920, 'steps': 40259, 'loss/train': 1.6398286819458008} -11/07/2021 02:53:08 - INFO - __main__ - Step 40261: {'lr': 0.00042198596632315576, 'samples': 7730112, 'steps': 40260, 'loss/train': 5.88883113861084} -11/07/2021 02:53:09 - INFO - __main__ - Step 40262: {'lr': 0.0004219821148409364, 'samples': 7730304, 'steps': 40261, 'loss/train': 1.5091698169708252} -11/07/2021 02:53:09 - INFO - __main__ - Step 40263: {'lr': 0.00042197826328122456, 'samples': 7730496, 'steps': 40262, 'loss/train': 1.4398863315582275} -11/07/2021 02:53:09 - INFO - __main__ - Step 40264: {'lr': 0.00042197441164402197, 'samples': 7730688, 'steps': 40263, 'loss/train': 1.578916311264038} -11/07/2021 02:53:10 - INFO - __main__ - Step 40265: {'lr': 0.0004219705599293303, 'samples': 7730880, 'steps': 40264, 'loss/train': 1.0776889324188232} -11/07/2021 02:53:11 - INFO - __main__ - Step 40266: {'lr': 0.00042196670813715137, 'samples': 7731072, 'steps': 40265, 'loss/train': 1.384979248046875} -11/07/2021 02:53:11 - INFO - __main__ - Step 40267: {'lr': 0.0004219628562674869, 'samples': 7731264, 'steps': 40266, 'loss/train': 1.5530970096588135} -11/07/2021 02:53:12 - INFO - __main__ - Step 40268: {'lr': 0.00042195900432033865, 'samples': 7731456, 'steps': 40267, 'loss/train': 2.001399278640747} -11/07/2021 02:53:12 - INFO - __main__ - Step 40269: {'lr': 0.00042195515229570833, 'samples': 7731648, 'steps': 40268, 'loss/train': 1.5870234966278076} -11/07/2021 02:53:12 - INFO - __main__ - Step 40270: {'lr': 0.0004219513001935976, 'samples': 7731840, 'steps': 40269, 'loss/train': 1.714131236076355} -11/07/2021 02:53:13 - INFO - __main__ - Step 40271: {'lr': 0.00042194744801400837, 'samples': 7732032, 'steps': 40270, 'loss/train': 1.4420199394226074} -11/07/2021 02:53:14 - INFO - __main__ - Step 40272: {'lr': 0.0004219435957569422, 'samples': 7732224, 'steps': 40271, 'loss/train': 1.428703784942627} -11/07/2021 02:53:14 - INFO - __main__ - Step 40273: {'lr': 0.0004219397434224009, 'samples': 7732416, 'steps': 40272, 'loss/train': 1.6456485986709595} -11/07/2021 02:53:14 - INFO - __main__ - Step 40274: {'lr': 0.0004219358910103862, 'samples': 7732608, 'steps': 40273, 'loss/train': 1.3778915405273438} -11/07/2021 02:53:15 - INFO - __main__ - Step 40275: {'lr': 0.00042193203852089993, 'samples': 7732800, 'steps': 40274, 'loss/train': 1.2710283994674683} -11/07/2021 02:53:15 - INFO - __main__ - Step 40276: {'lr': 0.00042192818595394367, 'samples': 7732992, 'steps': 40275, 'loss/train': 1.1744085550308228} -11/07/2021 02:53:16 - INFO - __main__ - Step 40277: {'lr': 0.00042192433330951926, 'samples': 7733184, 'steps': 40276, 'loss/train': 1.3941353559494019} -11/07/2021 02:53:16 - INFO - __main__ - Step 40278: {'lr': 0.00042192048058762834, 'samples': 7733376, 'steps': 40277, 'loss/train': 1.1758747100830078} -11/07/2021 02:53:17 - INFO - __main__ - Step 40279: {'lr': 0.00042191662778827275, 'samples': 7733568, 'steps': 40278, 'loss/train': 1.396023154258728} -11/07/2021 02:53:17 - INFO - __main__ - Step 40280: {'lr': 0.0004219127749114541, 'samples': 7733760, 'steps': 40279, 'loss/train': 1.4444804191589355} -11/07/2021 02:53:17 - INFO - __main__ - Step 40281: {'lr': 0.00042190892195717426, 'samples': 7733952, 'steps': 40280, 'loss/train': 1.2106468677520752} -11/07/2021 02:53:19 - INFO - __main__ - Step 40282: {'lr': 0.000421905068925435, 'samples': 7734144, 'steps': 40281, 'loss/train': 1.269433856010437} -11/07/2021 02:53:19 - INFO - __main__ - Step 40283: {'lr': 0.00042190121581623784, 'samples': 7734336, 'steps': 40282, 'loss/train': 1.8498080968856812} -11/07/2021 02:53:19 - INFO - __main__ - Step 40284: {'lr': 0.0004218973626295847, 'samples': 7734528, 'steps': 40283, 'loss/train': 1.6520702838897705} -11/07/2021 02:53:20 - INFO - __main__ - Step 40285: {'lr': 0.0004218935093654772, 'samples': 7734720, 'steps': 40284, 'loss/train': 1.5929603576660156} -11/07/2021 02:53:20 - INFO - __main__ - Step 40286: {'lr': 0.00042188965602391726, 'samples': 7734912, 'steps': 40285, 'loss/train': 1.637909173965454} -11/07/2021 02:53:21 - INFO - __main__ - Step 40287: {'lr': 0.0004218858026049064, 'samples': 7735104, 'steps': 40286, 'loss/train': 1.2915066480636597} -11/07/2021 02:53:21 - INFO - __main__ - Step 40288: {'lr': 0.00042188194910844644, 'samples': 7735296, 'steps': 40287, 'loss/train': 2.1509063243865967} -11/07/2021 02:53:22 - INFO - __main__ - Step 40289: {'lr': 0.0004218780955345392, 'samples': 7735488, 'steps': 40288, 'loss/train': 1.2132989168167114} -11/07/2021 02:53:22 - INFO - __main__ - Step 40290: {'lr': 0.0004218742418831863, 'samples': 7735680, 'steps': 40289, 'loss/train': 1.6381466388702393} -11/07/2021 02:53:22 - INFO - __main__ - Step 40291: {'lr': 0.0004218703881543895, 'samples': 7735872, 'steps': 40290, 'loss/train': 1.260995864868164} -11/07/2021 02:53:23 - INFO - __main__ - Step 40292: {'lr': 0.0004218665343481506, 'samples': 7736064, 'steps': 40291, 'loss/train': 1.5558457374572754} -11/07/2021 02:53:24 - INFO - __main__ - Step 40293: {'lr': 0.00042186268046447124, 'samples': 7736256, 'steps': 40292, 'loss/train': 1.7037135362625122} -11/07/2021 02:53:24 - INFO - __main__ - Step 40294: {'lr': 0.0004218588265033533, 'samples': 7736448, 'steps': 40293, 'loss/train': 0.8515810966491699} -11/07/2021 02:53:25 - INFO - __main__ - Step 40295: {'lr': 0.0004218549724647983, 'samples': 7736640, 'steps': 40294, 'loss/train': 1.9279394149780273} -11/07/2021 02:53:25 - INFO - __main__ - Step 40296: {'lr': 0.0004218511183488082, 'samples': 7736832, 'steps': 40295, 'loss/train': 1.844152569770813} -11/07/2021 02:53:25 - INFO - __main__ - Step 40297: {'lr': 0.00042184726415538457, 'samples': 7737024, 'steps': 40296, 'loss/train': 1.586840271949768} -11/07/2021 02:53:26 - INFO - __main__ - Step 40298: {'lr': 0.00042184340988452924, 'samples': 7737216, 'steps': 40297, 'loss/train': 1.3267289400100708} -11/07/2021 02:53:27 - INFO - __main__ - Step 40299: {'lr': 0.00042183955553624393, 'samples': 7737408, 'steps': 40298, 'loss/train': 1.6323528289794922} -11/07/2021 02:53:27 - INFO - __main__ - Step 40300: {'lr': 0.0004218357011105304, 'samples': 7737600, 'steps': 40299, 'loss/train': 1.4126336574554443} -11/07/2021 02:53:27 - INFO - __main__ - Step 40301: {'lr': 0.00042183184660739027, 'samples': 7737792, 'steps': 40300, 'loss/train': 1.3471697568893433} -11/07/2021 02:53:28 - INFO - __main__ - Step 40302: {'lr': 0.00042182799202682543, 'samples': 7737984, 'steps': 40301, 'loss/train': 1.7396727800369263} -11/07/2021 02:53:29 - INFO - __main__ - Step 40303: {'lr': 0.0004218241373688375, 'samples': 7738176, 'steps': 40302, 'loss/train': 2.6259586811065674} -11/07/2021 02:53:30 - INFO - __main__ - Step 40304: {'lr': 0.0004218202826334283, 'samples': 7738368, 'steps': 40303, 'loss/train': 1.8593873977661133} -11/07/2021 02:53:30 - INFO - __main__ - Step 40305: {'lr': 0.0004218164278205995, 'samples': 7738560, 'steps': 40304, 'loss/train': 1.0830633640289307} -11/07/2021 02:53:30 - INFO - __main__ - Step 40306: {'lr': 0.00042181257293035293, 'samples': 7738752, 'steps': 40305, 'loss/train': 0.8169730305671692} -11/07/2021 02:53:31 - INFO - __main__ - Step 40307: {'lr': 0.00042180871796269025, 'samples': 7738944, 'steps': 40306, 'loss/train': 1.5396815538406372} -11/07/2021 02:53:31 - INFO - __main__ - Step 40308: {'lr': 0.00042180486291761314, 'samples': 7739136, 'steps': 40307, 'loss/train': 1.6105730533599854} -11/07/2021 02:53:31 - INFO - __main__ - Step 40309: {'lr': 0.0004218010077951235, 'samples': 7739328, 'steps': 40308, 'loss/train': 1.5214552879333496} -11/07/2021 02:53:32 - INFO - __main__ - Step 40310: {'lr': 0.00042179715259522293, 'samples': 7739520, 'steps': 40309, 'loss/train': 1.711687445640564} -11/07/2021 02:53:33 - INFO - __main__ - Step 40311: {'lr': 0.00042179329731791324, 'samples': 7739712, 'steps': 40310, 'loss/train': 1.418582558631897} -11/07/2021 02:53:33 - INFO - __main__ - Step 40312: {'lr': 0.0004217894419631961, 'samples': 7739904, 'steps': 40311, 'loss/train': 1.4990530014038086} -11/07/2021 02:53:33 - INFO - __main__ - Step 40313: {'lr': 0.00042178558653107337, 'samples': 7740096, 'steps': 40312, 'loss/train': 1.4654122591018677} -11/07/2021 02:53:34 - INFO - __main__ - Step 40314: {'lr': 0.0004217817310215466, 'samples': 7740288, 'steps': 40313, 'loss/train': 1.5557605028152466} -11/07/2021 02:53:35 - INFO - __main__ - Step 40315: {'lr': 0.00042177787543461767, 'samples': 7740480, 'steps': 40314, 'loss/train': 1.8264100551605225} -11/07/2021 02:53:35 - INFO - __main__ - Step 40316: {'lr': 0.0004217740197702883, 'samples': 7740672, 'steps': 40315, 'loss/train': 1.7862824201583862} -11/07/2021 02:53:35 - INFO - __main__ - Step 40317: {'lr': 0.00042177016402856023, 'samples': 7740864, 'steps': 40316, 'loss/train': 1.6017388105392456} -11/07/2021 02:53:36 - INFO - __main__ - Step 40318: {'lr': 0.00042176630820943515, 'samples': 7741056, 'steps': 40317, 'loss/train': 1.3726780414581299} -11/07/2021 02:53:36 - INFO - __main__ - Step 40319: {'lr': 0.0004217624523129148, 'samples': 7741248, 'steps': 40318, 'loss/train': 1.5588961839675903} -11/07/2021 02:53:37 - INFO - __main__ - Step 40320: {'lr': 0.0004217585963390009, 'samples': 7741440, 'steps': 40319, 'loss/train': 1.0949862003326416} -11/07/2021 02:53:38 - INFO - __main__ - Step 40321: {'lr': 0.00042175474028769534, 'samples': 7741632, 'steps': 40320, 'loss/train': 1.5856151580810547} -11/07/2021 02:53:38 - INFO - __main__ - Step 40322: {'lr': 0.00042175088415899963, 'samples': 7741824, 'steps': 40321, 'loss/train': 1.3406957387924194} -11/07/2021 02:53:38 - INFO - __main__ - Step 40323: {'lr': 0.00042174702795291574, 'samples': 7742016, 'steps': 40322, 'loss/train': 1.3882884979248047} -11/07/2021 02:53:39 - INFO - __main__ - Step 40324: {'lr': 0.0004217431716694452, 'samples': 7742208, 'steps': 40323, 'loss/train': 1.621527910232544} -11/07/2021 02:53:40 - INFO - __main__ - Step 40325: {'lr': 0.00042173931530858986, 'samples': 7742400, 'steps': 40324, 'loss/train': 1.1860873699188232} -11/07/2021 02:53:40 - INFO - __main__ - Step 40326: {'lr': 0.00042173545887035145, 'samples': 7742592, 'steps': 40325, 'loss/train': 1.6575325727462769} -11/07/2021 02:53:40 - INFO - __main__ - Step 40327: {'lr': 0.0004217316023547317, 'samples': 7742784, 'steps': 40326, 'loss/train': 1.705884337425232} -11/07/2021 02:53:41 - INFO - __main__ - Step 40328: {'lr': 0.00042172774576173226, 'samples': 7742976, 'steps': 40327, 'loss/train': 2.0860137939453125} -11/07/2021 02:53:41 - INFO - __main__ - Step 40329: {'lr': 0.00042172388909135505, 'samples': 7743168, 'steps': 40328, 'loss/train': 1.2067232131958008} -11/07/2021 02:53:42 - INFO - __main__ - Step 40330: {'lr': 0.0004217200323436017, 'samples': 7743360, 'steps': 40329, 'loss/train': 1.7795089483261108} -11/07/2021 02:53:42 - INFO - __main__ - Step 40331: {'lr': 0.00042171617551847387, 'samples': 7743552, 'steps': 40330, 'loss/train': 1.6506901979446411} -11/07/2021 02:53:43 - INFO - __main__ - Step 40332: {'lr': 0.0004217123186159735, 'samples': 7743744, 'steps': 40331, 'loss/train': 1.5076559782028198} -11/07/2021 02:53:43 - INFO - __main__ - Step 40333: {'lr': 0.0004217084616361021, 'samples': 7743936, 'steps': 40332, 'loss/train': 1.3635174036026} -11/07/2021 02:53:43 - INFO - __main__ - Step 40334: {'lr': 0.0004217046045788615, 'samples': 7744128, 'steps': 40333, 'loss/train': 1.613263726234436} -11/07/2021 02:53:44 - INFO - __main__ - Step 40335: {'lr': 0.0004217007474442535, 'samples': 7744320, 'steps': 40334, 'loss/train': 1.0538244247436523} -11/07/2021 02:53:45 - INFO - __main__ - Step 40336: {'lr': 0.00042169689023227987, 'samples': 7744512, 'steps': 40335, 'loss/train': 1.7182577848434448} -11/07/2021 02:53:45 - INFO - __main__ - Step 40337: {'lr': 0.00042169303294294216, 'samples': 7744704, 'steps': 40336, 'loss/train': 1.5433964729309082} -11/07/2021 02:53:46 - INFO - __main__ - Step 40338: {'lr': 0.0004216891755762423, 'samples': 7744896, 'steps': 40337, 'loss/train': 1.5233230590820312} -11/07/2021 02:53:46 - INFO - __main__ - Step 40339: {'lr': 0.00042168531813218193, 'samples': 7745088, 'steps': 40338, 'loss/train': 2.014331102371216} -11/07/2021 02:53:46 - INFO - __main__ - Step 40340: {'lr': 0.0004216814606107627, 'samples': 7745280, 'steps': 40339, 'loss/train': 1.6288928985595703} -11/07/2021 02:53:47 - INFO - __main__ - Step 40341: {'lr': 0.00042167760301198656, 'samples': 7745472, 'steps': 40340, 'loss/train': 1.9901844263076782} -11/07/2021 02:53:48 - INFO - __main__ - Step 40342: {'lr': 0.0004216737453358551, 'samples': 7745664, 'steps': 40341, 'loss/train': 1.5221227407455444} -11/07/2021 02:53:48 - INFO - __main__ - Step 40343: {'lr': 0.00042166988758237013, 'samples': 7745856, 'steps': 40342, 'loss/train': 1.735198974609375} -11/07/2021 02:53:48 - INFO - __main__ - Step 40344: {'lr': 0.00042166602975153333, 'samples': 7746048, 'steps': 40343, 'loss/train': 1.4574334621429443} -11/07/2021 02:53:49 - INFO - __main__ - Step 40345: {'lr': 0.0004216621718433465, 'samples': 7746240, 'steps': 40344, 'loss/train': 1.4490758180618286} -11/07/2021 02:53:50 - INFO - __main__ - Step 40346: {'lr': 0.0004216583138578113, 'samples': 7746432, 'steps': 40345, 'loss/train': 1.3788456916809082} -11/07/2021 02:53:50 - INFO - __main__ - Step 40347: {'lr': 0.00042165445579492956, 'samples': 7746624, 'steps': 40346, 'loss/train': 1.7768930196762085} -11/07/2021 02:53:50 - INFO - __main__ - Step 40348: {'lr': 0.00042165059765470294, 'samples': 7746816, 'steps': 40347, 'loss/train': 1.6489914655685425} -11/07/2021 02:53:51 - INFO - __main__ - Step 40349: {'lr': 0.0004216467394371333, 'samples': 7747008, 'steps': 40348, 'loss/train': 1.6425361633300781} -11/07/2021 02:53:51 - INFO - __main__ - Step 40350: {'lr': 0.00042164288114222213, 'samples': 7747200, 'steps': 40349, 'loss/train': 1.606465220451355} -11/07/2021 02:53:52 - INFO - __main__ - Step 40351: {'lr': 0.0004216390227699714, 'samples': 7747392, 'steps': 40350, 'loss/train': 1.3147684335708618} -11/07/2021 02:53:52 - INFO - __main__ - Step 40352: {'lr': 0.0004216351643203828, 'samples': 7747584, 'steps': 40351, 'loss/train': 1.381427526473999} -11/07/2021 02:53:53 - INFO - __main__ - Step 40353: {'lr': 0.000421631305793458, 'samples': 7747776, 'steps': 40352, 'loss/train': 1.214415192604065} -11/07/2021 02:53:53 - INFO - __main__ - Step 40354: {'lr': 0.00042162744718919875, 'samples': 7747968, 'steps': 40353, 'loss/train': 1.4954808950424194} -11/07/2021 02:53:53 - INFO - __main__ - Step 40355: {'lr': 0.0004216235885076069, 'samples': 7748160, 'steps': 40354, 'loss/train': 1.5964220762252808} -11/07/2021 02:53:55 - INFO - __main__ - Step 40356: {'lr': 0.00042161972974868415, 'samples': 7748352, 'steps': 40355, 'loss/train': 1.5978648662567139} -11/07/2021 02:53:55 - INFO - __main__ - Step 40357: {'lr': 0.00042161587091243215, 'samples': 7748544, 'steps': 40356, 'loss/train': 1.434416651725769} -11/07/2021 02:53:55 - INFO - __main__ - Step 40358: {'lr': 0.00042161201199885257, 'samples': 7748736, 'steps': 40357, 'loss/train': 1.6181108951568604} -11/07/2021 02:53:56 - INFO - __main__ - Step 40359: {'lr': 0.0004216081530079474, 'samples': 7748928, 'steps': 40358, 'loss/train': 1.367638111114502} -11/07/2021 02:53:56 - INFO - __main__ - Step 40360: {'lr': 0.0004216042939397182, 'samples': 7749120, 'steps': 40359, 'loss/train': 1.4361519813537598} -11/07/2021 02:53:56 - INFO - __main__ - Step 40361: {'lr': 0.00042160043479416676, 'samples': 7749312, 'steps': 40360, 'loss/train': 5.871668338775635} -11/07/2021 02:53:57 - INFO - __main__ - Step 40362: {'lr': 0.00042159657557129483, 'samples': 7749504, 'steps': 40361, 'loss/train': 1.7653417587280273} -11/07/2021 02:53:58 - INFO - __main__ - Step 40363: {'lr': 0.0004215927162711041, 'samples': 7749696, 'steps': 40362, 'loss/train': 1.5643774271011353} -11/07/2021 02:53:58 - INFO - __main__ - Step 40364: {'lr': 0.00042158885689359637, 'samples': 7749888, 'steps': 40363, 'loss/train': 1.458735704421997} -11/07/2021 02:53:59 - INFO - __main__ - Step 40365: {'lr': 0.0004215849974387733, 'samples': 7750080, 'steps': 40364, 'loss/train': 1.1762034893035889} -11/07/2021 02:53:59 - INFO - __main__ - Step 40366: {'lr': 0.0004215811379066367, 'samples': 7750272, 'steps': 40365, 'loss/train': 1.7351243495941162} -11/07/2021 02:54:00 - INFO - __main__ - Step 40367: {'lr': 0.00042157727829718827, 'samples': 7750464, 'steps': 40366, 'loss/train': 0.9102671146392822} -11/07/2021 02:54:00 - INFO - __main__ - Step 40368: {'lr': 0.00042157341861042986, 'samples': 7750656, 'steps': 40367, 'loss/train': 1.847285270690918} -11/07/2021 02:54:01 - INFO - __main__ - Step 40369: {'lr': 0.00042156955884636307, 'samples': 7750848, 'steps': 40368, 'loss/train': 1.3229519128799438} -11/07/2021 02:54:01 - INFO - __main__ - Step 40370: {'lr': 0.0004215656990049896, 'samples': 7751040, 'steps': 40369, 'loss/train': 1.2186511754989624} -11/07/2021 02:54:01 - INFO - __main__ - Step 40371: {'lr': 0.0004215618390863114, 'samples': 7751232, 'steps': 40370, 'loss/train': 1.1559193134307861} -11/07/2021 02:54:02 - INFO - __main__ - Step 40372: {'lr': 0.00042155797909033, 'samples': 7751424, 'steps': 40371, 'loss/train': 1.7392240762710571} -11/07/2021 02:54:03 - INFO - __main__ - Step 40373: {'lr': 0.00042155411901704723, 'samples': 7751616, 'steps': 40372, 'loss/train': 1.645806074142456} -11/07/2021 02:54:03 - INFO - __main__ - Step 40374: {'lr': 0.0004215502588664648, 'samples': 7751808, 'steps': 40373, 'loss/train': 1.5513337850570679} -11/07/2021 02:54:03 - INFO - __main__ - Step 40375: {'lr': 0.0004215463986385845, 'samples': 7752000, 'steps': 40374, 'loss/train': 1.8371727466583252} -11/07/2021 02:54:04 - INFO - __main__ - Step 40376: {'lr': 0.0004215425383334081, 'samples': 7752192, 'steps': 40375, 'loss/train': 1.8390657901763916} -11/07/2021 02:54:05 - INFO - __main__ - Step 40377: {'lr': 0.00042153867795093714, 'samples': 7752384, 'steps': 40376, 'loss/train': 1.8111679553985596} -11/07/2021 02:54:05 - INFO - __main__ - Step 40378: {'lr': 0.0004215348174911736, 'samples': 7752576, 'steps': 40377, 'loss/train': 1.1135926246643066} -11/07/2021 02:54:05 - INFO - __main__ - Step 40379: {'lr': 0.0004215309569541191, 'samples': 7752768, 'steps': 40378, 'loss/train': 1.1120686531066895} -11/07/2021 02:54:06 - INFO - __main__ - Step 40380: {'lr': 0.00042152709633977545, 'samples': 7752960, 'steps': 40379, 'loss/train': 1.7353676557540894} -11/07/2021 02:54:06 - INFO - __main__ - Step 40381: {'lr': 0.0004215232356481442, 'samples': 7753152, 'steps': 40380, 'loss/train': 1.472200632095337} -11/07/2021 02:54:06 - INFO - __main__ - Step 40382: {'lr': 0.0004215193748792273, 'samples': 7753344, 'steps': 40381, 'loss/train': 1.3253713846206665} -11/07/2021 02:54:08 - INFO - __main__ - Step 40383: {'lr': 0.00042151551403302645, 'samples': 7753536, 'steps': 40382, 'loss/train': 1.6094202995300293} -11/07/2021 02:54:08 - INFO - __main__ - Step 40384: {'lr': 0.00042151165310954335, 'samples': 7753728, 'steps': 40383, 'loss/train': 1.6044669151306152} -11/07/2021 02:54:08 - INFO - __main__ - Step 40385: {'lr': 0.0004215077921087798, 'samples': 7753920, 'steps': 40384, 'loss/train': 0.5478833317756653} -11/07/2021 02:54:09 - INFO - __main__ - Step 40386: {'lr': 0.00042150393103073736, 'samples': 7754112, 'steps': 40385, 'loss/train': 1.0497719049453735} -11/07/2021 02:54:09 - INFO - __main__ - Step 40387: {'lr': 0.00042150006987541795, 'samples': 7754304, 'steps': 40386, 'loss/train': 1.6169170141220093} -11/07/2021 02:54:10 - INFO - __main__ - Step 40388: {'lr': 0.0004214962086428232, 'samples': 7754496, 'steps': 40387, 'loss/train': 1.7807025909423828} -11/07/2021 02:54:10 - INFO - __main__ - Step 40389: {'lr': 0.00042149234733295497, 'samples': 7754688, 'steps': 40388, 'loss/train': 1.7034701108932495} -11/07/2021 02:54:11 - INFO - __main__ - Step 40390: {'lr': 0.00042148848594581503, 'samples': 7754880, 'steps': 40389, 'loss/train': 0.9810364842414856} -11/07/2021 02:54:11 - INFO - __main__ - Step 40391: {'lr': 0.00042148462448140487, 'samples': 7755072, 'steps': 40390, 'loss/train': 1.7027150392532349} -11/07/2021 02:54:11 - INFO - __main__ - Step 40392: {'lr': 0.0004214807629397264, 'samples': 7755264, 'steps': 40391, 'loss/train': 1.563767671585083} -11/07/2021 02:54:12 - INFO - __main__ - Step 40393: {'lr': 0.00042147690132078136, 'samples': 7755456, 'steps': 40392, 'loss/train': 1.670060396194458} -11/07/2021 02:54:13 - INFO - __main__ - Step 40394: {'lr': 0.0004214730396245715, 'samples': 7755648, 'steps': 40393, 'loss/train': 0.9150652289390564} -11/07/2021 02:54:13 - INFO - __main__ - Step 40395: {'lr': 0.0004214691778510985, 'samples': 7755840, 'steps': 40394, 'loss/train': 1.806809425354004} -11/07/2021 02:54:13 - INFO - __main__ - Step 40396: {'lr': 0.0004214653160003642, 'samples': 7756032, 'steps': 40395, 'loss/train': 1.3819338083267212} -11/07/2021 02:54:14 - INFO - __main__ - Step 40397: {'lr': 0.00042146145407237023, 'samples': 7756224, 'steps': 40396, 'loss/train': 1.266759991645813} -11/07/2021 02:54:15 - INFO - __main__ - Step 40398: {'lr': 0.00042145759206711834, 'samples': 7756416, 'steps': 40397, 'loss/train': 1.3659684658050537} -11/07/2021 02:54:15 - INFO - __main__ - Step 40399: {'lr': 0.0004214537299846104, 'samples': 7756608, 'steps': 40398, 'loss/train': 1.5729107856750488} -11/07/2021 02:54:16 - INFO - __main__ - Step 40400: {'lr': 0.00042144986782484796, 'samples': 7756800, 'steps': 40399, 'loss/train': 1.468271255493164} -11/07/2021 02:54:16 - INFO - __main__ - Step 40401: {'lr': 0.00042144600558783284, 'samples': 7756992, 'steps': 40400, 'loss/train': 1.6899981498718262} -11/07/2021 02:54:16 - INFO - __main__ - Step 40402: {'lr': 0.0004214421432735669, 'samples': 7757184, 'steps': 40401, 'loss/train': 1.9053840637207031} -11/07/2021 02:54:17 - INFO - __main__ - Step 40403: {'lr': 0.0004214382808820517, 'samples': 7757376, 'steps': 40402, 'loss/train': 1.874024510383606} -11/07/2021 02:54:18 - INFO - __main__ - Step 40404: {'lr': 0.0004214344184132891, 'samples': 7757568, 'steps': 40403, 'loss/train': 1.5011881589889526} -11/07/2021 02:54:18 - INFO - __main__ - Step 40405: {'lr': 0.0004214305558672808, 'samples': 7757760, 'steps': 40404, 'loss/train': 2.215088367462158} -11/07/2021 02:54:19 - INFO - __main__ - Step 40406: {'lr': 0.0004214266932440285, 'samples': 7757952, 'steps': 40405, 'loss/train': 0.11188347637653351} -11/07/2021 02:54:19 - INFO - __main__ - Step 40407: {'lr': 0.000421422830543534, 'samples': 7758144, 'steps': 40406, 'loss/train': 2.0618247985839844} -11/07/2021 02:54:20 - INFO - __main__ - Step 40408: {'lr': 0.00042141896776579904, 'samples': 7758336, 'steps': 40407, 'loss/train': 1.0536060333251953} -11/07/2021 02:54:20 - INFO - __main__ - Step 40409: {'lr': 0.0004214151049108252, 'samples': 7758528, 'steps': 40408, 'loss/train': 1.743821144104004} -11/07/2021 02:54:21 - INFO - __main__ - Step 40410: {'lr': 0.00042141124197861456, 'samples': 7758720, 'steps': 40409, 'loss/train': 0.9953275322914124} -11/07/2021 02:54:21 - INFO - __main__ - Step 40411: {'lr': 0.0004214073789691686, 'samples': 7758912, 'steps': 40410, 'loss/train': 1.4814211130142212} -11/07/2021 02:54:22 - INFO - __main__ - Step 40412: {'lr': 0.00042140351588248906, 'samples': 7759104, 'steps': 40411, 'loss/train': 1.3941441774368286} -11/07/2021 02:54:22 - INFO - __main__ - Step 40413: {'lr': 0.00042139965271857774, 'samples': 7759296, 'steps': 40412, 'loss/train': 1.7358777523040771} -11/07/2021 02:54:22 - INFO - __main__ - Step 40414: {'lr': 0.0004213957894774364, 'samples': 7759488, 'steps': 40413, 'loss/train': 1.5109068155288696} -11/07/2021 02:54:23 - INFO - __main__ - Step 40415: {'lr': 0.0004213919261590667, 'samples': 7759680, 'steps': 40414, 'loss/train': 0.9453153014183044} -11/07/2021 02:54:24 - INFO - __main__ - Step 40416: {'lr': 0.0004213880627634705, 'samples': 7759872, 'steps': 40415, 'loss/train': 2.697310209274292} -11/07/2021 02:54:24 - INFO - __main__ - Step 40417: {'lr': 0.0004213841992906496, 'samples': 7760064, 'steps': 40416, 'loss/train': 1.6190316677093506} -11/07/2021 02:54:24 - INFO - __main__ - Step 40418: {'lr': 0.0004213803357406055, 'samples': 7760256, 'steps': 40417, 'loss/train': 1.7742410898208618} -11/07/2021 02:54:25 - INFO - __main__ - Step 40419: {'lr': 0.00042137647211334007, 'samples': 7760448, 'steps': 40418, 'loss/train': 1.904790997505188} -11/07/2021 02:54:26 - INFO - __main__ - Step 40420: {'lr': 0.000421372608408855, 'samples': 7760640, 'steps': 40419, 'loss/train': 1.5416607856750488} -11/07/2021 02:54:26 - INFO - __main__ - Step 40421: {'lr': 0.0004213687446271522, 'samples': 7760832, 'steps': 40420, 'loss/train': 0.8516736030578613} -11/07/2021 02:54:27 - INFO - __main__ - Step 40422: {'lr': 0.0004213648807682332, 'samples': 7761024, 'steps': 40421, 'loss/train': 1.5297152996063232} -11/07/2021 02:54:27 - INFO - __main__ - Step 40423: {'lr': 0.00042136101683209993, 'samples': 7761216, 'steps': 40422, 'loss/train': 1.6230645179748535} -11/07/2021 02:54:27 - INFO - __main__ - Step 40424: {'lr': 0.00042135715281875393, 'samples': 7761408, 'steps': 40423, 'loss/train': 1.3259097337722778} -11/07/2021 02:54:28 - INFO - __main__ - Step 40425: {'lr': 0.000421353288728197, 'samples': 7761600, 'steps': 40424, 'loss/train': 1.081849455833435} -11/07/2021 02:54:29 - INFO - __main__ - Step 40426: {'lr': 0.00042134942456043104, 'samples': 7761792, 'steps': 40425, 'loss/train': 1.590003490447998} -11/07/2021 02:54:29 - INFO - __main__ - Step 40427: {'lr': 0.00042134556031545755, 'samples': 7761984, 'steps': 40426, 'loss/train': 1.2831095457077026} -11/07/2021 02:54:29 - INFO - __main__ - Step 40428: {'lr': 0.0004213416959932785, 'samples': 7762176, 'steps': 40427, 'loss/train': 1.867786169052124} -11/07/2021 02:54:30 - INFO - __main__ - Step 40429: {'lr': 0.0004213378315938955, 'samples': 7762368, 'steps': 40428, 'loss/train': 1.2048214673995972} -11/07/2021 02:54:30 - INFO - __main__ - Step 40430: {'lr': 0.0004213339671173103, 'samples': 7762560, 'steps': 40429, 'loss/train': 1.6742734909057617} -11/07/2021 02:54:31 - INFO - __main__ - Step 40431: {'lr': 0.00042133010256352466, 'samples': 7762752, 'steps': 40430, 'loss/train': 1.6833750009536743} -11/07/2021 02:54:32 - INFO - __main__ - Step 40432: {'lr': 0.00042132623793254034, 'samples': 7762944, 'steps': 40431, 'loss/train': 0.7925304770469666} -11/07/2021 02:54:32 - INFO - __main__ - Step 40433: {'lr': 0.0004213223732243591, 'samples': 7763136, 'steps': 40432, 'loss/train': 1.357794165611267} -11/07/2021 02:54:32 - INFO - __main__ - Step 40434: {'lr': 0.00042131850843898255, 'samples': 7763328, 'steps': 40433, 'loss/train': 1.5195480585098267} -11/07/2021 02:54:33 - INFO - __main__ - Step 40435: {'lr': 0.0004213146435764126, 'samples': 7763520, 'steps': 40434, 'loss/train': 0.5984975099563599} -11/07/2021 02:54:33 - INFO - __main__ - Step 40436: {'lr': 0.00042131077863665086, 'samples': 7763712, 'steps': 40435, 'loss/train': 1.5049656629562378} -11/07/2021 02:54:35 - INFO - __main__ - Step 40437: {'lr': 0.00042130691361969914, 'samples': 7763904, 'steps': 40436, 'loss/train': 0.2353384792804718} -11/07/2021 02:54:35 - INFO - __main__ - Step 40438: {'lr': 0.00042130304852555916, 'samples': 7764096, 'steps': 40437, 'loss/train': 1.421054482460022} -11/07/2021 02:54:35 - INFO - __main__ - Step 40439: {'lr': 0.00042129918335423265, 'samples': 7764288, 'steps': 40438, 'loss/train': 1.5775226354599} -11/07/2021 02:54:36 - INFO - __main__ - Step 40440: {'lr': 0.0004212953181057214, 'samples': 7764480, 'steps': 40439, 'loss/train': 1.0920753479003906} -11/07/2021 02:54:36 - INFO - __main__ - Step 40441: {'lr': 0.0004212914527800272, 'samples': 7764672, 'steps': 40440, 'loss/train': 0.48488837480545044} -11/07/2021 02:54:37 - INFO - __main__ - Step 40442: {'lr': 0.0004212875873771516, 'samples': 7764864, 'steps': 40441, 'loss/train': 0.532578706741333} -11/07/2021 02:54:37 - INFO - __main__ - Step 40443: {'lr': 0.0004212837218970965, 'samples': 7765056, 'steps': 40442, 'loss/train': 0.6872163414955139} -11/07/2021 02:54:38 - INFO - __main__ - Step 40444: {'lr': 0.00042127985633986365, 'samples': 7765248, 'steps': 40443, 'loss/train': 1.7978664636611938} -11/07/2021 02:54:38 - INFO - __main__ - Step 40445: {'lr': 0.0004212759907054546, 'samples': 7765440, 'steps': 40444, 'loss/train': 1.7988765239715576} -11/07/2021 02:54:39 - INFO - __main__ - Step 40446: {'lr': 0.00042127212499387136, 'samples': 7765632, 'steps': 40445, 'loss/train': 1.7115402221679688} -11/07/2021 02:54:40 - INFO - __main__ - Step 40447: {'lr': 0.0004212682592051155, 'samples': 7765824, 'steps': 40446, 'loss/train': 1.5423678159713745} -11/07/2021 02:54:40 - INFO - __main__ - Step 40448: {'lr': 0.0004212643933391888, 'samples': 7766016, 'steps': 40447, 'loss/train': 1.4345892667770386} -11/07/2021 02:54:40 - INFO - __main__ - Step 40449: {'lr': 0.000421260527396093, 'samples': 7766208, 'steps': 40448, 'loss/train': 1.547603726387024} -11/07/2021 02:54:41 - INFO - __main__ - Step 40450: {'lr': 0.0004212566613758299, 'samples': 7766400, 'steps': 40449, 'loss/train': 1.6221541166305542} -11/07/2021 02:54:41 - INFO - __main__ - Step 40451: {'lr': 0.00042125279527840124, 'samples': 7766592, 'steps': 40450, 'loss/train': 1.768631100654602} -11/07/2021 02:54:42 - INFO - __main__ - Step 40452: {'lr': 0.0004212489291038085, 'samples': 7766784, 'steps': 40451, 'loss/train': 1.3406453132629395} -11/07/2021 02:54:42 - INFO - __main__ - Step 40453: {'lr': 0.0004212450628520538, 'samples': 7766976, 'steps': 40452, 'loss/train': 1.6043791770935059} -11/07/2021 02:54:43 - INFO - __main__ - Step 40454: {'lr': 0.0004212411965231387, 'samples': 7767168, 'steps': 40453, 'loss/train': 1.3485994338989258} -11/07/2021 02:54:43 - INFO - __main__ - Step 40455: {'lr': 0.0004212373301170649, 'samples': 7767360, 'steps': 40454, 'loss/train': 1.7538222074508667} -11/07/2021 02:54:43 - INFO - __main__ - Step 40456: {'lr': 0.00042123346363383426, 'samples': 7767552, 'steps': 40455, 'loss/train': 2.2991220951080322} -11/07/2021 02:54:44 - INFO - __main__ - Step 40457: {'lr': 0.0004212295970734484, 'samples': 7767744, 'steps': 40456, 'loss/train': 1.1079826354980469} -11/07/2021 02:54:45 - INFO - __main__ - Step 40458: {'lr': 0.00042122573043590925, 'samples': 7767936, 'steps': 40457, 'loss/train': 1.0960724353790283} -11/07/2021 02:54:45 - INFO - __main__ - Step 40459: {'lr': 0.0004212218637212183, 'samples': 7768128, 'steps': 40458, 'loss/train': 1.659537672996521} -11/07/2021 02:54:45 - INFO - __main__ - Step 40460: {'lr': 0.00042121799692937747, 'samples': 7768320, 'steps': 40459, 'loss/train': 1.698103666305542} -11/07/2021 02:54:46 - INFO - __main__ - Step 40461: {'lr': 0.00042121413006038845, 'samples': 7768512, 'steps': 40460, 'loss/train': 1.0684001445770264} -11/07/2021 02:54:47 - INFO - __main__ - Step 40462: {'lr': 0.000421210263114253, 'samples': 7768704, 'steps': 40461, 'loss/train': 1.7173820734024048} -11/07/2021 02:54:47 - INFO - __main__ - Step 40463: {'lr': 0.00042120639609097277, 'samples': 7768896, 'steps': 40462, 'loss/train': 1.9047561883926392} -11/07/2021 02:54:47 - INFO - __main__ - Step 40464: {'lr': 0.0004212025289905497, 'samples': 7769088, 'steps': 40463, 'loss/train': 1.4366101026535034} -11/07/2021 02:54:48 - INFO - __main__ - Step 40465: {'lr': 0.0004211986618129854, 'samples': 7769280, 'steps': 40464, 'loss/train': 1.5336722135543823} -11/07/2021 02:54:48 - INFO - __main__ - Step 40466: {'lr': 0.00042119479455828153, 'samples': 7769472, 'steps': 40465, 'loss/train': 1.2135385274887085} -11/07/2021 02:54:48 - INFO - __main__ - Step 40467: {'lr': 0.00042119092722644, 'samples': 7769664, 'steps': 40466, 'loss/train': 1.1936951875686646} -11/07/2021 02:54:50 - INFO - __main__ - Step 40468: {'lr': 0.0004211870598174624, 'samples': 7769856, 'steps': 40467, 'loss/train': 1.0657728910446167} -11/07/2021 02:54:50 - INFO - __main__ - Step 40469: {'lr': 0.0004211831923313506, 'samples': 7770048, 'steps': 40468, 'loss/train': 1.6648720502853394} -11/07/2021 02:54:51 - INFO - __main__ - Step 40470: {'lr': 0.0004211793247681064, 'samples': 7770240, 'steps': 40469, 'loss/train': 1.7868831157684326} -11/07/2021 02:54:51 - INFO - __main__ - Step 40471: {'lr': 0.0004211754571277313, 'samples': 7770432, 'steps': 40470, 'loss/train': 1.7979527711868286} -11/07/2021 02:54:51 - INFO - __main__ - Step 40472: {'lr': 0.0004211715894102272, 'samples': 7770624, 'steps': 40471, 'loss/train': 1.8728834390640259} -11/07/2021 02:54:52 - INFO - __main__ - Step 40473: {'lr': 0.00042116772161559585, 'samples': 7770816, 'steps': 40472, 'loss/train': 1.4813945293426514} -11/07/2021 02:54:53 - INFO - __main__ - Step 40474: {'lr': 0.0004211638537438389, 'samples': 7771008, 'steps': 40473, 'loss/train': 1.855363368988037} -11/07/2021 02:54:53 - INFO - __main__ - Step 40475: {'lr': 0.0004211599857949583, 'samples': 7771200, 'steps': 40474, 'loss/train': 1.609128713607788} -11/07/2021 02:54:53 - INFO - __main__ - Step 40476: {'lr': 0.00042115611776895556, 'samples': 7771392, 'steps': 40475, 'loss/train': 0.9565662741661072} -11/07/2021 02:54:54 - INFO - __main__ - Step 40477: {'lr': 0.00042115224966583255, 'samples': 7771584, 'steps': 40476, 'loss/train': 1.084002137184143} -11/07/2021 02:54:55 - INFO - __main__ - Step 40478: {'lr': 0.00042114838148559093, 'samples': 7771776, 'steps': 40477, 'loss/train': 1.3256856203079224} -11/07/2021 02:54:55 - INFO - __main__ - Step 40479: {'lr': 0.0004211445132282325, 'samples': 7771968, 'steps': 40478, 'loss/train': 1.4972087144851685} -11/07/2021 02:54:55 - INFO - __main__ - Step 40480: {'lr': 0.000421140644893759, 'samples': 7772160, 'steps': 40479, 'loss/train': 0.7012211680412292} -11/07/2021 02:54:56 - INFO - __main__ - Step 40481: {'lr': 0.0004211367764821722, 'samples': 7772352, 'steps': 40480, 'loss/train': 1.6657418012619019} -11/07/2021 02:54:56 - INFO - __main__ - Step 40482: {'lr': 0.00042113290799347376, 'samples': 7772544, 'steps': 40481, 'loss/train': 1.779977560043335} -11/07/2021 02:54:57 - INFO - __main__ - Step 40483: {'lr': 0.00042112903942766546, 'samples': 7772736, 'steps': 40482, 'loss/train': 2.0749664306640625} -11/07/2021 02:54:58 - INFO - __main__ - Step 40484: {'lr': 0.00042112517078474914, 'samples': 7772928, 'steps': 40483, 'loss/train': 1.6234458684921265} -11/07/2021 02:54:58 - INFO - __main__ - Step 40485: {'lr': 0.0004211213020647264, 'samples': 7773120, 'steps': 40484, 'loss/train': 1.8211755752563477} -11/07/2021 02:54:58 - INFO - __main__ - Step 40486: {'lr': 0.00042111743326759903, 'samples': 7773312, 'steps': 40485, 'loss/train': 1.5641697645187378} -11/07/2021 02:54:59 - INFO - __main__ - Step 40487: {'lr': 0.00042111356439336877, 'samples': 7773504, 'steps': 40486, 'loss/train': 1.8205519914627075} -11/07/2021 02:54:59 - INFO - __main__ - Step 40488: {'lr': 0.0004211096954420375, 'samples': 7773696, 'steps': 40487, 'loss/train': 1.2478127479553223} -11/07/2021 02:55:00 - INFO - __main__ - Step 40489: {'lr': 0.0004211058264136067, 'samples': 7773888, 'steps': 40488, 'loss/train': 1.0244457721710205} -11/07/2021 02:55:00 - INFO - __main__ - Step 40490: {'lr': 0.0004211019573080783, 'samples': 7774080, 'steps': 40489, 'loss/train': 1.2829538583755493} -11/07/2021 02:55:01 - INFO - __main__ - Step 40491: {'lr': 0.00042109808812545405, 'samples': 7774272, 'steps': 40490, 'loss/train': 1.4776816368103027} -11/07/2021 02:55:01 - INFO - __main__ - Step 40492: {'lr': 0.0004210942188657356, 'samples': 7774464, 'steps': 40491, 'loss/train': 1.0204192399978638} -11/07/2021 02:55:01 - INFO - __main__ - Step 40493: {'lr': 0.00042109034952892473, 'samples': 7774656, 'steps': 40492, 'loss/train': 1.4715652465820312} -11/07/2021 02:55:03 - INFO - __main__ - Step 40494: {'lr': 0.00042108648011502314, 'samples': 7774848, 'steps': 40493, 'loss/train': 1.7918028831481934} -11/07/2021 02:55:03 - INFO - __main__ - Step 40495: {'lr': 0.00042108261062403276, 'samples': 7775040, 'steps': 40494, 'loss/train': 1.0174304246902466} -11/07/2021 02:55:03 - INFO - __main__ - Step 40496: {'lr': 0.00042107874105595507, 'samples': 7775232, 'steps': 40495, 'loss/train': 0.7235434055328369} -11/07/2021 02:55:04 - INFO - __main__ - Step 40497: {'lr': 0.00042107487141079206, 'samples': 7775424, 'steps': 40496, 'loss/train': 1.3755961656570435} -11/07/2021 02:55:04 - INFO - __main__ - Step 40498: {'lr': 0.00042107100168854516, 'samples': 7775616, 'steps': 40497, 'loss/train': 1.5656465291976929} -11/07/2021 02:55:04 - INFO - __main__ - Step 40499: {'lr': 0.00042106713188921647, 'samples': 7775808, 'steps': 40498, 'loss/train': 1.7913703918457031} -11/07/2021 02:55:06 - INFO - __main__ - Step 40500: {'lr': 0.00042106326201280756, 'samples': 7776000, 'steps': 40499, 'loss/train': 0.22071810066699982} -11/07/2021 02:55:06 - INFO - __main__ - Step 40501: {'lr': 0.0004210593920593201, 'samples': 7776192, 'steps': 40500, 'loss/train': 0.8095206618309021} -11/07/2021 02:55:07 - INFO - __main__ - Step 40502: {'lr': 0.000421055522028756, 'samples': 7776384, 'steps': 40501, 'loss/train': 0.4188019335269928} -11/07/2021 02:55:07 - INFO - __main__ - Step 40503: {'lr': 0.00042105165192111684, 'samples': 7776576, 'steps': 40502, 'loss/train': 1.5947679281234741} -11/07/2021 02:55:07 - INFO - __main__ - Step 40504: {'lr': 0.00042104778173640453, 'samples': 7776768, 'steps': 40503, 'loss/train': 1.7064250707626343} -11/07/2021 02:55:08 - INFO - __main__ - Step 40505: {'lr': 0.0004210439114746206, 'samples': 7776960, 'steps': 40504, 'loss/train': 1.4955432415008545} -11/07/2021 02:55:09 - INFO - __main__ - Step 40506: {'lr': 0.00042104004113576707, 'samples': 7777152, 'steps': 40505, 'loss/train': 1.7106342315673828} -11/07/2021 02:55:09 - INFO - __main__ - Step 40507: {'lr': 0.00042103617071984544, 'samples': 7777344, 'steps': 40506, 'loss/train': 1.195376992225647} -11/07/2021 02:55:09 - INFO - __main__ - Step 40508: {'lr': 0.00042103230022685765, 'samples': 7777536, 'steps': 40507, 'loss/train': 1.639768123626709} -11/07/2021 02:55:10 - INFO - __main__ - Step 40509: {'lr': 0.0004210284296568052, 'samples': 7777728, 'steps': 40508, 'loss/train': 1.5711511373519897} -11/07/2021 02:55:11 - INFO - __main__ - Step 40510: {'lr': 0.0004210245590096901, 'samples': 7777920, 'steps': 40509, 'loss/train': 1.082285761833191} -11/07/2021 02:55:11 - INFO - __main__ - Step 40511: {'lr': 0.000421020688285514, 'samples': 7778112, 'steps': 40510, 'loss/train': 1.4846168756484985} -11/07/2021 02:55:11 - INFO - __main__ - Step 40512: {'lr': 0.0004210168174842785, 'samples': 7778304, 'steps': 40511, 'loss/train': 1.407073974609375} -11/07/2021 02:55:12 - INFO - __main__ - Step 40513: {'lr': 0.00042101294660598556, 'samples': 7778496, 'steps': 40512, 'loss/train': 1.8460878133773804} -11/07/2021 02:55:12 - INFO - __main__ - Step 40514: {'lr': 0.0004210090756506367, 'samples': 7778688, 'steps': 40513, 'loss/train': 1.498748779296875} -11/07/2021 02:55:13 - INFO - __main__ - Step 40515: {'lr': 0.0004210052046182339, 'samples': 7778880, 'steps': 40514, 'loss/train': 1.8797236680984497} -11/07/2021 02:55:14 - INFO - __main__ - Step 40516: {'lr': 0.0004210013335087787, 'samples': 7779072, 'steps': 40515, 'loss/train': 1.5167568922042847} -11/07/2021 02:55:14 - INFO - __main__ - Step 40517: {'lr': 0.000420997462322273, 'samples': 7779264, 'steps': 40516, 'loss/train': 1.554261326789856} -11/07/2021 02:55:14 - INFO - __main__ - Step 40518: {'lr': 0.00042099359105871856, 'samples': 7779456, 'steps': 40517, 'loss/train': 0.995050311088562} -11/07/2021 02:55:15 - INFO - __main__ - Step 40519: {'lr': 0.00042098971971811695, 'samples': 7779648, 'steps': 40518, 'loss/train': 1.330376148223877} -11/07/2021 02:55:16 - INFO - __main__ - Step 40520: {'lr': 0.00042098584830047004, 'samples': 7779840, 'steps': 40519, 'loss/train': 1.555248498916626} -11/07/2021 02:55:16 - INFO - __main__ - Step 40521: {'lr': 0.00042098197680577956, 'samples': 7780032, 'steps': 40520, 'loss/train': 1.7325122356414795} -11/07/2021 02:55:16 - INFO - __main__ - Step 40522: {'lr': 0.00042097810523404714, 'samples': 7780224, 'steps': 40521, 'loss/train': 1.4902366399765015} -11/07/2021 02:55:17 - INFO - __main__ - Step 40523: {'lr': 0.0004209742335852747, 'samples': 7780416, 'steps': 40522, 'loss/train': 1.586439609527588} -11/07/2021 02:55:17 - INFO - __main__ - Step 40524: {'lr': 0.0004209703618594639, 'samples': 7780608, 'steps': 40523, 'loss/train': 1.4793297052383423} -11/07/2021 02:55:17 - INFO - __main__ - Step 40525: {'lr': 0.00042096649005661654, 'samples': 7780800, 'steps': 40524, 'loss/train': 1.5533337593078613} -11/07/2021 02:55:18 - INFO - __main__ - Step 40526: {'lr': 0.00042096261817673423, 'samples': 7780992, 'steps': 40525, 'loss/train': 1.506975769996643} -11/07/2021 02:55:19 - INFO - __main__ - Step 40527: {'lr': 0.0004209587462198189, 'samples': 7781184, 'steps': 40526, 'loss/train': 1.802403450012207} -11/07/2021 02:55:19 - INFO - __main__ - Step 40528: {'lr': 0.0004209548741858721, 'samples': 7781376, 'steps': 40527, 'loss/train': 1.5555566549301147} -11/07/2021 02:55:19 - INFO - __main__ - Step 40529: {'lr': 0.00042095100207489573, 'samples': 7781568, 'steps': 40528, 'loss/train': 1.3441355228424072} -11/07/2021 02:55:20 - INFO - __main__ - Step 40530: {'lr': 0.0004209471298868914, 'samples': 7781760, 'steps': 40529, 'loss/train': 1.8669350147247314} -11/07/2021 02:55:21 - INFO - __main__ - Step 40531: {'lr': 0.00042094325762186103, 'samples': 7781952, 'steps': 40530, 'loss/train': 1.5020253658294678} -11/07/2021 02:55:21 - INFO - __main__ - Step 40532: {'lr': 0.0004209393852798062, 'samples': 7782144, 'steps': 40531, 'loss/train': 1.7007616758346558} -11/07/2021 02:55:21 - INFO - __main__ - Step 40533: {'lr': 0.00042093551286072887, 'samples': 7782336, 'steps': 40532, 'loss/train': 1.5439091920852661} -11/07/2021 02:55:22 - INFO - __main__ - Step 40534: {'lr': 0.00042093164036463045, 'samples': 7782528, 'steps': 40533, 'loss/train': 1.5337989330291748} -11/07/2021 02:55:22 - INFO - __main__ - Step 40535: {'lr': 0.0004209277677915129, 'samples': 7782720, 'steps': 40534, 'loss/train': 1.3965024948120117} -11/07/2021 02:55:24 - INFO - __main__ - Step 40536: {'lr': 0.000420923895141378, 'samples': 7782912, 'steps': 40535, 'loss/train': 1.4856348037719727} -11/07/2021 02:55:24 - INFO - __main__ - Step 40537: {'lr': 0.0004209200224142274, 'samples': 7783104, 'steps': 40536, 'loss/train': 1.4512770175933838} -11/07/2021 02:55:24 - INFO - __main__ - Step 40538: {'lr': 0.0004209161496100629, 'samples': 7783296, 'steps': 40537, 'loss/train': 0.8187178373336792} -11/07/2021 02:55:25 - INFO - __main__ - Step 40539: {'lr': 0.00042091227672888624, 'samples': 7783488, 'steps': 40538, 'loss/train': 1.7245628833770752} -11/07/2021 02:55:25 - INFO - __main__ - Step 40540: {'lr': 0.00042090840377069906, 'samples': 7783680, 'steps': 40539, 'loss/train': 1.4943673610687256} -11/07/2021 02:55:25 - INFO - __main__ - Step 40541: {'lr': 0.00042090453073550323, 'samples': 7783872, 'steps': 40540, 'loss/train': 1.4821431636810303} -11/07/2021 02:55:26 - INFO - __main__ - Step 40542: {'lr': 0.0004209006576233004, 'samples': 7784064, 'steps': 40541, 'loss/train': 1.2041219472885132} -11/07/2021 02:55:27 - INFO - __main__ - Step 40543: {'lr': 0.0004208967844340925, 'samples': 7784256, 'steps': 40542, 'loss/train': 1.1263279914855957} -11/07/2021 02:55:27 - INFO - __main__ - Step 40544: {'lr': 0.0004208929111678811, 'samples': 7784448, 'steps': 40543, 'loss/train': 1.6190506219863892} -11/07/2021 02:55:28 - INFO - __main__ - Step 40545: {'lr': 0.0004208890378246679, 'samples': 7784640, 'steps': 40544, 'loss/train': 1.5942102670669556} -11/07/2021 02:55:28 - INFO - __main__ - Step 40546: {'lr': 0.00042088516440445486, 'samples': 7784832, 'steps': 40545, 'loss/train': 0.7566236853599548} -11/07/2021 02:55:29 - INFO - __main__ - Step 40547: {'lr': 0.0004208812909072435, 'samples': 7785024, 'steps': 40546, 'loss/train': 1.7903724908828735} -11/07/2021 02:55:29 - INFO - __main__ - Step 40548: {'lr': 0.00042087741733303575, 'samples': 7785216, 'steps': 40547, 'loss/train': 1.1815096139907837} -11/07/2021 02:55:30 - INFO - __main__ - Step 40549: {'lr': 0.00042087354368183316, 'samples': 7785408, 'steps': 40548, 'loss/train': 1.5147377252578735} -11/07/2021 02:55:30 - INFO - __main__ - Step 40550: {'lr': 0.00042086966995363774, 'samples': 7785600, 'steps': 40549, 'loss/train': 1.6385198831558228} -11/07/2021 02:55:30 - INFO - __main__ - Step 40551: {'lr': 0.000420865796148451, 'samples': 7785792, 'steps': 40550, 'loss/train': 1.3999335765838623} -11/07/2021 02:55:31 - INFO - __main__ - Step 40552: {'lr': 0.00042086192226627476, 'samples': 7785984, 'steps': 40551, 'loss/train': 0.5500167608261108} -11/07/2021 02:55:32 - INFO - __main__ - Step 40553: {'lr': 0.00042085804830711084, 'samples': 7786176, 'steps': 40552, 'loss/train': 1.6004263162612915} -11/07/2021 02:55:32 - INFO - __main__ - Step 40554: {'lr': 0.00042085417427096085, 'samples': 7786368, 'steps': 40553, 'loss/train': 1.3719244003295898} -11/07/2021 02:55:32 - INFO - __main__ - Step 40555: {'lr': 0.0004208503001578266, 'samples': 7786560, 'steps': 40554, 'loss/train': 1.30928373336792} -11/07/2021 02:55:33 - INFO - __main__ - Step 40556: {'lr': 0.00042084642596770984, 'samples': 7786752, 'steps': 40555, 'loss/train': 1.6300101280212402} -11/07/2021 02:55:34 - INFO - __main__ - Step 40557: {'lr': 0.0004208425517006124, 'samples': 7786944, 'steps': 40556, 'loss/train': 1.650418758392334} -11/07/2021 02:55:34 - INFO - __main__ - Step 40558: {'lr': 0.0004208386773565359, 'samples': 7787136, 'steps': 40557, 'loss/train': 1.234565258026123} -11/07/2021 02:55:34 - INFO - __main__ - Step 40559: {'lr': 0.0004208348029354821, 'samples': 7787328, 'steps': 40558, 'loss/train': 1.5747935771942139} -11/07/2021 02:55:35 - INFO - __main__ - Step 40560: {'lr': 0.00042083092843745275, 'samples': 7787520, 'steps': 40559, 'loss/train': 1.7562403678894043} -11/07/2021 02:55:35 - INFO - __main__ - Step 40561: {'lr': 0.0004208270538624497, 'samples': 7787712, 'steps': 40560, 'loss/train': 1.1333563327789307} -11/07/2021 02:55:36 - INFO - __main__ - Step 40562: {'lr': 0.00042082317921047455, 'samples': 7787904, 'steps': 40561, 'loss/train': 1.908737063407898} -11/07/2021 02:55:37 - INFO - __main__ - Step 40563: {'lr': 0.0004208193044815291, 'samples': 7788096, 'steps': 40562, 'loss/train': 1.2895712852478027} -11/07/2021 02:55:37 - INFO - __main__ - Step 40564: {'lr': 0.0004208154296756152, 'samples': 7788288, 'steps': 40563, 'loss/train': 1.5736141204833984} -11/07/2021 02:55:37 - INFO - __main__ - Step 40565: {'lr': 0.0004208115547927345, 'samples': 7788480, 'steps': 40564, 'loss/train': 1.2707369327545166} -11/07/2021 02:55:38 - INFO - __main__ - Step 40566: {'lr': 0.0004208076798328886, 'samples': 7788672, 'steps': 40565, 'loss/train': 2.010261058807373} -11/07/2021 02:55:38 - INFO - __main__ - Step 40567: {'lr': 0.00042080380479607947, 'samples': 7788864, 'steps': 40566, 'loss/train': 1.1383821964263916} -11/07/2021 02:55:39 - INFO - __main__ - Step 40568: {'lr': 0.00042079992968230886, 'samples': 7789056, 'steps': 40567, 'loss/train': 1.415386438369751} -11/07/2021 02:55:39 - INFO - __main__ - Step 40569: {'lr': 0.0004207960544915784, 'samples': 7789248, 'steps': 40568, 'loss/train': 1.236395239830017} -11/07/2021 02:55:40 - INFO - __main__ - Step 40570: {'lr': 0.0004207921792238898, 'samples': 7789440, 'steps': 40569, 'loss/train': 1.6369279623031616} -11/07/2021 02:55:40 - INFO - __main__ - Step 40571: {'lr': 0.0004207883038792449, 'samples': 7789632, 'steps': 40570, 'loss/train': 1.3528670072555542} -11/07/2021 02:55:41 - INFO - __main__ - Step 40572: {'lr': 0.0004207844284576455, 'samples': 7789824, 'steps': 40571, 'loss/train': 1.7188644409179688} -11/07/2021 02:55:42 - INFO - __main__ - Step 40573: {'lr': 0.0004207805529590932, 'samples': 7790016, 'steps': 40572, 'loss/train': 1.762956976890564} -11/07/2021 02:55:42 - INFO - __main__ - Step 40574: {'lr': 0.0004207766773835899, 'samples': 7790208, 'steps': 40573, 'loss/train': 1.1353379487991333} -11/07/2021 02:55:43 - INFO - __main__ - Step 40575: {'lr': 0.0004207728017311372, 'samples': 7790400, 'steps': 40574, 'loss/train': 0.41304847598075867} -11/07/2021 02:55:43 - INFO - __main__ - Step 40576: {'lr': 0.0004207689260017369, 'samples': 7790592, 'steps': 40575, 'loss/train': 1.788718581199646} -11/07/2021 02:55:43 - INFO - __main__ - Step 40577: {'lr': 0.0004207650501953908, 'samples': 7790784, 'steps': 40576, 'loss/train': 1.785046100616455} -11/07/2021 02:55:44 - INFO - __main__ - Step 40578: {'lr': 0.0004207611743121006, 'samples': 7790976, 'steps': 40577, 'loss/train': 1.5799282789230347} -11/07/2021 02:55:45 - INFO - __main__ - Step 40579: {'lr': 0.00042075729835186807, 'samples': 7791168, 'steps': 40578, 'loss/train': 1.4899252653121948} -11/07/2021 02:55:45 - INFO - __main__ - Step 40580: {'lr': 0.0004207534223146948, 'samples': 7791360, 'steps': 40579, 'loss/train': 1.3295331001281738} -11/07/2021 02:55:45 - INFO - __main__ - Step 40581: {'lr': 0.0004207495462005828, 'samples': 7791552, 'steps': 40580, 'loss/train': 1.9620747566223145} -11/07/2021 02:55:46 - INFO - __main__ - Step 40582: {'lr': 0.0004207456700095337, 'samples': 7791744, 'steps': 40581, 'loss/train': 1.3816947937011719} -11/07/2021 02:55:47 - INFO - __main__ - Step 40583: {'lr': 0.0004207417937415492, 'samples': 7791936, 'steps': 40582, 'loss/train': 1.445510745048523} -11/07/2021 02:55:47 - INFO - __main__ - Step 40584: {'lr': 0.000420737917396631, 'samples': 7792128, 'steps': 40583, 'loss/train': 1.6489579677581787} -11/07/2021 02:55:48 - INFO - __main__ - Step 40585: {'lr': 0.00042073404097478105, 'samples': 7792320, 'steps': 40584, 'loss/train': 1.4975324869155884} -11/07/2021 02:55:48 - INFO - __main__ - Step 40586: {'lr': 0.000420730164476001, 'samples': 7792512, 'steps': 40585, 'loss/train': 2.274691104888916} -11/07/2021 02:55:48 - INFO - __main__ - Step 40587: {'lr': 0.00042072628790029243, 'samples': 7792704, 'steps': 40586, 'loss/train': 1.5260604619979858} -11/07/2021 02:55:49 - INFO - __main__ - Step 40588: {'lr': 0.0004207224112476573, 'samples': 7792896, 'steps': 40587, 'loss/train': 1.7950011491775513} -11/07/2021 02:55:50 - INFO - __main__ - Step 40589: {'lr': 0.0004207185345180973, 'samples': 7793088, 'steps': 40588, 'loss/train': 1.7205456495285034} -11/07/2021 02:55:50 - INFO - __main__ - Step 40590: {'lr': 0.00042071465771161416, 'samples': 7793280, 'steps': 40589, 'loss/train': 1.4447256326675415} -11/07/2021 02:55:50 - INFO - __main__ - Step 40591: {'lr': 0.0004207107808282097, 'samples': 7793472, 'steps': 40590, 'loss/train': 1.3997273445129395} -11/07/2021 02:55:51 - INFO - __main__ - Step 40592: {'lr': 0.00042070690386788545, 'samples': 7793664, 'steps': 40591, 'loss/train': 1.5835875272750854} -11/07/2021 02:55:52 - INFO - __main__ - Step 40593: {'lr': 0.0004207030268306434, 'samples': 7793856, 'steps': 40592, 'loss/train': 1.679340124130249} -11/07/2021 02:55:52 - INFO - __main__ - Step 40594: {'lr': 0.00042069914971648516, 'samples': 7794048, 'steps': 40593, 'loss/train': 1.6571979522705078} -11/07/2021 02:55:53 - INFO - __main__ - Step 40595: {'lr': 0.0004206952725254125, 'samples': 7794240, 'steps': 40594, 'loss/train': 1.4698810577392578} -11/07/2021 02:55:53 - INFO - __main__ - Step 40596: {'lr': 0.00042069139525742727, 'samples': 7794432, 'steps': 40595, 'loss/train': 1.6492644548416138} -11/07/2021 02:55:53 - INFO - __main__ - Step 40597: {'lr': 0.000420687517912531, 'samples': 7794624, 'steps': 40596, 'loss/train': 1.3679529428482056} -11/07/2021 02:55:54 - INFO - __main__ - Step 40598: {'lr': 0.0004206836404907257, 'samples': 7794816, 'steps': 40597, 'loss/train': 1.3563146591186523} -11/07/2021 02:55:55 - INFO - __main__ - Step 40599: {'lr': 0.0004206797629920129, 'samples': 7795008, 'steps': 40598, 'loss/train': 1.6323126554489136} -11/07/2021 02:55:55 - INFO - __main__ - Step 40600: {'lr': 0.0004206758854163945, 'samples': 7795200, 'steps': 40599, 'loss/train': 1.3663840293884277} -11/07/2021 02:55:55 - INFO - __main__ - Step 40601: {'lr': 0.00042067200776387215, 'samples': 7795392, 'steps': 40600, 'loss/train': 1.5179119110107422} -11/07/2021 02:55:56 - INFO - __main__ - Step 40602: {'lr': 0.0004206681300344476, 'samples': 7795584, 'steps': 40601, 'loss/train': 1.5285123586654663} -11/07/2021 02:55:56 - INFO - __main__ - Step 40603: {'lr': 0.0004206642522281227, 'samples': 7795776, 'steps': 40602, 'loss/train': 1.7061302661895752} -11/07/2021 02:55:57 - INFO - __main__ - Step 40604: {'lr': 0.000420660374344899, 'samples': 7795968, 'steps': 40603, 'loss/train': 1.711515188217163} -11/07/2021 02:55:57 - INFO - __main__ - Step 40605: {'lr': 0.00042065649638477843, 'samples': 7796160, 'steps': 40604, 'loss/train': 1.5275837182998657} -11/07/2021 02:55:58 - INFO - __main__ - Step 40606: {'lr': 0.0004206526183477627, 'samples': 7796352, 'steps': 40605, 'loss/train': 1.5344431400299072} -11/07/2021 02:55:58 - INFO - __main__ - Step 40607: {'lr': 0.0004206487402338535, 'samples': 7796544, 'steps': 40606, 'loss/train': 1.5935360193252563} -11/07/2021 02:55:59 - INFO - __main__ - Step 40608: {'lr': 0.00042064486204305263, 'samples': 7796736, 'steps': 40607, 'loss/train': 1.5178614854812622} -11/07/2021 02:56:00 - INFO - __main__ - Step 40609: {'lr': 0.0004206409837753618, 'samples': 7796928, 'steps': 40608, 'loss/train': 1.832965612411499} -11/07/2021 02:56:00 - INFO - __main__ - Step 40610: {'lr': 0.00042063710543078283, 'samples': 7797120, 'steps': 40609, 'loss/train': 1.4966989755630493} -11/07/2021 02:56:00 - INFO - __main__ - Step 40611: {'lr': 0.00042063322700931733, 'samples': 7797312, 'steps': 40610, 'loss/train': 1.3636682033538818} -11/07/2021 02:56:01 - INFO - __main__ - Step 40612: {'lr': 0.0004206293485109672, 'samples': 7797504, 'steps': 40611, 'loss/train': 2.53975248336792} -11/07/2021 02:56:01 - INFO - __main__ - Step 40613: {'lr': 0.0004206254699357341, 'samples': 7797696, 'steps': 40612, 'loss/train': 1.1263415813446045} -11/07/2021 02:56:02 - INFO - __main__ - Step 40614: {'lr': 0.00042062159128361976, 'samples': 7797888, 'steps': 40613, 'loss/train': 2.1661019325256348} -11/07/2021 02:56:02 - INFO - __main__ - Step 40615: {'lr': 0.000420617712554626, 'samples': 7798080, 'steps': 40614, 'loss/train': 1.3241528272628784} -11/07/2021 02:56:03 - INFO - __main__ - Step 40616: {'lr': 0.0004206138337487545, 'samples': 7798272, 'steps': 40615, 'loss/train': 0.6974542140960693} -11/07/2021 02:56:03 - INFO - __main__ - Step 40617: {'lr': 0.0004206099548660071, 'samples': 7798464, 'steps': 40616, 'loss/train': 1.47562575340271} -11/07/2021 02:56:03 - INFO - __main__ - Step 40618: {'lr': 0.00042060607590638547, 'samples': 7798656, 'steps': 40617, 'loss/train': 1.7578154802322388} -11/07/2021 02:56:04 - INFO - __main__ - Step 40619: {'lr': 0.00042060219686989133, 'samples': 7798848, 'steps': 40618, 'loss/train': 1.2786564826965332} -11/07/2021 02:56:05 - INFO - __main__ - Step 40620: {'lr': 0.00042059831775652644, 'samples': 7799040, 'steps': 40619, 'loss/train': 1.3147251605987549} -11/07/2021 02:56:05 - INFO - __main__ - Step 40621: {'lr': 0.00042059443856629265, 'samples': 7799232, 'steps': 40620, 'loss/train': 1.4205396175384521} -11/07/2021 02:56:06 - INFO - __main__ - Step 40622: {'lr': 0.00042059055929919163, 'samples': 7799424, 'steps': 40621, 'loss/train': 1.4647282361984253} -11/07/2021 02:56:06 - INFO - __main__ - Step 40623: {'lr': 0.00042058667995522513, 'samples': 7799616, 'steps': 40622, 'loss/train': 0.836337149143219} -11/07/2021 02:56:07 - INFO - __main__ - Step 40624: {'lr': 0.0004205828005343949, 'samples': 7799808, 'steps': 40623, 'loss/train': 1.6595656871795654} -11/07/2021 02:56:07 - INFO - __main__ - Step 40625: {'lr': 0.00042057892103670275, 'samples': 7800000, 'steps': 40624, 'loss/train': 1.6615570783615112} -11/07/2021 02:56:08 - INFO - __main__ - Step 40626: {'lr': 0.0004205750414621503, 'samples': 7800192, 'steps': 40625, 'loss/train': 1.3805701732635498} -11/07/2021 02:56:08 - INFO - __main__ - Step 40627: {'lr': 0.0004205711618107394, 'samples': 7800384, 'steps': 40626, 'loss/train': 2.026540517807007} -11/07/2021 02:56:08 - INFO - __main__ - Step 40628: {'lr': 0.00042056728208247175, 'samples': 7800576, 'steps': 40627, 'loss/train': 1.489866852760315} -11/07/2021 02:56:09 - INFO - __main__ - Step 40629: {'lr': 0.0004205634022773491, 'samples': 7800768, 'steps': 40628, 'loss/train': 1.2569215297698975} -11/07/2021 02:56:10 - INFO - __main__ - Step 40630: {'lr': 0.0004205595223953732, 'samples': 7800960, 'steps': 40629, 'loss/train': 1.34797203540802} -11/07/2021 02:56:10 - INFO - __main__ - Step 40631: {'lr': 0.0004205556424365459, 'samples': 7801152, 'steps': 40630, 'loss/train': 1.273876428604126} -11/07/2021 02:56:10 - INFO - __main__ - Step 40632: {'lr': 0.0004205517624008688, 'samples': 7801344, 'steps': 40631, 'loss/train': 1.5526227951049805} -11/07/2021 02:56:11 - INFO - __main__ - Step 40633: {'lr': 0.00042054788228834374, 'samples': 7801536, 'steps': 40632, 'loss/train': 1.3163074254989624} -11/07/2021 02:56:11 - INFO - __main__ - Step 40634: {'lr': 0.0004205440020989724, 'samples': 7801728, 'steps': 40633, 'loss/train': 1.474863886833191} -11/07/2021 02:56:12 - INFO - __main__ - Step 40635: {'lr': 0.0004205401218327565, 'samples': 7801920, 'steps': 40634, 'loss/train': 1.6535274982452393} -11/07/2021 02:56:13 - INFO - __main__ - Step 40636: {'lr': 0.0004205362414896979, 'samples': 7802112, 'steps': 40635, 'loss/train': 1.746715784072876} -11/07/2021 02:56:13 - INFO - __main__ - Step 40637: {'lr': 0.0004205323610697984, 'samples': 7802304, 'steps': 40636, 'loss/train': 1.7244786024093628} -11/07/2021 02:56:13 - INFO - __main__ - Step 40638: {'lr': 0.0004205284805730596, 'samples': 7802496, 'steps': 40637, 'loss/train': 1.8182399272918701} -11/07/2021 02:56:14 - INFO - __main__ - Step 40639: {'lr': 0.00042052459999948323, 'samples': 7802688, 'steps': 40638, 'loss/train': 1.222219467163086} -11/07/2021 02:56:14 - INFO - __main__ - Step 40640: {'lr': 0.00042052071934907116, 'samples': 7802880, 'steps': 40639, 'loss/train': 1.7510050535202026} -11/07/2021 02:56:15 - INFO - __main__ - Step 40641: {'lr': 0.00042051683862182504, 'samples': 7803072, 'steps': 40640, 'loss/train': 1.3503400087356567} -11/07/2021 02:56:15 - INFO - __main__ - Step 40642: {'lr': 0.0004205129578177467, 'samples': 7803264, 'steps': 40641, 'loss/train': 1.3796998262405396} -11/07/2021 02:56:16 - INFO - __main__ - Step 40643: {'lr': 0.0004205090769368379, 'samples': 7803456, 'steps': 40642, 'loss/train': 1.7264069318771362} -11/07/2021 02:56:16 - INFO - __main__ - Step 40644: {'lr': 0.00042050519597910024, 'samples': 7803648, 'steps': 40643, 'loss/train': 1.688590168952942} -11/07/2021 02:56:16 - INFO - __main__ - Step 40645: {'lr': 0.00042050131494453567, 'samples': 7803840, 'steps': 40644, 'loss/train': 1.254162311553955} -11/07/2021 02:56:18 - INFO - __main__ - Step 40646: {'lr': 0.00042049743383314577, 'samples': 7804032, 'steps': 40645, 'loss/train': 1.396903395652771} -11/07/2021 02:56:18 - INFO - __main__ - Step 40647: {'lr': 0.0004204935526449324, 'samples': 7804224, 'steps': 40646, 'loss/train': 1.4807292222976685} -11/07/2021 02:56:18 - INFO - __main__ - Step 40648: {'lr': 0.0004204896713798972, 'samples': 7804416, 'steps': 40647, 'loss/train': 1.357002854347229} -11/07/2021 02:56:19 - INFO - __main__ - Step 40649: {'lr': 0.00042048579003804205, 'samples': 7804608, 'steps': 40648, 'loss/train': 1.4147695302963257} -11/07/2021 02:56:19 - INFO - __main__ - Step 40650: {'lr': 0.00042048190861936866, 'samples': 7804800, 'steps': 40649, 'loss/train': 1.5080392360687256} -11/07/2021 02:56:20 - INFO - __main__ - Step 40651: {'lr': 0.0004204780271238786, 'samples': 7804992, 'steps': 40650, 'loss/train': 1.3220431804656982} -11/07/2021 02:56:20 - INFO - __main__ - Step 40652: {'lr': 0.00042047414555157394, 'samples': 7805184, 'steps': 40651, 'loss/train': 1.7669703960418701} -11/07/2021 02:56:21 - INFO - __main__ - Step 40653: {'lr': 0.0004204702639024562, 'samples': 7805376, 'steps': 40652, 'loss/train': 1.8579809665679932} -11/07/2021 02:56:21 - INFO - __main__ - Step 40654: {'lr': 0.00042046638217652717, 'samples': 7805568, 'steps': 40653, 'loss/train': 1.3786760568618774} -11/07/2021 02:56:21 - INFO - __main__ - Step 40655: {'lr': 0.00042046250037378865, 'samples': 7805760, 'steps': 40654, 'loss/train': 1.4152415990829468} -11/07/2021 02:56:22 - INFO - __main__ - Step 40656: {'lr': 0.0004204586184942423, 'samples': 7805952, 'steps': 40655, 'loss/train': 1.5150220394134521} -11/07/2021 02:56:23 - INFO - __main__ - Step 40657: {'lr': 0.00042045473653789004, 'samples': 7806144, 'steps': 40656, 'loss/train': 1.9052633047103882} -11/07/2021 02:56:23 - INFO - __main__ - Step 40658: {'lr': 0.00042045085450473336, 'samples': 7806336, 'steps': 40657, 'loss/train': 1.6889491081237793} -11/07/2021 02:56:23 - INFO - __main__ - Step 40659: {'lr': 0.00042044697239477423, 'samples': 7806528, 'steps': 40658, 'loss/train': 1.0255661010742188} -11/07/2021 02:56:24 - INFO - __main__ - Step 40660: {'lr': 0.00042044309020801434, 'samples': 7806720, 'steps': 40659, 'loss/train': 1.272469162940979} -11/07/2021 02:56:24 - INFO - __main__ - Step 40661: {'lr': 0.00042043920794445543, 'samples': 7806912, 'steps': 40660, 'loss/train': 1.1650625467300415} -11/07/2021 02:56:25 - INFO - __main__ - Step 40662: {'lr': 0.0004204353256040992, 'samples': 7807104, 'steps': 40661, 'loss/train': 1.1032905578613281} -11/07/2021 02:56:26 - INFO - __main__ - Step 40663: {'lr': 0.0004204314431869475, 'samples': 7807296, 'steps': 40662, 'loss/train': 1.5344452857971191} -11/07/2021 02:56:26 - INFO - __main__ - Step 40664: {'lr': 0.0004204275606930019, 'samples': 7807488, 'steps': 40663, 'loss/train': 1.6054086685180664} -11/07/2021 02:56:26 - INFO - __main__ - Step 40665: {'lr': 0.00042042367812226446, 'samples': 7807680, 'steps': 40664, 'loss/train': 1.3232537508010864} -11/07/2021 02:56:27 - INFO - __main__ - Step 40666: {'lr': 0.00042041979547473665, 'samples': 7807872, 'steps': 40665, 'loss/train': 1.46358060836792} -11/07/2021 02:56:28 - INFO - __main__ - Step 40667: {'lr': 0.0004204159127504202, 'samples': 7808064, 'steps': 40666, 'loss/train': 1.802840232849121} -11/07/2021 02:56:28 - INFO - __main__ - Step 40668: {'lr': 0.0004204120299493171, 'samples': 7808256, 'steps': 40667, 'loss/train': 0.9984766244888306} -11/07/2021 02:56:28 - INFO - __main__ - Step 40669: {'lr': 0.0004204081470714289, 'samples': 7808448, 'steps': 40668, 'loss/train': 1.5101535320281982} -11/07/2021 02:56:29 - INFO - __main__ - Step 40670: {'lr': 0.00042040426411675747, 'samples': 7808640, 'steps': 40669, 'loss/train': 1.0501954555511475} -11/07/2021 02:56:29 - INFO - __main__ - Step 40671: {'lr': 0.0004204003810853045, 'samples': 7808832, 'steps': 40670, 'loss/train': 1.3344838619232178} -11/07/2021 02:56:30 - INFO - __main__ - Step 40672: {'lr': 0.00042039649797707176, 'samples': 7809024, 'steps': 40671, 'loss/train': 1.6589035987854004} -11/07/2021 02:56:31 - INFO - __main__ - Step 40673: {'lr': 0.0004203926147920609, 'samples': 7809216, 'steps': 40672, 'loss/train': 0.6955644488334656} -11/07/2021 02:56:31 - INFO - __main__ - Step 40674: {'lr': 0.0004203887315302739, 'samples': 7809408, 'steps': 40673, 'loss/train': 1.543953776359558} -11/07/2021 02:56:31 - INFO - __main__ - Step 40675: {'lr': 0.0004203848481917122, 'samples': 7809600, 'steps': 40674, 'loss/train': 1.5235605239868164} -11/07/2021 02:56:32 - INFO - __main__ - Step 40676: {'lr': 0.00042038096477637786, 'samples': 7809792, 'steps': 40675, 'loss/train': 1.1400928497314453} -11/07/2021 02:56:33 - INFO - __main__ - Step 40677: {'lr': 0.00042037708128427243, 'samples': 7809984, 'steps': 40676, 'loss/train': 1.9184764623641968} -11/07/2021 02:56:33 - INFO - __main__ - Step 40678: {'lr': 0.00042037319771539775, 'samples': 7810176, 'steps': 40677, 'loss/train': 1.3890955448150635} -11/07/2021 02:56:33 - INFO - __main__ - Step 40679: {'lr': 0.00042036931406975547, 'samples': 7810368, 'steps': 40678, 'loss/train': 0.9071448445320129} -11/07/2021 02:56:34 - INFO - __main__ - Step 40680: {'lr': 0.0004203654303473474, 'samples': 7810560, 'steps': 40679, 'loss/train': 1.413865327835083} -11/07/2021 02:56:34 - INFO - __main__ - Step 40681: {'lr': 0.0004203615465481754, 'samples': 7810752, 'steps': 40680, 'loss/train': 1.401404857635498} -11/07/2021 02:56:35 - INFO - __main__ - Step 40682: {'lr': 0.0004203576626722411, 'samples': 7810944, 'steps': 40681, 'loss/train': 1.5267057418823242} -11/07/2021 02:56:35 - INFO - __main__ - Step 40683: {'lr': 0.00042035377871954614, 'samples': 7811136, 'steps': 40682, 'loss/train': 0.5235815048217773} -11/07/2021 02:56:36 - INFO - __main__ - Step 40684: {'lr': 0.00042034989469009245, 'samples': 7811328, 'steps': 40683, 'loss/train': 1.418968915939331} -11/07/2021 02:56:36 - INFO - __main__ - Step 40685: {'lr': 0.0004203460105838818, 'samples': 7811520, 'steps': 40684, 'loss/train': 1.3702691793441772} -11/07/2021 02:56:36 - INFO - __main__ - Step 40686: {'lr': 0.00042034212640091587, 'samples': 7811712, 'steps': 40685, 'loss/train': 1.2421624660491943} -11/07/2021 02:56:37 - INFO - __main__ - Step 40687: {'lr': 0.00042033824214119633, 'samples': 7811904, 'steps': 40686, 'loss/train': 1.2181388139724731} -11/07/2021 02:56:38 - INFO - __main__ - Step 40688: {'lr': 0.00042033435780472494, 'samples': 7812096, 'steps': 40687, 'loss/train': 1.5045456886291504} -11/07/2021 02:56:38 - INFO - __main__ - Step 40689: {'lr': 0.00042033047339150363, 'samples': 7812288, 'steps': 40688, 'loss/train': 1.4343459606170654} -11/07/2021 02:56:39 - INFO - __main__ - Step 40690: {'lr': 0.00042032658890153404, 'samples': 7812480, 'steps': 40689, 'loss/train': 1.233680009841919} -11/07/2021 02:56:39 - INFO - __main__ - Step 40691: {'lr': 0.0004203227043348179, 'samples': 7812672, 'steps': 40690, 'loss/train': 1.5752936601638794} -11/07/2021 02:56:39 - INFO - __main__ - Step 40692: {'lr': 0.000420318819691357, 'samples': 7812864, 'steps': 40691, 'loss/train': 1.6695582866668701} -11/07/2021 02:56:40 - INFO - __main__ - Step 40693: {'lr': 0.00042031493497115304, 'samples': 7813056, 'steps': 40692, 'loss/train': 1.7513031959533691} -11/07/2021 02:56:41 - INFO - __main__ - Step 40694: {'lr': 0.0004203110501742078, 'samples': 7813248, 'steps': 40693, 'loss/train': 0.9645717740058899} -11/07/2021 02:56:41 - INFO - __main__ - Step 40695: {'lr': 0.00042030716530052297, 'samples': 7813440, 'steps': 40694, 'loss/train': 1.6265499591827393} -11/07/2021 02:56:41 - INFO - __main__ - Step 40696: {'lr': 0.00042030328035010047, 'samples': 7813632, 'steps': 40695, 'loss/train': 1.2691519260406494} -11/07/2021 02:56:42 - INFO - __main__ - Step 40697: {'lr': 0.0004202993953229418, 'samples': 7813824, 'steps': 40696, 'loss/train': 1.6467305421829224} -11/07/2021 02:56:43 - INFO - __main__ - Step 40698: {'lr': 0.000420295510219049, 'samples': 7814016, 'steps': 40697, 'loss/train': 1.8103171586990356} -11/07/2021 02:56:43 - INFO - __main__ - Step 40699: {'lr': 0.00042029162503842357, 'samples': 7814208, 'steps': 40698, 'loss/train': 1.101730465888977} -11/07/2021 02:56:43 - INFO - __main__ - Step 40700: {'lr': 0.0004202877397810674, 'samples': 7814400, 'steps': 40699, 'loss/train': 1.522147536277771} -11/07/2021 02:56:44 - INFO - __main__ - Step 40701: {'lr': 0.0004202838544469822, 'samples': 7814592, 'steps': 40700, 'loss/train': 1.5229068994522095} -11/07/2021 02:56:44 - INFO - __main__ - Step 40702: {'lr': 0.00042027996903616974, 'samples': 7814784, 'steps': 40701, 'loss/train': 1.5482386350631714} -11/07/2021 02:56:45 - INFO - __main__ - Step 40703: {'lr': 0.0004202760835486317, 'samples': 7814976, 'steps': 40702, 'loss/train': 1.3894777297973633} -11/07/2021 02:56:46 - INFO - __main__ - Step 40704: {'lr': 0.00042027219798436996, 'samples': 7815168, 'steps': 40703, 'loss/train': 1.6228009462356567} -11/07/2021 02:56:46 - INFO - __main__ - Step 40705: {'lr': 0.00042026831234338614, 'samples': 7815360, 'steps': 40704, 'loss/train': 1.6805357933044434} -11/07/2021 02:56:46 - INFO - __main__ - Step 40706: {'lr': 0.0004202644266256821, 'samples': 7815552, 'steps': 40705, 'loss/train': 1.679015874862671} -11/07/2021 02:56:47 - INFO - __main__ - Step 40707: {'lr': 0.00042026054083125943, 'samples': 7815744, 'steps': 40706, 'loss/train': 1.0983397960662842} -11/07/2021 02:56:48 - INFO - __main__ - Step 40708: {'lr': 0.0004202566549601201, 'samples': 7815936, 'steps': 40707, 'loss/train': 1.7401659488677979} -11/07/2021 02:56:48 - INFO - __main__ - Step 40709: {'lr': 0.00042025276901226573, 'samples': 7816128, 'steps': 40708, 'loss/train': 1.924376368522644} -11/07/2021 02:56:49 - INFO - __main__ - Step 40710: {'lr': 0.00042024888298769806, 'samples': 7816320, 'steps': 40709, 'loss/train': 1.6605688333511353} -11/07/2021 02:56:49 - INFO - __main__ - Step 40711: {'lr': 0.0004202449968864188, 'samples': 7816512, 'steps': 40710, 'loss/train': 2.121345043182373} -11/07/2021 02:56:49 - INFO - __main__ - Step 40712: {'lr': 0.00042024111070842985, 'samples': 7816704, 'steps': 40711, 'loss/train': 2.026416778564453} -11/07/2021 02:56:51 - INFO - __main__ - Step 40713: {'lr': 0.0004202372244537329, 'samples': 7816896, 'steps': 40712, 'loss/train': 0.983768105506897} -11/07/2021 02:56:51 - INFO - __main__ - Step 40714: {'lr': 0.00042023333812232967, 'samples': 7817088, 'steps': 40713, 'loss/train': 1.6620196104049683} -11/07/2021 02:56:51 - INFO - __main__ - Step 40715: {'lr': 0.0004202294517142219, 'samples': 7817280, 'steps': 40714, 'loss/train': 1.6445621252059937} -11/07/2021 02:56:52 - INFO - __main__ - Step 40716: {'lr': 0.0004202255652294114, 'samples': 7817472, 'steps': 40715, 'loss/train': 1.2422605752944946} -11/07/2021 02:56:52 - INFO - __main__ - Step 40717: {'lr': 0.00042022167866789985, 'samples': 7817664, 'steps': 40716, 'loss/train': 1.9124672412872314} -11/07/2021 02:56:52 - INFO - __main__ - Step 40718: {'lr': 0.00042021779202968903, 'samples': 7817856, 'steps': 40717, 'loss/train': 1.974969744682312} -11/07/2021 02:56:53 - INFO - __main__ - Step 40719: {'lr': 0.0004202139053147808, 'samples': 7818048, 'steps': 40718, 'loss/train': 1.6937755346298218} -11/07/2021 02:56:54 - INFO - __main__ - Step 40720: {'lr': 0.0004202100185231767, 'samples': 7818240, 'steps': 40719, 'loss/train': 1.5049687623977661} -11/07/2021 02:56:54 - INFO - __main__ - Step 40721: {'lr': 0.00042020613165487863, 'samples': 7818432, 'steps': 40720, 'loss/train': 1.3050556182861328} -11/07/2021 02:56:54 - INFO - __main__ - Step 40722: {'lr': 0.0004202022447098883, 'samples': 7818624, 'steps': 40721, 'loss/train': 1.4542369842529297} -11/07/2021 02:56:55 - INFO - __main__ - Step 40723: {'lr': 0.00042019835768820744, 'samples': 7818816, 'steps': 40722, 'loss/train': 1.6474261283874512} -11/07/2021 02:56:56 - INFO - __main__ - Step 40724: {'lr': 0.00042019447058983786, 'samples': 7819008, 'steps': 40723, 'loss/train': 1.053047776222229} -11/07/2021 02:56:56 - INFO - __main__ - Step 40725: {'lr': 0.0004201905834147813, 'samples': 7819200, 'steps': 40724, 'loss/train': 1.6326931715011597} -11/07/2021 02:56:56 - INFO - __main__ - Step 40726: {'lr': 0.0004201866961630395, 'samples': 7819392, 'steps': 40725, 'loss/train': 1.4784409999847412} -11/07/2021 02:56:57 - INFO - __main__ - Step 40727: {'lr': 0.00042018280883461415, 'samples': 7819584, 'steps': 40726, 'loss/train': 1.242191195487976} -11/07/2021 02:56:57 - INFO - __main__ - Step 40728: {'lr': 0.000420178921429507, 'samples': 7819776, 'steps': 40727, 'loss/train': 1.5088322162628174} -11/07/2021 02:56:58 - INFO - __main__ - Step 40729: {'lr': 0.00042017503394771997, 'samples': 7819968, 'steps': 40728, 'loss/train': 1.5620919466018677} -11/07/2021 02:56:59 - INFO - __main__ - Step 40730: {'lr': 0.00042017114638925456, 'samples': 7820160, 'steps': 40729, 'loss/train': 1.665900707244873} -11/07/2021 02:56:59 - INFO - __main__ - Step 40731: {'lr': 0.00042016725875411274, 'samples': 7820352, 'steps': 40730, 'loss/train': 2.2982349395751953} -11/07/2021 02:56:59 - INFO - __main__ - Step 40732: {'lr': 0.0004201633710422962, 'samples': 7820544, 'steps': 40731, 'loss/train': 1.4807544946670532} -11/07/2021 02:57:00 - INFO - __main__ - Step 40733: {'lr': 0.0004201594832538067, 'samples': 7820736, 'steps': 40732, 'loss/train': 1.611283540725708} -11/07/2021 02:57:01 - INFO - __main__ - Step 40734: {'lr': 0.0004201555953886459, 'samples': 7820928, 'steps': 40733, 'loss/train': 1.288476586341858} -11/07/2021 02:57:01 - INFO - __main__ - Step 40735: {'lr': 0.00042015170744681566, 'samples': 7821120, 'steps': 40734, 'loss/train': 1.8149077892303467} -11/07/2021 02:57:01 - INFO - __main__ - Step 40736: {'lr': 0.00042014781942831757, 'samples': 7821312, 'steps': 40735, 'loss/train': 1.7490525245666504} -11/07/2021 02:57:02 - INFO - __main__ - Step 40737: {'lr': 0.00042014393133315366, 'samples': 7821504, 'steps': 40736, 'loss/train': 1.5821160078048706} -11/07/2021 02:57:02 - INFO - __main__ - Step 40738: {'lr': 0.00042014004316132537, 'samples': 7821696, 'steps': 40737, 'loss/train': 1.7117501497268677} -11/07/2021 02:57:03 - INFO - __main__ - Step 40739: {'lr': 0.0004201361549128347, 'samples': 7821888, 'steps': 40738, 'loss/train': 1.4417829513549805} -11/07/2021 02:57:03 - INFO - __main__ - Step 40740: {'lr': 0.00042013226658768333, 'samples': 7822080, 'steps': 40739, 'loss/train': 2.1850247383117676} -11/07/2021 02:57:04 - INFO - __main__ - Step 40741: {'lr': 0.0004201283781858729, 'samples': 7822272, 'steps': 40740, 'loss/train': 1.318172574043274} -11/07/2021 02:57:04 - INFO - __main__ - Step 40742: {'lr': 0.00042012448970740523, 'samples': 7822464, 'steps': 40741, 'loss/train': 1.9657243490219116} -11/07/2021 02:57:04 - INFO - __main__ - Step 40743: {'lr': 0.00042012060115228215, 'samples': 7822656, 'steps': 40742, 'loss/train': 1.322919487953186} -11/07/2021 02:57:05 - INFO - __main__ - Step 40744: {'lr': 0.0004201167125205054, 'samples': 7822848, 'steps': 40743, 'loss/train': 0.939601719379425} -11/07/2021 02:57:06 - INFO - __main__ - Step 40745: {'lr': 0.0004201128238120766, 'samples': 7823040, 'steps': 40744, 'loss/train': 1.352439045906067} -11/07/2021 02:57:06 - INFO - __main__ - Step 40746: {'lr': 0.00042010893502699765, 'samples': 7823232, 'steps': 40745, 'loss/train': 1.2596780061721802} -11/07/2021 02:57:07 - INFO - __main__ - Step 40747: {'lr': 0.0004201050461652702, 'samples': 7823424, 'steps': 40746, 'loss/train': 1.5559792518615723} -11/07/2021 02:57:07 - INFO - __main__ - Step 40748: {'lr': 0.00042010115722689603, 'samples': 7823616, 'steps': 40747, 'loss/train': 1.4758732318878174} -11/07/2021 02:57:08 - INFO - __main__ - Step 40749: {'lr': 0.0004200972682118769, 'samples': 7823808, 'steps': 40748, 'loss/train': 1.8409411907196045} -11/07/2021 02:57:08 - INFO - __main__ - Step 40750: {'lr': 0.0004200933791202146, 'samples': 7824000, 'steps': 40749, 'loss/train': 1.5887305736541748} -11/07/2021 02:57:09 - INFO - __main__ - Step 40751: {'lr': 0.0004200894899519108, 'samples': 7824192, 'steps': 40750, 'loss/train': 1.5835992097854614} -11/07/2021 02:57:09 - INFO - __main__ - Step 40752: {'lr': 0.00042008560070696735, 'samples': 7824384, 'steps': 40751, 'loss/train': 0.8489807844161987} -11/07/2021 02:57:09 - INFO - __main__ - Step 40753: {'lr': 0.000420081711385386, 'samples': 7824576, 'steps': 40752, 'loss/train': 1.7906991243362427} -11/07/2021 02:57:10 - INFO - __main__ - Step 40754: {'lr': 0.00042007782198716836, 'samples': 7824768, 'steps': 40753, 'loss/train': 2.3305821418762207} -11/07/2021 02:57:11 - INFO - __main__ - Step 40755: {'lr': 0.0004200739325123163, 'samples': 7824960, 'steps': 40754, 'loss/train': 1.161139965057373} -11/07/2021 02:57:11 - INFO - __main__ - Step 40756: {'lr': 0.0004200700429608315, 'samples': 7825152, 'steps': 40755, 'loss/train': 1.5971800088882446} -11/07/2021 02:57:11 - INFO - __main__ - Step 40757: {'lr': 0.00042006615333271585, 'samples': 7825344, 'steps': 40756, 'loss/train': 1.609025478363037} -11/07/2021 02:57:12 - INFO - __main__ - Step 40758: {'lr': 0.000420062263627971, 'samples': 7825536, 'steps': 40757, 'loss/train': 1.4358506202697754} -11/07/2021 02:57:12 - INFO - __main__ - Step 40759: {'lr': 0.0004200583738465987, 'samples': 7825728, 'steps': 40758, 'loss/train': 1.945847511291504} -11/07/2021 02:57:13 - INFO - __main__ - Step 40760: {'lr': 0.00042005448398860077, 'samples': 7825920, 'steps': 40759, 'loss/train': 1.662986159324646} -11/07/2021 02:57:13 - INFO - __main__ - Step 40761: {'lr': 0.00042005059405397885, 'samples': 7826112, 'steps': 40760, 'loss/train': 1.3383136987686157} -11/07/2021 02:57:14 - INFO - __main__ - Step 40762: {'lr': 0.00042004670404273474, 'samples': 7826304, 'steps': 40761, 'loss/train': 1.7181071043014526} -11/07/2021 02:57:14 - INFO - __main__ - Step 40763: {'lr': 0.0004200428139548703, 'samples': 7826496, 'steps': 40762, 'loss/train': 0.7669545412063599} -11/07/2021 02:57:14 - INFO - __main__ - Step 40764: {'lr': 0.0004200389237903871, 'samples': 7826688, 'steps': 40763, 'loss/train': 1.6772427558898926} -11/07/2021 02:57:16 - INFO - __main__ - Step 40765: {'lr': 0.000420035033549287, 'samples': 7826880, 'steps': 40764, 'loss/train': 1.4819986820220947} -11/07/2021 02:57:16 - INFO - __main__ - Step 40766: {'lr': 0.0004200311432315718, 'samples': 7827072, 'steps': 40765, 'loss/train': 1.9922943115234375} -11/07/2021 02:57:16 - INFO - __main__ - Step 40767: {'lr': 0.0004200272528372432, 'samples': 7827264, 'steps': 40766, 'loss/train': 1.4818094968795776} -11/07/2021 02:57:17 - INFO - __main__ - Step 40768: {'lr': 0.0004200233623663028, 'samples': 7827456, 'steps': 40767, 'loss/train': 1.082582712173462} -11/07/2021 02:57:17 - INFO - __main__ - Step 40769: {'lr': 0.0004200194718187527, 'samples': 7827648, 'steps': 40768, 'loss/train': 1.1773542165756226} -11/07/2021 02:57:18 - INFO - __main__ - Step 40770: {'lr': 0.0004200155811945943, 'samples': 7827840, 'steps': 40769, 'loss/train': 1.2706178426742554} -11/07/2021 02:57:18 - INFO - __main__ - Step 40771: {'lr': 0.0004200116904938295, 'samples': 7828032, 'steps': 40770, 'loss/train': 1.697472095489502} -11/07/2021 02:57:19 - INFO - __main__ - Step 40772: {'lr': 0.00042000779971646007, 'samples': 7828224, 'steps': 40771, 'loss/train': 1.7203675508499146} -11/07/2021 02:57:19 - INFO - __main__ - Step 40773: {'lr': 0.00042000390886248783, 'samples': 7828416, 'steps': 40772, 'loss/train': 5.857418537139893} -11/07/2021 02:57:19 - INFO - __main__ - Step 40774: {'lr': 0.0004200000179319144, 'samples': 7828608, 'steps': 40773, 'loss/train': 1.426015019416809} -11/07/2021 02:57:20 - INFO - __main__ - Step 40775: {'lr': 0.0004199961269247416, 'samples': 7828800, 'steps': 40774, 'loss/train': 1.3574186563491821} -11/07/2021 02:57:21 - INFO - __main__ - Step 40776: {'lr': 0.0004199922358409711, 'samples': 7828992, 'steps': 40775, 'loss/train': 1.6170494556427002} -11/07/2021 02:57:21 - INFO - __main__ - Step 40777: {'lr': 0.0004199883446806048, 'samples': 7829184, 'steps': 40776, 'loss/train': 1.7628307342529297} -11/07/2021 02:57:21 - INFO - __main__ - Step 40778: {'lr': 0.0004199844534436443, 'samples': 7829376, 'steps': 40777, 'loss/train': 2.341153621673584} -11/07/2021 02:57:22 - INFO - __main__ - Step 40779: {'lr': 0.0004199805621300915, 'samples': 7829568, 'steps': 40778, 'loss/train': 1.5946757793426514} -11/07/2021 02:57:23 - INFO - __main__ - Step 40780: {'lr': 0.0004199766707399481, 'samples': 7829760, 'steps': 40779, 'loss/train': 1.1053686141967773} -11/07/2021 02:57:23 - INFO - __main__ - Step 40781: {'lr': 0.0004199727792732158, 'samples': 7829952, 'steps': 40780, 'loss/train': 0.9021766185760498} -11/07/2021 02:57:23 - INFO - __main__ - Step 40782: {'lr': 0.0004199688877298964, 'samples': 7830144, 'steps': 40781, 'loss/train': 1.256246566772461} -11/07/2021 02:57:24 - INFO - __main__ - Step 40783: {'lr': 0.00041996499610999163, 'samples': 7830336, 'steps': 40782, 'loss/train': 1.5676124095916748} -11/07/2021 02:57:24 - INFO - __main__ - Step 40784: {'lr': 0.00041996110441350323, 'samples': 7830528, 'steps': 40783, 'loss/train': 1.7661354541778564} -11/07/2021 02:57:25 - INFO - __main__ - Step 40785: {'lr': 0.000419957212640433, 'samples': 7830720, 'steps': 40784, 'loss/train': 1.8322479724884033} -11/07/2021 02:57:25 - INFO - __main__ - Step 40786: {'lr': 0.0004199533207907827, 'samples': 7830912, 'steps': 40785, 'loss/train': 1.3264210224151611} -11/07/2021 02:57:26 - INFO - __main__ - Step 40787: {'lr': 0.00041994942886455403, 'samples': 7831104, 'steps': 40786, 'loss/train': 1.4569522142410278} -11/07/2021 02:57:26 - INFO - __main__ - Step 40788: {'lr': 0.00041994553686174876, 'samples': 7831296, 'steps': 40787, 'loss/train': 1.7506399154663086} -11/07/2021 02:57:27 - INFO - __main__ - Step 40789: {'lr': 0.0004199416447823686, 'samples': 7831488, 'steps': 40788, 'loss/train': 1.4973564147949219} -11/07/2021 02:57:28 - INFO - __main__ - Step 40790: {'lr': 0.0004199377526264154, 'samples': 7831680, 'steps': 40789, 'loss/train': 1.3136669397354126} -11/07/2021 02:57:28 - INFO - __main__ - Step 40791: {'lr': 0.00041993386039389095, 'samples': 7831872, 'steps': 40790, 'loss/train': 2.1212332248687744} -11/07/2021 02:57:28 - INFO - __main__ - Step 40792: {'lr': 0.0004199299680847969, 'samples': 7832064, 'steps': 40791, 'loss/train': 0.9397590756416321} -11/07/2021 02:57:29 - INFO - __main__ - Step 40793: {'lr': 0.000419926075699135, 'samples': 7832256, 'steps': 40792, 'loss/train': 1.2800946235656738} -11/07/2021 02:57:29 - INFO - __main__ - Step 40794: {'lr': 0.000419922183236907, 'samples': 7832448, 'steps': 40793, 'loss/train': 1.0686975717544556} -11/07/2021 02:57:30 - INFO - __main__ - Step 40795: {'lr': 0.0004199182906981147, 'samples': 7832640, 'steps': 40794, 'loss/train': 1.7454752922058105} -11/07/2021 02:57:31 - INFO - __main__ - Step 40796: {'lr': 0.00041991439808275986, 'samples': 7832832, 'steps': 40795, 'loss/train': 0.7209337949752808} -11/07/2021 02:57:31 - INFO - __main__ - Step 40797: {'lr': 0.0004199105053908442, 'samples': 7833024, 'steps': 40796, 'loss/train': 1.42599618434906} -11/07/2021 02:57:31 - INFO - __main__ - Step 40798: {'lr': 0.0004199066126223695, 'samples': 7833216, 'steps': 40797, 'loss/train': 1.8595082759857178} -11/07/2021 02:57:32 - INFO - __main__ - Step 40799: {'lr': 0.0004199027197773375, 'samples': 7833408, 'steps': 40798, 'loss/train': 2.1304287910461426} -11/07/2021 02:57:32 - INFO - __main__ - Step 40800: {'lr': 0.00041989882685575, 'samples': 7833600, 'steps': 40799, 'loss/train': 1.2476295232772827} -11/07/2021 02:57:33 - INFO - __main__ - Step 40801: {'lr': 0.0004198949338576086, 'samples': 7833792, 'steps': 40800, 'loss/train': 1.1822339296340942} -11/07/2021 02:57:34 - INFO - __main__ - Step 40802: {'lr': 0.0004198910407829152, 'samples': 7833984, 'steps': 40801, 'loss/train': 1.404305100440979} -11/07/2021 02:57:34 - INFO - __main__ - Step 40803: {'lr': 0.00041988714763167156, 'samples': 7834176, 'steps': 40802, 'loss/train': 1.536059021949768} -11/07/2021 02:57:34 - INFO - __main__ - Step 40804: {'lr': 0.00041988325440387944, 'samples': 7834368, 'steps': 40803, 'loss/train': 1.5439774990081787} -11/07/2021 02:57:35 - INFO - __main__ - Step 40805: {'lr': 0.00041987936109954047, 'samples': 7834560, 'steps': 40804, 'loss/train': 1.814212441444397} -11/07/2021 02:57:36 - INFO - __main__ - Step 40806: {'lr': 0.0004198754677186565, 'samples': 7834752, 'steps': 40805, 'loss/train': 1.5161305665969849} -11/07/2021 02:57:36 - INFO - __main__ - Step 40807: {'lr': 0.0004198715742612292, 'samples': 7834944, 'steps': 40806, 'loss/train': 1.632473111152649} -11/07/2021 02:57:36 - INFO - __main__ - Step 40808: {'lr': 0.0004198676807272605, 'samples': 7835136, 'steps': 40807, 'loss/train': 1.0738561153411865} -11/07/2021 02:57:37 - INFO - __main__ - Step 40809: {'lr': 0.000419863787116752, 'samples': 7835328, 'steps': 40808, 'loss/train': 1.2711148262023926} -11/07/2021 02:57:37 - INFO - __main__ - Step 40810: {'lr': 0.0004198598934297055, 'samples': 7835520, 'steps': 40809, 'loss/train': 1.3566529750823975} -11/07/2021 02:57:37 - INFO - __main__ - Step 40811: {'lr': 0.00041985599966612273, 'samples': 7835712, 'steps': 40810, 'loss/train': 1.2638170719146729} -11/07/2021 02:57:39 - INFO - __main__ - Step 40812: {'lr': 0.0004198521058260055, 'samples': 7835904, 'steps': 40811, 'loss/train': 0.5754212141036987} -11/07/2021 02:57:39 - INFO - __main__ - Step 40813: {'lr': 0.0004198482119093555, 'samples': 7836096, 'steps': 40812, 'loss/train': 1.6761367321014404} -11/07/2021 02:57:40 - INFO - __main__ - Step 40814: {'lr': 0.00041984431791617456, 'samples': 7836288, 'steps': 40813, 'loss/train': 2.0934343338012695} -11/07/2021 02:57:40 - INFO - __main__ - Step 40815: {'lr': 0.0004198404238464644, 'samples': 7836480, 'steps': 40814, 'loss/train': 2.344271183013916} -11/07/2021 02:57:40 - INFO - __main__ - Step 40816: {'lr': 0.0004198365297002267, 'samples': 7836672, 'steps': 40815, 'loss/train': 1.3367879390716553} -11/07/2021 02:57:41 - INFO - __main__ - Step 40817: {'lr': 0.0004198326354774633, 'samples': 7836864, 'steps': 40816, 'loss/train': 2.2786648273468018} -11/07/2021 02:57:42 - INFO - __main__ - Step 40818: {'lr': 0.00041982874117817593, 'samples': 7837056, 'steps': 40817, 'loss/train': 1.5131193399429321} -11/07/2021 02:57:42 - INFO - __main__ - Step 40819: {'lr': 0.00041982484680236636, 'samples': 7837248, 'steps': 40818, 'loss/train': 1.1675461530685425} -11/07/2021 02:57:42 - INFO - __main__ - Step 40820: {'lr': 0.00041982095235003634, 'samples': 7837440, 'steps': 40819, 'loss/train': 1.5366125106811523} -11/07/2021 02:57:43 - INFO - __main__ - Step 40821: {'lr': 0.0004198170578211877, 'samples': 7837632, 'steps': 40820, 'loss/train': 1.6404383182525635} -11/07/2021 02:57:43 - INFO - __main__ - Step 40822: {'lr': 0.000419813163215822, 'samples': 7837824, 'steps': 40821, 'loss/train': 1.3809610605239868} -11/07/2021 02:57:44 - INFO - __main__ - Step 40823: {'lr': 0.0004198092685339411, 'samples': 7838016, 'steps': 40822, 'loss/train': 1.6485894918441772} -11/07/2021 02:57:45 - INFO - __main__ - Step 40824: {'lr': 0.00041980537377554685, 'samples': 7838208, 'steps': 40823, 'loss/train': 1.9748244285583496} -11/07/2021 02:57:45 - INFO - __main__ - Step 40825: {'lr': 0.00041980147894064086, 'samples': 7838400, 'steps': 40824, 'loss/train': 1.0561368465423584} -11/07/2021 02:57:45 - INFO - __main__ - Step 40826: {'lr': 0.00041979758402922496, 'samples': 7838592, 'steps': 40825, 'loss/train': 1.2652628421783447} -11/07/2021 02:57:46 - INFO - __main__ - Step 40827: {'lr': 0.00041979368904130086, 'samples': 7838784, 'steps': 40826, 'loss/train': 1.6909739971160889} -11/07/2021 02:57:47 - INFO - __main__ - Step 40828: {'lr': 0.00041978979397687047, 'samples': 7838976, 'steps': 40827, 'loss/train': 1.191987156867981} -11/07/2021 02:57:47 - INFO - __main__ - Step 40829: {'lr': 0.00041978589883593525, 'samples': 7839168, 'steps': 40828, 'loss/train': 1.1689318418502808} -11/07/2021 02:57:47 - INFO - __main__ - Step 40830: {'lr': 0.0004197820036184972, 'samples': 7839360, 'steps': 40829, 'loss/train': 1.3950546979904175} -11/07/2021 02:57:48 - INFO - __main__ - Step 40831: {'lr': 0.000419778108324558, 'samples': 7839552, 'steps': 40830, 'loss/train': 1.4193148612976074} -11/07/2021 02:57:48 - INFO - __main__ - Step 40832: {'lr': 0.00041977421295411944, 'samples': 7839744, 'steps': 40831, 'loss/train': 1.3167130947113037} -11/07/2021 02:57:49 - INFO - __main__ - Step 40833: {'lr': 0.00041977031750718317, 'samples': 7839936, 'steps': 40832, 'loss/train': 1.5753673315048218} -11/07/2021 02:57:50 - INFO - __main__ - Step 40834: {'lr': 0.000419766421983751, 'samples': 7840128, 'steps': 40833, 'loss/train': 1.5279433727264404} -11/07/2021 02:57:50 - INFO - __main__ - Step 40835: {'lr': 0.00041976252638382483, 'samples': 7840320, 'steps': 40834, 'loss/train': 0.5898969173431396} -11/07/2021 02:57:50 - INFO - __main__ - Step 40836: {'lr': 0.00041975863070740617, 'samples': 7840512, 'steps': 40835, 'loss/train': 1.344542145729065} -11/07/2021 02:57:51 - INFO - __main__ - Step 40837: {'lr': 0.0004197547349544969, 'samples': 7840704, 'steps': 40836, 'loss/train': 0.8119551539421082} -11/07/2021 02:57:52 - INFO - __main__ - Step 40838: {'lr': 0.0004197508391250988, 'samples': 7840896, 'steps': 40837, 'loss/train': 1.9184430837631226} -11/07/2021 02:57:52 - INFO - __main__ - Step 40839: {'lr': 0.0004197469432192136, 'samples': 7841088, 'steps': 40838, 'loss/train': 1.3354907035827637} -11/07/2021 02:57:53 - INFO - __main__ - Step 40840: {'lr': 0.000419743047236843, 'samples': 7841280, 'steps': 40839, 'loss/train': 1.261608600616455} -11/07/2021 02:57:53 - INFO - __main__ - Step 40841: {'lr': 0.00041973915117798883, 'samples': 7841472, 'steps': 40840, 'loss/train': 1.2910435199737549} -11/07/2021 02:57:53 - INFO - __main__ - Step 40842: {'lr': 0.0004197352550426528, 'samples': 7841664, 'steps': 40841, 'loss/train': 1.584807276725769} -11/07/2021 02:57:54 - INFO - __main__ - Step 40843: {'lr': 0.0004197313588308367, 'samples': 7841856, 'steps': 40842, 'loss/train': 1.3579699993133545} -11/07/2021 02:57:55 - INFO - __main__ - Step 40844: {'lr': 0.0004197274625425423, 'samples': 7842048, 'steps': 40843, 'loss/train': 1.606826663017273} -11/07/2021 02:57:55 - INFO - __main__ - Step 40845: {'lr': 0.0004197235661777713, 'samples': 7842240, 'steps': 40844, 'loss/train': 1.7265325784683228} -11/07/2021 02:57:55 - INFO - __main__ - Step 40846: {'lr': 0.00041971966973652545, 'samples': 7842432, 'steps': 40845, 'loss/train': 1.2680137157440186} -11/07/2021 02:57:56 - INFO - __main__ - Step 40847: {'lr': 0.00041971577321880656, 'samples': 7842624, 'steps': 40846, 'loss/train': 1.2878777980804443} -11/07/2021 02:57:56 - INFO - __main__ - Step 40848: {'lr': 0.00041971187662461634, 'samples': 7842816, 'steps': 40847, 'loss/train': 1.6605842113494873} -11/07/2021 02:57:57 - INFO - __main__ - Step 40849: {'lr': 0.0004197079799539566, 'samples': 7843008, 'steps': 40848, 'loss/train': 1.651978611946106} -11/07/2021 02:57:57 - INFO - __main__ - Step 40850: {'lr': 0.0004197040832068291, 'samples': 7843200, 'steps': 40849, 'loss/train': 1.6321369409561157} -11/07/2021 02:57:58 - INFO - __main__ - Step 40851: {'lr': 0.00041970018638323546, 'samples': 7843392, 'steps': 40850, 'loss/train': 1.5288792848587036} -11/07/2021 02:57:58 - INFO - __main__ - Step 40852: {'lr': 0.00041969628948317756, 'samples': 7843584, 'steps': 40851, 'loss/train': 1.5668535232543945} -11/07/2021 02:57:58 - INFO - __main__ - Step 40853: {'lr': 0.00041969239250665716, 'samples': 7843776, 'steps': 40852, 'loss/train': 1.402988076210022} -11/07/2021 02:57:59 - INFO - __main__ - Step 40854: {'lr': 0.000419688495453676, 'samples': 7843968, 'steps': 40853, 'loss/train': 1.280922293663025} -11/07/2021 02:58:00 - INFO - __main__ - Step 40855: {'lr': 0.0004196845983242358, 'samples': 7844160, 'steps': 40854, 'loss/train': 1.6631810665130615} -11/07/2021 02:58:00 - INFO - __main__ - Step 40856: {'lr': 0.0004196807011183383, 'samples': 7844352, 'steps': 40855, 'loss/train': 1.41666841506958} -11/07/2021 02:58:00 - INFO - __main__ - Step 40857: {'lr': 0.00041967680383598536, 'samples': 7844544, 'steps': 40856, 'loss/train': 1.7356514930725098} -11/07/2021 02:58:01 - INFO - __main__ - Step 40858: {'lr': 0.00041967290647717864, 'samples': 7844736, 'steps': 40857, 'loss/train': 1.4704985618591309} -11/07/2021 02:58:02 - INFO - __main__ - Step 40859: {'lr': 0.00041966900904191995, 'samples': 7844928, 'steps': 40858, 'loss/train': 1.802902102470398} -11/07/2021 02:58:02 - INFO - __main__ - Step 40860: {'lr': 0.000419665111530211, 'samples': 7845120, 'steps': 40859, 'loss/train': 1.9410536289215088} -11/07/2021 02:58:03 - INFO - __main__ - Step 40861: {'lr': 0.00041966121394205357, 'samples': 7845312, 'steps': 40860, 'loss/train': 1.276798963546753} -11/07/2021 02:58:03 - INFO - __main__ - Step 40862: {'lr': 0.0004196573162774494, 'samples': 7845504, 'steps': 40861, 'loss/train': 0.9696474671363831} -11/07/2021 02:58:03 - INFO - __main__ - Step 40863: {'lr': 0.0004196534185364003, 'samples': 7845696, 'steps': 40862, 'loss/train': 0.7720293998718262} -11/07/2021 02:58:04 - INFO - __main__ - Step 40864: {'lr': 0.00041964952071890795, 'samples': 7845888, 'steps': 40863, 'loss/train': 1.7502236366271973} -11/07/2021 02:58:05 - INFO - __main__ - Step 40865: {'lr': 0.00041964562282497417, 'samples': 7846080, 'steps': 40864, 'loss/train': 1.2578016519546509} -11/07/2021 02:58:05 - INFO - __main__ - Step 40866: {'lr': 0.0004196417248546006, 'samples': 7846272, 'steps': 40865, 'loss/train': 1.572597622871399} -11/07/2021 02:58:05 - INFO - __main__ - Step 40867: {'lr': 0.0004196378268077893, 'samples': 7846464, 'steps': 40866, 'loss/train': 1.2670254707336426} -11/07/2021 02:58:06 - INFO - __main__ - Step 40868: {'lr': 0.00041963392868454163, 'samples': 7846656, 'steps': 40867, 'loss/train': 1.4458591938018799} -11/07/2021 02:58:06 - INFO - __main__ - Step 40869: {'lr': 0.0004196300304848596, 'samples': 7846848, 'steps': 40868, 'loss/train': 1.4543291330337524} -11/07/2021 02:58:07 - INFO - __main__ - Step 40870: {'lr': 0.00041962613220874486, 'samples': 7847040, 'steps': 40869, 'loss/train': 1.6573225259780884} -11/07/2021 02:58:07 - INFO - __main__ - Step 40871: {'lr': 0.0004196222338561992, 'samples': 7847232, 'steps': 40870, 'loss/train': 1.441749930381775} -11/07/2021 02:58:08 - INFO - __main__ - Step 40872: {'lr': 0.0004196183354272244, 'samples': 7847424, 'steps': 40871, 'loss/train': 1.2333451509475708} -11/07/2021 02:58:08 - INFO - __main__ - Step 40873: {'lr': 0.00041961443692182214, 'samples': 7847616, 'steps': 40872, 'loss/train': 1.369896411895752} -11/07/2021 02:58:08 - INFO - __main__ - Step 40874: {'lr': 0.00041961053833999433, 'samples': 7847808, 'steps': 40873, 'loss/train': 1.374863624572754} -11/07/2021 02:58:10 - INFO - __main__ - Step 40875: {'lr': 0.00041960663968174263, 'samples': 7848000, 'steps': 40874, 'loss/train': 1.2193489074707031} -11/07/2021 02:58:10 - INFO - __main__ - Step 40876: {'lr': 0.0004196027409470687, 'samples': 7848192, 'steps': 40875, 'loss/train': 1.4365462064743042} -11/07/2021 02:58:10 - INFO - __main__ - Step 40877: {'lr': 0.00041959884213597443, 'samples': 7848384, 'steps': 40876, 'loss/train': 1.5156211853027344} -11/07/2021 02:58:11 - INFO - __main__ - Step 40878: {'lr': 0.0004195949432484615, 'samples': 7848576, 'steps': 40877, 'loss/train': 1.7335604429244995} -11/07/2021 02:58:11 - INFO - __main__ - Step 40879: {'lr': 0.00041959104428453175, 'samples': 7848768, 'steps': 40878, 'loss/train': 1.2749711275100708} -11/07/2021 02:58:12 - INFO - __main__ - Step 40880: {'lr': 0.000419587145244187, 'samples': 7848960, 'steps': 40879, 'loss/train': 0.626573920249939} -11/07/2021 02:58:12 - INFO - __main__ - Step 40881: {'lr': 0.0004195832461274288, 'samples': 7849152, 'steps': 40880, 'loss/train': 0.25203990936279297} -11/07/2021 02:58:13 - INFO - __main__ - Step 40882: {'lr': 0.00041957934693425894, 'samples': 7849344, 'steps': 40881, 'loss/train': 1.595252513885498} -11/07/2021 02:58:13 - INFO - __main__ - Step 40883: {'lr': 0.0004195754476646793, 'samples': 7849536, 'steps': 40882, 'loss/train': 1.359736442565918} -11/07/2021 02:58:13 - INFO - __main__ - Step 40884: {'lr': 0.0004195715483186916, 'samples': 7849728, 'steps': 40883, 'loss/train': 1.6086974143981934} -11/07/2021 02:58:15 - INFO - __main__ - Step 40885: {'lr': 0.00041956764889629756, 'samples': 7849920, 'steps': 40884, 'loss/train': 1.9066940546035767} -11/07/2021 02:58:15 - INFO - __main__ - Step 40886: {'lr': 0.000419563749397499, 'samples': 7850112, 'steps': 40885, 'loss/train': 1.6675184965133667} -11/07/2021 02:58:15 - INFO - __main__ - Step 40887: {'lr': 0.00041955984982229756, 'samples': 7850304, 'steps': 40886, 'loss/train': 1.6105003356933594} -11/07/2021 02:58:16 - INFO - __main__ - Step 40888: {'lr': 0.0004195559501706951, 'samples': 7850496, 'steps': 40887, 'loss/train': 1.023625373840332} -11/07/2021 02:58:16 - INFO - __main__ - Step 40889: {'lr': 0.0004195520504426933, 'samples': 7850688, 'steps': 40888, 'loss/train': 1.644714593887329} -11/07/2021 02:58:17 - INFO - __main__ - Step 40890: {'lr': 0.000419548150638294, 'samples': 7850880, 'steps': 40889, 'loss/train': 1.4619386196136475} -11/07/2021 02:58:17 - INFO - __main__ - Step 40891: {'lr': 0.0004195442507574989, 'samples': 7851072, 'steps': 40890, 'loss/train': 1.5527533292770386} -11/07/2021 02:58:18 - INFO - __main__ - Step 40892: {'lr': 0.00041954035080030985, 'samples': 7851264, 'steps': 40891, 'loss/train': 1.0924385786056519} -11/07/2021 02:58:18 - INFO - __main__ - Step 40893: {'lr': 0.0004195364507667284, 'samples': 7851456, 'steps': 40892, 'loss/train': 1.4693257808685303} -11/07/2021 02:58:18 - INFO - __main__ - Step 40894: {'lr': 0.0004195325506567566, 'samples': 7851648, 'steps': 40893, 'loss/train': 1.937795877456665} -11/07/2021 02:58:19 - INFO - __main__ - Step 40895: {'lr': 0.00041952865047039604, 'samples': 7851840, 'steps': 40894, 'loss/train': 1.859720230102539} -11/07/2021 02:58:20 - INFO - __main__ - Step 40896: {'lr': 0.00041952475020764834, 'samples': 7852032, 'steps': 40895, 'loss/train': 1.1508278846740723} -11/07/2021 02:58:20 - INFO - __main__ - Step 40897: {'lr': 0.00041952084986851546, 'samples': 7852224, 'steps': 40896, 'loss/train': 1.3395731449127197} -11/07/2021 02:58:21 - INFO - __main__ - Step 40898: {'lr': 0.0004195169494529991, 'samples': 7852416, 'steps': 40897, 'loss/train': 5.83343505859375} -11/07/2021 02:58:21 - INFO - __main__ - Step 40899: {'lr': 0.0004195130489611011, 'samples': 7852608, 'steps': 40898, 'loss/train': 0.18828418850898743} -11/07/2021 02:58:21 - INFO - __main__ - Step 40900: {'lr': 0.0004195091483928231, 'samples': 7852800, 'steps': 40899, 'loss/train': 1.6984916925430298} -11/07/2021 02:58:22 - INFO - __main__ - Step 40901: {'lr': 0.0004195052477481669, 'samples': 7852992, 'steps': 40900, 'loss/train': 1.210571527481079} -11/07/2021 02:58:23 - INFO - __main__ - Step 40902: {'lr': 0.00041950134702713415, 'samples': 7853184, 'steps': 40901, 'loss/train': 1.6256788969039917} -11/07/2021 02:58:23 - INFO - __main__ - Step 40903: {'lr': 0.0004194974462297268, 'samples': 7853376, 'steps': 40902, 'loss/train': 0.6730626821517944} -11/07/2021 02:58:23 - INFO - __main__ - Step 40904: {'lr': 0.00041949354535594655, 'samples': 7853568, 'steps': 40903, 'loss/train': 1.4739363193511963} -11/07/2021 02:58:24 - INFO - __main__ - Step 40905: {'lr': 0.000419489644405795, 'samples': 7853760, 'steps': 40904, 'loss/train': 1.771188497543335} -11/07/2021 02:58:24 - INFO - __main__ - Step 40906: {'lr': 0.00041948574337927414, 'samples': 7853952, 'steps': 40905, 'loss/train': 1.63949453830719} -11/07/2021 02:58:25 - INFO - __main__ - Step 40907: {'lr': 0.0004194818422763856, 'samples': 7854144, 'steps': 40906, 'loss/train': 1.6062594652175903} -11/07/2021 02:58:26 - INFO - __main__ - Step 40908: {'lr': 0.00041947794109713113, 'samples': 7854336, 'steps': 40907, 'loss/train': 1.2813870906829834} -11/07/2021 02:58:26 - INFO - __main__ - Step 40909: {'lr': 0.0004194740398415125, 'samples': 7854528, 'steps': 40908, 'loss/train': 1.4221503734588623} -11/07/2021 02:58:26 - INFO - __main__ - Step 40910: {'lr': 0.00041947013850953156, 'samples': 7854720, 'steps': 40909, 'loss/train': 2.0788793563842773} -11/07/2021 02:58:27 - INFO - __main__ - Step 40911: {'lr': 0.00041946623710118993, 'samples': 7854912, 'steps': 40910, 'loss/train': 1.5028927326202393} -11/07/2021 02:58:28 - INFO - __main__ - Step 40912: {'lr': 0.0004194623356164894, 'samples': 7855104, 'steps': 40911, 'loss/train': 1.2865480184555054} -11/07/2021 02:58:28 - INFO - __main__ - Step 40913: {'lr': 0.0004194584340554318, 'samples': 7855296, 'steps': 40912, 'loss/train': 1.4281774759292603} -11/07/2021 02:58:28 - INFO - __main__ - Step 40914: {'lr': 0.0004194545324180188, 'samples': 7855488, 'steps': 40913, 'loss/train': 1.617722511291504} -11/07/2021 02:58:29 - INFO - __main__ - Step 40915: {'lr': 0.00041945063070425226, 'samples': 7855680, 'steps': 40914, 'loss/train': 1.6741904020309448} -11/07/2021 02:58:29 - INFO - __main__ - Step 40916: {'lr': 0.0004194467289141339, 'samples': 7855872, 'steps': 40915, 'loss/train': 0.865330696105957} -11/07/2021 02:58:30 - INFO - __main__ - Step 40917: {'lr': 0.00041944282704766534, 'samples': 7856064, 'steps': 40916, 'loss/train': 1.5894625186920166} -11/07/2021 02:58:31 - INFO - __main__ - Step 40918: {'lr': 0.0004194389251048486, 'samples': 7856256, 'steps': 40917, 'loss/train': 1.3960907459259033} -11/07/2021 02:58:31 - INFO - __main__ - Step 40919: {'lr': 0.00041943502308568523, 'samples': 7856448, 'steps': 40918, 'loss/train': 1.5175076723098755} -11/07/2021 02:58:31 - INFO - __main__ - Step 40920: {'lr': 0.000419431120990177, 'samples': 7856640, 'steps': 40919, 'loss/train': 1.536737084388733} -11/07/2021 02:58:32 - INFO - __main__ - Step 40921: {'lr': 0.0004194272188183258, 'samples': 7856832, 'steps': 40920, 'loss/train': 1.4177848100662231} -11/07/2021 02:58:33 - INFO - __main__ - Step 40922: {'lr': 0.0004194233165701333, 'samples': 7857024, 'steps': 40921, 'loss/train': 1.6465486288070679} -11/07/2021 02:58:33 - INFO - __main__ - Step 40923: {'lr': 0.0004194194142456013, 'samples': 7857216, 'steps': 40922, 'loss/train': 1.512831211090088} -11/07/2021 02:58:33 - INFO - __main__ - Step 40924: {'lr': 0.00041941551184473144, 'samples': 7857408, 'steps': 40923, 'loss/train': 1.766401767730713} -11/07/2021 02:58:34 - INFO - __main__ - Step 40925: {'lr': 0.0004194116093675256, 'samples': 7857600, 'steps': 40924, 'loss/train': 1.5521842241287231} -11/07/2021 02:58:34 - INFO - __main__ - Step 40926: {'lr': 0.0004194077068139855, 'samples': 7857792, 'steps': 40925, 'loss/train': 1.638545036315918} -11/07/2021 02:58:35 - INFO - __main__ - Step 40927: {'lr': 0.00041940380418411296, 'samples': 7857984, 'steps': 40926, 'loss/train': 1.4787472486495972} -11/07/2021 02:58:35 - INFO - __main__ - Step 40928: {'lr': 0.00041939990147790956, 'samples': 7858176, 'steps': 40927, 'loss/train': 1.639092206954956} -11/07/2021 02:58:36 - INFO - __main__ - Step 40929: {'lr': 0.00041939599869537724, 'samples': 7858368, 'steps': 40928, 'loss/train': 1.7011237144470215} -11/07/2021 02:58:36 - INFO - __main__ - Step 40930: {'lr': 0.00041939209583651774, 'samples': 7858560, 'steps': 40929, 'loss/train': 1.7363842725753784} -11/07/2021 02:58:36 - INFO - __main__ - Step 40931: {'lr': 0.0004193881929013327, 'samples': 7858752, 'steps': 40930, 'loss/train': 1.7511610984802246} -11/07/2021 02:58:37 - INFO - __main__ - Step 40932: {'lr': 0.00041938428988982403, 'samples': 7858944, 'steps': 40931, 'loss/train': 0.9895086884498596} -11/07/2021 02:58:38 - INFO - __main__ - Step 40933: {'lr': 0.00041938038680199333, 'samples': 7859136, 'steps': 40932, 'loss/train': 1.296011209487915} -11/07/2021 02:58:38 - INFO - __main__ - Step 40934: {'lr': 0.0004193764836378425, 'samples': 7859328, 'steps': 40933, 'loss/train': 1.413246989250183} -11/07/2021 02:58:39 - INFO - __main__ - Step 40935: {'lr': 0.0004193725803973732, 'samples': 7859520, 'steps': 40934, 'loss/train': 1.4412325620651245} -11/07/2021 02:58:39 - INFO - __main__ - Step 40936: {'lr': 0.0004193686770805873, 'samples': 7859712, 'steps': 40935, 'loss/train': 1.5362998247146606} -11/07/2021 02:58:40 - INFO - __main__ - Step 40937: {'lr': 0.00041936477368748645, 'samples': 7859904, 'steps': 40936, 'loss/train': 1.3954333066940308} -11/07/2021 02:58:40 - INFO - __main__ - Step 40938: {'lr': 0.00041936087021807243, 'samples': 7860096, 'steps': 40937, 'loss/train': 1.5923043489456177} -11/07/2021 02:58:41 - INFO - __main__ - Step 40939: {'lr': 0.000419356966672347, 'samples': 7860288, 'steps': 40938, 'loss/train': 1.7164502143859863} -11/07/2021 02:58:41 - INFO - __main__ - Step 40940: {'lr': 0.00041935306305031195, 'samples': 7860480, 'steps': 40939, 'loss/train': 0.6994503140449524} -11/07/2021 02:58:41 - INFO - __main__ - Step 40941: {'lr': 0.000419349159351969, 'samples': 7860672, 'steps': 40940, 'loss/train': 1.786657691001892} -11/07/2021 02:58:42 - INFO - __main__ - Step 40942: {'lr': 0.00041934525557732005, 'samples': 7860864, 'steps': 40941, 'loss/train': 1.44952392578125} -11/07/2021 02:58:43 - INFO - __main__ - Step 40943: {'lr': 0.00041934135172636667, 'samples': 7861056, 'steps': 40942, 'loss/train': 2.088534116744995} -11/07/2021 02:58:43 - INFO - __main__ - Step 40944: {'lr': 0.00041933744779911066, 'samples': 7861248, 'steps': 40943, 'loss/train': 1.5122030973434448} -11/07/2021 02:58:43 - INFO - __main__ - Step 40945: {'lr': 0.00041933354379555376, 'samples': 7861440, 'steps': 40944, 'loss/train': 1.540553331375122} -11/07/2021 02:58:44 - INFO - __main__ - Step 40946: {'lr': 0.00041932963971569786, 'samples': 7861632, 'steps': 40945, 'loss/train': 1.1800307035446167} -11/07/2021 02:58:45 - INFO - __main__ - Step 40947: {'lr': 0.0004193257355595446, 'samples': 7861824, 'steps': 40946, 'loss/train': 1.4031745195388794} -11/07/2021 02:58:45 - INFO - __main__ - Step 40948: {'lr': 0.00041932183132709587, 'samples': 7862016, 'steps': 40947, 'loss/train': 1.0483026504516602} -11/07/2021 02:58:46 - INFO - __main__ - Step 40949: {'lr': 0.00041931792701835325, 'samples': 7862208, 'steps': 40948, 'loss/train': 1.5203033685684204} -11/07/2021 02:58:46 - INFO - __main__ - Step 40950: {'lr': 0.00041931402263331856, 'samples': 7862400, 'steps': 40949, 'loss/train': 1.102845549583435} -11/07/2021 02:58:46 - INFO - __main__ - Step 40951: {'lr': 0.0004193101181719936, 'samples': 7862592, 'steps': 40950, 'loss/train': 1.4966281652450562} -11/07/2021 02:58:47 - INFO - __main__ - Step 40952: {'lr': 0.00041930621363438014, 'samples': 7862784, 'steps': 40951, 'loss/train': 1.6106051206588745} -11/07/2021 02:58:47 - INFO - __main__ - Step 40953: {'lr': 0.0004193023090204799, 'samples': 7862976, 'steps': 40952, 'loss/train': 1.6493892669677734} -11/07/2021 02:58:48 - INFO - __main__ - Step 40954: {'lr': 0.0004192984043302947, 'samples': 7863168, 'steps': 40953, 'loss/train': 1.6793699264526367} -11/07/2021 02:58:48 - INFO - __main__ - Step 40955: {'lr': 0.00041929449956382625, 'samples': 7863360, 'steps': 40954, 'loss/train': 1.2445733547210693} -11/07/2021 02:58:49 - INFO - __main__ - Step 40956: {'lr': 0.0004192905947210762, 'samples': 7863552, 'steps': 40955, 'loss/train': 0.526964545249939} -11/07/2021 02:58:49 - INFO - __main__ - Step 40957: {'lr': 0.00041928668980204653, 'samples': 7863744, 'steps': 40956, 'loss/train': 1.0845738649368286} -11/07/2021 02:58:50 - INFO - __main__ - Step 40958: {'lr': 0.00041928278480673884, 'samples': 7863936, 'steps': 40957, 'loss/train': 1.4329932928085327} -11/07/2021 02:58:50 - INFO - __main__ - Step 40959: {'lr': 0.00041927887973515493, 'samples': 7864128, 'steps': 40958, 'loss/train': 1.483497977256775} -11/07/2021 02:58:51 - INFO - __main__ - Step 40960: {'lr': 0.0004192749745872966, 'samples': 7864320, 'steps': 40959, 'loss/train': 1.2724796533584595} -11/07/2021 02:58:51 - INFO - __main__ - Step 40961: {'lr': 0.00041927106936316563, 'samples': 7864512, 'steps': 40960, 'loss/train': 1.6600308418273926} -11/07/2021 02:58:51 - INFO - __main__ - Step 40962: {'lr': 0.00041926716406276367, 'samples': 7864704, 'steps': 40961, 'loss/train': 1.5604661703109741} -11/07/2021 02:58:52 - INFO - __main__ - Step 40963: {'lr': 0.00041926325868609247, 'samples': 7864896, 'steps': 40962, 'loss/train': 1.5598963499069214} -11/07/2021 02:58:53 - INFO - __main__ - Step 40964: {'lr': 0.0004192593532331539, 'samples': 7865088, 'steps': 40963, 'loss/train': 1.7123584747314453} -11/07/2021 02:58:53 - INFO - __main__ - Step 40965: {'lr': 0.00041925544770394976, 'samples': 7865280, 'steps': 40964, 'loss/train': 1.3562514781951904} -11/07/2021 02:58:53 - INFO - __main__ - Step 40966: {'lr': 0.0004192515420984816, 'samples': 7865472, 'steps': 40965, 'loss/train': 1.4312055110931396} -11/07/2021 02:58:54 - INFO - __main__ - Step 40967: {'lr': 0.0004192476364167514, 'samples': 7865664, 'steps': 40966, 'loss/train': 1.754093885421753} -11/07/2021 02:58:55 - INFO - __main__ - Step 40968: {'lr': 0.0004192437306587608, 'samples': 7865856, 'steps': 40967, 'loss/train': 1.5404969453811646} -11/07/2021 02:58:55 - INFO - __main__ - Step 40969: {'lr': 0.0004192398248245116, 'samples': 7866048, 'steps': 40968, 'loss/train': 1.6052510738372803} -11/07/2021 02:58:56 - INFO - __main__ - Step 40970: {'lr': 0.00041923591891400555, 'samples': 7866240, 'steps': 40969, 'loss/train': 0.7481063604354858} -11/07/2021 02:58:56 - INFO - __main__ - Step 40971: {'lr': 0.00041923201292724436, 'samples': 7866432, 'steps': 40970, 'loss/train': 1.8128414154052734} -11/07/2021 02:58:56 - INFO - __main__ - Step 40972: {'lr': 0.00041922810686422987, 'samples': 7866624, 'steps': 40971, 'loss/train': 1.3442429304122925} -11/07/2021 02:58:57 - INFO - __main__ - Step 40973: {'lr': 0.00041922420072496383, 'samples': 7866816, 'steps': 40972, 'loss/train': 1.2182066440582275} -11/07/2021 02:58:58 - INFO - __main__ - Step 40974: {'lr': 0.00041922029450944785, 'samples': 7867008, 'steps': 40973, 'loss/train': 1.3147344589233398} -11/07/2021 02:58:58 - INFO - __main__ - Step 40975: {'lr': 0.000419216388217684, 'samples': 7867200, 'steps': 40974, 'loss/train': 1.1383329629898071} -11/07/2021 02:58:58 - INFO - __main__ - Step 40976: {'lr': 0.00041921248184967374, 'samples': 7867392, 'steps': 40975, 'loss/train': 1.6389542818069458} -11/07/2021 02:58:59 - INFO - __main__ - Step 40977: {'lr': 0.000419208575405419, 'samples': 7867584, 'steps': 40976, 'loss/train': 1.6150141954421997} -11/07/2021 02:59:00 - INFO - __main__ - Step 40978: {'lr': 0.00041920466888492147, 'samples': 7867776, 'steps': 40977, 'loss/train': 0.9776393175125122} -11/07/2021 02:59:00 - INFO - __main__ - Step 40979: {'lr': 0.00041920076228818293, 'samples': 7867968, 'steps': 40978, 'loss/train': 1.7132076025009155} -11/07/2021 02:59:00 - INFO - __main__ - Step 40980: {'lr': 0.0004191968556152051, 'samples': 7868160, 'steps': 40979, 'loss/train': 0.4408467710018158} -11/07/2021 02:59:01 - INFO - __main__ - Step 40981: {'lr': 0.0004191929488659898, 'samples': 7868352, 'steps': 40980, 'loss/train': 1.6313823461532593} -11/07/2021 02:59:01 - INFO - __main__ - Step 40982: {'lr': 0.00041918904204053874, 'samples': 7868544, 'steps': 40981, 'loss/train': 1.7473126649856567} -11/07/2021 02:59:02 - INFO - __main__ - Step 40983: {'lr': 0.0004191851351388538, 'samples': 7868736, 'steps': 40982, 'loss/train': 1.521274209022522} -11/07/2021 02:59:03 - INFO - __main__ - Step 40984: {'lr': 0.0004191812281609366, 'samples': 7868928, 'steps': 40983, 'loss/train': 1.632369875907898} -11/07/2021 02:59:03 - INFO - __main__ - Step 40985: {'lr': 0.00041917732110678896, 'samples': 7869120, 'steps': 40984, 'loss/train': 2.443267822265625} -11/07/2021 02:59:03 - INFO - __main__ - Step 40986: {'lr': 0.0004191734139764126, 'samples': 7869312, 'steps': 40985, 'loss/train': 1.7018356323242188} -11/07/2021 02:59:04 - INFO - __main__ - Step 40987: {'lr': 0.00041916950676980933, 'samples': 7869504, 'steps': 40986, 'loss/train': 1.4859052896499634} -11/07/2021 02:59:04 - INFO - __main__ - Step 40988: {'lr': 0.0004191655994869809, 'samples': 7869696, 'steps': 40987, 'loss/train': 1.4574897289276123} -11/07/2021 02:59:05 - INFO - __main__ - Step 40989: {'lr': 0.000419161692127929, 'samples': 7869888, 'steps': 40988, 'loss/train': 1.970042109489441} -11/07/2021 02:59:05 - INFO - __main__ - Step 40990: {'lr': 0.00041915778469265555, 'samples': 7870080, 'steps': 40989, 'loss/train': 1.6592310667037964} -11/07/2021 02:59:06 - INFO - __main__ - Step 40991: {'lr': 0.0004191538771811621, 'samples': 7870272, 'steps': 40990, 'loss/train': 1.3842103481292725} -11/07/2021 02:59:06 - INFO - __main__ - Step 40992: {'lr': 0.00041914996959345057, 'samples': 7870464, 'steps': 40991, 'loss/train': 1.3491690158843994} -11/07/2021 02:59:06 - INFO - __main__ - Step 40993: {'lr': 0.0004191460619295227, 'samples': 7870656, 'steps': 40992, 'loss/train': 1.3155477046966553} -11/07/2021 02:59:08 - INFO - __main__ - Step 40994: {'lr': 0.0004191421541893802, 'samples': 7870848, 'steps': 40993, 'loss/train': 1.4192020893096924} -11/07/2021 02:59:08 - INFO - __main__ - Step 40995: {'lr': 0.0004191382463730249, 'samples': 7871040, 'steps': 40994, 'loss/train': 0.810729444026947} -11/07/2021 02:59:08 - INFO - __main__ - Step 40996: {'lr': 0.00041913433848045844, 'samples': 7871232, 'steps': 40995, 'loss/train': 1.2763605117797852} -11/07/2021 02:59:09 - INFO - __main__ - Step 40997: {'lr': 0.00041913043051168276, 'samples': 7871424, 'steps': 40996, 'loss/train': 1.5386114120483398} -11/07/2021 02:59:09 - INFO - __main__ - Step 40998: {'lr': 0.00041912652246669943, 'samples': 7871616, 'steps': 40997, 'loss/train': 1.7605671882629395} -11/07/2021 02:59:10 - INFO - __main__ - Step 40999: {'lr': 0.0004191226143455103, 'samples': 7871808, 'steps': 40998, 'loss/train': 1.474281668663025} -11/07/2021 02:59:10 - INFO - __main__ - Step 41000: {'lr': 0.00041911870614811715, 'samples': 7872000, 'steps': 40999, 'loss/train': 1.4995510578155518} -11/07/2021 02:59:11 - INFO - __main__ - Step 41001: {'lr': 0.00041911479787452177, 'samples': 7872192, 'steps': 41000, 'loss/train': 1.3275129795074463} -11/07/2021 02:59:11 - INFO - __main__ - Step 41002: {'lr': 0.0004191108895247258, 'samples': 7872384, 'steps': 41001, 'loss/train': 1.3515865802764893} -11/07/2021 02:59:11 - INFO - __main__ - Step 41003: {'lr': 0.00041910698109873116, 'samples': 7872576, 'steps': 41002, 'loss/train': 1.233052372932434} -11/07/2021 02:59:12 - INFO - __main__ - Step 41004: {'lr': 0.0004191030725965394, 'samples': 7872768, 'steps': 41003, 'loss/train': 1.0532420873641968} -11/07/2021 02:59:13 - INFO - __main__ - Step 41005: {'lr': 0.00041909916401815245, 'samples': 7872960, 'steps': 41004, 'loss/train': 1.5793228149414062} -11/07/2021 02:59:13 - INFO - __main__ - Step 41006: {'lr': 0.00041909525536357206, 'samples': 7873152, 'steps': 41005, 'loss/train': 1.4701327085494995} -11/07/2021 02:59:14 - INFO - __main__ - Step 41007: {'lr': 0.0004190913466327999, 'samples': 7873344, 'steps': 41006, 'loss/train': 1.8696014881134033} -11/07/2021 02:59:14 - INFO - __main__ - Step 41008: {'lr': 0.00041908743782583793, 'samples': 7873536, 'steps': 41007, 'loss/train': 1.466177225112915} -11/07/2021 02:59:14 - INFO - __main__ - Step 41009: {'lr': 0.00041908352894268766, 'samples': 7873728, 'steps': 41008, 'loss/train': 1.524558663368225} -11/07/2021 02:59:15 - INFO - __main__ - Step 41010: {'lr': 0.00041907961998335094, 'samples': 7873920, 'steps': 41009, 'loss/train': 1.7194336652755737} -11/07/2021 02:59:16 - INFO - __main__ - Step 41011: {'lr': 0.0004190757109478296, 'samples': 7874112, 'steps': 41010, 'loss/train': 1.3648717403411865} -11/07/2021 02:59:16 - INFO - __main__ - Step 41012: {'lr': 0.00041907180183612525, 'samples': 7874304, 'steps': 41011, 'loss/train': 1.446285605430603} -11/07/2021 02:59:16 - INFO - __main__ - Step 41013: {'lr': 0.00041906789264823985, 'samples': 7874496, 'steps': 41012, 'loss/train': 1.3314675092697144} -11/07/2021 02:59:17 - INFO - __main__ - Step 41014: {'lr': 0.00041906398338417504, 'samples': 7874688, 'steps': 41013, 'loss/train': 1.8180811405181885} -11/07/2021 02:59:18 - INFO - __main__ - Step 41015: {'lr': 0.00041906007404393273, 'samples': 7874880, 'steps': 41014, 'loss/train': 1.1559853553771973} -11/07/2021 02:59:18 - INFO - __main__ - Step 41016: {'lr': 0.0004190561646275144, 'samples': 7875072, 'steps': 41015, 'loss/train': 1.9799628257751465} -11/07/2021 02:59:18 - INFO - __main__ - Step 41017: {'lr': 0.0004190522551349221, 'samples': 7875264, 'steps': 41016, 'loss/train': 1.4010202884674072} -11/07/2021 02:59:19 - INFO - __main__ - Step 41018: {'lr': 0.00041904834556615733, 'samples': 7875456, 'steps': 41017, 'loss/train': 1.2678967714309692} -11/07/2021 02:59:19 - INFO - __main__ - Step 41019: {'lr': 0.000419044435921222, 'samples': 7875648, 'steps': 41018, 'loss/train': 1.5244847536087036} -11/07/2021 02:59:20 - INFO - __main__ - Step 41020: {'lr': 0.0004190405262001179, 'samples': 7875840, 'steps': 41019, 'loss/train': 1.3021565675735474} -11/07/2021 02:59:21 - INFO - __main__ - Step 41021: {'lr': 0.00041903661640284675, 'samples': 7876032, 'steps': 41020, 'loss/train': 1.822368860244751} -11/07/2021 02:59:21 - INFO - __main__ - Step 41022: {'lr': 0.0004190327065294104, 'samples': 7876224, 'steps': 41021, 'loss/train': 0.6467123627662659} -11/07/2021 02:59:21 - INFO - __main__ - Step 41023: {'lr': 0.00041902879657981036, 'samples': 7876416, 'steps': 41022, 'loss/train': 1.0762028694152832} -11/07/2021 02:59:22 - INFO - __main__ - Step 41024: {'lr': 0.00041902488655404864, 'samples': 7876608, 'steps': 41023, 'loss/train': 1.6476768255233765} -11/07/2021 02:59:23 - INFO - __main__ - Step 41025: {'lr': 0.0004190209764521269, 'samples': 7876800, 'steps': 41024, 'loss/train': 1.7097328901290894} -11/07/2021 02:59:23 - INFO - __main__ - Step 41026: {'lr': 0.0004190170662740469, 'samples': 7876992, 'steps': 41025, 'loss/train': 1.1358178853988647} -11/07/2021 02:59:23 - INFO - __main__ - Step 41027: {'lr': 0.0004190131560198104, 'samples': 7877184, 'steps': 41026, 'loss/train': 1.4658715724945068} -11/07/2021 02:59:24 - INFO - __main__ - Step 41028: {'lr': 0.00041900924568941925, 'samples': 7877376, 'steps': 41027, 'loss/train': 0.515064537525177} -11/07/2021 02:59:24 - INFO - __main__ - Step 41029: {'lr': 0.0004190053352828751, 'samples': 7877568, 'steps': 41028, 'loss/train': 1.1149355173110962} -11/07/2021 02:59:25 - INFO - __main__ - Step 41030: {'lr': 0.00041900142480017974, 'samples': 7877760, 'steps': 41029, 'loss/train': 0.8842067718505859} -11/07/2021 02:59:25 - INFO - __main__ - Step 41031: {'lr': 0.0004189975142413349, 'samples': 7877952, 'steps': 41030, 'loss/train': 1.2230801582336426} -11/07/2021 02:59:26 - INFO - __main__ - Step 41032: {'lr': 0.00041899360360634247, 'samples': 7878144, 'steps': 41031, 'loss/train': 1.5904314517974854} -11/07/2021 02:59:26 - INFO - __main__ - Step 41033: {'lr': 0.0004189896928952041, 'samples': 7878336, 'steps': 41032, 'loss/train': 1.352460265159607} -11/07/2021 02:59:26 - INFO - __main__ - Step 41034: {'lr': 0.0004189857821079216, 'samples': 7878528, 'steps': 41033, 'loss/train': 1.438441514968872} -11/07/2021 02:59:28 - INFO - __main__ - Step 41035: {'lr': 0.0004189818712444967, 'samples': 7878720, 'steps': 41034, 'loss/train': 1.6369142532348633} -11/07/2021 02:59:28 - INFO - __main__ - Step 41036: {'lr': 0.0004189779603049312, 'samples': 7878912, 'steps': 41035, 'loss/train': 0.795782208442688} -11/07/2021 02:59:28 - INFO - __main__ - Step 41037: {'lr': 0.0004189740492892268, 'samples': 7879104, 'steps': 41036, 'loss/train': 1.4832515716552734} -11/07/2021 02:59:29 - INFO - __main__ - Step 41038: {'lr': 0.0004189701381973853, 'samples': 7879296, 'steps': 41037, 'loss/train': 1.3019779920578003} -11/07/2021 02:59:29 - INFO - __main__ - Step 41039: {'lr': 0.00041896622702940846, 'samples': 7879488, 'steps': 41038, 'loss/train': 1.4662656784057617} -11/07/2021 02:59:29 - INFO - __main__ - Step 41040: {'lr': 0.0004189623157852981, 'samples': 7879680, 'steps': 41039, 'loss/train': 1.8899928331375122} -11/07/2021 02:59:30 - INFO - __main__ - Step 41041: {'lr': 0.0004189584044650559, 'samples': 7879872, 'steps': 41040, 'loss/train': 2.035140037536621} -11/07/2021 02:59:31 - INFO - __main__ - Step 41042: {'lr': 0.0004189544930686837, 'samples': 7880064, 'steps': 41041, 'loss/train': 2.037627696990967} -11/07/2021 02:59:31 - INFO - __main__ - Step 41043: {'lr': 0.0004189505815961831, 'samples': 7880256, 'steps': 41042, 'loss/train': 1.5560941696166992} -11/07/2021 02:59:31 - INFO - __main__ - Step 41044: {'lr': 0.000418946670047556, 'samples': 7880448, 'steps': 41043, 'loss/train': 1.392247200012207} -11/07/2021 02:59:32 - INFO - __main__ - Step 41045: {'lr': 0.0004189427584228042, 'samples': 7880640, 'steps': 41044, 'loss/train': 1.5331697463989258} -11/07/2021 02:59:33 - INFO - __main__ - Step 41046: {'lr': 0.0004189388467219294, 'samples': 7880832, 'steps': 41045, 'loss/train': 1.496413230895996} -11/07/2021 02:59:33 - INFO - __main__ - Step 41047: {'lr': 0.0004189349349449333, 'samples': 7881024, 'steps': 41046, 'loss/train': 1.2940542697906494} -11/07/2021 02:59:34 - INFO - __main__ - Step 41048: {'lr': 0.00041893102309181773, 'samples': 7881216, 'steps': 41047, 'loss/train': 1.5159060955047607} -11/07/2021 02:59:34 - INFO - __main__ - Step 41049: {'lr': 0.00041892711116258454, 'samples': 7881408, 'steps': 41048, 'loss/train': 1.2349627017974854} -11/07/2021 02:59:34 - INFO - __main__ - Step 41050: {'lr': 0.00041892319915723533, 'samples': 7881600, 'steps': 41049, 'loss/train': 1.1747950315475464} -11/07/2021 02:59:35 - INFO - __main__ - Step 41051: {'lr': 0.0004189192870757719, 'samples': 7881792, 'steps': 41050, 'loss/train': 1.7542132139205933} -11/07/2021 02:59:36 - INFO - __main__ - Step 41052: {'lr': 0.0004189153749181961, 'samples': 7881984, 'steps': 41051, 'loss/train': 1.3275436162948608} -11/07/2021 02:59:36 - INFO - __main__ - Step 41053: {'lr': 0.00041891146268450963, 'samples': 7882176, 'steps': 41052, 'loss/train': 1.717761516571045} -11/07/2021 02:59:37 - INFO - __main__ - Step 41054: {'lr': 0.0004189075503747142, 'samples': 7882368, 'steps': 41053, 'loss/train': 1.5952472686767578} -11/07/2021 02:59:37 - INFO - __main__ - Step 41055: {'lr': 0.0004189036379888117, 'samples': 7882560, 'steps': 41054, 'loss/train': 1.4856972694396973} -11/07/2021 02:59:37 - INFO - __main__ - Step 41056: {'lr': 0.00041889972552680387, 'samples': 7882752, 'steps': 41055, 'loss/train': 1.6331814527511597} -11/07/2021 02:59:38 - INFO - __main__ - Step 41057: {'lr': 0.0004188958129886924, 'samples': 7882944, 'steps': 41056, 'loss/train': 1.7809665203094482} -11/07/2021 02:59:39 - INFO - __main__ - Step 41058: {'lr': 0.000418891900374479, 'samples': 7883136, 'steps': 41057, 'loss/train': 1.209208369255066} -11/07/2021 02:59:39 - INFO - __main__ - Step 41059: {'lr': 0.0004188879876841656, 'samples': 7883328, 'steps': 41058, 'loss/train': 2.0920801162719727} -11/07/2021 02:59:39 - INFO - __main__ - Step 41060: {'lr': 0.0004188840749177538, 'samples': 7883520, 'steps': 41059, 'loss/train': 1.6948528289794922} -11/07/2021 02:59:40 - INFO - __main__ - Step 41061: {'lr': 0.0004188801620752455, 'samples': 7883712, 'steps': 41060, 'loss/train': 1.7842382192611694} -11/07/2021 02:59:41 - INFO - __main__ - Step 41062: {'lr': 0.00041887624915664247, 'samples': 7883904, 'steps': 41061, 'loss/train': 0.37048017978668213} -11/07/2021 02:59:41 - INFO - __main__ - Step 41063: {'lr': 0.0004188723361619463, 'samples': 7884096, 'steps': 41062, 'loss/train': 1.9038022756576538} -11/07/2021 02:59:41 - INFO - __main__ - Step 41064: {'lr': 0.0004188684230911589, 'samples': 7884288, 'steps': 41063, 'loss/train': 1.2390437126159668} -11/07/2021 02:59:42 - INFO - __main__ - Step 41065: {'lr': 0.00041886450994428197, 'samples': 7884480, 'steps': 41064, 'loss/train': 1.3526166677474976} -11/07/2021 02:59:42 - INFO - __main__ - Step 41066: {'lr': 0.0004188605967213174, 'samples': 7884672, 'steps': 41065, 'loss/train': 0.6758860945701599} -11/07/2021 02:59:43 - INFO - __main__ - Step 41067: {'lr': 0.0004188566834222667, 'samples': 7884864, 'steps': 41066, 'loss/train': 1.5114113092422485} -11/07/2021 02:59:43 - INFO - __main__ - Step 41068: {'lr': 0.00041885277004713185, 'samples': 7885056, 'steps': 41067, 'loss/train': 1.4266055822372437} -11/07/2021 02:59:44 - INFO - __main__ - Step 41069: {'lr': 0.0004188488565959146, 'samples': 7885248, 'steps': 41068, 'loss/train': 1.9119995832443237} -11/07/2021 02:59:44 - INFO - __main__ - Step 41070: {'lr': 0.0004188449430686166, 'samples': 7885440, 'steps': 41069, 'loss/train': 1.4126471281051636} -11/07/2021 02:59:44 - INFO - __main__ - Step 41071: {'lr': 0.00041884102946523964, 'samples': 7885632, 'steps': 41070, 'loss/train': 1.4124705791473389} -11/07/2021 02:59:45 - INFO - __main__ - Step 41072: {'lr': 0.0004188371157857856, 'samples': 7885824, 'steps': 41071, 'loss/train': 2.075404167175293} -11/07/2021 02:59:46 - INFO - __main__ - Step 41073: {'lr': 0.0004188332020302561, 'samples': 7886016, 'steps': 41072, 'loss/train': 1.1294195652008057} -11/07/2021 02:59:46 - INFO - __main__ - Step 41074: {'lr': 0.000418829288198653, 'samples': 7886208, 'steps': 41073, 'loss/train': 1.5374236106872559} -11/07/2021 02:59:47 - INFO - __main__ - Step 41075: {'lr': 0.00041882537429097804, 'samples': 7886400, 'steps': 41074, 'loss/train': 1.0856437683105469} -11/07/2021 02:59:47 - INFO - __main__ - Step 41076: {'lr': 0.00041882146030723297, 'samples': 7886592, 'steps': 41075, 'loss/train': 1.1252588033676147} -11/07/2021 02:59:48 - INFO - __main__ - Step 41077: {'lr': 0.0004188175462474195, 'samples': 7886784, 'steps': 41076, 'loss/train': 1.6488182544708252} -11/07/2021 02:59:48 - INFO - __main__ - Step 41078: {'lr': 0.0004188136321115395, 'samples': 7886976, 'steps': 41077, 'loss/train': 1.5101019144058228} -11/07/2021 02:59:49 - INFO - __main__ - Step 41079: {'lr': 0.00041880971789959466, 'samples': 7887168, 'steps': 41078, 'loss/train': 1.8681154251098633} -11/07/2021 02:59:49 - INFO - __main__ - Step 41080: {'lr': 0.0004188058036115868, 'samples': 7887360, 'steps': 41079, 'loss/train': 1.7132915258407593} -11/07/2021 02:59:49 - INFO - __main__ - Step 41081: {'lr': 0.0004188018892475176, 'samples': 7887552, 'steps': 41080, 'loss/train': 1.715844988822937} -11/07/2021 02:59:50 - INFO - __main__ - Step 41082: {'lr': 0.0004187979748073889, 'samples': 7887744, 'steps': 41081, 'loss/train': 1.5530753135681152} -11/07/2021 02:59:51 - INFO - __main__ - Step 41083: {'lr': 0.0004187940602912024, 'samples': 7887936, 'steps': 41082, 'loss/train': 1.3540942668914795} -11/07/2021 02:59:51 - INFO - __main__ - Step 41084: {'lr': 0.00041879014569895994, 'samples': 7888128, 'steps': 41083, 'loss/train': 1.4271323680877686} -11/07/2021 02:59:51 - INFO - __main__ - Step 41085: {'lr': 0.0004187862310306633, 'samples': 7888320, 'steps': 41084, 'loss/train': 1.9033116102218628} -11/07/2021 02:59:52 - INFO - __main__ - Step 41086: {'lr': 0.00041878231628631406, 'samples': 7888512, 'steps': 41085, 'loss/train': 2.167079448699951} -11/07/2021 02:59:53 - INFO - __main__ - Step 41087: {'lr': 0.0004187784014659142, 'samples': 7888704, 'steps': 41086, 'loss/train': 0.9366491436958313} -11/07/2021 02:59:53 - INFO - __main__ - Step 41088: {'lr': 0.0004187744865694654, 'samples': 7888896, 'steps': 41087, 'loss/train': 1.4434558153152466} -11/07/2021 02:59:54 - INFO - __main__ - Step 41089: {'lr': 0.0004187705715969694, 'samples': 7889088, 'steps': 41088, 'loss/train': 1.1905782222747803} -11/07/2021 02:59:54 - INFO - __main__ - Step 41090: {'lr': 0.0004187666565484279, 'samples': 7889280, 'steps': 41089, 'loss/train': 1.3745850324630737} -11/07/2021 02:59:54 - INFO - __main__ - Step 41091: {'lr': 0.0004187627414238428, 'samples': 7889472, 'steps': 41090, 'loss/train': 0.6837329864501953} -11/07/2021 02:59:55 - INFO - __main__ - Step 41092: {'lr': 0.0004187588262232159, 'samples': 7889664, 'steps': 41091, 'loss/train': 1.574971079826355} -11/07/2021 02:59:56 - INFO - __main__ - Step 41093: {'lr': 0.00041875491094654885, 'samples': 7889856, 'steps': 41092, 'loss/train': 1.2117096185684204} -11/07/2021 02:59:56 - INFO - __main__ - Step 41094: {'lr': 0.0004187509955938434, 'samples': 7890048, 'steps': 41093, 'loss/train': 1.3760145902633667} -11/07/2021 02:59:56 - INFO - __main__ - Step 41095: {'lr': 0.0004187470801651013, 'samples': 7890240, 'steps': 41094, 'loss/train': 1.254813551902771} -11/07/2021 02:59:57 - INFO - __main__ - Step 41096: {'lr': 0.0004187431646603245, 'samples': 7890432, 'steps': 41095, 'loss/train': 1.0888969898223877} -11/07/2021 02:59:58 - INFO - __main__ - Step 41097: {'lr': 0.0004187392490795146, 'samples': 7890624, 'steps': 41096, 'loss/train': 1.7391693592071533} -11/07/2021 02:59:58 - INFO - __main__ - Step 41098: {'lr': 0.00041873533342267336, 'samples': 7890816, 'steps': 41097, 'loss/train': 1.4721550941467285} -11/07/2021 02:59:58 - INFO - __main__ - Step 41099: {'lr': 0.0004187314176898026, 'samples': 7891008, 'steps': 41098, 'loss/train': 1.741350769996643} -11/07/2021 02:59:59 - INFO - __main__ - Step 41100: {'lr': 0.000418727501880904, 'samples': 7891200, 'steps': 41099, 'loss/train': 2.3582005500793457} -11/07/2021 02:59:59 - INFO - __main__ - Step 41101: {'lr': 0.00041872358599597947, 'samples': 7891392, 'steps': 41100, 'loss/train': 1.6507580280303955} -11/07/2021 02:59:59 - INFO - __main__ - Step 41102: {'lr': 0.00041871967003503073, 'samples': 7891584, 'steps': 41101, 'loss/train': 1.177298903465271} -11/07/2021 03:00:01 - INFO - __main__ - Step 41103: {'lr': 0.00041871575399805947, 'samples': 7891776, 'steps': 41102, 'loss/train': 1.187396764755249} -11/07/2021 03:00:01 - INFO - __main__ - Step 41104: {'lr': 0.0004187118378850674, 'samples': 7891968, 'steps': 41103, 'loss/train': 1.6059626340866089} -11/07/2021 03:00:01 - INFO - __main__ - Step 41105: {'lr': 0.00041870792169605654, 'samples': 7892160, 'steps': 41104, 'loss/train': 2.1208462715148926} -11/07/2021 03:00:02 - INFO - __main__ - Step 41106: {'lr': 0.0004187040054310284, 'samples': 7892352, 'steps': 41105, 'loss/train': 1.490696907043457} -11/07/2021 03:00:02 - INFO - __main__ - Step 41107: {'lr': 0.0004187000890899848, 'samples': 7892544, 'steps': 41106, 'loss/train': 1.494994044303894} -11/07/2021 03:00:03 - INFO - __main__ - Step 41108: {'lr': 0.0004186961726729276, 'samples': 7892736, 'steps': 41107, 'loss/train': 1.3582350015640259} -11/07/2021 03:00:03 - INFO - __main__ - Step 41109: {'lr': 0.0004186922561798585, 'samples': 7892928, 'steps': 41108, 'loss/train': 0.9714041948318481} -11/07/2021 03:00:04 - INFO - __main__ - Step 41110: {'lr': 0.00041868833961077935, 'samples': 7893120, 'steps': 41109, 'loss/train': 1.1687935590744019} -11/07/2021 03:00:04 - INFO - __main__ - Step 41111: {'lr': 0.0004186844229656917, 'samples': 7893312, 'steps': 41110, 'loss/train': 1.5238968133926392} -11/07/2021 03:00:04 - INFO - __main__ - Step 41112: {'lr': 0.0004186805062445975, 'samples': 7893504, 'steps': 41111, 'loss/train': 1.8914436101913452} -11/07/2021 03:00:06 - INFO - __main__ - Step 41113: {'lr': 0.00041867658944749856, 'samples': 7893696, 'steps': 41112, 'loss/train': 1.78902006149292} -11/07/2021 03:00:06 - INFO - __main__ - Step 41114: {'lr': 0.00041867267257439644, 'samples': 7893888, 'steps': 41113, 'loss/train': 1.6058887243270874} -11/07/2021 03:00:06 - INFO - __main__ - Step 41115: {'lr': 0.00041866875562529305, 'samples': 7894080, 'steps': 41114, 'loss/train': 1.6523754596710205} -11/07/2021 03:00:07 - INFO - __main__ - Step 41116: {'lr': 0.0004186648386001901, 'samples': 7894272, 'steps': 41115, 'loss/train': 0.9120059013366699} -11/07/2021 03:00:07 - INFO - __main__ - Step 41117: {'lr': 0.0004186609214990894, 'samples': 7894464, 'steps': 41116, 'loss/train': 1.5206637382507324} -11/07/2021 03:00:07 - INFO - __main__ - Step 41118: {'lr': 0.0004186570043219927, 'samples': 7894656, 'steps': 41117, 'loss/train': 1.4369728565216064} -11/07/2021 03:00:08 - INFO - __main__ - Step 41119: {'lr': 0.0004186530870689017, 'samples': 7894848, 'steps': 41118, 'loss/train': 1.2693451642990112} -11/07/2021 03:00:09 - INFO - __main__ - Step 41120: {'lr': 0.00041864916973981833, 'samples': 7895040, 'steps': 41119, 'loss/train': 1.017479419708252} -11/07/2021 03:00:09 - INFO - __main__ - Step 41121: {'lr': 0.0004186452523347442, 'samples': 7895232, 'steps': 41120, 'loss/train': 1.0667365789413452} -11/07/2021 03:00:09 - INFO - __main__ - Step 41122: {'lr': 0.00041864133485368106, 'samples': 7895424, 'steps': 41121, 'loss/train': 1.0865099430084229} -11/07/2021 03:00:10 - INFO - __main__ - Step 41123: {'lr': 0.0004186374172966308, 'samples': 7895616, 'steps': 41122, 'loss/train': 1.5828053951263428} -11/07/2021 03:00:11 - INFO - __main__ - Step 41124: {'lr': 0.0004186334996635951, 'samples': 7895808, 'steps': 41123, 'loss/train': 1.979206919670105} -11/07/2021 03:00:11 - INFO - __main__ - Step 41125: {'lr': 0.00041862958195457574, 'samples': 7896000, 'steps': 41124, 'loss/train': 0.7947288751602173} -11/07/2021 03:00:12 - INFO - __main__ - Step 41126: {'lr': 0.0004186256641695745, 'samples': 7896192, 'steps': 41125, 'loss/train': 0.6448233723640442} -11/07/2021 03:00:12 - INFO - __main__ - Step 41127: {'lr': 0.00041862174630859315, 'samples': 7896384, 'steps': 41126, 'loss/train': 1.4096827507019043} -11/07/2021 03:00:12 - INFO - __main__ - Step 41128: {'lr': 0.0004186178283716334, 'samples': 7896576, 'steps': 41127, 'loss/train': 1.2233763933181763} -11/07/2021 03:00:13 - INFO - __main__ - Step 41129: {'lr': 0.0004186139103586971, 'samples': 7896768, 'steps': 41128, 'loss/train': 1.5383292436599731} -11/07/2021 03:00:14 - INFO - __main__ - Step 41130: {'lr': 0.00041860999226978605, 'samples': 7896960, 'steps': 41129, 'loss/train': 1.4980281591415405} -11/07/2021 03:00:14 - INFO - __main__ - Step 41131: {'lr': 0.0004186060741049018, 'samples': 7897152, 'steps': 41130, 'loss/train': 0.919456958770752} -11/07/2021 03:00:15 - INFO - __main__ - Step 41132: {'lr': 0.00041860215586404624, 'samples': 7897344, 'steps': 41131, 'loss/train': 1.7707819938659668} -11/07/2021 03:00:15 - INFO - __main__ - Step 41133: {'lr': 0.00041859823754722127, 'samples': 7897536, 'steps': 41132, 'loss/train': 1.076181411743164} -11/07/2021 03:00:16 - INFO - __main__ - Step 41134: {'lr': 0.00041859431915442847, 'samples': 7897728, 'steps': 41133, 'loss/train': 1.4806371927261353} -11/07/2021 03:00:16 - INFO - __main__ - Step 41135: {'lr': 0.0004185904006856697, 'samples': 7897920, 'steps': 41134, 'loss/train': 1.6345583200454712} -11/07/2021 03:00:17 - INFO - __main__ - Step 41136: {'lr': 0.0004185864821409467, 'samples': 7898112, 'steps': 41135, 'loss/train': 1.5924763679504395} -11/07/2021 03:00:17 - INFO - __main__ - Step 41137: {'lr': 0.00041858256352026124, 'samples': 7898304, 'steps': 41136, 'loss/train': 1.5258071422576904} -11/07/2021 03:00:17 - INFO - __main__ - Step 41138: {'lr': 0.0004185786448236151, 'samples': 7898496, 'steps': 41137, 'loss/train': 1.2716859579086304} -11/07/2021 03:00:18 - INFO - __main__ - Step 41139: {'lr': 0.0004185747260510099, 'samples': 7898688, 'steps': 41138, 'loss/train': 1.5812559127807617} -11/07/2021 03:00:19 - INFO - __main__ - Step 41140: {'lr': 0.0004185708072024476, 'samples': 7898880, 'steps': 41139, 'loss/train': 1.661331057548523} -11/07/2021 03:00:19 - INFO - __main__ - Step 41141: {'lr': 0.0004185668882779299, 'samples': 7899072, 'steps': 41140, 'loss/train': 1.2637416124343872} -11/07/2021 03:00:19 - INFO - __main__ - Step 41142: {'lr': 0.00041856296927745857, 'samples': 7899264, 'steps': 41141, 'loss/train': 1.122740626335144} -11/07/2021 03:00:20 - INFO - __main__ - Step 41143: {'lr': 0.00041855905020103543, 'samples': 7899456, 'steps': 41142, 'loss/train': 1.4493659734725952} -11/07/2021 03:00:21 - INFO - __main__ - Step 41144: {'lr': 0.00041855513104866203, 'samples': 7899648, 'steps': 41143, 'loss/train': 1.2647788524627686} -11/07/2021 03:00:21 - INFO - __main__ - Step 41145: {'lr': 0.00041855121182034037, 'samples': 7899840, 'steps': 41144, 'loss/train': 1.7006542682647705} -11/07/2021 03:00:22 - INFO - __main__ - Step 41146: {'lr': 0.00041854729251607214, 'samples': 7900032, 'steps': 41145, 'loss/train': 1.4035475254058838} -11/07/2021 03:00:22 - INFO - __main__ - Step 41147: {'lr': 0.00041854337313585913, 'samples': 7900224, 'steps': 41146, 'loss/train': 1.5544965267181396} -11/07/2021 03:00:22 - INFO - __main__ - Step 41148: {'lr': 0.000418539453679703, 'samples': 7900416, 'steps': 41147, 'loss/train': 1.6288424730300903} -11/07/2021 03:00:23 - INFO - __main__ - Step 41149: {'lr': 0.0004185355341476057, 'samples': 7900608, 'steps': 41148, 'loss/train': 1.534730315208435} -11/07/2021 03:00:24 - INFO - __main__ - Step 41150: {'lr': 0.00041853161453956885, 'samples': 7900800, 'steps': 41149, 'loss/train': 1.6405394077301025} -11/07/2021 03:00:24 - INFO - __main__ - Step 41151: {'lr': 0.0004185276948555942, 'samples': 7900992, 'steps': 41150, 'loss/train': 1.3956571817398071} -11/07/2021 03:00:24 - INFO - __main__ - Step 41152: {'lr': 0.0004185237750956836, 'samples': 7901184, 'steps': 41151, 'loss/train': 1.4736276865005493} -11/07/2021 03:00:25 - INFO - __main__ - Step 41153: {'lr': 0.0004185198552598388, 'samples': 7901376, 'steps': 41152, 'loss/train': 1.2600595951080322} -11/07/2021 03:00:26 - INFO - __main__ - Step 41154: {'lr': 0.00041851593534806154, 'samples': 7901568, 'steps': 41153, 'loss/train': 1.4591710567474365} -11/07/2021 03:00:26 - INFO - __main__ - Step 41155: {'lr': 0.0004185120153603536, 'samples': 7901760, 'steps': 41154, 'loss/train': 1.0266485214233398} -11/07/2021 03:00:27 - INFO - __main__ - Step 41156: {'lr': 0.0004185080952967168, 'samples': 7901952, 'steps': 41155, 'loss/train': 1.5074058771133423} -11/07/2021 03:00:27 - INFO - __main__ - Step 41157: {'lr': 0.00041850417515715277, 'samples': 7902144, 'steps': 41156, 'loss/train': 1.0465952157974243} -11/07/2021 03:00:27 - INFO - __main__ - Step 41158: {'lr': 0.00041850025494166346, 'samples': 7902336, 'steps': 41157, 'loss/train': 1.8012182712554932} -11/07/2021 03:00:28 - INFO - __main__ - Step 41159: {'lr': 0.0004184963346502504, 'samples': 7902528, 'steps': 41158, 'loss/train': 1.931903600692749} -11/07/2021 03:00:29 - INFO - __main__ - Step 41160: {'lr': 0.00041849241428291555, 'samples': 7902720, 'steps': 41159, 'loss/train': 0.7333551049232483} -11/07/2021 03:00:29 - INFO - __main__ - Step 41161: {'lr': 0.00041848849383966063, 'samples': 7902912, 'steps': 41160, 'loss/train': 0.9262370467185974} -11/07/2021 03:00:29 - INFO - __main__ - Step 41162: {'lr': 0.0004184845733204874, 'samples': 7903104, 'steps': 41161, 'loss/train': 1.379118800163269} -11/07/2021 03:00:30 - INFO - __main__ - Step 41163: {'lr': 0.00041848065272539765, 'samples': 7903296, 'steps': 41162, 'loss/train': 1.4716529846191406} -11/07/2021 03:00:31 - INFO - __main__ - Step 41164: {'lr': 0.00041847673205439305, 'samples': 7903488, 'steps': 41163, 'loss/train': 1.436081886291504} -11/07/2021 03:00:31 - INFO - __main__ - Step 41165: {'lr': 0.0004184728113074755, 'samples': 7903680, 'steps': 41164, 'loss/train': 1.4125069379806519} -11/07/2021 03:00:31 - INFO - __main__ - Step 41166: {'lr': 0.00041846889048464665, 'samples': 7903872, 'steps': 41165, 'loss/train': 1.7010443210601807} -11/07/2021 03:00:32 - INFO - __main__ - Step 41167: {'lr': 0.0004184649695859083, 'samples': 7904064, 'steps': 41166, 'loss/train': 1.6647261381149292} -11/07/2021 03:00:32 - INFO - __main__ - Step 41168: {'lr': 0.00041846104861126233, 'samples': 7904256, 'steps': 41167, 'loss/train': 2.12406325340271} -11/07/2021 03:00:33 - INFO - __main__ - Step 41169: {'lr': 0.0004184571275607103, 'samples': 7904448, 'steps': 41168, 'loss/train': 1.7294236421585083} -11/07/2021 03:00:34 - INFO - __main__ - Step 41170: {'lr': 0.0004184532064342542, 'samples': 7904640, 'steps': 41169, 'loss/train': 1.4182112216949463} -11/07/2021 03:00:34 - INFO - __main__ - Step 41171: {'lr': 0.0004184492852318956, 'samples': 7904832, 'steps': 41170, 'loss/train': 1.6887729167938232} -11/07/2021 03:00:34 - INFO - __main__ - Step 41172: {'lr': 0.00041844536395363636, 'samples': 7905024, 'steps': 41171, 'loss/train': 1.4426734447479248} -11/07/2021 03:00:35 - INFO - __main__ - Step 41173: {'lr': 0.00041844144259947825, 'samples': 7905216, 'steps': 41172, 'loss/train': 1.449723720550537} -11/07/2021 03:00:36 - INFO - __main__ - Step 41174: {'lr': 0.000418437521169423, 'samples': 7905408, 'steps': 41173, 'loss/train': 1.7111395597457886} -11/07/2021 03:00:36 - INFO - __main__ - Step 41175: {'lr': 0.0004184335996634725, 'samples': 7905600, 'steps': 41174, 'loss/train': 1.5197077989578247} -11/07/2021 03:00:36 - INFO - __main__ - Step 41176: {'lr': 0.00041842967808162834, 'samples': 7905792, 'steps': 41175, 'loss/train': 1.224771499633789} -11/07/2021 03:00:37 - INFO - __main__ - Step 41177: {'lr': 0.0004184257564238924, 'samples': 7905984, 'steps': 41176, 'loss/train': 1.630832314491272} -11/07/2021 03:00:37 - INFO - __main__ - Step 41178: {'lr': 0.0004184218346902663, 'samples': 7906176, 'steps': 41177, 'loss/train': 1.420072078704834} -11/07/2021 03:00:37 - INFO - __main__ - Step 41179: {'lr': 0.00041841791288075203, 'samples': 7906368, 'steps': 41178, 'loss/train': 1.6199049949645996} -11/07/2021 03:00:39 - INFO - __main__ - Step 41180: {'lr': 0.0004184139909953513, 'samples': 7906560, 'steps': 41179, 'loss/train': 1.5802867412567139} -11/07/2021 03:00:39 - INFO - __main__ - Step 41181: {'lr': 0.0004184100690340657, 'samples': 7906752, 'steps': 41180, 'loss/train': 1.0029767751693726} -11/07/2021 03:00:39 - INFO - __main__ - Step 41182: {'lr': 0.00041840614699689715, 'samples': 7906944, 'steps': 41181, 'loss/train': 1.5073751211166382} -11/07/2021 03:00:40 - INFO - __main__ - Step 41183: {'lr': 0.00041840222488384745, 'samples': 7907136, 'steps': 41182, 'loss/train': 1.5685653686523438} -11/07/2021 03:00:40 - INFO - __main__ - Step 41184: {'lr': 0.00041839830269491823, 'samples': 7907328, 'steps': 41183, 'loss/train': 1.391185998916626} -11/07/2021 03:00:41 - INFO - __main__ - Step 41185: {'lr': 0.0004183943804301114, 'samples': 7907520, 'steps': 41184, 'loss/train': 1.2560378313064575} -11/07/2021 03:00:41 - INFO - __main__ - Step 41186: {'lr': 0.0004183904580894287, 'samples': 7907712, 'steps': 41185, 'loss/train': 1.225590467453003} -11/07/2021 03:00:42 - INFO - __main__ - Step 41187: {'lr': 0.0004183865356728717, 'samples': 7907904, 'steps': 41186, 'loss/train': 1.9919193983078003} -11/07/2021 03:00:42 - INFO - __main__ - Step 41188: {'lr': 0.0004183826131804424, 'samples': 7908096, 'steps': 41187, 'loss/train': 1.4859697818756104} -11/07/2021 03:00:42 - INFO - __main__ - Step 41189: {'lr': 0.0004183786906121425, 'samples': 7908288, 'steps': 41188, 'loss/train': 1.4693942070007324} -11/07/2021 03:00:43 - INFO - __main__ - Step 41190: {'lr': 0.0004183747679679738, 'samples': 7908480, 'steps': 41189, 'loss/train': 1.2072123289108276} -11/07/2021 03:00:44 - INFO - __main__ - Step 41191: {'lr': 0.000418370845247938, 'samples': 7908672, 'steps': 41190, 'loss/train': 1.5702741146087646} -11/07/2021 03:00:44 - INFO - __main__ - Step 41192: {'lr': 0.0004183669224520369, 'samples': 7908864, 'steps': 41191, 'loss/train': 1.5912758111953735} -11/07/2021 03:00:44 - INFO - __main__ - Step 41193: {'lr': 0.00041836299958027226, 'samples': 7909056, 'steps': 41192, 'loss/train': 1.2868040800094604} -11/07/2021 03:00:45 - INFO - __main__ - Step 41194: {'lr': 0.00041835907663264585, 'samples': 7909248, 'steps': 41193, 'loss/train': 2.07917857170105} -11/07/2021 03:00:46 - INFO - __main__ - Step 41195: {'lr': 0.0004183551536091594, 'samples': 7909440, 'steps': 41194, 'loss/train': 1.5447174310684204} -11/07/2021 03:00:46 - INFO - __main__ - Step 41196: {'lr': 0.00041835123050981476, 'samples': 7909632, 'steps': 41195, 'loss/train': 1.3635088205337524} -11/07/2021 03:00:47 - INFO - __main__ - Step 41197: {'lr': 0.00041834730733461366, 'samples': 7909824, 'steps': 41196, 'loss/train': 1.5128867626190186} -11/07/2021 03:00:47 - INFO - __main__ - Step 41198: {'lr': 0.0004183433840835578, 'samples': 7910016, 'steps': 41197, 'loss/train': 1.45900297164917} -11/07/2021 03:00:47 - INFO - __main__ - Step 41199: {'lr': 0.0004183394607566491, 'samples': 7910208, 'steps': 41198, 'loss/train': 0.9792979955673218} -11/07/2021 03:00:48 - INFO - __main__ - Step 41200: {'lr': 0.0004183355373538892, 'samples': 7910400, 'steps': 41199, 'loss/train': 0.5584649443626404} -11/07/2021 03:00:49 - INFO - __main__ - Step 41201: {'lr': 0.00041833161387527985, 'samples': 7910592, 'steps': 41200, 'loss/train': 0.9643514156341553} -11/07/2021 03:00:49 - INFO - __main__ - Step 41202: {'lr': 0.0004183276903208228, 'samples': 7910784, 'steps': 41201, 'loss/train': 1.8792955875396729} -11/07/2021 03:00:50 - INFO - __main__ - Step 41203: {'lr': 0.0004183237666905201, 'samples': 7910976, 'steps': 41202, 'loss/train': 1.084418535232544} -11/07/2021 03:00:50 - INFO - __main__ - Step 41204: {'lr': 0.0004183198429843732, 'samples': 7911168, 'steps': 41203, 'loss/train': 1.5909727811813354} -11/07/2021 03:00:50 - INFO - __main__ - Step 41205: {'lr': 0.00041831591920238396, 'samples': 7911360, 'steps': 41204, 'loss/train': 1.7619580030441284} -11/07/2021 03:00:51 - INFO - __main__ - Step 41206: {'lr': 0.0004183119953445542, 'samples': 7911552, 'steps': 41205, 'loss/train': 1.2859710454940796} -11/07/2021 03:00:52 - INFO - __main__ - Step 41207: {'lr': 0.00041830807141088566, 'samples': 7911744, 'steps': 41206, 'loss/train': 1.5500056743621826} -11/07/2021 03:00:52 - INFO - __main__ - Step 41208: {'lr': 0.0004183041474013801, 'samples': 7911936, 'steps': 41207, 'loss/train': 1.6253983974456787} -11/07/2021 03:00:52 - INFO - __main__ - Step 41209: {'lr': 0.00041830022331603925, 'samples': 7912128, 'steps': 41208, 'loss/train': 1.482258915901184} -11/07/2021 03:00:53 - INFO - __main__ - Step 41210: {'lr': 0.000418296299154865, 'samples': 7912320, 'steps': 41209, 'loss/train': 1.3288849592208862} -11/07/2021 03:00:54 - INFO - __main__ - Step 41211: {'lr': 0.000418292374917859, 'samples': 7912512, 'steps': 41210, 'loss/train': 1.7064313888549805} -11/07/2021 03:00:54 - INFO - __main__ - Step 41212: {'lr': 0.00041828845060502297, 'samples': 7912704, 'steps': 41211, 'loss/train': 1.5797468423843384} -11/07/2021 03:00:55 - INFO - __main__ - Step 41213: {'lr': 0.00041828452621635884, 'samples': 7912896, 'steps': 41212, 'loss/train': 0.6790094375610352} -11/07/2021 03:00:55 - INFO - __main__ - Step 41214: {'lr': 0.0004182806017518682, 'samples': 7913088, 'steps': 41213, 'loss/train': 1.4418489933013916} -11/07/2021 03:00:55 - INFO - __main__ - Step 41215: {'lr': 0.00041827667721155303, 'samples': 7913280, 'steps': 41214, 'loss/train': 2.006834030151367} -11/07/2021 03:00:57 - INFO - __main__ - Step 41216: {'lr': 0.000418272752595415, 'samples': 7913472, 'steps': 41215, 'loss/train': 1.6815943717956543} -11/07/2021 03:00:57 - INFO - __main__ - Step 41217: {'lr': 0.00041826882790345577, 'samples': 7913664, 'steps': 41216, 'loss/train': 1.343355417251587} -11/07/2021 03:00:58 - INFO - __main__ - Step 41218: {'lr': 0.00041826490313567725, 'samples': 7913856, 'steps': 41217, 'loss/train': 1.6229034662246704} -11/07/2021 03:00:58 - INFO - __main__ - Step 41219: {'lr': 0.0004182609782920812, 'samples': 7914048, 'steps': 41218, 'loss/train': 1.9552432298660278} -11/07/2021 03:00:58 - INFO - __main__ - Step 41220: {'lr': 0.0004182570533726693, 'samples': 7914240, 'steps': 41219, 'loss/train': 1.3559013605117798} -11/07/2021 03:00:59 - INFO - __main__ - Step 41221: {'lr': 0.00041825312837744333, 'samples': 7914432, 'steps': 41220, 'loss/train': 1.5077816247940063} -11/07/2021 03:01:00 - INFO - __main__ - Step 41222: {'lr': 0.00041824920330640517, 'samples': 7914624, 'steps': 41221, 'loss/train': 0.24105438590049744} -11/07/2021 03:01:00 - INFO - __main__ - Step 41223: {'lr': 0.0004182452781595565, 'samples': 7914816, 'steps': 41222, 'loss/train': 1.7922337055206299} -11/07/2021 03:01:00 - INFO - __main__ - Step 41224: {'lr': 0.0004182413529368991, 'samples': 7915008, 'steps': 41223, 'loss/train': 1.418586015701294} -11/07/2021 03:01:01 - INFO - __main__ - Step 41225: {'lr': 0.0004182374276384347, 'samples': 7915200, 'steps': 41224, 'loss/train': 1.4558976888656616} -11/07/2021 03:01:01 - INFO - __main__ - Step 41226: {'lr': 0.0004182335022641651, 'samples': 7915392, 'steps': 41225, 'loss/train': 1.558049201965332} -11/07/2021 03:01:02 - INFO - __main__ - Step 41227: {'lr': 0.00041822957681409215, 'samples': 7915584, 'steps': 41226, 'loss/train': 1.8619894981384277} -11/07/2021 03:01:03 - INFO - __main__ - Step 41228: {'lr': 0.00041822565128821757, 'samples': 7915776, 'steps': 41227, 'loss/train': 1.5256032943725586} -11/07/2021 03:01:03 - INFO - __main__ - Step 41229: {'lr': 0.00041822172568654306, 'samples': 7915968, 'steps': 41228, 'loss/train': 1.7781447172164917} -11/07/2021 03:01:03 - INFO - __main__ - Step 41230: {'lr': 0.0004182178000090704, 'samples': 7916160, 'steps': 41229, 'loss/train': 1.4191579818725586} -11/07/2021 03:01:04 - INFO - __main__ - Step 41231: {'lr': 0.0004182138742558015, 'samples': 7916352, 'steps': 41230, 'loss/train': 1.6129021644592285} -11/07/2021 03:01:04 - INFO - __main__ - Step 41232: {'lr': 0.00041820994842673787, 'samples': 7916544, 'steps': 41231, 'loss/train': 1.6607749462127686} -11/07/2021 03:01:05 - INFO - __main__ - Step 41233: {'lr': 0.00041820602252188156, 'samples': 7916736, 'steps': 41232, 'loss/train': 1.9180601835250854} -11/07/2021 03:01:05 - INFO - __main__ - Step 41234: {'lr': 0.00041820209654123416, 'samples': 7916928, 'steps': 41233, 'loss/train': 1.4475653171539307} -11/07/2021 03:01:06 - INFO - __main__ - Step 41235: {'lr': 0.00041819817048479745, 'samples': 7917120, 'steps': 41234, 'loss/train': 4.331748008728027} -11/07/2021 03:01:06 - INFO - __main__ - Step 41236: {'lr': 0.0004181942443525734, 'samples': 7917312, 'steps': 41235, 'loss/train': 1.290693759918213} -11/07/2021 03:01:06 - INFO - __main__ - Step 41237: {'lr': 0.00041819031814456346, 'samples': 7917504, 'steps': 41236, 'loss/train': 1.7088333368301392} -11/07/2021 03:01:08 - INFO - __main__ - Step 41238: {'lr': 0.0004181863918607696, 'samples': 7917696, 'steps': 41237, 'loss/train': 1.9867417812347412} -11/07/2021 03:01:08 - INFO - __main__ - Step 41239: {'lr': 0.00041818246550119354, 'samples': 7917888, 'steps': 41238, 'loss/train': 1.6488137245178223} -11/07/2021 03:01:09 - INFO - __main__ - Step 41240: {'lr': 0.00041817853906583706, 'samples': 7918080, 'steps': 41239, 'loss/train': 1.6615079641342163} -11/07/2021 03:01:09 - INFO - __main__ - Step 41241: {'lr': 0.000418174612554702, 'samples': 7918272, 'steps': 41240, 'loss/train': 1.684520959854126} -11/07/2021 03:01:09 - INFO - __main__ - Step 41242: {'lr': 0.00041817068596778994, 'samples': 7918464, 'steps': 41241, 'loss/train': 1.7856652736663818} -11/07/2021 03:01:10 - INFO - __main__ - Step 41243: {'lr': 0.0004181667593051028, 'samples': 7918656, 'steps': 41242, 'loss/train': 1.7953649759292603} -11/07/2021 03:01:10 - INFO - __main__ - Step 41244: {'lr': 0.0004181628325666424, 'samples': 7918848, 'steps': 41243, 'loss/train': 1.7734460830688477} -11/07/2021 03:01:11 - INFO - __main__ - Step 41245: {'lr': 0.0004181589057524103, 'samples': 7919040, 'steps': 41244, 'loss/train': 1.22751784324646} -11/07/2021 03:01:11 - INFO - __main__ - Step 41246: {'lr': 0.0004181549788624085, 'samples': 7919232, 'steps': 41245, 'loss/train': 1.4137510061264038} -11/07/2021 03:01:12 - INFO - __main__ - Step 41247: {'lr': 0.0004181510518966386, 'samples': 7919424, 'steps': 41246, 'loss/train': 1.210434913635254} -11/07/2021 03:01:12 - INFO - __main__ - Step 41248: {'lr': 0.00041814712485510245, 'samples': 7919616, 'steps': 41247, 'loss/train': 0.9829598665237427} -11/07/2021 03:01:13 - INFO - __main__ - Step 41249: {'lr': 0.0004181431977378017, 'samples': 7919808, 'steps': 41248, 'loss/train': 1.560865879058838} -11/07/2021 03:01:14 - INFO - __main__ - Step 41250: {'lr': 0.00041813927054473835, 'samples': 7920000, 'steps': 41249, 'loss/train': 1.2396860122680664} -11/07/2021 03:01:14 - INFO - __main__ - Step 41251: {'lr': 0.000418135343275914, 'samples': 7920192, 'steps': 41250, 'loss/train': 1.5683566331863403} -11/07/2021 03:01:14 - INFO - __main__ - Step 41252: {'lr': 0.0004181314159313305, 'samples': 7920384, 'steps': 41251, 'loss/train': 1.6124900579452515} -11/07/2021 03:01:15 - INFO - __main__ - Step 41253: {'lr': 0.0004181274885109895, 'samples': 7920576, 'steps': 41252, 'loss/train': 0.991035521030426} -11/07/2021 03:01:15 - INFO - __main__ - Step 41254: {'lr': 0.0004181235610148929, 'samples': 7920768, 'steps': 41253, 'loss/train': 1.6612294912338257} -11/07/2021 03:01:16 - INFO - __main__ - Step 41255: {'lr': 0.0004181196334430424, 'samples': 7920960, 'steps': 41254, 'loss/train': 1.5381064414978027} -11/07/2021 03:01:16 - INFO - __main__ - Step 41256: {'lr': 0.00041811570579543977, 'samples': 7921152, 'steps': 41255, 'loss/train': 1.5637043714523315} -11/07/2021 03:01:17 - INFO - __main__ - Step 41257: {'lr': 0.0004181117780720868, 'samples': 7921344, 'steps': 41256, 'loss/train': 1.1258245706558228} -11/07/2021 03:01:17 - INFO - __main__ - Step 41258: {'lr': 0.00041810785027298524, 'samples': 7921536, 'steps': 41257, 'loss/train': 1.58634352684021} -11/07/2021 03:01:17 - INFO - __main__ - Step 41259: {'lr': 0.00041810392239813695, 'samples': 7921728, 'steps': 41258, 'loss/train': 1.0692466497421265} -11/07/2021 03:01:18 - INFO - __main__ - Step 41260: {'lr': 0.00041809999444754353, 'samples': 7921920, 'steps': 41259, 'loss/train': 2.233379602432251} -11/07/2021 03:01:19 - INFO - __main__ - Step 41261: {'lr': 0.0004180960664212069, 'samples': 7922112, 'steps': 41260, 'loss/train': 1.564186453819275} -11/07/2021 03:01:19 - INFO - __main__ - Step 41262: {'lr': 0.00041809213831912884, 'samples': 7922304, 'steps': 41261, 'loss/train': 1.601365089416504} -11/07/2021 03:01:19 - INFO - __main__ - Step 41263: {'lr': 0.0004180882101413109, 'samples': 7922496, 'steps': 41262, 'loss/train': 1.3063501119613647} -11/07/2021 03:01:20 - INFO - __main__ - Step 41264: {'lr': 0.00041808428188775515, 'samples': 7922688, 'steps': 41263, 'loss/train': 1.4315458536148071} -11/07/2021 03:01:20 - INFO - __main__ - Step 41265: {'lr': 0.0004180803535584632, 'samples': 7922880, 'steps': 41264, 'loss/train': 1.7812724113464355} -11/07/2021 03:01:21 - INFO - __main__ - Step 41266: {'lr': 0.0004180764251534368, 'samples': 7923072, 'steps': 41265, 'loss/train': 1.3440953493118286} -11/07/2021 03:01:22 - INFO - __main__ - Step 41267: {'lr': 0.0004180724966726778, 'samples': 7923264, 'steps': 41266, 'loss/train': 1.538791537284851} -11/07/2021 03:01:22 - INFO - __main__ - Step 41268: {'lr': 0.00041806856811618784, 'samples': 7923456, 'steps': 41267, 'loss/train': 1.7029993534088135} -11/07/2021 03:01:22 - INFO - __main__ - Step 41269: {'lr': 0.00041806463948396876, 'samples': 7923648, 'steps': 41268, 'loss/train': 1.508406639099121} -11/07/2021 03:01:23 - INFO - __main__ - Step 41270: {'lr': 0.0004180607107760225, 'samples': 7923840, 'steps': 41269, 'loss/train': 1.4010753631591797} -11/07/2021 03:01:24 - INFO - __main__ - Step 41271: {'lr': 0.0004180567819923505, 'samples': 7924032, 'steps': 41270, 'loss/train': 1.4275845289230347} -11/07/2021 03:01:24 - INFO - __main__ - Step 41272: {'lr': 0.0004180528531329548, 'samples': 7924224, 'steps': 41271, 'loss/train': 1.6024832725524902} -11/07/2021 03:01:24 - INFO - __main__ - Step 41273: {'lr': 0.00041804892419783715, 'samples': 7924416, 'steps': 41272, 'loss/train': 1.3015625476837158} -11/07/2021 03:01:25 - INFO - __main__ - Step 41274: {'lr': 0.0004180449951869991, 'samples': 7924608, 'steps': 41273, 'loss/train': 1.3946226835250854} -11/07/2021 03:01:25 - INFO - __main__ - Step 41275: {'lr': 0.00041804106610044263, 'samples': 7924800, 'steps': 41274, 'loss/train': 1.509242296218872} -11/07/2021 03:01:26 - INFO - __main__ - Step 41276: {'lr': 0.00041803713693816947, 'samples': 7924992, 'steps': 41275, 'loss/train': 1.2228401899337769} -11/07/2021 03:01:26 - INFO - __main__ - Step 41277: {'lr': 0.0004180332077001814, 'samples': 7925184, 'steps': 41276, 'loss/train': 1.587908148765564} -11/07/2021 03:01:27 - INFO - __main__ - Step 41278: {'lr': 0.0004180292783864801, 'samples': 7925376, 'steps': 41277, 'loss/train': 1.5843009948730469} -11/07/2021 03:01:27 - INFO - __main__ - Step 41279: {'lr': 0.00041802534899706734, 'samples': 7925568, 'steps': 41278, 'loss/train': 1.3490830659866333} -11/07/2021 03:01:27 - INFO - __main__ - Step 41280: {'lr': 0.0004180214195319451, 'samples': 7925760, 'steps': 41279, 'loss/train': 1.0151638984680176} -11/07/2021 03:01:28 - INFO - __main__ - Step 41281: {'lr': 0.00041801748999111487, 'samples': 7925952, 'steps': 41280, 'loss/train': 2.370021343231201} -11/07/2021 03:01:29 - INFO - __main__ - Step 41282: {'lr': 0.0004180135603745786, 'samples': 7926144, 'steps': 41281, 'loss/train': 1.8114560842514038} -11/07/2021 03:01:29 - INFO - __main__ - Step 41283: {'lr': 0.000418009630682338, 'samples': 7926336, 'steps': 41282, 'loss/train': 1.4603055715560913} -11/07/2021 03:01:29 - INFO - __main__ - Step 41284: {'lr': 0.00041800570091439493, 'samples': 7926528, 'steps': 41283, 'loss/train': 1.5822771787643433} -11/07/2021 03:01:30 - INFO - __main__ - Step 41285: {'lr': 0.000418001771070751, 'samples': 7926720, 'steps': 41284, 'loss/train': 1.1700141429901123} -11/07/2021 03:01:31 - INFO - __main__ - Step 41286: {'lr': 0.0004179978411514081, 'samples': 7926912, 'steps': 41285, 'loss/train': 1.5586498975753784} -11/07/2021 03:01:31 - INFO - __main__ - Step 41287: {'lr': 0.000417993911156368, 'samples': 7927104, 'steps': 41286, 'loss/train': 1.3684496879577637} -11/07/2021 03:01:32 - INFO - __main__ - Step 41288: {'lr': 0.00041798998108563234, 'samples': 7927296, 'steps': 41287, 'loss/train': 1.536394476890564} -11/07/2021 03:01:32 - INFO - __main__ - Step 41289: {'lr': 0.00041798605093920307, 'samples': 7927488, 'steps': 41288, 'loss/train': 1.71012544631958} -11/07/2021 03:01:32 - INFO - __main__ - Step 41290: {'lr': 0.00041798212071708185, 'samples': 7927680, 'steps': 41289, 'loss/train': 1.1121327877044678} -11/07/2021 03:01:33 - INFO - __main__ - Step 41291: {'lr': 0.0004179781904192704, 'samples': 7927872, 'steps': 41290, 'loss/train': 1.5258047580718994} -11/07/2021 03:01:34 - INFO - __main__ - Step 41292: {'lr': 0.00041797426004577066, 'samples': 7928064, 'steps': 41291, 'loss/train': 1.2911633253097534} -11/07/2021 03:01:34 - INFO - __main__ - Step 41293: {'lr': 0.00041797032959658433, 'samples': 7928256, 'steps': 41292, 'loss/train': 1.5362772941589355} -11/07/2021 03:01:34 - INFO - __main__ - Step 41294: {'lr': 0.0004179663990717131, 'samples': 7928448, 'steps': 41293, 'loss/train': 1.5473556518554688} -11/07/2021 03:01:35 - INFO - __main__ - Step 41295: {'lr': 0.0004179624684711588, 'samples': 7928640, 'steps': 41294, 'loss/train': 1.390834093093872} -11/07/2021 03:01:35 - INFO - __main__ - Step 41296: {'lr': 0.0004179585377949232, 'samples': 7928832, 'steps': 41295, 'loss/train': 1.8194223642349243} -11/07/2021 03:01:36 - INFO - __main__ - Step 41297: {'lr': 0.0004179546070430082, 'samples': 7929024, 'steps': 41296, 'loss/train': 1.2560080289840698} -11/07/2021 03:01:37 - INFO - __main__ - Step 41298: {'lr': 0.0004179506762154153, 'samples': 7929216, 'steps': 41297, 'loss/train': 1.2087020874023438} -11/07/2021 03:01:37 - INFO - __main__ - Step 41299: {'lr': 0.0004179467453121465, 'samples': 7929408, 'steps': 41298, 'loss/train': 1.3658021688461304} -11/07/2021 03:01:37 - INFO - __main__ - Step 41300: {'lr': 0.0004179428143332035, 'samples': 7929600, 'steps': 41299, 'loss/train': 1.672145128250122} -11/07/2021 03:01:38 - INFO - __main__ - Step 41301: {'lr': 0.000417938883278588, 'samples': 7929792, 'steps': 41300, 'loss/train': 1.7102265357971191} -11/07/2021 03:01:39 - INFO - __main__ - Step 41302: {'lr': 0.0004179349521483018, 'samples': 7929984, 'steps': 41301, 'loss/train': 1.1674959659576416} -11/07/2021 03:01:39 - INFO - __main__ - Step 41303: {'lr': 0.00041793102094234673, 'samples': 7930176, 'steps': 41302, 'loss/train': 1.4597300291061401} -11/07/2021 03:01:39 - INFO - __main__ - Step 41304: {'lr': 0.00041792708966072455, 'samples': 7930368, 'steps': 41303, 'loss/train': 1.5141634941101074} -11/07/2021 03:01:40 - INFO - __main__ - Step 41305: {'lr': 0.0004179231583034371, 'samples': 7930560, 'steps': 41304, 'loss/train': 1.7141952514648438} -11/07/2021 03:01:40 - INFO - __main__ - Step 41306: {'lr': 0.0004179192268704859, 'samples': 7930752, 'steps': 41305, 'loss/train': 1.4723738431930542} -11/07/2021 03:01:41 - INFO - __main__ - Step 41307: {'lr': 0.000417915295361873, 'samples': 7930944, 'steps': 41306, 'loss/train': 1.3933378458023071} -11/07/2021 03:01:42 - INFO - __main__ - Step 41308: {'lr': 0.0004179113637776, 'samples': 7931136, 'steps': 41307, 'loss/train': 1.2595709562301636} -11/07/2021 03:01:42 - INFO - __main__ - Step 41309: {'lr': 0.0004179074321176688, 'samples': 7931328, 'steps': 41308, 'loss/train': 1.5110349655151367} -11/07/2021 03:01:42 - INFO - __main__ - Step 41310: {'lr': 0.000417903500382081, 'samples': 7931520, 'steps': 41309, 'loss/train': 1.3963290452957153} -11/07/2021 03:01:43 - INFO - __main__ - Step 41311: {'lr': 0.00041789956857083853, 'samples': 7931712, 'steps': 41310, 'loss/train': 1.7429158687591553} -11/07/2021 03:01:44 - INFO - __main__ - Step 41312: {'lr': 0.00041789563668394314, 'samples': 7931904, 'steps': 41311, 'loss/train': 1.4432523250579834} -11/07/2021 03:01:44 - INFO - __main__ - Step 41313: {'lr': 0.0004178917047213965, 'samples': 7932096, 'steps': 41312, 'loss/train': 1.3484480381011963} -11/07/2021 03:01:44 - INFO - __main__ - Step 41314: {'lr': 0.00041788777268320055, 'samples': 7932288, 'steps': 41313, 'loss/train': 1.684675693511963} -11/07/2021 03:01:45 - INFO - __main__ - Step 41315: {'lr': 0.00041788384056935693, 'samples': 7932480, 'steps': 41314, 'loss/train': 1.4484103918075562} -11/07/2021 03:01:45 - INFO - __main__ - Step 41316: {'lr': 0.0004178799083798673, 'samples': 7932672, 'steps': 41315, 'loss/train': 1.47584068775177} -11/07/2021 03:01:45 - INFO - __main__ - Step 41317: {'lr': 0.00041787597611473375, 'samples': 7932864, 'steps': 41316, 'loss/train': 1.2993026971817017} -11/07/2021 03:01:46 - INFO - __main__ - Step 41318: {'lr': 0.00041787204377395783, 'samples': 7933056, 'steps': 41317, 'loss/train': 1.1744214296340942} -11/07/2021 03:01:47 - INFO - __main__ - Step 41319: {'lr': 0.0004178681113575413, 'samples': 7933248, 'steps': 41318, 'loss/train': 1.6770493984222412} -11/07/2021 03:01:47 - INFO - __main__ - Step 41320: {'lr': 0.00041786417886548606, 'samples': 7933440, 'steps': 41319, 'loss/train': 1.511395812034607} -11/07/2021 03:01:48 - INFO - __main__ - Step 41321: {'lr': 0.0004178602462977937, 'samples': 7933632, 'steps': 41320, 'loss/train': 1.0146536827087402} -11/07/2021 03:01:48 - INFO - __main__ - Step 41322: {'lr': 0.0004178563136544662, 'samples': 7933824, 'steps': 41321, 'loss/train': 1.5325267314910889} -11/07/2021 03:01:49 - INFO - __main__ - Step 41323: {'lr': 0.0004178523809355053, 'samples': 7934016, 'steps': 41322, 'loss/train': 1.431384801864624} -11/07/2021 03:01:49 - INFO - __main__ - Step 41324: {'lr': 0.00041784844814091263, 'samples': 7934208, 'steps': 41323, 'loss/train': 1.2008589506149292} -11/07/2021 03:01:50 - INFO - __main__ - Step 41325: {'lr': 0.00041784451527069, 'samples': 7934400, 'steps': 41324, 'loss/train': 1.5073442459106445} -11/07/2021 03:01:50 - INFO - __main__ - Step 41326: {'lr': 0.0004178405823248392, 'samples': 7934592, 'steps': 41325, 'loss/train': 1.7020225524902344} -11/07/2021 03:01:50 - INFO - __main__ - Step 41327: {'lr': 0.0004178366493033621, 'samples': 7934784, 'steps': 41326, 'loss/train': 1.369020700454712} -11/07/2021 03:01:52 - INFO - __main__ - Step 41328: {'lr': 0.0004178327162062604, 'samples': 7934976, 'steps': 41327, 'loss/train': 0.5613696575164795} -11/07/2021 03:01:52 - INFO - __main__ - Step 41329: {'lr': 0.00041782878303353577, 'samples': 7935168, 'steps': 41328, 'loss/train': 1.6528732776641846} -11/07/2021 03:01:52 - INFO - __main__ - Step 41330: {'lr': 0.0004178248497851902, 'samples': 7935360, 'steps': 41329, 'loss/train': 1.4104169607162476} -11/07/2021 03:01:53 - INFO - __main__ - Step 41331: {'lr': 0.00041782091646122533, 'samples': 7935552, 'steps': 41330, 'loss/train': 1.3062204122543335} -11/07/2021 03:01:53 - INFO - __main__ - Step 41332: {'lr': 0.00041781698306164283, 'samples': 7935744, 'steps': 41331, 'loss/train': 1.29737389087677} -11/07/2021 03:01:54 - INFO - __main__ - Step 41333: {'lr': 0.0004178130495864447, 'samples': 7935936, 'steps': 41332, 'loss/train': 1.2845706939697266} -11/07/2021 03:01:55 - INFO - __main__ - Step 41334: {'lr': 0.00041780911603563254, 'samples': 7936128, 'steps': 41333, 'loss/train': 1.6035759449005127} -11/07/2021 03:01:55 - INFO - __main__ - Step 41335: {'lr': 0.00041780518240920817, 'samples': 7936320, 'steps': 41334, 'loss/train': 1.7680363655090332} -11/07/2021 03:01:55 - INFO - __main__ - Step 41336: {'lr': 0.0004178012487071734, 'samples': 7936512, 'steps': 41335, 'loss/train': 1.8347069025039673} -11/07/2021 03:01:56 - INFO - __main__ - Step 41337: {'lr': 0.00041779731492953, 'samples': 7936704, 'steps': 41336, 'loss/train': 1.4897397756576538} -11/07/2021 03:01:56 - INFO - __main__ - Step 41338: {'lr': 0.0004177933810762797, 'samples': 7936896, 'steps': 41337, 'loss/train': 1.3531194925308228} -11/07/2021 03:01:57 - INFO - __main__ - Step 41339: {'lr': 0.00041778944714742435, 'samples': 7937088, 'steps': 41338, 'loss/train': 1.9024698734283447} -11/07/2021 03:01:59 - INFO - __main__ - Step 41340: {'lr': 0.00041778551314296556, 'samples': 7937280, 'steps': 41339, 'loss/train': 1.5987845659255981} -11/07/2021 03:01:59 - INFO - __main__ - Step 41341: {'lr': 0.00041778157906290525, 'samples': 7937472, 'steps': 41340, 'loss/train': 1.0938655138015747} -11/07/2021 03:02:00 - INFO - __main__ - Step 41342: {'lr': 0.00041777764490724515, 'samples': 7937664, 'steps': 41341, 'loss/train': 1.311763048171997} -11/07/2021 03:02:00 - INFO - __main__ - Step 41343: {'lr': 0.00041777371067598705, 'samples': 7937856, 'steps': 41342, 'loss/train': 1.4340498447418213} -11/07/2021 03:02:00 - INFO - __main__ - Step 41344: {'lr': 0.00041776977636913274, 'samples': 7938048, 'steps': 41343, 'loss/train': 1.6654342412948608} -11/07/2021 03:02:01 - INFO - __main__ - Step 41345: {'lr': 0.0004177658419866839, 'samples': 7938240, 'steps': 41344, 'loss/train': 1.9490320682525635} -11/07/2021 03:02:01 - INFO - __main__ - Step 41346: {'lr': 0.0004177619075286424, 'samples': 7938432, 'steps': 41345, 'loss/train': 1.9665720462799072} -11/07/2021 03:02:01 - INFO - __main__ - Step 41347: {'lr': 0.00041775797299500997, 'samples': 7938624, 'steps': 41346, 'loss/train': 1.7433401346206665} -11/07/2021 03:02:02 - INFO - __main__ - Step 41348: {'lr': 0.0004177540383857883, 'samples': 7938816, 'steps': 41347, 'loss/train': 1.7861980199813843} -11/07/2021 03:02:03 - INFO - __main__ - Step 41349: {'lr': 0.0004177501037009793, 'samples': 7939008, 'steps': 41348, 'loss/train': 1.8376537561416626} -11/07/2021 03:02:03 - INFO - __main__ - Step 41350: {'lr': 0.0004177461689405847, 'samples': 7939200, 'steps': 41349, 'loss/train': 1.8534979820251465} -11/07/2021 03:02:03 - INFO - __main__ - Step 41351: {'lr': 0.00041774223410460633, 'samples': 7939392, 'steps': 41350, 'loss/train': 1.8638612031936646} -11/07/2021 03:02:04 - INFO - __main__ - Step 41352: {'lr': 0.00041773829919304584, 'samples': 7939584, 'steps': 41351, 'loss/train': 1.4559210538864136} -11/07/2021 03:02:05 - INFO - __main__ - Step 41353: {'lr': 0.000417734364205905, 'samples': 7939776, 'steps': 41352, 'loss/train': 1.5426164865493774} -11/07/2021 03:02:05 - INFO - __main__ - Step 41354: {'lr': 0.0004177304291431857, 'samples': 7939968, 'steps': 41353, 'loss/train': 0.13154828548431396} -11/07/2021 03:02:05 - INFO - __main__ - Step 41355: {'lr': 0.00041772649400488967, 'samples': 7940160, 'steps': 41354, 'loss/train': 1.3842164278030396} -11/07/2021 03:02:06 - INFO - __main__ - Step 41356: {'lr': 0.0004177225587910186, 'samples': 7940352, 'steps': 41355, 'loss/train': 1.2309932708740234} -11/07/2021 03:02:06 - INFO - __main__ - Step 41357: {'lr': 0.0004177186235015744, 'samples': 7940544, 'steps': 41356, 'loss/train': 1.4589163064956665} -11/07/2021 03:02:07 - INFO - __main__ - Step 41358: {'lr': 0.0004177146881365588, 'samples': 7940736, 'steps': 41357, 'loss/train': 1.6069822311401367} -11/07/2021 03:02:07 - INFO - __main__ - Step 41359: {'lr': 0.00041771075269597354, 'samples': 7940928, 'steps': 41358, 'loss/train': 0.9026435017585754} -11/07/2021 03:02:08 - INFO - __main__ - Step 41360: {'lr': 0.0004177068171798204, 'samples': 7941120, 'steps': 41359, 'loss/train': 1.3894383907318115} -11/07/2021 03:02:08 - INFO - __main__ - Step 41361: {'lr': 0.0004177028815881011, 'samples': 7941312, 'steps': 41360, 'loss/train': 1.4144057035446167} -11/07/2021 03:02:08 - INFO - __main__ - Step 41362: {'lr': 0.00041769894592081746, 'samples': 7941504, 'steps': 41361, 'loss/train': 1.4857261180877686} -11/07/2021 03:02:10 - INFO - __main__ - Step 41363: {'lr': 0.0004176950101779713, 'samples': 7941696, 'steps': 41362, 'loss/train': 1.717484474182129} -11/07/2021 03:02:10 - INFO - __main__ - Step 41364: {'lr': 0.00041769107435956444, 'samples': 7941888, 'steps': 41363, 'loss/train': 1.5446809530258179} -11/07/2021 03:02:10 - INFO - __main__ - Step 41365: {'lr': 0.00041768713846559844, 'samples': 7942080, 'steps': 41364, 'loss/train': 1.936703085899353} -11/07/2021 03:02:11 - INFO - __main__ - Step 41366: {'lr': 0.00041768320249607527, 'samples': 7942272, 'steps': 41365, 'loss/train': 0.5804887413978577} -11/07/2021 03:02:11 - INFO - __main__ - Step 41367: {'lr': 0.00041767926645099664, 'samples': 7942464, 'steps': 41366, 'loss/train': 1.1168676614761353} -11/07/2021 03:02:12 - INFO - __main__ - Step 41368: {'lr': 0.00041767533033036425, 'samples': 7942656, 'steps': 41367, 'loss/train': 1.2331725358963013} -11/07/2021 03:02:12 - INFO - __main__ - Step 41369: {'lr': 0.00041767139413418, 'samples': 7942848, 'steps': 41368, 'loss/train': 1.3584792613983154} -11/07/2021 03:02:13 - INFO - __main__ - Step 41370: {'lr': 0.00041766745786244564, 'samples': 7943040, 'steps': 41369, 'loss/train': 1.856892704963684} -11/07/2021 03:02:13 - INFO - __main__ - Step 41371: {'lr': 0.00041766352151516284, 'samples': 7943232, 'steps': 41370, 'loss/train': 1.2535980939865112} -11/07/2021 03:02:13 - INFO - __main__ - Step 41372: {'lr': 0.0004176595850923335, 'samples': 7943424, 'steps': 41371, 'loss/train': 1.2640399932861328} -11/07/2021 03:02:14 - INFO - __main__ - Step 41373: {'lr': 0.0004176556485939593, 'samples': 7943616, 'steps': 41372, 'loss/train': 1.373843789100647} -11/07/2021 03:02:15 - INFO - __main__ - Step 41374: {'lr': 0.00041765171202004205, 'samples': 7943808, 'steps': 41373, 'loss/train': 1.3820745944976807} -11/07/2021 03:02:15 - INFO - __main__ - Step 41375: {'lr': 0.00041764777537058354, 'samples': 7944000, 'steps': 41374, 'loss/train': 1.7117164134979248} -11/07/2021 03:02:16 - INFO - __main__ - Step 41376: {'lr': 0.0004176438386455855, 'samples': 7944192, 'steps': 41375, 'loss/train': 0.868809163570404} -11/07/2021 03:02:16 - INFO - __main__ - Step 41377: {'lr': 0.00041763990184504984, 'samples': 7944384, 'steps': 41376, 'loss/train': 1.7543200254440308} -11/07/2021 03:02:16 - INFO - __main__ - Step 41378: {'lr': 0.00041763596496897817, 'samples': 7944576, 'steps': 41377, 'loss/train': 1.489722728729248} -11/07/2021 03:02:17 - INFO - __main__ - Step 41379: {'lr': 0.00041763202801737225, 'samples': 7944768, 'steps': 41378, 'loss/train': 1.531445860862732} -11/07/2021 03:02:18 - INFO - __main__ - Step 41380: {'lr': 0.00041762809099023403, 'samples': 7944960, 'steps': 41379, 'loss/train': 1.4082839488983154} -11/07/2021 03:02:18 - INFO - __main__ - Step 41381: {'lr': 0.00041762415388756514, 'samples': 7945152, 'steps': 41380, 'loss/train': 1.53441321849823} -11/07/2021 03:02:18 - INFO - __main__ - Step 41382: {'lr': 0.00041762021670936736, 'samples': 7945344, 'steps': 41381, 'loss/train': 1.8188769817352295} -11/07/2021 03:02:19 - INFO - __main__ - Step 41383: {'lr': 0.0004176162794556425, 'samples': 7945536, 'steps': 41382, 'loss/train': 1.631960391998291} -11/07/2021 03:02:20 - INFO - __main__ - Step 41384: {'lr': 0.0004176123421263923, 'samples': 7945728, 'steps': 41383, 'loss/train': 1.130538821220398} -11/07/2021 03:02:20 - INFO - __main__ - Step 41385: {'lr': 0.00041760840472161866, 'samples': 7945920, 'steps': 41384, 'loss/train': 1.5905122756958008} -11/07/2021 03:02:20 - INFO - __main__ - Step 41386: {'lr': 0.0004176044672413232, 'samples': 7946112, 'steps': 41385, 'loss/train': 1.7300176620483398} -11/07/2021 03:02:21 - INFO - __main__ - Step 41387: {'lr': 0.00041760052968550776, 'samples': 7946304, 'steps': 41386, 'loss/train': 1.1613948345184326} -11/07/2021 03:02:21 - INFO - __main__ - Step 41388: {'lr': 0.0004175965920541741, 'samples': 7946496, 'steps': 41387, 'loss/train': 1.0157157182693481} -11/07/2021 03:02:22 - INFO - __main__ - Step 41389: {'lr': 0.00041759265434732404, 'samples': 7946688, 'steps': 41388, 'loss/train': 0.9334609508514404} -11/07/2021 03:02:22 - INFO - __main__ - Step 41390: {'lr': 0.00041758871656495927, 'samples': 7946880, 'steps': 41389, 'loss/train': 0.7453952431678772} -11/07/2021 03:02:23 - INFO - __main__ - Step 41391: {'lr': 0.00041758477870708165, 'samples': 7947072, 'steps': 41390, 'loss/train': 1.6157008409500122} -11/07/2021 03:02:23 - INFO - __main__ - Step 41392: {'lr': 0.0004175808407736929, 'samples': 7947264, 'steps': 41391, 'loss/train': 0.9999271035194397} -11/07/2021 03:02:23 - INFO - __main__ - Step 41393: {'lr': 0.00041757690276479474, 'samples': 7947456, 'steps': 41392, 'loss/train': 1.3824840784072876} -11/07/2021 03:02:25 - INFO - __main__ - Step 41394: {'lr': 0.0004175729646803891, 'samples': 7947648, 'steps': 41393, 'loss/train': 1.6060587167739868} -11/07/2021 03:02:25 - INFO - __main__ - Step 41395: {'lr': 0.00041756902652047767, 'samples': 7947840, 'steps': 41394, 'loss/train': 1.4517266750335693} -11/07/2021 03:02:25 - INFO - __main__ - Step 41396: {'lr': 0.0004175650882850622, 'samples': 7948032, 'steps': 41395, 'loss/train': 0.9659159183502197} -11/07/2021 03:02:26 - INFO - __main__ - Step 41397: {'lr': 0.0004175611499741445, 'samples': 7948224, 'steps': 41396, 'loss/train': 1.5996308326721191} -11/07/2021 03:02:26 - INFO - __main__ - Step 41398: {'lr': 0.00041755721158772633, 'samples': 7948416, 'steps': 41397, 'loss/train': 0.12279503047466278} -11/07/2021 03:02:27 - INFO - __main__ - Step 41399: {'lr': 0.00041755327312580944, 'samples': 7948608, 'steps': 41398, 'loss/train': 1.602047324180603} -11/07/2021 03:02:27 - INFO - __main__ - Step 41400: {'lr': 0.0004175493345883956, 'samples': 7948800, 'steps': 41399, 'loss/train': 1.2394378185272217} -11/07/2021 03:02:28 - INFO - __main__ - Step 41401: {'lr': 0.0004175453959754867, 'samples': 7948992, 'steps': 41400, 'loss/train': 1.2604111433029175} -11/07/2021 03:02:28 - INFO - __main__ - Step 41402: {'lr': 0.00041754145728708434, 'samples': 7949184, 'steps': 41401, 'loss/train': 1.337045669555664} -11/07/2021 03:02:28 - INFO - __main__ - Step 41403: {'lr': 0.0004175375185231904, 'samples': 7949376, 'steps': 41402, 'loss/train': 1.2870851755142212} -11/07/2021 03:02:29 - INFO - __main__ - Step 41404: {'lr': 0.00041753357968380675, 'samples': 7949568, 'steps': 41403, 'loss/train': 1.5985771417617798} -11/07/2021 03:02:30 - INFO - __main__ - Step 41405: {'lr': 0.00041752964076893496, 'samples': 7949760, 'steps': 41404, 'loss/train': 1.6936683654785156} -11/07/2021 03:02:30 - INFO - __main__ - Step 41406: {'lr': 0.00041752570177857695, 'samples': 7949952, 'steps': 41405, 'loss/train': 1.5201998949050903} -11/07/2021 03:02:30 - INFO - __main__ - Step 41407: {'lr': 0.0004175217627127344, 'samples': 7950144, 'steps': 41406, 'loss/train': 1.4150969982147217} -11/07/2021 03:02:31 - INFO - __main__ - Step 41408: {'lr': 0.0004175178235714091, 'samples': 7950336, 'steps': 41407, 'loss/train': 1.580664038658142} -11/07/2021 03:02:31 - INFO - __main__ - Step 41409: {'lr': 0.0004175138843546029, 'samples': 7950528, 'steps': 41408, 'loss/train': 1.626002550125122} -11/07/2021 03:02:32 - INFO - __main__ - Step 41410: {'lr': 0.00041750994506231756, 'samples': 7950720, 'steps': 41409, 'loss/train': 0.6695911884307861} -11/07/2021 03:02:32 - INFO - __main__ - Step 41411: {'lr': 0.00041750600569455474, 'samples': 7950912, 'steps': 41410, 'loss/train': 1.4357165098190308} -11/07/2021 03:02:33 - INFO - __main__ - Step 41412: {'lr': 0.0004175020662513164, 'samples': 7951104, 'steps': 41411, 'loss/train': 1.796668291091919} -11/07/2021 03:02:33 - INFO - __main__ - Step 41413: {'lr': 0.0004174981267326041, 'samples': 7951296, 'steps': 41412, 'loss/train': 1.517921805381775} -11/07/2021 03:02:34 - INFO - __main__ - Step 41414: {'lr': 0.0004174941871384198, 'samples': 7951488, 'steps': 41413, 'loss/train': 0.9669694304466248} -11/07/2021 03:02:35 - INFO - __main__ - Step 41415: {'lr': 0.00041749024746876517, 'samples': 7951680, 'steps': 41414, 'loss/train': 1.9053404331207275} -11/07/2021 03:02:35 - INFO - __main__ - Step 41416: {'lr': 0.00041748630772364204, 'samples': 7951872, 'steps': 41415, 'loss/train': 1.4301363229751587} -11/07/2021 03:02:35 - INFO - __main__ - Step 41417: {'lr': 0.00041748236790305215, 'samples': 7952064, 'steps': 41416, 'loss/train': 1.349250078201294} -11/07/2021 03:02:36 - INFO - __main__ - Step 41418: {'lr': 0.0004174784280069973, 'samples': 7952256, 'steps': 41417, 'loss/train': 1.444665551185608} -11/07/2021 03:02:36 - INFO - __main__ - Step 41419: {'lr': 0.00041747448803547925, 'samples': 7952448, 'steps': 41418, 'loss/train': 1.7027661800384521} -11/07/2021 03:02:37 - INFO - __main__ - Step 41420: {'lr': 0.0004174705479884998, 'samples': 7952640, 'steps': 41419, 'loss/train': 0.8072425723075867} -11/07/2021 03:02:37 - INFO - __main__ - Step 41421: {'lr': 0.0004174666078660607, 'samples': 7952832, 'steps': 41420, 'loss/train': 1.1555086374282837} -11/07/2021 03:02:38 - INFO - __main__ - Step 41422: {'lr': 0.00041746266766816377, 'samples': 7953024, 'steps': 41421, 'loss/train': 1.1109774112701416} -11/07/2021 03:02:38 - INFO - __main__ - Step 41423: {'lr': 0.0004174587273948106, 'samples': 7953216, 'steps': 41422, 'loss/train': 1.418365716934204} -11/07/2021 03:02:38 - INFO - __main__ - Step 41424: {'lr': 0.0004174547870460033, 'samples': 7953408, 'steps': 41423, 'loss/train': 1.2630163431167603} -11/07/2021 03:02:39 - INFO - __main__ - Step 41425: {'lr': 0.0004174508466217434, 'samples': 7953600, 'steps': 41424, 'loss/train': 1.473492980003357} -11/07/2021 03:02:40 - INFO - __main__ - Step 41426: {'lr': 0.00041744690612203263, 'samples': 7953792, 'steps': 41425, 'loss/train': 1.6726351976394653} -11/07/2021 03:02:40 - INFO - __main__ - Step 41427: {'lr': 0.00041744296554687294, 'samples': 7953984, 'steps': 41426, 'loss/train': 1.9256874322891235} -11/07/2021 03:02:41 - INFO - __main__ - Step 41428: {'lr': 0.00041743902489626606, 'samples': 7954176, 'steps': 41427, 'loss/train': 1.5032762289047241} -11/07/2021 03:02:41 - INFO - __main__ - Step 41429: {'lr': 0.0004174350841702137, 'samples': 7954368, 'steps': 41428, 'loss/train': 1.2201040983200073} -11/07/2021 03:02:41 - INFO - __main__ - Step 41430: {'lr': 0.0004174311433687177, 'samples': 7954560, 'steps': 41429, 'loss/train': 1.4208319187164307} -11/07/2021 03:02:42 - INFO - __main__ - Step 41431: {'lr': 0.00041742720249177975, 'samples': 7954752, 'steps': 41430, 'loss/train': 1.0522828102111816} -11/07/2021 03:02:43 - INFO - __main__ - Step 41432: {'lr': 0.0004174232615394018, 'samples': 7954944, 'steps': 41431, 'loss/train': 1.4779268503189087} -11/07/2021 03:02:43 - INFO - __main__ - Step 41433: {'lr': 0.00041741932051158535, 'samples': 7955136, 'steps': 41432, 'loss/train': 1.259121060371399} -11/07/2021 03:02:43 - INFO - __main__ - Step 41434: {'lr': 0.00041741537940833247, 'samples': 7955328, 'steps': 41433, 'loss/train': 1.3860517740249634} -11/07/2021 03:02:44 - INFO - __main__ - Step 41435: {'lr': 0.00041741143822964476, 'samples': 7955520, 'steps': 41434, 'loss/train': 1.6901785135269165} -11/07/2021 03:02:45 - INFO - __main__ - Step 41436: {'lr': 0.00041740749697552406, 'samples': 7955712, 'steps': 41435, 'loss/train': 1.1720250844955444} -11/07/2021 03:02:45 - INFO - __main__ - Step 41437: {'lr': 0.0004174035556459721, 'samples': 7955904, 'steps': 41436, 'loss/train': 0.42491212487220764} -11/07/2021 03:02:45 - INFO - __main__ - Step 41438: {'lr': 0.0004173996142409907, 'samples': 7956096, 'steps': 41437, 'loss/train': 1.5557392835617065} -11/07/2021 03:02:46 - INFO - __main__ - Step 41439: {'lr': 0.0004173956727605816, 'samples': 7956288, 'steps': 41438, 'loss/train': 1.436159610748291} -11/07/2021 03:02:46 - INFO - __main__ - Step 41440: {'lr': 0.00041739173120474663, 'samples': 7956480, 'steps': 41439, 'loss/train': 1.266028642654419} -11/07/2021 03:02:47 - INFO - __main__ - Step 41441: {'lr': 0.00041738778957348745, 'samples': 7956672, 'steps': 41440, 'loss/train': 1.7526899576187134} -11/07/2021 03:02:48 - INFO - __main__ - Step 41442: {'lr': 0.00041738384786680596, 'samples': 7956864, 'steps': 41441, 'loss/train': 1.5865671634674072} -11/07/2021 03:02:48 - INFO - __main__ - Step 41443: {'lr': 0.0004173799060847039, 'samples': 7957056, 'steps': 41442, 'loss/train': 1.5946766138076782} -11/07/2021 03:02:48 - INFO - __main__ - Step 41444: {'lr': 0.00041737596422718306, 'samples': 7957248, 'steps': 41443, 'loss/train': 1.0524725914001465} -11/07/2021 03:02:49 - INFO - __main__ - Step 41445: {'lr': 0.0004173720222942452, 'samples': 7957440, 'steps': 41444, 'loss/train': 1.2988440990447998} -11/07/2021 03:02:50 - INFO - __main__ - Step 41446: {'lr': 0.000417368080285892, 'samples': 7957632, 'steps': 41445, 'loss/train': 1.635378360748291} -11/07/2021 03:02:50 - INFO - __main__ - Step 41447: {'lr': 0.0004173641382021254, 'samples': 7957824, 'steps': 41446, 'loss/train': 1.5069023370742798} -11/07/2021 03:02:50 - INFO - __main__ - Step 41448: {'lr': 0.00041736019604294704, 'samples': 7958016, 'steps': 41447, 'loss/train': 1.1068689823150635} -11/07/2021 03:02:51 - INFO - __main__ - Step 41449: {'lr': 0.00041735625380835884, 'samples': 7958208, 'steps': 41448, 'loss/train': 1.2277780771255493} -11/07/2021 03:02:51 - INFO - __main__ - Step 41450: {'lr': 0.0004173523114983624, 'samples': 7958400, 'steps': 41449, 'loss/train': 1.8505853414535522} -11/07/2021 03:02:51 - INFO - __main__ - Step 41451: {'lr': 0.0004173483691129597, 'samples': 7958592, 'steps': 41450, 'loss/train': 0.6934025883674622} -11/07/2021 03:02:52 - INFO - __main__ - Step 41452: {'lr': 0.00041734442665215235, 'samples': 7958784, 'steps': 41451, 'loss/train': 1.4254666566848755} -11/07/2021 03:02:53 - INFO - __main__ - Step 41453: {'lr': 0.00041734048411594214, 'samples': 7958976, 'steps': 41452, 'loss/train': 1.5704346895217896} -11/07/2021 03:02:53 - INFO - __main__ - Step 41454: {'lr': 0.000417336541504331, 'samples': 7959168, 'steps': 41453, 'loss/train': 1.513946533203125} -11/07/2021 03:02:54 - INFO - __main__ - Step 41455: {'lr': 0.0004173325988173205, 'samples': 7959360, 'steps': 41454, 'loss/train': 1.9185298681259155} -11/07/2021 03:02:54 - INFO - __main__ - Step 41456: {'lr': 0.00041732865605491256, 'samples': 7959552, 'steps': 41455, 'loss/train': 1.6555119752883911} -11/07/2021 03:02:55 - INFO - __main__ - Step 41457: {'lr': 0.00041732471321710886, 'samples': 7959744, 'steps': 41456, 'loss/train': 1.1334835290908813} -11/07/2021 03:02:55 - INFO - __main__ - Step 41458: {'lr': 0.00041732077030391126, 'samples': 7959936, 'steps': 41457, 'loss/train': 1.4219813346862793} -11/07/2021 03:02:56 - INFO - __main__ - Step 41459: {'lr': 0.00041731682731532154, 'samples': 7960128, 'steps': 41458, 'loss/train': 1.6092408895492554} -11/07/2021 03:02:56 - INFO - __main__ - Step 41460: {'lr': 0.0004173128842513414, 'samples': 7960320, 'steps': 41459, 'loss/train': 1.670626163482666} -11/07/2021 03:02:56 - INFO - __main__ - Step 41461: {'lr': 0.00041730894111197266, 'samples': 7960512, 'steps': 41460, 'loss/train': 1.2933282852172852} -11/07/2021 03:02:57 - INFO - __main__ - Step 41462: {'lr': 0.0004173049978972171, 'samples': 7960704, 'steps': 41461, 'loss/train': 1.370222568511963} -11/07/2021 03:02:58 - INFO - __main__ - Step 41463: {'lr': 0.0004173010546070765, 'samples': 7960896, 'steps': 41462, 'loss/train': 1.1095010042190552} -11/07/2021 03:02:58 - INFO - __main__ - Step 41464: {'lr': 0.00041729711124155255, 'samples': 7961088, 'steps': 41463, 'loss/train': 1.4668735265731812} -11/07/2021 03:02:58 - INFO - __main__ - Step 41465: {'lr': 0.0004172931678006472, 'samples': 7961280, 'steps': 41464, 'loss/train': 1.5170831680297852} -11/07/2021 03:02:59 - INFO - __main__ - Step 41466: {'lr': 0.00041728922428436213, 'samples': 7961472, 'steps': 41465, 'loss/train': 1.5716190338134766} -11/07/2021 03:03:00 - INFO - __main__ - Step 41467: {'lr': 0.000417285280692699, 'samples': 7961664, 'steps': 41466, 'loss/train': 1.6805745363235474} -11/07/2021 03:03:00 - INFO - __main__ - Step 41468: {'lr': 0.00041728133702565985, 'samples': 7961856, 'steps': 41467, 'loss/train': 1.1384950876235962} -11/07/2021 03:03:01 - INFO - __main__ - Step 41469: {'lr': 0.0004172773932832462, 'samples': 7962048, 'steps': 41468, 'loss/train': 1.230355978012085} -11/07/2021 03:03:01 - INFO - __main__ - Step 41470: {'lr': 0.00041727344946546, 'samples': 7962240, 'steps': 41469, 'loss/train': 1.650503396987915} -11/07/2021 03:03:02 - INFO - __main__ - Step 41471: {'lr': 0.00041726950557230294, 'samples': 7962432, 'steps': 41470, 'loss/train': 1.2427712678909302} -11/07/2021 03:03:02 - INFO - __main__ - Step 41472: {'lr': 0.0004172655616037768, 'samples': 7962624, 'steps': 41471, 'loss/train': 1.4126157760620117} -11/07/2021 03:03:02 - INFO - __main__ - Step 41473: {'lr': 0.0004172616175598835, 'samples': 7962816, 'steps': 41472, 'loss/train': 1.6682500839233398} -11/07/2021 03:03:03 - INFO - __main__ - Step 41474: {'lr': 0.00041725767344062453, 'samples': 7963008, 'steps': 41473, 'loss/train': 1.1578184366226196} -11/07/2021 03:03:04 - INFO - __main__ - Step 41475: {'lr': 0.00041725372924600193, 'samples': 7963200, 'steps': 41474, 'loss/train': 1.4274133443832397} -11/07/2021 03:03:04 - INFO - __main__ - Step 41476: {'lr': 0.00041724978497601736, 'samples': 7963392, 'steps': 41475, 'loss/train': 1.463484287261963} -11/07/2021 03:03:04 - INFO - __main__ - Step 41477: {'lr': 0.0004172458406306726, 'samples': 7963584, 'steps': 41476, 'loss/train': 1.0533301830291748} -11/07/2021 03:03:05 - INFO - __main__ - Step 41478: {'lr': 0.00041724189620996946, 'samples': 7963776, 'steps': 41477, 'loss/train': 1.0579352378845215} -11/07/2021 03:03:06 - INFO - __main__ - Step 41479: {'lr': 0.0004172379517139097, 'samples': 7963968, 'steps': 41478, 'loss/train': 1.7435880899429321} -11/07/2021 03:03:06 - INFO - __main__ - Step 41480: {'lr': 0.0004172340071424951, 'samples': 7964160, 'steps': 41479, 'loss/train': 1.8347982168197632} -11/07/2021 03:03:07 - INFO - __main__ - Step 41481: {'lr': 0.00041723006249572744, 'samples': 7964352, 'steps': 41480, 'loss/train': 1.4495962858200073} -11/07/2021 03:03:07 - INFO - __main__ - Step 41482: {'lr': 0.00041722611777360844, 'samples': 7964544, 'steps': 41481, 'loss/train': 1.658594012260437} -11/07/2021 03:03:07 - INFO - __main__ - Step 41483: {'lr': 0.00041722217297614, 'samples': 7964736, 'steps': 41482, 'loss/train': 1.278537631034851} -11/07/2021 03:03:09 - INFO - __main__ - Step 41484: {'lr': 0.00041721822810332384, 'samples': 7964928, 'steps': 41483, 'loss/train': 1.0990140438079834} -11/07/2021 03:03:09 - INFO - __main__ - Step 41485: {'lr': 0.00041721428315516176, 'samples': 7965120, 'steps': 41484, 'loss/train': 1.4794907569885254} -11/07/2021 03:03:09 - INFO - __main__ - Step 41486: {'lr': 0.00041721033813165543, 'samples': 7965312, 'steps': 41485, 'loss/train': 1.702915906906128} -11/07/2021 03:03:10 - INFO - __main__ - Step 41487: {'lr': 0.0004172063930328067, 'samples': 7965504, 'steps': 41486, 'loss/train': 1.5428369045257568} -11/07/2021 03:03:10 - INFO - __main__ - Step 41488: {'lr': 0.00041720244785861736, 'samples': 7965696, 'steps': 41487, 'loss/train': 1.109743356704712} -11/07/2021 03:03:12 - INFO - __main__ - Step 41489: {'lr': 0.0004171985026090892, 'samples': 7965888, 'steps': 41488, 'loss/train': 1.1824779510498047} -11/07/2021 03:03:12 - INFO - __main__ - Step 41490: {'lr': 0.00041719455728422394, 'samples': 7966080, 'steps': 41489, 'loss/train': 1.8389651775360107} -11/07/2021 03:03:12 - INFO - __main__ - Step 41491: {'lr': 0.0004171906118840234, 'samples': 7966272, 'steps': 41490, 'loss/train': 1.796555519104004} -11/07/2021 03:03:13 - INFO - __main__ - Step 41492: {'lr': 0.00041718666640848937, 'samples': 7966464, 'steps': 41491, 'loss/train': 1.8231583833694458} -11/07/2021 03:03:13 - INFO - __main__ - Step 41493: {'lr': 0.0004171827208576236, 'samples': 7966656, 'steps': 41492, 'loss/train': 1.3844928741455078} -11/07/2021 03:03:14 - INFO - __main__ - Step 41494: {'lr': 0.00041717877523142786, 'samples': 7966848, 'steps': 41493, 'loss/train': 1.3137469291687012} -11/07/2021 03:03:14 - INFO - __main__ - Step 41495: {'lr': 0.00041717482952990394, 'samples': 7967040, 'steps': 41494, 'loss/train': 1.6464651823043823} -11/07/2021 03:03:15 - INFO - __main__ - Step 41496: {'lr': 0.00041717088375305367, 'samples': 7967232, 'steps': 41495, 'loss/train': 0.9370419979095459} -11/07/2021 03:03:15 - INFO - __main__ - Step 41497: {'lr': 0.0004171669379008787, 'samples': 7967424, 'steps': 41496, 'loss/train': 1.5788377523422241} -11/07/2021 03:03:16 - INFO - __main__ - Step 41498: {'lr': 0.00041716299197338093, 'samples': 7967616, 'steps': 41497, 'loss/train': 1.5179771184921265} -11/07/2021 03:03:16 - INFO - __main__ - Step 41499: {'lr': 0.0004171590459705622, 'samples': 7967808, 'steps': 41498, 'loss/train': 1.1437050104141235} -11/07/2021 03:03:16 - INFO - __main__ - Step 41500: {'lr': 0.0004171550998924241, 'samples': 7968000, 'steps': 41499, 'loss/train': 1.9808309078216553} -11/07/2021 03:03:17 - INFO - __main__ - Step 41501: {'lr': 0.0004171511537389684, 'samples': 7968192, 'steps': 41500, 'loss/train': 1.4925646781921387} -11/07/2021 03:03:18 - INFO - __main__ - Step 41502: {'lr': 0.0004171472075101971, 'samples': 7968384, 'steps': 41501, 'loss/train': 1.3484253883361816} -11/07/2021 03:03:18 - INFO - __main__ - Step 41503: {'lr': 0.0004171432612061117, 'samples': 7968576, 'steps': 41502, 'loss/train': 1.1927528381347656} -11/07/2021 03:03:18 - INFO - __main__ - Step 41504: {'lr': 0.00041713931482671425, 'samples': 7968768, 'steps': 41503, 'loss/train': 1.7438743114471436} -11/07/2021 03:03:19 - INFO - __main__ - Step 41505: {'lr': 0.0004171353683720064, 'samples': 7968960, 'steps': 41504, 'loss/train': 1.5354259014129639} -11/07/2021 03:03:20 - INFO - __main__ - Step 41506: {'lr': 0.00041713142184198994, 'samples': 7969152, 'steps': 41505, 'loss/train': 0.9600526690483093} -11/07/2021 03:03:20 - INFO - __main__ - Step 41507: {'lr': 0.0004171274752366665, 'samples': 7969344, 'steps': 41506, 'loss/train': 1.7088255882263184} -11/07/2021 03:03:20 - INFO - __main__ - Step 41508: {'lr': 0.00041712352855603817, 'samples': 7969536, 'steps': 41507, 'loss/train': 0.9700304269790649} -11/07/2021 03:03:21 - INFO - __main__ - Step 41509: {'lr': 0.00041711958180010644, 'samples': 7969728, 'steps': 41508, 'loss/train': 1.4612095355987549} -11/07/2021 03:03:21 - INFO - __main__ - Step 41510: {'lr': 0.0004171156349688733, 'samples': 7969920, 'steps': 41509, 'loss/train': 1.733356237411499} -11/07/2021 03:03:22 - INFO - __main__ - Step 41511: {'lr': 0.0004171116880623404, 'samples': 7970112, 'steps': 41510, 'loss/train': 0.9728167057037354} -11/07/2021 03:03:23 - INFO - __main__ - Step 41512: {'lr': 0.0004171077410805095, 'samples': 7970304, 'steps': 41511, 'loss/train': 2.3415327072143555} -11/07/2021 03:03:23 - INFO - __main__ - Step 41513: {'lr': 0.0004171037940233825, 'samples': 7970496, 'steps': 41512, 'loss/train': 1.5685441493988037} -11/07/2021 03:03:23 - INFO - __main__ - Step 41514: {'lr': 0.0004170998468909611, 'samples': 7970688, 'steps': 41513, 'loss/train': 0.9442493915557861} -11/07/2021 03:03:24 - INFO - __main__ - Step 41515: {'lr': 0.00041709589968324704, 'samples': 7970880, 'steps': 41514, 'loss/train': 1.246776819229126} -11/07/2021 03:03:24 - INFO - __main__ - Step 41516: {'lr': 0.00041709195240024224, 'samples': 7971072, 'steps': 41515, 'loss/train': 1.509366750717163} -11/07/2021 03:03:25 - INFO - __main__ - Step 41517: {'lr': 0.0004170880050419483, 'samples': 7971264, 'steps': 41516, 'loss/train': 1.6185767650604248} -11/07/2021 03:03:25 - INFO - __main__ - Step 41518: {'lr': 0.0004170840576083671, 'samples': 7971456, 'steps': 41517, 'loss/train': 1.701627254486084} -11/07/2021 03:03:26 - INFO - __main__ - Step 41519: {'lr': 0.00041708011009950044, 'samples': 7971648, 'steps': 41518, 'loss/train': 1.5624347925186157} -11/07/2021 03:03:26 - INFO - __main__ - Step 41520: {'lr': 0.00041707616251535, 'samples': 7971840, 'steps': 41519, 'loss/train': 1.5904089212417603} -11/07/2021 03:03:26 - INFO - __main__ - Step 41521: {'lr': 0.0004170722148559176, 'samples': 7972032, 'steps': 41520, 'loss/train': 1.464963674545288} -11/07/2021 03:03:28 - INFO - __main__ - Step 41522: {'lr': 0.0004170682671212051, 'samples': 7972224, 'steps': 41521, 'loss/train': 1.7140016555786133} -11/07/2021 03:03:28 - INFO - __main__ - Step 41523: {'lr': 0.00041706431931121416, 'samples': 7972416, 'steps': 41522, 'loss/train': 1.342008113861084} -11/07/2021 03:03:28 - INFO - __main__ - Step 41524: {'lr': 0.00041706037142594666, 'samples': 7972608, 'steps': 41523, 'loss/train': 1.2205827236175537} -11/07/2021 03:03:29 - INFO - __main__ - Step 41525: {'lr': 0.00041705642346540436, 'samples': 7972800, 'steps': 41524, 'loss/train': 1.8854976892471313} -11/07/2021 03:03:29 - INFO - __main__ - Step 41526: {'lr': 0.00041705247542958904, 'samples': 7972992, 'steps': 41525, 'loss/train': 1.6413252353668213} -11/07/2021 03:03:30 - INFO - __main__ - Step 41527: {'lr': 0.00041704852731850234, 'samples': 7973184, 'steps': 41526, 'loss/train': 1.44478440284729} -11/07/2021 03:03:30 - INFO - __main__ - Step 41528: {'lr': 0.0004170445791321462, 'samples': 7973376, 'steps': 41527, 'loss/train': 1.8444479703903198} -11/07/2021 03:03:31 - INFO - __main__ - Step 41529: {'lr': 0.00041704063087052236, 'samples': 7973568, 'steps': 41528, 'loss/train': 0.33136051893234253} -11/07/2021 03:03:31 - INFO - __main__ - Step 41530: {'lr': 0.0004170366825336326, 'samples': 7973760, 'steps': 41529, 'loss/train': 1.6385127305984497} -11/07/2021 03:03:31 - INFO - __main__ - Step 41531: {'lr': 0.0004170327341214787, 'samples': 7973952, 'steps': 41530, 'loss/train': 1.5817596912384033} -11/07/2021 03:03:33 - INFO - __main__ - Step 41532: {'lr': 0.00041702878563406237, 'samples': 7974144, 'steps': 41531, 'loss/train': 1.5311561822891235} -11/07/2021 03:03:33 - INFO - __main__ - Step 41533: {'lr': 0.0004170248370713855, 'samples': 7974336, 'steps': 41532, 'loss/train': 1.442463994026184} -11/07/2021 03:03:34 - INFO - __main__ - Step 41534: {'lr': 0.0004170208884334498, 'samples': 7974528, 'steps': 41533, 'loss/train': 1.0978189706802368} -11/07/2021 03:03:34 - INFO - __main__ - Step 41535: {'lr': 0.000417016939720257, 'samples': 7974720, 'steps': 41534, 'loss/train': 1.4123374223709106} -11/07/2021 03:03:34 - INFO - __main__ - Step 41536: {'lr': 0.000417012990931809, 'samples': 7974912, 'steps': 41535, 'loss/train': 0.7976887822151184} -11/07/2021 03:03:35 - INFO - __main__ - Step 41537: {'lr': 0.00041700904206810755, 'samples': 7975104, 'steps': 41536, 'loss/train': 1.848340392112732} -11/07/2021 03:03:36 - INFO - __main__ - Step 41538: {'lr': 0.00041700509312915437, 'samples': 7975296, 'steps': 41537, 'loss/train': 1.4981316328048706} -11/07/2021 03:03:36 - INFO - __main__ - Step 41539: {'lr': 0.0004170011441149513, 'samples': 7975488, 'steps': 41538, 'loss/train': 0.8363898396492004} -11/07/2021 03:03:36 - INFO - __main__ - Step 41540: {'lr': 0.0004169971950255001, 'samples': 7975680, 'steps': 41539, 'loss/train': 1.6645216941833496} -11/07/2021 03:03:37 - INFO - __main__ - Step 41541: {'lr': 0.0004169932458608025, 'samples': 7975872, 'steps': 41540, 'loss/train': 1.6828755140304565} -11/07/2021 03:03:37 - INFO - __main__ - Step 41542: {'lr': 0.00041698929662086035, 'samples': 7976064, 'steps': 41541, 'loss/train': 1.5580079555511475} -11/07/2021 03:03:38 - INFO - __main__ - Step 41543: {'lr': 0.0004169853473056754, 'samples': 7976256, 'steps': 41542, 'loss/train': 1.5427733659744263} -11/07/2021 03:03:38 - INFO - __main__ - Step 41544: {'lr': 0.0004169813979152494, 'samples': 7976448, 'steps': 41543, 'loss/train': 1.0188912153244019} -11/07/2021 03:03:39 - INFO - __main__ - Step 41545: {'lr': 0.0004169774484495841, 'samples': 7976640, 'steps': 41544, 'loss/train': 1.597219467163086} -11/07/2021 03:03:39 - INFO - __main__ - Step 41546: {'lr': 0.00041697349890868146, 'samples': 7976832, 'steps': 41545, 'loss/train': 1.5436819791793823} -11/07/2021 03:03:39 - INFO - __main__ - Step 41547: {'lr': 0.0004169695492925431, 'samples': 7977024, 'steps': 41546, 'loss/train': 1.716619610786438} -11/07/2021 03:03:41 - INFO - __main__ - Step 41548: {'lr': 0.0004169655996011708, 'samples': 7977216, 'steps': 41547, 'loss/train': 1.5983400344848633} -11/07/2021 03:03:41 - INFO - __main__ - Step 41549: {'lr': 0.0004169616498345664, 'samples': 7977408, 'steps': 41548, 'loss/train': 0.22941921651363373} -11/07/2021 03:03:42 - INFO - __main__ - Step 41550: {'lr': 0.0004169576999927317, 'samples': 7977600, 'steps': 41549, 'loss/train': 0.8101643323898315} -11/07/2021 03:03:42 - INFO - __main__ - Step 41551: {'lr': 0.00041695375007566837, 'samples': 7977792, 'steps': 41550, 'loss/train': 1.3644152879714966} -11/07/2021 03:03:42 - INFO - __main__ - Step 41552: {'lr': 0.00041694980008337825, 'samples': 7977984, 'steps': 41551, 'loss/train': 1.5691694021224976} -11/07/2021 03:03:43 - INFO - __main__ - Step 41553: {'lr': 0.0004169458500158632, 'samples': 7978176, 'steps': 41552, 'loss/train': 1.4925529956817627} -11/07/2021 03:03:44 - INFO - __main__ - Step 41554: {'lr': 0.0004169418998731249, 'samples': 7978368, 'steps': 41553, 'loss/train': 1.4446444511413574} -11/07/2021 03:03:44 - INFO - __main__ - Step 41555: {'lr': 0.00041693794965516514, 'samples': 7978560, 'steps': 41554, 'loss/train': 1.3788728713989258} -11/07/2021 03:03:45 - INFO - __main__ - Step 41556: {'lr': 0.0004169339993619857, 'samples': 7978752, 'steps': 41555, 'loss/train': 1.3602726459503174} -11/07/2021 03:03:45 - INFO - __main__ - Step 41557: {'lr': 0.0004169300489935884, 'samples': 7978944, 'steps': 41556, 'loss/train': 1.5837068557739258} -11/07/2021 03:03:45 - INFO - __main__ - Step 41558: {'lr': 0.000416926098549975, 'samples': 7979136, 'steps': 41557, 'loss/train': 1.434810996055603} -11/07/2021 03:03:46 - INFO - __main__ - Step 41559: {'lr': 0.00041692214803114725, 'samples': 7979328, 'steps': 41558, 'loss/train': 1.3605402708053589} -11/07/2021 03:03:47 - INFO - __main__ - Step 41560: {'lr': 0.00041691819743710704, 'samples': 7979520, 'steps': 41559, 'loss/train': 1.6383851766586304} -11/07/2021 03:03:47 - INFO - __main__ - Step 41561: {'lr': 0.00041691424676785593, 'samples': 7979712, 'steps': 41560, 'loss/train': 1.891399621963501} -11/07/2021 03:03:47 - INFO - __main__ - Step 41562: {'lr': 0.00041691029602339595, 'samples': 7979904, 'steps': 41561, 'loss/train': 1.7154065370559692} -11/07/2021 03:03:48 - INFO - __main__ - Step 41563: {'lr': 0.00041690634520372865, 'samples': 7980096, 'steps': 41562, 'loss/train': 1.307283878326416} -11/07/2021 03:03:49 - INFO - __main__ - Step 41564: {'lr': 0.000416902394308856, 'samples': 7980288, 'steps': 41563, 'loss/train': 1.3553440570831299} -11/07/2021 03:03:49 - INFO - __main__ - Step 41565: {'lr': 0.00041689844333877966, 'samples': 7980480, 'steps': 41564, 'loss/train': 1.7948700189590454} -11/07/2021 03:03:49 - INFO - __main__ - Step 41566: {'lr': 0.00041689449229350155, 'samples': 7980672, 'steps': 41565, 'loss/train': 1.0878863334655762} -11/07/2021 03:03:50 - INFO - __main__ - Step 41567: {'lr': 0.00041689054117302333, 'samples': 7980864, 'steps': 41566, 'loss/train': 1.3097561597824097} -11/07/2021 03:03:50 - INFO - __main__ - Step 41568: {'lr': 0.00041688658997734675, 'samples': 7981056, 'steps': 41567, 'loss/train': 1.6336743831634521} -11/07/2021 03:03:51 - INFO - __main__ - Step 41569: {'lr': 0.0004168826387064737, 'samples': 7981248, 'steps': 41568, 'loss/train': 1.0773857831954956} -11/07/2021 03:03:51 - INFO - __main__ - Step 41570: {'lr': 0.00041687868736040593, 'samples': 7981440, 'steps': 41569, 'loss/train': 1.6702024936676025} -11/07/2021 03:03:52 - INFO - __main__ - Step 41571: {'lr': 0.0004168747359391451, 'samples': 7981632, 'steps': 41570, 'loss/train': 1.680422067642212} -11/07/2021 03:03:52 - INFO - __main__ - Step 41572: {'lr': 0.00041687078444269316, 'samples': 7981824, 'steps': 41571, 'loss/train': 1.8877520561218262} -11/07/2021 03:03:53 - INFO - __main__ - Step 41573: {'lr': 0.0004168668328710518, 'samples': 7982016, 'steps': 41572, 'loss/train': 1.2095186710357666} -11/07/2021 03:03:53 - INFO - __main__ - Step 41574: {'lr': 0.0004168628812242228, 'samples': 7982208, 'steps': 41573, 'loss/train': 1.69416344165802} -11/07/2021 03:03:54 - INFO - __main__ - Step 41575: {'lr': 0.00041685892950220804, 'samples': 7982400, 'steps': 41574, 'loss/train': 1.6244293451309204} -11/07/2021 03:03:54 - INFO - __main__ - Step 41576: {'lr': 0.0004168549777050091, 'samples': 7982592, 'steps': 41575, 'loss/train': 0.9274775981903076} -11/07/2021 03:03:55 - INFO - __main__ - Step 41577: {'lr': 0.000416851025832628, 'samples': 7982784, 'steps': 41576, 'loss/train': 0.6884801387786865} -11/07/2021 03:03:55 - INFO - __main__ - Step 41578: {'lr': 0.0004168470738850664, 'samples': 7982976, 'steps': 41577, 'loss/train': 1.5503827333450317} -11/07/2021 03:03:56 - INFO - __main__ - Step 41579: {'lr': 0.00041684312186232597, 'samples': 7983168, 'steps': 41578, 'loss/train': 1.9044495820999146} -11/07/2021 03:03:56 - INFO - __main__ - Step 41580: {'lr': 0.0004168391697644087, 'samples': 7983360, 'steps': 41579, 'loss/train': 2.477400064468384} -11/07/2021 03:03:57 - INFO - __main__ - Step 41581: {'lr': 0.0004168352175913163, 'samples': 7983552, 'steps': 41580, 'loss/train': 1.2631022930145264} -11/07/2021 03:03:57 - INFO - __main__ - Step 41582: {'lr': 0.00041683126534305037, 'samples': 7983744, 'steps': 41581, 'loss/train': 1.6071327924728394} -11/07/2021 03:03:57 - INFO - __main__ - Step 41583: {'lr': 0.000416827313019613, 'samples': 7983936, 'steps': 41582, 'loss/train': 1.5428014993667603} -11/07/2021 03:03:58 - INFO - __main__ - Step 41584: {'lr': 0.0004168233606210058, 'samples': 7984128, 'steps': 41583, 'loss/train': 0.9221970438957214} -11/07/2021 03:03:59 - INFO - __main__ - Step 41585: {'lr': 0.0004168194081472305, 'samples': 7984320, 'steps': 41584, 'loss/train': 1.1452103853225708} -11/07/2021 03:03:59 - INFO - __main__ - Step 41586: {'lr': 0.000416815455598289, 'samples': 7984512, 'steps': 41585, 'loss/train': 1.6904128789901733} -11/07/2021 03:03:59 - INFO - __main__ - Step 41587: {'lr': 0.000416811502974183, 'samples': 7984704, 'steps': 41586, 'loss/train': 1.4233283996582031} -11/07/2021 03:04:00 - INFO - __main__ - Step 41588: {'lr': 0.00041680755027491433, 'samples': 7984896, 'steps': 41587, 'loss/train': 1.4579297304153442} -11/07/2021 03:04:00 - INFO - __main__ - Step 41589: {'lr': 0.0004168035975004847, 'samples': 7985088, 'steps': 41588, 'loss/train': 0.9681318402290344} -11/07/2021 03:04:01 - INFO - __main__ - Step 41590: {'lr': 0.00041679964465089596, 'samples': 7985280, 'steps': 41589, 'loss/train': 1.7440179586410522} -11/07/2021 03:04:02 - INFO - __main__ - Step 41591: {'lr': 0.00041679569172614996, 'samples': 7985472, 'steps': 41590, 'loss/train': 1.1505935192108154} -11/07/2021 03:04:02 - INFO - __main__ - Step 41592: {'lr': 0.0004167917387262483, 'samples': 7985664, 'steps': 41591, 'loss/train': 1.8241571187973022} -11/07/2021 03:04:02 - INFO - __main__ - Step 41593: {'lr': 0.0004167877856511929, 'samples': 7985856, 'steps': 41592, 'loss/train': 1.6857103109359741} -11/07/2021 03:04:03 - INFO - __main__ - Step 41594: {'lr': 0.0004167838325009855, 'samples': 7986048, 'steps': 41593, 'loss/train': 1.7244120836257935} -11/07/2021 03:04:04 - INFO - __main__ - Step 41595: {'lr': 0.0004167798792756279, 'samples': 7986240, 'steps': 41594, 'loss/train': 1.451128602027893} -11/07/2021 03:04:04 - INFO - __main__ - Step 41596: {'lr': 0.0004167759259751218, 'samples': 7986432, 'steps': 41595, 'loss/train': 1.5407642126083374} -11/07/2021 03:04:04 - INFO - __main__ - Step 41597: {'lr': 0.0004167719725994691, 'samples': 7986624, 'steps': 41596, 'loss/train': 1.3572611808776855} -11/07/2021 03:04:05 - INFO - __main__ - Step 41598: {'lr': 0.00041676801914867145, 'samples': 7986816, 'steps': 41597, 'loss/train': 1.030824065208435} -11/07/2021 03:04:05 - INFO - __main__ - Step 41599: {'lr': 0.00041676406562273074, 'samples': 7987008, 'steps': 41598, 'loss/train': 1.2116070985794067} -11/07/2021 03:04:06 - INFO - __main__ - Step 41600: {'lr': 0.00041676011202164875, 'samples': 7987200, 'steps': 41599, 'loss/train': 1.7278271913528442} -11/07/2021 03:04:06 - INFO - __main__ - Step 41601: {'lr': 0.00041675615834542716, 'samples': 7987392, 'steps': 41600, 'loss/train': 1.5282822847366333} -11/07/2021 03:04:07 - INFO - __main__ - Step 41602: {'lr': 0.0004167522045940678, 'samples': 7987584, 'steps': 41601, 'loss/train': 1.5136961936950684} -11/07/2021 03:04:07 - INFO - __main__ - Step 41603: {'lr': 0.0004167482507675726, 'samples': 7987776, 'steps': 41602, 'loss/train': 1.5415982007980347} -11/07/2021 03:04:07 - INFO - __main__ - Step 41604: {'lr': 0.0004167442968659431, 'samples': 7987968, 'steps': 41603, 'loss/train': 1.5877426862716675} -11/07/2021 03:04:09 - INFO - __main__ - Step 41605: {'lr': 0.0004167403428891812, 'samples': 7988160, 'steps': 41604, 'loss/train': 1.3433371782302856} -11/07/2021 03:04:09 - INFO - __main__ - Step 41606: {'lr': 0.00041673638883728877, 'samples': 7988352, 'steps': 41605, 'loss/train': 1.543599247932434} -11/07/2021 03:04:09 - INFO - __main__ - Step 41607: {'lr': 0.00041673243471026746, 'samples': 7988544, 'steps': 41606, 'loss/train': 1.7371529340744019} -11/07/2021 03:04:10 - INFO - __main__ - Step 41608: {'lr': 0.000416728480508119, 'samples': 7988736, 'steps': 41607, 'loss/train': 1.6626496315002441} -11/07/2021 03:04:10 - INFO - __main__ - Step 41609: {'lr': 0.00041672452623084535, 'samples': 7988928, 'steps': 41608, 'loss/train': 1.3573652505874634} -11/07/2021 03:04:10 - INFO - __main__ - Step 41610: {'lr': 0.0004167205718784481, 'samples': 7989120, 'steps': 41609, 'loss/train': 1.6693180799484253} -11/07/2021 03:04:11 - INFO - __main__ - Step 41611: {'lr': 0.0004167166174509293, 'samples': 7989312, 'steps': 41610, 'loss/train': 1.1781405210494995} -11/07/2021 03:04:12 - INFO - __main__ - Step 41612: {'lr': 0.00041671266294829036, 'samples': 7989504, 'steps': 41611, 'loss/train': 1.4301857948303223} -11/07/2021 03:04:12 - INFO - __main__ - Step 41613: {'lr': 0.0004167087083705334, 'samples': 7989696, 'steps': 41612, 'loss/train': 1.623382568359375} -11/07/2021 03:04:12 - INFO - __main__ - Step 41614: {'lr': 0.00041670475371766, 'samples': 7989888, 'steps': 41613, 'loss/train': 1.4963102340698242} -11/07/2021 03:04:13 - INFO - __main__ - Step 41615: {'lr': 0.0004167007989896721, 'samples': 7990080, 'steps': 41614, 'loss/train': 1.2779196500778198} -11/07/2021 03:04:14 - INFO - __main__ - Step 41616: {'lr': 0.0004166968441865714, 'samples': 7990272, 'steps': 41615, 'loss/train': 1.5700368881225586} -11/07/2021 03:04:14 - INFO - __main__ - Step 41617: {'lr': 0.00041669288930835957, 'samples': 7990464, 'steps': 41616, 'loss/train': 1.4026747941970825} -11/07/2021 03:04:14 - INFO - __main__ - Step 41618: {'lr': 0.0004166889343550385, 'samples': 7990656, 'steps': 41617, 'loss/train': 1.3232351541519165} -11/07/2021 03:04:15 - INFO - __main__ - Step 41619: {'lr': 0.00041668497932661005, 'samples': 7990848, 'steps': 41618, 'loss/train': 1.4335687160491943} -11/07/2021 03:04:15 - INFO - __main__ - Step 41620: {'lr': 0.00041668102422307593, 'samples': 7991040, 'steps': 41619, 'loss/train': 1.4519500732421875} -11/07/2021 03:04:16 - INFO - __main__ - Step 41621: {'lr': 0.0004166770690444378, 'samples': 7991232, 'steps': 41620, 'loss/train': 0.8947644829750061} -11/07/2021 03:04:16 - INFO - __main__ - Step 41622: {'lr': 0.0004166731137906976, 'samples': 7991424, 'steps': 41621, 'loss/train': 1.49089777469635} -11/07/2021 03:04:17 - INFO - __main__ - Step 41623: {'lr': 0.0004166691584618572, 'samples': 7991616, 'steps': 41622, 'loss/train': 1.4614523649215698} -11/07/2021 03:04:17 - INFO - __main__ - Step 41624: {'lr': 0.00041666520305791806, 'samples': 7991808, 'steps': 41623, 'loss/train': 1.655706524848938} -11/07/2021 03:04:18 - INFO - __main__ - Step 41625: {'lr': 0.00041666124757888223, 'samples': 7992000, 'steps': 41624, 'loss/train': 1.599887490272522} -11/07/2021 03:04:19 - INFO - __main__ - Step 41626: {'lr': 0.0004166572920247514, 'samples': 7992192, 'steps': 41625, 'loss/train': 0.9554967880249023} -11/07/2021 03:04:19 - INFO - __main__ - Step 41627: {'lr': 0.0004166533363955274, 'samples': 7992384, 'steps': 41626, 'loss/train': 1.4879121780395508} -11/07/2021 03:04:19 - INFO - __main__ - Step 41628: {'lr': 0.00041664938069121195, 'samples': 7992576, 'steps': 41627, 'loss/train': 1.5209451913833618} -11/07/2021 03:04:20 - INFO - __main__ - Step 41629: {'lr': 0.00041664542491180685, 'samples': 7992768, 'steps': 41628, 'loss/train': 1.5639281272888184} -11/07/2021 03:04:20 - INFO - __main__ - Step 41630: {'lr': 0.0004166414690573139, 'samples': 7992960, 'steps': 41629, 'loss/train': 1.2982888221740723} -11/07/2021 03:04:20 - INFO - __main__ - Step 41631: {'lr': 0.0004166375131277349, 'samples': 7993152, 'steps': 41630, 'loss/train': 1.4986904859542847} -11/07/2021 03:04:21 - INFO - __main__ - Step 41632: {'lr': 0.0004166335571230716, 'samples': 7993344, 'steps': 41631, 'loss/train': 1.3777761459350586} -11/07/2021 03:04:22 - INFO - __main__ - Step 41633: {'lr': 0.0004166296010433258, 'samples': 7993536, 'steps': 41632, 'loss/train': 1.5161300897598267} -11/07/2021 03:04:22 - INFO - __main__ - Step 41634: {'lr': 0.00041662564488849927, 'samples': 7993728, 'steps': 41633, 'loss/train': 1.3086680173873901} -11/07/2021 03:04:22 - INFO - __main__ - Step 41635: {'lr': 0.00041662168865859374, 'samples': 7993920, 'steps': 41634, 'loss/train': 1.5390034914016724} -11/07/2021 03:04:23 - INFO - __main__ - Step 41636: {'lr': 0.0004166177323536111, 'samples': 7994112, 'steps': 41635, 'loss/train': 1.047380805015564} -11/07/2021 03:04:24 - INFO - __main__ - Step 41637: {'lr': 0.000416613775973553, 'samples': 7994304, 'steps': 41636, 'loss/train': 1.6869618892669678} -11/07/2021 03:04:24 - INFO - __main__ - Step 41638: {'lr': 0.0004166098195184214, 'samples': 7994496, 'steps': 41637, 'loss/train': 1.61757230758667} -11/07/2021 03:04:24 - INFO - __main__ - Step 41639: {'lr': 0.000416605862988218, 'samples': 7994688, 'steps': 41638, 'loss/train': 0.2610689401626587} -11/07/2021 03:04:25 - INFO - __main__ - Step 41640: {'lr': 0.00041660190638294456, 'samples': 7994880, 'steps': 41639, 'loss/train': 1.7146142721176147} -11/07/2021 03:04:25 - INFO - __main__ - Step 41641: {'lr': 0.0004165979497026028, 'samples': 7995072, 'steps': 41640, 'loss/train': 1.8692586421966553} -11/07/2021 03:04:26 - INFO - __main__ - Step 41642: {'lr': 0.00041659399294719456, 'samples': 7995264, 'steps': 41641, 'loss/train': 1.502307415008545} -11/07/2021 03:04:27 - INFO - __main__ - Step 41643: {'lr': 0.00041659003611672175, 'samples': 7995456, 'steps': 41642, 'loss/train': 1.2738826274871826} -11/07/2021 03:04:27 - INFO - __main__ - Step 41644: {'lr': 0.000416586079211186, 'samples': 7995648, 'steps': 41643, 'loss/train': 1.7889599800109863} -11/07/2021 03:04:27 - INFO - __main__ - Step 41645: {'lr': 0.0004165821222305891, 'samples': 7995840, 'steps': 41644, 'loss/train': 1.6064268350601196} -11/07/2021 03:04:28 - INFO - __main__ - Step 41646: {'lr': 0.00041657816517493284, 'samples': 7996032, 'steps': 41645, 'loss/train': 1.5085879564285278} -11/07/2021 03:04:29 - INFO - __main__ - Step 41647: {'lr': 0.00041657420804421907, 'samples': 7996224, 'steps': 41646, 'loss/train': 1.4858813285827637} -11/07/2021 03:04:29 - INFO - __main__ - Step 41648: {'lr': 0.00041657025083844957, 'samples': 7996416, 'steps': 41647, 'loss/train': 1.5819388628005981} -11/07/2021 03:04:29 - INFO - __main__ - Step 41649: {'lr': 0.00041656629355762607, 'samples': 7996608, 'steps': 41648, 'loss/train': 1.721908450126648} -11/07/2021 03:04:30 - INFO - __main__ - Step 41650: {'lr': 0.00041656233620175035, 'samples': 7996800, 'steps': 41649, 'loss/train': 1.5587491989135742} -11/07/2021 03:04:30 - INFO - __main__ - Step 41651: {'lr': 0.0004165583787708242, 'samples': 7996992, 'steps': 41650, 'loss/train': 1.8320040702819824} -11/07/2021 03:04:31 - INFO - __main__ - Step 41652: {'lr': 0.0004165544212648494, 'samples': 7997184, 'steps': 41651, 'loss/train': 1.6275389194488525} -11/07/2021 03:04:31 - INFO - __main__ - Step 41653: {'lr': 0.0004165504636838278, 'samples': 7997376, 'steps': 41652, 'loss/train': 0.7777548432350159} -11/07/2021 03:04:32 - INFO - __main__ - Step 41654: {'lr': 0.0004165465060277611, 'samples': 7997568, 'steps': 41653, 'loss/train': 2.0229907035827637} -11/07/2021 03:04:32 - INFO - __main__ - Step 41655: {'lr': 0.0004165425482966512, 'samples': 7997760, 'steps': 41654, 'loss/train': 1.7797147035598755} -11/07/2021 03:04:33 - INFO - __main__ - Step 41656: {'lr': 0.00041653859049049964, 'samples': 7997952, 'steps': 41655, 'loss/train': 1.5604771375656128} -11/07/2021 03:04:34 - INFO - __main__ - Step 41657: {'lr': 0.00041653463260930845, 'samples': 7998144, 'steps': 41656, 'loss/train': 1.7182575464248657} -11/07/2021 03:04:34 - INFO - __main__ - Step 41658: {'lr': 0.00041653067465307925, 'samples': 7998336, 'steps': 41657, 'loss/train': 1.416732907295227} -11/07/2021 03:04:34 - INFO - __main__ - Step 41659: {'lr': 0.00041652671662181394, 'samples': 7998528, 'steps': 41658, 'loss/train': 1.7493034601211548} -11/07/2021 03:04:35 - INFO - __main__ - Step 41660: {'lr': 0.00041652275851551435, 'samples': 7998720, 'steps': 41659, 'loss/train': 1.145478367805481} -11/07/2021 03:04:35 - INFO - __main__ - Step 41661: {'lr': 0.0004165188003341821, 'samples': 7998912, 'steps': 41660, 'loss/train': 1.4541614055633545} -11/07/2021 03:04:36 - INFO - __main__ - Step 41662: {'lr': 0.0004165148420778191, 'samples': 7999104, 'steps': 41661, 'loss/train': 1.7806086540222168} -11/07/2021 03:04:36 - INFO - __main__ - Step 41663: {'lr': 0.000416510883746427, 'samples': 7999296, 'steps': 41662, 'loss/train': 1.8331174850463867} -11/07/2021 03:04:37 - INFO - __main__ - Step 41664: {'lr': 0.00041650692534000766, 'samples': 7999488, 'steps': 41663, 'loss/train': 1.617154598236084} -11/07/2021 03:04:37 - INFO - __main__ - Step 41665: {'lr': 0.0004165029668585629, 'samples': 7999680, 'steps': 41664, 'loss/train': 1.5130399465560913} -11/07/2021 03:04:37 - INFO - __main__ - Step 41666: {'lr': 0.00041649900830209455, 'samples': 7999872, 'steps': 41665, 'loss/train': 1.3040863275527954} -11/07/2021 03:04:38 - INFO - __main__ - Step 41667: {'lr': 0.00041649504967060423, 'samples': 8000064, 'steps': 41666, 'loss/train': 1.3093539476394653} -11/07/2021 03:04:39 - INFO - __main__ - Step 41668: {'lr': 0.0004164910909640938, 'samples': 8000256, 'steps': 41667, 'loss/train': 1.47370445728302} -11/07/2021 03:04:39 - INFO - __main__ - Step 41669: {'lr': 0.0004164871321825651, 'samples': 8000448, 'steps': 41668, 'loss/train': 0.9638338685035706} -11/07/2021 03:04:39 - INFO - __main__ - Step 41670: {'lr': 0.0004164831733260198, 'samples': 8000640, 'steps': 41669, 'loss/train': 1.4005441665649414} -11/07/2021 03:04:40 - INFO - __main__ - Step 41671: {'lr': 0.0004164792143944598, 'samples': 8000832, 'steps': 41670, 'loss/train': 1.7547717094421387} -11/07/2021 03:04:40 - INFO - __main__ - Step 41672: {'lr': 0.0004164752553878868, 'samples': 8001024, 'steps': 41671, 'loss/train': 1.6093745231628418} -11/07/2021 03:04:41 - INFO - __main__ - Step 41673: {'lr': 0.00041647129630630265, 'samples': 8001216, 'steps': 41672, 'loss/train': 1.2964626550674438} -11/07/2021 03:04:42 - INFO - __main__ - Step 41674: {'lr': 0.0004164673371497092, 'samples': 8001408, 'steps': 41673, 'loss/train': 1.6003328561782837} -11/07/2021 03:04:42 - INFO - __main__ - Step 41675: {'lr': 0.000416463377918108, 'samples': 8001600, 'steps': 41674, 'loss/train': 0.9917303323745728} -11/07/2021 03:04:42 - INFO - __main__ - Step 41676: {'lr': 0.00041645941861150103, 'samples': 8001792, 'steps': 41675, 'loss/train': 2.396070957183838} -11/07/2021 03:04:43 - INFO - __main__ - Step 41677: {'lr': 0.00041645545922989, 'samples': 8001984, 'steps': 41676, 'loss/train': 1.1119292974472046} -11/07/2021 03:04:44 - INFO - __main__ - Step 41678: {'lr': 0.00041645149977327667, 'samples': 8002176, 'steps': 41677, 'loss/train': 0.8787075877189636} -11/07/2021 03:04:44 - INFO - __main__ - Step 41679: {'lr': 0.0004164475402416629, 'samples': 8002368, 'steps': 41678, 'loss/train': 1.0953854322433472} -11/07/2021 03:04:45 - INFO - __main__ - Step 41680: {'lr': 0.0004164435806350505, 'samples': 8002560, 'steps': 41679, 'loss/train': 1.580024003982544} -11/07/2021 03:04:45 - INFO - __main__ - Step 41681: {'lr': 0.00041643962095344107, 'samples': 8002752, 'steps': 41680, 'loss/train': 1.4981598854064941} -11/07/2021 03:04:45 - INFO - __main__ - Step 41682: {'lr': 0.0004164356611968366, 'samples': 8002944, 'steps': 41681, 'loss/train': 1.466947078704834} -11/07/2021 03:04:46 - INFO - __main__ - Step 41683: {'lr': 0.0004164317013652387, 'samples': 8003136, 'steps': 41682, 'loss/train': 1.6721065044403076} -11/07/2021 03:04:47 - INFO - __main__ - Step 41684: {'lr': 0.00041642774145864934, 'samples': 8003328, 'steps': 41683, 'loss/train': 1.6475099325180054} -11/07/2021 03:04:47 - INFO - __main__ - Step 41685: {'lr': 0.00041642378147707014, 'samples': 8003520, 'steps': 41684, 'loss/train': 1.4430322647094727} -11/07/2021 03:04:47 - INFO - __main__ - Step 41686: {'lr': 0.00041641982142050297, 'samples': 8003712, 'steps': 41685, 'loss/train': 1.5093369483947754} -11/07/2021 03:04:48 - INFO - __main__ - Step 41687: {'lr': 0.00041641586128894967, 'samples': 8003904, 'steps': 41686, 'loss/train': 1.529678225517273} -11/07/2021 03:04:48 - INFO - __main__ - Step 41688: {'lr': 0.0004164119010824119, 'samples': 8004096, 'steps': 41687, 'loss/train': 1.4738942384719849} -11/07/2021 03:04:49 - INFO - __main__ - Step 41689: {'lr': 0.00041640794080089144, 'samples': 8004288, 'steps': 41688, 'loss/train': 1.233488917350769} -11/07/2021 03:04:49 - INFO - __main__ - Step 41690: {'lr': 0.0004164039804443902, 'samples': 8004480, 'steps': 41689, 'loss/train': 1.4913170337677002} -11/07/2021 03:04:50 - INFO - __main__ - Step 41691: {'lr': 0.0004164000200129099, 'samples': 8004672, 'steps': 41690, 'loss/train': 1.5144816637039185} -11/07/2021 03:04:50 - INFO - __main__ - Step 41692: {'lr': 0.0004163960595064522, 'samples': 8004864, 'steps': 41691, 'loss/train': 1.6226403713226318} -11/07/2021 03:04:51 - INFO - __main__ - Step 41693: {'lr': 0.00041639209892501913, 'samples': 8005056, 'steps': 41692, 'loss/train': 1.6253248453140259} -11/07/2021 03:04:52 - INFO - __main__ - Step 41694: {'lr': 0.00041638813826861234, 'samples': 8005248, 'steps': 41693, 'loss/train': 1.784563422203064} -11/07/2021 03:04:52 - INFO - __main__ - Step 41695: {'lr': 0.00041638417753723356, 'samples': 8005440, 'steps': 41694, 'loss/train': 0.6529554724693298} -11/07/2021 03:04:53 - INFO - __main__ - Step 41696: {'lr': 0.00041638021673088464, 'samples': 8005632, 'steps': 41695, 'loss/train': 1.8190524578094482} -11/07/2021 03:04:53 - INFO - __main__ - Step 41697: {'lr': 0.0004163762558495674, 'samples': 8005824, 'steps': 41696, 'loss/train': 1.8762617111206055} -11/07/2021 03:04:53 - INFO - __main__ - Step 41698: {'lr': 0.0004163722948932836, 'samples': 8006016, 'steps': 41697, 'loss/train': 0.7908387184143066} -11/07/2021 03:04:54 - INFO - __main__ - Step 41699: {'lr': 0.000416368333862035, 'samples': 8006208, 'steps': 41698, 'loss/train': 1.673041820526123} -11/07/2021 03:04:54 - INFO - __main__ - Step 41700: {'lr': 0.00041636437275582335, 'samples': 8006400, 'steps': 41699, 'loss/train': 1.4131288528442383} -11/07/2021 03:04:55 - INFO - __main__ - Step 41701: {'lr': 0.00041636041157465056, 'samples': 8006592, 'steps': 41700, 'loss/train': 1.3762298822402954} -11/07/2021 03:04:56 - INFO - __main__ - Step 41702: {'lr': 0.00041635645031851826, 'samples': 8006784, 'steps': 41701, 'loss/train': 1.8060678243637085} -11/07/2021 03:04:56 - INFO - __main__ - Step 41703: {'lr': 0.00041635248898742834, 'samples': 8006976, 'steps': 41702, 'loss/train': 1.4579479694366455} -11/07/2021 03:04:56 - INFO - __main__ - Step 41704: {'lr': 0.00041634852758138253, 'samples': 8007168, 'steps': 41703, 'loss/train': 1.565946340560913} -11/07/2021 03:04:57 - INFO - __main__ - Step 41705: {'lr': 0.0004163445661003827, 'samples': 8007360, 'steps': 41704, 'loss/train': 2.0427615642547607} -11/07/2021 03:04:58 - INFO - __main__ - Step 41706: {'lr': 0.0004163406045444306, 'samples': 8007552, 'steps': 41705, 'loss/train': 1.6200158596038818} -11/07/2021 03:04:58 - INFO - __main__ - Step 41707: {'lr': 0.0004163366429135279, 'samples': 8007744, 'steps': 41706, 'loss/train': 1.5748037099838257} -11/07/2021 03:04:58 - INFO - __main__ - Step 41708: {'lr': 0.00041633268120767653, 'samples': 8007936, 'steps': 41707, 'loss/train': 1.799818992614746} -11/07/2021 03:04:59 - INFO - __main__ - Step 41709: {'lr': 0.00041632871942687814, 'samples': 8008128, 'steps': 41708, 'loss/train': 1.4548799991607666} -11/07/2021 03:04:59 - INFO - __main__ - Step 41710: {'lr': 0.00041632475757113466, 'samples': 8008320, 'steps': 41709, 'loss/train': 1.7368544340133667} -11/07/2021 03:05:00 - INFO - __main__ - Step 41711: {'lr': 0.00041632079564044776, 'samples': 8008512, 'steps': 41710, 'loss/train': 1.3731677532196045} -11/07/2021 03:05:01 - INFO - __main__ - Step 41712: {'lr': 0.0004163168336348194, 'samples': 8008704, 'steps': 41711, 'loss/train': 0.9456028342247009} -11/07/2021 03:05:01 - INFO - __main__ - Step 41713: {'lr': 0.00041631287155425114, 'samples': 8008896, 'steps': 41712, 'loss/train': 1.3551782369613647} -11/07/2021 03:05:01 - INFO - __main__ - Step 41714: {'lr': 0.0004163089093987449, 'samples': 8009088, 'steps': 41713, 'loss/train': 1.3990758657455444} -11/07/2021 03:05:02 - INFO - __main__ - Step 41715: {'lr': 0.00041630494716830244, 'samples': 8009280, 'steps': 41714, 'loss/train': 1.2092492580413818} -11/07/2021 03:05:03 - INFO - __main__ - Step 41716: {'lr': 0.00041630098486292546, 'samples': 8009472, 'steps': 41715, 'loss/train': 1.7054479122161865} -11/07/2021 03:05:03 - INFO - __main__ - Step 41717: {'lr': 0.0004162970224826159, 'samples': 8009664, 'steps': 41716, 'loss/train': 1.0781768560409546} -11/07/2021 03:05:03 - INFO - __main__ - Step 41718: {'lr': 0.0004162930600273754, 'samples': 8009856, 'steps': 41717, 'loss/train': 1.3864885568618774} -11/07/2021 03:05:04 - INFO - __main__ - Step 41719: {'lr': 0.0004162890974972059, 'samples': 8010048, 'steps': 41718, 'loss/train': 1.8126137256622314} -11/07/2021 03:05:04 - INFO - __main__ - Step 41720: {'lr': 0.00041628513489210906, 'samples': 8010240, 'steps': 41719, 'loss/train': 1.5357738733291626} -11/07/2021 03:05:05 - INFO - __main__ - Step 41721: {'lr': 0.0004162811722120867, 'samples': 8010432, 'steps': 41720, 'loss/train': 1.2699007987976074} -11/07/2021 03:05:05 - INFO - __main__ - Step 41722: {'lr': 0.00041627720945714065, 'samples': 8010624, 'steps': 41721, 'loss/train': 1.3326258659362793} -11/07/2021 03:05:06 - INFO - __main__ - Step 41723: {'lr': 0.00041627324662727263, 'samples': 8010816, 'steps': 41722, 'loss/train': 1.481400728225708} -11/07/2021 03:05:06 - INFO - __main__ - Step 41724: {'lr': 0.0004162692837224844, 'samples': 8011008, 'steps': 41723, 'loss/train': 1.7024741172790527} -11/07/2021 03:05:06 - INFO - __main__ - Step 41725: {'lr': 0.00041626532074277785, 'samples': 8011200, 'steps': 41724, 'loss/train': 1.259816288948059} -11/07/2021 03:05:07 - INFO - __main__ - Step 41726: {'lr': 0.00041626135768815467, 'samples': 8011392, 'steps': 41725, 'loss/train': 1.537654161453247} -11/07/2021 03:05:08 - INFO - __main__ - Step 41727: {'lr': 0.0004162573945586168, 'samples': 8011584, 'steps': 41726, 'loss/train': 1.597123146057129} -11/07/2021 03:05:08 - INFO - __main__ - Step 41728: {'lr': 0.0004162534313541658, 'samples': 8011776, 'steps': 41727, 'loss/train': 0.8959583044052124} -11/07/2021 03:05:09 - INFO - __main__ - Step 41729: {'lr': 0.00041624946807480357, 'samples': 8011968, 'steps': 41728, 'loss/train': 1.5581363439559937} -11/07/2021 03:05:09 - INFO - __main__ - Step 41730: {'lr': 0.0004162455047205319, 'samples': 8012160, 'steps': 41729, 'loss/train': 0.8903040885925293} -11/07/2021 03:05:10 - INFO - __main__ - Step 41731: {'lr': 0.0004162415412913526, 'samples': 8012352, 'steps': 41730, 'loss/train': 1.7477757930755615} -11/07/2021 03:05:10 - INFO - __main__ - Step 41732: {'lr': 0.00041623757778726743, 'samples': 8012544, 'steps': 41731, 'loss/train': 1.3590712547302246} -11/07/2021 03:05:10 - INFO - __main__ - Step 41733: {'lr': 0.00041623361420827816, 'samples': 8012736, 'steps': 41732, 'loss/train': 0.7484281659126282} -11/07/2021 03:05:11 - INFO - __main__ - Step 41734: {'lr': 0.0004162296505543867, 'samples': 8012928, 'steps': 41733, 'loss/train': 1.5739892721176147} -11/07/2021 03:05:11 - INFO - __main__ - Step 41735: {'lr': 0.00041622568682559455, 'samples': 8013120, 'steps': 41734, 'loss/train': 1.2763605117797852} -11/07/2021 03:05:12 - INFO - __main__ - Step 41736: {'lr': 0.0004162217230219038, 'samples': 8013312, 'steps': 41735, 'loss/train': 1.4866390228271484} -11/07/2021 03:05:13 - INFO - __main__ - Step 41737: {'lr': 0.00041621775914331595, 'samples': 8013504, 'steps': 41736, 'loss/train': 1.272396445274353} -11/07/2021 03:05:14 - INFO - __main__ - Step 41738: {'lr': 0.00041621379518983306, 'samples': 8013696, 'steps': 41737, 'loss/train': 1.5573691129684448} -11/07/2021 03:05:14 - INFO - __main__ - Step 41739: {'lr': 0.00041620983116145673, 'samples': 8013888, 'steps': 41738, 'loss/train': 1.3005025386810303} -11/07/2021 03:05:14 - INFO - __main__ - Step 41740: {'lr': 0.00041620586705818887, 'samples': 8014080, 'steps': 41739, 'loss/train': 0.7410742044448853} -11/07/2021 03:05:15 - INFO - __main__ - Step 41741: {'lr': 0.00041620190288003126, 'samples': 8014272, 'steps': 41740, 'loss/train': 1.2668712139129639} -11/07/2021 03:05:15 - INFO - __main__ - Step 41742: {'lr': 0.00041619793862698553, 'samples': 8014464, 'steps': 41741, 'loss/train': 1.555660367012024} -11/07/2021 03:05:16 - INFO - __main__ - Step 41743: {'lr': 0.00041619397429905363, 'samples': 8014656, 'steps': 41742, 'loss/train': 0.837822675704956} -11/07/2021 03:05:16 - INFO - __main__ - Step 41744: {'lr': 0.0004161900098962373, 'samples': 8014848, 'steps': 41743, 'loss/train': 1.4115031957626343} -11/07/2021 03:05:17 - INFO - __main__ - Step 41745: {'lr': 0.00041618604541853826, 'samples': 8015040, 'steps': 41744, 'loss/train': 1.5460307598114014} -11/07/2021 03:05:17 - INFO - __main__ - Step 41746: {'lr': 0.00041618208086595843, 'samples': 8015232, 'steps': 41745, 'loss/train': 1.339052677154541} -11/07/2021 03:05:17 - INFO - __main__ - Step 41747: {'lr': 0.0004161781162384994, 'samples': 8015424, 'steps': 41746, 'loss/train': 1.7926512956619263} -11/07/2021 03:05:19 - INFO - __main__ - Step 41748: {'lr': 0.00041617415153616323, 'samples': 8015616, 'steps': 41747, 'loss/train': 1.718548059463501} -11/07/2021 03:05:19 - INFO - __main__ - Step 41749: {'lr': 0.00041617018675895145, 'samples': 8015808, 'steps': 41748, 'loss/train': 1.0688071250915527} -11/07/2021 03:05:19 - INFO - __main__ - Step 41750: {'lr': 0.00041616622190686597, 'samples': 8016000, 'steps': 41749, 'loss/train': 1.0594754219055176} -11/07/2021 03:05:20 - INFO - __main__ - Step 41751: {'lr': 0.0004161622569799086, 'samples': 8016192, 'steps': 41750, 'loss/train': 1.49894118309021} -11/07/2021 03:05:20 - INFO - __main__ - Step 41752: {'lr': 0.00041615829197808095, 'samples': 8016384, 'steps': 41751, 'loss/train': 1.7414077520370483} -11/07/2021 03:05:20 - INFO - __main__ - Step 41753: {'lr': 0.0004161543269013851, 'samples': 8016576, 'steps': 41752, 'loss/train': 2.081005096435547} -11/07/2021 03:05:21 - INFO - __main__ - Step 41754: {'lr': 0.0004161503617498226, 'samples': 8016768, 'steps': 41753, 'loss/train': 1.1592674255371094} -11/07/2021 03:05:22 - INFO - __main__ - Step 41755: {'lr': 0.00041614639652339533, 'samples': 8016960, 'steps': 41754, 'loss/train': 0.987359344959259} -11/07/2021 03:05:22 - INFO - __main__ - Step 41756: {'lr': 0.00041614243122210505, 'samples': 8017152, 'steps': 41755, 'loss/train': 1.9649503231048584} -11/07/2021 03:05:22 - INFO - __main__ - Step 41757: {'lr': 0.0004161384658459535, 'samples': 8017344, 'steps': 41756, 'loss/train': 1.4676735401153564} -11/07/2021 03:05:23 - INFO - __main__ - Step 41758: {'lr': 0.0004161345003949426, 'samples': 8017536, 'steps': 41757, 'loss/train': 1.7614989280700684} -11/07/2021 03:05:24 - INFO - __main__ - Step 41759: {'lr': 0.00041613053486907396, 'samples': 8017728, 'steps': 41758, 'loss/train': 1.616061806678772} -11/07/2021 03:05:24 - INFO - __main__ - Step 41760: {'lr': 0.0004161265692683496, 'samples': 8017920, 'steps': 41759, 'loss/train': 1.723777413368225} -11/07/2021 03:05:25 - INFO - __main__ - Step 41761: {'lr': 0.0004161226035927711, 'samples': 8018112, 'steps': 41760, 'loss/train': 2.0317869186401367} -11/07/2021 03:05:25 - INFO - __main__ - Step 41762: {'lr': 0.0004161186378423403, 'samples': 8018304, 'steps': 41761, 'loss/train': 1.7671819925308228} -11/07/2021 03:05:25 - INFO - __main__ - Step 41763: {'lr': 0.000416114672017059, 'samples': 8018496, 'steps': 41762, 'loss/train': 1.7405064105987549} -11/07/2021 03:05:26 - INFO - __main__ - Step 41764: {'lr': 0.000416110706116929, 'samples': 8018688, 'steps': 41763, 'loss/train': 1.5564242601394653} -11/07/2021 03:05:27 - INFO - __main__ - Step 41765: {'lr': 0.0004161067401419521, 'samples': 8018880, 'steps': 41764, 'loss/train': 1.6028566360473633} -11/07/2021 03:05:27 - INFO - __main__ - Step 41766: {'lr': 0.00041610277409213003, 'samples': 8019072, 'steps': 41765, 'loss/train': 0.15148968994617462} -11/07/2021 03:05:27 - INFO - __main__ - Step 41767: {'lr': 0.00041609880796746463, 'samples': 8019264, 'steps': 41766, 'loss/train': 1.4200246334075928} -11/07/2021 03:05:28 - INFO - __main__ - Step 41768: {'lr': 0.00041609484176795774, 'samples': 8019456, 'steps': 41767, 'loss/train': 1.4033209085464478} -11/07/2021 03:05:29 - INFO - __main__ - Step 41769: {'lr': 0.000416090875493611, 'samples': 8019648, 'steps': 41768, 'loss/train': 1.5000132322311401} -11/07/2021 03:05:29 - INFO - __main__ - Step 41770: {'lr': 0.0004160869091444263, 'samples': 8019840, 'steps': 41769, 'loss/train': 1.6210057735443115} -11/07/2021 03:05:29 - INFO - __main__ - Step 41771: {'lr': 0.0004160829427204054, 'samples': 8020032, 'steps': 41770, 'loss/train': 1.5194448232650757} -11/07/2021 03:05:30 - INFO - __main__ - Step 41772: {'lr': 0.00041607897622155006, 'samples': 8020224, 'steps': 41771, 'loss/train': 1.3142369985580444} -11/07/2021 03:05:30 - INFO - __main__ - Step 41773: {'lr': 0.00041607500964786217, 'samples': 8020416, 'steps': 41772, 'loss/train': 1.448745846748352} -11/07/2021 03:05:31 - INFO - __main__ - Step 41774: {'lr': 0.0004160710429993434, 'samples': 8020608, 'steps': 41773, 'loss/train': 2.627546548843384} -11/07/2021 03:05:31 - INFO - __main__ - Step 41775: {'lr': 0.00041606707627599556, 'samples': 8020800, 'steps': 41774, 'loss/train': 1.5680979490280151} -11/07/2021 03:05:32 - INFO - __main__ - Step 41776: {'lr': 0.00041606310947782046, 'samples': 8020992, 'steps': 41775, 'loss/train': 1.5007060766220093} -11/07/2021 03:05:32 - INFO - __main__ - Step 41777: {'lr': 0.0004160591426048199, 'samples': 8021184, 'steps': 41776, 'loss/train': 1.1363593339920044} -11/07/2021 03:05:33 - INFO - __main__ - Step 41778: {'lr': 0.00041605517565699565, 'samples': 8021376, 'steps': 41777, 'loss/train': 1.7209640741348267} -11/07/2021 03:05:34 - INFO - __main__ - Step 41779: {'lr': 0.00041605120863434945, 'samples': 8021568, 'steps': 41778, 'loss/train': 1.527706503868103} -11/07/2021 03:05:34 - INFO - __main__ - Step 41780: {'lr': 0.0004160472415368832, 'samples': 8021760, 'steps': 41779, 'loss/train': 1.049204707145691} -11/07/2021 03:05:35 - INFO - __main__ - Step 41781: {'lr': 0.00041604327436459864, 'samples': 8021952, 'steps': 41780, 'loss/train': 1.3618234395980835} -11/07/2021 03:05:35 - INFO - __main__ - Step 41782: {'lr': 0.0004160393071174975, 'samples': 8022144, 'steps': 41781, 'loss/train': 1.4717530012130737} -11/07/2021 03:05:35 - INFO - __main__ - Step 41783: {'lr': 0.00041603533979558163, 'samples': 8022336, 'steps': 41782, 'loss/train': 1.55155611038208} -11/07/2021 03:05:36 - INFO - __main__ - Step 41784: {'lr': 0.0004160313723988528, 'samples': 8022528, 'steps': 41783, 'loss/train': 1.434744954109192} -11/07/2021 03:05:36 - INFO - __main__ - Step 41785: {'lr': 0.00041602740492731284, 'samples': 8022720, 'steps': 41784, 'loss/train': 5.639638423919678} -11/07/2021 03:05:37 - INFO - __main__ - Step 41786: {'lr': 0.0004160234373809634, 'samples': 8022912, 'steps': 41785, 'loss/train': 5.51109504699707} -11/07/2021 03:05:37 - INFO - __main__ - Step 41787: {'lr': 0.0004160194697598064, 'samples': 8023104, 'steps': 41786, 'loss/train': 1.7458086013793945} -11/07/2021 03:05:38 - INFO - __main__ - Step 41788: {'lr': 0.0004160155020638436, 'samples': 8023296, 'steps': 41787, 'loss/train': 1.6691575050354004} -11/07/2021 03:05:38 - INFO - __main__ - Step 41789: {'lr': 0.0004160115342930768, 'samples': 8023488, 'steps': 41788, 'loss/train': 1.4780073165893555} -11/07/2021 03:05:38 - INFO - __main__ - Step 41790: {'lr': 0.0004160075664475077, 'samples': 8023680, 'steps': 41789, 'loss/train': 1.584285020828247} -11/07/2021 03:05:39 - INFO - __main__ - Step 41791: {'lr': 0.0004160035985271382, 'samples': 8023872, 'steps': 41790, 'loss/train': 1.6199537515640259} -11/07/2021 03:05:40 - INFO - __main__ - Step 41792: {'lr': 0.00041599963053196997, 'samples': 8024064, 'steps': 41791, 'loss/train': 1.8177478313446045} -11/07/2021 03:05:40 - INFO - __main__ - Step 41793: {'lr': 0.0004159956624620049, 'samples': 8024256, 'steps': 41792, 'loss/train': 1.2697099447250366} -11/07/2021 03:05:41 - INFO - __main__ - Step 41794: {'lr': 0.0004159916943172448, 'samples': 8024448, 'steps': 41793, 'loss/train': 1.3568118810653687} -11/07/2021 03:05:41 - INFO - __main__ - Step 41795: {'lr': 0.0004159877260976914, 'samples': 8024640, 'steps': 41794, 'loss/train': 1.1664894819259644} -11/07/2021 03:05:41 - INFO - __main__ - Step 41796: {'lr': 0.00041598375780334653, 'samples': 8024832, 'steps': 41795, 'loss/train': 1.419095516204834} -11/07/2021 03:05:42 - INFO - __main__ - Step 41797: {'lr': 0.0004159797894342118, 'samples': 8025024, 'steps': 41796, 'loss/train': 1.4277313947677612} -11/07/2021 03:05:43 - INFO - __main__ - Step 41798: {'lr': 0.0004159758209902892, 'samples': 8025216, 'steps': 41797, 'loss/train': 1.4310158491134644} -11/07/2021 03:05:43 - INFO - __main__ - Step 41799: {'lr': 0.00041597185247158053, 'samples': 8025408, 'steps': 41798, 'loss/train': 1.2442349195480347} -11/07/2021 03:05:43 - INFO - __main__ - Step 41800: {'lr': 0.0004159678838780874, 'samples': 8025600, 'steps': 41799, 'loss/train': 1.3497828245162964} -11/07/2021 03:05:44 - INFO - __main__ - Step 41801: {'lr': 0.0004159639152098118, 'samples': 8025792, 'steps': 41800, 'loss/train': 1.1749296188354492} -11/07/2021 03:05:45 - INFO - __main__ - Step 41802: {'lr': 0.00041595994646675537, 'samples': 8025984, 'steps': 41801, 'loss/train': 1.4512723684310913} -11/07/2021 03:05:45 - INFO - __main__ - Step 41803: {'lr': 0.0004159559776489199, 'samples': 8026176, 'steps': 41802, 'loss/train': 1.5854878425598145} -11/07/2021 03:05:45 - INFO - __main__ - Step 41804: {'lr': 0.00041595200875630734, 'samples': 8026368, 'steps': 41803, 'loss/train': 1.5534003973007202} -11/07/2021 03:05:46 - INFO - __main__ - Step 41805: {'lr': 0.00041594803978891925, 'samples': 8026560, 'steps': 41804, 'loss/train': 1.3734766244888306} -11/07/2021 03:05:46 - INFO - __main__ - Step 41806: {'lr': 0.00041594407074675753, 'samples': 8026752, 'steps': 41805, 'loss/train': 1.9073400497436523} -11/07/2021 03:05:47 - INFO - __main__ - Step 41807: {'lr': 0.0004159401016298241, 'samples': 8026944, 'steps': 41806, 'loss/train': 1.948595404624939} -11/07/2021 03:05:48 - INFO - __main__ - Step 41808: {'lr': 0.0004159361324381206, 'samples': 8027136, 'steps': 41807, 'loss/train': 1.5608607530593872} -11/07/2021 03:05:48 - INFO - __main__ - Step 41809: {'lr': 0.0004159321631716487, 'samples': 8027328, 'steps': 41808, 'loss/train': 2.098839521408081} -11/07/2021 03:05:49 - INFO - __main__ - Step 41810: {'lr': 0.00041592819383041047, 'samples': 8027520, 'steps': 41809, 'loss/train': 1.6151118278503418} -11/07/2021 03:05:49 - INFO - __main__ - Step 41811: {'lr': 0.0004159242244144075, 'samples': 8027712, 'steps': 41810, 'loss/train': 1.6768019199371338} -11/07/2021 03:05:50 - INFO - __main__ - Step 41812: {'lr': 0.0004159202549236416, 'samples': 8027904, 'steps': 41811, 'loss/train': 1.2156720161437988} -11/07/2021 03:05:50 - INFO - __main__ - Step 41813: {'lr': 0.00041591628535811464, 'samples': 8028096, 'steps': 41812, 'loss/train': 1.1023814678192139} -11/07/2021 03:05:51 - INFO - __main__ - Step 41814: {'lr': 0.00041591231571782834, 'samples': 8028288, 'steps': 41813, 'loss/train': 1.4737012386322021} -11/07/2021 03:05:51 - INFO - __main__ - Step 41815: {'lr': 0.0004159083460027845, 'samples': 8028480, 'steps': 41814, 'loss/train': 1.6790229082107544} -11/07/2021 03:05:51 - INFO - __main__ - Step 41816: {'lr': 0.000415904376212985, 'samples': 8028672, 'steps': 41815, 'loss/train': 1.4413472414016724} -11/07/2021 03:05:52 - INFO - __main__ - Step 41817: {'lr': 0.00041590040634843144, 'samples': 8028864, 'steps': 41816, 'loss/train': 2.422144889831543} -11/07/2021 03:05:53 - INFO - __main__ - Step 41818: {'lr': 0.00041589643640912576, 'samples': 8029056, 'steps': 41817, 'loss/train': 1.58564031124115} -11/07/2021 03:05:53 - INFO - __main__ - Step 41819: {'lr': 0.0004158924663950697, 'samples': 8029248, 'steps': 41818, 'loss/train': 1.575334072113037} -11/07/2021 03:05:53 - INFO - __main__ - Step 41820: {'lr': 0.00041588849630626513, 'samples': 8029440, 'steps': 41819, 'loss/train': 1.7191028594970703} -11/07/2021 03:05:54 - INFO - __main__ - Step 41821: {'lr': 0.00041588452614271364, 'samples': 8029632, 'steps': 41820, 'loss/train': 1.5590040683746338} -11/07/2021 03:05:54 - INFO - __main__ - Step 41822: {'lr': 0.00041588055590441726, 'samples': 8029824, 'steps': 41821, 'loss/train': 1.3510241508483887} -11/07/2021 03:05:55 - INFO - __main__ - Step 41823: {'lr': 0.0004158765855913776, 'samples': 8030016, 'steps': 41822, 'loss/train': 1.5703097581863403} -11/07/2021 03:05:56 - INFO - __main__ - Step 41824: {'lr': 0.0004158726152035965, 'samples': 8030208, 'steps': 41823, 'loss/train': 1.4530744552612305} -11/07/2021 03:05:56 - INFO - __main__ - Step 41825: {'lr': 0.00041586864474107575, 'samples': 8030400, 'steps': 41824, 'loss/train': 1.1881881952285767} -11/07/2021 03:05:56 - INFO - __main__ - Step 41826: {'lr': 0.0004158646742038172, 'samples': 8030592, 'steps': 41825, 'loss/train': 1.6617271900177002} -11/07/2021 03:05:57 - INFO - __main__ - Step 41827: {'lr': 0.00041586070359182255, 'samples': 8030784, 'steps': 41826, 'loss/train': 1.8090656995773315} -11/07/2021 03:05:58 - INFO - __main__ - Step 41828: {'lr': 0.00041585673290509364, 'samples': 8030976, 'steps': 41827, 'loss/train': 1.0655546188354492} -11/07/2021 03:05:58 - INFO - __main__ - Step 41829: {'lr': 0.0004158527621436322, 'samples': 8031168, 'steps': 41828, 'loss/train': 1.5067369937896729} -11/07/2021 03:05:58 - INFO - __main__ - Step 41830: {'lr': 0.0004158487913074401, 'samples': 8031360, 'steps': 41829, 'loss/train': 1.3611478805541992} -11/07/2021 03:05:59 - INFO - __main__ - Step 41831: {'lr': 0.0004158448203965192, 'samples': 8031552, 'steps': 41830, 'loss/train': 1.7292866706848145} -11/07/2021 03:05:59 - INFO - __main__ - Step 41832: {'lr': 0.000415840849410871, 'samples': 8031744, 'steps': 41831, 'loss/train': 1.2231707572937012} -11/07/2021 03:06:00 - INFO - __main__ - Step 41833: {'lr': 0.0004158368783504975, 'samples': 8031936, 'steps': 41832, 'loss/train': 0.8280168175697327} -11/07/2021 03:06:00 - INFO - __main__ - Step 41834: {'lr': 0.00041583290721540055, 'samples': 8032128, 'steps': 41833, 'loss/train': 1.269150733947754} -11/07/2021 03:06:01 - INFO - __main__ - Step 41835: {'lr': 0.0004158289360055819, 'samples': 8032320, 'steps': 41834, 'loss/train': 0.977594256401062} -11/07/2021 03:06:01 - INFO - __main__ - Step 41836: {'lr': 0.00041582496472104314, 'samples': 8032512, 'steps': 41835, 'loss/train': 2.1492388248443604} -11/07/2021 03:06:01 - INFO - __main__ - Step 41837: {'lr': 0.0004158209933617863, 'samples': 8032704, 'steps': 41836, 'loss/train': 1.4113600254058838} -11/07/2021 03:06:02 - INFO - __main__ - Step 41838: {'lr': 0.00041581702192781305, 'samples': 8032896, 'steps': 41837, 'loss/train': 1.2576713562011719} -11/07/2021 03:06:03 - INFO - __main__ - Step 41839: {'lr': 0.0004158130504191252, 'samples': 8033088, 'steps': 41838, 'loss/train': 1.7074604034423828} -11/07/2021 03:06:03 - INFO - __main__ - Step 41840: {'lr': 0.0004158090788357246, 'samples': 8033280, 'steps': 41839, 'loss/train': 1.8725475072860718} -11/07/2021 03:06:03 - INFO - __main__ - Step 41841: {'lr': 0.0004158051071776129, 'samples': 8033472, 'steps': 41840, 'loss/train': 1.3763138055801392} -11/07/2021 03:06:04 - INFO - __main__ - Step 41842: {'lr': 0.00041580113544479203, 'samples': 8033664, 'steps': 41841, 'loss/train': 1.4608910083770752} -11/07/2021 03:06:05 - INFO - __main__ - Step 41843: {'lr': 0.00041579716363726376, 'samples': 8033856, 'steps': 41842, 'loss/train': 1.999753713607788} -11/07/2021 03:06:05 - INFO - __main__ - Step 41844: {'lr': 0.00041579319175502985, 'samples': 8034048, 'steps': 41843, 'loss/train': 0.8875548243522644} -11/07/2021 03:06:05 - INFO - __main__ - Step 41845: {'lr': 0.000415789219798092, 'samples': 8034240, 'steps': 41844, 'loss/train': 1.5030208826065063} -11/07/2021 03:06:06 - INFO - __main__ - Step 41846: {'lr': 0.00041578524776645216, 'samples': 8034432, 'steps': 41845, 'loss/train': 1.609982967376709} -11/07/2021 03:06:06 - INFO - __main__ - Step 41847: {'lr': 0.00041578127566011203, 'samples': 8034624, 'steps': 41846, 'loss/train': 1.7222378253936768} -11/07/2021 03:06:07 - INFO - __main__ - Step 41848: {'lr': 0.0004157773034790734, 'samples': 8034816, 'steps': 41847, 'loss/train': 1.5789622068405151} -11/07/2021 03:06:08 - INFO - __main__ - Step 41849: {'lr': 0.00041577333122333807, 'samples': 8035008, 'steps': 41848, 'loss/train': 0.21003803610801697} -11/07/2021 03:06:08 - INFO - __main__ - Step 41850: {'lr': 0.00041576935889290777, 'samples': 8035200, 'steps': 41849, 'loss/train': 1.580950140953064} -11/07/2021 03:06:08 - INFO - __main__ - Step 41851: {'lr': 0.0004157653864877845, 'samples': 8035392, 'steps': 41850, 'loss/train': 1.5882028341293335} -11/07/2021 03:06:09 - INFO - __main__ - Step 41852: {'lr': 0.00041576141400796984, 'samples': 8035584, 'steps': 41851, 'loss/train': 1.2623769044876099} -11/07/2021 03:06:09 - INFO - __main__ - Step 41853: {'lr': 0.00041575744145346563, 'samples': 8035776, 'steps': 41852, 'loss/train': 1.2826652526855469} -11/07/2021 03:06:10 - INFO - __main__ - Step 41854: {'lr': 0.00041575346882427366, 'samples': 8035968, 'steps': 41853, 'loss/train': 1.4938825368881226} -11/07/2021 03:06:10 - INFO - __main__ - Step 41855: {'lr': 0.00041574949612039583, 'samples': 8036160, 'steps': 41854, 'loss/train': 1.9276888370513916} -11/07/2021 03:06:11 - INFO - __main__ - Step 41856: {'lr': 0.0004157455233418337, 'samples': 8036352, 'steps': 41855, 'loss/train': 1.6604562997817993} -11/07/2021 03:06:11 - INFO - __main__ - Step 41857: {'lr': 0.0004157415504885893, 'samples': 8036544, 'steps': 41856, 'loss/train': 1.363741159439087} -11/07/2021 03:06:11 - INFO - __main__ - Step 41858: {'lr': 0.00041573757756066423, 'samples': 8036736, 'steps': 41857, 'loss/train': 0.9199839234352112} -11/07/2021 03:06:13 - INFO - __main__ - Step 41859: {'lr': 0.0004157336045580604, 'samples': 8036928, 'steps': 41858, 'loss/train': 1.5329149961471558} -11/07/2021 03:06:13 - INFO - __main__ - Step 41860: {'lr': 0.0004157296314807796, 'samples': 8037120, 'steps': 41859, 'loss/train': 1.2419116497039795} -11/07/2021 03:06:13 - INFO - __main__ - Step 41861: {'lr': 0.0004157256583288235, 'samples': 8037312, 'steps': 41860, 'loss/train': 0.6708611249923706} -11/07/2021 03:06:14 - INFO - __main__ - Step 41862: {'lr': 0.0004157216851021941, 'samples': 8037504, 'steps': 41861, 'loss/train': 2.5971829891204834} -11/07/2021 03:06:14 - INFO - __main__ - Step 41863: {'lr': 0.00041571771180089304, 'samples': 8037696, 'steps': 41862, 'loss/train': 1.778261423110962} -11/07/2021 03:06:15 - INFO - __main__ - Step 41864: {'lr': 0.0004157137384249221, 'samples': 8037888, 'steps': 41863, 'loss/train': 1.4639763832092285} -11/07/2021 03:06:15 - INFO - __main__ - Step 41865: {'lr': 0.00041570976497428303, 'samples': 8038080, 'steps': 41864, 'loss/train': 1.5496078729629517} -11/07/2021 03:06:16 - INFO - __main__ - Step 41866: {'lr': 0.0004157057914489778, 'samples': 8038272, 'steps': 41865, 'loss/train': 1.4821267127990723} -11/07/2021 03:06:16 - INFO - __main__ - Step 41867: {'lr': 0.00041570181784900806, 'samples': 8038464, 'steps': 41866, 'loss/train': 1.4663201570510864} -11/07/2021 03:06:16 - INFO - __main__ - Step 41868: {'lr': 0.0004156978441743756, 'samples': 8038656, 'steps': 41867, 'loss/train': 1.65707528591156} -11/07/2021 03:06:17 - INFO - __main__ - Step 41869: {'lr': 0.00041569387042508235, 'samples': 8038848, 'steps': 41868, 'loss/train': 1.712996244430542} -11/07/2021 03:06:18 - INFO - __main__ - Step 41870: {'lr': 0.0004156898966011299, 'samples': 8039040, 'steps': 41869, 'loss/train': 1.2954154014587402} -11/07/2021 03:06:18 - INFO - __main__ - Step 41871: {'lr': 0.0004156859227025202, 'samples': 8039232, 'steps': 41870, 'loss/train': 1.9032760858535767} -11/07/2021 03:06:18 - INFO - __main__ - Step 41872: {'lr': 0.0004156819487292549, 'samples': 8039424, 'steps': 41871, 'loss/train': 1.3794838190078735} -11/07/2021 03:06:19 - INFO - __main__ - Step 41873: {'lr': 0.00041567797468133595, 'samples': 8039616, 'steps': 41872, 'loss/train': 1.5694235563278198} -11/07/2021 03:06:20 - INFO - __main__ - Step 41874: {'lr': 0.00041567400055876505, 'samples': 8039808, 'steps': 41873, 'loss/train': 2.1152632236480713} -11/07/2021 03:06:20 - INFO - __main__ - Step 41875: {'lr': 0.00041567002636154406, 'samples': 8040000, 'steps': 41874, 'loss/train': 1.4536792039871216} -11/07/2021 03:06:21 - INFO - __main__ - Step 41876: {'lr': 0.0004156660520896746, 'samples': 8040192, 'steps': 41875, 'loss/train': 1.0573084354400635} -11/07/2021 03:06:21 - INFO - __main__ - Step 41877: {'lr': 0.00041566207774315866, 'samples': 8040384, 'steps': 41876, 'loss/train': 1.8460909128189087} -11/07/2021 03:06:21 - INFO - __main__ - Step 41878: {'lr': 0.0004156581033219979, 'samples': 8040576, 'steps': 41877, 'loss/train': 1.110854983329773} -11/07/2021 03:06:22 - INFO - __main__ - Step 41879: {'lr': 0.0004156541288261941, 'samples': 8040768, 'steps': 41878, 'loss/train': 1.5497623682022095} -11/07/2021 03:06:23 - INFO - __main__ - Step 41880: {'lr': 0.00041565015425574917, 'samples': 8040960, 'steps': 41879, 'loss/train': 1.6084986925125122} -11/07/2021 03:06:23 - INFO - __main__ - Step 41881: {'lr': 0.00041564617961066487, 'samples': 8041152, 'steps': 41880, 'loss/train': 1.2137629985809326} -11/07/2021 03:06:23 - INFO - __main__ - Step 41882: {'lr': 0.00041564220489094295, 'samples': 8041344, 'steps': 41881, 'loss/train': 1.3202635049819946} -11/07/2021 03:06:24 - INFO - __main__ - Step 41883: {'lr': 0.00041563823009658514, 'samples': 8041536, 'steps': 41882, 'loss/train': 1.5626225471496582} -11/07/2021 03:06:24 - INFO - __main__ - Step 41884: {'lr': 0.00041563425522759336, 'samples': 8041728, 'steps': 41883, 'loss/train': 1.4322011470794678} -11/07/2021 03:06:25 - INFO - __main__ - Step 41885: {'lr': 0.0004156302802839693, 'samples': 8041920, 'steps': 41884, 'loss/train': 1.412869930267334} -11/07/2021 03:06:25 - INFO - __main__ - Step 41886: {'lr': 0.0004156263052657148, 'samples': 8042112, 'steps': 41885, 'loss/train': 1.515254259109497} -11/07/2021 03:06:26 - INFO - __main__ - Step 41887: {'lr': 0.0004156223301728316, 'samples': 8042304, 'steps': 41886, 'loss/train': 1.881744146347046} -11/07/2021 03:06:26 - INFO - __main__ - Step 41888: {'lr': 0.0004156183550053216, 'samples': 8042496, 'steps': 41887, 'loss/train': 1.3872469663619995} -11/07/2021 03:06:26 - INFO - __main__ - Step 41889: {'lr': 0.0004156143797631866, 'samples': 8042688, 'steps': 41888, 'loss/train': 1.8121181726455688} -11/07/2021 03:06:28 - INFO - __main__ - Step 41890: {'lr': 0.0004156104044464282, 'samples': 8042880, 'steps': 41889, 'loss/train': 1.5599640607833862} -11/07/2021 03:06:28 - INFO - __main__ - Step 41891: {'lr': 0.00041560642905504833, 'samples': 8043072, 'steps': 41890, 'loss/train': 3.547255039215088} -11/07/2021 03:06:28 - INFO - __main__ - Step 41892: {'lr': 0.0004156024535890487, 'samples': 8043264, 'steps': 41891, 'loss/train': 1.33156156539917} -11/07/2021 03:06:29 - INFO - __main__ - Step 41893: {'lr': 0.00041559847804843123, 'samples': 8043456, 'steps': 41892, 'loss/train': 1.6302646398544312} -11/07/2021 03:06:29 - INFO - __main__ - Step 41894: {'lr': 0.0004155945024331976, 'samples': 8043648, 'steps': 41893, 'loss/train': 1.2952686548233032} -11/07/2021 03:06:30 - INFO - __main__ - Step 41895: {'lr': 0.00041559052674334975, 'samples': 8043840, 'steps': 41894, 'loss/train': 1.4727513790130615} -11/07/2021 03:06:30 - INFO - __main__ - Step 41896: {'lr': 0.0004155865509788893, 'samples': 8044032, 'steps': 41895, 'loss/train': 0.39268600940704346} -11/07/2021 03:06:31 - INFO - __main__ - Step 41897: {'lr': 0.00041558257513981805, 'samples': 8044224, 'steps': 41896, 'loss/train': 1.482244849205017} -11/07/2021 03:06:31 - INFO - __main__ - Step 41898: {'lr': 0.00041557859922613795, 'samples': 8044416, 'steps': 41897, 'loss/train': 1.8280117511749268} -11/07/2021 03:06:31 - INFO - __main__ - Step 41899: {'lr': 0.00041557462323785053, 'samples': 8044608, 'steps': 41898, 'loss/train': 1.4932671785354614} -11/07/2021 03:06:32 - INFO - __main__ - Step 41900: {'lr': 0.00041557064717495786, 'samples': 8044800, 'steps': 41899, 'loss/train': 1.7836129665374756} -11/07/2021 03:06:33 - INFO - __main__ - Step 41901: {'lr': 0.00041556667103746157, 'samples': 8044992, 'steps': 41900, 'loss/train': 1.612501859664917} -11/07/2021 03:06:33 - INFO - __main__ - Step 41902: {'lr': 0.00041556269482536355, 'samples': 8045184, 'steps': 41901, 'loss/train': 1.2717280387878418} -11/07/2021 03:06:34 - INFO - __main__ - Step 41903: {'lr': 0.00041555871853866553, 'samples': 8045376, 'steps': 41902, 'loss/train': 1.4974288940429688} -11/07/2021 03:06:34 - INFO - __main__ - Step 41904: {'lr': 0.00041555474217736926, 'samples': 8045568, 'steps': 41903, 'loss/train': 1.5328596830368042} -11/07/2021 03:06:34 - INFO - __main__ - Step 41905: {'lr': 0.0004155507657414766, 'samples': 8045760, 'steps': 41904, 'loss/train': 1.8202886581420898} -11/07/2021 03:06:35 - INFO - __main__ - Step 41906: {'lr': 0.0004155467892309893, 'samples': 8045952, 'steps': 41905, 'loss/train': 1.405146837234497} -11/07/2021 03:06:36 - INFO - __main__ - Step 41907: {'lr': 0.0004155428126459092, 'samples': 8046144, 'steps': 41906, 'loss/train': 1.0993465185165405} -11/07/2021 03:06:36 - INFO - __main__ - Step 41908: {'lr': 0.00041553883598623804, 'samples': 8046336, 'steps': 41907, 'loss/train': 1.3472046852111816} -11/07/2021 03:06:36 - INFO - __main__ - Step 41909: {'lr': 0.00041553485925197763, 'samples': 8046528, 'steps': 41908, 'loss/train': 2.0090084075927734} -11/07/2021 03:06:37 - INFO - __main__ - Step 41910: {'lr': 0.00041553088244312975, 'samples': 8046720, 'steps': 41909, 'loss/train': 1.7823117971420288} -11/07/2021 03:06:38 - INFO - __main__ - Step 41911: {'lr': 0.0004155269055596963, 'samples': 8046912, 'steps': 41910, 'loss/train': 0.9449849128723145} -11/07/2021 03:06:38 - INFO - __main__ - Step 41912: {'lr': 0.0004155229286016789, 'samples': 8047104, 'steps': 41911, 'loss/train': 1.4676487445831299} -11/07/2021 03:06:39 - INFO - __main__ - Step 41913: {'lr': 0.0004155189515690794, 'samples': 8047296, 'steps': 41912, 'loss/train': 1.838443636894226} -11/07/2021 03:06:39 - INFO - __main__ - Step 41914: {'lr': 0.0004155149744618997, 'samples': 8047488, 'steps': 41913, 'loss/train': 1.6639630794525146} -11/07/2021 03:06:39 - INFO - __main__ - Step 41915: {'lr': 0.0004155109972801414, 'samples': 8047680, 'steps': 41914, 'loss/train': 1.3994457721710205} -11/07/2021 03:06:40 - INFO - __main__ - Step 41916: {'lr': 0.0004155070200238065, 'samples': 8047872, 'steps': 41915, 'loss/train': 1.8797807693481445} -11/07/2021 03:06:41 - INFO - __main__ - Step 41917: {'lr': 0.00041550304269289664, 'samples': 8048064, 'steps': 41916, 'loss/train': 1.755118489265442} -11/07/2021 03:06:41 - INFO - __main__ - Step 41918: {'lr': 0.00041549906528741366, 'samples': 8048256, 'steps': 41917, 'loss/train': 2.0328023433685303} -11/07/2021 03:06:41 - INFO - __main__ - Step 41919: {'lr': 0.0004154950878073594, 'samples': 8048448, 'steps': 41918, 'loss/train': 1.6511229276657104} -11/07/2021 03:06:42 - INFO - __main__ - Step 41920: {'lr': 0.0004154911102527356, 'samples': 8048640, 'steps': 41919, 'loss/train': 1.6904728412628174} -11/07/2021 03:06:42 - INFO - __main__ - Step 41921: {'lr': 0.00041548713262354396, 'samples': 8048832, 'steps': 41920, 'loss/train': 1.1226547956466675} -11/07/2021 03:06:43 - INFO - __main__ - Step 41922: {'lr': 0.0004154831549197865, 'samples': 8049024, 'steps': 41921, 'loss/train': 1.5018033981323242} -11/07/2021 03:06:43 - INFO - __main__ - Step 41923: {'lr': 0.0004154791771414648, 'samples': 8049216, 'steps': 41922, 'loss/train': 2.225022077560425} -11/07/2021 03:06:44 - INFO - __main__ - Step 41924: {'lr': 0.0004154751992885808, 'samples': 8049408, 'steps': 41923, 'loss/train': 0.46176427602767944} -11/07/2021 03:06:44 - INFO - __main__ - Step 41925: {'lr': 0.0004154712213611362, 'samples': 8049600, 'steps': 41924, 'loss/train': 1.9820481538772583} -11/07/2021 03:06:44 - INFO - __main__ - Step 41926: {'lr': 0.0004154672433591328, 'samples': 8049792, 'steps': 41925, 'loss/train': 1.159741997718811} -11/07/2021 03:06:46 - INFO - __main__ - Step 41927: {'lr': 0.0004154632652825724, 'samples': 8049984, 'steps': 41926, 'loss/train': 1.5462394952774048} -11/07/2021 03:06:46 - INFO - __main__ - Step 41928: {'lr': 0.00041545928713145687, 'samples': 8050176, 'steps': 41927, 'loss/train': 1.55469810962677} -11/07/2021 03:06:46 - INFO - __main__ - Step 41929: {'lr': 0.00041545530890578784, 'samples': 8050368, 'steps': 41928, 'loss/train': 1.1376702785491943} -11/07/2021 03:06:47 - INFO - __main__ - Step 41930: {'lr': 0.00041545133060556734, 'samples': 8050560, 'steps': 41929, 'loss/train': 1.464155912399292} -11/07/2021 03:06:47 - INFO - __main__ - Step 41931: {'lr': 0.00041544735223079693, 'samples': 8050752, 'steps': 41930, 'loss/train': 1.6106220483779907} -11/07/2021 03:06:48 - INFO - __main__ - Step 41932: {'lr': 0.0004154433737814786, 'samples': 8050944, 'steps': 41931, 'loss/train': 1.9208873510360718} -11/07/2021 03:06:48 - INFO - __main__ - Step 41933: {'lr': 0.0004154393952576139, 'samples': 8051136, 'steps': 41932, 'loss/train': 1.5260471105575562} -11/07/2021 03:06:49 - INFO - __main__ - Step 41934: {'lr': 0.00041543541665920483, 'samples': 8051328, 'steps': 41933, 'loss/train': 1.2168070077896118} -11/07/2021 03:06:49 - INFO - __main__ - Step 41935: {'lr': 0.000415431437986253, 'samples': 8051520, 'steps': 41934, 'loss/train': 1.0677088499069214} -11/07/2021 03:06:49 - INFO - __main__ - Step 41936: {'lr': 0.00041542745923876047, 'samples': 8051712, 'steps': 41935, 'loss/train': 0.22388498485088348} -11/07/2021 03:06:51 - INFO - __main__ - Step 41937: {'lr': 0.00041542348041672886, 'samples': 8051904, 'steps': 41936, 'loss/train': 0.9962683916091919} -11/07/2021 03:06:51 - INFO - __main__ - Step 41938: {'lr': 0.00041541950152015997, 'samples': 8052096, 'steps': 41937, 'loss/train': 1.61919105052948} -11/07/2021 03:06:51 - INFO - __main__ - Step 41939: {'lr': 0.0004154155225490555, 'samples': 8052288, 'steps': 41938, 'loss/train': 2.00990629196167} -11/07/2021 03:06:52 - INFO - __main__ - Step 41940: {'lr': 0.0004154115435034175, 'samples': 8052480, 'steps': 41939, 'loss/train': 1.5125808715820312} -11/07/2021 03:06:52 - INFO - __main__ - Step 41941: {'lr': 0.00041540756438324746, 'samples': 8052672, 'steps': 41940, 'loss/train': 2.0472888946533203} -11/07/2021 03:06:52 - INFO - __main__ - Step 41942: {'lr': 0.0004154035851885474, 'samples': 8052864, 'steps': 41941, 'loss/train': 1.1914267539978027} -11/07/2021 03:06:54 - INFO - __main__ - Step 41943: {'lr': 0.0004153996059193191, 'samples': 8053056, 'steps': 41942, 'loss/train': 0.6326480507850647} -11/07/2021 03:06:54 - INFO - __main__ - Step 41944: {'lr': 0.0004153956265755642, 'samples': 8053248, 'steps': 41943, 'loss/train': 1.6083602905273438} -11/07/2021 03:06:54 - INFO - __main__ - Step 41945: {'lr': 0.0004153916471572846, 'samples': 8053440, 'steps': 41944, 'loss/train': 0.9648074507713318} -11/07/2021 03:06:55 - INFO - __main__ - Step 41946: {'lr': 0.0004153876676644821, 'samples': 8053632, 'steps': 41945, 'loss/train': 1.5843206644058228} -11/07/2021 03:06:55 - INFO - __main__ - Step 41947: {'lr': 0.0004153836880971585, 'samples': 8053824, 'steps': 41946, 'loss/train': 0.8655702471733093} -11/07/2021 03:06:56 - INFO - __main__ - Step 41948: {'lr': 0.00041537970845531547, 'samples': 8054016, 'steps': 41947, 'loss/train': 1.5090172290802002} -11/07/2021 03:06:56 - INFO - __main__ - Step 41949: {'lr': 0.00041537572873895503, 'samples': 8054208, 'steps': 41948, 'loss/train': 1.765095829963684} -11/07/2021 03:06:57 - INFO - __main__ - Step 41950: {'lr': 0.00041537174894807873, 'samples': 8054400, 'steps': 41949, 'loss/train': 1.4930294752120972} -11/07/2021 03:06:57 - INFO - __main__ - Step 41951: {'lr': 0.00041536776908268847, 'samples': 8054592, 'steps': 41950, 'loss/train': 1.2215300798416138} -11/07/2021 03:06:57 - INFO - __main__ - Step 41952: {'lr': 0.00041536378914278603, 'samples': 8054784, 'steps': 41951, 'loss/train': 1.7548632621765137} -11/07/2021 03:06:58 - INFO - __main__ - Step 41953: {'lr': 0.00041535980912837326, 'samples': 8054976, 'steps': 41952, 'loss/train': 1.6592971086502075} -11/07/2021 03:07:00 - INFO - __main__ - Step 41954: {'lr': 0.00041535582903945195, 'samples': 8055168, 'steps': 41953, 'loss/train': 1.9381015300750732} -11/07/2021 03:07:00 - INFO - __main__ - Step 41955: {'lr': 0.00041535184887602384, 'samples': 8055360, 'steps': 41954, 'loss/train': 1.328749656677246} -11/07/2021 03:07:00 - INFO - __main__ - Step 41956: {'lr': 0.0004153478686380907, 'samples': 8055552, 'steps': 41955, 'loss/train': 1.5953503847122192} -11/07/2021 03:07:01 - INFO - __main__ - Step 41957: {'lr': 0.0004153438883256544, 'samples': 8055744, 'steps': 41956, 'loss/train': 1.5133731365203857} -11/07/2021 03:07:01 - INFO - __main__ - Step 41958: {'lr': 0.0004153399079387167, 'samples': 8055936, 'steps': 41957, 'loss/train': 1.5228304862976074} -11/07/2021 03:07:01 - INFO - __main__ - Step 41959: {'lr': 0.00041533592747727935, 'samples': 8056128, 'steps': 41958, 'loss/train': 1.3258435726165771} -11/07/2021 03:07:02 - INFO - __main__ - Step 41960: {'lr': 0.00041533194694134414, 'samples': 8056320, 'steps': 41959, 'loss/train': 1.7467302083969116} -11/07/2021 03:07:03 - INFO - __main__ - Step 41961: {'lr': 0.00041532796633091297, 'samples': 8056512, 'steps': 41960, 'loss/train': 1.7610151767730713} -11/07/2021 03:07:03 - INFO - __main__ - Step 41962: {'lr': 0.00041532398564598757, 'samples': 8056704, 'steps': 41961, 'loss/train': 1.536446213722229} -11/07/2021 03:07:03 - INFO - __main__ - Step 41963: {'lr': 0.0004153200048865697, 'samples': 8056896, 'steps': 41962, 'loss/train': 1.8210513591766357} -11/07/2021 03:07:04 - INFO - __main__ - Step 41964: {'lr': 0.0004153160240526612, 'samples': 8057088, 'steps': 41963, 'loss/train': 1.6114858388900757} -11/07/2021 03:07:04 - INFO - __main__ - Step 41965: {'lr': 0.0004153120431442639, 'samples': 8057280, 'steps': 41964, 'loss/train': 1.4403822422027588} -11/07/2021 03:07:05 - INFO - __main__ - Step 41966: {'lr': 0.00041530806216137953, 'samples': 8057472, 'steps': 41965, 'loss/train': 1.6566977500915527} -11/07/2021 03:07:06 - INFO - __main__ - Step 41967: {'lr': 0.00041530408110400987, 'samples': 8057664, 'steps': 41966, 'loss/train': 1.118053913116455} -11/07/2021 03:07:06 - INFO - __main__ - Step 41968: {'lr': 0.00041530009997215665, 'samples': 8057856, 'steps': 41967, 'loss/train': 1.4030784368515015} -11/07/2021 03:07:06 - INFO - __main__ - Step 41969: {'lr': 0.00041529611876582194, 'samples': 8058048, 'steps': 41968, 'loss/train': 1.3769654035568237} -11/07/2021 03:07:07 - INFO - __main__ - Step 41970: {'lr': 0.00041529213748500726, 'samples': 8058240, 'steps': 41969, 'loss/train': 1.3986589908599854} -11/07/2021 03:07:07 - INFO - __main__ - Step 41971: {'lr': 0.0004152881561297145, 'samples': 8058432, 'steps': 41970, 'loss/train': 1.9423401355743408} -11/07/2021 03:07:08 - INFO - __main__ - Step 41972: {'lr': 0.0004152841746999454, 'samples': 8058624, 'steps': 41971, 'loss/train': 1.5982258319854736} -11/07/2021 03:07:08 - INFO - __main__ - Step 41973: {'lr': 0.00041528019319570186, 'samples': 8058816, 'steps': 41972, 'loss/train': 1.6509596109390259} -11/07/2021 03:07:09 - INFO - __main__ - Step 41974: {'lr': 0.0004152762116169856, 'samples': 8059008, 'steps': 41973, 'loss/train': 1.199228048324585} -11/07/2021 03:07:09 - INFO - __main__ - Step 41975: {'lr': 0.00041527222996379844, 'samples': 8059200, 'steps': 41974, 'loss/train': 1.4981478452682495} -11/07/2021 03:07:09 - INFO - __main__ - Step 41976: {'lr': 0.0004152682482361422, 'samples': 8059392, 'steps': 41975, 'loss/train': 1.662643313407898} -11/07/2021 03:07:11 - INFO - __main__ - Step 41977: {'lr': 0.0004152642664340185, 'samples': 8059584, 'steps': 41976, 'loss/train': 1.1987229585647583} -11/07/2021 03:07:11 - INFO - __main__ - Step 41978: {'lr': 0.00041526028455742936, 'samples': 8059776, 'steps': 41977, 'loss/train': 0.48487409949302673} -11/07/2021 03:07:12 - INFO - __main__ - Step 41979: {'lr': 0.0004152563026063765, 'samples': 8059968, 'steps': 41978, 'loss/train': 1.4140325784683228} -11/07/2021 03:07:12 - INFO - __main__ - Step 41980: {'lr': 0.00041525232058086173, 'samples': 8060160, 'steps': 41979, 'loss/train': 1.611794114112854} -11/07/2021 03:07:12 - INFO - __main__ - Step 41981: {'lr': 0.0004152483384808867, 'samples': 8060352, 'steps': 41980, 'loss/train': 1.3852312564849854} -11/07/2021 03:07:13 - INFO - __main__ - Step 41982: {'lr': 0.0004152443563064534, 'samples': 8060544, 'steps': 41981, 'loss/train': 0.39391547441482544} -11/07/2021 03:07:14 - INFO - __main__ - Step 41983: {'lr': 0.00041524037405756356, 'samples': 8060736, 'steps': 41982, 'loss/train': 1.5800052881240845} -11/07/2021 03:07:14 - INFO - __main__ - Step 41984: {'lr': 0.0004152363917342189, 'samples': 8060928, 'steps': 41983, 'loss/train': 1.337543249130249} -11/07/2021 03:07:15 - INFO - __main__ - Step 41985: {'lr': 0.00041523240933642134, 'samples': 8061120, 'steps': 41984, 'loss/train': 1.818328857421875} -11/07/2021 03:07:15 - INFO - __main__ - Step 41986: {'lr': 0.00041522842686417255, 'samples': 8061312, 'steps': 41985, 'loss/train': 1.1234190464019775} -11/07/2021 03:07:15 - INFO - __main__ - Step 41987: {'lr': 0.0004152244443174744, 'samples': 8061504, 'steps': 41986, 'loss/train': 0.8166891932487488} -11/07/2021 03:07:16 - INFO - __main__ - Step 41988: {'lr': 0.00041522046169632863, 'samples': 8061696, 'steps': 41987, 'loss/train': 2.011791706085205} -11/07/2021 03:07:16 - INFO - __main__ - Step 41989: {'lr': 0.0004152164790007371, 'samples': 8061888, 'steps': 41988, 'loss/train': 1.5016108751296997} -11/07/2021 03:07:17 - INFO - __main__ - Step 41990: {'lr': 0.00041521249623070164, 'samples': 8062080, 'steps': 41989, 'loss/train': 1.6521884202957153} -11/07/2021 03:07:17 - INFO - __main__ - Step 41991: {'lr': 0.0004152085133862239, 'samples': 8062272, 'steps': 41990, 'loss/train': 1.3991754055023193} -11/07/2021 03:07:18 - INFO - __main__ - Step 41992: {'lr': 0.0004152045304673058, 'samples': 8062464, 'steps': 41991, 'loss/train': 1.167265772819519} -11/07/2021 03:07:18 - INFO - __main__ - Step 41993: {'lr': 0.000415200547473949, 'samples': 8062656, 'steps': 41992, 'loss/train': 1.5853790044784546} -11/07/2021 03:07:19 - INFO - __main__ - Step 41994: {'lr': 0.00041519656440615544, 'samples': 8062848, 'steps': 41993, 'loss/train': 1.2686554193496704} -11/07/2021 03:07:20 - INFO - __main__ - Step 41995: {'lr': 0.00041519258126392685, 'samples': 8063040, 'steps': 41994, 'loss/train': 1.9380366802215576} -11/07/2021 03:07:20 - INFO - __main__ - Step 41996: {'lr': 0.00041518859804726507, 'samples': 8063232, 'steps': 41995, 'loss/train': 1.2416760921478271} -11/07/2021 03:07:20 - INFO - __main__ - Step 41997: {'lr': 0.00041518461475617183, 'samples': 8063424, 'steps': 41996, 'loss/train': 1.2034986019134521} -11/07/2021 03:07:21 - INFO - __main__ - Step 41998: {'lr': 0.00041518063139064893, 'samples': 8063616, 'steps': 41997, 'loss/train': 1.7212826013565063} -11/07/2021 03:07:21 - INFO - __main__ - Step 41999: {'lr': 0.0004151766479506982, 'samples': 8063808, 'steps': 41998, 'loss/train': 1.2917431592941284} -11/07/2021 03:07:23 - INFO - __main__ - Step 42000: {'lr': 0.0004151726644363214, 'samples': 8064000, 'steps': 41999, 'loss/train': 1.8012648820877075} -11/07/2021 03:07:23 - INFO - __main__ - Step 42001: {'lr': 0.00041516868084752034, 'samples': 8064192, 'steps': 42000, 'loss/train': 1.4202122688293457} -11/07/2021 03:07:23 - INFO - __main__ - Step 42002: {'lr': 0.0004151646971842968, 'samples': 8064384, 'steps': 42001, 'loss/train': 1.7842530012130737} -11/07/2021 03:07:24 - INFO - __main__ - Step 42003: {'lr': 0.00041516071344665275, 'samples': 8064576, 'steps': 42002, 'loss/train': 1.8126933574676514} -11/07/2021 03:07:24 - INFO - __main__ - Step 42004: {'lr': 0.00041515672963458975, 'samples': 8064768, 'steps': 42003, 'loss/train': 1.757590413093567} -11/07/2021 03:07:25 - INFO - __main__ - Step 42005: {'lr': 0.00041515274574810965, 'samples': 8064960, 'steps': 42004, 'loss/train': 1.5378392934799194} -11/07/2021 03:07:25 - INFO - __main__ - Step 42006: {'lr': 0.00041514876178721426, 'samples': 8065152, 'steps': 42005, 'loss/train': 1.984458565711975} -11/07/2021 03:07:25 - INFO - __main__ - Step 42007: {'lr': 0.0004151447777519054, 'samples': 8065344, 'steps': 42006, 'loss/train': 1.7512965202331543} -11/07/2021 03:07:26 - INFO - __main__ - Step 42008: {'lr': 0.00041514079364218483, 'samples': 8065536, 'steps': 42007, 'loss/train': 1.270204782485962} -11/07/2021 03:07:27 - INFO - __main__ - Step 42009: {'lr': 0.0004151368094580544, 'samples': 8065728, 'steps': 42008, 'loss/train': 1.3795816898345947} -11/07/2021 03:07:27 - INFO - __main__ - Step 42010: {'lr': 0.0004151328251995159, 'samples': 8065920, 'steps': 42009, 'loss/train': 1.1478238105773926} -11/07/2021 03:07:27 - INFO - __main__ - Step 42011: {'lr': 0.000415128840866571, 'samples': 8066112, 'steps': 42010, 'loss/train': 5.797067642211914} -11/07/2021 03:07:28 - INFO - __main__ - Step 42012: {'lr': 0.00041512485645922164, 'samples': 8066304, 'steps': 42011, 'loss/train': 1.7063237428665161} -11/07/2021 03:07:28 - INFO - __main__ - Step 42013: {'lr': 0.0004151208719774696, 'samples': 8066496, 'steps': 42012, 'loss/train': 1.5984175205230713} -11/07/2021 03:07:29 - INFO - __main__ - Step 42014: {'lr': 0.0004151168874213166, 'samples': 8066688, 'steps': 42013, 'loss/train': 1.807763934135437} -11/07/2021 03:07:29 - INFO - __main__ - Step 42015: {'lr': 0.00041511290279076454, 'samples': 8066880, 'steps': 42014, 'loss/train': 1.4820877313613892} -11/07/2021 03:07:30 - INFO - __main__ - Step 42016: {'lr': 0.0004151089180858151, 'samples': 8067072, 'steps': 42015, 'loss/train': 1.1027518510818481} -11/07/2021 03:07:30 - INFO - __main__ - Step 42017: {'lr': 0.00041510493330647015, 'samples': 8067264, 'steps': 42016, 'loss/train': 1.7387123107910156} -11/07/2021 03:07:31 - INFO - __main__ - Step 42018: {'lr': 0.00041510094845273145, 'samples': 8067456, 'steps': 42017, 'loss/train': 1.5490429401397705} -11/07/2021 03:07:32 - INFO - __main__ - Step 42019: {'lr': 0.0004150969635246008, 'samples': 8067648, 'steps': 42018, 'loss/train': 1.4055429697036743} -11/07/2021 03:07:32 - INFO - __main__ - Step 42020: {'lr': 0.00041509297852208003, 'samples': 8067840, 'steps': 42019, 'loss/train': 1.8538402318954468} -11/07/2021 03:07:32 - INFO - __main__ - Step 42021: {'lr': 0.00041508899344517094, 'samples': 8068032, 'steps': 42020, 'loss/train': 1.2977536916732788} -11/07/2021 03:07:33 - INFO - __main__ - Step 42022: {'lr': 0.0004150850082938752, 'samples': 8068224, 'steps': 42021, 'loss/train': 1.055382251739502} -11/07/2021 03:07:33 - INFO - __main__ - Step 42023: {'lr': 0.00041508102306819485, 'samples': 8068416, 'steps': 42022, 'loss/train': 1.807405710220337} -11/07/2021 03:07:34 - INFO - __main__ - Step 42024: {'lr': 0.0004150770377681314, 'samples': 8068608, 'steps': 42023, 'loss/train': 1.8987107276916504} -11/07/2021 03:07:34 - INFO - __main__ - Step 42025: {'lr': 0.00041507305239368684, 'samples': 8068800, 'steps': 42024, 'loss/train': 1.1936386823654175} -11/07/2021 03:07:35 - INFO - __main__ - Step 42026: {'lr': 0.0004150690669448629, 'samples': 8068992, 'steps': 42025, 'loss/train': 1.6065560579299927} -11/07/2021 03:07:35 - INFO - __main__ - Step 42027: {'lr': 0.0004150650814216614, 'samples': 8069184, 'steps': 42026, 'loss/train': 2.0050127506256104} -11/07/2021 03:07:36 - INFO - __main__ - Step 42028: {'lr': 0.0004150610958240841, 'samples': 8069376, 'steps': 42027, 'loss/train': 1.268518328666687} -11/07/2021 03:07:36 - INFO - __main__ - Step 42029: {'lr': 0.00041505711015213284, 'samples': 8069568, 'steps': 42028, 'loss/train': 1.7336264848709106} -11/07/2021 03:07:37 - INFO - __main__ - Step 42030: {'lr': 0.0004150531244058094, 'samples': 8069760, 'steps': 42029, 'loss/train': 1.4684981107711792} -11/07/2021 03:07:37 - INFO - __main__ - Step 42031: {'lr': 0.00041504913858511557, 'samples': 8069952, 'steps': 42030, 'loss/train': 1.1485469341278076} -11/07/2021 03:07:38 - INFO - __main__ - Step 42032: {'lr': 0.0004150451526900531, 'samples': 8070144, 'steps': 42031, 'loss/train': 1.8169656991958618} -11/07/2021 03:07:38 - INFO - __main__ - Step 42033: {'lr': 0.00041504116672062385, 'samples': 8070336, 'steps': 42032, 'loss/train': 1.820695400238037} -11/07/2021 03:07:38 - INFO - __main__ - Step 42034: {'lr': 0.0004150371806768296, 'samples': 8070528, 'steps': 42033, 'loss/train': 1.4767593145370483} -11/07/2021 03:07:39 - INFO - __main__ - Step 42035: {'lr': 0.00041503319455867216, 'samples': 8070720, 'steps': 42034, 'loss/train': 1.8394572734832764} -11/07/2021 03:07:40 - INFO - __main__ - Step 42036: {'lr': 0.0004150292083661533, 'samples': 8070912, 'steps': 42035, 'loss/train': 1.9457099437713623} -11/07/2021 03:07:40 - INFO - __main__ - Step 42037: {'lr': 0.00041502522209927486, 'samples': 8071104, 'steps': 42036, 'loss/train': 2.1062285900115967} -11/07/2021 03:07:40 - INFO - __main__ - Step 42038: {'lr': 0.00041502123575803854, 'samples': 8071296, 'steps': 42037, 'loss/train': 1.010448932647705} -11/07/2021 03:07:41 - INFO - __main__ - Step 42039: {'lr': 0.0004150172493424462, 'samples': 8071488, 'steps': 42038, 'loss/train': 1.797959804534912} -11/07/2021 03:07:41 - INFO - __main__ - Step 42040: {'lr': 0.00041501326285249963, 'samples': 8071680, 'steps': 42039, 'loss/train': 1.6893484592437744} -11/07/2021 03:07:42 - INFO - __main__ - Step 42041: {'lr': 0.0004150092762882007, 'samples': 8071872, 'steps': 42040, 'loss/train': 1.5143741369247437} -11/07/2021 03:07:43 - INFO - __main__ - Step 42042: {'lr': 0.00041500528964955106, 'samples': 8072064, 'steps': 42041, 'loss/train': 1.83730149269104} -11/07/2021 03:07:43 - INFO - __main__ - Step 42043: {'lr': 0.0004150013029365527, 'samples': 8072256, 'steps': 42042, 'loss/train': 1.7041666507720947} -11/07/2021 03:07:43 - INFO - __main__ - Step 42044: {'lr': 0.0004149973161492072, 'samples': 8072448, 'steps': 42043, 'loss/train': 1.4257150888442993} -11/07/2021 03:07:44 - INFO - __main__ - Step 42045: {'lr': 0.0004149933292875164, 'samples': 8072640, 'steps': 42044, 'loss/train': 1.5595922470092773} -11/07/2021 03:07:44 - INFO - __main__ - Step 42046: {'lr': 0.0004149893423514822, 'samples': 8072832, 'steps': 42045, 'loss/train': 1.4120824337005615} -11/07/2021 03:07:45 - INFO - __main__ - Step 42047: {'lr': 0.0004149853553411064, 'samples': 8073024, 'steps': 42046, 'loss/train': 1.8442844152450562} -11/07/2021 03:07:45 - INFO - __main__ - Step 42048: {'lr': 0.00041498136825639074, 'samples': 8073216, 'steps': 42047, 'loss/train': 1.3788831233978271} -11/07/2021 03:07:46 - INFO - __main__ - Step 42049: {'lr': 0.000414977381097337, 'samples': 8073408, 'steps': 42048, 'loss/train': 0.8893455862998962} -11/07/2021 03:07:46 - INFO - __main__ - Step 42050: {'lr': 0.000414973393863947, 'samples': 8073600, 'steps': 42049, 'loss/train': 1.5420819520950317} -11/07/2021 03:07:46 - INFO - __main__ - Step 42051: {'lr': 0.0004149694065562225, 'samples': 8073792, 'steps': 42050, 'loss/train': 0.9688058495521545} -11/07/2021 03:07:48 - INFO - __main__ - Step 42052: {'lr': 0.0004149654191741654, 'samples': 8073984, 'steps': 42051, 'loss/train': 1.6391124725341797} -11/07/2021 03:07:48 - INFO - __main__ - Step 42053: {'lr': 0.0004149614317177774, 'samples': 8074176, 'steps': 42052, 'loss/train': 1.605303168296814} -11/07/2021 03:07:48 - INFO - __main__ - Step 42054: {'lr': 0.00041495744418706027, 'samples': 8074368, 'steps': 42053, 'loss/train': 1.5720794200897217} -11/07/2021 03:07:49 - INFO - __main__ - Step 42055: {'lr': 0.00041495345658201587, 'samples': 8074560, 'steps': 42054, 'loss/train': 1.0581259727478027} -11/07/2021 03:07:49 - INFO - __main__ - Step 42056: {'lr': 0.00041494946890264606, 'samples': 8074752, 'steps': 42055, 'loss/train': 1.635392189025879} -11/07/2021 03:07:50 - INFO - __main__ - Step 42057: {'lr': 0.00041494548114895255, 'samples': 8074944, 'steps': 42056, 'loss/train': 1.5409810543060303} -11/07/2021 03:07:51 - INFO - __main__ - Step 42058: {'lr': 0.0004149414933209371, 'samples': 8075136, 'steps': 42057, 'loss/train': 1.8882447481155396} -11/07/2021 03:07:51 - INFO - __main__ - Step 42059: {'lr': 0.00041493750541860165, 'samples': 8075328, 'steps': 42058, 'loss/train': 0.4278101921081543} -11/07/2021 03:07:51 - INFO - __main__ - Step 42060: {'lr': 0.0004149335174419478, 'samples': 8075520, 'steps': 42059, 'loss/train': 1.5596524477005005} -11/07/2021 03:07:52 - INFO - __main__ - Step 42061: {'lr': 0.0004149295293909775, 'samples': 8075712, 'steps': 42060, 'loss/train': 1.5847713947296143} -11/07/2021 03:07:53 - INFO - __main__ - Step 42062: {'lr': 0.0004149255412656925, 'samples': 8075904, 'steps': 42061, 'loss/train': 1.6529903411865234} -11/07/2021 03:07:53 - INFO - __main__ - Step 42063: {'lr': 0.00041492155306609456, 'samples': 8076096, 'steps': 42062, 'loss/train': 2.4510741233825684} -11/07/2021 03:07:53 - INFO - __main__ - Step 42064: {'lr': 0.00041491756479218557, 'samples': 8076288, 'steps': 42063, 'loss/train': 1.7397103309631348} -11/07/2021 03:07:54 - INFO - __main__ - Step 42065: {'lr': 0.0004149135764439672, 'samples': 8076480, 'steps': 42064, 'loss/train': 1.273585557937622} -11/07/2021 03:07:54 - INFO - __main__ - Step 42066: {'lr': 0.0004149095880214414, 'samples': 8076672, 'steps': 42065, 'loss/train': 1.6326723098754883} -11/07/2021 03:07:55 - INFO - __main__ - Step 42067: {'lr': 0.00041490559952460983, 'samples': 8076864, 'steps': 42066, 'loss/train': 1.0523433685302734} -11/07/2021 03:07:55 - INFO - __main__ - Step 42068: {'lr': 0.00041490161095347435, 'samples': 8077056, 'steps': 42067, 'loss/train': 1.2187541723251343} -11/07/2021 03:07:56 - INFO - __main__ - Step 42069: {'lr': 0.00041489762230803676, 'samples': 8077248, 'steps': 42068, 'loss/train': 1.519520878791809} -11/07/2021 03:07:56 - INFO - __main__ - Step 42070: {'lr': 0.00041489363358829885, 'samples': 8077440, 'steps': 42069, 'loss/train': 1.3521915674209595} -11/07/2021 03:07:57 - INFO - __main__ - Step 42071: {'lr': 0.0004148896447942624, 'samples': 8077632, 'steps': 42070, 'loss/train': 1.5754438638687134} -11/07/2021 03:07:57 - INFO - __main__ - Step 42072: {'lr': 0.00041488565592592917, 'samples': 8077824, 'steps': 42071, 'loss/train': 1.6142688989639282} -11/07/2021 03:07:58 - INFO - __main__ - Step 42073: {'lr': 0.0004148816669833011, 'samples': 8078016, 'steps': 42072, 'loss/train': 2.0739517211914062} -11/07/2021 03:07:58 - INFO - __main__ - Step 42074: {'lr': 0.0004148776779663799, 'samples': 8078208, 'steps': 42073, 'loss/train': 1.590319275856018} -11/07/2021 03:07:59 - INFO - __main__ - Step 42075: {'lr': 0.00041487368887516726, 'samples': 8078400, 'steps': 42074, 'loss/train': 1.4445720911026} -11/07/2021 03:07:59 - INFO - __main__ - Step 42076: {'lr': 0.00041486969970966516, 'samples': 8078592, 'steps': 42075, 'loss/train': 1.8851046562194824} -11/07/2021 03:07:59 - INFO - __main__ - Step 42077: {'lr': 0.0004148657104698753, 'samples': 8078784, 'steps': 42076, 'loss/train': 1.7685871124267578} -11/07/2021 03:08:00 - INFO - __main__ - Step 42078: {'lr': 0.00041486172115579945, 'samples': 8078976, 'steps': 42077, 'loss/train': 1.370727777481079} -11/07/2021 03:08:01 - INFO - __main__ - Step 42079: {'lr': 0.00041485773176743953, 'samples': 8079168, 'steps': 42078, 'loss/train': 1.630990743637085} -11/07/2021 03:08:01 - INFO - __main__ - Step 42080: {'lr': 0.00041485374230479724, 'samples': 8079360, 'steps': 42079, 'loss/train': 1.9803260564804077} -11/07/2021 03:08:01 - INFO - __main__ - Step 42081: {'lr': 0.00041484975276787436, 'samples': 8079552, 'steps': 42080, 'loss/train': 1.5335677862167358} -11/07/2021 03:08:02 - INFO - __main__ - Step 42082: {'lr': 0.00041484576315667273, 'samples': 8079744, 'steps': 42081, 'loss/train': 1.72471284866333} -11/07/2021 03:08:03 - INFO - __main__ - Step 42083: {'lr': 0.0004148417734711941, 'samples': 8079936, 'steps': 42082, 'loss/train': 0.442223459482193} -11/07/2021 03:08:03 - INFO - __main__ - Step 42084: {'lr': 0.00041483778371144046, 'samples': 8080128, 'steps': 42083, 'loss/train': 1.3410874605178833} -11/07/2021 03:08:04 - INFO - __main__ - Step 42085: {'lr': 0.0004148337938774134, 'samples': 8080320, 'steps': 42084, 'loss/train': 1.4568349123001099} -11/07/2021 03:08:04 - INFO - __main__ - Step 42086: {'lr': 0.00041482980396911467, 'samples': 8080512, 'steps': 42085, 'loss/train': 0.7727944850921631} -11/07/2021 03:08:04 - INFO - __main__ - Step 42087: {'lr': 0.0004148258139865463, 'samples': 8080704, 'steps': 42086, 'loss/train': 2.0954015254974365} -11/07/2021 03:08:05 - INFO - __main__ - Step 42088: {'lr': 0.00041482182392970984, 'samples': 8080896, 'steps': 42087, 'loss/train': 1.3977972269058228} -11/07/2021 03:08:06 - INFO - __main__ - Step 42089: {'lr': 0.00041481783379860725, 'samples': 8081088, 'steps': 42088, 'loss/train': 1.567556381225586} -11/07/2021 03:08:06 - INFO - __main__ - Step 42090: {'lr': 0.0004148138435932404, 'samples': 8081280, 'steps': 42089, 'loss/train': 1.4468871355056763} -11/07/2021 03:08:06 - INFO - __main__ - Step 42091: {'lr': 0.0004148098533136109, 'samples': 8081472, 'steps': 42090, 'loss/train': 2.4713995456695557} -11/07/2021 03:08:07 - INFO - __main__ - Step 42092: {'lr': 0.0004148058629597206, 'samples': 8081664, 'steps': 42091, 'loss/train': 1.3342759609222412} -11/07/2021 03:08:07 - INFO - __main__ - Step 42093: {'lr': 0.0004148018725315713, 'samples': 8081856, 'steps': 42092, 'loss/train': 1.1993120908737183} -11/07/2021 03:08:08 - INFO - __main__ - Step 42094: {'lr': 0.00041479788202916483, 'samples': 8082048, 'steps': 42093, 'loss/train': 1.8482271432876587} -11/07/2021 03:08:09 - INFO - __main__ - Step 42095: {'lr': 0.000414793891452503, 'samples': 8082240, 'steps': 42094, 'loss/train': 1.5280399322509766} -11/07/2021 03:08:09 - INFO - __main__ - Step 42096: {'lr': 0.0004147899008015876, 'samples': 8082432, 'steps': 42095, 'loss/train': 1.5832175016403198} -11/07/2021 03:08:09 - INFO - __main__ - Step 42097: {'lr': 0.0004147859100764204, 'samples': 8082624, 'steps': 42096, 'loss/train': 1.7992056608200073} -11/07/2021 03:08:10 - INFO - __main__ - Step 42098: {'lr': 0.0004147819192770033, 'samples': 8082816, 'steps': 42097, 'loss/train': 1.5658690929412842} -11/07/2021 03:08:11 - INFO - __main__ - Step 42099: {'lr': 0.00041477792840333784, 'samples': 8083008, 'steps': 42098, 'loss/train': 1.2517671585083008} -11/07/2021 03:08:11 - INFO - __main__ - Step 42100: {'lr': 0.00041477393745542607, 'samples': 8083200, 'steps': 42099, 'loss/train': 1.3536474704742432} -11/07/2021 03:08:11 - INFO - __main__ - Step 42101: {'lr': 0.0004147699464332697, 'samples': 8083392, 'steps': 42100, 'loss/train': 1.4670751094818115} -11/07/2021 03:08:12 - INFO - __main__ - Step 42102: {'lr': 0.0004147659553368706, 'samples': 8083584, 'steps': 42101, 'loss/train': 2.541309118270874} -11/07/2021 03:08:12 - INFO - __main__ - Step 42103: {'lr': 0.00041476196416623034, 'samples': 8083776, 'steps': 42102, 'loss/train': 1.3247640132904053} -11/07/2021 03:08:13 - INFO - __main__ - Step 42104: {'lr': 0.0004147579729213511, 'samples': 8083968, 'steps': 42103, 'loss/train': 1.835842251777649} -11/07/2021 03:08:13 - INFO - __main__ - Step 42105: {'lr': 0.0004147539816022343, 'samples': 8084160, 'steps': 42104, 'loss/train': 1.3662902116775513} -11/07/2021 03:08:14 - INFO - __main__ - Step 42106: {'lr': 0.0004147499902088819, 'samples': 8084352, 'steps': 42105, 'loss/train': 1.5861386060714722} -11/07/2021 03:08:14 - INFO - __main__ - Step 42107: {'lr': 0.0004147459987412958, 'samples': 8084544, 'steps': 42106, 'loss/train': 1.6038364171981812} -11/07/2021 03:08:14 - INFO - __main__ - Step 42108: {'lr': 0.0004147420071994776, 'samples': 8084736, 'steps': 42107, 'loss/train': 1.1665230989456177} -11/07/2021 03:08:16 - INFO - __main__ - Step 42109: {'lr': 0.0004147380155834293, 'samples': 8084928, 'steps': 42108, 'loss/train': 1.8599544763565063} -11/07/2021 03:08:16 - INFO - __main__ - Step 42110: {'lr': 0.0004147340238931525, 'samples': 8085120, 'steps': 42109, 'loss/train': 1.515739917755127} -11/07/2021 03:08:16 - INFO - __main__ - Step 42111: {'lr': 0.0004147300321286491, 'samples': 8085312, 'steps': 42110, 'loss/train': 1.7114287614822388} -11/07/2021 03:08:17 - INFO - __main__ - Step 42112: {'lr': 0.0004147260402899209, 'samples': 8085504, 'steps': 42111, 'loss/train': 1.681444764137268} -11/07/2021 03:08:17 - INFO - __main__ - Step 42113: {'lr': 0.0004147220483769697, 'samples': 8085696, 'steps': 42112, 'loss/train': 1.788677453994751} -11/07/2021 03:08:18 - INFO - __main__ - Step 42114: {'lr': 0.0004147180563897972, 'samples': 8085888, 'steps': 42113, 'loss/train': 2.0268678665161133} -11/07/2021 03:08:18 - INFO - __main__ - Step 42115: {'lr': 0.0004147140643284054, 'samples': 8086080, 'steps': 42114, 'loss/train': 1.668137550354004} -11/07/2021 03:08:19 - INFO - __main__ - Step 42116: {'lr': 0.00041471007219279595, 'samples': 8086272, 'steps': 42115, 'loss/train': 1.519972562789917} -11/07/2021 03:08:19 - INFO - __main__ - Step 42117: {'lr': 0.0004147060799829707, 'samples': 8086464, 'steps': 42116, 'loss/train': 1.638015627861023} -11/07/2021 03:08:19 - INFO - __main__ - Step 42118: {'lr': 0.00041470208769893137, 'samples': 8086656, 'steps': 42117, 'loss/train': 1.7440546751022339} -11/07/2021 03:08:20 - INFO - __main__ - Step 42119: {'lr': 0.0004146980953406799, 'samples': 8086848, 'steps': 42118, 'loss/train': 0.6300422549247742} -11/07/2021 03:08:21 - INFO - __main__ - Step 42120: {'lr': 0.000414694102908218, 'samples': 8087040, 'steps': 42119, 'loss/train': 0.47657132148742676} -11/07/2021 03:08:21 - INFO - __main__ - Step 42121: {'lr': 0.0004146901104015474, 'samples': 8087232, 'steps': 42120, 'loss/train': 1.5050257444381714} -11/07/2021 03:08:21 - INFO - __main__ - Step 42122: {'lr': 0.00041468611782067, 'samples': 8087424, 'steps': 42121, 'loss/train': 1.2551136016845703} -11/07/2021 03:08:22 - INFO - __main__ - Step 42123: {'lr': 0.0004146821251655877, 'samples': 8087616, 'steps': 42122, 'loss/train': 1.520211100578308} -11/07/2021 03:08:22 - INFO - __main__ - Step 42124: {'lr': 0.000414678132436302, 'samples': 8087808, 'steps': 42123, 'loss/train': 0.9685293436050415} -11/07/2021 03:08:23 - INFO - __main__ - Step 42125: {'lr': 0.000414674139632815, 'samples': 8088000, 'steps': 42124, 'loss/train': 1.4324889183044434} -11/07/2021 03:08:23 - INFO - __main__ - Step 42126: {'lr': 0.0004146701467551283, 'samples': 8088192, 'steps': 42125, 'loss/train': 1.3058773279190063} -11/07/2021 03:08:24 - INFO - __main__ - Step 42127: {'lr': 0.0004146661538032438, 'samples': 8088384, 'steps': 42126, 'loss/train': 1.5557634830474854} -11/07/2021 03:08:24 - INFO - __main__ - Step 42128: {'lr': 0.0004146621607771633, 'samples': 8088576, 'steps': 42127, 'loss/train': 1.6212557554244995} -11/07/2021 03:08:25 - INFO - __main__ - Step 42129: {'lr': 0.00041465816767688853, 'samples': 8088768, 'steps': 42128, 'loss/train': 1.4947006702423096} -11/07/2021 03:08:26 - INFO - __main__ - Step 42130: {'lr': 0.0004146541745024214, 'samples': 8088960, 'steps': 42129, 'loss/train': 1.1805391311645508} -11/07/2021 03:08:26 - INFO - __main__ - Step 42131: {'lr': 0.00041465018125376354, 'samples': 8089152, 'steps': 42130, 'loss/train': 1.5250442028045654} -11/07/2021 03:08:26 - INFO - __main__ - Step 42132: {'lr': 0.0004146461879309169, 'samples': 8089344, 'steps': 42131, 'loss/train': 1.5029743909835815} -11/07/2021 03:08:27 - INFO - __main__ - Step 42133: {'lr': 0.0004146421945338832, 'samples': 8089536, 'steps': 42132, 'loss/train': 1.6332733631134033} -11/07/2021 03:08:27 - INFO - __main__ - Step 42134: {'lr': 0.0004146382010626643, 'samples': 8089728, 'steps': 42133, 'loss/train': 1.3687775135040283} -11/07/2021 03:08:28 - INFO - __main__ - Step 42135: {'lr': 0.000414634207517262, 'samples': 8089920, 'steps': 42134, 'loss/train': 1.0351780652999878} -11/07/2021 03:08:28 - INFO - __main__ - Step 42136: {'lr': 0.000414630213897678, 'samples': 8090112, 'steps': 42135, 'loss/train': 1.5677454471588135} -11/07/2021 03:08:29 - INFO - __main__ - Step 42137: {'lr': 0.00041462622020391416, 'samples': 8090304, 'steps': 42136, 'loss/train': 1.659880518913269} -11/07/2021 03:08:29 - INFO - __main__ - Step 42138: {'lr': 0.00041462222643597236, 'samples': 8090496, 'steps': 42137, 'loss/train': 1.4060335159301758} -11/07/2021 03:08:29 - INFO - __main__ - Step 42139: {'lr': 0.00041461823259385423, 'samples': 8090688, 'steps': 42138, 'loss/train': 1.3353675603866577} -11/07/2021 03:08:30 - INFO - __main__ - Step 42140: {'lr': 0.00041461423867756176, 'samples': 8090880, 'steps': 42139, 'loss/train': 1.480120301246643} -11/07/2021 03:08:31 - INFO - __main__ - Step 42141: {'lr': 0.00041461024468709664, 'samples': 8091072, 'steps': 42140, 'loss/train': 1.1149752140045166} -11/07/2021 03:08:31 - INFO - __main__ - Step 42142: {'lr': 0.0004146062506224606, 'samples': 8091264, 'steps': 42141, 'loss/train': 1.4817534685134888} -11/07/2021 03:08:31 - INFO - __main__ - Step 42143: {'lr': 0.0004146022564836556, 'samples': 8091456, 'steps': 42142, 'loss/train': 1.6729769706726074} -11/07/2021 03:08:32 - INFO - __main__ - Step 42144: {'lr': 0.0004145982622706833, 'samples': 8091648, 'steps': 42143, 'loss/train': 1.3165689706802368} -11/07/2021 03:08:33 - INFO - __main__ - Step 42145: {'lr': 0.00041459426798354563, 'samples': 8091840, 'steps': 42144, 'loss/train': 1.4829295873641968} -11/07/2021 03:08:33 - INFO - __main__ - Step 42146: {'lr': 0.00041459027362224433, 'samples': 8092032, 'steps': 42145, 'loss/train': 1.44984769821167} -11/07/2021 03:08:34 - INFO - __main__ - Step 42147: {'lr': 0.00041458627918678116, 'samples': 8092224, 'steps': 42146, 'loss/train': 1.9205005168914795} -11/07/2021 03:08:34 - INFO - __main__ - Step 42148: {'lr': 0.00041458228467715786, 'samples': 8092416, 'steps': 42147, 'loss/train': 1.452275037765503} -11/07/2021 03:08:34 - INFO - __main__ - Step 42149: {'lr': 0.00041457829009337643, 'samples': 8092608, 'steps': 42148, 'loss/train': 1.1981793642044067} -11/07/2021 03:08:35 - INFO - __main__ - Step 42150: {'lr': 0.00041457429543543856, 'samples': 8092800, 'steps': 42149, 'loss/train': 1.450162410736084} -11/07/2021 03:08:36 - INFO - __main__ - Step 42151: {'lr': 0.0004145703007033461, 'samples': 8092992, 'steps': 42150, 'loss/train': 1.1431949138641357} -11/07/2021 03:08:36 - INFO - __main__ - Step 42152: {'lr': 0.00041456630589710073, 'samples': 8093184, 'steps': 42151, 'loss/train': 1.1344993114471436} -11/07/2021 03:08:36 - INFO - __main__ - Step 42153: {'lr': 0.0004145623110167043, 'samples': 8093376, 'steps': 42152, 'loss/train': 1.4127930402755737} -11/07/2021 03:08:37 - INFO - __main__ - Step 42154: {'lr': 0.00041455831606215863, 'samples': 8093568, 'steps': 42153, 'loss/train': 1.4258630275726318} -11/07/2021 03:08:37 - INFO - __main__ - Step 42155: {'lr': 0.0004145543210334656, 'samples': 8093760, 'steps': 42154, 'loss/train': 1.334218144416809} -11/07/2021 03:08:38 - INFO - __main__ - Step 42156: {'lr': 0.00041455032593062685, 'samples': 8093952, 'steps': 42155, 'loss/train': 1.757309913635254} -11/07/2021 03:08:39 - INFO - __main__ - Step 42157: {'lr': 0.00041454633075364427, 'samples': 8094144, 'steps': 42156, 'loss/train': 1.4084231853485107} -11/07/2021 03:08:39 - INFO - __main__ - Step 42158: {'lr': 0.00041454233550251976, 'samples': 8094336, 'steps': 42157, 'loss/train': 1.2516793012619019} -11/07/2021 03:08:39 - INFO - __main__ - Step 42159: {'lr': 0.0004145383401772549, 'samples': 8094528, 'steps': 42158, 'loss/train': 1.6665518283843994} -11/07/2021 03:08:40 - INFO - __main__ - Step 42160: {'lr': 0.00041453434477785165, 'samples': 8094720, 'steps': 42159, 'loss/train': 1.5540876388549805} -11/07/2021 03:08:41 - INFO - __main__ - Step 42161: {'lr': 0.0004145303493043118, 'samples': 8094912, 'steps': 42160, 'loss/train': 1.2934569120407104} -11/07/2021 03:08:41 - INFO - __main__ - Step 42162: {'lr': 0.000414526353756637, 'samples': 8095104, 'steps': 42161, 'loss/train': 2.090319871902466} -11/07/2021 03:08:41 - INFO - __main__ - Step 42163: {'lr': 0.0004145223581348292, 'samples': 8095296, 'steps': 42162, 'loss/train': 1.8299297094345093} -11/07/2021 03:08:42 - INFO - __main__ - Step 42164: {'lr': 0.00041451836243889027, 'samples': 8095488, 'steps': 42163, 'loss/train': 1.2692837715148926} -11/07/2021 03:08:42 - INFO - __main__ - Step 42165: {'lr': 0.0004145143666688218, 'samples': 8095680, 'steps': 42164, 'loss/train': 1.8240784406661987} -11/07/2021 03:08:43 - INFO - __main__ - Step 42166: {'lr': 0.0004145103708246257, 'samples': 8095872, 'steps': 42165, 'loss/train': 1.1021740436553955} -11/07/2021 03:08:43 - INFO - __main__ - Step 42167: {'lr': 0.0004145063749063038, 'samples': 8096064, 'steps': 42166, 'loss/train': 1.6214840412139893} -11/07/2021 03:08:44 - INFO - __main__ - Step 42168: {'lr': 0.00041450237891385783, 'samples': 8096256, 'steps': 42167, 'loss/train': 1.618085265159607} -11/07/2021 03:08:44 - INFO - __main__ - Step 42169: {'lr': 0.00041449838284728964, 'samples': 8096448, 'steps': 42168, 'loss/train': 1.386372685432434} -11/07/2021 03:08:45 - INFO - __main__ - Step 42170: {'lr': 0.000414494386706601, 'samples': 8096640, 'steps': 42169, 'loss/train': 1.309335708618164} -11/07/2021 03:08:45 - INFO - __main__ - Step 42171: {'lr': 0.00041449039049179385, 'samples': 8096832, 'steps': 42170, 'loss/train': 1.3361847400665283} -11/07/2021 03:08:46 - INFO - __main__ - Step 42172: {'lr': 0.0004144863942028697, 'samples': 8097024, 'steps': 42171, 'loss/train': 1.3556065559387207} -11/07/2021 03:08:46 - INFO - __main__ - Step 42173: {'lr': 0.0004144823978398306, 'samples': 8097216, 'steps': 42172, 'loss/train': 1.8618935346603394} -11/07/2021 03:08:47 - INFO - __main__ - Step 42174: {'lr': 0.0004144784014026782, 'samples': 8097408, 'steps': 42173, 'loss/train': 1.6203159093856812} -11/07/2021 03:08:47 - INFO - __main__ - Step 42175: {'lr': 0.0004144744048914145, 'samples': 8097600, 'steps': 42174, 'loss/train': 1.4742738008499146} -11/07/2021 03:08:47 - INFO - __main__ - Step 42176: {'lr': 0.0004144704083060411, 'samples': 8097792, 'steps': 42175, 'loss/train': 1.5544403791427612} -11/07/2021 03:08:48 - INFO - __main__ - Step 42177: {'lr': 0.00041446641164655983, 'samples': 8097984, 'steps': 42176, 'loss/train': 1.346947431564331} -11/07/2021 03:08:49 - INFO - __main__ - Step 42178: {'lr': 0.0004144624149129727, 'samples': 8098176, 'steps': 42177, 'loss/train': 1.5605933666229248} -11/07/2021 03:08:49 - INFO - __main__ - Step 42179: {'lr': 0.00041445841810528117, 'samples': 8098368, 'steps': 42178, 'loss/train': 1.7424789667129517} -11/07/2021 03:08:49 - INFO - __main__ - Step 42180: {'lr': 0.00041445442122348727, 'samples': 8098560, 'steps': 42179, 'loss/train': 0.6647708415985107} -11/07/2021 03:08:50 - INFO - __main__ - Step 42181: {'lr': 0.0004144504242675927, 'samples': 8098752, 'steps': 42180, 'loss/train': 1.6002750396728516} -11/07/2021 03:08:50 - INFO - __main__ - Step 42182: {'lr': 0.0004144464272375994, 'samples': 8098944, 'steps': 42181, 'loss/train': 1.1403971910476685} -11/07/2021 03:08:51 - INFO - __main__ - Step 42183: {'lr': 0.000414442430133509, 'samples': 8099136, 'steps': 42182, 'loss/train': 1.608879566192627} -11/07/2021 03:08:52 - INFO - __main__ - Step 42184: {'lr': 0.00041443843295532333, 'samples': 8099328, 'steps': 42183, 'loss/train': 1.4282817840576172} -11/07/2021 03:08:52 - INFO - __main__ - Step 42185: {'lr': 0.0004144344357030444, 'samples': 8099520, 'steps': 42184, 'loss/train': 1.5298147201538086} -11/07/2021 03:08:52 - INFO - __main__ - Step 42186: {'lr': 0.0004144304383766737, 'samples': 8099712, 'steps': 42185, 'loss/train': 1.4202641248703003} -11/07/2021 03:08:53 - INFO - __main__ - Step 42187: {'lr': 0.0004144264409762133, 'samples': 8099904, 'steps': 42186, 'loss/train': 1.4413903951644897} -11/07/2021 03:08:54 - INFO - __main__ - Step 42188: {'lr': 0.0004144224435016648, 'samples': 8100096, 'steps': 42187, 'loss/train': 1.535606861114502} -11/07/2021 03:08:54 - INFO - __main__ - Step 42189: {'lr': 0.00041441844595303015, 'samples': 8100288, 'steps': 42188, 'loss/train': 1.5828893184661865} -11/07/2021 03:08:54 - INFO - __main__ - Step 42190: {'lr': 0.0004144144483303111, 'samples': 8100480, 'steps': 42189, 'loss/train': 1.4190727472305298} -11/07/2021 03:08:55 - INFO - __main__ - Step 42191: {'lr': 0.00041441045063350933, 'samples': 8100672, 'steps': 42190, 'loss/train': 1.7690839767456055} -11/07/2021 03:08:55 - INFO - __main__ - Step 42192: {'lr': 0.00041440645286262677, 'samples': 8100864, 'steps': 42191, 'loss/train': 1.7696083784103394} -11/07/2021 03:08:56 - INFO - __main__ - Step 42193: {'lr': 0.0004144024550176653, 'samples': 8101056, 'steps': 42192, 'loss/train': 1.3551652431488037} -11/07/2021 03:08:57 - INFO - __main__ - Step 42194: {'lr': 0.0004143984570986265, 'samples': 8101248, 'steps': 42193, 'loss/train': 1.4273933172225952} -11/07/2021 03:08:57 - INFO - __main__ - Step 42195: {'lr': 0.00041439445910551235, 'samples': 8101440, 'steps': 42194, 'loss/train': 1.6295689344406128} -11/07/2021 03:08:57 - INFO - __main__ - Step 42196: {'lr': 0.00041439046103832454, 'samples': 8101632, 'steps': 42195, 'loss/train': 1.0149160623550415} -11/07/2021 03:08:58 - INFO - __main__ - Step 42197: {'lr': 0.000414386462897065, 'samples': 8101824, 'steps': 42196, 'loss/train': 1.359559416770935} -11/07/2021 03:08:59 - INFO - __main__ - Step 42198: {'lr': 0.00041438246468173545, 'samples': 8102016, 'steps': 42197, 'loss/train': 1.8362070322036743} -11/07/2021 03:08:59 - INFO - __main__ - Step 42199: {'lr': 0.0004143784663923377, 'samples': 8102208, 'steps': 42198, 'loss/train': 1.4988839626312256} -11/07/2021 03:08:59 - INFO - __main__ - Step 42200: {'lr': 0.00041437446802887354, 'samples': 8102400, 'steps': 42199, 'loss/train': 0.7154588103294373} -11/07/2021 03:09:00 - INFO - __main__ - Step 42201: {'lr': 0.0004143704695913447, 'samples': 8102592, 'steps': 42200, 'loss/train': 1.3718774318695068} -11/07/2021 03:09:00 - INFO - __main__ - Step 42202: {'lr': 0.0004143664710797531, 'samples': 8102784, 'steps': 42201, 'loss/train': 1.7068943977355957} -11/07/2021 03:09:01 - INFO - __main__ - Step 42203: {'lr': 0.0004143624724941006, 'samples': 8102976, 'steps': 42202, 'loss/train': 1.0936533212661743} -11/07/2021 03:09:01 - INFO - __main__ - Step 42204: {'lr': 0.00041435847383438886, 'samples': 8103168, 'steps': 42203, 'loss/train': 1.7383671998977661} -11/07/2021 03:09:02 - INFO - __main__ - Step 42205: {'lr': 0.0004143544751006197, 'samples': 8103360, 'steps': 42204, 'loss/train': 1.5881863832473755} -11/07/2021 03:09:02 - INFO - __main__ - Step 42206: {'lr': 0.000414350476292795, 'samples': 8103552, 'steps': 42205, 'loss/train': 1.4384769201278687} -11/07/2021 03:09:02 - INFO - __main__ - Step 42207: {'lr': 0.0004143464774109164, 'samples': 8103744, 'steps': 42206, 'loss/train': 1.3117130994796753} -11/07/2021 03:09:03 - INFO - __main__ - Step 42208: {'lr': 0.0004143424784549859, 'samples': 8103936, 'steps': 42207, 'loss/train': 0.45743227005004883} -11/07/2021 03:09:04 - INFO - __main__ - Step 42209: {'lr': 0.00041433847942500516, 'samples': 8104128, 'steps': 42208, 'loss/train': 1.2702810764312744} -11/07/2021 03:09:04 - INFO - __main__ - Step 42210: {'lr': 0.0004143344803209761, 'samples': 8104320, 'steps': 42209, 'loss/train': 1.4717539548873901} -11/07/2021 03:09:04 - INFO - __main__ - Step 42211: {'lr': 0.0004143304811429005, 'samples': 8104512, 'steps': 42210, 'loss/train': 1.5789469480514526} -11/07/2021 03:09:05 - INFO - __main__ - Step 42212: {'lr': 0.00041432648189078006, 'samples': 8104704, 'steps': 42211, 'loss/train': 1.544179081916809} -11/07/2021 03:09:06 - INFO - __main__ - Step 42213: {'lr': 0.0004143224825646166, 'samples': 8104896, 'steps': 42212, 'loss/train': 1.3781150579452515} -11/07/2021 03:09:06 - INFO - __main__ - Step 42214: {'lr': 0.000414318483164412, 'samples': 8105088, 'steps': 42213, 'loss/train': 1.4762358665466309} -11/07/2021 03:09:07 - INFO - __main__ - Step 42215: {'lr': 0.000414314483690168, 'samples': 8105280, 'steps': 42214, 'loss/train': 1.572849988937378} -11/07/2021 03:09:07 - INFO - __main__ - Step 42216: {'lr': 0.00041431048414188645, 'samples': 8105472, 'steps': 42215, 'loss/train': 1.6689866781234741} -11/07/2021 03:09:07 - INFO - __main__ - Step 42217: {'lr': 0.00041430648451956913, 'samples': 8105664, 'steps': 42216, 'loss/train': 1.4321280717849731} -11/07/2021 03:09:08 - INFO - __main__ - Step 42218: {'lr': 0.00041430248482321794, 'samples': 8105856, 'steps': 42217, 'loss/train': 1.486643671989441} -11/07/2021 03:09:09 - INFO - __main__ - Step 42219: {'lr': 0.00041429848505283444, 'samples': 8106048, 'steps': 42218, 'loss/train': 1.625313401222229} -11/07/2021 03:09:09 - INFO - __main__ - Step 42220: {'lr': 0.00041429448520842064, 'samples': 8106240, 'steps': 42219, 'loss/train': 1.6230796575546265} -11/07/2021 03:09:09 - INFO - __main__ - Step 42221: {'lr': 0.0004142904852899783, 'samples': 8106432, 'steps': 42220, 'loss/train': 1.590558409690857} -11/07/2021 03:09:10 - INFO - __main__ - Step 42222: {'lr': 0.0004142864852975092, 'samples': 8106624, 'steps': 42221, 'loss/train': 1.4351541996002197} -11/07/2021 03:09:10 - INFO - __main__ - Step 42223: {'lr': 0.00041428248523101507, 'samples': 8106816, 'steps': 42222, 'loss/train': 1.552646279335022} -11/07/2021 03:09:11 - INFO - __main__ - Step 42224: {'lr': 0.0004142784850904978, 'samples': 8107008, 'steps': 42223, 'loss/train': 1.7166039943695068} -11/07/2021 03:09:11 - INFO - __main__ - Step 42225: {'lr': 0.00041427448487595933, 'samples': 8107200, 'steps': 42224, 'loss/train': 1.5216922760009766} -11/07/2021 03:09:12 - INFO - __main__ - Step 42226: {'lr': 0.0004142704845874012, 'samples': 8107392, 'steps': 42225, 'loss/train': 1.6146934032440186} -11/07/2021 03:09:12 - INFO - __main__ - Step 42227: {'lr': 0.00041426648422482527, 'samples': 8107584, 'steps': 42226, 'loss/train': 1.2154557704925537} -11/07/2021 03:09:12 - INFO - __main__ - Step 42228: {'lr': 0.0004142624837882335, 'samples': 8107776, 'steps': 42227, 'loss/train': 1.4375699758529663} -11/07/2021 03:09:14 - INFO - __main__ - Step 42229: {'lr': 0.0004142584832776275, 'samples': 8107968, 'steps': 42228, 'loss/train': 1.8489353656768799} -11/07/2021 03:09:14 - INFO - __main__ - Step 42230: {'lr': 0.00041425448269300923, 'samples': 8108160, 'steps': 42229, 'loss/train': 1.63296377658844} -11/07/2021 03:09:14 - INFO - __main__ - Step 42231: {'lr': 0.00041425048203438036, 'samples': 8108352, 'steps': 42230, 'loss/train': 2.0668020248413086} -11/07/2021 03:09:15 - INFO - __main__ - Step 42232: {'lr': 0.0004142464813017429, 'samples': 8108544, 'steps': 42231, 'loss/train': 1.516548752784729} -11/07/2021 03:09:15 - INFO - __main__ - Step 42233: {'lr': 0.0004142424804950984, 'samples': 8108736, 'steps': 42232, 'loss/train': 1.2571018934249878} -11/07/2021 03:09:16 - INFO - __main__ - Step 42234: {'lr': 0.00041423847961444873, 'samples': 8108928, 'steps': 42233, 'loss/train': 1.8132482767105103} -11/07/2021 03:09:16 - INFO - __main__ - Step 42235: {'lr': 0.0004142344786597958, 'samples': 8109120, 'steps': 42234, 'loss/train': 1.7678147554397583} -11/07/2021 03:09:17 - INFO - __main__ - Step 42236: {'lr': 0.0004142304776311413, 'samples': 8109312, 'steps': 42235, 'loss/train': 1.5495364665985107} -11/07/2021 03:09:17 - INFO - __main__ - Step 42237: {'lr': 0.0004142264765284871, 'samples': 8109504, 'steps': 42236, 'loss/train': 1.6588215827941895} -11/07/2021 03:09:17 - INFO - __main__ - Step 42238: {'lr': 0.0004142224753518351, 'samples': 8109696, 'steps': 42237, 'loss/train': 1.3605972528457642} -11/07/2021 03:09:18 - INFO - __main__ - Step 42239: {'lr': 0.00041421847410118685, 'samples': 8109888, 'steps': 42238, 'loss/train': 1.2603652477264404} -11/07/2021 03:09:19 - INFO - __main__ - Step 42240: {'lr': 0.00041421447277654436, 'samples': 8110080, 'steps': 42239, 'loss/train': 1.2082425355911255} -11/07/2021 03:09:19 - INFO - __main__ - Step 42241: {'lr': 0.0004142104713779093, 'samples': 8110272, 'steps': 42240, 'loss/train': 1.4556949138641357} -11/07/2021 03:09:20 - INFO - __main__ - Step 42242: {'lr': 0.00041420646990528355, 'samples': 8110464, 'steps': 42241, 'loss/train': 1.4256129264831543} -11/07/2021 03:09:20 - INFO - __main__ - Step 42243: {'lr': 0.0004142024683586689, 'samples': 8110656, 'steps': 42242, 'loss/train': 1.448241114616394} -11/07/2021 03:09:20 - INFO - __main__ - Step 42244: {'lr': 0.00041419846673806715, 'samples': 8110848, 'steps': 42243, 'loss/train': 1.2812025547027588} -11/07/2021 03:09:21 - INFO - __main__ - Step 42245: {'lr': 0.0004141944650434801, 'samples': 8111040, 'steps': 42244, 'loss/train': 1.5415171384811401} -11/07/2021 03:09:22 - INFO - __main__ - Step 42246: {'lr': 0.00041419046327490964, 'samples': 8111232, 'steps': 42245, 'loss/train': 1.428864598274231} -11/07/2021 03:09:22 - INFO - __main__ - Step 42247: {'lr': 0.00041418646143235737, 'samples': 8111424, 'steps': 42246, 'loss/train': 2.096343517303467} -11/07/2021 03:09:22 - INFO - __main__ - Step 42248: {'lr': 0.0004141824595158253, 'samples': 8111616, 'steps': 42247, 'loss/train': 1.5350630283355713} -11/07/2021 03:09:23 - INFO - __main__ - Step 42249: {'lr': 0.0004141784575253151, 'samples': 8111808, 'steps': 42248, 'loss/train': 1.8915627002716064} -11/07/2021 03:09:24 - INFO - __main__ - Step 42250: {'lr': 0.0004141744554608287, 'samples': 8112000, 'steps': 42249, 'loss/train': 1.0861523151397705} -11/07/2021 03:09:24 - INFO - __main__ - Step 42251: {'lr': 0.00041417045332236776, 'samples': 8112192, 'steps': 42250, 'loss/train': 1.1745171546936035} -11/07/2021 03:09:24 - INFO - __main__ - Step 42252: {'lr': 0.0004141664511099341, 'samples': 8112384, 'steps': 42251, 'loss/train': 1.573246955871582} -11/07/2021 03:09:25 - INFO - __main__ - Step 42253: {'lr': 0.00041416244882352965, 'samples': 8112576, 'steps': 42252, 'loss/train': 0.9070172905921936} -11/07/2021 03:09:25 - INFO - __main__ - Step 42254: {'lr': 0.00041415844646315613, 'samples': 8112768, 'steps': 42253, 'loss/train': 1.758210301399231} -11/07/2021 03:09:26 - INFO - __main__ - Step 42255: {'lr': 0.0004141544440288153, 'samples': 8112960, 'steps': 42254, 'loss/train': 2.242783546447754} -11/07/2021 03:09:26 - INFO - __main__ - Step 42256: {'lr': 0.0004141504415205091, 'samples': 8113152, 'steps': 42255, 'loss/train': 1.3303405046463013} -11/07/2021 03:09:27 - INFO - __main__ - Step 42257: {'lr': 0.0004141464389382391, 'samples': 8113344, 'steps': 42256, 'loss/train': 1.8815373182296753} -11/07/2021 03:09:27 - INFO - __main__ - Step 42258: {'lr': 0.0004141424362820073, 'samples': 8113536, 'steps': 42257, 'loss/train': 1.2732740640640259} -11/07/2021 03:09:28 - INFO - __main__ - Step 42259: {'lr': 0.0004141384335518155, 'samples': 8113728, 'steps': 42258, 'loss/train': 1.6466920375823975} -11/07/2021 03:09:28 - INFO - __main__ - Step 42260: {'lr': 0.00041413443074766543, 'samples': 8113920, 'steps': 42259, 'loss/train': 1.194049596786499} -11/07/2021 03:09:29 - INFO - __main__ - Step 42261: {'lr': 0.000414130427869559, 'samples': 8114112, 'steps': 42260, 'loss/train': 1.1260548830032349} -11/07/2021 03:09:29 - INFO - __main__ - Step 42262: {'lr': 0.0004141264249174978, 'samples': 8114304, 'steps': 42261, 'loss/train': 1.7151681184768677} -11/07/2021 03:09:30 - INFO - __main__ - Step 42263: {'lr': 0.00041412242189148383, 'samples': 8114496, 'steps': 42262, 'loss/train': 1.5122243165969849} -11/07/2021 03:09:30 - INFO - __main__ - Step 42264: {'lr': 0.00041411841879151877, 'samples': 8114688, 'steps': 42263, 'loss/train': 1.6099839210510254} -11/07/2021 03:09:30 - INFO - __main__ - Step 42265: {'lr': 0.00041411441561760455, 'samples': 8114880, 'steps': 42264, 'loss/train': 1.6253814697265625} -11/07/2021 03:09:31 - INFO - __main__ - Step 42266: {'lr': 0.0004141104123697429, 'samples': 8115072, 'steps': 42265, 'loss/train': 1.6564679145812988} -11/07/2021 03:09:32 - INFO - __main__ - Step 42267: {'lr': 0.00041410640904793563, 'samples': 8115264, 'steps': 42266, 'loss/train': 0.8678615093231201} -11/07/2021 03:09:32 - INFO - __main__ - Step 42268: {'lr': 0.0004141024056521845, 'samples': 8115456, 'steps': 42267, 'loss/train': 0.7243680357933044} -11/07/2021 03:09:32 - INFO - __main__ - Step 42269: {'lr': 0.0004140984021824914, 'samples': 8115648, 'steps': 42268, 'loss/train': 1.637137770652771} -11/07/2021 03:09:33 - INFO - __main__ - Step 42270: {'lr': 0.0004140943986388581, 'samples': 8115840, 'steps': 42269, 'loss/train': 1.5717798471450806} -11/07/2021 03:09:34 - INFO - __main__ - Step 42271: {'lr': 0.00041409039502128634, 'samples': 8116032, 'steps': 42270, 'loss/train': 1.5168558359146118} -11/07/2021 03:09:35 - INFO - __main__ - Step 42272: {'lr': 0.000414086391329778, 'samples': 8116224, 'steps': 42271, 'loss/train': 1.1119903326034546} -11/07/2021 03:09:35 - INFO - __main__ - Step 42273: {'lr': 0.0004140823875643349, 'samples': 8116416, 'steps': 42272, 'loss/train': 1.3936454057693481} -11/07/2021 03:09:36 - INFO - __main__ - Step 42274: {'lr': 0.00041407838372495883, 'samples': 8116608, 'steps': 42273, 'loss/train': 1.0360863208770752} -11/07/2021 03:09:36 - INFO - __main__ - Step 42275: {'lr': 0.00041407437981165154, 'samples': 8116800, 'steps': 42274, 'loss/train': 1.3648031949996948} -11/07/2021 03:09:36 - INFO - __main__ - Step 42276: {'lr': 0.0004140703758244148, 'samples': 8116992, 'steps': 42275, 'loss/train': 1.9282615184783936} -11/07/2021 03:09:37 - INFO - __main__ - Step 42277: {'lr': 0.00041406637176325054, 'samples': 8117184, 'steps': 42276, 'loss/train': 1.2744916677474976} -11/07/2021 03:09:38 - INFO - __main__ - Step 42278: {'lr': 0.00041406236762816053, 'samples': 8117376, 'steps': 42277, 'loss/train': 1.9428569078445435} -11/07/2021 03:09:38 - INFO - __main__ - Step 42279: {'lr': 0.0004140583634191465, 'samples': 8117568, 'steps': 42278, 'loss/train': 1.5542657375335693} -11/07/2021 03:09:38 - INFO - __main__ - Step 42280: {'lr': 0.00041405435913621037, 'samples': 8117760, 'steps': 42279, 'loss/train': 0.7622489333152771} -11/07/2021 03:09:39 - INFO - __main__ - Step 42281: {'lr': 0.0004140503547793538, 'samples': 8117952, 'steps': 42280, 'loss/train': 1.6333931684494019} -11/07/2021 03:09:39 - INFO - __main__ - Step 42282: {'lr': 0.00041404635034857876, 'samples': 8118144, 'steps': 42281, 'loss/train': 1.736616849899292} -11/07/2021 03:09:40 - INFO - __main__ - Step 42283: {'lr': 0.00041404234584388683, 'samples': 8118336, 'steps': 42282, 'loss/train': 1.5493872165679932} -11/07/2021 03:09:40 - INFO - __main__ - Step 42284: {'lr': 0.00041403834126528007, 'samples': 8118528, 'steps': 42283, 'loss/train': 1.6267235279083252} -11/07/2021 03:09:41 - INFO - __main__ - Step 42285: {'lr': 0.00041403433661276015, 'samples': 8118720, 'steps': 42284, 'loss/train': 1.4420843124389648} -11/07/2021 03:09:41 - INFO - __main__ - Step 42286: {'lr': 0.0004140303318863288, 'samples': 8118912, 'steps': 42285, 'loss/train': 1.6940083503723145} -11/07/2021 03:09:41 - INFO - __main__ - Step 42287: {'lr': 0.00041402632708598797, 'samples': 8119104, 'steps': 42286, 'loss/train': 1.706137776374817} -11/07/2021 03:09:43 - INFO - __main__ - Step 42288: {'lr': 0.0004140223222117394, 'samples': 8119296, 'steps': 42287, 'loss/train': 1.910693883895874} -11/07/2021 03:09:43 - INFO - __main__ - Step 42289: {'lr': 0.00041401831726358497, 'samples': 8119488, 'steps': 42288, 'loss/train': 1.5870105028152466} -11/07/2021 03:09:43 - INFO - __main__ - Step 42290: {'lr': 0.0004140143122415263, 'samples': 8119680, 'steps': 42289, 'loss/train': 1.8212772607803345} -11/07/2021 03:09:44 - INFO - __main__ - Step 42291: {'lr': 0.0004140103071455654, 'samples': 8119872, 'steps': 42290, 'loss/train': 1.7726240158081055} -11/07/2021 03:09:44 - INFO - __main__ - Step 42292: {'lr': 0.000414006301975704, 'samples': 8120064, 'steps': 42291, 'loss/train': 1.9648642539978027} -11/07/2021 03:09:44 - INFO - __main__ - Step 42293: {'lr': 0.0004140022967319439, 'samples': 8120256, 'steps': 42292, 'loss/train': 1.6367963552474976} -11/07/2021 03:09:45 - INFO - __main__ - Step 42294: {'lr': 0.0004139982914142868, 'samples': 8120448, 'steps': 42293, 'loss/train': 1.9807569980621338} -11/07/2021 03:09:46 - INFO - __main__ - Step 42295: {'lr': 0.0004139942860227346, 'samples': 8120640, 'steps': 42294, 'loss/train': 1.6433264017105103} -11/07/2021 03:09:46 - INFO - __main__ - Step 42296: {'lr': 0.00041399028055728914, 'samples': 8120832, 'steps': 42295, 'loss/train': 1.5786479711532593} -11/07/2021 03:09:46 - INFO - __main__ - Step 42297: {'lr': 0.0004139862750179523, 'samples': 8121024, 'steps': 42296, 'loss/train': 1.858721375465393} -11/07/2021 03:09:47 - INFO - __main__ - Step 42298: {'lr': 0.0004139822694047256, 'samples': 8121216, 'steps': 42297, 'loss/train': 1.4344762563705444} -11/07/2021 03:09:48 - INFO - __main__ - Step 42299: {'lr': 0.0004139782637176112, 'samples': 8121408, 'steps': 42298, 'loss/train': 1.577717900276184} -11/07/2021 03:09:48 - INFO - __main__ - Step 42300: {'lr': 0.0004139742579566106, 'samples': 8121600, 'steps': 42299, 'loss/train': 1.0138734579086304} -11/07/2021 03:09:49 - INFO - __main__ - Step 42301: {'lr': 0.00041397025212172573, 'samples': 8121792, 'steps': 42300, 'loss/train': 1.2797232866287231} -11/07/2021 03:09:49 - INFO - __main__ - Step 42302: {'lr': 0.00041396624621295843, 'samples': 8121984, 'steps': 42301, 'loss/train': 1.844573974609375} -11/07/2021 03:09:49 - INFO - __main__ - Step 42303: {'lr': 0.00041396224023031045, 'samples': 8122176, 'steps': 42302, 'loss/train': 1.121030569076538} -11/07/2021 03:09:50 - INFO - __main__ - Step 42304: {'lr': 0.0004139582341737836, 'samples': 8122368, 'steps': 42303, 'loss/train': 1.6290957927703857} -11/07/2021 03:09:51 - INFO - __main__ - Step 42305: {'lr': 0.0004139542280433797, 'samples': 8122560, 'steps': 42304, 'loss/train': 1.3857667446136475} -11/07/2021 03:09:51 - INFO - __main__ - Step 42306: {'lr': 0.00041395022183910064, 'samples': 8122752, 'steps': 42305, 'loss/train': 1.6097029447555542} -11/07/2021 03:09:51 - INFO - __main__ - Step 42307: {'lr': 0.00041394621556094805, 'samples': 8122944, 'steps': 42306, 'loss/train': 1.5338916778564453} -11/07/2021 03:09:52 - INFO - __main__ - Step 42308: {'lr': 0.0004139422092089239, 'samples': 8123136, 'steps': 42307, 'loss/train': 1.7702220678329468} -11/07/2021 03:09:53 - INFO - __main__ - Step 42309: {'lr': 0.0004139382027830298, 'samples': 8123328, 'steps': 42308, 'loss/train': 1.5488650798797607} -11/07/2021 03:09:53 - INFO - __main__ - Step 42310: {'lr': 0.00041393419628326777, 'samples': 8123520, 'steps': 42309, 'loss/train': 1.628334879875183} -11/07/2021 03:09:54 - INFO - __main__ - Step 42311: {'lr': 0.00041393018970963945, 'samples': 8123712, 'steps': 42310, 'loss/train': 1.7775880098342896} -11/07/2021 03:09:54 - INFO - __main__ - Step 42312: {'lr': 0.00041392618306214683, 'samples': 8123904, 'steps': 42311, 'loss/train': 1.2932323217391968} -11/07/2021 03:09:54 - INFO - __main__ - Step 42313: {'lr': 0.0004139221763407915, 'samples': 8124096, 'steps': 42312, 'loss/train': 1.6325318813323975} -11/07/2021 03:09:55 - INFO - __main__ - Step 42314: {'lr': 0.00041391816954557543, 'samples': 8124288, 'steps': 42313, 'loss/train': 0.11254347860813141} -11/07/2021 03:09:56 - INFO - __main__ - Step 42315: {'lr': 0.00041391416267650034, 'samples': 8124480, 'steps': 42314, 'loss/train': 1.9047186374664307} -11/07/2021 03:09:56 - INFO - __main__ - Step 42316: {'lr': 0.00041391015573356805, 'samples': 8124672, 'steps': 42315, 'loss/train': 1.5465834140777588} -11/07/2021 03:09:56 - INFO - __main__ - Step 42317: {'lr': 0.0004139061487167804, 'samples': 8124864, 'steps': 42316, 'loss/train': 1.3714628219604492} -11/07/2021 03:09:57 - INFO - __main__ - Step 42318: {'lr': 0.00041390214162613916, 'samples': 8125056, 'steps': 42317, 'loss/train': 1.8584504127502441} -11/07/2021 03:09:57 - INFO - __main__ - Step 42319: {'lr': 0.00041389813446164614, 'samples': 8125248, 'steps': 42318, 'loss/train': 1.3471084833145142} -11/07/2021 03:09:58 - INFO - __main__ - Step 42320: {'lr': 0.0004138941272233031, 'samples': 8125440, 'steps': 42319, 'loss/train': 1.346096396446228} -11/07/2021 03:09:58 - INFO - __main__ - Step 42321: {'lr': 0.0004138901199111119, 'samples': 8125632, 'steps': 42320, 'loss/train': 1.64899480342865} -11/07/2021 03:09:59 - INFO - __main__ - Step 42322: {'lr': 0.00041388611252507446, 'samples': 8125824, 'steps': 42321, 'loss/train': 1.300271987915039} -11/07/2021 03:09:59 - INFO - __main__ - Step 42323: {'lr': 0.0004138821050651923, 'samples': 8126016, 'steps': 42322, 'loss/train': 1.3816546201705933} -11/07/2021 03:10:00 - INFO - __main__ - Step 42324: {'lr': 0.00041387809753146756, 'samples': 8126208, 'steps': 42323, 'loss/train': 1.7210004329681396} -11/07/2021 03:10:00 - INFO - __main__ - Step 42325: {'lr': 0.00041387408992390177, 'samples': 8126400, 'steps': 42324, 'loss/train': 1.4438029527664185} -11/07/2021 03:10:01 - INFO - __main__ - Step 42326: {'lr': 0.0004138700822424968, 'samples': 8126592, 'steps': 42325, 'loss/train': 1.495758056640625} -11/07/2021 03:10:01 - INFO - __main__ - Step 42327: {'lr': 0.0004138660744872547, 'samples': 8126784, 'steps': 42326, 'loss/train': 1.3418431282043457} -11/07/2021 03:10:02 - INFO - __main__ - Step 42328: {'lr': 0.00041386206665817684, 'samples': 8126976, 'steps': 42327, 'loss/train': 5.740207195281982} -11/07/2021 03:10:02 - INFO - __main__ - Step 42329: {'lr': 0.0004138580587552654, 'samples': 8127168, 'steps': 42328, 'loss/train': 1.4846197366714478} -11/07/2021 03:10:02 - INFO - __main__ - Step 42330: {'lr': 0.000413854050778522, 'samples': 8127360, 'steps': 42329, 'loss/train': 1.207411289215088} -11/07/2021 03:10:03 - INFO - __main__ - Step 42331: {'lr': 0.00041385004272794846, 'samples': 8127552, 'steps': 42330, 'loss/train': 1.4573063850402832} -11/07/2021 03:10:04 - INFO - __main__ - Step 42332: {'lr': 0.0004138460346035467, 'samples': 8127744, 'steps': 42331, 'loss/train': 1.7764642238616943} -11/07/2021 03:10:04 - INFO - __main__ - Step 42333: {'lr': 0.0004138420264053184, 'samples': 8127936, 'steps': 42332, 'loss/train': 1.7020927667617798} -11/07/2021 03:10:05 - INFO - __main__ - Step 42334: {'lr': 0.00041383801813326543, 'samples': 8128128, 'steps': 42333, 'loss/train': 1.3734804391860962} -11/07/2021 03:10:05 - INFO - __main__ - Step 42335: {'lr': 0.00041383400978738956, 'samples': 8128320, 'steps': 42334, 'loss/train': 1.374592900276184} -11/07/2021 03:10:05 - INFO - __main__ - Step 42336: {'lr': 0.0004138300013676926, 'samples': 8128512, 'steps': 42335, 'loss/train': 1.3566697835922241} -11/07/2021 03:10:06 - INFO - __main__ - Step 42337: {'lr': 0.0004138259928741764, 'samples': 8128704, 'steps': 42336, 'loss/train': 1.46265709400177} -11/07/2021 03:10:07 - INFO - __main__ - Step 42338: {'lr': 0.0004138219843068427, 'samples': 8128896, 'steps': 42337, 'loss/train': 1.2423937320709229} -11/07/2021 03:10:07 - INFO - __main__ - Step 42339: {'lr': 0.00041381797566569345, 'samples': 8129088, 'steps': 42338, 'loss/train': 1.4230663776397705} -11/07/2021 03:10:07 - INFO - __main__ - Step 42340: {'lr': 0.0004138139669507303, 'samples': 8129280, 'steps': 42339, 'loss/train': 1.0463687181472778} -11/07/2021 03:10:08 - INFO - __main__ - Step 42341: {'lr': 0.000413809958161955, 'samples': 8129472, 'steps': 42340, 'loss/train': 1.5473113059997559} -11/07/2021 03:10:09 - INFO - __main__ - Step 42342: {'lr': 0.0004138059492993695, 'samples': 8129664, 'steps': 42341, 'loss/train': 1.9287792444229126} -11/07/2021 03:10:09 - INFO - __main__ - Step 42343: {'lr': 0.0004138019403629756, 'samples': 8129856, 'steps': 42342, 'loss/train': 1.5084797143936157} -11/07/2021 03:10:09 - INFO - __main__ - Step 42344: {'lr': 0.0004137979313527751, 'samples': 8130048, 'steps': 42343, 'loss/train': 1.1683118343353271} -11/07/2021 03:10:10 - INFO - __main__ - Step 42345: {'lr': 0.00041379392226876974, 'samples': 8130240, 'steps': 42344, 'loss/train': 1.669350028038025} -11/07/2021 03:10:10 - INFO - __main__ - Step 42346: {'lr': 0.0004137899131109614, 'samples': 8130432, 'steps': 42345, 'loss/train': 1.6195399761199951} -11/07/2021 03:10:11 - INFO - __main__ - Step 42347: {'lr': 0.0004137859038793518, 'samples': 8130624, 'steps': 42346, 'loss/train': 2.136760950088501} -11/07/2021 03:10:12 - INFO - __main__ - Step 42348: {'lr': 0.0004137818945739428, 'samples': 8130816, 'steps': 42347, 'loss/train': 1.791646122932434} -11/07/2021 03:10:12 - INFO - __main__ - Step 42349: {'lr': 0.00041377788519473624, 'samples': 8131008, 'steps': 42348, 'loss/train': 1.6567926406860352} -11/07/2021 03:10:12 - INFO - __main__ - Step 42350: {'lr': 0.0004137738757417339, 'samples': 8131200, 'steps': 42349, 'loss/train': 1.6222318410873413} -11/07/2021 03:10:13 - INFO - __main__ - Step 42351: {'lr': 0.0004137698662149375, 'samples': 8131392, 'steps': 42350, 'loss/train': 0.6834756135940552} -11/07/2021 03:10:14 - INFO - __main__ - Step 42352: {'lr': 0.00041376585661434903, 'samples': 8131584, 'steps': 42351, 'loss/train': 1.8909810781478882} -11/07/2021 03:10:14 - INFO - __main__ - Step 42353: {'lr': 0.0004137618469399702, 'samples': 8131776, 'steps': 42352, 'loss/train': 1.8924025297164917} -11/07/2021 03:10:15 - INFO - __main__ - Step 42354: {'lr': 0.0004137578371918027, 'samples': 8131968, 'steps': 42353, 'loss/train': 1.5220388174057007} -11/07/2021 03:10:15 - INFO - __main__ - Step 42355: {'lr': 0.00041375382736984857, 'samples': 8132160, 'steps': 42354, 'loss/train': 1.323188066482544} -11/07/2021 03:10:15 - INFO - __main__ - Step 42356: {'lr': 0.0004137498174741094, 'samples': 8132352, 'steps': 42355, 'loss/train': 1.8916676044464111} -11/07/2021 03:10:16 - INFO - __main__ - Step 42357: {'lr': 0.0004137458075045871, 'samples': 8132544, 'steps': 42356, 'loss/train': 0.9286091923713684} -11/07/2021 03:10:17 - INFO - __main__ - Step 42358: {'lr': 0.0004137417974612835, 'samples': 8132736, 'steps': 42357, 'loss/train': 1.803433895111084} -11/07/2021 03:10:18 - INFO - __main__ - Step 42359: {'lr': 0.0004137377873442004, 'samples': 8132928, 'steps': 42358, 'loss/train': 1.3678960800170898} -11/07/2021 03:10:18 - INFO - __main__ - Step 42360: {'lr': 0.00041373377715333946, 'samples': 8133120, 'steps': 42359, 'loss/train': 1.5719913244247437} -11/07/2021 03:10:19 - INFO - __main__ - Step 42361: {'lr': 0.00041372976688870266, 'samples': 8133312, 'steps': 42360, 'loss/train': 1.2116249799728394} -11/07/2021 03:10:19 - INFO - __main__ - Step 42362: {'lr': 0.0004137257565502918, 'samples': 8133504, 'steps': 42361, 'loss/train': 1.4815484285354614} -11/07/2021 03:10:19 - INFO - __main__ - Step 42363: {'lr': 0.00041372174613810863, 'samples': 8133696, 'steps': 42362, 'loss/train': 1.6371750831604004} -11/07/2021 03:10:20 - INFO - __main__ - Step 42364: {'lr': 0.00041371773565215494, 'samples': 8133888, 'steps': 42363, 'loss/train': 1.8453580141067505} -11/07/2021 03:10:21 - INFO - __main__ - Step 42365: {'lr': 0.00041371372509243256, 'samples': 8134080, 'steps': 42364, 'loss/train': 1.7084465026855469} -11/07/2021 03:10:21 - INFO - __main__ - Step 42366: {'lr': 0.00041370971445894335, 'samples': 8134272, 'steps': 42365, 'loss/train': 1.9868760108947754} -11/07/2021 03:10:21 - INFO - __main__ - Step 42367: {'lr': 0.00041370570375168903, 'samples': 8134464, 'steps': 42366, 'loss/train': 1.4556933641433716} -11/07/2021 03:10:22 - INFO - __main__ - Step 42368: {'lr': 0.00041370169297067145, 'samples': 8134656, 'steps': 42367, 'loss/train': 2.0079658031463623} -11/07/2021 03:10:22 - INFO - __main__ - Step 42369: {'lr': 0.00041369768211589245, 'samples': 8134848, 'steps': 42368, 'loss/train': 1.5647902488708496} -11/07/2021 03:10:22 - INFO - __main__ - Step 42370: {'lr': 0.0004136936711873537, 'samples': 8135040, 'steps': 42369, 'loss/train': 1.5075159072875977} -11/07/2021 03:10:23 - INFO - __main__ - Step 42371: {'lr': 0.0004136896601850572, 'samples': 8135232, 'steps': 42370, 'loss/train': 1.371673345565796} -11/07/2021 03:10:24 - INFO - __main__ - Step 42372: {'lr': 0.0004136856491090046, 'samples': 8135424, 'steps': 42371, 'loss/train': 1.6827363967895508} -11/07/2021 03:10:24 - INFO - __main__ - Step 42373: {'lr': 0.0004136816379591979, 'samples': 8135616, 'steps': 42372, 'loss/train': 2.1556642055511475} -11/07/2021 03:10:24 - INFO - __main__ - Step 42374: {'lr': 0.0004136776267356387, 'samples': 8135808, 'steps': 42373, 'loss/train': 1.7191283702850342} -11/07/2021 03:10:25 - INFO - __main__ - Step 42375: {'lr': 0.0004136736154383288, 'samples': 8136000, 'steps': 42374, 'loss/train': 1.7905488014221191} -11/07/2021 03:10:26 - INFO - __main__ - Step 42376: {'lr': 0.00041366960406727024, 'samples': 8136192, 'steps': 42375, 'loss/train': 1.4930577278137207} -11/07/2021 03:10:26 - INFO - __main__ - Step 42377: {'lr': 0.00041366559262246463, 'samples': 8136384, 'steps': 42376, 'loss/train': 1.5554438829421997} -11/07/2021 03:10:27 - INFO - __main__ - Step 42378: {'lr': 0.00041366158110391375, 'samples': 8136576, 'steps': 42377, 'loss/train': 1.5728462934494019} -11/07/2021 03:10:27 - INFO - __main__ - Step 42379: {'lr': 0.0004136575695116196, 'samples': 8136768, 'steps': 42378, 'loss/train': 1.3974881172180176} -11/07/2021 03:10:27 - INFO - __main__ - Step 42380: {'lr': 0.0004136535578455838, 'samples': 8136960, 'steps': 42379, 'loss/train': 1.3594677448272705} -11/07/2021 03:10:28 - INFO - __main__ - Step 42381: {'lr': 0.0004136495461058083, 'samples': 8137152, 'steps': 42380, 'loss/train': 1.4582617282867432} -11/07/2021 03:10:29 - INFO - __main__ - Step 42382: {'lr': 0.0004136455342922948, 'samples': 8137344, 'steps': 42381, 'loss/train': 1.524465799331665} -11/07/2021 03:10:29 - INFO - __main__ - Step 42383: {'lr': 0.0004136415224050451, 'samples': 8137536, 'steps': 42382, 'loss/train': 1.5900578498840332} -11/07/2021 03:10:29 - INFO - __main__ - Step 42384: {'lr': 0.0004136375104440611, 'samples': 8137728, 'steps': 42383, 'loss/train': 1.1075342893600464} -11/07/2021 03:10:30 - INFO - __main__ - Step 42385: {'lr': 0.0004136334984093446, 'samples': 8137920, 'steps': 42384, 'loss/train': 0.9145182967185974} -11/07/2021 03:10:31 - INFO - __main__ - Step 42386: {'lr': 0.0004136294863008974, 'samples': 8138112, 'steps': 42385, 'loss/train': 5.843629837036133} -11/07/2021 03:10:31 - INFO - __main__ - Step 42387: {'lr': 0.00041362547411872116, 'samples': 8138304, 'steps': 42386, 'loss/train': 0.8810856342315674} -11/07/2021 03:10:31 - INFO - __main__ - Step 42388: {'lr': 0.00041362146186281777, 'samples': 8138496, 'steps': 42387, 'loss/train': 1.6148850917816162} -11/07/2021 03:10:32 - INFO - __main__ - Step 42389: {'lr': 0.00041361744953318923, 'samples': 8138688, 'steps': 42388, 'loss/train': 1.2505319118499756} -11/07/2021 03:10:32 - INFO - __main__ - Step 42390: {'lr': 0.0004136134371298371, 'samples': 8138880, 'steps': 42389, 'loss/train': 1.6921306848526} -11/07/2021 03:10:33 - INFO - __main__ - Step 42391: {'lr': 0.0004136094246527633, 'samples': 8139072, 'steps': 42390, 'loss/train': 1.567236065864563} -11/07/2021 03:10:34 - INFO - __main__ - Step 42392: {'lr': 0.0004136054121019697, 'samples': 8139264, 'steps': 42391, 'loss/train': 1.408864140510559} -11/07/2021 03:10:34 - INFO - __main__ - Step 42393: {'lr': 0.0004136013994774579, 'samples': 8139456, 'steps': 42392, 'loss/train': 1.432043194770813} -11/07/2021 03:10:34 - INFO - __main__ - Step 42394: {'lr': 0.00041359738677922993, 'samples': 8139648, 'steps': 42393, 'loss/train': 1.5740227699279785} -11/07/2021 03:10:35 - INFO - __main__ - Step 42395: {'lr': 0.00041359337400728746, 'samples': 8139840, 'steps': 42394, 'loss/train': 0.7346595525741577} -11/07/2021 03:10:35 - INFO - __main__ - Step 42396: {'lr': 0.00041358936116163224, 'samples': 8140032, 'steps': 42395, 'loss/train': 1.6192106008529663} -11/07/2021 03:10:36 - INFO - __main__ - Step 42397: {'lr': 0.00041358534824226635, 'samples': 8140224, 'steps': 42396, 'loss/train': 1.6648677587509155} -11/07/2021 03:10:36 - INFO - __main__ - Step 42398: {'lr': 0.0004135813352491913, 'samples': 8140416, 'steps': 42397, 'loss/train': 1.7205020189285278} -11/07/2021 03:10:37 - INFO - __main__ - Step 42399: {'lr': 0.00041357732218240905, 'samples': 8140608, 'steps': 42398, 'loss/train': 1.6916424036026} -11/07/2021 03:10:37 - INFO - __main__ - Step 42400: {'lr': 0.0004135733090419215, 'samples': 8140800, 'steps': 42399, 'loss/train': 1.7660330533981323} -11/07/2021 03:10:37 - INFO - __main__ - Step 42401: {'lr': 0.00041356929582773023, 'samples': 8140992, 'steps': 42400, 'loss/train': 1.6983288526535034} -11/07/2021 03:10:38 - INFO - __main__ - Step 42402: {'lr': 0.00041356528253983714, 'samples': 8141184, 'steps': 42401, 'loss/train': 1.5337250232696533} -11/07/2021 03:10:39 - INFO - __main__ - Step 42403: {'lr': 0.0004135612691782441, 'samples': 8141376, 'steps': 42402, 'loss/train': 2.1747608184814453} -11/07/2021 03:10:39 - INFO - __main__ - Step 42404: {'lr': 0.0004135572557429529, 'samples': 8141568, 'steps': 42403, 'loss/train': 1.6874691247940063} -11/07/2021 03:10:39 - INFO - __main__ - Step 42405: {'lr': 0.0004135532422339653, 'samples': 8141760, 'steps': 42404, 'loss/train': 1.4186465740203857} -11/07/2021 03:10:40 - INFO - __main__ - Step 42406: {'lr': 0.00041354922865128316, 'samples': 8141952, 'steps': 42405, 'loss/train': 1.2541090250015259} -11/07/2021 03:10:41 - INFO - __main__ - Step 42407: {'lr': 0.00041354521499490813, 'samples': 8142144, 'steps': 42406, 'loss/train': 1.4607620239257812} -11/07/2021 03:10:41 - INFO - __main__ - Step 42408: {'lr': 0.00041354120126484227, 'samples': 8142336, 'steps': 42407, 'loss/train': 1.6432466506958008} -11/07/2021 03:10:42 - INFO - __main__ - Step 42409: {'lr': 0.00041353718746108724, 'samples': 8142528, 'steps': 42408, 'loss/train': 1.1523303985595703} -11/07/2021 03:10:42 - INFO - __main__ - Step 42410: {'lr': 0.00041353317358364496, 'samples': 8142720, 'steps': 42409, 'loss/train': 1.0971400737762451} -11/07/2021 03:10:42 - INFO - __main__ - Step 42411: {'lr': 0.00041352915963251705, 'samples': 8142912, 'steps': 42410, 'loss/train': 1.179257869720459} -11/07/2021 03:10:43 - INFO - __main__ - Step 42412: {'lr': 0.00041352514560770545, 'samples': 8143104, 'steps': 42411, 'loss/train': 1.554078459739685} -11/07/2021 03:10:44 - INFO - __main__ - Step 42413: {'lr': 0.000413521131509212, 'samples': 8143296, 'steps': 42412, 'loss/train': 1.9412667751312256} -11/07/2021 03:10:44 - INFO - __main__ - Step 42414: {'lr': 0.0004135171173370383, 'samples': 8143488, 'steps': 42413, 'loss/train': 1.1289230585098267} -11/07/2021 03:10:44 - INFO - __main__ - Step 42415: {'lr': 0.00041351310309118653, 'samples': 8143680, 'steps': 42414, 'loss/train': 0.7985998392105103} -11/07/2021 03:10:45 - INFO - __main__ - Step 42416: {'lr': 0.00041350908877165805, 'samples': 8143872, 'steps': 42415, 'loss/train': 1.303896188735962} -11/07/2021 03:10:46 - INFO - __main__ - Step 42417: {'lr': 0.00041350507437845505, 'samples': 8144064, 'steps': 42416, 'loss/train': 1.6557601690292358} -11/07/2021 03:10:46 - INFO - __main__ - Step 42418: {'lr': 0.00041350105991157915, 'samples': 8144256, 'steps': 42417, 'loss/train': 1.5549960136413574} -11/07/2021 03:10:46 - INFO - __main__ - Step 42419: {'lr': 0.00041349704537103216, 'samples': 8144448, 'steps': 42418, 'loss/train': 1.4929468631744385} -11/07/2021 03:10:47 - INFO - __main__ - Step 42420: {'lr': 0.000413493030756816, 'samples': 8144640, 'steps': 42419, 'loss/train': 1.7966359853744507} -11/07/2021 03:10:47 - INFO - __main__ - Step 42421: {'lr': 0.0004134890160689323, 'samples': 8144832, 'steps': 42420, 'loss/train': 1.2032808065414429} -11/07/2021 03:10:48 - INFO - __main__ - Step 42422: {'lr': 0.000413485001307383, 'samples': 8145024, 'steps': 42421, 'loss/train': 1.6719205379486084} -11/07/2021 03:10:49 - INFO - __main__ - Step 42423: {'lr': 0.00041348098647216993, 'samples': 8145216, 'steps': 42422, 'loss/train': 1.4168541431427002} -11/07/2021 03:10:49 - INFO - __main__ - Step 42424: {'lr': 0.00041347697156329485, 'samples': 8145408, 'steps': 42423, 'loss/train': 1.4836190938949585} -11/07/2021 03:10:49 - INFO - __main__ - Step 42425: {'lr': 0.00041347295658075955, 'samples': 8145600, 'steps': 42424, 'loss/train': 1.6768486499786377} -11/07/2021 03:10:50 - INFO - __main__ - Step 42426: {'lr': 0.00041346894152456584, 'samples': 8145792, 'steps': 42425, 'loss/train': 1.65650475025177} -11/07/2021 03:10:50 - INFO - __main__ - Step 42427: {'lr': 0.00041346492639471555, 'samples': 8145984, 'steps': 42426, 'loss/train': 1.1028519868850708} -11/07/2021 03:10:51 - INFO - __main__ - Step 42428: {'lr': 0.0004134609111912105, 'samples': 8146176, 'steps': 42427, 'loss/train': 0.635445773601532} -11/07/2021 03:10:51 - INFO - __main__ - Step 42429: {'lr': 0.00041345689591405256, 'samples': 8146368, 'steps': 42428, 'loss/train': 1.371331810951233} -11/07/2021 03:10:52 - INFO - __main__ - Step 42430: {'lr': 0.0004134528805632434, 'samples': 8146560, 'steps': 42429, 'loss/train': 1.5687236785888672} -11/07/2021 03:10:52 - INFO - __main__ - Step 42431: {'lr': 0.00041344886513878485, 'samples': 8146752, 'steps': 42430, 'loss/train': 1.7651448249816895} -11/07/2021 03:10:52 - INFO - __main__ - Step 42432: {'lr': 0.00041344484964067873, 'samples': 8146944, 'steps': 42431, 'loss/train': 1.099167823791504} -11/07/2021 03:10:54 - INFO - __main__ - Step 42433: {'lr': 0.00041344083406892704, 'samples': 8147136, 'steps': 42432, 'loss/train': 1.468461513519287} -11/07/2021 03:10:54 - INFO - __main__ - Step 42434: {'lr': 0.0004134368184235313, 'samples': 8147328, 'steps': 42433, 'loss/train': 1.3953205347061157} -11/07/2021 03:10:54 - INFO - __main__ - Step 42435: {'lr': 0.0004134328027044935, 'samples': 8147520, 'steps': 42434, 'loss/train': 1.4772852659225464} -11/07/2021 03:10:55 - INFO - __main__ - Step 42436: {'lr': 0.0004134287869118154, 'samples': 8147712, 'steps': 42435, 'loss/train': 1.740281343460083} -11/07/2021 03:10:55 - INFO - __main__ - Step 42437: {'lr': 0.0004134247710454988, 'samples': 8147904, 'steps': 42436, 'loss/train': 1.4107420444488525} -11/07/2021 03:10:55 - INFO - __main__ - Step 42438: {'lr': 0.00041342075510554554, 'samples': 8148096, 'steps': 42437, 'loss/train': 1.4461491107940674} -11/07/2021 03:10:56 - INFO - __main__ - Step 42439: {'lr': 0.0004134167390919574, 'samples': 8148288, 'steps': 42438, 'loss/train': 1.2683757543563843} -11/07/2021 03:10:57 - INFO - __main__ - Step 42440: {'lr': 0.0004134127230047362, 'samples': 8148480, 'steps': 42439, 'loss/train': 1.5026410818099976} -11/07/2021 03:10:57 - INFO - __main__ - Step 42441: {'lr': 0.00041340870684388375, 'samples': 8148672, 'steps': 42440, 'loss/train': 1.4890927076339722} -11/07/2021 03:10:57 - INFO - __main__ - Step 42442: {'lr': 0.00041340469060940183, 'samples': 8148864, 'steps': 42441, 'loss/train': 1.7618567943572998} -11/07/2021 03:10:58 - INFO - __main__ - Step 42443: {'lr': 0.0004134006743012923, 'samples': 8149056, 'steps': 42442, 'loss/train': 1.6861194372177124} -11/07/2021 03:10:59 - INFO - __main__ - Step 42444: {'lr': 0.00041339665791955695, 'samples': 8149248, 'steps': 42443, 'loss/train': 1.6956210136413574} -11/07/2021 03:10:59 - INFO - __main__ - Step 42445: {'lr': 0.00041339264146419757, 'samples': 8149440, 'steps': 42444, 'loss/train': 1.5215418338775635} -11/07/2021 03:10:59 - INFO - __main__ - Step 42446: {'lr': 0.000413388624935216, 'samples': 8149632, 'steps': 42445, 'loss/train': 1.765880823135376} -11/07/2021 03:11:00 - INFO - __main__ - Step 42447: {'lr': 0.00041338460833261403, 'samples': 8149824, 'steps': 42446, 'loss/train': 1.688170075416565} -11/07/2021 03:11:00 - INFO - __main__ - Step 42448: {'lr': 0.0004133805916563935, 'samples': 8150016, 'steps': 42447, 'loss/train': 1.2641940116882324} -11/07/2021 03:11:01 - INFO - __main__ - Step 42449: {'lr': 0.00041337657490655625, 'samples': 8150208, 'steps': 42448, 'loss/train': 1.819398283958435} -11/07/2021 03:11:01 - INFO - __main__ - Step 42450: {'lr': 0.00041337255808310394, 'samples': 8150400, 'steps': 42449, 'loss/train': 1.7530895471572876} -11/07/2021 03:11:02 - INFO - __main__ - Step 42451: {'lr': 0.0004133685411860385, 'samples': 8150592, 'steps': 42450, 'loss/train': 1.6568763256072998} -11/07/2021 03:11:02 - INFO - __main__ - Step 42452: {'lr': 0.0004133645242153617, 'samples': 8150784, 'steps': 42451, 'loss/train': 1.6520686149597168} -11/07/2021 03:11:03 - INFO - __main__ - Step 42453: {'lr': 0.0004133605071710754, 'samples': 8150976, 'steps': 42452, 'loss/train': 1.8637690544128418} -11/07/2021 03:11:04 - INFO - __main__ - Step 42454: {'lr': 0.00041335649005318133, 'samples': 8151168, 'steps': 42453, 'loss/train': 2.0649642944335938} -11/07/2021 03:11:04 - INFO - __main__ - Step 42455: {'lr': 0.0004133524728616814, 'samples': 8151360, 'steps': 42454, 'loss/train': 1.7693240642547607} -11/07/2021 03:11:04 - INFO - __main__ - Step 42456: {'lr': 0.00041334845559657735, 'samples': 8151552, 'steps': 42455, 'loss/train': 1.2166308164596558} -11/07/2021 03:11:05 - INFO - __main__ - Step 42457: {'lr': 0.00041334443825787097, 'samples': 8151744, 'steps': 42456, 'loss/train': 1.0859808921813965} -11/07/2021 03:11:05 - INFO - __main__ - Step 42458: {'lr': 0.0004133404208455642, 'samples': 8151936, 'steps': 42457, 'loss/train': 1.2377136945724487} -11/07/2021 03:11:06 - INFO - __main__ - Step 42459: {'lr': 0.00041333640335965865, 'samples': 8152128, 'steps': 42458, 'loss/train': 1.615179181098938} -11/07/2021 03:11:06 - INFO - __main__ - Step 42460: {'lr': 0.0004133323858001563, 'samples': 8152320, 'steps': 42459, 'loss/train': 1.0365239381790161} -11/07/2021 03:11:07 - INFO - __main__ - Step 42461: {'lr': 0.0004133283681670589, 'samples': 8152512, 'steps': 42460, 'loss/train': 1.2702975273132324} -11/07/2021 03:11:07 - INFO - __main__ - Step 42462: {'lr': 0.0004133243504603682, 'samples': 8152704, 'steps': 42461, 'loss/train': 1.4783105850219727} -11/07/2021 03:11:07 - INFO - __main__ - Step 42463: {'lr': 0.0004133203326800861, 'samples': 8152896, 'steps': 42462, 'loss/train': 1.4924323558807373} -11/07/2021 03:11:08 - INFO - __main__ - Step 42464: {'lr': 0.0004133163148262144, 'samples': 8153088, 'steps': 42463, 'loss/train': 1.103530764579773} -11/07/2021 03:11:09 - INFO - __main__ - Step 42465: {'lr': 0.00041331229689875487, 'samples': 8153280, 'steps': 42464, 'loss/train': 1.96661376953125} -11/07/2021 03:11:09 - INFO - __main__ - Step 42466: {'lr': 0.0004133082788977093, 'samples': 8153472, 'steps': 42465, 'loss/train': 1.1008806228637695} -11/07/2021 03:11:10 - INFO - __main__ - Step 42467: {'lr': 0.00041330426082307963, 'samples': 8153664, 'steps': 42466, 'loss/train': 1.5295052528381348} -11/07/2021 03:11:10 - INFO - __main__ - Step 42468: {'lr': 0.0004133002426748675, 'samples': 8153856, 'steps': 42467, 'loss/train': 1.3837577104568481} -11/07/2021 03:11:10 - INFO - __main__ - Step 42469: {'lr': 0.0004132962244530749, 'samples': 8154048, 'steps': 42468, 'loss/train': 1.902879238128662} -11/07/2021 03:11:11 - INFO - __main__ - Step 42470: {'lr': 0.0004132922061577035, 'samples': 8154240, 'steps': 42469, 'loss/train': 1.6521797180175781} -11/07/2021 03:11:12 - INFO - __main__ - Step 42471: {'lr': 0.0004132881877887551, 'samples': 8154432, 'steps': 42470, 'loss/train': 1.247977375984192} -11/07/2021 03:11:12 - INFO - __main__ - Step 42472: {'lr': 0.0004132841693462315, 'samples': 8154624, 'steps': 42471, 'loss/train': 1.312026858329773} -11/07/2021 03:11:12 - INFO - __main__ - Step 42473: {'lr': 0.0004132801508301347, 'samples': 8154816, 'steps': 42472, 'loss/train': 1.3885867595672607} -11/07/2021 03:11:13 - INFO - __main__ - Step 42474: {'lr': 0.0004132761322404663, 'samples': 8155008, 'steps': 42473, 'loss/train': 0.9789870977401733} -11/07/2021 03:11:14 - INFO - __main__ - Step 42475: {'lr': 0.00041327211357722825, 'samples': 8155200, 'steps': 42474, 'loss/train': 0.8852501511573792} -11/07/2021 03:11:14 - INFO - __main__ - Step 42476: {'lr': 0.00041326809484042235, 'samples': 8155392, 'steps': 42475, 'loss/train': 1.377720594406128} -11/07/2021 03:11:15 - INFO - __main__ - Step 42477: {'lr': 0.0004132640760300503, 'samples': 8155584, 'steps': 42476, 'loss/train': 1.496697187423706} -11/07/2021 03:11:15 - INFO - __main__ - Step 42478: {'lr': 0.000413260057146114, 'samples': 8155776, 'steps': 42477, 'loss/train': 1.9076615571975708} -11/07/2021 03:11:15 - INFO - __main__ - Step 42479: {'lr': 0.00041325603818861517, 'samples': 8155968, 'steps': 42478, 'loss/train': 1.923953652381897} -11/07/2021 03:11:16 - INFO - __main__ - Step 42480: {'lr': 0.0004132520191575558, 'samples': 8156160, 'steps': 42479, 'loss/train': 1.850592017173767} -11/07/2021 03:11:16 - INFO - __main__ - Step 42481: {'lr': 0.0004132480000529375, 'samples': 8156352, 'steps': 42480, 'loss/train': 1.101906180381775} -11/07/2021 03:11:17 - INFO - __main__ - Step 42482: {'lr': 0.0004132439808747622, 'samples': 8156544, 'steps': 42481, 'loss/train': 1.372361421585083} -11/07/2021 03:11:17 - INFO - __main__ - Step 42483: {'lr': 0.00041323996162303167, 'samples': 8156736, 'steps': 42482, 'loss/train': 1.4120784997940063} -11/07/2021 03:11:18 - INFO - __main__ - Step 42484: {'lr': 0.0004132359422977477, 'samples': 8156928, 'steps': 42483, 'loss/train': 1.6222646236419678} -11/07/2021 03:11:19 - INFO - __main__ - Step 42485: {'lr': 0.0004132319228989122, 'samples': 8157120, 'steps': 42484, 'loss/train': 1.6639920473098755} -11/07/2021 03:11:19 - INFO - __main__ - Step 42486: {'lr': 0.00041322790342652695, 'samples': 8157312, 'steps': 42485, 'loss/train': 0.6607436537742615} -11/07/2021 03:11:19 - INFO - __main__ - Step 42487: {'lr': 0.00041322388388059366, 'samples': 8157504, 'steps': 42486, 'loss/train': 1.8186523914337158} -11/07/2021 03:11:20 - INFO - __main__ - Step 42488: {'lr': 0.0004132198642611142, 'samples': 8157696, 'steps': 42487, 'loss/train': 0.4286053478717804} -11/07/2021 03:11:20 - INFO - __main__ - Step 42489: {'lr': 0.0004132158445680904, 'samples': 8157888, 'steps': 42488, 'loss/train': 1.5934503078460693} -11/07/2021 03:11:21 - INFO - __main__ - Step 42490: {'lr': 0.0004132118248015241, 'samples': 8158080, 'steps': 42489, 'loss/train': 1.6939036846160889} -11/07/2021 03:11:21 - INFO - __main__ - Step 42491: {'lr': 0.000413207804961417, 'samples': 8158272, 'steps': 42490, 'loss/train': 1.4884772300720215} -11/07/2021 03:11:22 - INFO - __main__ - Step 42492: {'lr': 0.000413203785047771, 'samples': 8158464, 'steps': 42491, 'loss/train': 1.7436952590942383} -11/07/2021 03:11:22 - INFO - __main__ - Step 42493: {'lr': 0.00041319976506058785, 'samples': 8158656, 'steps': 42492, 'loss/train': 0.9843049049377441} -11/07/2021 03:11:22 - INFO - __main__ - Step 42494: {'lr': 0.00041319574499986957, 'samples': 8158848, 'steps': 42493, 'loss/train': 1.8652119636535645} -11/07/2021 03:11:23 - INFO - __main__ - Step 42495: {'lr': 0.0004131917248656177, 'samples': 8159040, 'steps': 42494, 'loss/train': 1.465429663658142} -11/07/2021 03:11:24 - INFO - __main__ - Step 42496: {'lr': 0.0004131877046578341, 'samples': 8159232, 'steps': 42495, 'loss/train': 1.3295153379440308} -11/07/2021 03:11:24 - INFO - __main__ - Step 42497: {'lr': 0.0004131836843765207, 'samples': 8159424, 'steps': 42496, 'loss/train': 1.6745126247406006} -11/07/2021 03:11:24 - INFO - __main__ - Step 42498: {'lr': 0.00041317966402167923, 'samples': 8159616, 'steps': 42497, 'loss/train': 1.2073416709899902} -11/07/2021 03:11:25 - INFO - __main__ - Step 42499: {'lr': 0.0004131756435933115, 'samples': 8159808, 'steps': 42498, 'loss/train': 1.2210643291473389} -11/07/2021 03:11:25 - INFO - __main__ - Step 42500: {'lr': 0.00041317162309141944, 'samples': 8160000, 'steps': 42499, 'loss/train': 1.4471495151519775} -11/07/2021 03:11:26 - INFO - __main__ - Step 42501: {'lr': 0.00041316760251600474, 'samples': 8160192, 'steps': 42500, 'loss/train': 1.6119571924209595} -11/07/2021 03:11:27 - INFO - __main__ - Step 42502: {'lr': 0.00041316358186706915, 'samples': 8160384, 'steps': 42501, 'loss/train': 0.9305280447006226} -11/07/2021 03:11:27 - INFO - __main__ - Step 42503: {'lr': 0.0004131595611446146, 'samples': 8160576, 'steps': 42502, 'loss/train': 1.4976180791854858} -11/07/2021 03:11:27 - INFO - __main__ - Step 42504: {'lr': 0.0004131555403486429, 'samples': 8160768, 'steps': 42503, 'loss/train': 1.690905213356018} -11/07/2021 03:11:28 - INFO - __main__ - Step 42505: {'lr': 0.00041315151947915577, 'samples': 8160960, 'steps': 42504, 'loss/train': 1.7861652374267578} -11/07/2021 03:11:29 - INFO - __main__ - Step 42506: {'lr': 0.0004131474985361551, 'samples': 8161152, 'steps': 42505, 'loss/train': 1.7889028787612915} -11/07/2021 03:11:29 - INFO - __main__ - Step 42507: {'lr': 0.0004131434775196428, 'samples': 8161344, 'steps': 42506, 'loss/train': 1.2052451372146606} -11/07/2021 03:11:29 - INFO - __main__ - Step 42508: {'lr': 0.0004131394564296205, 'samples': 8161536, 'steps': 42507, 'loss/train': 1.2064223289489746} -11/07/2021 03:11:30 - INFO - __main__ - Step 42509: {'lr': 0.00041313543526609, 'samples': 8161728, 'steps': 42508, 'loss/train': 1.6265215873718262} -11/07/2021 03:11:30 - INFO - __main__ - Step 42510: {'lr': 0.00041313141402905324, 'samples': 8161920, 'steps': 42509, 'loss/train': 1.6610273122787476} -11/07/2021 03:11:31 - INFO - __main__ - Step 42511: {'lr': 0.00041312739271851196, 'samples': 8162112, 'steps': 42510, 'loss/train': 1.5313423871994019} -11/07/2021 03:11:31 - INFO - __main__ - Step 42512: {'lr': 0.0004131233713344681, 'samples': 8162304, 'steps': 42511, 'loss/train': 1.8610824346542358} -11/07/2021 03:11:32 - INFO - __main__ - Step 42513: {'lr': 0.0004131193498769232, 'samples': 8162496, 'steps': 42512, 'loss/train': 1.57438325881958} -11/07/2021 03:11:32 - INFO - __main__ - Step 42514: {'lr': 0.0004131153283458794, 'samples': 8162688, 'steps': 42513, 'loss/train': 1.455344796180725} -11/07/2021 03:11:32 - INFO - __main__ - Step 42515: {'lr': 0.00041311130674133824, 'samples': 8162880, 'steps': 42514, 'loss/train': 1.7059967517852783} -11/07/2021 03:11:33 - INFO - __main__ - Step 42516: {'lr': 0.0004131072850633017, 'samples': 8163072, 'steps': 42515, 'loss/train': 1.568089246749878} -11/07/2021 03:11:34 - INFO - __main__ - Step 42517: {'lr': 0.0004131032633117715, 'samples': 8163264, 'steps': 42516, 'loss/train': 1.0315004587173462} -11/07/2021 03:11:34 - INFO - __main__ - Step 42518: {'lr': 0.0004130992414867495, 'samples': 8163456, 'steps': 42517, 'loss/train': 1.199580430984497} -11/07/2021 03:11:35 - INFO - __main__ - Step 42519: {'lr': 0.0004130952195882375, 'samples': 8163648, 'steps': 42518, 'loss/train': 1.2123099565505981} -11/07/2021 03:11:35 - INFO - __main__ - Step 42520: {'lr': 0.0004130911976162373, 'samples': 8163840, 'steps': 42519, 'loss/train': 1.5549166202545166} -11/07/2021 03:11:36 - INFO - __main__ - Step 42521: {'lr': 0.0004130871755707508, 'samples': 8164032, 'steps': 42520, 'loss/train': 1.4823044538497925} -11/07/2021 03:11:36 - INFO - __main__ - Step 42522: {'lr': 0.0004130831534517796, 'samples': 8164224, 'steps': 42521, 'loss/train': 1.6366355419158936} -11/07/2021 03:11:37 - INFO - __main__ - Step 42523: {'lr': 0.00041307913125932574, 'samples': 8164416, 'steps': 42522, 'loss/train': 1.189083456993103} -11/07/2021 03:11:37 - INFO - __main__ - Step 42524: {'lr': 0.00041307510899339097, 'samples': 8164608, 'steps': 42523, 'loss/train': 1.2785511016845703} -11/07/2021 03:11:37 - INFO - __main__ - Step 42525: {'lr': 0.00041307108665397695, 'samples': 8164800, 'steps': 42524, 'loss/train': 1.7492245435714722} -11/07/2021 03:11:39 - INFO - __main__ - Step 42526: {'lr': 0.00041306706424108563, 'samples': 8164992, 'steps': 42525, 'loss/train': 1.626507043838501} -11/07/2021 03:11:39 - INFO - __main__ - Step 42527: {'lr': 0.0004130630417547189, 'samples': 8165184, 'steps': 42526, 'loss/train': 1.6828103065490723} -11/07/2021 03:11:39 - INFO - __main__ - Step 42528: {'lr': 0.00041305901919487845, 'samples': 8165376, 'steps': 42527, 'loss/train': 1.7451270818710327} -11/07/2021 03:11:40 - INFO - __main__ - Step 42529: {'lr': 0.0004130549965615661, 'samples': 8165568, 'steps': 42528, 'loss/train': 1.639512538909912} -11/07/2021 03:11:40 - INFO - __main__ - Step 42530: {'lr': 0.00041305097385478375, 'samples': 8165760, 'steps': 42529, 'loss/train': 1.508062481880188} -11/07/2021 03:11:40 - INFO - __main__ - Step 42531: {'lr': 0.00041304695107453307, 'samples': 8165952, 'steps': 42530, 'loss/train': 1.6047009229660034} -11/07/2021 03:11:41 - INFO - __main__ - Step 42532: {'lr': 0.000413042928220816, 'samples': 8166144, 'steps': 42531, 'loss/train': 0.9355162978172302} -11/07/2021 03:11:42 - INFO - __main__ - Step 42533: {'lr': 0.0004130389052936342, 'samples': 8166336, 'steps': 42532, 'loss/train': 1.5015809535980225} -11/07/2021 03:11:42 - INFO - __main__ - Step 42534: {'lr': 0.0004130348822929897, 'samples': 8166528, 'steps': 42533, 'loss/train': 1.8318469524383545} -11/07/2021 03:11:42 - INFO - __main__ - Step 42535: {'lr': 0.0004130308592188842, 'samples': 8166720, 'steps': 42534, 'loss/train': 1.5886842012405396} -11/07/2021 03:11:43 - INFO - __main__ - Step 42536: {'lr': 0.0004130268360713194, 'samples': 8166912, 'steps': 42535, 'loss/train': 1.339535117149353} -11/07/2021 03:11:44 - INFO - __main__ - Step 42537: {'lr': 0.0004130228128502973, 'samples': 8167104, 'steps': 42536, 'loss/train': 0.9194119572639465} -11/07/2021 03:11:44 - INFO - __main__ - Step 42538: {'lr': 0.0004130187895558196, 'samples': 8167296, 'steps': 42537, 'loss/train': 1.4769353866577148} -11/07/2021 03:11:44 - INFO - __main__ - Step 42539: {'lr': 0.00041301476618788827, 'samples': 8167488, 'steps': 42538, 'loss/train': 0.9612076282501221} -11/07/2021 03:11:45 - INFO - __main__ - Step 42540: {'lr': 0.0004130107427465049, 'samples': 8167680, 'steps': 42539, 'loss/train': 1.7081719636917114} -11/07/2021 03:11:45 - INFO - __main__ - Step 42541: {'lr': 0.00041300671923167145, 'samples': 8167872, 'steps': 42540, 'loss/train': 1.4179370403289795} -11/07/2021 03:11:46 - INFO - __main__ - Step 42542: {'lr': 0.00041300269564338956, 'samples': 8168064, 'steps': 42541, 'loss/train': 1.123705267906189} -11/07/2021 03:11:47 - INFO - __main__ - Step 42543: {'lr': 0.0004129986719816613, 'samples': 8168256, 'steps': 42542, 'loss/train': 1.6389899253845215} -11/07/2021 03:11:47 - INFO - __main__ - Step 42544: {'lr': 0.0004129946482464883, 'samples': 8168448, 'steps': 42543, 'loss/train': 0.9306034445762634} -11/07/2021 03:11:47 - INFO - __main__ - Step 42545: {'lr': 0.0004129906244378724, 'samples': 8168640, 'steps': 42544, 'loss/train': 1.734245777130127} -11/07/2021 03:11:48 - INFO - __main__ - Step 42546: {'lr': 0.0004129866005558155, 'samples': 8168832, 'steps': 42545, 'loss/train': 1.7263352870941162} -11/07/2021 03:11:49 - INFO - __main__ - Step 42547: {'lr': 0.00041298257660031935, 'samples': 8169024, 'steps': 42546, 'loss/train': 0.9408368468284607} -11/07/2021 03:11:49 - INFO - __main__ - Step 42548: {'lr': 0.00041297855257138577, 'samples': 8169216, 'steps': 42547, 'loss/train': 1.384551763534546} -11/07/2021 03:11:49 - INFO - __main__ - Step 42549: {'lr': 0.0004129745284690165, 'samples': 8169408, 'steps': 42548, 'loss/train': 1.6924649477005005} -11/07/2021 03:11:50 - INFO - __main__ - Step 42550: {'lr': 0.0004129705042932135, 'samples': 8169600, 'steps': 42549, 'loss/train': 1.3338024616241455} -11/07/2021 03:11:50 - INFO - __main__ - Step 42551: {'lr': 0.0004129664800439785, 'samples': 8169792, 'steps': 42550, 'loss/train': 1.6320832967758179} -11/07/2021 03:11:51 - INFO - __main__ - Step 42552: {'lr': 0.0004129624557213133, 'samples': 8169984, 'steps': 42551, 'loss/train': 1.28696870803833} -11/07/2021 03:11:51 - INFO - __main__ - Step 42553: {'lr': 0.00041295843132521973, 'samples': 8170176, 'steps': 42552, 'loss/train': 1.7522774934768677} -11/07/2021 03:11:52 - INFO - __main__ - Step 42554: {'lr': 0.0004129544068556996, 'samples': 8170368, 'steps': 42553, 'loss/train': 1.6836118698120117} -11/07/2021 03:11:52 - INFO - __main__ - Step 42555: {'lr': 0.00041295038231275473, 'samples': 8170560, 'steps': 42554, 'loss/train': 1.6868772506713867} -11/07/2021 03:11:53 - INFO - __main__ - Step 42556: {'lr': 0.0004129463576963869, 'samples': 8170752, 'steps': 42555, 'loss/train': 1.503050446510315} -11/07/2021 03:11:54 - INFO - __main__ - Step 42557: {'lr': 0.000412942333006598, 'samples': 8170944, 'steps': 42556, 'loss/train': 1.6459203958511353} -11/07/2021 03:11:54 - INFO - __main__ - Step 42558: {'lr': 0.0004129383082433898, 'samples': 8171136, 'steps': 42557, 'loss/train': 1.4009777307510376} -11/07/2021 03:11:54 - INFO - __main__ - Step 42559: {'lr': 0.0004129342834067641, 'samples': 8171328, 'steps': 42558, 'loss/train': 1.706690788269043} -11/07/2021 03:11:55 - INFO - __main__ - Step 42560: {'lr': 0.0004129302584967227, 'samples': 8171520, 'steps': 42559, 'loss/train': 1.6396253108978271} -11/07/2021 03:11:55 - INFO - __main__ - Step 42561: {'lr': 0.0004129262335132675, 'samples': 8171712, 'steps': 42560, 'loss/train': 0.891944408416748} -11/07/2021 03:11:55 - INFO - __main__ - Step 42562: {'lr': 0.00041292220845640023, 'samples': 8171904, 'steps': 42561, 'loss/train': 1.710152506828308} -11/07/2021 03:11:56 - INFO - __main__ - Step 42563: {'lr': 0.00041291818332612275, 'samples': 8172096, 'steps': 42562, 'loss/train': 1.7914820909500122} -11/07/2021 03:11:57 - INFO - __main__ - Step 42564: {'lr': 0.00041291415812243676, 'samples': 8172288, 'steps': 42563, 'loss/train': 1.2920377254486084} -11/07/2021 03:11:57 - INFO - __main__ - Step 42565: {'lr': 0.0004129101328453442, 'samples': 8172480, 'steps': 42564, 'loss/train': 1.6780205965042114} -11/07/2021 03:11:57 - INFO - __main__ - Step 42566: {'lr': 0.0004129061074948469, 'samples': 8172672, 'steps': 42565, 'loss/train': 1.525704264640808} -11/07/2021 03:11:58 - INFO - __main__ - Step 42567: {'lr': 0.0004129020820709466, 'samples': 8172864, 'steps': 42566, 'loss/train': 1.5468403100967407} -11/07/2021 03:11:59 - INFO - __main__ - Step 42568: {'lr': 0.00041289805657364516, 'samples': 8173056, 'steps': 42567, 'loss/train': 1.4239075183868408} -11/07/2021 03:11:59 - INFO - __main__ - Step 42569: {'lr': 0.0004128940310029443, 'samples': 8173248, 'steps': 42568, 'loss/train': 1.1596369743347168} -11/07/2021 03:12:00 - INFO - __main__ - Step 42570: {'lr': 0.0004128900053588459, 'samples': 8173440, 'steps': 42569, 'loss/train': 1.5229151248931885} -11/07/2021 03:12:00 - INFO - __main__ - Step 42571: {'lr': 0.00041288597964135186, 'samples': 8173632, 'steps': 42570, 'loss/train': 1.7631556987762451} -11/07/2021 03:12:00 - INFO - __main__ - Step 42572: {'lr': 0.0004128819538504639, 'samples': 8173824, 'steps': 42571, 'loss/train': 1.4214872121810913} -11/07/2021 03:12:01 - INFO - __main__ - Step 42573: {'lr': 0.00041287792798618374, 'samples': 8174016, 'steps': 42572, 'loss/train': 0.9737385511398315} -11/07/2021 03:12:02 - INFO - __main__ - Step 42574: {'lr': 0.00041287390204851343, 'samples': 8174208, 'steps': 42573, 'loss/train': 1.2740235328674316} -11/07/2021 03:12:02 - INFO - __main__ - Step 42575: {'lr': 0.0004128698760374546, 'samples': 8174400, 'steps': 42574, 'loss/train': 1.4505579471588135} -11/07/2021 03:12:02 - INFO - __main__ - Step 42576: {'lr': 0.0004128658499530091, 'samples': 8174592, 'steps': 42575, 'loss/train': 1.3641626834869385} -11/07/2021 03:12:03 - INFO - __main__ - Step 42577: {'lr': 0.00041286182379517876, 'samples': 8174784, 'steps': 42576, 'loss/train': 1.3425848484039307} -11/07/2021 03:12:04 - INFO - __main__ - Step 42578: {'lr': 0.00041285779756396543, 'samples': 8174976, 'steps': 42577, 'loss/train': 1.4676402807235718} -11/07/2021 03:12:04 - INFO - __main__ - Step 42579: {'lr': 0.00041285377125937085, 'samples': 8175168, 'steps': 42578, 'loss/train': 1.6525946855545044} -11/07/2021 03:12:04 - INFO - __main__ - Step 42580: {'lr': 0.0004128497448813969, 'samples': 8175360, 'steps': 42579, 'loss/train': 1.211531400680542} -11/07/2021 03:12:05 - INFO - __main__ - Step 42581: {'lr': 0.0004128457184300454, 'samples': 8175552, 'steps': 42580, 'loss/train': 0.8959876894950867} -11/07/2021 03:12:05 - INFO - __main__ - Step 42582: {'lr': 0.0004128416919053181, 'samples': 8175744, 'steps': 42581, 'loss/train': 1.1853410005569458} -11/07/2021 03:12:06 - INFO - __main__ - Step 42583: {'lr': 0.0004128376653072168, 'samples': 8175936, 'steps': 42582, 'loss/train': 1.5495693683624268} -11/07/2021 03:12:07 - INFO - __main__ - Step 42584: {'lr': 0.0004128336386357434, 'samples': 8176128, 'steps': 42583, 'loss/train': 1.5811612606048584} -11/07/2021 03:12:07 - INFO - __main__ - Step 42585: {'lr': 0.0004128296118908997, 'samples': 8176320, 'steps': 42584, 'loss/train': 1.4197684526443481} -11/07/2021 03:12:07 - INFO - __main__ - Step 42586: {'lr': 0.0004128255850726874, 'samples': 8176512, 'steps': 42585, 'loss/train': 1.4086215496063232} -11/07/2021 03:12:08 - INFO - __main__ - Step 42587: {'lr': 0.0004128215581811085, 'samples': 8176704, 'steps': 42586, 'loss/train': 1.300828456878662} -11/07/2021 03:12:09 - INFO - __main__ - Step 42588: {'lr': 0.0004128175312161647, 'samples': 8176896, 'steps': 42587, 'loss/train': 0.3088771402835846} -11/07/2021 03:12:09 - INFO - __main__ - Step 42589: {'lr': 0.00041281350417785777, 'samples': 8177088, 'steps': 42588, 'loss/train': 1.5267343521118164} -11/07/2021 03:12:09 - INFO - __main__ - Step 42590: {'lr': 0.00041280947706618965, 'samples': 8177280, 'steps': 42589, 'loss/train': 1.41680109500885} -11/07/2021 03:12:10 - INFO - __main__ - Step 42591: {'lr': 0.0004128054498811621, 'samples': 8177472, 'steps': 42590, 'loss/train': 0.8744376301765442} -11/07/2021 03:12:10 - INFO - __main__ - Step 42592: {'lr': 0.0004128014226227769, 'samples': 8177664, 'steps': 42591, 'loss/train': 1.8009610176086426} -11/07/2021 03:12:11 - INFO - __main__ - Step 42593: {'lr': 0.00041279739529103586, 'samples': 8177856, 'steps': 42592, 'loss/train': 2.0615074634552} -11/07/2021 03:12:11 - INFO - __main__ - Step 42594: {'lr': 0.0004127933678859409, 'samples': 8178048, 'steps': 42593, 'loss/train': 1.7933173179626465} -11/07/2021 03:12:12 - INFO - __main__ - Step 42595: {'lr': 0.00041278934040749375, 'samples': 8178240, 'steps': 42594, 'loss/train': 1.6331143379211426} -11/07/2021 03:12:12 - INFO - __main__ - Step 42596: {'lr': 0.0004127853128556962, 'samples': 8178432, 'steps': 42595, 'loss/train': 1.4697948694229126} -11/07/2021 03:12:12 - INFO - __main__ - Step 42597: {'lr': 0.00041278128523055015, 'samples': 8178624, 'steps': 42596, 'loss/train': 1.5395692586898804} -11/07/2021 03:12:13 - INFO - __main__ - Step 42598: {'lr': 0.0004127772575320573, 'samples': 8178816, 'steps': 42597, 'loss/train': 1.289622187614441} -11/07/2021 03:12:15 - INFO - __main__ - Step 42599: {'lr': 0.0004127732297602196, 'samples': 8179008, 'steps': 42598, 'loss/train': 0.9867827296257019} -11/07/2021 03:12:15 - INFO - __main__ - Step 42600: {'lr': 0.0004127692019150387, 'samples': 8179200, 'steps': 42599, 'loss/train': 1.7771762609481812} -11/07/2021 03:12:15 - INFO - __main__ - Step 42601: {'lr': 0.00041276517399651657, 'samples': 8179392, 'steps': 42600, 'loss/train': 1.8227523565292358} -11/07/2021 03:12:16 - INFO - __main__ - Step 42602: {'lr': 0.00041276114600465497, 'samples': 8179584, 'steps': 42601, 'loss/train': 1.7748034000396729} -11/07/2021 03:12:16 - INFO - __main__ - Step 42603: {'lr': 0.0004127571179394557, 'samples': 8179776, 'steps': 42602, 'loss/train': 1.3474419116973877} -11/07/2021 03:12:16 - INFO - __main__ - Step 42604: {'lr': 0.0004127530898009205, 'samples': 8179968, 'steps': 42603, 'loss/train': 1.3940340280532837} -11/07/2021 03:12:17 - INFO - __main__ - Step 42605: {'lr': 0.00041274906158905137, 'samples': 8180160, 'steps': 42604, 'loss/train': 2.1176109313964844} -11/07/2021 03:12:18 - INFO - __main__ - Step 42606: {'lr': 0.00041274503330384997, 'samples': 8180352, 'steps': 42605, 'loss/train': 1.880507469177246} -11/07/2021 03:12:18 - INFO - __main__ - Step 42607: {'lr': 0.0004127410049453182, 'samples': 8180544, 'steps': 42606, 'loss/train': 1.521466612815857} -11/07/2021 03:12:18 - INFO - __main__ - Step 42608: {'lr': 0.00041273697651345785, 'samples': 8180736, 'steps': 42607, 'loss/train': 1.7024065256118774} -11/07/2021 03:12:19 - INFO - __main__ - Step 42609: {'lr': 0.00041273294800827075, 'samples': 8180928, 'steps': 42608, 'loss/train': 1.6238617897033691} -11/07/2021 03:12:20 - INFO - __main__ - Step 42610: {'lr': 0.00041272891942975863, 'samples': 8181120, 'steps': 42609, 'loss/train': 1.1740303039550781} -11/07/2021 03:12:20 - INFO - __main__ - Step 42611: {'lr': 0.00041272489077792343, 'samples': 8181312, 'steps': 42610, 'loss/train': 1.7574613094329834} -11/07/2021 03:12:21 - INFO - __main__ - Step 42612: {'lr': 0.0004127208620527669, 'samples': 8181504, 'steps': 42611, 'loss/train': 1.3476653099060059} -11/07/2021 03:12:21 - INFO - __main__ - Step 42613: {'lr': 0.00041271683325429075, 'samples': 8181696, 'steps': 42612, 'loss/train': 0.977882981300354} -11/07/2021 03:12:21 - INFO - __main__ - Step 42614: {'lr': 0.00041271280438249705, 'samples': 8181888, 'steps': 42613, 'loss/train': 1.575322151184082} -11/07/2021 03:12:22 - INFO - __main__ - Step 42615: {'lr': 0.00041270877543738744, 'samples': 8182080, 'steps': 42614, 'loss/train': 1.1944984197616577} -11/07/2021 03:12:23 - INFO - __main__ - Step 42616: {'lr': 0.0004127047464189637, 'samples': 8182272, 'steps': 42615, 'loss/train': 0.4800504446029663} -11/07/2021 03:12:23 - INFO - __main__ - Step 42617: {'lr': 0.0004127007173272278, 'samples': 8182464, 'steps': 42616, 'loss/train': 1.5213189125061035} -11/07/2021 03:12:23 - INFO - __main__ - Step 42618: {'lr': 0.0004126966881621814, 'samples': 8182656, 'steps': 42617, 'loss/train': 1.9201672077178955} -11/07/2021 03:12:24 - INFO - __main__ - Step 42619: {'lr': 0.0004126926589238264, 'samples': 8182848, 'steps': 42618, 'loss/train': 1.2446012496948242} -11/07/2021 03:12:24 - INFO - __main__ - Step 42620: {'lr': 0.00041268862961216457, 'samples': 8183040, 'steps': 42619, 'loss/train': 1.7546820640563965} -11/07/2021 03:12:25 - INFO - __main__ - Step 42621: {'lr': 0.00041268460022719783, 'samples': 8183232, 'steps': 42620, 'loss/train': 1.547313928604126} -11/07/2021 03:12:25 - INFO - __main__ - Step 42622: {'lr': 0.0004126805707689279, 'samples': 8183424, 'steps': 42621, 'loss/train': 1.7227954864501953} -11/07/2021 03:12:26 - INFO - __main__ - Step 42623: {'lr': 0.0004126765412373566, 'samples': 8183616, 'steps': 42622, 'loss/train': 2.0326387882232666} -11/07/2021 03:12:26 - INFO - __main__ - Step 42624: {'lr': 0.0004126725116324858, 'samples': 8183808, 'steps': 42623, 'loss/train': 1.348909854888916} -11/07/2021 03:12:26 - INFO - __main__ - Step 42625: {'lr': 0.00041266848195431715, 'samples': 8184000, 'steps': 42624, 'loss/train': 1.6020936965942383} -11/07/2021 03:12:27 - INFO - __main__ - Step 42626: {'lr': 0.00041266445220285267, 'samples': 8184192, 'steps': 42625, 'loss/train': 0.6952012181282043} -11/07/2021 03:12:28 - INFO - __main__ - Step 42627: {'lr': 0.0004126604223780941, 'samples': 8184384, 'steps': 42626, 'loss/train': 1.5037245750427246} -11/07/2021 03:12:28 - INFO - __main__ - Step 42628: {'lr': 0.00041265639248004327, 'samples': 8184576, 'steps': 42627, 'loss/train': 1.6028532981872559} -11/07/2021 03:12:29 - INFO - __main__ - Step 42629: {'lr': 0.000412652362508702, 'samples': 8184768, 'steps': 42628, 'loss/train': 0.7027224898338318} -11/07/2021 03:12:29 - INFO - __main__ - Step 42630: {'lr': 0.000412648332464072, 'samples': 8184960, 'steps': 42629, 'loss/train': 1.5392451286315918} -11/07/2021 03:12:30 - INFO - __main__ - Step 42631: {'lr': 0.00041264430234615526, 'samples': 8185152, 'steps': 42630, 'loss/train': 1.8497998714447021} -11/07/2021 03:12:30 - INFO - __main__ - Step 42632: {'lr': 0.0004126402721549535, 'samples': 8185344, 'steps': 42631, 'loss/train': 1.470371127128601} -11/07/2021 03:12:31 - INFO - __main__ - Step 42633: {'lr': 0.00041263624189046846, 'samples': 8185536, 'steps': 42632, 'loss/train': 1.7528550624847412} -11/07/2021 03:12:31 - INFO - __main__ - Step 42634: {'lr': 0.0004126322115527021, 'samples': 8185728, 'steps': 42633, 'loss/train': 1.517307996749878} -11/07/2021 03:12:31 - INFO - __main__ - Step 42635: {'lr': 0.00041262818114165615, 'samples': 8185920, 'steps': 42634, 'loss/train': 1.2638063430786133} -11/07/2021 03:12:32 - INFO - __main__ - Step 42636: {'lr': 0.0004126241506573325, 'samples': 8186112, 'steps': 42635, 'loss/train': 1.5525659322738647} -11/07/2021 03:12:33 - INFO - __main__ - Step 42637: {'lr': 0.00041262012009973283, 'samples': 8186304, 'steps': 42636, 'loss/train': 1.163089394569397} -11/07/2021 03:12:33 - INFO - __main__ - Step 42638: {'lr': 0.0004126160894688591, 'samples': 8186496, 'steps': 42637, 'loss/train': 1.1772278547286987} -11/07/2021 03:12:33 - INFO - __main__ - Step 42639: {'lr': 0.00041261205876471307, 'samples': 8186688, 'steps': 42638, 'loss/train': 1.3485753536224365} -11/07/2021 03:12:34 - INFO - __main__ - Step 42640: {'lr': 0.0004126080279872966, 'samples': 8186880, 'steps': 42639, 'loss/train': 1.5482761859893799} -11/07/2021 03:12:34 - INFO - __main__ - Step 42641: {'lr': 0.0004126039971366114, 'samples': 8187072, 'steps': 42640, 'loss/train': 1.2749180793762207} -11/07/2021 03:12:35 - INFO - __main__ - Step 42642: {'lr': 0.0004125999662126594, 'samples': 8187264, 'steps': 42641, 'loss/train': 1.9490081071853638} -11/07/2021 03:12:35 - INFO - __main__ - Step 42643: {'lr': 0.00041259593521544223, 'samples': 8187456, 'steps': 42642, 'loss/train': 1.4983640909194946} -11/07/2021 03:12:36 - INFO - __main__ - Step 42644: {'lr': 0.00041259190414496194, 'samples': 8187648, 'steps': 42643, 'loss/train': 1.4390331506729126} -11/07/2021 03:12:36 - INFO - __main__ - Step 42645: {'lr': 0.00041258787300122026, 'samples': 8187840, 'steps': 42644, 'loss/train': 1.4660903215408325} -11/07/2021 03:12:36 - INFO - __main__ - Step 42646: {'lr': 0.000412583841784219, 'samples': 8188032, 'steps': 42645, 'loss/train': 1.397388219833374} -11/07/2021 03:12:37 - INFO - __main__ - Step 42647: {'lr': 0.00041257981049395997, 'samples': 8188224, 'steps': 42646, 'loss/train': 1.726476788520813} -11/07/2021 03:12:38 - INFO - __main__ - Step 42648: {'lr': 0.000412575779130445, 'samples': 8188416, 'steps': 42647, 'loss/train': 1.4296152591705322} -11/07/2021 03:12:38 - INFO - __main__ - Step 42649: {'lr': 0.0004125717476936758, 'samples': 8188608, 'steps': 42648, 'loss/train': 0.9558641910552979} -11/07/2021 03:12:39 - INFO - __main__ - Step 42650: {'lr': 0.0004125677161836543, 'samples': 8188800, 'steps': 42649, 'loss/train': 1.4704724550247192} -11/07/2021 03:12:39 - INFO - __main__ - Step 42651: {'lr': 0.00041256368460038237, 'samples': 8188992, 'steps': 42650, 'loss/train': 1.8188363313674927} -11/07/2021 03:12:40 - INFO - __main__ - Step 42652: {'lr': 0.00041255965294386174, 'samples': 8189184, 'steps': 42651, 'loss/train': 1.3506090641021729} -11/07/2021 03:12:40 - INFO - __main__ - Step 42653: {'lr': 0.00041255562121409416, 'samples': 8189376, 'steps': 42652, 'loss/train': 0.8035365343093872} -11/07/2021 03:12:41 - INFO - __main__ - Step 42654: {'lr': 0.0004125515894110816, 'samples': 8189568, 'steps': 42653, 'loss/train': 1.6913963556289673} -11/07/2021 03:12:41 - INFO - __main__ - Step 42655: {'lr': 0.00041254755753482574, 'samples': 8189760, 'steps': 42654, 'loss/train': 1.364007830619812} -11/07/2021 03:12:41 - INFO - __main__ - Step 42656: {'lr': 0.00041254352558532854, 'samples': 8189952, 'steps': 42655, 'loss/train': 1.3132096529006958} -11/07/2021 03:12:42 - INFO - __main__ - Step 42657: {'lr': 0.0004125394935625917, 'samples': 8190144, 'steps': 42656, 'loss/train': 0.9017446041107178} -11/07/2021 03:12:43 - INFO - __main__ - Step 42658: {'lr': 0.00041253546146661704, 'samples': 8190336, 'steps': 42657, 'loss/train': 1.883015513420105} -11/07/2021 03:12:43 - INFO - __main__ - Step 42659: {'lr': 0.00041253142929740643, 'samples': 8190528, 'steps': 42658, 'loss/train': 1.9374349117279053} -11/07/2021 03:12:43 - INFO - __main__ - Step 42660: {'lr': 0.00041252739705496165, 'samples': 8190720, 'steps': 42659, 'loss/train': 1.5369181632995605} -11/07/2021 03:12:44 - INFO - __main__ - Step 42661: {'lr': 0.00041252336473928455, 'samples': 8190912, 'steps': 42660, 'loss/train': 1.5200303792953491} -11/07/2021 03:12:45 - INFO - __main__ - Step 42662: {'lr': 0.00041251933235037695, 'samples': 8191104, 'steps': 42661, 'loss/train': 1.5997662544250488} -11/07/2021 03:12:45 - INFO - __main__ - Step 42663: {'lr': 0.00041251529988824067, 'samples': 8191296, 'steps': 42662, 'loss/train': 1.662327766418457} -11/07/2021 03:12:46 - INFO - __main__ - Step 42664: {'lr': 0.0004125112673528775, 'samples': 8191488, 'steps': 42663, 'loss/train': 1.5672930479049683} -11/07/2021 03:12:46 - INFO - __main__ - Step 42665: {'lr': 0.0004125072347442892, 'samples': 8191680, 'steps': 42664, 'loss/train': 1.6102161407470703} -11/07/2021 03:12:46 - INFO - __main__ - Step 42666: {'lr': 0.0004125032020624776, 'samples': 8191872, 'steps': 42665, 'loss/train': 1.5029171705245972} -11/07/2021 03:12:47 - INFO - __main__ - Step 42667: {'lr': 0.0004124991693074447, 'samples': 8192064, 'steps': 42666, 'loss/train': 1.9619196653366089} -11/07/2021 03:12:48 - INFO - __main__ - Step 42668: {'lr': 0.00041249513647919207, 'samples': 8192256, 'steps': 42667, 'loss/train': 2.0680155754089355} -11/07/2021 03:12:48 - INFO - __main__ - Step 42669: {'lr': 0.00041249110357772167, 'samples': 8192448, 'steps': 42668, 'loss/train': 1.3066715002059937} -11/07/2021 03:12:48 - INFO - __main__ - Step 42670: {'lr': 0.00041248707060303536, 'samples': 8192640, 'steps': 42669, 'loss/train': 1.6666626930236816} -11/07/2021 03:12:49 - INFO - __main__ - Step 42671: {'lr': 0.00041248303755513484, 'samples': 8192832, 'steps': 42670, 'loss/train': 1.66847562789917} -11/07/2021 03:12:49 - INFO - __main__ - Step 42672: {'lr': 0.00041247900443402194, 'samples': 8193024, 'steps': 42671, 'loss/train': 1.0965551137924194} -11/07/2021 03:12:50 - INFO - __main__ - Step 42673: {'lr': 0.00041247497123969844, 'samples': 8193216, 'steps': 42672, 'loss/train': 1.3833045959472656} -11/07/2021 03:12:50 - INFO - __main__ - Step 42674: {'lr': 0.00041247093797216637, 'samples': 8193408, 'steps': 42673, 'loss/train': 1.230155348777771} -11/07/2021 03:12:51 - INFO - __main__ - Step 42675: {'lr': 0.00041246690463142733, 'samples': 8193600, 'steps': 42674, 'loss/train': 0.7003434896469116} -11/07/2021 03:12:51 - INFO - __main__ - Step 42676: {'lr': 0.0004124628712174833, 'samples': 8193792, 'steps': 42675, 'loss/train': 1.5358424186706543} -11/07/2021 03:12:51 - INFO - __main__ - Step 42677: {'lr': 0.0004124588377303359, 'samples': 8193984, 'steps': 42676, 'loss/train': 1.5736559629440308} -11/07/2021 03:12:52 - INFO - __main__ - Step 42678: {'lr': 0.00041245480416998704, 'samples': 8194176, 'steps': 42677, 'loss/train': 1.054282307624817} -11/07/2021 03:12:53 - INFO - __main__ - Step 42679: {'lr': 0.00041245077053643866, 'samples': 8194368, 'steps': 42678, 'loss/train': 1.107468605041504} -11/07/2021 03:12:53 - INFO - __main__ - Step 42680: {'lr': 0.0004124467368296924, 'samples': 8194560, 'steps': 42679, 'loss/train': 1.5272530317306519} -11/07/2021 03:12:54 - INFO - __main__ - Step 42681: {'lr': 0.00041244270304975004, 'samples': 8194752, 'steps': 42680, 'loss/train': 0.5860555768013} -11/07/2021 03:12:54 - INFO - __main__ - Step 42682: {'lr': 0.0004124386691966137, 'samples': 8194944, 'steps': 42681, 'loss/train': 1.4744832515716553} -11/07/2021 03:12:55 - INFO - __main__ - Step 42683: {'lr': 0.00041243463527028493, 'samples': 8195136, 'steps': 42682, 'loss/train': 1.290229320526123} -11/07/2021 03:12:55 - INFO - __main__ - Step 42684: {'lr': 0.0004124306012707656, 'samples': 8195328, 'steps': 42683, 'loss/train': 1.3682605028152466} -11/07/2021 03:12:56 - INFO - __main__ - Step 42685: {'lr': 0.00041242656719805754, 'samples': 8195520, 'steps': 42684, 'loss/train': 1.3809823989868164} -11/07/2021 03:12:56 - INFO - __main__ - Step 42686: {'lr': 0.0004124225330521626, 'samples': 8195712, 'steps': 42685, 'loss/train': 1.5804864168167114} -11/07/2021 03:12:56 - INFO - __main__ - Step 42687: {'lr': 0.0004124184988330826, 'samples': 8195904, 'steps': 42686, 'loss/train': 0.9367903470993042} -11/07/2021 03:12:57 - INFO - __main__ - Step 42688: {'lr': 0.0004124144645408192, 'samples': 8196096, 'steps': 42687, 'loss/train': 1.4681004285812378} -11/07/2021 03:12:58 - INFO - __main__ - Step 42689: {'lr': 0.0004124104301753745, 'samples': 8196288, 'steps': 42688, 'loss/train': 1.3483312129974365} -11/07/2021 03:12:58 - INFO - __main__ - Step 42690: {'lr': 0.0004124063957367501, 'samples': 8196480, 'steps': 42689, 'loss/train': 1.2217729091644287} -11/07/2021 03:12:58 - INFO - __main__ - Step 42691: {'lr': 0.0004124023612249479, 'samples': 8196672, 'steps': 42690, 'loss/train': 1.4882365465164185} -11/07/2021 03:12:59 - INFO - __main__ - Step 42692: {'lr': 0.0004123983266399697, 'samples': 8196864, 'steps': 42691, 'loss/train': 1.5725913047790527} -11/07/2021 03:13:00 - INFO - __main__ - Step 42693: {'lr': 0.0004123942919818173, 'samples': 8197056, 'steps': 42692, 'loss/train': 1.2359098196029663} -11/07/2021 03:13:00 - INFO - __main__ - Step 42694: {'lr': 0.00041239025725049256, 'samples': 8197248, 'steps': 42693, 'loss/train': 1.1791036128997803} -11/07/2021 03:13:01 - INFO - __main__ - Step 42695: {'lr': 0.0004123862224459973, 'samples': 8197440, 'steps': 42694, 'loss/train': 1.843918800354004} -11/07/2021 03:13:01 - INFO - __main__ - Step 42696: {'lr': 0.0004123821875683333, 'samples': 8197632, 'steps': 42695, 'loss/train': 1.4438482522964478} -11/07/2021 03:13:01 - INFO - __main__ - Step 42697: {'lr': 0.0004123781526175023, 'samples': 8197824, 'steps': 42696, 'loss/train': 1.5149061679840088} -11/07/2021 03:13:02 - INFO - __main__ - Step 42698: {'lr': 0.0004123741175935063, 'samples': 8198016, 'steps': 42697, 'loss/train': 1.6861848831176758} -11/07/2021 03:13:03 - INFO - __main__ - Step 42699: {'lr': 0.000412370082496347, 'samples': 8198208, 'steps': 42698, 'loss/train': 1.707339882850647} -11/07/2021 03:13:03 - INFO - __main__ - Step 42700: {'lr': 0.0004123660473260263, 'samples': 8198400, 'steps': 42699, 'loss/train': 0.6675590872764587} -11/07/2021 03:13:03 - INFO - __main__ - Step 42701: {'lr': 0.0004123620120825459, 'samples': 8198592, 'steps': 42700, 'loss/train': 1.6229008436203003} -11/07/2021 03:13:04 - INFO - __main__ - Step 42702: {'lr': 0.00041235797676590776, 'samples': 8198784, 'steps': 42701, 'loss/train': 1.2133471965789795} -11/07/2021 03:13:04 - INFO - __main__ - Step 42703: {'lr': 0.0004123539413761136, 'samples': 8198976, 'steps': 42702, 'loss/train': 0.5439752340316772} -11/07/2021 03:13:05 - INFO - __main__ - Step 42704: {'lr': 0.0004123499059131652, 'samples': 8199168, 'steps': 42703, 'loss/train': 1.476960301399231} -11/07/2021 03:13:06 - INFO - __main__ - Step 42705: {'lr': 0.00041234587037706447, 'samples': 8199360, 'steps': 42704, 'loss/train': 1.2985483407974243} -11/07/2021 03:13:06 - INFO - __main__ - Step 42706: {'lr': 0.0004123418347678132, 'samples': 8199552, 'steps': 42705, 'loss/train': 1.567990779876709} -11/07/2021 03:13:06 - INFO - __main__ - Step 42707: {'lr': 0.00041233779908541316, 'samples': 8199744, 'steps': 42706, 'loss/train': 1.5503088235855103} -11/07/2021 03:13:07 - INFO - __main__ - Step 42708: {'lr': 0.0004123337633298662, 'samples': 8199936, 'steps': 42707, 'loss/train': 1.386027455329895} -11/07/2021 03:13:08 - INFO - __main__ - Step 42709: {'lr': 0.0004123297275011743, 'samples': 8200128, 'steps': 42708, 'loss/train': 1.4431533813476562} -11/07/2021 03:13:08 - INFO - __main__ - Step 42710: {'lr': 0.00041232569159933895, 'samples': 8200320, 'steps': 42709, 'loss/train': 1.3087667226791382} -11/07/2021 03:13:08 - INFO - __main__ - Step 42711: {'lr': 0.00041232165562436225, 'samples': 8200512, 'steps': 42710, 'loss/train': 1.0742384195327759} -11/07/2021 03:13:09 - INFO - __main__ - Step 42712: {'lr': 0.00041231761957624593, 'samples': 8200704, 'steps': 42711, 'loss/train': 1.6528187990188599} -11/07/2021 03:13:09 - INFO - __main__ - Step 42713: {'lr': 0.0004123135834549917, 'samples': 8200896, 'steps': 42712, 'loss/train': 1.6122461557388306} -11/07/2021 03:13:10 - INFO - __main__ - Step 42714: {'lr': 0.00041230954726060155, 'samples': 8201088, 'steps': 42713, 'loss/train': 1.4251964092254639} -11/07/2021 03:13:11 - INFO - __main__ - Step 42715: {'lr': 0.00041230551099307724, 'samples': 8201280, 'steps': 42714, 'loss/train': 1.4186371564865112} -11/07/2021 03:13:11 - INFO - __main__ - Step 42716: {'lr': 0.0004123014746524205, 'samples': 8201472, 'steps': 42715, 'loss/train': 1.5294647216796875} -11/07/2021 03:13:11 - INFO - __main__ - Step 42717: {'lr': 0.0004122974382386333, 'samples': 8201664, 'steps': 42716, 'loss/train': 1.4531598091125488} -11/07/2021 03:13:12 - INFO - __main__ - Step 42718: {'lr': 0.00041229340175171733, 'samples': 8201856, 'steps': 42717, 'loss/train': 1.565722942352295} -11/07/2021 03:13:13 - INFO - __main__ - Step 42719: {'lr': 0.00041228936519167446, 'samples': 8202048, 'steps': 42718, 'loss/train': 1.530666708946228} -11/07/2021 03:13:13 - INFO - __main__ - Step 42720: {'lr': 0.00041228532855850655, 'samples': 8202240, 'steps': 42719, 'loss/train': 1.1392285823822021} -11/07/2021 03:13:13 - INFO - __main__ - Step 42721: {'lr': 0.0004122812918522153, 'samples': 8202432, 'steps': 42720, 'loss/train': 0.7674376368522644} -11/07/2021 03:13:14 - INFO - __main__ - Step 42722: {'lr': 0.0004122772550728027, 'samples': 8202624, 'steps': 42721, 'loss/train': 1.3797781467437744} -11/07/2021 03:13:14 - INFO - __main__ - Step 42723: {'lr': 0.0004122732182202703, 'samples': 8202816, 'steps': 42722, 'loss/train': 1.799514651298523} -11/07/2021 03:13:15 - INFO - __main__ - Step 42724: {'lr': 0.0004122691812946202, 'samples': 8203008, 'steps': 42723, 'loss/train': 1.4491488933563232} -11/07/2021 03:13:16 - INFO - __main__ - Step 42725: {'lr': 0.00041226514429585417, 'samples': 8203200, 'steps': 42724, 'loss/train': 1.598483920097351} -11/07/2021 03:13:16 - INFO - __main__ - Step 42726: {'lr': 0.0004122611072239739, 'samples': 8203392, 'steps': 42725, 'loss/train': 1.3325248956680298} -11/07/2021 03:13:17 - INFO - __main__ - Step 42727: {'lr': 0.00041225707007898127, 'samples': 8203584, 'steps': 42726, 'loss/train': 1.7285935878753662} -11/07/2021 03:13:17 - INFO - __main__ - Step 42728: {'lr': 0.0004122530328608781, 'samples': 8203776, 'steps': 42727, 'loss/train': 1.6887344121932983} -11/07/2021 03:13:17 - INFO - __main__ - Step 42729: {'lr': 0.00041224899556966635, 'samples': 8203968, 'steps': 42728, 'loss/train': 1.861165165901184} -11/07/2021 03:13:18 - INFO - __main__ - Step 42730: {'lr': 0.00041224495820534757, 'samples': 8204160, 'steps': 42729, 'loss/train': 0.25296056270599365} -11/07/2021 03:13:19 - INFO - __main__ - Step 42731: {'lr': 0.00041224092076792374, 'samples': 8204352, 'steps': 42730, 'loss/train': 1.3531886339187622} -11/07/2021 03:13:19 - INFO - __main__ - Step 42732: {'lr': 0.0004122368832573967, 'samples': 8204544, 'steps': 42731, 'loss/train': 1.4255421161651611} -11/07/2021 03:13:19 - INFO - __main__ - Step 42733: {'lr': 0.00041223284567376816, 'samples': 8204736, 'steps': 42732, 'loss/train': 1.5796672105789185} -11/07/2021 03:13:20 - INFO - __main__ - Step 42734: {'lr': 0.00041222880801704005, 'samples': 8204928, 'steps': 42733, 'loss/train': 1.8132939338684082} -11/07/2021 03:13:21 - INFO - __main__ - Step 42735: {'lr': 0.0004122247702872141, 'samples': 8205120, 'steps': 42734, 'loss/train': 2.2760121822357178} -11/07/2021 03:13:21 - INFO - __main__ - Step 42736: {'lr': 0.0004122207324842923, 'samples': 8205312, 'steps': 42735, 'loss/train': 1.2232327461242676} -11/07/2021 03:13:22 - INFO - __main__ - Step 42737: {'lr': 0.00041221669460827614, 'samples': 8205504, 'steps': 42736, 'loss/train': 1.5809918642044067} -11/07/2021 03:13:22 - INFO - __main__ - Step 42738: {'lr': 0.00041221265665916776, 'samples': 8205696, 'steps': 42737, 'loss/train': 1.5916699171066284} -11/07/2021 03:13:22 - INFO - __main__ - Step 42739: {'lr': 0.00041220861863696886, 'samples': 8205888, 'steps': 42738, 'loss/train': 1.396811604499817} -11/07/2021 03:13:23 - INFO - __main__ - Step 42740: {'lr': 0.0004122045805416812, 'samples': 8206080, 'steps': 42739, 'loss/train': 1.6565934419631958} -11/07/2021 03:13:24 - INFO - __main__ - Step 42741: {'lr': 0.00041220054237330674, 'samples': 8206272, 'steps': 42740, 'loss/train': 1.755387783050537} -11/07/2021 03:13:24 - INFO - __main__ - Step 42742: {'lr': 0.00041219650413184714, 'samples': 8206464, 'steps': 42741, 'loss/train': 1.520103096961975} -11/07/2021 03:13:24 - INFO - __main__ - Step 42743: {'lr': 0.00041219246581730435, 'samples': 8206656, 'steps': 42742, 'loss/train': 1.721859097480774} -11/07/2021 03:13:25 - INFO - __main__ - Step 42744: {'lr': 0.0004121884274296801, 'samples': 8206848, 'steps': 42743, 'loss/train': 1.856993556022644} -11/07/2021 03:13:26 - INFO - __main__ - Step 42745: {'lr': 0.00041218438896897623, 'samples': 8207040, 'steps': 42744, 'loss/train': 1.4189162254333496} -11/07/2021 03:13:26 - INFO - __main__ - Step 42746: {'lr': 0.00041218035043519464, 'samples': 8207232, 'steps': 42745, 'loss/train': 1.5349032878875732} -11/07/2021 03:13:27 - INFO - __main__ - Step 42747: {'lr': 0.00041217631182833707, 'samples': 8207424, 'steps': 42746, 'loss/train': 1.169258713722229} -11/07/2021 03:13:27 - INFO - __main__ - Step 42748: {'lr': 0.00041217227314840535, 'samples': 8207616, 'steps': 42747, 'loss/train': 2.701878547668457} -11/07/2021 03:13:27 - INFO - __main__ - Step 42749: {'lr': 0.00041216823439540134, 'samples': 8207808, 'steps': 42748, 'loss/train': 1.5812207460403442} -11/07/2021 03:13:28 - INFO - __main__ - Step 42750: {'lr': 0.0004121641955693268, 'samples': 8208000, 'steps': 42749, 'loss/train': 1.693583369255066} -11/07/2021 03:13:29 - INFO - __main__ - Step 42751: {'lr': 0.00041216015667018357, 'samples': 8208192, 'steps': 42750, 'loss/train': 1.6943845748901367} -11/07/2021 03:13:29 - INFO - __main__ - Step 42752: {'lr': 0.00041215611769797344, 'samples': 8208384, 'steps': 42751, 'loss/train': 1.8799508810043335} -11/07/2021 03:13:29 - INFO - __main__ - Step 42753: {'lr': 0.00041215207865269833, 'samples': 8208576, 'steps': 42752, 'loss/train': 2.027010917663574} -11/07/2021 03:13:30 - INFO - __main__ - Step 42754: {'lr': 0.00041214803953435993, 'samples': 8208768, 'steps': 42753, 'loss/train': 1.3380992412567139} -11/07/2021 03:13:30 - INFO - __main__ - Step 42755: {'lr': 0.0004121440003429602, 'samples': 8208960, 'steps': 42754, 'loss/train': 1.271234393119812} -11/07/2021 03:13:31 - INFO - __main__ - Step 42756: {'lr': 0.0004121399610785008, 'samples': 8209152, 'steps': 42755, 'loss/train': 1.6511046886444092} -11/07/2021 03:13:32 - INFO - __main__ - Step 42757: {'lr': 0.00041213592174098367, 'samples': 8209344, 'steps': 42756, 'loss/train': 1.5800201892852783} -11/07/2021 03:13:32 - INFO - __main__ - Step 42758: {'lr': 0.00041213188233041065, 'samples': 8209536, 'steps': 42757, 'loss/train': 1.890745759010315} -11/07/2021 03:13:32 - INFO - __main__ - Step 42759: {'lr': 0.00041212784284678345, 'samples': 8209728, 'steps': 42758, 'loss/train': 1.4945995807647705} -11/07/2021 03:13:33 - INFO - __main__ - Step 42760: {'lr': 0.0004121238032901039, 'samples': 8209920, 'steps': 42759, 'loss/train': 1.3198996782302856} -11/07/2021 03:13:34 - INFO - __main__ - Step 42761: {'lr': 0.00041211976366037394, 'samples': 8210112, 'steps': 42760, 'loss/train': 0.8576481342315674} -11/07/2021 03:13:34 - INFO - __main__ - Step 42762: {'lr': 0.0004121157239575953, 'samples': 8210304, 'steps': 42761, 'loss/train': 1.662672758102417} -11/07/2021 03:13:35 - INFO - __main__ - Step 42763: {'lr': 0.0004121116841817699, 'samples': 8210496, 'steps': 42762, 'loss/train': 0.672544002532959} -11/07/2021 03:13:35 - INFO - __main__ - Step 42764: {'lr': 0.00041210764433289936, 'samples': 8210688, 'steps': 42763, 'loss/train': 1.4414068460464478} -11/07/2021 03:13:35 - INFO - __main__ - Step 42765: {'lr': 0.0004121036044109856, 'samples': 8210880, 'steps': 42764, 'loss/train': 1.4708746671676636} -11/07/2021 03:13:36 - INFO - __main__ - Step 42766: {'lr': 0.00041209956441603054, 'samples': 8211072, 'steps': 42765, 'loss/train': 1.7228068113327026} -11/07/2021 03:13:37 - INFO - __main__ - Step 42767: {'lr': 0.0004120955243480359, 'samples': 8211264, 'steps': 42766, 'loss/train': 1.7478610277175903} -11/07/2021 03:13:37 - INFO - __main__ - Step 42768: {'lr': 0.0004120914842070035, 'samples': 8211456, 'steps': 42767, 'loss/train': 1.1757432222366333} -11/07/2021 03:13:37 - INFO - __main__ - Step 42769: {'lr': 0.0004120874439929352, 'samples': 8211648, 'steps': 42768, 'loss/train': 1.5053163766860962} -11/07/2021 03:13:38 - INFO - __main__ - Step 42770: {'lr': 0.00041208340370583275, 'samples': 8211840, 'steps': 42769, 'loss/train': 0.9787638783454895} -11/07/2021 03:13:39 - INFO - __main__ - Step 42771: {'lr': 0.0004120793633456981, 'samples': 8212032, 'steps': 42770, 'loss/train': 1.8949719667434692} -11/07/2021 03:13:39 - INFO - __main__ - Step 42772: {'lr': 0.0004120753229125329, 'samples': 8212224, 'steps': 42771, 'loss/train': 1.3817518949508667} -11/07/2021 03:13:40 - INFO - __main__ - Step 42773: {'lr': 0.00041207128240633906, 'samples': 8212416, 'steps': 42772, 'loss/train': 1.1997261047363281} -11/07/2021 03:13:40 - INFO - __main__ - Step 42774: {'lr': 0.0004120672418271184, 'samples': 8212608, 'steps': 42773, 'loss/train': 1.54781174659729} -11/07/2021 03:13:40 - INFO - __main__ - Step 42775: {'lr': 0.0004120632011748728, 'samples': 8212800, 'steps': 42774, 'loss/train': 1.4456589221954346} -11/07/2021 03:13:41 - INFO - __main__ - Step 42776: {'lr': 0.00041205916044960406, 'samples': 8212992, 'steps': 42775, 'loss/train': 3.485616683959961} -11/07/2021 03:13:42 - INFO - __main__ - Step 42777: {'lr': 0.0004120551196513139, 'samples': 8213184, 'steps': 42776, 'loss/train': 1.132140040397644} -11/07/2021 03:13:42 - INFO - __main__ - Step 42778: {'lr': 0.0004120510787800042, 'samples': 8213376, 'steps': 42777, 'loss/train': 1.948042869567871} -11/07/2021 03:13:42 - INFO - __main__ - Step 42779: {'lr': 0.0004120470378356768, 'samples': 8213568, 'steps': 42778, 'loss/train': 1.4851789474487305} -11/07/2021 03:13:43 - INFO - __main__ - Step 42780: {'lr': 0.00041204299681833344, 'samples': 8213760, 'steps': 42779, 'loss/train': 1.4981358051300049} -11/07/2021 03:13:43 - INFO - __main__ - Step 42781: {'lr': 0.00041203895572797613, 'samples': 8213952, 'steps': 42780, 'loss/train': 1.876665472984314} -11/07/2021 03:13:44 - INFO - __main__ - Step 42782: {'lr': 0.00041203491456460653, 'samples': 8214144, 'steps': 42781, 'loss/train': 1.4150429964065552} -11/07/2021 03:13:44 - INFO - __main__ - Step 42783: {'lr': 0.00041203087332822644, 'samples': 8214336, 'steps': 42782, 'loss/train': 1.4986529350280762} -11/07/2021 03:13:45 - INFO - __main__ - Step 42784: {'lr': 0.0004120268320188378, 'samples': 8214528, 'steps': 42783, 'loss/train': 1.3611279726028442} -11/07/2021 03:13:45 - INFO - __main__ - Step 42785: {'lr': 0.00041202279063644234, 'samples': 8214720, 'steps': 42784, 'loss/train': 1.2365634441375732} -11/07/2021 03:13:45 - INFO - __main__ - Step 42786: {'lr': 0.00041201874918104185, 'samples': 8214912, 'steps': 42785, 'loss/train': 1.448770523071289} -11/07/2021 03:13:47 - INFO - __main__ - Step 42787: {'lr': 0.0004120147076526383, 'samples': 8215104, 'steps': 42786, 'loss/train': 1.3730212450027466} -11/07/2021 03:13:47 - INFO - __main__ - Step 42788: {'lr': 0.0004120106660512334, 'samples': 8215296, 'steps': 42787, 'loss/train': 1.5505905151367188} -11/07/2021 03:13:48 - INFO - __main__ - Step 42789: {'lr': 0.000412006624376829, 'samples': 8215488, 'steps': 42788, 'loss/train': 1.574457049369812} -11/07/2021 03:13:48 - INFO - __main__ - Step 42790: {'lr': 0.0004120025826294269, 'samples': 8215680, 'steps': 42789, 'loss/train': 1.6592400074005127} -11/07/2021 03:13:48 - INFO - __main__ - Step 42791: {'lr': 0.00041199854080902897, 'samples': 8215872, 'steps': 42790, 'loss/train': 1.792243242263794} -11/07/2021 03:13:49 - INFO - __main__ - Step 42792: {'lr': 0.00041199449891563694, 'samples': 8216064, 'steps': 42791, 'loss/train': 1.2733299732208252} -11/07/2021 03:13:50 - INFO - __main__ - Step 42793: {'lr': 0.00041199045694925273, 'samples': 8216256, 'steps': 42792, 'loss/train': 1.6514403820037842} -11/07/2021 03:13:50 - INFO - __main__ - Step 42794: {'lr': 0.0004119864149098781, 'samples': 8216448, 'steps': 42793, 'loss/train': 2.1267051696777344} -11/07/2021 03:13:50 - INFO - __main__ - Step 42795: {'lr': 0.0004119823727975149, 'samples': 8216640, 'steps': 42794, 'loss/train': 1.120583176612854} -11/07/2021 03:13:51 - INFO - __main__ - Step 42796: {'lr': 0.00041197833061216494, 'samples': 8216832, 'steps': 42795, 'loss/train': 1.3337584733963013} -11/07/2021 03:13:51 - INFO - __main__ - Step 42797: {'lr': 0.00041197428835383, 'samples': 8217024, 'steps': 42796, 'loss/train': 0.7551344037055969} -11/07/2021 03:13:52 - INFO - __main__ - Step 42798: {'lr': 0.00041197024602251204, 'samples': 8217216, 'steps': 42797, 'loss/train': 1.4640302658081055} -11/07/2021 03:13:53 - INFO - __main__ - Step 42799: {'lr': 0.0004119662036182127, 'samples': 8217408, 'steps': 42798, 'loss/train': 1.2800933122634888} -11/07/2021 03:13:53 - INFO - __main__ - Step 42800: {'lr': 0.00041196216114093397, 'samples': 8217600, 'steps': 42799, 'loss/train': 1.4961788654327393} -11/07/2021 03:13:53 - INFO - __main__ - Step 42801: {'lr': 0.00041195811859067756, 'samples': 8217792, 'steps': 42800, 'loss/train': 1.5047647953033447} -11/07/2021 03:13:54 - INFO - __main__ - Step 42802: {'lr': 0.0004119540759674453, 'samples': 8217984, 'steps': 42801, 'loss/train': 1.2064974308013916} -11/07/2021 03:13:54 - INFO - __main__ - Step 42803: {'lr': 0.000411950033271239, 'samples': 8218176, 'steps': 42802, 'loss/train': 1.220013976097107} -11/07/2021 03:13:55 - INFO - __main__ - Step 42804: {'lr': 0.0004119459905020606, 'samples': 8218368, 'steps': 42803, 'loss/train': 1.2036381959915161} -11/07/2021 03:13:55 - INFO - __main__ - Step 42805: {'lr': 0.0004119419476599118, 'samples': 8218560, 'steps': 42804, 'loss/train': 1.4537402391433716} -11/07/2021 03:13:56 - INFO - __main__ - Step 42806: {'lr': 0.0004119379047447944, 'samples': 8218752, 'steps': 42805, 'loss/train': 1.662406086921692} -11/07/2021 03:13:56 - INFO - __main__ - Step 42807: {'lr': 0.00041193386175671033, 'samples': 8218944, 'steps': 42806, 'loss/train': 1.4320244789123535} -11/07/2021 03:13:56 - INFO - __main__ - Step 42808: {'lr': 0.0004119298186956613, 'samples': 8219136, 'steps': 42807, 'loss/train': 1.7451808452606201} -11/07/2021 03:13:57 - INFO - __main__ - Step 42809: {'lr': 0.00041192577556164924, 'samples': 8219328, 'steps': 42808, 'loss/train': 3.0425539016723633} -11/07/2021 03:13:58 - INFO - __main__ - Step 42810: {'lr': 0.000411921732354676, 'samples': 8219520, 'steps': 42809, 'loss/train': 1.4344040155410767} -11/07/2021 03:13:58 - INFO - __main__ - Step 42811: {'lr': 0.00041191768907474326, 'samples': 8219712, 'steps': 42810, 'loss/train': 1.871738314628601} -11/07/2021 03:13:58 - INFO - __main__ - Step 42812: {'lr': 0.00041191364572185286, 'samples': 8219904, 'steps': 42811, 'loss/train': 1.4439513683319092} -11/07/2021 03:13:59 - INFO - __main__ - Step 42813: {'lr': 0.0004119096022960067, 'samples': 8220096, 'steps': 42812, 'loss/train': 1.6381014585494995} -11/07/2021 03:14:00 - INFO - __main__ - Step 42814: {'lr': 0.0004119055587972066, 'samples': 8220288, 'steps': 42813, 'loss/train': 1.3307337760925293} -11/07/2021 03:14:00 - INFO - __main__ - Step 42815: {'lr': 0.0004119015152254543, 'samples': 8220480, 'steps': 42814, 'loss/train': 1.7919366359710693} -11/07/2021 03:14:01 - INFO - __main__ - Step 42816: {'lr': 0.00041189747158075176, 'samples': 8220672, 'steps': 42815, 'loss/train': 1.4417839050292969} -11/07/2021 03:14:01 - INFO - __main__ - Step 42817: {'lr': 0.00041189342786310067, 'samples': 8220864, 'steps': 42816, 'loss/train': 1.1310538053512573} -11/07/2021 03:14:01 - INFO - __main__ - Step 42818: {'lr': 0.0004118893840725029, 'samples': 8221056, 'steps': 42817, 'loss/train': 1.6472176313400269} -11/07/2021 03:14:02 - INFO - __main__ - Step 42819: {'lr': 0.0004118853402089603, 'samples': 8221248, 'steps': 42818, 'loss/train': 0.6757338643074036} -11/07/2021 03:14:03 - INFO - __main__ - Step 42820: {'lr': 0.0004118812962724746, 'samples': 8221440, 'steps': 42819, 'loss/train': 1.600584626197815} -11/07/2021 03:14:03 - INFO - __main__ - Step 42821: {'lr': 0.00041187725226304775, 'samples': 8221632, 'steps': 42820, 'loss/train': 1.9334253072738647} -11/07/2021 03:14:04 - INFO - __main__ - Step 42822: {'lr': 0.0004118732081806814, 'samples': 8221824, 'steps': 42821, 'loss/train': 1.7592384815216064} -11/07/2021 03:14:04 - INFO - __main__ - Step 42823: {'lr': 0.0004118691640253777, 'samples': 8222016, 'steps': 42822, 'loss/train': 0.5113934874534607} -11/07/2021 03:14:04 - INFO - __main__ - Step 42824: {'lr': 0.00041186511979713806, 'samples': 8222208, 'steps': 42823, 'loss/train': 1.31758451461792} -11/07/2021 03:14:05 - INFO - __main__ - Step 42825: {'lr': 0.00041186107549596453, 'samples': 8222400, 'steps': 42824, 'loss/train': 1.43822181224823} -11/07/2021 03:14:06 - INFO - __main__ - Step 42826: {'lr': 0.0004118570311218589, 'samples': 8222592, 'steps': 42825, 'loss/train': 1.5050877332687378} -11/07/2021 03:14:06 - INFO - __main__ - Step 42827: {'lr': 0.00041185298667482294, 'samples': 8222784, 'steps': 42826, 'loss/train': 1.505362868309021} -11/07/2021 03:14:06 - INFO - __main__ - Step 42828: {'lr': 0.0004118489421548586, 'samples': 8222976, 'steps': 42827, 'loss/train': 0.5131959915161133} -11/07/2021 03:14:07 - INFO - __main__ - Step 42829: {'lr': 0.00041184489756196764, 'samples': 8223168, 'steps': 42828, 'loss/train': 1.1229454278945923} -11/07/2021 03:14:07 - INFO - __main__ - Step 42830: {'lr': 0.0004118408528961519, 'samples': 8223360, 'steps': 42829, 'loss/train': 1.5232681035995483} -11/07/2021 03:14:08 - INFO - __main__ - Step 42831: {'lr': 0.00041183680815741307, 'samples': 8223552, 'steps': 42830, 'loss/train': 1.2058498859405518} -11/07/2021 03:14:08 - INFO - __main__ - Step 42832: {'lr': 0.0004118327633457531, 'samples': 8223744, 'steps': 42831, 'loss/train': 0.5994836688041687} -11/07/2021 03:14:09 - INFO - __main__ - Step 42833: {'lr': 0.00041182871846117373, 'samples': 8223936, 'steps': 42832, 'loss/train': 1.479069471359253} -11/07/2021 03:14:09 - INFO - __main__ - Step 42834: {'lr': 0.0004118246735036769, 'samples': 8224128, 'steps': 42833, 'loss/train': 1.2316757440567017} -11/07/2021 03:14:09 - INFO - __main__ - Step 42835: {'lr': 0.0004118206284732644, 'samples': 8224320, 'steps': 42834, 'loss/train': 1.3874062299728394} -11/07/2021 03:14:10 - INFO - __main__ - Step 42836: {'lr': 0.000411816583369938, 'samples': 8224512, 'steps': 42835, 'loss/train': 1.6726195812225342} -11/07/2021 03:14:11 - INFO - __main__ - Step 42837: {'lr': 0.0004118125381936996, 'samples': 8224704, 'steps': 42836, 'loss/train': 1.5835198163986206} -11/07/2021 03:14:11 - INFO - __main__ - Step 42838: {'lr': 0.0004118084929445508, 'samples': 8224896, 'steps': 42837, 'loss/train': 1.3595654964447021} -11/07/2021 03:14:11 - INFO - __main__ - Step 42839: {'lr': 0.0004118044476224937, 'samples': 8225088, 'steps': 42838, 'loss/train': 1.2652711868286133} -11/07/2021 03:14:12 - INFO - __main__ - Step 42840: {'lr': 0.00041180040222753, 'samples': 8225280, 'steps': 42839, 'loss/train': 1.5912714004516602} -11/07/2021 03:14:13 - INFO - __main__ - Step 42841: {'lr': 0.00041179635675966155, 'samples': 8225472, 'steps': 42840, 'loss/train': 1.1543596982955933} -11/07/2021 03:14:13 - INFO - __main__ - Step 42842: {'lr': 0.00041179231121889014, 'samples': 8225664, 'steps': 42841, 'loss/train': 0.6163930892944336} -11/07/2021 03:14:14 - INFO - __main__ - Step 42843: {'lr': 0.0004117882656052176, 'samples': 8225856, 'steps': 42842, 'loss/train': 1.5155036449432373} -11/07/2021 03:14:14 - INFO - __main__ - Step 42844: {'lr': 0.0004117842199186458, 'samples': 8226048, 'steps': 42843, 'loss/train': 1.2637860774993896} -11/07/2021 03:14:14 - INFO - __main__ - Step 42845: {'lr': 0.00041178017415917655, 'samples': 8226240, 'steps': 42844, 'loss/train': 1.3483153581619263} -11/07/2021 03:14:15 - INFO - __main__ - Step 42846: {'lr': 0.00041177612832681156, 'samples': 8226432, 'steps': 42845, 'loss/train': 1.0798571109771729} -11/07/2021 03:14:16 - INFO - __main__ - Step 42847: {'lr': 0.00041177208242155285, 'samples': 8226624, 'steps': 42846, 'loss/train': 1.6547551155090332} -11/07/2021 03:14:16 - INFO - __main__ - Step 42848: {'lr': 0.000411768036443402, 'samples': 8226816, 'steps': 42847, 'loss/train': 2.1480069160461426} -11/07/2021 03:14:17 - INFO - __main__ - Step 42849: {'lr': 0.0004117639903923611, 'samples': 8227008, 'steps': 42848, 'loss/train': 0.9353717565536499} -11/07/2021 03:14:17 - INFO - __main__ - Step 42850: {'lr': 0.00041175994426843177, 'samples': 8227200, 'steps': 42849, 'loss/train': 1.4175337553024292} -11/07/2021 03:14:18 - INFO - __main__ - Step 42851: {'lr': 0.00041175589807161597, 'samples': 8227392, 'steps': 42850, 'loss/train': 1.5138330459594727} -11/07/2021 03:14:18 - INFO - __main__ - Step 42852: {'lr': 0.0004117518518019154, 'samples': 8227584, 'steps': 42851, 'loss/train': 1.3619396686553955} -11/07/2021 03:14:19 - INFO - __main__ - Step 42853: {'lr': 0.00041174780545933195, 'samples': 8227776, 'steps': 42852, 'loss/train': 1.7273114919662476} -11/07/2021 03:14:19 - INFO - __main__ - Step 42854: {'lr': 0.0004117437590438674, 'samples': 8227968, 'steps': 42853, 'loss/train': 1.7855308055877686} -11/07/2021 03:14:19 - INFO - __main__ - Step 42855: {'lr': 0.0004117397125555237, 'samples': 8228160, 'steps': 42854, 'loss/train': 1.7407039403915405} -11/07/2021 03:14:21 - INFO - __main__ - Step 42856: {'lr': 0.00041173566599430245, 'samples': 8228352, 'steps': 42855, 'loss/train': 1.6007099151611328} -11/07/2021 03:14:22 - INFO - __main__ - Step 42857: {'lr': 0.00041173161936020573, 'samples': 8228544, 'steps': 42856, 'loss/train': 1.495436668395996} -11/07/2021 03:14:22 - INFO - __main__ - Step 42858: {'lr': 0.0004117275726532352, 'samples': 8228736, 'steps': 42857, 'loss/train': 1.219700574874878} -11/07/2021 03:14:22 - INFO - __main__ - Step 42859: {'lr': 0.0004117235258733927, 'samples': 8228928, 'steps': 42858, 'loss/train': 1.6199307441711426} -11/07/2021 03:14:23 - INFO - __main__ - Step 42860: {'lr': 0.00041171947902068006, 'samples': 8229120, 'steps': 42859, 'loss/train': 1.9934972524642944} -11/07/2021 03:14:23 - INFO - __main__ - Step 42861: {'lr': 0.00041171543209509923, 'samples': 8229312, 'steps': 42860, 'loss/train': 1.7413346767425537} -11/07/2021 03:14:23 - INFO - __main__ - Step 42862: {'lr': 0.0004117113850966517, 'samples': 8229504, 'steps': 42861, 'loss/train': 1.840273141860962} -11/07/2021 03:14:24 - INFO - __main__ - Step 42863: {'lr': 0.00041170733802533974, 'samples': 8229696, 'steps': 42862, 'loss/train': 1.7821216583251953} -11/07/2021 03:14:25 - INFO - __main__ - Step 42864: {'lr': 0.0004117032908811649, 'samples': 8229888, 'steps': 42863, 'loss/train': 1.765580177307129} -11/07/2021 03:14:25 - INFO - __main__ - Step 42865: {'lr': 0.000411699243664129, 'samples': 8230080, 'steps': 42864, 'loss/train': 0.8765882253646851} -11/07/2021 03:14:26 - INFO - __main__ - Step 42866: {'lr': 0.00041169519637423394, 'samples': 8230272, 'steps': 42865, 'loss/train': 1.6690140962600708} -11/07/2021 03:14:26 - INFO - __main__ - Step 42867: {'lr': 0.0004116911490114815, 'samples': 8230464, 'steps': 42866, 'loss/train': 0.9538524150848389} -11/07/2021 03:14:26 - INFO - __main__ - Step 42868: {'lr': 0.0004116871015758735, 'samples': 8230656, 'steps': 42867, 'loss/train': 1.6665130853652954} -11/07/2021 03:14:27 - INFO - __main__ - Step 42869: {'lr': 0.0004116830540674118, 'samples': 8230848, 'steps': 42868, 'loss/train': 1.5690141916275024} -11/07/2021 03:14:28 - INFO - __main__ - Step 42870: {'lr': 0.00041167900648609825, 'samples': 8231040, 'steps': 42869, 'loss/train': 1.5212374925613403} -11/07/2021 03:14:28 - INFO - __main__ - Step 42871: {'lr': 0.00041167495883193464, 'samples': 8231232, 'steps': 42870, 'loss/train': 1.4287992715835571} -11/07/2021 03:14:28 - INFO - __main__ - Step 42872: {'lr': 0.00041167091110492273, 'samples': 8231424, 'steps': 42871, 'loss/train': 1.6299023628234863} -11/07/2021 03:14:29 - INFO - __main__ - Step 42873: {'lr': 0.0004116668633050644, 'samples': 8231616, 'steps': 42872, 'loss/train': 1.3518669605255127} -11/07/2021 03:14:29 - INFO - __main__ - Step 42874: {'lr': 0.0004116628154323616, 'samples': 8231808, 'steps': 42873, 'loss/train': 1.5255669355392456} -11/07/2021 03:14:30 - INFO - __main__ - Step 42875: {'lr': 0.0004116587674868159, 'samples': 8232000, 'steps': 42874, 'loss/train': 1.3380085229873657} -11/07/2021 03:14:31 - INFO - __main__ - Step 42876: {'lr': 0.00041165471946842924, 'samples': 8232192, 'steps': 42875, 'loss/train': 1.9206820726394653} -11/07/2021 03:14:31 - INFO - __main__ - Step 42877: {'lr': 0.00041165067137720356, 'samples': 8232384, 'steps': 42876, 'loss/train': 1.344838261604309} -11/07/2021 03:14:31 - INFO - __main__ - Step 42878: {'lr': 0.00041164662321314054, 'samples': 8232576, 'steps': 42877, 'loss/train': 1.2000056505203247} -11/07/2021 03:14:32 - INFO - __main__ - Step 42879: {'lr': 0.000411642574976242, 'samples': 8232768, 'steps': 42878, 'loss/train': 1.7511587142944336} -11/07/2021 03:14:33 - INFO - __main__ - Step 42880: {'lr': 0.0004116385266665099, 'samples': 8232960, 'steps': 42879, 'loss/train': 0.9567857384681702} -11/07/2021 03:14:33 - INFO - __main__ - Step 42881: {'lr': 0.0004116344782839459, 'samples': 8233152, 'steps': 42880, 'loss/train': 1.3815840482711792} -11/07/2021 03:14:33 - INFO - __main__ - Step 42882: {'lr': 0.00041163042982855194, 'samples': 8233344, 'steps': 42881, 'loss/train': 1.416580080986023} -11/07/2021 03:14:34 - INFO - __main__ - Step 42883: {'lr': 0.00041162638130032975, 'samples': 8233536, 'steps': 42882, 'loss/train': 1.3377119302749634} -11/07/2021 03:14:34 - INFO - __main__ - Step 42884: {'lr': 0.00041162233269928126, 'samples': 8233728, 'steps': 42883, 'loss/train': 1.66068434715271} -11/07/2021 03:14:35 - INFO - __main__ - Step 42885: {'lr': 0.0004116182840254082, 'samples': 8233920, 'steps': 42884, 'loss/train': 1.219361662864685} -11/07/2021 03:14:35 - INFO - __main__ - Step 42886: {'lr': 0.0004116142352787125, 'samples': 8234112, 'steps': 42885, 'loss/train': 1.7923866510391235} -11/07/2021 03:14:36 - INFO - __main__ - Step 42887: {'lr': 0.00041161018645919593, 'samples': 8234304, 'steps': 42886, 'loss/train': 1.2530755996704102} -11/07/2021 03:14:36 - INFO - __main__ - Step 42888: {'lr': 0.00041160613756686015, 'samples': 8234496, 'steps': 42887, 'loss/train': 1.4656062126159668} -11/07/2021 03:14:37 - INFO - __main__ - Step 42889: {'lr': 0.00041160208860170725, 'samples': 8234688, 'steps': 42888, 'loss/train': 1.395034670829773} -11/07/2021 03:14:38 - INFO - __main__ - Step 42890: {'lr': 0.000411598039563739, 'samples': 8234880, 'steps': 42889, 'loss/train': 1.0422735214233398} -11/07/2021 03:14:38 - INFO - __main__ - Step 42891: {'lr': 0.0004115939904529571, 'samples': 8235072, 'steps': 42890, 'loss/train': 1.6529215574264526} -11/07/2021 03:14:38 - INFO - __main__ - Step 42892: {'lr': 0.00041158994126936347, 'samples': 8235264, 'steps': 42891, 'loss/train': 1.6952149868011475} -11/07/2021 03:14:39 - INFO - __main__ - Step 42893: {'lr': 0.0004115858920129598, 'samples': 8235456, 'steps': 42892, 'loss/train': 1.9112871885299683} -11/07/2021 03:14:39 - INFO - __main__ - Step 42894: {'lr': 0.0004115818426837481, 'samples': 8235648, 'steps': 42893, 'loss/train': 1.6131938695907593} -11/07/2021 03:14:39 - INFO - __main__ - Step 42895: {'lr': 0.0004115777932817301, 'samples': 8235840, 'steps': 42894, 'loss/train': 1.5090101957321167} -11/07/2021 03:14:41 - INFO - __main__ - Step 42896: {'lr': 0.00041157374380690765, 'samples': 8236032, 'steps': 42895, 'loss/train': 4.94158935546875} -11/07/2021 03:14:41 - INFO - __main__ - Step 42897: {'lr': 0.0004115696942592826, 'samples': 8236224, 'steps': 42896, 'loss/train': 1.6551597118377686} -11/07/2021 03:14:41 - INFO - __main__ - Step 42898: {'lr': 0.0004115656446388567, 'samples': 8236416, 'steps': 42897, 'loss/train': 1.551294207572937} -11/07/2021 03:14:42 - INFO - __main__ - Step 42899: {'lr': 0.00041156159494563183, 'samples': 8236608, 'steps': 42898, 'loss/train': 1.627911925315857} -11/07/2021 03:14:42 - INFO - __main__ - Step 42900: {'lr': 0.00041155754517960974, 'samples': 8236800, 'steps': 42899, 'loss/train': 1.7276084423065186} -11/07/2021 03:14:42 - INFO - __main__ - Step 42901: {'lr': 0.00041155349534079236, 'samples': 8236992, 'steps': 42900, 'loss/train': 1.9185916185379028} -11/07/2021 03:14:43 - INFO - __main__ - Step 42902: {'lr': 0.0004115494454291815, 'samples': 8237184, 'steps': 42901, 'loss/train': 1.4276373386383057} -11/07/2021 03:14:44 - INFO - __main__ - Step 42903: {'lr': 0.0004115453954447789, 'samples': 8237376, 'steps': 42902, 'loss/train': 1.8472546339035034} -11/07/2021 03:14:44 - INFO - __main__ - Step 42904: {'lr': 0.0004115413453875865, 'samples': 8237568, 'steps': 42903, 'loss/train': 0.8522806167602539} -11/07/2021 03:14:44 - INFO - __main__ - Step 42905: {'lr': 0.000411537295257606, 'samples': 8237760, 'steps': 42904, 'loss/train': 1.500504493713379} -11/07/2021 03:14:45 - INFO - __main__ - Step 42906: {'lr': 0.00041153324505483933, 'samples': 8237952, 'steps': 42905, 'loss/train': 1.5426833629608154} -11/07/2021 03:14:46 - INFO - __main__ - Step 42907: {'lr': 0.0004115291947792882, 'samples': 8238144, 'steps': 42906, 'loss/train': 1.536191463470459} -11/07/2021 03:14:46 - INFO - __main__ - Step 42908: {'lr': 0.00041152514443095454, 'samples': 8238336, 'steps': 42907, 'loss/train': 1.0617425441741943} -11/07/2021 03:14:46 - INFO - __main__ - Step 42909: {'lr': 0.00041152109400984015, 'samples': 8238528, 'steps': 42908, 'loss/train': 2.1334660053253174} -11/07/2021 03:14:47 - INFO - __main__ - Step 42910: {'lr': 0.0004115170435159469, 'samples': 8238720, 'steps': 42909, 'loss/train': 1.8392415046691895} -11/07/2021 03:14:47 - INFO - __main__ - Step 42911: {'lr': 0.00041151299294927657, 'samples': 8238912, 'steps': 42910, 'loss/train': 1.5095146894454956} -11/07/2021 03:14:48 - INFO - __main__ - Step 42912: {'lr': 0.0004115089423098309, 'samples': 8239104, 'steps': 42911, 'loss/train': 1.5403552055358887} -11/07/2021 03:14:49 - INFO - __main__ - Step 42913: {'lr': 0.00041150489159761186, 'samples': 8239296, 'steps': 42912, 'loss/train': 1.5937893390655518} -11/07/2021 03:14:49 - INFO - __main__ - Step 42914: {'lr': 0.00041150084081262105, 'samples': 8239488, 'steps': 42913, 'loss/train': 1.7277464866638184} -11/07/2021 03:14:49 - INFO - __main__ - Step 42915: {'lr': 0.0004114967899548606, 'samples': 8239680, 'steps': 42914, 'loss/train': 1.2665598392486572} -11/07/2021 03:14:50 - INFO - __main__ - Step 42916: {'lr': 0.0004114927390243322, 'samples': 8239872, 'steps': 42915, 'loss/train': 1.7183034420013428} -11/07/2021 03:14:51 - INFO - __main__ - Step 42917: {'lr': 0.00041148868802103766, 'samples': 8240064, 'steps': 42916, 'loss/train': 1.6050708293914795} -11/07/2021 03:14:51 - INFO - __main__ - Step 42918: {'lr': 0.00041148463694497874, 'samples': 8240256, 'steps': 42917, 'loss/train': 1.6935396194458008} -11/07/2021 03:14:51 - INFO - __main__ - Step 42919: {'lr': 0.00041148058579615733, 'samples': 8240448, 'steps': 42918, 'loss/train': 1.258515477180481} -11/07/2021 03:14:52 - INFO - __main__ - Step 42920: {'lr': 0.00041147653457457534, 'samples': 8240640, 'steps': 42919, 'loss/train': 1.4335256814956665} -11/07/2021 03:14:52 - INFO - __main__ - Step 42921: {'lr': 0.0004114724832802345, 'samples': 8240832, 'steps': 42920, 'loss/train': 1.331539511680603} -11/07/2021 03:14:52 - INFO - __main__ - Step 42922: {'lr': 0.0004114684319131366, 'samples': 8241024, 'steps': 42921, 'loss/train': 0.9531698822975159} -11/07/2021 03:14:53 - INFO - __main__ - Step 42923: {'lr': 0.00041146438047328347, 'samples': 8241216, 'steps': 42922, 'loss/train': 1.325085163116455} -11/07/2021 03:14:54 - INFO - __main__ - Step 42924: {'lr': 0.0004114603289606771, 'samples': 8241408, 'steps': 42923, 'loss/train': 2.0017459392547607} -11/07/2021 03:14:54 - INFO - __main__ - Step 42925: {'lr': 0.00041145627737531915, 'samples': 8241600, 'steps': 42924, 'loss/train': 1.332912802696228} -11/07/2021 03:14:55 - INFO - __main__ - Step 42926: {'lr': 0.0004114522257172115, 'samples': 8241792, 'steps': 42925, 'loss/train': 1.446260929107666} -11/07/2021 03:14:55 - INFO - __main__ - Step 42927: {'lr': 0.000411448173986356, 'samples': 8241984, 'steps': 42926, 'loss/train': 1.5102177858352661} -11/07/2021 03:14:56 - INFO - __main__ - Step 42928: {'lr': 0.0004114441221827544, 'samples': 8242176, 'steps': 42927, 'loss/train': 1.4338157176971436} -11/07/2021 03:14:56 - INFO - __main__ - Step 42929: {'lr': 0.0004114400703064085, 'samples': 8242368, 'steps': 42928, 'loss/train': 1.3309646844863892} -11/07/2021 03:14:57 - INFO - __main__ - Step 42930: {'lr': 0.0004114360183573203, 'samples': 8242560, 'steps': 42929, 'loss/train': 1.402104139328003} -11/07/2021 03:14:57 - INFO - __main__ - Step 42931: {'lr': 0.0004114319663354915, 'samples': 8242752, 'steps': 42930, 'loss/train': 1.8404631614685059} -11/07/2021 03:14:57 - INFO - __main__ - Step 42932: {'lr': 0.000411427914240924, 'samples': 8242944, 'steps': 42931, 'loss/train': 1.820628046989441} -11/07/2021 03:14:58 - INFO - __main__ - Step 42933: {'lr': 0.0004114238620736195, 'samples': 8243136, 'steps': 42932, 'loss/train': 1.276533603668213} -11/07/2021 03:14:59 - INFO - __main__ - Step 42934: {'lr': 0.00041141980983357986, 'samples': 8243328, 'steps': 42933, 'loss/train': 1.1286767721176147} -11/07/2021 03:14:59 - INFO - __main__ - Step 42935: {'lr': 0.000411415757520807, 'samples': 8243520, 'steps': 42934, 'loss/train': 1.6131216287612915} -11/07/2021 03:14:59 - INFO - __main__ - Step 42936: {'lr': 0.00041141170513530267, 'samples': 8243712, 'steps': 42935, 'loss/train': 1.4220731258392334} -11/07/2021 03:15:00 - INFO - __main__ - Step 42937: {'lr': 0.0004114076526770688, 'samples': 8243904, 'steps': 42936, 'loss/train': 1.399277687072754} -11/07/2021 03:15:01 - INFO - __main__ - Step 42938: {'lr': 0.000411403600146107, 'samples': 8244096, 'steps': 42937, 'loss/train': 2.115095376968384} -11/07/2021 03:15:01 - INFO - __main__ - Step 42939: {'lr': 0.0004113995475424193, 'samples': 8244288, 'steps': 42938, 'loss/train': 1.4036604166030884} -11/07/2021 03:15:02 - INFO - __main__ - Step 42940: {'lr': 0.0004113954948660075, 'samples': 8244480, 'steps': 42939, 'loss/train': 1.0579941272735596} -11/07/2021 03:15:02 - INFO - __main__ - Step 42941: {'lr': 0.00041139144211687327, 'samples': 8244672, 'steps': 42940, 'loss/train': 1.5197367668151855} -11/07/2021 03:15:02 - INFO - __main__ - Step 42942: {'lr': 0.0004113873892950186, 'samples': 8244864, 'steps': 42941, 'loss/train': 1.0686310529708862} -11/07/2021 03:15:03 - INFO - __main__ - Step 42943: {'lr': 0.00041138333640044523, 'samples': 8245056, 'steps': 42942, 'loss/train': 1.4850374460220337} -11/07/2021 03:15:04 - INFO - __main__ - Step 42944: {'lr': 0.0004113792834331551, 'samples': 8245248, 'steps': 42943, 'loss/train': 1.482663869857788} -11/07/2021 03:15:04 - INFO - __main__ - Step 42945: {'lr': 0.00041137523039314994, 'samples': 8245440, 'steps': 42944, 'loss/train': 1.2159746885299683} -11/07/2021 03:15:05 - INFO - __main__ - Step 42946: {'lr': 0.0004113711772804315, 'samples': 8245632, 'steps': 42945, 'loss/train': 1.1424510478973389} -11/07/2021 03:15:05 - INFO - __main__ - Step 42947: {'lr': 0.0004113671240950018, 'samples': 8245824, 'steps': 42946, 'loss/train': 1.3112131357192993} -11/07/2021 03:15:06 - INFO - __main__ - Step 42948: {'lr': 0.0004113630708368625, 'samples': 8246016, 'steps': 42947, 'loss/train': 1.9154735803604126} -11/07/2021 03:15:06 - INFO - __main__ - Step 42949: {'lr': 0.0004113590175060155, 'samples': 8246208, 'steps': 42948, 'loss/train': 1.2409237623214722} -11/07/2021 03:15:07 - INFO - __main__ - Step 42950: {'lr': 0.00041135496410246264, 'samples': 8246400, 'steps': 42949, 'loss/train': 1.1103994846343994} -11/07/2021 03:15:07 - INFO - __main__ - Step 42951: {'lr': 0.0004113509106262058, 'samples': 8246592, 'steps': 42950, 'loss/train': 1.343586802482605} -11/07/2021 03:15:07 - INFO - __main__ - Step 42952: {'lr': 0.00041134685707724656, 'samples': 8246784, 'steps': 42951, 'loss/train': 1.314520239830017} -11/07/2021 03:15:08 - INFO - __main__ - Step 42953: {'lr': 0.000411342803455587, 'samples': 8246976, 'steps': 42952, 'loss/train': 1.8426026105880737} -11/07/2021 03:15:09 - INFO - __main__ - Step 42954: {'lr': 0.0004113387497612289, 'samples': 8247168, 'steps': 42953, 'loss/train': 1.7123295068740845} -11/07/2021 03:15:09 - INFO - __main__ - Step 42955: {'lr': 0.00041133469599417393, 'samples': 8247360, 'steps': 42954, 'loss/train': 1.0952670574188232} -11/07/2021 03:15:09 - INFO - __main__ - Step 42956: {'lr': 0.00041133064215442415, 'samples': 8247552, 'steps': 42955, 'loss/train': 2.494164228439331} -11/07/2021 03:15:10 - INFO - __main__ - Step 42957: {'lr': 0.0004113265882419812, 'samples': 8247744, 'steps': 42956, 'loss/train': 1.4035422801971436} -11/07/2021 03:15:10 - INFO - __main__ - Step 42958: {'lr': 0.0004113225342568471, 'samples': 8247936, 'steps': 42957, 'loss/train': 1.3970733880996704} -11/07/2021 03:15:11 - INFO - __main__ - Step 42959: {'lr': 0.00041131848019902343, 'samples': 8248128, 'steps': 42958, 'loss/train': 1.5247231721878052} -11/07/2021 03:15:11 - INFO - __main__ - Step 42960: {'lr': 0.0004113144260685122, 'samples': 8248320, 'steps': 42959, 'loss/train': 1.2599166631698608} -11/07/2021 03:15:12 - INFO - __main__ - Step 42961: {'lr': 0.00041131037186531514, 'samples': 8248512, 'steps': 42960, 'loss/train': 1.5106650590896606} -11/07/2021 03:15:12 - INFO - __main__ - Step 42962: {'lr': 0.00041130631758943414, 'samples': 8248704, 'steps': 42961, 'loss/train': 1.5878769159317017} -11/07/2021 03:15:13 - INFO - __main__ - Step 42963: {'lr': 0.00041130226324087094, 'samples': 8248896, 'steps': 42962, 'loss/train': 1.6092218160629272} -11/07/2021 03:15:14 - INFO - __main__ - Step 42964: {'lr': 0.00041129820881962754, 'samples': 8249088, 'steps': 42963, 'loss/train': 1.5334964990615845} -11/07/2021 03:15:14 - INFO - __main__ - Step 42965: {'lr': 0.0004112941543257056, 'samples': 8249280, 'steps': 42964, 'loss/train': 1.873719573020935} -11/07/2021 03:15:14 - INFO - __main__ - Step 42966: {'lr': 0.00041129009975910704, 'samples': 8249472, 'steps': 42965, 'loss/train': 1.4746450185775757} -11/07/2021 03:15:15 - INFO - __main__ - Step 42967: {'lr': 0.00041128604511983356, 'samples': 8249664, 'steps': 42966, 'loss/train': 2.0043632984161377} -11/07/2021 03:15:15 - INFO - __main__ - Step 42968: {'lr': 0.00041128199040788715, 'samples': 8249856, 'steps': 42967, 'loss/train': 1.3230992555618286} -11/07/2021 03:15:16 - INFO - __main__ - Step 42969: {'lr': 0.00041127793562326955, 'samples': 8250048, 'steps': 42968, 'loss/train': 1.7417832612991333} -11/07/2021 03:15:16 - INFO - __main__ - Step 42970: {'lr': 0.0004112738807659826, 'samples': 8250240, 'steps': 42969, 'loss/train': 1.4938559532165527} -11/07/2021 03:15:17 - INFO - __main__ - Step 42971: {'lr': 0.00041126982583602817, 'samples': 8250432, 'steps': 42970, 'loss/train': 1.7032666206359863} -11/07/2021 03:15:17 - INFO - __main__ - Step 42972: {'lr': 0.00041126577083340797, 'samples': 8250624, 'steps': 42971, 'loss/train': 1.1354724168777466} -11/07/2021 03:15:17 - INFO - __main__ - Step 42973: {'lr': 0.000411261715758124, 'samples': 8250816, 'steps': 42972, 'loss/train': 1.4441967010498047} -11/07/2021 03:15:18 - INFO - __main__ - Step 42974: {'lr': 0.0004112576606101779, 'samples': 8251008, 'steps': 42973, 'loss/train': 1.3982219696044922} -11/07/2021 03:15:19 - INFO - __main__ - Step 42975: {'lr': 0.0004112536053895716, 'samples': 8251200, 'steps': 42974, 'loss/train': 1.5185602903366089} -11/07/2021 03:15:19 - INFO - __main__ - Step 42976: {'lr': 0.0004112495500963069, 'samples': 8251392, 'steps': 42975, 'loss/train': 1.5261902809143066} -11/07/2021 03:15:19 - INFO - __main__ - Step 42977: {'lr': 0.00041124549473038564, 'samples': 8251584, 'steps': 42976, 'loss/train': 1.7653063535690308} -11/07/2021 03:15:20 - INFO - __main__ - Step 42978: {'lr': 0.0004112414392918097, 'samples': 8251776, 'steps': 42977, 'loss/train': 1.3035284280776978} -11/07/2021 03:15:20 - INFO - __main__ - Step 42979: {'lr': 0.00041123738378058083, 'samples': 8251968, 'steps': 42978, 'loss/train': 1.7096556425094604} -11/07/2021 03:15:21 - INFO - __main__ - Step 42980: {'lr': 0.0004112333281967009, 'samples': 8252160, 'steps': 42979, 'loss/train': 1.40980863571167} -11/07/2021 03:15:22 - INFO - __main__ - Step 42981: {'lr': 0.00041122927254017173, 'samples': 8252352, 'steps': 42980, 'loss/train': 1.3556780815124512} -11/07/2021 03:15:22 - INFO - __main__ - Step 42982: {'lr': 0.0004112252168109951, 'samples': 8252544, 'steps': 42981, 'loss/train': 1.8229740858078003} -11/07/2021 03:15:22 - INFO - __main__ - Step 42983: {'lr': 0.0004112211610091728, 'samples': 8252736, 'steps': 42982, 'loss/train': 2.1034083366394043} -11/07/2021 03:15:23 - INFO - __main__ - Step 42984: {'lr': 0.0004112171051347069, 'samples': 8252928, 'steps': 42983, 'loss/train': 1.8783169984817505} -11/07/2021 03:15:24 - INFO - __main__ - Step 42985: {'lr': 0.00041121304918759893, 'samples': 8253120, 'steps': 42984, 'loss/train': 1.5309916734695435} -11/07/2021 03:15:24 - INFO - __main__ - Step 42986: {'lr': 0.00041120899316785095, 'samples': 8253312, 'steps': 42985, 'loss/train': 1.4424855709075928} -11/07/2021 03:15:24 - INFO - __main__ - Step 42987: {'lr': 0.00041120493707546456, 'samples': 8253504, 'steps': 42986, 'loss/train': 1.3083442449569702} -11/07/2021 03:15:25 - INFO - __main__ - Step 42988: {'lr': 0.00041120088091044183, 'samples': 8253696, 'steps': 42987, 'loss/train': 1.4893476963043213} -11/07/2021 03:15:25 - INFO - __main__ - Step 42989: {'lr': 0.0004111968246727844, 'samples': 8253888, 'steps': 42988, 'loss/train': 1.3382315635681152} -11/07/2021 03:15:26 - INFO - __main__ - Step 42990: {'lr': 0.0004111927683624942, 'samples': 8254080, 'steps': 42989, 'loss/train': 0.8450368046760559} -11/07/2021 03:15:27 - INFO - __main__ - Step 42991: {'lr': 0.00041118871197957306, 'samples': 8254272, 'steps': 42990, 'loss/train': 0.8592576384544373} -11/07/2021 03:15:27 - INFO - __main__ - Step 42992: {'lr': 0.00041118465552402274, 'samples': 8254464, 'steps': 42991, 'loss/train': 2.1071560382843018} -11/07/2021 03:15:27 - INFO - __main__ - Step 42993: {'lr': 0.00041118059899584503, 'samples': 8254656, 'steps': 42992, 'loss/train': 1.7796658277511597} -11/07/2021 03:15:28 - INFO - __main__ - Step 42994: {'lr': 0.00041117654239504193, 'samples': 8254848, 'steps': 42993, 'loss/train': 1.23753023147583} -11/07/2021 03:15:29 - INFO - __main__ - Step 42995: {'lr': 0.0004111724857216151, 'samples': 8255040, 'steps': 42994, 'loss/train': 1.5601799488067627} -11/07/2021 03:15:29 - INFO - __main__ - Step 42996: {'lr': 0.0004111684289755665, 'samples': 8255232, 'steps': 42995, 'loss/train': 1.4935163259506226} -11/07/2021 03:15:29 - INFO - __main__ - Step 42997: {'lr': 0.00041116437215689785, 'samples': 8255424, 'steps': 42996, 'loss/train': 1.6728167533874512} -11/07/2021 03:15:30 - INFO - __main__ - Step 42998: {'lr': 0.000411160315265611, 'samples': 8255616, 'steps': 42997, 'loss/train': 1.5341050624847412} -11/07/2021 03:15:30 - INFO - __main__ - Step 42999: {'lr': 0.0004111562583017079, 'samples': 8255808, 'steps': 42998, 'loss/train': 1.1012388467788696} -11/07/2021 03:15:31 - INFO - __main__ - Step 43000: {'lr': 0.00041115220126519014, 'samples': 8256000, 'steps': 42999, 'loss/train': 1.7845770120620728} -11/07/2021 03:15:31 - INFO - __main__ - Step 43001: {'lr': 0.00041114814415605977, 'samples': 8256192, 'steps': 43000, 'loss/train': 0.8801016807556152} -11/07/2021 03:15:32 - INFO - __main__ - Step 43002: {'lr': 0.0004111440869743185, 'samples': 8256384, 'steps': 43001, 'loss/train': 1.5452907085418701} -11/07/2021 03:15:32 - INFO - __main__ - Step 43003: {'lr': 0.00041114002971996824, 'samples': 8256576, 'steps': 43002, 'loss/train': 0.9452287554740906} -11/07/2021 03:15:33 - INFO - __main__ - Step 43004: {'lr': 0.0004111359723930107, 'samples': 8256768, 'steps': 43003, 'loss/train': 0.4670843183994293} -11/07/2021 03:15:33 - INFO - __main__ - Step 43005: {'lr': 0.00041113191499344784, 'samples': 8256960, 'steps': 43004, 'loss/train': 1.4178489446640015} -11/07/2021 03:15:34 - INFO - __main__ - Step 43006: {'lr': 0.0004111278575212814, 'samples': 8257152, 'steps': 43005, 'loss/train': 1.4189621210098267} -11/07/2021 03:15:34 - INFO - __main__ - Step 43007: {'lr': 0.0004111237999765132, 'samples': 8257344, 'steps': 43006, 'loss/train': 1.805106520652771} -11/07/2021 03:15:35 - INFO - __main__ - Step 43008: {'lr': 0.0004111197423591452, 'samples': 8257536, 'steps': 43007, 'loss/train': 1.9079796075820923} -11/07/2021 03:15:35 - INFO - __main__ - Step 43009: {'lr': 0.000411115684669179, 'samples': 8257728, 'steps': 43008, 'loss/train': 1.5675806999206543} -11/07/2021 03:15:35 - INFO - __main__ - Step 43010: {'lr': 0.00041111162690661665, 'samples': 8257920, 'steps': 43009, 'loss/train': 1.6696821451187134} -11/07/2021 03:15:36 - INFO - __main__ - Step 43011: {'lr': 0.00041110756907145984, 'samples': 8258112, 'steps': 43010, 'loss/train': 1.4286752939224243} -11/07/2021 03:15:37 - INFO - __main__ - Step 43012: {'lr': 0.0004111035111637105, 'samples': 8258304, 'steps': 43011, 'loss/train': 1.3758095502853394} -11/07/2021 03:15:37 - INFO - __main__ - Step 43013: {'lr': 0.00041109945318337034, 'samples': 8258496, 'steps': 43012, 'loss/train': 1.6210780143737793} -11/07/2021 03:15:37 - INFO - __main__ - Step 43014: {'lr': 0.00041109539513044127, 'samples': 8258688, 'steps': 43013, 'loss/train': 1.3206629753112793} -11/07/2021 03:15:38 - INFO - __main__ - Step 43015: {'lr': 0.0004110913370049251, 'samples': 8258880, 'steps': 43014, 'loss/train': 1.639256238937378} -11/07/2021 03:15:39 - INFO - __main__ - Step 43016: {'lr': 0.00041108727880682363, 'samples': 8259072, 'steps': 43015, 'loss/train': 0.8471148014068604} -11/07/2021 03:15:39 - INFO - __main__ - Step 43017: {'lr': 0.0004110832205361388, 'samples': 8259264, 'steps': 43016, 'loss/train': 1.240605354309082} -11/07/2021 03:15:40 - INFO - __main__ - Step 43018: {'lr': 0.0004110791621928723, 'samples': 8259456, 'steps': 43017, 'loss/train': 1.4540150165557861} -11/07/2021 03:15:40 - INFO - __main__ - Step 43019: {'lr': 0.00041107510377702604, 'samples': 8259648, 'steps': 43018, 'loss/train': 1.5557411909103394} -11/07/2021 03:15:40 - INFO - __main__ - Step 43020: {'lr': 0.00041107104528860186, 'samples': 8259840, 'steps': 43019, 'loss/train': 1.4920012950897217} -11/07/2021 03:15:41 - INFO - __main__ - Step 43021: {'lr': 0.00041106698672760145, 'samples': 8260032, 'steps': 43020, 'loss/train': 1.1121315956115723} -11/07/2021 03:15:42 - INFO - __main__ - Step 43022: {'lr': 0.0004110629280940268, 'samples': 8260224, 'steps': 43021, 'loss/train': 1.8375533819198608} -11/07/2021 03:15:42 - INFO - __main__ - Step 43023: {'lr': 0.0004110588693878796, 'samples': 8260416, 'steps': 43022, 'loss/train': 1.7017621994018555} -11/07/2021 03:15:42 - INFO - __main__ - Step 43024: {'lr': 0.0004110548106091619, 'samples': 8260608, 'steps': 43023, 'loss/train': 1.8397775888442993} -11/07/2021 03:15:43 - INFO - __main__ - Step 43025: {'lr': 0.00041105075175787534, 'samples': 8260800, 'steps': 43024, 'loss/train': 1.5974022150039673} -11/07/2021 03:15:43 - INFO - __main__ - Step 43026: {'lr': 0.00041104669283402174, 'samples': 8260992, 'steps': 43025, 'loss/train': 1.4904776811599731} -11/07/2021 03:15:44 - INFO - __main__ - Step 43027: {'lr': 0.00041104263383760304, 'samples': 8261184, 'steps': 43026, 'loss/train': 1.4006849527359009} -11/07/2021 03:15:45 - INFO - __main__ - Step 43028: {'lr': 0.000411038574768621, 'samples': 8261376, 'steps': 43027, 'loss/train': 1.6243817806243896} -11/07/2021 03:15:45 - INFO - __main__ - Step 43029: {'lr': 0.00041103451562707745, 'samples': 8261568, 'steps': 43028, 'loss/train': 1.3424921035766602} -11/07/2021 03:15:45 - INFO - __main__ - Step 43030: {'lr': 0.0004110304564129742, 'samples': 8261760, 'steps': 43029, 'loss/train': 1.4041417837142944} -11/07/2021 03:15:46 - INFO - __main__ - Step 43031: {'lr': 0.00041102639712631316, 'samples': 8261952, 'steps': 43030, 'loss/train': 1.4108160734176636} -11/07/2021 03:15:47 - INFO - __main__ - Step 43032: {'lr': 0.0004110223377670962, 'samples': 8262144, 'steps': 43031, 'loss/train': 1.3687145709991455} -11/07/2021 03:15:47 - INFO - __main__ - Step 43033: {'lr': 0.0004110182783353249, 'samples': 8262336, 'steps': 43032, 'loss/train': 1.0869172811508179} -11/07/2021 03:15:47 - INFO - __main__ - Step 43034: {'lr': 0.0004110142188310013, 'samples': 8262528, 'steps': 43033, 'loss/train': 1.3496339321136475} -11/07/2021 03:15:48 - INFO - __main__ - Step 43035: {'lr': 0.0004110101592541272, 'samples': 8262720, 'steps': 43034, 'loss/train': 1.3196594715118408} -11/07/2021 03:15:48 - INFO - __main__ - Step 43036: {'lr': 0.0004110060996047044, 'samples': 8262912, 'steps': 43035, 'loss/train': 1.082405686378479} -11/07/2021 03:15:50 - INFO - __main__ - Step 43037: {'lr': 0.00041100203988273475, 'samples': 8263104, 'steps': 43036, 'loss/train': 1.2167576551437378} -11/07/2021 03:15:50 - INFO - __main__ - Step 43038: {'lr': 0.0004109979800882201, 'samples': 8263296, 'steps': 43037, 'loss/train': 1.5957521200180054} -11/07/2021 03:15:50 - INFO - __main__ - Step 43039: {'lr': 0.00041099392022116214, 'samples': 8263488, 'steps': 43038, 'loss/train': 1.3459219932556152} -11/07/2021 03:15:51 - INFO - __main__ - Step 43040: {'lr': 0.0004109898602815629, 'samples': 8263680, 'steps': 43039, 'loss/train': 1.0219038724899292} -11/07/2021 03:15:51 - INFO - __main__ - Step 43041: {'lr': 0.000410985800269424, 'samples': 8263872, 'steps': 43040, 'loss/train': 1.612999439239502} -11/07/2021 03:15:51 - INFO - __main__ - Step 43042: {'lr': 0.00041098174018474747, 'samples': 8264064, 'steps': 43041, 'loss/train': 1.31856369972229} -11/07/2021 03:15:52 - INFO - __main__ - Step 43043: {'lr': 0.000410977680027535, 'samples': 8264256, 'steps': 43042, 'loss/train': 1.392549991607666} -11/07/2021 03:15:53 - INFO - __main__ - Step 43044: {'lr': 0.00041097361979778853, 'samples': 8264448, 'steps': 43043, 'loss/train': 1.1940284967422485} -11/07/2021 03:15:53 - INFO - __main__ - Step 43045: {'lr': 0.00041096955949550983, 'samples': 8264640, 'steps': 43044, 'loss/train': 1.3849601745605469} -11/07/2021 03:15:54 - INFO - __main__ - Step 43046: {'lr': 0.00041096549912070067, 'samples': 8264832, 'steps': 43045, 'loss/train': 1.7899335622787476} -11/07/2021 03:15:54 - INFO - __main__ - Step 43047: {'lr': 0.000410961438673363, 'samples': 8265024, 'steps': 43046, 'loss/train': 1.868234395980835} -11/07/2021 03:15:55 - INFO - __main__ - Step 43048: {'lr': 0.0004109573781534985, 'samples': 8265216, 'steps': 43047, 'loss/train': 1.6222096681594849} -11/07/2021 03:15:56 - INFO - __main__ - Step 43049: {'lr': 0.0004109533175611092, 'samples': 8265408, 'steps': 43048, 'loss/train': 1.1791523694992065} -11/07/2021 03:15:56 - INFO - __main__ - Step 43050: {'lr': 0.0004109492568961968, 'samples': 8265600, 'steps': 43049, 'loss/train': 1.5527454614639282} -11/07/2021 03:15:56 - INFO - __main__ - Step 43051: {'lr': 0.00041094519615876313, 'samples': 8265792, 'steps': 43050, 'loss/train': 1.4125049114227295} -11/07/2021 03:15:57 - INFO - __main__ - Step 43052: {'lr': 0.0004109411353488101, 'samples': 8265984, 'steps': 43051, 'loss/train': 1.371485948562622} -11/07/2021 03:15:58 - INFO - __main__ - Step 43053: {'lr': 0.00041093707446633934, 'samples': 8266176, 'steps': 43052, 'loss/train': 1.9206199645996094} -11/07/2021 03:15:58 - INFO - __main__ - Step 43054: {'lr': 0.00041093301351135294, 'samples': 8266368, 'steps': 43053, 'loss/train': 2.1060402393341064} -11/07/2021 03:15:58 - INFO - __main__ - Step 43055: {'lr': 0.00041092895248385255, 'samples': 8266560, 'steps': 43054, 'loss/train': 1.3890399932861328} -11/07/2021 03:15:59 - INFO - __main__ - Step 43056: {'lr': 0.00041092489138384, 'samples': 8266752, 'steps': 43055, 'loss/train': 5.796188831329346} -11/07/2021 03:15:59 - INFO - __main__ - Step 43057: {'lr': 0.0004109208302113173, 'samples': 8266944, 'steps': 43056, 'loss/train': 1.612684965133667} -11/07/2021 03:16:00 - INFO - __main__ - Step 43058: {'lr': 0.00041091676896628604, 'samples': 8267136, 'steps': 43057, 'loss/train': 5.75294828414917} -11/07/2021 03:16:01 - INFO - __main__ - Step 43059: {'lr': 0.00041091270764874823, 'samples': 8267328, 'steps': 43058, 'loss/train': 1.6078474521636963} -11/07/2021 03:16:01 - INFO - __main__ - Step 43060: {'lr': 0.0004109086462587056, 'samples': 8267520, 'steps': 43059, 'loss/train': 1.4386402368545532} -11/07/2021 03:16:01 - INFO - __main__ - Step 43061: {'lr': 0.0004109045847961601, 'samples': 8267712, 'steps': 43060, 'loss/train': 1.534162163734436} -11/07/2021 03:16:02 - INFO - __main__ - Step 43062: {'lr': 0.0004109005232611134, 'samples': 8267904, 'steps': 43061, 'loss/train': 1.4820033311843872} -11/07/2021 03:16:02 - INFO - __main__ - Step 43063: {'lr': 0.00041089646165356743, 'samples': 8268096, 'steps': 43062, 'loss/train': 0.9905995726585388} -11/07/2021 03:16:03 - INFO - __main__ - Step 43064: {'lr': 0.000410892399973524, 'samples': 8268288, 'steps': 43063, 'loss/train': 1.497308373451233} -11/07/2021 03:16:03 - INFO - __main__ - Step 43065: {'lr': 0.00041088833822098495, 'samples': 8268480, 'steps': 43064, 'loss/train': 1.0966325998306274} -11/07/2021 03:16:04 - INFO - __main__ - Step 43066: {'lr': 0.00041088427639595206, 'samples': 8268672, 'steps': 43065, 'loss/train': 1.3141721487045288} -11/07/2021 03:16:04 - INFO - __main__ - Step 43067: {'lr': 0.0004108802144984273, 'samples': 8268864, 'steps': 43066, 'loss/train': 1.7734742164611816} -11/07/2021 03:16:04 - INFO - __main__ - Step 43068: {'lr': 0.0004108761525284123, 'samples': 8269056, 'steps': 43067, 'loss/train': 1.7632601261138916} -11/07/2021 03:16:05 - INFO - __main__ - Step 43069: {'lr': 0.000410872090485909, 'samples': 8269248, 'steps': 43068, 'loss/train': 1.366463541984558} -11/07/2021 03:16:06 - INFO - __main__ - Step 43070: {'lr': 0.00041086802837091916, 'samples': 8269440, 'steps': 43069, 'loss/train': 2.006185293197632} -11/07/2021 03:16:06 - INFO - __main__ - Step 43071: {'lr': 0.00041086396618344475, 'samples': 8269632, 'steps': 43070, 'loss/train': 1.924782395362854} -11/07/2021 03:16:06 - INFO - __main__ - Step 43072: {'lr': 0.0004108599039234875, 'samples': 8269824, 'steps': 43071, 'loss/train': 1.1278479099273682} -11/07/2021 03:16:07 - INFO - __main__ - Step 43073: {'lr': 0.00041085584159104925, 'samples': 8270016, 'steps': 43072, 'loss/train': 1.4849249124526978} -11/07/2021 03:16:08 - INFO - __main__ - Step 43074: {'lr': 0.00041085177918613185, 'samples': 8270208, 'steps': 43073, 'loss/train': 1.31929612159729} -11/07/2021 03:16:08 - INFO - __main__ - Step 43075: {'lr': 0.0004108477167087371, 'samples': 8270400, 'steps': 43074, 'loss/train': 1.661223292350769} -11/07/2021 03:16:09 - INFO - __main__ - Step 43076: {'lr': 0.0004108436541588669, 'samples': 8270592, 'steps': 43075, 'loss/train': 1.6085768938064575} -11/07/2021 03:16:09 - INFO - __main__ - Step 43077: {'lr': 0.000410839591536523, 'samples': 8270784, 'steps': 43076, 'loss/train': 1.5742981433868408} -11/07/2021 03:16:09 - INFO - __main__ - Step 43078: {'lr': 0.00041083552884170726, 'samples': 8270976, 'steps': 43077, 'loss/train': 1.8481992483139038} -11/07/2021 03:16:10 - INFO - __main__ - Step 43079: {'lr': 0.0004108314660744216, 'samples': 8271168, 'steps': 43078, 'loss/train': 1.462916612625122} -11/07/2021 03:16:11 - INFO - __main__ - Step 43080: {'lr': 0.0004108274032346676, 'samples': 8271360, 'steps': 43079, 'loss/train': 2.329413890838623} -11/07/2021 03:16:11 - INFO - __main__ - Step 43081: {'lr': 0.0004108233403224474, 'samples': 8271552, 'steps': 43080, 'loss/train': 1.365371823310852} -11/07/2021 03:16:11 - INFO - __main__ - Step 43082: {'lr': 0.0004108192773377626, 'samples': 8271744, 'steps': 43081, 'loss/train': 1.0467580556869507} -11/07/2021 03:16:12 - INFO - __main__ - Step 43083: {'lr': 0.0004108152142806151, 'samples': 8271936, 'steps': 43082, 'loss/train': 1.5733226537704468} -11/07/2021 03:16:12 - INFO - __main__ - Step 43084: {'lr': 0.00041081115115100677, 'samples': 8272128, 'steps': 43083, 'loss/train': 1.3022276163101196} -11/07/2021 03:16:13 - INFO - __main__ - Step 43085: {'lr': 0.0004108070879489395, 'samples': 8272320, 'steps': 43084, 'loss/train': 1.8730179071426392} -11/07/2021 03:16:13 - INFO - __main__ - Step 43086: {'lr': 0.0004108030246744149, 'samples': 8272512, 'steps': 43085, 'loss/train': 1.9628807306289673} -11/07/2021 03:16:14 - INFO - __main__ - Step 43087: {'lr': 0.00041079896132743506, 'samples': 8272704, 'steps': 43086, 'loss/train': 1.5374175310134888} -11/07/2021 03:16:14 - INFO - __main__ - Step 43088: {'lr': 0.0004107948979080016, 'samples': 8272896, 'steps': 43087, 'loss/train': 1.434190273284912} -11/07/2021 03:16:14 - INFO - __main__ - Step 43089: {'lr': 0.00041079083441611646, 'samples': 8273088, 'steps': 43088, 'loss/train': 0.9195286631584167} -11/07/2021 03:16:16 - INFO - __main__ - Step 43090: {'lr': 0.0004107867708517815, 'samples': 8273280, 'steps': 43089, 'loss/train': 1.2906053066253662} -11/07/2021 03:16:16 - INFO - __main__ - Step 43091: {'lr': 0.0004107827072149984, 'samples': 8273472, 'steps': 43090, 'loss/train': 1.2737891674041748} -11/07/2021 03:16:16 - INFO - __main__ - Step 43092: {'lr': 0.0004107786435057692, 'samples': 8273664, 'steps': 43091, 'loss/train': 1.444359302520752} -11/07/2021 03:16:17 - INFO - __main__ - Step 43093: {'lr': 0.0004107745797240956, 'samples': 8273856, 'steps': 43092, 'loss/train': 1.8389931917190552} -11/07/2021 03:16:17 - INFO - __main__ - Step 43094: {'lr': 0.0004107705158699794, 'samples': 8274048, 'steps': 43093, 'loss/train': 0.8773282170295715} -11/07/2021 03:16:18 - INFO - __main__ - Step 43095: {'lr': 0.00041076645194342254, 'samples': 8274240, 'steps': 43094, 'loss/train': 2.0294175148010254} -11/07/2021 03:16:18 - INFO - __main__ - Step 43096: {'lr': 0.00041076238794442675, 'samples': 8274432, 'steps': 43095, 'loss/train': 1.283133864402771} -11/07/2021 03:16:19 - INFO - __main__ - Step 43097: {'lr': 0.00041075832387299396, 'samples': 8274624, 'steps': 43096, 'loss/train': 1.3659342527389526} -11/07/2021 03:16:19 - INFO - __main__ - Step 43098: {'lr': 0.00041075425972912595, 'samples': 8274816, 'steps': 43097, 'loss/train': 1.7125060558319092} -11/07/2021 03:16:19 - INFO - __main__ - Step 43099: {'lr': 0.00041075019551282455, 'samples': 8275008, 'steps': 43098, 'loss/train': 1.3746939897537231} -11/07/2021 03:16:20 - INFO - __main__ - Step 43100: {'lr': 0.00041074613122409157, 'samples': 8275200, 'steps': 43099, 'loss/train': 1.4970327615737915} -11/07/2021 03:16:21 - INFO - __main__ - Step 43101: {'lr': 0.0004107420668629289, 'samples': 8275392, 'steps': 43100, 'loss/train': 1.3181568384170532} -11/07/2021 03:16:21 - INFO - __main__ - Step 43102: {'lr': 0.00041073800242933826, 'samples': 8275584, 'steps': 43101, 'loss/train': 1.4100422859191895} -11/07/2021 03:16:21 - INFO - __main__ - Step 43103: {'lr': 0.00041073393792332157, 'samples': 8275776, 'steps': 43102, 'loss/train': 1.6294130086898804} -11/07/2021 03:16:22 - INFO - __main__ - Step 43104: {'lr': 0.0004107298733448807, 'samples': 8275968, 'steps': 43103, 'loss/train': 1.350721001625061} -11/07/2021 03:16:23 - INFO - __main__ - Step 43105: {'lr': 0.0004107258086940174, 'samples': 8276160, 'steps': 43104, 'loss/train': 1.189432978630066} -11/07/2021 03:16:23 - INFO - __main__ - Step 43106: {'lr': 0.0004107217439707336, 'samples': 8276352, 'steps': 43105, 'loss/train': 1.315584659576416} -11/07/2021 03:16:23 - INFO - __main__ - Step 43107: {'lr': 0.000410717679175031, 'samples': 8276544, 'steps': 43106, 'loss/train': 1.1594332456588745} -11/07/2021 03:16:24 - INFO - __main__ - Step 43108: {'lr': 0.00041071361430691143, 'samples': 8276736, 'steps': 43107, 'loss/train': 1.5375863313674927} -11/07/2021 03:16:24 - INFO - __main__ - Step 43109: {'lr': 0.00041070954936637687, 'samples': 8276928, 'steps': 43108, 'loss/train': 1.8577443361282349} -11/07/2021 03:16:25 - INFO - __main__ - Step 43110: {'lr': 0.00041070548435342903, 'samples': 8277120, 'steps': 43109, 'loss/train': 1.6667335033416748} -11/07/2021 03:16:25 - INFO - __main__ - Step 43111: {'lr': 0.00041070141926806983, 'samples': 8277312, 'steps': 43110, 'loss/train': 1.0912951231002808} -11/07/2021 03:16:26 - INFO - __main__ - Step 43112: {'lr': 0.00041069735411030105, 'samples': 8277504, 'steps': 43111, 'loss/train': 1.5038973093032837} -11/07/2021 03:16:26 - INFO - __main__ - Step 43113: {'lr': 0.00041069328888012447, 'samples': 8277696, 'steps': 43112, 'loss/train': 1.277441382408142} -11/07/2021 03:16:26 - INFO - __main__ - Step 43114: {'lr': 0.000410689223577542, 'samples': 8277888, 'steps': 43113, 'loss/train': 1.4587876796722412} -11/07/2021 03:16:27 - INFO - __main__ - Step 43115: {'lr': 0.00041068515820255543, 'samples': 8278080, 'steps': 43114, 'loss/train': 1.666568636894226} -11/07/2021 03:16:28 - INFO - __main__ - Step 43116: {'lr': 0.00041068109275516665, 'samples': 8278272, 'steps': 43115, 'loss/train': 1.3361376523971558} -11/07/2021 03:16:28 - INFO - __main__ - Step 43117: {'lr': 0.0004106770272353774, 'samples': 8278464, 'steps': 43116, 'loss/train': 1.3129546642303467} -11/07/2021 03:16:29 - INFO - __main__ - Step 43118: {'lr': 0.00041067296164318956, 'samples': 8278656, 'steps': 43117, 'loss/train': 1.4723830223083496} -11/07/2021 03:16:29 - INFO - __main__ - Step 43119: {'lr': 0.000410668895978605, 'samples': 8278848, 'steps': 43118, 'loss/train': 1.167095422744751} -11/07/2021 03:16:29 - INFO - __main__ - Step 43120: {'lr': 0.0004106648302416255, 'samples': 8279040, 'steps': 43119, 'loss/train': 1.4202436208724976} -11/07/2021 03:16:30 - INFO - __main__ - Step 43121: {'lr': 0.0004106607644322529, 'samples': 8279232, 'steps': 43120, 'loss/train': 1.5817418098449707} -11/07/2021 03:16:31 - INFO - __main__ - Step 43122: {'lr': 0.00041065669855048896, 'samples': 8279424, 'steps': 43121, 'loss/train': 1.5932525396347046} -11/07/2021 03:16:31 - INFO - __main__ - Step 43123: {'lr': 0.0004106526325963357, 'samples': 8279616, 'steps': 43122, 'loss/train': 1.3598804473876953} -11/07/2021 03:16:31 - INFO - __main__ - Step 43124: {'lr': 0.0004106485665697948, 'samples': 8279808, 'steps': 43123, 'loss/train': 1.0472019910812378} -11/07/2021 03:16:32 - INFO - __main__ - Step 43125: {'lr': 0.00041064450047086814, 'samples': 8280000, 'steps': 43124, 'loss/train': 1.4605704545974731} -11/07/2021 03:16:33 - INFO - __main__ - Step 43126: {'lr': 0.00041064043429955756, 'samples': 8280192, 'steps': 43125, 'loss/train': 1.3245314359664917} -11/07/2021 03:16:33 - INFO - __main__ - Step 43127: {'lr': 0.0004106363680558649, 'samples': 8280384, 'steps': 43126, 'loss/train': 1.6327924728393555} -11/07/2021 03:16:33 - INFO - __main__ - Step 43128: {'lr': 0.0004106323017397919, 'samples': 8280576, 'steps': 43127, 'loss/train': 1.4311386346817017} -11/07/2021 03:16:34 - INFO - __main__ - Step 43129: {'lr': 0.00041062823535134053, 'samples': 8280768, 'steps': 43128, 'loss/train': 1.6788736581802368} -11/07/2021 03:16:34 - INFO - __main__ - Step 43130: {'lr': 0.0004106241688905126, 'samples': 8280960, 'steps': 43129, 'loss/train': 1.4539369344711304} -11/07/2021 03:16:35 - INFO - __main__ - Step 43131: {'lr': 0.00041062010235730974, 'samples': 8281152, 'steps': 43130, 'loss/train': 1.5070507526397705} -11/07/2021 03:16:36 - INFO - __main__ - Step 43132: {'lr': 0.0004106160357517341, 'samples': 8281344, 'steps': 43131, 'loss/train': 1.384362816810608} -11/07/2021 03:16:36 - INFO - __main__ - Step 43133: {'lr': 0.00041061196907378727, 'samples': 8281536, 'steps': 43132, 'loss/train': 0.20600904524326324} -11/07/2021 03:16:36 - INFO - __main__ - Step 43134: {'lr': 0.00041060790232347116, 'samples': 8281728, 'steps': 43133, 'loss/train': 1.1068603992462158} -11/07/2021 03:16:37 - INFO - __main__ - Step 43135: {'lr': 0.00041060383550078764, 'samples': 8281920, 'steps': 43134, 'loss/train': 1.7642035484313965} -11/07/2021 03:16:37 - INFO - __main__ - Step 43136: {'lr': 0.00041059976860573845, 'samples': 8282112, 'steps': 43135, 'loss/train': 1.1896979808807373} -11/07/2021 03:16:38 - INFO - __main__ - Step 43137: {'lr': 0.00041059570163832555, 'samples': 8282304, 'steps': 43136, 'loss/train': 0.7403428554534912} -11/07/2021 03:16:38 - INFO - __main__ - Step 43138: {'lr': 0.00041059163459855066, 'samples': 8282496, 'steps': 43137, 'loss/train': 1.6915414333343506} -11/07/2021 03:16:39 - INFO - __main__ - Step 43139: {'lr': 0.00041058756748641573, 'samples': 8282688, 'steps': 43138, 'loss/train': 1.559566855430603} -11/07/2021 03:16:39 - INFO - __main__ - Step 43140: {'lr': 0.0004105835003019225, 'samples': 8282880, 'steps': 43139, 'loss/train': 1.4372590780258179} -11/07/2021 03:16:39 - INFO - __main__ - Step 43141: {'lr': 0.00041057943304507273, 'samples': 8283072, 'steps': 43140, 'loss/train': 1.3585083484649658} -11/07/2021 03:16:41 - INFO - __main__ - Step 43142: {'lr': 0.0004105753657158684, 'samples': 8283264, 'steps': 43141, 'loss/train': 1.2696479558944702} -11/07/2021 03:16:41 - INFO - __main__ - Step 43143: {'lr': 0.00041057129831431133, 'samples': 8283456, 'steps': 43142, 'loss/train': 1.361433982849121} -11/07/2021 03:16:41 - INFO - __main__ - Step 43144: {'lr': 0.00041056723084040324, 'samples': 8283648, 'steps': 43143, 'loss/train': 1.8104569911956787} -11/07/2021 03:16:42 - INFO - __main__ - Step 43145: {'lr': 0.00041056316329414613, 'samples': 8283840, 'steps': 43144, 'loss/train': 1.4259611368179321} -11/07/2021 03:16:42 - INFO - __main__ - Step 43146: {'lr': 0.00041055909567554166, 'samples': 8284032, 'steps': 43145, 'loss/train': 1.4371272325515747} -11/07/2021 03:16:43 - INFO - __main__ - Step 43147: {'lr': 0.00041055502798459175, 'samples': 8284224, 'steps': 43146, 'loss/train': 1.4179667234420776} -11/07/2021 03:16:43 - INFO - __main__ - Step 43148: {'lr': 0.00041055096022129823, 'samples': 8284416, 'steps': 43147, 'loss/train': 1.4169361591339111} -11/07/2021 03:16:44 - INFO - __main__ - Step 43149: {'lr': 0.0004105468923856629, 'samples': 8284608, 'steps': 43148, 'loss/train': 1.2737438678741455} -11/07/2021 03:16:44 - INFO - __main__ - Step 43150: {'lr': 0.00041054282447768763, 'samples': 8284800, 'steps': 43149, 'loss/train': 1.6200916767120361} -11/07/2021 03:16:44 - INFO - __main__ - Step 43151: {'lr': 0.00041053875649737424, 'samples': 8284992, 'steps': 43150, 'loss/train': 1.7988002300262451} -11/07/2021 03:16:45 - INFO - __main__ - Step 43152: {'lr': 0.0004105346884447246, 'samples': 8285184, 'steps': 43151, 'loss/train': 1.8118313550949097} -11/07/2021 03:16:46 - INFO - __main__ - Step 43153: {'lr': 0.00041053062031974055, 'samples': 8285376, 'steps': 43152, 'loss/train': 1.5103808641433716} -11/07/2021 03:16:46 - INFO - __main__ - Step 43154: {'lr': 0.00041052655212242377, 'samples': 8285568, 'steps': 43153, 'loss/train': 1.352491021156311} -11/07/2021 03:16:46 - INFO - __main__ - Step 43155: {'lr': 0.00041052248385277623, 'samples': 8285760, 'steps': 43154, 'loss/train': 1.6922416687011719} -11/07/2021 03:16:47 - INFO - __main__ - Step 43156: {'lr': 0.0004105184155107998, 'samples': 8285952, 'steps': 43155, 'loss/train': 1.8941594362258911} -11/07/2021 03:16:48 - INFO - __main__ - Step 43157: {'lr': 0.00041051434709649614, 'samples': 8286144, 'steps': 43156, 'loss/train': 1.6118606328964233} -11/07/2021 03:16:48 - INFO - __main__ - Step 43158: {'lr': 0.0004105102786098672, 'samples': 8286336, 'steps': 43157, 'loss/train': 1.1860041618347168} -11/07/2021 03:16:49 - INFO - __main__ - Step 43159: {'lr': 0.0004105062100509149, 'samples': 8286528, 'steps': 43158, 'loss/train': 1.4262062311172485} -11/07/2021 03:16:49 - INFO - __main__ - Step 43160: {'lr': 0.000410502141419641, 'samples': 8286720, 'steps': 43159, 'loss/train': 1.2417993545532227} -11/07/2021 03:16:49 - INFO - __main__ - Step 43161: {'lr': 0.00041049807271604724, 'samples': 8286912, 'steps': 43160, 'loss/train': 1.6057826280593872} -11/07/2021 03:16:50 - INFO - __main__ - Step 43162: {'lr': 0.00041049400394013545, 'samples': 8287104, 'steps': 43161, 'loss/train': 0.7456337809562683} -11/07/2021 03:16:51 - INFO - __main__ - Step 43163: {'lr': 0.0004104899350919077, 'samples': 8287296, 'steps': 43162, 'loss/train': 1.8297420740127563} -11/07/2021 03:16:52 - INFO - __main__ - Step 43164: {'lr': 0.0004104858661713655, 'samples': 8287488, 'steps': 43163, 'loss/train': 1.7945384979248047} -11/07/2021 03:16:52 - INFO - __main__ - Step 43165: {'lr': 0.00041048179717851095, 'samples': 8287680, 'steps': 43164, 'loss/train': 0.2556303143501282} -11/07/2021 03:16:52 - INFO - __main__ - Step 43166: {'lr': 0.00041047772811334584, 'samples': 8287872, 'steps': 43165, 'loss/train': 1.3993481397628784} -11/07/2021 03:16:53 - INFO - __main__ - Step 43167: {'lr': 0.0004104736589758719, 'samples': 8288064, 'steps': 43166, 'loss/train': 0.8999582529067993} -11/07/2021 03:16:53 - INFO - __main__ - Step 43168: {'lr': 0.0004104695897660909, 'samples': 8288256, 'steps': 43167, 'loss/train': 1.4187109470367432} -11/07/2021 03:16:54 - INFO - __main__ - Step 43169: {'lr': 0.0004104655204840048, 'samples': 8288448, 'steps': 43168, 'loss/train': 1.7086986303329468} -11/07/2021 03:16:54 - INFO - __main__ - Step 43170: {'lr': 0.0004104614511296155, 'samples': 8288640, 'steps': 43169, 'loss/train': 1.5957424640655518} -11/07/2021 03:16:55 - INFO - __main__ - Step 43171: {'lr': 0.00041045738170292467, 'samples': 8288832, 'steps': 43170, 'loss/train': 1.7372387647628784} -11/07/2021 03:16:55 - INFO - __main__ - Step 43172: {'lr': 0.0004104533122039342, 'samples': 8289024, 'steps': 43171, 'loss/train': 1.630563735961914} -11/07/2021 03:16:55 - INFO - __main__ - Step 43173: {'lr': 0.00041044924263264603, 'samples': 8289216, 'steps': 43172, 'loss/train': 1.5493334531784058} -11/07/2021 03:16:56 - INFO - __main__ - Step 43174: {'lr': 0.00041044517298906194, 'samples': 8289408, 'steps': 43173, 'loss/train': 1.1043447256088257} -11/07/2021 03:16:57 - INFO - __main__ - Step 43175: {'lr': 0.0004104411032731836, 'samples': 8289600, 'steps': 43174, 'loss/train': 1.4027479887008667} -11/07/2021 03:16:57 - INFO - __main__ - Step 43176: {'lr': 0.00041043703348501304, 'samples': 8289792, 'steps': 43175, 'loss/train': 0.8495373129844666} -11/07/2021 03:16:57 - INFO - __main__ - Step 43177: {'lr': 0.0004104329636245521, 'samples': 8289984, 'steps': 43176, 'loss/train': 0.77286696434021} -11/07/2021 03:16:58 - INFO - __main__ - Step 43178: {'lr': 0.0004104288936918024, 'samples': 8290176, 'steps': 43177, 'loss/train': 1.7297497987747192} -11/07/2021 03:16:59 - INFO - __main__ - Step 43179: {'lr': 0.00041042482368676604, 'samples': 8290368, 'steps': 43178, 'loss/train': 1.2108728885650635} -11/07/2021 03:16:59 - INFO - __main__ - Step 43180: {'lr': 0.00041042075360944464, 'samples': 8290560, 'steps': 43179, 'loss/train': 1.4625720977783203} -11/07/2021 03:17:00 - INFO - __main__ - Step 43181: {'lr': 0.0004104166834598402, 'samples': 8290752, 'steps': 43180, 'loss/train': 1.3745132684707642} -11/07/2021 03:17:00 - INFO - __main__ - Step 43182: {'lr': 0.00041041261323795437, 'samples': 8290944, 'steps': 43181, 'loss/train': 1.5282878875732422} -11/07/2021 03:17:00 - INFO - __main__ - Step 43183: {'lr': 0.0004104085429437892, 'samples': 8291136, 'steps': 43182, 'loss/train': 1.267673373222351} -11/07/2021 03:17:01 - INFO - __main__ - Step 43184: {'lr': 0.00041040447257734635, 'samples': 8291328, 'steps': 43183, 'loss/train': 1.4752342700958252} -11/07/2021 03:17:02 - INFO - __main__ - Step 43185: {'lr': 0.00041040040213862774, 'samples': 8291520, 'steps': 43184, 'loss/train': 2.0098776817321777} -11/07/2021 03:17:02 - INFO - __main__ - Step 43186: {'lr': 0.00041039633162763523, 'samples': 8291712, 'steps': 43185, 'loss/train': 1.0623544454574585} -11/07/2021 03:17:02 - INFO - __main__ - Step 43187: {'lr': 0.00041039226104437056, 'samples': 8291904, 'steps': 43186, 'loss/train': 1.8754194974899292} -11/07/2021 03:17:03 - INFO - __main__ - Step 43188: {'lr': 0.0004103881903888356, 'samples': 8292096, 'steps': 43187, 'loss/train': 1.6514359712600708} -11/07/2021 03:17:04 - INFO - __main__ - Step 43189: {'lr': 0.0004103841196610322, 'samples': 8292288, 'steps': 43188, 'loss/train': 2.032471179962158} -11/07/2021 03:17:04 - INFO - __main__ - Step 43190: {'lr': 0.0004103800488609622, 'samples': 8292480, 'steps': 43189, 'loss/train': 1.1504318714141846} -11/07/2021 03:17:04 - INFO - __main__ - Step 43191: {'lr': 0.0004103759779886274, 'samples': 8292672, 'steps': 43190, 'loss/train': 1.742537021636963} -11/07/2021 03:17:05 - INFO - __main__ - Step 43192: {'lr': 0.0004103719070440297, 'samples': 8292864, 'steps': 43191, 'loss/train': 0.9761320352554321} -11/07/2021 03:17:05 - INFO - __main__ - Step 43193: {'lr': 0.00041036783602717086, 'samples': 8293056, 'steps': 43192, 'loss/train': 1.222903847694397} -11/07/2021 03:17:06 - INFO - __main__ - Step 43194: {'lr': 0.00041036376493805286, 'samples': 8293248, 'steps': 43193, 'loss/train': 2.652095317840576} -11/07/2021 03:17:07 - INFO - __main__ - Step 43195: {'lr': 0.0004103596937766773, 'samples': 8293440, 'steps': 43194, 'loss/train': 1.6091325283050537} -11/07/2021 03:17:07 - INFO - __main__ - Step 43196: {'lr': 0.00041035562254304614, 'samples': 8293632, 'steps': 43195, 'loss/train': 1.3011974096298218} -11/07/2021 03:17:07 - INFO - __main__ - Step 43197: {'lr': 0.00041035155123716127, 'samples': 8293824, 'steps': 43196, 'loss/train': 0.3642762005329132} -11/07/2021 03:17:08 - INFO - __main__ - Step 43198: {'lr': 0.00041034747985902446, 'samples': 8294016, 'steps': 43197, 'loss/train': 2.0115673542022705} -11/07/2021 03:17:08 - INFO - __main__ - Step 43199: {'lr': 0.0004103434084086375, 'samples': 8294208, 'steps': 43198, 'loss/train': 1.4424716234207153} -11/07/2021 03:17:09 - INFO - __main__ - Step 43200: {'lr': 0.0004103393368860023, 'samples': 8294400, 'steps': 43199, 'loss/train': 1.7488442659378052} -11/07/2021 03:17:09 - INFO - __main__ - Step 43201: {'lr': 0.0004103352652911206, 'samples': 8294592, 'steps': 43200, 'loss/train': 1.2876766920089722} -11/07/2021 03:17:10 - INFO - __main__ - Step 43202: {'lr': 0.0004103311936239944, 'samples': 8294784, 'steps': 43201, 'loss/train': 1.2778476476669312} -11/07/2021 03:17:10 - INFO - __main__ - Step 43203: {'lr': 0.0004103271218846254, 'samples': 8294976, 'steps': 43202, 'loss/train': 1.2290693521499634} -11/07/2021 03:17:10 - INFO - __main__ - Step 43204: {'lr': 0.00041032305007301554, 'samples': 8295168, 'steps': 43203, 'loss/train': 1.2880079746246338} -11/07/2021 03:17:11 - INFO - __main__ - Step 43205: {'lr': 0.00041031897818916645, 'samples': 8295360, 'steps': 43204, 'loss/train': 1.504037618637085} -11/07/2021 03:17:12 - INFO - __main__ - Step 43206: {'lr': 0.0004103149062330802, 'samples': 8295552, 'steps': 43205, 'loss/train': 1.6308549642562866} -11/07/2021 03:17:12 - INFO - __main__ - Step 43207: {'lr': 0.00041031083420475854, 'samples': 8295744, 'steps': 43206, 'loss/train': 1.379603624343872} -11/07/2021 03:17:12 - INFO - __main__ - Step 43208: {'lr': 0.00041030676210420324, 'samples': 8295936, 'steps': 43207, 'loss/train': 1.3084861040115356} -11/07/2021 03:17:13 - INFO - __main__ - Step 43209: {'lr': 0.0004103026899314162, 'samples': 8296128, 'steps': 43208, 'loss/train': 1.4617557525634766} -11/07/2021 03:17:14 - INFO - __main__ - Step 43210: {'lr': 0.00041029861768639934, 'samples': 8296320, 'steps': 43209, 'loss/train': 1.5682384967803955} -11/07/2021 03:17:14 - INFO - __main__ - Step 43211: {'lr': 0.0004102945453691542, 'samples': 8296512, 'steps': 43210, 'loss/train': 1.2275004386901855} -11/07/2021 03:17:15 - INFO - __main__ - Step 43212: {'lr': 0.00041029047297968293, 'samples': 8296704, 'steps': 43211, 'loss/train': 1.4966442584991455} -11/07/2021 03:17:15 - INFO - __main__ - Step 43213: {'lr': 0.00041028640051798726, 'samples': 8296896, 'steps': 43212, 'loss/train': 1.5281322002410889} -11/07/2021 03:17:15 - INFO - __main__ - Step 43214: {'lr': 0.000410282327984069, 'samples': 8297088, 'steps': 43213, 'loss/train': 1.1413795948028564} -11/07/2021 03:17:16 - INFO - __main__ - Step 43215: {'lr': 0.00041027825537792993, 'samples': 8297280, 'steps': 43214, 'loss/train': 1.04563307762146} -11/07/2021 03:17:17 - INFO - __main__ - Step 43216: {'lr': 0.0004102741826995721, 'samples': 8297472, 'steps': 43215, 'loss/train': 1.8254573345184326} -11/07/2021 03:17:17 - INFO - __main__ - Step 43217: {'lr': 0.000410270109948997, 'samples': 8297664, 'steps': 43216, 'loss/train': 1.4102542400360107} -11/07/2021 03:17:17 - INFO - __main__ - Step 43218: {'lr': 0.0004102660371262068, 'samples': 8297856, 'steps': 43217, 'loss/train': 1.1999146938323975} -11/07/2021 03:17:18 - INFO - __main__ - Step 43219: {'lr': 0.0004102619642312031, 'samples': 8298048, 'steps': 43218, 'loss/train': 1.255764365196228} -11/07/2021 03:17:18 - INFO - __main__ - Step 43220: {'lr': 0.00041025789126398793, 'samples': 8298240, 'steps': 43219, 'loss/train': 1.6038835048675537} -11/07/2021 03:17:20 - INFO - __main__ - Step 43221: {'lr': 0.000410253818224563, 'samples': 8298432, 'steps': 43220, 'loss/train': 1.781392216682434} -11/07/2021 03:17:20 - INFO - __main__ - Step 43222: {'lr': 0.0004102497451129302, 'samples': 8298624, 'steps': 43221, 'loss/train': 1.4568729400634766} -11/07/2021 03:17:20 - INFO - __main__ - Step 43223: {'lr': 0.00041024567192909125, 'samples': 8298816, 'steps': 43222, 'loss/train': 1.552573561668396} -11/07/2021 03:17:21 - INFO - __main__ - Step 43224: {'lr': 0.0004102415986730481, 'samples': 8299008, 'steps': 43223, 'loss/train': 0.9100706577301025} -11/07/2021 03:17:21 - INFO - __main__ - Step 43225: {'lr': 0.0004102375253448026, 'samples': 8299200, 'steps': 43224, 'loss/train': 1.3224427700042725} -11/07/2021 03:17:21 - INFO - __main__ - Step 43226: {'lr': 0.0004102334519443565, 'samples': 8299392, 'steps': 43225, 'loss/train': 0.4940943717956543} -11/07/2021 03:17:23 - INFO - __main__ - Step 43227: {'lr': 0.0004102293784717117, 'samples': 8299584, 'steps': 43226, 'loss/train': 0.4784579575061798} -11/07/2021 03:17:23 - INFO - __main__ - Step 43228: {'lr': 0.00041022530492687006, 'samples': 8299776, 'steps': 43227, 'loss/train': 1.7686057090759277} -11/07/2021 03:17:24 - INFO - __main__ - Step 43229: {'lr': 0.0004102212313098333, 'samples': 8299968, 'steps': 43228, 'loss/train': 1.4608936309814453} -11/07/2021 03:17:24 - INFO - __main__ - Step 43230: {'lr': 0.00041021715762060336, 'samples': 8300160, 'steps': 43229, 'loss/train': 1.6046879291534424} -11/07/2021 03:17:24 - INFO - __main__ - Step 43231: {'lr': 0.000410213083859182, 'samples': 8300352, 'steps': 43230, 'loss/train': 1.4580544233322144} -11/07/2021 03:17:25 - INFO - __main__ - Step 43232: {'lr': 0.0004102090100255711, 'samples': 8300544, 'steps': 43231, 'loss/train': 4.313381195068359} -11/07/2021 03:17:26 - INFO - __main__ - Step 43233: {'lr': 0.00041020493611977263, 'samples': 8300736, 'steps': 43232, 'loss/train': 3.5713274478912354} -11/07/2021 03:17:26 - INFO - __main__ - Step 43234: {'lr': 0.0004102008621417881, 'samples': 8300928, 'steps': 43233, 'loss/train': 1.7774174213409424} -11/07/2021 03:17:26 - INFO - __main__ - Step 43235: {'lr': 0.0004101967880916196, 'samples': 8301120, 'steps': 43234, 'loss/train': 1.1446168422698975} -11/07/2021 03:17:27 - INFO - __main__ - Step 43236: {'lr': 0.00041019271396926894, 'samples': 8301312, 'steps': 43235, 'loss/train': 1.3731508255004883} -11/07/2021 03:17:27 - INFO - __main__ - Step 43237: {'lr': 0.0004101886397747379, 'samples': 8301504, 'steps': 43236, 'loss/train': 1.533296823501587} -11/07/2021 03:17:28 - INFO - __main__ - Step 43238: {'lr': 0.0004101845655080283, 'samples': 8301696, 'steps': 43237, 'loss/train': 1.5787715911865234} -11/07/2021 03:17:28 - INFO - __main__ - Step 43239: {'lr': 0.00041018049116914204, 'samples': 8301888, 'steps': 43238, 'loss/train': 1.5141563415527344} -11/07/2021 03:17:29 - INFO - __main__ - Step 43240: {'lr': 0.00041017641675808095, 'samples': 8302080, 'steps': 43239, 'loss/train': 0.6786595582962036} -11/07/2021 03:17:29 - INFO - __main__ - Step 43241: {'lr': 0.00041017234227484675, 'samples': 8302272, 'steps': 43240, 'loss/train': 1.649290919303894} -11/07/2021 03:17:29 - INFO - __main__ - Step 43242: {'lr': 0.0004101682677194414, 'samples': 8302464, 'steps': 43241, 'loss/train': 1.368617057800293} -11/07/2021 03:17:30 - INFO - __main__ - Step 43243: {'lr': 0.0004101641930918667, 'samples': 8302656, 'steps': 43242, 'loss/train': 1.4992783069610596} -11/07/2021 03:17:31 - INFO - __main__ - Step 43244: {'lr': 0.00041016011839212446, 'samples': 8302848, 'steps': 43243, 'loss/train': 1.781638503074646} -11/07/2021 03:17:31 - INFO - __main__ - Step 43245: {'lr': 0.0004101560436202166, 'samples': 8303040, 'steps': 43244, 'loss/train': 1.5576189756393433} -11/07/2021 03:17:31 - INFO - __main__ - Step 43246: {'lr': 0.0004101519687761449, 'samples': 8303232, 'steps': 43245, 'loss/train': 1.2122910022735596} -11/07/2021 03:17:32 - INFO - __main__ - Step 43247: {'lr': 0.00041014789385991114, 'samples': 8303424, 'steps': 43246, 'loss/train': 1.5584133863449097} -11/07/2021 03:17:33 - INFO - __main__ - Step 43248: {'lr': 0.00041014381887151727, 'samples': 8303616, 'steps': 43247, 'loss/train': 1.2769432067871094} -11/07/2021 03:17:33 - INFO - __main__ - Step 43249: {'lr': 0.00041013974381096503, 'samples': 8303808, 'steps': 43248, 'loss/train': 1.1447575092315674} -11/07/2021 03:17:34 - INFO - __main__ - Step 43250: {'lr': 0.00041013566867825627, 'samples': 8304000, 'steps': 43249, 'loss/train': 1.616087794303894} -11/07/2021 03:17:34 - INFO - __main__ - Step 43251: {'lr': 0.00041013159347339293, 'samples': 8304192, 'steps': 43250, 'loss/train': 0.3687068819999695} -11/07/2021 03:17:34 - INFO - __main__ - Step 43252: {'lr': 0.0004101275181963767, 'samples': 8304384, 'steps': 43251, 'loss/train': 1.7518508434295654} -11/07/2021 03:17:35 - INFO - __main__ - Step 43253: {'lr': 0.0004101234428472095, 'samples': 8304576, 'steps': 43252, 'loss/train': 2.2655272483825684} -11/07/2021 03:17:36 - INFO - __main__ - Step 43254: {'lr': 0.0004101193674258931, 'samples': 8304768, 'steps': 43253, 'loss/train': 1.2787197828292847} -11/07/2021 03:17:36 - INFO - __main__ - Step 43255: {'lr': 0.00041011529193242947, 'samples': 8304960, 'steps': 43254, 'loss/train': 1.5614346265792847} -11/07/2021 03:17:36 - INFO - __main__ - Step 43256: {'lr': 0.00041011121636682024, 'samples': 8305152, 'steps': 43255, 'loss/train': 1.4917633533477783} -11/07/2021 03:17:37 - INFO - __main__ - Step 43257: {'lr': 0.0004101071407290675, 'samples': 8305344, 'steps': 43256, 'loss/train': 1.564497709274292} -11/07/2021 03:17:37 - INFO - __main__ - Step 43258: {'lr': 0.00041010306501917287, 'samples': 8305536, 'steps': 43257, 'loss/train': 1.4174599647521973} -11/07/2021 03:17:38 - INFO - __main__ - Step 43259: {'lr': 0.0004100989892371383, 'samples': 8305728, 'steps': 43258, 'loss/train': 1.2914807796478271} -11/07/2021 03:17:38 - INFO - __main__ - Step 43260: {'lr': 0.00041009491338296557, 'samples': 8305920, 'steps': 43259, 'loss/train': 1.1329169273376465} -11/07/2021 03:17:39 - INFO - __main__ - Step 43261: {'lr': 0.00041009083745665654, 'samples': 8306112, 'steps': 43260, 'loss/train': 1.5572667121887207} -11/07/2021 03:17:39 - INFO - __main__ - Step 43262: {'lr': 0.0004100867614582131, 'samples': 8306304, 'steps': 43261, 'loss/train': 1.5937113761901855} -11/07/2021 03:17:40 - INFO - __main__ - Step 43263: {'lr': 0.00041008268538763703, 'samples': 8306496, 'steps': 43262, 'loss/train': 1.6277613639831543} -11/07/2021 03:17:41 - INFO - __main__ - Step 43264: {'lr': 0.00041007860924493014, 'samples': 8306688, 'steps': 43263, 'loss/train': 1.5388847589492798} -11/07/2021 03:17:41 - INFO - __main__ - Step 43265: {'lr': 0.0004100745330300943, 'samples': 8306880, 'steps': 43264, 'loss/train': 1.5251654386520386} -11/07/2021 03:17:42 - INFO - __main__ - Step 43266: {'lr': 0.0004100704567431314, 'samples': 8307072, 'steps': 43265, 'loss/train': 1.2249115705490112} -11/07/2021 03:17:42 - INFO - __main__ - Step 43267: {'lr': 0.0004100663803840431, 'samples': 8307264, 'steps': 43266, 'loss/train': 0.8777159452438354} -11/07/2021 03:17:42 - INFO - __main__ - Step 43268: {'lr': 0.0004100623039528315, 'samples': 8307456, 'steps': 43267, 'loss/train': 0.4611353874206543} -11/07/2021 03:17:43 - INFO - __main__ - Step 43269: {'lr': 0.0004100582274494982, 'samples': 8307648, 'steps': 43268, 'loss/train': 1.3887360095977783} -11/07/2021 03:17:44 - INFO - __main__ - Step 43270: {'lr': 0.00041005415087404516, 'samples': 8307840, 'steps': 43269, 'loss/train': 1.452347993850708} -11/07/2021 03:17:44 - INFO - __main__ - Step 43271: {'lr': 0.0004100500742264742, 'samples': 8308032, 'steps': 43270, 'loss/train': 0.9966098070144653} -11/07/2021 03:17:44 - INFO - __main__ - Step 43272: {'lr': 0.0004100459975067871, 'samples': 8308224, 'steps': 43271, 'loss/train': 0.7639972567558289} -11/07/2021 03:17:45 - INFO - __main__ - Step 43273: {'lr': 0.0004100419207149858, 'samples': 8308416, 'steps': 43272, 'loss/train': 1.5415605306625366} -11/07/2021 03:17:46 - INFO - __main__ - Step 43274: {'lr': 0.0004100378438510721, 'samples': 8308608, 'steps': 43273, 'loss/train': 1.5262449979782104} -11/07/2021 03:17:46 - INFO - __main__ - Step 43275: {'lr': 0.00041003376691504777, 'samples': 8308800, 'steps': 43274, 'loss/train': 1.361143708229065} -11/07/2021 03:17:47 - INFO - __main__ - Step 43276: {'lr': 0.0004100296899069147, 'samples': 8308992, 'steps': 43275, 'loss/train': 1.4873331785202026} -11/07/2021 03:17:47 - INFO - __main__ - Step 43277: {'lr': 0.0004100256128266747, 'samples': 8309184, 'steps': 43276, 'loss/train': 1.2578943967819214} -11/07/2021 03:17:47 - INFO - __main__ - Step 43278: {'lr': 0.00041002153567432965, 'samples': 8309376, 'steps': 43277, 'loss/train': 1.4881389141082764} -11/07/2021 03:17:49 - INFO - __main__ - Step 43279: {'lr': 0.00041001745844988134, 'samples': 8309568, 'steps': 43278, 'loss/train': 1.335159182548523} -11/07/2021 03:17:49 - INFO - __main__ - Step 43280: {'lr': 0.00041001338115333175, 'samples': 8309760, 'steps': 43279, 'loss/train': 1.672161340713501} -11/07/2021 03:17:49 - INFO - __main__ - Step 43281: {'lr': 0.0004100093037846825, 'samples': 8309952, 'steps': 43280, 'loss/train': 0.9645368456840515} -11/07/2021 03:17:50 - INFO - __main__ - Step 43282: {'lr': 0.0004100052263439355, 'samples': 8310144, 'steps': 43281, 'loss/train': 1.6344153881072998} -11/07/2021 03:17:50 - INFO - __main__ - Step 43283: {'lr': 0.00041000114883109264, 'samples': 8310336, 'steps': 43282, 'loss/train': 1.7180469036102295} -11/07/2021 03:17:51 - INFO - __main__ - Step 43284: {'lr': 0.00040999707124615573, 'samples': 8310528, 'steps': 43283, 'loss/train': 1.3519318103790283} -11/07/2021 03:17:52 - INFO - __main__ - Step 43285: {'lr': 0.00040999299358912664, 'samples': 8310720, 'steps': 43284, 'loss/train': 1.628510594367981} -11/07/2021 03:17:52 - INFO - __main__ - Step 43286: {'lr': 0.00040998891586000716, 'samples': 8310912, 'steps': 43285, 'loss/train': 1.4235750436782837} -11/07/2021 03:17:52 - INFO - __main__ - Step 43287: {'lr': 0.0004099848380587992, 'samples': 8311104, 'steps': 43286, 'loss/train': 1.61976957321167} -11/07/2021 03:17:53 - INFO - __main__ - Step 43288: {'lr': 0.00040998076018550444, 'samples': 8311296, 'steps': 43287, 'loss/train': 1.476173758506775} -11/07/2021 03:17:54 - INFO - __main__ - Step 43289: {'lr': 0.00040997668224012485, 'samples': 8311488, 'steps': 43288, 'loss/train': 1.4979326725006104} -11/07/2021 03:17:54 - INFO - __main__ - Step 43290: {'lr': 0.00040997260422266223, 'samples': 8311680, 'steps': 43289, 'loss/train': 1.5309162139892578} -11/07/2021 03:17:54 - INFO - __main__ - Step 43291: {'lr': 0.00040996852613311844, 'samples': 8311872, 'steps': 43290, 'loss/train': 1.7398695945739746} -11/07/2021 03:17:55 - INFO - __main__ - Step 43292: {'lr': 0.00040996444797149526, 'samples': 8312064, 'steps': 43291, 'loss/train': 1.7311522960662842} -11/07/2021 03:17:55 - INFO - __main__ - Step 43293: {'lr': 0.0004099603697377946, 'samples': 8312256, 'steps': 43292, 'loss/train': 1.2518097162246704} -11/07/2021 03:17:55 - INFO - __main__ - Step 43294: {'lr': 0.0004099562914320183, 'samples': 8312448, 'steps': 43293, 'loss/train': 1.6182531118392944} -11/07/2021 03:17:57 - INFO - __main__ - Step 43295: {'lr': 0.0004099522130541681, 'samples': 8312640, 'steps': 43294, 'loss/train': 1.4488192796707153} -11/07/2021 03:17:57 - INFO - __main__ - Step 43296: {'lr': 0.000409948134604246, 'samples': 8312832, 'steps': 43295, 'loss/train': 1.589702844619751} -11/07/2021 03:17:57 - INFO - __main__ - Step 43297: {'lr': 0.0004099440560822536, 'samples': 8313024, 'steps': 43296, 'loss/train': 1.4996671676635742} -11/07/2021 03:17:58 - INFO - __main__ - Step 43298: {'lr': 0.000409939977488193, 'samples': 8313216, 'steps': 43297, 'loss/train': 2.0168118476867676} -11/07/2021 03:17:58 - INFO - __main__ - Step 43299: {'lr': 0.0004099358988220658, 'samples': 8313408, 'steps': 43298, 'loss/train': 1.5424015522003174} -11/07/2021 03:18:00 - INFO - __main__ - Step 43300: {'lr': 0.00040993182008387406, 'samples': 8313600, 'steps': 43299, 'loss/train': 1.5230618715286255} -11/07/2021 03:18:00 - INFO - __main__ - Step 43301: {'lr': 0.0004099277412736195, 'samples': 8313792, 'steps': 43300, 'loss/train': 0.788213312625885} -11/07/2021 03:18:01 - INFO - __main__ - Step 43302: {'lr': 0.0004099236623913039, 'samples': 8313984, 'steps': 43301, 'loss/train': 1.7703386545181274} -11/07/2021 03:18:01 - INFO - __main__ - Step 43303: {'lr': 0.0004099195834369292, 'samples': 8314176, 'steps': 43302, 'loss/train': 1.5457040071487427} -11/07/2021 03:18:02 - INFO - __main__ - Step 43304: {'lr': 0.0004099155044104972, 'samples': 8314368, 'steps': 43303, 'loss/train': 0.8869584202766418} -11/07/2021 03:18:02 - INFO - __main__ - Step 43305: {'lr': 0.00040991142531200973, 'samples': 8314560, 'steps': 43304, 'loss/train': 1.570747971534729} -11/07/2021 03:18:02 - INFO - __main__ - Step 43306: {'lr': 0.0004099073461414686, 'samples': 8314752, 'steps': 43305, 'loss/train': 1.8002310991287231} -11/07/2021 03:18:03 - INFO - __main__ - Step 43307: {'lr': 0.0004099032668988758, 'samples': 8314944, 'steps': 43306, 'loss/train': 2.0311312675476074} -11/07/2021 03:18:04 - INFO - __main__ - Step 43308: {'lr': 0.00040989918758423306, 'samples': 8315136, 'steps': 43307, 'loss/train': 1.678662896156311} -11/07/2021 03:18:04 - INFO - __main__ - Step 43309: {'lr': 0.0004098951081975421, 'samples': 8315328, 'steps': 43308, 'loss/train': 1.566868782043457} -11/07/2021 03:18:04 - INFO - __main__ - Step 43310: {'lr': 0.0004098910287388049, 'samples': 8315520, 'steps': 43309, 'loss/train': 1.680838942527771} -11/07/2021 03:18:05 - INFO - __main__ - Step 43311: {'lr': 0.00040988694920802326, 'samples': 8315712, 'steps': 43310, 'loss/train': 1.9421578645706177} -11/07/2021 03:18:05 - INFO - __main__ - Step 43312: {'lr': 0.0004098828696051991, 'samples': 8315904, 'steps': 43311, 'loss/train': 0.9963335990905762} -11/07/2021 03:18:06 - INFO - __main__ - Step 43313: {'lr': 0.00040987878993033417, 'samples': 8316096, 'steps': 43312, 'loss/train': 1.7013061046600342} -11/07/2021 03:18:06 - INFO - __main__ - Step 43314: {'lr': 0.0004098747101834303, 'samples': 8316288, 'steps': 43313, 'loss/train': 1.45722234249115} -11/07/2021 03:18:07 - INFO - __main__ - Step 43315: {'lr': 0.00040987063036448934, 'samples': 8316480, 'steps': 43314, 'loss/train': 1.5777240991592407} -11/07/2021 03:18:07 - INFO - __main__ - Step 43316: {'lr': 0.0004098665504735132, 'samples': 8316672, 'steps': 43315, 'loss/train': 1.9435744285583496} -11/07/2021 03:18:07 - INFO - __main__ - Step 43317: {'lr': 0.0004098624705105036, 'samples': 8316864, 'steps': 43316, 'loss/train': 1.5735280513763428} -11/07/2021 03:18:08 - INFO - __main__ - Step 43318: {'lr': 0.00040985839047546243, 'samples': 8317056, 'steps': 43317, 'loss/train': 2.057516574859619} -11/07/2021 03:18:09 - INFO - __main__ - Step 43319: {'lr': 0.00040985431036839155, 'samples': 8317248, 'steps': 43318, 'loss/train': 1.3936246633529663} -11/07/2021 03:18:09 - INFO - __main__ - Step 43320: {'lr': 0.00040985023018929277, 'samples': 8317440, 'steps': 43319, 'loss/train': 1.7613195180892944} -11/07/2021 03:18:09 - INFO - __main__ - Step 43321: {'lr': 0.000409846149938168, 'samples': 8317632, 'steps': 43320, 'loss/train': 1.836496114730835} -11/07/2021 03:18:10 - INFO - __main__ - Step 43322: {'lr': 0.000409842069615019, 'samples': 8317824, 'steps': 43321, 'loss/train': 1.7254339456558228} -11/07/2021 03:18:11 - INFO - __main__ - Step 43323: {'lr': 0.0004098379892198476, 'samples': 8318016, 'steps': 43322, 'loss/train': 1.6206070184707642} -11/07/2021 03:18:11 - INFO - __main__ - Step 43324: {'lr': 0.0004098339087526557, 'samples': 8318208, 'steps': 43323, 'loss/train': 2.0613462924957275} -11/07/2021 03:18:12 - INFO - __main__ - Step 43325: {'lr': 0.00040982982821344505, 'samples': 8318400, 'steps': 43324, 'loss/train': 0.8795347213745117} -11/07/2021 03:18:12 - INFO - __main__ - Step 43326: {'lr': 0.0004098257476022176, 'samples': 8318592, 'steps': 43325, 'loss/train': 1.7156808376312256} -11/07/2021 03:18:12 - INFO - __main__ - Step 43327: {'lr': 0.00040982166691897517, 'samples': 8318784, 'steps': 43326, 'loss/train': 1.533298373222351} -11/07/2021 03:18:13 - INFO - __main__ - Step 43328: {'lr': 0.00040981758616371943, 'samples': 8318976, 'steps': 43327, 'loss/train': 1.332958459854126} -11/07/2021 03:18:14 - INFO - __main__ - Step 43329: {'lr': 0.00040981350533645245, 'samples': 8319168, 'steps': 43328, 'loss/train': 1.8397305011749268} -11/07/2021 03:18:14 - INFO - __main__ - Step 43330: {'lr': 0.00040980942443717596, 'samples': 8319360, 'steps': 43329, 'loss/train': 1.0857611894607544} -11/07/2021 03:18:14 - INFO - __main__ - Step 43331: {'lr': 0.0004098053434658918, 'samples': 8319552, 'steps': 43330, 'loss/train': 1.4920378923416138} -11/07/2021 03:18:15 - INFO - __main__ - Step 43332: {'lr': 0.0004098012624226018, 'samples': 8319744, 'steps': 43331, 'loss/train': 1.2828925848007202} -11/07/2021 03:18:15 - INFO - __main__ - Step 43333: {'lr': 0.00040979718130730786, 'samples': 8319936, 'steps': 43332, 'loss/train': 0.9293913841247559} -11/07/2021 03:18:16 - INFO - __main__ - Step 43334: {'lr': 0.0004097931001200118, 'samples': 8320128, 'steps': 43333, 'loss/train': 1.555694818496704} -11/07/2021 03:18:16 - INFO - __main__ - Step 43335: {'lr': 0.00040978901886071543, 'samples': 8320320, 'steps': 43334, 'loss/train': 1.77414071559906} -11/07/2021 03:18:17 - INFO - __main__ - Step 43336: {'lr': 0.0004097849375294205, 'samples': 8320512, 'steps': 43335, 'loss/train': 1.270373821258545} -11/07/2021 03:18:17 - INFO - __main__ - Step 43337: {'lr': 0.000409780856126129, 'samples': 8320704, 'steps': 43336, 'loss/train': 1.5385404825210571} -11/07/2021 03:18:17 - INFO - __main__ - Step 43338: {'lr': 0.00040977677465084275, 'samples': 8320896, 'steps': 43337, 'loss/train': 1.318015217781067} -11/07/2021 03:18:18 - INFO - __main__ - Step 43339: {'lr': 0.00040977269310356345, 'samples': 8321088, 'steps': 43338, 'loss/train': 1.5474750995635986} -11/07/2021 03:18:19 - INFO - __main__ - Step 43340: {'lr': 0.00040976861148429313, 'samples': 8321280, 'steps': 43339, 'loss/train': 1.669358491897583} -11/07/2021 03:18:19 - INFO - __main__ - Step 43341: {'lr': 0.0004097645297930335, 'samples': 8321472, 'steps': 43340, 'loss/train': 1.5698802471160889} -11/07/2021 03:18:20 - INFO - __main__ - Step 43342: {'lr': 0.00040976044802978645, 'samples': 8321664, 'steps': 43341, 'loss/train': 1.496842622756958} -11/07/2021 03:18:20 - INFO - __main__ - Step 43343: {'lr': 0.0004097563661945538, 'samples': 8321856, 'steps': 43342, 'loss/train': 5.575445652008057} -11/07/2021 03:18:21 - INFO - __main__ - Step 43344: {'lr': 0.0004097522842873374, 'samples': 8322048, 'steps': 43343, 'loss/train': 1.5706019401550293} -11/07/2021 03:18:21 - INFO - __main__ - Step 43345: {'lr': 0.0004097482023081391, 'samples': 8322240, 'steps': 43344, 'loss/train': 1.1677210330963135} -11/07/2021 03:18:22 - INFO - __main__ - Step 43346: {'lr': 0.00040974412025696067, 'samples': 8322432, 'steps': 43345, 'loss/train': 1.5173113346099854} -11/07/2021 03:18:22 - INFO - __main__ - Step 43347: {'lr': 0.0004097400381338041, 'samples': 8322624, 'steps': 43346, 'loss/train': 1.7230134010314941} -11/07/2021 03:18:22 - INFO - __main__ - Step 43348: {'lr': 0.0004097359559386711, 'samples': 8322816, 'steps': 43347, 'loss/train': 1.76523756980896} -11/07/2021 03:18:23 - INFO - __main__ - Step 43349: {'lr': 0.0004097318736715635, 'samples': 8323008, 'steps': 43348, 'loss/train': 0.9458571076393127} -11/07/2021 03:18:24 - INFO - __main__ - Step 43350: {'lr': 0.0004097277913324832, 'samples': 8323200, 'steps': 43349, 'loss/train': 1.1856716871261597} -11/07/2021 03:18:24 - INFO - __main__ - Step 43351: {'lr': 0.000409723708921432, 'samples': 8323392, 'steps': 43350, 'loss/train': 2.379688024520874} -11/07/2021 03:18:24 - INFO - __main__ - Step 43352: {'lr': 0.0004097196264384118, 'samples': 8323584, 'steps': 43351, 'loss/train': 1.0327445268630981} -11/07/2021 03:18:25 - INFO - __main__ - Step 43353: {'lr': 0.00040971554388342436, 'samples': 8323776, 'steps': 43352, 'loss/train': 1.4225362539291382} -11/07/2021 03:18:26 - INFO - __main__ - Step 43354: {'lr': 0.00040971146125647165, 'samples': 8323968, 'steps': 43353, 'loss/train': 1.3241119384765625} -11/07/2021 03:18:26 - INFO - __main__ - Step 43355: {'lr': 0.00040970737855755535, 'samples': 8324160, 'steps': 43354, 'loss/train': 1.253584384918213} -11/07/2021 03:18:26 - INFO - __main__ - Step 43356: {'lr': 0.00040970329578667735, 'samples': 8324352, 'steps': 43355, 'loss/train': 1.532841444015503} -11/07/2021 03:18:27 - INFO - __main__ - Step 43357: {'lr': 0.00040969921294383956, 'samples': 8324544, 'steps': 43356, 'loss/train': 0.44970759749412537} -11/07/2021 03:18:27 - INFO - __main__ - Step 43358: {'lr': 0.00040969513002904375, 'samples': 8324736, 'steps': 43357, 'loss/train': 1.4711352586746216} -11/07/2021 03:18:27 - INFO - __main__ - Step 43359: {'lr': 0.0004096910470422918, 'samples': 8324928, 'steps': 43358, 'loss/train': 0.8249011635780334} -11/07/2021 03:18:29 - INFO - __main__ - Step 43360: {'lr': 0.0004096869639835855, 'samples': 8325120, 'steps': 43359, 'loss/train': 1.2207739353179932} -11/07/2021 03:18:29 - INFO - __main__ - Step 43361: {'lr': 0.0004096828808529267, 'samples': 8325312, 'steps': 43360, 'loss/train': 1.2354450225830078} -11/07/2021 03:18:29 - INFO - __main__ - Step 43362: {'lr': 0.0004096787976503173, 'samples': 8325504, 'steps': 43361, 'loss/train': 1.9712218046188354} -11/07/2021 03:18:30 - INFO - __main__ - Step 43363: {'lr': 0.0004096747143757591, 'samples': 8325696, 'steps': 43362, 'loss/train': 0.833960771560669} -11/07/2021 03:18:30 - INFO - __main__ - Step 43364: {'lr': 0.0004096706310292539, 'samples': 8325888, 'steps': 43363, 'loss/train': 1.145098328590393} -11/07/2021 03:18:31 - INFO - __main__ - Step 43365: {'lr': 0.0004096665476108036, 'samples': 8326080, 'steps': 43364, 'loss/train': 1.7072386741638184} -11/07/2021 03:18:32 - INFO - __main__ - Step 43366: {'lr': 0.00040966246412040995, 'samples': 8326272, 'steps': 43365, 'loss/train': 1.7308281660079956} -11/07/2021 03:18:32 - INFO - __main__ - Step 43367: {'lr': 0.00040965838055807493, 'samples': 8326464, 'steps': 43366, 'loss/train': 1.5208653211593628} -11/07/2021 03:18:32 - INFO - __main__ - Step 43368: {'lr': 0.00040965429692380034, 'samples': 8326656, 'steps': 43367, 'loss/train': 1.3145965337753296} -11/07/2021 03:18:33 - INFO - __main__ - Step 43369: {'lr': 0.00040965021321758796, 'samples': 8326848, 'steps': 43368, 'loss/train': 1.3993343114852905} -11/07/2021 03:18:34 - INFO - __main__ - Step 43370: {'lr': 0.00040964612943943964, 'samples': 8327040, 'steps': 43369, 'loss/train': 1.4707213640213013} -11/07/2021 03:18:34 - INFO - __main__ - Step 43371: {'lr': 0.00040964204558935726, 'samples': 8327232, 'steps': 43370, 'loss/train': 1.248171329498291} -11/07/2021 03:18:34 - INFO - __main__ - Step 43372: {'lr': 0.00040963796166734257, 'samples': 8327424, 'steps': 43371, 'loss/train': 1.6246415376663208} -11/07/2021 03:18:35 - INFO - __main__ - Step 43373: {'lr': 0.00040963387767339757, 'samples': 8327616, 'steps': 43372, 'loss/train': 1.0944591760635376} -11/07/2021 03:18:35 - INFO - __main__ - Step 43374: {'lr': 0.00040962979360752394, 'samples': 8327808, 'steps': 43373, 'loss/train': 1.5124233961105347} -11/07/2021 03:18:36 - INFO - __main__ - Step 43375: {'lr': 0.0004096257094697236, 'samples': 8328000, 'steps': 43374, 'loss/train': 1.634065866470337} -11/07/2021 03:18:36 - INFO - __main__ - Step 43376: {'lr': 0.00040962162525999833, 'samples': 8328192, 'steps': 43375, 'loss/train': 0.593380868434906} -11/07/2021 03:18:37 - INFO - __main__ - Step 43377: {'lr': 0.00040961754097835015, 'samples': 8328384, 'steps': 43376, 'loss/train': 1.536962866783142} -11/07/2021 03:18:37 - INFO - __main__ - Step 43378: {'lr': 0.00040961345662478065, 'samples': 8328576, 'steps': 43377, 'loss/train': 1.2107462882995605} -11/07/2021 03:18:37 - INFO - __main__ - Step 43379: {'lr': 0.00040960937219929186, 'samples': 8328768, 'steps': 43378, 'loss/train': 1.471487045288086} -11/07/2021 03:18:38 - INFO - __main__ - Step 43380: {'lr': 0.00040960528770188554, 'samples': 8328960, 'steps': 43379, 'loss/train': 1.4032756090164185} -11/07/2021 03:18:39 - INFO - __main__ - Step 43381: {'lr': 0.00040960120313256356, 'samples': 8329152, 'steps': 43380, 'loss/train': 1.7656457424163818} -11/07/2021 03:18:39 - INFO - __main__ - Step 43382: {'lr': 0.0004095971184913277, 'samples': 8329344, 'steps': 43381, 'loss/train': 1.5677131414413452} -11/07/2021 03:18:39 - INFO - __main__ - Step 43383: {'lr': 0.0004095930337781798, 'samples': 8329536, 'steps': 43382, 'loss/train': 0.2914910912513733} -11/07/2021 03:18:40 - INFO - __main__ - Step 43384: {'lr': 0.00040958894899312183, 'samples': 8329728, 'steps': 43383, 'loss/train': 1.640594244003296} -11/07/2021 03:18:40 - INFO - __main__ - Step 43385: {'lr': 0.0004095848641361555, 'samples': 8329920, 'steps': 43384, 'loss/train': 1.6570206880569458} -11/07/2021 03:18:41 - INFO - __main__ - Step 43386: {'lr': 0.0004095807792072827, 'samples': 8330112, 'steps': 43385, 'loss/train': 0.9187992811203003} -11/07/2021 03:18:42 - INFO - __main__ - Step 43387: {'lr': 0.00040957669420650525, 'samples': 8330304, 'steps': 43386, 'loss/train': 1.5217148065567017} -11/07/2021 03:18:42 - INFO - __main__ - Step 43388: {'lr': 0.000409572609133825, 'samples': 8330496, 'steps': 43387, 'loss/train': 1.2924803495407104} -11/07/2021 03:18:42 - INFO - __main__ - Step 43389: {'lr': 0.00040956852398924383, 'samples': 8330688, 'steps': 43388, 'loss/train': 1.3369059562683105} -11/07/2021 03:18:43 - INFO - __main__ - Step 43390: {'lr': 0.0004095644387727635, 'samples': 8330880, 'steps': 43389, 'loss/train': 1.7199703454971313} -11/07/2021 03:18:44 - INFO - __main__ - Step 43391: {'lr': 0.0004095603534843859, 'samples': 8331072, 'steps': 43390, 'loss/train': 2.3008205890655518} -11/07/2021 03:18:44 - INFO - __main__ - Step 43392: {'lr': 0.00040955626812411297, 'samples': 8331264, 'steps': 43391, 'loss/train': 1.1952695846557617} -11/07/2021 03:18:44 - INFO - __main__ - Step 43393: {'lr': 0.0004095521826919463, 'samples': 8331456, 'steps': 43392, 'loss/train': 1.5825469493865967} -11/07/2021 03:18:45 - INFO - __main__ - Step 43394: {'lr': 0.0004095480971878879, 'samples': 8331648, 'steps': 43393, 'loss/train': 1.059404730796814} -11/07/2021 03:18:45 - INFO - __main__ - Step 43395: {'lr': 0.0004095440116119397, 'samples': 8331840, 'steps': 43394, 'loss/train': 1.9554314613342285} -11/07/2021 03:18:46 - INFO - __main__ - Step 43396: {'lr': 0.00040953992596410335, 'samples': 8332032, 'steps': 43395, 'loss/train': 1.4320061206817627} -11/07/2021 03:18:46 - INFO - __main__ - Step 43397: {'lr': 0.0004095358402443808, 'samples': 8332224, 'steps': 43396, 'loss/train': 0.6256570219993591} -11/07/2021 03:18:47 - INFO - __main__ - Step 43398: {'lr': 0.0004095317544527738, 'samples': 8332416, 'steps': 43397, 'loss/train': 1.4908761978149414} -11/07/2021 03:18:47 - INFO - __main__ - Step 43399: {'lr': 0.00040952766858928433, 'samples': 8332608, 'steps': 43398, 'loss/train': 1.5086199045181274} -11/07/2021 03:18:47 - INFO - __main__ - Step 43400: {'lr': 0.0004095235826539141, 'samples': 8332800, 'steps': 43399, 'loss/train': 1.3647236824035645} -11/07/2021 03:18:49 - INFO - __main__ - Step 43401: {'lr': 0.00040951949664666504, 'samples': 8332992, 'steps': 43400, 'loss/train': 1.3735185861587524} -11/07/2021 03:18:49 - INFO - __main__ - Step 43402: {'lr': 0.00040951541056753895, 'samples': 8333184, 'steps': 43401, 'loss/train': 1.4975714683532715} -11/07/2021 03:18:50 - INFO - __main__ - Step 43403: {'lr': 0.00040951132441653773, 'samples': 8333376, 'steps': 43402, 'loss/train': 1.4579033851623535} -11/07/2021 03:18:50 - INFO - __main__ - Step 43404: {'lr': 0.00040950723819366307, 'samples': 8333568, 'steps': 43403, 'loss/train': 1.461193323135376} -11/07/2021 03:18:50 - INFO - __main__ - Step 43405: {'lr': 0.000409503151898917, 'samples': 8333760, 'steps': 43404, 'loss/train': 0.5103493928909302} -11/07/2021 03:18:51 - INFO - __main__ - Step 43406: {'lr': 0.0004094990655323012, 'samples': 8333952, 'steps': 43405, 'loss/train': 0.9520642161369324} -11/07/2021 03:18:52 - INFO - __main__ - Step 43407: {'lr': 0.00040949497909381757, 'samples': 8334144, 'steps': 43406, 'loss/train': 1.6208157539367676} -11/07/2021 03:18:52 - INFO - __main__ - Step 43408: {'lr': 0.000409490892583468, 'samples': 8334336, 'steps': 43407, 'loss/train': 1.2611219882965088} -11/07/2021 03:18:52 - INFO - __main__ - Step 43409: {'lr': 0.0004094868060012543, 'samples': 8334528, 'steps': 43408, 'loss/train': 1.7201714515686035} -11/07/2021 03:18:53 - INFO - __main__ - Step 43410: {'lr': 0.0004094827193471783, 'samples': 8334720, 'steps': 43409, 'loss/train': 1.157602071762085} -11/07/2021 03:18:53 - INFO - __main__ - Step 43411: {'lr': 0.00040947863262124186, 'samples': 8334912, 'steps': 43410, 'loss/train': 1.817247748374939} -11/07/2021 03:18:54 - INFO - __main__ - Step 43412: {'lr': 0.0004094745458234468, 'samples': 8335104, 'steps': 43411, 'loss/train': 1.3322869539260864} -11/07/2021 03:18:55 - INFO - __main__ - Step 43413: {'lr': 0.00040947045895379494, 'samples': 8335296, 'steps': 43412, 'loss/train': 1.4618539810180664} -11/07/2021 03:18:55 - INFO - __main__ - Step 43414: {'lr': 0.00040946637201228815, 'samples': 8335488, 'steps': 43413, 'loss/train': 0.8857395052909851} -11/07/2021 03:18:55 - INFO - __main__ - Step 43415: {'lr': 0.00040946228499892835, 'samples': 8335680, 'steps': 43414, 'loss/train': 0.5324795246124268} -11/07/2021 03:18:56 - INFO - __main__ - Step 43416: {'lr': 0.0004094581979137172, 'samples': 8335872, 'steps': 43415, 'loss/train': 1.338943362236023} -11/07/2021 03:18:57 - INFO - __main__ - Step 43417: {'lr': 0.00040945411075665674, 'samples': 8336064, 'steps': 43416, 'loss/train': 1.0641642808914185} -11/07/2021 03:18:57 - INFO - __main__ - Step 43418: {'lr': 0.0004094500235277486, 'samples': 8336256, 'steps': 43417, 'loss/train': 1.5129536390304565} -11/07/2021 03:18:57 - INFO - __main__ - Step 43419: {'lr': 0.0004094459362269949, 'samples': 8336448, 'steps': 43418, 'loss/train': 1.694779396057129} -11/07/2021 03:18:58 - INFO - __main__ - Step 43420: {'lr': 0.0004094418488543972, 'samples': 8336640, 'steps': 43419, 'loss/train': 1.850289225578308} -11/07/2021 03:18:58 - INFO - __main__ - Step 43421: {'lr': 0.00040943776140995756, 'samples': 8336832, 'steps': 43420, 'loss/train': 1.336556077003479} -11/07/2021 03:18:58 - INFO - __main__ - Step 43422: {'lr': 0.0004094336738936777, 'samples': 8337024, 'steps': 43421, 'loss/train': 1.7144724130630493} -11/07/2021 03:18:59 - INFO - __main__ - Step 43423: {'lr': 0.0004094295863055594, 'samples': 8337216, 'steps': 43422, 'loss/train': 1.6323271989822388} -11/07/2021 03:19:00 - INFO - __main__ - Step 43424: {'lr': 0.0004094254986456046, 'samples': 8337408, 'steps': 43423, 'loss/train': 1.2456058263778687} -11/07/2021 03:19:00 - INFO - __main__ - Step 43425: {'lr': 0.0004094214109138152, 'samples': 8337600, 'steps': 43424, 'loss/train': 1.344637155532837} -11/07/2021 03:19:00 - INFO - __main__ - Step 43426: {'lr': 0.000409417323110193, 'samples': 8337792, 'steps': 43425, 'loss/train': 1.5101417303085327} -11/07/2021 03:19:01 - INFO - __main__ - Step 43427: {'lr': 0.00040941323523473975, 'samples': 8337984, 'steps': 43426, 'loss/train': 1.7929035425186157} -11/07/2021 03:19:02 - INFO - __main__ - Step 43428: {'lr': 0.00040940914728745736, 'samples': 8338176, 'steps': 43427, 'loss/train': 0.9796424508094788} -11/07/2021 03:19:02 - INFO - __main__ - Step 43429: {'lr': 0.0004094050592683477, 'samples': 8338368, 'steps': 43428, 'loss/train': 1.762089729309082} -11/07/2021 03:19:03 - INFO - __main__ - Step 43430: {'lr': 0.00040940097117741255, 'samples': 8338560, 'steps': 43429, 'loss/train': 1.084628939628601} -11/07/2021 03:19:03 - INFO - __main__ - Step 43431: {'lr': 0.00040939688301465377, 'samples': 8338752, 'steps': 43430, 'loss/train': 1.2713582515716553} -11/07/2021 03:19:03 - INFO - __main__ - Step 43432: {'lr': 0.0004093927947800732, 'samples': 8338944, 'steps': 43431, 'loss/train': 1.6452714204788208} -11/07/2021 03:19:04 - INFO - __main__ - Step 43433: {'lr': 0.00040938870647367275, 'samples': 8339136, 'steps': 43432, 'loss/train': 1.3768030405044556} -11/07/2021 03:19:05 - INFO - __main__ - Step 43434: {'lr': 0.0004093846180954542, 'samples': 8339328, 'steps': 43433, 'loss/train': 1.5188106298446655} -11/07/2021 03:19:05 - INFO - __main__ - Step 43435: {'lr': 0.00040938052964541936, 'samples': 8339520, 'steps': 43434, 'loss/train': 1.2342990636825562} -11/07/2021 03:19:05 - INFO - __main__ - Step 43436: {'lr': 0.0004093764411235702, 'samples': 8339712, 'steps': 43435, 'loss/train': 1.8071941137313843} -11/07/2021 03:19:06 - INFO - __main__ - Step 43437: {'lr': 0.00040937235252990834, 'samples': 8339904, 'steps': 43436, 'loss/train': 1.6887180805206299} -11/07/2021 03:19:07 - INFO - __main__ - Step 43438: {'lr': 0.00040936826386443585, 'samples': 8340096, 'steps': 43437, 'loss/train': 1.5172128677368164} -11/07/2021 03:19:07 - INFO - __main__ - Step 43439: {'lr': 0.00040936417512715454, 'samples': 8340288, 'steps': 43438, 'loss/train': 1.392961025238037} -11/07/2021 03:19:07 - INFO - __main__ - Step 43440: {'lr': 0.00040936008631806603, 'samples': 8340480, 'steps': 43439, 'loss/train': 1.736971378326416} -11/07/2021 03:19:08 - INFO - __main__ - Step 43441: {'lr': 0.00040935599743717243, 'samples': 8340672, 'steps': 43440, 'loss/train': 1.6567108631134033} -11/07/2021 03:19:08 - INFO - __main__ - Step 43442: {'lr': 0.00040935190848447544, 'samples': 8340864, 'steps': 43441, 'loss/train': 1.3322232961654663} -11/07/2021 03:19:09 - INFO - __main__ - Step 43443: {'lr': 0.000409347819459977, 'samples': 8341056, 'steps': 43442, 'loss/train': 1.6457480192184448} -11/07/2021 03:19:09 - INFO - __main__ - Step 43444: {'lr': 0.0004093437303636788, 'samples': 8341248, 'steps': 43443, 'loss/train': 1.3809614181518555} -11/07/2021 03:19:10 - INFO - __main__ - Step 43445: {'lr': 0.0004093396411955829, 'samples': 8341440, 'steps': 43444, 'loss/train': 1.338553547859192} -11/07/2021 03:19:10 - INFO - __main__ - Step 43446: {'lr': 0.0004093355519556908, 'samples': 8341632, 'steps': 43445, 'loss/train': 1.2826430797576904} -11/07/2021 03:19:10 - INFO - __main__ - Step 43447: {'lr': 0.0004093314626440048, 'samples': 8341824, 'steps': 43446, 'loss/train': 1.4386062622070312} -11/07/2021 03:19:11 - INFO - __main__ - Step 43448: {'lr': 0.0004093273732605264, 'samples': 8342016, 'steps': 43447, 'loss/train': 1.561930775642395} -11/07/2021 03:19:12 - INFO - __main__ - Step 43449: {'lr': 0.0004093232838052575, 'samples': 8342208, 'steps': 43448, 'loss/train': 1.3393933773040771} -11/07/2021 03:19:12 - INFO - __main__ - Step 43450: {'lr': 0.0004093191942782001, 'samples': 8342400, 'steps': 43449, 'loss/train': 1.4493123292922974} -11/07/2021 03:19:13 - INFO - __main__ - Step 43451: {'lr': 0.0004093151046793558, 'samples': 8342592, 'steps': 43450, 'loss/train': 4.328895568847656} -11/07/2021 03:19:13 - INFO - __main__ - Step 43452: {'lr': 0.00040931101500872656, 'samples': 8342784, 'steps': 43451, 'loss/train': 1.560447096824646} -11/07/2021 03:19:14 - INFO - __main__ - Step 43453: {'lr': 0.00040930692526631443, 'samples': 8342976, 'steps': 43452, 'loss/train': 1.3717985153198242} -11/07/2021 03:19:14 - INFO - __main__ - Step 43454: {'lr': 0.0004093028354521209, 'samples': 8343168, 'steps': 43453, 'loss/train': 1.4804021120071411} -11/07/2021 03:19:15 - INFO - __main__ - Step 43455: {'lr': 0.000409298745566148, 'samples': 8343360, 'steps': 43454, 'loss/train': 1.7922828197479248} -11/07/2021 03:19:15 - INFO - __main__ - Step 43456: {'lr': 0.00040929465560839753, 'samples': 8343552, 'steps': 43455, 'loss/train': 1.7526626586914062} -11/07/2021 03:19:15 - INFO - __main__ - Step 43457: {'lr': 0.00040929056557887137, 'samples': 8343744, 'steps': 43456, 'loss/train': 1.7522269487380981} -11/07/2021 03:19:16 - INFO - __main__ - Step 43458: {'lr': 0.0004092864754775713, 'samples': 8343936, 'steps': 43457, 'loss/train': 1.1358518600463867} -11/07/2021 03:19:17 - INFO - __main__ - Step 43459: {'lr': 0.00040928238530449926, 'samples': 8344128, 'steps': 43458, 'loss/train': 1.2265043258666992} -11/07/2021 03:19:17 - INFO - __main__ - Step 43460: {'lr': 0.00040927829505965694, 'samples': 8344320, 'steps': 43459, 'loss/train': 1.6911441087722778} -11/07/2021 03:19:17 - INFO - __main__ - Step 43461: {'lr': 0.00040927420474304646, 'samples': 8344512, 'steps': 43460, 'loss/train': 0.21975359320640564} -11/07/2021 03:19:18 - INFO - __main__ - Step 43462: {'lr': 0.00040927011435466933, 'samples': 8344704, 'steps': 43461, 'loss/train': 1.3408634662628174} -11/07/2021 03:19:18 - INFO - __main__ - Step 43463: {'lr': 0.0004092660238945276, 'samples': 8344896, 'steps': 43462, 'loss/train': 1.6607204675674438} -11/07/2021 03:19:19 - INFO - __main__ - Step 43464: {'lr': 0.00040926193336262304, 'samples': 8345088, 'steps': 43463, 'loss/train': 1.8812296390533447} -11/07/2021 03:19:20 - INFO - __main__ - Step 43465: {'lr': 0.0004092578427589575, 'samples': 8345280, 'steps': 43464, 'loss/train': 1.7003211975097656} -11/07/2021 03:19:20 - INFO - __main__ - Step 43466: {'lr': 0.0004092537520835328, 'samples': 8345472, 'steps': 43465, 'loss/train': 1.2302883863449097} -11/07/2021 03:19:20 - INFO - __main__ - Step 43467: {'lr': 0.0004092496613363509, 'samples': 8345664, 'steps': 43466, 'loss/train': 1.0020233392715454} -11/07/2021 03:19:21 - INFO - __main__ - Step 43468: {'lr': 0.0004092455705174135, 'samples': 8345856, 'steps': 43467, 'loss/train': 1.6291698217391968} -11/07/2021 03:19:22 - INFO - __main__ - Step 43469: {'lr': 0.00040924147962672253, 'samples': 8346048, 'steps': 43468, 'loss/train': 3.498680353164673} -11/07/2021 03:19:22 - INFO - __main__ - Step 43470: {'lr': 0.00040923738866427986, 'samples': 8346240, 'steps': 43469, 'loss/train': 1.2424981594085693} -11/07/2021 03:19:23 - INFO - __main__ - Step 43471: {'lr': 0.00040923329763008714, 'samples': 8346432, 'steps': 43470, 'loss/train': 1.70469331741333} -11/07/2021 03:19:23 - INFO - __main__ - Step 43472: {'lr': 0.0004092292065241464, 'samples': 8346624, 'steps': 43471, 'loss/train': 1.1266168355941772} -11/07/2021 03:19:23 - INFO - __main__ - Step 43473: {'lr': 0.00040922511534645953, 'samples': 8346816, 'steps': 43472, 'loss/train': 1.3175348043441772} -11/07/2021 03:19:24 - INFO - __main__ - Step 43474: {'lr': 0.0004092210240970282, 'samples': 8347008, 'steps': 43473, 'loss/train': 1.4208704233169556} -11/07/2021 03:19:25 - INFO - __main__ - Step 43475: {'lr': 0.0004092169327758544, 'samples': 8347200, 'steps': 43474, 'loss/train': 1.222894549369812} -11/07/2021 03:19:25 - INFO - __main__ - Step 43476: {'lr': 0.0004092128413829398, 'samples': 8347392, 'steps': 43475, 'loss/train': 1.2349470853805542} -11/07/2021 03:19:25 - INFO - __main__ - Step 43477: {'lr': 0.0004092087499182864, 'samples': 8347584, 'steps': 43476, 'loss/train': 1.730302333831787} -11/07/2021 03:19:26 - INFO - __main__ - Step 43478: {'lr': 0.000409204658381896, 'samples': 8347776, 'steps': 43477, 'loss/train': 1.6098095178604126} -11/07/2021 03:19:26 - INFO - __main__ - Step 43479: {'lr': 0.00040920056677377047, 'samples': 8347968, 'steps': 43478, 'loss/train': 1.6416910886764526} -11/07/2021 03:19:27 - INFO - __main__ - Step 43480: {'lr': 0.00040919647509391155, 'samples': 8348160, 'steps': 43479, 'loss/train': 1.114418387413025} -11/07/2021 03:19:28 - INFO - __main__ - Step 43481: {'lr': 0.0004091923833423212, 'samples': 8348352, 'steps': 43480, 'loss/train': 1.4143720865249634} -11/07/2021 03:19:28 - INFO - __main__ - Step 43482: {'lr': 0.00040918829151900127, 'samples': 8348544, 'steps': 43481, 'loss/train': 1.4186195135116577} -11/07/2021 03:19:28 - INFO - __main__ - Step 43483: {'lr': 0.0004091841996239535, 'samples': 8348736, 'steps': 43482, 'loss/train': 1.563791275024414} -11/07/2021 03:19:29 - INFO - __main__ - Step 43484: {'lr': 0.00040918010765717976, 'samples': 8348928, 'steps': 43483, 'loss/train': 1.2986820936203003} -11/07/2021 03:19:30 - INFO - __main__ - Step 43485: {'lr': 0.00040917601561868194, 'samples': 8349120, 'steps': 43484, 'loss/train': 1.6048474311828613} -11/07/2021 03:19:30 - INFO - __main__ - Step 43486: {'lr': 0.00040917192350846187, 'samples': 8349312, 'steps': 43485, 'loss/train': 1.2884235382080078} -11/07/2021 03:19:31 - INFO - __main__ - Step 43487: {'lr': 0.00040916783132652134, 'samples': 8349504, 'steps': 43486, 'loss/train': 1.8406164646148682} -11/07/2021 03:19:31 - INFO - __main__ - Step 43488: {'lr': 0.0004091637390728623, 'samples': 8349696, 'steps': 43487, 'loss/train': 1.7488003969192505} -11/07/2021 03:19:31 - INFO - __main__ - Step 43489: {'lr': 0.00040915964674748665, 'samples': 8349888, 'steps': 43488, 'loss/train': 1.1958898305892944} -11/07/2021 03:19:32 - INFO - __main__ - Step 43490: {'lr': 0.0004091555543503959, 'samples': 8350080, 'steps': 43489, 'loss/train': 1.5925389528274536} -11/07/2021 03:19:33 - INFO - __main__ - Step 43491: {'lr': 0.00040915146188159223, 'samples': 8350272, 'steps': 43490, 'loss/train': 0.8500160574913025} -11/07/2021 03:19:33 - INFO - __main__ - Step 43492: {'lr': 0.0004091473693410773, 'samples': 8350464, 'steps': 43491, 'loss/train': 1.240749716758728} -11/07/2021 03:19:33 - INFO - __main__ - Step 43493: {'lr': 0.0004091432767288531, 'samples': 8350656, 'steps': 43492, 'loss/train': 1.4671683311462402} -11/07/2021 03:19:34 - INFO - __main__ - Step 43494: {'lr': 0.0004091391840449213, 'samples': 8350848, 'steps': 43493, 'loss/train': 1.5638720989227295} -11/07/2021 03:19:34 - INFO - __main__ - Step 43495: {'lr': 0.00040913509128928394, 'samples': 8351040, 'steps': 43494, 'loss/train': 1.8460904359817505} -11/07/2021 03:19:35 - INFO - __main__ - Step 43496: {'lr': 0.00040913099846194274, 'samples': 8351232, 'steps': 43495, 'loss/train': 1.6968833208084106} -11/07/2021 03:19:35 - INFO - __main__ - Step 43497: {'lr': 0.00040912690556289957, 'samples': 8351424, 'steps': 43496, 'loss/train': 0.21595387160778046} -11/07/2021 03:19:36 - INFO - __main__ - Step 43498: {'lr': 0.0004091228125921562, 'samples': 8351616, 'steps': 43497, 'loss/train': 1.8241119384765625} -11/07/2021 03:19:36 - INFO - __main__ - Step 43499: {'lr': 0.0004091187195497146, 'samples': 8351808, 'steps': 43498, 'loss/train': 2.1405017375946045} -11/07/2021 03:19:36 - INFO - __main__ - Step 43500: {'lr': 0.00040911462643557656, 'samples': 8352000, 'steps': 43499, 'loss/train': 1.618061900138855} -11/07/2021 03:19:37 - INFO - __main__ - Step 43501: {'lr': 0.0004091105332497439, 'samples': 8352192, 'steps': 43500, 'loss/train': 1.3820098638534546} -11/07/2021 03:19:38 - INFO - __main__ - Step 43502: {'lr': 0.0004091064399922185, 'samples': 8352384, 'steps': 43501, 'loss/train': 1.3085178136825562} -11/07/2021 03:19:38 - INFO - __main__ - Step 43503: {'lr': 0.0004091023466630023, 'samples': 8352576, 'steps': 43502, 'loss/train': 1.8581750392913818} -11/07/2021 03:19:38 - INFO - __main__ - Step 43504: {'lr': 0.00040909825326209694, 'samples': 8352768, 'steps': 43503, 'loss/train': 1.267033576965332} -11/07/2021 03:19:39 - INFO - __main__ - Step 43505: {'lr': 0.0004090941597895043, 'samples': 8352960, 'steps': 43504, 'loss/train': 1.826012134552002} -11/07/2021 03:19:40 - INFO - __main__ - Step 43506: {'lr': 0.0004090900662452264, 'samples': 8353152, 'steps': 43505, 'loss/train': 1.538798451423645} -11/07/2021 03:19:40 - INFO - __main__ - Step 43507: {'lr': 0.00040908597262926484, 'samples': 8353344, 'steps': 43506, 'loss/train': 1.5585148334503174} -11/07/2021 03:19:41 - INFO - __main__ - Step 43508: {'lr': 0.0004090818789416217, 'samples': 8353536, 'steps': 43507, 'loss/train': 1.1718560457229614} -11/07/2021 03:19:41 - INFO - __main__ - Step 43509: {'lr': 0.0004090777851822988, 'samples': 8353728, 'steps': 43508, 'loss/train': 1.2051889896392822} -11/07/2021 03:19:41 - INFO - __main__ - Step 43510: {'lr': 0.0004090736913512977, 'samples': 8353920, 'steps': 43509, 'loss/train': 1.932144284248352} -11/07/2021 03:19:42 - INFO - __main__ - Step 43511: {'lr': 0.0004090695974486206, 'samples': 8354112, 'steps': 43510, 'loss/train': 1.5004621744155884} -11/07/2021 03:19:43 - INFO - __main__ - Step 43512: {'lr': 0.00040906550347426907, 'samples': 8354304, 'steps': 43511, 'loss/train': 0.28656384348869324} -11/07/2021 03:19:43 - INFO - __main__ - Step 43513: {'lr': 0.0004090614094282452, 'samples': 8354496, 'steps': 43512, 'loss/train': 1.5482137203216553} -11/07/2021 03:19:43 - INFO - __main__ - Step 43514: {'lr': 0.00040905731531055067, 'samples': 8354688, 'steps': 43513, 'loss/train': 1.636155366897583} -11/07/2021 03:19:44 - INFO - __main__ - Step 43515: {'lr': 0.0004090532211211874, 'samples': 8354880, 'steps': 43514, 'loss/train': 1.1567301750183105} -11/07/2021 03:19:44 - INFO - __main__ - Step 43516: {'lr': 0.0004090491268601572, 'samples': 8355072, 'steps': 43515, 'loss/train': 1.7579503059387207} -11/07/2021 03:19:45 - INFO - __main__ - Step 43517: {'lr': 0.0004090450325274618, 'samples': 8355264, 'steps': 43516, 'loss/train': 1.4337153434753418} -11/07/2021 03:19:45 - INFO - __main__ - Step 43518: {'lr': 0.0004090409381231033, 'samples': 8355456, 'steps': 43517, 'loss/train': 0.9164023399353027} -11/07/2021 03:19:46 - INFO - __main__ - Step 43519: {'lr': 0.0004090368436470833, 'samples': 8355648, 'steps': 43518, 'loss/train': 1.3550169467926025} -11/07/2021 03:19:46 - INFO - __main__ - Step 43520: {'lr': 0.0004090327490994038, 'samples': 8355840, 'steps': 43519, 'loss/train': 1.3841397762298584} -11/07/2021 03:19:47 - INFO - __main__ - Step 43521: {'lr': 0.00040902865448006663, 'samples': 8356032, 'steps': 43520, 'loss/train': 1.8165466785430908} -11/07/2021 03:19:48 - INFO - __main__ - Step 43522: {'lr': 0.0004090245597890736, 'samples': 8356224, 'steps': 43521, 'loss/train': 1.598728895187378} -11/07/2021 03:19:48 - INFO - __main__ - Step 43523: {'lr': 0.00040902046502642656, 'samples': 8356416, 'steps': 43522, 'loss/train': 1.8639800548553467} -11/07/2021 03:19:48 - INFO - __main__ - Step 43524: {'lr': 0.0004090163701921273, 'samples': 8356608, 'steps': 43523, 'loss/train': 1.2822519540786743} -11/07/2021 03:19:49 - INFO - __main__ - Step 43525: {'lr': 0.0004090122752861777, 'samples': 8356800, 'steps': 43524, 'loss/train': 1.387771725654602} -11/07/2021 03:19:49 - INFO - __main__ - Step 43526: {'lr': 0.0004090081803085797, 'samples': 8356992, 'steps': 43525, 'loss/train': 1.2362226247787476} -11/07/2021 03:19:50 - INFO - __main__ - Step 43527: {'lr': 0.00040900408525933505, 'samples': 8357184, 'steps': 43526, 'loss/train': 1.8942064046859741} -11/07/2021 03:19:51 - INFO - __main__ - Step 43528: {'lr': 0.0004089999901384456, 'samples': 8357376, 'steps': 43527, 'loss/train': 1.1758595705032349} -11/07/2021 03:19:51 - INFO - __main__ - Step 43529: {'lr': 0.00040899589494591316, 'samples': 8357568, 'steps': 43528, 'loss/train': 1.031545639038086} -11/07/2021 03:19:51 - INFO - __main__ - Step 43530: {'lr': 0.0004089917996817397, 'samples': 8357760, 'steps': 43529, 'loss/train': 1.3493149280548096} -11/07/2021 03:19:52 - INFO - __main__ - Step 43531: {'lr': 0.00040898770434592694, 'samples': 8357952, 'steps': 43530, 'loss/train': 1.3495090007781982} -11/07/2021 03:19:53 - INFO - __main__ - Step 43532: {'lr': 0.0004089836089384768, 'samples': 8358144, 'steps': 43531, 'loss/train': 1.5462332963943481} -11/07/2021 03:19:53 - INFO - __main__ - Step 43533: {'lr': 0.0004089795134593911, 'samples': 8358336, 'steps': 43532, 'loss/train': 1.2180896997451782} -11/07/2021 03:19:54 - INFO - __main__ - Step 43534: {'lr': 0.00040897541790867165, 'samples': 8358528, 'steps': 43533, 'loss/train': 2.5205626487731934} -11/07/2021 03:19:54 - INFO - __main__ - Step 43535: {'lr': 0.00040897132228632035, 'samples': 8358720, 'steps': 43534, 'loss/train': 1.61453115940094} -11/07/2021 03:19:54 - INFO - __main__ - Step 43536: {'lr': 0.000408967226592339, 'samples': 8358912, 'steps': 43535, 'loss/train': 1.846745252609253} -11/07/2021 03:19:56 - INFO - __main__ - Step 43537: {'lr': 0.00040896313082672953, 'samples': 8359104, 'steps': 43536, 'loss/train': 0.9068235754966736} -11/07/2021 03:19:56 - INFO - __main__ - Step 43538: {'lr': 0.0004089590349894937, 'samples': 8359296, 'steps': 43537, 'loss/train': 1.7170244455337524} -11/07/2021 03:19:56 - INFO - __main__ - Step 43539: {'lr': 0.0004089549390806334, 'samples': 8359488, 'steps': 43538, 'loss/train': 1.5198299884796143} -11/07/2021 03:19:57 - INFO - __main__ - Step 43540: {'lr': 0.0004089508431001504, 'samples': 8359680, 'steps': 43539, 'loss/train': 1.860291600227356} -11/07/2021 03:19:57 - INFO - __main__ - Step 43541: {'lr': 0.00040894674704804667, 'samples': 8359872, 'steps': 43540, 'loss/train': 1.6128144264221191} -11/07/2021 03:19:57 - INFO - __main__ - Step 43542: {'lr': 0.00040894265092432397, 'samples': 8360064, 'steps': 43541, 'loss/train': 1.2706501483917236} -11/07/2021 03:19:58 - INFO - __main__ - Step 43543: {'lr': 0.0004089385547289841, 'samples': 8360256, 'steps': 43542, 'loss/train': 0.9065102338790894} -11/07/2021 03:19:59 - INFO - __main__ - Step 43544: {'lr': 0.00040893445846202904, 'samples': 8360448, 'steps': 43543, 'loss/train': 1.482672929763794} -11/07/2021 03:19:59 - INFO - __main__ - Step 43545: {'lr': 0.00040893036212346056, 'samples': 8360640, 'steps': 43544, 'loss/train': 1.546755075454712} -11/07/2021 03:19:59 - INFO - __main__ - Step 43546: {'lr': 0.00040892626571328053, 'samples': 8360832, 'steps': 43545, 'loss/train': 1.0674269199371338} -11/07/2021 03:20:00 - INFO - __main__ - Step 43547: {'lr': 0.00040892216923149073, 'samples': 8361024, 'steps': 43546, 'loss/train': 1.7720543146133423} -11/07/2021 03:20:01 - INFO - __main__ - Step 43548: {'lr': 0.000408918072678093, 'samples': 8361216, 'steps': 43547, 'loss/train': 1.5051828622817993} -11/07/2021 03:20:01 - INFO - __main__ - Step 43549: {'lr': 0.0004089139760530893, 'samples': 8361408, 'steps': 43548, 'loss/train': 1.3326727151870728} -11/07/2021 03:20:02 - INFO - __main__ - Step 43550: {'lr': 0.0004089098793564815, 'samples': 8361600, 'steps': 43549, 'loss/train': 1.5760725736618042} -11/07/2021 03:20:02 - INFO - __main__ - Step 43551: {'lr': 0.00040890578258827125, 'samples': 8361792, 'steps': 43550, 'loss/train': 1.712302327156067} -11/07/2021 03:20:02 - INFO - __main__ - Step 43552: {'lr': 0.00040890168574846055, 'samples': 8361984, 'steps': 43551, 'loss/train': 1.5927711725234985} -11/07/2021 03:20:03 - INFO - __main__ - Step 43553: {'lr': 0.0004088975888370512, 'samples': 8362176, 'steps': 43552, 'loss/train': 1.4326268434524536} -11/07/2021 03:20:04 - INFO - __main__ - Step 43554: {'lr': 0.00040889349185404503, 'samples': 8362368, 'steps': 43553, 'loss/train': 1.8387601375579834} -11/07/2021 03:20:04 - INFO - __main__ - Step 43555: {'lr': 0.00040888939479944385, 'samples': 8362560, 'steps': 43554, 'loss/train': 1.3779672384262085} -11/07/2021 03:20:04 - INFO - __main__ - Step 43556: {'lr': 0.00040888529767324966, 'samples': 8362752, 'steps': 43555, 'loss/train': 1.569291114807129} -11/07/2021 03:20:05 - INFO - __main__ - Step 43557: {'lr': 0.0004088812004754642, 'samples': 8362944, 'steps': 43556, 'loss/train': 0.6441032886505127} -11/07/2021 03:20:06 - INFO - __main__ - Step 43558: {'lr': 0.00040887710320608927, 'samples': 8363136, 'steps': 43557, 'loss/train': 0.5327775478363037} -11/07/2021 03:20:06 - INFO - __main__ - Step 43559: {'lr': 0.00040887300586512677, 'samples': 8363328, 'steps': 43558, 'loss/train': 1.2207534313201904} -11/07/2021 03:20:06 - INFO - __main__ - Step 43560: {'lr': 0.0004088689084525786, 'samples': 8363520, 'steps': 43559, 'loss/train': 1.6354135274887085} -11/07/2021 03:20:07 - INFO - __main__ - Step 43561: {'lr': 0.0004088648109684465, 'samples': 8363712, 'steps': 43560, 'loss/train': 1.0811123847961426} -11/07/2021 03:20:07 - INFO - __main__ - Step 43562: {'lr': 0.00040886071341273236, 'samples': 8363904, 'steps': 43561, 'loss/train': 1.5641906261444092} -11/07/2021 03:20:08 - INFO - __main__ - Step 43563: {'lr': 0.0004088566157854381, 'samples': 8364096, 'steps': 43562, 'loss/train': 0.8359418511390686} -11/07/2021 03:20:08 - INFO - __main__ - Step 43564: {'lr': 0.0004088525180865654, 'samples': 8364288, 'steps': 43563, 'loss/train': 1.4746079444885254} -11/07/2021 03:20:09 - INFO - __main__ - Step 43565: {'lr': 0.0004088484203161163, 'samples': 8364480, 'steps': 43564, 'loss/train': 1.2377235889434814} -11/07/2021 03:20:09 - INFO - __main__ - Step 43566: {'lr': 0.0004088443224740925, 'samples': 8364672, 'steps': 43565, 'loss/train': 0.6066043972969055} -11/07/2021 03:20:09 - INFO - __main__ - Step 43567: {'lr': 0.00040884022456049595, 'samples': 8364864, 'steps': 43566, 'loss/train': 1.4646358489990234} -11/07/2021 03:20:10 - INFO - __main__ - Step 43568: {'lr': 0.00040883612657532844, 'samples': 8365056, 'steps': 43567, 'loss/train': 0.7460005879402161} -11/07/2021 03:20:11 - INFO - __main__ - Step 43569: {'lr': 0.0004088320285185918, 'samples': 8365248, 'steps': 43568, 'loss/train': 1.2883244752883911} -11/07/2021 03:20:11 - INFO - __main__ - Step 43570: {'lr': 0.0004088279303902879, 'samples': 8365440, 'steps': 43569, 'loss/train': 1.4460668563842773} -11/07/2021 03:20:12 - INFO - __main__ - Step 43571: {'lr': 0.0004088238321904185, 'samples': 8365632, 'steps': 43570, 'loss/train': 1.7092125415802002} -11/07/2021 03:20:12 - INFO - __main__ - Step 43572: {'lr': 0.00040881973391898563, 'samples': 8365824, 'steps': 43571, 'loss/train': 1.3663840293884277} -11/07/2021 03:20:12 - INFO - __main__ - Step 43573: {'lr': 0.00040881563557599107, 'samples': 8366016, 'steps': 43572, 'loss/train': 1.221165418624878} -11/07/2021 03:20:13 - INFO - __main__ - Step 43574: {'lr': 0.00040881153716143656, 'samples': 8366208, 'steps': 43573, 'loss/train': 1.2819992303848267} -11/07/2021 03:20:14 - INFO - __main__ - Step 43575: {'lr': 0.000408807438675324, 'samples': 8366400, 'steps': 43574, 'loss/train': 1.6424840688705444} -11/07/2021 03:20:14 - INFO - __main__ - Step 43576: {'lr': 0.0004088033401176554, 'samples': 8366592, 'steps': 43575, 'loss/train': 1.4731272459030151} -11/07/2021 03:20:14 - INFO - __main__ - Step 43577: {'lr': 0.00040879924148843233, 'samples': 8366784, 'steps': 43576, 'loss/train': 1.5095930099487305} -11/07/2021 03:20:15 - INFO - __main__ - Step 43578: {'lr': 0.00040879514278765685, 'samples': 8366976, 'steps': 43577, 'loss/train': 1.735713005065918} -11/07/2021 03:20:16 - INFO - __main__ - Step 43579: {'lr': 0.00040879104401533064, 'samples': 8367168, 'steps': 43578, 'loss/train': 1.2982885837554932} -11/07/2021 03:20:16 - INFO - __main__ - Step 43580: {'lr': 0.0004087869451714557, 'samples': 8367360, 'steps': 43579, 'loss/train': 1.4081155061721802} -11/07/2021 03:20:16 - INFO - __main__ - Step 43581: {'lr': 0.0004087828462560338, 'samples': 8367552, 'steps': 43580, 'loss/train': 1.8157951831817627} -11/07/2021 03:20:17 - INFO - __main__ - Step 43582: {'lr': 0.0004087787472690668, 'samples': 8367744, 'steps': 43581, 'loss/train': 1.1368916034698486} -11/07/2021 03:20:17 - INFO - __main__ - Step 43583: {'lr': 0.00040877464821055656, 'samples': 8367936, 'steps': 43582, 'loss/train': 1.5306081771850586} -11/07/2021 03:20:18 - INFO - __main__ - Step 43584: {'lr': 0.00040877054908050495, 'samples': 8368128, 'steps': 43583, 'loss/train': 1.5217291116714478} -11/07/2021 03:20:18 - INFO - __main__ - Step 43585: {'lr': 0.0004087664498789137, 'samples': 8368320, 'steps': 43584, 'loss/train': 1.1860651969909668} -11/07/2021 03:20:19 - INFO - __main__ - Step 43586: {'lr': 0.00040876235060578476, 'samples': 8368512, 'steps': 43585, 'loss/train': 1.665792465209961} -11/07/2021 03:20:19 - INFO - __main__ - Step 43587: {'lr': 0.00040875825126112, 'samples': 8368704, 'steps': 43586, 'loss/train': 1.4056962728500366} -11/07/2021 03:20:19 - INFO - __main__ - Step 43588: {'lr': 0.00040875415184492113, 'samples': 8368896, 'steps': 43587, 'loss/train': 1.6160039901733398} -11/07/2021 03:20:21 - INFO - __main__ - Step 43589: {'lr': 0.0004087500523571902, 'samples': 8369088, 'steps': 43588, 'loss/train': 1.5002211332321167} -11/07/2021 03:20:21 - INFO - __main__ - Step 43590: {'lr': 0.00040874595279792884, 'samples': 8369280, 'steps': 43589, 'loss/train': 1.3868716955184937} -11/07/2021 03:20:21 - INFO - __main__ - Step 43591: {'lr': 0.00040874185316713905, 'samples': 8369472, 'steps': 43590, 'loss/train': 1.3115204572677612} -11/07/2021 03:20:22 - INFO - __main__ - Step 43592: {'lr': 0.00040873775346482265, 'samples': 8369664, 'steps': 43591, 'loss/train': 0.7397732734680176} -11/07/2021 03:20:22 - INFO - __main__ - Step 43593: {'lr': 0.0004087336536909815, 'samples': 8369856, 'steps': 43592, 'loss/train': 1.7234948873519897} -11/07/2021 03:20:24 - INFO - __main__ - Step 43594: {'lr': 0.00040872955384561735, 'samples': 8370048, 'steps': 43593, 'loss/train': 1.3786344528198242} -11/07/2021 03:20:24 - INFO - __main__ - Step 43595: {'lr': 0.00040872545392873214, 'samples': 8370240, 'steps': 43594, 'loss/train': 1.480933427810669} -11/07/2021 03:20:24 - INFO - __main__ - Step 43596: {'lr': 0.00040872135394032764, 'samples': 8370432, 'steps': 43595, 'loss/train': 1.488183856010437} -11/07/2021 03:20:25 - INFO - __main__ - Step 43597: {'lr': 0.0004087172538804058, 'samples': 8370624, 'steps': 43596, 'loss/train': 1.3239374160766602} -11/07/2021 03:20:25 - INFO - __main__ - Step 43598: {'lr': 0.0004087131537489685, 'samples': 8370816, 'steps': 43597, 'loss/train': 1.4526338577270508} -11/07/2021 03:20:25 - INFO - __main__ - Step 43599: {'lr': 0.00040870905354601733, 'samples': 8371008, 'steps': 43598, 'loss/train': 1.9269925355911255} -11/07/2021 03:20:26 - INFO - __main__ - Step 43600: {'lr': 0.0004087049532715544, 'samples': 8371200, 'steps': 43599, 'loss/train': 0.2446974217891693} -11/07/2021 03:20:27 - INFO - __main__ - Step 43601: {'lr': 0.00040870085292558147, 'samples': 8371392, 'steps': 43600, 'loss/train': 1.1627293825149536} -11/07/2021 03:20:27 - INFO - __main__ - Step 43602: {'lr': 0.0004086967525081003, 'samples': 8371584, 'steps': 43601, 'loss/train': 1.3988213539123535} -11/07/2021 03:20:27 - INFO - __main__ - Step 43603: {'lr': 0.00040869265201911285, 'samples': 8371776, 'steps': 43602, 'loss/train': 0.8341631889343262} -11/07/2021 03:20:28 - INFO - __main__ - Step 43604: {'lr': 0.00040868855145862105, 'samples': 8371968, 'steps': 43603, 'loss/train': 1.744335412979126} -11/07/2021 03:20:29 - INFO - __main__ - Step 43605: {'lr': 0.00040868445082662655, 'samples': 8372160, 'steps': 43604, 'loss/train': 1.4655396938323975} -11/07/2021 03:20:29 - INFO - __main__ - Step 43606: {'lr': 0.0004086803501231313, 'samples': 8372352, 'steps': 43605, 'loss/train': 1.306358814239502} -11/07/2021 03:20:29 - INFO - __main__ - Step 43607: {'lr': 0.00040867624934813715, 'samples': 8372544, 'steps': 43606, 'loss/train': 2.9461324214935303} -11/07/2021 03:20:30 - INFO - __main__ - Step 43608: {'lr': 0.00040867214850164594, 'samples': 8372736, 'steps': 43607, 'loss/train': 0.9181822538375854} -11/07/2021 03:20:30 - INFO - __main__ - Step 43609: {'lr': 0.0004086680475836594, 'samples': 8372928, 'steps': 43608, 'loss/train': 0.5646260976791382} -11/07/2021 03:20:31 - INFO - __main__ - Step 43610: {'lr': 0.0004086639465941796, 'samples': 8373120, 'steps': 43609, 'loss/train': 1.3706705570220947} -11/07/2021 03:20:32 - INFO - __main__ - Step 43611: {'lr': 0.00040865984553320825, 'samples': 8373312, 'steps': 43610, 'loss/train': 1.3446487188339233} -11/07/2021 03:20:32 - INFO - __main__ - Step 43612: {'lr': 0.0004086557444007472, 'samples': 8373504, 'steps': 43611, 'loss/train': 1.6764800548553467} -11/07/2021 03:20:32 - INFO - __main__ - Step 43613: {'lr': 0.0004086516431967984, 'samples': 8373696, 'steps': 43612, 'loss/train': 1.6255570650100708} -11/07/2021 03:20:33 - INFO - __main__ - Step 43614: {'lr': 0.0004086475419213635, 'samples': 8373888, 'steps': 43613, 'loss/train': 1.2821707725524902} -11/07/2021 03:20:33 - INFO - __main__ - Step 43615: {'lr': 0.0004086434405744445, 'samples': 8374080, 'steps': 43614, 'loss/train': 1.3963944911956787} -11/07/2021 03:20:34 - INFO - __main__ - Step 43616: {'lr': 0.00040863933915604323, 'samples': 8374272, 'steps': 43615, 'loss/train': 0.8696134686470032} -11/07/2021 03:20:34 - INFO - __main__ - Step 43617: {'lr': 0.00040863523766616157, 'samples': 8374464, 'steps': 43616, 'loss/train': 1.4096627235412598} -11/07/2021 03:20:35 - INFO - __main__ - Step 43618: {'lr': 0.0004086311361048012, 'samples': 8374656, 'steps': 43617, 'loss/train': 1.5101468563079834} -11/07/2021 03:20:35 - INFO - __main__ - Step 43619: {'lr': 0.0004086270344719642, 'samples': 8374848, 'steps': 43618, 'loss/train': 1.7593225240707397} -11/07/2021 03:20:35 - INFO - __main__ - Step 43620: {'lr': 0.00040862293276765227, 'samples': 8375040, 'steps': 43619, 'loss/train': 1.3444418907165527} -11/07/2021 03:20:36 - INFO - __main__ - Step 43621: {'lr': 0.00040861883099186725, 'samples': 8375232, 'steps': 43620, 'loss/train': 1.2412489652633667} -11/07/2021 03:20:37 - INFO - __main__ - Step 43622: {'lr': 0.0004086147291446111, 'samples': 8375424, 'steps': 43621, 'loss/train': 1.0515379905700684} -11/07/2021 03:20:37 - INFO - __main__ - Step 43623: {'lr': 0.0004086106272258856, 'samples': 8375616, 'steps': 43622, 'loss/train': 0.8363951444625854} -11/07/2021 03:20:37 - INFO - __main__ - Step 43624: {'lr': 0.0004086065252356925, 'samples': 8375808, 'steps': 43623, 'loss/train': 1.4724141359329224} -11/07/2021 03:20:38 - INFO - __main__ - Step 43625: {'lr': 0.00040860242317403383, 'samples': 8376000, 'steps': 43624, 'loss/train': 1.4095970392227173} -11/07/2021 03:20:39 - INFO - __main__ - Step 43626: {'lr': 0.0004085983210409114, 'samples': 8376192, 'steps': 43625, 'loss/train': 1.4020105600357056} -11/07/2021 03:20:40 - INFO - __main__ - Step 43627: {'lr': 0.00040859421883632696, 'samples': 8376384, 'steps': 43626, 'loss/train': 1.2069751024246216} -11/07/2021 03:20:40 - INFO - __main__ - Step 43628: {'lr': 0.0004085901165602824, 'samples': 8376576, 'steps': 43627, 'loss/train': 1.2861889600753784} -11/07/2021 03:20:40 - INFO - __main__ - Step 43629: {'lr': 0.00040858601421277956, 'samples': 8376768, 'steps': 43628, 'loss/train': 1.0271927118301392} -11/07/2021 03:20:41 - INFO - __main__ - Step 43630: {'lr': 0.00040858191179382044, 'samples': 8376960, 'steps': 43629, 'loss/train': 1.1741310358047485} -11/07/2021 03:20:41 - INFO - __main__ - Step 43631: {'lr': 0.0004085778093034066, 'samples': 8377152, 'steps': 43630, 'loss/train': 1.7343759536743164} -11/07/2021 03:20:42 - INFO - __main__ - Step 43632: {'lr': 0.0004085737067415401, 'samples': 8377344, 'steps': 43631, 'loss/train': 1.6797895431518555} -11/07/2021 03:20:42 - INFO - __main__ - Step 43633: {'lr': 0.00040856960410822277, 'samples': 8377536, 'steps': 43632, 'loss/train': 1.4149872064590454} -11/07/2021 03:20:43 - INFO - __main__ - Step 43634: {'lr': 0.0004085655014034564, 'samples': 8377728, 'steps': 43633, 'loss/train': 1.6078990697860718} -11/07/2021 03:20:43 - INFO - __main__ - Step 43635: {'lr': 0.0004085613986272428, 'samples': 8377920, 'steps': 43634, 'loss/train': 5.793621063232422} -11/07/2021 03:20:43 - INFO - __main__ - Step 43636: {'lr': 0.0004085572957795839, 'samples': 8378112, 'steps': 43635, 'loss/train': 1.4916640520095825} -11/07/2021 03:20:44 - INFO - __main__ - Step 43637: {'lr': 0.00040855319286048163, 'samples': 8378304, 'steps': 43636, 'loss/train': 1.4157909154891968} -11/07/2021 03:20:45 - INFO - __main__ - Step 43638: {'lr': 0.0004085490898699377, 'samples': 8378496, 'steps': 43637, 'loss/train': 1.3781392574310303} -11/07/2021 03:20:45 - INFO - __main__ - Step 43639: {'lr': 0.0004085449868079539, 'samples': 8378688, 'steps': 43638, 'loss/train': 1.5037422180175781} -11/07/2021 03:20:46 - INFO - __main__ - Step 43640: {'lr': 0.00040854088367453225, 'samples': 8378880, 'steps': 43639, 'loss/train': 1.285473346710205} -11/07/2021 03:20:46 - INFO - __main__ - Step 43641: {'lr': 0.00040853678046967454, 'samples': 8379072, 'steps': 43640, 'loss/train': 1.3737177848815918} -11/07/2021 03:20:46 - INFO - __main__ - Step 43642: {'lr': 0.00040853267719338256, 'samples': 8379264, 'steps': 43641, 'loss/train': 1.3150479793548584} -11/07/2021 03:20:47 - INFO - __main__ - Step 43643: {'lr': 0.00040852857384565824, 'samples': 8379456, 'steps': 43642, 'loss/train': 1.0506174564361572} -11/07/2021 03:20:48 - INFO - __main__ - Step 43644: {'lr': 0.00040852447042650337, 'samples': 8379648, 'steps': 43643, 'loss/train': 1.6337863206863403} -11/07/2021 03:20:48 - INFO - __main__ - Step 43645: {'lr': 0.0004085203669359198, 'samples': 8379840, 'steps': 43644, 'loss/train': 1.521552324295044} -11/07/2021 03:20:48 - INFO - __main__ - Step 43646: {'lr': 0.0004085162633739095, 'samples': 8380032, 'steps': 43645, 'loss/train': 1.760745882987976} -11/07/2021 03:20:49 - INFO - __main__ - Step 43647: {'lr': 0.0004085121597404741, 'samples': 8380224, 'steps': 43646, 'loss/train': 1.9856324195861816} -11/07/2021 03:20:50 - INFO - __main__ - Step 43648: {'lr': 0.0004085080560356156, 'samples': 8380416, 'steps': 43647, 'loss/train': 1.5533442497253418} -11/07/2021 03:20:50 - INFO - __main__ - Step 43649: {'lr': 0.0004085039522593358, 'samples': 8380608, 'steps': 43648, 'loss/train': 1.524967908859253} -11/07/2021 03:20:51 - INFO - __main__ - Step 43650: {'lr': 0.0004084998484116366, 'samples': 8380800, 'steps': 43649, 'loss/train': 1.6469630002975464} -11/07/2021 03:20:51 - INFO - __main__ - Step 43651: {'lr': 0.0004084957444925198, 'samples': 8380992, 'steps': 43650, 'loss/train': 1.450783371925354} -11/07/2021 03:20:51 - INFO - __main__ - Step 43652: {'lr': 0.0004084916405019873, 'samples': 8381184, 'steps': 43651, 'loss/train': 1.3922834396362305} -11/07/2021 03:20:52 - INFO - __main__ - Step 43653: {'lr': 0.0004084875364400409, 'samples': 8381376, 'steps': 43652, 'loss/train': 1.9974443912506104} -11/07/2021 03:20:53 - INFO - __main__ - Step 43654: {'lr': 0.0004084834323066824, 'samples': 8381568, 'steps': 43653, 'loss/train': 1.7659012079238892} -11/07/2021 03:20:53 - INFO - __main__ - Step 43655: {'lr': 0.00040847932810191375, 'samples': 8381760, 'steps': 43654, 'loss/train': 1.340469479560852} -11/07/2021 03:20:53 - INFO - __main__ - Step 43656: {'lr': 0.00040847522382573675, 'samples': 8381952, 'steps': 43655, 'loss/train': 1.574964165687561} -11/07/2021 03:20:54 - INFO - __main__ - Step 43657: {'lr': 0.0004084711194781533, 'samples': 8382144, 'steps': 43656, 'loss/train': 1.0405417680740356} -11/07/2021 03:20:54 - INFO - __main__ - Step 43658: {'lr': 0.00040846701505916516, 'samples': 8382336, 'steps': 43657, 'loss/train': 1.6210185289382935} -11/07/2021 03:20:55 - INFO - __main__ - Step 43659: {'lr': 0.00040846291056877425, 'samples': 8382528, 'steps': 43658, 'loss/train': 1.4585506916046143} -11/07/2021 03:20:55 - INFO - __main__ - Step 43660: {'lr': 0.0004084588060069824, 'samples': 8382720, 'steps': 43659, 'loss/train': 1.3846935033798218} -11/07/2021 03:20:56 - INFO - __main__ - Step 43661: {'lr': 0.0004084547013737915, 'samples': 8382912, 'steps': 43660, 'loss/train': 1.5579522848129272} -11/07/2021 03:20:56 - INFO - __main__ - Step 43662: {'lr': 0.00040845059666920323, 'samples': 8383104, 'steps': 43661, 'loss/train': 1.7791005373001099} -11/07/2021 03:20:57 - INFO - __main__ - Step 43663: {'lr': 0.0004084464918932197, 'samples': 8383296, 'steps': 43662, 'loss/train': 1.4406996965408325} -11/07/2021 03:20:58 - INFO - __main__ - Step 43664: {'lr': 0.0004084423870458426, 'samples': 8383488, 'steps': 43663, 'loss/train': 1.6090887784957886} -11/07/2021 03:20:58 - INFO - __main__ - Step 43665: {'lr': 0.00040843828212707366, 'samples': 8383680, 'steps': 43664, 'loss/train': 1.5177305936813354} -11/07/2021 03:20:58 - INFO - __main__ - Step 43666: {'lr': 0.00040843417713691505, 'samples': 8383872, 'steps': 43665, 'loss/train': 0.8475781083106995} -11/07/2021 03:20:59 - INFO - __main__ - Step 43667: {'lr': 0.0004084300720753684, 'samples': 8384064, 'steps': 43666, 'loss/train': 1.6888883113861084} -11/07/2021 03:20:59 - INFO - __main__ - Step 43668: {'lr': 0.0004084259669424356, 'samples': 8384256, 'steps': 43667, 'loss/train': 1.521574854850769} -11/07/2021 03:21:00 - INFO - __main__ - Step 43669: {'lr': 0.0004084218617381185, 'samples': 8384448, 'steps': 43668, 'loss/train': 1.4842170476913452} -11/07/2021 03:21:00 - INFO - __main__ - Step 43670: {'lr': 0.00040841775646241897, 'samples': 8384640, 'steps': 43669, 'loss/train': 0.7249814867973328} -11/07/2021 03:21:01 - INFO - __main__ - Step 43671: {'lr': 0.0004084136511153388, 'samples': 8384832, 'steps': 43670, 'loss/train': 1.9210768938064575} -11/07/2021 03:21:01 - INFO - __main__ - Step 43672: {'lr': 0.0004084095456968799, 'samples': 8385024, 'steps': 43671, 'loss/train': 1.5453283786773682} -11/07/2021 03:21:02 - INFO - __main__ - Step 43673: {'lr': 0.0004084054402070441, 'samples': 8385216, 'steps': 43672, 'loss/train': 1.5406078100204468} -11/07/2021 03:21:02 - INFO - __main__ - Step 43674: {'lr': 0.0004084013346458333, 'samples': 8385408, 'steps': 43673, 'loss/train': 1.7233799695968628} -11/07/2021 03:21:03 - INFO - __main__ - Step 43675: {'lr': 0.00040839722901324924, 'samples': 8385600, 'steps': 43674, 'loss/train': 0.7722538709640503} -11/07/2021 03:21:03 - INFO - __main__ - Step 43676: {'lr': 0.00040839312330929377, 'samples': 8385792, 'steps': 43675, 'loss/train': 1.3467720746994019} -11/07/2021 03:21:04 - INFO - __main__ - Step 43677: {'lr': 0.00040838901753396896, 'samples': 8385984, 'steps': 43676, 'loss/train': 1.4793387651443481} -11/07/2021 03:21:04 - INFO - __main__ - Step 43678: {'lr': 0.0004083849116872764, 'samples': 8386176, 'steps': 43677, 'loss/train': 1.6407707929611206} -11/07/2021 03:21:05 - INFO - __main__ - Step 43679: {'lr': 0.0004083808057692181, 'samples': 8386368, 'steps': 43678, 'loss/train': 1.5521893501281738} -11/07/2021 03:21:05 - INFO - __main__ - Step 43680: {'lr': 0.00040837669977979586, 'samples': 8386560, 'steps': 43679, 'loss/train': 1.1769499778747559} -11/07/2021 03:21:06 - INFO - __main__ - Step 43681: {'lr': 0.00040837259371901145, 'samples': 8386752, 'steps': 43680, 'loss/train': 1.577649474143982} -11/07/2021 03:21:06 - INFO - __main__ - Step 43682: {'lr': 0.00040836848758686687, 'samples': 8386944, 'steps': 43681, 'loss/train': 1.474136233329773} -11/07/2021 03:21:06 - INFO - __main__ - Step 43683: {'lr': 0.00040836438138336384, 'samples': 8387136, 'steps': 43682, 'loss/train': 1.5819343328475952} -11/07/2021 03:21:07 - INFO - __main__ - Step 43684: {'lr': 0.00040836027510850426, 'samples': 8387328, 'steps': 43683, 'loss/train': 1.250996708869934} -11/07/2021 03:21:08 - INFO - __main__ - Step 43685: {'lr': 0.00040835616876229, 'samples': 8387520, 'steps': 43684, 'loss/train': 1.6471080780029297} -11/07/2021 03:21:08 - INFO - __main__ - Step 43686: {'lr': 0.00040835206234472287, 'samples': 8387712, 'steps': 43685, 'loss/train': 1.461700439453125} -11/07/2021 03:21:08 - INFO - __main__ - Step 43687: {'lr': 0.0004083479558558048, 'samples': 8387904, 'steps': 43686, 'loss/train': 1.5194342136383057} -11/07/2021 03:21:09 - INFO - __main__ - Step 43688: {'lr': 0.0004083438492955376, 'samples': 8388096, 'steps': 43687, 'loss/train': 1.0905221700668335} -11/07/2021 03:21:10 - INFO - __main__ - Step 43689: {'lr': 0.00040833974266392306, 'samples': 8388288, 'steps': 43688, 'loss/train': 1.6670489311218262} -11/07/2021 03:21:10 - INFO - __main__ - Step 43690: {'lr': 0.00040833563596096305, 'samples': 8388480, 'steps': 43689, 'loss/train': 1.2590972185134888} -11/07/2021 03:21:10 - INFO - __main__ - Step 43691: {'lr': 0.0004083315291866595, 'samples': 8388672, 'steps': 43690, 'loss/train': 1.5689071416854858} -11/07/2021 03:21:11 - INFO - __main__ - Step 43692: {'lr': 0.00040832742234101415, 'samples': 8388864, 'steps': 43691, 'loss/train': 1.4217921495437622} -11/07/2021 03:21:11 - INFO - __main__ - Step 43693: {'lr': 0.00040832331542402895, 'samples': 8389056, 'steps': 43692, 'loss/train': 1.8546339273452759} -11/07/2021 03:21:12 - INFO - __main__ - Step 43694: {'lr': 0.0004083192084357057, 'samples': 8389248, 'steps': 43693, 'loss/train': 1.5490301847457886} -11/07/2021 03:21:13 - INFO - __main__ - Step 43695: {'lr': 0.0004083151013760462, 'samples': 8389440, 'steps': 43694, 'loss/train': 1.5929126739501953} -11/07/2021 03:21:13 - INFO - __main__ - Step 43696: {'lr': 0.0004083109942450524, 'samples': 8389632, 'steps': 43695, 'loss/train': 1.4311790466308594} -11/07/2021 03:21:13 - INFO - __main__ - Step 43697: {'lr': 0.00040830688704272615, 'samples': 8389824, 'steps': 43696, 'loss/train': 1.2046213150024414} -11/07/2021 03:21:14 - INFO - __main__ - Step 43698: {'lr': 0.0004083027797690693, 'samples': 8390016, 'steps': 43697, 'loss/train': 1.4289475679397583} -11/07/2021 03:21:14 - INFO - __main__ - Step 43699: {'lr': 0.0004082986724240835, 'samples': 8390208, 'steps': 43698, 'loss/train': 1.9071747064590454} -11/07/2021 03:21:15 - INFO - __main__ - Step 43700: {'lr': 0.00040829456500777084, 'samples': 8390400, 'steps': 43699, 'loss/train': 1.3858799934387207} -11/07/2021 03:21:15 - INFO - __main__ - Step 43701: {'lr': 0.00040829045752013317, 'samples': 8390592, 'steps': 43700, 'loss/train': 1.8750146627426147} -11/07/2021 03:21:16 - INFO - __main__ - Step 43702: {'lr': 0.00040828634996117213, 'samples': 8390784, 'steps': 43701, 'loss/train': 1.3986989259719849} -11/07/2021 03:21:16 - INFO - __main__ - Step 43703: {'lr': 0.0004082822423308897, 'samples': 8390976, 'steps': 43702, 'loss/train': 0.9039545059204102} -11/07/2021 03:21:16 - INFO - __main__ - Step 43704: {'lr': 0.00040827813462928784, 'samples': 8391168, 'steps': 43703, 'loss/train': 1.2571094036102295} -11/07/2021 03:21:17 - INFO - __main__ - Step 43705: {'lr': 0.0004082740268563683, 'samples': 8391360, 'steps': 43704, 'loss/train': 1.4285101890563965} -11/07/2021 03:21:18 - INFO - __main__ - Step 43706: {'lr': 0.0004082699190121329, 'samples': 8391552, 'steps': 43705, 'loss/train': 0.6200053691864014} -11/07/2021 03:21:18 - INFO - __main__ - Step 43707: {'lr': 0.00040826581109658345, 'samples': 8391744, 'steps': 43706, 'loss/train': 1.3370939493179321} -11/07/2021 03:21:19 - INFO - __main__ - Step 43708: {'lr': 0.00040826170310972196, 'samples': 8391936, 'steps': 43707, 'loss/train': 1.3259520530700684} -11/07/2021 03:21:19 - INFO - __main__ - Step 43709: {'lr': 0.0004082575950515501, 'samples': 8392128, 'steps': 43708, 'loss/train': 1.5314348936080933} -11/07/2021 03:21:19 - INFO - __main__ - Step 43710: {'lr': 0.00040825348692206985, 'samples': 8392320, 'steps': 43709, 'loss/train': 1.7945643663406372} -11/07/2021 03:21:20 - INFO - __main__ - Step 43711: {'lr': 0.0004082493787212831, 'samples': 8392512, 'steps': 43710, 'loss/train': 1.4325158596038818} -11/07/2021 03:21:21 - INFO - __main__ - Step 43712: {'lr': 0.00040824527044919153, 'samples': 8392704, 'steps': 43711, 'loss/train': 1.5164660215377808} -11/07/2021 03:21:21 - INFO - __main__ - Step 43713: {'lr': 0.0004082411621057971, 'samples': 8392896, 'steps': 43712, 'loss/train': 1.6946877241134644} -11/07/2021 03:21:21 - INFO - __main__ - Step 43714: {'lr': 0.00040823705369110163, 'samples': 8393088, 'steps': 43713, 'loss/train': 0.49761763215065} -11/07/2021 03:21:22 - INFO - __main__ - Step 43715: {'lr': 0.000408232945205107, 'samples': 8393280, 'steps': 43714, 'loss/train': 1.9720444679260254} -11/07/2021 03:21:23 - INFO - __main__ - Step 43716: {'lr': 0.00040822883664781506, 'samples': 8393472, 'steps': 43715, 'loss/train': 0.9192848205566406} -11/07/2021 03:21:23 - INFO - __main__ - Step 43717: {'lr': 0.0004082247280192276, 'samples': 8393664, 'steps': 43716, 'loss/train': 1.2968155145645142} -11/07/2021 03:21:23 - INFO - __main__ - Step 43718: {'lr': 0.00040822061931934656, 'samples': 8393856, 'steps': 43717, 'loss/train': 1.8738207817077637} -11/07/2021 03:21:24 - INFO - __main__ - Step 43719: {'lr': 0.00040821651054817376, 'samples': 8394048, 'steps': 43718, 'loss/train': 1.6693713665008545} -11/07/2021 03:21:24 - INFO - __main__ - Step 43720: {'lr': 0.000408212401705711, 'samples': 8394240, 'steps': 43719, 'loss/train': 1.4084855318069458} -11/07/2021 03:21:25 - INFO - __main__ - Step 43721: {'lr': 0.0004082082927919602, 'samples': 8394432, 'steps': 43720, 'loss/train': 0.9644858241081238} -11/07/2021 03:21:25 - INFO - __main__ - Step 43722: {'lr': 0.0004082041838069232, 'samples': 8394624, 'steps': 43721, 'loss/train': 1.4714794158935547} -11/07/2021 03:21:26 - INFO - __main__ - Step 43723: {'lr': 0.0004082000747506018, 'samples': 8394816, 'steps': 43722, 'loss/train': 1.086302638053894} -11/07/2021 03:21:26 - INFO - __main__ - Step 43724: {'lr': 0.00040819596562299793, 'samples': 8395008, 'steps': 43723, 'loss/train': 0.6590692400932312} -11/07/2021 03:21:27 - INFO - __main__ - Step 43725: {'lr': 0.0004081918564241134, 'samples': 8395200, 'steps': 43724, 'loss/train': 1.3129510879516602} -11/07/2021 03:21:29 - INFO - __main__ - Step 43726: {'lr': 0.00040818774715395, 'samples': 8395392, 'steps': 43725, 'loss/train': 1.5787527561187744} -11/07/2021 03:21:29 - INFO - __main__ - Step 43727: {'lr': 0.0004081836378125097, 'samples': 8395584, 'steps': 43726, 'loss/train': 1.050729751586914} -11/07/2021 03:21:29 - INFO - __main__ - Step 43728: {'lr': 0.00040817952839979424, 'samples': 8395776, 'steps': 43727, 'loss/train': 1.8111873865127563} -11/07/2021 03:21:30 - INFO - __main__ - Step 43729: {'lr': 0.00040817541891580557, 'samples': 8395968, 'steps': 43728, 'loss/train': 0.9503833055496216} -11/07/2021 03:21:30 - INFO - __main__ - Step 43730: {'lr': 0.00040817130936054546, 'samples': 8396160, 'steps': 43729, 'loss/train': 1.7883265018463135} -11/07/2021 03:21:30 - INFO - __main__ - Step 43731: {'lr': 0.00040816719973401586, 'samples': 8396352, 'steps': 43730, 'loss/train': 1.64004647731781} -11/07/2021 03:21:31 - INFO - __main__ - Step 43732: {'lr': 0.0004081630900362185, 'samples': 8396544, 'steps': 43731, 'loss/train': 1.5553715229034424} -11/07/2021 03:21:32 - INFO - __main__ - Step 43733: {'lr': 0.0004081589802671553, 'samples': 8396736, 'steps': 43732, 'loss/train': 1.3468505144119263} -11/07/2021 03:21:32 - INFO - __main__ - Step 43734: {'lr': 0.00040815487042682814, 'samples': 8396928, 'steps': 43733, 'loss/train': 1.5261868238449097} -11/07/2021 03:21:32 - INFO - __main__ - Step 43735: {'lr': 0.0004081507605152388, 'samples': 8397120, 'steps': 43734, 'loss/train': 0.9943277835845947} -11/07/2021 03:21:33 - INFO - __main__ - Step 43736: {'lr': 0.0004081466505323892, 'samples': 8397312, 'steps': 43735, 'loss/train': 0.5817473530769348} -11/07/2021 03:21:33 - INFO - __main__ - Step 43737: {'lr': 0.0004081425404782811, 'samples': 8397504, 'steps': 43736, 'loss/train': 1.6696367263793945} -11/07/2021 03:21:34 - INFO - __main__ - Step 43738: {'lr': 0.00040813843035291655, 'samples': 8397696, 'steps': 43737, 'loss/train': 1.6473397016525269} -11/07/2021 03:21:35 - INFO - __main__ - Step 43739: {'lr': 0.00040813432015629714, 'samples': 8397888, 'steps': 43738, 'loss/train': 1.7417515516281128} -11/07/2021 03:21:35 - INFO - __main__ - Step 43740: {'lr': 0.0004081302098884249, 'samples': 8398080, 'steps': 43739, 'loss/train': 0.8534517288208008} -11/07/2021 03:21:35 - INFO - __main__ - Step 43741: {'lr': 0.0004081260995493015, 'samples': 8398272, 'steps': 43740, 'loss/train': 2.0336036682128906} -11/07/2021 03:21:36 - INFO - __main__ - Step 43742: {'lr': 0.0004081219891389291, 'samples': 8398464, 'steps': 43741, 'loss/train': 1.8651096820831299} -11/07/2021 03:21:36 - INFO - __main__ - Step 43743: {'lr': 0.0004081178786573092, 'samples': 8398656, 'steps': 43742, 'loss/train': 1.3008315563201904} -11/07/2021 03:21:37 - INFO - __main__ - Step 43744: {'lr': 0.000408113768104444, 'samples': 8398848, 'steps': 43743, 'loss/train': 1.471579909324646} -11/07/2021 03:21:38 - INFO - __main__ - Step 43745: {'lr': 0.0004081096574803351, 'samples': 8399040, 'steps': 43744, 'loss/train': 1.38153076171875} -11/07/2021 03:21:38 - INFO - __main__ - Step 43746: {'lr': 0.00040810554678498434, 'samples': 8399232, 'steps': 43745, 'loss/train': 1.2050849199295044} -11/07/2021 03:21:38 - INFO - __main__ - Step 43747: {'lr': 0.00040810143601839377, 'samples': 8399424, 'steps': 43746, 'loss/train': 1.6005651950836182} -11/07/2021 03:21:39 - INFO - __main__ - Step 43748: {'lr': 0.0004080973251805651, 'samples': 8399616, 'steps': 43747, 'loss/train': 1.2557823657989502} -11/07/2021 03:21:40 - INFO - __main__ - Step 43749: {'lr': 0.0004080932142715002, 'samples': 8399808, 'steps': 43748, 'loss/train': 1.5913665294647217} -11/07/2021 03:21:40 - INFO - __main__ - Step 43750: {'lr': 0.000408089103291201, 'samples': 8400000, 'steps': 43749, 'loss/train': 1.661261796951294} -11/07/2021 03:21:40 - INFO - __main__ - Step 43751: {'lr': 0.0004080849922396692, 'samples': 8400192, 'steps': 43750, 'loss/train': 1.527084231376648} -11/07/2021 03:21:41 - INFO - __main__ - Step 43752: {'lr': 0.00040808088111690677, 'samples': 8400384, 'steps': 43751, 'loss/train': 1.6774927377700806} -11/07/2021 03:21:41 - INFO - __main__ - Step 43753: {'lr': 0.00040807676992291557, 'samples': 8400576, 'steps': 43752, 'loss/train': 1.3135204315185547} -11/07/2021 03:21:42 - INFO - __main__ - Step 43754: {'lr': 0.0004080726586576974, 'samples': 8400768, 'steps': 43753, 'loss/train': 1.443676471710205} -11/07/2021 03:21:42 - INFO - __main__ - Step 43755: {'lr': 0.0004080685473212541, 'samples': 8400960, 'steps': 43754, 'loss/train': 1.5122127532958984} -11/07/2021 03:21:43 - INFO - __main__ - Step 43756: {'lr': 0.0004080644359135876, 'samples': 8401152, 'steps': 43755, 'loss/train': 1.314313530921936} -11/07/2021 03:21:43 - INFO - __main__ - Step 43757: {'lr': 0.00040806032443469967, 'samples': 8401344, 'steps': 43756, 'loss/train': 1.472224473953247} -11/07/2021 03:21:44 - INFO - __main__ - Step 43758: {'lr': 0.0004080562128845923, 'samples': 8401536, 'steps': 43757, 'loss/train': 1.3135592937469482} -11/07/2021 03:21:44 - INFO - __main__ - Step 43759: {'lr': 0.0004080521012632671, 'samples': 8401728, 'steps': 43758, 'loss/train': 1.6687555313110352} -11/07/2021 03:21:45 - INFO - __main__ - Step 43760: {'lr': 0.00040804798957072607, 'samples': 8401920, 'steps': 43759, 'loss/train': 1.6299394369125366} -11/07/2021 03:21:45 - INFO - __main__ - Step 43761: {'lr': 0.0004080438778069711, 'samples': 8402112, 'steps': 43760, 'loss/train': 1.4132717847824097} -11/07/2021 03:21:46 - INFO - __main__ - Step 43762: {'lr': 0.000408039765972004, 'samples': 8402304, 'steps': 43761, 'loss/train': 1.6096906661987305} -11/07/2021 03:21:46 - INFO - __main__ - Step 43763: {'lr': 0.0004080356540658266, 'samples': 8402496, 'steps': 43762, 'loss/train': 1.373243808746338} -11/07/2021 03:21:46 - INFO - __main__ - Step 43764: {'lr': 0.00040803154208844086, 'samples': 8402688, 'steps': 43763, 'loss/train': 1.814076542854309} -11/07/2021 03:21:47 - INFO - __main__ - Step 43765: {'lr': 0.00040802743003984845, 'samples': 8402880, 'steps': 43764, 'loss/train': 1.7175999879837036} -11/07/2021 03:21:48 - INFO - __main__ - Step 43766: {'lr': 0.0004080233179200513, 'samples': 8403072, 'steps': 43765, 'loss/train': 1.591747522354126} -11/07/2021 03:21:48 - INFO - __main__ - Step 43767: {'lr': 0.00040801920572905133, 'samples': 8403264, 'steps': 43766, 'loss/train': 1.5183857679367065} -11/07/2021 03:21:49 - INFO - __main__ - Step 43768: {'lr': 0.0004080150934668503, 'samples': 8403456, 'steps': 43767, 'loss/train': 1.1555874347686768} -11/07/2021 03:21:49 - INFO - __main__ - Step 43769: {'lr': 0.00040801098113345014, 'samples': 8403648, 'steps': 43768, 'loss/train': 1.8131109476089478} -11/07/2021 03:21:50 - INFO - __main__ - Step 43770: {'lr': 0.00040800686872885267, 'samples': 8403840, 'steps': 43769, 'loss/train': 0.3235270082950592} -11/07/2021 03:21:50 - INFO - __main__ - Step 43771: {'lr': 0.0004080027562530598, 'samples': 8404032, 'steps': 43770, 'loss/train': 1.4960527420043945} -11/07/2021 03:21:51 - INFO - __main__ - Step 43772: {'lr': 0.0004079986437060733, 'samples': 8404224, 'steps': 43771, 'loss/train': 2.1998274326324463} -11/07/2021 03:21:51 - INFO - __main__ - Step 43773: {'lr': 0.00040799453108789497, 'samples': 8404416, 'steps': 43772, 'loss/train': 1.7890753746032715} -11/07/2021 03:21:51 - INFO - __main__ - Step 43774: {'lr': 0.0004079904183985268, 'samples': 8404608, 'steps': 43773, 'loss/train': 1.5287282466888428} -11/07/2021 03:21:52 - INFO - __main__ - Step 43775: {'lr': 0.00040798630563797055, 'samples': 8404800, 'steps': 43774, 'loss/train': 1.4617946147918701} -11/07/2021 03:21:53 - INFO - __main__ - Step 43776: {'lr': 0.00040798219280622816, 'samples': 8404992, 'steps': 43775, 'loss/train': 1.5505151748657227} -11/07/2021 03:21:53 - INFO - __main__ - Step 43777: {'lr': 0.0004079780799033014, 'samples': 8405184, 'steps': 43776, 'loss/train': 1.1835485696792603} -11/07/2021 03:21:53 - INFO - __main__ - Step 43778: {'lr': 0.0004079739669291922, 'samples': 8405376, 'steps': 43777, 'loss/train': 1.4083938598632812} -11/07/2021 03:21:54 - INFO - __main__ - Step 43779: {'lr': 0.0004079698538839023, 'samples': 8405568, 'steps': 43778, 'loss/train': 1.3506239652633667} -11/07/2021 03:21:55 - INFO - __main__ - Step 43780: {'lr': 0.00040796574076743366, 'samples': 8405760, 'steps': 43779, 'loss/train': 1.6787636280059814} -11/07/2021 03:21:55 - INFO - __main__ - Step 43781: {'lr': 0.00040796162757978803, 'samples': 8405952, 'steps': 43780, 'loss/train': 2.036315679550171} -11/07/2021 03:21:55 - INFO - __main__ - Step 43782: {'lr': 0.00040795751432096746, 'samples': 8406144, 'steps': 43781, 'loss/train': 1.39372980594635} -11/07/2021 03:21:56 - INFO - __main__ - Step 43783: {'lr': 0.00040795340099097357, 'samples': 8406336, 'steps': 43782, 'loss/train': 1.23551607131958} -11/07/2021 03:21:56 - INFO - __main__ - Step 43784: {'lr': 0.00040794928758980837, 'samples': 8406528, 'steps': 43783, 'loss/train': 1.1073113679885864} -11/07/2021 03:21:56 - INFO - __main__ - Step 43785: {'lr': 0.0004079451741174737, 'samples': 8406720, 'steps': 43784, 'loss/train': 1.5919462442398071} -11/07/2021 03:21:58 - INFO - __main__ - Step 43786: {'lr': 0.00040794106057397123, 'samples': 8406912, 'steps': 43785, 'loss/train': 1.5587059259414673} -11/07/2021 03:21:58 - INFO - __main__ - Step 43787: {'lr': 0.00040793694695930304, 'samples': 8407104, 'steps': 43786, 'loss/train': 1.360137701034546} -11/07/2021 03:21:59 - INFO - __main__ - Step 43788: {'lr': 0.00040793283327347085, 'samples': 8407296, 'steps': 43787, 'loss/train': 1.580074667930603} -11/07/2021 03:21:59 - INFO - __main__ - Step 43789: {'lr': 0.00040792871951647657, 'samples': 8407488, 'steps': 43788, 'loss/train': 1.572245478630066} -11/07/2021 03:21:59 - INFO - __main__ - Step 43790: {'lr': 0.00040792460568832214, 'samples': 8407680, 'steps': 43789, 'loss/train': 1.5273981094360352} -11/07/2021 03:22:00 - INFO - __main__ - Step 43791: {'lr': 0.00040792049178900924, 'samples': 8407872, 'steps': 43790, 'loss/train': 1.3839747905731201} -11/07/2021 03:22:01 - INFO - __main__ - Step 43792: {'lr': 0.00040791637781853983, 'samples': 8408064, 'steps': 43791, 'loss/train': 1.33804190158844} -11/07/2021 03:22:01 - INFO - __main__ - Step 43793: {'lr': 0.0004079122637769157, 'samples': 8408256, 'steps': 43792, 'loss/train': 1.3798296451568604} -11/07/2021 03:22:02 - INFO - __main__ - Step 43794: {'lr': 0.0004079081496641388, 'samples': 8408448, 'steps': 43793, 'loss/train': 1.4129741191864014} -11/07/2021 03:22:02 - INFO - __main__ - Step 43795: {'lr': 0.0004079040354802109, 'samples': 8408640, 'steps': 43794, 'loss/train': 0.3329477906227112} -11/07/2021 03:22:03 - INFO - __main__ - Step 43796: {'lr': 0.00040789992122513386, 'samples': 8408832, 'steps': 43795, 'loss/train': 0.7639191150665283} -11/07/2021 03:22:04 - INFO - __main__ - Step 43797: {'lr': 0.00040789580689890953, 'samples': 8409024, 'steps': 43796, 'loss/train': 1.3062173128128052} -11/07/2021 03:22:04 - INFO - __main__ - Step 43798: {'lr': 0.00040789169250153985, 'samples': 8409216, 'steps': 43797, 'loss/train': 1.3329349756240845} -11/07/2021 03:22:04 - INFO - __main__ - Step 43799: {'lr': 0.00040788757803302656, 'samples': 8409408, 'steps': 43798, 'loss/train': 1.2266077995300293} -11/07/2021 03:22:05 - INFO - __main__ - Step 43800: {'lr': 0.00040788346349337156, 'samples': 8409600, 'steps': 43799, 'loss/train': 1.3185638189315796} -11/07/2021 03:22:05 - INFO - __main__ - Step 43801: {'lr': 0.00040787934888257673, 'samples': 8409792, 'steps': 43800, 'loss/train': 1.1510093212127686} -11/07/2021 03:22:06 - INFO - __main__ - Step 43802: {'lr': 0.00040787523420064394, 'samples': 8409984, 'steps': 43801, 'loss/train': 1.5760995149612427} -11/07/2021 03:22:06 - INFO - __main__ - Step 43803: {'lr': 0.00040787111944757496, 'samples': 8410176, 'steps': 43802, 'loss/train': 1.4465820789337158} -11/07/2021 03:22:07 - INFO - __main__ - Step 43804: {'lr': 0.0004078670046233717, 'samples': 8410368, 'steps': 43803, 'loss/train': 1.5060796737670898} -11/07/2021 03:22:07 - INFO - __main__ - Step 43805: {'lr': 0.000407862889728036, 'samples': 8410560, 'steps': 43804, 'loss/train': 1.6155372858047485} -11/07/2021 03:22:07 - INFO - __main__ - Step 43806: {'lr': 0.0004078587747615697, 'samples': 8410752, 'steps': 43805, 'loss/train': 1.4102935791015625} -11/07/2021 03:22:08 - INFO - __main__ - Step 43807: {'lr': 0.00040785465972397475, 'samples': 8410944, 'steps': 43806, 'loss/train': 1.7546608448028564} -11/07/2021 03:22:09 - INFO - __main__ - Step 43808: {'lr': 0.0004078505446152528, 'samples': 8411136, 'steps': 43807, 'loss/train': 1.7220182418823242} -11/07/2021 03:22:09 - INFO - __main__ - Step 43809: {'lr': 0.0004078464294354059, 'samples': 8411328, 'steps': 43808, 'loss/train': 1.6403729915618896} -11/07/2021 03:22:09 - INFO - __main__ - Step 43810: {'lr': 0.00040784231418443585, 'samples': 8411520, 'steps': 43809, 'loss/train': 1.6539579629898071} -11/07/2021 03:22:10 - INFO - __main__ - Step 43811: {'lr': 0.00040783819886234445, 'samples': 8411712, 'steps': 43810, 'loss/train': 1.6177512407302856} -11/07/2021 03:22:11 - INFO - __main__ - Step 43812: {'lr': 0.00040783408346913366, 'samples': 8411904, 'steps': 43811, 'loss/train': 1.1286613941192627} -11/07/2021 03:22:11 - INFO - __main__ - Step 43813: {'lr': 0.00040782996800480523, 'samples': 8412096, 'steps': 43812, 'loss/train': 1.3283767700195312} -11/07/2021 03:22:12 - INFO - __main__ - Step 43814: {'lr': 0.000407825852469361, 'samples': 8412288, 'steps': 43813, 'loss/train': 1.4667810201644897} -11/07/2021 03:22:12 - INFO - __main__ - Step 43815: {'lr': 0.00040782173686280287, 'samples': 8412480, 'steps': 43814, 'loss/train': 1.4546928405761719} -11/07/2021 03:22:12 - INFO - __main__ - Step 43816: {'lr': 0.0004078176211851328, 'samples': 8412672, 'steps': 43815, 'loss/train': 1.089661717414856} -11/07/2021 03:22:13 - INFO - __main__ - Step 43817: {'lr': 0.0004078135054363524, 'samples': 8412864, 'steps': 43816, 'loss/train': 1.2308920621871948} -11/07/2021 03:22:14 - INFO - __main__ - Step 43818: {'lr': 0.00040780938961646385, 'samples': 8413056, 'steps': 43817, 'loss/train': 1.5190150737762451} -11/07/2021 03:22:14 - INFO - __main__ - Step 43819: {'lr': 0.00040780527372546874, 'samples': 8413248, 'steps': 43818, 'loss/train': 1.7634469270706177} -11/07/2021 03:22:14 - INFO - __main__ - Step 43820: {'lr': 0.000407801157763369, 'samples': 8413440, 'steps': 43819, 'loss/train': 1.3441243171691895} -11/07/2021 03:22:15 - INFO - __main__ - Step 43821: {'lr': 0.0004077970417301665, 'samples': 8413632, 'steps': 43820, 'loss/train': 1.578310251235962} -11/07/2021 03:22:15 - INFO - __main__ - Step 43822: {'lr': 0.00040779292562586304, 'samples': 8413824, 'steps': 43821, 'loss/train': 1.3511230945587158} -11/07/2021 03:22:16 - INFO - __main__ - Step 43823: {'lr': 0.0004077888094504606, 'samples': 8414016, 'steps': 43822, 'loss/train': 1.7738044261932373} -11/07/2021 03:22:16 - INFO - __main__ - Step 43824: {'lr': 0.0004077846932039609, 'samples': 8414208, 'steps': 43823, 'loss/train': 1.5807143449783325} -11/07/2021 03:22:17 - INFO - __main__ - Step 43825: {'lr': 0.00040778057688636594, 'samples': 8414400, 'steps': 43824, 'loss/train': 1.0032193660736084} -11/07/2021 03:22:17 - INFO - __main__ - Step 43826: {'lr': 0.00040777646049767736, 'samples': 8414592, 'steps': 43825, 'loss/train': 1.5744746923446655} -11/07/2021 03:22:17 - INFO - __main__ - Step 43827: {'lr': 0.0004077723440378972, 'samples': 8414784, 'steps': 43826, 'loss/train': 1.5103524923324585} -11/07/2021 03:22:18 - INFO - __main__ - Step 43828: {'lr': 0.0004077682275070273, 'samples': 8414976, 'steps': 43827, 'loss/train': 1.714619517326355} -11/07/2021 03:22:19 - INFO - __main__ - Step 43829: {'lr': 0.00040776411090506944, 'samples': 8415168, 'steps': 43828, 'loss/train': 4.008372783660889} -11/07/2021 03:22:19 - INFO - __main__ - Step 43830: {'lr': 0.0004077599942320255, 'samples': 8415360, 'steps': 43829, 'loss/train': 1.4760822057724} -11/07/2021 03:22:19 - INFO - __main__ - Step 43831: {'lr': 0.00040775587748789733, 'samples': 8415552, 'steps': 43830, 'loss/train': 1.6377016305923462} -11/07/2021 03:22:20 - INFO - __main__ - Step 43832: {'lr': 0.0004077517606726868, 'samples': 8415744, 'steps': 43831, 'loss/train': 1.2174091339111328} -11/07/2021 03:22:21 - INFO - __main__ - Step 43833: {'lr': 0.0004077476437863958, 'samples': 8415936, 'steps': 43832, 'loss/train': 1.558376431465149} -11/07/2021 03:22:22 - INFO - __main__ - Step 43834: {'lr': 0.0004077435268290261, 'samples': 8416128, 'steps': 43833, 'loss/train': 1.772778034210205} -11/07/2021 03:22:22 - INFO - __main__ - Step 43835: {'lr': 0.0004077394098005796, 'samples': 8416320, 'steps': 43834, 'loss/train': 1.7632755041122437} -11/07/2021 03:22:22 - INFO - __main__ - Step 43836: {'lr': 0.00040773529270105816, 'samples': 8416512, 'steps': 43835, 'loss/train': 0.5030577182769775} -11/07/2021 03:22:23 - INFO - __main__ - Step 43837: {'lr': 0.0004077311755304637, 'samples': 8416704, 'steps': 43836, 'loss/train': 1.724934458732605} -11/07/2021 03:22:24 - INFO - __main__ - Step 43838: {'lr': 0.000407727058288798, 'samples': 8416896, 'steps': 43837, 'loss/train': 1.2645070552825928} -11/07/2021 03:22:24 - INFO - __main__ - Step 43839: {'lr': 0.00040772294097606276, 'samples': 8417088, 'steps': 43838, 'loss/train': 1.1850857734680176} -11/07/2021 03:22:24 - INFO - __main__ - Step 43840: {'lr': 0.0004077188235922601, 'samples': 8417280, 'steps': 43839, 'loss/train': 1.8185043334960938} -11/07/2021 03:22:25 - INFO - __main__ - Step 43841: {'lr': 0.0004077147061373918, 'samples': 8417472, 'steps': 43840, 'loss/train': 1.5139338970184326} -11/07/2021 03:22:25 - INFO - __main__ - Step 43842: {'lr': 0.00040771058861145963, 'samples': 8417664, 'steps': 43841, 'loss/train': 1.6452528238296509} -11/07/2021 03:22:25 - INFO - __main__ - Step 43843: {'lr': 0.0004077064710144656, 'samples': 8417856, 'steps': 43842, 'loss/train': 2.128436326980591} -11/07/2021 03:22:27 - INFO - __main__ - Step 43844: {'lr': 0.0004077023533464114, 'samples': 8418048, 'steps': 43843, 'loss/train': 1.321452260017395} -11/07/2021 03:22:27 - INFO - __main__ - Step 43845: {'lr': 0.000407698235607299, 'samples': 8418240, 'steps': 43844, 'loss/train': 1.3933018445968628} -11/07/2021 03:22:27 - INFO - __main__ - Step 43846: {'lr': 0.0004076941177971301, 'samples': 8418432, 'steps': 43845, 'loss/train': 1.6112278699874878} -11/07/2021 03:22:28 - INFO - __main__ - Step 43847: {'lr': 0.0004076899999159067, 'samples': 8418624, 'steps': 43846, 'loss/train': 1.155909538269043} -11/07/2021 03:22:28 - INFO - __main__ - Step 43848: {'lr': 0.0004076858819636307, 'samples': 8418816, 'steps': 43847, 'loss/train': 1.2335573434829712} -11/07/2021 03:22:29 - INFO - __main__ - Step 43849: {'lr': 0.0004076817639403038, 'samples': 8419008, 'steps': 43848, 'loss/train': 1.659220576286316} -11/07/2021 03:22:29 - INFO - __main__ - Step 43850: {'lr': 0.0004076776458459279, 'samples': 8419200, 'steps': 43849, 'loss/train': 1.4065468311309814} -11/07/2021 03:22:30 - INFO - __main__ - Step 43851: {'lr': 0.00040767352768050503, 'samples': 8419392, 'steps': 43850, 'loss/train': 1.8235328197479248} -11/07/2021 03:22:30 - INFO - __main__ - Step 43852: {'lr': 0.0004076694094440368, 'samples': 8419584, 'steps': 43851, 'loss/train': 1.302893042564392} -11/07/2021 03:22:30 - INFO - __main__ - Step 43853: {'lr': 0.0004076652911365252, 'samples': 8419776, 'steps': 43852, 'loss/train': 1.7538639307022095} -11/07/2021 03:22:32 - INFO - __main__ - Step 43854: {'lr': 0.00040766117275797196, 'samples': 8419968, 'steps': 43853, 'loss/train': 2.043196201324463} -11/07/2021 03:22:32 - INFO - __main__ - Step 43855: {'lr': 0.0004076570543083792, 'samples': 8420160, 'steps': 43854, 'loss/train': 1.650506615638733} -11/07/2021 03:22:32 - INFO - __main__ - Step 43856: {'lr': 0.0004076529357877485, 'samples': 8420352, 'steps': 43855, 'loss/train': 1.1953593492507935} -11/07/2021 03:22:33 - INFO - __main__ - Step 43857: {'lr': 0.00040764881719608184, 'samples': 8420544, 'steps': 43856, 'loss/train': 1.5082013607025146} -11/07/2021 03:22:33 - INFO - __main__ - Step 43858: {'lr': 0.000407644698533381, 'samples': 8420736, 'steps': 43857, 'loss/train': 1.5169827938079834} -11/07/2021 03:22:34 - INFO - __main__ - Step 43859: {'lr': 0.00040764057979964793, 'samples': 8420928, 'steps': 43858, 'loss/train': 1.1407544612884521} -11/07/2021 03:22:34 - INFO - __main__ - Step 43860: {'lr': 0.0004076364609948844, 'samples': 8421120, 'steps': 43859, 'loss/train': 1.04957115650177} -11/07/2021 03:22:35 - INFO - __main__ - Step 43861: {'lr': 0.0004076323421190924, 'samples': 8421312, 'steps': 43860, 'loss/train': 1.3893458843231201} -11/07/2021 03:22:35 - INFO - __main__ - Step 43862: {'lr': 0.0004076282231722737, 'samples': 8421504, 'steps': 43861, 'loss/train': 1.1427700519561768} -11/07/2021 03:22:35 - INFO - __main__ - Step 43863: {'lr': 0.0004076241041544301, 'samples': 8421696, 'steps': 43862, 'loss/train': 1.4993537664413452} -11/07/2021 03:22:36 - INFO - __main__ - Step 43864: {'lr': 0.00040761998506556353, 'samples': 8421888, 'steps': 43863, 'loss/train': 1.5167622566223145} -11/07/2021 03:22:37 - INFO - __main__ - Step 43865: {'lr': 0.0004076158659056758, 'samples': 8422080, 'steps': 43864, 'loss/train': 1.1694954633712769} -11/07/2021 03:22:37 - INFO - __main__ - Step 43866: {'lr': 0.00040761174667476883, 'samples': 8422272, 'steps': 43865, 'loss/train': 1.4639588594436646} -11/07/2021 03:22:37 - INFO - __main__ - Step 43867: {'lr': 0.0004076076273728444, 'samples': 8422464, 'steps': 43866, 'loss/train': 1.7881133556365967} -11/07/2021 03:22:38 - INFO - __main__ - Step 43868: {'lr': 0.0004076035079999045, 'samples': 8422656, 'steps': 43867, 'loss/train': 1.3311805725097656} -11/07/2021 03:22:39 - INFO - __main__ - Step 43869: {'lr': 0.0004075993885559508, 'samples': 8422848, 'steps': 43868, 'loss/train': 1.6587876081466675} -11/07/2021 03:22:39 - INFO - __main__ - Step 43870: {'lr': 0.0004075952690409852, 'samples': 8423040, 'steps': 43869, 'loss/train': 1.6615227460861206} -11/07/2021 03:22:39 - INFO - __main__ - Step 43871: {'lr': 0.00040759114945500974, 'samples': 8423232, 'steps': 43870, 'loss/train': 1.629590392112732} -11/07/2021 03:22:40 - INFO - __main__ - Step 43872: {'lr': 0.0004075870297980261, 'samples': 8423424, 'steps': 43871, 'loss/train': 1.5323020219802856} -11/07/2021 03:22:40 - INFO - __main__ - Step 43873: {'lr': 0.0004075829100700361, 'samples': 8423616, 'steps': 43872, 'loss/train': 1.6959728002548218} -11/07/2021 03:22:41 - INFO - __main__ - Step 43874: {'lr': 0.0004075787902710417, 'samples': 8423808, 'steps': 43873, 'loss/train': 1.9394711256027222} -11/07/2021 03:22:42 - INFO - __main__ - Step 43875: {'lr': 0.0004075746704010448, 'samples': 8424000, 'steps': 43874, 'loss/train': 1.5391508340835571} -11/07/2021 03:22:42 - INFO - __main__ - Step 43876: {'lr': 0.0004075705504600471, 'samples': 8424192, 'steps': 43875, 'loss/train': 1.6477059125900269} -11/07/2021 03:22:42 - INFO - __main__ - Step 43877: {'lr': 0.00040756643044805057, 'samples': 8424384, 'steps': 43876, 'loss/train': 2.9302780628204346} -11/07/2021 03:22:43 - INFO - __main__ - Step 43878: {'lr': 0.0004075623103650571, 'samples': 8424576, 'steps': 43877, 'loss/train': 1.6522893905639648} -11/07/2021 03:22:44 - INFO - __main__ - Step 43879: {'lr': 0.00040755819021106844, 'samples': 8424768, 'steps': 43878, 'loss/train': 1.4377820491790771} -11/07/2021 03:22:44 - INFO - __main__ - Step 43880: {'lr': 0.00040755406998608645, 'samples': 8424960, 'steps': 43879, 'loss/train': 1.9909913539886475} -11/07/2021 03:22:44 - INFO - __main__ - Step 43881: {'lr': 0.00040754994969011306, 'samples': 8425152, 'steps': 43880, 'loss/train': 0.9266546964645386} -11/07/2021 03:22:45 - INFO - __main__ - Step 43882: {'lr': 0.00040754582932315007, 'samples': 8425344, 'steps': 43881, 'loss/train': 2.1872682571411133} -11/07/2021 03:22:45 - INFO - __main__ - Step 43883: {'lr': 0.0004075417088851994, 'samples': 8425536, 'steps': 43882, 'loss/train': 1.6716867685317993} -11/07/2021 03:22:46 - INFO - __main__ - Step 43884: {'lr': 0.0004075375883762629, 'samples': 8425728, 'steps': 43883, 'loss/train': 1.638662338256836} -11/07/2021 03:22:47 - INFO - __main__ - Step 43885: {'lr': 0.0004075334677963423, 'samples': 8425920, 'steps': 43884, 'loss/train': 1.7723662853240967} -11/07/2021 03:22:47 - INFO - __main__ - Step 43886: {'lr': 0.0004075293471454396, 'samples': 8426112, 'steps': 43885, 'loss/train': 1.765032172203064} -11/07/2021 03:22:47 - INFO - __main__ - Step 43887: {'lr': 0.0004075252264235566, 'samples': 8426304, 'steps': 43886, 'loss/train': 1.8197784423828125} -11/07/2021 03:22:48 - INFO - __main__ - Step 43888: {'lr': 0.0004075211056306951, 'samples': 8426496, 'steps': 43887, 'loss/train': 1.9503345489501953} -11/07/2021 03:22:48 - INFO - __main__ - Step 43889: {'lr': 0.00040751698476685716, 'samples': 8426688, 'steps': 43888, 'loss/train': 1.4646555185317993} -11/07/2021 03:22:49 - INFO - __main__ - Step 43890: {'lr': 0.00040751286383204437, 'samples': 8426880, 'steps': 43889, 'loss/train': 1.5433449745178223} -11/07/2021 03:22:49 - INFO - __main__ - Step 43891: {'lr': 0.0004075087428262588, 'samples': 8427072, 'steps': 43890, 'loss/train': 1.3730559349060059} -11/07/2021 03:22:50 - INFO - __main__ - Step 43892: {'lr': 0.0004075046217495022, 'samples': 8427264, 'steps': 43891, 'loss/train': 0.6554791331291199} -11/07/2021 03:22:50 - INFO - __main__ - Step 43893: {'lr': 0.00040750050060177643, 'samples': 8427456, 'steps': 43892, 'loss/train': 1.933127760887146} -11/07/2021 03:22:50 - INFO - __main__ - Step 43894: {'lr': 0.00040749637938308336, 'samples': 8427648, 'steps': 43893, 'loss/train': 1.17872953414917} -11/07/2021 03:22:51 - INFO - __main__ - Step 43895: {'lr': 0.00040749225809342485, 'samples': 8427840, 'steps': 43894, 'loss/train': 1.7261704206466675} -11/07/2021 03:22:52 - INFO - __main__ - Step 43896: {'lr': 0.00040748813673280277, 'samples': 8428032, 'steps': 43895, 'loss/train': 1.2042407989501953} -11/07/2021 03:22:52 - INFO - __main__ - Step 43897: {'lr': 0.0004074840153012189, 'samples': 8428224, 'steps': 43896, 'loss/train': 1.368628978729248} -11/07/2021 03:22:52 - INFO - __main__ - Step 43898: {'lr': 0.0004074798937986753, 'samples': 8428416, 'steps': 43897, 'loss/train': 1.738026738166809} -11/07/2021 03:22:53 - INFO - __main__ - Step 43899: {'lr': 0.00040747577222517364, 'samples': 8428608, 'steps': 43898, 'loss/train': 1.714708685874939} -11/07/2021 03:22:54 - INFO - __main__ - Step 43900: {'lr': 0.0004074716505807158, 'samples': 8428800, 'steps': 43899, 'loss/train': 1.4866786003112793} -11/07/2021 03:22:55 - INFO - __main__ - Step 43901: {'lr': 0.0004074675288653037, 'samples': 8428992, 'steps': 43900, 'loss/train': 1.5645619630813599} -11/07/2021 03:22:55 - INFO - __main__ - Step 43902: {'lr': 0.0004074634070789391, 'samples': 8429184, 'steps': 43901, 'loss/train': 0.1000712662935257} -11/07/2021 03:22:55 - INFO - __main__ - Step 43903: {'lr': 0.0004074592852216239, 'samples': 8429376, 'steps': 43902, 'loss/train': 1.6530612707138062} -11/07/2021 03:22:56 - INFO - __main__ - Step 43904: {'lr': 0.0004074551632933601, 'samples': 8429568, 'steps': 43903, 'loss/train': 1.089402437210083} -11/07/2021 03:22:56 - INFO - __main__ - Step 43905: {'lr': 0.00040745104129414933, 'samples': 8429760, 'steps': 43904, 'loss/train': 0.9136307835578918} -11/07/2021 03:22:57 - INFO - __main__ - Step 43906: {'lr': 0.0004074469192239936, 'samples': 8429952, 'steps': 43905, 'loss/train': 1.4113155603408813} -11/07/2021 03:22:57 - INFO - __main__ - Step 43907: {'lr': 0.0004074427970828947, 'samples': 8430144, 'steps': 43906, 'loss/train': 1.4035757780075073} -11/07/2021 03:22:58 - INFO - __main__ - Step 43908: {'lr': 0.00040743867487085444, 'samples': 8430336, 'steps': 43907, 'loss/train': 1.4519786834716797} -11/07/2021 03:22:58 - INFO - __main__ - Step 43909: {'lr': 0.0004074345525878748, 'samples': 8430528, 'steps': 43908, 'loss/train': 1.6051146984100342} -11/07/2021 03:22:58 - INFO - __main__ - Step 43910: {'lr': 0.0004074304302339576, 'samples': 8430720, 'steps': 43909, 'loss/train': 1.672196388244629} -11/07/2021 03:22:59 - INFO - __main__ - Step 43911: {'lr': 0.0004074263078091046, 'samples': 8430912, 'steps': 43910, 'loss/train': 1.1506792306900024} -11/07/2021 03:23:00 - INFO - __main__ - Step 43912: {'lr': 0.00040742218531331786, 'samples': 8431104, 'steps': 43911, 'loss/train': 2.5236992835998535} -11/07/2021 03:23:00 - INFO - __main__ - Step 43913: {'lr': 0.0004074180627465991, 'samples': 8431296, 'steps': 43912, 'loss/train': 1.912400245666504} -11/07/2021 03:23:00 - INFO - __main__ - Step 43914: {'lr': 0.00040741394010895013, 'samples': 8431488, 'steps': 43913, 'loss/train': 1.4635186195373535} -11/07/2021 03:23:01 - INFO - __main__ - Step 43915: {'lr': 0.0004074098174003729, 'samples': 8431680, 'steps': 43914, 'loss/train': 1.7027950286865234} -11/07/2021 03:23:02 - INFO - __main__ - Step 43916: {'lr': 0.0004074056946208692, 'samples': 8431872, 'steps': 43915, 'loss/train': 1.5679969787597656} -11/07/2021 03:23:02 - INFO - __main__ - Step 43917: {'lr': 0.0004074015717704409, 'samples': 8432064, 'steps': 43916, 'loss/train': 1.717900037765503} -11/07/2021 03:23:03 - INFO - __main__ - Step 43918: {'lr': 0.00040739744884908994, 'samples': 8432256, 'steps': 43917, 'loss/train': 1.867804765701294} -11/07/2021 03:23:03 - INFO - __main__ - Step 43919: {'lr': 0.00040739332585681807, 'samples': 8432448, 'steps': 43918, 'loss/train': 1.896952509880066} -11/07/2021 03:23:03 - INFO - __main__ - Step 43920: {'lr': 0.00040738920279362724, 'samples': 8432640, 'steps': 43919, 'loss/train': 1.7845344543457031} -11/07/2021 03:23:04 - INFO - __main__ - Step 43921: {'lr': 0.00040738507965951923, 'samples': 8432832, 'steps': 43920, 'loss/train': 1.416855812072754} -11/07/2021 03:23:05 - INFO - __main__ - Step 43922: {'lr': 0.0004073809564544959, 'samples': 8433024, 'steps': 43921, 'loss/train': 2.4920897483825684} -11/07/2021 03:23:05 - INFO - __main__ - Step 43923: {'lr': 0.0004073768331785592, 'samples': 8433216, 'steps': 43922, 'loss/train': 1.7586002349853516} -11/07/2021 03:23:05 - INFO - __main__ - Step 43924: {'lr': 0.0004073727098317109, 'samples': 8433408, 'steps': 43923, 'loss/train': 1.983863353729248} -11/07/2021 03:23:06 - INFO - __main__ - Step 43925: {'lr': 0.0004073685864139529, 'samples': 8433600, 'steps': 43924, 'loss/train': 1.6089143753051758} -11/07/2021 03:23:07 - INFO - __main__ - Step 43926: {'lr': 0.00040736446292528704, 'samples': 8433792, 'steps': 43925, 'loss/train': 2.148613214492798} -11/07/2021 03:23:07 - INFO - __main__ - Step 43927: {'lr': 0.0004073603393657152, 'samples': 8433984, 'steps': 43926, 'loss/train': 1.701894998550415} -11/07/2021 03:23:08 - INFO - __main__ - Step 43928: {'lr': 0.0004073562157352392, 'samples': 8434176, 'steps': 43927, 'loss/train': 1.439337968826294} -11/07/2021 03:23:08 - INFO - __main__ - Step 43929: {'lr': 0.00040735209203386093, 'samples': 8434368, 'steps': 43928, 'loss/train': 1.6041038036346436} -11/07/2021 03:23:08 - INFO - __main__ - Step 43930: {'lr': 0.00040734796826158226, 'samples': 8434560, 'steps': 43929, 'loss/train': 1.6103554964065552} -11/07/2021 03:23:09 - INFO - __main__ - Step 43931: {'lr': 0.000407343844418405, 'samples': 8434752, 'steps': 43930, 'loss/train': 1.2818981409072876} -11/07/2021 03:23:10 - INFO - __main__ - Step 43932: {'lr': 0.000407339720504331, 'samples': 8434944, 'steps': 43931, 'loss/train': 1.7273222208023071} -11/07/2021 03:23:10 - INFO - __main__ - Step 43933: {'lr': 0.00040733559651936216, 'samples': 8435136, 'steps': 43932, 'loss/train': 9.138843536376953} -11/07/2021 03:23:11 - INFO - __main__ - Step 43934: {'lr': 0.0004073314724635003, 'samples': 8435328, 'steps': 43933, 'loss/train': 0.8566093444824219} -11/07/2021 03:23:11 - INFO - __main__ - Step 43935: {'lr': 0.0004073273483367474, 'samples': 8435520, 'steps': 43934, 'loss/train': 0.11346945911645889} -11/07/2021 03:23:11 - INFO - __main__ - Step 43936: {'lr': 0.0004073232241391052, 'samples': 8435712, 'steps': 43935, 'loss/train': 1.9948738813400269} -11/07/2021 03:23:12 - INFO - __main__ - Step 43937: {'lr': 0.00040731909987057547, 'samples': 8435904, 'steps': 43936, 'loss/train': 1.584019660949707} -11/07/2021 03:23:13 - INFO - __main__ - Step 43938: {'lr': 0.0004073149755311603, 'samples': 8436096, 'steps': 43937, 'loss/train': 1.7624531984329224} -11/07/2021 03:23:13 - INFO - __main__ - Step 43939: {'lr': 0.0004073108511208614, 'samples': 8436288, 'steps': 43938, 'loss/train': 1.6295770406723022} -11/07/2021 03:23:13 - INFO - __main__ - Step 43940: {'lr': 0.0004073067266396807, 'samples': 8436480, 'steps': 43939, 'loss/train': 1.6054798364639282} -11/07/2021 03:23:14 - INFO - __main__ - Step 43941: {'lr': 0.00040730260208761995, 'samples': 8436672, 'steps': 43940, 'loss/train': 1.169405460357666} -11/07/2021 03:23:15 - INFO - __main__ - Step 43942: {'lr': 0.0004072984774646811, 'samples': 8436864, 'steps': 43941, 'loss/train': 1.4220243692398071} -11/07/2021 03:23:15 - INFO - __main__ - Step 43943: {'lr': 0.0004072943527708659, 'samples': 8437056, 'steps': 43942, 'loss/train': 1.10098397731781} -11/07/2021 03:23:15 - INFO - __main__ - Step 43944: {'lr': 0.00040729022800617637, 'samples': 8437248, 'steps': 43943, 'loss/train': 1.892876148223877} -11/07/2021 03:23:16 - INFO - __main__ - Step 43945: {'lr': 0.00040728610317061433, 'samples': 8437440, 'steps': 43944, 'loss/train': 1.7797027826309204} -11/07/2021 03:23:16 - INFO - __main__ - Step 43946: {'lr': 0.0004072819782641816, 'samples': 8437632, 'steps': 43945, 'loss/train': 2.0013530254364014} -11/07/2021 03:23:17 - INFO - __main__ - Step 43947: {'lr': 0.00040727785328687995, 'samples': 8437824, 'steps': 43946, 'loss/train': 1.4861782789230347} -11/07/2021 03:23:17 - INFO - __main__ - Step 43948: {'lr': 0.00040727372823871135, 'samples': 8438016, 'steps': 43947, 'loss/train': 1.3490138053894043} -11/07/2021 03:23:18 - INFO - __main__ - Step 43949: {'lr': 0.00040726960311967766, 'samples': 8438208, 'steps': 43948, 'loss/train': 1.4066849946975708} -11/07/2021 03:23:18 - INFO - __main__ - Step 43950: {'lr': 0.0004072654779297807, 'samples': 8438400, 'steps': 43949, 'loss/train': 1.1034836769104004} -11/07/2021 03:23:19 - INFO - __main__ - Step 43951: {'lr': 0.0004072613526690223, 'samples': 8438592, 'steps': 43950, 'loss/train': 1.2344754934310913} -11/07/2021 03:23:19 - INFO - __main__ - Step 43952: {'lr': 0.00040725722733740444, 'samples': 8438784, 'steps': 43951, 'loss/train': 1.6640533208847046} -11/07/2021 03:23:20 - INFO - __main__ - Step 43953: {'lr': 0.0004072531019349289, 'samples': 8438976, 'steps': 43952, 'loss/train': 0.542209267616272} -11/07/2021 03:23:21 - INFO - __main__ - Step 43954: {'lr': 0.00040724897646159753, 'samples': 8439168, 'steps': 43953, 'loss/train': 1.1740684509277344} -11/07/2021 03:23:21 - INFO - __main__ - Step 43955: {'lr': 0.0004072448509174121, 'samples': 8439360, 'steps': 43954, 'loss/train': 1.7182492017745972} -11/07/2021 03:23:21 - INFO - __main__ - Step 43956: {'lr': 0.00040724072530237465, 'samples': 8439552, 'steps': 43955, 'loss/train': 1.1453046798706055} -11/07/2021 03:23:22 - INFO - __main__ - Step 43957: {'lr': 0.00040723659961648694, 'samples': 8439744, 'steps': 43956, 'loss/train': 2.543769598007202} -11/07/2021 03:23:22 - INFO - __main__ - Step 43958: {'lr': 0.0004072324738597509, 'samples': 8439936, 'steps': 43957, 'loss/train': 0.9986402988433838} -11/07/2021 03:23:23 - INFO - __main__ - Step 43959: {'lr': 0.00040722834803216834, 'samples': 8440128, 'steps': 43958, 'loss/train': 1.1566802263259888} -11/07/2021 03:23:23 - INFO - __main__ - Step 43960: {'lr': 0.000407224222133741, 'samples': 8440320, 'steps': 43959, 'loss/train': 2.107487440109253} -11/07/2021 03:23:24 - INFO - __main__ - Step 43961: {'lr': 0.00040722009616447094, 'samples': 8440512, 'steps': 43960, 'loss/train': 1.6063014268875122} -11/07/2021 03:23:24 - INFO - __main__ - Step 43962: {'lr': 0.0004072159701243599, 'samples': 8440704, 'steps': 43961, 'loss/train': 1.5708634853363037} -11/07/2021 03:23:24 - INFO - __main__ - Step 43963: {'lr': 0.00040721184401340977, 'samples': 8440896, 'steps': 43962, 'loss/train': 1.6888006925582886} -11/07/2021 03:23:25 - INFO - __main__ - Step 43964: {'lr': 0.00040720771783162236, 'samples': 8441088, 'steps': 43963, 'loss/train': 1.2426689863204956} -11/07/2021 03:23:26 - INFO - __main__ - Step 43965: {'lr': 0.0004072035915789997, 'samples': 8441280, 'steps': 43964, 'loss/train': 1.6193268299102783} -11/07/2021 03:23:26 - INFO - __main__ - Step 43966: {'lr': 0.0004071994652555434, 'samples': 8441472, 'steps': 43965, 'loss/train': 1.2662886381149292} -11/07/2021 03:23:27 - INFO - __main__ - Step 43967: {'lr': 0.0004071953388612555, 'samples': 8441664, 'steps': 43966, 'loss/train': 1.4906792640686035} -11/07/2021 03:23:27 - INFO - __main__ - Step 43968: {'lr': 0.0004071912123961379, 'samples': 8441856, 'steps': 43967, 'loss/train': 1.512399435043335} -11/07/2021 03:23:28 - INFO - __main__ - Step 43969: {'lr': 0.00040718708586019226, 'samples': 8442048, 'steps': 43968, 'loss/train': 0.19833578169345856} -11/07/2021 03:23:28 - INFO - __main__ - Step 43970: {'lr': 0.00040718295925342053, 'samples': 8442240, 'steps': 43969, 'loss/train': 1.3765857219696045} -11/07/2021 03:23:29 - INFO - __main__ - Step 43971: {'lr': 0.0004071788325758246, 'samples': 8442432, 'steps': 43970, 'loss/train': 0.7994476556777954} -11/07/2021 03:23:29 - INFO - __main__ - Step 43972: {'lr': 0.00040717470582740634, 'samples': 8442624, 'steps': 43971, 'loss/train': 1.7003074884414673} -11/07/2021 03:23:29 - INFO - __main__ - Step 43973: {'lr': 0.0004071705790081676, 'samples': 8442816, 'steps': 43972, 'loss/train': 1.42214834690094} -11/07/2021 03:23:30 - INFO - __main__ - Step 43974: {'lr': 0.0004071664521181102, 'samples': 8443008, 'steps': 43973, 'loss/train': 1.4173136949539185} -11/07/2021 03:23:31 - INFO - __main__ - Step 43975: {'lr': 0.00040716232515723596, 'samples': 8443200, 'steps': 43974, 'loss/train': 1.5742828845977783} -11/07/2021 03:23:31 - INFO - __main__ - Step 43976: {'lr': 0.00040715819812554686, 'samples': 8443392, 'steps': 43975, 'loss/train': 1.956968069076538} -11/07/2021 03:23:31 - INFO - __main__ - Step 43977: {'lr': 0.0004071540710230447, 'samples': 8443584, 'steps': 43976, 'loss/train': 1.3919167518615723} -11/07/2021 03:23:32 - INFO - __main__ - Step 43978: {'lr': 0.0004071499438497314, 'samples': 8443776, 'steps': 43977, 'loss/train': 1.4417613744735718} -11/07/2021 03:23:32 - INFO - __main__ - Step 43979: {'lr': 0.0004071458166056087, 'samples': 8443968, 'steps': 43978, 'loss/train': 1.6836180686950684} -11/07/2021 03:23:34 - INFO - __main__ - Step 43980: {'lr': 0.00040714168929067854, 'samples': 8444160, 'steps': 43979, 'loss/train': 1.9319530725479126} -11/07/2021 03:23:34 - INFO - __main__ - Step 43981: {'lr': 0.0004071375619049427, 'samples': 8444352, 'steps': 43980, 'loss/train': 1.5899041891098022} -11/07/2021 03:23:34 - INFO - __main__ - Step 43982: {'lr': 0.0004071334344484031, 'samples': 8444544, 'steps': 43981, 'loss/train': 2.048292636871338} -11/07/2021 03:23:35 - INFO - __main__ - Step 43983: {'lr': 0.00040712930692106164, 'samples': 8444736, 'steps': 43982, 'loss/train': 1.5842952728271484} -11/07/2021 03:23:35 - INFO - __main__ - Step 43984: {'lr': 0.00040712517932292016, 'samples': 8444928, 'steps': 43983, 'loss/train': 1.2995017766952515} -11/07/2021 03:23:36 - INFO - __main__ - Step 43985: {'lr': 0.00040712105165398044, 'samples': 8445120, 'steps': 43984, 'loss/train': 0.8532267808914185} -11/07/2021 03:23:36 - INFO - __main__ - Step 43986: {'lr': 0.0004071169239142445, 'samples': 8445312, 'steps': 43985, 'loss/train': 1.5599069595336914} -11/07/2021 03:23:37 - INFO - __main__ - Step 43987: {'lr': 0.000407112796103714, 'samples': 8445504, 'steps': 43986, 'loss/train': 1.4275630712509155} -11/07/2021 03:23:37 - INFO - __main__ - Step 43988: {'lr': 0.0004071086682223909, 'samples': 8445696, 'steps': 43987, 'loss/train': 1.1857975721359253} -11/07/2021 03:23:37 - INFO - __main__ - Step 43989: {'lr': 0.0004071045402702771, 'samples': 8445888, 'steps': 43988, 'loss/train': 1.6939241886138916} -11/07/2021 03:23:38 - INFO - __main__ - Step 43990: {'lr': 0.0004071004122473744, 'samples': 8446080, 'steps': 43989, 'loss/train': 1.6355971097946167} -11/07/2021 03:23:39 - INFO - __main__ - Step 43991: {'lr': 0.0004070962841536847, 'samples': 8446272, 'steps': 43990, 'loss/train': 1.6357855796813965} -11/07/2021 03:23:39 - INFO - __main__ - Step 43992: {'lr': 0.0004070921559892098, 'samples': 8446464, 'steps': 43991, 'loss/train': 1.360775113105774} -11/07/2021 03:23:39 - INFO - __main__ - Step 43993: {'lr': 0.00040708802775395165, 'samples': 8446656, 'steps': 43992, 'loss/train': 1.4375793933868408} -11/07/2021 03:23:40 - INFO - __main__ - Step 43994: {'lr': 0.000407083899447912, 'samples': 8446848, 'steps': 43993, 'loss/train': 1.5229673385620117} -11/07/2021 03:23:41 - INFO - __main__ - Step 43995: {'lr': 0.00040707977107109285, 'samples': 8447040, 'steps': 43994, 'loss/train': 1.6514801979064941} -11/07/2021 03:23:41 - INFO - __main__ - Step 43996: {'lr': 0.00040707564262349594, 'samples': 8447232, 'steps': 43995, 'loss/train': 1.9328930377960205} -11/07/2021 03:23:42 - INFO - __main__ - Step 43997: {'lr': 0.0004070715141051231, 'samples': 8447424, 'steps': 43996, 'loss/train': 1.518604040145874} -11/07/2021 03:23:42 - INFO - __main__ - Step 43998: {'lr': 0.00040706738551597634, 'samples': 8447616, 'steps': 43997, 'loss/train': 1.8714951276779175} -11/07/2021 03:23:42 - INFO - __main__ - Step 43999: {'lr': 0.0004070632568560574, 'samples': 8447808, 'steps': 43998, 'loss/train': 1.267977237701416} -11/07/2021 03:23:43 - INFO - __main__ - Step 44000: {'lr': 0.0004070591281253682, 'samples': 8448000, 'steps': 43999, 'loss/train': 1.512953519821167} -11/07/2021 03:23:44 - INFO - __main__ - Step 44001: {'lr': 0.0004070549993239106, 'samples': 8448192, 'steps': 44000, 'loss/train': 0.831805408000946} -11/07/2021 03:23:44 - INFO - __main__ - Step 44002: {'lr': 0.0004070508704516864, 'samples': 8448384, 'steps': 44001, 'loss/train': 1.5522176027297974} -11/07/2021 03:23:44 - INFO - __main__ - Step 44003: {'lr': 0.00040704674150869753, 'samples': 8448576, 'steps': 44002, 'loss/train': 1.5985102653503418} -11/07/2021 03:23:45 - INFO - __main__ - Step 44004: {'lr': 0.0004070426124949458, 'samples': 8448768, 'steps': 44003, 'loss/train': 1.6318305730819702} -11/07/2021 03:23:45 - INFO - __main__ - Step 44005: {'lr': 0.00040703848341043313, 'samples': 8448960, 'steps': 44004, 'loss/train': 1.3904163837432861} -11/07/2021 03:23:46 - INFO - __main__ - Step 44006: {'lr': 0.00040703435425516136, 'samples': 8449152, 'steps': 44005, 'loss/train': 1.818678855895996} -11/07/2021 03:23:46 - INFO - __main__ - Step 44007: {'lr': 0.0004070302250291322, 'samples': 8449344, 'steps': 44006, 'loss/train': 1.2677369117736816} -11/07/2021 03:23:47 - INFO - __main__ - Step 44008: {'lr': 0.0004070260957323478, 'samples': 8449536, 'steps': 44007, 'loss/train': 1.5789427757263184} -11/07/2021 03:23:47 - INFO - __main__ - Step 44009: {'lr': 0.0004070219663648098, 'samples': 8449728, 'steps': 44008, 'loss/train': 1.146945595741272} -11/07/2021 03:23:47 - INFO - __main__ - Step 44010: {'lr': 0.0004070178369265201, 'samples': 8449920, 'steps': 44009, 'loss/train': 1.254859447479248} -11/07/2021 03:23:49 - INFO - __main__ - Step 44011: {'lr': 0.00040701370741748057, 'samples': 8450112, 'steps': 44010, 'loss/train': 1.4340729713439941} -11/07/2021 03:23:49 - INFO - __main__ - Step 44012: {'lr': 0.0004070095778376932, 'samples': 8450304, 'steps': 44011, 'loss/train': 1.708217978477478} -11/07/2021 03:23:49 - INFO - __main__ - Step 44013: {'lr': 0.0004070054481871597, 'samples': 8450496, 'steps': 44012, 'loss/train': 1.3653974533081055} -11/07/2021 03:23:50 - INFO - __main__ - Step 44014: {'lr': 0.00040700131846588185, 'samples': 8450688, 'steps': 44013, 'loss/train': 0.32702651619911194} -11/07/2021 03:23:50 - INFO - __main__ - Step 44015: {'lr': 0.0004069971886738617, 'samples': 8450880, 'steps': 44014, 'loss/train': 1.6158820390701294} -11/07/2021 03:23:51 - INFO - __main__ - Step 44016: {'lr': 0.00040699305881110103, 'samples': 8451072, 'steps': 44015, 'loss/train': 1.2307311296463013} -11/07/2021 03:23:52 - INFO - __main__ - Step 44017: {'lr': 0.00040698892887760174, 'samples': 8451264, 'steps': 44016, 'loss/train': 2.1337993144989014} -11/07/2021 03:23:52 - INFO - __main__ - Step 44018: {'lr': 0.00040698479887336567, 'samples': 8451456, 'steps': 44017, 'loss/train': 1.6925996541976929} -11/07/2021 03:23:52 - INFO - __main__ - Step 44019: {'lr': 0.00040698066879839463, 'samples': 8451648, 'steps': 44018, 'loss/train': 1.8600653409957886} -11/07/2021 03:23:53 - INFO - __main__ - Step 44020: {'lr': 0.00040697653865269057, 'samples': 8451840, 'steps': 44019, 'loss/train': 0.4142761826515198} -11/07/2021 03:23:54 - INFO - __main__ - Step 44021: {'lr': 0.00040697240843625527, 'samples': 8452032, 'steps': 44020, 'loss/train': 1.5758490562438965} -11/07/2021 03:23:54 - INFO - __main__ - Step 44022: {'lr': 0.00040696827814909063, 'samples': 8452224, 'steps': 44021, 'loss/train': 1.2229807376861572} -11/07/2021 03:23:54 - INFO - __main__ - Step 44023: {'lr': 0.0004069641477911985, 'samples': 8452416, 'steps': 44022, 'loss/train': 1.3245600461959839} -11/07/2021 03:23:55 - INFO - __main__ - Step 44024: {'lr': 0.00040696001736258077, 'samples': 8452608, 'steps': 44023, 'loss/train': 1.4945148229599} -11/07/2021 03:23:55 - INFO - __main__ - Step 44025: {'lr': 0.0004069558868632393, 'samples': 8452800, 'steps': 44024, 'loss/train': 1.1728746891021729} -11/07/2021 03:23:56 - INFO - __main__ - Step 44026: {'lr': 0.0004069517562931759, 'samples': 8452992, 'steps': 44025, 'loss/train': 1.3753551244735718} -11/07/2021 03:23:56 - INFO - __main__ - Step 44027: {'lr': 0.0004069476256523924, 'samples': 8453184, 'steps': 44026, 'loss/train': 1.3952306509017944} -11/07/2021 03:23:57 - INFO - __main__ - Step 44028: {'lr': 0.0004069434949408908, 'samples': 8453376, 'steps': 44027, 'loss/train': 1.2849841117858887} -11/07/2021 03:23:57 - INFO - __main__ - Step 44029: {'lr': 0.0004069393641586728, 'samples': 8453568, 'steps': 44028, 'loss/train': 1.9058088064193726} -11/07/2021 03:23:57 - INFO - __main__ - Step 44030: {'lr': 0.00040693523330574043, 'samples': 8453760, 'steps': 44029, 'loss/train': 1.7052431106567383} -11/07/2021 03:23:58 - INFO - __main__ - Step 44031: {'lr': 0.0004069311023820954, 'samples': 8453952, 'steps': 44030, 'loss/train': 0.7730574011802673} -11/07/2021 03:23:59 - INFO - __main__ - Step 44032: {'lr': 0.0004069269713877397, 'samples': 8454144, 'steps': 44031, 'loss/train': 1.3204773664474487} -11/07/2021 03:23:59 - INFO - __main__ - Step 44033: {'lr': 0.00040692284032267515, 'samples': 8454336, 'steps': 44032, 'loss/train': 1.355200171470642} -11/07/2021 03:24:00 - INFO - __main__ - Step 44034: {'lr': 0.0004069187091869035, 'samples': 8454528, 'steps': 44033, 'loss/train': 1.5818285942077637} -11/07/2021 03:24:00 - INFO - __main__ - Step 44035: {'lr': 0.00040691457798042673, 'samples': 8454720, 'steps': 44034, 'loss/train': 1.3490406274795532} -11/07/2021 03:24:01 - INFO - __main__ - Step 44036: {'lr': 0.00040691044670324673, 'samples': 8454912, 'steps': 44035, 'loss/train': 1.9681199789047241} -11/07/2021 03:24:01 - INFO - __main__ - Step 44037: {'lr': 0.00040690631535536526, 'samples': 8455104, 'steps': 44036, 'loss/train': 1.5073906183242798} -11/07/2021 03:24:02 - INFO - __main__ - Step 44038: {'lr': 0.00040690218393678426, 'samples': 8455296, 'steps': 44037, 'loss/train': 1.4101229906082153} -11/07/2021 03:24:02 - INFO - __main__ - Step 44039: {'lr': 0.0004068980524475054, 'samples': 8455488, 'steps': 44038, 'loss/train': 1.77540123462677} -11/07/2021 03:24:03 - INFO - __main__ - Step 44040: {'lr': 0.00040689392088753097, 'samples': 8455680, 'steps': 44039, 'loss/train': 5.637470245361328} -11/07/2021 03:24:03 - INFO - __main__ - Step 44041: {'lr': 0.00040688978925686235, 'samples': 8455872, 'steps': 44040, 'loss/train': 1.8101271390914917} -11/07/2021 03:24:04 - INFO - __main__ - Step 44042: {'lr': 0.00040688565755550164, 'samples': 8456064, 'steps': 44041, 'loss/train': 1.7539114952087402} -11/07/2021 03:24:04 - INFO - __main__ - Step 44043: {'lr': 0.00040688152578345074, 'samples': 8456256, 'steps': 44042, 'loss/train': 1.4729076623916626} -11/07/2021 03:24:05 - INFO - __main__ - Step 44044: {'lr': 0.0004068773939407114, 'samples': 8456448, 'steps': 44043, 'loss/train': 1.6007177829742432} -11/07/2021 03:24:05 - INFO - __main__ - Step 44045: {'lr': 0.0004068732620272856, 'samples': 8456640, 'steps': 44044, 'loss/train': 1.4922720193862915} -11/07/2021 03:24:05 - INFO - __main__ - Step 44046: {'lr': 0.000406869130043175, 'samples': 8456832, 'steps': 44045, 'loss/train': 1.3924622535705566} -11/07/2021 03:24:06 - INFO - __main__ - Step 44047: {'lr': 0.0004068649979883817, 'samples': 8457024, 'steps': 44046, 'loss/train': 1.539118766784668} -11/07/2021 03:24:07 - INFO - __main__ - Step 44048: {'lr': 0.0004068608658629074, 'samples': 8457216, 'steps': 44047, 'loss/train': 1.7003668546676636} -11/07/2021 03:24:07 - INFO - __main__ - Step 44049: {'lr': 0.000406856733666754, 'samples': 8457408, 'steps': 44048, 'loss/train': 1.2621194124221802} -11/07/2021 03:24:07 - INFO - __main__ - Step 44050: {'lr': 0.00040685260139992343, 'samples': 8457600, 'steps': 44049, 'loss/train': 1.989881157875061} -11/07/2021 03:24:08 - INFO - __main__ - Step 44051: {'lr': 0.00040684846906241745, 'samples': 8457792, 'steps': 44050, 'loss/train': 1.3429982662200928} -11/07/2021 03:24:09 - INFO - __main__ - Step 44052: {'lr': 0.000406844336654238, 'samples': 8457984, 'steps': 44051, 'loss/train': 1.6912051439285278} -11/07/2021 03:24:09 - INFO - __main__ - Step 44053: {'lr': 0.00040684020417538694, 'samples': 8458176, 'steps': 44052, 'loss/train': 1.2079888582229614} -11/07/2021 03:24:09 - INFO - __main__ - Step 44054: {'lr': 0.00040683607162586604, 'samples': 8458368, 'steps': 44053, 'loss/train': 1.5336663722991943} -11/07/2021 03:24:10 - INFO - __main__ - Step 44055: {'lr': 0.00040683193900567727, 'samples': 8458560, 'steps': 44054, 'loss/train': 1.1132365465164185} -11/07/2021 03:24:10 - INFO - __main__ - Step 44056: {'lr': 0.00040682780631482243, 'samples': 8458752, 'steps': 44055, 'loss/train': 1.7476736307144165} -11/07/2021 03:24:10 - INFO - __main__ - Step 44057: {'lr': 0.0004068236735533034, 'samples': 8458944, 'steps': 44056, 'loss/train': 1.392434000968933} -11/07/2021 03:24:11 - INFO - __main__ - Step 44058: {'lr': 0.00040681954072112206, 'samples': 8459136, 'steps': 44057, 'loss/train': 1.7331249713897705} -11/07/2021 03:24:12 - INFO - __main__ - Step 44059: {'lr': 0.0004068154078182802, 'samples': 8459328, 'steps': 44058, 'loss/train': 0.8346248269081116} -11/07/2021 03:24:12 - INFO - __main__ - Step 44060: {'lr': 0.00040681127484477983, 'samples': 8459520, 'steps': 44059, 'loss/train': 1.481729507446289} -11/07/2021 03:24:12 - INFO - __main__ - Step 44061: {'lr': 0.0004068071418006226, 'samples': 8459712, 'steps': 44060, 'loss/train': 1.9142131805419922} -11/07/2021 03:24:13 - INFO - __main__ - Step 44062: {'lr': 0.0004068030086858106, 'samples': 8459904, 'steps': 44061, 'loss/train': 1.3857892751693726} -11/07/2021 03:24:14 - INFO - __main__ - Step 44063: {'lr': 0.00040679887550034555, 'samples': 8460096, 'steps': 44062, 'loss/train': 1.4364193677902222} -11/07/2021 03:24:14 - INFO - __main__ - Step 44064: {'lr': 0.0004067947422442293, 'samples': 8460288, 'steps': 44063, 'loss/train': 1.6256428956985474} -11/07/2021 03:24:15 - INFO - __main__ - Step 44065: {'lr': 0.00040679060891746384, 'samples': 8460480, 'steps': 44064, 'loss/train': 1.7078979015350342} -11/07/2021 03:24:15 - INFO - __main__ - Step 44066: {'lr': 0.00040678647552005087, 'samples': 8460672, 'steps': 44065, 'loss/train': 1.907792329788208} -11/07/2021 03:24:15 - INFO - __main__ - Step 44067: {'lr': 0.00040678234205199237, 'samples': 8460864, 'steps': 44066, 'loss/train': 1.3730069398880005} -11/07/2021 03:24:16 - INFO - __main__ - Step 44068: {'lr': 0.0004067782085132902, 'samples': 8461056, 'steps': 44067, 'loss/train': 1.428218960762024} -11/07/2021 03:24:17 - INFO - __main__ - Step 44069: {'lr': 0.00040677407490394616, 'samples': 8461248, 'steps': 44068, 'loss/train': 1.4499595165252686} -11/07/2021 03:24:17 - INFO - __main__ - Step 44070: {'lr': 0.0004067699412239622, 'samples': 8461440, 'steps': 44069, 'loss/train': 1.5239028930664062} -11/07/2021 03:24:17 - INFO - __main__ - Step 44071: {'lr': 0.00040676580747334, 'samples': 8461632, 'steps': 44070, 'loss/train': 1.042952537536621} -11/07/2021 03:24:18 - INFO - __main__ - Step 44072: {'lr': 0.0004067616736520816, 'samples': 8461824, 'steps': 44071, 'loss/train': 1.2719451189041138} -11/07/2021 03:24:19 - INFO - __main__ - Step 44073: {'lr': 0.0004067575397601888, 'samples': 8462016, 'steps': 44072, 'loss/train': 1.175555944442749} -11/07/2021 03:24:19 - INFO - __main__ - Step 44074: {'lr': 0.0004067534057976635, 'samples': 8462208, 'steps': 44073, 'loss/train': 1.5510388612747192} -11/07/2021 03:24:19 - INFO - __main__ - Step 44075: {'lr': 0.0004067492717645075, 'samples': 8462400, 'steps': 44074, 'loss/train': 1.422773003578186} -11/07/2021 03:24:20 - INFO - __main__ - Step 44076: {'lr': 0.00040674513766072274, 'samples': 8462592, 'steps': 44075, 'loss/train': 0.9936408996582031} -11/07/2021 03:24:20 - INFO - __main__ - Step 44077: {'lr': 0.000406741003486311, 'samples': 8462784, 'steps': 44076, 'loss/train': 1.760259985923767} -11/07/2021 03:24:21 - INFO - __main__ - Step 44078: {'lr': 0.00040673686924127416, 'samples': 8462976, 'steps': 44077, 'loss/train': 1.571046233177185} -11/07/2021 03:24:22 - INFO - __main__ - Step 44079: {'lr': 0.0004067327349256142, 'samples': 8463168, 'steps': 44078, 'loss/train': 1.288905382156372} -11/07/2021 03:24:22 - INFO - __main__ - Step 44080: {'lr': 0.00040672860053933286, 'samples': 8463360, 'steps': 44079, 'loss/train': 1.5099854469299316} -11/07/2021 03:24:22 - INFO - __main__ - Step 44081: {'lr': 0.00040672446608243194, 'samples': 8463552, 'steps': 44080, 'loss/train': 1.4610154628753662} -11/07/2021 03:24:23 - INFO - __main__ - Step 44082: {'lr': 0.0004067203315549135, 'samples': 8463744, 'steps': 44081, 'loss/train': 1.413544774055481} -11/07/2021 03:24:24 - INFO - __main__ - Step 44083: {'lr': 0.00040671619695677923, 'samples': 8463936, 'steps': 44082, 'loss/train': 1.3504700660705566} -11/07/2021 03:24:24 - INFO - __main__ - Step 44084: {'lr': 0.00040671206228803117, 'samples': 8464128, 'steps': 44083, 'loss/train': 1.6227068901062012} -11/07/2021 03:24:24 - INFO - __main__ - Step 44085: {'lr': 0.0004067079275486709, 'samples': 8464320, 'steps': 44084, 'loss/train': 0.2816094756126404} -11/07/2021 03:24:25 - INFO - __main__ - Step 44086: {'lr': 0.00040670379273870054, 'samples': 8464512, 'steps': 44085, 'loss/train': 1.8726481199264526} -11/07/2021 03:24:25 - INFO - __main__ - Step 44087: {'lr': 0.00040669965785812193, 'samples': 8464704, 'steps': 44086, 'loss/train': 1.5070987939834595} -11/07/2021 03:24:25 - INFO - __main__ - Step 44088: {'lr': 0.00040669552290693677, 'samples': 8464896, 'steps': 44087, 'loss/train': 1.7143826484680176} -11/07/2021 03:24:27 - INFO - __main__ - Step 44089: {'lr': 0.0004066913878851471, 'samples': 8465088, 'steps': 44088, 'loss/train': 1.077122688293457} -11/07/2021 03:24:27 - INFO - __main__ - Step 44090: {'lr': 0.00040668725279275464, 'samples': 8465280, 'steps': 44089, 'loss/train': 1.257422685623169} -11/07/2021 03:24:27 - INFO - __main__ - Step 44091: {'lr': 0.0004066831176297614, 'samples': 8465472, 'steps': 44090, 'loss/train': 1.3948299884796143} -11/07/2021 03:24:28 - INFO - __main__ - Step 44092: {'lr': 0.0004066789823961691, 'samples': 8465664, 'steps': 44091, 'loss/train': 1.5024408102035522} -11/07/2021 03:24:28 - INFO - __main__ - Step 44093: {'lr': 0.00040667484709197967, 'samples': 8465856, 'steps': 44092, 'loss/train': 0.9710264205932617} -11/07/2021 03:24:29 - INFO - __main__ - Step 44094: {'lr': 0.00040667071171719503, 'samples': 8466048, 'steps': 44093, 'loss/train': 1.559989094734192} -11/07/2021 03:24:29 - INFO - __main__ - Step 44095: {'lr': 0.00040666657627181697, 'samples': 8466240, 'steps': 44094, 'loss/train': 1.1567920446395874} -11/07/2021 03:24:30 - INFO - __main__ - Step 44096: {'lr': 0.00040666244075584736, 'samples': 8466432, 'steps': 44095, 'loss/train': 1.9180774688720703} -11/07/2021 03:24:30 - INFO - __main__ - Step 44097: {'lr': 0.000406658305169288, 'samples': 8466624, 'steps': 44096, 'loss/train': 1.5806243419647217} -11/07/2021 03:24:30 - INFO - __main__ - Step 44098: {'lr': 0.000406654169512141, 'samples': 8466816, 'steps': 44097, 'loss/train': 1.4634579420089722} -11/07/2021 03:24:32 - INFO - __main__ - Step 44099: {'lr': 0.0004066500337844078, 'samples': 8467008, 'steps': 44098, 'loss/train': 1.3353631496429443} -11/07/2021 03:24:32 - INFO - __main__ - Step 44100: {'lr': 0.0004066458979860907, 'samples': 8467200, 'steps': 44099, 'loss/train': 1.8623902797698975} -11/07/2021 03:24:33 - INFO - __main__ - Step 44101: {'lr': 0.00040664176211719136, 'samples': 8467392, 'steps': 44100, 'loss/train': 1.426758885383606} -11/07/2021 03:24:33 - INFO - __main__ - Step 44102: {'lr': 0.00040663762617771163, 'samples': 8467584, 'steps': 44101, 'loss/train': 1.5183041095733643} -11/07/2021 03:24:33 - INFO - __main__ - Step 44103: {'lr': 0.00040663349016765337, 'samples': 8467776, 'steps': 44102, 'loss/train': 1.2168281078338623} -11/07/2021 03:24:34 - INFO - __main__ - Step 44104: {'lr': 0.00040662935408701853, 'samples': 8467968, 'steps': 44103, 'loss/train': 1.5888041257858276} -11/07/2021 03:24:35 - INFO - __main__ - Step 44105: {'lr': 0.00040662521793580886, 'samples': 8468160, 'steps': 44104, 'loss/train': 0.3741858899593353} -11/07/2021 03:24:35 - INFO - __main__ - Step 44106: {'lr': 0.0004066210817140263, 'samples': 8468352, 'steps': 44105, 'loss/train': 1.7300732135772705} -11/07/2021 03:24:35 - INFO - __main__ - Step 44107: {'lr': 0.0004066169454216727, 'samples': 8468544, 'steps': 44106, 'loss/train': 2.1087207794189453} -11/07/2021 03:24:36 - INFO - __main__ - Step 44108: {'lr': 0.00040661280905875, 'samples': 8468736, 'steps': 44107, 'loss/train': 1.2548373937606812} -11/07/2021 03:24:36 - INFO - __main__ - Step 44109: {'lr': 0.0004066086726252599, 'samples': 8468928, 'steps': 44108, 'loss/train': 1.4089781045913696} -11/07/2021 03:24:37 - INFO - __main__ - Step 44110: {'lr': 0.0004066045361212043, 'samples': 8469120, 'steps': 44109, 'loss/train': 0.9372249245643616} -11/07/2021 03:24:37 - INFO - __main__ - Step 44111: {'lr': 0.00040660039954658523, 'samples': 8469312, 'steps': 44110, 'loss/train': 1.983938455581665} -11/07/2021 03:24:38 - INFO - __main__ - Step 44112: {'lr': 0.0004065962629014044, 'samples': 8469504, 'steps': 44111, 'loss/train': 1.4359891414642334} -11/07/2021 03:24:38 - INFO - __main__ - Step 44113: {'lr': 0.00040659212618566364, 'samples': 8469696, 'steps': 44112, 'loss/train': 1.4150471687316895} -11/07/2021 03:24:39 - INFO - __main__ - Step 44114: {'lr': 0.000406587989399365, 'samples': 8469888, 'steps': 44113, 'loss/train': 1.5617057085037231} -11/07/2021 03:24:40 - INFO - __main__ - Step 44115: {'lr': 0.0004065838525425102, 'samples': 8470080, 'steps': 44114, 'loss/train': 0.9213770031929016} -11/07/2021 03:24:40 - INFO - __main__ - Step 44116: {'lr': 0.00040657971561510104, 'samples': 8470272, 'steps': 44115, 'loss/train': 1.8451734781265259} -11/07/2021 03:24:40 - INFO - __main__ - Step 44117: {'lr': 0.00040657557861713956, 'samples': 8470464, 'steps': 44116, 'loss/train': 1.2429790496826172} -11/07/2021 03:24:41 - INFO - __main__ - Step 44118: {'lr': 0.00040657144154862746, 'samples': 8470656, 'steps': 44117, 'loss/train': 1.3513708114624023} -11/07/2021 03:24:41 - INFO - __main__ - Step 44119: {'lr': 0.00040656730440956677, 'samples': 8470848, 'steps': 44118, 'loss/train': 1.3201446533203125} -11/07/2021 03:24:42 - INFO - __main__ - Step 44120: {'lr': 0.0004065631671999592, 'samples': 8471040, 'steps': 44119, 'loss/train': 1.51387357711792} -11/07/2021 03:24:43 - INFO - __main__ - Step 44121: {'lr': 0.0004065590299198068, 'samples': 8471232, 'steps': 44120, 'loss/train': 1.7190121412277222} -11/07/2021 03:24:43 - INFO - __main__ - Step 44122: {'lr': 0.00040655489256911123, 'samples': 8471424, 'steps': 44121, 'loss/train': 1.5446957349777222} -11/07/2021 03:24:43 - INFO - __main__ - Step 44123: {'lr': 0.00040655075514787445, 'samples': 8471616, 'steps': 44122, 'loss/train': 1.3534348011016846} -11/07/2021 03:24:44 - INFO - __main__ - Step 44124: {'lr': 0.0004065466176560983, 'samples': 8471808, 'steps': 44123, 'loss/train': 1.3408905267715454} -11/07/2021 03:24:45 - INFO - __main__ - Step 44125: {'lr': 0.0004065424800937847, 'samples': 8472000, 'steps': 44124, 'loss/train': 1.0104137659072876} -11/07/2021 03:24:45 - INFO - __main__ - Step 44126: {'lr': 0.0004065383424609354, 'samples': 8472192, 'steps': 44125, 'loss/train': 1.5084606409072876} -11/07/2021 03:24:45 - INFO - __main__ - Step 44127: {'lr': 0.00040653420475755245, 'samples': 8472384, 'steps': 44126, 'loss/train': 1.3555549383163452} -11/07/2021 03:24:46 - INFO - __main__ - Step 44128: {'lr': 0.0004065300669836375, 'samples': 8472576, 'steps': 44127, 'loss/train': 1.8347290754318237} -11/07/2021 03:24:46 - INFO - __main__ - Step 44129: {'lr': 0.0004065259291391926, 'samples': 8472768, 'steps': 44128, 'loss/train': 1.2331953048706055} -11/07/2021 03:24:47 - INFO - __main__ - Step 44130: {'lr': 0.0004065217912242195, 'samples': 8472960, 'steps': 44129, 'loss/train': 1.6485356092453003} -11/07/2021 03:24:47 - INFO - __main__ - Step 44131: {'lr': 0.00040651765323872, 'samples': 8473152, 'steps': 44130, 'loss/train': 1.753224492073059} -11/07/2021 03:24:48 - INFO - __main__ - Step 44132: {'lr': 0.0004065135151826962, 'samples': 8473344, 'steps': 44131, 'loss/train': 1.2589049339294434} -11/07/2021 03:24:48 - INFO - __main__ - Step 44133: {'lr': 0.00040650937705614975, 'samples': 8473536, 'steps': 44132, 'loss/train': 1.6444562673568726} -11/07/2021 03:24:48 - INFO - __main__ - Step 44134: {'lr': 0.0004065052388590826, 'samples': 8473728, 'steps': 44133, 'loss/train': 1.6255830526351929} -11/07/2021 03:24:50 - INFO - __main__ - Step 44135: {'lr': 0.00040650110059149664, 'samples': 8473920, 'steps': 44134, 'loss/train': 1.9925587177276611} -11/07/2021 03:24:50 - INFO - __main__ - Step 44136: {'lr': 0.0004064969622533937, 'samples': 8474112, 'steps': 44135, 'loss/train': 1.1963980197906494} -11/07/2021 03:24:50 - INFO - __main__ - Step 44137: {'lr': 0.0004064928238447756, 'samples': 8474304, 'steps': 44136, 'loss/train': 1.5025725364685059} -11/07/2021 03:24:51 - INFO - __main__ - Step 44138: {'lr': 0.00040648868536564427, 'samples': 8474496, 'steps': 44137, 'loss/train': 1.430065631866455} -11/07/2021 03:24:51 - INFO - __main__ - Step 44139: {'lr': 0.00040648454681600153, 'samples': 8474688, 'steps': 44138, 'loss/train': 1.4614596366882324} -11/07/2021 03:24:51 - INFO - __main__ - Step 44140: {'lr': 0.0004064804081958493, 'samples': 8474880, 'steps': 44139, 'loss/train': 1.4588491916656494} -11/07/2021 03:24:52 - INFO - __main__ - Step 44141: {'lr': 0.00040647626950518945, 'samples': 8475072, 'steps': 44140, 'loss/train': 1.6638232469558716} -11/07/2021 03:24:53 - INFO - __main__ - Step 44142: {'lr': 0.00040647213074402374, 'samples': 8475264, 'steps': 44141, 'loss/train': 1.2178179025650024} -11/07/2021 03:24:53 - INFO - __main__ - Step 44143: {'lr': 0.0004064679919123541, 'samples': 8475456, 'steps': 44142, 'loss/train': 1.2608200311660767} -11/07/2021 03:24:53 - INFO - __main__ - Step 44144: {'lr': 0.00040646385301018243, 'samples': 8475648, 'steps': 44143, 'loss/train': 1.7908116579055786} -11/07/2021 03:24:54 - INFO - __main__ - Step 44145: {'lr': 0.0004064597140375105, 'samples': 8475840, 'steps': 44144, 'loss/train': 0.6181836128234863} -11/07/2021 03:24:55 - INFO - __main__ - Step 44146: {'lr': 0.00040645557499434035, 'samples': 8476032, 'steps': 44145, 'loss/train': 1.198376178741455} -11/07/2021 03:24:55 - INFO - __main__ - Step 44147: {'lr': 0.0004064514358806737, 'samples': 8476224, 'steps': 44146, 'loss/train': 1.6143416166305542} -11/07/2021 03:24:55 - INFO - __main__ - Step 44148: {'lr': 0.00040644729669651235, 'samples': 8476416, 'steps': 44147, 'loss/train': 1.154239535331726} -11/07/2021 03:24:56 - INFO - __main__ - Step 44149: {'lr': 0.0004064431574418583, 'samples': 8476608, 'steps': 44148, 'loss/train': 1.6307626962661743} -11/07/2021 03:24:56 - INFO - __main__ - Step 44150: {'lr': 0.00040643901811671345, 'samples': 8476800, 'steps': 44149, 'loss/train': 1.8045600652694702} -11/07/2021 03:24:57 - INFO - __main__ - Step 44151: {'lr': 0.0004064348787210795, 'samples': 8476992, 'steps': 44150, 'loss/train': 0.6478796005249023} -11/07/2021 03:24:58 - INFO - __main__ - Step 44152: {'lr': 0.0004064307392549585, 'samples': 8477184, 'steps': 44151, 'loss/train': 1.6127792596817017} -11/07/2021 03:24:58 - INFO - __main__ - Step 44153: {'lr': 0.00040642659971835217, 'samples': 8477376, 'steps': 44152, 'loss/train': 1.827341079711914} -11/07/2021 03:24:58 - INFO - __main__ - Step 44154: {'lr': 0.0004064224601112625, 'samples': 8477568, 'steps': 44153, 'loss/train': 1.2901002168655396} -11/07/2021 03:24:59 - INFO - __main__ - Step 44155: {'lr': 0.0004064183204336912, 'samples': 8477760, 'steps': 44154, 'loss/train': 2.1328094005584717} -11/07/2021 03:25:00 - INFO - __main__ - Step 44156: {'lr': 0.00040641418068564024, 'samples': 8477952, 'steps': 44155, 'loss/train': 1.2231348752975464} -11/07/2021 03:25:00 - INFO - __main__ - Step 44157: {'lr': 0.0004064100408671114, 'samples': 8478144, 'steps': 44156, 'loss/train': 1.8266414403915405} -11/07/2021 03:25:00 - INFO - __main__ - Step 44158: {'lr': 0.0004064059009781067, 'samples': 8478336, 'steps': 44157, 'loss/train': 1.670493245124817} -11/07/2021 03:25:01 - INFO - __main__ - Step 44159: {'lr': 0.0004064017610186279, 'samples': 8478528, 'steps': 44158, 'loss/train': 1.9124197959899902} -11/07/2021 03:25:01 - INFO - __main__ - Step 44160: {'lr': 0.00040639762098867684, 'samples': 8478720, 'steps': 44159, 'loss/train': 1.1427425146102905} -11/07/2021 03:25:02 - INFO - __main__ - Step 44161: {'lr': 0.0004063934808882555, 'samples': 8478912, 'steps': 44160, 'loss/train': 1.389540433883667} -11/07/2021 03:25:02 - INFO - __main__ - Step 44162: {'lr': 0.0004063893407173656, 'samples': 8479104, 'steps': 44161, 'loss/train': 1.037030577659607} -11/07/2021 03:25:03 - INFO - __main__ - Step 44163: {'lr': 0.00040638520047600916, 'samples': 8479296, 'steps': 44162, 'loss/train': 1.5312376022338867} -11/07/2021 03:25:03 - INFO - __main__ - Step 44164: {'lr': 0.00040638106016418785, 'samples': 8479488, 'steps': 44163, 'loss/train': 1.4833199977874756} -11/07/2021 03:25:03 - INFO - __main__ - Step 44165: {'lr': 0.0004063769197819037, 'samples': 8479680, 'steps': 44164, 'loss/train': 1.6046035289764404} -11/07/2021 03:25:05 - INFO - __main__ - Step 44166: {'lr': 0.0004063727793291585, 'samples': 8479872, 'steps': 44165, 'loss/train': 1.6139516830444336} -11/07/2021 03:25:05 - INFO - __main__ - Step 44167: {'lr': 0.00040636863880595415, 'samples': 8480064, 'steps': 44166, 'loss/train': 1.361234426498413} -11/07/2021 03:25:05 - INFO - __main__ - Step 44168: {'lr': 0.0004063644982122926, 'samples': 8480256, 'steps': 44167, 'loss/train': 1.920316457748413} -11/07/2021 03:25:06 - INFO - __main__ - Step 44169: {'lr': 0.00040636035754817545, 'samples': 8480448, 'steps': 44168, 'loss/train': 1.5258365869522095} -11/07/2021 03:25:06 - INFO - __main__ - Step 44170: {'lr': 0.00040635621681360485, 'samples': 8480640, 'steps': 44169, 'loss/train': 1.5655819177627563} -11/07/2021 03:25:06 - INFO - __main__ - Step 44171: {'lr': 0.00040635207600858247, 'samples': 8480832, 'steps': 44170, 'loss/train': 1.3133772611618042} -11/07/2021 03:25:07 - INFO - __main__ - Step 44172: {'lr': 0.00040634793513311037, 'samples': 8481024, 'steps': 44171, 'loss/train': 1.8161416053771973} -11/07/2021 03:25:08 - INFO - __main__ - Step 44173: {'lr': 0.0004063437941871903, 'samples': 8481216, 'steps': 44172, 'loss/train': 0.9237746000289917} -11/07/2021 03:25:08 - INFO - __main__ - Step 44174: {'lr': 0.000406339653170824, 'samples': 8481408, 'steps': 44173, 'loss/train': 1.6315330266952515} -11/07/2021 03:25:08 - INFO - __main__ - Step 44175: {'lr': 0.00040633551208401356, 'samples': 8481600, 'steps': 44174, 'loss/train': 1.2439640760421753} -11/07/2021 03:25:09 - INFO - __main__ - Step 44176: {'lr': 0.0004063313709267607, 'samples': 8481792, 'steps': 44175, 'loss/train': 1.1543171405792236} -11/07/2021 03:25:10 - INFO - __main__ - Step 44177: {'lr': 0.0004063272296990674, 'samples': 8481984, 'steps': 44176, 'loss/train': 1.2038911581039429} -11/07/2021 03:25:10 - INFO - __main__ - Step 44178: {'lr': 0.00040632308840093533, 'samples': 8482176, 'steps': 44177, 'loss/train': 1.9420859813690186} -11/07/2021 03:25:10 - INFO - __main__ - Step 44179: {'lr': 0.0004063189470323666, 'samples': 8482368, 'steps': 44178, 'loss/train': 1.3965636491775513} -11/07/2021 03:25:11 - INFO - __main__ - Step 44180: {'lr': 0.000406314805593363, 'samples': 8482560, 'steps': 44179, 'loss/train': 1.4306188821792603} -11/07/2021 03:25:11 - INFO - __main__ - Step 44181: {'lr': 0.00040631066408392636, 'samples': 8482752, 'steps': 44180, 'loss/train': 0.47852659225463867} -11/07/2021 03:25:12 - INFO - __main__ - Step 44182: {'lr': 0.0004063065225040584, 'samples': 8482944, 'steps': 44181, 'loss/train': 1.3241499662399292} -11/07/2021 03:25:12 - INFO - __main__ - Step 44183: {'lr': 0.0004063023808537613, 'samples': 8483136, 'steps': 44182, 'loss/train': 1.2116507291793823} -11/07/2021 03:25:13 - INFO - __main__ - Step 44184: {'lr': 0.00040629823913303665, 'samples': 8483328, 'steps': 44183, 'loss/train': 0.8394481539726257} -11/07/2021 03:25:13 - INFO - __main__ - Step 44185: {'lr': 0.0004062940973418865, 'samples': 8483520, 'steps': 44184, 'loss/train': 1.467079758644104} -11/07/2021 03:25:14 - INFO - __main__ - Step 44186: {'lr': 0.00040628995548031254, 'samples': 8483712, 'steps': 44185, 'loss/train': 1.486828327178955} -11/07/2021 03:25:15 - INFO - __main__ - Step 44187: {'lr': 0.00040628581354831687, 'samples': 8483904, 'steps': 44186, 'loss/train': 1.712790608406067} -11/07/2021 03:25:15 - INFO - __main__ - Step 44188: {'lr': 0.0004062816715459011, 'samples': 8484096, 'steps': 44187, 'loss/train': 1.5028607845306396} -11/07/2021 03:25:15 - INFO - __main__ - Step 44189: {'lr': 0.0004062775294730673, 'samples': 8484288, 'steps': 44188, 'loss/train': 1.4444500207901} -11/07/2021 03:25:16 - INFO - __main__ - Step 44190: {'lr': 0.0004062733873298172, 'samples': 8484480, 'steps': 44189, 'loss/train': 1.873066782951355} -11/07/2021 03:25:16 - INFO - __main__ - Step 44191: {'lr': 0.0004062692451161528, 'samples': 8484672, 'steps': 44190, 'loss/train': 1.6633840799331665} -11/07/2021 03:25:17 - INFO - __main__ - Step 44192: {'lr': 0.00040626510283207586, 'samples': 8484864, 'steps': 44191, 'loss/train': 1.141286015510559} -11/07/2021 03:25:18 - INFO - __main__ - Step 44193: {'lr': 0.00040626096047758823, 'samples': 8485056, 'steps': 44192, 'loss/train': 1.1355482339859009} -11/07/2021 03:25:18 - INFO - __main__ - Step 44194: {'lr': 0.0004062568180526919, 'samples': 8485248, 'steps': 44193, 'loss/train': 0.19759449362754822} -11/07/2021 03:25:18 - INFO - __main__ - Step 44195: {'lr': 0.0004062526755573886, 'samples': 8485440, 'steps': 44194, 'loss/train': 1.320232629776001} -11/07/2021 03:25:19 - INFO - __main__ - Step 44196: {'lr': 0.00040624853299168025, 'samples': 8485632, 'steps': 44195, 'loss/train': 1.5903716087341309} -11/07/2021 03:25:20 - INFO - __main__ - Step 44197: {'lr': 0.0004062443903555687, 'samples': 8485824, 'steps': 44196, 'loss/train': 1.3376597166061401} -11/07/2021 03:25:20 - INFO - __main__ - Step 44198: {'lr': 0.0004062402476490559, 'samples': 8486016, 'steps': 44197, 'loss/train': 1.3712801933288574} -11/07/2021 03:25:20 - INFO - __main__ - Step 44199: {'lr': 0.00040623610487214366, 'samples': 8486208, 'steps': 44198, 'loss/train': 1.0875322818756104} -11/07/2021 03:25:21 - INFO - __main__ - Step 44200: {'lr': 0.0004062319620248338, 'samples': 8486400, 'steps': 44199, 'loss/train': 1.6165579557418823} -11/07/2021 03:25:21 - INFO - __main__ - Step 44201: {'lr': 0.00040622781910712826, 'samples': 8486592, 'steps': 44200, 'loss/train': 1.1684272289276123} -11/07/2021 03:25:22 - INFO - __main__ - Step 44202: {'lr': 0.00040622367611902886, 'samples': 8486784, 'steps': 44201, 'loss/train': 1.704862117767334} -11/07/2021 03:25:23 - INFO - __main__ - Step 44203: {'lr': 0.0004062195330605375, 'samples': 8486976, 'steps': 44202, 'loss/train': 1.402276873588562} -11/07/2021 03:25:23 - INFO - __main__ - Step 44204: {'lr': 0.000406215389931656, 'samples': 8487168, 'steps': 44203, 'loss/train': 1.4944804906845093} -11/07/2021 03:25:23 - INFO - __main__ - Step 44205: {'lr': 0.0004062112467323863, 'samples': 8487360, 'steps': 44204, 'loss/train': 1.7162210941314697} -11/07/2021 03:25:24 - INFO - __main__ - Step 44206: {'lr': 0.00040620710346273015, 'samples': 8487552, 'steps': 44205, 'loss/train': 1.2356802225112915} -11/07/2021 03:25:24 - INFO - __main__ - Step 44207: {'lr': 0.00040620296012268956, 'samples': 8487744, 'steps': 44206, 'loss/train': 1.6394577026367188} -11/07/2021 03:25:25 - INFO - __main__ - Step 44208: {'lr': 0.0004061988167122663, 'samples': 8487936, 'steps': 44207, 'loss/train': 0.7263883352279663} -11/07/2021 03:25:25 - INFO - __main__ - Step 44209: {'lr': 0.00040619467323146224, 'samples': 8488128, 'steps': 44208, 'loss/train': 0.44673678278923035} -11/07/2021 03:25:26 - INFO - __main__ - Step 44210: {'lr': 0.0004061905296802793, 'samples': 8488320, 'steps': 44209, 'loss/train': 1.4260218143463135} -11/07/2021 03:25:26 - INFO - __main__ - Step 44211: {'lr': 0.00040618638605871934, 'samples': 8488512, 'steps': 44210, 'loss/train': 0.9377465844154358} -11/07/2021 03:25:27 - INFO - __main__ - Step 44212: {'lr': 0.00040618224236678413, 'samples': 8488704, 'steps': 44211, 'loss/train': 1.746358871459961} -11/07/2021 03:25:27 - INFO - __main__ - Step 44213: {'lr': 0.00040617809860447564, 'samples': 8488896, 'steps': 44212, 'loss/train': 0.8359420299530029} -11/07/2021 03:25:28 - INFO - __main__ - Step 44214: {'lr': 0.00040617395477179577, 'samples': 8489088, 'steps': 44213, 'loss/train': 1.3058966398239136} -11/07/2021 03:25:29 - INFO - __main__ - Step 44215: {'lr': 0.0004061698108687463, 'samples': 8489280, 'steps': 44214, 'loss/train': 1.6434102058410645} -11/07/2021 03:25:29 - INFO - __main__ - Step 44216: {'lr': 0.00040616566689532905, 'samples': 8489472, 'steps': 44215, 'loss/train': 1.4960986375808716} -11/07/2021 03:25:29 - INFO - __main__ - Step 44217: {'lr': 0.00040616152285154607, 'samples': 8489664, 'steps': 44216, 'loss/train': 1.7768678665161133} -11/07/2021 03:25:30 - INFO - __main__ - Step 44218: {'lr': 0.000406157378737399, 'samples': 8489856, 'steps': 44217, 'loss/train': 1.7725777626037598} -11/07/2021 03:25:30 - INFO - __main__ - Step 44219: {'lr': 0.0004061532345528899, 'samples': 8490048, 'steps': 44218, 'loss/train': 1.3695653676986694} -11/07/2021 03:25:31 - INFO - __main__ - Step 44220: {'lr': 0.00040614909029802054, 'samples': 8490240, 'steps': 44219, 'loss/train': 1.4920202493667603} -11/07/2021 03:25:32 - INFO - __main__ - Step 44221: {'lr': 0.0004061449459727928, 'samples': 8490432, 'steps': 44220, 'loss/train': 1.9846137762069702} -11/07/2021 03:25:32 - INFO - __main__ - Step 44222: {'lr': 0.0004061408015772086, 'samples': 8490624, 'steps': 44221, 'loss/train': 1.5419899225234985} -11/07/2021 03:25:32 - INFO - __main__ - Step 44223: {'lr': 0.0004061366571112698, 'samples': 8490816, 'steps': 44222, 'loss/train': 1.380388617515564} -11/07/2021 03:25:33 - INFO - __main__ - Step 44224: {'lr': 0.0004061325125749781, 'samples': 8491008, 'steps': 44223, 'loss/train': 1.3789750337600708} -11/07/2021 03:25:34 - INFO - __main__ - Step 44225: {'lr': 0.00040612836796833556, 'samples': 8491200, 'steps': 44224, 'loss/train': 1.9082430601119995} -11/07/2021 03:25:34 - INFO - __main__ - Step 44226: {'lr': 0.000406124223291344, 'samples': 8491392, 'steps': 44225, 'loss/train': 2.0185680389404297} -11/07/2021 03:25:34 - INFO - __main__ - Step 44227: {'lr': 0.0004061200785440052, 'samples': 8491584, 'steps': 44226, 'loss/train': 1.3868499994277954} -11/07/2021 03:25:35 - INFO - __main__ - Step 44228: {'lr': 0.0004061159337263213, 'samples': 8491776, 'steps': 44227, 'loss/train': 1.6316428184509277} -11/07/2021 03:25:35 - INFO - __main__ - Step 44229: {'lr': 0.0004061117888382938, 'samples': 8491968, 'steps': 44228, 'loss/train': 1.5498803853988647} -11/07/2021 03:25:36 - INFO - __main__ - Step 44230: {'lr': 0.00040610764387992475, 'samples': 8492160, 'steps': 44229, 'loss/train': 1.3144543170928955} -11/07/2021 03:25:37 - INFO - __main__ - Step 44231: {'lr': 0.0004061034988512161, 'samples': 8492352, 'steps': 44230, 'loss/train': 1.8794748783111572} -11/07/2021 03:25:37 - INFO - __main__ - Step 44232: {'lr': 0.0004060993537521695, 'samples': 8492544, 'steps': 44231, 'loss/train': 5.840709686279297} -11/07/2021 03:25:37 - INFO - __main__ - Step 44233: {'lr': 0.00040609520858278704, 'samples': 8492736, 'steps': 44232, 'loss/train': 1.6199346780776978} -11/07/2021 03:25:38 - INFO - __main__ - Step 44234: {'lr': 0.0004060910633430704, 'samples': 8492928, 'steps': 44233, 'loss/train': 1.3364590406417847} -11/07/2021 03:25:38 - INFO - __main__ - Step 44235: {'lr': 0.0004060869180330216, 'samples': 8493120, 'steps': 44234, 'loss/train': 1.4359380006790161} -11/07/2021 03:25:39 - INFO - __main__ - Step 44236: {'lr': 0.00040608277265264243, 'samples': 8493312, 'steps': 44235, 'loss/train': 1.476361870765686} -11/07/2021 03:25:39 - INFO - __main__ - Step 44237: {'lr': 0.0004060786272019348, 'samples': 8493504, 'steps': 44236, 'loss/train': 1.8258213996887207} -11/07/2021 03:25:40 - INFO - __main__ - Step 44238: {'lr': 0.00040607448168090044, 'samples': 8493696, 'steps': 44237, 'loss/train': 1.4443018436431885} -11/07/2021 03:25:40 - INFO - __main__ - Step 44239: {'lr': 0.00040607033608954136, 'samples': 8493888, 'steps': 44238, 'loss/train': 1.3991117477416992} -11/07/2021 03:25:40 - INFO - __main__ - Step 44240: {'lr': 0.0004060661904278595, 'samples': 8494080, 'steps': 44239, 'loss/train': 0.4276210069656372} -11/07/2021 03:25:41 - INFO - __main__ - Step 44241: {'lr': 0.0004060620446958565, 'samples': 8494272, 'steps': 44240, 'loss/train': 1.401721715927124} -11/07/2021 03:25:42 - INFO - __main__ - Step 44242: {'lr': 0.00040605789889353445, 'samples': 8494464, 'steps': 44241, 'loss/train': 1.4835010766983032} -11/07/2021 03:25:42 - INFO - __main__ - Step 44243: {'lr': 0.00040605375302089507, 'samples': 8494656, 'steps': 44242, 'loss/train': 1.3869136571884155} -11/07/2021 03:25:42 - INFO - __main__ - Step 44244: {'lr': 0.00040604960707794023, 'samples': 8494848, 'steps': 44243, 'loss/train': 1.373746395111084} -11/07/2021 03:25:43 - INFO - __main__ - Step 44245: {'lr': 0.00040604546106467196, 'samples': 8495040, 'steps': 44244, 'loss/train': 1.4466519355773926} -11/07/2021 03:25:43 - INFO - __main__ - Step 44246: {'lr': 0.00040604131498109193, 'samples': 8495232, 'steps': 44245, 'loss/train': 1.67646062374115} -11/07/2021 03:25:44 - INFO - __main__ - Step 44247: {'lr': 0.0004060371688272021, 'samples': 8495424, 'steps': 44246, 'loss/train': 1.4390851259231567} -11/07/2021 03:25:45 - INFO - __main__ - Step 44248: {'lr': 0.00040603302260300435, 'samples': 8495616, 'steps': 44247, 'loss/train': 1.0876033306121826} -11/07/2021 03:25:45 - INFO - __main__ - Step 44249: {'lr': 0.00040602887630850055, 'samples': 8495808, 'steps': 44248, 'loss/train': 1.3555651903152466} -11/07/2021 03:25:45 - INFO - __main__ - Step 44250: {'lr': 0.0004060247299436925, 'samples': 8496000, 'steps': 44249, 'loss/train': 2.00783371925354} -11/07/2021 03:25:46 - INFO - __main__ - Step 44251: {'lr': 0.0004060205835085821, 'samples': 8496192, 'steps': 44250, 'loss/train': 1.2769891023635864} -11/07/2021 03:25:46 - INFO - __main__ - Step 44252: {'lr': 0.00040601643700317126, 'samples': 8496384, 'steps': 44251, 'loss/train': 1.2505950927734375} -11/07/2021 03:25:47 - INFO - __main__ - Step 44253: {'lr': 0.0004060122904274618, 'samples': 8496576, 'steps': 44252, 'loss/train': 1.2134746313095093} -11/07/2021 03:25:47 - INFO - __main__ - Step 44254: {'lr': 0.0004060081437814557, 'samples': 8496768, 'steps': 44253, 'loss/train': 1.798974633216858} -11/07/2021 03:25:48 - INFO - __main__ - Step 44255: {'lr': 0.00040600399706515466, 'samples': 8496960, 'steps': 44254, 'loss/train': 1.435835599899292} -11/07/2021 03:25:48 - INFO - __main__ - Step 44256: {'lr': 0.0004059998502785606, 'samples': 8497152, 'steps': 44255, 'loss/train': 1.6909722089767456} -11/07/2021 03:25:49 - INFO - __main__ - Step 44257: {'lr': 0.0004059957034216755, 'samples': 8497344, 'steps': 44256, 'loss/train': 1.5016534328460693} -11/07/2021 03:25:49 - INFO - __main__ - Step 44258: {'lr': 0.00040599155649450106, 'samples': 8497536, 'steps': 44257, 'loss/train': 1.8113622665405273} -11/07/2021 03:25:50 - INFO - __main__ - Step 44259: {'lr': 0.00040598740949703927, 'samples': 8497728, 'steps': 44258, 'loss/train': 1.6369322538375854} -11/07/2021 03:25:50 - INFO - __main__ - Step 44260: {'lr': 0.00040598326242929195, 'samples': 8497920, 'steps': 44259, 'loss/train': 1.4528487920761108} -11/07/2021 03:25:50 - INFO - __main__ - Step 44261: {'lr': 0.00040597911529126096, 'samples': 8498112, 'steps': 44260, 'loss/train': 1.588715672492981} -11/07/2021 03:25:52 - INFO - __main__ - Step 44262: {'lr': 0.00040597496808294825, 'samples': 8498304, 'steps': 44261, 'loss/train': 1.552764654159546} -11/07/2021 03:25:52 - INFO - __main__ - Step 44263: {'lr': 0.0004059708208043556, 'samples': 8498496, 'steps': 44262, 'loss/train': 2.3060762882232666} -11/07/2021 03:25:52 - INFO - __main__ - Step 44264: {'lr': 0.00040596667345548486, 'samples': 8498688, 'steps': 44263, 'loss/train': 0.9599685668945312} -11/07/2021 03:25:53 - INFO - __main__ - Step 44265: {'lr': 0.00040596252603633797, 'samples': 8498880, 'steps': 44264, 'loss/train': 1.3154436349868774} -11/07/2021 03:25:53 - INFO - __main__ - Step 44266: {'lr': 0.0004059583785469168, 'samples': 8499072, 'steps': 44265, 'loss/train': 1.1292322874069214} -11/07/2021 03:25:54 - INFO - __main__ - Step 44267: {'lr': 0.00040595423098722315, 'samples': 8499264, 'steps': 44266, 'loss/train': 1.3291518688201904} -11/07/2021 03:25:54 - INFO - __main__ - Step 44268: {'lr': 0.000405950083357259, 'samples': 8499456, 'steps': 44267, 'loss/train': 1.5495879650115967} -11/07/2021 03:25:55 - INFO - __main__ - Step 44269: {'lr': 0.0004059459356570261, 'samples': 8499648, 'steps': 44268, 'loss/train': 1.3936069011688232} -11/07/2021 03:25:55 - INFO - __main__ - Step 44270: {'lr': 0.00040594178788652636, 'samples': 8499840, 'steps': 44269, 'loss/train': 1.0680961608886719} -11/07/2021 03:25:55 - INFO - __main__ - Step 44271: {'lr': 0.00040593764004576166, 'samples': 8500032, 'steps': 44270, 'loss/train': 0.7102341651916504} -11/07/2021 03:25:57 - INFO - __main__ - Step 44272: {'lr': 0.0004059334921347339, 'samples': 8500224, 'steps': 44271, 'loss/train': 1.6032512187957764} -11/07/2021 03:25:57 - INFO - __main__ - Step 44273: {'lr': 0.00040592934415344486, 'samples': 8500416, 'steps': 44272, 'loss/train': 1.1632397174835205} -11/07/2021 03:25:57 - INFO - __main__ - Step 44274: {'lr': 0.0004059251961018965, 'samples': 8500608, 'steps': 44273, 'loss/train': 1.0936400890350342} -11/07/2021 03:25:58 - INFO - __main__ - Step 44275: {'lr': 0.00040592104798009066, 'samples': 8500800, 'steps': 44274, 'loss/train': 1.1963216066360474} -11/07/2021 03:25:58 - INFO - __main__ - Step 44276: {'lr': 0.00040591689978802917, 'samples': 8500992, 'steps': 44275, 'loss/train': 1.8550727367401123} -11/07/2021 03:26:00 - INFO - __main__ - Step 44277: {'lr': 0.0004059127515257139, 'samples': 8501184, 'steps': 44276, 'loss/train': 1.220307469367981} -11/07/2021 03:26:00 - INFO - __main__ - Step 44278: {'lr': 0.0004059086031931468, 'samples': 8501376, 'steps': 44277, 'loss/train': 1.9647818803787231} -11/07/2021 03:26:00 - INFO - __main__ - Step 44279: {'lr': 0.00040590445479032965, 'samples': 8501568, 'steps': 44278, 'loss/train': 1.5263757705688477} -11/07/2021 03:26:01 - INFO - __main__ - Step 44280: {'lr': 0.0004059003063172644, 'samples': 8501760, 'steps': 44279, 'loss/train': 1.7530311346054077} -11/07/2021 03:26:01 - INFO - __main__ - Step 44281: {'lr': 0.0004058961577739529, 'samples': 8501952, 'steps': 44280, 'loss/train': 1.3085688352584839} -11/07/2021 03:26:01 - INFO - __main__ - Step 44282: {'lr': 0.00040589200916039703, 'samples': 8502144, 'steps': 44281, 'loss/train': 1.7258718013763428} -11/07/2021 03:26:02 - INFO - __main__ - Step 44283: {'lr': 0.0004058878604765985, 'samples': 8502336, 'steps': 44282, 'loss/train': 2.434744119644165} -11/07/2021 03:26:03 - INFO - __main__ - Step 44284: {'lr': 0.00040588371172255936, 'samples': 8502528, 'steps': 44283, 'loss/train': 2.6195433139801025} -11/07/2021 03:26:03 - INFO - __main__ - Step 44285: {'lr': 0.0004058795628982814, 'samples': 8502720, 'steps': 44284, 'loss/train': 1.3945242166519165} -11/07/2021 03:26:03 - INFO - __main__ - Step 44286: {'lr': 0.0004058754140037666, 'samples': 8502912, 'steps': 44285, 'loss/train': 1.7013885974884033} -11/07/2021 03:26:04 - INFO - __main__ - Step 44287: {'lr': 0.00040587126503901664, 'samples': 8503104, 'steps': 44286, 'loss/train': 1.5036070346832275} -11/07/2021 03:26:04 - INFO - __main__ - Step 44288: {'lr': 0.0004058671160040336, 'samples': 8503296, 'steps': 44287, 'loss/train': 1.908082365989685} -11/07/2021 03:26:05 - INFO - __main__ - Step 44289: {'lr': 0.0004058629668988192, 'samples': 8503488, 'steps': 44288, 'loss/train': 1.5681588649749756} -11/07/2021 03:26:05 - INFO - __main__ - Step 44290: {'lr': 0.0004058588177233753, 'samples': 8503680, 'steps': 44289, 'loss/train': 1.7509156465530396} -11/07/2021 03:26:06 - INFO - __main__ - Step 44291: {'lr': 0.0004058546684777039, 'samples': 8503872, 'steps': 44290, 'loss/train': 1.3371413946151733} -11/07/2021 03:26:06 - INFO - __main__ - Step 44292: {'lr': 0.0004058505191618067, 'samples': 8504064, 'steps': 44291, 'loss/train': 1.466626763343811} -11/07/2021 03:26:07 - INFO - __main__ - Step 44293: {'lr': 0.00040584636977568573, 'samples': 8504256, 'steps': 44292, 'loss/train': 1.5148591995239258} -11/07/2021 03:26:07 - INFO - __main__ - Step 44294: {'lr': 0.0004058422203193428, 'samples': 8504448, 'steps': 44293, 'loss/train': 2.143653392791748} -11/07/2021 03:26:08 - INFO - __main__ - Step 44295: {'lr': 0.0004058380707927798, 'samples': 8504640, 'steps': 44294, 'loss/train': 1.8551056385040283} -11/07/2021 03:26:08 - INFO - __main__ - Step 44296: {'lr': 0.00040583392119599847, 'samples': 8504832, 'steps': 44295, 'loss/train': 1.5859216451644897} -11/07/2021 03:26:09 - INFO - __main__ - Step 44297: {'lr': 0.0004058297715290008, 'samples': 8505024, 'steps': 44296, 'loss/train': 1.3397605419158936} -11/07/2021 03:26:09 - INFO - __main__ - Step 44298: {'lr': 0.00040582562179178864, 'samples': 8505216, 'steps': 44297, 'loss/train': 1.5907195806503296} -11/07/2021 03:26:10 - INFO - __main__ - Step 44299: {'lr': 0.0004058214719843639, 'samples': 8505408, 'steps': 44298, 'loss/train': 1.302096962928772} -11/07/2021 03:26:11 - INFO - __main__ - Step 44300: {'lr': 0.0004058173221067284, 'samples': 8505600, 'steps': 44299, 'loss/train': 1.5051329135894775} -11/07/2021 03:26:11 - INFO - __main__ - Step 44301: {'lr': 0.00040581317215888403, 'samples': 8505792, 'steps': 44300, 'loss/train': 1.4881658554077148} -11/07/2021 03:26:11 - INFO - __main__ - Step 44302: {'lr': 0.0004058090221408326, 'samples': 8505984, 'steps': 44301, 'loss/train': 1.6845630407333374} -11/07/2021 03:26:12 - INFO - __main__ - Step 44303: {'lr': 0.0004058048720525761, 'samples': 8506176, 'steps': 44302, 'loss/train': 1.5862226486206055} -11/07/2021 03:26:13 - INFO - __main__ - Step 44304: {'lr': 0.00040580072189411626, 'samples': 8506368, 'steps': 44303, 'loss/train': 0.34425705671310425} -11/07/2021 03:26:13 - INFO - __main__ - Step 44305: {'lr': 0.00040579657166545503, 'samples': 8506560, 'steps': 44304, 'loss/train': 1.3707748651504517} -11/07/2021 03:26:13 - INFO - __main__ - Step 44306: {'lr': 0.0004057924213665943, 'samples': 8506752, 'steps': 44305, 'loss/train': 1.7618228197097778} -11/07/2021 03:26:14 - INFO - __main__ - Step 44307: {'lr': 0.0004057882709975359, 'samples': 8506944, 'steps': 44306, 'loss/train': 1.6465903520584106} -11/07/2021 03:26:14 - INFO - __main__ - Step 44308: {'lr': 0.0004057841205582817, 'samples': 8507136, 'steps': 44307, 'loss/train': 1.5074667930603027} -11/07/2021 03:26:15 - INFO - __main__ - Step 44309: {'lr': 0.0004057799700488336, 'samples': 8507328, 'steps': 44308, 'loss/train': 1.3298178911209106} -11/07/2021 03:26:16 - INFO - __main__ - Step 44310: {'lr': 0.0004057758194691934, 'samples': 8507520, 'steps': 44309, 'loss/train': 1.3904099464416504} -11/07/2021 03:26:16 - INFO - __main__ - Step 44311: {'lr': 0.00040577166881936304, 'samples': 8507712, 'steps': 44310, 'loss/train': 1.4899998903274536} -11/07/2021 03:26:16 - INFO - __main__ - Step 44312: {'lr': 0.0004057675180993444, 'samples': 8507904, 'steps': 44311, 'loss/train': 1.7797423601150513} -11/07/2021 03:26:17 - INFO - __main__ - Step 44313: {'lr': 0.00040576336730913933, 'samples': 8508096, 'steps': 44312, 'loss/train': 1.3314696550369263} -11/07/2021 03:26:17 - INFO - __main__ - Step 44314: {'lr': 0.00040575921644874966, 'samples': 8508288, 'steps': 44313, 'loss/train': 1.326983094215393} -11/07/2021 03:26:19 - INFO - __main__ - Step 44315: {'lr': 0.00040575506551817725, 'samples': 8508480, 'steps': 44314, 'loss/train': 0.7640935778617859} -11/07/2021 03:26:19 - INFO - __main__ - Step 44316: {'lr': 0.00040575091451742405, 'samples': 8508672, 'steps': 44315, 'loss/train': 1.2644010782241821} -11/07/2021 03:26:19 - INFO - __main__ - Step 44317: {'lr': 0.0004057467634464919, 'samples': 8508864, 'steps': 44316, 'loss/train': 1.4013490676879883} -11/07/2021 03:26:20 - INFO - __main__ - Step 44318: {'lr': 0.00040574261230538267, 'samples': 8509056, 'steps': 44317, 'loss/train': 1.2443079948425293} -11/07/2021 03:26:20 - INFO - __main__ - Step 44319: {'lr': 0.0004057384610940982, 'samples': 8509248, 'steps': 44318, 'loss/train': 1.4569404125213623} -11/07/2021 03:26:20 - INFO - __main__ - Step 44320: {'lr': 0.0004057343098126404, 'samples': 8509440, 'steps': 44319, 'loss/train': 1.319869041442871} -11/07/2021 03:26:21 - INFO - __main__ - Step 44321: {'lr': 0.0004057301584610111, 'samples': 8509632, 'steps': 44320, 'loss/train': 1.4804351329803467} -11/07/2021 03:26:22 - INFO - __main__ - Step 44322: {'lr': 0.00040572600703921223, 'samples': 8509824, 'steps': 44321, 'loss/train': 3.2597482204437256} -11/07/2021 03:26:22 - INFO - __main__ - Step 44323: {'lr': 0.0004057218555472456, 'samples': 8510016, 'steps': 44322, 'loss/train': 1.5574032068252563} -11/07/2021 03:26:22 - INFO - __main__ - Step 44324: {'lr': 0.0004057177039851131, 'samples': 8510208, 'steps': 44323, 'loss/train': 1.564391016960144} -11/07/2021 03:26:23 - INFO - __main__ - Step 44325: {'lr': 0.00040571355235281657, 'samples': 8510400, 'steps': 44324, 'loss/train': 1.9127159118652344} -11/07/2021 03:26:24 - INFO - __main__ - Step 44326: {'lr': 0.00040570940065035797, 'samples': 8510592, 'steps': 44325, 'loss/train': 1.2782944440841675} -11/07/2021 03:26:24 - INFO - __main__ - Step 44327: {'lr': 0.0004057052488777392, 'samples': 8510784, 'steps': 44326, 'loss/train': 1.6044999361038208} -11/07/2021 03:26:25 - INFO - __main__ - Step 44328: {'lr': 0.0004057010970349619, 'samples': 8510976, 'steps': 44327, 'loss/train': 1.5265976190567017} -11/07/2021 03:26:25 - INFO - __main__ - Step 44329: {'lr': 0.00040569694512202815, 'samples': 8511168, 'steps': 44328, 'loss/train': 1.3547221422195435} -11/07/2021 03:26:25 - INFO - __main__ - Step 44330: {'lr': 0.00040569279313893976, 'samples': 8511360, 'steps': 44329, 'loss/train': 1.4769420623779297} -11/07/2021 03:26:26 - INFO - __main__ - Step 44331: {'lr': 0.0004056886410856986, 'samples': 8511552, 'steps': 44330, 'loss/train': 0.3407726585865021} -11/07/2021 03:26:27 - INFO - __main__ - Step 44332: {'lr': 0.0004056844889623065, 'samples': 8511744, 'steps': 44331, 'loss/train': 1.1814073324203491} -11/07/2021 03:26:27 - INFO - __main__ - Step 44333: {'lr': 0.0004056803367687654, 'samples': 8511936, 'steps': 44332, 'loss/train': 1.6243948936462402} -11/07/2021 03:26:27 - INFO - __main__ - Step 44334: {'lr': 0.0004056761845050772, 'samples': 8512128, 'steps': 44333, 'loss/train': 0.6642376184463501} -11/07/2021 03:26:28 - INFO - __main__ - Step 44335: {'lr': 0.0004056720321712436, 'samples': 8512320, 'steps': 44334, 'loss/train': 1.2679871320724487} -11/07/2021 03:26:29 - INFO - __main__ - Step 44336: {'lr': 0.00040566787976726665, 'samples': 8512512, 'steps': 44335, 'loss/train': 1.2967005968093872} -11/07/2021 03:26:29 - INFO - __main__ - Step 44337: {'lr': 0.00040566372729314813, 'samples': 8512704, 'steps': 44336, 'loss/train': 1.4064103364944458} -11/07/2021 03:26:29 - INFO - __main__ - Step 44338: {'lr': 0.00040565957474889, 'samples': 8512896, 'steps': 44337, 'loss/train': 1.4833481311798096} -11/07/2021 03:26:30 - INFO - __main__ - Step 44339: {'lr': 0.000405655422134494, 'samples': 8513088, 'steps': 44338, 'loss/train': 2.3924691677093506} -11/07/2021 03:26:30 - INFO - __main__ - Step 44340: {'lr': 0.0004056512694499621, 'samples': 8513280, 'steps': 44339, 'loss/train': 0.9818007946014404} -11/07/2021 03:26:31 - INFO - __main__ - Step 44341: {'lr': 0.0004056471166952961, 'samples': 8513472, 'steps': 44340, 'loss/train': 1.5734854936599731} -11/07/2021 03:26:32 - INFO - __main__ - Step 44342: {'lr': 0.0004056429638704979, 'samples': 8513664, 'steps': 44341, 'loss/train': 1.7564226388931274} -11/07/2021 03:26:32 - INFO - __main__ - Step 44343: {'lr': 0.0004056388109755695, 'samples': 8513856, 'steps': 44342, 'loss/train': 1.9729844331741333} -11/07/2021 03:26:32 - INFO - __main__ - Step 44344: {'lr': 0.0004056346580105126, 'samples': 8514048, 'steps': 44343, 'loss/train': 0.17679743468761444} -11/07/2021 03:26:33 - INFO - __main__ - Step 44345: {'lr': 0.00040563050497532905, 'samples': 8514240, 'steps': 44344, 'loss/train': 1.5594099760055542} -11/07/2021 03:26:33 - INFO - __main__ - Step 44346: {'lr': 0.00040562635187002083, 'samples': 8514432, 'steps': 44345, 'loss/train': 1.5085008144378662} -11/07/2021 03:26:34 - INFO - __main__ - Step 44347: {'lr': 0.0004056221986945898, 'samples': 8514624, 'steps': 44346, 'loss/train': 0.818427562713623} -11/07/2021 03:26:35 - INFO - __main__ - Step 44348: {'lr': 0.0004056180454490378, 'samples': 8514816, 'steps': 44347, 'loss/train': 0.6687682867050171} -11/07/2021 03:26:35 - INFO - __main__ - Step 44349: {'lr': 0.00040561389213336673, 'samples': 8515008, 'steps': 44348, 'loss/train': 1.2913715839385986} -11/07/2021 03:26:35 - INFO - __main__ - Step 44350: {'lr': 0.00040560973874757844, 'samples': 8515200, 'steps': 44349, 'loss/train': 1.7278624773025513} -11/07/2021 03:26:36 - INFO - __main__ - Step 44351: {'lr': 0.0004056055852916748, 'samples': 8515392, 'steps': 44350, 'loss/train': 1.3829728364944458} -11/07/2021 03:26:37 - INFO - __main__ - Step 44352: {'lr': 0.0004056014317656577, 'samples': 8515584, 'steps': 44351, 'loss/train': 1.8176770210266113} -11/07/2021 03:26:37 - INFO - __main__ - Step 44353: {'lr': 0.00040559727816952897, 'samples': 8515776, 'steps': 44352, 'loss/train': 1.4659550189971924} -11/07/2021 03:26:37 - INFO - __main__ - Step 44354: {'lr': 0.0004055931245032904, 'samples': 8515968, 'steps': 44353, 'loss/train': 1.4851115942001343} -11/07/2021 03:26:38 - INFO - __main__ - Step 44355: {'lr': 0.0004055889707669441, 'samples': 8516160, 'steps': 44354, 'loss/train': 1.867988109588623} -11/07/2021 03:26:38 - INFO - __main__ - Step 44356: {'lr': 0.0004055848169604919, 'samples': 8516352, 'steps': 44355, 'loss/train': 1.2548911571502686} -11/07/2021 03:26:39 - INFO - __main__ - Step 44357: {'lr': 0.00040558066308393536, 'samples': 8516544, 'steps': 44356, 'loss/train': 1.6776759624481201} -11/07/2021 03:26:40 - INFO - __main__ - Step 44358: {'lr': 0.0004055765091372767, 'samples': 8516736, 'steps': 44357, 'loss/train': 1.2604798078536987} -11/07/2021 03:26:40 - INFO - __main__ - Step 44359: {'lr': 0.0004055723551205177, 'samples': 8516928, 'steps': 44358, 'loss/train': 2.0085549354553223} -11/07/2021 03:26:40 - INFO - __main__ - Step 44360: {'lr': 0.0004055682010336601, 'samples': 8517120, 'steps': 44359, 'loss/train': 1.4113619327545166} -11/07/2021 03:26:41 - INFO - __main__ - Step 44361: {'lr': 0.0004055640468767059, 'samples': 8517312, 'steps': 44360, 'loss/train': 1.4180389642715454} -11/07/2021 03:26:42 - INFO - __main__ - Step 44362: {'lr': 0.000405559892649657, 'samples': 8517504, 'steps': 44361, 'loss/train': 1.191287875175476} -11/07/2021 03:26:42 - INFO - __main__ - Step 44363: {'lr': 0.00040555573835251513, 'samples': 8517696, 'steps': 44362, 'loss/train': 1.7261238098144531} -11/07/2021 03:26:42 - INFO - __main__ - Step 44364: {'lr': 0.00040555158398528237, 'samples': 8517888, 'steps': 44363, 'loss/train': 1.5277279615402222} -11/07/2021 03:26:43 - INFO - __main__ - Step 44365: {'lr': 0.0004055474295479603, 'samples': 8518080, 'steps': 44364, 'loss/train': 1.3089200258255005} -11/07/2021 03:26:43 - INFO - __main__ - Step 44366: {'lr': 0.00040554327504055106, 'samples': 8518272, 'steps': 44365, 'loss/train': 1.2779258489608765} -11/07/2021 03:26:45 - INFO - __main__ - Step 44367: {'lr': 0.0004055391204630564, 'samples': 8518464, 'steps': 44366, 'loss/train': 1.3282432556152344} -11/07/2021 03:26:45 - INFO - __main__ - Step 44368: {'lr': 0.0004055349658154782, 'samples': 8518656, 'steps': 44367, 'loss/train': 1.0060210227966309} -11/07/2021 03:26:46 - INFO - __main__ - Step 44369: {'lr': 0.00040553081109781844, 'samples': 8518848, 'steps': 44368, 'loss/train': 1.7433545589447021} -11/07/2021 03:26:46 - INFO - __main__ - Step 44370: {'lr': 0.0004055266563100788, 'samples': 8519040, 'steps': 44369, 'loss/train': 1.9142252206802368} -11/07/2021 03:26:46 - INFO - __main__ - Step 44371: {'lr': 0.00040552250145226124, 'samples': 8519232, 'steps': 44370, 'loss/train': 1.2746949195861816} -11/07/2021 03:26:47 - INFO - __main__ - Step 44372: {'lr': 0.0004055183465243676, 'samples': 8519424, 'steps': 44371, 'loss/train': 0.8926762938499451} -11/07/2021 03:26:47 - INFO - __main__ - Step 44373: {'lr': 0.0004055141915263999, 'samples': 8519616, 'steps': 44372, 'loss/train': 1.221543788909912} -11/07/2021 03:26:48 - INFO - __main__ - Step 44374: {'lr': 0.0004055100364583598, 'samples': 8519808, 'steps': 44373, 'loss/train': 1.3261895179748535} -11/07/2021 03:26:48 - INFO - __main__ - Step 44375: {'lr': 0.0004055058813202493, 'samples': 8520000, 'steps': 44374, 'loss/train': 2.2200098037719727} -11/07/2021 03:26:49 - INFO - __main__ - Step 44376: {'lr': 0.0004055017261120704, 'samples': 8520192, 'steps': 44375, 'loss/train': 2.082080125808716} -11/07/2021 03:26:49 - INFO - __main__ - Step 44377: {'lr': 0.00040549757083382465, 'samples': 8520384, 'steps': 44376, 'loss/train': 1.1706246137619019} -11/07/2021 03:26:50 - INFO - __main__ - Step 44378: {'lr': 0.00040549341548551415, 'samples': 8520576, 'steps': 44377, 'loss/train': 1.8282917737960815} -11/07/2021 03:26:51 - INFO - __main__ - Step 44379: {'lr': 0.0004054892600671407, 'samples': 8520768, 'steps': 44378, 'loss/train': 1.7403497695922852} -11/07/2021 03:26:51 - INFO - __main__ - Step 44380: {'lr': 0.00040548510457870623, 'samples': 8520960, 'steps': 44379, 'loss/train': 1.3733513355255127} -11/07/2021 03:26:51 - INFO - __main__ - Step 44381: {'lr': 0.00040548094902021257, 'samples': 8521152, 'steps': 44380, 'loss/train': 1.5659174919128418} -11/07/2021 03:26:52 - INFO - __main__ - Step 44382: {'lr': 0.00040547679339166155, 'samples': 8521344, 'steps': 44381, 'loss/train': 1.7189534902572632} -11/07/2021 03:26:52 - INFO - __main__ - Step 44383: {'lr': 0.0004054726376930551, 'samples': 8521536, 'steps': 44382, 'loss/train': 1.4297466278076172} -11/07/2021 03:26:53 - INFO - __main__ - Step 44384: {'lr': 0.0004054684819243951, 'samples': 8521728, 'steps': 44383, 'loss/train': 1.544453501701355} -11/07/2021 03:26:53 - INFO - __main__ - Step 44385: {'lr': 0.0004054643260856834, 'samples': 8521920, 'steps': 44384, 'loss/train': 1.738171935081482} -11/07/2021 03:26:54 - INFO - __main__ - Step 44386: {'lr': 0.00040546017017692183, 'samples': 8522112, 'steps': 44385, 'loss/train': 1.7193278074264526} -11/07/2021 03:26:54 - INFO - __main__ - Step 44387: {'lr': 0.00040545601419811236, 'samples': 8522304, 'steps': 44386, 'loss/train': 1.71592378616333} -11/07/2021 03:26:54 - INFO - __main__ - Step 44388: {'lr': 0.00040545185814925676, 'samples': 8522496, 'steps': 44387, 'loss/train': 1.3953267335891724} -11/07/2021 03:26:55 - INFO - __main__ - Step 44389: {'lr': 0.00040544770203035705, 'samples': 8522688, 'steps': 44388, 'loss/train': 1.3401683568954468} -11/07/2021 03:26:56 - INFO - __main__ - Step 44390: {'lr': 0.0004054435458414149, 'samples': 8522880, 'steps': 44389, 'loss/train': 1.2182083129882812} -11/07/2021 03:26:56 - INFO - __main__ - Step 44391: {'lr': 0.0004054393895824323, 'samples': 8523072, 'steps': 44390, 'loss/train': 1.2936636209487915} -11/07/2021 03:26:56 - INFO - __main__ - Step 44392: {'lr': 0.00040543523325341116, 'samples': 8523264, 'steps': 44391, 'loss/train': 1.199650764465332} -11/07/2021 03:26:57 - INFO - __main__ - Step 44393: {'lr': 0.0004054310768543532, 'samples': 8523456, 'steps': 44392, 'loss/train': 0.5333095788955688} -11/07/2021 03:26:58 - INFO - __main__ - Step 44394: {'lr': 0.00040542692038526054, 'samples': 8523648, 'steps': 44393, 'loss/train': 1.777122139930725} -11/07/2021 03:26:58 - INFO - __main__ - Step 44395: {'lr': 0.0004054227638461348, 'samples': 8523840, 'steps': 44394, 'loss/train': 1.1267532110214233} -11/07/2021 03:26:59 - INFO - __main__ - Step 44396: {'lr': 0.000405418607236978, 'samples': 8524032, 'steps': 44395, 'loss/train': 1.3103433847427368} -11/07/2021 03:26:59 - INFO - __main__ - Step 44397: {'lr': 0.00040541445055779197, 'samples': 8524224, 'steps': 44396, 'loss/train': 1.1464890241622925} -11/07/2021 03:26:59 - INFO - __main__ - Step 44398: {'lr': 0.0004054102938085786, 'samples': 8524416, 'steps': 44397, 'loss/train': 1.3520127534866333} -11/07/2021 03:27:01 - INFO - __main__ - Step 44399: {'lr': 0.0004054061369893397, 'samples': 8524608, 'steps': 44398, 'loss/train': 1.9427788257598877} -11/07/2021 03:27:01 - INFO - __main__ - Step 44400: {'lr': 0.0004054019801000772, 'samples': 8524800, 'steps': 44399, 'loss/train': 1.9333767890930176} -11/07/2021 03:27:01 - INFO - __main__ - Step 44401: {'lr': 0.00040539782314079304, 'samples': 8524992, 'steps': 44400, 'loss/train': 1.6394872665405273} -11/07/2021 03:27:02 - INFO - __main__ - Step 44402: {'lr': 0.000405393666111489, 'samples': 8525184, 'steps': 44401, 'loss/train': 1.2938517332077026} -11/07/2021 03:27:02 - INFO - __main__ - Step 44403: {'lr': 0.0004053895090121669, 'samples': 8525376, 'steps': 44402, 'loss/train': 1.545699119567871} -11/07/2021 03:27:03 - INFO - __main__ - Step 44404: {'lr': 0.00040538535184282877, 'samples': 8525568, 'steps': 44403, 'loss/train': 0.23328112065792084} -11/07/2021 03:27:03 - INFO - __main__ - Step 44405: {'lr': 0.00040538119460347636, 'samples': 8525760, 'steps': 44404, 'loss/train': 1.5613592863082886} -11/07/2021 03:27:04 - INFO - __main__ - Step 44406: {'lr': 0.0004053770372941116, 'samples': 8525952, 'steps': 44405, 'loss/train': 1.7085882425308228} -11/07/2021 03:27:04 - INFO - __main__ - Step 44407: {'lr': 0.00040537287991473627, 'samples': 8526144, 'steps': 44406, 'loss/train': 1.5492923259735107} -11/07/2021 03:27:04 - INFO - __main__ - Step 44408: {'lr': 0.0004053687224653524, 'samples': 8526336, 'steps': 44407, 'loss/train': 1.4747073650360107} -11/07/2021 03:27:05 - INFO - __main__ - Step 44409: {'lr': 0.0004053645649459617, 'samples': 8526528, 'steps': 44408, 'loss/train': 1.1547192335128784} -11/07/2021 03:27:06 - INFO - __main__ - Step 44410: {'lr': 0.0004053604073565662, 'samples': 8526720, 'steps': 44409, 'loss/train': 1.2398037910461426} -11/07/2021 03:27:06 - INFO - __main__ - Step 44411: {'lr': 0.0004053562496971677, 'samples': 8526912, 'steps': 44410, 'loss/train': 2.591552972793579} -11/07/2021 03:27:07 - INFO - __main__ - Step 44412: {'lr': 0.00040535209196776803, 'samples': 8527104, 'steps': 44411, 'loss/train': 1.2528629302978516} -11/07/2021 03:27:07 - INFO - __main__ - Step 44413: {'lr': 0.00040534793416836915, 'samples': 8527296, 'steps': 44412, 'loss/train': 1.191092610359192} -11/07/2021 03:27:07 - INFO - __main__ - Step 44414: {'lr': 0.00040534377629897276, 'samples': 8527488, 'steps': 44413, 'loss/train': 0.8791242241859436} -11/07/2021 03:27:08 - INFO - __main__ - Step 44415: {'lr': 0.000405339618359581, 'samples': 8527680, 'steps': 44414, 'loss/train': 0.21375149488449097} -11/07/2021 03:27:09 - INFO - __main__ - Step 44416: {'lr': 0.0004053354603501956, 'samples': 8527872, 'steps': 44415, 'loss/train': 1.3721272945404053} -11/07/2021 03:27:09 - INFO - __main__ - Step 44417: {'lr': 0.0004053313022708184, 'samples': 8528064, 'steps': 44416, 'loss/train': 0.752591609954834} -11/07/2021 03:27:09 - INFO - __main__ - Step 44418: {'lr': 0.00040532714412145135, 'samples': 8528256, 'steps': 44417, 'loss/train': 2.0578362941741943} -11/07/2021 03:27:10 - INFO - __main__ - Step 44419: {'lr': 0.0004053229859020962, 'samples': 8528448, 'steps': 44418, 'loss/train': 1.4786136150360107} -11/07/2021 03:27:11 - INFO - __main__ - Step 44420: {'lr': 0.00040531882761275496, 'samples': 8528640, 'steps': 44419, 'loss/train': 1.2803568840026855} -11/07/2021 03:27:12 - INFO - __main__ - Step 44421: {'lr': 0.00040531466925342947, 'samples': 8528832, 'steps': 44420, 'loss/train': 1.6242843866348267} -11/07/2021 03:27:12 - INFO - __main__ - Step 44422: {'lr': 0.0004053105108241216, 'samples': 8529024, 'steps': 44421, 'loss/train': 1.488799810409546} -11/07/2021 03:27:12 - INFO - __main__ - Step 44423: {'lr': 0.0004053063523248331, 'samples': 8529216, 'steps': 44422, 'loss/train': 1.6097091436386108} -11/07/2021 03:27:13 - INFO - __main__ - Step 44424: {'lr': 0.0004053021937555661, 'samples': 8529408, 'steps': 44423, 'loss/train': 1.3957725763320923} -11/07/2021 03:27:13 - INFO - __main__ - Step 44425: {'lr': 0.00040529803511632224, 'samples': 8529600, 'steps': 44424, 'loss/train': 0.8210239410400391} -11/07/2021 03:27:14 - INFO - __main__ - Step 44426: {'lr': 0.0004052938764071035, 'samples': 8529792, 'steps': 44425, 'loss/train': 0.4482980966567993} -11/07/2021 03:27:14 - INFO - __main__ - Step 44427: {'lr': 0.00040528971762791177, 'samples': 8529984, 'steps': 44426, 'loss/train': 1.7034776210784912} -11/07/2021 03:27:15 - INFO - __main__ - Step 44428: {'lr': 0.0004052855587787488, 'samples': 8530176, 'steps': 44427, 'loss/train': 1.948665976524353} -11/07/2021 03:27:15 - INFO - __main__ - Step 44429: {'lr': 0.0004052813998596167, 'samples': 8530368, 'steps': 44428, 'loss/train': 1.4644088745117188} -11/07/2021 03:27:15 - INFO - __main__ - Step 44430: {'lr': 0.0004052772408705171, 'samples': 8530560, 'steps': 44429, 'loss/train': 1.6136597394943237} -11/07/2021 03:27:17 - INFO - __main__ - Step 44431: {'lr': 0.000405273081811452, 'samples': 8530752, 'steps': 44430, 'loss/train': 1.1703969240188599} -11/07/2021 03:27:17 - INFO - __main__ - Step 44432: {'lr': 0.0004052689226824232, 'samples': 8530944, 'steps': 44431, 'loss/train': 1.5301213264465332} -11/07/2021 03:27:17 - INFO - __main__ - Step 44433: {'lr': 0.0004052647634834327, 'samples': 8531136, 'steps': 44432, 'loss/train': 1.528038501739502} -11/07/2021 03:27:18 - INFO - __main__ - Step 44434: {'lr': 0.00040526060421448216, 'samples': 8531328, 'steps': 44433, 'loss/train': 1.3487976789474487} -11/07/2021 03:27:18 - INFO - __main__ - Step 44435: {'lr': 0.00040525644487557366, 'samples': 8531520, 'steps': 44434, 'loss/train': 1.7728455066680908} -11/07/2021 03:27:19 - INFO - __main__ - Step 44436: {'lr': 0.000405252285466709, 'samples': 8531712, 'steps': 44435, 'loss/train': 1.8397818803787231} -11/07/2021 03:27:19 - INFO - __main__ - Step 44437: {'lr': 0.0004052481259878901, 'samples': 8531904, 'steps': 44436, 'loss/train': 1.6660261154174805} -11/07/2021 03:27:20 - INFO - __main__ - Step 44438: {'lr': 0.00040524396643911874, 'samples': 8532096, 'steps': 44437, 'loss/train': 1.6685140132904053} -11/07/2021 03:27:20 - INFO - __main__ - Step 44439: {'lr': 0.00040523980682039684, 'samples': 8532288, 'steps': 44438, 'loss/train': 1.6078511476516724} -11/07/2021 03:27:20 - INFO - __main__ - Step 44440: {'lr': 0.00040523564713172634, 'samples': 8532480, 'steps': 44439, 'loss/train': 1.8439935445785522} -11/07/2021 03:27:21 - INFO - __main__ - Step 44441: {'lr': 0.000405231487373109, 'samples': 8532672, 'steps': 44440, 'loss/train': 0.8348057866096497} -11/07/2021 03:27:22 - INFO - __main__ - Step 44442: {'lr': 0.00040522732754454674, 'samples': 8532864, 'steps': 44441, 'loss/train': 1.5335814952850342} -11/07/2021 03:27:22 - INFO - __main__ - Step 44443: {'lr': 0.0004052231676460415, 'samples': 8533056, 'steps': 44442, 'loss/train': 1.5462127923965454} -11/07/2021 03:27:22 - INFO - __main__ - Step 44444: {'lr': 0.000405219007677595, 'samples': 8533248, 'steps': 44443, 'loss/train': 1.638048529624939} -11/07/2021 03:27:23 - INFO - __main__ - Step 44445: {'lr': 0.0004052148476392093, 'samples': 8533440, 'steps': 44444, 'loss/train': 1.5250041484832764} -11/07/2021 03:27:23 - INFO - __main__ - Step 44446: {'lr': 0.00040521068753088615, 'samples': 8533632, 'steps': 44445, 'loss/train': 1.178097128868103} -11/07/2021 03:27:26 - INFO - __main__ - Step 44447: {'lr': 0.0004052065273526274, 'samples': 8533824, 'steps': 44446, 'loss/train': 1.603786587715149} -11/07/2021 03:27:26 - INFO - __main__ - Step 44448: {'lr': 0.0004052023671044351, 'samples': 8534016, 'steps': 44447, 'loss/train': 1.2792620658874512} -11/07/2021 03:27:26 - INFO - __main__ - Step 44449: {'lr': 0.0004051982067863109, 'samples': 8534208, 'steps': 44448, 'loss/train': 1.9062073230743408} -11/07/2021 03:27:27 - INFO - __main__ - Step 44450: {'lr': 0.0004051940463982569, 'samples': 8534400, 'steps': 44449, 'loss/train': 1.2241114377975464} -11/07/2021 03:27:27 - INFO - __main__ - Step 44451: {'lr': 0.0004051898859402748, 'samples': 8534592, 'steps': 44450, 'loss/train': 1.7529017925262451} -11/07/2021 03:27:27 - INFO - __main__ - Step 44452: {'lr': 0.00040518572541236653, 'samples': 8534784, 'steps': 44451, 'loss/train': 1.7296701669692993} -11/07/2021 03:27:28 - INFO - __main__ - Step 44453: {'lr': 0.00040518156481453397, 'samples': 8534976, 'steps': 44452, 'loss/train': 1.0338215827941895} -11/07/2021 03:27:29 - INFO - __main__ - Step 44454: {'lr': 0.0004051774041467789, 'samples': 8535168, 'steps': 44453, 'loss/train': 1.2485108375549316} -11/07/2021 03:27:29 - INFO - __main__ - Step 44455: {'lr': 0.00040517324340910347, 'samples': 8535360, 'steps': 44454, 'loss/train': 1.7952251434326172} -11/07/2021 03:27:29 - INFO - __main__ - Step 44456: {'lr': 0.0004051690826015092, 'samples': 8535552, 'steps': 44455, 'loss/train': 1.1251962184906006} -11/07/2021 03:27:30 - INFO - __main__ - Step 44457: {'lr': 0.0004051649217239982, 'samples': 8535744, 'steps': 44456, 'loss/train': 1.3085439205169678} -11/07/2021 03:27:30 - INFO - __main__ - Step 44458: {'lr': 0.00040516076077657233, 'samples': 8535936, 'steps': 44457, 'loss/train': 1.619061827659607} -11/07/2021 03:27:31 - INFO - __main__ - Step 44459: {'lr': 0.0004051565997592334, 'samples': 8536128, 'steps': 44458, 'loss/train': 1.7020214796066284} -11/07/2021 03:27:32 - INFO - __main__ - Step 44460: {'lr': 0.0004051524386719832, 'samples': 8536320, 'steps': 44459, 'loss/train': 1.3638756275177002} -11/07/2021 03:27:32 - INFO - __main__ - Step 44461: {'lr': 0.0004051482775148238, 'samples': 8536512, 'steps': 44460, 'loss/train': 1.798329472541809} -11/07/2021 03:27:32 - INFO - __main__ - Step 44462: {'lr': 0.00040514411628775695, 'samples': 8536704, 'steps': 44461, 'loss/train': 1.083493709564209} -11/07/2021 03:27:33 - INFO - __main__ - Step 44463: {'lr': 0.0004051399549907846, 'samples': 8536896, 'steps': 44462, 'loss/train': 1.439456582069397} -11/07/2021 03:27:33 - INFO - __main__ - Step 44464: {'lr': 0.0004051357936239085, 'samples': 8537088, 'steps': 44463, 'loss/train': 0.927096962928772} -11/07/2021 03:27:34 - INFO - __main__ - Step 44465: {'lr': 0.0004051316321871307, 'samples': 8537280, 'steps': 44464, 'loss/train': 1.1415132284164429} -11/07/2021 03:27:35 - INFO - __main__ - Step 44466: {'lr': 0.0004051274706804529, 'samples': 8537472, 'steps': 44465, 'loss/train': 0.8037278056144714} -11/07/2021 03:27:35 - INFO - __main__ - Step 44467: {'lr': 0.00040512330910387706, 'samples': 8537664, 'steps': 44466, 'loss/train': 2.71468186378479} -11/07/2021 03:27:35 - INFO - __main__ - Step 44468: {'lr': 0.0004051191474574051, 'samples': 8537856, 'steps': 44467, 'loss/train': 1.15324068069458} -11/07/2021 03:27:36 - INFO - __main__ - Step 44469: {'lr': 0.0004051149857410388, 'samples': 8538048, 'steps': 44468, 'loss/train': 1.7898513078689575} -11/07/2021 03:27:37 - INFO - __main__ - Step 44470: {'lr': 0.00040511082395478014, 'samples': 8538240, 'steps': 44469, 'loss/train': 1.243414282798767} -11/07/2021 03:27:37 - INFO - __main__ - Step 44471: {'lr': 0.0004051066620986309, 'samples': 8538432, 'steps': 44470, 'loss/train': 2.240720510482788} -11/07/2021 03:27:37 - INFO - __main__ - Step 44472: {'lr': 0.00040510250017259297, 'samples': 8538624, 'steps': 44471, 'loss/train': 1.2709674835205078} -11/07/2021 03:27:38 - INFO - __main__ - Step 44473: {'lr': 0.0004050983381766683, 'samples': 8538816, 'steps': 44472, 'loss/train': 1.600716233253479} -11/07/2021 03:27:38 - INFO - __main__ - Step 44474: {'lr': 0.00040509417611085864, 'samples': 8539008, 'steps': 44473, 'loss/train': 1.0161057710647583} -11/07/2021 03:27:40 - INFO - __main__ - Step 44475: {'lr': 0.000405090013975166, 'samples': 8539200, 'steps': 44474, 'loss/train': 1.0554980039596558} -11/07/2021 03:27:40 - INFO - __main__ - Step 44476: {'lr': 0.0004050858517695921, 'samples': 8539392, 'steps': 44475, 'loss/train': 2.087064027786255} -11/07/2021 03:27:40 - INFO - __main__ - Step 44477: {'lr': 0.00040508168949413904, 'samples': 8539584, 'steps': 44476, 'loss/train': 1.0634537935256958} -11/07/2021 03:27:41 - INFO - __main__ - Step 44478: {'lr': 0.00040507752714880854, 'samples': 8539776, 'steps': 44477, 'loss/train': 1.3781660795211792} -11/07/2021 03:27:41 - INFO - __main__ - Step 44479: {'lr': 0.0004050733647336024, 'samples': 8539968, 'steps': 44478, 'loss/train': 1.4802095890045166} -11/07/2021 03:27:42 - INFO - __main__ - Step 44480: {'lr': 0.00040506920224852265, 'samples': 8540160, 'steps': 44479, 'loss/train': 1.452307105064392} -11/07/2021 03:27:43 - INFO - __main__ - Step 44481: {'lr': 0.0004050650396935711, 'samples': 8540352, 'steps': 44480, 'loss/train': 1.2733694314956665} -11/07/2021 03:27:43 - INFO - __main__ - Step 44482: {'lr': 0.00040506087706874966, 'samples': 8540544, 'steps': 44481, 'loss/train': 1.220317006111145} -11/07/2021 03:27:43 - INFO - __main__ - Step 44483: {'lr': 0.00040505671437406017, 'samples': 8540736, 'steps': 44482, 'loss/train': 0.8834923505783081} -11/07/2021 03:27:44 - INFO - __main__ - Step 44484: {'lr': 0.00040505255160950453, 'samples': 8540928, 'steps': 44483, 'loss/train': 1.421524167060852} -11/07/2021 03:27:44 - INFO - __main__ - Step 44485: {'lr': 0.00040504838877508464, 'samples': 8541120, 'steps': 44484, 'loss/train': 1.5100693702697754} -11/07/2021 03:27:44 - INFO - __main__ - Step 44486: {'lr': 0.0004050442258708022, 'samples': 8541312, 'steps': 44485, 'loss/train': 0.9665480256080627} -11/07/2021 03:27:45 - INFO - __main__ - Step 44487: {'lr': 0.0004050400628966594, 'samples': 8541504, 'steps': 44486, 'loss/train': 1.4220572710037231} -11/07/2021 03:27:46 - INFO - __main__ - Step 44488: {'lr': 0.0004050358998526578, 'samples': 8541696, 'steps': 44487, 'loss/train': 1.3052656650543213} -11/07/2021 03:27:46 - INFO - __main__ - Step 44489: {'lr': 0.00040503173673879945, 'samples': 8541888, 'steps': 44488, 'loss/train': 1.27193021774292} -11/07/2021 03:27:46 - INFO - __main__ - Step 44490: {'lr': 0.00040502757355508626, 'samples': 8542080, 'steps': 44489, 'loss/train': 0.7407692670822144} -11/07/2021 03:27:47 - INFO - __main__ - Step 44491: {'lr': 0.00040502341030152, 'samples': 8542272, 'steps': 44490, 'loss/train': 1.129051923751831} -11/07/2021 03:27:48 - INFO - __main__ - Step 44492: {'lr': 0.0004050192469781025, 'samples': 8542464, 'steps': 44491, 'loss/train': 1.6179014444351196} -11/07/2021 03:27:48 - INFO - __main__ - Step 44493: {'lr': 0.00040501508358483583, 'samples': 8542656, 'steps': 44492, 'loss/train': 1.8394125699996948} -11/07/2021 03:27:49 - INFO - __main__ - Step 44494: {'lr': 0.00040501092012172173, 'samples': 8542848, 'steps': 44493, 'loss/train': 1.7730039358139038} -11/07/2021 03:27:49 - INFO - __main__ - Step 44495: {'lr': 0.0004050067565887621, 'samples': 8543040, 'steps': 44494, 'loss/train': 1.4558534622192383} -11/07/2021 03:27:49 - INFO - __main__ - Step 44496: {'lr': 0.00040500259298595874, 'samples': 8543232, 'steps': 44495, 'loss/train': 1.5732234716415405} -11/07/2021 03:27:50 - INFO - __main__ - Step 44497: {'lr': 0.00040499842931331374, 'samples': 8543424, 'steps': 44496, 'loss/train': 1.3753433227539062} -11/07/2021 03:27:51 - INFO - __main__ - Step 44498: {'lr': 0.0004049942655708287, 'samples': 8543616, 'steps': 44497, 'loss/train': 1.4764783382415771} -11/07/2021 03:27:51 - INFO - __main__ - Step 44499: {'lr': 0.0004049901017585058, 'samples': 8543808, 'steps': 44498, 'loss/train': 1.58024263381958} -11/07/2021 03:27:51 - INFO - __main__ - Step 44500: {'lr': 0.00040498593787634664, 'samples': 8544000, 'steps': 44499, 'loss/train': 1.0468982458114624} -11/07/2021 03:27:52 - INFO - __main__ - Step 44501: {'lr': 0.0004049817739243532, 'samples': 8544192, 'steps': 44500, 'loss/train': 1.7301188707351685} -11/07/2021 03:27:53 - INFO - __main__ - Step 44502: {'lr': 0.0004049776099025274, 'samples': 8544384, 'steps': 44501, 'loss/train': 1.7797633409500122} -11/07/2021 03:27:53 - INFO - __main__ - Step 44503: {'lr': 0.000404973445810871, 'samples': 8544576, 'steps': 44502, 'loss/train': 1.3407477140426636} -11/07/2021 03:27:53 - INFO - __main__ - Step 44504: {'lr': 0.00040496928164938614, 'samples': 8544768, 'steps': 44503, 'loss/train': 1.2654181718826294} -11/07/2021 03:27:54 - INFO - __main__ - Step 44505: {'lr': 0.0004049651174180744, 'samples': 8544960, 'steps': 44504, 'loss/train': 1.4537317752838135} -11/07/2021 03:27:54 - INFO - __main__ - Step 44506: {'lr': 0.00040496095311693775, 'samples': 8545152, 'steps': 44505, 'loss/train': 1.857408881187439} -11/07/2021 03:27:55 - INFO - __main__ - Step 44507: {'lr': 0.0004049567887459781, 'samples': 8545344, 'steps': 44506, 'loss/train': 1.611707091331482} -11/07/2021 03:27:56 - INFO - __main__ - Step 44508: {'lr': 0.0004049526243051973, 'samples': 8545536, 'steps': 44507, 'loss/train': 1.5558937788009644} -11/07/2021 03:27:56 - INFO - __main__ - Step 44509: {'lr': 0.0004049484597945973, 'samples': 8545728, 'steps': 44508, 'loss/train': 2.009676218032837} -11/07/2021 03:27:56 - INFO - __main__ - Step 44510: {'lr': 0.00040494429521417983, 'samples': 8545920, 'steps': 44509, 'loss/train': 1.0804678201675415} -11/07/2021 03:27:57 - INFO - __main__ - Step 44511: {'lr': 0.0004049401305639469, 'samples': 8546112, 'steps': 44510, 'loss/train': 1.7514135837554932} -11/07/2021 03:27:57 - INFO - __main__ - Step 44512: {'lr': 0.00040493596584390034, 'samples': 8546304, 'steps': 44511, 'loss/train': 1.0365068912506104} -11/07/2021 03:27:58 - INFO - __main__ - Step 44513: {'lr': 0.00040493180105404203, 'samples': 8546496, 'steps': 44512, 'loss/train': 1.2823036909103394} -11/07/2021 03:27:58 - INFO - __main__ - Step 44514: {'lr': 0.0004049276361943738, 'samples': 8546688, 'steps': 44513, 'loss/train': 1.1235660314559937} -11/07/2021 03:27:59 - INFO - __main__ - Step 44515: {'lr': 0.0004049234712648976, 'samples': 8546880, 'steps': 44514, 'loss/train': 1.4431331157684326} -11/07/2021 03:27:59 - INFO - __main__ - Step 44516: {'lr': 0.00040491930626561525, 'samples': 8547072, 'steps': 44515, 'loss/train': 1.423165202140808} -11/07/2021 03:27:59 - INFO - __main__ - Step 44517: {'lr': 0.00040491514119652875, 'samples': 8547264, 'steps': 44516, 'loss/train': 1.4906201362609863} -11/07/2021 03:28:01 - INFO - __main__ - Step 44518: {'lr': 0.00040491097605763974, 'samples': 8547456, 'steps': 44517, 'loss/train': 1.781027913093567} -11/07/2021 03:28:01 - INFO - __main__ - Step 44519: {'lr': 0.00040490681084895034, 'samples': 8547648, 'steps': 44518, 'loss/train': 1.086724042892456} -11/07/2021 03:28:01 - INFO - __main__ - Step 44520: {'lr': 0.00040490264557046217, 'samples': 8547840, 'steps': 44519, 'loss/train': 1.5045785903930664} -11/07/2021 03:28:02 - INFO - __main__ - Step 44521: {'lr': 0.0004048984802221774, 'samples': 8548032, 'steps': 44520, 'loss/train': 1.6920466423034668} -11/07/2021 03:28:02 - INFO - __main__ - Step 44522: {'lr': 0.0004048943148040977, 'samples': 8548224, 'steps': 44521, 'loss/train': 1.6950204372406006} -11/07/2021 03:28:03 - INFO - __main__ - Step 44523: {'lr': 0.0004048901493162251, 'samples': 8548416, 'steps': 44522, 'loss/train': 1.0734343528747559} -11/07/2021 03:28:03 - INFO - __main__ - Step 44524: {'lr': 0.00040488598375856133, 'samples': 8548608, 'steps': 44523, 'loss/train': 1.0315029621124268} -11/07/2021 03:28:04 - INFO - __main__ - Step 44525: {'lr': 0.0004048818181311083, 'samples': 8548800, 'steps': 44524, 'loss/train': 1.529782772064209} -11/07/2021 03:28:04 - INFO - __main__ - Step 44526: {'lr': 0.000404877652433868, 'samples': 8548992, 'steps': 44525, 'loss/train': 1.3307926654815674} -11/07/2021 03:28:04 - INFO - __main__ - Step 44527: {'lr': 0.0004048734866668421, 'samples': 8549184, 'steps': 44526, 'loss/train': 1.581064224243164} -11/07/2021 03:28:05 - INFO - __main__ - Step 44528: {'lr': 0.0004048693208300327, 'samples': 8549376, 'steps': 44527, 'loss/train': 1.7866863012313843} -11/07/2021 03:28:06 - INFO - __main__ - Step 44529: {'lr': 0.00040486515492344145, 'samples': 8549568, 'steps': 44528, 'loss/train': 1.6121472120285034} -11/07/2021 03:28:06 - INFO - __main__ - Step 44530: {'lr': 0.00040486098894707044, 'samples': 8549760, 'steps': 44529, 'loss/train': 0.9334121346473694} -11/07/2021 03:28:06 - INFO - __main__ - Step 44531: {'lr': 0.00040485682290092144, 'samples': 8549952, 'steps': 44530, 'loss/train': 1.5065734386444092} -11/07/2021 03:28:07 - INFO - __main__ - Step 44532: {'lr': 0.0004048526567849964, 'samples': 8550144, 'steps': 44531, 'loss/train': 1.7208983898162842} -11/07/2021 03:28:08 - INFO - __main__ - Step 44533: {'lr': 0.00040484849059929705, 'samples': 8550336, 'steps': 44532, 'loss/train': 1.720125436782837} -11/07/2021 03:28:08 - INFO - __main__ - Step 44534: {'lr': 0.00040484432434382547, 'samples': 8550528, 'steps': 44533, 'loss/train': 1.2826281785964966} -11/07/2021 03:28:09 - INFO - __main__ - Step 44535: {'lr': 0.0004048401580185833, 'samples': 8550720, 'steps': 44534, 'loss/train': 1.655936598777771} -11/07/2021 03:28:09 - INFO - __main__ - Step 44536: {'lr': 0.00040483599162357257, 'samples': 8550912, 'steps': 44535, 'loss/train': 1.1506872177124023} -11/07/2021 03:28:09 - INFO - __main__ - Step 44537: {'lr': 0.0004048318251587952, 'samples': 8551104, 'steps': 44536, 'loss/train': 1.6509345769882202} -11/07/2021 03:28:10 - INFO - __main__ - Step 44538: {'lr': 0.000404827658624253, 'samples': 8551296, 'steps': 44537, 'loss/train': 1.1471433639526367} -11/07/2021 03:28:11 - INFO - __main__ - Step 44539: {'lr': 0.00040482349201994785, 'samples': 8551488, 'steps': 44538, 'loss/train': 1.1694883108139038} -11/07/2021 03:28:11 - INFO - __main__ - Step 44540: {'lr': 0.00040481932534588153, 'samples': 8551680, 'steps': 44539, 'loss/train': 1.3767096996307373} -11/07/2021 03:28:11 - INFO - __main__ - Step 44541: {'lr': 0.00040481515860205607, 'samples': 8551872, 'steps': 44540, 'loss/train': 1.4552617073059082} -11/07/2021 03:28:12 - INFO - __main__ - Step 44542: {'lr': 0.00040481099178847326, 'samples': 8552064, 'steps': 44541, 'loss/train': 1.4863961935043335} -11/07/2021 03:28:12 - INFO - __main__ - Step 44543: {'lr': 0.000404806824905135, 'samples': 8552256, 'steps': 44542, 'loss/train': 1.2956562042236328} -11/07/2021 03:28:13 - INFO - __main__ - Step 44544: {'lr': 0.0004048026579520433, 'samples': 8552448, 'steps': 44543, 'loss/train': 1.751367449760437} -11/07/2021 03:28:13 - INFO - __main__ - Step 44545: {'lr': 0.00040479849092919974, 'samples': 8552640, 'steps': 44544, 'loss/train': 1.4386411905288696} -11/07/2021 03:28:14 - INFO - __main__ - Step 44546: {'lr': 0.00040479432383660644, 'samples': 8552832, 'steps': 44545, 'loss/train': 1.5601409673690796} -11/07/2021 03:28:14 - INFO - __main__ - Step 44547: {'lr': 0.00040479015667426523, 'samples': 8553024, 'steps': 44546, 'loss/train': 1.5965445041656494} -11/07/2021 03:28:14 - INFO - __main__ - Step 44548: {'lr': 0.00040478598944217794, 'samples': 8553216, 'steps': 44547, 'loss/train': 1.6914118528366089} -11/07/2021 03:28:15 - INFO - __main__ - Step 44549: {'lr': 0.0004047818221403464, 'samples': 8553408, 'steps': 44548, 'loss/train': 1.3184523582458496} -11/07/2021 03:28:16 - INFO - __main__ - Step 44550: {'lr': 0.0004047776547687727, 'samples': 8553600, 'steps': 44549, 'loss/train': 1.451835036277771} -11/07/2021 03:28:16 - INFO - __main__ - Step 44551: {'lr': 0.00040477348732745853, 'samples': 8553792, 'steps': 44550, 'loss/train': 1.5977486371994019} -11/07/2021 03:28:17 - INFO - __main__ - Step 44552: {'lr': 0.0004047693198164058, 'samples': 8553984, 'steps': 44551, 'loss/train': 1.5908708572387695} -11/07/2021 03:28:17 - INFO - __main__ - Step 44553: {'lr': 0.0004047651522356164, 'samples': 8554176, 'steps': 44552, 'loss/train': 1.6753019094467163} -11/07/2021 03:28:17 - INFO - __main__ - Step 44554: {'lr': 0.0004047609845850922, 'samples': 8554368, 'steps': 44553, 'loss/train': 1.3718253374099731} -11/07/2021 03:28:19 - INFO - __main__ - Step 44555: {'lr': 0.0004047568168648351, 'samples': 8554560, 'steps': 44554, 'loss/train': 1.522674798965454} -11/07/2021 03:28:19 - INFO - __main__ - Step 44556: {'lr': 0.00040475264907484696, 'samples': 8554752, 'steps': 44555, 'loss/train': 1.0965365171432495} -11/07/2021 03:28:19 - INFO - __main__ - Step 44557: {'lr': 0.0004047484812151296, 'samples': 8554944, 'steps': 44556, 'loss/train': 1.554131269454956} -11/07/2021 03:28:20 - INFO - __main__ - Step 44558: {'lr': 0.00040474431328568506, 'samples': 8555136, 'steps': 44557, 'loss/train': 1.3718769550323486} -11/07/2021 03:28:20 - INFO - __main__ - Step 44559: {'lr': 0.00040474014528651514, 'samples': 8555328, 'steps': 44558, 'loss/train': 1.8229775428771973} -11/07/2021 03:28:20 - INFO - __main__ - Step 44560: {'lr': 0.00040473597721762164, 'samples': 8555520, 'steps': 44559, 'loss/train': 0.5324205756187439} -11/07/2021 03:28:22 - INFO - __main__ - Step 44561: {'lr': 0.00040473180907900645, 'samples': 8555712, 'steps': 44560, 'loss/train': 0.978965699672699} -11/07/2021 03:28:22 - INFO - __main__ - Step 44562: {'lr': 0.0004047276408706716, 'samples': 8555904, 'steps': 44561, 'loss/train': 1.4872220754623413} -11/07/2021 03:28:22 - INFO - __main__ - Step 44563: {'lr': 0.00040472347259261875, 'samples': 8556096, 'steps': 44562, 'loss/train': 1.306357741355896} -11/07/2021 03:28:23 - INFO - __main__ - Step 44564: {'lr': 0.00040471930424485, 'samples': 8556288, 'steps': 44563, 'loss/train': 0.8524765968322754} -11/07/2021 03:28:23 - INFO - __main__ - Step 44565: {'lr': 0.0004047151358273671, 'samples': 8556480, 'steps': 44564, 'loss/train': 1.5363770723342896} -11/07/2021 03:28:24 - INFO - __main__ - Step 44566: {'lr': 0.00040471096734017185, 'samples': 8556672, 'steps': 44565, 'loss/train': 0.9901103377342224} -11/07/2021 03:28:24 - INFO - __main__ - Step 44567: {'lr': 0.0004047067987832663, 'samples': 8556864, 'steps': 44566, 'loss/train': 1.4449656009674072} -11/07/2021 03:28:25 - INFO - __main__ - Step 44568: {'lr': 0.00040470263015665234, 'samples': 8557056, 'steps': 44567, 'loss/train': 1.0699820518493652} -11/07/2021 03:28:25 - INFO - __main__ - Step 44569: {'lr': 0.00040469846146033164, 'samples': 8557248, 'steps': 44568, 'loss/train': 0.8161872625350952} -11/07/2021 03:28:25 - INFO - __main__ - Step 44570: {'lr': 0.00040469429269430617, 'samples': 8557440, 'steps': 44569, 'loss/train': 0.8928823471069336} -11/07/2021 03:28:26 - INFO - __main__ - Step 44571: {'lr': 0.00040469012385857794, 'samples': 8557632, 'steps': 44570, 'loss/train': 1.259041428565979} -11/07/2021 03:28:27 - INFO - __main__ - Step 44572: {'lr': 0.0004046859549531487, 'samples': 8557824, 'steps': 44571, 'loss/train': 1.3198877573013306} -11/07/2021 03:28:27 - INFO - __main__ - Step 44573: {'lr': 0.0004046817859780203, 'samples': 8558016, 'steps': 44572, 'loss/train': 1.0246363878250122} -11/07/2021 03:28:28 - INFO - __main__ - Step 44574: {'lr': 0.00040467761693319473, 'samples': 8558208, 'steps': 44573, 'loss/train': 1.1041311025619507} -11/07/2021 03:28:28 - INFO - __main__ - Step 44575: {'lr': 0.0004046734478186738, 'samples': 8558400, 'steps': 44574, 'loss/train': 1.3575173616409302} -11/07/2021 03:28:29 - INFO - __main__ - Step 44576: {'lr': 0.0004046692786344594, 'samples': 8558592, 'steps': 44575, 'loss/train': 1.237064003944397} -11/07/2021 03:28:29 - INFO - __main__ - Step 44577: {'lr': 0.0004046651093805534, 'samples': 8558784, 'steps': 44576, 'loss/train': 1.3218896389007568} -11/07/2021 03:28:30 - INFO - __main__ - Step 44578: {'lr': 0.0004046609400569577, 'samples': 8558976, 'steps': 44577, 'loss/train': 1.2574677467346191} -11/07/2021 03:28:30 - INFO - __main__ - Step 44579: {'lr': 0.00040465677066367424, 'samples': 8559168, 'steps': 44578, 'loss/train': 1.6030867099761963} -11/07/2021 03:28:30 - INFO - __main__ - Step 44580: {'lr': 0.0004046526012007047, 'samples': 8559360, 'steps': 44579, 'loss/train': 1.4407395124435425} -11/07/2021 03:28:31 - INFO - __main__ - Step 44581: {'lr': 0.0004046484316680511, 'samples': 8559552, 'steps': 44580, 'loss/train': 0.8182333111763} -11/07/2021 03:28:32 - INFO - __main__ - Step 44582: {'lr': 0.0004046442620657154, 'samples': 8559744, 'steps': 44581, 'loss/train': 1.3196399211883545} -11/07/2021 03:28:32 - INFO - __main__ - Step 44583: {'lr': 0.00040464009239369925, 'samples': 8559936, 'steps': 44582, 'loss/train': 1.4967689514160156} -11/07/2021 03:28:32 - INFO - __main__ - Step 44584: {'lr': 0.0004046359226520048, 'samples': 8560128, 'steps': 44583, 'loss/train': 1.42673921585083} -11/07/2021 03:28:33 - INFO - __main__ - Step 44585: {'lr': 0.0004046317528406337, 'samples': 8560320, 'steps': 44584, 'loss/train': 0.9684894680976868} -11/07/2021 03:28:34 - INFO - __main__ - Step 44586: {'lr': 0.0004046275829595879, 'samples': 8560512, 'steps': 44585, 'loss/train': 1.9079174995422363} -11/07/2021 03:28:34 - INFO - __main__ - Step 44587: {'lr': 0.0004046234130088694, 'samples': 8560704, 'steps': 44586, 'loss/train': 1.0878044366836548} -11/07/2021 03:28:34 - INFO - __main__ - Step 44588: {'lr': 0.00040461924298847987, 'samples': 8560896, 'steps': 44587, 'loss/train': 2.121105432510376} -11/07/2021 03:28:35 - INFO - __main__ - Step 44589: {'lr': 0.0004046150728984214, 'samples': 8561088, 'steps': 44588, 'loss/train': 1.2639451026916504} -11/07/2021 03:28:35 - INFO - __main__ - Step 44590: {'lr': 0.00040461090273869566, 'samples': 8561280, 'steps': 44589, 'loss/train': 1.383887529373169} -11/07/2021 03:28:36 - INFO - __main__ - Step 44591: {'lr': 0.0004046067325093047, 'samples': 8561472, 'steps': 44590, 'loss/train': 1.1634901762008667} -11/07/2021 03:28:37 - INFO - __main__ - Step 44592: {'lr': 0.00040460256221025025, 'samples': 8561664, 'steps': 44591, 'loss/train': 1.2618054151535034} -11/07/2021 03:28:37 - INFO - __main__ - Step 44593: {'lr': 0.00040459839184153436, 'samples': 8561856, 'steps': 44592, 'loss/train': 1.6785650253295898} -11/07/2021 03:28:37 - INFO - __main__ - Step 44594: {'lr': 0.00040459422140315876, 'samples': 8562048, 'steps': 44593, 'loss/train': 1.0582304000854492} -11/07/2021 03:28:38 - INFO - __main__ - Step 44595: {'lr': 0.00040459005089512544, 'samples': 8562240, 'steps': 44594, 'loss/train': 1.5507423877716064} -11/07/2021 03:28:38 - INFO - __main__ - Step 44596: {'lr': 0.0004045858803174362, 'samples': 8562432, 'steps': 44595, 'loss/train': 1.3976720571517944} -11/07/2021 03:28:39 - INFO - __main__ - Step 44597: {'lr': 0.0004045817096700929, 'samples': 8562624, 'steps': 44596, 'loss/train': 1.7540621757507324} -11/07/2021 03:28:39 - INFO - __main__ - Step 44598: {'lr': 0.0004045775389530976, 'samples': 8562816, 'steps': 44597, 'loss/train': 1.73148512840271} -11/07/2021 03:28:40 - INFO - __main__ - Step 44599: {'lr': 0.00040457336816645195, 'samples': 8563008, 'steps': 44598, 'loss/train': 1.1353774070739746} -11/07/2021 03:28:40 - INFO - __main__ - Step 44600: {'lr': 0.000404569197310158, 'samples': 8563200, 'steps': 44599, 'loss/train': 1.5680984258651733} -11/07/2021 03:28:40 - INFO - __main__ - Step 44601: {'lr': 0.0004045650263842174, 'samples': 8563392, 'steps': 44600, 'loss/train': 1.0853443145751953} -11/07/2021 03:28:41 - INFO - __main__ - Step 44602: {'lr': 0.0004045608553886323, 'samples': 8563584, 'steps': 44601, 'loss/train': 1.4845424890518188} -11/07/2021 03:28:42 - INFO - __main__ - Step 44603: {'lr': 0.0004045566843234044, 'samples': 8563776, 'steps': 44602, 'loss/train': 1.0669195652008057} -11/07/2021 03:28:42 - INFO - __main__ - Step 44604: {'lr': 0.0004045525131885357, 'samples': 8563968, 'steps': 44603, 'loss/train': 1.5860636234283447} -11/07/2021 03:28:42 - INFO - __main__ - Step 44605: {'lr': 0.0004045483419840281, 'samples': 8564160, 'steps': 44604, 'loss/train': 1.49483060836792} -11/07/2021 03:28:43 - INFO - __main__ - Step 44606: {'lr': 0.00040454417070988325, 'samples': 8564352, 'steps': 44605, 'loss/train': 1.434079647064209} -11/07/2021 03:28:44 - INFO - __main__ - Step 44607: {'lr': 0.0004045399993661033, 'samples': 8564544, 'steps': 44606, 'loss/train': 1.501473069190979} -11/07/2021 03:28:44 - INFO - __main__ - Step 44608: {'lr': 0.00040453582795268994, 'samples': 8564736, 'steps': 44607, 'loss/train': 0.5401839017868042} -11/07/2021 03:28:45 - INFO - __main__ - Step 44609: {'lr': 0.00040453165646964505, 'samples': 8564928, 'steps': 44608, 'loss/train': 1.4329159259796143} -11/07/2021 03:28:45 - INFO - __main__ - Step 44610: {'lr': 0.00040452748491697074, 'samples': 8565120, 'steps': 44609, 'loss/train': 1.2819854021072388} -11/07/2021 03:28:46 - INFO - __main__ - Step 44611: {'lr': 0.00040452331329466864, 'samples': 8565312, 'steps': 44610, 'loss/train': 1.503104329109192} -11/07/2021 03:28:46 - INFO - __main__ - Step 44612: {'lr': 0.0004045191416027407, 'samples': 8565504, 'steps': 44611, 'loss/train': 0.9699654579162598} -11/07/2021 03:28:47 - INFO - __main__ - Step 44613: {'lr': 0.0004045149698411889, 'samples': 8565696, 'steps': 44612, 'loss/train': 0.3859573304653168} -11/07/2021 03:28:47 - INFO - __main__ - Step 44614: {'lr': 0.000404510798010015, 'samples': 8565888, 'steps': 44613, 'loss/train': 2.097834587097168} -11/07/2021 03:28:48 - INFO - __main__ - Step 44615: {'lr': 0.0004045066261092209, 'samples': 8566080, 'steps': 44614, 'loss/train': 1.0142295360565186} -11/07/2021 03:28:48 - INFO - __main__ - Step 44616: {'lr': 0.0004045024541388085, 'samples': 8566272, 'steps': 44615, 'loss/train': 1.4237236976623535} -11/07/2021 03:28:48 - INFO - __main__ - Step 44617: {'lr': 0.0004044982820987797, 'samples': 8566464, 'steps': 44616, 'loss/train': 1.5492023229599} -11/07/2021 03:28:49 - INFO - __main__ - Step 44618: {'lr': 0.0004044941099891364, 'samples': 8566656, 'steps': 44617, 'loss/train': 1.244526743888855} -11/07/2021 03:28:50 - INFO - __main__ - Step 44619: {'lr': 0.0004044899378098803, 'samples': 8566848, 'steps': 44618, 'loss/train': 1.1378777027130127} -11/07/2021 03:28:50 - INFO - __main__ - Step 44620: {'lr': 0.00040448576556101356, 'samples': 8567040, 'steps': 44619, 'loss/train': 1.8612985610961914} -11/07/2021 03:28:51 - INFO - __main__ - Step 44621: {'lr': 0.0004044815932425379, 'samples': 8567232, 'steps': 44620, 'loss/train': 2.050100088119507} -11/07/2021 03:28:51 - INFO - __main__ - Step 44622: {'lr': 0.0004044774208544551, 'samples': 8567424, 'steps': 44621, 'loss/train': 1.3216272592544556} -11/07/2021 03:28:52 - INFO - __main__ - Step 44623: {'lr': 0.00040447324839676727, 'samples': 8567616, 'steps': 44622, 'loss/train': 1.1530163288116455} -11/07/2021 03:28:52 - INFO - __main__ - Step 44624: {'lr': 0.00040446907586947614, 'samples': 8567808, 'steps': 44623, 'loss/train': 1.5983481407165527} -11/07/2021 03:28:53 - INFO - __main__ - Step 44625: {'lr': 0.0004044649032725836, 'samples': 8568000, 'steps': 44624, 'loss/train': 1.199302315711975} -11/07/2021 03:28:53 - INFO - __main__ - Step 44626: {'lr': 0.00040446073060609156, 'samples': 8568192, 'steps': 44625, 'loss/train': 1.1727397441864014} -11/07/2021 03:28:53 - INFO - __main__ - Step 44627: {'lr': 0.00040445655787000196, 'samples': 8568384, 'steps': 44626, 'loss/train': 1.0947909355163574} -11/07/2021 03:28:54 - INFO - __main__ - Step 44628: {'lr': 0.0004044523850643166, 'samples': 8568576, 'steps': 44627, 'loss/train': 1.65569269657135} -11/07/2021 03:28:55 - INFO - __main__ - Step 44629: {'lr': 0.0004044482121890374, 'samples': 8568768, 'steps': 44628, 'loss/train': 1.7430261373519897} -11/07/2021 03:28:55 - INFO - __main__ - Step 44630: {'lr': 0.00040444403924416614, 'samples': 8568960, 'steps': 44629, 'loss/train': 1.1327166557312012} -11/07/2021 03:28:55 - INFO - __main__ - Step 44631: {'lr': 0.00040443986622970486, 'samples': 8569152, 'steps': 44630, 'loss/train': 1.8160648345947266} -11/07/2021 03:28:56 - INFO - __main__ - Step 44632: {'lr': 0.0004044356931456553, 'samples': 8569344, 'steps': 44631, 'loss/train': 1.0969573259353638} -11/07/2021 03:28:57 - INFO - __main__ - Step 44633: {'lr': 0.00040443151999201946, 'samples': 8569536, 'steps': 44632, 'loss/train': 1.370672345161438} -11/07/2021 03:28:57 - INFO - __main__ - Step 44634: {'lr': 0.00040442734676879907, 'samples': 8569728, 'steps': 44633, 'loss/train': 1.0866888761520386} -11/07/2021 03:28:57 - INFO - __main__ - Step 44635: {'lr': 0.0004044231734759961, 'samples': 8569920, 'steps': 44634, 'loss/train': 1.5982840061187744} -11/07/2021 03:28:58 - INFO - __main__ - Step 44636: {'lr': 0.00040441900011361256, 'samples': 8570112, 'steps': 44635, 'loss/train': 1.1409536600112915} -11/07/2021 03:28:58 - INFO - __main__ - Step 44637: {'lr': 0.0004044148266816501, 'samples': 8570304, 'steps': 44636, 'loss/train': 1.6011314392089844} -11/07/2021 03:28:59 - INFO - __main__ - Step 44638: {'lr': 0.0004044106531801107, 'samples': 8570496, 'steps': 44637, 'loss/train': 1.7269203662872314} -11/07/2021 03:29:00 - INFO - __main__ - Step 44639: {'lr': 0.0004044064796089963, 'samples': 8570688, 'steps': 44638, 'loss/train': 1.596115231513977} -11/07/2021 03:29:00 - INFO - __main__ - Step 44640: {'lr': 0.0004044023059683087, 'samples': 8570880, 'steps': 44639, 'loss/train': 1.7004880905151367} -11/07/2021 03:29:00 - INFO - __main__ - Step 44641: {'lr': 0.00040439813225804977, 'samples': 8571072, 'steps': 44640, 'loss/train': 1.777889609336853} -11/07/2021 03:29:01 - INFO - __main__ - Step 44642: {'lr': 0.00040439395847822145, 'samples': 8571264, 'steps': 44641, 'loss/train': 1.8670952320098877} -11/07/2021 03:29:02 - INFO - __main__ - Step 44643: {'lr': 0.00040438978462882557, 'samples': 8571456, 'steps': 44642, 'loss/train': 1.3878732919692993} -11/07/2021 03:29:02 - INFO - __main__ - Step 44644: {'lr': 0.0004043856107098641, 'samples': 8571648, 'steps': 44643, 'loss/train': 1.3951754570007324} -11/07/2021 03:29:02 - INFO - __main__ - Step 44645: {'lr': 0.0004043814367213388, 'samples': 8571840, 'steps': 44644, 'loss/train': 1.39116370677948} -11/07/2021 03:29:03 - INFO - __main__ - Step 44646: {'lr': 0.00040437726266325164, 'samples': 8572032, 'steps': 44645, 'loss/train': 1.547196388244629} -11/07/2021 03:29:03 - INFO - __main__ - Step 44647: {'lr': 0.00040437308853560444, 'samples': 8572224, 'steps': 44646, 'loss/train': 1.3838136196136475} -11/07/2021 03:29:04 - INFO - __main__ - Step 44648: {'lr': 0.0004043689143383991, 'samples': 8572416, 'steps': 44647, 'loss/train': 1.6577091217041016} -11/07/2021 03:29:04 - INFO - __main__ - Step 44649: {'lr': 0.00040436474007163754, 'samples': 8572608, 'steps': 44648, 'loss/train': 1.0719048976898193} -11/07/2021 03:29:05 - INFO - __main__ - Step 44650: {'lr': 0.0004043605657353216, 'samples': 8572800, 'steps': 44649, 'loss/train': 1.302512288093567} -11/07/2021 03:29:05 - INFO - __main__ - Step 44651: {'lr': 0.00040435639132945314, 'samples': 8572992, 'steps': 44650, 'loss/train': 1.2456927299499512} -11/07/2021 03:29:05 - INFO - __main__ - Step 44652: {'lr': 0.0004043522168540341, 'samples': 8573184, 'steps': 44651, 'loss/train': 1.5196424722671509} -11/07/2021 03:29:06 - INFO - __main__ - Step 44653: {'lr': 0.0004043480423090664, 'samples': 8573376, 'steps': 44652, 'loss/train': 1.4495714902877808} -11/07/2021 03:29:07 - INFO - __main__ - Step 44654: {'lr': 0.0004043438676945518, 'samples': 8573568, 'steps': 44653, 'loss/train': 1.6864550113677979} -11/07/2021 03:29:07 - INFO - __main__ - Step 44655: {'lr': 0.0004043396930104922, 'samples': 8573760, 'steps': 44654, 'loss/train': 1.440232515335083} -11/07/2021 03:29:07 - INFO - __main__ - Step 44656: {'lr': 0.0004043355182568895, 'samples': 8573952, 'steps': 44655, 'loss/train': 1.5735957622528076} -11/07/2021 03:29:08 - INFO - __main__ - Step 44657: {'lr': 0.00040433134343374565, 'samples': 8574144, 'steps': 44656, 'loss/train': 1.6642217636108398} -11/07/2021 03:29:08 - INFO - __main__ - Step 44658: {'lr': 0.0004043271685410625, 'samples': 8574336, 'steps': 44657, 'loss/train': 1.1298478841781616} -11/07/2021 03:29:09 - INFO - __main__ - Step 44659: {'lr': 0.00040432299357884185, 'samples': 8574528, 'steps': 44658, 'loss/train': 1.385873794555664} -11/07/2021 03:29:10 - INFO - __main__ - Step 44660: {'lr': 0.0004043188185470856, 'samples': 8574720, 'steps': 44659, 'loss/train': 1.2078728675842285} -11/07/2021 03:29:10 - INFO - __main__ - Step 44661: {'lr': 0.00040431464344579585, 'samples': 8574912, 'steps': 44660, 'loss/train': 1.7153549194335938} -11/07/2021 03:29:10 - INFO - __main__ - Step 44662: {'lr': 0.00040431046827497415, 'samples': 8575104, 'steps': 44661, 'loss/train': 1.582525610923767} -11/07/2021 03:29:11 - INFO - __main__ - Step 44663: {'lr': 0.00040430629303462256, 'samples': 8575296, 'steps': 44662, 'loss/train': 1.4888883829116821} -11/07/2021 03:29:12 - INFO - __main__ - Step 44664: {'lr': 0.000404302117724743, 'samples': 8575488, 'steps': 44663, 'loss/train': 1.955739974975586} -11/07/2021 03:29:12 - INFO - __main__ - Step 44665: {'lr': 0.00040429794234533726, 'samples': 8575680, 'steps': 44664, 'loss/train': 1.2550443410873413} -11/07/2021 03:29:12 - INFO - __main__ - Step 44666: {'lr': 0.0004042937668964072, 'samples': 8575872, 'steps': 44665, 'loss/train': 2.086137056350708} -11/07/2021 03:29:13 - INFO - __main__ - Step 44667: {'lr': 0.00040428959137795475, 'samples': 8576064, 'steps': 44666, 'loss/train': 1.512468695640564} -11/07/2021 03:29:13 - INFO - __main__ - Step 44668: {'lr': 0.0004042854157899818, 'samples': 8576256, 'steps': 44667, 'loss/train': 1.9976961612701416} -11/07/2021 03:29:13 - INFO - __main__ - Step 44669: {'lr': 0.0004042812401324902, 'samples': 8576448, 'steps': 44668, 'loss/train': 1.7271101474761963} -11/07/2021 03:29:14 - INFO - __main__ - Step 44670: {'lr': 0.0004042770644054819, 'samples': 8576640, 'steps': 44669, 'loss/train': 1.6623976230621338} -11/07/2021 03:29:15 - INFO - __main__ - Step 44671: {'lr': 0.0004042728886089587, 'samples': 8576832, 'steps': 44670, 'loss/train': 1.8340626955032349} -11/07/2021 03:29:15 - INFO - __main__ - Step 44672: {'lr': 0.00040426871274292257, 'samples': 8577024, 'steps': 44671, 'loss/train': 1.5917364358901978} -11/07/2021 03:29:16 - INFO - __main__ - Step 44673: {'lr': 0.00040426453680737534, 'samples': 8577216, 'steps': 44672, 'loss/train': 1.7523205280303955} -11/07/2021 03:29:16 - INFO - __main__ - Step 44674: {'lr': 0.0004042603608023189, 'samples': 8577408, 'steps': 44673, 'loss/train': 1.5502620935440063} -11/07/2021 03:29:17 - INFO - __main__ - Step 44675: {'lr': 0.00040425618472775504, 'samples': 8577600, 'steps': 44674, 'loss/train': 1.4467202425003052} -11/07/2021 03:29:17 - INFO - __main__ - Step 44676: {'lr': 0.0004042520085836857, 'samples': 8577792, 'steps': 44675, 'loss/train': 1.835953712463379} -11/07/2021 03:29:18 - INFO - __main__ - Step 44677: {'lr': 0.0004042478323701129, 'samples': 8577984, 'steps': 44676, 'loss/train': 1.275037169456482} -11/07/2021 03:29:18 - INFO - __main__ - Step 44678: {'lr': 0.00040424365608703836, 'samples': 8578176, 'steps': 44677, 'loss/train': 1.4688793420791626} -11/07/2021 03:29:18 - INFO - __main__ - Step 44679: {'lr': 0.00040423947973446404, 'samples': 8578368, 'steps': 44678, 'loss/train': 1.7626153230667114} -11/07/2021 03:29:19 - INFO - __main__ - Step 44680: {'lr': 0.00040423530331239177, 'samples': 8578560, 'steps': 44679, 'loss/train': 1.0789210796356201} -11/07/2021 03:29:20 - INFO - __main__ - Step 44681: {'lr': 0.0004042311268208234, 'samples': 8578752, 'steps': 44680, 'loss/train': 2.3214893341064453} -11/07/2021 03:29:20 - INFO - __main__ - Step 44682: {'lr': 0.00040422695025976084, 'samples': 8578944, 'steps': 44681, 'loss/train': 1.3355746269226074} -11/07/2021 03:29:21 - INFO - __main__ - Step 44683: {'lr': 0.00040422277362920614, 'samples': 8579136, 'steps': 44682, 'loss/train': 0.9555754661560059} -11/07/2021 03:29:21 - INFO - __main__ - Step 44684: {'lr': 0.0004042185969291609, 'samples': 8579328, 'steps': 44683, 'loss/train': 1.8307428359985352} -11/07/2021 03:29:22 - INFO - __main__ - Step 44685: {'lr': 0.00040421442015962727, 'samples': 8579520, 'steps': 44684, 'loss/train': 1.598419189453125} -11/07/2021 03:29:22 - INFO - __main__ - Step 44686: {'lr': 0.0004042102433206069, 'samples': 8579712, 'steps': 44685, 'loss/train': 1.1682043075561523} -11/07/2021 03:29:23 - INFO - __main__ - Step 44687: {'lr': 0.0004042060664121018, 'samples': 8579904, 'steps': 44686, 'loss/train': 0.7249529361724854} -11/07/2021 03:29:23 - INFO - __main__ - Step 44688: {'lr': 0.00040420188943411385, 'samples': 8580096, 'steps': 44687, 'loss/train': 1.834280014038086} -11/07/2021 03:29:23 - INFO - __main__ - Step 44689: {'lr': 0.0004041977123866448, 'samples': 8580288, 'steps': 44688, 'loss/train': 1.1947107315063477} -11/07/2021 03:29:24 - INFO - __main__ - Step 44690: {'lr': 0.0004041935352696968, 'samples': 8580480, 'steps': 44689, 'loss/train': 1.2123805284500122} -11/07/2021 03:29:25 - INFO - __main__ - Step 44691: {'lr': 0.00040418935808327153, 'samples': 8580672, 'steps': 44690, 'loss/train': 0.9247638583183289} -11/07/2021 03:29:25 - INFO - __main__ - Step 44692: {'lr': 0.00040418518082737087, 'samples': 8580864, 'steps': 44691, 'loss/train': 1.1153234243392944} -11/07/2021 03:29:25 - INFO - __main__ - Step 44693: {'lr': 0.0004041810035019967, 'samples': 8581056, 'steps': 44692, 'loss/train': 1.3872288465499878} -11/07/2021 03:29:26 - INFO - __main__ - Step 44694: {'lr': 0.00040417682610715107, 'samples': 8581248, 'steps': 44693, 'loss/train': 1.0482349395751953} -11/07/2021 03:29:27 - INFO - __main__ - Step 44695: {'lr': 0.00040417264864283563, 'samples': 8581440, 'steps': 44694, 'loss/train': 1.252543568611145} -11/07/2021 03:29:27 - INFO - __main__ - Step 44696: {'lr': 0.00040416847110905243, 'samples': 8581632, 'steps': 44695, 'loss/train': 1.1403671503067017} -11/07/2021 03:29:28 - INFO - __main__ - Step 44697: {'lr': 0.0004041642935058033, 'samples': 8581824, 'steps': 44696, 'loss/train': 1.35580313205719} -11/07/2021 03:29:28 - INFO - __main__ - Step 44698: {'lr': 0.0004041601158330901, 'samples': 8582016, 'steps': 44697, 'loss/train': 1.7104305028915405} -11/07/2021 03:29:28 - INFO - __main__ - Step 44699: {'lr': 0.0004041559380909148, 'samples': 8582208, 'steps': 44698, 'loss/train': 1.700950264930725} -11/07/2021 03:29:29 - INFO - __main__ - Step 44700: {'lr': 0.00040415176027927915, 'samples': 8582400, 'steps': 44699, 'loss/train': 1.3662071228027344} -11/07/2021 03:29:31 - INFO - __main__ - Step 44701: {'lr': 0.00040414758239818506, 'samples': 8582592, 'steps': 44700, 'loss/train': 1.6446884870529175} -11/07/2021 03:29:31 - INFO - __main__ - Step 44702: {'lr': 0.00040414340444763455, 'samples': 8582784, 'steps': 44701, 'loss/train': 1.5361683368682861} -11/07/2021 03:29:32 - INFO - __main__ - Step 44703: {'lr': 0.0004041392264276292, 'samples': 8582976, 'steps': 44702, 'loss/train': 1.8980095386505127} -11/07/2021 03:29:32 - INFO - __main__ - Step 44704: {'lr': 0.00040413504833817127, 'samples': 8583168, 'steps': 44703, 'loss/train': 1.8210697174072266} -11/07/2021 03:29:32 - INFO - __main__ - Step 44705: {'lr': 0.0004041308701792625, 'samples': 8583360, 'steps': 44704, 'loss/train': 1.8195379972457886} -11/07/2021 03:29:33 - INFO - __main__ - Step 44706: {'lr': 0.00040412669195090466, 'samples': 8583552, 'steps': 44705, 'loss/train': 1.787896752357483} -11/07/2021 03:29:33 - INFO - __main__ - Step 44707: {'lr': 0.0004041225136530997, 'samples': 8583744, 'steps': 44706, 'loss/train': 1.7658010721206665} -11/07/2021 03:29:34 - INFO - __main__ - Step 44708: {'lr': 0.0004041183352858495, 'samples': 8583936, 'steps': 44707, 'loss/train': 1.7904207706451416} -11/07/2021 03:29:34 - INFO - __main__ - Step 44709: {'lr': 0.00040411415684915596, 'samples': 8584128, 'steps': 44708, 'loss/train': 1.2527177333831787} -11/07/2021 03:29:35 - INFO - __main__ - Step 44710: {'lr': 0.000404109978343021, 'samples': 8584320, 'steps': 44709, 'loss/train': 1.5017738342285156} -11/07/2021 03:29:35 - INFO - __main__ - Step 44711: {'lr': 0.0004041057997674464, 'samples': 8584512, 'steps': 44710, 'loss/train': 1.3378225564956665} -11/07/2021 03:29:36 - INFO - __main__ - Step 44712: {'lr': 0.0004041016211224342, 'samples': 8584704, 'steps': 44711, 'loss/train': 1.3807090520858765} -11/07/2021 03:29:37 - INFO - __main__ - Step 44713: {'lr': 0.0004040974424079862, 'samples': 8584896, 'steps': 44712, 'loss/train': 1.5382866859436035} -11/07/2021 03:29:37 - INFO - __main__ - Step 44714: {'lr': 0.00040409326362410416, 'samples': 8585088, 'steps': 44713, 'loss/train': 1.2872508764266968} -11/07/2021 03:29:37 - INFO - __main__ - Step 44715: {'lr': 0.0004040890847707901, 'samples': 8585280, 'steps': 44714, 'loss/train': 1.6032570600509644} -11/07/2021 03:29:38 - INFO - __main__ - Step 44716: {'lr': 0.0004040849058480459, 'samples': 8585472, 'steps': 44715, 'loss/train': 0.18380995094776154} -11/07/2021 03:29:38 - INFO - __main__ - Step 44717: {'lr': 0.0004040807268558734, 'samples': 8585664, 'steps': 44716, 'loss/train': 1.8361215591430664} -11/07/2021 03:29:38 - INFO - __main__ - Step 44718: {'lr': 0.0004040765477942745, 'samples': 8585856, 'steps': 44717, 'loss/train': 1.7135276794433594} -11/07/2021 03:29:39 - INFO - __main__ - Step 44719: {'lr': 0.0004040723686632512, 'samples': 8586048, 'steps': 44718, 'loss/train': 1.422973394393921} -11/07/2021 03:29:40 - INFO - __main__ - Step 44720: {'lr': 0.00040406818946280514, 'samples': 8586240, 'steps': 44719, 'loss/train': 0.0921250507235527} -11/07/2021 03:29:40 - INFO - __main__ - Step 44721: {'lr': 0.0004040640101929384, 'samples': 8586432, 'steps': 44720, 'loss/train': 1.2875210046768188} -11/07/2021 03:29:41 - INFO - __main__ - Step 44722: {'lr': 0.0004040598308536527, 'samples': 8586624, 'steps': 44721, 'loss/train': 1.5017659664154053} -11/07/2021 03:29:41 - INFO - __main__ - Step 44723: {'lr': 0.0004040556514449501, 'samples': 8586816, 'steps': 44722, 'loss/train': 1.0461225509643555} -11/07/2021 03:29:42 - INFO - __main__ - Step 44724: {'lr': 0.0004040514719668324, 'samples': 8587008, 'steps': 44723, 'loss/train': 1.646589756011963} -11/07/2021 03:29:42 - INFO - __main__ - Step 44725: {'lr': 0.00040404729241930144, 'samples': 8587200, 'steps': 44724, 'loss/train': 1.349840521812439} -11/07/2021 03:29:43 - INFO - __main__ - Step 44726: {'lr': 0.0004040431128023592, 'samples': 8587392, 'steps': 44725, 'loss/train': 1.336923599243164} -11/07/2021 03:29:43 - INFO - __main__ - Step 44727: {'lr': 0.0004040389331160075, 'samples': 8587584, 'steps': 44726, 'loss/train': 1.6357241868972778} -11/07/2021 03:29:43 - INFO - __main__ - Step 44728: {'lr': 0.00040403475336024816, 'samples': 8587776, 'steps': 44727, 'loss/train': 1.8353484869003296} -11/07/2021 03:29:45 - INFO - __main__ - Step 44729: {'lr': 0.0004040305735350832, 'samples': 8587968, 'steps': 44728, 'loss/train': 1.692384123802185} -11/07/2021 03:29:45 - INFO - __main__ - Step 44730: {'lr': 0.00040402639364051443, 'samples': 8588160, 'steps': 44729, 'loss/train': 1.8110960721969604} -11/07/2021 03:29:45 - INFO - __main__ - Step 44731: {'lr': 0.0004040222136765437, 'samples': 8588352, 'steps': 44730, 'loss/train': 1.1847339868545532} -11/07/2021 03:29:46 - INFO - __main__ - Step 44732: {'lr': 0.000404018033643173, 'samples': 8588544, 'steps': 44731, 'loss/train': 1.5125484466552734} -11/07/2021 03:29:46 - INFO - __main__ - Step 44733: {'lr': 0.00040401385354040415, 'samples': 8588736, 'steps': 44732, 'loss/train': 1.4958770275115967} -11/07/2021 03:29:46 - INFO - __main__ - Step 44734: {'lr': 0.00040400967336823903, 'samples': 8588928, 'steps': 44733, 'loss/train': 1.5879772901535034} -11/07/2021 03:29:47 - INFO - __main__ - Step 44735: {'lr': 0.0004040054931266795, 'samples': 8589120, 'steps': 44734, 'loss/train': 1.4642417430877686} -11/07/2021 03:29:48 - INFO - __main__ - Step 44736: {'lr': 0.0004040013128157275, 'samples': 8589312, 'steps': 44735, 'loss/train': 1.6132031679153442} -11/07/2021 03:29:48 - INFO - __main__ - Step 44737: {'lr': 0.00040399713243538483, 'samples': 8589504, 'steps': 44736, 'loss/train': 0.6882599592208862} -11/07/2021 03:29:48 - INFO - __main__ - Step 44738: {'lr': 0.00040399295198565344, 'samples': 8589696, 'steps': 44737, 'loss/train': 1.5418144464492798} -11/07/2021 03:29:49 - INFO - __main__ - Step 44739: {'lr': 0.0004039887714665352, 'samples': 8589888, 'steps': 44738, 'loss/train': 1.4107799530029297} -11/07/2021 03:29:50 - INFO - __main__ - Step 44740: {'lr': 0.0004039845908780321, 'samples': 8590080, 'steps': 44739, 'loss/train': 1.3109534978866577} -11/07/2021 03:29:50 - INFO - __main__ - Step 44741: {'lr': 0.00040398041022014585, 'samples': 8590272, 'steps': 44740, 'loss/train': 1.3458914756774902} -11/07/2021 03:29:51 - INFO - __main__ - Step 44742: {'lr': 0.0004039762294928784, 'samples': 8590464, 'steps': 44741, 'loss/train': 1.0974065065383911} -11/07/2021 03:29:51 - INFO - __main__ - Step 44743: {'lr': 0.0004039720486962316, 'samples': 8590656, 'steps': 44742, 'loss/train': 1.3014174699783325} -11/07/2021 03:29:51 - INFO - __main__ - Step 44744: {'lr': 0.00040396786783020747, 'samples': 8590848, 'steps': 44743, 'loss/train': 1.29957115650177} -11/07/2021 03:29:52 - INFO - __main__ - Step 44745: {'lr': 0.00040396368689480766, 'samples': 8591040, 'steps': 44744, 'loss/train': 1.4198511838912964} -11/07/2021 03:29:53 - INFO - __main__ - Step 44746: {'lr': 0.00040395950589003425, 'samples': 8591232, 'steps': 44745, 'loss/train': 1.7467460632324219} -11/07/2021 03:29:53 - INFO - __main__ - Step 44747: {'lr': 0.00040395532481588914, 'samples': 8591424, 'steps': 44746, 'loss/train': 1.654396414756775} -11/07/2021 03:29:53 - INFO - __main__ - Step 44748: {'lr': 0.00040395114367237407, 'samples': 8591616, 'steps': 44747, 'loss/train': 1.1026297807693481} -11/07/2021 03:29:54 - INFO - __main__ - Step 44749: {'lr': 0.00040394696245949093, 'samples': 8591808, 'steps': 44748, 'loss/train': 1.638931155204773} -11/07/2021 03:29:55 - INFO - __main__ - Step 44750: {'lr': 0.0004039427811772417, 'samples': 8592000, 'steps': 44749, 'loss/train': 1.6664801836013794} -11/07/2021 03:29:55 - INFO - __main__ - Step 44751: {'lr': 0.0004039385998256283, 'samples': 8592192, 'steps': 44750, 'loss/train': 1.2520142793655396} -11/07/2021 03:29:55 - INFO - __main__ - Step 44752: {'lr': 0.0004039344184046525, 'samples': 8592384, 'steps': 44751, 'loss/train': 1.4764256477355957} -11/07/2021 03:29:56 - INFO - __main__ - Step 44753: {'lr': 0.00040393023691431617, 'samples': 8592576, 'steps': 44752, 'loss/train': 1.5981147289276123} -11/07/2021 03:29:56 - INFO - __main__ - Step 44754: {'lr': 0.00040392605535462137, 'samples': 8592768, 'steps': 44753, 'loss/train': 1.1540776491165161} -11/07/2021 03:29:57 - INFO - __main__ - Step 44755: {'lr': 0.00040392187372556977, 'samples': 8592960, 'steps': 44754, 'loss/train': 1.6268656253814697} -11/07/2021 03:29:57 - INFO - __main__ - Step 44756: {'lr': 0.00040391769202716333, 'samples': 8593152, 'steps': 44755, 'loss/train': 1.6105319261550903} -11/07/2021 03:29:58 - INFO - __main__ - Step 44757: {'lr': 0.00040391351025940406, 'samples': 8593344, 'steps': 44756, 'loss/train': 1.4816174507141113} -11/07/2021 03:29:58 - INFO - __main__ - Step 44758: {'lr': 0.00040390932842229363, 'samples': 8593536, 'steps': 44757, 'loss/train': 1.7078075408935547} -11/07/2021 03:29:59 - INFO - __main__ - Step 44759: {'lr': 0.0004039051465158341, 'samples': 8593728, 'steps': 44758, 'loss/train': 1.6025429964065552} -11/07/2021 03:29:59 - INFO - __main__ - Step 44760: {'lr': 0.0004039009645400272, 'samples': 8593920, 'steps': 44759, 'loss/train': 1.4869424104690552} -11/07/2021 03:30:00 - INFO - __main__ - Step 44761: {'lr': 0.00040389678249487504, 'samples': 8594112, 'steps': 44760, 'loss/train': 1.7148278951644897} -11/07/2021 03:30:00 - INFO - __main__ - Step 44762: {'lr': 0.00040389260038037924, 'samples': 8594304, 'steps': 44761, 'loss/train': 0.8487159609794617} -11/07/2021 03:30:01 - INFO - __main__ - Step 44763: {'lr': 0.0004038884181965419, 'samples': 8594496, 'steps': 44762, 'loss/train': 1.2550697326660156} -11/07/2021 03:30:01 - INFO - __main__ - Step 44764: {'lr': 0.0004038842359433647, 'samples': 8594688, 'steps': 44763, 'loss/train': 1.3257486820220947} -11/07/2021 03:30:01 - INFO - __main__ - Step 44765: {'lr': 0.0004038800536208497, 'samples': 8594880, 'steps': 44764, 'loss/train': 1.4142779111862183} -11/07/2021 03:30:02 - INFO - __main__ - Step 44766: {'lr': 0.00040387587122899877, 'samples': 8595072, 'steps': 44765, 'loss/train': 1.2997912168502808} -11/07/2021 03:30:03 - INFO - __main__ - Step 44767: {'lr': 0.0004038716887678137, 'samples': 8595264, 'steps': 44766, 'loss/train': 1.6130790710449219} -11/07/2021 03:30:03 - INFO - __main__ - Step 44768: {'lr': 0.0004038675062372964, 'samples': 8595456, 'steps': 44767, 'loss/train': 1.2441644668579102} -11/07/2021 03:30:03 - INFO - __main__ - Step 44769: {'lr': 0.00040386332363744884, 'samples': 8595648, 'steps': 44768, 'loss/train': 1.7680883407592773} -11/07/2021 03:30:04 - INFO - __main__ - Step 44770: {'lr': 0.0004038591409682728, 'samples': 8595840, 'steps': 44769, 'loss/train': 1.4171826839447021} -11/07/2021 03:30:05 - INFO - __main__ - Step 44771: {'lr': 0.00040385495822977015, 'samples': 8596032, 'steps': 44770, 'loss/train': 1.5394569635391235} -11/07/2021 03:30:05 - INFO - __main__ - Step 44772: {'lr': 0.00040385077542194294, 'samples': 8596224, 'steps': 44771, 'loss/train': 1.4642919301986694} -11/07/2021 03:30:05 - INFO - __main__ - Step 44773: {'lr': 0.0004038465925447929, 'samples': 8596416, 'steps': 44772, 'loss/train': 1.5884572267532349} -11/07/2021 03:30:06 - INFO - __main__ - Step 44774: {'lr': 0.00040384240959832196, 'samples': 8596608, 'steps': 44773, 'loss/train': 1.3437590599060059} -11/07/2021 03:30:06 - INFO - __main__ - Step 44775: {'lr': 0.000403838226582532, 'samples': 8596800, 'steps': 44774, 'loss/train': 1.4359939098358154} -11/07/2021 03:30:07 - INFO - __main__ - Step 44776: {'lr': 0.00040383404349742484, 'samples': 8596992, 'steps': 44775, 'loss/train': 1.4305771589279175} -11/07/2021 03:30:08 - INFO - __main__ - Step 44777: {'lr': 0.0004038298603430025, 'samples': 8597184, 'steps': 44776, 'loss/train': 1.1964409351348877} -11/07/2021 03:30:08 - INFO - __main__ - Step 44778: {'lr': 0.0004038256771192668, 'samples': 8597376, 'steps': 44777, 'loss/train': 1.8335461616516113} -11/07/2021 03:30:08 - INFO - __main__ - Step 44779: {'lr': 0.00040382149382621967, 'samples': 8597568, 'steps': 44778, 'loss/train': 1.5217831134796143} -11/07/2021 03:30:09 - INFO - __main__ - Step 44780: {'lr': 0.00040381731046386295, 'samples': 8597760, 'steps': 44779, 'loss/train': 1.361086130142212} -11/07/2021 03:30:10 - INFO - __main__ - Step 44781: {'lr': 0.0004038131270321984, 'samples': 8597952, 'steps': 44780, 'loss/train': 1.297823429107666} -11/07/2021 03:30:10 - INFO - __main__ - Step 44782: {'lr': 0.0004038089435312281, 'samples': 8598144, 'steps': 44781, 'loss/train': 1.009280800819397} -11/07/2021 03:30:10 - INFO - __main__ - Step 44783: {'lr': 0.0004038047599609539, 'samples': 8598336, 'steps': 44782, 'loss/train': 0.9909611344337463} -11/07/2021 03:30:11 - INFO - __main__ - Step 44784: {'lr': 0.00040380057632137756, 'samples': 8598528, 'steps': 44783, 'loss/train': 1.3801733255386353} -11/07/2021 03:30:11 - INFO - __main__ - Step 44785: {'lr': 0.0004037963926125011, 'samples': 8598720, 'steps': 44784, 'loss/train': 1.8758233785629272} -11/07/2021 03:30:12 - INFO - __main__ - Step 44786: {'lr': 0.00040379220883432644, 'samples': 8598912, 'steps': 44785, 'loss/train': 1.2698369026184082} -11/07/2021 03:30:12 - INFO - __main__ - Step 44787: {'lr': 0.0004037880249868553, 'samples': 8599104, 'steps': 44786, 'loss/train': 1.7087428569793701} -11/07/2021 03:30:13 - INFO - __main__ - Step 44788: {'lr': 0.00040378384107008967, 'samples': 8599296, 'steps': 44787, 'loss/train': 1.9226173162460327} -11/07/2021 03:30:13 - INFO - __main__ - Step 44789: {'lr': 0.00040377965708403133, 'samples': 8599488, 'steps': 44788, 'loss/train': 1.6939905881881714} -11/07/2021 03:30:13 - INFO - __main__ - Step 44790: {'lr': 0.00040377547302868235, 'samples': 8599680, 'steps': 44789, 'loss/train': 5.499805927276611} -11/07/2021 03:30:14 - INFO - __main__ - Step 44791: {'lr': 0.00040377128890404444, 'samples': 8599872, 'steps': 44790, 'loss/train': 1.661346435546875} -11/07/2021 03:30:15 - INFO - __main__ - Step 44792: {'lr': 0.00040376710471011967, 'samples': 8600064, 'steps': 44791, 'loss/train': 1.880703091621399} -11/07/2021 03:30:15 - INFO - __main__ - Step 44793: {'lr': 0.0004037629204469098, 'samples': 8600256, 'steps': 44792, 'loss/train': 1.6165194511413574} -11/07/2021 03:30:16 - INFO - __main__ - Step 44794: {'lr': 0.0004037587361144166, 'samples': 8600448, 'steps': 44793, 'loss/train': 1.1653132438659668} -11/07/2021 03:30:16 - INFO - __main__ - Step 44795: {'lr': 0.0004037545517126422, 'samples': 8600640, 'steps': 44794, 'loss/train': 1.2117013931274414} -11/07/2021 03:30:16 - INFO - __main__ - Step 44796: {'lr': 0.0004037503672415883, 'samples': 8600832, 'steps': 44795, 'loss/train': 1.3438433408737183} -11/07/2021 03:30:17 - INFO - __main__ - Step 44797: {'lr': 0.000403746182701257, 'samples': 8601024, 'steps': 44796, 'loss/train': 1.2403674125671387} -11/07/2021 03:30:18 - INFO - __main__ - Step 44798: {'lr': 0.0004037419980916499, 'samples': 8601216, 'steps': 44797, 'loss/train': 1.3725799322128296} -11/07/2021 03:30:18 - INFO - __main__ - Step 44799: {'lr': 0.00040373781341276904, 'samples': 8601408, 'steps': 44798, 'loss/train': 1.3333415985107422} -11/07/2021 03:30:18 - INFO - __main__ - Step 44800: {'lr': 0.00040373362866461633, 'samples': 8601600, 'steps': 44799, 'loss/train': 1.6242492198944092} -11/07/2021 03:30:19 - INFO - __main__ - Step 44801: {'lr': 0.0004037294438471936, 'samples': 8601792, 'steps': 44800, 'loss/train': 1.2437806129455566} -11/07/2021 03:30:20 - INFO - __main__ - Step 44802: {'lr': 0.00040372525896050285, 'samples': 8601984, 'steps': 44801, 'loss/train': 1.6958515644073486} -11/07/2021 03:30:20 - INFO - __main__ - Step 44803: {'lr': 0.0004037210740045457, 'samples': 8602176, 'steps': 44802, 'loss/train': 1.30084228515625} -11/07/2021 03:30:21 - INFO - __main__ - Step 44804: {'lr': 0.0004037168889793243, 'samples': 8602368, 'steps': 44803, 'loss/train': 1.8645272254943848} -11/07/2021 03:30:21 - INFO - __main__ - Step 44805: {'lr': 0.0004037127038848404, 'samples': 8602560, 'steps': 44804, 'loss/train': 1.5042856931686401} -11/07/2021 03:30:21 - INFO - __main__ - Step 44806: {'lr': 0.00040370851872109604, 'samples': 8602752, 'steps': 44805, 'loss/train': 1.5103329420089722} -11/07/2021 03:30:22 - INFO - __main__ - Step 44807: {'lr': 0.0004037043334880929, 'samples': 8602944, 'steps': 44806, 'loss/train': 1.3800625801086426} -11/07/2021 03:30:23 - INFO - __main__ - Step 44808: {'lr': 0.000403700148185833, 'samples': 8603136, 'steps': 44807, 'loss/train': 1.4422687292099} -11/07/2021 03:30:23 - INFO - __main__ - Step 44809: {'lr': 0.00040369596281431816, 'samples': 8603328, 'steps': 44808, 'loss/train': 1.1962133646011353} -11/07/2021 03:30:23 - INFO - __main__ - Step 44810: {'lr': 0.0004036917773735502, 'samples': 8603520, 'steps': 44809, 'loss/train': 1.5136005878448486} -11/07/2021 03:30:24 - INFO - __main__ - Step 44811: {'lr': 0.00040368759186353123, 'samples': 8603712, 'steps': 44810, 'loss/train': 1.7433708906173706} -11/07/2021 03:30:25 - INFO - __main__ - Step 44812: {'lr': 0.0004036834062842629, 'samples': 8603904, 'steps': 44811, 'loss/train': 1.8308992385864258} -11/07/2021 03:30:25 - INFO - __main__ - Step 44813: {'lr': 0.00040367922063574735, 'samples': 8604096, 'steps': 44812, 'loss/train': 1.7019158601760864} -11/07/2021 03:30:26 - INFO - __main__ - Step 44814: {'lr': 0.0004036750349179862, 'samples': 8604288, 'steps': 44813, 'loss/train': 1.2187209129333496} -11/07/2021 03:30:26 - INFO - __main__ - Step 44815: {'lr': 0.00040367084913098153, 'samples': 8604480, 'steps': 44814, 'loss/train': 1.3914854526519775} -11/07/2021 03:30:26 - INFO - __main__ - Step 44816: {'lr': 0.000403666663274735, 'samples': 8604672, 'steps': 44815, 'loss/train': 1.2438373565673828} -11/07/2021 03:30:27 - INFO - __main__ - Step 44817: {'lr': 0.0004036624773492488, 'samples': 8604864, 'steps': 44816, 'loss/train': 1.1171629428863525} -11/07/2021 03:30:28 - INFO - __main__ - Step 44818: {'lr': 0.0004036582913545246, 'samples': 8605056, 'steps': 44817, 'loss/train': 1.2431228160858154} -11/07/2021 03:30:28 - INFO - __main__ - Step 44819: {'lr': 0.0004036541052905643, 'samples': 8605248, 'steps': 44818, 'loss/train': 1.629530906677246} -11/07/2021 03:30:28 - INFO - __main__ - Step 44820: {'lr': 0.0004036499191573699, 'samples': 8605440, 'steps': 44819, 'loss/train': 2.1798417568206787} -11/07/2021 03:30:29 - INFO - __main__ - Step 44821: {'lr': 0.00040364573295494316, 'samples': 8605632, 'steps': 44820, 'loss/train': 1.426156997680664} -11/07/2021 03:30:30 - INFO - __main__ - Step 44822: {'lr': 0.00040364154668328604, 'samples': 8605824, 'steps': 44821, 'loss/train': 1.6849960088729858} -11/07/2021 03:30:30 - INFO - __main__ - Step 44823: {'lr': 0.0004036373603424004, 'samples': 8606016, 'steps': 44822, 'loss/train': 1.3584458827972412} -11/07/2021 03:30:30 - INFO - __main__ - Step 44824: {'lr': 0.00040363317393228814, 'samples': 8606208, 'steps': 44823, 'loss/train': 0.9686586260795593} -11/07/2021 03:30:31 - INFO - __main__ - Step 44825: {'lr': 0.00040362898745295117, 'samples': 8606400, 'steps': 44824, 'loss/train': 1.492126703262329} -11/07/2021 03:30:31 - INFO - __main__ - Step 44826: {'lr': 0.00040362480090439136, 'samples': 8606592, 'steps': 44825, 'loss/train': 1.4815083742141724} -11/07/2021 03:30:32 - INFO - __main__ - Step 44827: {'lr': 0.00040362061428661055, 'samples': 8606784, 'steps': 44826, 'loss/train': 1.5363249778747559} -11/07/2021 03:30:33 - INFO - __main__ - Step 44828: {'lr': 0.0004036164275996107, 'samples': 8606976, 'steps': 44827, 'loss/train': 1.1376135349273682} -11/07/2021 03:30:33 - INFO - __main__ - Step 44829: {'lr': 0.00040361224084339365, 'samples': 8607168, 'steps': 44828, 'loss/train': 1.5848695039749146} -11/07/2021 03:30:33 - INFO - __main__ - Step 44830: {'lr': 0.00040360805401796124, 'samples': 8607360, 'steps': 44829, 'loss/train': 1.6936755180358887} -11/07/2021 03:30:34 - INFO - __main__ - Step 44831: {'lr': 0.0004036038671233154, 'samples': 8607552, 'steps': 44830, 'loss/train': 1.593983769416809} -11/07/2021 03:30:34 - INFO - __main__ - Step 44832: {'lr': 0.00040359968015945814, 'samples': 8607744, 'steps': 44831, 'loss/train': 1.419744849205017} -11/07/2021 03:30:35 - INFO - __main__ - Step 44833: {'lr': 0.0004035954931263912, 'samples': 8607936, 'steps': 44832, 'loss/train': 1.3327523469924927} -11/07/2021 03:30:35 - INFO - __main__ - Step 44834: {'lr': 0.00040359130602411644, 'samples': 8608128, 'steps': 44833, 'loss/train': 1.508933186531067} -11/07/2021 03:30:36 - INFO - __main__ - Step 44835: {'lr': 0.0004035871188526358, 'samples': 8608320, 'steps': 44834, 'loss/train': 1.6264845132827759} -11/07/2021 03:30:36 - INFO - __main__ - Step 44836: {'lr': 0.00040358293161195125, 'samples': 8608512, 'steps': 44835, 'loss/train': 1.378198266029358} -11/07/2021 03:30:37 - INFO - __main__ - Step 44837: {'lr': 0.0004035787443020645, 'samples': 8608704, 'steps': 44836, 'loss/train': 1.2456293106079102} -11/07/2021 03:30:37 - INFO - __main__ - Step 44838: {'lr': 0.00040357455692297765, 'samples': 8608896, 'steps': 44837, 'loss/train': 1.5283297300338745} -11/07/2021 03:30:38 - INFO - __main__ - Step 44839: {'lr': 0.0004035703694746924, 'samples': 8609088, 'steps': 44838, 'loss/train': 1.4481676816940308} -11/07/2021 03:30:38 - INFO - __main__ - Step 44840: {'lr': 0.0004035661819572108, 'samples': 8609280, 'steps': 44839, 'loss/train': 1.4853111505508423} -11/07/2021 03:30:39 - INFO - __main__ - Step 44841: {'lr': 0.0004035619943705345, 'samples': 8609472, 'steps': 44840, 'loss/train': 1.4644232988357544} -11/07/2021 03:30:39 - INFO - __main__ - Step 44842: {'lr': 0.0004035578067146657, 'samples': 8609664, 'steps': 44841, 'loss/train': 0.952649712562561} -11/07/2021 03:30:40 - INFO - __main__ - Step 44843: {'lr': 0.000403553618989606, 'samples': 8609856, 'steps': 44842, 'loss/train': 1.4051940441131592} -11/07/2021 03:30:40 - INFO - __main__ - Step 44844: {'lr': 0.0004035494311953575, 'samples': 8610048, 'steps': 44843, 'loss/train': 1.7837588787078857} -11/07/2021 03:30:41 - INFO - __main__ - Step 44845: {'lr': 0.0004035452433319219, 'samples': 8610240, 'steps': 44844, 'loss/train': 1.64267897605896} -11/07/2021 03:30:41 - INFO - __main__ - Step 44846: {'lr': 0.0004035410553993012, 'samples': 8610432, 'steps': 44845, 'loss/train': 1.8207674026489258} -11/07/2021 03:30:41 - INFO - __main__ - Step 44847: {'lr': 0.00040353686739749733, 'samples': 8610624, 'steps': 44846, 'loss/train': 1.419385552406311} -11/07/2021 03:30:42 - INFO - __main__ - Step 44848: {'lr': 0.0004035326793265121, 'samples': 8610816, 'steps': 44847, 'loss/train': 1.539034366607666} -11/07/2021 03:30:43 - INFO - __main__ - Step 44849: {'lr': 0.0004035284911863474, 'samples': 8611008, 'steps': 44848, 'loss/train': 1.7744563817977905} -11/07/2021 03:30:43 - INFO - __main__ - Step 44850: {'lr': 0.00040352430297700513, 'samples': 8611200, 'steps': 44849, 'loss/train': 1.3370999097824097} -11/07/2021 03:30:43 - INFO - __main__ - Step 44851: {'lr': 0.00040352011469848713, 'samples': 8611392, 'steps': 44850, 'loss/train': 0.7737088203430176} -11/07/2021 03:30:44 - INFO - __main__ - Step 44852: {'lr': 0.00040351592635079535, 'samples': 8611584, 'steps': 44851, 'loss/train': 1.7571678161621094} -11/07/2021 03:30:45 - INFO - __main__ - Step 44853: {'lr': 0.0004035117379339318, 'samples': 8611776, 'steps': 44852, 'loss/train': 1.7419499158859253} -11/07/2021 03:30:45 - INFO - __main__ - Step 44854: {'lr': 0.00040350754944789815, 'samples': 8611968, 'steps': 44853, 'loss/train': 1.3507704734802246} -11/07/2021 03:30:45 - INFO - __main__ - Step 44855: {'lr': 0.0004035033608926963, 'samples': 8612160, 'steps': 44854, 'loss/train': 1.4348763227462769} -11/07/2021 03:30:46 - INFO - __main__ - Step 44856: {'lr': 0.0004034991722683282, 'samples': 8612352, 'steps': 44855, 'loss/train': 1.1511130332946777} -11/07/2021 03:30:46 - INFO - __main__ - Step 44857: {'lr': 0.0004034949835747958, 'samples': 8612544, 'steps': 44856, 'loss/train': 1.2454063892364502} -11/07/2021 03:30:47 - INFO - __main__ - Step 44858: {'lr': 0.00040349079481210096, 'samples': 8612736, 'steps': 44857, 'loss/train': 1.4043110609054565} -11/07/2021 03:30:48 - INFO - __main__ - Step 44859: {'lr': 0.00040348660598024547, 'samples': 8612928, 'steps': 44858, 'loss/train': 1.4020954370498657} -11/07/2021 03:30:48 - INFO - __main__ - Step 44860: {'lr': 0.0004034824170792313, 'samples': 8613120, 'steps': 44859, 'loss/train': 0.940532386302948} -11/07/2021 03:30:48 - INFO - __main__ - Step 44861: {'lr': 0.0004034782281090603, 'samples': 8613312, 'steps': 44860, 'loss/train': 1.7690776586532593} -11/07/2021 03:30:49 - INFO - __main__ - Step 44862: {'lr': 0.00040347403906973445, 'samples': 8613504, 'steps': 44861, 'loss/train': 1.2716156244277954} -11/07/2021 03:30:49 - INFO - __main__ - Step 44863: {'lr': 0.0004034698499612555, 'samples': 8613696, 'steps': 44862, 'loss/train': 1.0258671045303345} -11/07/2021 03:30:50 - INFO - __main__ - Step 44864: {'lr': 0.00040346566078362545, 'samples': 8613888, 'steps': 44863, 'loss/train': 1.5426487922668457} -11/07/2021 03:30:50 - INFO - __main__ - Step 44865: {'lr': 0.0004034614715368461, 'samples': 8614080, 'steps': 44864, 'loss/train': 1.569562554359436} -11/07/2021 03:30:51 - INFO - __main__ - Step 44866: {'lr': 0.0004034572822209194, 'samples': 8614272, 'steps': 44865, 'loss/train': 1.3128806352615356} -11/07/2021 03:30:51 - INFO - __main__ - Step 44867: {'lr': 0.00040345309283584726, 'samples': 8614464, 'steps': 44866, 'loss/train': 1.4803099632263184} -11/07/2021 03:30:51 - INFO - __main__ - Step 44868: {'lr': 0.0004034489033816314, 'samples': 8614656, 'steps': 44867, 'loss/train': 1.3495128154754639} -11/07/2021 03:30:52 - INFO - __main__ - Step 44869: {'lr': 0.00040344471385827396, 'samples': 8614848, 'steps': 44868, 'loss/train': 1.1803743839263916} -11/07/2021 03:30:53 - INFO - __main__ - Step 44870: {'lr': 0.00040344052426577665, 'samples': 8615040, 'steps': 44869, 'loss/train': 1.2572747468948364} -11/07/2021 03:30:53 - INFO - __main__ - Step 44871: {'lr': 0.0004034363346041414, 'samples': 8615232, 'steps': 44870, 'loss/train': 1.3079253435134888} -11/07/2021 03:30:53 - INFO - __main__ - Step 44872: {'lr': 0.0004034321448733701, 'samples': 8615424, 'steps': 44871, 'loss/train': 1.5915842056274414} -11/07/2021 03:30:54 - INFO - __main__ - Step 44873: {'lr': 0.00040342795507346464, 'samples': 8615616, 'steps': 44872, 'loss/train': 1.5641024112701416} -11/07/2021 03:30:55 - INFO - __main__ - Step 44874: {'lr': 0.000403423765204427, 'samples': 8615808, 'steps': 44873, 'loss/train': 1.731332540512085} -11/07/2021 03:30:55 - INFO - __main__ - Step 44875: {'lr': 0.0004034195752662589, 'samples': 8616000, 'steps': 44874, 'loss/train': 1.3966073989868164} -11/07/2021 03:30:55 - INFO - __main__ - Step 44876: {'lr': 0.00040341538525896233, 'samples': 8616192, 'steps': 44875, 'loss/train': 1.4717856645584106} -11/07/2021 03:30:56 - INFO - __main__ - Step 44877: {'lr': 0.0004034111951825391, 'samples': 8616384, 'steps': 44876, 'loss/train': 1.5354030132293701} -11/07/2021 03:30:56 - INFO - __main__ - Step 44878: {'lr': 0.00040340700503699116, 'samples': 8616576, 'steps': 44877, 'loss/train': 1.6030645370483398} -11/07/2021 03:30:57 - INFO - __main__ - Step 44879: {'lr': 0.0004034028148223204, 'samples': 8616768, 'steps': 44878, 'loss/train': 1.5579181909561157} -11/07/2021 03:30:58 - INFO - __main__ - Step 44880: {'lr': 0.0004033986245385288, 'samples': 8616960, 'steps': 44879, 'loss/train': 1.655372977256775} -11/07/2021 03:30:58 - INFO - __main__ - Step 44881: {'lr': 0.0004033944341856181, 'samples': 8617152, 'steps': 44880, 'loss/train': 1.4386367797851562} -11/07/2021 03:30:58 - INFO - __main__ - Step 44882: {'lr': 0.00040339024376359015, 'samples': 8617344, 'steps': 44881, 'loss/train': 0.927916407585144} -11/07/2021 03:30:59 - INFO - __main__ - Step 44883: {'lr': 0.000403386053272447, 'samples': 8617536, 'steps': 44882, 'loss/train': 1.5074671506881714} -11/07/2021 03:31:00 - INFO - __main__ - Step 44884: {'lr': 0.0004033818627121904, 'samples': 8617728, 'steps': 44883, 'loss/train': 1.0531666278839111} -11/07/2021 03:31:00 - INFO - __main__ - Step 44885: {'lr': 0.00040337767208282235, 'samples': 8617920, 'steps': 44884, 'loss/train': 1.7778396606445312} -11/07/2021 03:31:00 - INFO - __main__ - Step 44886: {'lr': 0.00040337348138434466, 'samples': 8618112, 'steps': 44885, 'loss/train': 0.8337576389312744} -11/07/2021 03:31:01 - INFO - __main__ - Step 44887: {'lr': 0.00040336929061675933, 'samples': 8618304, 'steps': 44886, 'loss/train': 1.292196273803711} -11/07/2021 03:31:01 - INFO - __main__ - Step 44888: {'lr': 0.0004033650997800681, 'samples': 8618496, 'steps': 44887, 'loss/train': 1.5180169343948364} -11/07/2021 03:31:02 - INFO - __main__ - Step 44889: {'lr': 0.00040336090887427284, 'samples': 8618688, 'steps': 44888, 'loss/train': 1.934960126876831} -11/07/2021 03:31:02 - INFO - __main__ - Step 44890: {'lr': 0.00040335671789937564, 'samples': 8618880, 'steps': 44889, 'loss/train': 1.5152138471603394} -11/07/2021 03:31:03 - INFO - __main__ - Step 44891: {'lr': 0.00040335252685537817, 'samples': 8619072, 'steps': 44890, 'loss/train': 0.4493248760700226} -11/07/2021 03:31:03 - INFO - __main__ - Step 44892: {'lr': 0.0004033483357422825, 'samples': 8619264, 'steps': 44891, 'loss/train': 1.8648028373718262} -11/07/2021 03:31:03 - INFO - __main__ - Step 44893: {'lr': 0.0004033441445600904, 'samples': 8619456, 'steps': 44892, 'loss/train': 1.6660622358322144} -11/07/2021 03:31:04 - INFO - __main__ - Step 44894: {'lr': 0.0004033399533088038, 'samples': 8619648, 'steps': 44893, 'loss/train': 1.3583667278289795} -11/07/2021 03:31:05 - INFO - __main__ - Step 44895: {'lr': 0.00040333576198842456, 'samples': 8619840, 'steps': 44894, 'loss/train': 1.1685876846313477} -11/07/2021 03:31:05 - INFO - __main__ - Step 44896: {'lr': 0.00040333157059895463, 'samples': 8620032, 'steps': 44895, 'loss/train': 1.2783938646316528} -11/07/2021 03:31:06 - INFO - __main__ - Step 44897: {'lr': 0.0004033273791403959, 'samples': 8620224, 'steps': 44896, 'loss/train': 1.4491678476333618} -11/07/2021 03:31:06 - INFO - __main__ - Step 44898: {'lr': 0.0004033231876127501, 'samples': 8620416, 'steps': 44897, 'loss/train': 1.4834508895874023} -11/07/2021 03:31:06 - INFO - __main__ - Step 44899: {'lr': 0.00040331899601601934, 'samples': 8620608, 'steps': 44898, 'loss/train': 0.9562569856643677} -11/07/2021 03:31:07 - INFO - __main__ - Step 44900: {'lr': 0.0004033148043502054, 'samples': 8620800, 'steps': 44899, 'loss/train': 1.7440876960754395} -11/07/2021 03:31:08 - INFO - __main__ - Step 44901: {'lr': 0.00040331061261531014, 'samples': 8620992, 'steps': 44900, 'loss/train': 1.2397050857543945} -11/07/2021 03:31:08 - INFO - __main__ - Step 44902: {'lr': 0.0004033064208113355, 'samples': 8621184, 'steps': 44901, 'loss/train': 1.4030208587646484} -11/07/2021 03:31:08 - INFO - __main__ - Step 44903: {'lr': 0.00040330222893828334, 'samples': 8621376, 'steps': 44902, 'loss/train': 1.8505945205688477} -11/07/2021 03:31:09 - INFO - __main__ - Step 44904: {'lr': 0.0004032980369961555, 'samples': 8621568, 'steps': 44903, 'loss/train': 1.1294523477554321} -11/07/2021 03:31:10 - INFO - __main__ - Step 44905: {'lr': 0.000403293844984954, 'samples': 8621760, 'steps': 44904, 'loss/train': 0.1676974892616272} -11/07/2021 03:31:10 - INFO - __main__ - Step 44906: {'lr': 0.00040328965290468066, 'samples': 8621952, 'steps': 44905, 'loss/train': 1.710390329360962} -11/07/2021 03:31:10 - INFO - __main__ - Step 44907: {'lr': 0.00040328546075533745, 'samples': 8622144, 'steps': 44906, 'loss/train': 1.4258091449737549} -11/07/2021 03:31:11 - INFO - __main__ - Step 44908: {'lr': 0.00040328126853692606, 'samples': 8622336, 'steps': 44907, 'loss/train': 1.154900312423706} -11/07/2021 03:31:11 - INFO - __main__ - Step 44909: {'lr': 0.00040327707624944855, 'samples': 8622528, 'steps': 44908, 'loss/train': 1.5896992683410645} -11/07/2021 03:31:12 - INFO - __main__ - Step 44910: {'lr': 0.0004032728838929067, 'samples': 8622720, 'steps': 44909, 'loss/train': 0.9224819540977478} -11/07/2021 03:31:13 - INFO - __main__ - Step 44911: {'lr': 0.0004032686914673025, 'samples': 8622912, 'steps': 44910, 'loss/train': 1.7258622646331787} -11/07/2021 03:31:13 - INFO - __main__ - Step 44912: {'lr': 0.00040326449897263775, 'samples': 8623104, 'steps': 44911, 'loss/train': 1.3852179050445557} -11/07/2021 03:31:13 - INFO - __main__ - Step 44913: {'lr': 0.0004032603064089144, 'samples': 8623296, 'steps': 44912, 'loss/train': 0.12013912200927734} -11/07/2021 03:31:14 - INFO - __main__ - Step 44914: {'lr': 0.00040325611377613435, 'samples': 8623488, 'steps': 44913, 'loss/train': 2.0965540409088135} -11/07/2021 03:31:15 - INFO - __main__ - Step 44915: {'lr': 0.00040325192107429944, 'samples': 8623680, 'steps': 44914, 'loss/train': 1.8563235998153687} -11/07/2021 03:31:15 - INFO - __main__ - Step 44916: {'lr': 0.00040324772830341163, 'samples': 8623872, 'steps': 44915, 'loss/train': 1.5661081075668335} -11/07/2021 03:31:15 - INFO - __main__ - Step 44917: {'lr': 0.0004032435354634726, 'samples': 8624064, 'steps': 44916, 'loss/train': 1.2690373659133911} -11/07/2021 03:31:16 - INFO - __main__ - Step 44918: {'lr': 0.00040323934255448457, 'samples': 8624256, 'steps': 44917, 'loss/train': 1.1036372184753418} -11/07/2021 03:31:16 - INFO - __main__ - Step 44919: {'lr': 0.00040323514957644915, 'samples': 8624448, 'steps': 44918, 'loss/train': 1.6021407842636108} -11/07/2021 03:31:17 - INFO - __main__ - Step 44920: {'lr': 0.00040323095652936843, 'samples': 8624640, 'steps': 44919, 'loss/train': 1.4129055738449097} -11/07/2021 03:31:17 - INFO - __main__ - Step 44921: {'lr': 0.00040322676341324415, 'samples': 8624832, 'steps': 44920, 'loss/train': 1.3669313192367554} -11/07/2021 03:31:18 - INFO - __main__ - Step 44922: {'lr': 0.0004032225702280783, 'samples': 8625024, 'steps': 44921, 'loss/train': 1.6862813234329224} -11/07/2021 03:31:18 - INFO - __main__ - Step 44923: {'lr': 0.00040321837697387264, 'samples': 8625216, 'steps': 44922, 'loss/train': 1.9148911237716675} -11/07/2021 03:31:18 - INFO - __main__ - Step 44924: {'lr': 0.00040321418365062915, 'samples': 8625408, 'steps': 44923, 'loss/train': 0.8510093688964844} -11/07/2021 03:31:19 - INFO - __main__ - Step 44925: {'lr': 0.00040320999025834973, 'samples': 8625600, 'steps': 44924, 'loss/train': 1.509555459022522} -11/07/2021 03:31:20 - INFO - __main__ - Step 44926: {'lr': 0.0004032057967970363, 'samples': 8625792, 'steps': 44925, 'loss/train': 1.7970837354660034} -11/07/2021 03:31:20 - INFO - __main__ - Step 44927: {'lr': 0.0004032016032666907, 'samples': 8625984, 'steps': 44926, 'loss/train': 1.5563510656356812} -11/07/2021 03:31:21 - INFO - __main__ - Step 44928: {'lr': 0.00040319740966731477, 'samples': 8626176, 'steps': 44927, 'loss/train': 1.2547262907028198} -11/07/2021 03:31:21 - INFO - __main__ - Step 44929: {'lr': 0.0004031932159989105, 'samples': 8626368, 'steps': 44928, 'loss/train': 1.417038917541504} -11/07/2021 03:31:21 - INFO - __main__ - Step 44930: {'lr': 0.0004031890222614797, 'samples': 8626560, 'steps': 44929, 'loss/train': 1.4200637340545654} -11/07/2021 03:31:22 - INFO - __main__ - Step 44931: {'lr': 0.0004031848284550243, 'samples': 8626752, 'steps': 44930, 'loss/train': 1.3945986032485962} -11/07/2021 03:31:23 - INFO - __main__ - Step 44932: {'lr': 0.0004031806345795462, 'samples': 8626944, 'steps': 44931, 'loss/train': 0.8418196439743042} -11/07/2021 03:31:23 - INFO - __main__ - Step 44933: {'lr': 0.0004031764406350472, 'samples': 8627136, 'steps': 44932, 'loss/train': 1.5948578119277954} -11/07/2021 03:31:23 - INFO - __main__ - Step 44934: {'lr': 0.0004031722466215293, 'samples': 8627328, 'steps': 44933, 'loss/train': 1.464234709739685} -11/07/2021 03:31:24 - INFO - __main__ - Step 44935: {'lr': 0.00040316805253899434, 'samples': 8627520, 'steps': 44934, 'loss/train': 0.7063742280006409} -11/07/2021 03:31:25 - INFO - __main__ - Step 44936: {'lr': 0.0004031638583874443, 'samples': 8627712, 'steps': 44935, 'loss/train': 1.4003729820251465} -11/07/2021 03:31:25 - INFO - __main__ - Step 44937: {'lr': 0.0004031596641668809, 'samples': 8627904, 'steps': 44936, 'loss/train': 1.2112001180648804} -11/07/2021 03:31:26 - INFO - __main__ - Step 44938: {'lr': 0.0004031554698773061, 'samples': 8628096, 'steps': 44937, 'loss/train': 1.67475426197052} -11/07/2021 03:31:26 - INFO - __main__ - Step 44939: {'lr': 0.0004031512755187219, 'samples': 8628288, 'steps': 44938, 'loss/train': 1.6906245946884155} -11/07/2021 03:31:26 - INFO - __main__ - Step 44940: {'lr': 0.00040314708109113003, 'samples': 8628480, 'steps': 44939, 'loss/train': 1.8159323930740356} -11/07/2021 03:31:28 - INFO - __main__ - Step 44941: {'lr': 0.0004031428865945325, 'samples': 8628672, 'steps': 44940, 'loss/train': 1.7222596406936646} -11/07/2021 03:31:28 - INFO - __main__ - Step 44942: {'lr': 0.0004031386920289311, 'samples': 8628864, 'steps': 44941, 'loss/train': 0.9303457736968994} -11/07/2021 03:31:28 - INFO - __main__ - Step 44943: {'lr': 0.0004031344973943278, 'samples': 8629056, 'steps': 44942, 'loss/train': 1.8656607866287231} -11/07/2021 03:31:29 - INFO - __main__ - Step 44944: {'lr': 0.00040313030269072445, 'samples': 8629248, 'steps': 44943, 'loss/train': 0.9886725544929504} -11/07/2021 03:31:29 - INFO - __main__ - Step 44945: {'lr': 0.00040312610791812286, 'samples': 8629440, 'steps': 44944, 'loss/train': 1.2826176881790161} -11/07/2021 03:31:30 - INFO - __main__ - Step 44946: {'lr': 0.00040312191307652513, 'samples': 8629632, 'steps': 44945, 'loss/train': 0.7697887420654297} -11/07/2021 03:31:30 - INFO - __main__ - Step 44947: {'lr': 0.000403117718165933, 'samples': 8629824, 'steps': 44946, 'loss/train': 0.953285276889801} -11/07/2021 03:31:31 - INFO - __main__ - Step 44948: {'lr': 0.00040311352318634844, 'samples': 8630016, 'steps': 44947, 'loss/train': 5.663651466369629} -11/07/2021 03:31:31 - INFO - __main__ - Step 44949: {'lr': 0.00040310932813777316, 'samples': 8630208, 'steps': 44948, 'loss/train': 1.1987284421920776} -11/07/2021 03:31:31 - INFO - __main__ - Step 44950: {'lr': 0.0004031051330202092, 'samples': 8630400, 'steps': 44949, 'loss/train': 1.4727267026901245} -11/07/2021 03:31:32 - INFO - __main__ - Step 44951: {'lr': 0.00040310093783365854, 'samples': 8630592, 'steps': 44950, 'loss/train': 1.728103756904602} -11/07/2021 03:31:33 - INFO - __main__ - Step 44952: {'lr': 0.0004030967425781229, 'samples': 8630784, 'steps': 44951, 'loss/train': 1.317302942276001} -11/07/2021 03:31:33 - INFO - __main__ - Step 44953: {'lr': 0.0004030925472536042, 'samples': 8630976, 'steps': 44952, 'loss/train': 1.6258738040924072} -11/07/2021 03:31:34 - INFO - __main__ - Step 44954: {'lr': 0.0004030883518601044, 'samples': 8631168, 'steps': 44953, 'loss/train': 1.1118228435516357} -11/07/2021 03:31:34 - INFO - __main__ - Step 44955: {'lr': 0.0004030841563976254, 'samples': 8631360, 'steps': 44954, 'loss/train': 1.2092745304107666} -11/07/2021 03:31:35 - INFO - __main__ - Step 44956: {'lr': 0.00040307996086616895, 'samples': 8631552, 'steps': 44955, 'loss/train': 1.5450530052185059} -11/07/2021 03:31:35 - INFO - __main__ - Step 44957: {'lr': 0.00040307576526573704, 'samples': 8631744, 'steps': 44956, 'loss/train': 1.7838172912597656} -11/07/2021 03:31:36 - INFO - __main__ - Step 44958: {'lr': 0.00040307156959633154, 'samples': 8631936, 'steps': 44957, 'loss/train': 1.2368890047073364} -11/07/2021 03:31:36 - INFO - __main__ - Step 44959: {'lr': 0.00040306737385795437, 'samples': 8632128, 'steps': 44958, 'loss/train': 1.431859016418457} -11/07/2021 03:31:36 - INFO - __main__ - Step 44960: {'lr': 0.00040306317805060746, 'samples': 8632320, 'steps': 44959, 'loss/train': 1.3809988498687744} -11/07/2021 03:31:37 - INFO - __main__ - Step 44961: {'lr': 0.0004030589821742926, 'samples': 8632512, 'steps': 44960, 'loss/train': 1.3988364934921265} -11/07/2021 03:31:38 - INFO - __main__ - Step 44962: {'lr': 0.00040305478622901177, 'samples': 8632704, 'steps': 44961, 'loss/train': 1.5435221195220947} -11/07/2021 03:31:38 - INFO - __main__ - Step 44963: {'lr': 0.0004030505902147668, 'samples': 8632896, 'steps': 44962, 'loss/train': 1.8923532962799072} -11/07/2021 03:31:38 - INFO - __main__ - Step 44964: {'lr': 0.00040304639413155953, 'samples': 8633088, 'steps': 44963, 'loss/train': 1.4311248064041138} -11/07/2021 03:31:39 - INFO - __main__ - Step 44965: {'lr': 0.0004030421979793919, 'samples': 8633280, 'steps': 44964, 'loss/train': 1.5051273107528687} -11/07/2021 03:31:40 - INFO - __main__ - Step 44966: {'lr': 0.0004030380017582659, 'samples': 8633472, 'steps': 44965, 'loss/train': 1.7004728317260742} -11/07/2021 03:31:40 - INFO - __main__ - Step 44967: {'lr': 0.0004030338054681833, 'samples': 8633664, 'steps': 44966, 'loss/train': 1.6326181888580322} -11/07/2021 03:31:40 - INFO - __main__ - Step 44968: {'lr': 0.0004030296091091461, 'samples': 8633856, 'steps': 44967, 'loss/train': 1.38742995262146} -11/07/2021 03:31:41 - INFO - __main__ - Step 44969: {'lr': 0.000403025412681156, 'samples': 8634048, 'steps': 44968, 'loss/train': 1.190015196800232} -11/07/2021 03:31:41 - INFO - __main__ - Step 44970: {'lr': 0.00040302121618421505, 'samples': 8634240, 'steps': 44969, 'loss/train': 1.7225620746612549} -11/07/2021 03:31:42 - INFO - __main__ - Step 44971: {'lr': 0.0004030170196183252, 'samples': 8634432, 'steps': 44970, 'loss/train': 1.1247191429138184} -11/07/2021 03:31:42 - INFO - __main__ - Step 44972: {'lr': 0.00040301282298348806, 'samples': 8634624, 'steps': 44971, 'loss/train': 1.6943212747573853} -11/07/2021 03:31:43 - INFO - __main__ - Step 44973: {'lr': 0.0004030086262797058, 'samples': 8634816, 'steps': 44972, 'loss/train': 1.40690279006958} -11/07/2021 03:31:43 - INFO - __main__ - Step 44974: {'lr': 0.0004030044295069803, 'samples': 8635008, 'steps': 44973, 'loss/train': 1.1578707695007324} -11/07/2021 03:31:43 - INFO - __main__ - Step 44975: {'lr': 0.00040300023266531327, 'samples': 8635200, 'steps': 44974, 'loss/train': 1.1108335256576538} -11/07/2021 03:31:45 - INFO - __main__ - Step 44976: {'lr': 0.0004029960357547067, 'samples': 8635392, 'steps': 44975, 'loss/train': 1.3263057470321655} -11/07/2021 03:31:45 - INFO - __main__ - Step 44977: {'lr': 0.0004029918387751625, 'samples': 8635584, 'steps': 44976, 'loss/train': 1.6945290565490723} -11/07/2021 03:31:45 - INFO - __main__ - Step 44978: {'lr': 0.00040298764172668253, 'samples': 8635776, 'steps': 44977, 'loss/train': 1.4941730499267578} -11/07/2021 03:31:46 - INFO - __main__ - Step 44979: {'lr': 0.00040298344460926866, 'samples': 8635968, 'steps': 44978, 'loss/train': 1.4797956943511963} -11/07/2021 03:31:46 - INFO - __main__ - Step 44980: {'lr': 0.0004029792474229228, 'samples': 8636160, 'steps': 44979, 'loss/train': 1.5584986209869385} -11/07/2021 03:31:46 - INFO - __main__ - Step 44981: {'lr': 0.00040297505016764697, 'samples': 8636352, 'steps': 44980, 'loss/train': 1.4460642337799072} -11/07/2021 03:31:47 - INFO - __main__ - Step 44982: {'lr': 0.00040297085284344284, 'samples': 8636544, 'steps': 44981, 'loss/train': 1.5774402618408203} -11/07/2021 03:31:48 - INFO - __main__ - Step 44983: {'lr': 0.0004029666554503124, 'samples': 8636736, 'steps': 44982, 'loss/train': 1.447740077972412} -11/07/2021 03:31:48 - INFO - __main__ - Step 44984: {'lr': 0.0004029624579882576, 'samples': 8636928, 'steps': 44983, 'loss/train': 2.202698230743408} -11/07/2021 03:31:48 - INFO - __main__ - Step 44985: {'lr': 0.00040295826045728023, 'samples': 8637120, 'steps': 44984, 'loss/train': 0.47387027740478516} -11/07/2021 03:31:49 - INFO - __main__ - Step 44986: {'lr': 0.00040295406285738224, 'samples': 8637312, 'steps': 44985, 'loss/train': 1.4053353071212769} -11/07/2021 03:31:50 - INFO - __main__ - Step 44987: {'lr': 0.00040294986518856553, 'samples': 8637504, 'steps': 44986, 'loss/train': 1.6060630083084106} -11/07/2021 03:31:50 - INFO - __main__ - Step 44988: {'lr': 0.00040294566745083195, 'samples': 8637696, 'steps': 44987, 'loss/train': 1.1187083721160889} -11/07/2021 03:31:51 - INFO - __main__ - Step 44989: {'lr': 0.00040294146964418344, 'samples': 8637888, 'steps': 44988, 'loss/train': 1.3277955055236816} -11/07/2021 03:31:51 - INFO - __main__ - Step 44990: {'lr': 0.00040293727176862184, 'samples': 8638080, 'steps': 44989, 'loss/train': 1.8343409299850464} -11/07/2021 03:31:51 - INFO - __main__ - Step 44991: {'lr': 0.000402933073824149, 'samples': 8638272, 'steps': 44990, 'loss/train': 0.9720051288604736} -11/07/2021 03:31:52 - INFO - __main__ - Step 44992: {'lr': 0.000402928875810767, 'samples': 8638464, 'steps': 44991, 'loss/train': 1.4146634340286255} -11/07/2021 03:31:53 - INFO - __main__ - Step 44993: {'lr': 0.00040292467772847754, 'samples': 8638656, 'steps': 44992, 'loss/train': 1.0446237325668335} -11/07/2021 03:31:53 - INFO - __main__ - Step 44994: {'lr': 0.00040292047957728264, 'samples': 8638848, 'steps': 44993, 'loss/train': 1.6617484092712402} -11/07/2021 03:31:53 - INFO - __main__ - Step 44995: {'lr': 0.00040291628135718404, 'samples': 8639040, 'steps': 44994, 'loss/train': 1.681424617767334} -11/07/2021 03:31:54 - INFO - __main__ - Step 44996: {'lr': 0.0004029120830681838, 'samples': 8639232, 'steps': 44995, 'loss/train': 1.5093427896499634} -11/07/2021 03:31:55 - INFO - __main__ - Step 44997: {'lr': 0.0004029078847102837, 'samples': 8639424, 'steps': 44996, 'loss/train': 1.4904605150222778} -11/07/2021 03:31:55 - INFO - __main__ - Step 44998: {'lr': 0.00040290368628348564, 'samples': 8639616, 'steps': 44997, 'loss/train': 0.495597243309021} -11/07/2021 03:31:56 - INFO - __main__ - Step 44999: {'lr': 0.00040289948778779157, 'samples': 8639808, 'steps': 44998, 'loss/train': 1.3495784997940063} -11/07/2021 03:31:56 - INFO - __main__ - Step 45000: {'lr': 0.00040289528922320334, 'samples': 8640000, 'steps': 44999, 'loss/train': 0.798037052154541} -11/07/2021 03:31:56 - INFO - __main__ - Evaluating and saving model checkpoint -11/07/2021 03:35:09 - INFO - __main__ - Step 45000: {'loss/eval': 1.406919240951538, 'perplexity': 4.0833563804626465} -11/07/2021 03:35:20 - WARNING - huggingface_hub.repository - Adding files tracked by Git LFS: ['wandb/run-20211106_211610-dtkf2u0m/run-dtkf2u0m.wandb']. This may take a bit of time if the files are large. -11/07/2021 03:35:24 - WARNING - huggingface_hub.repository - Several commits (3) will be pushed upstream. -11/07/2021 03:35:24 - WARNING - huggingface_hub.repository - The progress bars may be unreliable. -11/07/2021 03:35:49 - WARNING - huggingface_hub.repository - To https://huggingface.co/lvwerra/codeparrot-small - d425b2d..5ed0776 proud-haze-135 -> proud-haze-135 - -11/07/2021 03:35:50 - INFO - __main__ - Step 45001: {'lr': 0.00040289109058972285, 'samples': 8640192, 'steps': 45000, 'loss/train': 1.378940463066101} -11/07/2021 03:35:51 - INFO - __main__ - Step 45002: {'lr': 0.000402886891887352, 'samples': 8640384, 'steps': 45001, 'loss/train': 0.7639281749725342} -11/07/2021 03:35:52 - INFO - __main__ - Step 45003: {'lr': 0.0004028826931160927, 'samples': 8640576, 'steps': 45002, 'loss/train': 1.7666077613830566} -11/07/2021 03:35:52 - INFO - __main__ - Step 45004: {'lr': 0.0004028784942759468, 'samples': 8640768, 'steps': 45003, 'loss/train': 1.9681998491287231} -11/07/2021 03:35:53 - INFO - __main__ - Step 45005: {'lr': 0.0004028742953669162, 'samples': 8640960, 'steps': 45004, 'loss/train': 1.333229899406433} -11/07/2021 03:35:53 - INFO - __main__ - Step 45006: {'lr': 0.0004028700963890028, 'samples': 8641152, 'steps': 45005, 'loss/train': 1.756109356880188} -11/07/2021 03:35:53 - INFO - __main__ - Step 45007: {'lr': 0.0004028658973422085, 'samples': 8641344, 'steps': 45006, 'loss/train': 1.7226879596710205} -11/07/2021 03:35:54 - INFO - __main__ - Step 45008: {'lr': 0.0004028616982265352, 'samples': 8641536, 'steps': 45007, 'loss/train': 1.0147008895874023} -11/07/2021 03:35:55 - INFO - __main__ - Step 45009: {'lr': 0.0004028574990419848, 'samples': 8641728, 'steps': 45008, 'loss/train': 1.5768661499023438} -11/07/2021 03:35:55 - INFO - __main__ - Step 45010: {'lr': 0.0004028532997885591, 'samples': 8641920, 'steps': 45009, 'loss/train': 1.1671724319458008} -11/07/2021 03:35:55 - INFO - __main__ - Step 45011: {'lr': 0.0004028491004662601, 'samples': 8642112, 'steps': 45010, 'loss/train': 1.2716879844665527} -11/07/2021 03:35:56 - INFO - __main__ - Step 45012: {'lr': 0.0004028449010750896, 'samples': 8642304, 'steps': 45011, 'loss/train': 1.6644291877746582} -11/07/2021 03:35:57 - INFO - __main__ - Step 45013: {'lr': 0.0004028407016150496, 'samples': 8642496, 'steps': 45012, 'loss/train': 1.2869713306427002} -11/07/2021 03:35:57 - INFO - __main__ - Step 45014: {'lr': 0.000402836502086142, 'samples': 8642688, 'steps': 45013, 'loss/train': 1.0818111896514893} -11/07/2021 03:35:57 - INFO - __main__ - Step 45015: {'lr': 0.00040283230248836855, 'samples': 8642880, 'steps': 45014, 'loss/train': 1.1113263368606567} -11/07/2021 03:35:58 - INFO - __main__ - Step 45016: {'lr': 0.0004028281028217312, 'samples': 8643072, 'steps': 45015, 'loss/train': 1.3489185571670532} -11/07/2021 03:35:58 - INFO - __main__ - Step 45017: {'lr': 0.00040282390308623195, 'samples': 8643264, 'steps': 45016, 'loss/train': 1.355971336364746} -11/07/2021 03:35:59 - INFO - __main__ - Step 45018: {'lr': 0.0004028197032818726, 'samples': 8643456, 'steps': 45017, 'loss/train': 1.0107563734054565} -11/07/2021 03:36:00 - INFO - __main__ - Step 45019: {'lr': 0.00040281550340865493, 'samples': 8643648, 'steps': 45018, 'loss/train': 1.496358871459961} -11/07/2021 03:36:00 - INFO - __main__ - Step 45020: {'lr': 0.000402811303466581, 'samples': 8643840, 'steps': 45019, 'loss/train': 1.4261424541473389} -11/07/2021 03:36:00 - INFO - __main__ - Step 45021: {'lr': 0.00040280710345565277, 'samples': 8644032, 'steps': 45020, 'loss/train': 1.3391042947769165} -11/07/2021 03:36:01 - INFO - __main__ - Step 45022: {'lr': 0.0004028029033758719, 'samples': 8644224, 'steps': 45021, 'loss/train': 1.426767349243164} -11/07/2021 03:36:02 - INFO - __main__ - Step 45023: {'lr': 0.00040279870322724044, 'samples': 8644416, 'steps': 45022, 'loss/train': 1.71662175655365} -11/07/2021 03:36:02 - INFO - __main__ - Step 45024: {'lr': 0.00040279450300976025, 'samples': 8644608, 'steps': 45023, 'loss/train': 1.476520299911499} -11/07/2021 03:36:02 - INFO - __main__ - Step 45025: {'lr': 0.0004027903027234332, 'samples': 8644800, 'steps': 45024, 'loss/train': 1.5499037504196167} -11/07/2021 03:36:03 - INFO - __main__ - Step 45026: {'lr': 0.0004027861023682612, 'samples': 8644992, 'steps': 45025, 'loss/train': 0.5358538031578064} -11/07/2021 03:36:03 - INFO - __main__ - Step 45027: {'lr': 0.00040278190194424613, 'samples': 8645184, 'steps': 45026, 'loss/train': 0.8318495750427246} -11/07/2021 03:36:04 - INFO - __main__ - Step 45028: {'lr': 0.0004027777014513899, 'samples': 8645376, 'steps': 45027, 'loss/train': 1.6739071607589722} -11/07/2021 03:36:04 - INFO - __main__ - Step 45029: {'lr': 0.0004027735008896944, 'samples': 8645568, 'steps': 45028, 'loss/train': 1.6734158992767334} -11/07/2021 03:36:05 - INFO - __main__ - Step 45030: {'lr': 0.0004027693002591615, 'samples': 8645760, 'steps': 45029, 'loss/train': 1.218596339225769} -11/07/2021 03:36:05 - INFO - __main__ - Step 45031: {'lr': 0.0004027650995597931, 'samples': 8645952, 'steps': 45030, 'loss/train': 1.261763572692871} -11/07/2021 03:36:05 - INFO - __main__ - Step 45032: {'lr': 0.0004027608987915912, 'samples': 8646144, 'steps': 45031, 'loss/train': 1.4001818895339966} -11/07/2021 03:36:06 - INFO - __main__ - Step 45033: {'lr': 0.0004027566979545574, 'samples': 8646336, 'steps': 45032, 'loss/train': 1.6564899682998657} -11/07/2021 03:36:07 - INFO - __main__ - Step 45034: {'lr': 0.000402752497048694, 'samples': 8646528, 'steps': 45033, 'loss/train': 1.373465657234192} -11/07/2021 03:36:07 - INFO - __main__ - Step 45035: {'lr': 0.0004027482960740026, 'samples': 8646720, 'steps': 45034, 'loss/train': 1.378868818283081} -11/07/2021 03:36:08 - INFO - __main__ - Step 45036: {'lr': 0.00040274409503048513, 'samples': 8646912, 'steps': 45035, 'loss/train': 1.5058993101119995} -11/07/2021 03:36:08 - INFO - __main__ - Step 45037: {'lr': 0.0004027398939181436, 'samples': 8647104, 'steps': 45036, 'loss/train': 1.4314427375793457} -11/07/2021 03:36:08 - INFO - __main__ - Step 45038: {'lr': 0.00040273569273697974, 'samples': 8647296, 'steps': 45037, 'loss/train': 1.5494295358657837} -11/07/2021 03:36:09 - INFO - __main__ - Step 45039: {'lr': 0.0004027314914869956, 'samples': 8647488, 'steps': 45038, 'loss/train': 1.506453514099121} -11/07/2021 03:36:10 - INFO - __main__ - Step 45040: {'lr': 0.000402727290168193, 'samples': 8647680, 'steps': 45039, 'loss/train': 1.688452959060669} -11/07/2021 03:36:10 - INFO - __main__ - Step 45041: {'lr': 0.00040272308878057383, 'samples': 8647872, 'steps': 45040, 'loss/train': 1.3499056100845337} -11/07/2021 03:36:10 - INFO - __main__ - Step 45042: {'lr': 0.0004027188873241401, 'samples': 8648064, 'steps': 45041, 'loss/train': 1.4158624410629272} -11/07/2021 03:36:11 - INFO - __main__ - Step 45043: {'lr': 0.00040271468579889346, 'samples': 8648256, 'steps': 45042, 'loss/train': 1.4179600477218628} -11/07/2021 03:36:12 - INFO - __main__ - Step 45044: {'lr': 0.0004027104842048359, 'samples': 8648448, 'steps': 45043, 'loss/train': 2.341157913208008} -11/07/2021 03:36:12 - INFO - __main__ - Step 45045: {'lr': 0.0004027062825419695, 'samples': 8648640, 'steps': 45044, 'loss/train': 1.744893193244934} -11/07/2021 03:36:12 - INFO - __main__ - Step 45046: {'lr': 0.0004027020808102959, 'samples': 8648832, 'steps': 45045, 'loss/train': 0.9090373516082764} -11/07/2021 03:36:13 - INFO - __main__ - Step 45047: {'lr': 0.0004026978790098171, 'samples': 8649024, 'steps': 45046, 'loss/train': 0.878197193145752} -11/07/2021 03:36:13 - INFO - __main__ - Step 45048: {'lr': 0.0004026936771405351, 'samples': 8649216, 'steps': 45047, 'loss/train': 1.6723681688308716} -11/07/2021 03:36:14 - INFO - __main__ - Step 45049: {'lr': 0.0004026894752024516, 'samples': 8649408, 'steps': 45048, 'loss/train': 1.3421533107757568} -11/07/2021 03:36:14 - INFO - __main__ - Step 45050: {'lr': 0.00040268527319556856, 'samples': 8649600, 'steps': 45049, 'loss/train': 1.3463534116744995} -11/07/2021 03:36:15 - INFO - __main__ - Step 45051: {'lr': 0.0004026810711198879, 'samples': 8649792, 'steps': 45050, 'loss/train': 1.0824987888336182} -11/07/2021 03:36:15 - INFO - __main__ - Step 45052: {'lr': 0.00040267686897541157, 'samples': 8649984, 'steps': 45051, 'loss/train': 1.6015963554382324} -11/07/2021 03:36:15 - INFO - __main__ - Step 45053: {'lr': 0.0004026726667621413, 'samples': 8650176, 'steps': 45052, 'loss/train': 1.3904969692230225} -11/07/2021 03:36:16 - INFO - __main__ - Step 45054: {'lr': 0.00040266846448007914, 'samples': 8650368, 'steps': 45053, 'loss/train': 1.6913669109344482} -11/07/2021 03:36:17 - INFO - __main__ - Step 45055: {'lr': 0.00040266426212922697, 'samples': 8650560, 'steps': 45054, 'loss/train': 1.5606504678726196} -11/07/2021 03:36:17 - INFO - __main__ - Step 45056: {'lr': 0.00040266005970958656, 'samples': 8650752, 'steps': 45055, 'loss/train': 1.2225046157836914} -11/07/2021 03:36:17 - INFO - __main__ - Step 45057: {'lr': 0.0004026558572211599, 'samples': 8650944, 'steps': 45056, 'loss/train': 1.4816373586654663} -11/07/2021 03:36:18 - INFO - __main__ - Step 45058: {'lr': 0.00040265165466394894, 'samples': 8651136, 'steps': 45057, 'loss/train': 1.6577447652816772} -11/07/2021 03:36:19 - INFO - __main__ - Step 45059: {'lr': 0.00040264745203795536, 'samples': 8651328, 'steps': 45058, 'loss/train': 1.5056010484695435} -11/07/2021 03:36:19 - INFO - __main__ - Step 45060: {'lr': 0.0004026432493431813, 'samples': 8651520, 'steps': 45059, 'loss/train': 1.4441595077514648} -11/07/2021 03:36:20 - INFO - __main__ - Step 45061: {'lr': 0.0004026390465796286, 'samples': 8651712, 'steps': 45060, 'loss/train': 1.7447130680084229} -11/07/2021 03:36:20 - INFO - __main__ - Step 45062: {'lr': 0.000402634843747299, 'samples': 8651904, 'steps': 45061, 'loss/train': 1.3498313426971436} -11/07/2021 03:36:20 - INFO - __main__ - Step 45063: {'lr': 0.0004026306408461945, 'samples': 8652096, 'steps': 45062, 'loss/train': 1.6140329837799072} -11/07/2021 03:36:21 - INFO - __main__ - Step 45064: {'lr': 0.000402626437876317, 'samples': 8652288, 'steps': 45063, 'loss/train': 1.8729219436645508} -11/07/2021 03:36:22 - INFO - __main__ - Step 45065: {'lr': 0.00040262223483766835, 'samples': 8652480, 'steps': 45064, 'loss/train': 1.4350508451461792} -11/07/2021 03:36:22 - INFO - __main__ - Step 45066: {'lr': 0.0004026180317302506, 'samples': 8652672, 'steps': 45065, 'loss/train': 1.5817408561706543} -11/07/2021 03:36:22 - INFO - __main__ - Step 45067: {'lr': 0.0004026138285540654, 'samples': 8652864, 'steps': 45066, 'loss/train': 1.3502610921859741} -11/07/2021 03:36:23 - INFO - __main__ - Step 45068: {'lr': 0.0004026096253091148, 'samples': 8653056, 'steps': 45067, 'loss/train': 1.4997808933258057} -11/07/2021 03:36:23 - INFO - __main__ - Step 45069: {'lr': 0.00040260542199540064, 'samples': 8653248, 'steps': 45068, 'loss/train': 1.4410582780838013} -11/07/2021 03:36:24 - INFO - __main__ - Step 45070: {'lr': 0.00040260121861292484, 'samples': 8653440, 'steps': 45069, 'loss/train': 1.253722071647644} -11/07/2021 03:36:25 - INFO - __main__ - Step 45071: {'lr': 0.0004025970151616893, 'samples': 8653632, 'steps': 45070, 'loss/train': 1.573169469833374} -11/07/2021 03:36:25 - INFO - __main__ - Step 45072: {'lr': 0.0004025928116416959, 'samples': 8653824, 'steps': 45071, 'loss/train': 1.4829283952713013} -11/07/2021 03:36:25 - INFO - __main__ - Step 45073: {'lr': 0.0004025886080529465, 'samples': 8654016, 'steps': 45072, 'loss/train': 2.308427095413208} -11/07/2021 03:36:26 - INFO - __main__ - Step 45074: {'lr': 0.00040258440439544307, 'samples': 8654208, 'steps': 45073, 'loss/train': 1.4862397909164429} -11/07/2021 03:36:27 - INFO - __main__ - Step 45075: {'lr': 0.0004025802006691874, 'samples': 8654400, 'steps': 45074, 'loss/train': 1.362560510635376} -11/07/2021 03:36:27 - INFO - __main__ - Step 45076: {'lr': 0.0004025759968741816, 'samples': 8654592, 'steps': 45075, 'loss/train': 1.7087560892105103} -11/07/2021 03:36:27 - INFO - __main__ - Step 45077: {'lr': 0.00040257179301042724, 'samples': 8654784, 'steps': 45076, 'loss/train': 1.1875423192977905} -11/07/2021 03:36:28 - INFO - __main__ - Step 45078: {'lr': 0.00040256758907792646, 'samples': 8654976, 'steps': 45077, 'loss/train': 1.640230417251587} -11/07/2021 03:36:28 - INFO - __main__ - Step 45079: {'lr': 0.0004025633850766811, 'samples': 8655168, 'steps': 45078, 'loss/train': 0.8937728404998779} -11/07/2021 03:36:29 - INFO - __main__ - Step 45080: {'lr': 0.00040255918100669296, 'samples': 8655360, 'steps': 45079, 'loss/train': 1.7140698432922363} -11/07/2021 03:36:30 - INFO - __main__ - Step 45081: {'lr': 0.000402554976867964, 'samples': 8655552, 'steps': 45080, 'loss/train': 2.8504831790924072} -11/07/2021 03:36:30 - INFO - __main__ - Step 45082: {'lr': 0.00040255077266049624, 'samples': 8655744, 'steps': 45081, 'loss/train': 1.5986260175704956} -11/07/2021 03:36:30 - INFO - __main__ - Step 45083: {'lr': 0.0004025465683842914, 'samples': 8655936, 'steps': 45082, 'loss/train': 1.4731183052062988} -11/07/2021 03:36:31 - INFO - __main__ - Step 45084: {'lr': 0.0004025423640393514, 'samples': 8656128, 'steps': 45083, 'loss/train': 1.6889382600784302} -11/07/2021 03:36:31 - INFO - __main__ - Step 45085: {'lr': 0.0004025381596256782, 'samples': 8656320, 'steps': 45084, 'loss/train': 1.5213496685028076} -11/07/2021 03:36:32 - INFO - __main__ - Step 45086: {'lr': 0.0004025339551432736, 'samples': 8656512, 'steps': 45085, 'loss/train': 1.6633069515228271} -11/07/2021 03:36:32 - INFO - __main__ - Step 45087: {'lr': 0.0004025297505921396, 'samples': 8656704, 'steps': 45086, 'loss/train': 1.361456036567688} -11/07/2021 03:36:33 - INFO - __main__ - Step 45088: {'lr': 0.00040252554597227795, 'samples': 8656896, 'steps': 45087, 'loss/train': 1.7299543619155884} -11/07/2021 03:36:33 - INFO - __main__ - Step 45089: {'lr': 0.00040252134128369085, 'samples': 8657088, 'steps': 45088, 'loss/train': 1.6604050397872925} -11/07/2021 03:36:34 - INFO - __main__ - Step 45090: {'lr': 0.00040251713652637985, 'samples': 8657280, 'steps': 45089, 'loss/train': 1.785449743270874} -11/07/2021 03:36:34 - INFO - __main__ - Step 45091: {'lr': 0.00040251293170034697, 'samples': 8657472, 'steps': 45090, 'loss/train': 1.5653769969940186} -11/07/2021 03:36:35 - INFO - __main__ - Step 45092: {'lr': 0.00040250872680559416, 'samples': 8657664, 'steps': 45091, 'loss/train': 1.049634337425232} -11/07/2021 03:36:35 - INFO - __main__ - Step 45093: {'lr': 0.00040250452184212326, 'samples': 8657856, 'steps': 45092, 'loss/train': 1.2109078168869019} -11/07/2021 03:36:36 - INFO - __main__ - Step 45094: {'lr': 0.00040250031680993617, 'samples': 8658048, 'steps': 45093, 'loss/train': 1.3026163578033447} -11/07/2021 03:36:36 - INFO - __main__ - Step 45095: {'lr': 0.0004024961117090348, 'samples': 8658240, 'steps': 45094, 'loss/train': 1.310563087463379} -11/07/2021 03:36:36 - INFO - __main__ - Step 45096: {'lr': 0.00040249190653942105, 'samples': 8658432, 'steps': 45095, 'loss/train': 1.729379415512085} -11/07/2021 03:36:37 - INFO - __main__ - Step 45097: {'lr': 0.00040248770130109677, 'samples': 8658624, 'steps': 45096, 'loss/train': 1.745119571685791} -11/07/2021 03:36:38 - INFO - __main__ - Step 45098: {'lr': 0.0004024834959940639, 'samples': 8658816, 'steps': 45097, 'loss/train': 1.3489664793014526} -11/07/2021 03:36:38 - INFO - __main__ - Step 45099: {'lr': 0.0004024792906183243, 'samples': 8659008, 'steps': 45098, 'loss/train': 1.7792701721191406} -11/07/2021 03:36:38 - INFO - __main__ - Step 45100: {'lr': 0.0004024750851738799, 'samples': 8659200, 'steps': 45099, 'loss/train': 1.3792343139648438} -11/07/2021 03:36:39 - INFO - __main__ - Step 45101: {'lr': 0.00040247087966073253, 'samples': 8659392, 'steps': 45100, 'loss/train': 0.5739343762397766} -11/07/2021 03:36:40 - INFO - __main__ - Step 45102: {'lr': 0.00040246667407888427, 'samples': 8659584, 'steps': 45101, 'loss/train': 1.3865184783935547} -11/07/2021 03:36:40 - INFO - __main__ - Step 45103: {'lr': 0.0004024624684283368, 'samples': 8659776, 'steps': 45102, 'loss/train': 1.595341682434082} -11/07/2021 03:36:40 - INFO - __main__ - Step 45104: {'lr': 0.000402458262709092, 'samples': 8659968, 'steps': 45103, 'loss/train': 1.605851650238037} -11/07/2021 03:36:41 - INFO - __main__ - Step 45105: {'lr': 0.00040245405692115193, 'samples': 8660160, 'steps': 45104, 'loss/train': 1.5262550115585327} -11/07/2021 03:36:41 - INFO - __main__ - Step 45106: {'lr': 0.0004024498510645185, 'samples': 8660352, 'steps': 45105, 'loss/train': 1.4625663757324219} -11/07/2021 03:36:42 - INFO - __main__ - Step 45107: {'lr': 0.0004024456451391934, 'samples': 8660544, 'steps': 45106, 'loss/train': 0.90992271900177} -11/07/2021 03:36:43 - INFO - __main__ - Step 45108: {'lr': 0.0004024414391451787, 'samples': 8660736, 'steps': 45107, 'loss/train': 1.426047921180725} -11/07/2021 03:36:43 - INFO - __main__ - Step 45109: {'lr': 0.00040243723308247624, 'samples': 8660928, 'steps': 45108, 'loss/train': 1.5061769485473633} -11/07/2021 03:36:43 - INFO - __main__ - Step 45110: {'lr': 0.0004024330269510879, 'samples': 8661120, 'steps': 45109, 'loss/train': 1.8153321743011475} -11/07/2021 03:36:44 - INFO - __main__ - Step 45111: {'lr': 0.00040242882075101563, 'samples': 8661312, 'steps': 45110, 'loss/train': 1.7206075191497803} -11/07/2021 03:36:45 - INFO - __main__ - Step 45112: {'lr': 0.0004024246144822612, 'samples': 8661504, 'steps': 45111, 'loss/train': 1.9978528022766113} -11/07/2021 03:36:45 - INFO - __main__ - Step 45113: {'lr': 0.00040242040814482665, 'samples': 8661696, 'steps': 45112, 'loss/train': 1.1356459856033325} -11/07/2021 03:36:45 - INFO - __main__ - Step 45114: {'lr': 0.00040241620173871385, 'samples': 8661888, 'steps': 45113, 'loss/train': 1.4631052017211914} -11/07/2021 03:36:46 - INFO - __main__ - Step 45115: {'lr': 0.0004024119952639246, 'samples': 8662080, 'steps': 45114, 'loss/train': 1.5599628686904907} -11/07/2021 03:36:46 - INFO - __main__ - Step 45116: {'lr': 0.00040240778872046093, 'samples': 8662272, 'steps': 45115, 'loss/train': 1.4171319007873535} -11/07/2021 03:36:47 - INFO - __main__ - Step 45117: {'lr': 0.00040240358210832456, 'samples': 8662464, 'steps': 45116, 'loss/train': 1.6910568475723267} -11/07/2021 03:36:47 - INFO - __main__ - Step 45118: {'lr': 0.00040239937542751753, 'samples': 8662656, 'steps': 45117, 'loss/train': 1.4217894077301025} -11/07/2021 03:36:48 - INFO - __main__ - Step 45119: {'lr': 0.0004023951686780417, 'samples': 8662848, 'steps': 45118, 'loss/train': 1.3507628440856934} -11/07/2021 03:36:48 - INFO - __main__ - Step 45120: {'lr': 0.000402390961859899, 'samples': 8663040, 'steps': 45119, 'loss/train': 1.2889933586120605} -11/07/2021 03:36:48 - INFO - __main__ - Step 45121: {'lr': 0.00040238675497309117, 'samples': 8663232, 'steps': 45120, 'loss/train': 1.2425684928894043} -11/07/2021 03:36:50 - INFO - __main__ - Step 45122: {'lr': 0.0004023825480176204, 'samples': 8663424, 'steps': 45121, 'loss/train': 1.8090465068817139} -11/07/2021 03:36:50 - INFO - __main__ - Step 45123: {'lr': 0.0004023783409934882, 'samples': 8663616, 'steps': 45122, 'loss/train': 1.250329613685608} -11/07/2021 03:36:50 - INFO - __main__ - Step 45124: {'lr': 0.00040237413390069684, 'samples': 8663808, 'steps': 45123, 'loss/train': 1.3898934125900269} -11/07/2021 03:36:51 - INFO - __main__ - Step 45125: {'lr': 0.000402369926739248, 'samples': 8664000, 'steps': 45124, 'loss/train': 1.5924787521362305} -11/07/2021 03:36:51 - INFO - __main__ - Step 45126: {'lr': 0.0004023657195091436, 'samples': 8664192, 'steps': 45125, 'loss/train': 1.8747450113296509} -11/07/2021 03:36:52 - INFO - __main__ - Step 45127: {'lr': 0.00040236151221038555, 'samples': 8664384, 'steps': 45126, 'loss/train': 1.515708327293396} -11/07/2021 03:36:52 - INFO - __main__ - Step 45128: {'lr': 0.00040235730484297573, 'samples': 8664576, 'steps': 45127, 'loss/train': 1.0064326524734497} -11/07/2021 03:36:53 - INFO - __main__ - Step 45129: {'lr': 0.00040235309740691607, 'samples': 8664768, 'steps': 45128, 'loss/train': 1.7677335739135742} -11/07/2021 03:36:53 - INFO - __main__ - Step 45130: {'lr': 0.0004023488899022085, 'samples': 8664960, 'steps': 45129, 'loss/train': 1.232685923576355} -11/07/2021 03:36:53 - INFO - __main__ - Step 45131: {'lr': 0.00040234468232885483, 'samples': 8665152, 'steps': 45130, 'loss/train': 1.8822057247161865} -11/07/2021 03:36:54 - INFO - __main__ - Step 45132: {'lr': 0.00040234047468685704, 'samples': 8665344, 'steps': 45131, 'loss/train': 0.13900701701641083} -11/07/2021 03:36:55 - INFO - __main__ - Step 45133: {'lr': 0.00040233626697621695, 'samples': 8665536, 'steps': 45132, 'loss/train': 1.5698128938674927} -11/07/2021 03:36:55 - INFO - __main__ - Step 45134: {'lr': 0.0004023320591969365, 'samples': 8665728, 'steps': 45133, 'loss/train': 1.1442500352859497} -11/07/2021 03:36:55 - INFO - __main__ - Step 45135: {'lr': 0.00040232785134901755, 'samples': 8665920, 'steps': 45134, 'loss/train': 1.6900111436843872} -11/07/2021 03:36:56 - INFO - __main__ - Step 45136: {'lr': 0.0004023236434324621, 'samples': 8666112, 'steps': 45135, 'loss/train': 1.533385157585144} -11/07/2021 03:36:56 - INFO - __main__ - Step 45137: {'lr': 0.0004023194354472719, 'samples': 8666304, 'steps': 45136, 'loss/train': 1.4602547883987427} -11/07/2021 03:36:57 - INFO - __main__ - Step 45138: {'lr': 0.0004023152273934489, 'samples': 8666496, 'steps': 45137, 'loss/train': 1.6864073276519775} -11/07/2021 03:36:58 - INFO - __main__ - Step 45139: {'lr': 0.000402311019270995, 'samples': 8666688, 'steps': 45138, 'loss/train': 1.7880440950393677} -11/07/2021 03:36:58 - INFO - __main__ - Step 45140: {'lr': 0.00040230681107991217, 'samples': 8666880, 'steps': 45139, 'loss/train': 0.9193914532661438} -11/07/2021 03:36:58 - INFO - __main__ - Step 45141: {'lr': 0.0004023026028202021, 'samples': 8667072, 'steps': 45140, 'loss/train': 1.1637225151062012} -11/07/2021 03:36:59 - INFO - __main__ - Step 45142: {'lr': 0.000402298394491867, 'samples': 8667264, 'steps': 45141, 'loss/train': 1.384219765663147} -11/07/2021 03:37:00 - INFO - __main__ - Step 45143: {'lr': 0.0004022941860949085, 'samples': 8667456, 'steps': 45142, 'loss/train': 1.5145856142044067} -11/07/2021 03:37:00 - INFO - __main__ - Step 45144: {'lr': 0.0004022899776293287, 'samples': 8667648, 'steps': 45143, 'loss/train': 1.5330946445465088} -11/07/2021 03:37:00 - INFO - __main__ - Step 45145: {'lr': 0.00040228576909512927, 'samples': 8667840, 'steps': 45144, 'loss/train': 1.4673269987106323} -11/07/2021 03:37:01 - INFO - __main__ - Step 45146: {'lr': 0.0004022815604923122, 'samples': 8668032, 'steps': 45145, 'loss/train': 1.427357792854309} -11/07/2021 03:37:01 - INFO - __main__ - Step 45147: {'lr': 0.00040227735182087954, 'samples': 8668224, 'steps': 45146, 'loss/train': 1.6355878114700317} -11/07/2021 03:37:02 - INFO - __main__ - Step 45148: {'lr': 0.00040227314308083296, 'samples': 8668416, 'steps': 45147, 'loss/train': 1.5041543245315552} -11/07/2021 03:37:03 - INFO - __main__ - Step 45149: {'lr': 0.0004022689342721745, 'samples': 8668608, 'steps': 45148, 'loss/train': 1.401368498802185} -11/07/2021 03:37:03 - INFO - __main__ - Step 45150: {'lr': 0.000402264725394906, 'samples': 8668800, 'steps': 45149, 'loss/train': 1.3359441757202148} -11/07/2021 03:37:03 - INFO - __main__ - Step 45151: {'lr': 0.00040226051644902925, 'samples': 8668992, 'steps': 45150, 'loss/train': 1.7657395601272583} -11/07/2021 03:37:04 - INFO - __main__ - Step 45152: {'lr': 0.0004022563074345464, 'samples': 8669184, 'steps': 45151, 'loss/train': 1.005380630493164} -11/07/2021 03:37:05 - INFO - __main__ - Step 45153: {'lr': 0.00040225209835145916, 'samples': 8669376, 'steps': 45152, 'loss/train': 1.4632766246795654} -11/07/2021 03:37:05 - INFO - __main__ - Step 45154: {'lr': 0.0004022478891997695, 'samples': 8669568, 'steps': 45153, 'loss/train': 1.425004243850708} -11/07/2021 03:37:05 - INFO - __main__ - Step 45155: {'lr': 0.0004022436799794792, 'samples': 8669760, 'steps': 45154, 'loss/train': 1.634901523590088} -11/07/2021 03:37:06 - INFO - __main__ - Step 45156: {'lr': 0.0004022394706905904, 'samples': 8669952, 'steps': 45155, 'loss/train': 1.547129511833191} -11/07/2021 03:37:06 - INFO - __main__ - Step 45157: {'lr': 0.0004022352613331047, 'samples': 8670144, 'steps': 45156, 'loss/train': 1.5003315210342407} -11/07/2021 03:37:07 - INFO - __main__ - Step 45158: {'lr': 0.0004022310519070242, 'samples': 8670336, 'steps': 45157, 'loss/train': 1.1571340560913086} -11/07/2021 03:37:07 - INFO - __main__ - Step 45159: {'lr': 0.00040222684241235075, 'samples': 8670528, 'steps': 45158, 'loss/train': 1.305799961090088} -11/07/2021 03:37:08 - INFO - __main__ - Step 45160: {'lr': 0.00040222263284908616, 'samples': 8670720, 'steps': 45159, 'loss/train': 1.6285111904144287} -11/07/2021 03:37:08 - INFO - __main__ - Step 45161: {'lr': 0.00040221842321723245, 'samples': 8670912, 'steps': 45160, 'loss/train': 1.3914912939071655} -11/07/2021 03:37:08 - INFO - __main__ - Step 45162: {'lr': 0.0004022142135167915, 'samples': 8671104, 'steps': 45161, 'loss/train': 1.4020293951034546} -11/07/2021 03:37:09 - INFO - __main__ - Step 45163: {'lr': 0.0004022100037477652, 'samples': 8671296, 'steps': 45162, 'loss/train': 1.3243298530578613} -11/07/2021 03:37:10 - INFO - __main__ - Step 45164: {'lr': 0.0004022057939101553, 'samples': 8671488, 'steps': 45163, 'loss/train': 1.6081992387771606} -11/07/2021 03:37:10 - INFO - __main__ - Step 45165: {'lr': 0.0004022015840039639, 'samples': 8671680, 'steps': 45164, 'loss/train': 0.20652131736278534} -11/07/2021 03:37:11 - INFO - __main__ - Step 45166: {'lr': 0.00040219737402919284, 'samples': 8671872, 'steps': 45165, 'loss/train': 1.3107188940048218} -11/07/2021 03:37:11 - INFO - __main__ - Step 45167: {'lr': 0.0004021931639858439, 'samples': 8672064, 'steps': 45166, 'loss/train': 1.767072081565857} -11/07/2021 03:37:11 - INFO - __main__ - Step 45168: {'lr': 0.00040218895387391913, 'samples': 8672256, 'steps': 45167, 'loss/train': 1.615883708000183} -11/07/2021 03:37:12 - INFO - __main__ - Step 45169: {'lr': 0.0004021847436934204, 'samples': 8672448, 'steps': 45168, 'loss/train': 1.5700477361679077} -11/07/2021 03:37:13 - INFO - __main__ - Step 45170: {'lr': 0.0004021805334443496, 'samples': 8672640, 'steps': 45169, 'loss/train': 1.1653289794921875} -11/07/2021 03:37:13 - INFO - __main__ - Step 45171: {'lr': 0.00040217632312670846, 'samples': 8672832, 'steps': 45170, 'loss/train': 1.2083021402359009} -11/07/2021 03:37:13 - INFO - __main__ - Step 45172: {'lr': 0.0004021721127404991, 'samples': 8673024, 'steps': 45171, 'loss/train': 1.7216506004333496} -11/07/2021 03:37:14 - INFO - __main__ - Step 45173: {'lr': 0.0004021679022857233, 'samples': 8673216, 'steps': 45172, 'loss/train': 1.6763455867767334} -11/07/2021 03:37:15 - INFO - __main__ - Step 45174: {'lr': 0.000402163691762383, 'samples': 8673408, 'steps': 45173, 'loss/train': 1.2438222169876099} -11/07/2021 03:37:15 - INFO - __main__ - Step 45175: {'lr': 0.00040215948117048006, 'samples': 8673600, 'steps': 45174, 'loss/train': 1.4948920011520386} -11/07/2021 03:37:15 - INFO - __main__ - Step 45176: {'lr': 0.00040215527051001653, 'samples': 8673792, 'steps': 45175, 'loss/train': 1.5023847818374634} -11/07/2021 03:37:16 - INFO - __main__ - Step 45177: {'lr': 0.00040215105978099407, 'samples': 8673984, 'steps': 45176, 'loss/train': 1.5538227558135986} -11/07/2021 03:37:16 - INFO - __main__ - Step 45178: {'lr': 0.00040214684898341475, 'samples': 8674176, 'steps': 45177, 'loss/train': 1.6242763996124268} -11/07/2021 03:37:18 - INFO - __main__ - Step 45179: {'lr': 0.00040214263811728034, 'samples': 8674368, 'steps': 45178, 'loss/train': 1.148213267326355} -11/07/2021 03:37:18 - INFO - __main__ - Step 45180: {'lr': 0.00040213842718259287, 'samples': 8674560, 'steps': 45179, 'loss/train': 1.8194248676300049} -11/07/2021 03:37:19 - INFO - __main__ - Step 45181: {'lr': 0.00040213421617935416, 'samples': 8674752, 'steps': 45180, 'loss/train': 1.411015510559082} -11/07/2021 03:37:19 - INFO - __main__ - Step 45182: {'lr': 0.000402130005107566, 'samples': 8674944, 'steps': 45181, 'loss/train': 3.0634677410125732} -11/07/2021 03:37:19 - INFO - __main__ - Step 45183: {'lr': 0.0004021257939672306, 'samples': 8675136, 'steps': 45182, 'loss/train': 1.4965283870697021} -11/07/2021 03:37:20 - INFO - __main__ - Step 45184: {'lr': 0.0004021215827583496, 'samples': 8675328, 'steps': 45183, 'loss/train': 1.5582106113433838} -11/07/2021 03:37:21 - INFO - __main__ - Step 45185: {'lr': 0.0004021173714809249, 'samples': 8675520, 'steps': 45184, 'loss/train': 1.5984597206115723} -11/07/2021 03:37:21 - INFO - __main__ - Step 45186: {'lr': 0.0004021131601349585, 'samples': 8675712, 'steps': 45185, 'loss/train': 1.2047393321990967} -11/07/2021 03:37:21 - INFO - __main__ - Step 45187: {'lr': 0.0004021089487204522, 'samples': 8675904, 'steps': 45186, 'loss/train': 1.9748467206954956} -11/07/2021 03:37:22 - INFO - __main__ - Step 45188: {'lr': 0.00040210473723740803, 'samples': 8676096, 'steps': 45187, 'loss/train': 1.7441582679748535} -11/07/2021 03:37:22 - INFO - __main__ - Step 45189: {'lr': 0.0004021005256858279, 'samples': 8676288, 'steps': 45188, 'loss/train': 1.3486766815185547} -11/07/2021 03:37:23 - INFO - __main__ - Step 45190: {'lr': 0.00040209631406571344, 'samples': 8676480, 'steps': 45189, 'loss/train': 2.29198956489563} -11/07/2021 03:37:23 - INFO - __main__ - Step 45191: {'lr': 0.00040209210237706684, 'samples': 8676672, 'steps': 45190, 'loss/train': 1.65663743019104} -11/07/2021 03:37:24 - INFO - __main__ - Step 45192: {'lr': 0.0004020878906198898, 'samples': 8676864, 'steps': 45191, 'loss/train': 1.2061249017715454} -11/07/2021 03:37:24 - INFO - __main__ - Step 45193: {'lr': 0.0004020836787941844, 'samples': 8677056, 'steps': 45192, 'loss/train': 1.2055654525756836} -11/07/2021 03:37:25 - INFO - __main__ - Step 45194: {'lr': 0.0004020794668999524, 'samples': 8677248, 'steps': 45193, 'loss/train': 1.764271855354309} -11/07/2021 03:37:26 - INFO - __main__ - Step 45195: {'lr': 0.0004020752549371957, 'samples': 8677440, 'steps': 45194, 'loss/train': 1.267154335975647} -11/07/2021 03:37:26 - INFO - __main__ - Step 45196: {'lr': 0.00040207104290591633, 'samples': 8677632, 'steps': 45195, 'loss/train': 1.8496373891830444} -11/07/2021 03:37:26 - INFO - __main__ - Step 45197: {'lr': 0.000402066830806116, 'samples': 8677824, 'steps': 45196, 'loss/train': 1.0303630828857422} -11/07/2021 03:37:27 - INFO - __main__ - Step 45198: {'lr': 0.0004020626186377967, 'samples': 8678016, 'steps': 45197, 'loss/train': 1.5434365272521973} -11/07/2021 03:37:27 - INFO - __main__ - Step 45199: {'lr': 0.00040205840640096036, 'samples': 8678208, 'steps': 45198, 'loss/train': 1.3023549318313599} -11/07/2021 03:37:27 - INFO - __main__ - Step 45200: {'lr': 0.0004020541940956089, 'samples': 8678400, 'steps': 45199, 'loss/train': 1.1285649538040161} -11/07/2021 03:37:28 - INFO - __main__ - Step 45201: {'lr': 0.0004020499817217441, 'samples': 8678592, 'steps': 45200, 'loss/train': 1.0267317295074463} -11/07/2021 03:37:29 - INFO - __main__ - Step 45202: {'lr': 0.000402045769279368, 'samples': 8678784, 'steps': 45201, 'loss/train': 1.3042110204696655} -11/07/2021 03:37:29 - INFO - __main__ - Step 45203: {'lr': 0.0004020415567684823, 'samples': 8678976, 'steps': 45202, 'loss/train': 1.1630033254623413} -11/07/2021 03:37:30 - INFO - __main__ - Step 45204: {'lr': 0.0004020373441890891, 'samples': 8679168, 'steps': 45203, 'loss/train': 2.08655047416687} -11/07/2021 03:37:30 - INFO - __main__ - Step 45205: {'lr': 0.00040203313154119026, 'samples': 8679360, 'steps': 45204, 'loss/train': 1.9520084857940674} -11/07/2021 03:37:32 - INFO - __main__ - Step 45206: {'lr': 0.00040202891882478754, 'samples': 8679552, 'steps': 45205, 'loss/train': 1.7195074558258057} -11/07/2021 03:37:32 - INFO - __main__ - Step 45207: {'lr': 0.000402024706039883, 'samples': 8679744, 'steps': 45206, 'loss/train': 1.6180075407028198} -11/07/2021 03:37:33 - INFO - __main__ - Step 45208: {'lr': 0.0004020204931864785, 'samples': 8679936, 'steps': 45207, 'loss/train': 1.2656595706939697} -11/07/2021 03:37:33 - INFO - __main__ - Step 45209: {'lr': 0.0004020162802645758, 'samples': 8680128, 'steps': 45208, 'loss/train': 1.5247958898544312} -11/07/2021 03:37:33 - INFO - __main__ - Step 45210: {'lr': 0.000402012067274177, 'samples': 8680320, 'steps': 45209, 'loss/train': 1.5917531251907349} -11/07/2021 03:37:34 - INFO - __main__ - Step 45211: {'lr': 0.0004020078542152839, 'samples': 8680512, 'steps': 45210, 'loss/train': 2.631469249725342} -11/07/2021 03:37:34 - INFO - __main__ - Step 45212: {'lr': 0.0004020036410878984, 'samples': 8680704, 'steps': 45211, 'loss/train': 1.7594704627990723} -11/07/2021 03:37:35 - INFO - __main__ - Step 45213: {'lr': 0.0004019994278920224, 'samples': 8680896, 'steps': 45212, 'loss/train': 1.6504069566726685} -11/07/2021 03:37:35 - INFO - __main__ - Step 45214: {'lr': 0.00040199521462765776, 'samples': 8681088, 'steps': 45213, 'loss/train': 1.2237399816513062} -11/07/2021 03:37:36 - INFO - __main__ - Step 45215: {'lr': 0.0004019910012948065, 'samples': 8681280, 'steps': 45214, 'loss/train': 1.6197471618652344} -11/07/2021 03:37:36 - INFO - __main__ - Step 45216: {'lr': 0.0004019867878934704, 'samples': 8681472, 'steps': 45215, 'loss/train': 1.4788774251937866} -11/07/2021 03:37:36 - INFO - __main__ - Step 45217: {'lr': 0.0004019825744236514, 'samples': 8681664, 'steps': 45216, 'loss/train': 1.4490773677825928} -11/07/2021 03:37:37 - INFO - __main__ - Step 45218: {'lr': 0.0004019783608853513, 'samples': 8681856, 'steps': 45217, 'loss/train': 1.8118454217910767} -11/07/2021 03:37:38 - INFO - __main__ - Step 45219: {'lr': 0.0004019741472785723, 'samples': 8682048, 'steps': 45218, 'loss/train': 1.7203056812286377} -11/07/2021 03:37:38 - INFO - __main__ - Step 45220: {'lr': 0.0004019699336033159, 'samples': 8682240, 'steps': 45219, 'loss/train': 1.4860272407531738} -11/07/2021 03:37:39 - INFO - __main__ - Step 45221: {'lr': 0.0004019657198595843, 'samples': 8682432, 'steps': 45220, 'loss/train': 1.7316553592681885} -11/07/2021 03:37:39 - INFO - __main__ - Step 45222: {'lr': 0.00040196150604737924, 'samples': 8682624, 'steps': 45221, 'loss/train': 1.0518038272857666} -11/07/2021 03:37:39 - INFO - __main__ - Step 45223: {'lr': 0.0004019572921667027, 'samples': 8682816, 'steps': 45222, 'loss/train': 1.50096595287323} -11/07/2021 03:37:40 - INFO - __main__ - Step 45224: {'lr': 0.0004019530782175566, 'samples': 8683008, 'steps': 45223, 'loss/train': 1.5049973726272583} -11/07/2021 03:37:41 - INFO - __main__ - Step 45225: {'lr': 0.00040194886419994274, 'samples': 8683200, 'steps': 45224, 'loss/train': 1.1065824031829834} -11/07/2021 03:37:41 - INFO - __main__ - Step 45226: {'lr': 0.0004019446501138631, 'samples': 8683392, 'steps': 45225, 'loss/train': 1.344346046447754} -11/07/2021 03:37:41 - INFO - __main__ - Step 45227: {'lr': 0.0004019404359593195, 'samples': 8683584, 'steps': 45226, 'loss/train': 0.24694529175758362} -11/07/2021 03:37:42 - INFO - __main__ - Step 45228: {'lr': 0.0004019362217363138, 'samples': 8683776, 'steps': 45227, 'loss/train': 1.2918033599853516} -11/07/2021 03:37:43 - INFO - __main__ - Step 45229: {'lr': 0.00040193200744484815, 'samples': 8683968, 'steps': 45228, 'loss/train': 1.40713632106781} -11/07/2021 03:37:43 - INFO - __main__ - Step 45230: {'lr': 0.00040192779308492423, 'samples': 8684160, 'steps': 45229, 'loss/train': 1.5547404289245605} -11/07/2021 03:37:44 - INFO - __main__ - Step 45231: {'lr': 0.00040192357865654395, 'samples': 8684352, 'steps': 45230, 'loss/train': 1.2795825004577637} -11/07/2021 03:37:44 - INFO - __main__ - Step 45232: {'lr': 0.00040191936415970926, 'samples': 8684544, 'steps': 45231, 'loss/train': 1.4769785404205322} -11/07/2021 03:37:44 - INFO - __main__ - Step 45233: {'lr': 0.00040191514959442206, 'samples': 8684736, 'steps': 45232, 'loss/train': 1.2793304920196533} -11/07/2021 03:37:45 - INFO - __main__ - Step 45234: {'lr': 0.0004019109349606842, 'samples': 8684928, 'steps': 45233, 'loss/train': 1.544562578201294} -11/07/2021 03:37:46 - INFO - __main__ - Step 45235: {'lr': 0.0004019067202584977, 'samples': 8685120, 'steps': 45234, 'loss/train': 2.054046392440796} -11/07/2021 03:37:46 - INFO - __main__ - Step 45236: {'lr': 0.0004019025054878643, 'samples': 8685312, 'steps': 45235, 'loss/train': 3.486762762069702} -11/07/2021 03:37:46 - INFO - __main__ - Step 45237: {'lr': 0.00040189829064878605, 'samples': 8685504, 'steps': 45236, 'loss/train': 1.7212954759597778} -11/07/2021 03:37:47 - INFO - __main__ - Step 45238: {'lr': 0.0004018940757412647, 'samples': 8685696, 'steps': 45237, 'loss/train': 0.9980286359786987} -11/07/2021 03:37:48 - INFO - __main__ - Step 45239: {'lr': 0.0004018898607653022, 'samples': 8685888, 'steps': 45238, 'loss/train': 1.3442773818969727} -11/07/2021 03:37:48 - INFO - __main__ - Step 45240: {'lr': 0.00040188564572090057, 'samples': 8686080, 'steps': 45239, 'loss/train': 1.4004093408584595} -11/07/2021 03:37:48 - INFO - __main__ - Step 45241: {'lr': 0.00040188143060806156, 'samples': 8686272, 'steps': 45240, 'loss/train': 1.0079407691955566} -11/07/2021 03:37:49 - INFO - __main__ - Step 45242: {'lr': 0.0004018772154267871, 'samples': 8686464, 'steps': 45241, 'loss/train': 1.5502294301986694} -11/07/2021 03:37:49 - INFO - __main__ - Step 45243: {'lr': 0.0004018730001770792, 'samples': 8686656, 'steps': 45242, 'loss/train': 1.4918146133422852} -11/07/2021 03:37:50 - INFO - __main__ - Step 45244: {'lr': 0.00040186878485893955, 'samples': 8686848, 'steps': 45243, 'loss/train': 1.7983713150024414} -11/07/2021 03:37:50 - INFO - __main__ - Step 45245: {'lr': 0.0004018645694723703, 'samples': 8687040, 'steps': 45244, 'loss/train': 1.4935053586959839} -11/07/2021 03:37:51 - INFO - __main__ - Step 45246: {'lr': 0.00040186035401737307, 'samples': 8687232, 'steps': 45245, 'loss/train': 1.4526677131652832} -11/07/2021 03:37:51 - INFO - __main__ - Step 45247: {'lr': 0.00040185613849395, 'samples': 8687424, 'steps': 45246, 'loss/train': 1.2876986265182495} -11/07/2021 03:37:51 - INFO - __main__ - Step 45248: {'lr': 0.0004018519229021029, 'samples': 8687616, 'steps': 45247, 'loss/train': 0.5878735780715942} -11/07/2021 03:37:53 - INFO - __main__ - Step 45249: {'lr': 0.0004018477072418336, 'samples': 8687808, 'steps': 45248, 'loss/train': 1.623437523841858} -11/07/2021 03:37:53 - INFO - __main__ - Step 45250: {'lr': 0.00040184349151314413, 'samples': 8688000, 'steps': 45249, 'loss/train': 1.5730112791061401} -11/07/2021 03:37:53 - INFO - __main__ - Step 45251: {'lr': 0.0004018392757160363, 'samples': 8688192, 'steps': 45250, 'loss/train': 0.9747245907783508} -11/07/2021 03:37:54 - INFO - __main__ - Step 45252: {'lr': 0.00040183505985051204, 'samples': 8688384, 'steps': 45251, 'loss/train': 1.9808520078659058} -11/07/2021 03:37:54 - INFO - __main__ - Step 45253: {'lr': 0.0004018308439165733, 'samples': 8688576, 'steps': 45252, 'loss/train': 0.8069427609443665} -11/07/2021 03:37:54 - INFO - __main__ - Step 45254: {'lr': 0.00040182662791422185, 'samples': 8688768, 'steps': 45253, 'loss/train': 1.6230127811431885} -11/07/2021 03:37:55 - INFO - __main__ - Step 45255: {'lr': 0.0004018224118434597, 'samples': 8688960, 'steps': 45254, 'loss/train': 1.6706337928771973} -11/07/2021 03:37:56 - INFO - __main__ - Step 45256: {'lr': 0.0004018181957042887, 'samples': 8689152, 'steps': 45255, 'loss/train': 1.0620611906051636} -11/07/2021 03:37:56 - INFO - __main__ - Step 45257: {'lr': 0.00040181397949671073, 'samples': 8689344, 'steps': 45256, 'loss/train': 1.2024199962615967} -11/07/2021 03:37:56 - INFO - __main__ - Step 45258: {'lr': 0.00040180976322072776, 'samples': 8689536, 'steps': 45257, 'loss/train': 1.508073091506958} -11/07/2021 03:37:57 - INFO - __main__ - Step 45259: {'lr': 0.0004018055468763416, 'samples': 8689728, 'steps': 45258, 'loss/train': 1.4503211975097656} -11/07/2021 03:37:58 - INFO - __main__ - Step 45260: {'lr': 0.0004018013304635543, 'samples': 8689920, 'steps': 45259, 'loss/train': 1.3935219049453735} -11/07/2021 03:37:58 - INFO - __main__ - Step 45261: {'lr': 0.0004017971139823676, 'samples': 8690112, 'steps': 45260, 'loss/train': 1.8210779428482056} -11/07/2021 03:37:59 - INFO - __main__ - Step 45262: {'lr': 0.0004017928974327835, 'samples': 8690304, 'steps': 45261, 'loss/train': 1.3265295028686523} -11/07/2021 03:37:59 - INFO - __main__ - Step 45263: {'lr': 0.00040178868081480393, 'samples': 8690496, 'steps': 45262, 'loss/train': 1.6089332103729248} -11/07/2021 03:37:59 - INFO - __main__ - Step 45264: {'lr': 0.00040178446412843054, 'samples': 8690688, 'steps': 45263, 'loss/train': 1.2602695226669312} -11/07/2021 03:38:00 - INFO - __main__ - Step 45265: {'lr': 0.0004017802473736655, 'samples': 8690880, 'steps': 45264, 'loss/train': 1.212044358253479} -11/07/2021 03:38:01 - INFO - __main__ - Step 45266: {'lr': 0.00040177603055051065, 'samples': 8691072, 'steps': 45265, 'loss/train': 1.4239474534988403} -11/07/2021 03:38:01 - INFO - __main__ - Step 45267: {'lr': 0.0004017718136589679, 'samples': 8691264, 'steps': 45266, 'loss/train': 1.1865142583847046} -11/07/2021 03:38:01 - INFO - __main__ - Step 45268: {'lr': 0.000401767596699039, 'samples': 8691456, 'steps': 45267, 'loss/train': 1.5081130266189575} -11/07/2021 03:38:02 - INFO - __main__ - Step 45269: {'lr': 0.00040176337967072603, 'samples': 8691648, 'steps': 45268, 'loss/train': 1.8244184255599976} -11/07/2021 03:38:03 - INFO - __main__ - Step 45270: {'lr': 0.0004017591625740308, 'samples': 8691840, 'steps': 45269, 'loss/train': 1.4279512166976929} -11/07/2021 03:38:03 - INFO - __main__ - Step 45271: {'lr': 0.0004017549454089553, 'samples': 8692032, 'steps': 45270, 'loss/train': 1.4407144784927368} -11/07/2021 03:38:03 - INFO - __main__ - Step 45272: {'lr': 0.00040175072817550127, 'samples': 8692224, 'steps': 45271, 'loss/train': 1.6822588443756104} -11/07/2021 03:38:04 - INFO - __main__ - Step 45273: {'lr': 0.00040174651087367076, 'samples': 8692416, 'steps': 45272, 'loss/train': 1.109861969947815} -11/07/2021 03:38:04 - INFO - __main__ - Step 45274: {'lr': 0.0004017422935034656, 'samples': 8692608, 'steps': 45273, 'loss/train': 1.4292773008346558} -11/07/2021 03:38:05 - INFO - __main__ - Step 45275: {'lr': 0.00040173807606488763, 'samples': 8692800, 'steps': 45274, 'loss/train': 0.8860165476799011} -11/07/2021 03:38:06 - INFO - __main__ - Step 45276: {'lr': 0.0004017338585579389, 'samples': 8692992, 'steps': 45275, 'loss/train': 1.3372459411621094} -11/07/2021 03:38:06 - INFO - __main__ - Step 45277: {'lr': 0.0004017296409826213, 'samples': 8693184, 'steps': 45276, 'loss/train': 1.598120927810669} -11/07/2021 03:38:06 - INFO - __main__ - Step 45278: {'lr': 0.00040172542333893657, 'samples': 8693376, 'steps': 45277, 'loss/train': 2.6153388023376465} -11/07/2021 03:38:07 - INFO - __main__ - Step 45279: {'lr': 0.00040172120562688673, 'samples': 8693568, 'steps': 45278, 'loss/train': 1.7494827508926392} -11/07/2021 03:38:07 - INFO - __main__ - Step 45280: {'lr': 0.00040171698784647366, 'samples': 8693760, 'steps': 45279, 'loss/train': 1.1776270866394043} -11/07/2021 03:38:08 - INFO - __main__ - Step 45281: {'lr': 0.00040171276999769926, 'samples': 8693952, 'steps': 45280, 'loss/train': 1.368177056312561} -11/07/2021 03:38:08 - INFO - __main__ - Step 45282: {'lr': 0.00040170855208056537, 'samples': 8694144, 'steps': 45281, 'loss/train': 1.5612167119979858} -11/07/2021 03:38:09 - INFO - __main__ - Step 45283: {'lr': 0.000401704334095074, 'samples': 8694336, 'steps': 45282, 'loss/train': 1.2405672073364258} -11/07/2021 03:38:09 - INFO - __main__ - Step 45284: {'lr': 0.00040170011604122704, 'samples': 8694528, 'steps': 45283, 'loss/train': 1.4168163537979126} -11/07/2021 03:38:09 - INFO - __main__ - Step 45285: {'lr': 0.0004016958979190263, 'samples': 8694720, 'steps': 45284, 'loss/train': 1.6693315505981445} -11/07/2021 03:38:11 - INFO - __main__ - Step 45286: {'lr': 0.0004016916797284738, 'samples': 8694912, 'steps': 45285, 'loss/train': 1.5633200407028198} -11/07/2021 03:38:11 - INFO - __main__ - Step 45287: {'lr': 0.00040168746146957123, 'samples': 8695104, 'steps': 45286, 'loss/train': 1.2865655422210693} -11/07/2021 03:38:11 - INFO - __main__ - Step 45288: {'lr': 0.0004016832431423207, 'samples': 8695296, 'steps': 45287, 'loss/train': 1.1564030647277832} -11/07/2021 03:38:12 - INFO - __main__ - Step 45289: {'lr': 0.00040167902474672404, 'samples': 8695488, 'steps': 45288, 'loss/train': 1.4032548666000366} -11/07/2021 03:38:12 - INFO - __main__ - Step 45290: {'lr': 0.0004016748062827832, 'samples': 8695680, 'steps': 45289, 'loss/train': 1.2627499103546143} -11/07/2021 03:38:13 - INFO - __main__ - Step 45291: {'lr': 0.00040167058775049993, 'samples': 8695872, 'steps': 45290, 'loss/train': 1.611716628074646} -11/07/2021 03:38:13 - INFO - __main__ - Step 45292: {'lr': 0.0004016663691498763, 'samples': 8696064, 'steps': 45291, 'loss/train': 1.4768520593643188} -11/07/2021 03:38:14 - INFO - __main__ - Step 45293: {'lr': 0.00040166215048091414, 'samples': 8696256, 'steps': 45292, 'loss/train': 1.205528974533081} -11/07/2021 03:38:14 - INFO - __main__ - Step 45294: {'lr': 0.0004016579317436153, 'samples': 8696448, 'steps': 45293, 'loss/train': 1.9122101068496704} -11/07/2021 03:38:14 - INFO - __main__ - Step 45295: {'lr': 0.0004016537129379818, 'samples': 8696640, 'steps': 45294, 'loss/train': 1.5891315937042236} -11/07/2021 03:38:15 - INFO - __main__ - Step 45296: {'lr': 0.0004016494940640155, 'samples': 8696832, 'steps': 45295, 'loss/train': 1.4022443294525146} -11/07/2021 03:38:16 - INFO - __main__ - Step 45297: {'lr': 0.0004016452751217183, 'samples': 8697024, 'steps': 45296, 'loss/train': 1.3902982473373413} -11/07/2021 03:38:16 - INFO - __main__ - Step 45298: {'lr': 0.00040164105611109195, 'samples': 8697216, 'steps': 45297, 'loss/train': 1.7416541576385498} -11/07/2021 03:38:17 - INFO - __main__ - Step 45299: {'lr': 0.0004016368370321386, 'samples': 8697408, 'steps': 45298, 'loss/train': 1.1704825162887573} -11/07/2021 03:38:17 - INFO - __main__ - Step 45300: {'lr': 0.00040163261788485994, 'samples': 8697600, 'steps': 45299, 'loss/train': 1.501841425895691} -11/07/2021 03:38:18 - INFO - __main__ - Step 45301: {'lr': 0.00040162839866925804, 'samples': 8697792, 'steps': 45300, 'loss/train': 1.65465247631073} -11/07/2021 03:38:18 - INFO - __main__ - Step 45302: {'lr': 0.0004016241793853347, 'samples': 8697984, 'steps': 45301, 'loss/train': 1.2076376676559448} -11/07/2021 03:38:19 - INFO - __main__ - Step 45303: {'lr': 0.00040161996003309174, 'samples': 8698176, 'steps': 45302, 'loss/train': 1.5029069185256958} -11/07/2021 03:38:19 - INFO - __main__ - Step 45304: {'lr': 0.00040161574061253134, 'samples': 8698368, 'steps': 45303, 'loss/train': 1.6785801649093628} -11/07/2021 03:38:19 - INFO - __main__ - Step 45305: {'lr': 0.0004016115211236552, 'samples': 8698560, 'steps': 45304, 'loss/train': 1.2267104387283325} -11/07/2021 03:38:20 - INFO - __main__ - Step 45306: {'lr': 0.0004016073015664651, 'samples': 8698752, 'steps': 45305, 'loss/train': 1.4622952938079834} -11/07/2021 03:38:21 - INFO - __main__ - Step 45307: {'lr': 0.0004016030819409632, 'samples': 8698944, 'steps': 45306, 'loss/train': 1.6274431943893433} -11/07/2021 03:38:21 - INFO - __main__ - Step 45308: {'lr': 0.00040159886224715126, 'samples': 8699136, 'steps': 45307, 'loss/train': 1.5141170024871826} -11/07/2021 03:38:21 - INFO - __main__ - Step 45309: {'lr': 0.0004015946424850312, 'samples': 8699328, 'steps': 45308, 'loss/train': 1.6308294534683228} -11/07/2021 03:38:22 - INFO - __main__ - Step 45310: {'lr': 0.000401590422654605, 'samples': 8699520, 'steps': 45309, 'loss/train': 1.4504419565200806} -11/07/2021 03:38:23 - INFO - __main__ - Step 45311: {'lr': 0.00040158620275587443, 'samples': 8699712, 'steps': 45310, 'loss/train': 0.8374848961830139} -11/07/2021 03:38:23 - INFO - __main__ - Step 45312: {'lr': 0.0004015819827888415, 'samples': 8699904, 'steps': 45311, 'loss/train': 1.1242897510528564} -11/07/2021 03:38:23 - INFO - __main__ - Step 45313: {'lr': 0.00040157776275350805, 'samples': 8700096, 'steps': 45312, 'loss/train': 1.6858326196670532} -11/07/2021 03:38:24 - INFO - __main__ - Step 45314: {'lr': 0.000401573542649876, 'samples': 8700288, 'steps': 45313, 'loss/train': 1.314355731010437} -11/07/2021 03:38:24 - INFO - __main__ - Step 45315: {'lr': 0.0004015693224779472, 'samples': 8700480, 'steps': 45314, 'loss/train': 1.3788398504257202} -11/07/2021 03:38:24 - INFO - __main__ - Step 45316: {'lr': 0.0004015651022377237, 'samples': 8700672, 'steps': 45315, 'loss/train': 1.6739813089370728} -11/07/2021 03:38:26 - INFO - __main__ - Step 45317: {'lr': 0.00040156088192920726, 'samples': 8700864, 'steps': 45316, 'loss/train': 1.5884895324707031} -11/07/2021 03:38:26 - INFO - __main__ - Step 45318: {'lr': 0.0004015566615523998, 'samples': 8701056, 'steps': 45317, 'loss/train': 1.2685041427612305} -11/07/2021 03:38:26 - INFO - __main__ - Step 45319: {'lr': 0.00040155244110730325, 'samples': 8701248, 'steps': 45318, 'loss/train': 2.00679349899292} -11/07/2021 03:38:27 - INFO - __main__ - Step 45320: {'lr': 0.00040154822059391954, 'samples': 8701440, 'steps': 45319, 'loss/train': 1.6689691543579102} -11/07/2021 03:38:27 - INFO - __main__ - Step 45321: {'lr': 0.00040154400001225055, 'samples': 8701632, 'steps': 45320, 'loss/train': 1.1222220659255981} -11/07/2021 03:38:28 - INFO - __main__ - Step 45322: {'lr': 0.00040153977936229813, 'samples': 8701824, 'steps': 45321, 'loss/train': 1.3170971870422363} -11/07/2021 03:38:28 - INFO - __main__ - Step 45323: {'lr': 0.00040153555864406423, 'samples': 8702016, 'steps': 45322, 'loss/train': 0.9419315457344055} -11/07/2021 03:38:29 - INFO - __main__ - Step 45324: {'lr': 0.0004015313378575508, 'samples': 8702208, 'steps': 45323, 'loss/train': 1.348008394241333} -11/07/2021 03:38:29 - INFO - __main__ - Step 45325: {'lr': 0.00040152711700275963, 'samples': 8702400, 'steps': 45324, 'loss/train': 1.7534323930740356} -11/07/2021 03:38:29 - INFO - __main__ - Step 45326: {'lr': 0.0004015228960796927, 'samples': 8702592, 'steps': 45325, 'loss/train': 1.7659834623336792} -11/07/2021 03:38:30 - INFO - __main__ - Step 45327: {'lr': 0.0004015186750883518, 'samples': 8702784, 'steps': 45326, 'loss/train': 0.9564913511276245} -11/07/2021 03:38:31 - INFO - __main__ - Step 45328: {'lr': 0.0004015144540287391, 'samples': 8702976, 'steps': 45327, 'loss/train': 1.4444808959960938} -11/07/2021 03:38:31 - INFO - __main__ - Step 45329: {'lr': 0.0004015102329008562, 'samples': 8703168, 'steps': 45328, 'loss/train': 0.23689793050289154} -11/07/2021 03:38:31 - INFO - __main__ - Step 45330: {'lr': 0.0004015060117047051, 'samples': 8703360, 'steps': 45329, 'loss/train': 1.4495890140533447} -11/07/2021 03:38:32 - INFO - __main__ - Step 45331: {'lr': 0.0004015017904402879, 'samples': 8703552, 'steps': 45330, 'loss/train': 1.1690396070480347} -11/07/2021 03:38:33 - INFO - __main__ - Step 45332: {'lr': 0.00040149756910760616, 'samples': 8703744, 'steps': 45331, 'loss/train': 1.6938713788986206} -11/07/2021 03:38:33 - INFO - __main__ - Step 45333: {'lr': 0.000401493347706662, 'samples': 8703936, 'steps': 45332, 'loss/train': 1.1185976266860962} -11/07/2021 03:38:33 - INFO - __main__ - Step 45334: {'lr': 0.00040148912623745733, 'samples': 8704128, 'steps': 45333, 'loss/train': 1.6920937299728394} -11/07/2021 03:38:34 - INFO - __main__ - Step 45335: {'lr': 0.0004014849046999939, 'samples': 8704320, 'steps': 45334, 'loss/train': 1.3867719173431396} -11/07/2021 03:38:34 - INFO - __main__ - Step 45336: {'lr': 0.00040148068309427376, 'samples': 8704512, 'steps': 45335, 'loss/train': 1.4321553707122803} -11/07/2021 03:38:35 - INFO - __main__ - Step 45337: {'lr': 0.00040147646142029884, 'samples': 8704704, 'steps': 45336, 'loss/train': 1.781887173652649} -11/07/2021 03:38:36 - INFO - __main__ - Step 45338: {'lr': 0.0004014722396780709, 'samples': 8704896, 'steps': 45337, 'loss/train': 1.198248267173767} -11/07/2021 03:38:36 - INFO - __main__ - Step 45339: {'lr': 0.00040146801786759183, 'samples': 8705088, 'steps': 45338, 'loss/train': 1.3500672578811646} -11/07/2021 03:38:36 - INFO - __main__ - Step 45340: {'lr': 0.00040146379598886376, 'samples': 8705280, 'steps': 45339, 'loss/train': 1.4676085710525513} -11/07/2021 03:38:37 - INFO - __main__ - Step 45341: {'lr': 0.00040145957404188825, 'samples': 8705472, 'steps': 45340, 'loss/train': 1.3935436010360718} -11/07/2021 03:38:38 - INFO - __main__ - Step 45342: {'lr': 0.00040145535202666747, 'samples': 8705664, 'steps': 45341, 'loss/train': 0.6357443332672119} -11/07/2021 03:38:38 - INFO - __main__ - Step 45343: {'lr': 0.0004014511299432033, 'samples': 8705856, 'steps': 45342, 'loss/train': 1.6631529331207275} -11/07/2021 03:38:39 - INFO - __main__ - Step 45344: {'lr': 0.0004014469077914976, 'samples': 8706048, 'steps': 45343, 'loss/train': 1.384961485862732} -11/07/2021 03:38:39 - INFO - __main__ - Step 45345: {'lr': 0.0004014426855715523, 'samples': 8706240, 'steps': 45344, 'loss/train': 1.0772547721862793} -11/07/2021 03:38:39 - INFO - __main__ - Step 45346: {'lr': 0.00040143846328336913, 'samples': 8706432, 'steps': 45345, 'loss/train': 1.3336265087127686} -11/07/2021 03:38:40 - INFO - __main__ - Step 45347: {'lr': 0.00040143424092695015, 'samples': 8706624, 'steps': 45346, 'loss/train': 1.4853858947753906} -11/07/2021 03:38:40 - INFO - __main__ - Step 45348: {'lr': 0.00040143001850229733, 'samples': 8706816, 'steps': 45347, 'loss/train': 2.2581679821014404} -11/07/2021 03:38:41 - INFO - __main__ - Step 45349: {'lr': 0.00040142579600941237, 'samples': 8707008, 'steps': 45348, 'loss/train': 1.3928520679473877} -11/07/2021 03:38:41 - INFO - __main__ - Step 45350: {'lr': 0.0004014215734482973, 'samples': 8707200, 'steps': 45349, 'loss/train': 1.4989149570465088} -11/07/2021 03:38:42 - INFO - __main__ - Step 45351: {'lr': 0.00040141735081895407, 'samples': 8707392, 'steps': 45350, 'loss/train': 1.6037946939468384} -11/07/2021 03:38:42 - INFO - __main__ - Step 45352: {'lr': 0.00040141312812138453, 'samples': 8707584, 'steps': 45351, 'loss/train': 1.6483333110809326} -11/07/2021 03:38:42 - INFO - __main__ - Step 45353: {'lr': 0.0004014089053555905, 'samples': 8707776, 'steps': 45352, 'loss/train': 1.1922721862792969} -11/07/2021 03:38:44 - INFO - __main__ - Step 45354: {'lr': 0.000401404682521574, 'samples': 8707968, 'steps': 45353, 'loss/train': 1.1696412563323975} -11/07/2021 03:38:44 - INFO - __main__ - Step 45355: {'lr': 0.0004014004596193368, 'samples': 8708160, 'steps': 45354, 'loss/train': 1.2211811542510986} -11/07/2021 03:38:44 - INFO - __main__ - Step 45356: {'lr': 0.000401396236648881, 'samples': 8708352, 'steps': 45355, 'loss/train': 1.2534793615341187} -11/07/2021 03:38:45 - INFO - __main__ - Step 45357: {'lr': 0.00040139201361020827, 'samples': 8708544, 'steps': 45356, 'loss/train': 1.3304888010025024} -11/07/2021 03:38:45 - INFO - __main__ - Step 45358: {'lr': 0.0004013877905033208, 'samples': 8708736, 'steps': 45357, 'loss/train': 0.8877719044685364} -11/07/2021 03:38:46 - INFO - __main__ - Step 45359: {'lr': 0.0004013835673282202, 'samples': 8708928, 'steps': 45358, 'loss/train': 1.0555520057678223} -11/07/2021 03:38:46 - INFO - __main__ - Step 45360: {'lr': 0.00040137934408490856, 'samples': 8709120, 'steps': 45359, 'loss/train': 1.185915231704712} -11/07/2021 03:38:47 - INFO - __main__ - Step 45361: {'lr': 0.0004013751207733877, 'samples': 8709312, 'steps': 45360, 'loss/train': 1.7336360216140747} -11/07/2021 03:38:47 - INFO - __main__ - Step 45362: {'lr': 0.0004013708973936595, 'samples': 8709504, 'steps': 45361, 'loss/train': 1.5897088050842285} -11/07/2021 03:38:47 - INFO - __main__ - Step 45363: {'lr': 0.000401366673945726, 'samples': 8709696, 'steps': 45362, 'loss/train': 1.6161272525787354} -11/07/2021 03:38:49 - INFO - __main__ - Step 45364: {'lr': 0.00040136245042958897, 'samples': 8709888, 'steps': 45363, 'loss/train': 1.0643367767333984} -11/07/2021 03:38:49 - INFO - __main__ - Step 45365: {'lr': 0.00040135822684525036, 'samples': 8710080, 'steps': 45364, 'loss/train': 1.150641679763794} -11/07/2021 03:38:50 - INFO - __main__ - Step 45366: {'lr': 0.0004013540031927121, 'samples': 8710272, 'steps': 45365, 'loss/train': 1.0963282585144043} -11/07/2021 03:38:50 - INFO - __main__ - Step 45367: {'lr': 0.000401349779471976, 'samples': 8710464, 'steps': 45366, 'loss/train': 1.2358239889144897} -11/07/2021 03:38:50 - INFO - __main__ - Step 45368: {'lr': 0.000401345555683044, 'samples': 8710656, 'steps': 45367, 'loss/train': 1.6147366762161255} -11/07/2021 03:38:51 - INFO - __main__ - Step 45369: {'lr': 0.00040134133182591813, 'samples': 8710848, 'steps': 45368, 'loss/train': 1.0666077136993408} -11/07/2021 03:38:52 - INFO - __main__ - Step 45370: {'lr': 0.0004013371079006001, 'samples': 8711040, 'steps': 45369, 'loss/train': 0.46323254704475403} -11/07/2021 03:38:52 - INFO - __main__ - Step 45371: {'lr': 0.000401332883907092, 'samples': 8711232, 'steps': 45370, 'loss/train': 1.4854381084442139} -11/07/2021 03:38:52 - INFO - __main__ - Step 45372: {'lr': 0.00040132865984539556, 'samples': 8711424, 'steps': 45371, 'loss/train': 1.0855177640914917} -11/07/2021 03:38:53 - INFO - __main__ - Step 45373: {'lr': 0.0004013244357155128, 'samples': 8711616, 'steps': 45372, 'loss/train': 1.092380404472351} -11/07/2021 03:38:53 - INFO - __main__ - Step 45374: {'lr': 0.0004013202115174456, 'samples': 8711808, 'steps': 45373, 'loss/train': 0.912677526473999} -11/07/2021 03:38:54 - INFO - __main__ - Step 45375: {'lr': 0.0004013159872511958, 'samples': 8712000, 'steps': 45374, 'loss/train': 1.3166635036468506} -11/07/2021 03:38:55 - INFO - __main__ - Step 45376: {'lr': 0.0004013117629167653, 'samples': 8712192, 'steps': 45375, 'loss/train': 1.071495771408081} -11/07/2021 03:38:55 - INFO - __main__ - Step 45377: {'lr': 0.0004013075385141561, 'samples': 8712384, 'steps': 45376, 'loss/train': 1.6424611806869507} -11/07/2021 03:38:55 - INFO - __main__ - Step 45378: {'lr': 0.0004013033140433702, 'samples': 8712576, 'steps': 45377, 'loss/train': 0.13290008902549744} -11/07/2021 03:38:56 - INFO - __main__ - Step 45379: {'lr': 0.0004012990895044092, 'samples': 8712768, 'steps': 45378, 'loss/train': 1.250949740409851} -11/07/2021 03:38:57 - INFO - __main__ - Step 45380: {'lr': 0.0004012948648972752, 'samples': 8712960, 'steps': 45379, 'loss/train': 0.9296746253967285} -11/07/2021 03:38:57 - INFO - __main__ - Step 45381: {'lr': 0.00040129064022197006, 'samples': 8713152, 'steps': 45380, 'loss/train': 1.6221343278884888} -11/07/2021 03:38:58 - INFO - __main__ - Step 45382: {'lr': 0.0004012864154784957, 'samples': 8713344, 'steps': 45381, 'loss/train': 1.529241681098938} -11/07/2021 03:38:58 - INFO - __main__ - Step 45383: {'lr': 0.00040128219066685403, 'samples': 8713536, 'steps': 45382, 'loss/train': 1.508192539215088} -11/07/2021 03:38:58 - INFO - __main__ - Step 45384: {'lr': 0.00040127796578704703, 'samples': 8713728, 'steps': 45383, 'loss/train': 1.7660785913467407} -11/07/2021 03:38:59 - INFO - __main__ - Step 45385: {'lr': 0.00040127374083907634, 'samples': 8713920, 'steps': 45384, 'loss/train': 1.0196280479431152} -11/07/2021 03:39:00 - INFO - __main__ - Step 45386: {'lr': 0.00040126951582294414, 'samples': 8714112, 'steps': 45385, 'loss/train': 0.7238351106643677} -11/07/2021 03:39:00 - INFO - __main__ - Step 45387: {'lr': 0.00040126529073865216, 'samples': 8714304, 'steps': 45386, 'loss/train': 3.4579100608825684} -11/07/2021 03:39:00 - INFO - __main__ - Step 45388: {'lr': 0.00040126106558620246, 'samples': 8714496, 'steps': 45387, 'loss/train': 0.8059271574020386} -11/07/2021 03:39:01 - INFO - __main__ - Step 45389: {'lr': 0.0004012568403655967, 'samples': 8714688, 'steps': 45388, 'loss/train': 1.2644438743591309} -11/07/2021 03:39:01 - INFO - __main__ - Step 45390: {'lr': 0.00040125261507683706, 'samples': 8714880, 'steps': 45389, 'loss/train': 0.9288297891616821} -11/07/2021 03:39:02 - INFO - __main__ - Step 45391: {'lr': 0.0004012483897199254, 'samples': 8715072, 'steps': 45390, 'loss/train': 1.1532604694366455} -11/07/2021 03:39:03 - INFO - __main__ - Step 45392: {'lr': 0.0004012441642948635, 'samples': 8715264, 'steps': 45391, 'loss/train': 1.7337646484375} -11/07/2021 03:39:03 - INFO - __main__ - Step 45393: {'lr': 0.0004012399388016533, 'samples': 8715456, 'steps': 45392, 'loss/train': 1.607285499572754} -11/07/2021 03:39:03 - INFO - __main__ - Step 45394: {'lr': 0.00040123571324029663, 'samples': 8715648, 'steps': 45393, 'loss/train': 0.2502501606941223} -11/07/2021 03:39:04 - INFO - __main__ - Step 45395: {'lr': 0.0004012314876107956, 'samples': 8715840, 'steps': 45394, 'loss/train': 1.7108367681503296} -11/07/2021 03:39:04 - INFO - __main__ - Step 45396: {'lr': 0.00040122726191315196, 'samples': 8716032, 'steps': 45395, 'loss/train': 1.3642891645431519} -11/07/2021 03:39:05 - INFO - __main__ - Step 45397: {'lr': 0.00040122303614736763, 'samples': 8716224, 'steps': 45396, 'loss/train': 1.5683138370513916} -11/07/2021 03:39:05 - INFO - __main__ - Step 45398: {'lr': 0.00040121881031344455, 'samples': 8716416, 'steps': 45397, 'loss/train': 1.4296704530715942} -11/07/2021 03:39:06 - INFO - __main__ - Step 45399: {'lr': 0.00040121458441138457, 'samples': 8716608, 'steps': 45398, 'loss/train': 1.3734186887741089} -11/07/2021 03:39:06 - INFO - __main__ - Step 45400: {'lr': 0.0004012103584411897, 'samples': 8716800, 'steps': 45399, 'loss/train': 1.0634467601776123} -11/07/2021 03:39:06 - INFO - __main__ - Step 45401: {'lr': 0.0004012061324028617, 'samples': 8716992, 'steps': 45400, 'loss/train': 1.677510380744934} -11/07/2021 03:39:07 - INFO - __main__ - Step 45402: {'lr': 0.0004012019062964026, 'samples': 8717184, 'steps': 45401, 'loss/train': 1.3154534101486206} -11/07/2021 03:39:08 - INFO - __main__ - Step 45403: {'lr': 0.00040119768012181423, 'samples': 8717376, 'steps': 45402, 'loss/train': 1.3625843524932861} -11/07/2021 03:39:08 - INFO - __main__ - Step 45404: {'lr': 0.0004011934538790986, 'samples': 8717568, 'steps': 45403, 'loss/train': 1.2091530561447144} -11/07/2021 03:39:08 - INFO - __main__ - Step 45405: {'lr': 0.00040118922756825735, 'samples': 8717760, 'steps': 45404, 'loss/train': 1.4153841733932495} -11/07/2021 03:39:09 - INFO - __main__ - Step 45406: {'lr': 0.00040118500118929267, 'samples': 8717952, 'steps': 45405, 'loss/train': 1.504854679107666} -11/07/2021 03:39:10 - INFO - __main__ - Step 45407: {'lr': 0.00040118077474220643, 'samples': 8718144, 'steps': 45406, 'loss/train': 1.545736312866211} -11/07/2021 03:39:10 - INFO - __main__ - Step 45408: {'lr': 0.00040117654822700047, 'samples': 8718336, 'steps': 45407, 'loss/train': 0.8987617492675781} -11/07/2021 03:39:11 - INFO - __main__ - Step 45409: {'lr': 0.0004011723216436766, 'samples': 8718528, 'steps': 45408, 'loss/train': 1.142067313194275} -11/07/2021 03:39:11 - INFO - __main__ - Step 45410: {'lr': 0.0004011680949922368, 'samples': 8718720, 'steps': 45409, 'loss/train': 1.677101492881775} -11/07/2021 03:39:11 - INFO - __main__ - Step 45411: {'lr': 0.00040116386827268304, 'samples': 8718912, 'steps': 45410, 'loss/train': 1.656983733177185} -11/07/2021 03:39:13 - INFO - __main__ - Step 45412: {'lr': 0.0004011596414850172, 'samples': 8719104, 'steps': 45411, 'loss/train': 1.2456414699554443} -11/07/2021 03:39:14 - INFO - __main__ - Step 45413: {'lr': 0.0004011554146292411, 'samples': 8719296, 'steps': 45412, 'loss/train': 1.2986106872558594} -11/07/2021 03:39:14 - INFO - __main__ - Step 45414: {'lr': 0.0004011511877053567, 'samples': 8719488, 'steps': 45413, 'loss/train': 1.574819803237915} -11/07/2021 03:39:14 - INFO - __main__ - Step 45415: {'lr': 0.0004011469607133659, 'samples': 8719680, 'steps': 45414, 'loss/train': 0.9463472962379456} -11/07/2021 03:39:15 - INFO - __main__ - Step 45416: {'lr': 0.0004011427336532707, 'samples': 8719872, 'steps': 45415, 'loss/train': 2.732780694961548} -11/07/2021 03:39:15 - INFO - __main__ - Step 45417: {'lr': 0.00040113850652507286, 'samples': 8720064, 'steps': 45416, 'loss/train': 2.6750824451446533} -11/07/2021 03:39:15 - INFO - __main__ - Step 45418: {'lr': 0.00040113427932877434, 'samples': 8720256, 'steps': 45417, 'loss/train': 2.024507522583008} -11/07/2021 03:39:16 - INFO - __main__ - Step 45419: {'lr': 0.00040113005206437704, 'samples': 8720448, 'steps': 45418, 'loss/train': 1.1875247955322266} -11/07/2021 03:39:17 - INFO - __main__ - Step 45420: {'lr': 0.00040112582473188284, 'samples': 8720640, 'steps': 45419, 'loss/train': 1.6446876525878906} -11/07/2021 03:39:17 - INFO - __main__ - Step 45421: {'lr': 0.00040112159733129375, 'samples': 8720832, 'steps': 45420, 'loss/train': 1.5601922273635864} -11/07/2021 03:39:17 - INFO - __main__ - Step 45422: {'lr': 0.00040111736986261155, 'samples': 8721024, 'steps': 45421, 'loss/train': 1.513543963432312} -11/07/2021 03:39:18 - INFO - __main__ - Step 45423: {'lr': 0.00040111314232583816, 'samples': 8721216, 'steps': 45422, 'loss/train': 1.7309056520462036} -11/07/2021 03:39:19 - INFO - __main__ - Step 45424: {'lr': 0.0004011089147209756, 'samples': 8721408, 'steps': 45423, 'loss/train': 1.6408305168151855} -11/07/2021 03:39:19 - INFO - __main__ - Step 45425: {'lr': 0.00040110468704802573, 'samples': 8721600, 'steps': 45424, 'loss/train': 1.5653102397918701} -11/07/2021 03:39:20 - INFO - __main__ - Step 45426: {'lr': 0.00040110045930699033, 'samples': 8721792, 'steps': 45425, 'loss/train': 1.1400521993637085} -11/07/2021 03:39:20 - INFO - __main__ - Step 45427: {'lr': 0.00040109623149787137, 'samples': 8721984, 'steps': 45426, 'loss/train': 1.363743782043457} -11/07/2021 03:39:20 - INFO - __main__ - Step 45428: {'lr': 0.0004010920036206709, 'samples': 8722176, 'steps': 45427, 'loss/train': 1.199953317642212} -11/07/2021 03:39:22 - INFO - __main__ - Step 45429: {'lr': 0.00040108777567539057, 'samples': 8722368, 'steps': 45428, 'loss/train': 1.6662077903747559} -11/07/2021 03:39:22 - INFO - __main__ - Step 45430: {'lr': 0.00040108354766203247, 'samples': 8722560, 'steps': 45429, 'loss/train': 1.6846674680709839} -11/07/2021 03:39:22 - INFO - __main__ - Step 45431: {'lr': 0.0004010793195805985, 'samples': 8722752, 'steps': 45430, 'loss/train': 1.2505202293395996} -11/07/2021 03:39:23 - INFO - __main__ - Step 45432: {'lr': 0.0004010750914310905, 'samples': 8722944, 'steps': 45431, 'loss/train': 1.168033480644226} -11/07/2021 03:39:23 - INFO - __main__ - Step 45433: {'lr': 0.0004010708632135104, 'samples': 8723136, 'steps': 45432, 'loss/train': 1.0324722528457642} -11/07/2021 03:39:23 - INFO - __main__ - Step 45434: {'lr': 0.00040106663492786007, 'samples': 8723328, 'steps': 45433, 'loss/train': 5.603840351104736} -11/07/2021 03:39:24 - INFO - __main__ - Step 45435: {'lr': 0.00040106240657414137, 'samples': 8723520, 'steps': 45434, 'loss/train': 5.6717705726623535} -11/07/2021 03:39:25 - INFO - __main__ - Step 45436: {'lr': 0.0004010581781523564, 'samples': 8723712, 'steps': 45435, 'loss/train': 5.517861366271973} -11/07/2021 03:39:25 - INFO - __main__ - Step 45437: {'lr': 0.0004010539496625069, 'samples': 8723904, 'steps': 45436, 'loss/train': 1.426464557647705} -11/07/2021 03:39:26 - INFO - __main__ - Step 45438: {'lr': 0.00040104972110459493, 'samples': 8724096, 'steps': 45437, 'loss/train': 1.9749648571014404} -11/07/2021 03:39:26 - INFO - __main__ - Step 45439: {'lr': 0.00040104549247862217, 'samples': 8724288, 'steps': 45438, 'loss/train': 1.8147975206375122} -11/07/2021 03:39:26 - INFO - __main__ - Step 45440: {'lr': 0.0004010412637845906, 'samples': 8724480, 'steps': 45439, 'loss/train': 1.4899234771728516} -11/07/2021 03:39:27 - INFO - __main__ - Step 45441: {'lr': 0.00040103703502250223, 'samples': 8724672, 'steps': 45440, 'loss/train': 1.7324793338775635} -11/07/2021 03:39:28 - INFO - __main__ - Step 45442: {'lr': 0.0004010328061923589, 'samples': 8724864, 'steps': 45441, 'loss/train': 1.6355983018875122} -11/07/2021 03:39:28 - INFO - __main__ - Step 45443: {'lr': 0.00040102857729416256, 'samples': 8725056, 'steps': 45442, 'loss/train': 1.6216485500335693} -11/07/2021 03:39:28 - INFO - __main__ - Step 45444: {'lr': 0.000401024348327915, 'samples': 8725248, 'steps': 45443, 'loss/train': 1.4130525588989258} -11/07/2021 03:39:29 - INFO - __main__ - Step 45445: {'lr': 0.00040102011929361826, 'samples': 8725440, 'steps': 45444, 'loss/train': 1.080099105834961} -11/07/2021 03:39:30 - INFO - __main__ - Step 45446: {'lr': 0.00040101589019127416, 'samples': 8725632, 'steps': 45445, 'loss/train': 1.3785549402236938} -11/07/2021 03:39:30 - INFO - __main__ - Step 45447: {'lr': 0.0004010116610208846, 'samples': 8725824, 'steps': 45446, 'loss/train': 1.7756900787353516} -11/07/2021 03:39:30 - INFO - __main__ - Step 45448: {'lr': 0.0004010074317824516, 'samples': 8726016, 'steps': 45447, 'loss/train': 1.0014840364456177} -11/07/2021 03:39:31 - INFO - __main__ - Step 45449: {'lr': 0.0004010032024759769, 'samples': 8726208, 'steps': 45448, 'loss/train': 1.5262198448181152} -11/07/2021 03:39:31 - INFO - __main__ - Step 45450: {'lr': 0.0004009989731014625, 'samples': 8726400, 'steps': 45449, 'loss/train': 1.2290147542953491} -11/07/2021 03:39:33 - INFO - __main__ - Step 45451: {'lr': 0.00040099474365891033, 'samples': 8726592, 'steps': 45450, 'loss/train': 1.4418271780014038} -11/07/2021 03:39:33 - INFO - __main__ - Step 45452: {'lr': 0.0004009905141483222, 'samples': 8726784, 'steps': 45451, 'loss/train': 1.9713292121887207} -11/07/2021 03:39:33 - INFO - __main__ - Step 45453: {'lr': 0.0004009862845697001, 'samples': 8726976, 'steps': 45452, 'loss/train': 1.6822173595428467} -11/07/2021 03:39:34 - INFO - __main__ - Step 45454: {'lr': 0.00040098205492304596, 'samples': 8727168, 'steps': 45453, 'loss/train': 1.695788860321045} -11/07/2021 03:39:34 - INFO - __main__ - Step 45455: {'lr': 0.00040097782520836156, 'samples': 8727360, 'steps': 45454, 'loss/train': 1.7513108253479004} -11/07/2021 03:39:34 - INFO - __main__ - Step 45456: {'lr': 0.00040097359542564894, 'samples': 8727552, 'steps': 45455, 'loss/train': 1.728674292564392} -11/07/2021 03:39:35 - INFO - __main__ - Step 45457: {'lr': 0.0004009693655749099, 'samples': 8727744, 'steps': 45456, 'loss/train': 1.1296839714050293} -11/07/2021 03:39:36 - INFO - __main__ - Step 45458: {'lr': 0.00040096513565614645, 'samples': 8727936, 'steps': 45457, 'loss/train': 1.2750709056854248} -11/07/2021 03:39:36 - INFO - __main__ - Step 45459: {'lr': 0.00040096090566936037, 'samples': 8728128, 'steps': 45458, 'loss/train': 0.9658198952674866} -11/07/2021 03:39:37 - INFO - __main__ - Step 45460: {'lr': 0.00040095667561455367, 'samples': 8728320, 'steps': 45459, 'loss/train': 1.7042561769485474} -11/07/2021 03:39:37 - INFO - __main__ - Step 45461: {'lr': 0.00040095244549172824, 'samples': 8728512, 'steps': 45460, 'loss/train': 1.1562546491622925} -11/07/2021 03:39:37 - INFO - __main__ - Step 45462: {'lr': 0.00040094821530088594, 'samples': 8728704, 'steps': 45461, 'loss/train': 1.7081876993179321} -11/07/2021 03:39:38 - INFO - __main__ - Step 45463: {'lr': 0.0004009439850420287, 'samples': 8728896, 'steps': 45462, 'loss/train': 1.6255519390106201} -11/07/2021 03:39:39 - INFO - __main__ - Step 45464: {'lr': 0.00040093975471515843, 'samples': 8729088, 'steps': 45463, 'loss/train': 1.6070562601089478} -11/07/2021 03:39:39 - INFO - __main__ - Step 45465: {'lr': 0.00040093552432027713, 'samples': 8729280, 'steps': 45464, 'loss/train': 1.1172105073928833} -11/07/2021 03:39:39 - INFO - __main__ - Step 45466: {'lr': 0.0004009312938573865, 'samples': 8729472, 'steps': 45465, 'loss/train': 1.5569968223571777} -11/07/2021 03:39:40 - INFO - __main__ - Step 45467: {'lr': 0.00040092706332648856, 'samples': 8729664, 'steps': 45466, 'loss/train': 1.3887341022491455} -11/07/2021 03:39:41 - INFO - __main__ - Step 45468: {'lr': 0.00040092283272758525, 'samples': 8729856, 'steps': 45467, 'loss/train': 1.8437894582748413} -11/07/2021 03:39:41 - INFO - __main__ - Step 45469: {'lr': 0.00040091860206067844, 'samples': 8730048, 'steps': 45468, 'loss/train': 1.4862357378005981} -11/07/2021 03:39:41 - INFO - __main__ - Step 45470: {'lr': 0.00040091437132577004, 'samples': 8730240, 'steps': 45469, 'loss/train': 1.660348653793335} -11/07/2021 03:39:42 - INFO - __main__ - Step 45471: {'lr': 0.0004009101405228619, 'samples': 8730432, 'steps': 45470, 'loss/train': 1.6826940774917603} -11/07/2021 03:39:42 - INFO - __main__ - Step 45472: {'lr': 0.00040090590965195604, 'samples': 8730624, 'steps': 45471, 'loss/train': 0.5386844873428345} -11/07/2021 03:39:42 - INFO - __main__ - Step 45473: {'lr': 0.0004009016787130543, 'samples': 8730816, 'steps': 45472, 'loss/train': 6.135570049285889} -11/07/2021 03:39:43 - INFO - __main__ - Step 45474: {'lr': 0.0004008974477061586, 'samples': 8731008, 'steps': 45473, 'loss/train': 0.7260832786560059} -11/07/2021 03:39:44 - INFO - __main__ - Step 45475: {'lr': 0.0004008932166312708, 'samples': 8731200, 'steps': 45474, 'loss/train': 1.4672410488128662} -11/07/2021 03:39:44 - INFO - __main__ - Step 45476: {'lr': 0.0004008889854883929, 'samples': 8731392, 'steps': 45475, 'loss/train': 0.9254458546638489} -11/07/2021 03:39:45 - INFO - __main__ - Step 45477: {'lr': 0.0004008847542775267, 'samples': 8731584, 'steps': 45476, 'loss/train': 1.8162497282028198} -11/07/2021 03:39:45 - INFO - __main__ - Step 45478: {'lr': 0.00040088052299867415, 'samples': 8731776, 'steps': 45477, 'loss/train': 1.2034556865692139} -11/07/2021 03:39:46 - INFO - __main__ - Step 45479: {'lr': 0.0004008762916518372, 'samples': 8731968, 'steps': 45478, 'loss/train': 1.6396222114562988} -11/07/2021 03:39:46 - INFO - __main__ - Step 45480: {'lr': 0.0004008720602370177, 'samples': 8732160, 'steps': 45479, 'loss/train': 1.153206467628479} -11/07/2021 03:39:47 - INFO - __main__ - Step 45481: {'lr': 0.00040086782875421755, 'samples': 8732352, 'steps': 45480, 'loss/train': 1.8851182460784912} -11/07/2021 03:39:47 - INFO - __main__ - Step 45482: {'lr': 0.0004008635972034388, 'samples': 8732544, 'steps': 45481, 'loss/train': 1.4990321397781372} -11/07/2021 03:39:47 - INFO - __main__ - Step 45483: {'lr': 0.0004008593655846831, 'samples': 8732736, 'steps': 45482, 'loss/train': 1.3766307830810547} -11/07/2021 03:39:48 - INFO - __main__ - Step 45484: {'lr': 0.0004008551338979526, 'samples': 8732928, 'steps': 45483, 'loss/train': 0.743320643901825} -11/07/2021 03:39:49 - INFO - __main__ - Step 45485: {'lr': 0.00040085090214324906, 'samples': 8733120, 'steps': 45484, 'loss/train': 1.4501512050628662} -11/07/2021 03:39:49 - INFO - __main__ - Step 45486: {'lr': 0.00040084667032057444, 'samples': 8733312, 'steps': 45485, 'loss/train': 1.6061315536499023} -11/07/2021 03:39:49 - INFO - __main__ - Step 45487: {'lr': 0.00040084243842993065, 'samples': 8733504, 'steps': 45486, 'loss/train': 1.3426865339279175} -11/07/2021 03:39:50 - INFO - __main__ - Step 45488: {'lr': 0.0004008382064713195, 'samples': 8733696, 'steps': 45487, 'loss/train': 1.6358917951583862} -11/07/2021 03:39:51 - INFO - __main__ - Step 45489: {'lr': 0.0004008339744447431, 'samples': 8733888, 'steps': 45488, 'loss/train': 1.4708629846572876} -11/07/2021 03:39:51 - INFO - __main__ - Step 45490: {'lr': 0.0004008297423502032, 'samples': 8734080, 'steps': 45489, 'loss/train': 1.5823044776916504} -11/07/2021 03:39:52 - INFO - __main__ - Step 45491: {'lr': 0.0004008255101877017, 'samples': 8734272, 'steps': 45490, 'loss/train': 1.4473228454589844} -11/07/2021 03:39:52 - INFO - __main__ - Step 45492: {'lr': 0.00040082127795724066, 'samples': 8734464, 'steps': 45491, 'loss/train': 1.4682440757751465} -11/07/2021 03:39:52 - INFO - __main__ - Step 45493: {'lr': 0.00040081704565882176, 'samples': 8734656, 'steps': 45492, 'loss/train': 1.3882434368133545} -11/07/2021 03:39:53 - INFO - __main__ - Step 45494: {'lr': 0.00040081281329244707, 'samples': 8734848, 'steps': 45493, 'loss/train': 6.106868743896484} -11/07/2021 03:39:54 - INFO - __main__ - Step 45495: {'lr': 0.00040080858085811844, 'samples': 8735040, 'steps': 45494, 'loss/train': 0.2559010982513428} -11/07/2021 03:39:54 - INFO - __main__ - Step 45496: {'lr': 0.00040080434835583777, 'samples': 8735232, 'steps': 45495, 'loss/train': 0.9081894159317017} -11/07/2021 03:39:54 - INFO - __main__ - Step 45497: {'lr': 0.00040080011578560705, 'samples': 8735424, 'steps': 45496, 'loss/train': 1.5792264938354492} -11/07/2021 03:39:55 - INFO - __main__ - Step 45498: {'lr': 0.0004007958831474281, 'samples': 8735616, 'steps': 45497, 'loss/train': 1.1584725379943848} -11/07/2021 03:39:55 - INFO - __main__ - Step 45499: {'lr': 0.0004007916504413029, 'samples': 8735808, 'steps': 45498, 'loss/train': 0.7571787238121033} -11/07/2021 03:39:56 - INFO - __main__ - Step 45500: {'lr': 0.00040078741766723326, 'samples': 8736000, 'steps': 45499, 'loss/train': 1.438258171081543} -11/07/2021 03:39:56 - INFO - __main__ - Step 45501: {'lr': 0.00040078318482522114, 'samples': 8736192, 'steps': 45500, 'loss/train': 1.6170825958251953} -11/07/2021 03:39:57 - INFO - __main__ - Step 45502: {'lr': 0.0004007789519152684, 'samples': 8736384, 'steps': 45501, 'loss/train': 1.430743932723999} -11/07/2021 03:39:57 - INFO - __main__ - Step 45503: {'lr': 0.00040077471893737703, 'samples': 8736576, 'steps': 45502, 'loss/train': 1.7867926359176636} -11/07/2021 03:39:58 - INFO - __main__ - Step 45504: {'lr': 0.0004007704858915489, 'samples': 8736768, 'steps': 45503, 'loss/train': 1.342382788658142} -11/07/2021 03:39:59 - INFO - __main__ - Step 45505: {'lr': 0.00040076625277778594, 'samples': 8736960, 'steps': 45504, 'loss/train': 1.2320177555084229} -11/07/2021 03:39:59 - INFO - __main__ - Step 45506: {'lr': 0.00040076201959609003, 'samples': 8737152, 'steps': 45505, 'loss/train': 1.6842968463897705} -11/07/2021 03:39:59 - INFO - __main__ - Step 45507: {'lr': 0.00040075778634646305, 'samples': 8737344, 'steps': 45506, 'loss/train': 1.3534555435180664} -11/07/2021 03:40:00 - INFO - __main__ - Step 45508: {'lr': 0.0004007535530289069, 'samples': 8737536, 'steps': 45507, 'loss/train': 1.2427611351013184} -11/07/2021 03:40:00 - INFO - __main__ - Step 45509: {'lr': 0.0004007493196434236, 'samples': 8737728, 'steps': 45508, 'loss/train': 1.5556435585021973} -11/07/2021 03:40:01 - INFO - __main__ - Step 45510: {'lr': 0.0004007450861900149, 'samples': 8737920, 'steps': 45509, 'loss/train': 1.7099498510360718} -11/07/2021 03:40:02 - INFO - __main__ - Step 45511: {'lr': 0.00040074085266868285, 'samples': 8738112, 'steps': 45510, 'loss/train': 1.4670841693878174} -11/07/2021 03:40:02 - INFO - __main__ - Step 45512: {'lr': 0.0004007366190794294, 'samples': 8738304, 'steps': 45511, 'loss/train': 1.3476924896240234} -11/07/2021 03:40:02 - INFO - __main__ - Step 45513: {'lr': 0.00040073238542225623, 'samples': 8738496, 'steps': 45512, 'loss/train': 1.453534483909607} -11/07/2021 03:40:03 - INFO - __main__ - Step 45514: {'lr': 0.00040072815169716534, 'samples': 8738688, 'steps': 45513, 'loss/train': 1.599866509437561} -11/07/2021 03:40:03 - INFO - __main__ - Step 45515: {'lr': 0.00040072391790415873, 'samples': 8738880, 'steps': 45514, 'loss/train': 1.2118515968322754} -11/07/2021 03:40:04 - INFO - __main__ - Step 45516: {'lr': 0.00040071968404323824, 'samples': 8739072, 'steps': 45515, 'loss/train': 1.3849482536315918} -11/07/2021 03:40:04 - INFO - __main__ - Step 45517: {'lr': 0.0004007154501144058, 'samples': 8739264, 'steps': 45516, 'loss/train': 1.4673330783843994} -11/07/2021 03:40:05 - INFO - __main__ - Step 45518: {'lr': 0.00040071121611766325, 'samples': 8739456, 'steps': 45517, 'loss/train': 1.6368898153305054} -11/07/2021 03:40:05 - INFO - __main__ - Step 45519: {'lr': 0.00040070698205301266, 'samples': 8739648, 'steps': 45518, 'loss/train': 1.6441377401351929} -11/07/2021 03:40:05 - INFO - __main__ - Step 45520: {'lr': 0.0004007027479204557, 'samples': 8739840, 'steps': 45519, 'loss/train': 1.7209645509719849} -11/07/2021 03:40:06 - INFO - __main__ - Step 45521: {'lr': 0.0004006985137199945, 'samples': 8740032, 'steps': 45520, 'loss/train': 1.7317477464675903} -11/07/2021 03:40:07 - INFO - __main__ - Step 45522: {'lr': 0.00040069427945163083, 'samples': 8740224, 'steps': 45521, 'loss/train': 1.6250065565109253} -11/07/2021 03:40:07 - INFO - __main__ - Step 45523: {'lr': 0.00040069004511536667, 'samples': 8740416, 'steps': 45522, 'loss/train': 1.2221133708953857} -11/07/2021 03:40:07 - INFO - __main__ - Step 45524: {'lr': 0.00040068581071120386, 'samples': 8740608, 'steps': 45523, 'loss/train': 1.7659928798675537} -11/07/2021 03:40:08 - INFO - __main__ - Step 45525: {'lr': 0.00040068157623914435, 'samples': 8740800, 'steps': 45524, 'loss/train': 1.4572179317474365} -11/07/2021 03:40:09 - INFO - __main__ - Step 45526: {'lr': 0.0004006773416991901, 'samples': 8740992, 'steps': 45525, 'loss/train': 0.5819351077079773} -11/07/2021 03:40:09 - INFO - __main__ - Step 45527: {'lr': 0.00040067310709134295, 'samples': 8741184, 'steps': 45526, 'loss/train': 1.801347017288208} -11/07/2021 03:40:09 - INFO - __main__ - Step 45528: {'lr': 0.0004006688724156048, 'samples': 8741376, 'steps': 45527, 'loss/train': 1.456350326538086} -11/07/2021 03:40:10 - INFO - __main__ - Step 45529: {'lr': 0.00040066463767197757, 'samples': 8741568, 'steps': 45528, 'loss/train': 1.5421572923660278} -11/07/2021 03:40:10 - INFO - __main__ - Step 45530: {'lr': 0.00040066040286046325, 'samples': 8741760, 'steps': 45529, 'loss/train': 1.0882627964019775} -11/07/2021 03:40:11 - INFO - __main__ - Step 45531: {'lr': 0.0004006561679810636, 'samples': 8741952, 'steps': 45530, 'loss/train': 1.636697769165039} -11/07/2021 03:40:12 - INFO - __main__ - Step 45532: {'lr': 0.0004006519330337807, 'samples': 8742144, 'steps': 45531, 'loss/train': 1.5281553268432617} -11/07/2021 03:40:12 - INFO - __main__ - Step 45533: {'lr': 0.0004006476980186163, 'samples': 8742336, 'steps': 45532, 'loss/train': 0.9776030778884888} -11/07/2021 03:40:12 - INFO - __main__ - Step 45534: {'lr': 0.0004006434629355723, 'samples': 8742528, 'steps': 45533, 'loss/train': 1.47916841506958} -11/07/2021 03:40:13 - INFO - __main__ - Step 45535: {'lr': 0.0004006392277846508, 'samples': 8742720, 'steps': 45534, 'loss/train': 1.5749417543411255} -11/07/2021 03:40:14 - INFO - __main__ - Step 45536: {'lr': 0.00040063499256585354, 'samples': 8742912, 'steps': 45535, 'loss/train': 1.0047314167022705} -11/07/2021 03:40:14 - INFO - __main__ - Step 45537: {'lr': 0.00040063075727918247, 'samples': 8743104, 'steps': 45536, 'loss/train': 1.3174585103988647} -11/07/2021 03:40:14 - INFO - __main__ - Step 45538: {'lr': 0.0004006265219246395, 'samples': 8743296, 'steps': 45537, 'loss/train': 1.3374698162078857} -11/07/2021 03:40:15 - INFO - __main__ - Step 45539: {'lr': 0.00040062228650222657, 'samples': 8743488, 'steps': 45538, 'loss/train': 1.4565569162368774} -11/07/2021 03:40:15 - INFO - __main__ - Step 45540: {'lr': 0.00040061805101194553, 'samples': 8743680, 'steps': 45539, 'loss/train': 1.4614648818969727} -11/07/2021 03:40:16 - INFO - __main__ - Step 45541: {'lr': 0.00040061381545379837, 'samples': 8743872, 'steps': 45540, 'loss/train': 1.1748137474060059} -11/07/2021 03:40:17 - INFO - __main__ - Step 45542: {'lr': 0.00040060957982778687, 'samples': 8744064, 'steps': 45541, 'loss/train': 1.3833144903182983} -11/07/2021 03:40:17 - INFO - __main__ - Step 45543: {'lr': 0.0004006053441339131, 'samples': 8744256, 'steps': 45542, 'loss/train': 1.6318830251693726} -11/07/2021 03:40:17 - INFO - __main__ - Step 45544: {'lr': 0.00040060110837217885, 'samples': 8744448, 'steps': 45543, 'loss/train': 1.6543395519256592} -11/07/2021 03:40:18 - INFO - __main__ - Step 45545: {'lr': 0.000400596872542586, 'samples': 8744640, 'steps': 45544, 'loss/train': 1.4727685451507568} -11/07/2021 03:40:18 - INFO - __main__ - Step 45546: {'lr': 0.0004005926366451367, 'samples': 8744832, 'steps': 45545, 'loss/train': 1.6064571142196655} -11/07/2021 03:40:19 - INFO - __main__ - Step 45547: {'lr': 0.0004005884006798325, 'samples': 8745024, 'steps': 45546, 'loss/train': 1.4628363847732544} -11/07/2021 03:40:19 - INFO - __main__ - Step 45548: {'lr': 0.0004005841646466756, 'samples': 8745216, 'steps': 45547, 'loss/train': 1.2657325267791748} -11/07/2021 03:40:20 - INFO - __main__ - Step 45549: {'lr': 0.00040057992854566774, 'samples': 8745408, 'steps': 45548, 'loss/train': 1.6489057540893555} -11/07/2021 03:40:20 - INFO - __main__ - Step 45550: {'lr': 0.0004005756923768109, 'samples': 8745600, 'steps': 45549, 'loss/train': 1.4323945045471191} -11/07/2021 03:40:21 - INFO - __main__ - Step 45551: {'lr': 0.0004005714561401069, 'samples': 8745792, 'steps': 45550, 'loss/train': 1.2886767387390137} -11/07/2021 03:40:21 - INFO - __main__ - Step 45552: {'lr': 0.0004005672198355579, 'samples': 8745984, 'steps': 45551, 'loss/train': 1.3043690919876099} -11/07/2021 03:40:22 - INFO - __main__ - Step 45553: {'lr': 0.00040056298346316554, 'samples': 8746176, 'steps': 45552, 'loss/train': 1.378745675086975} -11/07/2021 03:40:22 - INFO - __main__ - Step 45554: {'lr': 0.0004005587470229318, 'samples': 8746368, 'steps': 45553, 'loss/train': 1.0702617168426514} -11/07/2021 03:40:23 - INFO - __main__ - Step 45555: {'lr': 0.00040055451051485865, 'samples': 8746560, 'steps': 45554, 'loss/train': 2.052830457687378} -11/07/2021 03:40:23 - INFO - __main__ - Step 45556: {'lr': 0.0004005502739389479, 'samples': 8746752, 'steps': 45555, 'loss/train': 1.501568078994751} -11/07/2021 03:40:24 - INFO - __main__ - Step 45557: {'lr': 0.00040054603729520154, 'samples': 8746944, 'steps': 45556, 'loss/train': 1.662977933883667} -11/07/2021 03:40:24 - INFO - __main__ - Step 45558: {'lr': 0.00040054180058362156, 'samples': 8747136, 'steps': 45557, 'loss/train': 1.621247410774231} -11/07/2021 03:40:25 - INFO - __main__ - Step 45559: {'lr': 0.0004005375638042097, 'samples': 8747328, 'steps': 45558, 'loss/train': 1.490097999572754} -11/07/2021 03:40:25 - INFO - __main__ - Step 45560: {'lr': 0.0004005333269569679, 'samples': 8747520, 'steps': 45559, 'loss/train': 1.5717151165008545} -11/07/2021 03:40:25 - INFO - __main__ - Step 45561: {'lr': 0.0004005290900418982, 'samples': 8747712, 'steps': 45560, 'loss/train': 1.599551796913147} -11/07/2021 03:40:26 - INFO - __main__ - Step 45562: {'lr': 0.0004005248530590023, 'samples': 8747904, 'steps': 45561, 'loss/train': 1.0087416172027588} -11/07/2021 03:40:27 - INFO - __main__ - Step 45563: {'lr': 0.0004005206160082823, 'samples': 8748096, 'steps': 45562, 'loss/train': 1.5920844078063965} -11/07/2021 03:40:27 - INFO - __main__ - Step 45564: {'lr': 0.00040051637888973996, 'samples': 8748288, 'steps': 45563, 'loss/train': 1.5179200172424316} -11/07/2021 03:40:28 - INFO - __main__ - Step 45565: {'lr': 0.0004005121417033773, 'samples': 8748480, 'steps': 45564, 'loss/train': 0.9567902088165283} -11/07/2021 03:40:28 - INFO - __main__ - Step 45566: {'lr': 0.0004005079044491963, 'samples': 8748672, 'steps': 45565, 'loss/train': 0.9599171280860901} -11/07/2021 03:40:28 - INFO - __main__ - Step 45567: {'lr': 0.0004005036671271986, 'samples': 8748864, 'steps': 45566, 'loss/train': 1.2490531206130981} -11/07/2021 03:40:29 - INFO - __main__ - Step 45568: {'lr': 0.00040049942973738626, 'samples': 8749056, 'steps': 45567, 'loss/train': 1.963448405265808} -11/07/2021 03:40:30 - INFO - __main__ - Step 45569: {'lr': 0.00040049519227976135, 'samples': 8749248, 'steps': 45568, 'loss/train': 1.647210955619812} -11/07/2021 03:40:30 - INFO - __main__ - Step 45570: {'lr': 0.0004004909547543255, 'samples': 8749440, 'steps': 45569, 'loss/train': 1.090729832649231} -11/07/2021 03:40:30 - INFO - __main__ - Step 45571: {'lr': 0.0004004867171610808, 'samples': 8749632, 'steps': 45570, 'loss/train': 1.408889651298523} -11/07/2021 03:40:31 - INFO - __main__ - Step 45572: {'lr': 0.00040048247950002917, 'samples': 8749824, 'steps': 45571, 'loss/train': 1.5346219539642334} -11/07/2021 03:40:32 - INFO - __main__ - Step 45573: {'lr': 0.0004004782417711724, 'samples': 8750016, 'steps': 45572, 'loss/train': 0.6711319088935852} -11/07/2021 03:40:32 - INFO - __main__ - Step 45574: {'lr': 0.0004004740039745124, 'samples': 8750208, 'steps': 45573, 'loss/train': 1.6857950687408447} -11/07/2021 03:40:33 - INFO - __main__ - Step 45575: {'lr': 0.0004004697661100512, 'samples': 8750400, 'steps': 45574, 'loss/train': 1.100041151046753} -11/07/2021 03:40:33 - INFO - __main__ - Step 45576: {'lr': 0.0004004655281777906, 'samples': 8750592, 'steps': 45575, 'loss/train': 1.2100518941879272} -11/07/2021 03:40:33 - INFO - __main__ - Step 45577: {'lr': 0.0004004612901777326, 'samples': 8750784, 'steps': 45576, 'loss/train': 1.9163987636566162} -11/07/2021 03:40:34 - INFO - __main__ - Step 45578: {'lr': 0.000400457052109879, 'samples': 8750976, 'steps': 45577, 'loss/train': 1.7235652208328247} -11/07/2021 03:40:35 - INFO - __main__ - Step 45579: {'lr': 0.0004004528139742319, 'samples': 8751168, 'steps': 45578, 'loss/train': 1.5605733394622803} -11/07/2021 03:40:35 - INFO - __main__ - Step 45580: {'lr': 0.00040044857577079294, 'samples': 8751360, 'steps': 45579, 'loss/train': 1.3955143690109253} -11/07/2021 03:40:35 - INFO - __main__ - Step 45581: {'lr': 0.00040044433749956434, 'samples': 8751552, 'steps': 45580, 'loss/train': 1.2570422887802124} -11/07/2021 03:40:36 - INFO - __main__ - Step 45582: {'lr': 0.0004004400991605477, 'samples': 8751744, 'steps': 45581, 'loss/train': 0.8221997618675232} -11/07/2021 03:40:36 - INFO - __main__ - Step 45583: {'lr': 0.0004004358607537451, 'samples': 8751936, 'steps': 45582, 'loss/train': 1.2752317190170288} -11/07/2021 03:40:37 - INFO - __main__ - Step 45584: {'lr': 0.0004004316222791584, 'samples': 8752128, 'steps': 45583, 'loss/train': 1.6482517719268799} -11/07/2021 03:40:38 - INFO - __main__ - Step 45585: {'lr': 0.00040042738373678954, 'samples': 8752320, 'steps': 45584, 'loss/train': 1.456422209739685} -11/07/2021 03:40:38 - INFO - __main__ - Step 45586: {'lr': 0.0004004231451266406, 'samples': 8752512, 'steps': 45585, 'loss/train': 1.0222355127334595} -11/07/2021 03:40:38 - INFO - __main__ - Step 45587: {'lr': 0.0004004189064487131, 'samples': 8752704, 'steps': 45586, 'loss/train': 0.8327646255493164} -11/07/2021 03:40:39 - INFO - __main__ - Step 45588: {'lr': 0.00040041466770300923, 'samples': 8752896, 'steps': 45587, 'loss/train': 1.407906413078308} -11/07/2021 03:40:40 - INFO - __main__ - Step 45589: {'lr': 0.00040041042888953085, 'samples': 8753088, 'steps': 45588, 'loss/train': 1.678365707397461} -11/07/2021 03:40:40 - INFO - __main__ - Step 45590: {'lr': 0.0004004061900082798, 'samples': 8753280, 'steps': 45589, 'loss/train': 1.6984779834747314} -11/07/2021 03:40:41 - INFO - __main__ - Step 45591: {'lr': 0.00040040195105925803, 'samples': 8753472, 'steps': 45590, 'loss/train': 1.6859689950942993} -11/07/2021 03:40:41 - INFO - __main__ - Step 45592: {'lr': 0.00040039771204246756, 'samples': 8753664, 'steps': 45591, 'loss/train': 2.851062536239624} -11/07/2021 03:40:41 - INFO - __main__ - Step 45593: {'lr': 0.0004003934729579101, 'samples': 8753856, 'steps': 45592, 'loss/train': 1.8652925491333008} -11/07/2021 03:40:42 - INFO - __main__ - Step 45594: {'lr': 0.0004003892338055877, 'samples': 8754048, 'steps': 45593, 'loss/train': 1.4023840427398682} -11/07/2021 03:40:43 - INFO - __main__ - Step 45595: {'lr': 0.0004003849945855023, 'samples': 8754240, 'steps': 45594, 'loss/train': 1.2967686653137207} -11/07/2021 03:40:43 - INFO - __main__ - Step 45596: {'lr': 0.0004003807552976556, 'samples': 8754432, 'steps': 45595, 'loss/train': 0.9110772013664246} -11/07/2021 03:40:43 - INFO - __main__ - Step 45597: {'lr': 0.00040037651594204975, 'samples': 8754624, 'steps': 45596, 'loss/train': 1.5004764795303345} -11/07/2021 03:40:44 - INFO - __main__ - Step 45598: {'lr': 0.00040037227651868655, 'samples': 8754816, 'steps': 45597, 'loss/train': 0.45010626316070557} -11/07/2021 03:40:44 - INFO - __main__ - Step 45599: {'lr': 0.000400368037027568, 'samples': 8755008, 'steps': 45598, 'loss/train': 1.6588164567947388} -11/07/2021 03:40:45 - INFO - __main__ - Step 45600: {'lr': 0.0004003637974686958, 'samples': 8755200, 'steps': 45599, 'loss/train': 1.6795395612716675} -11/07/2021 03:40:46 - INFO - __main__ - Step 45601: {'lr': 0.000400359557842072, 'samples': 8755392, 'steps': 45600, 'loss/train': 1.6923891305923462} -11/07/2021 03:40:46 - INFO - __main__ - Step 45602: {'lr': 0.00040035531814769853, 'samples': 8755584, 'steps': 45601, 'loss/train': 1.6309795379638672} -11/07/2021 03:40:46 - INFO - __main__ - Step 45603: {'lr': 0.0004003510783855774, 'samples': 8755776, 'steps': 45602, 'loss/train': 1.6606926918029785} -11/07/2021 03:40:47 - INFO - __main__ - Step 45604: {'lr': 0.00040034683855571027, 'samples': 8755968, 'steps': 45603, 'loss/train': 1.921417236328125} -11/07/2021 03:40:48 - INFO - __main__ - Step 45605: {'lr': 0.00040034259865809915, 'samples': 8756160, 'steps': 45604, 'loss/train': 1.2512096166610718} -11/07/2021 03:40:48 - INFO - __main__ - Step 45606: {'lr': 0.00040033835869274605, 'samples': 8756352, 'steps': 45605, 'loss/train': 0.9501252174377441} -11/07/2021 03:40:48 - INFO - __main__ - Step 45607: {'lr': 0.00040033411865965276, 'samples': 8756544, 'steps': 45606, 'loss/train': 1.3827056884765625} -11/07/2021 03:40:49 - INFO - __main__ - Step 45608: {'lr': 0.0004003298785588212, 'samples': 8756736, 'steps': 45607, 'loss/train': 1.574720025062561} -11/07/2021 03:40:49 - INFO - __main__ - Step 45609: {'lr': 0.00040032563839025335, 'samples': 8756928, 'steps': 45608, 'loss/train': 1.3279770612716675} -11/07/2021 03:40:50 - INFO - __main__ - Step 45610: {'lr': 0.00040032139815395114, 'samples': 8757120, 'steps': 45609, 'loss/train': 1.8429594039916992} -11/07/2021 03:40:51 - INFO - __main__ - Step 45611: {'lr': 0.00040031715784991643, 'samples': 8757312, 'steps': 45610, 'loss/train': 1.3361419439315796} -11/07/2021 03:40:51 - INFO - __main__ - Step 45612: {'lr': 0.000400312917478151, 'samples': 8757504, 'steps': 45611, 'loss/train': 1.6061185598373413} -11/07/2021 03:40:51 - INFO - __main__ - Step 45613: {'lr': 0.000400308677038657, 'samples': 8757696, 'steps': 45612, 'loss/train': 1.4026153087615967} -11/07/2021 03:40:52 - INFO - __main__ - Step 45614: {'lr': 0.0004003044365314362, 'samples': 8757888, 'steps': 45613, 'loss/train': 1.5190362930297852} -11/07/2021 03:40:53 - INFO - __main__ - Step 45615: {'lr': 0.0004003001959564906, 'samples': 8758080, 'steps': 45614, 'loss/train': 0.32917556166648865} -11/07/2021 03:40:54 - INFO - __main__ - Step 45616: {'lr': 0.000400295955313822, 'samples': 8758272, 'steps': 45615, 'loss/train': 1.3965507745742798} -11/07/2021 03:40:54 - INFO - __main__ - Step 45617: {'lr': 0.0004002917146034323, 'samples': 8758464, 'steps': 45616, 'loss/train': 1.3469103574752808} -11/07/2021 03:40:54 - INFO - __main__ - Step 45618: {'lr': 0.0004002874738253235, 'samples': 8758656, 'steps': 45617, 'loss/train': 1.355541467666626} -11/07/2021 03:40:55 - INFO - __main__ - Step 45619: {'lr': 0.00040028323297949754, 'samples': 8758848, 'steps': 45618, 'loss/train': 1.3055799007415771} -11/07/2021 03:40:55 - INFO - __main__ - Step 45620: {'lr': 0.0004002789920659563, 'samples': 8759040, 'steps': 45619, 'loss/train': 1.5339677333831787} -11/07/2021 03:40:56 - INFO - __main__ - Step 45621: {'lr': 0.0004002747510847016, 'samples': 8759232, 'steps': 45620, 'loss/train': 1.6751906871795654} -11/07/2021 03:40:57 - INFO - __main__ - Step 45622: {'lr': 0.0004002705100357354, 'samples': 8759424, 'steps': 45621, 'loss/train': 1.5554715394973755} -11/07/2021 03:40:57 - INFO - __main__ - Step 45623: {'lr': 0.00040026626891905963, 'samples': 8759616, 'steps': 45622, 'loss/train': 1.5582956075668335} -11/07/2021 03:40:57 - INFO - __main__ - Step 45624: {'lr': 0.00040026202773467623, 'samples': 8759808, 'steps': 45623, 'loss/train': 1.737872838973999} -11/07/2021 03:40:58 - INFO - __main__ - Step 45625: {'lr': 0.00040025778648258706, 'samples': 8760000, 'steps': 45624, 'loss/train': 1.5353635549545288} -11/07/2021 03:40:59 - INFO - __main__ - Step 45626: {'lr': 0.00040025354516279413, 'samples': 8760192, 'steps': 45625, 'loss/train': 0.9963065981864929} -11/07/2021 03:40:59 - INFO - __main__ - Step 45627: {'lr': 0.0004002493037752992, 'samples': 8760384, 'steps': 45626, 'loss/train': 1.507947564125061} -11/07/2021 03:40:59 - INFO - __main__ - Step 45628: {'lr': 0.0004002450623201043, 'samples': 8760576, 'steps': 45627, 'loss/train': 1.379876732826233} -11/07/2021 03:41:00 - INFO - __main__ - Step 45629: {'lr': 0.0004002408207972111, 'samples': 8760768, 'steps': 45628, 'loss/train': 2.1403496265411377} -11/07/2021 03:41:00 - INFO - __main__ - Step 45630: {'lr': 0.00040023657920662195, 'samples': 8760960, 'steps': 45629, 'loss/train': 1.431511402130127} -11/07/2021 03:41:00 - INFO - __main__ - Step 45631: {'lr': 0.0004002323375483384, 'samples': 8761152, 'steps': 45630, 'loss/train': 1.7480183839797974} -11/07/2021 03:41:01 - INFO - __main__ - Step 45632: {'lr': 0.00040022809582236245, 'samples': 8761344, 'steps': 45631, 'loss/train': 2.1796576976776123} -11/07/2021 03:41:02 - INFO - __main__ - Step 45633: {'lr': 0.0004002238540286961, 'samples': 8761536, 'steps': 45632, 'loss/train': 1.638445258140564} -11/07/2021 03:41:02 - INFO - __main__ - Step 45634: {'lr': 0.00040021961216734123, 'samples': 8761728, 'steps': 45633, 'loss/train': 1.6624153852462769} -11/07/2021 03:41:03 - INFO - __main__ - Step 45635: {'lr': 0.0004002153702382997, 'samples': 8761920, 'steps': 45634, 'loss/train': 1.3904660940170288} -11/07/2021 03:41:03 - INFO - __main__ - Step 45636: {'lr': 0.0004002111282415734, 'samples': 8762112, 'steps': 45635, 'loss/train': 0.7281976342201233} -11/07/2021 03:41:04 - INFO - __main__ - Step 45637: {'lr': 0.00040020688617716427, 'samples': 8762304, 'steps': 45636, 'loss/train': 1.0489119291305542} -11/07/2021 03:41:04 - INFO - __main__ - Step 45638: {'lr': 0.0004002026440450742, 'samples': 8762496, 'steps': 45637, 'loss/train': 1.5963797569274902} -11/07/2021 03:41:05 - INFO - __main__ - Step 45639: {'lr': 0.0004001984018453052, 'samples': 8762688, 'steps': 45638, 'loss/train': 1.5868746042251587} -11/07/2021 03:41:05 - INFO - __main__ - Step 45640: {'lr': 0.0004001941595778592, 'samples': 8762880, 'steps': 45639, 'loss/train': 1.3480441570281982} -11/07/2021 03:41:05 - INFO - __main__ - Step 45641: {'lr': 0.0004001899172427379, 'samples': 8763072, 'steps': 45640, 'loss/train': 1.348357081413269} -11/07/2021 03:41:06 - INFO - __main__ - Step 45642: {'lr': 0.00040018567483994337, 'samples': 8763264, 'steps': 45641, 'loss/train': 1.5343412160873413} -11/07/2021 03:41:07 - INFO - __main__ - Step 45643: {'lr': 0.00040018143236947756, 'samples': 8763456, 'steps': 45642, 'loss/train': 1.5094057321548462} -11/07/2021 03:41:07 - INFO - __main__ - Step 45644: {'lr': 0.0004001771898313422, 'samples': 8763648, 'steps': 45643, 'loss/train': 1.577721357345581} -11/07/2021 03:41:07 - INFO - __main__ - Step 45645: {'lr': 0.00040017294722553945, 'samples': 8763840, 'steps': 45644, 'loss/train': 1.5198816061019897} -11/07/2021 03:41:08 - INFO - __main__ - Step 45646: {'lr': 0.000400168704552071, 'samples': 8764032, 'steps': 45645, 'loss/train': 1.4890958070755005} -11/07/2021 03:41:09 - INFO - __main__ - Step 45647: {'lr': 0.0004001644618109389, 'samples': 8764224, 'steps': 45646, 'loss/train': 2.0204715728759766} -11/07/2021 03:41:09 - INFO - __main__ - Step 45648: {'lr': 0.00040016021900214497, 'samples': 8764416, 'steps': 45647, 'loss/train': 1.0654419660568237} -11/07/2021 03:41:09 - INFO - __main__ - Step 45649: {'lr': 0.00040015597612569115, 'samples': 8764608, 'steps': 45648, 'loss/train': 1.324616551399231} -11/07/2021 03:41:10 - INFO - __main__ - Step 45650: {'lr': 0.00040015173318157937, 'samples': 8764800, 'steps': 45649, 'loss/train': 1.0149785280227661} -11/07/2021 03:41:10 - INFO - __main__ - Step 45651: {'lr': 0.00040014749016981154, 'samples': 8764992, 'steps': 45650, 'loss/train': 1.5370380878448486} -11/07/2021 03:41:11 - INFO - __main__ - Step 45652: {'lr': 0.00040014324709038965, 'samples': 8765184, 'steps': 45651, 'loss/train': 1.5011380910873413} -11/07/2021 03:41:12 - INFO - __main__ - Step 45653: {'lr': 0.00040013900394331544, 'samples': 8765376, 'steps': 45652, 'loss/train': 1.340386152267456} -11/07/2021 03:41:12 - INFO - __main__ - Step 45654: {'lr': 0.0004001347607285909, 'samples': 8765568, 'steps': 45653, 'loss/train': 1.6123696565628052} -11/07/2021 03:41:12 - INFO - __main__ - Step 45655: {'lr': 0.000400130517446218, 'samples': 8765760, 'steps': 45654, 'loss/train': 1.710909128189087} -11/07/2021 03:41:13 - INFO - __main__ - Step 45656: {'lr': 0.00040012627409619853, 'samples': 8765952, 'steps': 45655, 'loss/train': 1.3030675649642944} -11/07/2021 03:41:13 - INFO - __main__ - Step 45657: {'lr': 0.00040012203067853457, 'samples': 8766144, 'steps': 45656, 'loss/train': 1.6493674516677856} -11/07/2021 03:41:14 - INFO - __main__ - Step 45658: {'lr': 0.0004001177871932279, 'samples': 8766336, 'steps': 45657, 'loss/train': 1.0549403429031372} -11/07/2021 03:41:15 - INFO - __main__ - Step 45659: {'lr': 0.00040011354364028053, 'samples': 8766528, 'steps': 45658, 'loss/train': 1.245045781135559} -11/07/2021 03:41:15 - INFO - __main__ - Step 45660: {'lr': 0.00040010930001969426, 'samples': 8766720, 'steps': 45659, 'loss/train': 0.8746814727783203} -11/07/2021 03:41:15 - INFO - __main__ - Step 45661: {'lr': 0.00040010505633147106, 'samples': 8766912, 'steps': 45660, 'loss/train': 0.6673946976661682} -11/07/2021 03:41:16 - INFO - __main__ - Step 45662: {'lr': 0.00040010081257561283, 'samples': 8767104, 'steps': 45661, 'loss/train': 0.17925159633159637} -11/07/2021 03:41:17 - INFO - __main__ - Step 45663: {'lr': 0.0004000965687521215, 'samples': 8767296, 'steps': 45662, 'loss/train': 1.4898158311843872} -11/07/2021 03:41:17 - INFO - __main__ - Step 45664: {'lr': 0.0004000923248609989, 'samples': 8767488, 'steps': 45663, 'loss/train': 1.8594963550567627} -11/07/2021 03:41:17 - INFO - __main__ - Step 45665: {'lr': 0.00040008808090224714, 'samples': 8767680, 'steps': 45664, 'loss/train': 1.7202855348587036} -11/07/2021 03:41:18 - INFO - __main__ - Step 45666: {'lr': 0.0004000838368758679, 'samples': 8767872, 'steps': 45665, 'loss/train': 1.6891522407531738} -11/07/2021 03:41:18 - INFO - __main__ - Step 45667: {'lr': 0.00040007959278186327, 'samples': 8768064, 'steps': 45666, 'loss/train': 1.3225188255310059} -11/07/2021 03:41:19 - INFO - __main__ - Step 45668: {'lr': 0.0004000753486202351, 'samples': 8768256, 'steps': 45667, 'loss/train': 1.238524317741394} -11/07/2021 03:41:20 - INFO - __main__ - Step 45669: {'lr': 0.0004000711043909853, 'samples': 8768448, 'steps': 45668, 'loss/train': 1.3674970865249634} -11/07/2021 03:41:20 - INFO - __main__ - Step 45670: {'lr': 0.0004000668600941157, 'samples': 8768640, 'steps': 45669, 'loss/train': 1.4492086172103882} -11/07/2021 03:41:20 - INFO - __main__ - Step 45671: {'lr': 0.00040006261572962833, 'samples': 8768832, 'steps': 45670, 'loss/train': 1.239437222480774} -11/07/2021 03:41:21 - INFO - __main__ - Step 45672: {'lr': 0.00040005837129752496, 'samples': 8769024, 'steps': 45671, 'loss/train': 1.1618527173995972} -11/07/2021 03:41:22 - INFO - __main__ - Step 45673: {'lr': 0.00040005412679780777, 'samples': 8769216, 'steps': 45672, 'loss/train': 1.4424184560775757} -11/07/2021 03:41:22 - INFO - __main__ - Step 45674: {'lr': 0.00040004988223047843, 'samples': 8769408, 'steps': 45673, 'loss/train': 1.3270950317382812} -11/07/2021 03:41:22 - INFO - __main__ - Step 45675: {'lr': 0.0004000456375955389, 'samples': 8769600, 'steps': 45674, 'loss/train': 1.350642442703247} -11/07/2021 03:41:23 - INFO - __main__ - Step 45676: {'lr': 0.00040004139289299127, 'samples': 8769792, 'steps': 45675, 'loss/train': 1.709375023841858} -11/07/2021 03:41:23 - INFO - __main__ - Step 45677: {'lr': 0.0004000371481228371, 'samples': 8769984, 'steps': 45676, 'loss/train': 1.4423998594284058} -11/07/2021 03:41:24 - INFO - __main__ - Step 45678: {'lr': 0.00040003290328507855, 'samples': 8770176, 'steps': 45677, 'loss/train': 1.486462116241455} -11/07/2021 03:41:25 - INFO - __main__ - Step 45679: {'lr': 0.0004000286583797176, 'samples': 8770368, 'steps': 45678, 'loss/train': 1.642520546913147} -11/07/2021 03:41:25 - INFO - __main__ - Step 45680: {'lr': 0.000400024413406756, 'samples': 8770560, 'steps': 45679, 'loss/train': 1.4172120094299316} -11/07/2021 03:41:25 - INFO - __main__ - Step 45681: {'lr': 0.0004000201683661957, 'samples': 8770752, 'steps': 45680, 'loss/train': 1.7763307094573975} -11/07/2021 03:41:26 - INFO - __main__ - Step 45682: {'lr': 0.0004000159232580386, 'samples': 8770944, 'steps': 45681, 'loss/train': 1.6562503576278687} -11/07/2021 03:41:27 - INFO - __main__ - Step 45683: {'lr': 0.0004000116780822867, 'samples': 8771136, 'steps': 45682, 'loss/train': 1.8312898874282837} -11/07/2021 03:41:27 - INFO - __main__ - Step 45684: {'lr': 0.0004000074328389418, 'samples': 8771328, 'steps': 45683, 'loss/train': 1.7056604623794556} -11/07/2021 03:41:28 - INFO - __main__ - Step 45685: {'lr': 0.0004000031875280059, 'samples': 8771520, 'steps': 45684, 'loss/train': 1.4973245859146118} -11/07/2021 03:41:28 - INFO - __main__ - Step 45686: {'lr': 0.00039999894214948087, 'samples': 8771712, 'steps': 45685, 'loss/train': 1.3996328115463257} -11/07/2021 03:41:28 - INFO - __main__ - Step 45687: {'lr': 0.00039999469670336864, 'samples': 8771904, 'steps': 45686, 'loss/train': 0.9094541072845459} -11/07/2021 03:41:29 - INFO - __main__ - Step 45688: {'lr': 0.0003999904511896711, 'samples': 8772096, 'steps': 45687, 'loss/train': 1.5477782487869263} -11/07/2021 03:41:30 - INFO - __main__ - Step 45689: {'lr': 0.00039998620560839014, 'samples': 8772288, 'steps': 45688, 'loss/train': 1.755375862121582} -11/07/2021 03:41:30 - INFO - __main__ - Step 45690: {'lr': 0.0003999819599595278, 'samples': 8772480, 'steps': 45689, 'loss/train': 1.5153800249099731} -11/07/2021 03:41:30 - INFO - __main__ - Step 45691: {'lr': 0.00039997771424308583, 'samples': 8772672, 'steps': 45690, 'loss/train': 1.8970978260040283} -11/07/2021 03:41:31 - INFO - __main__ - Step 45692: {'lr': 0.0003999734684590662, 'samples': 8772864, 'steps': 45691, 'loss/train': 1.9008773565292358} -11/07/2021 03:41:31 - INFO - __main__ - Step 45693: {'lr': 0.0003999692226074709, 'samples': 8773056, 'steps': 45692, 'loss/train': 1.364372968673706} -11/07/2021 03:41:32 - INFO - __main__ - Step 45694: {'lr': 0.0003999649766883018, 'samples': 8773248, 'steps': 45693, 'loss/train': 1.855595588684082} -11/07/2021 03:41:32 - INFO - __main__ - Step 45695: {'lr': 0.0003999607307015607, 'samples': 8773440, 'steps': 45694, 'loss/train': 0.847008466720581} -11/07/2021 03:41:33 - INFO - __main__ - Step 45696: {'lr': 0.00039995648464724966, 'samples': 8773632, 'steps': 45695, 'loss/train': 1.5284357070922852} -11/07/2021 03:41:33 - INFO - __main__ - Step 45697: {'lr': 0.00039995223852537054, 'samples': 8773824, 'steps': 45696, 'loss/train': 1.5149009227752686} -11/07/2021 03:41:34 - INFO - __main__ - Step 45698: {'lr': 0.0003999479923359253, 'samples': 8774016, 'steps': 45697, 'loss/train': 1.5185508728027344} -11/07/2021 03:41:34 - INFO - __main__ - Step 45699: {'lr': 0.0003999437460789157, 'samples': 8774208, 'steps': 45698, 'loss/train': 1.335496425628662} -11/07/2021 03:41:35 - INFO - __main__ - Step 45700: {'lr': 0.0003999394997543439, 'samples': 8774400, 'steps': 45699, 'loss/train': 0.5011448264122009} -11/07/2021 03:41:35 - INFO - __main__ - Step 45701: {'lr': 0.0003999352533622116, 'samples': 8774592, 'steps': 45700, 'loss/train': 2.193835973739624} -11/07/2021 03:41:36 - INFO - __main__ - Step 45702: {'lr': 0.00039993100690252084, 'samples': 8774784, 'steps': 45701, 'loss/train': 1.5538792610168457} -11/07/2021 03:41:36 - INFO - __main__ - Step 45703: {'lr': 0.00039992676037527337, 'samples': 8774976, 'steps': 45702, 'loss/train': 1.1894370317459106} -11/07/2021 03:41:36 - INFO - __main__ - Step 45704: {'lr': 0.0003999225137804713, 'samples': 8775168, 'steps': 45703, 'loss/train': 1.1973448991775513} -11/07/2021 03:41:37 - INFO - __main__ - Step 45705: {'lr': 0.0003999182671181164, 'samples': 8775360, 'steps': 45704, 'loss/train': 1.148694396018982} -11/07/2021 03:41:38 - INFO - __main__ - Step 45706: {'lr': 0.00039991402038821067, 'samples': 8775552, 'steps': 45705, 'loss/train': 1.6992937326431274} -11/07/2021 03:41:38 - INFO - __main__ - Step 45707: {'lr': 0.00039990977359075607, 'samples': 8775744, 'steps': 45706, 'loss/train': 1.647392988204956} -11/07/2021 03:41:38 - INFO - __main__ - Step 45708: {'lr': 0.00039990552672575436, 'samples': 8775936, 'steps': 45707, 'loss/train': 1.611392617225647} -11/07/2021 03:41:39 - INFO - __main__ - Step 45709: {'lr': 0.00039990127979320757, 'samples': 8776128, 'steps': 45708, 'loss/train': 1.4701683521270752} -11/07/2021 03:41:39 - INFO - __main__ - Step 45710: {'lr': 0.00039989703279311753, 'samples': 8776320, 'steps': 45709, 'loss/train': 1.3313275575637817} -11/07/2021 03:41:40 - INFO - __main__ - Step 45711: {'lr': 0.00039989278572548625, 'samples': 8776512, 'steps': 45710, 'loss/train': 1.3801134824752808} -11/07/2021 03:41:41 - INFO - __main__ - Step 45712: {'lr': 0.00039988853859031557, 'samples': 8776704, 'steps': 45711, 'loss/train': 1.8523447513580322} -11/07/2021 03:41:41 - INFO - __main__ - Step 45713: {'lr': 0.0003998842913876074, 'samples': 8776896, 'steps': 45712, 'loss/train': 1.0423424243927002} -11/07/2021 03:41:41 - INFO - __main__ - Step 45714: {'lr': 0.0003998800441173637, 'samples': 8777088, 'steps': 45713, 'loss/train': 1.2443095445632935} -11/07/2021 03:41:42 - INFO - __main__ - Step 45715: {'lr': 0.00039987579677958643, 'samples': 8777280, 'steps': 45714, 'loss/train': 1.7403079271316528} -11/07/2021 03:41:42 - INFO - __main__ - Step 45716: {'lr': 0.0003998715493742774, 'samples': 8777472, 'steps': 45715, 'loss/train': 1.786270260810852} -11/07/2021 03:41:43 - INFO - __main__ - Step 45717: {'lr': 0.0003998673019014385, 'samples': 8777664, 'steps': 45716, 'loss/train': 1.768802523612976} -11/07/2021 03:41:43 - INFO - __main__ - Step 45718: {'lr': 0.0003998630543610717, 'samples': 8777856, 'steps': 45717, 'loss/train': 1.3839589357376099} -11/07/2021 03:41:44 - INFO - __main__ - Step 45719: {'lr': 0.00039985880675317897, 'samples': 8778048, 'steps': 45718, 'loss/train': 1.6259337663650513} -11/07/2021 03:41:44 - INFO - __main__ - Step 45720: {'lr': 0.0003998545590777622, 'samples': 8778240, 'steps': 45719, 'loss/train': 1.936063289642334} -11/07/2021 03:41:45 - INFO - __main__ - Step 45721: {'lr': 0.0003998503113348233, 'samples': 8778432, 'steps': 45720, 'loss/train': 1.554116129875183} -11/07/2021 03:41:46 - INFO - __main__ - Step 45722: {'lr': 0.0003998460635243641, 'samples': 8778624, 'steps': 45721, 'loss/train': 1.700764536857605} -11/07/2021 03:41:46 - INFO - __main__ - Step 45723: {'lr': 0.00039984181564638654, 'samples': 8778816, 'steps': 45722, 'loss/train': 1.6266900300979614} -11/07/2021 03:41:46 - INFO - __main__ - Step 45724: {'lr': 0.00039983756770089264, 'samples': 8779008, 'steps': 45723, 'loss/train': 0.8411117792129517} -11/07/2021 03:41:47 - INFO - __main__ - Step 45725: {'lr': 0.0003998333196878843, 'samples': 8779200, 'steps': 45724, 'loss/train': 1.3577433824539185} -11/07/2021 03:41:47 - INFO - __main__ - Step 45726: {'lr': 0.00039982907160736325, 'samples': 8779392, 'steps': 45725, 'loss/train': 1.300414800643921} -11/07/2021 03:41:47 - INFO - __main__ - Step 45727: {'lr': 0.00039982482345933155, 'samples': 8779584, 'steps': 45726, 'loss/train': 1.2126566171646118} -11/07/2021 03:41:48 - INFO - __main__ - Step 45728: {'lr': 0.00039982057524379124, 'samples': 8779776, 'steps': 45727, 'loss/train': 1.459671974182129} -11/07/2021 03:41:49 - INFO - __main__ - Step 45729: {'lr': 0.00039981632696074396, 'samples': 8779968, 'steps': 45728, 'loss/train': 1.786897897720337} -11/07/2021 03:41:49 - INFO - __main__ - Step 45730: {'lr': 0.00039981207861019175, 'samples': 8780160, 'steps': 45729, 'loss/train': 1.1281368732452393} -11/07/2021 03:41:49 - INFO - __main__ - Step 45731: {'lr': 0.0003998078301921365, 'samples': 8780352, 'steps': 45730, 'loss/train': 1.603014349937439} -11/07/2021 03:41:50 - INFO - __main__ - Step 45732: {'lr': 0.00039980358170658026, 'samples': 8780544, 'steps': 45731, 'loss/train': 1.6706631183624268} -11/07/2021 03:41:51 - INFO - __main__ - Step 45733: {'lr': 0.0003997993331535248, 'samples': 8780736, 'steps': 45732, 'loss/train': 1.5991101264953613} -11/07/2021 03:41:51 - INFO - __main__ - Step 45734: {'lr': 0.0003997950845329721, 'samples': 8780928, 'steps': 45733, 'loss/train': 1.6309759616851807} -11/07/2021 03:41:52 - INFO - __main__ - Step 45735: {'lr': 0.000399790835844924, 'samples': 8781120, 'steps': 45734, 'loss/train': 1.2797209024429321} -11/07/2021 03:41:52 - INFO - __main__ - Step 45736: {'lr': 0.00039978658708938244, 'samples': 8781312, 'steps': 45735, 'loss/train': 1.7494573593139648} -11/07/2021 03:41:52 - INFO - __main__ - Step 45737: {'lr': 0.00039978233826634934, 'samples': 8781504, 'steps': 45736, 'loss/train': 1.0572928190231323} -11/07/2021 03:41:54 - INFO - __main__ - Step 45738: {'lr': 0.0003997780893758267, 'samples': 8781696, 'steps': 45737, 'loss/train': 1.5383487939834595} -11/07/2021 03:41:54 - INFO - __main__ - Step 45739: {'lr': 0.0003997738404178164, 'samples': 8781888, 'steps': 45738, 'loss/train': 2.2209999561309814} -11/07/2021 03:41:54 - INFO - __main__ - Step 45740: {'lr': 0.00039976959139232017, 'samples': 8782080, 'steps': 45739, 'loss/train': 1.2510405778884888} -11/07/2021 03:41:55 - INFO - __main__ - Step 45741: {'lr': 0.0003997653422993402, 'samples': 8782272, 'steps': 45740, 'loss/train': 1.1893982887268066} -11/07/2021 03:41:55 - INFO - __main__ - Step 45742: {'lr': 0.0003997610931388782, 'samples': 8782464, 'steps': 45741, 'loss/train': 1.5910414457321167} -11/07/2021 03:41:56 - INFO - __main__ - Step 45743: {'lr': 0.0003997568439109363, 'samples': 8782656, 'steps': 45742, 'loss/train': 1.802226185798645} -11/07/2021 03:41:56 - INFO - __main__ - Step 45744: {'lr': 0.00039975259461551613, 'samples': 8782848, 'steps': 45743, 'loss/train': 1.9506511688232422} -11/07/2021 03:41:57 - INFO - __main__ - Step 45745: {'lr': 0.0003997483452526198, 'samples': 8783040, 'steps': 45744, 'loss/train': 1.4046062231063843} -11/07/2021 03:41:57 - INFO - __main__ - Step 45746: {'lr': 0.0003997440958222491, 'samples': 8783232, 'steps': 45745, 'loss/train': 1.6467649936676025} -11/07/2021 03:41:57 - INFO - __main__ - Step 45747: {'lr': 0.0003997398463244062, 'samples': 8783424, 'steps': 45746, 'loss/train': 1.4050190448760986} -11/07/2021 03:41:59 - INFO - __main__ - Step 45748: {'lr': 0.00039973559675909274, 'samples': 8783616, 'steps': 45747, 'loss/train': 1.5863054990768433} -11/07/2021 03:41:59 - INFO - __main__ - Step 45749: {'lr': 0.00039973134712631067, 'samples': 8783808, 'steps': 45748, 'loss/train': 1.5905817747116089} -11/07/2021 03:41:59 - INFO - __main__ - Step 45750: {'lr': 0.00039972709742606207, 'samples': 8784000, 'steps': 45749, 'loss/train': 1.5976406335830688} -11/07/2021 03:42:00 - INFO - __main__ - Step 45751: {'lr': 0.00039972284765834866, 'samples': 8784192, 'steps': 45750, 'loss/train': 1.4078799486160278} -11/07/2021 03:42:00 - INFO - __main__ - Step 45752: {'lr': 0.00039971859782317245, 'samples': 8784384, 'steps': 45751, 'loss/train': 0.5994760990142822} -11/07/2021 03:42:01 - INFO - __main__ - Step 45753: {'lr': 0.0003997143479205354, 'samples': 8784576, 'steps': 45752, 'loss/train': 1.6960455179214478} -11/07/2021 03:42:01 - INFO - __main__ - Step 45754: {'lr': 0.0003997100979504394, 'samples': 8784768, 'steps': 45753, 'loss/train': 1.2282835245132446} -11/07/2021 03:42:02 - INFO - __main__ - Step 45755: {'lr': 0.00039970584791288626, 'samples': 8784960, 'steps': 45754, 'loss/train': 1.7166662216186523} -11/07/2021 03:42:02 - INFO - __main__ - Step 45756: {'lr': 0.000399701597807878, 'samples': 8785152, 'steps': 45755, 'loss/train': 1.2824113368988037} -11/07/2021 03:42:02 - INFO - __main__ - Step 45757: {'lr': 0.00039969734763541657, 'samples': 8785344, 'steps': 45756, 'loss/train': 0.9290876984596252} -11/07/2021 03:42:03 - INFO - __main__ - Step 45758: {'lr': 0.00039969309739550373, 'samples': 8785536, 'steps': 45757, 'loss/train': 1.5645976066589355} -11/07/2021 03:42:04 - INFO - __main__ - Step 45759: {'lr': 0.0003996888470881416, 'samples': 8785728, 'steps': 45758, 'loss/train': 1.6670734882354736} -11/07/2021 03:42:04 - INFO - __main__ - Step 45760: {'lr': 0.0003996845967133319, 'samples': 8785920, 'steps': 45759, 'loss/train': 1.7307648658752441} -11/07/2021 03:42:04 - INFO - __main__ - Step 45761: {'lr': 0.0003996803462710766, 'samples': 8786112, 'steps': 45760, 'loss/train': 1.9626553058624268} -11/07/2021 03:42:05 - INFO - __main__ - Step 45762: {'lr': 0.00039967609576137774, 'samples': 8786304, 'steps': 45761, 'loss/train': 1.5805244445800781} -11/07/2021 03:42:05 - INFO - __main__ - Step 45763: {'lr': 0.0003996718451842371, 'samples': 8786496, 'steps': 45762, 'loss/train': 1.5933947563171387} -11/07/2021 03:42:06 - INFO - __main__ - Step 45764: {'lr': 0.00039966759453965664, 'samples': 8786688, 'steps': 45763, 'loss/train': 2.0527541637420654} -11/07/2021 03:42:07 - INFO - __main__ - Step 45765: {'lr': 0.00039966334382763826, 'samples': 8786880, 'steps': 45764, 'loss/train': 1.156002402305603} -11/07/2021 03:42:07 - INFO - __main__ - Step 45766: {'lr': 0.00039965909304818387, 'samples': 8787072, 'steps': 45765, 'loss/train': 0.7822408080101013} -11/07/2021 03:42:07 - INFO - __main__ - Step 45767: {'lr': 0.00039965484220129546, 'samples': 8787264, 'steps': 45766, 'loss/train': 1.55080246925354} -11/07/2021 03:42:08 - INFO - __main__ - Step 45768: {'lr': 0.0003996505912869749, 'samples': 8787456, 'steps': 45767, 'loss/train': 1.7155765295028687} -11/07/2021 03:42:09 - INFO - __main__ - Step 45769: {'lr': 0.000399646340305224, 'samples': 8787648, 'steps': 45768, 'loss/train': 1.4348912239074707} -11/07/2021 03:42:09 - INFO - __main__ - Step 45770: {'lr': 0.00039964208925604485, 'samples': 8787840, 'steps': 45769, 'loss/train': 0.3281099200248718} -11/07/2021 03:42:09 - INFO - __main__ - Step 45771: {'lr': 0.0003996378381394392, 'samples': 8788032, 'steps': 45770, 'loss/train': 1.5719586610794067} -11/07/2021 03:42:10 - INFO - __main__ - Step 45772: {'lr': 0.00039963358695540907, 'samples': 8788224, 'steps': 45771, 'loss/train': 1.2992075681686401} -11/07/2021 03:42:10 - INFO - __main__ - Step 45773: {'lr': 0.0003996293357039564, 'samples': 8788416, 'steps': 45772, 'loss/train': 1.2013145685195923} -11/07/2021 03:42:11 - INFO - __main__ - Step 45774: {'lr': 0.0003996250843850831, 'samples': 8788608, 'steps': 45773, 'loss/train': 1.9157236814498901} -11/07/2021 03:42:11 - INFO - __main__ - Step 45775: {'lr': 0.000399620832998791, 'samples': 8788800, 'steps': 45774, 'loss/train': 1.9511425495147705} -11/07/2021 03:42:12 - INFO - __main__ - Step 45776: {'lr': 0.000399616581545082, 'samples': 8788992, 'steps': 45775, 'loss/train': 1.366453766822815} -11/07/2021 03:42:12 - INFO - __main__ - Step 45777: {'lr': 0.0003996123300239581, 'samples': 8789184, 'steps': 45776, 'loss/train': 1.2759289741516113} -11/07/2021 03:42:12 - INFO - __main__ - Step 45778: {'lr': 0.0003996080784354212, 'samples': 8789376, 'steps': 45777, 'loss/train': 1.4267598390579224} -11/07/2021 03:42:13 - INFO - __main__ - Step 45779: {'lr': 0.0003996038267794733, 'samples': 8789568, 'steps': 45778, 'loss/train': 1.9631978273391724} -11/07/2021 03:42:14 - INFO - __main__ - Step 45780: {'lr': 0.0003995995750561161, 'samples': 8789760, 'steps': 45779, 'loss/train': 1.7855234146118164} -11/07/2021 03:42:14 - INFO - __main__ - Step 45781: {'lr': 0.00039959532326535175, 'samples': 8789952, 'steps': 45780, 'loss/train': 1.3308883905410767} -11/07/2021 03:42:15 - INFO - __main__ - Step 45782: {'lr': 0.000399591071407182, 'samples': 8790144, 'steps': 45781, 'loss/train': 1.2953991889953613} -11/07/2021 03:42:15 - INFO - __main__ - Step 45783: {'lr': 0.0003995868194816088, 'samples': 8790336, 'steps': 45782, 'loss/train': 1.6726969480514526} -11/07/2021 03:42:15 - INFO - __main__ - Step 45784: {'lr': 0.0003995825674886341, 'samples': 8790528, 'steps': 45783, 'loss/train': 1.6071983575820923} -11/07/2021 03:42:16 - INFO - __main__ - Step 45785: {'lr': 0.00039957831542825983, 'samples': 8790720, 'steps': 45784, 'loss/train': 1.026556372642517} -11/07/2021 03:42:17 - INFO - __main__ - Step 45786: {'lr': 0.0003995740633004878, 'samples': 8790912, 'steps': 45785, 'loss/train': 1.1194347143173218} -11/07/2021 03:42:17 - INFO - __main__ - Step 45787: {'lr': 0.00039956981110532007, 'samples': 8791104, 'steps': 45786, 'loss/train': 1.8880589008331299} -11/07/2021 03:42:17 - INFO - __main__ - Step 45788: {'lr': 0.0003995655588427586, 'samples': 8791296, 'steps': 45787, 'loss/train': 1.363681674003601} -11/07/2021 03:42:18 - INFO - __main__ - Step 45789: {'lr': 0.00039956130651280504, 'samples': 8791488, 'steps': 45788, 'loss/train': 1.6982097625732422} -11/07/2021 03:42:19 - INFO - __main__ - Step 45790: {'lr': 0.0003995570541154615, 'samples': 8791680, 'steps': 45789, 'loss/train': 1.8806573152542114} -11/07/2021 03:42:19 - INFO - __main__ - Step 45791: {'lr': 0.0003995528016507298, 'samples': 8791872, 'steps': 45790, 'loss/train': 1.3060063123703003} -11/07/2021 03:42:19 - INFO - __main__ - Step 45792: {'lr': 0.000399548549118612, 'samples': 8792064, 'steps': 45791, 'loss/train': 1.6437419652938843} -11/07/2021 03:42:20 - INFO - __main__ - Step 45793: {'lr': 0.00039954429651910993, 'samples': 8792256, 'steps': 45792, 'loss/train': 1.2622495889663696} -11/07/2021 03:42:20 - INFO - __main__ - Step 45794: {'lr': 0.00039954004385222555, 'samples': 8792448, 'steps': 45793, 'loss/train': 1.5217324495315552} -11/07/2021 03:42:21 - INFO - __main__ - Step 45795: {'lr': 0.00039953579111796065, 'samples': 8792640, 'steps': 45794, 'loss/train': 1.6628124713897705} -11/07/2021 03:42:21 - INFO - __main__ - Step 45796: {'lr': 0.00039953153831631726, 'samples': 8792832, 'steps': 45795, 'loss/train': 1.499194622039795} -11/07/2021 03:42:22 - INFO - __main__ - Step 45797: {'lr': 0.0003995272854472972, 'samples': 8793024, 'steps': 45796, 'loss/train': 1.5747181177139282} -11/07/2021 03:42:22 - INFO - __main__ - Step 45798: {'lr': 0.00039952303251090254, 'samples': 8793216, 'steps': 45797, 'loss/train': 1.9704207181930542} -11/07/2021 03:42:22 - INFO - __main__ - Step 45799: {'lr': 0.00039951877950713513, 'samples': 8793408, 'steps': 45798, 'loss/train': 1.6811201572418213} -11/07/2021 03:42:23 - INFO - __main__ - Step 45800: {'lr': 0.0003995145264359968, 'samples': 8793600, 'steps': 45799, 'loss/train': 1.8199926614761353} -11/07/2021 03:42:24 - INFO - __main__ - Step 45801: {'lr': 0.00039951027329748957, 'samples': 8793792, 'steps': 45800, 'loss/train': 1.422680377960205} -11/07/2021 03:42:24 - INFO - __main__ - Step 45802: {'lr': 0.0003995060200916153, 'samples': 8793984, 'steps': 45801, 'loss/train': 1.3478022813796997} -11/07/2021 03:42:24 - INFO - __main__ - Step 45803: {'lr': 0.0003995017668183759, 'samples': 8794176, 'steps': 45802, 'loss/train': 1.246759057044983} -11/07/2021 03:42:25 - INFO - __main__ - Step 45804: {'lr': 0.0003994975134777733, 'samples': 8794368, 'steps': 45803, 'loss/train': 1.6146609783172607} -11/07/2021 03:42:26 - INFO - __main__ - Step 45805: {'lr': 0.00039949326006980944, 'samples': 8794560, 'steps': 45804, 'loss/train': 1.7832012176513672} -11/07/2021 03:42:26 - INFO - __main__ - Step 45806: {'lr': 0.0003994890065944863, 'samples': 8794752, 'steps': 45805, 'loss/train': 1.466225504875183} -11/07/2021 03:42:27 - INFO - __main__ - Step 45807: {'lr': 0.00039948475305180567, 'samples': 8794944, 'steps': 45806, 'loss/train': 1.4615516662597656} -11/07/2021 03:42:27 - INFO - __main__ - Step 45808: {'lr': 0.0003994804994417695, 'samples': 8795136, 'steps': 45807, 'loss/train': 1.4964948892593384} -11/07/2021 03:42:27 - INFO - __main__ - Step 45809: {'lr': 0.0003994762457643797, 'samples': 8795328, 'steps': 45808, 'loss/train': 1.6247048377990723} -11/07/2021 03:42:28 - INFO - __main__ - Step 45810: {'lr': 0.0003994719920196383, 'samples': 8795520, 'steps': 45809, 'loss/train': 1.7376784086227417} -11/07/2021 03:42:29 - INFO - __main__ - Step 45811: {'lr': 0.00039946773820754704, 'samples': 8795712, 'steps': 45810, 'loss/train': 1.5790966749191284} -11/07/2021 03:42:29 - INFO - __main__ - Step 45812: {'lr': 0.00039946348432810797, 'samples': 8795904, 'steps': 45811, 'loss/train': 1.4171829223632812} -11/07/2021 03:42:29 - INFO - __main__ - Step 45813: {'lr': 0.0003994592303813229, 'samples': 8796096, 'steps': 45812, 'loss/train': 1.3879013061523438} -11/07/2021 03:42:30 - INFO - __main__ - Step 45814: {'lr': 0.00039945497636719384, 'samples': 8796288, 'steps': 45813, 'loss/train': 1.4347091913223267} -11/07/2021 03:42:30 - INFO - __main__ - Step 45815: {'lr': 0.00039945072228572275, 'samples': 8796480, 'steps': 45814, 'loss/train': 0.9813772439956665} -11/07/2021 03:42:31 - INFO - __main__ - Step 45816: {'lr': 0.0003994464681369114, 'samples': 8796672, 'steps': 45815, 'loss/train': 1.7121654748916626} -11/07/2021 03:42:32 - INFO - __main__ - Step 45817: {'lr': 0.0003994422139207618, 'samples': 8796864, 'steps': 45816, 'loss/train': 1.9688409566879272} -11/07/2021 03:42:32 - INFO - __main__ - Step 45818: {'lr': 0.00039943795963727583, 'samples': 8797056, 'steps': 45817, 'loss/train': 1.3847655057907104} -11/07/2021 03:42:32 - INFO - __main__ - Step 45819: {'lr': 0.0003994337052864554, 'samples': 8797248, 'steps': 45818, 'loss/train': 1.5700711011886597} -11/07/2021 03:42:33 - INFO - __main__ - Step 45820: {'lr': 0.00039942945086830246, 'samples': 8797440, 'steps': 45819, 'loss/train': 2.300741195678711} -11/07/2021 03:42:34 - INFO - __main__ - Step 45821: {'lr': 0.00039942519638281893, 'samples': 8797632, 'steps': 45820, 'loss/train': 1.5391618013381958} -11/07/2021 03:42:34 - INFO - __main__ - Step 45822: {'lr': 0.0003994209418300068, 'samples': 8797824, 'steps': 45821, 'loss/train': 1.2126270532608032} -11/07/2021 03:42:34 - INFO - __main__ - Step 45823: {'lr': 0.0003994166872098677, 'samples': 8798016, 'steps': 45822, 'loss/train': 1.7054393291473389} -11/07/2021 03:42:35 - INFO - __main__ - Step 45824: {'lr': 0.0003994124325224039, 'samples': 8798208, 'steps': 45823, 'loss/train': 1.7563220262527466} -11/07/2021 03:42:35 - INFO - __main__ - Step 45825: {'lr': 0.00039940817776761706, 'samples': 8798400, 'steps': 45824, 'loss/train': 1.543555498123169} -11/07/2021 03:42:37 - INFO - __main__ - Step 45826: {'lr': 0.0003994039229455093, 'samples': 8798592, 'steps': 45825, 'loss/train': 1.7660768032073975} -11/07/2021 03:42:37 - INFO - __main__ - Step 45827: {'lr': 0.00039939966805608234, 'samples': 8798784, 'steps': 45826, 'loss/train': 0.9904483556747437} -11/07/2021 03:42:38 - INFO - __main__ - Step 45828: {'lr': 0.0003993954130993383, 'samples': 8798976, 'steps': 45827, 'loss/train': 1.0330867767333984} -11/07/2021 03:42:38 - INFO - __main__ - Step 45829: {'lr': 0.0003993911580752789, 'samples': 8799168, 'steps': 45828, 'loss/train': 1.1959236860275269} -11/07/2021 03:42:38 - INFO - __main__ - Step 45830: {'lr': 0.00039938690298390624, 'samples': 8799360, 'steps': 45829, 'loss/train': 1.4125633239746094} -11/07/2021 03:42:39 - INFO - __main__ - Step 45831: {'lr': 0.00039938264782522206, 'samples': 8799552, 'steps': 45830, 'loss/train': 1.7893304824829102} -11/07/2021 03:42:39 - INFO - __main__ - Step 45832: {'lr': 0.0003993783925992284, 'samples': 8799744, 'steps': 45831, 'loss/train': 0.11289530247449875} -11/07/2021 03:42:40 - INFO - __main__ - Step 45833: {'lr': 0.00039937413730592713, 'samples': 8799936, 'steps': 45832, 'loss/train': 1.5255755186080933} -11/07/2021 03:42:40 - INFO - __main__ - Step 45834: {'lr': 0.0003993698819453202, 'samples': 8800128, 'steps': 45833, 'loss/train': 1.3934648036956787} -11/07/2021 03:42:41 - INFO - __main__ - Step 45835: {'lr': 0.00039936562651740956, 'samples': 8800320, 'steps': 45834, 'loss/train': 1.3922640085220337} -11/07/2021 03:42:41 - INFO - __main__ - Step 45836: {'lr': 0.00039936137102219695, 'samples': 8800512, 'steps': 45835, 'loss/train': 1.3778247833251953} -11/07/2021 03:42:41 - INFO - __main__ - Step 45837: {'lr': 0.0003993571154596845, 'samples': 8800704, 'steps': 45836, 'loss/train': 1.7465338706970215} -11/07/2021 03:42:43 - INFO - __main__ - Step 45838: {'lr': 0.00039935285982987403, 'samples': 8800896, 'steps': 45837, 'loss/train': 1.6409074068069458} -11/07/2021 03:42:43 - INFO - __main__ - Step 45839: {'lr': 0.0003993486041327674, 'samples': 8801088, 'steps': 45838, 'loss/train': 1.664171814918518} -11/07/2021 03:42:43 - INFO - __main__ - Step 45840: {'lr': 0.00039934434836836664, 'samples': 8801280, 'steps': 45839, 'loss/train': 1.5493240356445312} -11/07/2021 03:42:44 - INFO - __main__ - Step 45841: {'lr': 0.00039934009253667356, 'samples': 8801472, 'steps': 45840, 'loss/train': 1.693857192993164} -11/07/2021 03:42:44 - INFO - __main__ - Step 45842: {'lr': 0.0003993358366376903, 'samples': 8801664, 'steps': 45841, 'loss/train': 0.4450680911540985} -11/07/2021 03:42:44 - INFO - __main__ - Step 45843: {'lr': 0.0003993315806714185, 'samples': 8801856, 'steps': 45842, 'loss/train': 1.3008158206939697} -11/07/2021 03:42:45 - INFO - __main__ - Step 45844: {'lr': 0.0003993273246378602, 'samples': 8802048, 'steps': 45843, 'loss/train': 0.5249027609825134} -11/07/2021 03:42:46 - INFO - __main__ - Step 45845: {'lr': 0.00039932306853701735, 'samples': 8802240, 'steps': 45844, 'loss/train': 1.738145351409912} -11/07/2021 03:42:46 - INFO - __main__ - Step 45846: {'lr': 0.0003993188123688918, 'samples': 8802432, 'steps': 45845, 'loss/train': 1.5204349756240845} -11/07/2021 03:42:46 - INFO - __main__ - Step 45847: {'lr': 0.00039931455613348546, 'samples': 8802624, 'steps': 45846, 'loss/train': 1.2769067287445068} -11/07/2021 03:42:47 - INFO - __main__ - Step 45848: {'lr': 0.0003993102998308004, 'samples': 8802816, 'steps': 45847, 'loss/train': 1.755358099937439} -11/07/2021 03:42:48 - INFO - __main__ - Step 45849: {'lr': 0.0003993060434608383, 'samples': 8803008, 'steps': 45848, 'loss/train': 1.435434341430664} -11/07/2021 03:42:48 - INFO - __main__ - Step 45850: {'lr': 0.0003993017870236012, 'samples': 8803200, 'steps': 45849, 'loss/train': 1.9264001846313477} -11/07/2021 03:42:48 - INFO - __main__ - Step 45851: {'lr': 0.0003992975305190911, 'samples': 8803392, 'steps': 45850, 'loss/train': 1.6069012880325317} -11/07/2021 03:42:49 - INFO - __main__ - Step 45852: {'lr': 0.0003992932739473098, 'samples': 8803584, 'steps': 45851, 'loss/train': 1.504792332649231} -11/07/2021 03:42:49 - INFO - __main__ - Step 45853: {'lr': 0.0003992890173082593, 'samples': 8803776, 'steps': 45852, 'loss/train': 1.418312430381775} -11/07/2021 03:42:50 - INFO - __main__ - Step 45854: {'lr': 0.00039928476060194137, 'samples': 8803968, 'steps': 45853, 'loss/train': 1.2826389074325562} -11/07/2021 03:42:50 - INFO - __main__ - Step 45855: {'lr': 0.0003992805038283581, 'samples': 8804160, 'steps': 45854, 'loss/train': 1.3450167179107666} -11/07/2021 03:42:51 - INFO - __main__ - Step 45856: {'lr': 0.0003992762469875113, 'samples': 8804352, 'steps': 45855, 'loss/train': 0.4302082359790802} -11/07/2021 03:42:51 - INFO - __main__ - Step 45857: {'lr': 0.00039927199007940294, 'samples': 8804544, 'steps': 45856, 'loss/train': 1.6461188793182373} -11/07/2021 03:42:52 - INFO - __main__ - Step 45858: {'lr': 0.00039926773310403497, 'samples': 8804736, 'steps': 45857, 'loss/train': 2.005046844482422} -11/07/2021 03:42:53 - INFO - __main__ - Step 45859: {'lr': 0.0003992634760614092, 'samples': 8804928, 'steps': 45858, 'loss/train': 1.6766897439956665} -11/07/2021 03:42:53 - INFO - __main__ - Step 45860: {'lr': 0.00039925921895152765, 'samples': 8805120, 'steps': 45859, 'loss/train': 1.3352468013763428} -11/07/2021 03:42:53 - INFO - __main__ - Step 45861: {'lr': 0.00039925496177439226, 'samples': 8805312, 'steps': 45860, 'loss/train': 1.4517005681991577} -11/07/2021 03:42:54 - INFO - __main__ - Step 45862: {'lr': 0.0003992507045300048, 'samples': 8805504, 'steps': 45861, 'loss/train': 1.3755040168762207} -11/07/2021 03:42:54 - INFO - __main__ - Step 45863: {'lr': 0.00039924644721836734, 'samples': 8805696, 'steps': 45862, 'loss/train': 2.094545602798462} -11/07/2021 03:42:55 - INFO - __main__ - Step 45864: {'lr': 0.0003992421898394817, 'samples': 8805888, 'steps': 45863, 'loss/train': 1.4637939929962158} -11/07/2021 03:42:55 - INFO - __main__ - Step 45865: {'lr': 0.00039923793239334974, 'samples': 8806080, 'steps': 45864, 'loss/train': 1.7148493528366089} -11/07/2021 03:42:56 - INFO - __main__ - Step 45866: {'lr': 0.0003992336748799736, 'samples': 8806272, 'steps': 45865, 'loss/train': 1.241485595703125} -11/07/2021 03:42:56 - INFO - __main__ - Step 45867: {'lr': 0.00039922941729935503, 'samples': 8806464, 'steps': 45866, 'loss/train': 1.6325886249542236} -11/07/2021 03:42:56 - INFO - __main__ - Step 45868: {'lr': 0.000399225159651496, 'samples': 8806656, 'steps': 45867, 'loss/train': 1.3532395362854004} -11/07/2021 03:42:58 - INFO - __main__ - Step 45869: {'lr': 0.0003992209019363984, 'samples': 8806848, 'steps': 45868, 'loss/train': 1.514560580253601} -11/07/2021 03:42:58 - INFO - __main__ - Step 45870: {'lr': 0.0003992166441540641, 'samples': 8807040, 'steps': 45869, 'loss/train': 1.3086159229278564} -11/07/2021 03:42:58 - INFO - __main__ - Step 45871: {'lr': 0.00039921238630449515, 'samples': 8807232, 'steps': 45870, 'loss/train': 1.616173505783081} -11/07/2021 03:42:59 - INFO - __main__ - Step 45872: {'lr': 0.0003992081283876934, 'samples': 8807424, 'steps': 45871, 'loss/train': 1.00423264503479} -11/07/2021 03:42:59 - INFO - __main__ - Step 45873: {'lr': 0.00039920387040366076, 'samples': 8807616, 'steps': 45872, 'loss/train': 1.6508270502090454} -11/07/2021 03:43:00 - INFO - __main__ - Step 45874: {'lr': 0.00039919961235239913, 'samples': 8807808, 'steps': 45873, 'loss/train': 0.48083221912384033} -11/07/2021 03:43:01 - INFO - __main__ - Step 45875: {'lr': 0.0003991953542339105, 'samples': 8808000, 'steps': 45874, 'loss/train': 1.726269006729126} -11/07/2021 03:43:01 - INFO - __main__ - Step 45876: {'lr': 0.00039919109604819676, 'samples': 8808192, 'steps': 45875, 'loss/train': 0.335126668214798} -11/07/2021 03:43:01 - INFO - __main__ - Step 45877: {'lr': 0.00039918683779525976, 'samples': 8808384, 'steps': 45876, 'loss/train': 1.3062458038330078} -11/07/2021 03:43:02 - INFO - __main__ - Step 45878: {'lr': 0.0003991825794751015, 'samples': 8808576, 'steps': 45877, 'loss/train': 1.2087069749832153} -11/07/2021 03:43:02 - INFO - __main__ - Step 45879: {'lr': 0.0003991783210877239, 'samples': 8808768, 'steps': 45878, 'loss/train': 1.5349632501602173} -11/07/2021 03:43:03 - INFO - __main__ - Step 45880: {'lr': 0.00039917406263312885, 'samples': 8808960, 'steps': 45879, 'loss/train': 1.3000528812408447} -11/07/2021 03:43:03 - INFO - __main__ - Step 45881: {'lr': 0.0003991698041113182, 'samples': 8809152, 'steps': 45880, 'loss/train': 1.5514869689941406} -11/07/2021 03:43:04 - INFO - __main__ - Step 45882: {'lr': 0.000399165545522294, 'samples': 8809344, 'steps': 45881, 'loss/train': 1.4706882238388062} -11/07/2021 03:43:04 - INFO - __main__ - Step 45883: {'lr': 0.0003991612868660581, 'samples': 8809536, 'steps': 45882, 'loss/train': 1.2744070291519165} -11/07/2021 03:43:04 - INFO - __main__ - Step 45884: {'lr': 0.0003991570281426124, 'samples': 8809728, 'steps': 45883, 'loss/train': 2.4730279445648193} -11/07/2021 03:43:05 - INFO - __main__ - Step 45885: {'lr': 0.0003991527693519589, 'samples': 8809920, 'steps': 45884, 'loss/train': 1.9310436248779297} -11/07/2021 03:43:06 - INFO - __main__ - Step 45886: {'lr': 0.0003991485104940994, 'samples': 8810112, 'steps': 45885, 'loss/train': 1.477452039718628} -11/07/2021 03:43:06 - INFO - __main__ - Step 45887: {'lr': 0.0003991442515690359, 'samples': 8810304, 'steps': 45886, 'loss/train': 1.0899360179901123} -11/07/2021 03:43:06 - INFO - __main__ - Step 45888: {'lr': 0.00039913999257677025, 'samples': 8810496, 'steps': 45887, 'loss/train': 2.2320735454559326} -11/07/2021 03:43:07 - INFO - __main__ - Step 45889: {'lr': 0.0003991357335173045, 'samples': 8810688, 'steps': 45888, 'loss/train': 1.5972838401794434} -11/07/2021 03:43:08 - INFO - __main__ - Step 45890: {'lr': 0.0003991314743906405, 'samples': 8810880, 'steps': 45889, 'loss/train': 1.3330001831054688} -11/07/2021 03:43:08 - INFO - __main__ - Step 45891: {'lr': 0.0003991272151967801, 'samples': 8811072, 'steps': 45890, 'loss/train': 1.6927576065063477} -11/07/2021 03:43:08 - INFO - __main__ - Step 45892: {'lr': 0.0003991229559357253, 'samples': 8811264, 'steps': 45891, 'loss/train': 1.166650414466858} -11/07/2021 03:43:09 - INFO - __main__ - Step 45893: {'lr': 0.00039911869660747804, 'samples': 8811456, 'steps': 45892, 'loss/train': 1.2685664892196655} -11/07/2021 03:43:09 - INFO - __main__ - Step 45894: {'lr': 0.0003991144372120401, 'samples': 8811648, 'steps': 45893, 'loss/train': 1.2748992443084717} -11/07/2021 03:43:10 - INFO - __main__ - Step 45895: {'lr': 0.0003991101777494136, 'samples': 8811840, 'steps': 45894, 'loss/train': 1.6891132593154907} -11/07/2021 03:43:11 - INFO - __main__ - Step 45896: {'lr': 0.0003991059182196003, 'samples': 8812032, 'steps': 45895, 'loss/train': 1.1875171661376953} -11/07/2021 03:43:11 - INFO - __main__ - Step 45897: {'lr': 0.00039910165862260216, 'samples': 8812224, 'steps': 45896, 'loss/train': 1.4112639427185059} -11/07/2021 03:43:11 - INFO - __main__ - Step 45898: {'lr': 0.0003990973989584211, 'samples': 8812416, 'steps': 45897, 'loss/train': 1.9724289178848267} -11/07/2021 03:43:12 - INFO - __main__ - Step 45899: {'lr': 0.00039909313922705913, 'samples': 8812608, 'steps': 45898, 'loss/train': 1.9549881219863892} -11/07/2021 03:43:13 - INFO - __main__ - Step 45900: {'lr': 0.000399088879428518, 'samples': 8812800, 'steps': 45899, 'loss/train': 2.485609531402588} -11/07/2021 03:43:13 - INFO - __main__ - Step 45901: {'lr': 0.0003990846195627998, 'samples': 8812992, 'steps': 45900, 'loss/train': 1.1123993396759033} -11/07/2021 03:43:13 - INFO - __main__ - Step 45902: {'lr': 0.0003990803596299064, 'samples': 8813184, 'steps': 45901, 'loss/train': 1.7796376943588257} -11/07/2021 03:43:14 - INFO - __main__ - Step 45903: {'lr': 0.0003990760996298396, 'samples': 8813376, 'steps': 45902, 'loss/train': 1.5923742055892944} -11/07/2021 03:43:14 - INFO - __main__ - Step 45904: {'lr': 0.0003990718395626014, 'samples': 8813568, 'steps': 45903, 'loss/train': 1.4409897327423096} -11/07/2021 03:43:14 - INFO - __main__ - Step 45905: {'lr': 0.0003990675794281938, 'samples': 8813760, 'steps': 45904, 'loss/train': 1.350804090499878} -11/07/2021 03:43:15 - INFO - __main__ - Step 45906: {'lr': 0.00039906331922661857, 'samples': 8813952, 'steps': 45905, 'loss/train': 1.6716240644454956} -11/07/2021 03:43:16 - INFO - __main__ - Step 45907: {'lr': 0.00039905905895787775, 'samples': 8814144, 'steps': 45906, 'loss/train': 1.2691327333450317} -11/07/2021 03:43:16 - INFO - __main__ - Step 45908: {'lr': 0.00039905479862197327, 'samples': 8814336, 'steps': 45907, 'loss/train': 1.3989278078079224} -11/07/2021 03:43:16 - INFO - __main__ - Step 45909: {'lr': 0.00039905053821890697, 'samples': 8814528, 'steps': 45908, 'loss/train': 1.3683829307556152} -11/07/2021 03:43:17 - INFO - __main__ - Step 45910: {'lr': 0.0003990462777486808, 'samples': 8814720, 'steps': 45909, 'loss/train': 0.9254510402679443} -11/07/2021 03:43:18 - INFO - __main__ - Step 45911: {'lr': 0.00039904201721129663, 'samples': 8814912, 'steps': 45910, 'loss/train': 1.3869608640670776} -11/07/2021 03:43:18 - INFO - __main__ - Step 45912: {'lr': 0.00039903775660675645, 'samples': 8815104, 'steps': 45911, 'loss/train': 1.241188883781433} -11/07/2021 03:43:18 - INFO - __main__ - Step 45913: {'lr': 0.00039903349593506214, 'samples': 8815296, 'steps': 45912, 'loss/train': 1.3880771398544312} -11/07/2021 03:43:19 - INFO - __main__ - Step 45914: {'lr': 0.0003990292351962157, 'samples': 8815488, 'steps': 45913, 'loss/train': 1.409548044204712} -11/07/2021 03:43:19 - INFO - __main__ - Step 45915: {'lr': 0.00039902497439021895, 'samples': 8815680, 'steps': 45914, 'loss/train': 1.898686170578003} -11/07/2021 03:43:20 - INFO - __main__ - Step 45916: {'lr': 0.0003990207135170738, 'samples': 8815872, 'steps': 45915, 'loss/train': 1.645846962928772} -11/07/2021 03:43:21 - INFO - __main__ - Step 45917: {'lr': 0.00039901645257678234, 'samples': 8816064, 'steps': 45916, 'loss/train': 1.190329909324646} -11/07/2021 03:43:21 - INFO - __main__ - Step 45918: {'lr': 0.0003990121915693462, 'samples': 8816256, 'steps': 45917, 'loss/train': 1.5712729692459106} -11/07/2021 03:43:21 - INFO - __main__ - Step 45919: {'lr': 0.0003990079304947676, 'samples': 8816448, 'steps': 45918, 'loss/train': 1.7502552270889282} -11/07/2021 03:43:22 - INFO - __main__ - Step 45920: {'lr': 0.00039900366935304824, 'samples': 8816640, 'steps': 45919, 'loss/train': 1.6001427173614502} -11/07/2021 03:43:23 - INFO - __main__ - Step 45921: {'lr': 0.0003989994081441902, 'samples': 8816832, 'steps': 45920, 'loss/train': 1.2713396549224854} -11/07/2021 03:43:23 - INFO - __main__ - Step 45922: {'lr': 0.00039899514686819526, 'samples': 8817024, 'steps': 45921, 'loss/train': 1.0933136940002441} -11/07/2021 03:43:23 - INFO - __main__ - Step 45923: {'lr': 0.00039899088552506544, 'samples': 8817216, 'steps': 45922, 'loss/train': 1.9176268577575684} -11/07/2021 03:43:24 - INFO - __main__ - Step 45924: {'lr': 0.00039898662411480264, 'samples': 8817408, 'steps': 45923, 'loss/train': 1.3488006591796875} -11/07/2021 03:43:24 - INFO - __main__ - Step 45925: {'lr': 0.00039898236263740875, 'samples': 8817600, 'steps': 45924, 'loss/train': 1.6533674001693726} -11/07/2021 03:43:25 - INFO - __main__ - Step 45926: {'lr': 0.00039897810109288566, 'samples': 8817792, 'steps': 45925, 'loss/train': 0.8493460416793823} -11/07/2021 03:43:26 - INFO - __main__ - Step 45927: {'lr': 0.0003989738394812354, 'samples': 8817984, 'steps': 45926, 'loss/train': 1.268776535987854} -11/07/2021 03:43:26 - INFO - __main__ - Step 45928: {'lr': 0.0003989695778024598, 'samples': 8818176, 'steps': 45927, 'loss/train': 1.2660177946090698} -11/07/2021 03:43:26 - INFO - __main__ - Step 45929: {'lr': 0.00039896531605656085, 'samples': 8818368, 'steps': 45928, 'loss/train': 1.4705090522766113} -11/07/2021 03:43:27 - INFO - __main__ - Step 45930: {'lr': 0.00039896105424354035, 'samples': 8818560, 'steps': 45929, 'loss/train': 1.8615349531173706} -11/07/2021 03:43:28 - INFO - __main__ - Step 45931: {'lr': 0.0003989567923634003, 'samples': 8818752, 'steps': 45930, 'loss/train': 1.7084077596664429} -11/07/2021 03:43:28 - INFO - __main__ - Step 45932: {'lr': 0.00039895253041614265, 'samples': 8818944, 'steps': 45931, 'loss/train': 1.4123179912567139} -11/07/2021 03:43:28 - INFO - __main__ - Step 45933: {'lr': 0.00039894826840176933, 'samples': 8819136, 'steps': 45932, 'loss/train': 1.1559531688690186} -11/07/2021 03:43:29 - INFO - __main__ - Step 45934: {'lr': 0.00039894400632028217, 'samples': 8819328, 'steps': 45933, 'loss/train': 1.6073169708251953} -11/07/2021 03:43:29 - INFO - __main__ - Step 45935: {'lr': 0.00039893974417168316, 'samples': 8819520, 'steps': 45934, 'loss/train': 1.4241822957992554} -11/07/2021 03:43:30 - INFO - __main__ - Step 45936: {'lr': 0.00039893548195597415, 'samples': 8819712, 'steps': 45935, 'loss/train': 1.7503966093063354} -11/07/2021 03:43:31 - INFO - __main__ - Step 45937: {'lr': 0.0003989312196731572, 'samples': 8819904, 'steps': 45936, 'loss/train': 1.5599544048309326} -11/07/2021 03:43:31 - INFO - __main__ - Step 45938: {'lr': 0.0003989269573232341, 'samples': 8820096, 'steps': 45937, 'loss/train': 1.580369234085083} -11/07/2021 03:43:31 - INFO - __main__ - Step 45939: {'lr': 0.0003989226949062068, 'samples': 8820288, 'steps': 45938, 'loss/train': 1.3357412815093994} -11/07/2021 03:43:32 - INFO - __main__ - Step 45940: {'lr': 0.00039891843242207726, 'samples': 8820480, 'steps': 45939, 'loss/train': 1.5565556287765503} -11/07/2021 03:43:32 - INFO - __main__ - Step 45941: {'lr': 0.00039891416987084726, 'samples': 8820672, 'steps': 45940, 'loss/train': 1.424456238746643} -11/07/2021 03:43:33 - INFO - __main__ - Step 45942: {'lr': 0.00039890990725251896, 'samples': 8820864, 'steps': 45941, 'loss/train': 2.265129327774048} -11/07/2021 03:43:34 - INFO - __main__ - Step 45943: {'lr': 0.0003989056445670941, 'samples': 8821056, 'steps': 45942, 'loss/train': 1.5895918607711792} -11/07/2021 03:43:34 - INFO - __main__ - Step 45944: {'lr': 0.0003989013818145747, 'samples': 8821248, 'steps': 45943, 'loss/train': 1.706114649772644} -11/07/2021 03:43:34 - INFO - __main__ - Step 45945: {'lr': 0.0003988971189949626, 'samples': 8821440, 'steps': 45944, 'loss/train': 1.637607216835022} -11/07/2021 03:43:35 - INFO - __main__ - Step 45946: {'lr': 0.0003988928561082598, 'samples': 8821632, 'steps': 45945, 'loss/train': 1.3578442335128784} -11/07/2021 03:43:35 - INFO - __main__ - Step 45947: {'lr': 0.0003988885931544681, 'samples': 8821824, 'steps': 45946, 'loss/train': 1.0622464418411255} -11/07/2021 03:43:37 - INFO - __main__ - Step 45948: {'lr': 0.0003988843301335895, 'samples': 8822016, 'steps': 45947, 'loss/train': 1.4858222007751465} -11/07/2021 03:43:37 - INFO - __main__ - Step 45949: {'lr': 0.00039888006704562594, 'samples': 8822208, 'steps': 45948, 'loss/train': 1.3465840816497803} -11/07/2021 03:43:37 - INFO - __main__ - Step 45950: {'lr': 0.0003988758038905794, 'samples': 8822400, 'steps': 45949, 'loss/train': 1.2762097120285034} -11/07/2021 03:43:38 - INFO - __main__ - Step 45951: {'lr': 0.00039887154066845166, 'samples': 8822592, 'steps': 45950, 'loss/train': 1.5280088186264038} -11/07/2021 03:43:38 - INFO - __main__ - Step 45952: {'lr': 0.00039886727737924464, 'samples': 8822784, 'steps': 45951, 'loss/train': 0.44151145219802856} -11/07/2021 03:43:39 - INFO - __main__ - Step 45953: {'lr': 0.00039886301402296037, 'samples': 8822976, 'steps': 45952, 'loss/train': 0.2146332859992981} -11/07/2021 03:43:39 - INFO - __main__ - Step 45954: {'lr': 0.00039885875059960074, 'samples': 8823168, 'steps': 45953, 'loss/train': 1.481507420539856} -11/07/2021 03:43:40 - INFO - __main__ - Step 45955: {'lr': 0.0003988544871091676, 'samples': 8823360, 'steps': 45954, 'loss/train': 1.226210355758667} -11/07/2021 03:43:40 - INFO - __main__ - Step 45956: {'lr': 0.000398850223551663, 'samples': 8823552, 'steps': 45955, 'loss/train': 1.7058351039886475} -11/07/2021 03:43:40 - INFO - __main__ - Step 45957: {'lr': 0.00039884595992708877, 'samples': 8823744, 'steps': 45956, 'loss/train': 1.4703701734542847} -11/07/2021 03:43:41 - INFO - __main__ - Step 45958: {'lr': 0.00039884169623544683, 'samples': 8823936, 'steps': 45957, 'loss/train': 1.5774255990982056} -11/07/2021 03:43:42 - INFO - __main__ - Step 45959: {'lr': 0.0003988374324767391, 'samples': 8824128, 'steps': 45958, 'loss/train': 1.3722915649414062} -11/07/2021 03:43:42 - INFO - __main__ - Step 45960: {'lr': 0.0003988331686509675, 'samples': 8824320, 'steps': 45959, 'loss/train': 1.1074728965759277} -11/07/2021 03:43:42 - INFO - __main__ - Step 45961: {'lr': 0.000398828904758134, 'samples': 8824512, 'steps': 45960, 'loss/train': 1.7804874181747437} -11/07/2021 03:43:43 - INFO - __main__ - Step 45962: {'lr': 0.0003988246407982405, 'samples': 8824704, 'steps': 45961, 'loss/train': 1.5980979204177856} -11/07/2021 03:43:43 - INFO - __main__ - Step 45963: {'lr': 0.00039882037677128895, 'samples': 8824896, 'steps': 45962, 'loss/train': 2.0666005611419678} -11/07/2021 03:43:44 - INFO - __main__ - Step 45964: {'lr': 0.0003988161126772812, 'samples': 8825088, 'steps': 45963, 'loss/train': 0.9492558240890503} -11/07/2021 03:43:44 - INFO - __main__ - Step 45965: {'lr': 0.0003988118485162192, 'samples': 8825280, 'steps': 45964, 'loss/train': 1.4683305025100708} -11/07/2021 03:43:45 - INFO - __main__ - Step 45966: {'lr': 0.00039880758428810487, 'samples': 8825472, 'steps': 45965, 'loss/train': 1.331489086151123} -11/07/2021 03:43:45 - INFO - __main__ - Step 45967: {'lr': 0.00039880331999294017, 'samples': 8825664, 'steps': 45966, 'loss/train': 1.5512917041778564} -11/07/2021 03:43:46 - INFO - __main__ - Step 45968: {'lr': 0.00039879905563072694, 'samples': 8825856, 'steps': 45967, 'loss/train': 0.9686439037322998} -11/07/2021 03:43:47 - INFO - __main__ - Step 45969: {'lr': 0.00039879479120146725, 'samples': 8826048, 'steps': 45968, 'loss/train': 1.2109235525131226} -11/07/2021 03:43:47 - INFO - __main__ - Step 45970: {'lr': 0.0003987905267051628, 'samples': 8826240, 'steps': 45969, 'loss/train': 1.4375460147857666} -11/07/2021 03:43:47 - INFO - __main__ - Step 45971: {'lr': 0.0003987862621418157, 'samples': 8826432, 'steps': 45970, 'loss/train': 1.5557785034179688} -11/07/2021 03:43:48 - INFO - __main__ - Step 45972: {'lr': 0.0003987819975114278, 'samples': 8826624, 'steps': 45971, 'loss/train': 1.1495202779769897} -11/07/2021 03:43:48 - INFO - __main__ - Step 45973: {'lr': 0.000398777732814001, 'samples': 8826816, 'steps': 45972, 'loss/train': 1.341982126235962} -11/07/2021 03:43:49 - INFO - __main__ - Step 45974: {'lr': 0.0003987734680495373, 'samples': 8827008, 'steps': 45973, 'loss/train': 1.3633899688720703} -11/07/2021 03:43:49 - INFO - __main__ - Step 45975: {'lr': 0.0003987692032180385, 'samples': 8827200, 'steps': 45974, 'loss/train': 0.8215121030807495} -11/07/2021 03:43:50 - INFO - __main__ - Step 45976: {'lr': 0.00039876493831950664, 'samples': 8827392, 'steps': 45975, 'loss/train': 1.5936977863311768} -11/07/2021 03:43:50 - INFO - __main__ - Step 45977: {'lr': 0.00039876067335394363, 'samples': 8827584, 'steps': 45976, 'loss/train': 1.0867680311203003} -11/07/2021 03:43:50 - INFO - __main__ - Step 45978: {'lr': 0.0003987564083213513, 'samples': 8827776, 'steps': 45977, 'loss/train': 1.5268322229385376} -11/07/2021 03:43:51 - INFO - __main__ - Step 45979: {'lr': 0.00039875214322173167, 'samples': 8827968, 'steps': 45978, 'loss/train': 1.3771189451217651} -11/07/2021 03:43:52 - INFO - __main__ - Step 45980: {'lr': 0.00039874787805508656, 'samples': 8828160, 'steps': 45979, 'loss/train': 1.4589320421218872} -11/07/2021 03:43:52 - INFO - __main__ - Step 45981: {'lr': 0.000398743612821418, 'samples': 8828352, 'steps': 45980, 'loss/train': 1.7522274255752563} -11/07/2021 03:43:52 - INFO - __main__ - Step 45982: {'lr': 0.0003987393475207278, 'samples': 8828544, 'steps': 45981, 'loss/train': 1.7427177429199219} -11/07/2021 03:43:53 - INFO - __main__ - Step 45983: {'lr': 0.000398735082153018, 'samples': 8828736, 'steps': 45982, 'loss/train': 1.525829792022705} -11/07/2021 03:43:54 - INFO - __main__ - Step 45984: {'lr': 0.00039873081671829046, 'samples': 8828928, 'steps': 45983, 'loss/train': 2.171912670135498} -11/07/2021 03:43:54 - INFO - __main__ - Step 45985: {'lr': 0.0003987265512165471, 'samples': 8829120, 'steps': 45984, 'loss/train': 1.4670724868774414} -11/07/2021 03:43:55 - INFO - __main__ - Step 45986: {'lr': 0.0003987222856477899, 'samples': 8829312, 'steps': 45985, 'loss/train': 1.321970820426941} -11/07/2021 03:43:55 - INFO - __main__ - Step 45987: {'lr': 0.0003987180200120207, 'samples': 8829504, 'steps': 45986, 'loss/train': 1.2274272441864014} -11/07/2021 03:43:56 - INFO - __main__ - Step 45988: {'lr': 0.0003987137543092414, 'samples': 8829696, 'steps': 45987, 'loss/train': 1.7335909605026245} -11/07/2021 03:43:56 - INFO - __main__ - Step 45989: {'lr': 0.0003987094885394541, 'samples': 8829888, 'steps': 45988, 'loss/train': 1.610555648803711} -11/07/2021 03:43:57 - INFO - __main__ - Step 45990: {'lr': 0.0003987052227026605, 'samples': 8830080, 'steps': 45989, 'loss/train': 1.0616350173950195} -11/07/2021 03:43:57 - INFO - __main__ - Step 45991: {'lr': 0.0003987009567988626, 'samples': 8830272, 'steps': 45990, 'loss/train': 1.3533833026885986} -11/07/2021 03:43:58 - INFO - __main__ - Step 45992: {'lr': 0.00039869669082806243, 'samples': 8830464, 'steps': 45991, 'loss/train': 0.27393484115600586} -11/07/2021 03:43:58 - INFO - __main__ - Step 45993: {'lr': 0.0003986924247902618, 'samples': 8830656, 'steps': 45992, 'loss/train': 1.3827497959136963} -11/07/2021 03:43:59 - INFO - __main__ - Step 45994: {'lr': 0.00039868815868546257, 'samples': 8830848, 'steps': 45993, 'loss/train': 2.0358173847198486} -11/07/2021 03:43:59 - INFO - __main__ - Step 45995: {'lr': 0.00039868389251366686, 'samples': 8831040, 'steps': 45994, 'loss/train': 2.121223211288452} -11/07/2021 03:44:00 - INFO - __main__ - Step 45996: {'lr': 0.00039867962627487645, 'samples': 8831232, 'steps': 45995, 'loss/train': 1.6265567541122437} -11/07/2021 03:44:00 - INFO - __main__ - Step 45997: {'lr': 0.0003986753599690933, 'samples': 8831424, 'steps': 45996, 'loss/train': 1.1627484560012817} -11/07/2021 03:44:00 - INFO - __main__ - Step 45998: {'lr': 0.00039867109359631935, 'samples': 8831616, 'steps': 45997, 'loss/train': 1.7465667724609375} -11/07/2021 03:44:01 - INFO - __main__ - Step 45999: {'lr': 0.00039866682715655646, 'samples': 8831808, 'steps': 45998, 'loss/train': 1.0794578790664673} -11/07/2021 03:44:02 - INFO - __main__ - Step 46000: {'lr': 0.00039866256064980657, 'samples': 8832000, 'steps': 45999, 'loss/train': 1.949453592300415} -11/07/2021 03:44:02 - INFO - __main__ - Step 46001: {'lr': 0.0003986582940760717, 'samples': 8832192, 'steps': 46000, 'loss/train': 1.27757728099823} -11/07/2021 03:44:02 - INFO - __main__ - Step 46002: {'lr': 0.0003986540274353536, 'samples': 8832384, 'steps': 46001, 'loss/train': 1.7763686180114746} -11/07/2021 03:44:03 - INFO - __main__ - Step 46003: {'lr': 0.00039864976072765437, 'samples': 8832576, 'steps': 46002, 'loss/train': 1.5143035650253296} -11/07/2021 03:44:03 - INFO - __main__ - Step 46004: {'lr': 0.0003986454939529758, 'samples': 8832768, 'steps': 46003, 'loss/train': 1.384948968887329} -11/07/2021 03:44:04 - INFO - __main__ - Step 46005: {'lr': 0.0003986412271113199, 'samples': 8832960, 'steps': 46004, 'loss/train': 1.4078046083450317} -11/07/2021 03:44:04 - INFO - __main__ - Step 46006: {'lr': 0.0003986369602026886, 'samples': 8833152, 'steps': 46005, 'loss/train': 1.493535041809082} -11/07/2021 03:44:05 - INFO - __main__ - Step 46007: {'lr': 0.0003986326932270836, 'samples': 8833344, 'steps': 46006, 'loss/train': 1.1166813373565674} -11/07/2021 03:44:05 - INFO - __main__ - Step 46008: {'lr': 0.00039862842618450717, 'samples': 8833536, 'steps': 46007, 'loss/train': 2.2529072761535645} -11/07/2021 03:44:05 - INFO - __main__ - Step 46009: {'lr': 0.00039862415907496103, 'samples': 8833728, 'steps': 46008, 'loss/train': 1.8821719884872437} -11/07/2021 03:44:07 - INFO - __main__ - Step 46010: {'lr': 0.00039861989189844715, 'samples': 8833920, 'steps': 46009, 'loss/train': 1.2184703350067139} -11/07/2021 03:44:07 - INFO - __main__ - Step 46011: {'lr': 0.00039861562465496735, 'samples': 8834112, 'steps': 46010, 'loss/train': 1.2818342447280884} -11/07/2021 03:44:07 - INFO - __main__ - Step 46012: {'lr': 0.00039861135734452376, 'samples': 8834304, 'steps': 46011, 'loss/train': 1.7484780550003052} -11/07/2021 03:44:08 - INFO - __main__ - Step 46013: {'lr': 0.00039860708996711816, 'samples': 8834496, 'steps': 46012, 'loss/train': 1.7105348110198975} -11/07/2021 03:44:08 - INFO - __main__ - Step 46014: {'lr': 0.00039860282252275245, 'samples': 8834688, 'steps': 46013, 'loss/train': 0.4886361360549927} -11/07/2021 03:44:09 - INFO - __main__ - Step 46015: {'lr': 0.0003985985550114286, 'samples': 8834880, 'steps': 46014, 'loss/train': 1.743740439414978} -11/07/2021 03:44:10 - INFO - __main__ - Step 46016: {'lr': 0.00039859428743314857, 'samples': 8835072, 'steps': 46015, 'loss/train': 1.7782355546951294} -11/07/2021 03:44:10 - INFO - __main__ - Step 46017: {'lr': 0.0003985900197879142, 'samples': 8835264, 'steps': 46016, 'loss/train': 2.0538876056671143} -11/07/2021 03:44:10 - INFO - __main__ - Step 46018: {'lr': 0.00039858575207572756, 'samples': 8835456, 'steps': 46017, 'loss/train': 1.385968804359436} -11/07/2021 03:44:11 - INFO - __main__ - Step 46019: {'lr': 0.00039858148429659036, 'samples': 8835648, 'steps': 46018, 'loss/train': 1.4984182119369507} -11/07/2021 03:44:11 - INFO - __main__ - Step 46020: {'lr': 0.0003985772164505047, 'samples': 8835840, 'steps': 46019, 'loss/train': 0.7730764746665955} -11/07/2021 03:44:11 - INFO - __main__ - Step 46021: {'lr': 0.0003985729485374724, 'samples': 8836032, 'steps': 46020, 'loss/train': 1.6437476873397827} -11/07/2021 03:44:13 - INFO - __main__ - Step 46022: {'lr': 0.0003985686805574954, 'samples': 8836224, 'steps': 46021, 'loss/train': 1.77516770362854} -11/07/2021 03:44:13 - INFO - __main__ - Step 46023: {'lr': 0.00039856441251057573, 'samples': 8836416, 'steps': 46022, 'loss/train': 1.629174828529358} -11/07/2021 03:44:13 - INFO - __main__ - Step 46024: {'lr': 0.0003985601443967152, 'samples': 8836608, 'steps': 46023, 'loss/train': 1.600903868675232} -11/07/2021 03:44:14 - INFO - __main__ - Step 46025: {'lr': 0.0003985558762159157, 'samples': 8836800, 'steps': 46024, 'loss/train': 1.515991449356079} -11/07/2021 03:44:14 - INFO - __main__ - Step 46026: {'lr': 0.0003985516079681793, 'samples': 8836992, 'steps': 46025, 'loss/train': 1.7451043128967285} -11/07/2021 03:44:15 - INFO - __main__ - Step 46027: {'lr': 0.0003985473396535078, 'samples': 8837184, 'steps': 46026, 'loss/train': 1.4028428792953491} -11/07/2021 03:44:15 - INFO - __main__ - Step 46028: {'lr': 0.00039854307127190316, 'samples': 8837376, 'steps': 46027, 'loss/train': 1.4161070585250854} -11/07/2021 03:44:16 - INFO - __main__ - Step 46029: {'lr': 0.0003985388028233673, 'samples': 8837568, 'steps': 46028, 'loss/train': 1.7701877355575562} -11/07/2021 03:44:16 - INFO - __main__ - Step 46030: {'lr': 0.0003985345343079022, 'samples': 8837760, 'steps': 46029, 'loss/train': 1.0398225784301758} -11/07/2021 03:44:16 - INFO - __main__ - Step 46031: {'lr': 0.00039853026572550965, 'samples': 8837952, 'steps': 46030, 'loss/train': 2.184058666229248} -11/07/2021 03:44:17 - INFO - __main__ - Step 46032: {'lr': 0.0003985259970761917, 'samples': 8838144, 'steps': 46031, 'loss/train': 1.8846038579940796} -11/07/2021 03:44:18 - INFO - __main__ - Step 46033: {'lr': 0.0003985217283599502, 'samples': 8838336, 'steps': 46032, 'loss/train': 1.2859147787094116} -11/07/2021 03:44:18 - INFO - __main__ - Step 46034: {'lr': 0.0003985174595767871, 'samples': 8838528, 'steps': 46033, 'loss/train': 1.7278329133987427} -11/07/2021 03:44:18 - INFO - __main__ - Step 46035: {'lr': 0.0003985131907267043, 'samples': 8838720, 'steps': 46034, 'loss/train': 1.7227964401245117} -11/07/2021 03:44:19 - INFO - __main__ - Step 46036: {'lr': 0.00039850892180970387, 'samples': 8838912, 'steps': 46035, 'loss/train': 2.0506961345672607} -11/07/2021 03:44:20 - INFO - __main__ - Step 46037: {'lr': 0.0003985046528257875, 'samples': 8839104, 'steps': 46036, 'loss/train': 0.9985599517822266} -11/07/2021 03:44:20 - INFO - __main__ - Step 46038: {'lr': 0.00039850038377495727, 'samples': 8839296, 'steps': 46037, 'loss/train': 1.7415443658828735} -11/07/2021 03:44:21 - INFO - __main__ - Step 46039: {'lr': 0.000398496114657215, 'samples': 8839488, 'steps': 46038, 'loss/train': 1.8762344121932983} -11/07/2021 03:44:21 - INFO - __main__ - Step 46040: {'lr': 0.0003984918454725628, 'samples': 8839680, 'steps': 46039, 'loss/train': 1.3955578804016113} -11/07/2021 03:44:21 - INFO - __main__ - Step 46041: {'lr': 0.0003984875762210023, 'samples': 8839872, 'steps': 46040, 'loss/train': 1.3260287046432495} -11/07/2021 03:44:22 - INFO - __main__ - Step 46042: {'lr': 0.0003984833069025357, 'samples': 8840064, 'steps': 46041, 'loss/train': 1.4703521728515625} -11/07/2021 03:44:23 - INFO - __main__ - Step 46043: {'lr': 0.00039847903751716486, 'samples': 8840256, 'steps': 46042, 'loss/train': 1.4357061386108398} -11/07/2021 03:44:23 - INFO - __main__ - Step 46044: {'lr': 0.00039847476806489153, 'samples': 8840448, 'steps': 46043, 'loss/train': 0.6424424052238464} -11/07/2021 03:44:23 - INFO - __main__ - Step 46045: {'lr': 0.00039847049854571784, 'samples': 8840640, 'steps': 46044, 'loss/train': 1.3334059715270996} -11/07/2021 03:44:24 - INFO - __main__ - Step 46046: {'lr': 0.00039846622895964556, 'samples': 8840832, 'steps': 46045, 'loss/train': 1.4812532663345337} -11/07/2021 03:44:25 - INFO - __main__ - Step 46047: {'lr': 0.0003984619593066767, 'samples': 8841024, 'steps': 46046, 'loss/train': 1.4225276708602905} -11/07/2021 03:44:25 - INFO - __main__ - Step 46048: {'lr': 0.0003984576895868132, 'samples': 8841216, 'steps': 46047, 'loss/train': 1.6545523405075073} -11/07/2021 03:44:25 - INFO - __main__ - Step 46049: {'lr': 0.000398453419800057, 'samples': 8841408, 'steps': 46048, 'loss/train': 1.4333152770996094} -11/07/2021 03:44:26 - INFO - __main__ - Step 46050: {'lr': 0.00039844914994640994, 'samples': 8841600, 'steps': 46049, 'loss/train': 1.543885350227356} -11/07/2021 03:44:26 - INFO - __main__ - Step 46051: {'lr': 0.00039844488002587397, 'samples': 8841792, 'steps': 46050, 'loss/train': 1.1068906784057617} -11/07/2021 03:44:27 - INFO - __main__ - Step 46052: {'lr': 0.00039844061003845114, 'samples': 8841984, 'steps': 46051, 'loss/train': 1.8480699062347412} -11/07/2021 03:44:28 - INFO - __main__ - Step 46053: {'lr': 0.00039843633998414306, 'samples': 8842176, 'steps': 46052, 'loss/train': 1.6766722202301025} -11/07/2021 03:44:28 - INFO - __main__ - Step 46054: {'lr': 0.000398432069862952, 'samples': 8842368, 'steps': 46053, 'loss/train': 1.7152425050735474} -11/07/2021 03:44:29 - INFO - __main__ - Step 46055: {'lr': 0.00039842779967487967, 'samples': 8842560, 'steps': 46054, 'loss/train': 0.5176750421524048} -11/07/2021 03:44:29 - INFO - __main__ - Step 46056: {'lr': 0.0003984235294199281, 'samples': 8842752, 'steps': 46055, 'loss/train': 0.8775113821029663} -11/07/2021 03:44:29 - INFO - __main__ - Step 46057: {'lr': 0.0003984192590980992, 'samples': 8842944, 'steps': 46056, 'loss/train': 1.3182798624038696} -11/07/2021 03:44:30 - INFO - __main__ - Step 46058: {'lr': 0.00039841498870939483, 'samples': 8843136, 'steps': 46057, 'loss/train': 0.20144513249397278} -11/07/2021 03:44:31 - INFO - __main__ - Step 46059: {'lr': 0.000398410718253817, 'samples': 8843328, 'steps': 46058, 'loss/train': 1.1564953327178955} -11/07/2021 03:44:31 - INFO - __main__ - Step 46060: {'lr': 0.00039840644773136757, 'samples': 8843520, 'steps': 46059, 'loss/train': 1.2651718854904175} -11/07/2021 03:44:31 - INFO - __main__ - Step 46061: {'lr': 0.0003984021771420484, 'samples': 8843712, 'steps': 46060, 'loss/train': 1.7208924293518066} -11/07/2021 03:44:32 - INFO - __main__ - Step 46062: {'lr': 0.0003983979064858616, 'samples': 8843904, 'steps': 46061, 'loss/train': 1.408997654914856} -11/07/2021 03:44:33 - INFO - __main__ - Step 46063: {'lr': 0.000398393635762809, 'samples': 8844096, 'steps': 46062, 'loss/train': 1.4301825761795044} -11/07/2021 03:44:33 - INFO - __main__ - Step 46064: {'lr': 0.0003983893649728925, 'samples': 8844288, 'steps': 46063, 'loss/train': 1.620592474937439} -11/07/2021 03:44:34 - INFO - __main__ - Step 46065: {'lr': 0.000398385094116114, 'samples': 8844480, 'steps': 46064, 'loss/train': 1.2645494937896729} -11/07/2021 03:44:34 - INFO - __main__ - Step 46066: {'lr': 0.0003983808231924755, 'samples': 8844672, 'steps': 46065, 'loss/train': 1.045702338218689} -11/07/2021 03:44:34 - INFO - __main__ - Step 46067: {'lr': 0.0003983765522019789, 'samples': 8844864, 'steps': 46066, 'loss/train': 1.748497486114502} -11/07/2021 03:44:35 - INFO - __main__ - Step 46068: {'lr': 0.0003983722811446261, 'samples': 8845056, 'steps': 46067, 'loss/train': 1.3432093858718872} -11/07/2021 03:44:36 - INFO - __main__ - Step 46069: {'lr': 0.00039836801002041903, 'samples': 8845248, 'steps': 46068, 'loss/train': 1.3738770484924316} -11/07/2021 03:44:36 - INFO - __main__ - Step 46070: {'lr': 0.00039836373882935967, 'samples': 8845440, 'steps': 46069, 'loss/train': 1.4351294040679932} -11/07/2021 03:44:36 - INFO - __main__ - Step 46071: {'lr': 0.0003983594675714498, 'samples': 8845632, 'steps': 46070, 'loss/train': 1.1481633186340332} -11/07/2021 03:44:37 - INFO - __main__ - Step 46072: {'lr': 0.0003983551962466915, 'samples': 8845824, 'steps': 46071, 'loss/train': 1.5206433534622192} -11/07/2021 03:44:37 - INFO - __main__ - Step 46073: {'lr': 0.0003983509248550867, 'samples': 8846016, 'steps': 46072, 'loss/train': 1.1233588457107544} -11/07/2021 03:44:38 - INFO - __main__ - Step 46074: {'lr': 0.00039834665339663725, 'samples': 8846208, 'steps': 46073, 'loss/train': 1.2450916767120361} -11/07/2021 03:44:38 - INFO - __main__ - Step 46075: {'lr': 0.00039834238187134497, 'samples': 8846400, 'steps': 46074, 'loss/train': 1.1505430936813354} -11/07/2021 03:44:39 - INFO - __main__ - Step 46076: {'lr': 0.00039833811027921196, 'samples': 8846592, 'steps': 46075, 'loss/train': 1.3425941467285156} -11/07/2021 03:44:39 - INFO - __main__ - Step 46077: {'lr': 0.00039833383862024016, 'samples': 8846784, 'steps': 46076, 'loss/train': 1.7394100427627563} -11/07/2021 03:44:39 - INFO - __main__ - Step 46078: {'lr': 0.00039832956689443135, 'samples': 8846976, 'steps': 46077, 'loss/train': 1.5554648637771606} -11/07/2021 03:44:40 - INFO - __main__ - Step 46079: {'lr': 0.00039832529510178756, 'samples': 8847168, 'steps': 46078, 'loss/train': 1.199279546737671} -11/07/2021 03:44:41 - INFO - __main__ - Step 46080: {'lr': 0.0003983210232423107, 'samples': 8847360, 'steps': 46079, 'loss/train': 1.7897357940673828} -11/07/2021 03:44:41 - INFO - __main__ - Step 46081: {'lr': 0.00039831675131600253, 'samples': 8847552, 'steps': 46080, 'loss/train': 1.701612949371338} -11/07/2021 03:44:41 - INFO - __main__ - Step 46082: {'lr': 0.0003983124793228653, 'samples': 8847744, 'steps': 46081, 'loss/train': 1.5686990022659302} -11/07/2021 03:44:42 - INFO - __main__ - Step 46083: {'lr': 0.00039830820726290063, 'samples': 8847936, 'steps': 46082, 'loss/train': 1.6925108432769775} -11/07/2021 03:44:43 - INFO - __main__ - Step 46084: {'lr': 0.0003983039351361106, 'samples': 8848128, 'steps': 46083, 'loss/train': 1.5960572957992554} -11/07/2021 03:44:43 - INFO - __main__ - Step 46085: {'lr': 0.0003982996629424972, 'samples': 8848320, 'steps': 46084, 'loss/train': 1.156279444694519} -11/07/2021 03:44:43 - INFO - __main__ - Step 46086: {'lr': 0.0003982953906820622, 'samples': 8848512, 'steps': 46085, 'loss/train': 1.071182131767273} -11/07/2021 03:44:44 - INFO - __main__ - Step 46087: {'lr': 0.0003982911183548075, 'samples': 8848704, 'steps': 46086, 'loss/train': 1.5461595058441162} -11/07/2021 03:44:44 - INFO - __main__ - Step 46088: {'lr': 0.0003982868459607352, 'samples': 8848896, 'steps': 46087, 'loss/train': 1.517485499382019} -11/07/2021 03:44:45 - INFO - __main__ - Step 46089: {'lr': 0.0003982825734998471, 'samples': 8849088, 'steps': 46088, 'loss/train': 1.4021140336990356} -11/07/2021 03:44:46 - INFO - __main__ - Step 46090: {'lr': 0.0003982783009721452, 'samples': 8849280, 'steps': 46089, 'loss/train': 1.940238118171692} -11/07/2021 03:44:46 - INFO - __main__ - Step 46091: {'lr': 0.00039827402837763136, 'samples': 8849472, 'steps': 46090, 'loss/train': 1.4375869035720825} -11/07/2021 03:44:46 - INFO - __main__ - Step 46092: {'lr': 0.00039826975571630754, 'samples': 8849664, 'steps': 46091, 'loss/train': 0.8164916634559631} -11/07/2021 03:44:47 - INFO - __main__ - Step 46093: {'lr': 0.0003982654829881757, 'samples': 8849856, 'steps': 46092, 'loss/train': 0.9763711094856262} -11/07/2021 03:44:48 - INFO - __main__ - Step 46094: {'lr': 0.0003982612101932376, 'samples': 8850048, 'steps': 46093, 'loss/train': 1.353725790977478} -11/07/2021 03:44:48 - INFO - __main__ - Step 46095: {'lr': 0.0003982569373314954, 'samples': 8850240, 'steps': 46094, 'loss/train': 1.9268068075180054} -11/07/2021 03:44:48 - INFO - __main__ - Step 46096: {'lr': 0.0003982526644029508, 'samples': 8850432, 'steps': 46095, 'loss/train': 1.31769859790802} -11/07/2021 03:44:49 - INFO - __main__ - Step 46097: {'lr': 0.000398248391407606, 'samples': 8850624, 'steps': 46096, 'loss/train': 1.2756290435791016} -11/07/2021 03:44:49 - INFO - __main__ - Step 46098: {'lr': 0.0003982441183454627, 'samples': 8850816, 'steps': 46097, 'loss/train': 1.1033422946929932} -11/07/2021 03:44:49 - INFO - __main__ - Step 46099: {'lr': 0.0003982398452165228, 'samples': 8851008, 'steps': 46098, 'loss/train': 1.5437897443771362} -11/07/2021 03:44:50 - INFO - __main__ - Step 46100: {'lr': 0.0003982355720207884, 'samples': 8851200, 'steps': 46099, 'loss/train': 1.0908828973770142} -11/07/2021 03:44:51 - INFO - __main__ - Step 46101: {'lr': 0.00039823129875826127, 'samples': 8851392, 'steps': 46100, 'loss/train': 1.4641016721725464} -11/07/2021 03:44:51 - INFO - __main__ - Step 46102: {'lr': 0.0003982270254289435, 'samples': 8851584, 'steps': 46101, 'loss/train': 1.1825180053710938} -11/07/2021 03:44:51 - INFO - __main__ - Step 46103: {'lr': 0.0003982227520328368, 'samples': 8851776, 'steps': 46102, 'loss/train': 1.260934829711914} -11/07/2021 03:44:52 - INFO - __main__ - Step 46104: {'lr': 0.0003982184785699433, 'samples': 8851968, 'steps': 46103, 'loss/train': 1.7066675424575806} -11/07/2021 03:44:53 - INFO - __main__ - Step 46105: {'lr': 0.00039821420504026486, 'samples': 8852160, 'steps': 46104, 'loss/train': 1.4572490453720093} -11/07/2021 03:44:53 - INFO - __main__ - Step 46106: {'lr': 0.00039820993144380333, 'samples': 8852352, 'steps': 46105, 'loss/train': 1.6005284786224365} -11/07/2021 03:44:54 - INFO - __main__ - Step 46107: {'lr': 0.0003982056577805607, 'samples': 8852544, 'steps': 46106, 'loss/train': 1.1769062280654907} -11/07/2021 03:44:54 - INFO - __main__ - Step 46108: {'lr': 0.00039820138405053887, 'samples': 8852736, 'steps': 46107, 'loss/train': 1.3909072875976562} -11/07/2021 03:44:54 - INFO - __main__ - Step 46109: {'lr': 0.0003981971102537398, 'samples': 8852928, 'steps': 46108, 'loss/train': 1.658613920211792} -11/07/2021 03:44:55 - INFO - __main__ - Step 46110: {'lr': 0.00039819283639016547, 'samples': 8853120, 'steps': 46109, 'loss/train': 1.5829380750656128} -11/07/2021 03:44:56 - INFO - __main__ - Step 46111: {'lr': 0.00039818856245981766, 'samples': 8853312, 'steps': 46110, 'loss/train': 2.1844825744628906} -11/07/2021 03:44:56 - INFO - __main__ - Step 46112: {'lr': 0.0003981842884626984, 'samples': 8853504, 'steps': 46111, 'loss/train': 0.8375652432441711} -11/07/2021 03:44:56 - INFO - __main__ - Step 46113: {'lr': 0.0003981800143988095, 'samples': 8853696, 'steps': 46112, 'loss/train': 1.705703854560852} -11/07/2021 03:44:57 - INFO - __main__ - Step 46114: {'lr': 0.00039817574026815305, 'samples': 8853888, 'steps': 46113, 'loss/train': 1.6477971076965332} -11/07/2021 03:44:58 - INFO - __main__ - Step 46115: {'lr': 0.0003981714660707309, 'samples': 8854080, 'steps': 46114, 'loss/train': 1.4718902111053467} -11/07/2021 03:44:58 - INFO - __main__ - Step 46116: {'lr': 0.00039816719180654493, 'samples': 8854272, 'steps': 46115, 'loss/train': 0.8173640370368958} -11/07/2021 03:44:58 - INFO - __main__ - Step 46117: {'lr': 0.0003981629174755972, 'samples': 8854464, 'steps': 46116, 'loss/train': 1.6102850437164307} -11/07/2021 03:44:59 - INFO - __main__ - Step 46118: {'lr': 0.0003981586430778895, 'samples': 8854656, 'steps': 46117, 'loss/train': 1.548747181892395} -11/07/2021 03:44:59 - INFO - __main__ - Step 46119: {'lr': 0.0003981543686134238, 'samples': 8854848, 'steps': 46118, 'loss/train': 1.253394603729248} -11/07/2021 03:45:00 - INFO - __main__ - Step 46120: {'lr': 0.000398150094082202, 'samples': 8855040, 'steps': 46119, 'loss/train': 1.7422831058502197} -11/07/2021 03:45:00 - INFO - __main__ - Step 46121: {'lr': 0.000398145819484226, 'samples': 8855232, 'steps': 46120, 'loss/train': 1.6735376119613647} -11/07/2021 03:45:01 - INFO - __main__ - Step 46122: {'lr': 0.00039814154481949786, 'samples': 8855424, 'steps': 46121, 'loss/train': 1.60072660446167} -11/07/2021 03:45:01 - INFO - __main__ - Step 46123: {'lr': 0.00039813727008801945, 'samples': 8855616, 'steps': 46122, 'loss/train': 1.3049921989440918} -11/07/2021 03:45:02 - INFO - __main__ - Step 46124: {'lr': 0.00039813299528979263, 'samples': 8855808, 'steps': 46123, 'loss/train': 1.8983211517333984} -11/07/2021 03:45:03 - INFO - __main__ - Step 46125: {'lr': 0.0003981287204248194, 'samples': 8856000, 'steps': 46124, 'loss/train': 1.713747262954712} -11/07/2021 03:45:03 - INFO - __main__ - Step 46126: {'lr': 0.0003981244454931017, 'samples': 8856192, 'steps': 46125, 'loss/train': 1.5147662162780762} -11/07/2021 03:45:03 - INFO - __main__ - Step 46127: {'lr': 0.00039812017049464126, 'samples': 8856384, 'steps': 46126, 'loss/train': 1.7749470472335815} -11/07/2021 03:45:04 - INFO - __main__ - Step 46128: {'lr': 0.0003981158954294403, 'samples': 8856576, 'steps': 46127, 'loss/train': 1.315519094467163} -11/07/2021 03:45:04 - INFO - __main__ - Step 46129: {'lr': 0.00039811162029750047, 'samples': 8856768, 'steps': 46128, 'loss/train': 1.5389231443405151} -11/07/2021 03:45:04 - INFO - __main__ - Step 46130: {'lr': 0.00039810734509882395, 'samples': 8856960, 'steps': 46129, 'loss/train': 1.6367995738983154} -11/07/2021 03:45:05 - INFO - __main__ - Step 46131: {'lr': 0.0003981030698334125, 'samples': 8857152, 'steps': 46130, 'loss/train': 0.968117892742157} -11/07/2021 03:45:06 - INFO - __main__ - Step 46132: {'lr': 0.00039809879450126805, 'samples': 8857344, 'steps': 46131, 'loss/train': 1.5910096168518066} -11/07/2021 03:45:06 - INFO - __main__ - Step 46133: {'lr': 0.00039809451910239257, 'samples': 8857536, 'steps': 46132, 'loss/train': 1.5100864171981812} -11/07/2021 03:45:06 - INFO - __main__ - Step 46134: {'lr': 0.000398090243636788, 'samples': 8857728, 'steps': 46133, 'loss/train': 1.3803400993347168} -11/07/2021 03:45:07 - INFO - __main__ - Step 46135: {'lr': 0.00039808596810445636, 'samples': 8857920, 'steps': 46134, 'loss/train': 1.642842411994934} -11/07/2021 03:45:08 - INFO - __main__ - Step 46136: {'lr': 0.0003980816925053994, 'samples': 8858112, 'steps': 46135, 'loss/train': 1.5238131284713745} -11/07/2021 03:45:08 - INFO - __main__ - Step 46137: {'lr': 0.0003980774168396191, 'samples': 8858304, 'steps': 46136, 'loss/train': 1.399741291999817} -11/07/2021 03:45:08 - INFO - __main__ - Step 46138: {'lr': 0.00039807314110711735, 'samples': 8858496, 'steps': 46137, 'loss/train': 1.3536529541015625} -11/07/2021 03:45:09 - INFO - __main__ - Step 46139: {'lr': 0.0003980688653078962, 'samples': 8858688, 'steps': 46138, 'loss/train': 1.0252282619476318} -11/07/2021 03:45:09 - INFO - __main__ - Step 46140: {'lr': 0.00039806458944195743, 'samples': 8858880, 'steps': 46139, 'loss/train': 2.035419464111328} -11/07/2021 03:45:10 - INFO - __main__ - Step 46141: {'lr': 0.00039806031350930315, 'samples': 8859072, 'steps': 46140, 'loss/train': 1.6623613834381104} -11/07/2021 03:45:11 - INFO - __main__ - Step 46142: {'lr': 0.00039805603750993514, 'samples': 8859264, 'steps': 46141, 'loss/train': 1.3882590532302856} -11/07/2021 03:45:11 - INFO - __main__ - Step 46143: {'lr': 0.0003980517614438553, 'samples': 8859456, 'steps': 46142, 'loss/train': 2.1687562465667725} -11/07/2021 03:45:11 - INFO - __main__ - Step 46144: {'lr': 0.00039804748531106565, 'samples': 8859648, 'steps': 46143, 'loss/train': 1.4556162357330322} -11/07/2021 03:45:12 - INFO - __main__ - Step 46145: {'lr': 0.0003980432091115681, 'samples': 8859840, 'steps': 46144, 'loss/train': 1.7229753732681274} -11/07/2021 03:45:13 - INFO - __main__ - Step 46146: {'lr': 0.0003980389328453646, 'samples': 8860032, 'steps': 46145, 'loss/train': 1.2073771953582764} -11/07/2021 03:45:13 - INFO - __main__ - Step 46147: {'lr': 0.00039803465651245694, 'samples': 8860224, 'steps': 46146, 'loss/train': 1.692874550819397} -11/07/2021 03:45:13 - INFO - __main__ - Step 46148: {'lr': 0.00039803038011284724, 'samples': 8860416, 'steps': 46147, 'loss/train': 1.5015639066696167} -11/07/2021 03:45:14 - INFO - __main__ - Step 46149: {'lr': 0.00039802610364653737, 'samples': 8860608, 'steps': 46148, 'loss/train': 1.696057915687561} -11/07/2021 03:45:14 - INFO - __main__ - Step 46150: {'lr': 0.00039802182711352906, 'samples': 8860800, 'steps': 46149, 'loss/train': 1.4315892457962036} -11/07/2021 03:45:15 - INFO - __main__ - Step 46151: {'lr': 0.0003980175505138246, 'samples': 8860992, 'steps': 46150, 'loss/train': 1.3779420852661133} -11/07/2021 03:45:15 - INFO - __main__ - Step 46152: {'lr': 0.0003980132738474256, 'samples': 8861184, 'steps': 46151, 'loss/train': 1.1602864265441895} -11/07/2021 03:45:16 - INFO - __main__ - Step 46153: {'lr': 0.0003980089971143341, 'samples': 8861376, 'steps': 46152, 'loss/train': 1.6327952146530151} -11/07/2021 03:45:16 - INFO - __main__ - Step 46154: {'lr': 0.000398004720314552, 'samples': 8861568, 'steps': 46153, 'loss/train': 2.127473831176758} -11/07/2021 03:45:17 - INFO - __main__ - Step 46155: {'lr': 0.00039800044344808134, 'samples': 8861760, 'steps': 46154, 'loss/train': 1.058316707611084} -11/07/2021 03:45:18 - INFO - __main__ - Step 46156: {'lr': 0.00039799616651492394, 'samples': 8861952, 'steps': 46155, 'loss/train': 1.5582176446914673} -11/07/2021 03:45:18 - INFO - __main__ - Step 46157: {'lr': 0.00039799188951508176, 'samples': 8862144, 'steps': 46156, 'loss/train': 1.5612353086471558} -11/07/2021 03:45:18 - INFO - __main__ - Step 46158: {'lr': 0.0003979876124485567, 'samples': 8862336, 'steps': 46157, 'loss/train': 0.9640724062919617} -11/07/2021 03:45:19 - INFO - __main__ - Step 46159: {'lr': 0.0003979833353153507, 'samples': 8862528, 'steps': 46158, 'loss/train': 1.6415303945541382} -11/07/2021 03:45:19 - INFO - __main__ - Step 46160: {'lr': 0.00039797905811546564, 'samples': 8862720, 'steps': 46159, 'loss/train': 1.5795783996582031} -11/07/2021 03:45:19 - INFO - __main__ - Step 46161: {'lr': 0.0003979747808489036, 'samples': 8862912, 'steps': 46160, 'loss/train': 1.205873727798462} -11/07/2021 03:45:20 - INFO - __main__ - Step 46162: {'lr': 0.0003979705035156663, 'samples': 8863104, 'steps': 46161, 'loss/train': 1.7263001203536987} -11/07/2021 03:45:21 - INFO - __main__ - Step 46163: {'lr': 0.0003979662261157558, 'samples': 8863296, 'steps': 46162, 'loss/train': 1.7620081901550293} -11/07/2021 03:45:21 - INFO - __main__ - Step 46164: {'lr': 0.00039796194864917414, 'samples': 8863488, 'steps': 46163, 'loss/train': 1.6041735410690308} -11/07/2021 03:45:21 - INFO - __main__ - Step 46165: {'lr': 0.00039795767111592303, 'samples': 8863680, 'steps': 46164, 'loss/train': 1.8693697452545166} -11/07/2021 03:45:22 - INFO - __main__ - Step 46166: {'lr': 0.00039795339351600444, 'samples': 8863872, 'steps': 46165, 'loss/train': 1.9089528322219849} -11/07/2021 03:45:23 - INFO - __main__ - Step 46167: {'lr': 0.0003979491158494203, 'samples': 8864064, 'steps': 46166, 'loss/train': 1.438377022743225} -11/07/2021 03:45:23 - INFO - __main__ - Step 46168: {'lr': 0.00039794483811617267, 'samples': 8864256, 'steps': 46167, 'loss/train': 1.8377418518066406} -11/07/2021 03:45:23 - INFO - __main__ - Step 46169: {'lr': 0.0003979405603162633, 'samples': 8864448, 'steps': 46168, 'loss/train': 1.2616311311721802} -11/07/2021 03:45:24 - INFO - __main__ - Step 46170: {'lr': 0.0003979362824496942, 'samples': 8864640, 'steps': 46169, 'loss/train': 1.7195957899093628} -11/07/2021 03:45:24 - INFO - __main__ - Step 46171: {'lr': 0.00039793200451646737, 'samples': 8864832, 'steps': 46170, 'loss/train': 1.6643671989440918} -11/07/2021 03:45:25 - INFO - __main__ - Step 46172: {'lr': 0.0003979277265165846, 'samples': 8865024, 'steps': 46171, 'loss/train': 1.4506498575210571} -11/07/2021 03:45:26 - INFO - __main__ - Step 46173: {'lr': 0.00039792344845004793, 'samples': 8865216, 'steps': 46172, 'loss/train': 1.3304592370986938} -11/07/2021 03:45:26 - INFO - __main__ - Step 46174: {'lr': 0.00039791917031685914, 'samples': 8865408, 'steps': 46173, 'loss/train': 1.5090699195861816} -11/07/2021 03:45:26 - INFO - __main__ - Step 46175: {'lr': 0.0003979148921170203, 'samples': 8865600, 'steps': 46174, 'loss/train': 1.5561892986297607} -11/07/2021 03:45:27 - INFO - __main__ - Step 46176: {'lr': 0.0003979106138505333, 'samples': 8865792, 'steps': 46175, 'loss/train': 1.3784784078598022} -11/07/2021 03:45:28 - INFO - __main__ - Step 46177: {'lr': 0.00039790633551740006, 'samples': 8865984, 'steps': 46176, 'loss/train': 1.4233170747756958} -11/07/2021 03:45:28 - INFO - __main__ - Step 46178: {'lr': 0.0003979020571176226, 'samples': 8866176, 'steps': 46177, 'loss/train': 1.3791457414627075} -11/07/2021 03:45:28 - INFO - __main__ - Step 46179: {'lr': 0.00039789777865120257, 'samples': 8866368, 'steps': 46178, 'loss/train': 1.4233858585357666} -11/07/2021 03:45:29 - INFO - __main__ - Step 46180: {'lr': 0.0003978935001181422, 'samples': 8866560, 'steps': 46179, 'loss/train': 1.8352843523025513} -11/07/2021 03:45:29 - INFO - __main__ - Step 46181: {'lr': 0.0003978892215184433, 'samples': 8866752, 'steps': 46180, 'loss/train': 1.3255808353424072} -11/07/2021 03:45:30 - INFO - __main__ - Step 46182: {'lr': 0.00039788494285210774, 'samples': 8866944, 'steps': 46181, 'loss/train': 1.5028743743896484} -11/07/2021 03:45:31 - INFO - __main__ - Step 46183: {'lr': 0.0003978806641191376, 'samples': 8867136, 'steps': 46182, 'loss/train': 1.8030539751052856} -11/07/2021 03:45:31 - INFO - __main__ - Step 46184: {'lr': 0.0003978763853195346, 'samples': 8867328, 'steps': 46183, 'loss/train': 1.3502064943313599} -11/07/2021 03:45:31 - INFO - __main__ - Step 46185: {'lr': 0.0003978721064533009, 'samples': 8867520, 'steps': 46184, 'loss/train': 1.466660976409912} -11/07/2021 03:45:32 - INFO - __main__ - Step 46186: {'lr': 0.0003978678275204383, 'samples': 8867712, 'steps': 46185, 'loss/train': 1.0451267957687378} -11/07/2021 03:45:32 - INFO - __main__ - Step 46187: {'lr': 0.00039786354852094864, 'samples': 8867904, 'steps': 46186, 'loss/train': 1.3738776445388794} -11/07/2021 03:45:33 - INFO - __main__ - Step 46188: {'lr': 0.00039785926945483396, 'samples': 8868096, 'steps': 46187, 'loss/train': 1.433671236038208} -11/07/2021 03:45:33 - INFO - __main__ - Step 46189: {'lr': 0.00039785499032209625, 'samples': 8868288, 'steps': 46188, 'loss/train': 1.3277513980865479} -11/07/2021 03:45:34 - INFO - __main__ - Step 46190: {'lr': 0.0003978507111227373, 'samples': 8868480, 'steps': 46189, 'loss/train': 1.5594428777694702} -11/07/2021 03:45:34 - INFO - __main__ - Step 46191: {'lr': 0.00039784643185675916, 'samples': 8868672, 'steps': 46190, 'loss/train': 1.5130149126052856} -11/07/2021 03:45:34 - INFO - __main__ - Step 46192: {'lr': 0.0003978421525241637, 'samples': 8868864, 'steps': 46191, 'loss/train': 1.791502833366394} -11/07/2021 03:45:35 - INFO - __main__ - Step 46193: {'lr': 0.00039783787312495277, 'samples': 8869056, 'steps': 46192, 'loss/train': 1.1747045516967773} -11/07/2021 03:45:36 - INFO - __main__ - Step 46194: {'lr': 0.0003978335936591284, 'samples': 8869248, 'steps': 46193, 'loss/train': 1.7039309740066528} -11/07/2021 03:45:36 - INFO - __main__ - Step 46195: {'lr': 0.00039782931412669253, 'samples': 8869440, 'steps': 46194, 'loss/train': 1.482157826423645} -11/07/2021 03:45:36 - INFO - __main__ - Step 46196: {'lr': 0.000397825034527647, 'samples': 8869632, 'steps': 46195, 'loss/train': 1.8387107849121094} -11/07/2021 03:45:37 - INFO - __main__ - Step 46197: {'lr': 0.0003978207548619939, 'samples': 8869824, 'steps': 46196, 'loss/train': 1.5056120157241821} -11/07/2021 03:45:38 - INFO - __main__ - Step 46198: {'lr': 0.000397816475129735, 'samples': 8870016, 'steps': 46197, 'loss/train': 1.4632428884506226} -11/07/2021 03:45:38 - INFO - __main__ - Step 46199: {'lr': 0.0003978121953308722, 'samples': 8870208, 'steps': 46198, 'loss/train': 1.8056995868682861} -11/07/2021 03:45:38 - INFO - __main__ - Step 46200: {'lr': 0.0003978079154654075, 'samples': 8870400, 'steps': 46199, 'loss/train': 1.4516160488128662} -11/07/2021 03:45:39 - INFO - __main__ - Step 46201: {'lr': 0.000397803635533343, 'samples': 8870592, 'steps': 46200, 'loss/train': 1.0014290809631348} -11/07/2021 03:45:39 - INFO - __main__ - Step 46202: {'lr': 0.00039779935553468026, 'samples': 8870784, 'steps': 46201, 'loss/train': 1.3329901695251465} -11/07/2021 03:45:40 - INFO - __main__ - Step 46203: {'lr': 0.0003977950754694215, 'samples': 8870976, 'steps': 46202, 'loss/train': 1.5694855451583862} -11/07/2021 03:45:41 - INFO - __main__ - Step 46204: {'lr': 0.00039779079533756856, 'samples': 8871168, 'steps': 46203, 'loss/train': 1.2100770473480225} -11/07/2021 03:45:41 - INFO - __main__ - Step 46205: {'lr': 0.00039778651513912343, 'samples': 8871360, 'steps': 46204, 'loss/train': 1.1733067035675049} -11/07/2021 03:45:41 - INFO - __main__ - Step 46206: {'lr': 0.00039778223487408796, 'samples': 8871552, 'steps': 46205, 'loss/train': 0.9480448961257935} -11/07/2021 03:45:42 - INFO - __main__ - Step 46207: {'lr': 0.000397777954542464, 'samples': 8871744, 'steps': 46206, 'loss/train': 1.1663490533828735} -11/07/2021 03:45:43 - INFO - __main__ - Step 46208: {'lr': 0.0003977736741442537, 'samples': 8871936, 'steps': 46207, 'loss/train': 1.4362285137176514} -11/07/2021 03:45:43 - INFO - __main__ - Step 46209: {'lr': 0.00039776939367945874, 'samples': 8872128, 'steps': 46208, 'loss/train': 1.7439661026000977} -11/07/2021 03:45:44 - INFO - __main__ - Step 46210: {'lr': 0.00039776511314808125, 'samples': 8872320, 'steps': 46209, 'loss/train': 1.4757336378097534} -11/07/2021 03:45:44 - INFO - __main__ - Step 46211: {'lr': 0.00039776083255012307, 'samples': 8872512, 'steps': 46210, 'loss/train': 1.7445675134658813} -11/07/2021 03:45:44 - INFO - __main__ - Step 46212: {'lr': 0.0003977565518855861, 'samples': 8872704, 'steps': 46211, 'loss/train': 1.7271639108657837} -11/07/2021 03:45:45 - INFO - __main__ - Step 46213: {'lr': 0.0003977522711544723, 'samples': 8872896, 'steps': 46212, 'loss/train': 1.2396310567855835} -11/07/2021 03:45:46 - INFO - __main__ - Step 46214: {'lr': 0.00039774799035678367, 'samples': 8873088, 'steps': 46213, 'loss/train': 1.4215750694274902} -11/07/2021 03:45:46 - INFO - __main__ - Step 46215: {'lr': 0.000397743709492522, 'samples': 8873280, 'steps': 46214, 'loss/train': 1.7732235193252563} -11/07/2021 03:45:46 - INFO - __main__ - Step 46216: {'lr': 0.0003977394285616893, 'samples': 8873472, 'steps': 46215, 'loss/train': 1.045384407043457} -11/07/2021 03:45:47 - INFO - __main__ - Step 46217: {'lr': 0.0003977351475642876, 'samples': 8873664, 'steps': 46216, 'loss/train': 0.8771900534629822} -11/07/2021 03:45:47 - INFO - __main__ - Step 46218: {'lr': 0.00039773086650031866, 'samples': 8873856, 'steps': 46217, 'loss/train': 0.9818655848503113} -11/07/2021 03:45:48 - INFO - __main__ - Step 46219: {'lr': 0.00039772658536978443, 'samples': 8874048, 'steps': 46218, 'loss/train': 1.6137886047363281} -11/07/2021 03:45:48 - INFO - __main__ - Step 46220: {'lr': 0.00039772230417268697, 'samples': 8874240, 'steps': 46219, 'loss/train': 1.6870713233947754} -11/07/2021 03:45:49 - INFO - __main__ - Step 46221: {'lr': 0.00039771802290902806, 'samples': 8874432, 'steps': 46220, 'loss/train': 1.9500912427902222} -11/07/2021 03:45:49 - INFO - __main__ - Step 46222: {'lr': 0.0003977137415788097, 'samples': 8874624, 'steps': 46221, 'loss/train': 1.2778922319412231} -11/07/2021 03:45:49 - INFO - __main__ - Step 46223: {'lr': 0.00039770946018203375, 'samples': 8874816, 'steps': 46222, 'loss/train': 1.569501519203186} -11/07/2021 03:45:51 - INFO - __main__ - Step 46224: {'lr': 0.00039770517871870226, 'samples': 8875008, 'steps': 46223, 'loss/train': 1.6372594833374023} -11/07/2021 03:45:51 - INFO - __main__ - Step 46225: {'lr': 0.00039770089718881707, 'samples': 8875200, 'steps': 46224, 'loss/train': 0.9442867040634155} -11/07/2021 03:45:51 - INFO - __main__ - Step 46226: {'lr': 0.00039769661559238014, 'samples': 8875392, 'steps': 46225, 'loss/train': 1.5672374963760376} -11/07/2021 03:45:52 - INFO - __main__ - Step 46227: {'lr': 0.0003976923339293934, 'samples': 8875584, 'steps': 46226, 'loss/train': 1.2659668922424316} -11/07/2021 03:45:52 - INFO - __main__ - Step 46228: {'lr': 0.0003976880521998588, 'samples': 8875776, 'steps': 46227, 'loss/train': 1.7109959125518799} -11/07/2021 03:45:52 - INFO - __main__ - Step 46229: {'lr': 0.00039768377040377823, 'samples': 8875968, 'steps': 46228, 'loss/train': 1.5612633228302002} -11/07/2021 03:45:53 - INFO - __main__ - Step 46230: {'lr': 0.00039767948854115356, 'samples': 8876160, 'steps': 46229, 'loss/train': 3.5253870487213135} -11/07/2021 03:45:54 - INFO - __main__ - Step 46231: {'lr': 0.0003976752066119869, 'samples': 8876352, 'steps': 46230, 'loss/train': 1.3928388357162476} -11/07/2021 03:45:54 - INFO - __main__ - Step 46232: {'lr': 0.00039767092461628, 'samples': 8876544, 'steps': 46231, 'loss/train': 1.063865303993225} -11/07/2021 03:45:55 - INFO - __main__ - Step 46233: {'lr': 0.0003976666425540349, 'samples': 8876736, 'steps': 46232, 'loss/train': 1.5887515544891357} -11/07/2021 03:45:55 - INFO - __main__ - Step 46234: {'lr': 0.00039766236042525346, 'samples': 8876928, 'steps': 46233, 'loss/train': 1.708302617073059} -11/07/2021 03:45:56 - INFO - __main__ - Step 46235: {'lr': 0.0003976580782299376, 'samples': 8877120, 'steps': 46234, 'loss/train': 1.5173242092132568} -11/07/2021 03:45:56 - INFO - __main__ - Step 46236: {'lr': 0.0003976537959680894, 'samples': 8877312, 'steps': 46235, 'loss/train': 1.6224896907806396} -11/07/2021 03:45:57 - INFO - __main__ - Step 46237: {'lr': 0.0003976495136397106, 'samples': 8877504, 'steps': 46236, 'loss/train': 1.1167081594467163} -11/07/2021 03:45:57 - INFO - __main__ - Step 46238: {'lr': 0.0003976452312448032, 'samples': 8877696, 'steps': 46237, 'loss/train': 1.2795268297195435} -11/07/2021 03:45:57 - INFO - __main__ - Step 46239: {'lr': 0.0003976409487833692, 'samples': 8877888, 'steps': 46238, 'loss/train': 1.6856943368911743} -11/07/2021 03:45:58 - INFO - __main__ - Step 46240: {'lr': 0.0003976366662554104, 'samples': 8878080, 'steps': 46239, 'loss/train': 0.9027916789054871} -11/07/2021 03:45:59 - INFO - __main__ - Step 46241: {'lr': 0.0003976323836609288, 'samples': 8878272, 'steps': 46240, 'loss/train': 1.8561947345733643} -11/07/2021 03:45:59 - INFO - __main__ - Step 46242: {'lr': 0.00039762810099992644, 'samples': 8878464, 'steps': 46241, 'loss/train': 1.3961539268493652} -11/07/2021 03:46:00 - INFO - __main__ - Step 46243: {'lr': 0.00039762381827240496, 'samples': 8878656, 'steps': 46242, 'loss/train': 0.9099176526069641} -11/07/2021 03:46:00 - INFO - __main__ - Step 46244: {'lr': 0.00039761953547836655, 'samples': 8878848, 'steps': 46243, 'loss/train': 2.1442995071411133} -11/07/2021 03:46:01 - INFO - __main__ - Step 46245: {'lr': 0.00039761525261781304, 'samples': 8879040, 'steps': 46244, 'loss/train': 1.3313018083572388} -11/07/2021 03:46:01 - INFO - __main__ - Step 46246: {'lr': 0.00039761096969074644, 'samples': 8879232, 'steps': 46245, 'loss/train': 1.868284821510315} -11/07/2021 03:46:02 - INFO - __main__ - Step 46247: {'lr': 0.0003976066866971686, 'samples': 8879424, 'steps': 46246, 'loss/train': 1.4452598094940186} -11/07/2021 03:46:02 - INFO - __main__ - Step 46248: {'lr': 0.0003976024036370814, 'samples': 8879616, 'steps': 46247, 'loss/train': 1.410376787185669} -11/07/2021 03:46:02 - INFO - __main__ - Step 46249: {'lr': 0.0003975981205104868, 'samples': 8879808, 'steps': 46248, 'loss/train': 0.6749045252799988} -11/07/2021 03:46:03 - INFO - __main__ - Step 46250: {'lr': 0.0003975938373173868, 'samples': 8880000, 'steps': 46249, 'loss/train': 1.77179753780365} -11/07/2021 03:46:04 - INFO - __main__ - Step 46251: {'lr': 0.00039758955405778344, 'samples': 8880192, 'steps': 46250, 'loss/train': 1.5711568593978882} -11/07/2021 03:46:04 - INFO - __main__ - Step 46252: {'lr': 0.0003975852707316784, 'samples': 8880384, 'steps': 46251, 'loss/train': 1.2575101852416992} -11/07/2021 03:46:05 - INFO - __main__ - Step 46253: {'lr': 0.00039758098733907364, 'samples': 8880576, 'steps': 46252, 'loss/train': 1.2835415601730347} -11/07/2021 03:46:05 - INFO - __main__ - Step 46254: {'lr': 0.00039757670387997125, 'samples': 8880768, 'steps': 46253, 'loss/train': 1.1759365797042847} -11/07/2021 03:46:05 - INFO - __main__ - Step 46255: {'lr': 0.000397572420354373, 'samples': 8880960, 'steps': 46254, 'loss/train': 1.6075844764709473} -11/07/2021 03:46:06 - INFO - __main__ - Step 46256: {'lr': 0.00039756813676228097, 'samples': 8881152, 'steps': 46255, 'loss/train': 1.6370705366134644} -11/07/2021 03:46:07 - INFO - __main__ - Step 46257: {'lr': 0.00039756385310369703, 'samples': 8881344, 'steps': 46256, 'loss/train': 1.8248659372329712} -11/07/2021 03:46:07 - INFO - __main__ - Step 46258: {'lr': 0.00039755956937862305, 'samples': 8881536, 'steps': 46257, 'loss/train': 1.6447463035583496} -11/07/2021 03:46:07 - INFO - __main__ - Step 46259: {'lr': 0.000397555285587061, 'samples': 8881728, 'steps': 46258, 'loss/train': 1.0949921607971191} -11/07/2021 03:46:08 - INFO - __main__ - Step 46260: {'lr': 0.0003975510017290128, 'samples': 8881920, 'steps': 46259, 'loss/train': 1.5389002561569214} -11/07/2021 03:46:08 - INFO - __main__ - Step 46261: {'lr': 0.00039754671780448044, 'samples': 8882112, 'steps': 46260, 'loss/train': 1.0770015716552734} -11/07/2021 03:46:09 - INFO - __main__ - Step 46262: {'lr': 0.00039754243381346575, 'samples': 8882304, 'steps': 46261, 'loss/train': 1.4575480222702026} -11/07/2021 03:46:10 - INFO - __main__ - Step 46263: {'lr': 0.0003975381497559708, 'samples': 8882496, 'steps': 46262, 'loss/train': 0.6957834959030151} -11/07/2021 03:46:10 - INFO - __main__ - Step 46264: {'lr': 0.00039753386563199733, 'samples': 8882688, 'steps': 46263, 'loss/train': 1.280260443687439} -11/07/2021 03:46:10 - INFO - __main__ - Step 46265: {'lr': 0.0003975295814415475, 'samples': 8882880, 'steps': 46264, 'loss/train': 1.0015782117843628} -11/07/2021 03:46:11 - INFO - __main__ - Step 46266: {'lr': 0.000397525297184623, 'samples': 8883072, 'steps': 46265, 'loss/train': 1.1495505571365356} -11/07/2021 03:46:12 - INFO - __main__ - Step 46267: {'lr': 0.000397521012861226, 'samples': 8883264, 'steps': 46266, 'loss/train': 1.4827730655670166} -11/07/2021 03:46:12 - INFO - __main__ - Step 46268: {'lr': 0.0003975167284713582, 'samples': 8883456, 'steps': 46267, 'loss/train': 0.9695247411727905} -11/07/2021 03:46:12 - INFO - __main__ - Step 46269: {'lr': 0.0003975124440150217, 'samples': 8883648, 'steps': 46268, 'loss/train': 1.5522502660751343} -11/07/2021 03:46:13 - INFO - __main__ - Step 46270: {'lr': 0.0003975081594922183, 'samples': 8883840, 'steps': 46269, 'loss/train': 1.0997180938720703} -11/07/2021 03:46:13 - INFO - __main__ - Step 46271: {'lr': 0.00039750387490295006, 'samples': 8884032, 'steps': 46270, 'loss/train': 1.3116071224212646} -11/07/2021 03:46:14 - INFO - __main__ - Step 46272: {'lr': 0.00039749959024721883, 'samples': 8884224, 'steps': 46271, 'loss/train': 1.546545386314392} -11/07/2021 03:46:14 - INFO - __main__ - Step 46273: {'lr': 0.00039749530552502654, 'samples': 8884416, 'steps': 46272, 'loss/train': 1.332622766494751} -11/07/2021 03:46:15 - INFO - __main__ - Step 46274: {'lr': 0.0003974910207363752, 'samples': 8884608, 'steps': 46273, 'loss/train': 1.4993009567260742} -11/07/2021 03:46:15 - INFO - __main__ - Step 46275: {'lr': 0.00039748673588126674, 'samples': 8884800, 'steps': 46274, 'loss/train': 1.944024682044983} -11/07/2021 03:46:16 - INFO - __main__ - Step 46276: {'lr': 0.00039748245095970285, 'samples': 8884992, 'steps': 46275, 'loss/train': 1.0248795747756958} -11/07/2021 03:46:17 - INFO - __main__ - Step 46277: {'lr': 0.0003974781659716857, 'samples': 8885184, 'steps': 46276, 'loss/train': 1.0836387872695923} -11/07/2021 03:46:17 - INFO - __main__ - Step 46278: {'lr': 0.00039747388091721723, 'samples': 8885376, 'steps': 46277, 'loss/train': 1.4748361110687256} -11/07/2021 03:46:17 - INFO - __main__ - Step 46279: {'lr': 0.00039746959579629924, 'samples': 8885568, 'steps': 46278, 'loss/train': 1.4609371423721313} -11/07/2021 03:46:18 - INFO - __main__ - Step 46280: {'lr': 0.00039746531060893387, 'samples': 8885760, 'steps': 46279, 'loss/train': 1.255275845527649} -11/07/2021 03:46:18 - INFO - __main__ - Step 46281: {'lr': 0.00039746102535512273, 'samples': 8885952, 'steps': 46280, 'loss/train': 1.3065893650054932} -11/07/2021 03:46:19 - INFO - __main__ - Step 46282: {'lr': 0.000397456740034868, 'samples': 8886144, 'steps': 46281, 'loss/train': 1.4119219779968262} -11/07/2021 03:46:19 - INFO - __main__ - Step 46283: {'lr': 0.00039745245464817156, 'samples': 8886336, 'steps': 46282, 'loss/train': 1.323103666305542} -11/07/2021 03:46:20 - INFO - __main__ - Step 46284: {'lr': 0.0003974481691950352, 'samples': 8886528, 'steps': 46283, 'loss/train': 1.300934910774231} -11/07/2021 03:46:20 - INFO - __main__ - Step 46285: {'lr': 0.00039744388367546113, 'samples': 8886720, 'steps': 46284, 'loss/train': 1.2084866762161255} -11/07/2021 03:46:20 - INFO - __main__ - Step 46286: {'lr': 0.0003974395980894511, 'samples': 8886912, 'steps': 46285, 'loss/train': 1.968017339706421} -11/07/2021 03:46:21 - INFO - __main__ - Step 46287: {'lr': 0.000397435312437007, 'samples': 8887104, 'steps': 46286, 'loss/train': 1.5359374284744263} -11/07/2021 03:46:22 - INFO - __main__ - Step 46288: {'lr': 0.0003974310267181308, 'samples': 8887296, 'steps': 46287, 'loss/train': 1.4335994720458984} -11/07/2021 03:46:22 - INFO - __main__ - Step 46289: {'lr': 0.00039742674093282447, 'samples': 8887488, 'steps': 46288, 'loss/train': 0.9824011921882629} -11/07/2021 03:46:23 - INFO - __main__ - Step 46290: {'lr': 0.00039742245508109, 'samples': 8887680, 'steps': 46289, 'loss/train': 1.5129871368408203} -11/07/2021 03:46:23 - INFO - __main__ - Step 46291: {'lr': 0.0003974181691629292, 'samples': 8887872, 'steps': 46290, 'loss/train': 0.4517260491847992} -11/07/2021 03:46:23 - INFO - __main__ - Step 46292: {'lr': 0.00039741388317834404, 'samples': 8888064, 'steps': 46291, 'loss/train': 0.2578364312648773} -11/07/2021 03:46:24 - INFO - __main__ - Step 46293: {'lr': 0.0003974095971273365, 'samples': 8888256, 'steps': 46292, 'loss/train': 1.7126384973526} -11/07/2021 03:46:25 - INFO - __main__ - Step 46294: {'lr': 0.0003974053110099084, 'samples': 8888448, 'steps': 46293, 'loss/train': 1.5983866453170776} -11/07/2021 03:46:25 - INFO - __main__ - Step 46295: {'lr': 0.00039740102482606175, 'samples': 8888640, 'steps': 46294, 'loss/train': 1.3725718259811401} -11/07/2021 03:46:25 - INFO - __main__ - Step 46296: {'lr': 0.0003973967385757985, 'samples': 8888832, 'steps': 46295, 'loss/train': 1.0838935375213623} -11/07/2021 03:46:26 - INFO - __main__ - Step 46297: {'lr': 0.00039739245225912055, 'samples': 8889024, 'steps': 46296, 'loss/train': 1.899027943611145} -11/07/2021 03:46:27 - INFO - __main__ - Step 46298: {'lr': 0.0003973881658760298, 'samples': 8889216, 'steps': 46297, 'loss/train': 1.5178961753845215} -11/07/2021 03:46:27 - INFO - __main__ - Step 46299: {'lr': 0.0003973838794265283, 'samples': 8889408, 'steps': 46298, 'loss/train': 1.2332338094711304} -11/07/2021 03:46:27 - INFO - __main__ - Step 46300: {'lr': 0.00039737959291061785, 'samples': 8889600, 'steps': 46299, 'loss/train': 1.6719191074371338} -11/07/2021 03:46:28 - INFO - __main__ - Step 46301: {'lr': 0.00039737530632830045, 'samples': 8889792, 'steps': 46300, 'loss/train': 1.134166955947876} -11/07/2021 03:46:28 - INFO - __main__ - Step 46302: {'lr': 0.000397371019679578, 'samples': 8889984, 'steps': 46301, 'loss/train': 1.2153406143188477} -11/07/2021 03:46:29 - INFO - __main__ - Step 46303: {'lr': 0.00039736673296445233, 'samples': 8890176, 'steps': 46302, 'loss/train': 1.4334412813186646} -11/07/2021 03:46:30 - INFO - __main__ - Step 46304: {'lr': 0.00039736244618292563, 'samples': 8890368, 'steps': 46303, 'loss/train': 1.919948935508728} -11/07/2021 03:46:30 - INFO - __main__ - Step 46305: {'lr': 0.0003973581593349997, 'samples': 8890560, 'steps': 46304, 'loss/train': 1.259997010231018} -11/07/2021 03:46:30 - INFO - __main__ - Step 46306: {'lr': 0.00039735387242067637, 'samples': 8890752, 'steps': 46305, 'loss/train': 1.6165543794631958} -11/07/2021 03:46:31 - INFO - __main__ - Step 46307: {'lr': 0.0003973495854399577, 'samples': 8890944, 'steps': 46306, 'loss/train': 1.770179271697998} -11/07/2021 03:46:32 - INFO - __main__ - Step 46308: {'lr': 0.0003973452983928456, 'samples': 8891136, 'steps': 46307, 'loss/train': 1.8767409324645996} -11/07/2021 03:46:32 - INFO - __main__ - Step 46309: {'lr': 0.00039734101127934194, 'samples': 8891328, 'steps': 46308, 'loss/train': 1.3616315126419067} -11/07/2021 03:46:32 - INFO - __main__ - Step 46310: {'lr': 0.0003973367240994487, 'samples': 8891520, 'steps': 46309, 'loss/train': 1.2925238609313965} -11/07/2021 03:46:33 - INFO - __main__ - Step 46311: {'lr': 0.00039733243685316776, 'samples': 8891712, 'steps': 46310, 'loss/train': 1.692766547203064} -11/07/2021 03:46:33 - INFO - __main__ - Step 46312: {'lr': 0.00039732814954050125, 'samples': 8891904, 'steps': 46311, 'loss/train': 1.7525407075881958} -11/07/2021 03:46:34 - INFO - __main__ - Step 46313: {'lr': 0.0003973238621614508, 'samples': 8892096, 'steps': 46312, 'loss/train': 1.7229480743408203} -11/07/2021 03:46:34 - INFO - __main__ - Step 46314: {'lr': 0.0003973195747160185, 'samples': 8892288, 'steps': 46313, 'loss/train': 1.8279120922088623} -11/07/2021 03:46:35 - INFO - __main__ - Step 46315: {'lr': 0.00039731528720420635, 'samples': 8892480, 'steps': 46314, 'loss/train': 1.6845635175704956} -11/07/2021 03:46:35 - INFO - __main__ - Step 46316: {'lr': 0.00039731099962601613, 'samples': 8892672, 'steps': 46315, 'loss/train': 1.5683223009109497} -11/07/2021 03:46:35 - INFO - __main__ - Step 46317: {'lr': 0.0003973067119814499, 'samples': 8892864, 'steps': 46316, 'loss/train': 1.3998371362686157} -11/07/2021 03:46:36 - INFO - __main__ - Step 46318: {'lr': 0.00039730242427050955, 'samples': 8893056, 'steps': 46317, 'loss/train': 1.473682165145874} -11/07/2021 03:46:37 - INFO - __main__ - Step 46319: {'lr': 0.00039729813649319704, 'samples': 8893248, 'steps': 46318, 'loss/train': 1.5312484502792358} -11/07/2021 03:46:37 - INFO - __main__ - Step 46320: {'lr': 0.0003972938486495141, 'samples': 8893440, 'steps': 46319, 'loss/train': 1.6194556951522827} -11/07/2021 03:46:38 - INFO - __main__ - Step 46321: {'lr': 0.000397289560739463, 'samples': 8893632, 'steps': 46320, 'loss/train': 0.7224371433258057} -11/07/2021 03:46:38 - INFO - __main__ - Step 46322: {'lr': 0.0003972852727630454, 'samples': 8893824, 'steps': 46321, 'loss/train': 1.4943556785583496} -11/07/2021 03:46:39 - INFO - __main__ - Step 46323: {'lr': 0.0003972809847202633, 'samples': 8894016, 'steps': 46322, 'loss/train': 1.1739274263381958} -11/07/2021 03:46:39 - INFO - __main__ - Step 46324: {'lr': 0.0003972766966111187, 'samples': 8894208, 'steps': 46323, 'loss/train': 1.3836803436279297} -11/07/2021 03:46:40 - INFO - __main__ - Step 46325: {'lr': 0.0003972724084356135, 'samples': 8894400, 'steps': 46324, 'loss/train': 1.1018271446228027} -11/07/2021 03:46:40 - INFO - __main__ - Step 46326: {'lr': 0.0003972681201937497, 'samples': 8894592, 'steps': 46325, 'loss/train': 1.9598287343978882} -11/07/2021 03:46:40 - INFO - __main__ - Step 46327: {'lr': 0.00039726383188552907, 'samples': 8894784, 'steps': 46326, 'loss/train': 0.4965382516384125} -11/07/2021 03:46:41 - INFO - __main__ - Step 46328: {'lr': 0.0003972595435109536, 'samples': 8894976, 'steps': 46327, 'loss/train': 1.0187140703201294} -11/07/2021 03:46:42 - INFO - __main__ - Step 46329: {'lr': 0.0003972552550700253, 'samples': 8895168, 'steps': 46328, 'loss/train': 1.9053086042404175} -11/07/2021 03:46:42 - INFO - __main__ - Step 46330: {'lr': 0.00039725096656274605, 'samples': 8895360, 'steps': 46329, 'loss/train': 1.474176287651062} -11/07/2021 03:46:42 - INFO - __main__ - Step 46331: {'lr': 0.0003972466779891178, 'samples': 8895552, 'steps': 46330, 'loss/train': 1.58558988571167} -11/07/2021 03:46:43 - INFO - __main__ - Step 46332: {'lr': 0.00039724238934914246, 'samples': 8895744, 'steps': 46331, 'loss/train': 1.1344085931777954} -11/07/2021 03:46:43 - INFO - __main__ - Step 46333: {'lr': 0.00039723810064282194, 'samples': 8895936, 'steps': 46332, 'loss/train': 1.906126856803894} -11/07/2021 03:46:44 - INFO - __main__ - Step 46334: {'lr': 0.00039723381187015827, 'samples': 8896128, 'steps': 46333, 'loss/train': 1.4070894718170166} -11/07/2021 03:46:44 - INFO - __main__ - Step 46335: {'lr': 0.00039722952303115325, 'samples': 8896320, 'steps': 46334, 'loss/train': 1.662004828453064} -11/07/2021 03:46:45 - INFO - __main__ - Step 46336: {'lr': 0.00039722523412580893, 'samples': 8896512, 'steps': 46335, 'loss/train': 1.8109190464019775} -11/07/2021 03:46:45 - INFO - __main__ - Step 46337: {'lr': 0.00039722094515412716, 'samples': 8896704, 'steps': 46336, 'loss/train': 1.2489622831344604} -11/07/2021 03:46:45 - INFO - __main__ - Step 46338: {'lr': 0.0003972166561161099, 'samples': 8896896, 'steps': 46337, 'loss/train': 1.6360827684402466} -11/07/2021 03:46:46 - INFO - __main__ - Step 46339: {'lr': 0.0003972123670117591, 'samples': 8897088, 'steps': 46338, 'loss/train': 1.5947308540344238} -11/07/2021 03:46:47 - INFO - __main__ - Step 46340: {'lr': 0.0003972080778410767, 'samples': 8897280, 'steps': 46339, 'loss/train': 1.5650063753128052} -11/07/2021 03:46:47 - INFO - __main__ - Step 46341: {'lr': 0.0003972037886040646, 'samples': 8897472, 'steps': 46340, 'loss/train': 1.557324767112732} -11/07/2021 03:46:47 - INFO - __main__ - Step 46342: {'lr': 0.0003971994993007247, 'samples': 8897664, 'steps': 46341, 'loss/train': 1.0299310684204102} -11/07/2021 03:46:48 - INFO - __main__ - Step 46343: {'lr': 0.000397195209931059, 'samples': 8897856, 'steps': 46342, 'loss/train': 1.5515167713165283} -11/07/2021 03:46:49 - INFO - __main__ - Step 46344: {'lr': 0.00039719092049506945, 'samples': 8898048, 'steps': 46343, 'loss/train': 1.3159284591674805} -11/07/2021 03:46:49 - INFO - __main__ - Step 46345: {'lr': 0.0003971866309927579, 'samples': 8898240, 'steps': 46344, 'loss/train': 1.5566840171813965} -11/07/2021 03:46:50 - INFO - __main__ - Step 46346: {'lr': 0.0003971823414241263, 'samples': 8898432, 'steps': 46345, 'loss/train': 1.3025474548339844} -11/07/2021 03:46:50 - INFO - __main__ - Step 46347: {'lr': 0.00039717805178917666, 'samples': 8898624, 'steps': 46346, 'loss/train': 0.9771838188171387} -11/07/2021 03:46:50 - INFO - __main__ - Step 46348: {'lr': 0.0003971737620879109, 'samples': 8898816, 'steps': 46347, 'loss/train': 1.1943190097808838} -11/07/2021 03:46:52 - INFO - __main__ - Step 46349: {'lr': 0.00039716947232033086, 'samples': 8899008, 'steps': 46348, 'loss/train': 1.3805917501449585} -11/07/2021 03:46:52 - INFO - __main__ - Step 46350: {'lr': 0.0003971651824864385, 'samples': 8899200, 'steps': 46349, 'loss/train': 1.2455881834030151} -11/07/2021 03:46:52 - INFO - __main__ - Step 46351: {'lr': 0.0003971608925862358, 'samples': 8899392, 'steps': 46350, 'loss/train': 0.6013545393943787} -11/07/2021 03:46:53 - INFO - __main__ - Step 46352: {'lr': 0.0003971566026197247, 'samples': 8899584, 'steps': 46351, 'loss/train': 1.3850561380386353} -11/07/2021 03:46:53 - INFO - __main__ - Step 46353: {'lr': 0.0003971523125869071, 'samples': 8899776, 'steps': 46352, 'loss/train': 1.5100414752960205} -11/07/2021 03:46:54 - INFO - __main__ - Step 46354: {'lr': 0.0003971480224877849, 'samples': 8899968, 'steps': 46353, 'loss/train': 1.7108681201934814} -11/07/2021 03:46:54 - INFO - __main__ - Step 46355: {'lr': 0.0003971437323223601, 'samples': 8900160, 'steps': 46354, 'loss/train': 1.50070321559906} -11/07/2021 03:46:55 - INFO - __main__ - Step 46356: {'lr': 0.0003971394420906346, 'samples': 8900352, 'steps': 46355, 'loss/train': 1.4882370233535767} -11/07/2021 03:46:55 - INFO - __main__ - Step 46357: {'lr': 0.0003971351517926103, 'samples': 8900544, 'steps': 46356, 'loss/train': 1.826380729675293} -11/07/2021 03:46:55 - INFO - __main__ - Step 46358: {'lr': 0.00039713086142828926, 'samples': 8900736, 'steps': 46357, 'loss/train': 1.4136426448822021} -11/07/2021 03:46:56 - INFO - __main__ - Step 46359: {'lr': 0.0003971265709976732, 'samples': 8900928, 'steps': 46358, 'loss/train': 1.0631334781646729} -11/07/2021 03:46:57 - INFO - __main__ - Step 46360: {'lr': 0.0003971222805007643, 'samples': 8901120, 'steps': 46359, 'loss/train': 1.5096248388290405} -11/07/2021 03:46:57 - INFO - __main__ - Step 46361: {'lr': 0.0003971179899375643, 'samples': 8901312, 'steps': 46360, 'loss/train': 1.5115386247634888} -11/07/2021 03:46:57 - INFO - __main__ - Step 46362: {'lr': 0.0003971136993080753, 'samples': 8901504, 'steps': 46361, 'loss/train': 1.3785995244979858} -11/07/2021 03:46:58 - INFO - __main__ - Step 46363: {'lr': 0.000397109408612299, 'samples': 8901696, 'steps': 46362, 'loss/train': 1.4775710105895996} -11/07/2021 03:46:58 - INFO - __main__ - Step 46364: {'lr': 0.0003971051178502375, 'samples': 8901888, 'steps': 46363, 'loss/train': 1.3644808530807495} -11/07/2021 03:46:59 - INFO - __main__ - Step 46365: {'lr': 0.00039710082702189276, 'samples': 8902080, 'steps': 46364, 'loss/train': 0.9544762372970581} -11/07/2021 03:46:59 - INFO - __main__ - Step 46366: {'lr': 0.0003970965361272667, 'samples': 8902272, 'steps': 46365, 'loss/train': 1.3058061599731445} -11/07/2021 03:47:00 - INFO - __main__ - Step 46367: {'lr': 0.0003970922451663611, 'samples': 8902464, 'steps': 46366, 'loss/train': 1.5385879278182983} -11/07/2021 03:47:00 - INFO - __main__ - Step 46368: {'lr': 0.0003970879541391781, 'samples': 8902656, 'steps': 46367, 'loss/train': 1.2907299995422363} -11/07/2021 03:47:01 - INFO - __main__ - Step 46369: {'lr': 0.0003970836630457194, 'samples': 8902848, 'steps': 46368, 'loss/train': 1.6435942649841309} -11/07/2021 03:47:02 - INFO - __main__ - Step 46370: {'lr': 0.00039707937188598717, 'samples': 8903040, 'steps': 46369, 'loss/train': 1.3786275386810303} -11/07/2021 03:47:02 - INFO - __main__ - Step 46371: {'lr': 0.00039707508065998324, 'samples': 8903232, 'steps': 46370, 'loss/train': 1.4974207878112793} -11/07/2021 03:47:03 - INFO - __main__ - Step 46372: {'lr': 0.0003970707893677095, 'samples': 8903424, 'steps': 46371, 'loss/train': 1.7725350856781006} -11/07/2021 03:47:03 - INFO - __main__ - Step 46373: {'lr': 0.00039706649800916804, 'samples': 8903616, 'steps': 46372, 'loss/train': 1.5043054819107056} -11/07/2021 03:47:03 - INFO - __main__ - Step 46374: {'lr': 0.0003970622065843607, 'samples': 8903808, 'steps': 46373, 'loss/train': 5.2578558921813965} -11/07/2021 03:47:04 - INFO - __main__ - Step 46375: {'lr': 0.00039705791509328926, 'samples': 8904000, 'steps': 46374, 'loss/train': 1.6006724834442139} -11/07/2021 03:47:05 - INFO - __main__ - Step 46376: {'lr': 0.0003970536235359558, 'samples': 8904192, 'steps': 46375, 'loss/train': 1.1772557497024536} -11/07/2021 03:47:05 - INFO - __main__ - Step 46377: {'lr': 0.00039704933191236225, 'samples': 8904384, 'steps': 46376, 'loss/train': 1.2849663496017456} -11/07/2021 03:47:05 - INFO - __main__ - Step 46378: {'lr': 0.00039704504022251066, 'samples': 8904576, 'steps': 46377, 'loss/train': 1.5546324253082275} -11/07/2021 03:47:06 - INFO - __main__ - Step 46379: {'lr': 0.00039704074846640277, 'samples': 8904768, 'steps': 46378, 'loss/train': 1.1840581893920898} -11/07/2021 03:47:06 - INFO - __main__ - Step 46380: {'lr': 0.0003970364566440406, 'samples': 8904960, 'steps': 46379, 'loss/train': 1.5081672668457031} -11/07/2021 03:47:07 - INFO - __main__ - Step 46381: {'lr': 0.000397032164755426, 'samples': 8905152, 'steps': 46380, 'loss/train': 1.852556824684143} -11/07/2021 03:47:07 - INFO - __main__ - Step 46382: {'lr': 0.0003970278728005611, 'samples': 8905344, 'steps': 46381, 'loss/train': 1.6030914783477783} -11/07/2021 03:47:08 - INFO - __main__ - Step 46383: {'lr': 0.0003970235807794476, 'samples': 8905536, 'steps': 46382, 'loss/train': 1.5848695039749146} -11/07/2021 03:47:08 - INFO - __main__ - Step 46384: {'lr': 0.00039701928869208757, 'samples': 8905728, 'steps': 46383, 'loss/train': 2.116671323776245} -11/07/2021 03:47:09 - INFO - __main__ - Step 46385: {'lr': 0.0003970149965384829, 'samples': 8905920, 'steps': 46384, 'loss/train': 1.5274428129196167} -11/07/2021 03:47:10 - INFO - __main__ - Step 46386: {'lr': 0.00039701070431863564, 'samples': 8906112, 'steps': 46385, 'loss/train': 1.8301100730895996} -11/07/2021 03:47:10 - INFO - __main__ - Step 46387: {'lr': 0.00039700641203254755, 'samples': 8906304, 'steps': 46386, 'loss/train': 1.2952507734298706} -11/07/2021 03:47:10 - INFO - __main__ - Step 46388: {'lr': 0.0003970021196802206, 'samples': 8906496, 'steps': 46387, 'loss/train': 1.4825998544692993} -11/07/2021 03:47:11 - INFO - __main__ - Step 46389: {'lr': 0.0003969978272616569, 'samples': 8906688, 'steps': 46388, 'loss/train': 1.300925612449646} -11/07/2021 03:47:11 - INFO - __main__ - Step 46390: {'lr': 0.0003969935347768581, 'samples': 8906880, 'steps': 46389, 'loss/train': 1.5207626819610596} -11/07/2021 03:47:12 - INFO - __main__ - Step 46391: {'lr': 0.00039698924222582636, 'samples': 8907072, 'steps': 46390, 'loss/train': 1.572201132774353} -11/07/2021 03:47:12 - INFO - __main__ - Step 46392: {'lr': 0.00039698494960856346, 'samples': 8907264, 'steps': 46391, 'loss/train': 1.227784276008606} -11/07/2021 03:47:13 - INFO - __main__ - Step 46393: {'lr': 0.0003969806569250716, 'samples': 8907456, 'steps': 46392, 'loss/train': 0.8939191102981567} -11/07/2021 03:47:13 - INFO - __main__ - Step 46394: {'lr': 0.0003969763641753523, 'samples': 8907648, 'steps': 46393, 'loss/train': 1.826757788658142} -11/07/2021 03:47:14 - INFO - __main__ - Step 46395: {'lr': 0.00039697207135940785, 'samples': 8907840, 'steps': 46394, 'loss/train': 0.6387439370155334} -11/07/2021 03:47:14 - INFO - __main__ - Step 46396: {'lr': 0.00039696777847724, 'samples': 8908032, 'steps': 46395, 'loss/train': 1.2974773645401} -11/07/2021 03:47:15 - INFO - __main__ - Step 46397: {'lr': 0.00039696348552885075, 'samples': 8908224, 'steps': 46396, 'loss/train': 1.2351579666137695} -11/07/2021 03:47:15 - INFO - __main__ - Step 46398: {'lr': 0.000396959192514242, 'samples': 8908416, 'steps': 46397, 'loss/train': 1.7253797054290771} -11/07/2021 03:47:16 - INFO - __main__ - Step 46399: {'lr': 0.0003969548994334158, 'samples': 8908608, 'steps': 46398, 'loss/train': 1.3931994438171387} -11/07/2021 03:47:16 - INFO - __main__ - Step 46400: {'lr': 0.0003969506062863739, 'samples': 8908800, 'steps': 46399, 'loss/train': 1.0712485313415527} -11/07/2021 03:47:16 - INFO - __main__ - Step 46401: {'lr': 0.0003969463130731183, 'samples': 8908992, 'steps': 46400, 'loss/train': 1.5049532651901245} -11/07/2021 03:47:17 - INFO - __main__ - Step 46402: {'lr': 0.00039694201979365094, 'samples': 8909184, 'steps': 46401, 'loss/train': 1.2959758043289185} -11/07/2021 03:47:18 - INFO - __main__ - Step 46403: {'lr': 0.00039693772644797386, 'samples': 8909376, 'steps': 46402, 'loss/train': 1.4447095394134521} -11/07/2021 03:47:18 - INFO - __main__ - Step 46404: {'lr': 0.0003969334330360889, 'samples': 8909568, 'steps': 46403, 'loss/train': 1.9214714765548706} -11/07/2021 03:47:18 - INFO - __main__ - Step 46405: {'lr': 0.000396929139557998, 'samples': 8909760, 'steps': 46404, 'loss/train': 1.6759204864501953} -11/07/2021 03:47:19 - INFO - __main__ - Step 46406: {'lr': 0.00039692484601370305, 'samples': 8909952, 'steps': 46405, 'loss/train': 1.6240415573120117} -11/07/2021 03:47:20 - INFO - __main__ - Step 46407: {'lr': 0.0003969205524032061, 'samples': 8910144, 'steps': 46406, 'loss/train': 1.2875351905822754} -11/07/2021 03:47:20 - INFO - __main__ - Step 46408: {'lr': 0.00039691625872650895, 'samples': 8910336, 'steps': 46407, 'loss/train': 1.4437205791473389} -11/07/2021 03:47:20 - INFO - __main__ - Step 46409: {'lr': 0.00039691196498361364, 'samples': 8910528, 'steps': 46408, 'loss/train': 1.4613850116729736} -11/07/2021 03:47:21 - INFO - __main__ - Step 46410: {'lr': 0.0003969076711745221, 'samples': 8910720, 'steps': 46409, 'loss/train': 1.6706717014312744} -11/07/2021 03:47:21 - INFO - __main__ - Step 46411: {'lr': 0.00039690337729923617, 'samples': 8910912, 'steps': 46410, 'loss/train': 1.7761319875717163} -11/07/2021 03:47:22 - INFO - __main__ - Step 46412: {'lr': 0.0003968990833577578, 'samples': 8911104, 'steps': 46411, 'loss/train': 1.0088707208633423} -11/07/2021 03:47:23 - INFO - __main__ - Step 46413: {'lr': 0.00039689478935008905, 'samples': 8911296, 'steps': 46412, 'loss/train': 1.9144214391708374} -11/07/2021 03:47:23 - INFO - __main__ - Step 46414: {'lr': 0.00039689049527623176, 'samples': 8911488, 'steps': 46413, 'loss/train': 1.185842752456665} -11/07/2021 03:47:23 - INFO - __main__ - Step 46415: {'lr': 0.0003968862011361879, 'samples': 8911680, 'steps': 46414, 'loss/train': 1.3232680559158325} -11/07/2021 03:47:24 - INFO - __main__ - Step 46416: {'lr': 0.0003968819069299593, 'samples': 8911872, 'steps': 46415, 'loss/train': 1.2034891843795776} -11/07/2021 03:47:25 - INFO - __main__ - Step 46417: {'lr': 0.0003968776126575481, 'samples': 8912064, 'steps': 46416, 'loss/train': 1.278905987739563} -11/07/2021 03:47:25 - INFO - __main__ - Step 46418: {'lr': 0.000396873318318956, 'samples': 8912256, 'steps': 46417, 'loss/train': 1.3681342601776123} -11/07/2021 03:47:25 - INFO - __main__ - Step 46419: {'lr': 0.00039686902391418514, 'samples': 8912448, 'steps': 46418, 'loss/train': 1.267077088356018} -11/07/2021 03:47:26 - INFO - __main__ - Step 46420: {'lr': 0.00039686472944323734, 'samples': 8912640, 'steps': 46419, 'loss/train': 1.7939561605453491} -11/07/2021 03:47:26 - INFO - __main__ - Step 46421: {'lr': 0.0003968604349061145, 'samples': 8912832, 'steps': 46420, 'loss/train': 1.28379487991333} -11/07/2021 03:47:26 - INFO - __main__ - Step 46422: {'lr': 0.0003968561403028187, 'samples': 8913024, 'steps': 46421, 'loss/train': 1.4254707098007202} -11/07/2021 03:47:27 - INFO - __main__ - Step 46423: {'lr': 0.00039685184563335174, 'samples': 8913216, 'steps': 46422, 'loss/train': 1.5502345561981201} -11/07/2021 03:47:28 - INFO - __main__ - Step 46424: {'lr': 0.00039684755089771555, 'samples': 8913408, 'steps': 46423, 'loss/train': 1.2274820804595947} -11/07/2021 03:47:28 - INFO - __main__ - Step 46425: {'lr': 0.0003968432560959122, 'samples': 8913600, 'steps': 46424, 'loss/train': 1.656483769416809} -11/07/2021 03:47:28 - INFO - __main__ - Step 46426: {'lr': 0.00039683896122794354, 'samples': 8913792, 'steps': 46425, 'loss/train': 1.4895061254501343} -11/07/2021 03:47:29 - INFO - __main__ - Step 46427: {'lr': 0.0003968346662938115, 'samples': 8913984, 'steps': 46426, 'loss/train': 1.6468385457992554} -11/07/2021 03:47:30 - INFO - __main__ - Step 46428: {'lr': 0.00039683037129351805, 'samples': 8914176, 'steps': 46427, 'loss/train': 1.4098467826843262} -11/07/2021 03:47:30 - INFO - __main__ - Step 46429: {'lr': 0.000396826076227065, 'samples': 8914368, 'steps': 46428, 'loss/train': 1.276272177696228} -11/07/2021 03:47:31 - INFO - __main__ - Step 46430: {'lr': 0.00039682178109445447, 'samples': 8914560, 'steps': 46429, 'loss/train': 1.4634912014007568} -11/07/2021 03:47:31 - INFO - __main__ - Step 46431: {'lr': 0.0003968174858956883, 'samples': 8914752, 'steps': 46430, 'loss/train': 1.4141737222671509} -11/07/2021 03:47:31 - INFO - __main__ - Step 46432: {'lr': 0.0003968131906307684, 'samples': 8914944, 'steps': 46431, 'loss/train': 1.7467100620269775} -11/07/2021 03:47:32 - INFO - __main__ - Step 46433: {'lr': 0.00039680889529969686, 'samples': 8915136, 'steps': 46432, 'loss/train': 1.4590861797332764} -11/07/2021 03:47:33 - INFO - __main__ - Step 46434: {'lr': 0.0003968045999024754, 'samples': 8915328, 'steps': 46433, 'loss/train': 1.3307888507843018} -11/07/2021 03:47:33 - INFO - __main__ - Step 46435: {'lr': 0.0003968003044391061, 'samples': 8915520, 'steps': 46434, 'loss/train': 1.1671562194824219} -11/07/2021 03:47:33 - INFO - __main__ - Step 46436: {'lr': 0.00039679600890959077, 'samples': 8915712, 'steps': 46435, 'loss/train': 1.6333740949630737} -11/07/2021 03:47:34 - INFO - __main__ - Step 46437: {'lr': 0.0003967917133139315, 'samples': 8915904, 'steps': 46436, 'loss/train': 1.6342260837554932} -11/07/2021 03:47:35 - INFO - __main__ - Step 46438: {'lr': 0.00039678741765213006, 'samples': 8916096, 'steps': 46437, 'loss/train': 1.4422754049301147} -11/07/2021 03:47:35 - INFO - __main__ - Step 46439: {'lr': 0.0003967831219241885, 'samples': 8916288, 'steps': 46438, 'loss/train': 0.8115842938423157} -11/07/2021 03:47:35 - INFO - __main__ - Step 46440: {'lr': 0.00039677882613010885, 'samples': 8916480, 'steps': 46439, 'loss/train': 1.4022616147994995} -11/07/2021 03:47:36 - INFO - __main__ - Step 46441: {'lr': 0.0003967745302698928, 'samples': 8916672, 'steps': 46440, 'loss/train': 1.2536962032318115} -11/07/2021 03:47:36 - INFO - __main__ - Step 46442: {'lr': 0.0003967702343435424, 'samples': 8916864, 'steps': 46441, 'loss/train': 1.6496021747589111} -11/07/2021 03:47:37 - INFO - __main__ - Step 46443: {'lr': 0.00039676593835105966, 'samples': 8917056, 'steps': 46442, 'loss/train': 1.66366446018219} -11/07/2021 03:47:37 - INFO - __main__ - Step 46444: {'lr': 0.0003967616422924465, 'samples': 8917248, 'steps': 46443, 'loss/train': 0.9641647934913635} -11/07/2021 03:47:38 - INFO - __main__ - Step 46445: {'lr': 0.0003967573461677047, 'samples': 8917440, 'steps': 46444, 'loss/train': 1.5705403089523315} -11/07/2021 03:47:38 - INFO - __main__ - Step 46446: {'lr': 0.0003967530499768364, 'samples': 8917632, 'steps': 46445, 'loss/train': 1.5934021472930908} -11/07/2021 03:47:39 - INFO - __main__ - Step 46447: {'lr': 0.00039674875371984336, 'samples': 8917824, 'steps': 46446, 'loss/train': 1.6371523141860962} -11/07/2021 03:47:39 - INFO - __main__ - Step 46448: {'lr': 0.0003967444573967277, 'samples': 8918016, 'steps': 46447, 'loss/train': 1.5475355386734009} -11/07/2021 03:47:40 - INFO - __main__ - Step 46449: {'lr': 0.0003967401610074911, 'samples': 8918208, 'steps': 46448, 'loss/train': 1.378336787223816} -11/07/2021 03:47:40 - INFO - __main__ - Step 46450: {'lr': 0.0003967358645521357, 'samples': 8918400, 'steps': 46449, 'loss/train': 1.6174300909042358} -11/07/2021 03:47:41 - INFO - __main__ - Step 46451: {'lr': 0.00039673156803066346, 'samples': 8918592, 'steps': 46450, 'loss/train': 1.4035089015960693} -11/07/2021 03:47:41 - INFO - __main__ - Step 46452: {'lr': 0.00039672727144307617, 'samples': 8918784, 'steps': 46451, 'loss/train': 1.4450703859329224} -11/07/2021 03:47:41 - INFO - __main__ - Step 46453: {'lr': 0.0003967229747893759, 'samples': 8918976, 'steps': 46452, 'loss/train': 1.6976627111434937} -11/07/2021 03:47:42 - INFO - __main__ - Step 46454: {'lr': 0.0003967186780695645, 'samples': 8919168, 'steps': 46453, 'loss/train': 1.2306568622589111} -11/07/2021 03:47:43 - INFO - __main__ - Step 46455: {'lr': 0.0003967143812836439, 'samples': 8919360, 'steps': 46454, 'loss/train': 1.285661220550537} -11/07/2021 03:47:43 - INFO - __main__ - Step 46456: {'lr': 0.00039671008443161604, 'samples': 8919552, 'steps': 46455, 'loss/train': 1.6329265832901} -11/07/2021 03:47:43 - INFO - __main__ - Step 46457: {'lr': 0.00039670578751348283, 'samples': 8919744, 'steps': 46456, 'loss/train': 1.6372334957122803} -11/07/2021 03:47:44 - INFO - __main__ - Step 46458: {'lr': 0.0003967014905292464, 'samples': 8919936, 'steps': 46457, 'loss/train': 0.9876204133033752} -11/07/2021 03:47:45 - INFO - __main__ - Step 46459: {'lr': 0.0003966971934789084, 'samples': 8920128, 'steps': 46458, 'loss/train': 1.5900052785873413} -11/07/2021 03:47:45 - INFO - __main__ - Step 46460: {'lr': 0.0003966928963624711, 'samples': 8920320, 'steps': 46459, 'loss/train': 1.9930756092071533} -11/07/2021 03:47:46 - INFO - __main__ - Step 46461: {'lr': 0.0003966885991799361, 'samples': 8920512, 'steps': 46460, 'loss/train': 1.638953685760498} -11/07/2021 03:47:46 - INFO - __main__ - Step 46462: {'lr': 0.0003966843019313055, 'samples': 8920704, 'steps': 46461, 'loss/train': 1.3511921167373657} -11/07/2021 03:47:46 - INFO - __main__ - Step 46463: {'lr': 0.00039668000461658126, 'samples': 8920896, 'steps': 46462, 'loss/train': 0.6511127948760986} -11/07/2021 03:47:47 - INFO - __main__ - Step 46464: {'lr': 0.00039667570723576516, 'samples': 8921088, 'steps': 46463, 'loss/train': 0.8745549917221069} -11/07/2021 03:47:48 - INFO - __main__ - Step 46465: {'lr': 0.0003966714097888594, 'samples': 8921280, 'steps': 46464, 'loss/train': 1.5564099550247192} -11/07/2021 03:47:48 - INFO - __main__ - Step 46466: {'lr': 0.0003966671122758657, 'samples': 8921472, 'steps': 46465, 'loss/train': 1.396647334098816} -11/07/2021 03:47:48 - INFO - __main__ - Step 46467: {'lr': 0.00039666281469678604, 'samples': 8921664, 'steps': 46466, 'loss/train': 1.562657356262207} -11/07/2021 03:47:49 - INFO - __main__ - Step 46468: {'lr': 0.0003966585170516224, 'samples': 8921856, 'steps': 46467, 'loss/train': 1.7159804105758667} -11/07/2021 03:47:49 - INFO - __main__ - Step 46469: {'lr': 0.0003966542193403767, 'samples': 8922048, 'steps': 46468, 'loss/train': 1.0989930629730225} -11/07/2021 03:47:50 - INFO - __main__ - Step 46470: {'lr': 0.00039664992156305086, 'samples': 8922240, 'steps': 46469, 'loss/train': 1.3452023267745972} -11/07/2021 03:47:50 - INFO - __main__ - Step 46471: {'lr': 0.00039664562371964683, 'samples': 8922432, 'steps': 46470, 'loss/train': 1.5813894271850586} -11/07/2021 03:47:51 - INFO - __main__ - Step 46472: {'lr': 0.00039664132581016654, 'samples': 8922624, 'steps': 46471, 'loss/train': 1.7242380380630493} -11/07/2021 03:47:51 - INFO - __main__ - Step 46473: {'lr': 0.000396637027834612, 'samples': 8922816, 'steps': 46472, 'loss/train': 1.4563004970550537} -11/07/2021 03:47:51 - INFO - __main__ - Step 46474: {'lr': 0.000396632729792985, 'samples': 8923008, 'steps': 46473, 'loss/train': 1.0452595949172974} -11/07/2021 03:47:52 - INFO - __main__ - Step 46475: {'lr': 0.00039662843168528756, 'samples': 8923200, 'steps': 46474, 'loss/train': 1.0003538131713867} -11/07/2021 03:47:53 - INFO - __main__ - Step 46476: {'lr': 0.0003966241335115216, 'samples': 8923392, 'steps': 46475, 'loss/train': 1.5979691743850708} -11/07/2021 03:47:53 - INFO - __main__ - Step 46477: {'lr': 0.0003966198352716891, 'samples': 8923584, 'steps': 46476, 'loss/train': 1.578640341758728} -11/07/2021 03:47:54 - INFO - __main__ - Step 46478: {'lr': 0.000396615536965792, 'samples': 8923776, 'steps': 46477, 'loss/train': 1.4766262769699097} -11/07/2021 03:47:54 - INFO - __main__ - Step 46479: {'lr': 0.00039661123859383214, 'samples': 8923968, 'steps': 46478, 'loss/train': 1.2574434280395508} -11/07/2021 03:47:55 - INFO - __main__ - Step 46480: {'lr': 0.0003966069401558116, 'samples': 8924160, 'steps': 46479, 'loss/train': 1.872518539428711} -11/07/2021 03:47:55 - INFO - __main__ - Step 46481: {'lr': 0.0003966026416517321, 'samples': 8924352, 'steps': 46480, 'loss/train': 1.8166900873184204} -11/07/2021 03:47:56 - INFO - __main__ - Step 46482: {'lr': 0.0003965983430815958, 'samples': 8924544, 'steps': 46481, 'loss/train': 1.5014415979385376} -11/07/2021 03:47:56 - INFO - __main__ - Step 46483: {'lr': 0.00039659404444540456, 'samples': 8924736, 'steps': 46482, 'loss/train': 1.8454792499542236} -11/07/2021 03:47:57 - INFO - __main__ - Step 46484: {'lr': 0.0003965897457431602, 'samples': 8924928, 'steps': 46483, 'loss/train': 1.2768256664276123} -11/07/2021 03:47:57 - INFO - __main__ - Step 46485: {'lr': 0.00039658544697486486, 'samples': 8925120, 'steps': 46484, 'loss/train': 0.8908268213272095} -11/07/2021 03:47:58 - INFO - __main__ - Step 46486: {'lr': 0.0003965811481405204, 'samples': 8925312, 'steps': 46485, 'loss/train': 1.6718217134475708} -11/07/2021 03:47:58 - INFO - __main__ - Step 46487: {'lr': 0.00039657684924012873, 'samples': 8925504, 'steps': 46486, 'loss/train': 1.548094391822815} -11/07/2021 03:47:59 - INFO - __main__ - Step 46488: {'lr': 0.0003965725502736917, 'samples': 8925696, 'steps': 46487, 'loss/train': 1.6084216833114624} -11/07/2021 03:47:59 - INFO - __main__ - Step 46489: {'lr': 0.0003965682512412114, 'samples': 8925888, 'steps': 46488, 'loss/train': 1.1312930583953857} -11/07/2021 03:47:59 - INFO - __main__ - Step 46490: {'lr': 0.0003965639521426897, 'samples': 8926080, 'steps': 46489, 'loss/train': 1.8306597471237183} -11/07/2021 03:48:00 - INFO - __main__ - Step 46491: {'lr': 0.0003965596529781286, 'samples': 8926272, 'steps': 46490, 'loss/train': 1.3911941051483154} -11/07/2021 03:48:01 - INFO - __main__ - Step 46492: {'lr': 0.0003965553537475299, 'samples': 8926464, 'steps': 46491, 'loss/train': 2.3198862075805664} -11/07/2021 03:48:01 - INFO - __main__ - Step 46493: {'lr': 0.0003965510544508957, 'samples': 8926656, 'steps': 46492, 'loss/train': 1.6831574440002441} -11/07/2021 03:48:01 - INFO - __main__ - Step 46494: {'lr': 0.0003965467550882278, 'samples': 8926848, 'steps': 46493, 'loss/train': 1.5054762363433838} -11/07/2021 03:48:02 - INFO - __main__ - Step 46495: {'lr': 0.0003965424556595282, 'samples': 8927040, 'steps': 46494, 'loss/train': 1.6593341827392578} -11/07/2021 03:48:03 - INFO - __main__ - Step 46496: {'lr': 0.0003965381561647988, 'samples': 8927232, 'steps': 46495, 'loss/train': 1.6570336818695068} -11/07/2021 03:48:03 - INFO - __main__ - Step 46497: {'lr': 0.0003965338566040416, 'samples': 8927424, 'steps': 46496, 'loss/train': 1.7234264612197876} -11/07/2021 03:48:03 - INFO - __main__ - Step 46498: {'lr': 0.0003965295569772585, 'samples': 8927616, 'steps': 46497, 'loss/train': 1.8450464010238647} -11/07/2021 03:48:04 - INFO - __main__ - Step 46499: {'lr': 0.00039652525728445145, 'samples': 8927808, 'steps': 46498, 'loss/train': 1.6731663942337036} -11/07/2021 03:48:04 - INFO - __main__ - Step 46500: {'lr': 0.00039652095752562246, 'samples': 8928000, 'steps': 46499, 'loss/train': 1.2277780771255493} -11/07/2021 03:48:05 - INFO - __main__ - Step 46501: {'lr': 0.00039651665770077326, 'samples': 8928192, 'steps': 46500, 'loss/train': 1.7918261289596558} -11/07/2021 03:48:06 - INFO - __main__ - Step 46502: {'lr': 0.00039651235780990596, 'samples': 8928384, 'steps': 46501, 'loss/train': 1.228326678276062} -11/07/2021 03:48:06 - INFO - __main__ - Step 46503: {'lr': 0.00039650805785302245, 'samples': 8928576, 'steps': 46502, 'loss/train': 1.630692481994629} -11/07/2021 03:48:07 - INFO - __main__ - Step 46504: {'lr': 0.0003965037578301247, 'samples': 8928768, 'steps': 46503, 'loss/train': 1.2357648611068726} -11/07/2021 03:48:07 - INFO - __main__ - Step 46505: {'lr': 0.00039649945774121453, 'samples': 8928960, 'steps': 46504, 'loss/train': 1.0091569423675537} -11/07/2021 03:48:07 - INFO - __main__ - Step 46506: {'lr': 0.0003964951575862941, 'samples': 8929152, 'steps': 46505, 'loss/train': 1.7667460441589355} -11/07/2021 03:48:08 - INFO - __main__ - Step 46507: {'lr': 0.00039649085736536517, 'samples': 8929344, 'steps': 46506, 'loss/train': 0.6111887693405151} -11/07/2021 03:48:09 - INFO - __main__ - Step 46508: {'lr': 0.0003964865570784296, 'samples': 8929536, 'steps': 46507, 'loss/train': 1.2216861248016357} -11/07/2021 03:48:09 - INFO - __main__ - Step 46509: {'lr': 0.00039648225672548953, 'samples': 8929728, 'steps': 46508, 'loss/train': 1.1576570272445679} -11/07/2021 03:48:09 - INFO - __main__ - Step 46510: {'lr': 0.00039647795630654687, 'samples': 8929920, 'steps': 46509, 'loss/train': 1.639652132987976} -11/07/2021 03:48:10 - INFO - __main__ - Step 46511: {'lr': 0.00039647365582160345, 'samples': 8930112, 'steps': 46510, 'loss/train': 1.9230080842971802} -11/07/2021 03:48:12 - INFO - __main__ - Step 46512: {'lr': 0.00039646935527066124, 'samples': 8930304, 'steps': 46511, 'loss/train': 1.6091551780700684} -11/07/2021 03:48:13 - INFO - __main__ - Step 46513: {'lr': 0.00039646505465372223, 'samples': 8930496, 'steps': 46512, 'loss/train': 1.5849133729934692} -11/07/2021 03:48:13 - INFO - __main__ - Step 46514: {'lr': 0.0003964607539707884, 'samples': 8930688, 'steps': 46513, 'loss/train': 3.213456392288208} -11/07/2021 03:48:13 - INFO - __main__ - Step 46515: {'lr': 0.0003964564532218615, 'samples': 8930880, 'steps': 46514, 'loss/train': 3.0650737285614014} -11/07/2021 03:48:14 - INFO - __main__ - Step 46516: {'lr': 0.0003964521524069436, 'samples': 8931072, 'steps': 46515, 'loss/train': 3.095937967300415} -11/07/2021 03:48:14 - INFO - __main__ - Step 46517: {'lr': 0.00039644785152603666, 'samples': 8931264, 'steps': 46516, 'loss/train': 3.1416046619415283} -11/07/2021 03:48:14 - INFO - __main__ - Step 46518: {'lr': 0.0003964435505791425, 'samples': 8931456, 'steps': 46517, 'loss/train': 1.620643973350525} -11/07/2021 03:48:15 - INFO - __main__ - Step 46519: {'lr': 0.0003964392495662632, 'samples': 8931648, 'steps': 46518, 'loss/train': 1.5931931734085083} -11/07/2021 03:48:16 - INFO - __main__ - Step 46520: {'lr': 0.0003964349484874007, 'samples': 8931840, 'steps': 46519, 'loss/train': 1.1818599700927734} -11/07/2021 03:48:16 - INFO - __main__ - Step 46521: {'lr': 0.00039643064734255675, 'samples': 8932032, 'steps': 46520, 'loss/train': 1.839593529701233} -11/07/2021 03:48:16 - INFO - __main__ - Step 46522: {'lr': 0.0003964263461317334, 'samples': 8932224, 'steps': 46521, 'loss/train': 1.2800414562225342} -11/07/2021 03:48:17 - INFO - __main__ - Step 46523: {'lr': 0.0003964220448549327, 'samples': 8932416, 'steps': 46522, 'loss/train': 1.3235206604003906} -11/07/2021 03:48:17 - INFO - __main__ - Step 46524: {'lr': 0.0003964177435121565, 'samples': 8932608, 'steps': 46523, 'loss/train': 1.8287054300308228} -11/07/2021 03:48:18 - INFO - __main__ - Step 46525: {'lr': 0.00039641344210340665, 'samples': 8932800, 'steps': 46524, 'loss/train': 1.641908049583435} -11/07/2021 03:48:18 - INFO - __main__ - Step 46526: {'lr': 0.00039640914062868515, 'samples': 8932992, 'steps': 46525, 'loss/train': 1.56090247631073} -11/07/2021 03:48:19 - INFO - __main__ - Step 46527: {'lr': 0.000396404839087994, 'samples': 8933184, 'steps': 46526, 'loss/train': 0.6343189477920532} -11/07/2021 03:48:19 - INFO - __main__ - Step 46528: {'lr': 0.0003964005374813351, 'samples': 8933376, 'steps': 46527, 'loss/train': 1.3692983388900757} -11/07/2021 03:48:20 - INFO - __main__ - Step 46529: {'lr': 0.0003963962358087103, 'samples': 8933568, 'steps': 46528, 'loss/train': 1.516156554222107} -11/07/2021 03:48:21 - INFO - __main__ - Step 46530: {'lr': 0.00039639193407012166, 'samples': 8933760, 'steps': 46529, 'loss/train': 1.586659550666809} -11/07/2021 03:48:21 - INFO - __main__ - Step 46531: {'lr': 0.00039638763226557106, 'samples': 8933952, 'steps': 46530, 'loss/train': 1.5941252708435059} -11/07/2021 03:48:21 - INFO - __main__ - Step 46532: {'lr': 0.0003963833303950605, 'samples': 8934144, 'steps': 46531, 'loss/train': 1.4129873514175415} -11/07/2021 03:48:22 - INFO - __main__ - Step 46533: {'lr': 0.00039637902845859185, 'samples': 8934336, 'steps': 46532, 'loss/train': 1.332977294921875} -11/07/2021 03:48:22 - INFO - __main__ - Step 46534: {'lr': 0.00039637472645616704, 'samples': 8934528, 'steps': 46533, 'loss/train': 1.740139126777649} -11/07/2021 03:48:23 - INFO - __main__ - Step 46535: {'lr': 0.00039637042438778804, 'samples': 8934720, 'steps': 46534, 'loss/train': 1.2434988021850586} -11/07/2021 03:48:24 - INFO - __main__ - Step 46536: {'lr': 0.0003963661222534568, 'samples': 8934912, 'steps': 46535, 'loss/train': 1.1036967039108276} -11/07/2021 03:48:24 - INFO - __main__ - Step 46537: {'lr': 0.00039636182005317524, 'samples': 8935104, 'steps': 46536, 'loss/train': 1.4403520822525024} -11/07/2021 03:48:24 - INFO - __main__ - Step 46538: {'lr': 0.0003963575177869453, 'samples': 8935296, 'steps': 46537, 'loss/train': 1.4397002458572388} -11/07/2021 03:48:25 - INFO - __main__ - Step 46539: {'lr': 0.00039635321545476894, 'samples': 8935488, 'steps': 46538, 'loss/train': 1.5650548934936523} -11/07/2021 03:48:26 - INFO - __main__ - Step 46540: {'lr': 0.00039634891305664806, 'samples': 8935680, 'steps': 46539, 'loss/train': 2.071367025375366} -11/07/2021 03:48:26 - INFO - __main__ - Step 46541: {'lr': 0.00039634461059258466, 'samples': 8935872, 'steps': 46540, 'loss/train': 1.7746798992156982} -11/07/2021 03:48:26 - INFO - __main__ - Step 46542: {'lr': 0.0003963403080625806, 'samples': 8936064, 'steps': 46541, 'loss/train': 1.6014556884765625} -11/07/2021 03:48:27 - INFO - __main__ - Step 46543: {'lr': 0.00039633600546663784, 'samples': 8936256, 'steps': 46542, 'loss/train': 1.584721326828003} -11/07/2021 03:48:27 - INFO - __main__ - Step 46544: {'lr': 0.00039633170280475833, 'samples': 8936448, 'steps': 46543, 'loss/train': 1.3739217519760132} -11/07/2021 03:48:28 - INFO - __main__ - Step 46545: {'lr': 0.000396327400076944, 'samples': 8936640, 'steps': 46544, 'loss/train': 1.6864553689956665} -11/07/2021 03:48:28 - INFO - __main__ - Step 46546: {'lr': 0.0003963230972831968, 'samples': 8936832, 'steps': 46545, 'loss/train': 1.6099401712417603} -11/07/2021 03:48:29 - INFO - __main__ - Step 46547: {'lr': 0.0003963187944235188, 'samples': 8937024, 'steps': 46546, 'loss/train': 1.7182683944702148} -11/07/2021 03:48:29 - INFO - __main__ - Step 46548: {'lr': 0.00039631449149791164, 'samples': 8937216, 'steps': 46547, 'loss/train': 1.5881284475326538} -11/07/2021 03:48:29 - INFO - __main__ - Step 46549: {'lr': 0.0003963101885063776, 'samples': 8937408, 'steps': 46548, 'loss/train': 1.5946006774902344} -11/07/2021 03:48:31 - INFO - __main__ - Step 46550: {'lr': 0.00039630588544891835, 'samples': 8937600, 'steps': 46549, 'loss/train': 1.1868088245391846} -11/07/2021 03:48:31 - INFO - __main__ - Step 46551: {'lr': 0.0003963015823255359, 'samples': 8937792, 'steps': 46550, 'loss/train': 1.6669026613235474} -11/07/2021 03:48:31 - INFO - __main__ - Step 46552: {'lr': 0.00039629727913623213, 'samples': 8937984, 'steps': 46551, 'loss/train': 1.6167420148849487} -11/07/2021 03:48:32 - INFO - __main__ - Step 46553: {'lr': 0.0003962929758810092, 'samples': 8938176, 'steps': 46552, 'loss/train': 1.8316158056259155} -11/07/2021 03:48:32 - INFO - __main__ - Step 46554: {'lr': 0.00039628867255986887, 'samples': 8938368, 'steps': 46553, 'loss/train': 2.182403087615967} -11/07/2021 03:48:33 - INFO - __main__ - Step 46555: {'lr': 0.0003962843691728132, 'samples': 8938560, 'steps': 46554, 'loss/train': 1.6754432916641235} -11/07/2021 03:48:33 - INFO - __main__ - Step 46556: {'lr': 0.000396280065719844, 'samples': 8938752, 'steps': 46555, 'loss/train': 1.8905868530273438} -11/07/2021 03:48:34 - INFO - __main__ - Step 46557: {'lr': 0.0003962757622009632, 'samples': 8938944, 'steps': 46556, 'loss/train': 1.4807912111282349} -11/07/2021 03:48:34 - INFO - __main__ - Step 46558: {'lr': 0.0003962714586161729, 'samples': 8939136, 'steps': 46557, 'loss/train': 1.1115580797195435} -11/07/2021 03:48:34 - INFO - __main__ - Step 46559: {'lr': 0.0003962671549654748, 'samples': 8939328, 'steps': 46558, 'loss/train': 0.7697739601135254} -11/07/2021 03:48:35 - INFO - __main__ - Step 46560: {'lr': 0.00039626285124887107, 'samples': 8939520, 'steps': 46559, 'loss/train': 1.631230115890503} -11/07/2021 03:48:36 - INFO - __main__ - Step 46561: {'lr': 0.00039625854746636356, 'samples': 8939712, 'steps': 46560, 'loss/train': 1.4189014434814453} -11/07/2021 03:48:36 - INFO - __main__ - Step 46562: {'lr': 0.0003962542436179542, 'samples': 8939904, 'steps': 46561, 'loss/train': 1.2800192832946777} -11/07/2021 03:48:37 - INFO - __main__ - Step 46563: {'lr': 0.0003962499397036449, 'samples': 8940096, 'steps': 46562, 'loss/train': 1.153496503829956} -11/07/2021 03:48:37 - INFO - __main__ - Step 46564: {'lr': 0.0003962456357234377, 'samples': 8940288, 'steps': 46563, 'loss/train': 1.1571232080459595} -11/07/2021 03:48:38 - INFO - __main__ - Step 46565: {'lr': 0.0003962413316773344, 'samples': 8940480, 'steps': 46564, 'loss/train': 1.484740138053894} -11/07/2021 03:48:38 - INFO - __main__ - Step 46566: {'lr': 0.000396237027565337, 'samples': 8940672, 'steps': 46565, 'loss/train': 2.0003304481506348} -11/07/2021 03:48:39 - INFO - __main__ - Step 46567: {'lr': 0.00039623272338744754, 'samples': 8940864, 'steps': 46566, 'loss/train': 1.615573763847351} -11/07/2021 03:48:39 - INFO - __main__ - Step 46568: {'lr': 0.00039622841914366784, 'samples': 8941056, 'steps': 46567, 'loss/train': 1.545198917388916} -11/07/2021 03:48:39 - INFO - __main__ - Step 46569: {'lr': 0.0003962241148339999, 'samples': 8941248, 'steps': 46568, 'loss/train': 1.480456829071045} -11/07/2021 03:48:40 - INFO - __main__ - Step 46570: {'lr': 0.0003962198104584456, 'samples': 8941440, 'steps': 46569, 'loss/train': 1.4060744047164917} -11/07/2021 03:48:41 - INFO - __main__ - Step 46571: {'lr': 0.00039621550601700683, 'samples': 8941632, 'steps': 46570, 'loss/train': 1.5286009311676025} -11/07/2021 03:48:41 - INFO - __main__ - Step 46572: {'lr': 0.0003962112015096857, 'samples': 8941824, 'steps': 46571, 'loss/train': 1.2991770505905151} -11/07/2021 03:48:42 - INFO - __main__ - Step 46573: {'lr': 0.00039620689693648404, 'samples': 8942016, 'steps': 46572, 'loss/train': 0.5695983171463013} -11/07/2021 03:48:42 - INFO - __main__ - Step 46574: {'lr': 0.0003962025922974038, 'samples': 8942208, 'steps': 46573, 'loss/train': 1.6276212930679321} -11/07/2021 03:48:42 - INFO - __main__ - Step 46575: {'lr': 0.00039619828759244693, 'samples': 8942400, 'steps': 46574, 'loss/train': 1.5821086168289185} -11/07/2021 03:48:43 - INFO - __main__ - Step 46576: {'lr': 0.00039619398282161536, 'samples': 8942592, 'steps': 46575, 'loss/train': 1.1809090375900269} -11/07/2021 03:48:44 - INFO - __main__ - Step 46577: {'lr': 0.000396189677984911, 'samples': 8942784, 'steps': 46576, 'loss/train': 1.2262035608291626} -11/07/2021 03:48:44 - INFO - __main__ - Step 46578: {'lr': 0.00039618537308233593, 'samples': 8942976, 'steps': 46577, 'loss/train': 1.1441209316253662} -11/07/2021 03:48:44 - INFO - __main__ - Step 46579: {'lr': 0.00039618106811389187, 'samples': 8943168, 'steps': 46578, 'loss/train': 1.8602534532546997} -11/07/2021 03:48:45 - INFO - __main__ - Step 46580: {'lr': 0.00039617676307958095, 'samples': 8943360, 'steps': 46579, 'loss/train': 1.4358470439910889} -11/07/2021 03:48:46 - INFO - __main__ - Step 46581: {'lr': 0.000396172457979405, 'samples': 8943552, 'steps': 46580, 'loss/train': 0.9704254269599915} -11/07/2021 03:48:46 - INFO - __main__ - Step 46582: {'lr': 0.0003961681528133661, 'samples': 8943744, 'steps': 46581, 'loss/train': 1.5471473932266235} -11/07/2021 03:48:46 - INFO - __main__ - Step 46583: {'lr': 0.00039616384758146594, 'samples': 8943936, 'steps': 46582, 'loss/train': 1.4239884614944458} -11/07/2021 03:48:47 - INFO - __main__ - Step 46584: {'lr': 0.0003961595422837067, 'samples': 8944128, 'steps': 46583, 'loss/train': 1.2873655557632446} -11/07/2021 03:48:47 - INFO - __main__ - Step 46585: {'lr': 0.0003961552369200902, 'samples': 8944320, 'steps': 46584, 'loss/train': 1.6000466346740723} -11/07/2021 03:48:49 - INFO - __main__ - Step 46586: {'lr': 0.0003961509314906184, 'samples': 8944512, 'steps': 46585, 'loss/train': 1.4519565105438232} -11/07/2021 03:48:49 - INFO - __main__ - Step 46587: {'lr': 0.00039614662599529325, 'samples': 8944704, 'steps': 46586, 'loss/train': 1.7165050506591797} -11/07/2021 03:48:49 - INFO - __main__ - Step 46588: {'lr': 0.0003961423204341167, 'samples': 8944896, 'steps': 46587, 'loss/train': 1.883649230003357} -11/07/2021 03:48:50 - INFO - __main__ - Step 46589: {'lr': 0.00039613801480709065, 'samples': 8945088, 'steps': 46588, 'loss/train': 1.7284959554672241} -11/07/2021 03:48:50 - INFO - __main__ - Step 46590: {'lr': 0.00039613370911421706, 'samples': 8945280, 'steps': 46589, 'loss/train': 1.1167792081832886} -11/07/2021 03:48:50 - INFO - __main__ - Step 46591: {'lr': 0.00039612940335549793, 'samples': 8945472, 'steps': 46590, 'loss/train': 1.5884649753570557} -11/07/2021 03:48:51 - INFO - __main__ - Step 46592: {'lr': 0.0003961250975309351, 'samples': 8945664, 'steps': 46591, 'loss/train': 1.5987987518310547} -11/07/2021 03:48:52 - INFO - __main__ - Step 46593: {'lr': 0.0003961207916405305, 'samples': 8945856, 'steps': 46592, 'loss/train': 1.3909083604812622} -11/07/2021 03:48:52 - INFO - __main__ - Step 46594: {'lr': 0.00039611648568428626, 'samples': 8946048, 'steps': 46593, 'loss/train': 1.7174088954925537} -11/07/2021 03:48:52 - INFO - __main__ - Step 46595: {'lr': 0.0003961121796622041, 'samples': 8946240, 'steps': 46594, 'loss/train': 1.463890552520752} -11/07/2021 03:48:53 - INFO - __main__ - Step 46596: {'lr': 0.000396107873574286, 'samples': 8946432, 'steps': 46595, 'loss/train': 1.6015509366989136} -11/07/2021 03:48:54 - INFO - __main__ - Step 46597: {'lr': 0.00039610356742053403, 'samples': 8946624, 'steps': 46596, 'loss/train': 0.988956868648529} -11/07/2021 03:48:54 - INFO - __main__ - Step 46598: {'lr': 0.0003960992612009501, 'samples': 8946816, 'steps': 46597, 'loss/train': 1.4584623575210571} -11/07/2021 03:48:54 - INFO - __main__ - Step 46599: {'lr': 0.0003960949549155359, 'samples': 8947008, 'steps': 46598, 'loss/train': 1.323596715927124} -11/07/2021 03:48:55 - INFO - __main__ - Step 46600: {'lr': 0.0003960906485642938, 'samples': 8947200, 'steps': 46599, 'loss/train': 1.269243597984314} -11/07/2021 03:48:55 - INFO - __main__ - Step 46601: {'lr': 0.0003960863421472254, 'samples': 8947392, 'steps': 46600, 'loss/train': 1.7932299375534058} -11/07/2021 03:48:56 - INFO - __main__ - Step 46602: {'lr': 0.00039608203566433273, 'samples': 8947584, 'steps': 46601, 'loss/train': 1.4171199798583984} -11/07/2021 03:48:57 - INFO - __main__ - Step 46603: {'lr': 0.00039607772911561776, 'samples': 8947776, 'steps': 46602, 'loss/train': 1.5545135736465454} -11/07/2021 03:48:57 - INFO - __main__ - Step 46604: {'lr': 0.00039607342250108234, 'samples': 8947968, 'steps': 46603, 'loss/train': 1.7056605815887451} -11/07/2021 03:48:57 - INFO - __main__ - Step 46605: {'lr': 0.0003960691158207287, 'samples': 8948160, 'steps': 46604, 'loss/train': 1.4816783666610718} -11/07/2021 03:48:58 - INFO - __main__ - Step 46606: {'lr': 0.0003960648090745584, 'samples': 8948352, 'steps': 46605, 'loss/train': 1.4529831409454346} -11/07/2021 03:48:59 - INFO - __main__ - Step 46607: {'lr': 0.00039606050226257354, 'samples': 8948544, 'steps': 46606, 'loss/train': 2.054903030395508} -11/07/2021 03:48:59 - INFO - __main__ - Step 46608: {'lr': 0.00039605619538477617, 'samples': 8948736, 'steps': 46607, 'loss/train': 1.7597931623458862} -11/07/2021 03:49:00 - INFO - __main__ - Step 46609: {'lr': 0.00039605188844116815, 'samples': 8948928, 'steps': 46608, 'loss/train': 1.247678279876709} -11/07/2021 03:49:00 - INFO - __main__ - Step 46610: {'lr': 0.0003960475814317512, 'samples': 8949120, 'steps': 46609, 'loss/train': 2.0703155994415283} -11/07/2021 03:49:00 - INFO - __main__ - Step 46611: {'lr': 0.0003960432743565277, 'samples': 8949312, 'steps': 46610, 'loss/train': 1.2479217052459717} -11/07/2021 03:49:01 - INFO - __main__ - Step 46612: {'lr': 0.00039603896721549924, 'samples': 8949504, 'steps': 46611, 'loss/train': 0.7806252837181091} -11/07/2021 03:49:02 - INFO - __main__ - Step 46613: {'lr': 0.0003960346600086679, 'samples': 8949696, 'steps': 46612, 'loss/train': 1.7482831478118896} -11/07/2021 03:49:02 - INFO - __main__ - Step 46614: {'lr': 0.0003960303527360356, 'samples': 8949888, 'steps': 46613, 'loss/train': 1.7881076335906982} -11/07/2021 03:49:02 - INFO - __main__ - Step 46615: {'lr': 0.00039602604539760425, 'samples': 8950080, 'steps': 46614, 'loss/train': 1.4864344596862793} -11/07/2021 03:49:03 - INFO - __main__ - Step 46616: {'lr': 0.0003960217379933758, 'samples': 8950272, 'steps': 46615, 'loss/train': 0.23502303659915924} -11/07/2021 03:49:03 - INFO - __main__ - Step 46617: {'lr': 0.00039601743052335224, 'samples': 8950464, 'steps': 46616, 'loss/train': 1.6170903444290161} -11/07/2021 03:49:04 - INFO - __main__ - Step 46618: {'lr': 0.00039601312298753554, 'samples': 8950656, 'steps': 46617, 'loss/train': 1.5993255376815796} -11/07/2021 03:49:04 - INFO - __main__ - Step 46619: {'lr': 0.0003960088153859275, 'samples': 8950848, 'steps': 46618, 'loss/train': 1.3210651874542236} -11/07/2021 03:49:05 - INFO - __main__ - Step 46620: {'lr': 0.0003960045077185301, 'samples': 8951040, 'steps': 46619, 'loss/train': 1.428301453590393} -11/07/2021 03:49:05 - INFO - __main__ - Step 46621: {'lr': 0.0003960001999853454, 'samples': 8951232, 'steps': 46620, 'loss/train': 1.6477384567260742} -11/07/2021 03:49:06 - INFO - __main__ - Step 46622: {'lr': 0.00039599589218637535, 'samples': 8951424, 'steps': 46621, 'loss/train': 1.698339581489563} -11/07/2021 03:49:06 - INFO - __main__ - Step 46623: {'lr': 0.00039599158432162163, 'samples': 8951616, 'steps': 46622, 'loss/train': 1.2999848127365112} -11/07/2021 03:49:07 - INFO - __main__ - Step 46624: {'lr': 0.00039598727639108644, 'samples': 8951808, 'steps': 46623, 'loss/train': 1.4000439643859863} -11/07/2021 03:49:07 - INFO - __main__ - Step 46625: {'lr': 0.00039598296839477167, 'samples': 8952000, 'steps': 46624, 'loss/train': 1.7494179010391235} -11/07/2021 03:49:08 - INFO - __main__ - Step 46626: {'lr': 0.00039597866033267917, 'samples': 8952192, 'steps': 46625, 'loss/train': 1.659546136856079} -11/07/2021 03:49:08 - INFO - __main__ - Step 46627: {'lr': 0.00039597435220481094, 'samples': 8952384, 'steps': 46626, 'loss/train': 1.4539217948913574} -11/07/2021 03:49:09 - INFO - __main__ - Step 46628: {'lr': 0.0003959700440111689, 'samples': 8952576, 'steps': 46627, 'loss/train': 1.1460973024368286} -11/07/2021 03:49:10 - INFO - __main__ - Step 46629: {'lr': 0.00039596573575175506, 'samples': 8952768, 'steps': 46628, 'loss/train': 1.5490814447402954} -11/07/2021 03:49:10 - INFO - __main__ - Step 46630: {'lr': 0.00039596142742657125, 'samples': 8952960, 'steps': 46629, 'loss/train': 0.5390429496765137} -11/07/2021 03:49:10 - INFO - __main__ - Step 46631: {'lr': 0.00039595711903561947, 'samples': 8953152, 'steps': 46630, 'loss/train': 1.2273478507995605} -11/07/2021 03:49:11 - INFO - __main__ - Step 46632: {'lr': 0.0003959528105789018, 'samples': 8953344, 'steps': 46631, 'loss/train': 2.5275912284851074} -11/07/2021 03:49:11 - INFO - __main__ - Step 46633: {'lr': 0.00039594850205641985, 'samples': 8953536, 'steps': 46632, 'loss/train': 2.9538755416870117} -11/07/2021 03:49:12 - INFO - __main__ - Step 46634: {'lr': 0.0003959441934681759, 'samples': 8953728, 'steps': 46633, 'loss/train': 1.9540854692459106} -11/07/2021 03:49:12 - INFO - __main__ - Step 46635: {'lr': 0.00039593988481417174, 'samples': 8953920, 'steps': 46634, 'loss/train': 1.362870454788208} -11/07/2021 03:49:13 - INFO - __main__ - Step 46636: {'lr': 0.0003959355760944093, 'samples': 8954112, 'steps': 46635, 'loss/train': 1.3720383644104004} -11/07/2021 03:49:13 - INFO - __main__ - Step 46637: {'lr': 0.0003959312673088905, 'samples': 8954304, 'steps': 46636, 'loss/train': 1.8665322065353394} -11/07/2021 03:49:13 - INFO - __main__ - Step 46638: {'lr': 0.0003959269584576173, 'samples': 8954496, 'steps': 46637, 'loss/train': 1.192275881767273} -11/07/2021 03:49:14 - INFO - __main__ - Step 46639: {'lr': 0.00039592264954059177, 'samples': 8954688, 'steps': 46638, 'loss/train': 1.9641491174697876} -11/07/2021 03:49:15 - INFO - __main__ - Step 46640: {'lr': 0.00039591834055781566, 'samples': 8954880, 'steps': 46639, 'loss/train': 1.2691432237625122} -11/07/2021 03:49:15 - INFO - __main__ - Step 46641: {'lr': 0.0003959140315092911, 'samples': 8955072, 'steps': 46640, 'loss/train': 1.4783892631530762} -11/07/2021 03:49:16 - INFO - __main__ - Step 46642: {'lr': 0.00039590972239501984, 'samples': 8955264, 'steps': 46641, 'loss/train': 1.8274744749069214} -11/07/2021 03:49:16 - INFO - __main__ - Step 46643: {'lr': 0.0003959054132150039, 'samples': 8955456, 'steps': 46642, 'loss/train': 1.2819947004318237} -11/07/2021 03:49:16 - INFO - __main__ - Step 46644: {'lr': 0.00039590110396924526, 'samples': 8955648, 'steps': 46643, 'loss/train': 2.006920337677002} -11/07/2021 03:49:17 - INFO - __main__ - Step 46645: {'lr': 0.0003958967946577459, 'samples': 8955840, 'steps': 46644, 'loss/train': 1.395865797996521} -11/07/2021 03:49:18 - INFO - __main__ - Step 46646: {'lr': 0.0003958924852805076, 'samples': 8956032, 'steps': 46645, 'loss/train': 1.7654708623886108} -11/07/2021 03:49:18 - INFO - __main__ - Step 46647: {'lr': 0.00039588817583753236, 'samples': 8956224, 'steps': 46646, 'loss/train': 1.3263219594955444} -11/07/2021 03:49:18 - INFO - __main__ - Step 46648: {'lr': 0.0003958838663288223, 'samples': 8956416, 'steps': 46647, 'loss/train': 1.6043410301208496} -11/07/2021 03:49:19 - INFO - __main__ - Step 46649: {'lr': 0.00039587955675437917, 'samples': 8956608, 'steps': 46648, 'loss/train': 1.3933658599853516} -11/07/2021 03:49:20 - INFO - __main__ - Step 46650: {'lr': 0.00039587524711420487, 'samples': 8956800, 'steps': 46649, 'loss/train': 1.3795287609100342} -11/07/2021 03:49:20 - INFO - __main__ - Step 46651: {'lr': 0.00039587093740830147, 'samples': 8956992, 'steps': 46650, 'loss/train': 0.8048598766326904} -11/07/2021 03:49:20 - INFO - __main__ - Step 46652: {'lr': 0.0003958666276366709, 'samples': 8957184, 'steps': 46651, 'loss/train': 1.2594974040985107} -11/07/2021 03:49:21 - INFO - __main__ - Step 46653: {'lr': 0.00039586231779931516, 'samples': 8957376, 'steps': 46652, 'loss/train': 0.3006884753704071} -11/07/2021 03:49:21 - INFO - __main__ - Step 46654: {'lr': 0.000395858007896236, 'samples': 8957568, 'steps': 46653, 'loss/train': 1.400397777557373} -11/07/2021 03:49:22 - INFO - __main__ - Step 46655: {'lr': 0.0003958536979274355, 'samples': 8957760, 'steps': 46654, 'loss/train': 1.100865125656128} -11/07/2021 03:49:23 - INFO - __main__ - Step 46656: {'lr': 0.00039584938789291563, 'samples': 8957952, 'steps': 46655, 'loss/train': 1.5183429718017578} -11/07/2021 03:49:23 - INFO - __main__ - Step 46657: {'lr': 0.0003958450777926782, 'samples': 8958144, 'steps': 46656, 'loss/train': 1.4449796676635742} -11/07/2021 03:49:23 - INFO - __main__ - Step 46658: {'lr': 0.00039584076762672526, 'samples': 8958336, 'steps': 46657, 'loss/train': 1.4669604301452637} -11/07/2021 03:49:24 - INFO - __main__ - Step 46659: {'lr': 0.0003958364573950587, 'samples': 8958528, 'steps': 46658, 'loss/train': 1.6107738018035889} -11/07/2021 03:49:25 - INFO - __main__ - Step 46660: {'lr': 0.00039583214709768054, 'samples': 8958720, 'steps': 46659, 'loss/train': 1.4138153791427612} -11/07/2021 03:49:25 - INFO - __main__ - Step 46661: {'lr': 0.0003958278367345926, 'samples': 8958912, 'steps': 46660, 'loss/train': 1.656166911125183} -11/07/2021 03:49:25 - INFO - __main__ - Step 46662: {'lr': 0.00039582352630579697, 'samples': 8959104, 'steps': 46661, 'loss/train': 1.3021039962768555} -11/07/2021 03:49:26 - INFO - __main__ - Step 46663: {'lr': 0.00039581921581129543, 'samples': 8959296, 'steps': 46662, 'loss/train': 1.5526115894317627} -11/07/2021 03:49:26 - INFO - __main__ - Step 46664: {'lr': 0.00039581490525109005, 'samples': 8959488, 'steps': 46663, 'loss/train': 1.0968859195709229} -11/07/2021 03:49:27 - INFO - __main__ - Step 46665: {'lr': 0.00039581059462518266, 'samples': 8959680, 'steps': 46664, 'loss/train': 1.296531081199646} -11/07/2021 03:49:27 - INFO - __main__ - Step 46666: {'lr': 0.00039580628393357534, 'samples': 8959872, 'steps': 46665, 'loss/train': 1.4447951316833496} -11/07/2021 03:49:28 - INFO - __main__ - Step 46667: {'lr': 0.0003958019731762699, 'samples': 8960064, 'steps': 46666, 'loss/train': 1.739152193069458} -11/07/2021 03:49:28 - INFO - __main__ - Step 46668: {'lr': 0.0003957976623532684, 'samples': 8960256, 'steps': 46667, 'loss/train': 1.4870009422302246} -11/07/2021 03:49:29 - INFO - __main__ - Step 46669: {'lr': 0.0003957933514645727, 'samples': 8960448, 'steps': 46668, 'loss/train': 1.5848653316497803} -11/07/2021 03:49:30 - INFO - __main__ - Step 46670: {'lr': 0.00039578904051018474, 'samples': 8960640, 'steps': 46669, 'loss/train': 1.4008269309997559} -11/07/2021 03:49:30 - INFO - __main__ - Step 46671: {'lr': 0.00039578472949010644, 'samples': 8960832, 'steps': 46670, 'loss/train': 1.578660249710083} -11/07/2021 03:49:30 - INFO - __main__ - Step 46672: {'lr': 0.00039578041840433986, 'samples': 8961024, 'steps': 46671, 'loss/train': 1.870067834854126} -11/07/2021 03:49:31 - INFO - __main__ - Step 46673: {'lr': 0.00039577610725288694, 'samples': 8961216, 'steps': 46672, 'loss/train': 1.4752981662750244} -11/07/2021 03:49:31 - INFO - __main__ - Step 46674: {'lr': 0.0003957717960357494, 'samples': 8961408, 'steps': 46673, 'loss/train': 1.3758714199066162} -11/07/2021 03:49:31 - INFO - __main__ - Step 46675: {'lr': 0.0003957674847529295, 'samples': 8961600, 'steps': 46674, 'loss/train': 1.70477294921875} -11/07/2021 03:49:32 - INFO - __main__ - Step 46676: {'lr': 0.00039576317340442893, 'samples': 8961792, 'steps': 46675, 'loss/train': 1.4040971994400024} -11/07/2021 03:49:33 - INFO - __main__ - Step 46677: {'lr': 0.00039575886199024976, 'samples': 8961984, 'steps': 46676, 'loss/train': 1.8378627300262451} -11/07/2021 03:49:33 - INFO - __main__ - Step 46678: {'lr': 0.0003957545505103939, 'samples': 8962176, 'steps': 46677, 'loss/train': 2.1272621154785156} -11/07/2021 03:49:33 - INFO - __main__ - Step 46679: {'lr': 0.0003957502389648632, 'samples': 8962368, 'steps': 46678, 'loss/train': 0.7058058381080627} -11/07/2021 03:49:34 - INFO - __main__ - Step 46680: {'lr': 0.00039574592735365976, 'samples': 8962560, 'steps': 46679, 'loss/train': 1.6294348239898682} -11/07/2021 03:49:35 - INFO - __main__ - Step 46681: {'lr': 0.00039574161567678545, 'samples': 8962752, 'steps': 46680, 'loss/train': 0.8606553673744202} -11/07/2021 03:49:35 - INFO - __main__ - Step 46682: {'lr': 0.00039573730393424226, 'samples': 8962944, 'steps': 46681, 'loss/train': 1.6506311893463135} -11/07/2021 03:49:36 - INFO - __main__ - Step 46683: {'lr': 0.000395732992126032, 'samples': 8963136, 'steps': 46682, 'loss/train': 1.470301866531372} -11/07/2021 03:49:36 - INFO - __main__ - Step 46684: {'lr': 0.00039572868025215677, 'samples': 8963328, 'steps': 46683, 'loss/train': 1.0998947620391846} -11/07/2021 03:49:36 - INFO - __main__ - Step 46685: {'lr': 0.0003957243683126184, 'samples': 8963520, 'steps': 46684, 'loss/train': 1.2275121212005615} -11/07/2021 03:49:37 - INFO - __main__ - Step 46686: {'lr': 0.00039572005630741886, 'samples': 8963712, 'steps': 46685, 'loss/train': 1.9175535440444946} -11/07/2021 03:49:38 - INFO - __main__ - Step 46687: {'lr': 0.00039571574423656017, 'samples': 8963904, 'steps': 46686, 'loss/train': 1.5435117483139038} -11/07/2021 03:49:38 - INFO - __main__ - Step 46688: {'lr': 0.0003957114321000442, 'samples': 8964096, 'steps': 46687, 'loss/train': 1.4155611991882324} -11/07/2021 03:49:38 - INFO - __main__ - Step 46689: {'lr': 0.0003957071198978729, 'samples': 8964288, 'steps': 46688, 'loss/train': 1.3612478971481323} -11/07/2021 03:49:39 - INFO - __main__ - Step 46690: {'lr': 0.00039570280763004823, 'samples': 8964480, 'steps': 46689, 'loss/train': 1.7550060749053955} -11/07/2021 03:49:40 - INFO - __main__ - Step 46691: {'lr': 0.0003956984952965721, 'samples': 8964672, 'steps': 46690, 'loss/train': 1.3893109560012817} -11/07/2021 03:49:40 - INFO - __main__ - Step 46692: {'lr': 0.0003956941828974465, 'samples': 8964864, 'steps': 46691, 'loss/train': 1.536023497581482} -11/07/2021 03:49:40 - INFO - __main__ - Step 46693: {'lr': 0.0003956898704326733, 'samples': 8965056, 'steps': 46692, 'loss/train': 1.3925052881240845} -11/07/2021 03:49:41 - INFO - __main__ - Step 46694: {'lr': 0.00039568555790225456, 'samples': 8965248, 'steps': 46693, 'loss/train': 1.4903935194015503} -11/07/2021 03:49:41 - INFO - __main__ - Step 46695: {'lr': 0.00039568124530619213, 'samples': 8965440, 'steps': 46694, 'loss/train': 1.5666130781173706} -11/07/2021 03:49:41 - INFO - __main__ - Step 46696: {'lr': 0.00039567693264448803, 'samples': 8965632, 'steps': 46695, 'loss/train': 0.9935513138771057} -11/07/2021 03:49:42 - INFO - __main__ - Step 46697: {'lr': 0.00039567261991714406, 'samples': 8965824, 'steps': 46696, 'loss/train': 1.3019336462020874} -11/07/2021 03:49:43 - INFO - __main__ - Step 46698: {'lr': 0.00039566830712416226, 'samples': 8966016, 'steps': 46697, 'loss/train': 1.6125619411468506} -11/07/2021 03:49:43 - INFO - __main__ - Step 46699: {'lr': 0.0003956639942655446, 'samples': 8966208, 'steps': 46698, 'loss/train': 1.5985229015350342} -11/07/2021 03:49:44 - INFO - __main__ - Step 46700: {'lr': 0.000395659681341293, 'samples': 8966400, 'steps': 46699, 'loss/train': 1.6518969535827637} -11/07/2021 03:49:44 - INFO - __main__ - Step 46701: {'lr': 0.00039565536835140934, 'samples': 8966592, 'steps': 46700, 'loss/train': 1.3528852462768555} -11/07/2021 03:49:45 - INFO - __main__ - Step 46702: {'lr': 0.00039565105529589575, 'samples': 8966784, 'steps': 46701, 'loss/train': 1.752949833869934} -11/07/2021 03:49:45 - INFO - __main__ - Step 46703: {'lr': 0.00039564674217475393, 'samples': 8966976, 'steps': 46702, 'loss/train': 2.194688558578491} -11/07/2021 03:49:46 - INFO - __main__ - Step 46704: {'lr': 0.00039564242898798595, 'samples': 8967168, 'steps': 46703, 'loss/train': 1.578883409500122} -11/07/2021 03:49:46 - INFO - __main__ - Step 46705: {'lr': 0.00039563811573559377, 'samples': 8967360, 'steps': 46704, 'loss/train': 1.5374468564987183} -11/07/2021 03:49:46 - INFO - __main__ - Step 46706: {'lr': 0.00039563380241757927, 'samples': 8967552, 'steps': 46705, 'loss/train': 1.447409749031067} -11/07/2021 03:49:47 - INFO - __main__ - Step 46707: {'lr': 0.00039562948903394446, 'samples': 8967744, 'steps': 46706, 'loss/train': 1.3885626792907715} -11/07/2021 03:49:48 - INFO - __main__ - Step 46708: {'lr': 0.00039562517558469124, 'samples': 8967936, 'steps': 46707, 'loss/train': 1.3380175828933716} -11/07/2021 03:49:48 - INFO - __main__ - Step 46709: {'lr': 0.00039562086206982157, 'samples': 8968128, 'steps': 46708, 'loss/train': 1.9125405550003052} -11/07/2021 03:49:48 - INFO - __main__ - Step 46710: {'lr': 0.0003956165484893374, 'samples': 8968320, 'steps': 46709, 'loss/train': 1.4979057312011719} -11/07/2021 03:49:49 - INFO - __main__ - Step 46711: {'lr': 0.0003956122348432406, 'samples': 8968512, 'steps': 46710, 'loss/train': 1.2842931747436523} -11/07/2021 03:49:50 - INFO - __main__ - Step 46712: {'lr': 0.0003956079211315332, 'samples': 8968704, 'steps': 46711, 'loss/train': 1.184146523475647} -11/07/2021 03:49:50 - INFO - __main__ - Step 46713: {'lr': 0.00039560360735421706, 'samples': 8968896, 'steps': 46712, 'loss/train': 1.3897055387496948} -11/07/2021 03:49:51 - INFO - __main__ - Step 46714: {'lr': 0.0003955992935112943, 'samples': 8969088, 'steps': 46713, 'loss/train': 1.3282452821731567} -11/07/2021 03:49:51 - INFO - __main__ - Step 46715: {'lr': 0.00039559497960276667, 'samples': 8969280, 'steps': 46714, 'loss/train': 0.5708993673324585} -11/07/2021 03:49:51 - INFO - __main__ - Step 46716: {'lr': 0.0003955906656286362, 'samples': 8969472, 'steps': 46715, 'loss/train': 1.396579623222351} -11/07/2021 03:49:53 - INFO - __main__ - Step 46717: {'lr': 0.00039558635158890487, 'samples': 8969664, 'steps': 46716, 'loss/train': 1.4984301328659058} -11/07/2021 03:49:53 - INFO - __main__ - Step 46718: {'lr': 0.0003955820374835745, 'samples': 8969856, 'steps': 46717, 'loss/train': 1.558255672454834} -11/07/2021 03:49:53 - INFO - __main__ - Step 46719: {'lr': 0.0003955777233126472, 'samples': 8970048, 'steps': 46718, 'loss/train': 1.1341357231140137} -11/07/2021 03:49:54 - INFO - __main__ - Step 46720: {'lr': 0.00039557340907612473, 'samples': 8970240, 'steps': 46719, 'loss/train': 1.982488989830017} -11/07/2021 03:49:54 - INFO - __main__ - Step 46721: {'lr': 0.00039556909477400914, 'samples': 8970432, 'steps': 46720, 'loss/train': 1.388935923576355} -11/07/2021 03:49:55 - INFO - __main__ - Step 46722: {'lr': 0.00039556478040630246, 'samples': 8970624, 'steps': 46721, 'loss/train': 1.6528886556625366} -11/07/2021 03:49:55 - INFO - __main__ - Step 46723: {'lr': 0.0003955604659730064, 'samples': 8970816, 'steps': 46722, 'loss/train': 1.4015668630599976} -11/07/2021 03:49:56 - INFO - __main__ - Step 46724: {'lr': 0.00039555615147412315, 'samples': 8971008, 'steps': 46723, 'loss/train': 1.8984806537628174} -11/07/2021 03:49:56 - INFO - __main__ - Step 46725: {'lr': 0.00039555183690965454, 'samples': 8971200, 'steps': 46724, 'loss/train': 1.2106280326843262} -11/07/2021 03:49:56 - INFO - __main__ - Step 46726: {'lr': 0.00039554752227960243, 'samples': 8971392, 'steps': 46725, 'loss/train': 1.5564759969711304} -11/07/2021 03:49:57 - INFO - __main__ - Step 46727: {'lr': 0.0003955432075839689, 'samples': 8971584, 'steps': 46726, 'loss/train': 1.1629358530044556} -11/07/2021 03:49:58 - INFO - __main__ - Step 46728: {'lr': 0.00039553889282275585, 'samples': 8971776, 'steps': 46727, 'loss/train': 0.1853945404291153} -11/07/2021 03:49:58 - INFO - __main__ - Step 46729: {'lr': 0.0003955345779959653, 'samples': 8971968, 'steps': 46728, 'loss/train': 0.9729139804840088} -11/07/2021 03:49:59 - INFO - __main__ - Step 46730: {'lr': 0.00039553026310359897, 'samples': 8972160, 'steps': 46729, 'loss/train': 2.072021961212158} -11/07/2021 03:49:59 - INFO - __main__ - Step 46731: {'lr': 0.000395525948145659, 'samples': 8972352, 'steps': 46730, 'loss/train': 1.3280072212219238} -11/07/2021 03:50:00 - INFO - __main__ - Step 46732: {'lr': 0.0003955216331221473, 'samples': 8972544, 'steps': 46731, 'loss/train': 1.6797558069229126} -11/07/2021 03:50:00 - INFO - __main__ - Step 46733: {'lr': 0.00039551731803306577, 'samples': 8972736, 'steps': 46732, 'loss/train': 1.758447527885437} -11/07/2021 03:50:01 - INFO - __main__ - Step 46734: {'lr': 0.0003955130028784165, 'samples': 8972928, 'steps': 46733, 'loss/train': 2.373305559158325} -11/07/2021 03:50:01 - INFO - __main__ - Step 46735: {'lr': 0.0003955086876582012, 'samples': 8973120, 'steps': 46734, 'loss/train': 1.5346252918243408} -11/07/2021 03:50:01 - INFO - __main__ - Step 46736: {'lr': 0.000395504372372422, 'samples': 8973312, 'steps': 46735, 'loss/train': 1.6995505094528198} -11/07/2021 03:50:02 - INFO - __main__ - Step 46737: {'lr': 0.0003955000570210807, 'samples': 8973504, 'steps': 46736, 'loss/train': 1.3359993696212769} -11/07/2021 03:50:03 - INFO - __main__ - Step 46738: {'lr': 0.0003954957416041793, 'samples': 8973696, 'steps': 46737, 'loss/train': 1.7690136432647705} -11/07/2021 03:50:03 - INFO - __main__ - Step 46739: {'lr': 0.0003954914261217198, 'samples': 8973888, 'steps': 46738, 'loss/train': 1.6240804195404053} -11/07/2021 03:50:03 - INFO - __main__ - Step 46740: {'lr': 0.0003954871105737042, 'samples': 8974080, 'steps': 46739, 'loss/train': 1.0496690273284912} -11/07/2021 03:50:04 - INFO - __main__ - Step 46741: {'lr': 0.00039548279496013424, 'samples': 8974272, 'steps': 46740, 'loss/train': 0.8729541301727295} -11/07/2021 03:50:04 - INFO - __main__ - Step 46742: {'lr': 0.000395478479281012, 'samples': 8974464, 'steps': 46741, 'loss/train': 1.4796406030654907} -11/07/2021 03:50:05 - INFO - __main__ - Step 46743: {'lr': 0.00039547416353633946, 'samples': 8974656, 'steps': 46742, 'loss/train': 1.3999308347702026} -11/07/2021 03:50:06 - INFO - __main__ - Step 46744: {'lr': 0.00039546984772611843, 'samples': 8974848, 'steps': 46743, 'loss/train': 1.0811153650283813} -11/07/2021 03:50:06 - INFO - __main__ - Step 46745: {'lr': 0.00039546553185035093, 'samples': 8975040, 'steps': 46744, 'loss/train': 1.0817866325378418} -11/07/2021 03:50:06 - INFO - __main__ - Step 46746: {'lr': 0.00039546121590903897, 'samples': 8975232, 'steps': 46745, 'loss/train': 1.5537179708480835} -11/07/2021 03:50:07 - INFO - __main__ - Step 46747: {'lr': 0.0003954568999021844, 'samples': 8975424, 'steps': 46746, 'loss/train': 1.363145351409912} -11/07/2021 03:50:08 - INFO - __main__ - Step 46748: {'lr': 0.0003954525838297892, 'samples': 8975616, 'steps': 46747, 'loss/train': 1.4305704832077026} -11/07/2021 03:50:08 - INFO - __main__ - Step 46749: {'lr': 0.0003954482676918553, 'samples': 8975808, 'steps': 46748, 'loss/train': 1.5961601734161377} -11/07/2021 03:50:08 - INFO - __main__ - Step 46750: {'lr': 0.00039544395148838465, 'samples': 8976000, 'steps': 46749, 'loss/train': 1.72967529296875} -11/07/2021 03:50:09 - INFO - __main__ - Step 46751: {'lr': 0.0003954396352193792, 'samples': 8976192, 'steps': 46750, 'loss/train': 2.361015796661377} -11/07/2021 03:50:09 - INFO - __main__ - Step 46752: {'lr': 0.000395435318884841, 'samples': 8976384, 'steps': 46751, 'loss/train': 1.7659987211227417} -11/07/2021 03:50:10 - INFO - __main__ - Step 46753: {'lr': 0.0003954310024847717, 'samples': 8976576, 'steps': 46752, 'loss/train': 1.489812970161438} -11/07/2021 03:50:10 - INFO - __main__ - Step 46754: {'lr': 0.00039542668601917353, 'samples': 8976768, 'steps': 46753, 'loss/train': 1.301104187965393} -11/07/2021 03:50:11 - INFO - __main__ - Step 46755: {'lr': 0.0003954223694880483, 'samples': 8976960, 'steps': 46754, 'loss/train': 1.5028026103973389} -11/07/2021 03:50:11 - INFO - __main__ - Step 46756: {'lr': 0.0003954180528913981, 'samples': 8977152, 'steps': 46755, 'loss/train': 1.4305599927902222} -11/07/2021 03:50:11 - INFO - __main__ - Step 46757: {'lr': 0.0003954137362292247, 'samples': 8977344, 'steps': 46756, 'loss/train': 1.4253391027450562} -11/07/2021 03:50:12 - INFO - __main__ - Step 46758: {'lr': 0.0003954094195015301, 'samples': 8977536, 'steps': 46757, 'loss/train': 1.3867909908294678} -11/07/2021 03:50:13 - INFO - __main__ - Step 46759: {'lr': 0.0003954051027083163, 'samples': 8977728, 'steps': 46758, 'loss/train': 1.9530441761016846} -11/07/2021 03:50:13 - INFO - __main__ - Step 46760: {'lr': 0.0003954007858495852, 'samples': 8977920, 'steps': 46759, 'loss/train': 1.2998592853546143} -11/07/2021 03:50:13 - INFO - __main__ - Step 46761: {'lr': 0.00039539646892533867, 'samples': 8978112, 'steps': 46760, 'loss/train': 1.5191389322280884} -11/07/2021 03:50:14 - INFO - __main__ - Step 46762: {'lr': 0.00039539215193557886, 'samples': 8978304, 'steps': 46761, 'loss/train': 1.5478785037994385} -11/07/2021 03:50:14 - INFO - __main__ - Step 46763: {'lr': 0.0003953878348803075, 'samples': 8978496, 'steps': 46762, 'loss/train': 1.9524608850479126} -11/07/2021 03:50:15 - INFO - __main__ - Step 46764: {'lr': 0.0003953835177595266, 'samples': 8978688, 'steps': 46763, 'loss/train': 1.666530966758728} -11/07/2021 03:50:16 - INFO - __main__ - Step 46765: {'lr': 0.0003953792005732382, 'samples': 8978880, 'steps': 46764, 'loss/train': 1.1611963510513306} -11/07/2021 03:50:16 - INFO - __main__ - Step 46766: {'lr': 0.0003953748833214442, 'samples': 8979072, 'steps': 46765, 'loss/train': 1.4376670122146606} -11/07/2021 03:50:16 - INFO - __main__ - Step 46767: {'lr': 0.00039537056600414647, 'samples': 8979264, 'steps': 46766, 'loss/train': 1.1385133266448975} -11/07/2021 03:50:17 - INFO - __main__ - Step 46768: {'lr': 0.00039536624862134695, 'samples': 8979456, 'steps': 46767, 'loss/train': 1.679625391960144} -11/07/2021 03:50:18 - INFO - __main__ - Step 46769: {'lr': 0.00039536193117304774, 'samples': 8979648, 'steps': 46768, 'loss/train': 1.402443766593933} -11/07/2021 03:50:18 - INFO - __main__ - Step 46770: {'lr': 0.0003953576136592507, 'samples': 8979840, 'steps': 46769, 'loss/train': 1.2000861167907715} -11/07/2021 03:50:18 - INFO - __main__ - Step 46771: {'lr': 0.0003953532960799577, 'samples': 8980032, 'steps': 46770, 'loss/train': 1.1951671838760376} -11/07/2021 03:50:19 - INFO - __main__ - Step 46772: {'lr': 0.0003953489784351707, 'samples': 8980224, 'steps': 46771, 'loss/train': 1.7271140813827515} -11/07/2021 03:50:19 - INFO - __main__ - Step 46773: {'lr': 0.0003953446607248918, 'samples': 8980416, 'steps': 46772, 'loss/train': 1.2765376567840576} -11/07/2021 03:50:20 - INFO - __main__ - Step 46774: {'lr': 0.00039534034294912276, 'samples': 8980608, 'steps': 46773, 'loss/train': 1.1294169425964355} -11/07/2021 03:50:20 - INFO - __main__ - Step 46775: {'lr': 0.0003953360251078656, 'samples': 8980800, 'steps': 46774, 'loss/train': 1.6824162006378174} -11/07/2021 03:50:21 - INFO - __main__ - Step 46776: {'lr': 0.0003953317072011224, 'samples': 8980992, 'steps': 46775, 'loss/train': 1.4009029865264893} -11/07/2021 03:50:21 - INFO - __main__ - Step 46777: {'lr': 0.0003953273892288949, 'samples': 8981184, 'steps': 46776, 'loss/train': 0.33751192688941956} -11/07/2021 03:50:21 - INFO - __main__ - Step 46778: {'lr': 0.00039532307119118505, 'samples': 8981376, 'steps': 46777, 'loss/train': 1.763453722000122} -11/07/2021 03:50:23 - INFO - __main__ - Step 46779: {'lr': 0.00039531875308799493, 'samples': 8981568, 'steps': 46778, 'loss/train': 1.458613634109497} -11/07/2021 03:50:23 - INFO - __main__ - Step 46780: {'lr': 0.0003953144349193264, 'samples': 8981760, 'steps': 46779, 'loss/train': 1.495517373085022} -11/07/2021 03:50:23 - INFO - __main__ - Step 46781: {'lr': 0.0003953101166851814, 'samples': 8981952, 'steps': 46780, 'loss/train': 1.5929330587387085} -11/07/2021 03:50:24 - INFO - __main__ - Step 46782: {'lr': 0.0003953057983855619, 'samples': 8982144, 'steps': 46781, 'loss/train': 1.6176116466522217} -11/07/2021 03:50:24 - INFO - __main__ - Step 46783: {'lr': 0.00039530148002046996, 'samples': 8982336, 'steps': 46782, 'loss/train': 1.8476134538650513} -11/07/2021 03:50:25 - INFO - __main__ - Step 46784: {'lr': 0.0003952971615899074, 'samples': 8982528, 'steps': 46783, 'loss/train': 1.4362748861312866} -11/07/2021 03:50:25 - INFO - __main__ - Step 46785: {'lr': 0.00039529284309387607, 'samples': 8982720, 'steps': 46784, 'loss/train': 1.153825283050537} -11/07/2021 03:50:26 - INFO - __main__ - Step 46786: {'lr': 0.0003952885245323781, 'samples': 8982912, 'steps': 46785, 'loss/train': 1.3790760040283203} -11/07/2021 03:50:26 - INFO - __main__ - Step 46787: {'lr': 0.00039528420590541536, 'samples': 8983104, 'steps': 46786, 'loss/train': 1.3740510940551758} -11/07/2021 03:50:26 - INFO - __main__ - Step 46788: {'lr': 0.0003952798872129897, 'samples': 8983296, 'steps': 46787, 'loss/train': 0.6646178960800171} -11/07/2021 03:50:28 - INFO - __main__ - Step 46789: {'lr': 0.00039527556845510336, 'samples': 8983488, 'steps': 46788, 'loss/train': 1.5769122838974} -11/07/2021 03:50:28 - INFO - __main__ - Step 46790: {'lr': 0.00039527124963175796, 'samples': 8983680, 'steps': 46789, 'loss/train': 1.3731993436813354} -11/07/2021 03:50:28 - INFO - __main__ - Step 46791: {'lr': 0.0003952669307429556, 'samples': 8983872, 'steps': 46790, 'loss/train': 2.1312155723571777} -11/07/2021 03:50:29 - INFO - __main__ - Step 46792: {'lr': 0.00039526261178869816, 'samples': 8984064, 'steps': 46791, 'loss/train': 1.5580544471740723} -11/07/2021 03:50:29 - INFO - __main__ - Step 46793: {'lr': 0.0003952582927689877, 'samples': 8984256, 'steps': 46792, 'loss/train': 1.2427005767822266} -11/07/2021 03:50:29 - INFO - __main__ - Step 46794: {'lr': 0.00039525397368382604, 'samples': 8984448, 'steps': 46793, 'loss/train': 1.6376162767410278} -11/07/2021 03:50:30 - INFO - __main__ - Step 46795: {'lr': 0.0003952496545332152, 'samples': 8984640, 'steps': 46794, 'loss/train': 1.7411525249481201} -11/07/2021 03:50:31 - INFO - __main__ - Step 46796: {'lr': 0.00039524533531715714, 'samples': 8984832, 'steps': 46795, 'loss/train': 1.1954646110534668} -11/07/2021 03:50:31 - INFO - __main__ - Step 46797: {'lr': 0.00039524101603565377, 'samples': 8985024, 'steps': 46796, 'loss/train': 1.771838903427124} -11/07/2021 03:50:31 - INFO - __main__ - Step 46798: {'lr': 0.000395236696688707, 'samples': 8985216, 'steps': 46797, 'loss/train': 1.5596638917922974} -11/07/2021 03:50:32 - INFO - __main__ - Step 46799: {'lr': 0.0003952323772763188, 'samples': 8985408, 'steps': 46798, 'loss/train': 1.5280567407608032} -11/07/2021 03:50:33 - INFO - __main__ - Step 46800: {'lr': 0.00039522805779849116, 'samples': 8985600, 'steps': 46799, 'loss/train': 1.419503092765808} -11/07/2021 03:50:33 - INFO - __main__ - Step 46801: {'lr': 0.000395223738255226, 'samples': 8985792, 'steps': 46800, 'loss/train': 1.2403419017791748} -11/07/2021 03:50:33 - INFO - __main__ - Step 46802: {'lr': 0.00039521941864652525, 'samples': 8985984, 'steps': 46801, 'loss/train': 1.4845149517059326} -11/07/2021 03:50:34 - INFO - __main__ - Step 46803: {'lr': 0.0003952150989723909, 'samples': 8986176, 'steps': 46802, 'loss/train': 1.7280097007751465} -11/07/2021 03:50:34 - INFO - __main__ - Step 46804: {'lr': 0.00039521077923282486, 'samples': 8986368, 'steps': 46803, 'loss/train': 1.6100494861602783} -11/07/2021 03:50:35 - INFO - __main__ - Step 46805: {'lr': 0.00039520645942782906, 'samples': 8986560, 'steps': 46804, 'loss/train': 1.4668149948120117} -11/07/2021 03:50:36 - INFO - __main__ - Step 46806: {'lr': 0.00039520213955740555, 'samples': 8986752, 'steps': 46805, 'loss/train': 1.8643771409988403} -11/07/2021 03:50:36 - INFO - __main__ - Step 46807: {'lr': 0.0003951978196215561, 'samples': 8986944, 'steps': 46806, 'loss/train': 2.0712478160858154} -11/07/2021 03:50:36 - INFO - __main__ - Step 46808: {'lr': 0.00039519349962028276, 'samples': 8987136, 'steps': 46807, 'loss/train': 0.9385669231414795} -11/07/2021 03:50:37 - INFO - __main__ - Step 46809: {'lr': 0.0003951891795535875, 'samples': 8987328, 'steps': 46808, 'loss/train': 1.5247825384140015} -11/07/2021 03:50:38 - INFO - __main__ - Step 46810: {'lr': 0.00039518485942147233, 'samples': 8987520, 'steps': 46809, 'loss/train': 1.3851916790008545} -11/07/2021 03:50:38 - INFO - __main__ - Step 46811: {'lr': 0.0003951805392239389, 'samples': 8987712, 'steps': 46810, 'loss/train': 0.7063491940498352} -11/07/2021 03:50:39 - INFO - __main__ - Step 46812: {'lr': 0.00039517621896098954, 'samples': 8987904, 'steps': 46811, 'loss/train': 1.5973904132843018} -11/07/2021 03:50:39 - INFO - __main__ - Step 46813: {'lr': 0.00039517189863262593, 'samples': 8988096, 'steps': 46812, 'loss/train': 1.5485116243362427} -11/07/2021 03:50:39 - INFO - __main__ - Step 46814: {'lr': 0.00039516757823885006, 'samples': 8988288, 'steps': 46813, 'loss/train': 1.8475719690322876} -11/07/2021 03:50:40 - INFO - __main__ - Step 46815: {'lr': 0.000395163257779664, 'samples': 8988480, 'steps': 46814, 'loss/train': 1.8050289154052734} -11/07/2021 03:50:41 - INFO - __main__ - Step 46816: {'lr': 0.00039515893725506956, 'samples': 8988672, 'steps': 46815, 'loss/train': 1.5417001247406006} -11/07/2021 03:50:42 - INFO - __main__ - Step 46817: {'lr': 0.0003951546166650688, 'samples': 8988864, 'steps': 46816, 'loss/train': 4.985804557800293} -11/07/2021 03:50:42 - INFO - __main__ - Step 46818: {'lr': 0.0003951502960096636, 'samples': 8989056, 'steps': 46817, 'loss/train': 5.222023010253906} -11/07/2021 03:50:42 - INFO - __main__ - Step 46819: {'lr': 0.00039514597528885587, 'samples': 8989248, 'steps': 46818, 'loss/train': 1.0148247480392456} -11/07/2021 03:50:43 - INFO - __main__ - Step 46820: {'lr': 0.0003951416545026476, 'samples': 8989440, 'steps': 46819, 'loss/train': 1.453107237815857} -11/07/2021 03:50:43 - INFO - __main__ - Step 46821: {'lr': 0.0003951373336510408, 'samples': 8989632, 'steps': 46820, 'loss/train': 1.2581894397735596} -11/07/2021 03:50:44 - INFO - __main__ - Step 46822: {'lr': 0.00039513301273403733, 'samples': 8989824, 'steps': 46821, 'loss/train': 1.9668676853179932} -11/07/2021 03:50:44 - INFO - __main__ - Step 46823: {'lr': 0.0003951286917516392, 'samples': 8990016, 'steps': 46822, 'loss/train': 1.7566052675247192} -11/07/2021 03:50:45 - INFO - __main__ - Step 46824: {'lr': 0.00039512437070384827, 'samples': 8990208, 'steps': 46823, 'loss/train': 1.5792790651321411} -11/07/2021 03:50:45 - INFO - __main__ - Step 46825: {'lr': 0.00039512004959066653, 'samples': 8990400, 'steps': 46824, 'loss/train': 1.590653419494629} -11/07/2021 03:50:45 - INFO - __main__ - Step 46826: {'lr': 0.00039511572841209597, 'samples': 8990592, 'steps': 46825, 'loss/train': 1.6206929683685303} -11/07/2021 03:50:46 - INFO - __main__ - Step 46827: {'lr': 0.00039511140716813847, 'samples': 8990784, 'steps': 46826, 'loss/train': 1.5135914087295532} -11/07/2021 03:50:47 - INFO - __main__ - Step 46828: {'lr': 0.00039510708585879605, 'samples': 8990976, 'steps': 46827, 'loss/train': 1.8345533609390259} -11/07/2021 03:50:47 - INFO - __main__ - Step 46829: {'lr': 0.00039510276448407054, 'samples': 8991168, 'steps': 46828, 'loss/train': 1.2339359521865845} -11/07/2021 03:50:47 - INFO - __main__ - Step 46830: {'lr': 0.00039509844304396407, 'samples': 8991360, 'steps': 46829, 'loss/train': 0.958311140537262} -11/07/2021 03:50:48 - INFO - __main__ - Step 46831: {'lr': 0.00039509412153847847, 'samples': 8991552, 'steps': 46830, 'loss/train': 1.6364647150039673} -11/07/2021 03:50:48 - INFO - __main__ - Step 46832: {'lr': 0.00039508979996761564, 'samples': 8991744, 'steps': 46831, 'loss/train': 1.422149896621704} -11/07/2021 03:50:49 - INFO - __main__ - Step 46833: {'lr': 0.00039508547833137753, 'samples': 8991936, 'steps': 46832, 'loss/train': 1.893943190574646} -11/07/2021 03:50:50 - INFO - __main__ - Step 46834: {'lr': 0.0003950811566297662, 'samples': 8992128, 'steps': 46833, 'loss/train': 1.193856120109558} -11/07/2021 03:50:50 - INFO - __main__ - Step 46835: {'lr': 0.00039507683486278357, 'samples': 8992320, 'steps': 46834, 'loss/train': 2.5559275150299072} -11/07/2021 03:50:50 - INFO - __main__ - Step 46836: {'lr': 0.00039507251303043156, 'samples': 8992512, 'steps': 46835, 'loss/train': 1.5294876098632812} -11/07/2021 03:50:51 - INFO - __main__ - Step 46837: {'lr': 0.0003950681911327121, 'samples': 8992704, 'steps': 46836, 'loss/train': 1.7873066663742065} -11/07/2021 03:50:52 - INFO - __main__ - Step 46838: {'lr': 0.00039506386916962714, 'samples': 8992896, 'steps': 46837, 'loss/train': 1.2543444633483887} -11/07/2021 03:50:52 - INFO - __main__ - Step 46839: {'lr': 0.0003950595471411786, 'samples': 8993088, 'steps': 46838, 'loss/train': 1.2466020584106445} -11/07/2021 03:50:52 - INFO - __main__ - Step 46840: {'lr': 0.00039505522504736855, 'samples': 8993280, 'steps': 46839, 'loss/train': 1.3969309329986572} -11/07/2021 03:50:53 - INFO - __main__ - Step 46841: {'lr': 0.00039505090288819876, 'samples': 8993472, 'steps': 46840, 'loss/train': 2.016864776611328} -11/07/2021 03:50:53 - INFO - __main__ - Step 46842: {'lr': 0.00039504658066367136, 'samples': 8993664, 'steps': 46841, 'loss/train': 1.4573959112167358} -11/07/2021 03:50:54 - INFO - __main__ - Step 46843: {'lr': 0.0003950422583737882, 'samples': 8993856, 'steps': 46842, 'loss/train': 1.6924041509628296} -11/07/2021 03:50:54 - INFO - __main__ - Step 46844: {'lr': 0.0003950379360185512, 'samples': 8994048, 'steps': 46843, 'loss/train': 1.1295289993286133} -11/07/2021 03:50:55 - INFO - __main__ - Step 46845: {'lr': 0.00039503361359796235, 'samples': 8994240, 'steps': 46844, 'loss/train': 0.9984075427055359} -11/07/2021 03:50:55 - INFO - __main__ - Step 46846: {'lr': 0.00039502929111202357, 'samples': 8994432, 'steps': 46845, 'loss/train': 1.9570423364639282} -11/07/2021 03:50:55 - INFO - __main__ - Step 46847: {'lr': 0.0003950249685607369, 'samples': 8994624, 'steps': 46846, 'loss/train': 1.361639142036438} -11/07/2021 03:50:56 - INFO - __main__ - Step 46848: {'lr': 0.00039502064594410414, 'samples': 8994816, 'steps': 46847, 'loss/train': 1.080751895904541} -11/07/2021 03:50:57 - INFO - __main__ - Step 46849: {'lr': 0.00039501632326212734, 'samples': 8995008, 'steps': 46848, 'loss/train': 1.4507310390472412} -11/07/2021 03:50:57 - INFO - __main__ - Step 46850: {'lr': 0.00039501200051480844, 'samples': 8995200, 'steps': 46849, 'loss/train': 1.6919381618499756} -11/07/2021 03:50:57 - INFO - __main__ - Step 46851: {'lr': 0.0003950076777021494, 'samples': 8995392, 'steps': 46850, 'loss/train': 1.6522619724273682} -11/07/2021 03:50:58 - INFO - __main__ - Step 46852: {'lr': 0.00039500335482415205, 'samples': 8995584, 'steps': 46851, 'loss/train': 1.5006636381149292} -11/07/2021 03:50:58 - INFO - __main__ - Step 46853: {'lr': 0.00039499903188081856, 'samples': 8995776, 'steps': 46852, 'loss/train': 1.6721848249435425} -11/07/2021 03:50:59 - INFO - __main__ - Step 46854: {'lr': 0.0003949947088721506, 'samples': 8995968, 'steps': 46853, 'loss/train': 1.4820759296417236} -11/07/2021 03:51:00 - INFO - __main__ - Step 46855: {'lr': 0.0003949903857981503, 'samples': 8996160, 'steps': 46854, 'loss/train': 1.4208883047103882} -11/07/2021 03:51:00 - INFO - __main__ - Step 46856: {'lr': 0.0003949860626588196, 'samples': 8996352, 'steps': 46855, 'loss/train': 1.5806963443756104} -11/07/2021 03:51:00 - INFO - __main__ - Step 46857: {'lr': 0.0003949817394541604, 'samples': 8996544, 'steps': 46856, 'loss/train': 1.4058988094329834} -11/07/2021 03:51:01 - INFO - __main__ - Step 46858: {'lr': 0.0003949774161841747, 'samples': 8996736, 'steps': 46857, 'loss/train': 2.2320330142974854} -11/07/2021 03:51:02 - INFO - __main__ - Step 46859: {'lr': 0.0003949730928488644, 'samples': 8996928, 'steps': 46858, 'loss/train': 1.3717622756958008} -11/07/2021 03:51:02 - INFO - __main__ - Step 46860: {'lr': 0.0003949687694482314, 'samples': 8997120, 'steps': 46859, 'loss/train': 1.7184524536132812} -11/07/2021 03:51:02 - INFO - __main__ - Step 46861: {'lr': 0.0003949644459822778, 'samples': 8997312, 'steps': 46860, 'loss/train': 1.2574100494384766} -11/07/2021 03:51:03 - INFO - __main__ - Step 46862: {'lr': 0.00039496012245100536, 'samples': 8997504, 'steps': 46861, 'loss/train': 1.7844125032424927} -11/07/2021 03:51:03 - INFO - __main__ - Step 46863: {'lr': 0.0003949557988544162, 'samples': 8997696, 'steps': 46862, 'loss/train': 1.4378299713134766} -11/07/2021 03:51:04 - INFO - __main__ - Step 46864: {'lr': 0.0003949514751925122, 'samples': 8997888, 'steps': 46863, 'loss/train': 1.038225769996643} -11/07/2021 03:51:04 - INFO - __main__ - Step 46865: {'lr': 0.00039494715146529526, 'samples': 8998080, 'steps': 46864, 'loss/train': 1.1390782594680786} -11/07/2021 03:51:05 - INFO - __main__ - Step 46866: {'lr': 0.00039494282767276736, 'samples': 8998272, 'steps': 46865, 'loss/train': 1.4852098226547241} -11/07/2021 03:51:05 - INFO - __main__ - Step 46867: {'lr': 0.0003949385038149305, 'samples': 8998464, 'steps': 46866, 'loss/train': 1.7658873796463013} -11/07/2021 03:51:06 - INFO - __main__ - Step 46868: {'lr': 0.0003949341798917866, 'samples': 8998656, 'steps': 46867, 'loss/train': 0.9245157837867737} -11/07/2021 03:51:07 - INFO - __main__ - Step 46869: {'lr': 0.00039492985590333754, 'samples': 8998848, 'steps': 46868, 'loss/train': 1.5905011892318726} -11/07/2021 03:51:08 - INFO - __main__ - Step 46870: {'lr': 0.00039492553184958533, 'samples': 8999040, 'steps': 46869, 'loss/train': 0.830938458442688} -11/07/2021 03:51:08 - INFO - __main__ - Step 46871: {'lr': 0.00039492120773053195, 'samples': 8999232, 'steps': 46870, 'loss/train': 1.3371855020523071} -11/07/2021 03:51:09 - INFO - __main__ - Step 46872: {'lr': 0.0003949168835461793, 'samples': 8999424, 'steps': 46871, 'loss/train': 1.7193821668624878} -11/07/2021 03:51:09 - INFO - __main__ - Step 46873: {'lr': 0.0003949125592965293, 'samples': 8999616, 'steps': 46872, 'loss/train': 1.5219018459320068} -11/07/2021 03:51:09 - INFO - __main__ - Step 46874: {'lr': 0.000394908234981584, 'samples': 8999808, 'steps': 46873, 'loss/train': 1.4934570789337158} -11/07/2021 03:51:10 - INFO - __main__ - Step 46875: {'lr': 0.00039490391060134525, 'samples': 9000000, 'steps': 46874, 'loss/train': 1.3278827667236328} -11/07/2021 03:51:11 - INFO - __main__ - Step 46876: {'lr': 0.000394899586155815, 'samples': 9000192, 'steps': 46875, 'loss/train': 1.5030622482299805} -11/07/2021 03:51:11 - INFO - __main__ - Step 46877: {'lr': 0.00039489526164499536, 'samples': 9000384, 'steps': 46876, 'loss/train': 1.18563973903656} -11/07/2021 03:51:11 - INFO - __main__ - Step 46878: {'lr': 0.000394890937068888, 'samples': 9000576, 'steps': 46877, 'loss/train': 1.779812216758728} -11/07/2021 03:51:12 - INFO - __main__ - Step 46879: {'lr': 0.00039488661242749506, 'samples': 9000768, 'steps': 46878, 'loss/train': 1.6924418210983276} -11/07/2021 03:51:12 - INFO - __main__ - Step 46880: {'lr': 0.00039488228772081846, 'samples': 9000960, 'steps': 46879, 'loss/train': 0.20111282169818878} -11/07/2021 03:51:13 - INFO - __main__ - Step 46881: {'lr': 0.00039487796294886016, 'samples': 9001152, 'steps': 46880, 'loss/train': 1.9703088998794556} -11/07/2021 03:51:14 - INFO - __main__ - Step 46882: {'lr': 0.0003948736381116221, 'samples': 9001344, 'steps': 46881, 'loss/train': 1.535144329071045} -11/07/2021 03:51:14 - INFO - __main__ - Step 46883: {'lr': 0.0003948693132091061, 'samples': 9001536, 'steps': 46882, 'loss/train': 1.4550069570541382} -11/07/2021 03:51:14 - INFO - __main__ - Step 46884: {'lr': 0.00039486498824131434, 'samples': 9001728, 'steps': 46883, 'loss/train': 1.181460976600647} -11/07/2021 03:51:15 - INFO - __main__ - Step 46885: {'lr': 0.00039486066320824865, 'samples': 9001920, 'steps': 46884, 'loss/train': 0.7617834806442261} -11/07/2021 03:51:16 - INFO - __main__ - Step 46886: {'lr': 0.00039485633810991096, 'samples': 9002112, 'steps': 46885, 'loss/train': 1.6075130701065063} -11/07/2021 03:51:16 - INFO - __main__ - Step 46887: {'lr': 0.0003948520129463032, 'samples': 9002304, 'steps': 46886, 'loss/train': 1.8204573392868042} -11/07/2021 03:51:16 - INFO - __main__ - Step 46888: {'lr': 0.0003948476877174274, 'samples': 9002496, 'steps': 46887, 'loss/train': 1.8663369417190552} -11/07/2021 03:51:17 - INFO - __main__ - Step 46889: {'lr': 0.0003948433624232854, 'samples': 9002688, 'steps': 46888, 'loss/train': 2.045262098312378} -11/07/2021 03:51:17 - INFO - __main__ - Step 46890: {'lr': 0.0003948390370638794, 'samples': 9002880, 'steps': 46889, 'loss/train': 1.6313608884811401} -11/07/2021 03:51:17 - INFO - __main__ - Step 46891: {'lr': 0.000394834711639211, 'samples': 9003072, 'steps': 46890, 'loss/train': 1.6466128826141357} -11/07/2021 03:51:19 - INFO - __main__ - Step 46892: {'lr': 0.00039483038614928235, 'samples': 9003264, 'steps': 46891, 'loss/train': 1.4804253578186035} -11/07/2021 03:51:19 - INFO - __main__ - Step 46893: {'lr': 0.0003948260605940953, 'samples': 9003456, 'steps': 46892, 'loss/train': 1.5738805532455444} -11/07/2021 03:51:19 - INFO - __main__ - Step 46894: {'lr': 0.00039482173497365193, 'samples': 9003648, 'steps': 46893, 'loss/train': 1.5786223411560059} -11/07/2021 03:51:20 - INFO - __main__ - Step 46895: {'lr': 0.0003948174092879541, 'samples': 9003840, 'steps': 46894, 'loss/train': 1.8035955429077148} -11/07/2021 03:51:20 - INFO - __main__ - Step 46896: {'lr': 0.0003948130835370038, 'samples': 9004032, 'steps': 46895, 'loss/train': 1.8617504835128784} -11/07/2021 03:51:21 - INFO - __main__ - Step 46897: {'lr': 0.000394808757720803, 'samples': 9004224, 'steps': 46896, 'loss/train': 0.9014905691146851} -11/07/2021 03:51:21 - INFO - __main__ - Step 46898: {'lr': 0.00039480443183935357, 'samples': 9004416, 'steps': 46897, 'loss/train': 1.4515459537506104} -11/07/2021 03:51:22 - INFO - __main__ - Step 46899: {'lr': 0.0003948001058926575, 'samples': 9004608, 'steps': 46898, 'loss/train': 2.697383403778076} -11/07/2021 03:51:22 - INFO - __main__ - Step 46900: {'lr': 0.0003947957798807167, 'samples': 9004800, 'steps': 46899, 'loss/train': 1.7489532232284546} -11/07/2021 03:51:22 - INFO - __main__ - Step 46901: {'lr': 0.00039479145380353313, 'samples': 9004992, 'steps': 46900, 'loss/train': 1.0459482669830322} -11/07/2021 03:51:24 - INFO - __main__ - Step 46902: {'lr': 0.0003947871276611088, 'samples': 9005184, 'steps': 46901, 'loss/train': 1.5989751815795898} -11/07/2021 03:51:24 - INFO - __main__ - Step 46903: {'lr': 0.0003947828014534457, 'samples': 9005376, 'steps': 46902, 'loss/train': 1.4633909463882446} -11/07/2021 03:51:24 - INFO - __main__ - Step 46904: {'lr': 0.00039477847518054566, 'samples': 9005568, 'steps': 46903, 'loss/train': 1.4922444820404053} -11/07/2021 03:51:25 - INFO - __main__ - Step 46905: {'lr': 0.00039477414884241064, 'samples': 9005760, 'steps': 46904, 'loss/train': 1.4760546684265137} -11/07/2021 03:51:25 - INFO - __main__ - Step 46906: {'lr': 0.0003947698224390426, 'samples': 9005952, 'steps': 46905, 'loss/train': 2.0090863704681396} -11/07/2021 03:51:25 - INFO - __main__ - Step 46907: {'lr': 0.0003947654959704435, 'samples': 9006144, 'steps': 46906, 'loss/train': 1.7975330352783203} -11/07/2021 03:51:26 - INFO - __main__ - Step 46908: {'lr': 0.00039476116943661544, 'samples': 9006336, 'steps': 46907, 'loss/train': 1.886009931564331} -11/07/2021 03:51:27 - INFO - __main__ - Step 46909: {'lr': 0.00039475684283756007, 'samples': 9006528, 'steps': 46908, 'loss/train': 0.6918396949768066} -11/07/2021 03:51:27 - INFO - __main__ - Step 46910: {'lr': 0.0003947525161732797, 'samples': 9006720, 'steps': 46909, 'loss/train': 1.0997514724731445} -11/07/2021 03:51:27 - INFO - __main__ - Step 46911: {'lr': 0.0003947481894437759, 'samples': 9006912, 'steps': 46910, 'loss/train': 1.4464973211288452} -11/07/2021 03:51:28 - INFO - __main__ - Step 46912: {'lr': 0.0003947438626490508, 'samples': 9007104, 'steps': 46911, 'loss/train': 1.5185309648513794} -11/07/2021 03:51:29 - INFO - __main__ - Step 46913: {'lr': 0.0003947395357891064, 'samples': 9007296, 'steps': 46912, 'loss/train': 0.4749510586261749} -11/07/2021 03:51:29 - INFO - __main__ - Step 46914: {'lr': 0.00039473520886394465, 'samples': 9007488, 'steps': 46913, 'loss/train': 1.6673336029052734} -11/07/2021 03:51:29 - INFO - __main__ - Step 46915: {'lr': 0.00039473088187356737, 'samples': 9007680, 'steps': 46914, 'loss/train': 1.1993536949157715} -11/07/2021 03:51:30 - INFO - __main__ - Step 46916: {'lr': 0.0003947265548179766, 'samples': 9007872, 'steps': 46915, 'loss/train': 1.507056474685669} -11/07/2021 03:51:30 - INFO - __main__ - Step 46917: {'lr': 0.00039472222769717434, 'samples': 9008064, 'steps': 46916, 'loss/train': 1.8981199264526367} -11/07/2021 03:51:31 - INFO - __main__ - Step 46918: {'lr': 0.00039471790051116243, 'samples': 9008256, 'steps': 46917, 'loss/train': 1.3224080801010132} -11/07/2021 03:51:32 - INFO - __main__ - Step 46919: {'lr': 0.0003947135732599428, 'samples': 9008448, 'steps': 46918, 'loss/train': 1.5564310550689697} -11/07/2021 03:51:32 - INFO - __main__ - Step 46920: {'lr': 0.0003947092459435176, 'samples': 9008640, 'steps': 46919, 'loss/train': 0.5554118752479553} -11/07/2021 03:51:32 - INFO - __main__ - Step 46921: {'lr': 0.0003947049185618886, 'samples': 9008832, 'steps': 46920, 'loss/train': 0.7767159342765808} -11/07/2021 03:51:33 - INFO - __main__ - Step 46922: {'lr': 0.0003947005911150577, 'samples': 9009024, 'steps': 46921, 'loss/train': 1.5369144678115845} -11/07/2021 03:51:34 - INFO - __main__ - Step 46923: {'lr': 0.0003946962636030271, 'samples': 9009216, 'steps': 46922, 'loss/train': 1.928104281425476} -11/07/2021 03:51:34 - INFO - __main__ - Step 46924: {'lr': 0.00039469193602579856, 'samples': 9009408, 'steps': 46923, 'loss/train': 1.6119428873062134} -11/07/2021 03:51:34 - INFO - __main__ - Step 46925: {'lr': 0.000394687608383374, 'samples': 9009600, 'steps': 46924, 'loss/train': 1.768648386001587} -11/07/2021 03:51:35 - INFO - __main__ - Step 46926: {'lr': 0.0003946832806757554, 'samples': 9009792, 'steps': 46925, 'loss/train': 1.144248127937317} -11/07/2021 03:51:35 - INFO - __main__ - Step 46927: {'lr': 0.00039467895290294484, 'samples': 9009984, 'steps': 46926, 'loss/train': 1.4360101222991943} -11/07/2021 03:51:36 - INFO - __main__ - Step 46928: {'lr': 0.00039467462506494416, 'samples': 9010176, 'steps': 46927, 'loss/train': 1.2297422885894775} -11/07/2021 03:51:37 - INFO - __main__ - Step 46929: {'lr': 0.0003946702971617553, 'samples': 9010368, 'steps': 46928, 'loss/train': 1.675126075744629} -11/07/2021 03:51:37 - INFO - __main__ - Step 46930: {'lr': 0.00039466596919338027, 'samples': 9010560, 'steps': 46929, 'loss/train': 1.154676079750061} -11/07/2021 03:51:37 - INFO - __main__ - Step 46931: {'lr': 0.000394661641159821, 'samples': 9010752, 'steps': 46930, 'loss/train': 1.3921693563461304} -11/07/2021 03:51:38 - INFO - __main__ - Step 46932: {'lr': 0.00039465731306107937, 'samples': 9010944, 'steps': 46931, 'loss/train': 1.4811137914657593} -11/07/2021 03:51:39 - INFO - __main__ - Step 46933: {'lr': 0.0003946529848971574, 'samples': 9011136, 'steps': 46932, 'loss/train': 0.9219220280647278} -11/07/2021 03:51:39 - INFO - __main__ - Step 46934: {'lr': 0.00039464865666805706, 'samples': 9011328, 'steps': 46933, 'loss/train': 1.5291695594787598} -11/07/2021 03:51:39 - INFO - __main__ - Step 46935: {'lr': 0.00039464432837378025, 'samples': 9011520, 'steps': 46934, 'loss/train': 1.7101067304611206} -11/07/2021 03:51:40 - INFO - __main__ - Step 46936: {'lr': 0.0003946400000143289, 'samples': 9011712, 'steps': 46935, 'loss/train': 1.0490752458572388} -11/07/2021 03:51:40 - INFO - __main__ - Step 46937: {'lr': 0.000394635671589705, 'samples': 9011904, 'steps': 46936, 'loss/train': 1.351618766784668} -11/07/2021 03:51:41 - INFO - __main__ - Step 46938: {'lr': 0.0003946313430999106, 'samples': 9012096, 'steps': 46937, 'loss/train': 1.6533046960830688} -11/07/2021 03:51:41 - INFO - __main__ - Step 46939: {'lr': 0.0003946270145449475, 'samples': 9012288, 'steps': 46938, 'loss/train': 1.3199681043624878} -11/07/2021 03:51:42 - INFO - __main__ - Step 46940: {'lr': 0.00039462268592481767, 'samples': 9012480, 'steps': 46939, 'loss/train': 0.9378066062927246} -11/07/2021 03:51:42 - INFO - __main__ - Step 46941: {'lr': 0.00039461835723952313, 'samples': 9012672, 'steps': 46940, 'loss/train': 1.3353723287582397} -11/07/2021 03:51:43 - INFO - __main__ - Step 46942: {'lr': 0.0003946140284890657, 'samples': 9012864, 'steps': 46941, 'loss/train': 1.2372130155563354} -11/07/2021 03:51:44 - INFO - __main__ - Step 46943: {'lr': 0.0003946096996734475, 'samples': 9013056, 'steps': 46942, 'loss/train': 1.3074778318405151} -11/07/2021 03:51:44 - INFO - __main__ - Step 46944: {'lr': 0.00039460537079267035, 'samples': 9013248, 'steps': 46943, 'loss/train': 1.737030267715454} -11/07/2021 03:51:44 - INFO - __main__ - Step 46945: {'lr': 0.00039460104184673627, 'samples': 9013440, 'steps': 46944, 'loss/train': 1.4304100275039673} -11/07/2021 03:51:45 - INFO - __main__ - Step 46946: {'lr': 0.00039459671283564727, 'samples': 9013632, 'steps': 46945, 'loss/train': 1.438733696937561} -11/07/2021 03:51:45 - INFO - __main__ - Step 46947: {'lr': 0.0003945923837594051, 'samples': 9013824, 'steps': 46946, 'loss/train': 1.9903538227081299} -11/07/2021 03:51:46 - INFO - __main__ - Step 46948: {'lr': 0.0003945880546180119, 'samples': 9014016, 'steps': 46947, 'loss/train': 1.6213985681533813} -11/07/2021 03:51:46 - INFO - __main__ - Step 46949: {'lr': 0.00039458372541146955, 'samples': 9014208, 'steps': 46948, 'loss/train': 1.5832176208496094} -11/07/2021 03:51:47 - INFO - __main__ - Step 46950: {'lr': 0.00039457939613978, 'samples': 9014400, 'steps': 46949, 'loss/train': 1.7206088304519653} -11/07/2021 03:51:47 - INFO - __main__ - Step 46951: {'lr': 0.0003945750668029452, 'samples': 9014592, 'steps': 46950, 'loss/train': 1.3618377447128296} -11/07/2021 03:51:47 - INFO - __main__ - Step 46952: {'lr': 0.0003945707374009671, 'samples': 9014784, 'steps': 46951, 'loss/train': 1.8693825006484985} -11/07/2021 03:51:48 - INFO - __main__ - Step 46953: {'lr': 0.0003945664079338477, 'samples': 9014976, 'steps': 46952, 'loss/train': 1.589695930480957} -11/07/2021 03:51:49 - INFO - __main__ - Step 46954: {'lr': 0.0003945620784015888, 'samples': 9015168, 'steps': 46953, 'loss/train': 1.9525930881500244} -11/07/2021 03:51:49 - INFO - __main__ - Step 46955: {'lr': 0.00039455774880419256, 'samples': 9015360, 'steps': 46954, 'loss/train': 1.226714849472046} -11/07/2021 03:51:49 - INFO - __main__ - Step 46956: {'lr': 0.00039455341914166074, 'samples': 9015552, 'steps': 46955, 'loss/train': 0.9247803688049316} -11/07/2021 03:51:50 - INFO - __main__ - Step 46957: {'lr': 0.0003945490894139955, 'samples': 9015744, 'steps': 46956, 'loss/train': 1.0902832746505737} -11/07/2021 03:51:50 - INFO - __main__ - Step 46958: {'lr': 0.0003945447596211986, 'samples': 9015936, 'steps': 46957, 'loss/train': 1.6723014116287231} -11/07/2021 03:51:51 - INFO - __main__ - Step 46959: {'lr': 0.0003945404297632721, 'samples': 9016128, 'steps': 46958, 'loss/train': 1.616858959197998} -11/07/2021 03:51:52 - INFO - __main__ - Step 46960: {'lr': 0.00039453609984021787, 'samples': 9016320, 'steps': 46959, 'loss/train': 1.7943397760391235} -11/07/2021 03:51:52 - INFO - __main__ - Step 46961: {'lr': 0.00039453176985203785, 'samples': 9016512, 'steps': 46960, 'loss/train': 1.3130934238433838} -11/07/2021 03:51:52 - INFO - __main__ - Step 46962: {'lr': 0.0003945274397987342, 'samples': 9016704, 'steps': 46961, 'loss/train': 1.7671287059783936} -11/07/2021 03:51:53 - INFO - __main__ - Step 46963: {'lr': 0.0003945231096803086, 'samples': 9016896, 'steps': 46962, 'loss/train': 1.2953639030456543} -11/07/2021 03:51:54 - INFO - __main__ - Step 46964: {'lr': 0.0003945187794967632, 'samples': 9017088, 'steps': 46963, 'loss/train': 1.5047909021377563} -11/07/2021 03:51:54 - INFO - __main__ - Step 46965: {'lr': 0.00039451444924809976, 'samples': 9017280, 'steps': 46964, 'loss/train': 1.5116136074066162} -11/07/2021 03:51:54 - INFO - __main__ - Step 46966: {'lr': 0.0003945101189343204, 'samples': 9017472, 'steps': 46965, 'loss/train': 1.4135128259658813} -11/07/2021 03:51:55 - INFO - __main__ - Step 46967: {'lr': 0.000394505788555427, 'samples': 9017664, 'steps': 46966, 'loss/train': 1.447141408920288} -11/07/2021 03:51:55 - INFO - __main__ - Step 46968: {'lr': 0.0003945014581114215, 'samples': 9017856, 'steps': 46967, 'loss/train': 1.9308451414108276} -11/07/2021 03:51:56 - INFO - __main__ - Step 46969: {'lr': 0.00039449712760230584, 'samples': 9018048, 'steps': 46968, 'loss/train': 1.1975317001342773} -11/07/2021 03:51:56 - INFO - __main__ - Step 46970: {'lr': 0.0003944927970280821, 'samples': 9018240, 'steps': 46969, 'loss/train': 1.501655101776123} -11/07/2021 03:51:57 - INFO - __main__ - Step 46971: {'lr': 0.00039448846638875213, 'samples': 9018432, 'steps': 46970, 'loss/train': 1.0903911590576172} -11/07/2021 03:51:57 - INFO - __main__ - Step 46972: {'lr': 0.00039448413568431785, 'samples': 9018624, 'steps': 46971, 'loss/train': 1.5875543355941772} -11/07/2021 03:51:57 - INFO - __main__ - Step 46973: {'lr': 0.0003944798049147812, 'samples': 9018816, 'steps': 46972, 'loss/train': 1.8218967914581299} -11/07/2021 03:51:58 - INFO - __main__ - Step 46974: {'lr': 0.00039447547408014426, 'samples': 9019008, 'steps': 46973, 'loss/train': 1.572045087814331} -11/07/2021 03:51:59 - INFO - __main__ - Step 46975: {'lr': 0.00039447114318040885, 'samples': 9019200, 'steps': 46974, 'loss/train': 1.3558261394500732} -11/07/2021 03:51:59 - INFO - __main__ - Step 46976: {'lr': 0.000394466812215577, 'samples': 9019392, 'steps': 46975, 'loss/train': 1.5541266202926636} -11/07/2021 03:51:59 - INFO - __main__ - Step 46977: {'lr': 0.0003944624811856506, 'samples': 9019584, 'steps': 46976, 'loss/train': 1.6195271015167236} -11/07/2021 03:52:00 - INFO - __main__ - Step 46978: {'lr': 0.0003944581500906317, 'samples': 9019776, 'steps': 46977, 'loss/train': 1.519793152809143} -11/07/2021 03:52:01 - INFO - __main__ - Step 46979: {'lr': 0.00039445381893052215, 'samples': 9019968, 'steps': 46978, 'loss/train': 1.248785376548767} -11/07/2021 03:52:01 - INFO - __main__ - Step 46980: {'lr': 0.0003944494877053239, 'samples': 9020160, 'steps': 46979, 'loss/train': 1.2922887802124023} -11/07/2021 03:52:01 - INFO - __main__ - Step 46981: {'lr': 0.00039444515641503896, 'samples': 9020352, 'steps': 46980, 'loss/train': 1.960410237312317} -11/07/2021 03:52:02 - INFO - __main__ - Step 46982: {'lr': 0.00039444082505966926, 'samples': 9020544, 'steps': 46981, 'loss/train': 1.441537857055664} -11/07/2021 03:52:02 - INFO - __main__ - Step 46983: {'lr': 0.0003944364936392168, 'samples': 9020736, 'steps': 46982, 'loss/train': 1.4293638467788696} -11/07/2021 03:52:02 - INFO - __main__ - Step 46984: {'lr': 0.0003944321621536835, 'samples': 9020928, 'steps': 46983, 'loss/train': 1.1249370574951172} -11/07/2021 03:52:04 - INFO - __main__ - Step 46985: {'lr': 0.00039442783060307117, 'samples': 9021120, 'steps': 46984, 'loss/train': 1.44890296459198} -11/07/2021 03:52:04 - INFO - __main__ - Step 46986: {'lr': 0.00039442349898738204, 'samples': 9021312, 'steps': 46985, 'loss/train': 1.7546148300170898} -11/07/2021 03:52:04 - INFO - __main__ - Step 46987: {'lr': 0.0003944191673066178, 'samples': 9021504, 'steps': 46986, 'loss/train': 1.1470195055007935} -11/07/2021 03:52:05 - INFO - __main__ - Step 46988: {'lr': 0.00039441483556078055, 'samples': 9021696, 'steps': 46987, 'loss/train': 1.1848145723342896} -11/07/2021 03:52:05 - INFO - __main__ - Step 46989: {'lr': 0.0003944105037498722, 'samples': 9021888, 'steps': 46988, 'loss/train': 1.8253114223480225} -11/07/2021 03:52:06 - INFO - __main__ - Step 46990: {'lr': 0.0003944061718738947, 'samples': 9022080, 'steps': 46989, 'loss/train': 1.395495891571045} -11/07/2021 03:52:06 - INFO - __main__ - Step 46991: {'lr': 0.00039440183993285006, 'samples': 9022272, 'steps': 46990, 'loss/train': 1.5553473234176636} -11/07/2021 03:52:07 - INFO - __main__ - Step 46992: {'lr': 0.0003943975079267401, 'samples': 9022464, 'steps': 46991, 'loss/train': 1.4578441381454468} -11/07/2021 03:52:07 - INFO - __main__ - Step 46993: {'lr': 0.0003943931758555669, 'samples': 9022656, 'steps': 46992, 'loss/train': 1.4696886539459229} -11/07/2021 03:52:07 - INFO - __main__ - Step 46994: {'lr': 0.0003943888437193324, 'samples': 9022848, 'steps': 46993, 'loss/train': 1.2073811292648315} -11/07/2021 03:52:08 - INFO - __main__ - Step 46995: {'lr': 0.00039438451151803844, 'samples': 9023040, 'steps': 46994, 'loss/train': 1.1929799318313599} -11/07/2021 03:52:09 - INFO - __main__ - Step 46996: {'lr': 0.000394380179251687, 'samples': 9023232, 'steps': 46995, 'loss/train': 1.5996979475021362} -11/07/2021 03:52:09 - INFO - __main__ - Step 46997: {'lr': 0.0003943758469202802, 'samples': 9023424, 'steps': 46996, 'loss/train': 1.0800632238388062} -11/07/2021 03:52:09 - INFO - __main__ - Step 46998: {'lr': 0.0003943715145238198, 'samples': 9023616, 'steps': 46997, 'loss/train': 1.2664647102355957} -11/07/2021 03:52:10 - INFO - __main__ - Step 46999: {'lr': 0.00039436718206230795, 'samples': 9023808, 'steps': 46998, 'loss/train': 1.4994295835494995} -11/07/2021 03:52:11 - INFO - __main__ - Step 47000: {'lr': 0.0003943628495357463, 'samples': 9024000, 'steps': 46999, 'loss/train': 1.680883765220642} -11/07/2021 03:52:11 - INFO - __main__ - Step 47001: {'lr': 0.00039435851694413705, 'samples': 9024192, 'steps': 47000, 'loss/train': 2.1149520874023438} -11/07/2021 03:52:12 - INFO - __main__ - Step 47002: {'lr': 0.00039435418428748206, 'samples': 9024384, 'steps': 47001, 'loss/train': 1.675614833831787} -11/07/2021 03:52:12 - INFO - __main__ - Step 47003: {'lr': 0.00039434985156578333, 'samples': 9024576, 'steps': 47002, 'loss/train': 1.2153077125549316} -11/07/2021 03:52:12 - INFO - __main__ - Step 47004: {'lr': 0.0003943455187790428, 'samples': 9024768, 'steps': 47003, 'loss/train': 1.455561637878418} -11/07/2021 03:52:13 - INFO - __main__ - Step 47005: {'lr': 0.0003943411859272624, 'samples': 9024960, 'steps': 47004, 'loss/train': 1.614766001701355} -11/07/2021 03:52:14 - INFO - __main__ - Step 47006: {'lr': 0.0003943368530104441, 'samples': 9025152, 'steps': 47005, 'loss/train': 1.222779631614685} -11/07/2021 03:52:14 - INFO - __main__ - Step 47007: {'lr': 0.00039433252002858975, 'samples': 9025344, 'steps': 47006, 'loss/train': 1.3408775329589844} -11/07/2021 03:52:14 - INFO - __main__ - Step 47008: {'lr': 0.0003943281869817015, 'samples': 9025536, 'steps': 47007, 'loss/train': 0.7637006640434265} -11/07/2021 03:52:15 - INFO - __main__ - Step 47009: {'lr': 0.0003943238538697811, 'samples': 9025728, 'steps': 47008, 'loss/train': 1.2307101488113403} -11/07/2021 03:52:15 - INFO - __main__ - Step 47010: {'lr': 0.00039431952069283067, 'samples': 9025920, 'steps': 47009, 'loss/train': 1.1147801876068115} -11/07/2021 03:52:16 - INFO - __main__ - Step 47011: {'lr': 0.00039431518745085205, 'samples': 9026112, 'steps': 47010, 'loss/train': 1.3025678396224976} -11/07/2021 03:52:16 - INFO - __main__ - Step 47012: {'lr': 0.00039431085414384727, 'samples': 9026304, 'steps': 47011, 'loss/train': 1.6826845407485962} -11/07/2021 03:52:17 - INFO - __main__ - Step 47013: {'lr': 0.0003943065207718182, 'samples': 9026496, 'steps': 47012, 'loss/train': 1.8111188411712646} -11/07/2021 03:52:17 - INFO - __main__ - Step 47014: {'lr': 0.0003943021873347669, 'samples': 9026688, 'steps': 47013, 'loss/train': 1.3840372562408447} -11/07/2021 03:52:18 - INFO - __main__ - Step 47015: {'lr': 0.00039429785383269524, 'samples': 9026880, 'steps': 47014, 'loss/train': 1.157009482383728} -11/07/2021 03:52:19 - INFO - __main__ - Step 47016: {'lr': 0.00039429352026560516, 'samples': 9027072, 'steps': 47015, 'loss/train': 1.1459460258483887} -11/07/2021 03:52:19 - INFO - __main__ - Step 47017: {'lr': 0.0003942891866334987, 'samples': 9027264, 'steps': 47016, 'loss/train': 1.6639070510864258} -11/07/2021 03:52:19 - INFO - __main__ - Step 47018: {'lr': 0.00039428485293637773, 'samples': 9027456, 'steps': 47017, 'loss/train': 1.348271131515503} -11/07/2021 03:52:20 - INFO - __main__ - Step 47019: {'lr': 0.00039428051917424423, 'samples': 9027648, 'steps': 47018, 'loss/train': 1.3297394514083862} -11/07/2021 03:52:20 - INFO - __main__ - Step 47020: {'lr': 0.0003942761853471002, 'samples': 9027840, 'steps': 47019, 'loss/train': 1.7127476930618286} -11/07/2021 03:52:21 - INFO - __main__ - Step 47021: {'lr': 0.0003942718514549475, 'samples': 9028032, 'steps': 47020, 'loss/train': 1.5943137407302856} -11/07/2021 03:52:21 - INFO - __main__ - Step 47022: {'lr': 0.0003942675174977881, 'samples': 9028224, 'steps': 47021, 'loss/train': 1.2140249013900757} -11/07/2021 03:52:22 - INFO - __main__ - Step 47023: {'lr': 0.000394263183475624, 'samples': 9028416, 'steps': 47022, 'loss/train': 1.5225287675857544} -11/07/2021 03:52:22 - INFO - __main__ - Step 47024: {'lr': 0.0003942588493884571, 'samples': 9028608, 'steps': 47023, 'loss/train': 1.6169816255569458} -11/07/2021 03:52:22 - INFO - __main__ - Step 47025: {'lr': 0.00039425451523628953, 'samples': 9028800, 'steps': 47024, 'loss/train': 1.2692021131515503} -11/07/2021 03:52:23 - INFO - __main__ - Step 47026: {'lr': 0.00039425018101912305, 'samples': 9028992, 'steps': 47025, 'loss/train': 1.7158222198486328} -11/07/2021 03:52:24 - INFO - __main__ - Step 47027: {'lr': 0.00039424584673695956, 'samples': 9029184, 'steps': 47026, 'loss/train': 1.682454228401184} -11/07/2021 03:52:24 - INFO - __main__ - Step 47028: {'lr': 0.0003942415123898012, 'samples': 9029376, 'steps': 47027, 'loss/train': 1.6168550252914429} -11/07/2021 03:52:24 - INFO - __main__ - Step 47029: {'lr': 0.0003942371779776498, 'samples': 9029568, 'steps': 47028, 'loss/train': 1.5480886697769165} -11/07/2021 03:52:25 - INFO - __main__ - Step 47030: {'lr': 0.00039423284350050735, 'samples': 9029760, 'steps': 47029, 'loss/train': 1.8418940305709839} -11/07/2021 03:52:26 - INFO - __main__ - Step 47031: {'lr': 0.0003942285089583759, 'samples': 9029952, 'steps': 47030, 'loss/train': 1.7178999185562134} -11/07/2021 03:52:26 - INFO - __main__ - Step 47032: {'lr': 0.0003942241743512572, 'samples': 9030144, 'steps': 47031, 'loss/train': 1.4074722528457642} -11/07/2021 03:52:26 - INFO - __main__ - Step 47033: {'lr': 0.00039421983967915337, 'samples': 9030336, 'steps': 47032, 'loss/train': 1.7305998802185059} -11/07/2021 03:52:27 - INFO - __main__ - Step 47034: {'lr': 0.00039421550494206625, 'samples': 9030528, 'steps': 47033, 'loss/train': 1.7071924209594727} -11/07/2021 03:52:27 - INFO - __main__ - Step 47035: {'lr': 0.0003942111701399979, 'samples': 9030720, 'steps': 47034, 'loss/train': 1.5228930711746216} -11/07/2021 03:52:28 - INFO - __main__ - Step 47036: {'lr': 0.0003942068352729502, 'samples': 9030912, 'steps': 47035, 'loss/train': 1.6422492265701294} -11/07/2021 03:52:29 - INFO - __main__ - Step 47037: {'lr': 0.0003942025003409252, 'samples': 9031104, 'steps': 47036, 'loss/train': 1.4419137239456177} -11/07/2021 03:52:29 - INFO - __main__ - Step 47038: {'lr': 0.0003941981653439247, 'samples': 9031296, 'steps': 47037, 'loss/train': 1.5991615056991577} -11/07/2021 03:52:29 - INFO - __main__ - Step 47039: {'lr': 0.00039419383028195076, 'samples': 9031488, 'steps': 47038, 'loss/train': 1.3113130331039429} -11/07/2021 03:52:30 - INFO - __main__ - Step 47040: {'lr': 0.00039418949515500524, 'samples': 9031680, 'steps': 47039, 'loss/train': 1.5550031661987305} -11/07/2021 03:52:31 - INFO - __main__ - Step 47041: {'lr': 0.0003941851599630902, 'samples': 9031872, 'steps': 47040, 'loss/train': 1.4652179479599} -11/07/2021 03:52:31 - INFO - __main__ - Step 47042: {'lr': 0.00039418082470620756, 'samples': 9032064, 'steps': 47041, 'loss/train': 1.7316834926605225} -11/07/2021 03:52:32 - INFO - __main__ - Step 47043: {'lr': 0.0003941764893843593, 'samples': 9032256, 'steps': 47042, 'loss/train': 1.5148168802261353} -11/07/2021 03:52:32 - INFO - __main__ - Step 47044: {'lr': 0.0003941721539975473, 'samples': 9032448, 'steps': 47043, 'loss/train': 1.3945996761322021} -11/07/2021 03:52:32 - INFO - __main__ - Step 47045: {'lr': 0.0003941678185457736, 'samples': 9032640, 'steps': 47044, 'loss/train': 1.6497108936309814} -11/07/2021 03:52:33 - INFO - __main__ - Step 47046: {'lr': 0.00039416348302904005, 'samples': 9032832, 'steps': 47045, 'loss/train': 1.4801838397979736} -11/07/2021 03:52:34 - INFO - __main__ - Step 47047: {'lr': 0.0003941591474473487, 'samples': 9033024, 'steps': 47046, 'loss/train': 1.6212077140808105} -11/07/2021 03:52:34 - INFO - __main__ - Step 47048: {'lr': 0.0003941548118007014, 'samples': 9033216, 'steps': 47047, 'loss/train': 1.920916199684143} -11/07/2021 03:52:34 - INFO - __main__ - Step 47049: {'lr': 0.00039415047608910023, 'samples': 9033408, 'steps': 47048, 'loss/train': 1.437896966934204} -11/07/2021 03:52:35 - INFO - __main__ - Step 47050: {'lr': 0.000394146140312547, 'samples': 9033600, 'steps': 47049, 'loss/train': 1.3306047916412354} -11/07/2021 03:52:35 - INFO - __main__ - Step 47051: {'lr': 0.0003941418044710438, 'samples': 9033792, 'steps': 47050, 'loss/train': 1.4316445589065552} -11/07/2021 03:52:36 - INFO - __main__ - Step 47052: {'lr': 0.00039413746856459253, 'samples': 9033984, 'steps': 47051, 'loss/train': 0.7563554644584656} -11/07/2021 03:52:37 - INFO - __main__ - Step 47053: {'lr': 0.0003941331325931952, 'samples': 9034176, 'steps': 47052, 'loss/train': 1.5452617406845093} -11/07/2021 03:52:37 - INFO - __main__ - Step 47054: {'lr': 0.0003941287965568536, 'samples': 9034368, 'steps': 47053, 'loss/train': 1.8800292015075684} -11/07/2021 03:52:37 - INFO - __main__ - Step 47055: {'lr': 0.0003941244604555698, 'samples': 9034560, 'steps': 47054, 'loss/train': 1.7606195211410522} -11/07/2021 03:52:38 - INFO - __main__ - Step 47056: {'lr': 0.0003941201242893457, 'samples': 9034752, 'steps': 47055, 'loss/train': 1.5376604795455933} -11/07/2021 03:52:39 - INFO - __main__ - Step 47057: {'lr': 0.00039411578805818344, 'samples': 9034944, 'steps': 47056, 'loss/train': 1.383442997932434} -11/07/2021 03:52:39 - INFO - __main__ - Step 47058: {'lr': 0.00039411145176208477, 'samples': 9035136, 'steps': 47057, 'loss/train': 1.3758971691131592} -11/07/2021 03:52:39 - INFO - __main__ - Step 47059: {'lr': 0.0003941071154010517, 'samples': 9035328, 'steps': 47058, 'loss/train': 1.4077143669128418} -11/07/2021 03:52:40 - INFO - __main__ - Step 47060: {'lr': 0.00039410277897508617, 'samples': 9035520, 'steps': 47059, 'loss/train': 1.337977647781372} -11/07/2021 03:52:40 - INFO - __main__ - Step 47061: {'lr': 0.00039409844248419014, 'samples': 9035712, 'steps': 47060, 'loss/train': 1.5199073553085327} -11/07/2021 03:52:41 - INFO - __main__ - Step 47062: {'lr': 0.0003940941059283656, 'samples': 9035904, 'steps': 47061, 'loss/train': 1.421905517578125} -11/07/2021 03:52:41 - INFO - __main__ - Step 47063: {'lr': 0.00039408976930761444, 'samples': 9036096, 'steps': 47062, 'loss/train': 1.5089776515960693} -11/07/2021 03:52:42 - INFO - __main__ - Step 47064: {'lr': 0.00039408543262193867, 'samples': 9036288, 'steps': 47063, 'loss/train': 1.375567078590393} -11/07/2021 03:52:42 - INFO - __main__ - Step 47065: {'lr': 0.00039408109587134034, 'samples': 9036480, 'steps': 47064, 'loss/train': 0.798215925693512} -11/07/2021 03:52:42 - INFO - __main__ - Step 47066: {'lr': 0.00039407675905582117, 'samples': 9036672, 'steps': 47065, 'loss/train': 1.7782467603683472} -11/07/2021 03:52:44 - INFO - __main__ - Step 47067: {'lr': 0.00039407242217538317, 'samples': 9036864, 'steps': 47066, 'loss/train': 1.2912510633468628} -11/07/2021 03:52:44 - INFO - __main__ - Step 47068: {'lr': 0.0003940680852300285, 'samples': 9037056, 'steps': 47067, 'loss/train': 1.5498754978179932} -11/07/2021 03:52:44 - INFO - __main__ - Step 47069: {'lr': 0.00039406374821975893, 'samples': 9037248, 'steps': 47068, 'loss/train': 1.6175334453582764} -11/07/2021 03:52:45 - INFO - __main__ - Step 47070: {'lr': 0.00039405941114457644, 'samples': 9037440, 'steps': 47069, 'loss/train': 1.3006986379623413} -11/07/2021 03:52:45 - INFO - __main__ - Step 47071: {'lr': 0.000394055074004483, 'samples': 9037632, 'steps': 47070, 'loss/train': 1.5169404745101929} -11/07/2021 03:52:46 - INFO - __main__ - Step 47072: {'lr': 0.0003940507367994806, 'samples': 9037824, 'steps': 47071, 'loss/train': 0.5934475660324097} -11/07/2021 03:52:46 - INFO - __main__ - Step 47073: {'lr': 0.00039404639952957116, 'samples': 9038016, 'steps': 47072, 'loss/train': 1.216092586517334} -11/07/2021 03:52:47 - INFO - __main__ - Step 47074: {'lr': 0.00039404206219475655, 'samples': 9038208, 'steps': 47073, 'loss/train': 1.2290641069412231} -11/07/2021 03:52:47 - INFO - __main__ - Step 47075: {'lr': 0.00039403772479503895, 'samples': 9038400, 'steps': 47074, 'loss/train': 1.8244417905807495} -11/07/2021 03:52:47 - INFO - __main__ - Step 47076: {'lr': 0.0003940333873304201, 'samples': 9038592, 'steps': 47075, 'loss/train': 0.9801872968673706} -11/07/2021 03:52:49 - INFO - __main__ - Step 47077: {'lr': 0.000394029049800902, 'samples': 9038784, 'steps': 47076, 'loss/train': 1.3451482057571411} -11/07/2021 03:52:49 - INFO - __main__ - Step 47078: {'lr': 0.00039402471220648675, 'samples': 9038976, 'steps': 47077, 'loss/train': 1.9589600563049316} -11/07/2021 03:52:49 - INFO - __main__ - Step 47079: {'lr': 0.000394020374547176, 'samples': 9039168, 'steps': 47078, 'loss/train': 1.6597225666046143} -11/07/2021 03:52:50 - INFO - __main__ - Step 47080: {'lr': 0.00039401603682297204, 'samples': 9039360, 'steps': 47079, 'loss/train': 1.3895072937011719} -11/07/2021 03:52:50 - INFO - __main__ - Step 47081: {'lr': 0.0003940116990338766, 'samples': 9039552, 'steps': 47080, 'loss/train': 2.7593445777893066} -11/07/2021 03:52:50 - INFO - __main__ - Step 47082: {'lr': 0.00039400736117989175, 'samples': 9039744, 'steps': 47081, 'loss/train': 1.3985692262649536} -11/07/2021 03:52:51 - INFO - __main__ - Step 47083: {'lr': 0.0003940030232610194, 'samples': 9039936, 'steps': 47082, 'loss/train': 1.3660260438919067} -11/07/2021 03:52:52 - INFO - __main__ - Step 47084: {'lr': 0.0003939986852772615, 'samples': 9040128, 'steps': 47083, 'loss/train': 1.7843916416168213} -11/07/2021 03:52:52 - INFO - __main__ - Step 47085: {'lr': 0.00039399434722862004, 'samples': 9040320, 'steps': 47084, 'loss/train': 1.2024017572402954} -11/07/2021 03:52:53 - INFO - __main__ - Step 47086: {'lr': 0.00039399000911509685, 'samples': 9040512, 'steps': 47085, 'loss/train': 1.2676604986190796} -11/07/2021 03:52:53 - INFO - __main__ - Step 47087: {'lr': 0.00039398567093669413, 'samples': 9040704, 'steps': 47086, 'loss/train': 1.5416532754898071} -11/07/2021 03:52:54 - INFO - __main__ - Step 47088: {'lr': 0.00039398133269341357, 'samples': 9040896, 'steps': 47087, 'loss/train': 1.261775016784668} -11/07/2021 03:52:54 - INFO - __main__ - Step 47089: {'lr': 0.0003939769943852573, 'samples': 9041088, 'steps': 47088, 'loss/train': 1.8220853805541992} -11/07/2021 03:52:55 - INFO - __main__ - Step 47090: {'lr': 0.0003939726560122272, 'samples': 9041280, 'steps': 47089, 'loss/train': 0.8334203362464905} -11/07/2021 03:52:55 - INFO - __main__ - Step 47091: {'lr': 0.00039396831757432526, 'samples': 9041472, 'steps': 47090, 'loss/train': 1.4785126447677612} -11/07/2021 03:52:55 - INFO - __main__ - Step 47092: {'lr': 0.0003939639790715535, 'samples': 9041664, 'steps': 47091, 'loss/train': 1.4800597429275513} -11/07/2021 03:52:56 - INFO - __main__ - Step 47093: {'lr': 0.0003939596405039136, 'samples': 9041856, 'steps': 47092, 'loss/train': 1.4908806085586548} -11/07/2021 03:52:57 - INFO - __main__ - Step 47094: {'lr': 0.00039395530187140784, 'samples': 9042048, 'steps': 47093, 'loss/train': 1.5633057355880737} -11/07/2021 03:52:57 - INFO - __main__ - Step 47095: {'lr': 0.000393950963174038, 'samples': 9042240, 'steps': 47094, 'loss/train': 1.6771138906478882} -11/07/2021 03:52:57 - INFO - __main__ - Step 47096: {'lr': 0.00039394662441180606, 'samples': 9042432, 'steps': 47095, 'loss/train': 1.8062840700149536} -11/07/2021 03:52:58 - INFO - __main__ - Step 47097: {'lr': 0.000393942285584714, 'samples': 9042624, 'steps': 47096, 'loss/train': 1.3849742412567139} -11/07/2021 03:52:58 - INFO - __main__ - Step 47098: {'lr': 0.00039393794669276386, 'samples': 9042816, 'steps': 47097, 'loss/train': 1.4430208206176758} -11/07/2021 03:52:59 - INFO - __main__ - Step 47099: {'lr': 0.00039393360773595744, 'samples': 9043008, 'steps': 47098, 'loss/train': 1.518402099609375} -11/07/2021 03:52:59 - INFO - __main__ - Step 47100: {'lr': 0.0003939292687142967, 'samples': 9043200, 'steps': 47099, 'loss/train': 1.5874766111373901} -11/07/2021 03:53:00 - INFO - __main__ - Step 47101: {'lr': 0.0003939249296277837, 'samples': 9043392, 'steps': 47100, 'loss/train': 1.4214836359024048} -11/07/2021 03:53:00 - INFO - __main__ - Step 47102: {'lr': 0.0003939205904764204, 'samples': 9043584, 'steps': 47101, 'loss/train': 1.459752082824707} -11/07/2021 03:53:01 - INFO - __main__ - Step 47103: {'lr': 0.00039391625126020856, 'samples': 9043776, 'steps': 47102, 'loss/train': 1.505184292793274} -11/07/2021 03:53:02 - INFO - __main__ - Step 47104: {'lr': 0.0003939119119791504, 'samples': 9043968, 'steps': 47103, 'loss/train': 1.4024347066879272} -11/07/2021 03:53:02 - INFO - __main__ - Step 47105: {'lr': 0.0003939075726332477, 'samples': 9044160, 'steps': 47104, 'loss/train': 1.4824903011322021} -11/07/2021 03:53:02 - INFO - __main__ - Step 47106: {'lr': 0.00039390323322250253, 'samples': 9044352, 'steps': 47105, 'loss/train': 0.8480738997459412} -11/07/2021 03:53:03 - INFO - __main__ - Step 47107: {'lr': 0.0003938988937469168, 'samples': 9044544, 'steps': 47106, 'loss/train': 1.2670586109161377} -11/07/2021 03:53:03 - INFO - __main__ - Step 47108: {'lr': 0.0003938945542064923, 'samples': 9044736, 'steps': 47107, 'loss/train': 1.4854414463043213} -11/07/2021 03:53:04 - INFO - __main__ - Step 47109: {'lr': 0.00039389021460123125, 'samples': 9044928, 'steps': 47108, 'loss/train': 1.1902029514312744} -11/07/2021 03:53:04 - INFO - __main__ - Step 47110: {'lr': 0.0003938858749311355, 'samples': 9045120, 'steps': 47109, 'loss/train': 1.9038214683532715} -11/07/2021 03:53:05 - INFO - __main__ - Step 47111: {'lr': 0.00039388153519620696, 'samples': 9045312, 'steps': 47110, 'loss/train': 1.5505082607269287} -11/07/2021 03:53:05 - INFO - __main__ - Step 47112: {'lr': 0.0003938771953964476, 'samples': 9045504, 'steps': 47111, 'loss/train': 1.3920332193374634} -11/07/2021 03:53:05 - INFO - __main__ - Step 47113: {'lr': 0.0003938728555318594, 'samples': 9045696, 'steps': 47112, 'loss/train': 2.713216543197632} -11/07/2021 03:53:06 - INFO - __main__ - Step 47114: {'lr': 0.00039386851560244433, 'samples': 9045888, 'steps': 47113, 'loss/train': 1.6680505275726318} -11/07/2021 03:53:07 - INFO - __main__ - Step 47115: {'lr': 0.0003938641756082043, 'samples': 9046080, 'steps': 47114, 'loss/train': 1.3867429494857788} -11/07/2021 03:53:07 - INFO - __main__ - Step 47116: {'lr': 0.00039385983554914136, 'samples': 9046272, 'steps': 47115, 'loss/train': 1.3547860383987427} -11/07/2021 03:53:08 - INFO - __main__ - Step 47117: {'lr': 0.0003938554954252573, 'samples': 9046464, 'steps': 47116, 'loss/train': 1.5629254579544067} -11/07/2021 03:53:08 - INFO - __main__ - Step 47118: {'lr': 0.00039385115523655426, 'samples': 9046656, 'steps': 47117, 'loss/train': 1.1610107421875} -11/07/2021 03:53:09 - INFO - __main__ - Step 47119: {'lr': 0.00039384681498303407, 'samples': 9046848, 'steps': 47118, 'loss/train': 1.762439489364624} -11/07/2021 03:53:09 - INFO - __main__ - Step 47120: {'lr': 0.0003938424746646988, 'samples': 9047040, 'steps': 47119, 'loss/train': 1.3170665502548218} -11/07/2021 03:53:10 - INFO - __main__ - Step 47121: {'lr': 0.00039383813428155027, 'samples': 9047232, 'steps': 47120, 'loss/train': 2.4549214839935303} -11/07/2021 03:53:10 - INFO - __main__ - Step 47122: {'lr': 0.0003938337938335904, 'samples': 9047424, 'steps': 47121, 'loss/train': 1.5323492288589478} -11/07/2021 03:53:10 - INFO - __main__ - Step 47123: {'lr': 0.00039382945332082136, 'samples': 9047616, 'steps': 47122, 'loss/train': 1.4084267616271973} -11/07/2021 03:53:11 - INFO - __main__ - Step 47124: {'lr': 0.00039382511274324496, 'samples': 9047808, 'steps': 47123, 'loss/train': 1.4346362352371216} -11/07/2021 03:53:12 - INFO - __main__ - Step 47125: {'lr': 0.0003938207721008632, 'samples': 9048000, 'steps': 47124, 'loss/train': 1.3514961004257202} -11/07/2021 03:53:12 - INFO - __main__ - Step 47126: {'lr': 0.00039381643139367806, 'samples': 9048192, 'steps': 47125, 'loss/train': 1.743735909461975} -11/07/2021 03:53:12 - INFO - __main__ - Step 47127: {'lr': 0.00039381209062169136, 'samples': 9048384, 'steps': 47126, 'loss/train': 1.2722545862197876} -11/07/2021 03:53:13 - INFO - __main__ - Step 47128: {'lr': 0.0003938077497849052, 'samples': 9048576, 'steps': 47127, 'loss/train': 1.4940422773361206} -11/07/2021 03:53:13 - INFO - __main__ - Step 47129: {'lr': 0.00039380340888332143, 'samples': 9048768, 'steps': 47128, 'loss/train': 1.303487777709961} -11/07/2021 03:53:14 - INFO - __main__ - Step 47130: {'lr': 0.0003937990679169421, 'samples': 9048960, 'steps': 47129, 'loss/train': 2.0714499950408936} -11/07/2021 03:53:15 - INFO - __main__ - Step 47131: {'lr': 0.0003937947268857692, 'samples': 9049152, 'steps': 47130, 'loss/train': 1.6812490224838257} -11/07/2021 03:53:15 - INFO - __main__ - Step 47132: {'lr': 0.00039379038578980454, 'samples': 9049344, 'steps': 47131, 'loss/train': 1.5768859386444092} -11/07/2021 03:53:15 - INFO - __main__ - Step 47133: {'lr': 0.0003937860446290502, 'samples': 9049536, 'steps': 47132, 'loss/train': 1.3159254789352417} -11/07/2021 03:53:16 - INFO - __main__ - Step 47134: {'lr': 0.0003937817034035081, 'samples': 9049728, 'steps': 47133, 'loss/train': 1.0606609582901} -11/07/2021 03:53:17 - INFO - __main__ - Step 47135: {'lr': 0.00039377736211318004, 'samples': 9049920, 'steps': 47134, 'loss/train': 2.44612717628479} -11/07/2021 03:53:17 - INFO - __main__ - Step 47136: {'lr': 0.0003937730207580682, 'samples': 9050112, 'steps': 47135, 'loss/train': 1.7027770280838013} -11/07/2021 03:53:17 - INFO - __main__ - Step 47137: {'lr': 0.0003937686793381745, 'samples': 9050304, 'steps': 47136, 'loss/train': 0.6332939863204956} -11/07/2021 03:53:18 - INFO - __main__ - Step 47138: {'lr': 0.0003937643378535009, 'samples': 9050496, 'steps': 47137, 'loss/train': 1.0706485509872437} -11/07/2021 03:53:18 - INFO - __main__ - Step 47139: {'lr': 0.0003937599963040491, 'samples': 9050688, 'steps': 47138, 'loss/train': 0.40077632665634155} -11/07/2021 03:53:19 - INFO - __main__ - Step 47140: {'lr': 0.0003937556546898214, 'samples': 9050880, 'steps': 47139, 'loss/train': 1.3255983591079712} -11/07/2021 03:53:20 - INFO - __main__ - Step 47141: {'lr': 0.0003937513130108197, 'samples': 9051072, 'steps': 47140, 'loss/train': 1.567197322845459} -11/07/2021 03:53:20 - INFO - __main__ - Step 47142: {'lr': 0.00039374697126704573, 'samples': 9051264, 'steps': 47141, 'loss/train': 1.435327172279358} -11/07/2021 03:53:20 - INFO - __main__ - Step 47143: {'lr': 0.0003937426294585017, 'samples': 9051456, 'steps': 47142, 'loss/train': 0.9999099373817444} -11/07/2021 03:53:21 - INFO - __main__ - Step 47144: {'lr': 0.00039373828758518936, 'samples': 9051648, 'steps': 47143, 'loss/train': 0.8797643780708313} -11/07/2021 03:53:21 - INFO - __main__ - Step 47145: {'lr': 0.00039373394564711086, 'samples': 9051840, 'steps': 47144, 'loss/train': 0.6948489546775818} -11/07/2021 03:53:22 - INFO - __main__ - Step 47146: {'lr': 0.00039372960364426803, 'samples': 9052032, 'steps': 47145, 'loss/train': 1.5431687831878662} -11/07/2021 03:53:22 - INFO - __main__ - Step 47147: {'lr': 0.0003937252615766628, 'samples': 9052224, 'steps': 47146, 'loss/train': 1.4942766427993774} -11/07/2021 03:53:23 - INFO - __main__ - Step 47148: {'lr': 0.0003937209194442973, 'samples': 9052416, 'steps': 47147, 'loss/train': 1.663383960723877} -11/07/2021 03:53:23 - INFO - __main__ - Step 47149: {'lr': 0.00039371657724717325, 'samples': 9052608, 'steps': 47148, 'loss/train': 1.6548125743865967} -11/07/2021 03:53:24 - INFO - __main__ - Step 47150: {'lr': 0.0003937122349852928, 'samples': 9052800, 'steps': 47149, 'loss/train': 1.6805589199066162} -11/07/2021 03:53:24 - INFO - __main__ - Step 47151: {'lr': 0.0003937078926586578, 'samples': 9052992, 'steps': 47150, 'loss/train': 1.630454421043396} -11/07/2021 03:53:25 - INFO - __main__ - Step 47152: {'lr': 0.0003937035502672703, 'samples': 9053184, 'steps': 47151, 'loss/train': 1.3253780603408813} -11/07/2021 03:53:25 - INFO - __main__ - Step 47153: {'lr': 0.0003936992078111321, 'samples': 9053376, 'steps': 47152, 'loss/train': 2.368971109390259} -11/07/2021 03:53:26 - INFO - __main__ - Step 47154: {'lr': 0.0003936948652902453, 'samples': 9053568, 'steps': 47153, 'loss/train': 1.6653461456298828} -11/07/2021 03:53:26 - INFO - __main__ - Step 47155: {'lr': 0.0003936905227046119, 'samples': 9053760, 'steps': 47154, 'loss/train': 1.3452043533325195} -11/07/2021 03:53:27 - INFO - __main__ - Step 47156: {'lr': 0.00039368618005423365, 'samples': 9053952, 'steps': 47155, 'loss/train': 1.4380110502243042} -11/07/2021 03:53:27 - INFO - __main__ - Step 47157: {'lr': 0.00039368183733911265, 'samples': 9054144, 'steps': 47156, 'loss/train': 1.4627124071121216} -11/07/2021 03:53:28 - INFO - __main__ - Step 47158: {'lr': 0.00039367749455925086, 'samples': 9054336, 'steps': 47157, 'loss/train': 1.1693251132965088} -11/07/2021 03:53:28 - INFO - __main__ - Step 47159: {'lr': 0.0003936731517146502, 'samples': 9054528, 'steps': 47158, 'loss/train': 1.4604130983352661} -11/07/2021 03:53:28 - INFO - __main__ - Step 47160: {'lr': 0.0003936688088053126, 'samples': 9054720, 'steps': 47159, 'loss/train': 1.8615742921829224} -11/07/2021 03:53:29 - INFO - __main__ - Step 47161: {'lr': 0.0003936644658312401, 'samples': 9054912, 'steps': 47160, 'loss/train': 1.6003049612045288} -11/07/2021 03:53:30 - INFO - __main__ - Step 47162: {'lr': 0.0003936601227924346, 'samples': 9055104, 'steps': 47161, 'loss/train': 0.5940176248550415} -11/07/2021 03:53:30 - INFO - __main__ - Step 47163: {'lr': 0.00039365577968889805, 'samples': 9055296, 'steps': 47162, 'loss/train': 1.779089093208313} -11/07/2021 03:53:30 - INFO - __main__ - Step 47164: {'lr': 0.0003936514365206324, 'samples': 9055488, 'steps': 47163, 'loss/train': 1.7254983186721802} -11/07/2021 03:53:31 - INFO - __main__ - Step 47165: {'lr': 0.00039364709328763966, 'samples': 9055680, 'steps': 47164, 'loss/train': 1.2700613737106323} -11/07/2021 03:53:31 - INFO - __main__ - Step 47166: {'lr': 0.00039364274998992177, 'samples': 9055872, 'steps': 47165, 'loss/train': 1.04393470287323} -11/07/2021 03:53:32 - INFO - __main__ - Step 47167: {'lr': 0.00039363840662748063, 'samples': 9056064, 'steps': 47166, 'loss/train': 0.7460552453994751} -11/07/2021 03:53:32 - INFO - __main__ - Step 47168: {'lr': 0.0003936340632003183, 'samples': 9056256, 'steps': 47167, 'loss/train': 1.065807580947876} -11/07/2021 03:53:33 - INFO - __main__ - Step 47169: {'lr': 0.0003936297197084366, 'samples': 9056448, 'steps': 47168, 'loss/train': 1.5235415697097778} -11/07/2021 03:53:33 - INFO - __main__ - Step 47170: {'lr': 0.00039362537615183764, 'samples': 9056640, 'steps': 47169, 'loss/train': 1.1110341548919678} -11/07/2021 03:53:33 - INFO - __main__ - Step 47171: {'lr': 0.0003936210325305233, 'samples': 9056832, 'steps': 47170, 'loss/train': 1.6105690002441406} -11/07/2021 03:53:35 - INFO - __main__ - Step 47172: {'lr': 0.0003936166888444954, 'samples': 9057024, 'steps': 47171, 'loss/train': 1.2022067308425903} -11/07/2021 03:53:35 - INFO - __main__ - Step 47173: {'lr': 0.0003936123450937562, 'samples': 9057216, 'steps': 47172, 'loss/train': 1.0590406656265259} -11/07/2021 03:53:35 - INFO - __main__ - Step 47174: {'lr': 0.0003936080012783075, 'samples': 9057408, 'steps': 47173, 'loss/train': 1.7635650634765625} -11/07/2021 03:53:36 - INFO - __main__ - Step 47175: {'lr': 0.0003936036573981512, 'samples': 9057600, 'steps': 47174, 'loss/train': 1.543225884437561} -11/07/2021 03:53:36 - INFO - __main__ - Step 47176: {'lr': 0.00039359931345328927, 'samples': 9057792, 'steps': 47175, 'loss/train': 1.3579483032226562} -11/07/2021 03:53:37 - INFO - __main__ - Step 47177: {'lr': 0.0003935949694437237, 'samples': 9057984, 'steps': 47176, 'loss/train': 1.6006814241409302} -11/07/2021 03:53:37 - INFO - __main__ - Step 47178: {'lr': 0.00039359062536945645, 'samples': 9058176, 'steps': 47177, 'loss/train': 0.7601653933525085} -11/07/2021 03:53:38 - INFO - __main__ - Step 47179: {'lr': 0.00039358628123048955, 'samples': 9058368, 'steps': 47178, 'loss/train': 1.717115044593811} -11/07/2021 03:53:38 - INFO - __main__ - Step 47180: {'lr': 0.0003935819370268249, 'samples': 9058560, 'steps': 47179, 'loss/train': 1.3778393268585205} -11/07/2021 03:53:38 - INFO - __main__ - Step 47181: {'lr': 0.00039357759275846437, 'samples': 9058752, 'steps': 47180, 'loss/train': 1.2944941520690918} -11/07/2021 03:53:40 - INFO - __main__ - Step 47182: {'lr': 0.00039357324842541, 'samples': 9058944, 'steps': 47181, 'loss/train': 1.4966262578964233} -11/07/2021 03:53:40 - INFO - __main__ - Step 47183: {'lr': 0.0003935689040276638, 'samples': 9059136, 'steps': 47182, 'loss/train': 2.011629104614258} -11/07/2021 03:53:40 - INFO - __main__ - Step 47184: {'lr': 0.0003935645595652276, 'samples': 9059328, 'steps': 47183, 'loss/train': 1.5474724769592285} -11/07/2021 03:53:41 - INFO - __main__ - Step 47185: {'lr': 0.0003935602150381034, 'samples': 9059520, 'steps': 47184, 'loss/train': 1.3871104717254639} -11/07/2021 03:53:41 - INFO - __main__ - Step 47186: {'lr': 0.00039355587044629325, 'samples': 9059712, 'steps': 47185, 'loss/train': 2.540052652359009} -11/07/2021 03:53:42 - INFO - __main__ - Step 47187: {'lr': 0.00039355152578979903, 'samples': 9059904, 'steps': 47186, 'loss/train': 1.1637755632400513} -11/07/2021 03:53:42 - INFO - __main__ - Step 47188: {'lr': 0.0003935471810686228, 'samples': 9060096, 'steps': 47187, 'loss/train': 1.387712001800537} -11/07/2021 03:53:43 - INFO - __main__ - Step 47189: {'lr': 0.0003935428362827662, 'samples': 9060288, 'steps': 47188, 'loss/train': 1.6322131156921387} -11/07/2021 03:53:43 - INFO - __main__ - Step 47190: {'lr': 0.0003935384914322316, 'samples': 9060480, 'steps': 47189, 'loss/train': 0.8436173796653748} -11/07/2021 03:53:44 - INFO - __main__ - Step 47191: {'lr': 0.0003935341465170207, 'samples': 9060672, 'steps': 47190, 'loss/train': 1.3562065362930298} -11/07/2021 03:53:44 - INFO - __main__ - Step 47192: {'lr': 0.0003935298015371355, 'samples': 9060864, 'steps': 47191, 'loss/train': 1.4174747467041016} -11/07/2021 03:53:46 - INFO - __main__ - Step 47193: {'lr': 0.0003935254564925781, 'samples': 9061056, 'steps': 47192, 'loss/train': 1.27580988407135} -11/07/2021 03:53:46 - INFO - __main__ - Step 47194: {'lr': 0.0003935211113833502, 'samples': 9061248, 'steps': 47193, 'loss/train': 1.6711721420288086} -11/07/2021 03:53:47 - INFO - __main__ - Step 47195: {'lr': 0.00039351676620945396, 'samples': 9061440, 'steps': 47194, 'loss/train': 0.5922019481658936} -11/07/2021 03:53:47 - INFO - __main__ - Step 47196: {'lr': 0.00039351242097089133, 'samples': 9061632, 'steps': 47195, 'loss/train': 1.8144773244857788} -11/07/2021 03:53:47 - INFO - __main__ - Step 47197: {'lr': 0.0003935080756676641, 'samples': 9061824, 'steps': 47196, 'loss/train': 1.7800637483596802} -11/07/2021 03:53:48 - INFO - __main__ - Step 47198: {'lr': 0.0003935037302997745, 'samples': 9062016, 'steps': 47197, 'loss/train': 1.7908663749694824} -11/07/2021 03:53:48 - INFO - __main__ - Step 47199: {'lr': 0.00039349938486722425, 'samples': 9062208, 'steps': 47198, 'loss/train': 1.4536714553833008} -11/07/2021 03:53:48 - INFO - __main__ - Step 47200: {'lr': 0.0003934950393700154, 'samples': 9062400, 'steps': 47199, 'loss/train': 1.3902226686477661} -11/07/2021 03:53:49 - INFO - __main__ - Step 47201: {'lr': 0.0003934906938081499, 'samples': 9062592, 'steps': 47200, 'loss/train': 1.2590264081954956} -11/07/2021 03:53:50 - INFO - __main__ - Step 47202: {'lr': 0.0003934863481816297, 'samples': 9062784, 'steps': 47201, 'loss/train': 1.6010756492614746} -11/07/2021 03:53:50 - INFO - __main__ - Step 47203: {'lr': 0.00039348200249045675, 'samples': 9062976, 'steps': 47202, 'loss/train': 1.2708886861801147} -11/07/2021 03:53:51 - INFO - __main__ - Step 47204: {'lr': 0.000393477656734633, 'samples': 9063168, 'steps': 47203, 'loss/train': 2.0616767406463623} -11/07/2021 03:53:51 - INFO - __main__ - Step 47205: {'lr': 0.0003934733109141605, 'samples': 9063360, 'steps': 47204, 'loss/train': 1.5255537033081055} -11/07/2021 03:53:52 - INFO - __main__ - Step 47206: {'lr': 0.00039346896502904117, 'samples': 9063552, 'steps': 47205, 'loss/train': 1.4788717031478882} -11/07/2021 03:53:52 - INFO - __main__ - Step 47207: {'lr': 0.0003934646190792769, 'samples': 9063744, 'steps': 47206, 'loss/train': 1.8538322448730469} -11/07/2021 03:53:53 - INFO - __main__ - Step 47208: {'lr': 0.00039346027306486964, 'samples': 9063936, 'steps': 47207, 'loss/train': 1.713992714881897} -11/07/2021 03:53:53 - INFO - __main__ - Step 47209: {'lr': 0.00039345592698582146, 'samples': 9064128, 'steps': 47208, 'loss/train': 1.1504381895065308} -11/07/2021 03:53:53 - INFO - __main__ - Step 47210: {'lr': 0.00039345158084213417, 'samples': 9064320, 'steps': 47209, 'loss/train': 1.6446284055709839} -11/07/2021 03:53:54 - INFO - __main__ - Step 47211: {'lr': 0.0003934472346338099, 'samples': 9064512, 'steps': 47210, 'loss/train': 1.9809157848358154} -11/07/2021 03:53:55 - INFO - __main__ - Step 47212: {'lr': 0.00039344288836085046, 'samples': 9064704, 'steps': 47211, 'loss/train': 1.4329661130905151} -11/07/2021 03:53:55 - INFO - __main__ - Step 47213: {'lr': 0.0003934385420232579, 'samples': 9064896, 'steps': 47212, 'loss/train': 1.3324871063232422} -11/07/2021 03:53:55 - INFO - __main__ - Step 47214: {'lr': 0.0003934341956210341, 'samples': 9065088, 'steps': 47213, 'loss/train': 1.3765357732772827} -11/07/2021 03:53:56 - INFO - __main__ - Step 47215: {'lr': 0.0003934298491541811, 'samples': 9065280, 'steps': 47214, 'loss/train': 1.4130184650421143} -11/07/2021 03:53:57 - INFO - __main__ - Step 47216: {'lr': 0.0003934255026227008, 'samples': 9065472, 'steps': 47215, 'loss/train': 1.6666706800460815} -11/07/2021 03:53:57 - INFO - __main__ - Step 47217: {'lr': 0.0003934211560265952, 'samples': 9065664, 'steps': 47216, 'loss/train': 1.3997408151626587} -11/07/2021 03:53:58 - INFO - __main__ - Step 47218: {'lr': 0.0003934168093658663, 'samples': 9065856, 'steps': 47217, 'loss/train': 2.0830512046813965} -11/07/2021 03:53:58 - INFO - __main__ - Step 47219: {'lr': 0.0003934124626405159, 'samples': 9066048, 'steps': 47218, 'loss/train': 1.5073606967926025} -11/07/2021 03:53:58 - INFO - __main__ - Step 47220: {'lr': 0.00039340811585054615, 'samples': 9066240, 'steps': 47219, 'loss/train': 1.524347186088562} -11/07/2021 03:53:59 - INFO - __main__ - Step 47221: {'lr': 0.0003934037689959589, 'samples': 9066432, 'steps': 47220, 'loss/train': 1.5292742252349854} -11/07/2021 03:54:00 - INFO - __main__ - Step 47222: {'lr': 0.00039339942207675604, 'samples': 9066624, 'steps': 47221, 'loss/train': 1.8891303539276123} -11/07/2021 03:54:00 - INFO - __main__ - Step 47223: {'lr': 0.0003933950750929397, 'samples': 9066816, 'steps': 47222, 'loss/train': 0.27736398577690125} -11/07/2021 03:54:00 - INFO - __main__ - Step 47224: {'lr': 0.0003933907280445117, 'samples': 9067008, 'steps': 47223, 'loss/train': 1.1352673768997192} -11/07/2021 03:54:01 - INFO - __main__ - Step 47225: {'lr': 0.00039338638093147404, 'samples': 9067200, 'steps': 47224, 'loss/train': 0.9194772839546204} -11/07/2021 03:54:02 - INFO - __main__ - Step 47226: {'lr': 0.00039338203375382873, 'samples': 9067392, 'steps': 47225, 'loss/train': 1.056955099105835} -11/07/2021 03:54:02 - INFO - __main__ - Step 47227: {'lr': 0.00039337768651157766, 'samples': 9067584, 'steps': 47226, 'loss/train': 1.5889086723327637} -11/07/2021 03:54:02 - INFO - __main__ - Step 47228: {'lr': 0.0003933733392047228, 'samples': 9067776, 'steps': 47227, 'loss/train': 1.2220077514648438} -11/07/2021 03:54:03 - INFO - __main__ - Step 47229: {'lr': 0.0003933689918332662, 'samples': 9067968, 'steps': 47228, 'loss/train': 1.3765571117401123} -11/07/2021 03:54:03 - INFO - __main__ - Step 47230: {'lr': 0.0003933646443972097, 'samples': 9068160, 'steps': 47229, 'loss/train': 0.5726089477539062} -11/07/2021 03:54:03 - INFO - __main__ - Step 47231: {'lr': 0.0003933602968965553, 'samples': 9068352, 'steps': 47230, 'loss/train': 1.0503922700881958} -11/07/2021 03:54:05 - INFO - __main__ - Step 47232: {'lr': 0.00039335594933130494, 'samples': 9068544, 'steps': 47231, 'loss/train': 1.624923586845398} -11/07/2021 03:54:06 - INFO - __main__ - Step 47233: {'lr': 0.0003933516017014607, 'samples': 9068736, 'steps': 47232, 'loss/train': 1.2353731393814087} -11/07/2021 03:54:06 - INFO - __main__ - Step 47234: {'lr': 0.0003933472540070243, 'samples': 9068928, 'steps': 47233, 'loss/train': 2.365288019180298} -11/07/2021 03:54:06 - INFO - __main__ - Step 47235: {'lr': 0.00039334290624799795, 'samples': 9069120, 'steps': 47234, 'loss/train': 3.6028764247894287} -11/07/2021 03:54:07 - INFO - __main__ - Step 47236: {'lr': 0.0003933385584243834, 'samples': 9069312, 'steps': 47235, 'loss/train': 2.2998764514923096} -11/07/2021 03:54:07 - INFO - __main__ - Step 47237: {'lr': 0.0003933342105361828, 'samples': 9069504, 'steps': 47236, 'loss/train': 1.322514295578003} -11/07/2021 03:54:08 - INFO - __main__ - Step 47238: {'lr': 0.000393329862583398, 'samples': 9069696, 'steps': 47237, 'loss/train': 1.5863367319107056} -11/07/2021 03:54:09 - INFO - __main__ - Step 47239: {'lr': 0.00039332551456603093, 'samples': 9069888, 'steps': 47238, 'loss/train': 1.2961407899856567} -11/07/2021 03:54:09 - INFO - __main__ - Step 47240: {'lr': 0.00039332116648408365, 'samples': 9070080, 'steps': 47239, 'loss/train': 2.511929988861084} -11/07/2021 03:54:10 - INFO - __main__ - Step 47241: {'lr': 0.00039331681833755804, 'samples': 9070272, 'steps': 47240, 'loss/train': 1.450066089630127} -11/07/2021 03:54:10 - INFO - __main__ - Step 47242: {'lr': 0.00039331247012645604, 'samples': 9070464, 'steps': 47241, 'loss/train': 0.961763858795166} -11/07/2021 03:54:10 - INFO - __main__ - Step 47243: {'lr': 0.00039330812185077967, 'samples': 9070656, 'steps': 47242, 'loss/train': 1.3809430599212646} -11/07/2021 03:54:11 - INFO - __main__ - Step 47244: {'lr': 0.0003933037735105309, 'samples': 9070848, 'steps': 47243, 'loss/train': 1.3170738220214844} -11/07/2021 03:54:12 - INFO - __main__ - Step 47245: {'lr': 0.00039329942510571165, 'samples': 9071040, 'steps': 47244, 'loss/train': 1.5395973920822144} -11/07/2021 03:54:12 - INFO - __main__ - Step 47246: {'lr': 0.0003932950766363239, 'samples': 9071232, 'steps': 47245, 'loss/train': 1.5195993185043335} -11/07/2021 03:54:12 - INFO - __main__ - Step 47247: {'lr': 0.00039329072810236965, 'samples': 9071424, 'steps': 47246, 'loss/train': 0.65678471326828} -11/07/2021 03:54:13 - INFO - __main__ - Step 47248: {'lr': 0.0003932863795038507, 'samples': 9071616, 'steps': 47247, 'loss/train': 0.8310577273368835} -11/07/2021 03:54:14 - INFO - __main__ - Step 47249: {'lr': 0.0003932820308407692, 'samples': 9071808, 'steps': 47248, 'loss/train': 1.3056358098983765} -11/07/2021 03:54:14 - INFO - __main__ - Step 47250: {'lr': 0.000393277682113127, 'samples': 9072000, 'steps': 47249, 'loss/train': 1.0573945045471191} -11/07/2021 03:54:14 - INFO - __main__ - Step 47251: {'lr': 0.00039327333332092606, 'samples': 9072192, 'steps': 47250, 'loss/train': 1.5271329879760742} -11/07/2021 03:54:15 - INFO - __main__ - Step 47252: {'lr': 0.0003932689844641684, 'samples': 9072384, 'steps': 47251, 'loss/train': 1.4134752750396729} -11/07/2021 03:54:15 - INFO - __main__ - Step 47253: {'lr': 0.00039326463554285597, 'samples': 9072576, 'steps': 47252, 'loss/train': 1.1137325763702393} -11/07/2021 03:54:15 - INFO - __main__ - Step 47254: {'lr': 0.00039326028655699063, 'samples': 9072768, 'steps': 47253, 'loss/train': 1.1397970914840698} -11/07/2021 03:54:17 - INFO - __main__ - Step 47255: {'lr': 0.0003932559375065745, 'samples': 9072960, 'steps': 47254, 'loss/train': 1.6555663347244263} -11/07/2021 03:54:17 - INFO - __main__ - Step 47256: {'lr': 0.00039325158839160937, 'samples': 9073152, 'steps': 47255, 'loss/train': 1.5813300609588623} -11/07/2021 03:54:17 - INFO - __main__ - Step 47257: {'lr': 0.0003932472392120974, 'samples': 9073344, 'steps': 47256, 'loss/train': 1.7237550020217896} -11/07/2021 03:54:18 - INFO - __main__ - Step 47258: {'lr': 0.00039324288996804026, 'samples': 9073536, 'steps': 47257, 'loss/train': 1.1574243307113647} -11/07/2021 03:54:18 - INFO - __main__ - Step 47259: {'lr': 0.0003932385406594402, 'samples': 9073728, 'steps': 47258, 'loss/train': 1.146239161491394} -11/07/2021 03:54:19 - INFO - __main__ - Step 47260: {'lr': 0.0003932341912862991, 'samples': 9073920, 'steps': 47259, 'loss/train': 0.8379764556884766} -11/07/2021 03:54:19 - INFO - __main__ - Step 47261: {'lr': 0.0003932298418486188, 'samples': 9074112, 'steps': 47260, 'loss/train': 1.6379982233047485} -11/07/2021 03:54:20 - INFO - __main__ - Step 47262: {'lr': 0.00039322549234640136, 'samples': 9074304, 'steps': 47261, 'loss/train': 1.5093833208084106} -11/07/2021 03:54:20 - INFO - __main__ - Step 47263: {'lr': 0.00039322114277964875, 'samples': 9074496, 'steps': 47262, 'loss/train': 1.1236997842788696} -11/07/2021 03:54:20 - INFO - __main__ - Step 47264: {'lr': 0.0003932167931483629, 'samples': 9074688, 'steps': 47263, 'loss/train': 1.0301036834716797} -11/07/2021 03:54:21 - INFO - __main__ - Step 47265: {'lr': 0.00039321244345254583, 'samples': 9074880, 'steps': 47264, 'loss/train': 1.3616799116134644} -11/07/2021 03:54:22 - INFO - __main__ - Step 47266: {'lr': 0.0003932080936921993, 'samples': 9075072, 'steps': 47265, 'loss/train': 1.1745116710662842} -11/07/2021 03:54:22 - INFO - __main__ - Step 47267: {'lr': 0.00039320374386732555, 'samples': 9075264, 'steps': 47266, 'loss/train': 1.5966567993164062} -11/07/2021 03:54:22 - INFO - __main__ - Step 47268: {'lr': 0.00039319939397792635, 'samples': 9075456, 'steps': 47267, 'loss/train': 1.515926480293274} -11/07/2021 03:54:23 - INFO - __main__ - Step 47269: {'lr': 0.00039319504402400367, 'samples': 9075648, 'steps': 47268, 'loss/train': 0.9507867097854614} -11/07/2021 03:54:24 - INFO - __main__ - Step 47270: {'lr': 0.0003931906940055596, 'samples': 9075840, 'steps': 47269, 'loss/train': 1.687520146369934} -11/07/2021 03:54:24 - INFO - __main__ - Step 47271: {'lr': 0.00039318634392259593, 'samples': 9076032, 'steps': 47270, 'loss/train': 1.403967022895813} -11/07/2021 03:54:24 - INFO - __main__ - Step 47272: {'lr': 0.00039318199377511476, 'samples': 9076224, 'steps': 47271, 'loss/train': 1.505491852760315} -11/07/2021 03:54:25 - INFO - __main__ - Step 47273: {'lr': 0.00039317764356311803, 'samples': 9076416, 'steps': 47272, 'loss/train': 1.9129726886749268} -11/07/2021 03:54:25 - INFO - __main__ - Step 47274: {'lr': 0.00039317329328660754, 'samples': 9076608, 'steps': 47273, 'loss/train': 1.8173123598098755} -11/07/2021 03:54:26 - INFO - __main__ - Step 47275: {'lr': 0.0003931689429455855, 'samples': 9076800, 'steps': 47274, 'loss/train': 1.7296642065048218} -11/07/2021 03:54:27 - INFO - __main__ - Step 47276: {'lr': 0.00039316459254005364, 'samples': 9076992, 'steps': 47275, 'loss/train': 1.330780029296875} -11/07/2021 03:54:27 - INFO - __main__ - Step 47277: {'lr': 0.00039316024207001403, 'samples': 9077184, 'steps': 47276, 'loss/train': 1.7858941555023193} -11/07/2021 03:54:27 - INFO - __main__ - Step 47278: {'lr': 0.0003931558915354687, 'samples': 9077376, 'steps': 47277, 'loss/train': 1.0815973281860352} -11/07/2021 03:54:28 - INFO - __main__ - Step 47279: {'lr': 0.00039315154093641947, 'samples': 9077568, 'steps': 47278, 'loss/train': 1.7182049751281738} -11/07/2021 03:54:28 - INFO - __main__ - Step 47280: {'lr': 0.00039314719027286837, 'samples': 9077760, 'steps': 47279, 'loss/train': 1.3329108953475952} -11/07/2021 03:54:29 - INFO - __main__ - Step 47281: {'lr': 0.00039314283954481737, 'samples': 9077952, 'steps': 47280, 'loss/train': 1.2826067209243774} -11/07/2021 03:54:29 - INFO - __main__ - Step 47282: {'lr': 0.00039313848875226844, 'samples': 9078144, 'steps': 47281, 'loss/train': 1.6733689308166504} -11/07/2021 03:54:30 - INFO - __main__ - Step 47283: {'lr': 0.0003931341378952235, 'samples': 9078336, 'steps': 47282, 'loss/train': 1.5830260515213013} -11/07/2021 03:54:30 - INFO - __main__ - Step 47284: {'lr': 0.0003931297869736845, 'samples': 9078528, 'steps': 47283, 'loss/train': 1.3615508079528809} -11/07/2021 03:54:30 - INFO - __main__ - Step 47285: {'lr': 0.0003931254359876535, 'samples': 9078720, 'steps': 47284, 'loss/train': 1.4981908798217773} -11/07/2021 03:54:31 - INFO - __main__ - Step 47286: {'lr': 0.00039312108493713227, 'samples': 9078912, 'steps': 47285, 'loss/train': 1.6365206241607666} -11/07/2021 03:54:32 - INFO - __main__ - Step 47287: {'lr': 0.00039311673382212296, 'samples': 9079104, 'steps': 47286, 'loss/train': 1.4383234977722168} -11/07/2021 03:54:32 - INFO - __main__ - Step 47288: {'lr': 0.0003931123826426275, 'samples': 9079296, 'steps': 47287, 'loss/train': 1.3046178817749023} -11/07/2021 03:54:33 - INFO - __main__ - Step 47289: {'lr': 0.00039310803139864777, 'samples': 9079488, 'steps': 47288, 'loss/train': 1.2773518562316895} -11/07/2021 03:54:33 - INFO - __main__ - Step 47290: {'lr': 0.0003931036800901857, 'samples': 9079680, 'steps': 47289, 'loss/train': 1.4533926248550415} -11/07/2021 03:54:34 - INFO - __main__ - Step 47291: {'lr': 0.0003930993287172434, 'samples': 9079872, 'steps': 47290, 'loss/train': 1.3367587327957153} -11/07/2021 03:54:34 - INFO - __main__ - Step 47292: {'lr': 0.0003930949772798227, 'samples': 9080064, 'steps': 47291, 'loss/train': 1.9066798686981201} -11/07/2021 03:54:35 - INFO - __main__ - Step 47293: {'lr': 0.00039309062577792565, 'samples': 9080256, 'steps': 47292, 'loss/train': 1.4607013463974} -11/07/2021 03:54:35 - INFO - __main__ - Step 47294: {'lr': 0.0003930862742115542, 'samples': 9080448, 'steps': 47293, 'loss/train': 1.6229429244995117} -11/07/2021 03:54:35 - INFO - __main__ - Step 47295: {'lr': 0.0003930819225807102, 'samples': 9080640, 'steps': 47294, 'loss/train': 1.2199546098709106} -11/07/2021 03:54:37 - INFO - __main__ - Step 47296: {'lr': 0.00039307757088539574, 'samples': 9080832, 'steps': 47295, 'loss/train': 1.463995099067688} -11/07/2021 03:54:37 - INFO - __main__ - Step 47297: {'lr': 0.0003930732191256128, 'samples': 9081024, 'steps': 47296, 'loss/train': 1.3913321495056152} -11/07/2021 03:54:37 - INFO - __main__ - Step 47298: {'lr': 0.00039306886730136316, 'samples': 9081216, 'steps': 47297, 'loss/train': 1.3702958822250366} -11/07/2021 03:54:38 - INFO - __main__ - Step 47299: {'lr': 0.00039306451541264896, 'samples': 9081408, 'steps': 47298, 'loss/train': 1.3876159191131592} -11/07/2021 03:54:38 - INFO - __main__ - Step 47300: {'lr': 0.0003930601634594721, 'samples': 9081600, 'steps': 47299, 'loss/train': 1.3369739055633545} -11/07/2021 03:54:38 - INFO - __main__ - Step 47301: {'lr': 0.0003930558114418345, 'samples': 9081792, 'steps': 47300, 'loss/train': 1.3893908262252808} -11/07/2021 03:54:39 - INFO - __main__ - Step 47302: {'lr': 0.0003930514593597382, 'samples': 9081984, 'steps': 47301, 'loss/train': 1.543992519378662} -11/07/2021 03:54:40 - INFO - __main__ - Step 47303: {'lr': 0.00039304710721318505, 'samples': 9082176, 'steps': 47302, 'loss/train': 1.5732660293579102} -11/07/2021 03:54:40 - INFO - __main__ - Step 47304: {'lr': 0.0003930427550021771, 'samples': 9082368, 'steps': 47303, 'loss/train': 1.4729195833206177} -11/07/2021 03:54:40 - INFO - __main__ - Step 47305: {'lr': 0.00039303840272671636, 'samples': 9082560, 'steps': 47304, 'loss/train': 2.4504709243774414} -11/07/2021 03:54:41 - INFO - __main__ - Step 47306: {'lr': 0.00039303405038680465, 'samples': 9082752, 'steps': 47305, 'loss/train': 1.43690824508667} -11/07/2021 03:54:42 - INFO - __main__ - Step 47307: {'lr': 0.00039302969798244407, 'samples': 9082944, 'steps': 47306, 'loss/train': 1.5622464418411255} -11/07/2021 03:54:42 - INFO - __main__ - Step 47308: {'lr': 0.0003930253455136365, 'samples': 9083136, 'steps': 47307, 'loss/train': 1.2252328395843506} -11/07/2021 03:54:42 - INFO - __main__ - Step 47309: {'lr': 0.0003930209929803839, 'samples': 9083328, 'steps': 47308, 'loss/train': 1.747268557548523} -11/07/2021 03:54:43 - INFO - __main__ - Step 47310: {'lr': 0.0003930166403826883, 'samples': 9083520, 'steps': 47309, 'loss/train': 1.8754584789276123} -11/07/2021 03:54:43 - INFO - __main__ - Step 47311: {'lr': 0.00039301228772055147, 'samples': 9083712, 'steps': 47310, 'loss/train': 1.5060009956359863} -11/07/2021 03:54:44 - INFO - __main__ - Step 47312: {'lr': 0.0003930079349939756, 'samples': 9083904, 'steps': 47311, 'loss/train': 1.5311397314071655} -11/07/2021 03:54:44 - INFO - __main__ - Step 47313: {'lr': 0.00039300358220296255, 'samples': 9084096, 'steps': 47312, 'loss/train': 1.609533667564392} -11/07/2021 03:54:45 - INFO - __main__ - Step 47314: {'lr': 0.0003929992293475143, 'samples': 9084288, 'steps': 47313, 'loss/train': 1.5221704244613647} -11/07/2021 03:54:45 - INFO - __main__ - Step 47315: {'lr': 0.00039299487642763286, 'samples': 9084480, 'steps': 47314, 'loss/train': 0.9802134037017822} -11/07/2021 03:54:46 - INFO - __main__ - Step 47316: {'lr': 0.00039299052344332, 'samples': 9084672, 'steps': 47315, 'loss/train': 1.5102630853652954} -11/07/2021 03:54:47 - INFO - __main__ - Step 47317: {'lr': 0.00039298617039457796, 'samples': 9084864, 'steps': 47316, 'loss/train': 1.2505311965942383} -11/07/2021 03:54:47 - INFO - __main__ - Step 47318: {'lr': 0.0003929818172814085, 'samples': 9085056, 'steps': 47317, 'loss/train': 1.1996872425079346} -11/07/2021 03:54:47 - INFO - __main__ - Step 47319: {'lr': 0.00039297746410381357, 'samples': 9085248, 'steps': 47318, 'loss/train': 1.3600307703018188} -11/07/2021 03:54:48 - INFO - __main__ - Step 47320: {'lr': 0.00039297311086179535, 'samples': 9085440, 'steps': 47319, 'loss/train': 1.2544894218444824} -11/07/2021 03:54:48 - INFO - __main__ - Step 47321: {'lr': 0.00039296875755535557, 'samples': 9085632, 'steps': 47320, 'loss/train': 1.227154016494751} -11/07/2021 03:54:48 - INFO - __main__ - Step 47322: {'lr': 0.0003929644041844962, 'samples': 9085824, 'steps': 47321, 'loss/train': 1.1505377292633057} -11/07/2021 03:54:50 - INFO - __main__ - Step 47323: {'lr': 0.00039296005074921937, 'samples': 9086016, 'steps': 47322, 'loss/train': 1.7143731117248535} -11/07/2021 03:54:50 - INFO - __main__ - Step 47324: {'lr': 0.0003929556972495269, 'samples': 9086208, 'steps': 47323, 'loss/train': 1.8348923921585083} -11/07/2021 03:54:50 - INFO - __main__ - Step 47325: {'lr': 0.00039295134368542083, 'samples': 9086400, 'steps': 47324, 'loss/train': 1.1800689697265625} -11/07/2021 03:54:51 - INFO - __main__ - Step 47326: {'lr': 0.000392946990056903, 'samples': 9086592, 'steps': 47325, 'loss/train': 1.5850028991699219} -11/07/2021 03:54:51 - INFO - __main__ - Step 47327: {'lr': 0.00039294263636397564, 'samples': 9086784, 'steps': 47326, 'loss/train': 1.642444133758545} -11/07/2021 03:54:52 - INFO - __main__ - Step 47328: {'lr': 0.00039293828260664047, 'samples': 9086976, 'steps': 47327, 'loss/train': 2.3432319164276123} -11/07/2021 03:54:52 - INFO - __main__ - Step 47329: {'lr': 0.0003929339287848994, 'samples': 9087168, 'steps': 47328, 'loss/train': 1.3766820430755615} -11/07/2021 03:54:53 - INFO - __main__ - Step 47330: {'lr': 0.00039292957489875456, 'samples': 9087360, 'steps': 47329, 'loss/train': 1.3282623291015625} -11/07/2021 03:54:53 - INFO - __main__ - Step 47331: {'lr': 0.00039292522094820794, 'samples': 9087552, 'steps': 47330, 'loss/train': 2.0509135723114014} -11/07/2021 03:54:53 - INFO - __main__ - Step 47332: {'lr': 0.00039292086693326134, 'samples': 9087744, 'steps': 47331, 'loss/train': 1.2490166425704956} -11/07/2021 03:54:54 - INFO - __main__ - Step 47333: {'lr': 0.0003929165128539168, 'samples': 9087936, 'steps': 47332, 'loss/train': 1.6519125699996948} -11/07/2021 03:54:55 - INFO - __main__ - Step 47334: {'lr': 0.0003929121587101764, 'samples': 9088128, 'steps': 47333, 'loss/train': 1.5916945934295654} -11/07/2021 03:54:55 - INFO - __main__ - Step 47335: {'lr': 0.00039290780450204187, 'samples': 9088320, 'steps': 47334, 'loss/train': 1.6293517351150513} -11/07/2021 03:54:55 - INFO - __main__ - Step 47336: {'lr': 0.00039290345022951535, 'samples': 9088512, 'steps': 47335, 'loss/train': 2.4737918376922607} -11/07/2021 03:54:56 - INFO - __main__ - Step 47337: {'lr': 0.0003928990958925987, 'samples': 9088704, 'steps': 47336, 'loss/train': 1.8430202007293701} -11/07/2021 03:54:57 - INFO - __main__ - Step 47338: {'lr': 0.0003928947414912939, 'samples': 9088896, 'steps': 47337, 'loss/train': 1.7198305130004883} -11/07/2021 03:54:57 - INFO - __main__ - Step 47339: {'lr': 0.00039289038702560304, 'samples': 9089088, 'steps': 47338, 'loss/train': 1.2610658407211304} -11/07/2021 03:54:58 - INFO - __main__ - Step 47340: {'lr': 0.0003928860324955279, 'samples': 9089280, 'steps': 47339, 'loss/train': 1.1008061170578003} -11/07/2021 03:54:58 - INFO - __main__ - Step 47341: {'lr': 0.00039288167790107055, 'samples': 9089472, 'steps': 47340, 'loss/train': 1.7525180578231812} -11/07/2021 03:54:58 - INFO - __main__ - Step 47342: {'lr': 0.00039287732324223287, 'samples': 9089664, 'steps': 47341, 'loss/train': 1.2478035688400269} -11/07/2021 03:54:59 - INFO - __main__ - Step 47343: {'lr': 0.0003928729685190169, 'samples': 9089856, 'steps': 47342, 'loss/train': 1.0368107557296753} -11/07/2021 03:55:00 - INFO - __main__ - Step 47344: {'lr': 0.00039286861373142456, 'samples': 9090048, 'steps': 47343, 'loss/train': 1.490264892578125} -11/07/2021 03:55:00 - INFO - __main__ - Step 47345: {'lr': 0.0003928642588794579, 'samples': 9090240, 'steps': 47344, 'loss/train': 1.3091282844543457} -11/07/2021 03:55:00 - INFO - __main__ - Step 47346: {'lr': 0.0003928599039631187, 'samples': 9090432, 'steps': 47345, 'loss/train': 1.1811167001724243} -11/07/2021 03:55:01 - INFO - __main__ - Step 47347: {'lr': 0.00039285554898240907, 'samples': 9090624, 'steps': 47346, 'loss/train': 1.5830038785934448} -11/07/2021 03:55:01 - INFO - __main__ - Step 47348: {'lr': 0.0003928511939373309, 'samples': 9090816, 'steps': 47347, 'loss/train': 1.7371083498001099} -11/07/2021 03:55:02 - INFO - __main__ - Step 47349: {'lr': 0.0003928468388278863, 'samples': 9091008, 'steps': 47348, 'loss/train': 1.4600836038589478} -11/07/2021 03:55:03 - INFO - __main__ - Step 47350: {'lr': 0.00039284248365407704, 'samples': 9091200, 'steps': 47349, 'loss/train': 1.5137965679168701} -11/07/2021 03:55:03 - INFO - __main__ - Step 47351: {'lr': 0.00039283812841590514, 'samples': 9091392, 'steps': 47350, 'loss/train': 1.3401132822036743} -11/07/2021 03:55:03 - INFO - __main__ - Step 47352: {'lr': 0.0003928337731133727, 'samples': 9091584, 'steps': 47351, 'loss/train': 0.8940303921699524} -11/07/2021 03:55:04 - INFO - __main__ - Step 47353: {'lr': 0.0003928294177464814, 'samples': 9091776, 'steps': 47352, 'loss/train': 1.344061017036438} -11/07/2021 03:55:05 - INFO - __main__ - Step 47354: {'lr': 0.0003928250623152335, 'samples': 9091968, 'steps': 47353, 'loss/train': 1.3783444166183472} -11/07/2021 03:55:05 - INFO - __main__ - Step 47355: {'lr': 0.00039282070681963076, 'samples': 9092160, 'steps': 47354, 'loss/train': 0.9003660678863525} -11/07/2021 03:55:05 - INFO - __main__ - Step 47356: {'lr': 0.00039281635125967525, 'samples': 9092352, 'steps': 47355, 'loss/train': 1.6121208667755127} -11/07/2021 03:55:06 - INFO - __main__ - Step 47357: {'lr': 0.00039281199563536887, 'samples': 9092544, 'steps': 47356, 'loss/train': 1.4227135181427002} -11/07/2021 03:55:06 - INFO - __main__ - Step 47358: {'lr': 0.00039280763994671363, 'samples': 9092736, 'steps': 47357, 'loss/train': 1.783883810043335} -11/07/2021 03:55:07 - INFO - __main__ - Step 47359: {'lr': 0.0003928032841937115, 'samples': 9092928, 'steps': 47358, 'loss/train': 0.9126694202423096} -11/07/2021 03:55:07 - INFO - __main__ - Step 47360: {'lr': 0.0003927989283763643, 'samples': 9093120, 'steps': 47359, 'loss/train': 0.3783952295780182} -11/07/2021 03:55:08 - INFO - __main__ - Step 47361: {'lr': 0.0003927945724946742, 'samples': 9093312, 'steps': 47360, 'loss/train': 1.4427589178085327} -11/07/2021 03:55:08 - INFO - __main__ - Step 47362: {'lr': 0.00039279021654864307, 'samples': 9093504, 'steps': 47361, 'loss/train': 1.2977060079574585} -11/07/2021 03:55:08 - INFO - __main__ - Step 47363: {'lr': 0.0003927858605382728, 'samples': 9093696, 'steps': 47362, 'loss/train': 1.5949335098266602} -11/07/2021 03:55:09 - INFO - __main__ - Step 47364: {'lr': 0.0003927815044635655, 'samples': 9093888, 'steps': 47363, 'loss/train': 1.5859639644622803} -11/07/2021 03:55:10 - INFO - __main__ - Step 47365: {'lr': 0.00039277714832452304, 'samples': 9094080, 'steps': 47364, 'loss/train': 0.8822575807571411} -11/07/2021 03:55:10 - INFO - __main__ - Step 47366: {'lr': 0.0003927727921211474, 'samples': 9094272, 'steps': 47365, 'loss/train': 1.8432468175888062} -11/07/2021 03:55:11 - INFO - __main__ - Step 47367: {'lr': 0.00039276843585344046, 'samples': 9094464, 'steps': 47366, 'loss/train': 0.81095951795578} -11/07/2021 03:55:11 - INFO - __main__ - Step 47368: {'lr': 0.0003927640795214044, 'samples': 9094656, 'steps': 47367, 'loss/train': 1.6812350749969482} -11/07/2021 03:55:11 - INFO - __main__ - Step 47369: {'lr': 0.00039275972312504103, 'samples': 9094848, 'steps': 47368, 'loss/train': 1.4239321947097778} -11/07/2021 03:55:13 - INFO - __main__ - Step 47370: {'lr': 0.0003927553666643523, 'samples': 9095040, 'steps': 47369, 'loss/train': 1.0802626609802246} -11/07/2021 03:55:13 - INFO - __main__ - Step 47371: {'lr': 0.0003927510101393401, 'samples': 9095232, 'steps': 47370, 'loss/train': 1.0999367237091064} -11/07/2021 03:55:13 - INFO - __main__ - Step 47372: {'lr': 0.0003927466535500066, 'samples': 9095424, 'steps': 47371, 'loss/train': 1.2307920455932617} -11/07/2021 03:55:14 - INFO - __main__ - Step 47373: {'lr': 0.00039274229689635365, 'samples': 9095616, 'steps': 47372, 'loss/train': 1.0841302871704102} -11/07/2021 03:55:14 - INFO - __main__ - Step 47374: {'lr': 0.00039273794017838327, 'samples': 9095808, 'steps': 47373, 'loss/train': 1.7814555168151855} -11/07/2021 03:55:15 - INFO - __main__ - Step 47375: {'lr': 0.0003927335833960973, 'samples': 9096000, 'steps': 47374, 'loss/train': 1.539723515510559} -11/07/2021 03:55:15 - INFO - __main__ - Step 47376: {'lr': 0.00039272922654949783, 'samples': 9096192, 'steps': 47375, 'loss/train': 1.4435195922851562} -11/07/2021 03:55:16 - INFO - __main__ - Step 47377: {'lr': 0.0003927248696385868, 'samples': 9096384, 'steps': 47376, 'loss/train': 1.781643271446228} -11/07/2021 03:55:16 - INFO - __main__ - Step 47378: {'lr': 0.00039272051266336607, 'samples': 9096576, 'steps': 47377, 'loss/train': 1.3502711057662964} -11/07/2021 03:55:16 - INFO - __main__ - Step 47379: {'lr': 0.00039271615562383775, 'samples': 9096768, 'steps': 47378, 'loss/train': 0.17254693806171417} -11/07/2021 03:55:18 - INFO - __main__ - Step 47380: {'lr': 0.00039271179852000366, 'samples': 9096960, 'steps': 47379, 'loss/train': 1.5878491401672363} -11/07/2021 03:55:18 - INFO - __main__ - Step 47381: {'lr': 0.0003927074413518659, 'samples': 9097152, 'steps': 47380, 'loss/train': 1.3975498676300049} -11/07/2021 03:55:18 - INFO - __main__ - Step 47382: {'lr': 0.0003927030841194263, 'samples': 9097344, 'steps': 47381, 'loss/train': 1.100394606590271} -11/07/2021 03:55:19 - INFO - __main__ - Step 47383: {'lr': 0.00039269872682268697, 'samples': 9097536, 'steps': 47382, 'loss/train': 1.9096540212631226} -11/07/2021 03:55:19 - INFO - __main__ - Step 47384: {'lr': 0.00039269436946164977, 'samples': 9097728, 'steps': 47383, 'loss/train': 1.53835928440094} -11/07/2021 03:55:20 - INFO - __main__ - Step 47385: {'lr': 0.00039269001203631667, 'samples': 9097920, 'steps': 47384, 'loss/train': 1.1829365491867065} -11/07/2021 03:55:20 - INFO - __main__ - Step 47386: {'lr': 0.0003926856545466896, 'samples': 9098112, 'steps': 47385, 'loss/train': 1.4961042404174805} -11/07/2021 03:55:21 - INFO - __main__ - Step 47387: {'lr': 0.0003926812969927707, 'samples': 9098304, 'steps': 47386, 'loss/train': 1.2566967010498047} -11/07/2021 03:55:21 - INFO - __main__ - Step 47388: {'lr': 0.0003926769393745617, 'samples': 9098496, 'steps': 47387, 'loss/train': 1.3491863012313843} -11/07/2021 03:55:21 - INFO - __main__ - Step 47389: {'lr': 0.0003926725816920648, 'samples': 9098688, 'steps': 47388, 'loss/train': 1.4302196502685547} -11/07/2021 03:55:22 - INFO - __main__ - Step 47390: {'lr': 0.0003926682239452817, 'samples': 9098880, 'steps': 47389, 'loss/train': 1.1231874227523804} -11/07/2021 03:55:23 - INFO - __main__ - Step 47391: {'lr': 0.00039266386613421455, 'samples': 9099072, 'steps': 47390, 'loss/train': 1.0468133687973022} -11/07/2021 03:55:23 - INFO - __main__ - Step 47392: {'lr': 0.00039265950825886523, 'samples': 9099264, 'steps': 47391, 'loss/train': 1.6112629175186157} -11/07/2021 03:55:23 - INFO - __main__ - Step 47393: {'lr': 0.00039265515031923585, 'samples': 9099456, 'steps': 47392, 'loss/train': 1.6024153232574463} -11/07/2021 03:55:24 - INFO - __main__ - Step 47394: {'lr': 0.0003926507923153282, 'samples': 9099648, 'steps': 47393, 'loss/train': 1.5982778072357178} -11/07/2021 03:55:24 - INFO - __main__ - Step 47395: {'lr': 0.0003926464342471443, 'samples': 9099840, 'steps': 47394, 'loss/train': 1.7416530847549438} -11/07/2021 03:55:25 - INFO - __main__ - Step 47396: {'lr': 0.00039264207611468607, 'samples': 9100032, 'steps': 47395, 'loss/train': 1.781440019607544} -11/07/2021 03:55:26 - INFO - __main__ - Step 47397: {'lr': 0.00039263771791795554, 'samples': 9100224, 'steps': 47396, 'loss/train': 1.5347706079483032} -11/07/2021 03:55:26 - INFO - __main__ - Step 47398: {'lr': 0.0003926333596569547, 'samples': 9100416, 'steps': 47397, 'loss/train': 1.39937162399292} -11/07/2021 03:55:26 - INFO - __main__ - Step 47399: {'lr': 0.00039262900133168544, 'samples': 9100608, 'steps': 47398, 'loss/train': 1.6870687007904053} -11/07/2021 03:55:27 - INFO - __main__ - Step 47400: {'lr': 0.0003926246429421497, 'samples': 9100800, 'steps': 47399, 'loss/train': 1.5279653072357178} -11/07/2021 03:55:28 - INFO - __main__ - Step 47401: {'lr': 0.00039262028448834964, 'samples': 9100992, 'steps': 47400, 'loss/train': 1.6076257228851318} -11/07/2021 03:55:28 - INFO - __main__ - Step 47402: {'lr': 0.00039261592597028696, 'samples': 9101184, 'steps': 47401, 'loss/train': 1.4856348037719727} -11/07/2021 03:55:28 - INFO - __main__ - Step 47403: {'lr': 0.0003926115673879638, 'samples': 9101376, 'steps': 47402, 'loss/train': 1.4722977876663208} -11/07/2021 03:55:29 - INFO - __main__ - Step 47404: {'lr': 0.000392607208741382, 'samples': 9101568, 'steps': 47403, 'loss/train': 1.549590826034546} -11/07/2021 03:55:29 - INFO - __main__ - Step 47405: {'lr': 0.00039260285003054365, 'samples': 9101760, 'steps': 47404, 'loss/train': 1.8400324583053589} -11/07/2021 03:55:30 - INFO - __main__ - Step 47406: {'lr': 0.0003925984912554507, 'samples': 9101952, 'steps': 47405, 'loss/train': 1.9346383810043335} -11/07/2021 03:55:31 - INFO - __main__ - Step 47407: {'lr': 0.00039259413241610495, 'samples': 9102144, 'steps': 47406, 'loss/train': 1.3195863962173462} -11/07/2021 03:55:31 - INFO - __main__ - Step 47408: {'lr': 0.0003925897735125086, 'samples': 9102336, 'steps': 47407, 'loss/train': 5.765100479125977} -11/07/2021 03:55:31 - INFO - __main__ - Step 47409: {'lr': 0.00039258541454466344, 'samples': 9102528, 'steps': 47408, 'loss/train': 1.1543376445770264} -11/07/2021 03:55:32 - INFO - __main__ - Step 47410: {'lr': 0.0003925810555125715, 'samples': 9102720, 'steps': 47409, 'loss/train': 1.2631092071533203} -11/07/2021 03:55:33 - INFO - __main__ - Step 47411: {'lr': 0.00039257669641623474, 'samples': 9102912, 'steps': 47410, 'loss/train': 1.3123632669448853} -11/07/2021 03:55:33 - INFO - __main__ - Step 47412: {'lr': 0.0003925723372556551, 'samples': 9103104, 'steps': 47411, 'loss/train': 2.1971917152404785} -11/07/2021 03:55:34 - INFO - __main__ - Step 47413: {'lr': 0.00039256797803083457, 'samples': 9103296, 'steps': 47412, 'loss/train': 0.8656166791915894} -11/07/2021 03:55:34 - INFO - __main__ - Step 47414: {'lr': 0.00039256361874177517, 'samples': 9103488, 'steps': 47413, 'loss/train': 1.8716926574707031} -11/07/2021 03:55:34 - INFO - __main__ - Step 47415: {'lr': 0.0003925592593884787, 'samples': 9103680, 'steps': 47414, 'loss/train': 1.5350236892700195} -11/07/2021 03:55:35 - INFO - __main__ - Step 47416: {'lr': 0.0003925548999709473, 'samples': 9103872, 'steps': 47415, 'loss/train': 1.506656527519226} -11/07/2021 03:55:36 - INFO - __main__ - Step 47417: {'lr': 0.00039255054048918284, 'samples': 9104064, 'steps': 47416, 'loss/train': 0.6237403154373169} -11/07/2021 03:55:36 - INFO - __main__ - Step 47418: {'lr': 0.00039254618094318726, 'samples': 9104256, 'steps': 47417, 'loss/train': 1.6589988470077515} -11/07/2021 03:55:36 - INFO - __main__ - Step 47419: {'lr': 0.0003925418213329627, 'samples': 9104448, 'steps': 47418, 'loss/train': 1.7542097568511963} -11/07/2021 03:55:37 - INFO - __main__ - Step 47420: {'lr': 0.0003925374616585109, 'samples': 9104640, 'steps': 47419, 'loss/train': 1.64899480342865} -11/07/2021 03:55:37 - INFO - __main__ - Step 47421: {'lr': 0.00039253310191983393, 'samples': 9104832, 'steps': 47420, 'loss/train': 1.9085698127746582} -11/07/2021 03:55:38 - INFO - __main__ - Step 47422: {'lr': 0.0003925287421169337, 'samples': 9105024, 'steps': 47421, 'loss/train': 1.615214228630066} -11/07/2021 03:55:38 - INFO - __main__ - Step 47423: {'lr': 0.00039252438224981237, 'samples': 9105216, 'steps': 47422, 'loss/train': 1.4789481163024902} -11/07/2021 03:55:39 - INFO - __main__ - Step 47424: {'lr': 0.0003925200223184716, 'samples': 9105408, 'steps': 47423, 'loss/train': 1.1823432445526123} -11/07/2021 03:55:39 - INFO - __main__ - Step 47425: {'lr': 0.0003925156623229136, 'samples': 9105600, 'steps': 47424, 'loss/train': 1.7379939556121826} -11/07/2021 03:55:40 - INFO - __main__ - Step 47426: {'lr': 0.00039251130226314015, 'samples': 9105792, 'steps': 47425, 'loss/train': 1.4799647331237793} -11/07/2021 03:55:41 - INFO - __main__ - Step 47427: {'lr': 0.00039250694213915335, 'samples': 9105984, 'steps': 47426, 'loss/train': 1.6108179092407227} -11/07/2021 03:55:41 - INFO - __main__ - Step 47428: {'lr': 0.0003925025819509551, 'samples': 9106176, 'steps': 47427, 'loss/train': 1.475036382675171} -11/07/2021 03:55:41 - INFO - __main__ - Step 47429: {'lr': 0.00039249822169854745, 'samples': 9106368, 'steps': 47428, 'loss/train': 0.7688894271850586} -11/07/2021 03:55:42 - INFO - __main__ - Step 47430: {'lr': 0.0003924938613819322, 'samples': 9106560, 'steps': 47429, 'loss/train': 1.7876664400100708} -11/07/2021 03:55:42 - INFO - __main__ - Step 47431: {'lr': 0.0003924895010011115, 'samples': 9106752, 'steps': 47430, 'loss/train': 0.8254964351654053} -11/07/2021 03:55:43 - INFO - __main__ - Step 47432: {'lr': 0.0003924851405560872, 'samples': 9106944, 'steps': 47431, 'loss/train': 1.0238627195358276} -11/07/2021 03:55:43 - INFO - __main__ - Step 47433: {'lr': 0.00039248078004686126, 'samples': 9107136, 'steps': 47432, 'loss/train': 1.3875761032104492} -11/07/2021 03:55:44 - INFO - __main__ - Step 47434: {'lr': 0.00039247641947343575, 'samples': 9107328, 'steps': 47433, 'loss/train': 1.2660794258117676} -11/07/2021 03:55:44 - INFO - __main__ - Step 47435: {'lr': 0.0003924720588358126, 'samples': 9107520, 'steps': 47434, 'loss/train': 1.3477479219436646} -11/07/2021 03:55:45 - INFO - __main__ - Step 47436: {'lr': 0.0003924676981339936, 'samples': 9107712, 'steps': 47435, 'loss/train': 1.7307621240615845} -11/07/2021 03:55:45 - INFO - __main__ - Step 47437: {'lr': 0.00039246333736798095, 'samples': 9107904, 'steps': 47436, 'loss/train': 1.5367916822433472} -11/07/2021 03:55:46 - INFO - __main__ - Step 47438: {'lr': 0.0003924589765377765, 'samples': 9108096, 'steps': 47437, 'loss/train': 1.5305283069610596} -11/07/2021 03:55:46 - INFO - __main__ - Step 47439: {'lr': 0.00039245461564338223, 'samples': 9108288, 'steps': 47438, 'loss/train': 1.7045104503631592} -11/07/2021 03:55:47 - INFO - __main__ - Step 47440: {'lr': 0.00039245025468480013, 'samples': 9108480, 'steps': 47439, 'loss/train': 1.171530842781067} -11/07/2021 03:55:47 - INFO - __main__ - Step 47441: {'lr': 0.00039244589366203207, 'samples': 9108672, 'steps': 47440, 'loss/train': 0.5102721452713013} -11/07/2021 03:55:47 - INFO - __main__ - Step 47442: {'lr': 0.0003924415325750802, 'samples': 9108864, 'steps': 47441, 'loss/train': 1.3438969850540161} -11/07/2021 03:55:48 - INFO - __main__ - Step 47443: {'lr': 0.0003924371714239463, 'samples': 9109056, 'steps': 47442, 'loss/train': 1.5555357933044434} -11/07/2021 03:55:49 - INFO - __main__ - Step 47444: {'lr': 0.0003924328102086324, 'samples': 9109248, 'steps': 47443, 'loss/train': 1.4037777185440063} -11/07/2021 03:55:49 - INFO - __main__ - Step 47445: {'lr': 0.0003924284489291405, 'samples': 9109440, 'steps': 47444, 'loss/train': 1.8709050416946411} -11/07/2021 03:55:49 - INFO - __main__ - Step 47446: {'lr': 0.00039242408758547256, 'samples': 9109632, 'steps': 47445, 'loss/train': 1.5296556949615479} -11/07/2021 03:55:50 - INFO - __main__ - Step 47447: {'lr': 0.0003924197261776304, 'samples': 9109824, 'steps': 47446, 'loss/train': 1.7294964790344238} -11/07/2021 03:55:50 - INFO - __main__ - Step 47448: {'lr': 0.0003924153647056163, 'samples': 9110016, 'steps': 47447, 'loss/train': 1.8322336673736572} -11/07/2021 03:55:51 - INFO - __main__ - Step 47449: {'lr': 0.0003924110031694319, 'samples': 9110208, 'steps': 47448, 'loss/train': 1.8327605724334717} -11/07/2021 03:55:51 - INFO - __main__ - Step 47450: {'lr': 0.00039240664156907937, 'samples': 9110400, 'steps': 47449, 'loss/train': 1.2270948886871338} -11/07/2021 03:55:52 - INFO - __main__ - Step 47451: {'lr': 0.00039240227990456055, 'samples': 9110592, 'steps': 47450, 'loss/train': 1.0061084032058716} -11/07/2021 03:55:52 - INFO - __main__ - Step 47452: {'lr': 0.00039239791817587746, 'samples': 9110784, 'steps': 47451, 'loss/train': 1.542582631111145} -11/07/2021 03:55:52 - INFO - __main__ - Step 47453: {'lr': 0.0003923935563830321, 'samples': 9110976, 'steps': 47452, 'loss/train': 1.3199650049209595} -11/07/2021 03:55:53 - INFO - __main__ - Step 47454: {'lr': 0.0003923891945260264, 'samples': 9111168, 'steps': 47453, 'loss/train': 1.102708101272583} -11/07/2021 03:55:54 - INFO - __main__ - Step 47455: {'lr': 0.00039238483260486235, 'samples': 9111360, 'steps': 47454, 'loss/train': 0.989068865776062} -11/07/2021 03:55:54 - INFO - __main__ - Step 47456: {'lr': 0.0003923804706195418, 'samples': 9111552, 'steps': 47455, 'loss/train': 1.8135876655578613} -11/07/2021 03:55:54 - INFO - __main__ - Step 47457: {'lr': 0.0003923761085700669, 'samples': 9111744, 'steps': 47456, 'loss/train': 1.2370156049728394} -11/07/2021 03:55:55 - INFO - __main__ - Step 47458: {'lr': 0.0003923717464564395, 'samples': 9111936, 'steps': 47457, 'loss/train': 0.9308407306671143} -11/07/2021 03:55:56 - INFO - __main__ - Step 47459: {'lr': 0.00039236738427866154, 'samples': 9112128, 'steps': 47458, 'loss/train': 0.8917006850242615} -11/07/2021 03:55:56 - INFO - __main__ - Step 47460: {'lr': 0.000392363022036735, 'samples': 9112320, 'steps': 47459, 'loss/train': 1.387584924697876} -11/07/2021 03:55:57 - INFO - __main__ - Step 47461: {'lr': 0.00039235865973066196, 'samples': 9112512, 'steps': 47460, 'loss/train': 1.2784820795059204} -11/07/2021 03:55:57 - INFO - __main__ - Step 47462: {'lr': 0.00039235429736044435, 'samples': 9112704, 'steps': 47461, 'loss/train': 1.7527347803115845} -11/07/2021 03:55:58 - INFO - __main__ - Step 47463: {'lr': 0.00039234993492608404, 'samples': 9112896, 'steps': 47462, 'loss/train': 1.625871181488037} -11/07/2021 03:55:58 - INFO - __main__ - Step 47464: {'lr': 0.0003923455724275831, 'samples': 9113088, 'steps': 47463, 'loss/train': 1.7436282634735107} -11/07/2021 03:55:59 - INFO - __main__ - Step 47465: {'lr': 0.0003923412098649433, 'samples': 9113280, 'steps': 47464, 'loss/train': 1.4446229934692383} -11/07/2021 03:55:59 - INFO - __main__ - Step 47466: {'lr': 0.0003923368472381668, 'samples': 9113472, 'steps': 47465, 'loss/train': 1.7699695825576782} -11/07/2021 03:56:00 - INFO - __main__ - Step 47467: {'lr': 0.0003923324845472556, 'samples': 9113664, 'steps': 47466, 'loss/train': 1.5300990343093872} -11/07/2021 03:56:00 - INFO - __main__ - Step 47468: {'lr': 0.0003923281217922115, 'samples': 9113856, 'steps': 47467, 'loss/train': 1.4730432033538818} -11/07/2021 03:56:01 - INFO - __main__ - Step 47469: {'lr': 0.0003923237589730366, 'samples': 9114048, 'steps': 47468, 'loss/train': 1.4974443912506104} -11/07/2021 03:56:01 - INFO - __main__ - Step 47470: {'lr': 0.00039231939608973276, 'samples': 9114240, 'steps': 47469, 'loss/train': 1.9974877834320068} -11/07/2021 03:56:02 - INFO - __main__ - Step 47471: {'lr': 0.000392315033142302, 'samples': 9114432, 'steps': 47470, 'loss/train': 1.3896907567977905} -11/07/2021 03:56:02 - INFO - __main__ - Step 47472: {'lr': 0.0003923106701307463, 'samples': 9114624, 'steps': 47471, 'loss/train': 1.5565924644470215} -11/07/2021 03:56:02 - INFO - __main__ - Step 47473: {'lr': 0.0003923063070550676, 'samples': 9114816, 'steps': 47472, 'loss/train': 1.4438856840133667} -11/07/2021 03:56:03 - INFO - __main__ - Step 47474: {'lr': 0.00039230194391526784, 'samples': 9115008, 'steps': 47473, 'loss/train': 1.4795085191726685} -11/07/2021 03:56:04 - INFO - __main__ - Step 47475: {'lr': 0.00039229758071134907, 'samples': 9115200, 'steps': 47474, 'loss/train': 2.37557053565979} -11/07/2021 03:56:04 - INFO - __main__ - Step 47476: {'lr': 0.0003922932174433132, 'samples': 9115392, 'steps': 47475, 'loss/train': 1.6281499862670898} -11/07/2021 03:56:04 - INFO - __main__ - Step 47477: {'lr': 0.0003922888541111622, 'samples': 9115584, 'steps': 47476, 'loss/train': 1.0745799541473389} -11/07/2021 03:56:05 - INFO - __main__ - Step 47478: {'lr': 0.00039228449071489804, 'samples': 9115776, 'steps': 47477, 'loss/train': 1.604480266571045} -11/07/2021 03:56:06 - INFO - __main__ - Step 47479: {'lr': 0.0003922801272545227, 'samples': 9115968, 'steps': 47478, 'loss/train': 1.740954041481018} -11/07/2021 03:56:06 - INFO - __main__ - Step 47480: {'lr': 0.000392275763730038, 'samples': 9116160, 'steps': 47479, 'loss/train': 1.3065632581710815} -11/07/2021 03:56:07 - INFO - __main__ - Step 47481: {'lr': 0.00039227140014144615, 'samples': 9116352, 'steps': 47480, 'loss/train': 1.776518702507019} -11/07/2021 03:56:07 - INFO - __main__ - Step 47482: {'lr': 0.00039226703648874905, 'samples': 9116544, 'steps': 47481, 'loss/train': 1.07040274143219} -11/07/2021 03:56:07 - INFO - __main__ - Step 47483: {'lr': 0.00039226267277194855, 'samples': 9116736, 'steps': 47482, 'loss/train': 1.2167857885360718} -11/07/2021 03:56:08 - INFO - __main__ - Step 47484: {'lr': 0.0003922583089910467, 'samples': 9116928, 'steps': 47483, 'loss/train': 1.297946810722351} -11/07/2021 03:56:09 - INFO - __main__ - Step 47485: {'lr': 0.0003922539451460454, 'samples': 9117120, 'steps': 47484, 'loss/train': 1.4696154594421387} -11/07/2021 03:56:09 - INFO - __main__ - Step 47486: {'lr': 0.00039224958123694676, 'samples': 9117312, 'steps': 47485, 'loss/train': 1.5161038637161255} -11/07/2021 03:56:09 - INFO - __main__ - Step 47487: {'lr': 0.0003922452172637526, 'samples': 9117504, 'steps': 47486, 'loss/train': 0.7221962809562683} -11/07/2021 03:56:10 - INFO - __main__ - Step 47488: {'lr': 0.000392240853226465, 'samples': 9117696, 'steps': 47487, 'loss/train': 1.6920087337493896} -11/07/2021 03:56:11 - INFO - __main__ - Step 47489: {'lr': 0.0003922364891250858, 'samples': 9117888, 'steps': 47488, 'loss/train': 1.1007860898971558} -11/07/2021 03:56:11 - INFO - __main__ - Step 47490: {'lr': 0.00039223212495961704, 'samples': 9118080, 'steps': 47489, 'loss/train': 1.5745450258255005} -11/07/2021 03:56:11 - INFO - __main__ - Step 47491: {'lr': 0.0003922277607300607, 'samples': 9118272, 'steps': 47490, 'loss/train': 0.9680019021034241} -11/07/2021 03:56:12 - INFO - __main__ - Step 47492: {'lr': 0.0003922233964364187, 'samples': 9118464, 'steps': 47491, 'loss/train': 1.7139664888381958} -11/07/2021 03:56:12 - INFO - __main__ - Step 47493: {'lr': 0.000392219032078693, 'samples': 9118656, 'steps': 47492, 'loss/train': 1.9633903503417969} -11/07/2021 03:56:13 - INFO - __main__ - Step 47494: {'lr': 0.0003922146676568856, 'samples': 9118848, 'steps': 47493, 'loss/train': 1.7013767957687378} -11/07/2021 03:56:13 - INFO - __main__ - Step 47495: {'lr': 0.0003922103031709986, 'samples': 9119040, 'steps': 47494, 'loss/train': 1.2616795301437378} -11/07/2021 03:56:14 - INFO - __main__ - Step 47496: {'lr': 0.0003922059386210337, 'samples': 9119232, 'steps': 47495, 'loss/train': 1.4971474409103394} -11/07/2021 03:56:14 - INFO - __main__ - Step 47497: {'lr': 0.0003922015740069931, 'samples': 9119424, 'steps': 47496, 'loss/train': 0.1893942803144455} -11/07/2021 03:56:15 - INFO - __main__ - Step 47498: {'lr': 0.0003921972093288786, 'samples': 9119616, 'steps': 47497, 'loss/train': 1.8189650774002075} -11/07/2021 03:56:15 - INFO - __main__ - Step 47499: {'lr': 0.00039219284458669217, 'samples': 9119808, 'steps': 47498, 'loss/train': 1.4831254482269287} -11/07/2021 03:56:16 - INFO - __main__ - Step 47500: {'lr': 0.00039218847978043594, 'samples': 9120000, 'steps': 47499, 'loss/train': 1.6738368272781372} -11/07/2021 03:56:16 - INFO - __main__ - Step 47501: {'lr': 0.00039218411491011176, 'samples': 9120192, 'steps': 47500, 'loss/train': 1.4098420143127441} -11/07/2021 03:56:17 - INFO - __main__ - Step 47502: {'lr': 0.0003921797499757216, 'samples': 9120384, 'steps': 47501, 'loss/train': 1.5153719186782837} -11/07/2021 03:56:17 - INFO - __main__ - Step 47503: {'lr': 0.0003921753849772674, 'samples': 9120576, 'steps': 47502, 'loss/train': 1.432418942451477} -11/07/2021 03:56:17 - INFO - __main__ - Step 47504: {'lr': 0.0003921710199147512, 'samples': 9120768, 'steps': 47503, 'loss/train': 1.4112839698791504} -11/07/2021 03:56:18 - INFO - __main__ - Step 47505: {'lr': 0.0003921666547881749, 'samples': 9120960, 'steps': 47504, 'loss/train': 1.5197889804840088} -11/07/2021 03:56:19 - INFO - __main__ - Step 47506: {'lr': 0.00039216228959754055, 'samples': 9121152, 'steps': 47505, 'loss/train': 1.8048980236053467} -11/07/2021 03:56:19 - INFO - __main__ - Step 47507: {'lr': 0.00039215792434285, 'samples': 9121344, 'steps': 47506, 'loss/train': 1.5157513618469238} -11/07/2021 03:56:19 - INFO - __main__ - Step 47508: {'lr': 0.00039215355902410534, 'samples': 9121536, 'steps': 47507, 'loss/train': 1.1093748807907104} -11/07/2021 03:56:20 - INFO - __main__ - Step 47509: {'lr': 0.0003921491936413085, 'samples': 9121728, 'steps': 47508, 'loss/train': 1.6741187572479248} -11/07/2021 03:56:21 - INFO - __main__ - Step 47510: {'lr': 0.0003921448281944614, 'samples': 9121920, 'steps': 47509, 'loss/train': 1.2055332660675049} -11/07/2021 03:56:21 - INFO - __main__ - Step 47511: {'lr': 0.000392140462683566, 'samples': 9122112, 'steps': 47510, 'loss/train': 1.3611558675765991} -11/07/2021 03:56:22 - INFO - __main__ - Step 47512: {'lr': 0.0003921360971086243, 'samples': 9122304, 'steps': 47511, 'loss/train': 1.3768153190612793} -11/07/2021 03:56:22 - INFO - __main__ - Step 47513: {'lr': 0.0003921317314696383, 'samples': 9122496, 'steps': 47512, 'loss/train': 1.7975044250488281} -11/07/2021 03:56:22 - INFO - __main__ - Step 47514: {'lr': 0.0003921273657666099, 'samples': 9122688, 'steps': 47513, 'loss/train': 1.3423588275909424} -11/07/2021 03:56:23 - INFO - __main__ - Step 47515: {'lr': 0.0003921229999995412, 'samples': 9122880, 'steps': 47514, 'loss/train': 1.1245650053024292} -11/07/2021 03:56:24 - INFO - __main__ - Step 47516: {'lr': 0.000392118634168434, 'samples': 9123072, 'steps': 47515, 'loss/train': 0.41801056265830994} -11/07/2021 03:56:24 - INFO - __main__ - Step 47517: {'lr': 0.00039211426827329035, 'samples': 9123264, 'steps': 47516, 'loss/train': 0.7599082589149475} -11/07/2021 03:56:24 - INFO - __main__ - Step 47518: {'lr': 0.0003921099023141121, 'samples': 9123456, 'steps': 47517, 'loss/train': 1.2782249450683594} -11/07/2021 03:56:25 - INFO - __main__ - Step 47519: {'lr': 0.0003921055362909015, 'samples': 9123648, 'steps': 47518, 'loss/train': 1.3840163946151733} -11/07/2021 03:56:25 - INFO - __main__ - Step 47520: {'lr': 0.0003921011702036602, 'samples': 9123840, 'steps': 47519, 'loss/train': 0.9894071817398071} -11/07/2021 03:56:26 - INFO - __main__ - Step 47521: {'lr': 0.00039209680405239035, 'samples': 9124032, 'steps': 47520, 'loss/train': 1.6704676151275635} -11/07/2021 03:56:26 - INFO - __main__ - Step 47522: {'lr': 0.0003920924378370939, 'samples': 9124224, 'steps': 47521, 'loss/train': 1.1027514934539795} -11/07/2021 03:56:27 - INFO - __main__ - Step 47523: {'lr': 0.0003920880715577728, 'samples': 9124416, 'steps': 47522, 'loss/train': 1.4846141338348389} -11/07/2021 03:56:27 - INFO - __main__ - Step 47524: {'lr': 0.00039208370521442895, 'samples': 9124608, 'steps': 47523, 'loss/train': 1.6287258863449097} -11/07/2021 03:56:28 - INFO - __main__ - Step 47525: {'lr': 0.0003920793388070644, 'samples': 9124800, 'steps': 47524, 'loss/train': 0.7328007221221924} -11/07/2021 03:56:29 - INFO - __main__ - Step 47526: {'lr': 0.0003920749723356811, 'samples': 9124992, 'steps': 47525, 'loss/train': 1.7460342645645142} -11/07/2021 03:56:29 - INFO - __main__ - Step 47527: {'lr': 0.000392070605800281, 'samples': 9125184, 'steps': 47526, 'loss/train': 1.5260841846466064} -11/07/2021 03:56:29 - INFO - __main__ - Step 47528: {'lr': 0.00039206623920086603, 'samples': 9125376, 'steps': 47527, 'loss/train': 1.522653579711914} -11/07/2021 03:56:30 - INFO - __main__ - Step 47529: {'lr': 0.0003920618725374383, 'samples': 9125568, 'steps': 47528, 'loss/train': 1.4565163850784302} -11/07/2021 03:56:30 - INFO - __main__ - Step 47530: {'lr': 0.00039205750580999964, 'samples': 9125760, 'steps': 47529, 'loss/train': 1.4106204509735107} -11/07/2021 03:56:31 - INFO - __main__ - Step 47531: {'lr': 0.0003920531390185521, 'samples': 9125952, 'steps': 47530, 'loss/train': 1.9258077144622803} -11/07/2021 03:56:31 - INFO - __main__ - Step 47532: {'lr': 0.00039204877216309755, 'samples': 9126144, 'steps': 47531, 'loss/train': 1.7408628463745117} -11/07/2021 03:56:32 - INFO - __main__ - Step 47533: {'lr': 0.00039204440524363805, 'samples': 9126336, 'steps': 47532, 'loss/train': 1.299311637878418} -11/07/2021 03:56:32 - INFO - __main__ - Step 47534: {'lr': 0.0003920400382601755, 'samples': 9126528, 'steps': 47533, 'loss/train': 1.6594051122665405} -11/07/2021 03:56:32 - INFO - __main__ - Step 47535: {'lr': 0.00039203567121271187, 'samples': 9126720, 'steps': 47534, 'loss/train': 1.7957714796066284} -11/07/2021 03:56:34 - INFO - __main__ - Step 47536: {'lr': 0.00039203130410124927, 'samples': 9126912, 'steps': 47535, 'loss/train': 2.0496859550476074} -11/07/2021 03:56:34 - INFO - __main__ - Step 47537: {'lr': 0.0003920269369257895, 'samples': 9127104, 'steps': 47536, 'loss/train': 1.5177720785140991} -11/07/2021 03:56:34 - INFO - __main__ - Step 47538: {'lr': 0.0003920225696863345, 'samples': 9127296, 'steps': 47537, 'loss/train': 1.370882272720337} -11/07/2021 03:56:35 - INFO - __main__ - Step 47539: {'lr': 0.00039201820238288644, 'samples': 9127488, 'steps': 47538, 'loss/train': 1.5021008253097534} -11/07/2021 03:56:35 - INFO - __main__ - Step 47540: {'lr': 0.00039201383501544706, 'samples': 9127680, 'steps': 47539, 'loss/train': 1.5323901176452637} -11/07/2021 03:56:36 - INFO - __main__ - Step 47541: {'lr': 0.00039200946758401856, 'samples': 9127872, 'steps': 47540, 'loss/train': 1.6588393449783325} -11/07/2021 03:56:36 - INFO - __main__ - Step 47542: {'lr': 0.00039200510008860273, 'samples': 9128064, 'steps': 47541, 'loss/train': 1.0969041585922241} -11/07/2021 03:56:37 - INFO - __main__ - Step 47543: {'lr': 0.0003920007325292016, 'samples': 9128256, 'steps': 47542, 'loss/train': 1.2662030458450317} -11/07/2021 03:56:37 - INFO - __main__ - Step 47544: {'lr': 0.00039199636490581713, 'samples': 9128448, 'steps': 47543, 'loss/train': 1.4820476770401} -11/07/2021 03:56:37 - INFO - __main__ - Step 47545: {'lr': 0.00039199199721845127, 'samples': 9128640, 'steps': 47544, 'loss/train': 0.8880251049995422} -11/07/2021 03:56:38 - INFO - __main__ - Step 47546: {'lr': 0.000391987629467106, 'samples': 9128832, 'steps': 47545, 'loss/train': 1.5734833478927612} -11/07/2021 03:56:39 - INFO - __main__ - Step 47547: {'lr': 0.00039198326165178335, 'samples': 9129024, 'steps': 47546, 'loss/train': 1.2641962766647339} -11/07/2021 03:56:39 - INFO - __main__ - Step 47548: {'lr': 0.0003919788937724852, 'samples': 9129216, 'steps': 47547, 'loss/train': 1.4985029697418213} -11/07/2021 03:56:39 - INFO - __main__ - Step 47549: {'lr': 0.0003919745258292135, 'samples': 9129408, 'steps': 47548, 'loss/train': 1.4992035627365112} -11/07/2021 03:56:40 - INFO - __main__ - Step 47550: {'lr': 0.00039197015782197034, 'samples': 9129600, 'steps': 47549, 'loss/train': 1.4774483442306519} -11/07/2021 03:56:40 - INFO - __main__ - Step 47551: {'lr': 0.0003919657897507576, 'samples': 9129792, 'steps': 47550, 'loss/train': 1.6427239179611206} -11/07/2021 03:56:41 - INFO - __main__ - Step 47552: {'lr': 0.0003919614216155772, 'samples': 9129984, 'steps': 47551, 'loss/train': 1.5218361616134644} -11/07/2021 03:56:42 - INFO - __main__ - Step 47553: {'lr': 0.0003919570534164313, 'samples': 9130176, 'steps': 47552, 'loss/train': 1.2969653606414795} -11/07/2021 03:56:42 - INFO - __main__ - Step 47554: {'lr': 0.0003919526851533216, 'samples': 9130368, 'steps': 47553, 'loss/train': 1.785011887550354} -11/07/2021 03:56:42 - INFO - __main__ - Step 47555: {'lr': 0.00039194831682625033, 'samples': 9130560, 'steps': 47554, 'loss/train': 1.4270840883255005} -11/07/2021 03:56:43 - INFO - __main__ - Step 47556: {'lr': 0.0003919439484352193, 'samples': 9130752, 'steps': 47555, 'loss/train': 0.7276812791824341} -11/07/2021 03:56:44 - INFO - __main__ - Step 47557: {'lr': 0.00039193957998023057, 'samples': 9130944, 'steps': 47556, 'loss/train': 1.7058446407318115} -11/07/2021 03:56:44 - INFO - __main__ - Step 47558: {'lr': 0.000391935211461286, 'samples': 9131136, 'steps': 47557, 'loss/train': 1.4903485774993896} -11/07/2021 03:56:44 - INFO - __main__ - Step 47559: {'lr': 0.00039193084287838755, 'samples': 9131328, 'steps': 47558, 'loss/train': 1.2844045162200928} -11/07/2021 03:56:45 - INFO - __main__ - Step 47560: {'lr': 0.0003919264742315373, 'samples': 9131520, 'steps': 47559, 'loss/train': 1.8127259016036987} -11/07/2021 03:56:45 - INFO - __main__ - Step 47561: {'lr': 0.00039192210552073723, 'samples': 9131712, 'steps': 47560, 'loss/train': 1.9596339464187622} -11/07/2021 03:56:46 - INFO - __main__ - Step 47562: {'lr': 0.0003919177367459892, 'samples': 9131904, 'steps': 47561, 'loss/train': 1.9238076210021973} -11/07/2021 03:56:47 - INFO - __main__ - Step 47563: {'lr': 0.00039191336790729526, 'samples': 9132096, 'steps': 47562, 'loss/train': 1.9140310287475586} -11/07/2021 03:56:47 - INFO - __main__ - Step 47564: {'lr': 0.00039190899900465727, 'samples': 9132288, 'steps': 47563, 'loss/train': 1.6951509714126587} -11/07/2021 03:56:47 - INFO - __main__ - Step 47565: {'lr': 0.0003919046300380773, 'samples': 9132480, 'steps': 47564, 'loss/train': 0.3123338520526886} -11/07/2021 03:56:48 - INFO - __main__ - Step 47566: {'lr': 0.00039190026100755735, 'samples': 9132672, 'steps': 47565, 'loss/train': 1.3794103860855103} -11/07/2021 03:56:49 - INFO - __main__ - Step 47567: {'lr': 0.00039189589191309927, 'samples': 9132864, 'steps': 47566, 'loss/train': 0.9913450479507446} -11/07/2021 03:56:49 - INFO - __main__ - Step 47568: {'lr': 0.00039189152275470514, 'samples': 9133056, 'steps': 47567, 'loss/train': 0.6241242289543152} -11/07/2021 03:56:49 - INFO - __main__ - Step 47569: {'lr': 0.0003918871535323769, 'samples': 9133248, 'steps': 47568, 'loss/train': 1.2644298076629639} -11/07/2021 03:56:50 - INFO - __main__ - Step 47570: {'lr': 0.0003918827842461165, 'samples': 9133440, 'steps': 47569, 'loss/train': 1.5793612003326416} -11/07/2021 03:56:50 - INFO - __main__ - Step 47571: {'lr': 0.0003918784148959258, 'samples': 9133632, 'steps': 47570, 'loss/train': 0.8174675107002258} -11/07/2021 03:56:51 - INFO - __main__ - Step 47572: {'lr': 0.0003918740454818069, 'samples': 9133824, 'steps': 47571, 'loss/train': 1.1769851446151733} -11/07/2021 03:56:52 - INFO - __main__ - Step 47573: {'lr': 0.0003918696760037618, 'samples': 9134016, 'steps': 47572, 'loss/train': 1.6718579530715942} -11/07/2021 03:56:52 - INFO - __main__ - Step 47574: {'lr': 0.0003918653064617924, 'samples': 9134208, 'steps': 47573, 'loss/train': 1.5838192701339722} -11/07/2021 03:56:52 - INFO - __main__ - Step 47575: {'lr': 0.00039186093685590064, 'samples': 9134400, 'steps': 47574, 'loss/train': 1.1955496072769165} -11/07/2021 03:56:53 - INFO - __main__ - Step 47576: {'lr': 0.0003918565671860886, 'samples': 9134592, 'steps': 47575, 'loss/train': 1.5702279806137085} -11/07/2021 03:56:53 - INFO - __main__ - Step 47577: {'lr': 0.00039185219745235816, 'samples': 9134784, 'steps': 47576, 'loss/train': 1.6203112602233887} -11/07/2021 03:56:54 - INFO - __main__ - Step 47578: {'lr': 0.0003918478276547113, 'samples': 9134976, 'steps': 47577, 'loss/train': 1.670324444770813} -11/07/2021 03:56:54 - INFO - __main__ - Step 47579: {'lr': 0.00039184345779315, 'samples': 9135168, 'steps': 47578, 'loss/train': 1.572860836982727} -11/07/2021 03:56:55 - INFO - __main__ - Step 47580: {'lr': 0.0003918390878676762, 'samples': 9135360, 'steps': 47579, 'loss/train': 1.5355112552642822} -11/07/2021 03:56:55 - INFO - __main__ - Step 47581: {'lr': 0.00039183471787829194, 'samples': 9135552, 'steps': 47580, 'loss/train': 1.6907731294631958} -11/07/2021 03:56:56 - INFO - __main__ - Step 47582: {'lr': 0.0003918303478249991, 'samples': 9135744, 'steps': 47581, 'loss/train': 1.6832005977630615} -11/07/2021 03:56:57 - INFO - __main__ - Step 47583: {'lr': 0.0003918259777077997, 'samples': 9135936, 'steps': 47582, 'loss/train': 1.2778152227401733} -11/07/2021 03:56:57 - INFO - __main__ - Step 47584: {'lr': 0.00039182160752669577, 'samples': 9136128, 'steps': 47583, 'loss/train': 1.6662622690200806} -11/07/2021 03:56:58 - INFO - __main__ - Step 47585: {'lr': 0.0003918172372816892, 'samples': 9136320, 'steps': 47584, 'loss/train': 1.4052339792251587} -11/07/2021 03:56:58 - INFO - __main__ - Step 47586: {'lr': 0.0003918128669727818, 'samples': 9136512, 'steps': 47585, 'loss/train': 0.2713298201560974} -11/07/2021 03:56:58 - INFO - __main__ - Step 47587: {'lr': 0.00039180849659997593, 'samples': 9136704, 'steps': 47586, 'loss/train': 0.8063874840736389} -11/07/2021 03:57:00 - INFO - __main__ - Step 47588: {'lr': 0.00039180412616327323, 'samples': 9136896, 'steps': 47587, 'loss/train': 1.20669424533844} -11/07/2021 03:57:00 - INFO - __main__ - Step 47589: {'lr': 0.00039179975566267585, 'samples': 9137088, 'steps': 47588, 'loss/train': 1.0589284896850586} -11/07/2021 03:57:00 - INFO - __main__ - Step 47590: {'lr': 0.00039179538509818556, 'samples': 9137280, 'steps': 47589, 'loss/train': 1.230054259300232} -11/07/2021 03:57:01 - INFO - __main__ - Step 47591: {'lr': 0.0003917910144698046, 'samples': 9137472, 'steps': 47590, 'loss/train': 2.2915971279144287} -11/07/2021 03:57:01 - INFO - __main__ - Step 47592: {'lr': 0.0003917866437775347, 'samples': 9137664, 'steps': 47591, 'loss/train': 1.0403106212615967} -11/07/2021 03:57:02 - INFO - __main__ - Step 47593: {'lr': 0.000391782273021378, 'samples': 9137856, 'steps': 47592, 'loss/train': 1.5003052949905396} -11/07/2021 03:57:02 - INFO - __main__ - Step 47594: {'lr': 0.00039177790220133637, 'samples': 9138048, 'steps': 47593, 'loss/train': 1.8745750188827515} -11/07/2021 03:57:03 - INFO - __main__ - Step 47595: {'lr': 0.0003917735313174117, 'samples': 9138240, 'steps': 47594, 'loss/train': 1.5211420059204102} -11/07/2021 03:57:03 - INFO - __main__ - Step 47596: {'lr': 0.0003917691603696062, 'samples': 9138432, 'steps': 47595, 'loss/train': 1.5756067037582397} -11/07/2021 03:57:03 - INFO - __main__ - Step 47597: {'lr': 0.0003917647893579217, 'samples': 9138624, 'steps': 47596, 'loss/train': 1.660907506942749} -11/07/2021 03:57:04 - INFO - __main__ - Step 47598: {'lr': 0.0003917604182823601, 'samples': 9138816, 'steps': 47597, 'loss/train': 1.3687254190444946} -11/07/2021 03:57:05 - INFO - __main__ - Step 47599: {'lr': 0.00039175604714292346, 'samples': 9139008, 'steps': 47598, 'loss/train': 1.4359571933746338} -11/07/2021 03:57:05 - INFO - __main__ - Step 47600: {'lr': 0.00039175167593961377, 'samples': 9139200, 'steps': 47599, 'loss/train': 1.042655110359192} -11/07/2021 03:57:06 - INFO - __main__ - Step 47601: {'lr': 0.0003917473046724329, 'samples': 9139392, 'steps': 47600, 'loss/train': 1.4571832418441772} -11/07/2021 03:57:06 - INFO - __main__ - Step 47602: {'lr': 0.000391742933341383, 'samples': 9139584, 'steps': 47601, 'loss/train': 1.5106868743896484} -11/07/2021 03:57:06 - INFO - __main__ - Step 47603: {'lr': 0.00039173856194646585, 'samples': 9139776, 'steps': 47602, 'loss/train': 1.426308035850525} -11/07/2021 03:57:08 - INFO - __main__ - Step 47604: {'lr': 0.00039173419048768343, 'samples': 9139968, 'steps': 47603, 'loss/train': 1.333543300628662} -11/07/2021 03:57:08 - INFO - __main__ - Step 47605: {'lr': 0.0003917298189650378, 'samples': 9140160, 'steps': 47604, 'loss/train': 2.3469433784484863} -11/07/2021 03:57:08 - INFO - __main__ - Step 47606: {'lr': 0.00039172544737853097, 'samples': 9140352, 'steps': 47605, 'loss/train': 0.9758121967315674} -11/07/2021 03:57:09 - INFO - __main__ - Step 47607: {'lr': 0.00039172107572816477, 'samples': 9140544, 'steps': 47606, 'loss/train': 1.5648424625396729} -11/07/2021 03:57:09 - INFO - __main__ - Step 47608: {'lr': 0.00039171670401394134, 'samples': 9140736, 'steps': 47607, 'loss/train': 0.8682147860527039} -11/07/2021 03:57:10 - INFO - __main__ - Step 47609: {'lr': 0.00039171233223586247, 'samples': 9140928, 'steps': 47608, 'loss/train': 1.2661722898483276} -11/07/2021 03:57:10 - INFO - __main__ - Step 47610: {'lr': 0.0003917079603939302, 'samples': 9141120, 'steps': 47609, 'loss/train': 2.0972232818603516} -11/07/2021 03:57:11 - INFO - __main__ - Step 47611: {'lr': 0.0003917035884881465, 'samples': 9141312, 'steps': 47610, 'loss/train': 0.6600740551948547} -11/07/2021 03:57:11 - INFO - __main__ - Step 47612: {'lr': 0.00039169921651851337, 'samples': 9141504, 'steps': 47611, 'loss/train': 1.7421717643737793} -11/07/2021 03:57:11 - INFO - __main__ - Step 47613: {'lr': 0.0003916948444850328, 'samples': 9141696, 'steps': 47612, 'loss/train': 1.5109429359436035} -11/07/2021 03:57:12 - INFO - __main__ - Step 47614: {'lr': 0.0003916904723877067, 'samples': 9141888, 'steps': 47613, 'loss/train': 1.4767059087753296} -11/07/2021 03:57:13 - INFO - __main__ - Step 47615: {'lr': 0.000391686100226537, 'samples': 9142080, 'steps': 47614, 'loss/train': 1.5321447849273682} -11/07/2021 03:57:13 - INFO - __main__ - Step 47616: {'lr': 0.00039168172800152577, 'samples': 9142272, 'steps': 47615, 'loss/train': 1.3128496408462524} -11/07/2021 03:57:14 - INFO - __main__ - Step 47617: {'lr': 0.0003916773557126749, 'samples': 9142464, 'steps': 47616, 'loss/train': 1.225580096244812} -11/07/2021 03:57:14 - INFO - __main__ - Step 47618: {'lr': 0.00039167298335998646, 'samples': 9142656, 'steps': 47617, 'loss/train': 1.678581953048706} -11/07/2021 03:57:15 - INFO - __main__ - Step 47619: {'lr': 0.0003916686109434624, 'samples': 9142848, 'steps': 47618, 'loss/train': 1.4629886150360107} -11/07/2021 03:57:15 - INFO - __main__ - Step 47620: {'lr': 0.00039166423846310463, 'samples': 9143040, 'steps': 47619, 'loss/train': 1.1578612327575684} -11/07/2021 03:57:16 - INFO - __main__ - Step 47621: {'lr': 0.00039165986591891506, 'samples': 9143232, 'steps': 47620, 'loss/train': 1.5875498056411743} -11/07/2021 03:57:16 - INFO - __main__ - Step 47622: {'lr': 0.0003916554933108958, 'samples': 9143424, 'steps': 47621, 'loss/train': 1.1253294944763184} -11/07/2021 03:57:16 - INFO - __main__ - Step 47623: {'lr': 0.00039165112063904874, 'samples': 9143616, 'steps': 47622, 'loss/train': 0.9231517314910889} -11/07/2021 03:57:18 - INFO - __main__ - Step 47624: {'lr': 0.0003916467479033759, 'samples': 9143808, 'steps': 47623, 'loss/train': 1.4769951105117798} -11/07/2021 03:57:18 - INFO - __main__ - Step 47625: {'lr': 0.00039164237510387915, 'samples': 9144000, 'steps': 47624, 'loss/train': 1.0370756387710571} -11/07/2021 03:57:18 - INFO - __main__ - Step 47626: {'lr': 0.0003916380022405606, 'samples': 9144192, 'steps': 47625, 'loss/train': 1.2719224691390991} -11/07/2021 03:57:19 - INFO - __main__ - Step 47627: {'lr': 0.0003916336293134222, 'samples': 9144384, 'steps': 47626, 'loss/train': 2.3809704780578613} -11/07/2021 03:57:19 - INFO - __main__ - Step 47628: {'lr': 0.0003916292563224657, 'samples': 9144576, 'steps': 47627, 'loss/train': 1.146511197090149} -11/07/2021 03:57:19 - INFO - __main__ - Step 47629: {'lr': 0.00039162488326769334, 'samples': 9144768, 'steps': 47628, 'loss/train': 2.0270538330078125} -11/07/2021 03:57:21 - INFO - __main__ - Step 47630: {'lr': 0.00039162051014910706, 'samples': 9144960, 'steps': 47629, 'loss/train': 2.115088939666748} -11/07/2021 03:57:21 - INFO - __main__ - Step 47631: {'lr': 0.0003916161369667087, 'samples': 9145152, 'steps': 47630, 'loss/train': 1.8053927421569824} -11/07/2021 03:57:21 - INFO - __main__ - Step 47632: {'lr': 0.0003916117637205003, 'samples': 9145344, 'steps': 47631, 'loss/train': 1.1802260875701904} -11/07/2021 03:57:22 - INFO - __main__ - Step 47633: {'lr': 0.00039160739041048376, 'samples': 9145536, 'steps': 47632, 'loss/train': 0.5280793309211731} -11/07/2021 03:57:22 - INFO - __main__ - Step 47634: {'lr': 0.0003916030170366612, 'samples': 9145728, 'steps': 47633, 'loss/train': 1.577242136001587} -11/07/2021 03:57:23 - INFO - __main__ - Step 47635: {'lr': 0.0003915986435990345, 'samples': 9145920, 'steps': 47634, 'loss/train': 1.6110584735870361} -11/07/2021 03:57:23 - INFO - __main__ - Step 47636: {'lr': 0.0003915942700976056, 'samples': 9146112, 'steps': 47635, 'loss/train': 1.3024262189865112} -11/07/2021 03:57:24 - INFO - __main__ - Step 47637: {'lr': 0.0003915898965323765, 'samples': 9146304, 'steps': 47636, 'loss/train': 1.7504475116729736} -11/07/2021 03:57:24 - INFO - __main__ - Step 47638: {'lr': 0.00039158552290334927, 'samples': 9146496, 'steps': 47637, 'loss/train': 1.4919499158859253} -11/07/2021 03:57:24 - INFO - __main__ - Step 47639: {'lr': 0.00039158114921052567, 'samples': 9146688, 'steps': 47638, 'loss/train': 1.6135183572769165} -11/07/2021 03:57:25 - INFO - __main__ - Step 47640: {'lr': 0.0003915767754539078, 'samples': 9146880, 'steps': 47639, 'loss/train': 1.364461898803711} -11/07/2021 03:57:26 - INFO - __main__ - Step 47641: {'lr': 0.0003915724016334977, 'samples': 9147072, 'steps': 47640, 'loss/train': 1.3528691530227661} -11/07/2021 03:57:26 - INFO - __main__ - Step 47642: {'lr': 0.00039156802774929723, 'samples': 9147264, 'steps': 47641, 'loss/train': 1.877328634262085} -11/07/2021 03:57:26 - INFO - __main__ - Step 47643: {'lr': 0.00039156365380130844, 'samples': 9147456, 'steps': 47642, 'loss/train': 1.2187020778656006} -11/07/2021 03:57:27 - INFO - __main__ - Step 47644: {'lr': 0.00039155927978953316, 'samples': 9147648, 'steps': 47643, 'loss/train': 1.3663796186447144} -11/07/2021 03:57:28 - INFO - __main__ - Step 47645: {'lr': 0.00039155490571397345, 'samples': 9147840, 'steps': 47644, 'loss/train': 1.871665596961975} -11/07/2021 03:57:29 - INFO - __main__ - Step 47646: {'lr': 0.0003915505315746313, 'samples': 9148032, 'steps': 47645, 'loss/train': 2.014326333999634} -11/07/2021 03:57:29 - INFO - __main__ - Step 47647: {'lr': 0.00039154615737150867, 'samples': 9148224, 'steps': 47646, 'loss/train': 1.3724406957626343} -11/07/2021 03:57:29 - INFO - __main__ - Step 47648: {'lr': 0.00039154178310460755, 'samples': 9148416, 'steps': 47647, 'loss/train': 1.3263518810272217} -11/07/2021 03:57:30 - INFO - __main__ - Step 47649: {'lr': 0.00039153740877392987, 'samples': 9148608, 'steps': 47648, 'loss/train': 0.2772655189037323} -11/07/2021 03:57:31 - INFO - __main__ - Step 47650: {'lr': 0.0003915330343794777, 'samples': 9148800, 'steps': 47649, 'loss/train': 1.6966464519500732} -11/07/2021 03:57:31 - INFO - __main__ - Step 47651: {'lr': 0.0003915286599212529, 'samples': 9148992, 'steps': 47650, 'loss/train': 1.5087082386016846} -11/07/2021 03:57:32 - INFO - __main__ - Step 47652: {'lr': 0.0003915242853992573, 'samples': 9149184, 'steps': 47651, 'loss/train': 1.1331799030303955} -11/07/2021 03:57:32 - INFO - __main__ - Step 47653: {'lr': 0.0003915199108134932, 'samples': 9149376, 'steps': 47652, 'loss/train': 0.2149980217218399} -11/07/2021 03:57:32 - INFO - __main__ - Step 47654: {'lr': 0.00039151553616396234, 'samples': 9149568, 'steps': 47653, 'loss/train': 5.551827430725098} -11/07/2021 03:57:33 - INFO - __main__ - Step 47655: {'lr': 0.0003915111614506668, 'samples': 9149760, 'steps': 47654, 'loss/train': 1.6605746746063232} -11/07/2021 03:57:34 - INFO - __main__ - Step 47656: {'lr': 0.0003915067866736085, 'samples': 9149952, 'steps': 47655, 'loss/train': 1.5566972494125366} -11/07/2021 03:57:34 - INFO - __main__ - Step 47657: {'lr': 0.0003915024118327895, 'samples': 9150144, 'steps': 47656, 'loss/train': 1.962587594985962} -11/07/2021 03:57:34 - INFO - __main__ - Step 47658: {'lr': 0.0003914980369282116, 'samples': 9150336, 'steps': 47657, 'loss/train': 1.4869587421417236} -11/07/2021 03:57:35 - INFO - __main__ - Step 47659: {'lr': 0.0003914936619598769, 'samples': 9150528, 'steps': 47658, 'loss/train': 1.1580917835235596} -11/07/2021 03:57:36 - INFO - __main__ - Step 47660: {'lr': 0.0003914892869277873, 'samples': 9150720, 'steps': 47659, 'loss/train': 1.6406500339508057} -11/07/2021 03:57:36 - INFO - __main__ - Step 47661: {'lr': 0.0003914849118319449, 'samples': 9150912, 'steps': 47660, 'loss/train': 1.7226920127868652} -11/07/2021 03:57:37 - INFO - __main__ - Step 47662: {'lr': 0.0003914805366723515, 'samples': 9151104, 'steps': 47661, 'loss/train': 1.6189788579940796} -11/07/2021 03:57:37 - INFO - __main__ - Step 47663: {'lr': 0.0003914761614490092, 'samples': 9151296, 'steps': 47662, 'loss/train': 1.6396089792251587} -11/07/2021 03:57:37 - INFO - __main__ - Step 47664: {'lr': 0.0003914717861619199, 'samples': 9151488, 'steps': 47663, 'loss/train': 1.578438639640808} -11/07/2021 03:57:38 - INFO - __main__ - Step 47665: {'lr': 0.00039146741081108567, 'samples': 9151680, 'steps': 47664, 'loss/train': 1.9214646816253662} -11/07/2021 03:57:39 - INFO - __main__ - Step 47666: {'lr': 0.0003914630353965083, 'samples': 9151872, 'steps': 47665, 'loss/train': 1.3176829814910889} -11/07/2021 03:57:39 - INFO - __main__ - Step 47667: {'lr': 0.00039145865991818994, 'samples': 9152064, 'steps': 47666, 'loss/train': 1.5965214967727661} -11/07/2021 03:57:39 - INFO - __main__ - Step 47668: {'lr': 0.00039145428437613246, 'samples': 9152256, 'steps': 47667, 'loss/train': 1.41964852809906} -11/07/2021 03:57:40 - INFO - __main__ - Step 47669: {'lr': 0.0003914499087703379, 'samples': 9152448, 'steps': 47668, 'loss/train': 1.509716510772705} -11/07/2021 03:57:40 - INFO - __main__ - Step 47670: {'lr': 0.00039144553310080816, 'samples': 9152640, 'steps': 47669, 'loss/train': 1.100142002105713} -11/07/2021 03:57:41 - INFO - __main__ - Step 47671: {'lr': 0.0003914411573675453, 'samples': 9152832, 'steps': 47670, 'loss/train': 1.584984302520752} -11/07/2021 03:57:42 - INFO - __main__ - Step 47672: {'lr': 0.0003914367815705511, 'samples': 9153024, 'steps': 47671, 'loss/train': 1.3642358779907227} -11/07/2021 03:57:42 - INFO - __main__ - Step 47673: {'lr': 0.00039143240570982776, 'samples': 9153216, 'steps': 47672, 'loss/train': 1.5138477087020874} -11/07/2021 03:57:42 - INFO - __main__ - Step 47674: {'lr': 0.00039142802978537716, 'samples': 9153408, 'steps': 47673, 'loss/train': 1.6956623792648315} -11/07/2021 03:57:43 - INFO - __main__ - Step 47675: {'lr': 0.00039142365379720123, 'samples': 9153600, 'steps': 47674, 'loss/train': 1.4973416328430176} -11/07/2021 03:57:44 - INFO - __main__ - Step 47676: {'lr': 0.0003914192777453021, 'samples': 9153792, 'steps': 47675, 'loss/train': 1.4953629970550537} -11/07/2021 03:57:44 - INFO - __main__ - Step 47677: {'lr': 0.00039141490162968154, 'samples': 9153984, 'steps': 47676, 'loss/train': 1.174144983291626} -11/07/2021 03:57:44 - INFO - __main__ - Step 47678: {'lr': 0.0003914105254503416, 'samples': 9154176, 'steps': 47677, 'loss/train': 1.7978628873825073} -11/07/2021 03:57:45 - INFO - __main__ - Step 47679: {'lr': 0.00039140614920728424, 'samples': 9154368, 'steps': 47678, 'loss/train': 1.5725959539413452} -11/07/2021 03:57:45 - INFO - __main__ - Step 47680: {'lr': 0.0003914017729005115, 'samples': 9154560, 'steps': 47679, 'loss/train': 1.680406928062439} -11/07/2021 03:57:46 - INFO - __main__ - Step 47681: {'lr': 0.00039139739653002527, 'samples': 9154752, 'steps': 47680, 'loss/train': 0.5801538825035095} -11/07/2021 03:57:46 - INFO - __main__ - Step 47682: {'lr': 0.00039139302009582753, 'samples': 9154944, 'steps': 47681, 'loss/train': 1.4638181924819946} -11/07/2021 03:57:47 - INFO - __main__ - Step 47683: {'lr': 0.00039138864359792035, 'samples': 9155136, 'steps': 47682, 'loss/train': 1.611740231513977} -11/07/2021 03:57:47 - INFO - __main__ - Step 47684: {'lr': 0.0003913842670363056, 'samples': 9155328, 'steps': 47683, 'loss/train': 0.9025747776031494} -11/07/2021 03:57:47 - INFO - __main__ - Step 47685: {'lr': 0.0003913798904109853, 'samples': 9155520, 'steps': 47684, 'loss/train': 1.3374627828598022} -11/07/2021 03:57:49 - INFO - __main__ - Step 47686: {'lr': 0.0003913755137219614, 'samples': 9155712, 'steps': 47685, 'loss/train': 1.321630597114563} -11/07/2021 03:57:49 - INFO - __main__ - Step 47687: {'lr': 0.00039137113696923587, 'samples': 9155904, 'steps': 47686, 'loss/train': 1.7227809429168701} -11/07/2021 03:57:49 - INFO - __main__ - Step 47688: {'lr': 0.00039136676015281063, 'samples': 9156096, 'steps': 47687, 'loss/train': 0.8350129723548889} -11/07/2021 03:57:50 - INFO - __main__ - Step 47689: {'lr': 0.00039136238327268776, 'samples': 9156288, 'steps': 47688, 'loss/train': 1.270866870880127} -11/07/2021 03:57:50 - INFO - __main__ - Step 47690: {'lr': 0.0003913580063288692, 'samples': 9156480, 'steps': 47689, 'loss/train': 1.9323718547821045} -11/07/2021 03:57:51 - INFO - __main__ - Step 47691: {'lr': 0.0003913536293213569, 'samples': 9156672, 'steps': 47690, 'loss/train': 1.5638900995254517} -11/07/2021 03:57:51 - INFO - __main__ - Step 47692: {'lr': 0.00039134925225015277, 'samples': 9156864, 'steps': 47691, 'loss/train': 1.785346269607544} -11/07/2021 03:57:52 - INFO - __main__ - Step 47693: {'lr': 0.0003913448751152589, 'samples': 9157056, 'steps': 47692, 'loss/train': 0.6156972050666809} -11/07/2021 03:57:52 - INFO - __main__ - Step 47694: {'lr': 0.0003913404979166772, 'samples': 9157248, 'steps': 47693, 'loss/train': 1.6768780946731567} -11/07/2021 03:57:53 - INFO - __main__ - Step 47695: {'lr': 0.00039133612065440964, 'samples': 9157440, 'steps': 47694, 'loss/train': 1.6212339401245117} -11/07/2021 03:57:53 - INFO - __main__ - Step 47696: {'lr': 0.0003913317433284582, 'samples': 9157632, 'steps': 47695, 'loss/train': 1.614753246307373} -11/07/2021 03:57:53 - INFO - __main__ - Step 47697: {'lr': 0.0003913273659388249, 'samples': 9157824, 'steps': 47696, 'loss/train': 1.357269287109375} -11/07/2021 03:57:54 - INFO - __main__ - Step 47698: {'lr': 0.0003913229884855117, 'samples': 9158016, 'steps': 47697, 'loss/train': 0.7561484575271606} -11/07/2021 03:57:55 - INFO - __main__ - Step 47699: {'lr': 0.00039131861096852044, 'samples': 9158208, 'steps': 47698, 'loss/train': 1.6597344875335693} -11/07/2021 03:57:55 - INFO - __main__ - Step 47700: {'lr': 0.0003913142333878533, 'samples': 9158400, 'steps': 47699, 'loss/train': 1.3496906757354736} -11/07/2021 03:57:55 - INFO - __main__ - Step 47701: {'lr': 0.0003913098557435121, 'samples': 9158592, 'steps': 47700, 'loss/train': 1.3063585758209229} -11/07/2021 03:57:56 - INFO - __main__ - Step 47702: {'lr': 0.00039130547803549877, 'samples': 9158784, 'steps': 47701, 'loss/train': 1.5292190313339233} -11/07/2021 03:57:57 - INFO - __main__ - Step 47703: {'lr': 0.00039130110026381547, 'samples': 9158976, 'steps': 47702, 'loss/train': 1.587748408317566} -11/07/2021 03:57:57 - INFO - __main__ - Step 47704: {'lr': 0.00039129672242846407, 'samples': 9159168, 'steps': 47703, 'loss/train': 0.2601267695426941} -11/07/2021 03:57:58 - INFO - __main__ - Step 47705: {'lr': 0.0003912923445294465, 'samples': 9159360, 'steps': 47704, 'loss/train': 1.6256636381149292} -11/07/2021 03:57:58 - INFO - __main__ - Step 47706: {'lr': 0.00039128796656676487, 'samples': 9159552, 'steps': 47705, 'loss/train': 1.1044323444366455} -11/07/2021 03:57:58 - INFO - __main__ - Step 47707: {'lr': 0.000391283588540421, 'samples': 9159744, 'steps': 47706, 'loss/train': 1.5699584484100342} -11/07/2021 03:57:59 - INFO - __main__ - Step 47708: {'lr': 0.00039127921045041693, 'samples': 9159936, 'steps': 47707, 'loss/train': 1.3472719192504883} -11/07/2021 03:58:00 - INFO - __main__ - Step 47709: {'lr': 0.00039127483229675457, 'samples': 9160128, 'steps': 47708, 'loss/train': 1.4134140014648438} -11/07/2021 03:58:00 - INFO - __main__ - Step 47710: {'lr': 0.0003912704540794361, 'samples': 9160320, 'steps': 47709, 'loss/train': 1.2979545593261719} -11/07/2021 03:58:00 - INFO - __main__ - Step 47711: {'lr': 0.0003912660757984632, 'samples': 9160512, 'steps': 47710, 'loss/train': 1.8867838382720947} -11/07/2021 03:58:01 - INFO - __main__ - Step 47712: {'lr': 0.00039126169745383807, 'samples': 9160704, 'steps': 47711, 'loss/train': 0.4019244313240051} -11/07/2021 03:58:01 - INFO - __main__ - Step 47713: {'lr': 0.00039125731904556254, 'samples': 9160896, 'steps': 47712, 'loss/train': 1.565820336341858} -11/07/2021 03:58:02 - INFO - __main__ - Step 47714: {'lr': 0.0003912529405736387, 'samples': 9161088, 'steps': 47713, 'loss/train': 1.0823204517364502} -11/07/2021 03:58:02 - INFO - __main__ - Step 47715: {'lr': 0.00039124856203806834, 'samples': 9161280, 'steps': 47714, 'loss/train': 1.3622620105743408} -11/07/2021 03:58:03 - INFO - __main__ - Step 47716: {'lr': 0.0003912441834388537, 'samples': 9161472, 'steps': 47715, 'loss/train': 1.5373780727386475} -11/07/2021 03:58:03 - INFO - __main__ - Step 47717: {'lr': 0.00039123980477599664, 'samples': 9161664, 'steps': 47716, 'loss/train': 1.94687020778656} -11/07/2021 03:58:04 - INFO - __main__ - Step 47718: {'lr': 0.00039123542604949904, 'samples': 9161856, 'steps': 47717, 'loss/train': 1.64690363407135} -11/07/2021 03:58:04 - INFO - __main__ - Step 47719: {'lr': 0.0003912310472593629, 'samples': 9162048, 'steps': 47718, 'loss/train': 1.5679748058319092} -11/07/2021 03:58:05 - INFO - __main__ - Step 47720: {'lr': 0.0003912266684055902, 'samples': 9162240, 'steps': 47719, 'loss/train': 1.5285804271697998} -11/07/2021 03:58:05 - INFO - __main__ - Step 47721: {'lr': 0.000391222289488183, 'samples': 9162432, 'steps': 47720, 'loss/train': 1.8171290159225464} -11/07/2021 03:58:06 - INFO - __main__ - Step 47722: {'lr': 0.00039121791050714317, 'samples': 9162624, 'steps': 47721, 'loss/train': 1.580133318901062} -11/07/2021 03:58:06 - INFO - __main__ - Step 47723: {'lr': 0.0003912135314624728, 'samples': 9162816, 'steps': 47722, 'loss/train': 1.504193902015686} -11/07/2021 03:58:07 - INFO - __main__ - Step 47724: {'lr': 0.00039120915235417377, 'samples': 9163008, 'steps': 47723, 'loss/train': 1.044930100440979} -11/07/2021 03:58:07 - INFO - __main__ - Step 47725: {'lr': 0.0003912047731822481, 'samples': 9163200, 'steps': 47724, 'loss/train': 1.6905770301818848} -11/07/2021 03:58:08 - INFO - __main__ - Step 47726: {'lr': 0.0003912003939466977, 'samples': 9163392, 'steps': 47725, 'loss/train': 1.3502663373947144} -11/07/2021 03:58:08 - INFO - __main__ - Step 47727: {'lr': 0.0003911960146475245, 'samples': 9163584, 'steps': 47726, 'loss/train': 0.49609217047691345} -11/07/2021 03:58:08 - INFO - __main__ - Step 47728: {'lr': 0.0003911916352847307, 'samples': 9163776, 'steps': 47727, 'loss/train': 1.264794945716858} -11/07/2021 03:58:10 - INFO - __main__ - Step 47729: {'lr': 0.0003911872558583181, 'samples': 9163968, 'steps': 47728, 'loss/train': 1.5488823652267456} -11/07/2021 03:58:10 - INFO - __main__ - Step 47730: {'lr': 0.00039118287636828866, 'samples': 9164160, 'steps': 47729, 'loss/train': 1.5856084823608398} -11/07/2021 03:58:10 - INFO - __main__ - Step 47731: {'lr': 0.0003911784968146444, 'samples': 9164352, 'steps': 47730, 'loss/train': 1.1186045408248901} -11/07/2021 03:58:11 - INFO - __main__ - Step 47732: {'lr': 0.00039117411719738726, 'samples': 9164544, 'steps': 47731, 'loss/train': 1.676872968673706} -11/07/2021 03:58:11 - INFO - __main__ - Step 47733: {'lr': 0.0003911697375165193, 'samples': 9164736, 'steps': 47732, 'loss/train': 1.6229221820831299} -11/07/2021 03:58:12 - INFO - __main__ - Step 47734: {'lr': 0.00039116535777204237, 'samples': 9164928, 'steps': 47733, 'loss/train': 1.2042266130447388} -11/07/2021 03:58:12 - INFO - __main__ - Step 47735: {'lr': 0.00039116097796395856, 'samples': 9165120, 'steps': 47734, 'loss/train': 1.3100491762161255} -11/07/2021 03:58:13 - INFO - __main__ - Step 47736: {'lr': 0.00039115659809226975, 'samples': 9165312, 'steps': 47735, 'loss/train': 1.545833706855774} -11/07/2021 03:58:13 - INFO - __main__ - Step 47737: {'lr': 0.00039115221815697797, 'samples': 9165504, 'steps': 47736, 'loss/train': 1.6659634113311768} -11/07/2021 03:58:13 - INFO - __main__ - Step 47738: {'lr': 0.00039114783815808526, 'samples': 9165696, 'steps': 47737, 'loss/train': 1.2204612493515015} -11/07/2021 03:58:14 - INFO - __main__ - Step 47739: {'lr': 0.0003911434580955934, 'samples': 9165888, 'steps': 47738, 'loss/train': 1.8816306591033936} -11/07/2021 03:58:15 - INFO - __main__ - Step 47740: {'lr': 0.00039113907796950453, 'samples': 9166080, 'steps': 47739, 'loss/train': 1.467585802078247} -11/07/2021 03:58:15 - INFO - __main__ - Step 47741: {'lr': 0.0003911346977798206, 'samples': 9166272, 'steps': 47740, 'loss/train': 0.9358709454536438} -11/07/2021 03:58:16 - INFO - __main__ - Step 47742: {'lr': 0.0003911303175265435, 'samples': 9166464, 'steps': 47741, 'loss/train': 1.3167362213134766} -11/07/2021 03:58:16 - INFO - __main__ - Step 47743: {'lr': 0.00039112593720967524, 'samples': 9166656, 'steps': 47742, 'loss/train': 1.5671089887619019} -11/07/2021 03:58:16 - INFO - __main__ - Step 47744: {'lr': 0.00039112155682921785, 'samples': 9166848, 'steps': 47743, 'loss/train': 1.520840048789978} -11/07/2021 03:58:17 - INFO - __main__ - Step 47745: {'lr': 0.00039111717638517325, 'samples': 9167040, 'steps': 47744, 'loss/train': 1.286608099937439} -11/07/2021 03:58:18 - INFO - __main__ - Step 47746: {'lr': 0.00039111279587754344, 'samples': 9167232, 'steps': 47745, 'loss/train': 1.2636497020721436} -11/07/2021 03:58:18 - INFO - __main__ - Step 47747: {'lr': 0.0003911084153063303, 'samples': 9167424, 'steps': 47746, 'loss/train': 1.6070020198822021} -11/07/2021 03:58:18 - INFO - __main__ - Step 47748: {'lr': 0.000391104034671536, 'samples': 9167616, 'steps': 47747, 'loss/train': 1.3143073320388794} -11/07/2021 03:58:19 - INFO - __main__ - Step 47749: {'lr': 0.00039109965397316236, 'samples': 9167808, 'steps': 47748, 'loss/train': 1.0709642171859741} -11/07/2021 03:58:20 - INFO - __main__ - Step 47750: {'lr': 0.0003910952732112114, 'samples': 9168000, 'steps': 47749, 'loss/train': 1.06427800655365} -11/07/2021 03:58:20 - INFO - __main__ - Step 47751: {'lr': 0.00039109089238568507, 'samples': 9168192, 'steps': 47750, 'loss/train': 1.802921175956726} -11/07/2021 03:58:20 - INFO - __main__ - Step 47752: {'lr': 0.00039108651149658534, 'samples': 9168384, 'steps': 47751, 'loss/train': 1.2981460094451904} -11/07/2021 03:58:21 - INFO - __main__ - Step 47753: {'lr': 0.0003910821305439143, 'samples': 9168576, 'steps': 47752, 'loss/train': 1.3508820533752441} -11/07/2021 03:58:21 - INFO - __main__ - Step 47754: {'lr': 0.00039107774952767374, 'samples': 9168768, 'steps': 47753, 'loss/train': 4.926101207733154} -11/07/2021 03:58:22 - INFO - __main__ - Step 47755: {'lr': 0.0003910733684478657, 'samples': 9168960, 'steps': 47754, 'loss/train': 1.0816140174865723} -11/07/2021 03:58:23 - INFO - __main__ - Step 47756: {'lr': 0.00039106898730449223, 'samples': 9169152, 'steps': 47755, 'loss/train': 1.4479185342788696} -11/07/2021 03:58:23 - INFO - __main__ - Step 47757: {'lr': 0.0003910646060975553, 'samples': 9169344, 'steps': 47756, 'loss/train': 1.2211220264434814} -11/07/2021 03:58:23 - INFO - __main__ - Step 47758: {'lr': 0.00039106022482705675, 'samples': 9169536, 'steps': 47757, 'loss/train': 1.4629676342010498} -11/07/2021 03:58:24 - INFO - __main__ - Step 47759: {'lr': 0.0003910558434929987, 'samples': 9169728, 'steps': 47758, 'loss/train': 1.2839739322662354} -11/07/2021 03:58:25 - INFO - __main__ - Step 47760: {'lr': 0.000391051462095383, 'samples': 9169920, 'steps': 47759, 'loss/train': 1.7330576181411743} -11/07/2021 03:58:25 - INFO - __main__ - Step 47761: {'lr': 0.0003910470806342117, 'samples': 9170112, 'steps': 47760, 'loss/train': 1.3753608465194702} -11/07/2021 03:58:25 - INFO - __main__ - Step 47762: {'lr': 0.00039104269910948675, 'samples': 9170304, 'steps': 47761, 'loss/train': 1.8073952198028564} -11/07/2021 03:58:26 - INFO - __main__ - Step 47763: {'lr': 0.00039103831752121024, 'samples': 9170496, 'steps': 47762, 'loss/train': 1.5527784824371338} -11/07/2021 03:58:26 - INFO - __main__ - Step 47764: {'lr': 0.00039103393586938394, 'samples': 9170688, 'steps': 47763, 'loss/train': 1.7788493633270264} -11/07/2021 03:58:26 - INFO - __main__ - Step 47765: {'lr': 0.00039102955415401, 'samples': 9170880, 'steps': 47764, 'loss/train': 1.4334397315979004} -11/07/2021 03:58:27 - INFO - __main__ - Step 47766: {'lr': 0.00039102517237509025, 'samples': 9171072, 'steps': 47765, 'loss/train': 1.1334584951400757} -11/07/2021 03:58:28 - INFO - __main__ - Step 47767: {'lr': 0.0003910207905326267, 'samples': 9171264, 'steps': 47766, 'loss/train': 1.5549800395965576} -11/07/2021 03:58:28 - INFO - __main__ - Step 47768: {'lr': 0.00039101640862662147, 'samples': 9171456, 'steps': 47767, 'loss/train': 1.2709290981292725} -11/07/2021 03:58:28 - INFO - __main__ - Step 47769: {'lr': 0.0003910120266570764, 'samples': 9171648, 'steps': 47768, 'loss/train': 2.0093159675598145} -11/07/2021 03:58:29 - INFO - __main__ - Step 47770: {'lr': 0.0003910076446239934, 'samples': 9171840, 'steps': 47769, 'loss/train': 1.5359703302383423} -11/07/2021 03:58:30 - INFO - __main__ - Step 47771: {'lr': 0.00039100326252737463, 'samples': 9172032, 'steps': 47770, 'loss/train': 1.9358810186386108} -11/07/2021 03:58:30 - INFO - __main__ - Step 47772: {'lr': 0.00039099888036722187, 'samples': 9172224, 'steps': 47771, 'loss/train': 1.156240701675415} -11/07/2021 03:58:31 - INFO - __main__ - Step 47773: {'lr': 0.00039099449814353725, 'samples': 9172416, 'steps': 47772, 'loss/train': 0.9753404259681702} -11/07/2021 03:58:31 - INFO - __main__ - Step 47774: {'lr': 0.00039099011585632266, 'samples': 9172608, 'steps': 47773, 'loss/train': 1.1997112035751343} -11/07/2021 03:58:31 - INFO - __main__ - Step 47775: {'lr': 0.0003909857335055801, 'samples': 9172800, 'steps': 47774, 'loss/train': 1.3026461601257324} -11/07/2021 03:58:32 - INFO - __main__ - Step 47776: {'lr': 0.00039098135109131156, 'samples': 9172992, 'steps': 47775, 'loss/train': 1.5997029542922974} -11/07/2021 03:58:33 - INFO - __main__ - Step 47777: {'lr': 0.00039097696861351895, 'samples': 9173184, 'steps': 47776, 'loss/train': 1.5098634958267212} -11/07/2021 03:58:33 - INFO - __main__ - Step 47778: {'lr': 0.00039097258607220445, 'samples': 9173376, 'steps': 47777, 'loss/train': 1.658744215965271} -11/07/2021 03:58:33 - INFO - __main__ - Step 47779: {'lr': 0.00039096820346736974, 'samples': 9173568, 'steps': 47778, 'loss/train': 1.496510624885559} -11/07/2021 03:58:34 - INFO - __main__ - Step 47780: {'lr': 0.00039096382079901695, 'samples': 9173760, 'steps': 47779, 'loss/train': 1.2784366607666016} -11/07/2021 03:58:35 - INFO - __main__ - Step 47781: {'lr': 0.000390959438067148, 'samples': 9173952, 'steps': 47780, 'loss/train': 1.5558462142944336} -11/07/2021 03:58:35 - INFO - __main__ - Step 47782: {'lr': 0.000390955055271765, 'samples': 9174144, 'steps': 47781, 'loss/train': 1.5842334032058716} -11/07/2021 03:58:35 - INFO - __main__ - Step 47783: {'lr': 0.00039095067241286973, 'samples': 9174336, 'steps': 47782, 'loss/train': 1.5696221590042114} -11/07/2021 03:58:36 - INFO - __main__ - Step 47784: {'lr': 0.00039094628949046435, 'samples': 9174528, 'steps': 47783, 'loss/train': 1.2933385372161865} -11/07/2021 03:58:36 - INFO - __main__ - Step 47785: {'lr': 0.0003909419065045507, 'samples': 9174720, 'steps': 47784, 'loss/train': 1.1484545469284058} -11/07/2021 03:58:37 - INFO - __main__ - Step 47786: {'lr': 0.0003909375234551308, 'samples': 9174912, 'steps': 47785, 'loss/train': 1.266628623008728} -11/07/2021 03:58:37 - INFO - __main__ - Step 47787: {'lr': 0.0003909331403422066, 'samples': 9175104, 'steps': 47786, 'loss/train': 1.4414047002792358} -11/07/2021 03:58:38 - INFO - __main__ - Step 47788: {'lr': 0.00039092875716578013, 'samples': 9175296, 'steps': 47787, 'loss/train': 1.4967223405838013} -11/07/2021 03:58:38 - INFO - __main__ - Step 47789: {'lr': 0.00039092437392585335, 'samples': 9175488, 'steps': 47788, 'loss/train': 1.2454779148101807} -11/07/2021 03:58:39 - INFO - __main__ - Step 47790: {'lr': 0.0003909199906224282, 'samples': 9175680, 'steps': 47789, 'loss/train': 1.5636887550354004} -11/07/2021 03:58:40 - INFO - __main__ - Step 47791: {'lr': 0.00039091560725550676, 'samples': 9175872, 'steps': 47790, 'loss/train': 1.3521119356155396} -11/07/2021 03:58:40 - INFO - __main__ - Step 47792: {'lr': 0.0003909112238250908, 'samples': 9176064, 'steps': 47791, 'loss/train': 1.4724849462509155} -11/07/2021 03:58:40 - INFO - __main__ - Step 47793: {'lr': 0.0003909068403311825, 'samples': 9176256, 'steps': 47792, 'loss/train': 1.5105748176574707} -11/07/2021 03:58:41 - INFO - __main__ - Step 47794: {'lr': 0.0003909024567737837, 'samples': 9176448, 'steps': 47793, 'loss/train': 1.4884341955184937} -11/07/2021 03:58:41 - INFO - __main__ - Step 47795: {'lr': 0.0003908980731528965, 'samples': 9176640, 'steps': 47794, 'loss/train': 1.392460584640503} -11/07/2021 03:58:42 - INFO - __main__ - Step 47796: {'lr': 0.0003908936894685227, 'samples': 9176832, 'steps': 47795, 'loss/train': 1.4147835969924927} -11/07/2021 03:58:42 - INFO - __main__ - Step 47797: {'lr': 0.0003908893057206644, 'samples': 9177024, 'steps': 47796, 'loss/train': 1.644497036933899} -11/07/2021 03:58:43 - INFO - __main__ - Step 47798: {'lr': 0.00039088492190932365, 'samples': 9177216, 'steps': 47797, 'loss/train': 1.58420729637146} -11/07/2021 03:58:43 - INFO - __main__ - Step 47799: {'lr': 0.00039088053803450223, 'samples': 9177408, 'steps': 47798, 'loss/train': 1.7875009775161743} -11/07/2021 03:58:43 - INFO - __main__ - Step 47800: {'lr': 0.00039087615409620223, 'samples': 9177600, 'steps': 47799, 'loss/train': 1.3872160911560059} -11/07/2021 03:58:44 - INFO - __main__ - Step 47801: {'lr': 0.00039087177009442567, 'samples': 9177792, 'steps': 47800, 'loss/train': 1.6980464458465576} -11/07/2021 03:58:45 - INFO - __main__ - Step 47802: {'lr': 0.0003908673860291744, 'samples': 9177984, 'steps': 47801, 'loss/train': 1.910475254058838} -11/07/2021 03:58:45 - INFO - __main__ - Step 47803: {'lr': 0.0003908630019004504, 'samples': 9178176, 'steps': 47802, 'loss/train': 1.361932396888733} -11/07/2021 03:58:45 - INFO - __main__ - Step 47804: {'lr': 0.00039085861770825586, 'samples': 9178368, 'steps': 47803, 'loss/train': 1.6999609470367432} -11/07/2021 03:58:46 - INFO - __main__ - Step 47805: {'lr': 0.00039085423345259254, 'samples': 9178560, 'steps': 47804, 'loss/train': 1.305261492729187} -11/07/2021 03:58:46 - INFO - __main__ - Step 47806: {'lr': 0.00039084984913346246, 'samples': 9178752, 'steps': 47805, 'loss/train': 1.737400770187378} -11/07/2021 03:58:47 - INFO - __main__ - Step 47807: {'lr': 0.0003908454647508676, 'samples': 9178944, 'steps': 47806, 'loss/train': 1.7078434228897095} -11/07/2021 03:58:48 - INFO - __main__ - Step 47808: {'lr': 0.0003908410803048099, 'samples': 9179136, 'steps': 47807, 'loss/train': 0.9526119232177734} -11/07/2021 03:58:48 - INFO - __main__ - Step 47809: {'lr': 0.0003908366957952915, 'samples': 9179328, 'steps': 47808, 'loss/train': 1.8848559856414795} -11/07/2021 03:58:48 - INFO - __main__ - Step 47810: {'lr': 0.0003908323112223142, 'samples': 9179520, 'steps': 47809, 'loss/train': 1.385873556137085} -11/07/2021 03:58:49 - INFO - __main__ - Step 47811: {'lr': 0.0003908279265858801, 'samples': 9179712, 'steps': 47810, 'loss/train': 1.7560125589370728} -11/07/2021 03:58:50 - INFO - __main__ - Step 47812: {'lr': 0.00039082354188599094, 'samples': 9179904, 'steps': 47811, 'loss/train': 0.9998289942741394} -11/07/2021 03:58:50 - INFO - __main__ - Step 47813: {'lr': 0.00039081915712264897, 'samples': 9180096, 'steps': 47812, 'loss/train': 1.5740004777908325} -11/07/2021 03:58:50 - INFO - __main__ - Step 47814: {'lr': 0.000390814772295856, 'samples': 9180288, 'steps': 47813, 'loss/train': 0.9608702063560486} -11/07/2021 03:58:51 - INFO - __main__ - Step 47815: {'lr': 0.0003908103874056142, 'samples': 9180480, 'steps': 47814, 'loss/train': 1.3893488645553589} -11/07/2021 03:58:51 - INFO - __main__ - Step 47816: {'lr': 0.0003908060024519253, 'samples': 9180672, 'steps': 47815, 'loss/train': 1.414729118347168} -11/07/2021 03:58:51 - INFO - __main__ - Step 47817: {'lr': 0.0003908016174347915, 'samples': 9180864, 'steps': 47816, 'loss/train': 1.5888200998306274} -11/07/2021 03:58:52 - INFO - __main__ - Step 47818: {'lr': 0.00039079723235421456, 'samples': 9181056, 'steps': 47817, 'loss/train': 1.9803375005722046} -11/07/2021 03:58:53 - INFO - __main__ - Step 47819: {'lr': 0.0003907928472101966, 'samples': 9181248, 'steps': 47818, 'loss/train': 1.477423071861267} -11/07/2021 03:58:53 - INFO - __main__ - Step 47820: {'lr': 0.00039078846200273955, 'samples': 9181440, 'steps': 47819, 'loss/train': 1.858801007270813} -11/07/2021 03:58:53 - INFO - __main__ - Step 47821: {'lr': 0.00039078407673184536, 'samples': 9181632, 'steps': 47820, 'loss/train': 1.4473891258239746} -11/07/2021 03:58:54 - INFO - __main__ - Step 47822: {'lr': 0.000390779691397516, 'samples': 9181824, 'steps': 47821, 'loss/train': 1.2635656595230103} -11/07/2021 03:58:55 - INFO - __main__ - Step 47823: {'lr': 0.0003907753059997536, 'samples': 9182016, 'steps': 47822, 'loss/train': 1.6431529521942139} -11/07/2021 03:58:55 - INFO - __main__ - Step 47824: {'lr': 0.00039077092053855996, 'samples': 9182208, 'steps': 47823, 'loss/train': 1.7903770208358765} -11/07/2021 03:58:56 - INFO - __main__ - Step 47825: {'lr': 0.0003907665350139371, 'samples': 9182400, 'steps': 47824, 'loss/train': 1.5683518648147583} -11/07/2021 03:58:56 - INFO - __main__ - Step 47826: {'lr': 0.00039076214942588704, 'samples': 9182592, 'steps': 47825, 'loss/train': 1.5268745422363281} -11/07/2021 03:58:56 - INFO - __main__ - Step 47827: {'lr': 0.00039075776377441176, 'samples': 9182784, 'steps': 47826, 'loss/train': 1.1185357570648193} -11/07/2021 03:58:57 - INFO - __main__ - Step 47828: {'lr': 0.00039075337805951314, 'samples': 9182976, 'steps': 47827, 'loss/train': 5.700735092163086} -11/07/2021 03:58:58 - INFO - __main__ - Step 47829: {'lr': 0.0003907489922811932, 'samples': 9183168, 'steps': 47828, 'loss/train': 1.038259744644165} -11/07/2021 03:58:58 - INFO - __main__ - Step 47830: {'lr': 0.000390744606439454, 'samples': 9183360, 'steps': 47829, 'loss/train': 1.5854010581970215} -11/07/2021 03:58:58 - INFO - __main__ - Step 47831: {'lr': 0.00039074022053429746, 'samples': 9183552, 'steps': 47830, 'loss/train': 1.1093767881393433} -11/07/2021 03:58:59 - INFO - __main__ - Step 47832: {'lr': 0.00039073583456572547, 'samples': 9183744, 'steps': 47831, 'loss/train': 1.3338769674301147} -11/07/2021 03:59:00 - INFO - __main__ - Step 47833: {'lr': 0.0003907314485337402, 'samples': 9183936, 'steps': 47832, 'loss/train': 1.903498649597168} -11/07/2021 03:59:00 - INFO - __main__ - Step 47834: {'lr': 0.00039072706243834345, 'samples': 9184128, 'steps': 47833, 'loss/train': 1.6174588203430176} -11/07/2021 03:59:01 - INFO - __main__ - Step 47835: {'lr': 0.0003907226762795372, 'samples': 9184320, 'steps': 47834, 'loss/train': 1.1398457288742065} -11/07/2021 03:59:01 - INFO - __main__ - Step 47836: {'lr': 0.0003907182900573235, 'samples': 9184512, 'steps': 47835, 'loss/train': 1.6860932111740112} -11/07/2021 03:59:01 - INFO - __main__ - Step 47837: {'lr': 0.00039071390377170434, 'samples': 9184704, 'steps': 47836, 'loss/train': 1.1040606498718262} -11/07/2021 03:59:02 - INFO - __main__ - Step 47838: {'lr': 0.00039070951742268173, 'samples': 9184896, 'steps': 47837, 'loss/train': 1.4555193185806274} -11/07/2021 03:59:03 - INFO - __main__ - Step 47839: {'lr': 0.00039070513101025753, 'samples': 9185088, 'steps': 47838, 'loss/train': 1.118199348449707} -11/07/2021 03:59:03 - INFO - __main__ - Step 47840: {'lr': 0.00039070074453443374, 'samples': 9185280, 'steps': 47839, 'loss/train': 1.9513616561889648} -11/07/2021 03:59:03 - INFO - __main__ - Step 47841: {'lr': 0.0003906963579952124, 'samples': 9185472, 'steps': 47840, 'loss/train': 1.395675539970398} -11/07/2021 03:59:04 - INFO - __main__ - Step 47842: {'lr': 0.0003906919713925954, 'samples': 9185664, 'steps': 47841, 'loss/train': 1.8071616888046265} -11/07/2021 03:59:04 - INFO - __main__ - Step 47843: {'lr': 0.00039068758472658483, 'samples': 9185856, 'steps': 47842, 'loss/train': 1.3935356140136719} -11/07/2021 03:59:05 - INFO - __main__ - Step 47844: {'lr': 0.0003906831979971826, 'samples': 9186048, 'steps': 47843, 'loss/train': 1.501913070678711} -11/07/2021 03:59:05 - INFO - __main__ - Step 47845: {'lr': 0.0003906788112043907, 'samples': 9186240, 'steps': 47844, 'loss/train': 1.1235847473144531} -11/07/2021 03:59:06 - INFO - __main__ - Step 47846: {'lr': 0.00039067442434821106, 'samples': 9186432, 'steps': 47845, 'loss/train': 0.49357911944389343} -11/07/2021 03:59:06 - INFO - __main__ - Step 47847: {'lr': 0.0003906700374286457, 'samples': 9186624, 'steps': 47846, 'loss/train': 1.6865296363830566} -11/07/2021 03:59:06 - INFO - __main__ - Step 47848: {'lr': 0.0003906656504456966, 'samples': 9186816, 'steps': 47847, 'loss/train': 1.388684868812561} -11/07/2021 03:59:08 - INFO - __main__ - Step 47849: {'lr': 0.0003906612633993657, 'samples': 9187008, 'steps': 47848, 'loss/train': 0.9301236867904663} -11/07/2021 03:59:08 - INFO - __main__ - Step 47850: {'lr': 0.00039065687628965506, 'samples': 9187200, 'steps': 47849, 'loss/train': 1.4606879949569702} -11/07/2021 03:59:08 - INFO - __main__ - Step 47851: {'lr': 0.0003906524891165666, 'samples': 9187392, 'steps': 47850, 'loss/train': 1.518761157989502} -11/07/2021 03:59:09 - INFO - __main__ - Step 47852: {'lr': 0.00039064810188010223, 'samples': 9187584, 'steps': 47851, 'loss/train': 1.4743632078170776} -11/07/2021 03:59:09 - INFO - __main__ - Step 47853: {'lr': 0.000390643714580264, 'samples': 9187776, 'steps': 47852, 'loss/train': 2.037034511566162} -11/07/2021 03:59:10 - INFO - __main__ - Step 47854: {'lr': 0.000390639327217054, 'samples': 9187968, 'steps': 47853, 'loss/train': 1.6816785335540771} -11/07/2021 03:59:10 - INFO - __main__ - Step 47855: {'lr': 0.000390634939790474, 'samples': 9188160, 'steps': 47854, 'loss/train': 1.4877616167068481} -11/07/2021 03:59:11 - INFO - __main__ - Step 47856: {'lr': 0.00039063055230052605, 'samples': 9188352, 'steps': 47855, 'loss/train': 1.093326210975647} -11/07/2021 03:59:11 - INFO - __main__ - Step 47857: {'lr': 0.00039062616474721217, 'samples': 9188544, 'steps': 47856, 'loss/train': 1.781771183013916} -11/07/2021 03:59:11 - INFO - __main__ - Step 47858: {'lr': 0.00039062177713053436, 'samples': 9188736, 'steps': 47857, 'loss/train': 1.5823264122009277} -11/07/2021 03:59:12 - INFO - __main__ - Step 47859: {'lr': 0.00039061738945049454, 'samples': 9188928, 'steps': 47858, 'loss/train': 4.710807800292969} -11/07/2021 03:59:12 - INFO - __main__ - Step 47860: {'lr': 0.0003906130017070946, 'samples': 9189120, 'steps': 47859, 'loss/train': 1.006072759628296} -11/07/2021 03:59:13 - INFO - __main__ - Step 47861: {'lr': 0.0003906086139003366, 'samples': 9189312, 'steps': 47860, 'loss/train': 1.132124662399292} -11/07/2021 03:59:14 - INFO - __main__ - Step 47862: {'lr': 0.00039060422603022266, 'samples': 9189504, 'steps': 47861, 'loss/train': 1.6611148118972778} -11/07/2021 03:59:14 - INFO - __main__ - Step 47863: {'lr': 0.0003905998380967546, 'samples': 9189696, 'steps': 47862, 'loss/train': 1.276165246963501} -11/07/2021 03:59:14 - INFO - __main__ - Step 47864: {'lr': 0.00039059545009993436, 'samples': 9189888, 'steps': 47863, 'loss/train': 1.817383885383606} -11/07/2021 03:59:15 - INFO - __main__ - Step 47865: {'lr': 0.00039059106203976403, 'samples': 9190080, 'steps': 47864, 'loss/train': 1.0590981245040894} -11/07/2021 03:59:16 - INFO - __main__ - Step 47866: {'lr': 0.00039058667391624546, 'samples': 9190272, 'steps': 47865, 'loss/train': 1.774393916130066} -11/07/2021 03:59:17 - INFO - __main__ - Step 47867: {'lr': 0.00039058228572938074, 'samples': 9190464, 'steps': 47866, 'loss/train': 1.5428546667099} -11/07/2021 03:59:17 - INFO - __main__ - Step 47868: {'lr': 0.00039057789747917184, 'samples': 9190656, 'steps': 47867, 'loss/train': 0.7667586207389832} -11/07/2021 03:59:17 - INFO - __main__ - Step 47869: {'lr': 0.00039057350916562065, 'samples': 9190848, 'steps': 47868, 'loss/train': 1.5777109861373901} -11/07/2021 03:59:18 - INFO - __main__ - Step 47870: {'lr': 0.0003905691207887293, 'samples': 9191040, 'steps': 47869, 'loss/train': 2.0030999183654785} -11/07/2021 03:59:18 - INFO - __main__ - Step 47871: {'lr': 0.00039056473234849964, 'samples': 9191232, 'steps': 47870, 'loss/train': 1.908658742904663} -11/07/2021 03:59:18 - INFO - __main__ - Step 47872: {'lr': 0.0003905603438449337, 'samples': 9191424, 'steps': 47871, 'loss/train': 1.2018303871154785} -11/07/2021 03:59:19 - INFO - __main__ - Step 47873: {'lr': 0.00039055595527803333, 'samples': 9191616, 'steps': 47872, 'loss/train': 1.4805277585983276} -11/07/2021 03:59:20 - INFO - __main__ - Step 47874: {'lr': 0.00039055156664780067, 'samples': 9191808, 'steps': 47873, 'loss/train': 0.9325542449951172} -11/07/2021 03:59:20 - INFO - __main__ - Step 47875: {'lr': 0.00039054717795423765, 'samples': 9192000, 'steps': 47874, 'loss/train': 1.3526469469070435} -11/07/2021 03:59:20 - INFO - __main__ - Step 47876: {'lr': 0.0003905427891973463, 'samples': 9192192, 'steps': 47875, 'loss/train': 1.7165586948394775} -11/07/2021 03:59:21 - INFO - __main__ - Step 47877: {'lr': 0.0003905384003771285, 'samples': 9192384, 'steps': 47876, 'loss/train': 1.5303162336349487} -11/07/2021 03:59:22 - INFO - __main__ - Step 47878: {'lr': 0.00039053401149358625, 'samples': 9192576, 'steps': 47877, 'loss/train': 1.5087376832962036} -11/07/2021 03:59:22 - INFO - __main__ - Step 47879: {'lr': 0.0003905296225467215, 'samples': 9192768, 'steps': 47878, 'loss/train': 1.519276738166809} -11/07/2021 03:59:23 - INFO - __main__ - Step 47880: {'lr': 0.0003905252335365364, 'samples': 9192960, 'steps': 47879, 'loss/train': 1.481291651725769} -11/07/2021 03:59:23 - INFO - __main__ - Step 47881: {'lr': 0.00039052084446303264, 'samples': 9193152, 'steps': 47880, 'loss/train': 1.1391723155975342} -11/07/2021 03:59:23 - INFO - __main__ - Step 47882: {'lr': 0.0003905164553262125, 'samples': 9193344, 'steps': 47881, 'loss/train': 0.9642443656921387} -11/07/2021 03:59:24 - INFO - __main__ - Step 47883: {'lr': 0.0003905120661260777, 'samples': 9193536, 'steps': 47882, 'loss/train': 1.2184077501296997} -11/07/2021 03:59:25 - INFO - __main__ - Step 47884: {'lr': 0.00039050767686263035, 'samples': 9193728, 'steps': 47883, 'loss/train': 1.4414434432983398} -11/07/2021 03:59:25 - INFO - __main__ - Step 47885: {'lr': 0.0003905032875358725, 'samples': 9193920, 'steps': 47884, 'loss/train': 1.474022626876831} -11/07/2021 03:59:26 - INFO - __main__ - Step 47886: {'lr': 0.00039049889814580597, 'samples': 9194112, 'steps': 47885, 'loss/train': 1.4804164171218872} -11/07/2021 03:59:26 - INFO - __main__ - Step 47887: {'lr': 0.00039049450869243276, 'samples': 9194304, 'steps': 47886, 'loss/train': 0.8207853436470032} -11/07/2021 03:59:27 - INFO - __main__ - Step 47888: {'lr': 0.00039049011917575494, 'samples': 9194496, 'steps': 47887, 'loss/train': 1.946252465248108} -11/07/2021 03:59:27 - INFO - __main__ - Step 47889: {'lr': 0.00039048572959577446, 'samples': 9194688, 'steps': 47888, 'loss/train': 1.5656707286834717} -11/07/2021 03:59:28 - INFO - __main__ - Step 47890: {'lr': 0.0003904813399524932, 'samples': 9194880, 'steps': 47889, 'loss/train': 1.0549839735031128} -11/07/2021 03:59:28 - INFO - __main__ - Step 47891: {'lr': 0.0003904769502459133, 'samples': 9195072, 'steps': 47890, 'loss/train': 0.9227809906005859} -11/07/2021 03:59:28 - INFO - __main__ - Step 47892: {'lr': 0.0003904725604760366, 'samples': 9195264, 'steps': 47891, 'loss/train': 1.466859221458435} -11/07/2021 03:59:29 - INFO - __main__ - Step 47893: {'lr': 0.0003904681706428652, 'samples': 9195456, 'steps': 47892, 'loss/train': 1.8413870334625244} -11/07/2021 03:59:30 - INFO - __main__ - Step 47894: {'lr': 0.000390463780746401, 'samples': 9195648, 'steps': 47893, 'loss/train': 0.5830784440040588} -11/07/2021 03:59:30 - INFO - __main__ - Step 47895: {'lr': 0.00039045939078664595, 'samples': 9195840, 'steps': 47894, 'loss/train': 1.316049575805664} -11/07/2021 03:59:30 - INFO - __main__ - Step 47896: {'lr': 0.0003904550007636021, 'samples': 9196032, 'steps': 47895, 'loss/train': 0.8721176385879517} -11/07/2021 03:59:31 - INFO - __main__ - Step 47897: {'lr': 0.00039045061067727126, 'samples': 9196224, 'steps': 47896, 'loss/train': 1.7862621545791626} -11/07/2021 03:59:31 - INFO - __main__ - Step 47898: {'lr': 0.0003904462205276557, 'samples': 9196416, 'steps': 47897, 'loss/train': 1.522489070892334} -11/07/2021 03:59:32 - INFO - __main__ - Step 47899: {'lr': 0.0003904418303147572, 'samples': 9196608, 'steps': 47898, 'loss/train': 1.3559387922286987} -11/07/2021 03:59:33 - INFO - __main__ - Step 47900: {'lr': 0.0003904374400385777, 'samples': 9196800, 'steps': 47899, 'loss/train': 1.9666988849639893} -11/07/2021 03:59:33 - INFO - __main__ - Step 47901: {'lr': 0.0003904330496991194, 'samples': 9196992, 'steps': 47900, 'loss/train': 1.569732427597046} -11/07/2021 03:59:33 - INFO - __main__ - Step 47902: {'lr': 0.00039042865929638404, 'samples': 9197184, 'steps': 47901, 'loss/train': 1.6634944677352905} -11/07/2021 03:59:34 - INFO - __main__ - Step 47903: {'lr': 0.00039042426883037376, 'samples': 9197376, 'steps': 47902, 'loss/train': 1.6189223527908325} -11/07/2021 03:59:35 - INFO - __main__ - Step 47904: {'lr': 0.00039041987830109036, 'samples': 9197568, 'steps': 47903, 'loss/train': 1.027011752128601} -11/07/2021 03:59:35 - INFO - __main__ - Step 47905: {'lr': 0.000390415487708536, 'samples': 9197760, 'steps': 47904, 'loss/train': 1.4380768537521362} -11/07/2021 03:59:35 - INFO - __main__ - Step 47906: {'lr': 0.0003904110970527126, 'samples': 9197952, 'steps': 47905, 'loss/train': 1.5336869955062866} -11/07/2021 03:59:36 - INFO - __main__ - Step 47907: {'lr': 0.00039040670633362206, 'samples': 9198144, 'steps': 47906, 'loss/train': 1.5007959604263306} -11/07/2021 03:59:36 - INFO - __main__ - Step 47908: {'lr': 0.00039040231555126647, 'samples': 9198336, 'steps': 47907, 'loss/train': 1.2818505764007568} -11/07/2021 03:59:37 - INFO - __main__ - Step 47909: {'lr': 0.0003903979247056478, 'samples': 9198528, 'steps': 47908, 'loss/train': 1.2131530046463013} -11/07/2021 03:59:37 - INFO - __main__ - Step 47910: {'lr': 0.00039039353379676796, 'samples': 9198720, 'steps': 47909, 'loss/train': 1.4607211351394653} -11/07/2021 03:59:38 - INFO - __main__ - Step 47911: {'lr': 0.0003903891428246289, 'samples': 9198912, 'steps': 47910, 'loss/train': 1.980078101158142} -11/07/2021 03:59:38 - INFO - __main__ - Step 47912: {'lr': 0.0003903847517892328, 'samples': 9199104, 'steps': 47911, 'loss/train': 1.5750683546066284} -11/07/2021 03:59:38 - INFO - __main__ - Step 47913: {'lr': 0.00039038036069058137, 'samples': 9199296, 'steps': 47912, 'loss/train': 1.5380631685256958} -11/07/2021 03:59:39 - INFO - __main__ - Step 47914: {'lr': 0.0003903759695286768, 'samples': 9199488, 'steps': 47913, 'loss/train': 1.278486728668213} -11/07/2021 03:59:40 - INFO - __main__ - Step 47915: {'lr': 0.0003903715783035209, 'samples': 9199680, 'steps': 47914, 'loss/train': 0.8846134543418884} -11/07/2021 03:59:40 - INFO - __main__ - Step 47916: {'lr': 0.00039036718701511577, 'samples': 9199872, 'steps': 47915, 'loss/train': 1.2928320169448853} -11/07/2021 03:59:41 - INFO - __main__ - Step 47917: {'lr': 0.00039036279566346334, 'samples': 9200064, 'steps': 47916, 'loss/train': 1.5142719745635986} -11/07/2021 03:59:41 - INFO - __main__ - Step 47918: {'lr': 0.0003903584042485656, 'samples': 9200256, 'steps': 47917, 'loss/train': 0.7032201290130615} -11/07/2021 03:59:42 - INFO - __main__ - Step 47919: {'lr': 0.0003903540127704246, 'samples': 9200448, 'steps': 47918, 'loss/train': 1.6926442384719849} -11/07/2021 03:59:42 - INFO - __main__ - Step 47920: {'lr': 0.0003903496212290422, 'samples': 9200640, 'steps': 47919, 'loss/train': 0.8472903370857239} -11/07/2021 03:59:43 - INFO - __main__ - Step 47921: {'lr': 0.00039034522962442045, 'samples': 9200832, 'steps': 47920, 'loss/train': 0.6675543189048767} -11/07/2021 03:59:43 - INFO - __main__ - Step 47922: {'lr': 0.0003903408379565612, 'samples': 9201024, 'steps': 47921, 'loss/train': 1.4430902004241943} -11/07/2021 03:59:43 - INFO - __main__ - Step 47923: {'lr': 0.0003903364462254666, 'samples': 9201216, 'steps': 47922, 'loss/train': 1.4382398128509521} -11/07/2021 03:59:44 - INFO - __main__ - Step 47924: {'lr': 0.0003903320544311386, 'samples': 9201408, 'steps': 47923, 'loss/train': 1.2611238956451416} -11/07/2021 03:59:45 - INFO - __main__ - Step 47925: {'lr': 0.0003903276625735791, 'samples': 9201600, 'steps': 47924, 'loss/train': 1.5550249814987183} -11/07/2021 03:59:45 - INFO - __main__ - Step 47926: {'lr': 0.00039032327065279015, 'samples': 9201792, 'steps': 47925, 'loss/train': 0.6004175543785095} -11/07/2021 03:59:45 - INFO - __main__ - Step 47927: {'lr': 0.0003903188786687737, 'samples': 9201984, 'steps': 47926, 'loss/train': 1.0430054664611816} -11/07/2021 03:59:46 - INFO - __main__ - Step 47928: {'lr': 0.0003903144866215317, 'samples': 9202176, 'steps': 47927, 'loss/train': 1.3700852394104004} -11/07/2021 03:59:47 - INFO - __main__ - Step 47929: {'lr': 0.0003903100945110661, 'samples': 9202368, 'steps': 47928, 'loss/train': 1.3961900472640991} -11/07/2021 03:59:47 - INFO - __main__ - Step 47930: {'lr': 0.00039030570233737903, 'samples': 9202560, 'steps': 47929, 'loss/train': 1.1518902778625488} -11/07/2021 03:59:48 - INFO - __main__ - Step 47931: {'lr': 0.0003903013101004724, 'samples': 9202752, 'steps': 47930, 'loss/train': 1.6772443056106567} -11/07/2021 03:59:48 - INFO - __main__ - Step 47932: {'lr': 0.00039029691780034814, 'samples': 9202944, 'steps': 47931, 'loss/train': 1.384472370147705} -11/07/2021 03:59:48 - INFO - __main__ - Step 47933: {'lr': 0.00039029252543700823, 'samples': 9203136, 'steps': 47932, 'loss/train': 1.481557846069336} -11/07/2021 03:59:49 - INFO - __main__ - Step 47934: {'lr': 0.0003902881330104546, 'samples': 9203328, 'steps': 47933, 'loss/train': 1.4954843521118164} -11/07/2021 03:59:50 - INFO - __main__ - Step 47935: {'lr': 0.00039028374052068937, 'samples': 9203520, 'steps': 47934, 'loss/train': 1.54979407787323} -11/07/2021 03:59:50 - INFO - __main__ - Step 47936: {'lr': 0.0003902793479677145, 'samples': 9203712, 'steps': 47935, 'loss/train': 1.6774086952209473} -11/07/2021 03:59:50 - INFO - __main__ - Step 47937: {'lr': 0.00039027495535153185, 'samples': 9203904, 'steps': 47936, 'loss/train': 1.4777233600616455} -11/07/2021 03:59:51 - INFO - __main__ - Step 47938: {'lr': 0.0003902705626721435, 'samples': 9204096, 'steps': 47937, 'loss/train': 0.9641197323799133} -11/07/2021 03:59:51 - INFO - __main__ - Step 47939: {'lr': 0.00039026616992955145, 'samples': 9204288, 'steps': 47938, 'loss/train': 1.1526705026626587} -11/07/2021 03:59:52 - INFO - __main__ - Step 47940: {'lr': 0.0003902617771237575, 'samples': 9204480, 'steps': 47939, 'loss/train': 1.3181544542312622} -11/07/2021 03:59:52 - INFO - __main__ - Step 47941: {'lr': 0.0003902573842547639, 'samples': 9204672, 'steps': 47940, 'loss/train': 1.266067385673523} -11/07/2021 03:59:53 - INFO - __main__ - Step 47942: {'lr': 0.00039025299132257243, 'samples': 9204864, 'steps': 47941, 'loss/train': 1.1862119436264038} -11/07/2021 03:59:53 - INFO - __main__ - Step 47943: {'lr': 0.00039024859832718505, 'samples': 9205056, 'steps': 47942, 'loss/train': 1.8826212882995605} -11/07/2021 03:59:54 - INFO - __main__ - Step 47944: {'lr': 0.0003902442052686039, 'samples': 9205248, 'steps': 47943, 'loss/train': 1.5753989219665527} -11/07/2021 03:59:55 - INFO - __main__ - Step 47945: {'lr': 0.00039023981214683087, 'samples': 9205440, 'steps': 47944, 'loss/train': 1.1622357368469238} -11/07/2021 03:59:55 - INFO - __main__ - Step 47946: {'lr': 0.0003902354189618679, 'samples': 9205632, 'steps': 47945, 'loss/train': 1.7712570428848267} -11/07/2021 03:59:55 - INFO - __main__ - Step 47947: {'lr': 0.00039023102571371707, 'samples': 9205824, 'steps': 47946, 'loss/train': 1.6194078922271729} -11/07/2021 03:59:56 - INFO - __main__ - Step 47948: {'lr': 0.0003902266324023803, 'samples': 9206016, 'steps': 47947, 'loss/train': 1.4775843620300293} -11/07/2021 03:59:56 - INFO - __main__ - Step 47949: {'lr': 0.00039022223902785954, 'samples': 9206208, 'steps': 47948, 'loss/train': 1.5144954919815063} -11/07/2021 03:59:57 - INFO - __main__ - Step 47950: {'lr': 0.0003902178455901568, 'samples': 9206400, 'steps': 47949, 'loss/train': 1.2559685707092285} -11/07/2021 03:59:57 - INFO - __main__ - Step 47951: {'lr': 0.00039021345208927404, 'samples': 9206592, 'steps': 47950, 'loss/train': 1.4207682609558105} -11/07/2021 03:59:58 - INFO - __main__ - Step 47952: {'lr': 0.0003902090585252133, 'samples': 9206784, 'steps': 47951, 'loss/train': 1.2095712423324585} -11/07/2021 03:59:58 - INFO - __main__ - Step 47953: {'lr': 0.0003902046648979766, 'samples': 9206976, 'steps': 47952, 'loss/train': 1.166861891746521} -11/07/2021 03:59:59 - INFO - __main__ - Step 47954: {'lr': 0.00039020027120756573, 'samples': 9207168, 'steps': 47953, 'loss/train': 0.9656014442443848} -11/07/2021 03:59:59 - INFO - __main__ - Step 47955: {'lr': 0.00039019587745398276, 'samples': 9207360, 'steps': 47954, 'loss/train': 1.032138466835022} -11/07/2021 04:00:00 - INFO - __main__ - Step 47956: {'lr': 0.0003901914836372298, 'samples': 9207552, 'steps': 47955, 'loss/train': 1.3611185550689697} -11/07/2021 04:00:00 - INFO - __main__ - Step 47957: {'lr': 0.00039018708975730864, 'samples': 9207744, 'steps': 47956, 'loss/train': 1.2215360403060913} -11/07/2021 04:00:01 - INFO - __main__ - Step 47958: {'lr': 0.0003901826958142214, 'samples': 9207936, 'steps': 47957, 'loss/train': 1.4965671300888062} -11/07/2021 04:00:01 - INFO - __main__ - Step 47959: {'lr': 0.0003901783018079699, 'samples': 9208128, 'steps': 47958, 'loss/train': 1.5038868188858032} -11/07/2021 04:00:02 - INFO - __main__ - Step 47960: {'lr': 0.0003901739077385563, 'samples': 9208320, 'steps': 47959, 'loss/train': 1.7007519006729126} -11/07/2021 04:00:02 - INFO - __main__ - Step 47961: {'lr': 0.0003901695136059825, 'samples': 9208512, 'steps': 47960, 'loss/train': 1.1992660760879517} -11/07/2021 04:00:03 - INFO - __main__ - Step 47962: {'lr': 0.00039016511941025045, 'samples': 9208704, 'steps': 47961, 'loss/train': 2.0137312412261963} -11/07/2021 04:00:03 - INFO - __main__ - Step 47963: {'lr': 0.0003901607251513622, 'samples': 9208896, 'steps': 47962, 'loss/train': 1.7977275848388672} -11/07/2021 04:00:03 - INFO - __main__ - Step 47964: {'lr': 0.0003901563308293197, 'samples': 9209088, 'steps': 47963, 'loss/train': 1.5365867614746094} -11/07/2021 04:00:04 - INFO - __main__ - Step 47965: {'lr': 0.0003901519364441248, 'samples': 9209280, 'steps': 47964, 'loss/train': 1.5069364309310913} -11/07/2021 04:00:05 - INFO - __main__ - Step 47966: {'lr': 0.0003901475419957797, 'samples': 9209472, 'steps': 47965, 'loss/train': 1.3223764896392822} -11/07/2021 04:00:05 - INFO - __main__ - Step 47967: {'lr': 0.0003901431474842863, 'samples': 9209664, 'steps': 47966, 'loss/train': 1.5235975980758667} -11/07/2021 04:00:05 - INFO - __main__ - Step 47968: {'lr': 0.0003901387529096465, 'samples': 9209856, 'steps': 47967, 'loss/train': 1.5078519582748413} -11/07/2021 04:00:06 - INFO - __main__ - Step 47969: {'lr': 0.0003901343582718624, 'samples': 9210048, 'steps': 47968, 'loss/train': 1.3114722967147827} -11/07/2021 04:00:06 - INFO - __main__ - Step 47970: {'lr': 0.0003901299635709359, 'samples': 9210240, 'steps': 47969, 'loss/train': 1.4865241050720215} -11/07/2021 04:00:07 - INFO - __main__ - Step 47971: {'lr': 0.00039012556880686897, 'samples': 9210432, 'steps': 47970, 'loss/train': 0.869248628616333} -11/07/2021 04:00:08 - INFO - __main__ - Step 47972: {'lr': 0.00039012117397966363, 'samples': 9210624, 'steps': 47971, 'loss/train': 1.566467046737671} -11/07/2021 04:00:08 - INFO - __main__ - Step 47973: {'lr': 0.00039011677908932184, 'samples': 9210816, 'steps': 47972, 'loss/train': 1.6380442380905151} -11/07/2021 04:00:08 - INFO - __main__ - Step 47974: {'lr': 0.00039011238413584566, 'samples': 9211008, 'steps': 47973, 'loss/train': 2.1799044609069824} -11/07/2021 04:00:09 - INFO - __main__ - Step 47975: {'lr': 0.0003901079891192369, 'samples': 9211200, 'steps': 47974, 'loss/train': 0.16520646214485168} -11/07/2021 04:00:10 - INFO - __main__ - Step 47976: {'lr': 0.00039010359403949776, 'samples': 9211392, 'steps': 47975, 'loss/train': 1.1269757747650146} -11/07/2021 04:00:10 - INFO - __main__ - Step 47977: {'lr': 0.00039009919889663005, 'samples': 9211584, 'steps': 47976, 'loss/train': 2.0871849060058594} -11/07/2021 04:00:10 - INFO - __main__ - Step 47978: {'lr': 0.00039009480369063575, 'samples': 9211776, 'steps': 47977, 'loss/train': 1.1506580114364624} -11/07/2021 04:00:11 - INFO - __main__ - Step 47979: {'lr': 0.000390090408421517, 'samples': 9211968, 'steps': 47978, 'loss/train': 1.7109673023223877} -11/07/2021 04:00:11 - INFO - __main__ - Step 47980: {'lr': 0.0003900860130892756, 'samples': 9212160, 'steps': 47979, 'loss/train': 1.2497364282608032} -11/07/2021 04:00:12 - INFO - __main__ - Step 47981: {'lr': 0.0003900816176939136, 'samples': 9212352, 'steps': 47980, 'loss/train': 1.489717960357666} -11/07/2021 04:00:12 - INFO - __main__ - Step 47982: {'lr': 0.000390077222235433, 'samples': 9212544, 'steps': 47981, 'loss/train': 1.4342354536056519} -11/07/2021 04:00:13 - INFO - __main__ - Step 47983: {'lr': 0.0003900728267138357, 'samples': 9212736, 'steps': 47982, 'loss/train': 1.5929369926452637} -11/07/2021 04:00:13 - INFO - __main__ - Step 47984: {'lr': 0.0003900684311291238, 'samples': 9212928, 'steps': 47983, 'loss/train': 0.9831579327583313} -11/07/2021 04:00:14 - INFO - __main__ - Step 47985: {'lr': 0.0003900640354812992, 'samples': 9213120, 'steps': 47984, 'loss/train': 1.508144736289978} -11/07/2021 04:00:15 - INFO - __main__ - Step 47986: {'lr': 0.000390059639770364, 'samples': 9213312, 'steps': 47985, 'loss/train': 1.419266700744629} -11/07/2021 04:00:15 - INFO - __main__ - Step 47987: {'lr': 0.0003900552439963201, 'samples': 9213504, 'steps': 47986, 'loss/train': 1.4877800941467285} -11/07/2021 04:00:15 - INFO - __main__ - Step 47988: {'lr': 0.0003900508481591694, 'samples': 9213696, 'steps': 47987, 'loss/train': 1.4193735122680664} -11/07/2021 04:00:16 - INFO - __main__ - Step 47989: {'lr': 0.00039004645225891387, 'samples': 9213888, 'steps': 47988, 'loss/train': 1.3641928434371948} -11/07/2021 04:00:16 - INFO - __main__ - Step 47990: {'lr': 0.0003900420562955557, 'samples': 9214080, 'steps': 47989, 'loss/train': 1.297823429107666} -11/07/2021 04:00:16 - INFO - __main__ - Step 47991: {'lr': 0.0003900376602690966, 'samples': 9214272, 'steps': 47990, 'loss/train': 1.5094558000564575} -11/07/2021 04:00:17 - INFO - __main__ - Step 47992: {'lr': 0.0003900332641795388, 'samples': 9214464, 'steps': 47991, 'loss/train': 1.933498740196228} -11/07/2021 04:00:18 - INFO - __main__ - Step 47993: {'lr': 0.0003900288680268842, 'samples': 9214656, 'steps': 47992, 'loss/train': 1.278651237487793} -11/07/2021 04:00:18 - INFO - __main__ - Step 47994: {'lr': 0.00039002447181113464, 'samples': 9214848, 'steps': 47993, 'loss/train': 2.1139328479766846} -11/07/2021 04:00:18 - INFO - __main__ - Step 47995: {'lr': 0.0003900200755322923, 'samples': 9215040, 'steps': 47994, 'loss/train': 1.141119360923767} -11/07/2021 04:00:19 - INFO - __main__ - Step 47996: {'lr': 0.0003900156791903591, 'samples': 9215232, 'steps': 47995, 'loss/train': 1.348052740097046} -11/07/2021 04:00:20 - INFO - __main__ - Step 47997: {'lr': 0.0003900112827853369, 'samples': 9215424, 'steps': 47996, 'loss/train': 1.3135474920272827} -11/07/2021 04:00:20 - INFO - __main__ - Step 47998: {'lr': 0.0003900068863172278, 'samples': 9215616, 'steps': 47997, 'loss/train': 1.4085980653762817} -11/07/2021 04:00:21 - INFO - __main__ - Step 47999: {'lr': 0.0003900024897860338, 'samples': 9215808, 'steps': 47998, 'loss/train': 1.8113974332809448} -11/07/2021 04:00:21 - INFO - __main__ - Step 48000: {'lr': 0.00038999809319175684, 'samples': 9216000, 'steps': 47999, 'loss/train': 0.4227254092693329} -11/07/2021 04:00:21 - INFO - __main__ - Step 48001: {'lr': 0.0003899936965343989, 'samples': 9216192, 'steps': 48000, 'loss/train': 1.8167829513549805} -11/07/2021 04:00:22 - INFO - __main__ - Step 48002: {'lr': 0.00038998929981396194, 'samples': 9216384, 'steps': 48001, 'loss/train': 1.4759230613708496} -11/07/2021 04:00:23 - INFO - __main__ - Step 48003: {'lr': 0.0003899849030304479, 'samples': 9216576, 'steps': 48002, 'loss/train': 2.544011116027832} -11/07/2021 04:00:23 - INFO - __main__ - Step 48004: {'lr': 0.0003899805061838589, 'samples': 9216768, 'steps': 48003, 'loss/train': 1.7079887390136719} -11/07/2021 04:00:24 - INFO - __main__ - Step 48005: {'lr': 0.0003899761092741968, 'samples': 9216960, 'steps': 48004, 'loss/train': 1.6452378034591675} -11/07/2021 04:00:24 - INFO - __main__ - Step 48006: {'lr': 0.00038997171230146366, 'samples': 9217152, 'steps': 48005, 'loss/train': 1.3807014226913452} -11/07/2021 04:00:24 - INFO - __main__ - Step 48007: {'lr': 0.0003899673152656614, 'samples': 9217344, 'steps': 48006, 'loss/train': 1.7523833513259888} -11/07/2021 04:00:25 - INFO - __main__ - Step 48008: {'lr': 0.0003899629181667921, 'samples': 9217536, 'steps': 48007, 'loss/train': 1.784700632095337} -11/07/2021 04:00:26 - INFO - __main__ - Step 48009: {'lr': 0.0003899585210048576, 'samples': 9217728, 'steps': 48008, 'loss/train': 1.3834120035171509} -11/07/2021 04:00:26 - INFO - __main__ - Step 48010: {'lr': 0.0003899541237798599, 'samples': 9217920, 'steps': 48009, 'loss/train': 1.6663899421691895} -11/07/2021 04:00:26 - INFO - __main__ - Step 48011: {'lr': 0.0003899497264918012, 'samples': 9218112, 'steps': 48010, 'loss/train': 1.1437512636184692} -11/07/2021 04:00:27 - INFO - __main__ - Step 48012: {'lr': 0.00038994532914068313, 'samples': 9218304, 'steps': 48011, 'loss/train': 1.5247350931167603} -11/07/2021 04:00:28 - INFO - __main__ - Step 48013: {'lr': 0.00038994093172650804, 'samples': 9218496, 'steps': 48012, 'loss/train': 1.5147181749343872} -11/07/2021 04:00:28 - INFO - __main__ - Step 48014: {'lr': 0.00038993653424927754, 'samples': 9218688, 'steps': 48013, 'loss/train': 1.5079004764556885} -11/07/2021 04:00:29 - INFO - __main__ - Step 48015: {'lr': 0.00038993213670899385, 'samples': 9218880, 'steps': 48014, 'loss/train': 1.1028234958648682} -11/07/2021 04:00:29 - INFO - __main__ - Step 48016: {'lr': 0.000389927739105659, 'samples': 9219072, 'steps': 48015, 'loss/train': 1.5839699506759644} -11/07/2021 04:00:29 - INFO - __main__ - Step 48017: {'lr': 0.0003899233414392748, 'samples': 9219264, 'steps': 48016, 'loss/train': 1.3747262954711914} -11/07/2021 04:00:30 - INFO - __main__ - Step 48018: {'lr': 0.0003899189437098433, 'samples': 9219456, 'steps': 48017, 'loss/train': 1.2862333059310913} -11/07/2021 04:00:31 - INFO - __main__ - Step 48019: {'lr': 0.00038991454591736643, 'samples': 9219648, 'steps': 48018, 'loss/train': 1.1262879371643066} -11/07/2021 04:00:31 - INFO - __main__ - Step 48020: {'lr': 0.00038991014806184635, 'samples': 9219840, 'steps': 48019, 'loss/train': 1.2946993112564087} -11/07/2021 04:00:31 - INFO - __main__ - Step 48021: {'lr': 0.0003899057501432848, 'samples': 9220032, 'steps': 48020, 'loss/train': 1.6199647188186646} -11/07/2021 04:00:32 - INFO - __main__ - Step 48022: {'lr': 0.0003899013521616839, 'samples': 9220224, 'steps': 48021, 'loss/train': 1.3253999948501587} -11/07/2021 04:00:33 - INFO - __main__ - Step 48023: {'lr': 0.0003898969541170456, 'samples': 9220416, 'steps': 48022, 'loss/train': 1.4175102710723877} -11/07/2021 04:00:33 - INFO - __main__ - Step 48024: {'lr': 0.0003898925560093719, 'samples': 9220608, 'steps': 48023, 'loss/train': 1.3709696531295776} -11/07/2021 04:00:33 - INFO - __main__ - Step 48025: {'lr': 0.00038988815783866485, 'samples': 9220800, 'steps': 48024, 'loss/train': 1.568740725517273} -11/07/2021 04:00:34 - INFO - __main__ - Step 48026: {'lr': 0.00038988375960492626, 'samples': 9220992, 'steps': 48025, 'loss/train': 1.8158372640609741} -11/07/2021 04:00:34 - INFO - __main__ - Step 48027: {'lr': 0.0003898793613081583, 'samples': 9221184, 'steps': 48026, 'loss/train': 1.3739103078842163} -11/07/2021 04:00:36 - INFO - __main__ - Step 48028: {'lr': 0.0003898749629483628, 'samples': 9221376, 'steps': 48027, 'loss/train': 2.0244140625} -11/07/2021 04:00:36 - INFO - __main__ - Step 48029: {'lr': 0.00038987056452554177, 'samples': 9221568, 'steps': 48028, 'loss/train': 1.6520586013793945} -11/07/2021 04:00:36 - INFO - __main__ - Step 48030: {'lr': 0.0003898661660396973, 'samples': 9221760, 'steps': 48029, 'loss/train': 1.8628299236297607} -11/07/2021 04:00:37 - INFO - __main__ - Step 48031: {'lr': 0.00038986176749083117, 'samples': 9221952, 'steps': 48030, 'loss/train': 0.3103807270526886} -11/07/2021 04:00:37 - INFO - __main__ - Step 48032: {'lr': 0.0003898573688789456, 'samples': 9222144, 'steps': 48031, 'loss/train': 0.3190688192844391} -11/07/2021 04:00:38 - INFO - __main__ - Step 48033: {'lr': 0.0003898529702040424, 'samples': 9222336, 'steps': 48032, 'loss/train': 1.669013261795044} -11/07/2021 04:00:38 - INFO - __main__ - Step 48034: {'lr': 0.00038984857146612365, 'samples': 9222528, 'steps': 48033, 'loss/train': 1.5042675733566284} -11/07/2021 04:00:39 - INFO - __main__ - Step 48035: {'lr': 0.00038984417266519126, 'samples': 9222720, 'steps': 48034, 'loss/train': 1.2486090660095215} -11/07/2021 04:00:39 - INFO - __main__ - Step 48036: {'lr': 0.00038983977380124726, 'samples': 9222912, 'steps': 48035, 'loss/train': 1.455985426902771} -11/07/2021 04:00:39 - INFO - __main__ - Step 48037: {'lr': 0.0003898353748742936, 'samples': 9223104, 'steps': 48036, 'loss/train': 1.2599023580551147} -11/07/2021 04:00:40 - INFO - __main__ - Step 48038: {'lr': 0.00038983097588433225, 'samples': 9223296, 'steps': 48037, 'loss/train': 1.5512021780014038} -11/07/2021 04:00:41 - INFO - __main__ - Step 48039: {'lr': 0.00038982657683136524, 'samples': 9223488, 'steps': 48038, 'loss/train': 1.6784405708312988} -11/07/2021 04:00:41 - INFO - __main__ - Step 48040: {'lr': 0.00038982217771539466, 'samples': 9223680, 'steps': 48039, 'loss/train': 1.306701898574829} -11/07/2021 04:00:42 - INFO - __main__ - Step 48041: {'lr': 0.0003898177785364222, 'samples': 9223872, 'steps': 48040, 'loss/train': 1.0747727155685425} -11/07/2021 04:00:42 - INFO - __main__ - Step 48042: {'lr': 0.00038981337929445004, 'samples': 9224064, 'steps': 48041, 'loss/train': 1.4584308862686157} -11/07/2021 04:00:42 - INFO - __main__ - Step 48043: {'lr': 0.0003898089799894802, 'samples': 9224256, 'steps': 48042, 'loss/train': 1.5404750108718872} -11/07/2021 04:00:43 - INFO - __main__ - Step 48044: {'lr': 0.0003898045806215145, 'samples': 9224448, 'steps': 48043, 'loss/train': 1.6170690059661865} -11/07/2021 04:00:44 - INFO - __main__ - Step 48045: {'lr': 0.00038980018119055506, 'samples': 9224640, 'steps': 48044, 'loss/train': 1.2645432949066162} -11/07/2021 04:00:44 - INFO - __main__ - Step 48046: {'lr': 0.00038979578169660384, 'samples': 9224832, 'steps': 48045, 'loss/train': 1.5899505615234375} -11/07/2021 04:00:44 - INFO - __main__ - Step 48047: {'lr': 0.0003897913821396628, 'samples': 9225024, 'steps': 48046, 'loss/train': 1.07871675491333} -11/07/2021 04:00:45 - INFO - __main__ - Step 48048: {'lr': 0.0003897869825197339, 'samples': 9225216, 'steps': 48047, 'loss/train': 2.3908605575561523} -11/07/2021 04:00:46 - INFO - __main__ - Step 48049: {'lr': 0.0003897825828368191, 'samples': 9225408, 'steps': 48048, 'loss/train': 1.2328208684921265} -11/07/2021 04:00:46 - INFO - __main__ - Step 48050: {'lr': 0.0003897781830909204, 'samples': 9225600, 'steps': 48049, 'loss/train': 1.1049468517303467} -11/07/2021 04:00:46 - INFO - __main__ - Step 48051: {'lr': 0.00038977378328203987, 'samples': 9225792, 'steps': 48050, 'loss/train': 1.367971658706665} -11/07/2021 04:00:47 - INFO - __main__ - Step 48052: {'lr': 0.0003897693834101794, 'samples': 9225984, 'steps': 48051, 'loss/train': 1.1159980297088623} -11/07/2021 04:00:47 - INFO - __main__ - Step 48053: {'lr': 0.00038976498347534106, 'samples': 9226176, 'steps': 48052, 'loss/train': 1.4800593852996826} -11/07/2021 04:00:48 - INFO - __main__ - Step 48054: {'lr': 0.0003897605834775267, 'samples': 9226368, 'steps': 48053, 'loss/train': 1.5713735818862915} -11/07/2021 04:00:49 - INFO - __main__ - Step 48055: {'lr': 0.00038975618341673845, 'samples': 9226560, 'steps': 48054, 'loss/train': 1.028491735458374} -11/07/2021 04:00:49 - INFO - __main__ - Step 48056: {'lr': 0.0003897517832929782, 'samples': 9226752, 'steps': 48055, 'loss/train': 1.6298503875732422} -11/07/2021 04:00:49 - INFO - __main__ - Step 48057: {'lr': 0.00038974738310624797, 'samples': 9226944, 'steps': 48056, 'loss/train': 1.0520175695419312} -11/07/2021 04:00:50 - INFO - __main__ - Step 48058: {'lr': 0.00038974298285654967, 'samples': 9227136, 'steps': 48057, 'loss/train': 1.0178232192993164} -11/07/2021 04:00:51 - INFO - __main__ - Step 48059: {'lr': 0.0003897385825438854, 'samples': 9227328, 'steps': 48058, 'loss/train': 1.4590984582901} -11/07/2021 04:00:51 - INFO - __main__ - Step 48060: {'lr': 0.0003897341821682571, 'samples': 9227520, 'steps': 48059, 'loss/train': 0.2315509021282196} -11/07/2021 04:00:51 - INFO - __main__ - Step 48061: {'lr': 0.0003897297817296667, 'samples': 9227712, 'steps': 48060, 'loss/train': 1.2649005651474} -11/07/2021 04:00:52 - INFO - __main__ - Step 48062: {'lr': 0.00038972538122811613, 'samples': 9227904, 'steps': 48061, 'loss/train': 1.64288330078125} -11/07/2021 04:00:52 - INFO - __main__ - Step 48063: {'lr': 0.00038972098066360753, 'samples': 9228096, 'steps': 48062, 'loss/train': 1.4780681133270264} -11/07/2021 04:00:52 - INFO - __main__ - Step 48064: {'lr': 0.0003897165800361427, 'samples': 9228288, 'steps': 48063, 'loss/train': 1.5908677577972412} -11/07/2021 04:00:53 - INFO - __main__ - Step 48065: {'lr': 0.0003897121793457239, 'samples': 9228480, 'steps': 48064, 'loss/train': 1.5628256797790527} -11/07/2021 04:00:54 - INFO - __main__ - Step 48066: {'lr': 0.0003897077785923529, 'samples': 9228672, 'steps': 48065, 'loss/train': 1.6030704975128174} -11/07/2021 04:00:54 - INFO - __main__ - Step 48067: {'lr': 0.0003897033777760318, 'samples': 9228864, 'steps': 48066, 'loss/train': 1.1855614185333252} -11/07/2021 04:00:55 - INFO - __main__ - Step 48068: {'lr': 0.0003896989768967624, 'samples': 9229056, 'steps': 48067, 'loss/train': 1.5664584636688232} -11/07/2021 04:00:55 - INFO - __main__ - Step 48069: {'lr': 0.0003896945759545468, 'samples': 9229248, 'steps': 48068, 'loss/train': 1.6907851696014404} -11/07/2021 04:00:56 - INFO - __main__ - Step 48070: {'lr': 0.000389690174949387, 'samples': 9229440, 'steps': 48069, 'loss/train': 1.2275843620300293} -11/07/2021 04:00:56 - INFO - __main__ - Step 48071: {'lr': 0.00038968577388128503, 'samples': 9229632, 'steps': 48070, 'loss/train': 1.7831544876098633} -11/07/2021 04:00:57 - INFO - __main__ - Step 48072: {'lr': 0.00038968137275024274, 'samples': 9229824, 'steps': 48071, 'loss/train': 1.374072551727295} -11/07/2021 04:00:57 - INFO - __main__ - Step 48073: {'lr': 0.0003896769715562622, 'samples': 9230016, 'steps': 48072, 'loss/train': 1.4499943256378174} -11/07/2021 04:00:57 - INFO - __main__ - Step 48074: {'lr': 0.0003896725702993453, 'samples': 9230208, 'steps': 48073, 'loss/train': 0.9299537539482117} -11/07/2021 04:00:58 - INFO - __main__ - Step 48075: {'lr': 0.0003896681689794942, 'samples': 9230400, 'steps': 48074, 'loss/train': 1.2336264848709106} -11/07/2021 04:00:59 - INFO - __main__ - Step 48076: {'lr': 0.00038966376759671075, 'samples': 9230592, 'steps': 48075, 'loss/train': 1.3669625520706177} -11/07/2021 04:00:59 - INFO - __main__ - Step 48077: {'lr': 0.00038965936615099694, 'samples': 9230784, 'steps': 48076, 'loss/train': 1.556752324104309} -11/07/2021 04:00:59 - INFO - __main__ - Step 48078: {'lr': 0.0003896549646423548, 'samples': 9230976, 'steps': 48077, 'loss/train': 1.269991159439087} -11/07/2021 04:01:00 - INFO - __main__ - Step 48079: {'lr': 0.0003896505630707863, 'samples': 9231168, 'steps': 48078, 'loss/train': 1.0601564645767212} -11/07/2021 04:01:01 - INFO - __main__ - Step 48080: {'lr': 0.00038964616143629337, 'samples': 9231360, 'steps': 48079, 'loss/train': 1.5609855651855469} -11/07/2021 04:01:01 - INFO - __main__ - Step 48081: {'lr': 0.00038964175973887807, 'samples': 9231552, 'steps': 48080, 'loss/train': 1.0855125188827515} -11/07/2021 04:01:02 - INFO - __main__ - Step 48082: {'lr': 0.0003896373579785423, 'samples': 9231744, 'steps': 48081, 'loss/train': 1.7724723815917969} -11/07/2021 04:01:02 - INFO - __main__ - Step 48083: {'lr': 0.00038963295615528803, 'samples': 9231936, 'steps': 48082, 'loss/train': 1.3519500494003296} -11/07/2021 04:01:02 - INFO - __main__ - Step 48084: {'lr': 0.00038962855426911746, 'samples': 9232128, 'steps': 48083, 'loss/train': 1.6795637607574463} -11/07/2021 04:01:03 - INFO - __main__ - Step 48085: {'lr': 0.00038962415232003233, 'samples': 9232320, 'steps': 48084, 'loss/train': 1.6219850778579712} -11/07/2021 04:01:04 - INFO - __main__ - Step 48086: {'lr': 0.00038961975030803474, 'samples': 9232512, 'steps': 48085, 'loss/train': 1.5682246685028076} -11/07/2021 04:01:04 - INFO - __main__ - Step 48087: {'lr': 0.00038961534823312664, 'samples': 9232704, 'steps': 48086, 'loss/train': 1.5759390592575073} -11/07/2021 04:01:04 - INFO - __main__ - Step 48088: {'lr': 0.00038961094609531, 'samples': 9232896, 'steps': 48087, 'loss/train': 1.3574557304382324} -11/07/2021 04:01:05 - INFO - __main__ - Step 48089: {'lr': 0.00038960654389458684, 'samples': 9233088, 'steps': 48088, 'loss/train': 1.263695478439331} -11/07/2021 04:01:05 - INFO - __main__ - Step 48090: {'lr': 0.0003896021416309591, 'samples': 9233280, 'steps': 48089, 'loss/train': 1.3953235149383545} -11/07/2021 04:01:06 - INFO - __main__ - Step 48091: {'lr': 0.0003895977393044288, 'samples': 9233472, 'steps': 48090, 'loss/train': 1.786818504333496} -11/07/2021 04:01:06 - INFO - __main__ - Step 48092: {'lr': 0.00038959333691499794, 'samples': 9233664, 'steps': 48091, 'loss/train': 1.076110601425171} -11/07/2021 04:01:07 - INFO - __main__ - Step 48093: {'lr': 0.00038958893446266844, 'samples': 9233856, 'steps': 48092, 'loss/train': 1.581133246421814} -11/07/2021 04:01:07 - INFO - __main__ - Step 48094: {'lr': 0.00038958453194744237, 'samples': 9234048, 'steps': 48093, 'loss/train': 1.5100988149642944} -11/07/2021 04:01:07 - INFO - __main__ - Step 48095: {'lr': 0.0003895801293693216, 'samples': 9234240, 'steps': 48094, 'loss/train': 1.3519607782363892} -11/07/2021 04:01:09 - INFO - __main__ - Step 48096: {'lr': 0.0003895757267283082, 'samples': 9234432, 'steps': 48095, 'loss/train': 1.5387576818466187} -11/07/2021 04:01:09 - INFO - __main__ - Step 48097: {'lr': 0.0003895713240244042, 'samples': 9234624, 'steps': 48096, 'loss/train': 1.3814644813537598} -11/07/2021 04:01:09 - INFO - __main__ - Step 48098: {'lr': 0.0003895669212576114, 'samples': 9234816, 'steps': 48097, 'loss/train': 1.592847228050232} -11/07/2021 04:01:10 - INFO - __main__ - Step 48099: {'lr': 0.000389562518427932, 'samples': 9235008, 'steps': 48098, 'loss/train': 1.7075380086898804} -11/07/2021 04:01:10 - INFO - __main__ - Step 48100: {'lr': 0.00038955811553536787, 'samples': 9235200, 'steps': 48099, 'loss/train': 1.761032223701477} -11/07/2021 04:01:11 - INFO - __main__ - Step 48101: {'lr': 0.00038955371257992096, 'samples': 9235392, 'steps': 48100, 'loss/train': 2.054033041000366} -11/07/2021 04:01:11 - INFO - __main__ - Step 48102: {'lr': 0.0003895493095615933, 'samples': 9235584, 'steps': 48101, 'loss/train': 1.3840248584747314} -11/07/2021 04:01:12 - INFO - __main__ - Step 48103: {'lr': 0.00038954490648038687, 'samples': 9235776, 'steps': 48102, 'loss/train': 1.024058222770691} -11/07/2021 04:01:12 - INFO - __main__ - Step 48104: {'lr': 0.0003895405033363037, 'samples': 9235968, 'steps': 48103, 'loss/train': 1.359765648841858} -11/07/2021 04:01:12 - INFO - __main__ - Step 48105: {'lr': 0.0003895361001293457, 'samples': 9236160, 'steps': 48104, 'loss/train': 1.476563811302185} -11/07/2021 04:01:13 - INFO - __main__ - Step 48106: {'lr': 0.0003895316968595149, 'samples': 9236352, 'steps': 48105, 'loss/train': 1.8598228693008423} -11/07/2021 04:01:14 - INFO - __main__ - Step 48107: {'lr': 0.0003895272935268133, 'samples': 9236544, 'steps': 48106, 'loss/train': 1.3268775939941406} -11/07/2021 04:01:14 - INFO - __main__ - Step 48108: {'lr': 0.0003895228901312428, 'samples': 9236736, 'steps': 48107, 'loss/train': 0.6876649856567383} -11/07/2021 04:01:15 - INFO - __main__ - Step 48109: {'lr': 0.0003895184866728054, 'samples': 9236928, 'steps': 48108, 'loss/train': 1.5355066061019897} -11/07/2021 04:01:15 - INFO - __main__ - Step 48110: {'lr': 0.0003895140831515033, 'samples': 9237120, 'steps': 48109, 'loss/train': 1.507046103477478} -11/07/2021 04:01:15 - INFO - __main__ - Step 48111: {'lr': 0.0003895096795673381, 'samples': 9237312, 'steps': 48110, 'loss/train': 1.1604622602462769} -11/07/2021 04:01:16 - INFO - __main__ - Step 48112: {'lr': 0.0003895052759203121, 'samples': 9237504, 'steps': 48111, 'loss/train': 1.9194079637527466} -11/07/2021 04:01:17 - INFO - __main__ - Step 48113: {'lr': 0.0003895008722104272, 'samples': 9237696, 'steps': 48112, 'loss/train': 1.3934123516082764} -11/07/2021 04:01:17 - INFO - __main__ - Step 48114: {'lr': 0.00038949646843768526, 'samples': 9237888, 'steps': 48113, 'loss/train': 1.328235387802124} -11/07/2021 04:01:17 - INFO - __main__ - Step 48115: {'lr': 0.00038949206460208845, 'samples': 9238080, 'steps': 48114, 'loss/train': 1.8984450101852417} -11/07/2021 04:01:18 - INFO - __main__ - Step 48116: {'lr': 0.0003894876607036386, 'samples': 9238272, 'steps': 48115, 'loss/train': 1.4652715921401978} -11/07/2021 04:01:18 - INFO - __main__ - Step 48117: {'lr': 0.0003894832567423379, 'samples': 9238464, 'steps': 48116, 'loss/train': 1.687768578529358} -11/07/2021 04:01:19 - INFO - __main__ - Step 48118: {'lr': 0.00038947885271818807, 'samples': 9238656, 'steps': 48117, 'loss/train': 1.3348737955093384} -11/07/2021 04:01:20 - INFO - __main__ - Step 48119: {'lr': 0.0003894744486311912, 'samples': 9238848, 'steps': 48118, 'loss/train': 0.9331466555595398} -11/07/2021 04:01:20 - INFO - __main__ - Step 48120: {'lr': 0.00038947004448134937, 'samples': 9239040, 'steps': 48119, 'loss/train': 1.088590145111084} -11/07/2021 04:01:20 - INFO - __main__ - Step 48121: {'lr': 0.0003894656402686645, 'samples': 9239232, 'steps': 48120, 'loss/train': 2.1469006538391113} -11/07/2021 04:01:21 - INFO - __main__ - Step 48122: {'lr': 0.00038946123599313846, 'samples': 9239424, 'steps': 48121, 'loss/train': 1.62726628780365} -11/07/2021 04:01:22 - INFO - __main__ - Step 48123: {'lr': 0.0003894568316547734, 'samples': 9239616, 'steps': 48122, 'loss/train': 2.0312588214874268} -11/07/2021 04:01:22 - INFO - __main__ - Step 48124: {'lr': 0.00038945242725357127, 'samples': 9239808, 'steps': 48123, 'loss/train': 1.563032627105713} -11/07/2021 04:01:22 - INFO - __main__ - Step 48125: {'lr': 0.000389448022789534, 'samples': 9240000, 'steps': 48124, 'loss/train': 1.9691152572631836} -11/07/2021 04:01:23 - INFO - __main__ - Step 48126: {'lr': 0.0003894436182626636, 'samples': 9240192, 'steps': 48125, 'loss/train': 1.8409271240234375} -11/07/2021 04:01:23 - INFO - __main__ - Step 48127: {'lr': 0.00038943921367296213, 'samples': 9240384, 'steps': 48126, 'loss/train': 1.4550058841705322} -11/07/2021 04:01:24 - INFO - __main__ - Step 48128: {'lr': 0.00038943480902043146, 'samples': 9240576, 'steps': 48127, 'loss/train': 1.4334383010864258} -11/07/2021 04:01:24 - INFO - __main__ - Step 48129: {'lr': 0.0003894304043050736, 'samples': 9240768, 'steps': 48128, 'loss/train': 1.6067302227020264} -11/07/2021 04:01:25 - INFO - __main__ - Step 48130: {'lr': 0.0003894259995268905, 'samples': 9240960, 'steps': 48129, 'loss/train': 1.6146119832992554} -11/07/2021 04:01:25 - INFO - __main__ - Step 48131: {'lr': 0.00038942159468588423, 'samples': 9241152, 'steps': 48130, 'loss/train': 1.4710017442703247} -11/07/2021 04:01:25 - INFO - __main__ - Step 48132: {'lr': 0.00038941718978205674, 'samples': 9241344, 'steps': 48131, 'loss/train': 1.373228669166565} -11/07/2021 04:01:27 - INFO - __main__ - Step 48133: {'lr': 0.0003894127848154101, 'samples': 9241536, 'steps': 48132, 'loss/train': 1.3340827226638794} -11/07/2021 04:01:27 - INFO - __main__ - Step 48134: {'lr': 0.0003894083797859461, 'samples': 9241728, 'steps': 48133, 'loss/train': 1.859207034111023} -11/07/2021 04:01:27 - INFO - __main__ - Step 48135: {'lr': 0.00038940397469366695, 'samples': 9241920, 'steps': 48134, 'loss/train': 1.445658564567566} -11/07/2021 04:01:28 - INFO - __main__ - Step 48136: {'lr': 0.0003893995695385744, 'samples': 9242112, 'steps': 48135, 'loss/train': 1.6205159425735474} -11/07/2021 04:01:28 - INFO - __main__ - Step 48137: {'lr': 0.0003893951643206706, 'samples': 9242304, 'steps': 48136, 'loss/train': 0.8118087649345398} -11/07/2021 04:01:28 - INFO - __main__ - Step 48138: {'lr': 0.00038939075903995744, 'samples': 9242496, 'steps': 48137, 'loss/train': 1.5155673027038574} -11/07/2021 04:01:29 - INFO - __main__ - Step 48139: {'lr': 0.000389386353696437, 'samples': 9242688, 'steps': 48138, 'loss/train': 1.2779062986373901} -11/07/2021 04:01:30 - INFO - __main__ - Step 48140: {'lr': 0.0003893819482901113, 'samples': 9242880, 'steps': 48139, 'loss/train': 1.4969934225082397} -11/07/2021 04:01:30 - INFO - __main__ - Step 48141: {'lr': 0.0003893775428209822, 'samples': 9243072, 'steps': 48140, 'loss/train': 1.910718321800232} -11/07/2021 04:01:30 - INFO - __main__ - Step 48142: {'lr': 0.00038937313728905164, 'samples': 9243264, 'steps': 48141, 'loss/train': 1.4000948667526245} -11/07/2021 04:01:31 - INFO - __main__ - Step 48143: {'lr': 0.0003893687316943218, 'samples': 9243456, 'steps': 48142, 'loss/train': 1.5593124628067017} -11/07/2021 04:01:32 - INFO - __main__ - Step 48144: {'lr': 0.0003893643260367945, 'samples': 9243648, 'steps': 48143, 'loss/train': 2.035222053527832} -11/07/2021 04:01:32 - INFO - __main__ - Step 48145: {'lr': 0.00038935992031647183, 'samples': 9243840, 'steps': 48144, 'loss/train': 1.6396360397338867} -11/07/2021 04:01:33 - INFO - __main__ - Step 48146: {'lr': 0.00038935551453335573, 'samples': 9244032, 'steps': 48145, 'loss/train': 1.7988249063491821} -11/07/2021 04:01:33 - INFO - __main__ - Step 48147: {'lr': 0.00038935110868744817, 'samples': 9244224, 'steps': 48146, 'loss/train': 1.5400888919830322} -11/07/2021 04:01:33 - INFO - __main__ - Step 48148: {'lr': 0.0003893467027787511, 'samples': 9244416, 'steps': 48147, 'loss/train': 1.4044010639190674} -11/07/2021 04:01:34 - INFO - __main__ - Step 48149: {'lr': 0.00038934229680726663, 'samples': 9244608, 'steps': 48148, 'loss/train': 1.3595432043075562} -11/07/2021 04:01:35 - INFO - __main__ - Step 48150: {'lr': 0.0003893378907729966, 'samples': 9244800, 'steps': 48149, 'loss/train': 1.5146124362945557} -11/07/2021 04:01:35 - INFO - __main__ - Step 48151: {'lr': 0.0003893334846759431, 'samples': 9244992, 'steps': 48150, 'loss/train': 1.3512797355651855} -11/07/2021 04:01:35 - INFO - __main__ - Step 48152: {'lr': 0.0003893290785161081, 'samples': 9245184, 'steps': 48151, 'loss/train': 1.6466460227966309} -11/07/2021 04:01:36 - INFO - __main__ - Step 48153: {'lr': 0.00038932467229349353, 'samples': 9245376, 'steps': 48152, 'loss/train': 1.788167119026184} -11/07/2021 04:01:37 - INFO - __main__ - Step 48154: {'lr': 0.0003893202660081014, 'samples': 9245568, 'steps': 48153, 'loss/train': 1.78120756149292} -11/07/2021 04:01:37 - INFO - __main__ - Step 48155: {'lr': 0.00038931585965993384, 'samples': 9245760, 'steps': 48154, 'loss/train': 1.456383228302002} -11/07/2021 04:01:38 - INFO - __main__ - Step 48156: {'lr': 0.0003893114532489926, 'samples': 9245952, 'steps': 48155, 'loss/train': 0.7910884022712708} -11/07/2021 04:01:38 - INFO - __main__ - Step 48157: {'lr': 0.00038930704677527975, 'samples': 9246144, 'steps': 48156, 'loss/train': 1.9671176671981812} -11/07/2021 04:01:38 - INFO - __main__ - Step 48158: {'lr': 0.00038930264023879737, 'samples': 9246336, 'steps': 48157, 'loss/train': 1.5886300802230835} -11/07/2021 04:01:39 - INFO - __main__ - Step 48159: {'lr': 0.0003892982336395473, 'samples': 9246528, 'steps': 48158, 'loss/train': 1.5728018283843994} -11/07/2021 04:01:40 - INFO - __main__ - Step 48160: {'lr': 0.00038929382697753157, 'samples': 9246720, 'steps': 48159, 'loss/train': 1.4440854787826538} -11/07/2021 04:01:40 - INFO - __main__ - Step 48161: {'lr': 0.00038928942025275227, 'samples': 9246912, 'steps': 48160, 'loss/train': 1.386595606803894} -11/07/2021 04:01:41 - INFO - __main__ - Step 48162: {'lr': 0.00038928501346521127, 'samples': 9247104, 'steps': 48161, 'loss/train': 1.5824897289276123} -11/07/2021 04:01:41 - INFO - __main__ - Step 48163: {'lr': 0.0003892806066149106, 'samples': 9247296, 'steps': 48162, 'loss/train': 1.7923336029052734} -11/07/2021 04:01:41 - INFO - __main__ - Step 48164: {'lr': 0.00038927619970185225, 'samples': 9247488, 'steps': 48163, 'loss/train': 1.387700080871582} -11/07/2021 04:01:43 - INFO - __main__ - Step 48165: {'lr': 0.0003892717927260382, 'samples': 9247680, 'steps': 48164, 'loss/train': 1.330069661140442} -11/07/2021 04:01:43 - INFO - __main__ - Step 48166: {'lr': 0.00038926738568747035, 'samples': 9247872, 'steps': 48165, 'loss/train': 1.217962384223938} -11/07/2021 04:01:43 - INFO - __main__ - Step 48167: {'lr': 0.0003892629785861509, 'samples': 9248064, 'steps': 48166, 'loss/train': 1.3875772953033447} -11/07/2021 04:01:44 - INFO - __main__ - Step 48168: {'lr': 0.00038925857142208155, 'samples': 9248256, 'steps': 48167, 'loss/train': 1.591727614402771} -11/07/2021 04:01:44 - INFO - __main__ - Step 48169: {'lr': 0.0003892541641952645, 'samples': 9248448, 'steps': 48168, 'loss/train': 2.152301788330078} -11/07/2021 04:01:46 - INFO - __main__ - Step 48170: {'lr': 0.00038924975690570173, 'samples': 9248640, 'steps': 48169, 'loss/train': 0.714447021484375} -11/07/2021 04:01:46 - INFO - __main__ - Step 48171: {'lr': 0.0003892453495533951, 'samples': 9248832, 'steps': 48170, 'loss/train': 1.6348806619644165} -11/07/2021 04:01:47 - INFO - __main__ - Step 48172: {'lr': 0.0003892409421383467, 'samples': 9249024, 'steps': 48171, 'loss/train': 1.3700920343399048} -11/07/2021 04:01:47 - INFO - __main__ - Step 48173: {'lr': 0.0003892365346605584, 'samples': 9249216, 'steps': 48172, 'loss/train': 1.094175100326538} -11/07/2021 04:01:47 - INFO - __main__ - Step 48174: {'lr': 0.0003892321271200324, 'samples': 9249408, 'steps': 48173, 'loss/train': 1.1373343467712402} -11/07/2021 04:01:48 - INFO - __main__ - Step 48175: {'lr': 0.0003892277195167705, 'samples': 9249600, 'steps': 48174, 'loss/train': 0.7871014475822449} -11/07/2021 04:01:48 - INFO - __main__ - Step 48176: {'lr': 0.00038922331185077465, 'samples': 9249792, 'steps': 48175, 'loss/train': 0.7428754568099976} -11/07/2021 04:01:49 - INFO - __main__ - Step 48177: {'lr': 0.000389218904122047, 'samples': 9249984, 'steps': 48176, 'loss/train': 1.4595086574554443} -11/07/2021 04:01:49 - INFO - __main__ - Step 48178: {'lr': 0.00038921449633058945, 'samples': 9250176, 'steps': 48177, 'loss/train': 1.8247631788253784} -11/07/2021 04:01:50 - INFO - __main__ - Step 48179: {'lr': 0.00038921008847640407, 'samples': 9250368, 'steps': 48178, 'loss/train': 1.262622594833374} -11/07/2021 04:01:50 - INFO - __main__ - Step 48180: {'lr': 0.0003892056805594926, 'samples': 9250560, 'steps': 48179, 'loss/train': 1.541310429573059} -11/07/2021 04:01:50 - INFO - __main__ - Step 48181: {'lr': 0.0003892012725798574, 'samples': 9250752, 'steps': 48180, 'loss/train': 1.705743432044983} -11/07/2021 04:01:51 - INFO - __main__ - Step 48182: {'lr': 0.00038919686453750015, 'samples': 9250944, 'steps': 48181, 'loss/train': 1.821557641029358} -11/07/2021 04:01:52 - INFO - __main__ - Step 48183: {'lr': 0.0003891924564324229, 'samples': 9251136, 'steps': 48182, 'loss/train': 1.426300287246704} -11/07/2021 04:01:52 - INFO - __main__ - Step 48184: {'lr': 0.0003891880482646277, 'samples': 9251328, 'steps': 48183, 'loss/train': 1.5814155340194702} -11/07/2021 04:01:52 - INFO - __main__ - Step 48185: {'lr': 0.00038918364003411656, 'samples': 9251520, 'steps': 48184, 'loss/train': 1.4798948764801025} -11/07/2021 04:01:53 - INFO - __main__ - Step 48186: {'lr': 0.0003891792317408914, 'samples': 9251712, 'steps': 48185, 'loss/train': 1.9678324460983276} -11/07/2021 04:01:54 - INFO - __main__ - Step 48187: {'lr': 0.00038917482338495424, 'samples': 9251904, 'steps': 48186, 'loss/train': 1.6393036842346191} -11/07/2021 04:01:54 - INFO - __main__ - Step 48188: {'lr': 0.000389170414966307, 'samples': 9252096, 'steps': 48187, 'loss/train': 1.6283665895462036} -11/07/2021 04:01:55 - INFO - __main__ - Step 48189: {'lr': 0.0003891660064849518, 'samples': 9252288, 'steps': 48188, 'loss/train': 0.8630964756011963} -11/07/2021 04:01:55 - INFO - __main__ - Step 48190: {'lr': 0.00038916159794089044, 'samples': 9252480, 'steps': 48189, 'loss/train': 1.1445237398147583} -11/07/2021 04:01:55 - INFO - __main__ - Step 48191: {'lr': 0.00038915718933412515, 'samples': 9252672, 'steps': 48190, 'loss/train': 1.79466712474823} -11/07/2021 04:01:56 - INFO - __main__ - Step 48192: {'lr': 0.0003891527806646576, 'samples': 9252864, 'steps': 48191, 'loss/train': 1.5653927326202393} -11/07/2021 04:01:57 - INFO - __main__ - Step 48193: {'lr': 0.0003891483719324901, 'samples': 9253056, 'steps': 48192, 'loss/train': 1.4417861700057983} -11/07/2021 04:01:57 - INFO - __main__ - Step 48194: {'lr': 0.00038914396313762445, 'samples': 9253248, 'steps': 48193, 'loss/train': 1.647060751914978} -11/07/2021 04:01:57 - INFO - __main__ - Step 48195: {'lr': 0.00038913955428006265, 'samples': 9253440, 'steps': 48194, 'loss/train': 1.4309707880020142} -11/07/2021 04:01:58 - INFO - __main__ - Step 48196: {'lr': 0.00038913514535980675, 'samples': 9253632, 'steps': 48195, 'loss/train': 1.375997543334961} -11/07/2021 04:01:59 - INFO - __main__ - Step 48197: {'lr': 0.0003891307363768587, 'samples': 9253824, 'steps': 48196, 'loss/train': 0.729505717754364} -11/07/2021 04:01:59 - INFO - __main__ - Step 48198: {'lr': 0.00038912632733122045, 'samples': 9254016, 'steps': 48197, 'loss/train': 1.4610792398452759} -11/07/2021 04:01:59 - INFO - __main__ - Step 48199: {'lr': 0.000389121918222894, 'samples': 9254208, 'steps': 48198, 'loss/train': 1.446216344833374} -11/07/2021 04:02:00 - INFO - __main__ - Step 48200: {'lr': 0.0003891175090518814, 'samples': 9254400, 'steps': 48199, 'loss/train': 1.6533331871032715} -11/07/2021 04:02:00 - INFO - __main__ - Step 48201: {'lr': 0.00038911309981818466, 'samples': 9254592, 'steps': 48200, 'loss/train': 1.6140072345733643} -11/07/2021 04:02:01 - INFO - __main__ - Step 48202: {'lr': 0.00038910869052180563, 'samples': 9254784, 'steps': 48201, 'loss/train': 1.157281756401062} -11/07/2021 04:02:02 - INFO - __main__ - Step 48203: {'lr': 0.00038910428116274644, 'samples': 9254976, 'steps': 48202, 'loss/train': 1.405438780784607} -11/07/2021 04:02:02 - INFO - __main__ - Step 48204: {'lr': 0.0003890998717410089, 'samples': 9255168, 'steps': 48203, 'loss/train': 1.6671035289764404} -11/07/2021 04:02:02 - INFO - __main__ - Step 48205: {'lr': 0.0003890954622565952, 'samples': 9255360, 'steps': 48204, 'loss/train': 1.69551682472229} -11/07/2021 04:02:03 - INFO - __main__ - Step 48206: {'lr': 0.00038909105270950716, 'samples': 9255552, 'steps': 48205, 'loss/train': 1.541272521018982} -11/07/2021 04:02:03 - INFO - __main__ - Step 48207: {'lr': 0.0003890866430997468, 'samples': 9255744, 'steps': 48206, 'loss/train': 1.7470780611038208} -11/07/2021 04:02:04 - INFO - __main__ - Step 48208: {'lr': 0.0003890822334273163, 'samples': 9255936, 'steps': 48207, 'loss/train': 1.031080722808838} -11/07/2021 04:02:04 - INFO - __main__ - Step 48209: {'lr': 0.0003890778236922174, 'samples': 9256128, 'steps': 48208, 'loss/train': 1.8261090517044067} -11/07/2021 04:02:05 - INFO - __main__ - Step 48210: {'lr': 0.00038907341389445217, 'samples': 9256320, 'steps': 48209, 'loss/train': 1.4540414810180664} -11/07/2021 04:02:05 - INFO - __main__ - Step 48211: {'lr': 0.0003890690040340226, 'samples': 9256512, 'steps': 48210, 'loss/train': 0.7340781688690186} -11/07/2021 04:02:05 - INFO - __main__ - Step 48212: {'lr': 0.00038906459411093075, 'samples': 9256704, 'steps': 48211, 'loss/train': 0.9523065686225891} -11/07/2021 04:02:07 - INFO - __main__ - Step 48213: {'lr': 0.0003890601841251785, 'samples': 9256896, 'steps': 48212, 'loss/train': 1.6918346881866455} -11/07/2021 04:02:07 - INFO - __main__ - Step 48214: {'lr': 0.0003890557740767678, 'samples': 9257088, 'steps': 48213, 'loss/train': 1.09598708152771} -11/07/2021 04:02:07 - INFO - __main__ - Step 48215: {'lr': 0.00038905136396570085, 'samples': 9257280, 'steps': 48214, 'loss/train': 1.8478615283966064} -11/07/2021 04:02:08 - INFO - __main__ - Step 48216: {'lr': 0.0003890469537919794, 'samples': 9257472, 'steps': 48215, 'loss/train': 0.5915213227272034} -11/07/2021 04:02:08 - INFO - __main__ - Step 48217: {'lr': 0.0003890425435556055, 'samples': 9257664, 'steps': 48216, 'loss/train': 2.091214418411255} -11/07/2021 04:02:09 - INFO - __main__ - Step 48218: {'lr': 0.0003890381332565813, 'samples': 9257856, 'steps': 48217, 'loss/train': 1.7031760215759277} -11/07/2021 04:02:09 - INFO - __main__ - Step 48219: {'lr': 0.00038903372289490865, 'samples': 9258048, 'steps': 48218, 'loss/train': 1.9759994745254517} -11/07/2021 04:02:10 - INFO - __main__ - Step 48220: {'lr': 0.0003890293124705895, 'samples': 9258240, 'steps': 48219, 'loss/train': 1.4671889543533325} -11/07/2021 04:02:10 - INFO - __main__ - Step 48221: {'lr': 0.0003890249019836259, 'samples': 9258432, 'steps': 48220, 'loss/train': 1.2330702543258667} -11/07/2021 04:02:10 - INFO - __main__ - Step 48222: {'lr': 0.0003890204914340198, 'samples': 9258624, 'steps': 48221, 'loss/train': 1.453384280204773} -11/07/2021 04:02:12 - INFO - __main__ - Step 48223: {'lr': 0.00038901608082177327, 'samples': 9258816, 'steps': 48222, 'loss/train': 1.6290801763534546} -11/07/2021 04:02:12 - INFO - __main__ - Step 48224: {'lr': 0.0003890116701468882, 'samples': 9259008, 'steps': 48223, 'loss/train': 1.69619882106781} -11/07/2021 04:02:12 - INFO - __main__ - Step 48225: {'lr': 0.0003890072594093666, 'samples': 9259200, 'steps': 48224, 'loss/train': 1.2480615377426147} -11/07/2021 04:02:13 - INFO - __main__ - Step 48226: {'lr': 0.00038900284860921046, 'samples': 9259392, 'steps': 48225, 'loss/train': 0.24857133626937866} -11/07/2021 04:02:13 - INFO - __main__ - Step 48227: {'lr': 0.00038899843774642184, 'samples': 9259584, 'steps': 48226, 'loss/train': 1.8875969648361206} -11/07/2021 04:02:13 - INFO - __main__ - Step 48228: {'lr': 0.00038899402682100265, 'samples': 9259776, 'steps': 48227, 'loss/train': 1.4447287321090698} -11/07/2021 04:02:14 - INFO - __main__ - Step 48229: {'lr': 0.0003889896158329549, 'samples': 9259968, 'steps': 48228, 'loss/train': 1.9886767864227295} -11/07/2021 04:02:15 - INFO - __main__ - Step 48230: {'lr': 0.00038898520478228055, 'samples': 9260160, 'steps': 48229, 'loss/train': 1.613850474357605} -11/07/2021 04:02:15 - INFO - __main__ - Step 48231: {'lr': 0.00038898079366898164, 'samples': 9260352, 'steps': 48230, 'loss/train': 1.478806495666504} -11/07/2021 04:02:15 - INFO - __main__ - Step 48232: {'lr': 0.0003889763824930601, 'samples': 9260544, 'steps': 48231, 'loss/train': 1.3042471408843994} -11/07/2021 04:02:16 - INFO - __main__ - Step 48233: {'lr': 0.00038897197125451795, 'samples': 9260736, 'steps': 48232, 'loss/train': 1.3413423299789429} -11/07/2021 04:02:17 - INFO - __main__ - Step 48234: {'lr': 0.0003889675599533572, 'samples': 9260928, 'steps': 48233, 'loss/train': 1.5150249004364014} -11/07/2021 04:02:17 - INFO - __main__ - Step 48235: {'lr': 0.0003889631485895798, 'samples': 9261120, 'steps': 48234, 'loss/train': 1.4947305917739868} -11/07/2021 04:02:17 - INFO - __main__ - Step 48236: {'lr': 0.00038895873716318776, 'samples': 9261312, 'steps': 48235, 'loss/train': 1.218025803565979} -11/07/2021 04:02:18 - INFO - __main__ - Step 48237: {'lr': 0.000388954325674183, 'samples': 9261504, 'steps': 48236, 'loss/train': 1.2372782230377197} -11/07/2021 04:02:18 - INFO - __main__ - Step 48238: {'lr': 0.00038894991412256766, 'samples': 9261696, 'steps': 48237, 'loss/train': 1.2564854621887207} -11/07/2021 04:02:19 - INFO - __main__ - Step 48239: {'lr': 0.00038894550250834355, 'samples': 9261888, 'steps': 48238, 'loss/train': 1.5338630676269531} -11/07/2021 04:02:20 - INFO - __main__ - Step 48240: {'lr': 0.00038894109083151274, 'samples': 9262080, 'steps': 48239, 'loss/train': 1.4853929281234741} -11/07/2021 04:02:20 - INFO - __main__ - Step 48241: {'lr': 0.0003889366790920773, 'samples': 9262272, 'steps': 48240, 'loss/train': 1.1592860221862793} -11/07/2021 04:02:20 - INFO - __main__ - Step 48242: {'lr': 0.00038893226729003904, 'samples': 9262464, 'steps': 48241, 'loss/train': 2.0898427963256836} -11/07/2021 04:02:21 - INFO - __main__ - Step 48243: {'lr': 0.0003889278554254001, 'samples': 9262656, 'steps': 48242, 'loss/train': 1.4382511377334595} -11/07/2021 04:02:22 - INFO - __main__ - Step 48244: {'lr': 0.00038892344349816246, 'samples': 9262848, 'steps': 48243, 'loss/train': 1.4409617185592651} -11/07/2021 04:02:22 - INFO - __main__ - Step 48245: {'lr': 0.00038891903150832795, 'samples': 9263040, 'steps': 48244, 'loss/train': 1.440793752670288} -11/07/2021 04:02:22 - INFO - __main__ - Step 48246: {'lr': 0.00038891461945589866, 'samples': 9263232, 'steps': 48245, 'loss/train': 1.4871621131896973} -11/07/2021 04:02:23 - INFO - __main__ - Step 48247: {'lr': 0.0003889102073408767, 'samples': 9263424, 'steps': 48246, 'loss/train': 2.115586996078491} -11/07/2021 04:02:23 - INFO - __main__ - Step 48248: {'lr': 0.0003889057951632639, 'samples': 9263616, 'steps': 48247, 'loss/train': 1.8211729526519775} -11/07/2021 04:02:23 - INFO - __main__ - Step 48249: {'lr': 0.0003889013829230623, 'samples': 9263808, 'steps': 48248, 'loss/train': 1.6548411846160889} -11/07/2021 04:02:24 - INFO - __main__ - Step 48250: {'lr': 0.00038889697062027384, 'samples': 9264000, 'steps': 48249, 'loss/train': 1.5534456968307495} -11/07/2021 04:02:25 - INFO - __main__ - Step 48251: {'lr': 0.00038889255825490053, 'samples': 9264192, 'steps': 48250, 'loss/train': 1.0798821449279785} -11/07/2021 04:02:25 - INFO - __main__ - Step 48252: {'lr': 0.0003888881458269444, 'samples': 9264384, 'steps': 48251, 'loss/train': 0.9305204153060913} -11/07/2021 04:02:26 - INFO - __main__ - Step 48253: {'lr': 0.00038888373333640746, 'samples': 9264576, 'steps': 48252, 'loss/train': 1.3799680471420288} -11/07/2021 04:02:26 - INFO - __main__ - Step 48254: {'lr': 0.00038887932078329165, 'samples': 9264768, 'steps': 48253, 'loss/train': 1.4742240905761719} -11/07/2021 04:02:27 - INFO - __main__ - Step 48255: {'lr': 0.00038887490816759895, 'samples': 9264960, 'steps': 48254, 'loss/train': 1.489135980606079} -11/07/2021 04:02:27 - INFO - __main__ - Step 48256: {'lr': 0.00038887049548933135, 'samples': 9265152, 'steps': 48255, 'loss/train': 1.4327009916305542} -11/07/2021 04:02:28 - INFO - __main__ - Step 48257: {'lr': 0.0003888660827484908, 'samples': 9265344, 'steps': 48256, 'loss/train': 1.4369255304336548} -11/07/2021 04:02:28 - INFO - __main__ - Step 48258: {'lr': 0.00038886166994507945, 'samples': 9265536, 'steps': 48257, 'loss/train': 1.502833604812622} -11/07/2021 04:02:28 - INFO - __main__ - Step 48259: {'lr': 0.00038885725707909905, 'samples': 9265728, 'steps': 48258, 'loss/train': 0.3147200047969818} -11/07/2021 04:02:29 - INFO - __main__ - Step 48260: {'lr': 0.0003888528441505518, 'samples': 9265920, 'steps': 48259, 'loss/train': 1.8659920692443848} -11/07/2021 04:02:30 - INFO - __main__ - Step 48261: {'lr': 0.00038884843115943955, 'samples': 9266112, 'steps': 48260, 'loss/train': 0.5704777836799622} -11/07/2021 04:02:30 - INFO - __main__ - Step 48262: {'lr': 0.00038884401810576434, 'samples': 9266304, 'steps': 48261, 'loss/train': 1.202111005783081} -11/07/2021 04:02:30 - INFO - __main__ - Step 48263: {'lr': 0.0003888396049895282, 'samples': 9266496, 'steps': 48262, 'loss/train': 1.4878652095794678} -11/07/2021 04:02:31 - INFO - __main__ - Step 48264: {'lr': 0.000388835191810733, 'samples': 9266688, 'steps': 48263, 'loss/train': 1.6896651983261108} -11/07/2021 04:02:32 - INFO - __main__ - Step 48265: {'lr': 0.0003888307785693809, 'samples': 9266880, 'steps': 48264, 'loss/train': 1.4856317043304443} -11/07/2021 04:02:32 - INFO - __main__ - Step 48266: {'lr': 0.0003888263652654738, 'samples': 9267072, 'steps': 48265, 'loss/train': 1.5039575099945068} -11/07/2021 04:02:33 - INFO - __main__ - Step 48267: {'lr': 0.0003888219518990136, 'samples': 9267264, 'steps': 48266, 'loss/train': 1.9758280515670776} -11/07/2021 04:02:33 - INFO - __main__ - Step 48268: {'lr': 0.0003888175384700024, 'samples': 9267456, 'steps': 48267, 'loss/train': 1.226232647895813} -11/07/2021 04:02:33 - INFO - __main__ - Step 48269: {'lr': 0.0003888131249784421, 'samples': 9267648, 'steps': 48268, 'loss/train': 1.7522835731506348} -11/07/2021 04:02:34 - INFO - __main__ - Step 48270: {'lr': 0.00038880871142433484, 'samples': 9267840, 'steps': 48269, 'loss/train': 0.9955446124076843} -11/07/2021 04:02:35 - INFO - __main__ - Step 48271: {'lr': 0.0003888042978076825, 'samples': 9268032, 'steps': 48270, 'loss/train': 1.7882648706436157} -11/07/2021 04:02:35 - INFO - __main__ - Step 48272: {'lr': 0.00038879988412848706, 'samples': 9268224, 'steps': 48271, 'loss/train': 1.4117809534072876} -11/07/2021 04:02:35 - INFO - __main__ - Step 48273: {'lr': 0.00038879547038675054, 'samples': 9268416, 'steps': 48272, 'loss/train': 1.4808791875839233} -11/07/2021 04:02:36 - INFO - __main__ - Step 48274: {'lr': 0.0003887910565824749, 'samples': 9268608, 'steps': 48273, 'loss/train': 0.9658954739570618} -11/07/2021 04:02:36 - INFO - __main__ - Step 48275: {'lr': 0.0003887866427156622, 'samples': 9268800, 'steps': 48274, 'loss/train': 1.368213415145874} -11/07/2021 04:02:37 - INFO - __main__ - Step 48276: {'lr': 0.00038878222878631444, 'samples': 9268992, 'steps': 48275, 'loss/train': 1.7484121322631836} -11/07/2021 04:02:37 - INFO - __main__ - Step 48277: {'lr': 0.0003887778147944334, 'samples': 9269184, 'steps': 48276, 'loss/train': 1.3552138805389404} -11/07/2021 04:02:38 - INFO - __main__ - Step 48278: {'lr': 0.0003887734007400213, 'samples': 9269376, 'steps': 48277, 'loss/train': 1.819169044494629} -11/07/2021 04:02:38 - INFO - __main__ - Step 48279: {'lr': 0.00038876898662308, 'samples': 9269568, 'steps': 48278, 'loss/train': 1.8303667306900024} -11/07/2021 04:02:39 - INFO - __main__ - Step 48280: {'lr': 0.00038876457244361166, 'samples': 9269760, 'steps': 48279, 'loss/train': 1.3897451162338257} -11/07/2021 04:02:40 - INFO - __main__ - Step 48281: {'lr': 0.000388760158201618, 'samples': 9269952, 'steps': 48280, 'loss/train': 1.4322813749313354} -11/07/2021 04:02:40 - INFO - __main__ - Step 48282: {'lr': 0.0003887557438971012, 'samples': 9270144, 'steps': 48281, 'loss/train': 1.7044888734817505} -11/07/2021 04:02:40 - INFO - __main__ - Step 48283: {'lr': 0.0003887513295300632, 'samples': 9270336, 'steps': 48282, 'loss/train': 1.4639825820922852} -11/07/2021 04:02:41 - INFO - __main__ - Step 48284: {'lr': 0.00038874691510050604, 'samples': 9270528, 'steps': 48283, 'loss/train': 1.6526075601577759} -11/07/2021 04:02:41 - INFO - __main__ - Step 48285: {'lr': 0.00038874250060843163, 'samples': 9270720, 'steps': 48284, 'loss/train': 1.1600265502929688} -11/07/2021 04:02:42 - INFO - __main__ - Step 48286: {'lr': 0.00038873808605384197, 'samples': 9270912, 'steps': 48285, 'loss/train': 1.3651691675186157} -11/07/2021 04:02:42 - INFO - __main__ - Step 48287: {'lr': 0.0003887336714367391, 'samples': 9271104, 'steps': 48286, 'loss/train': 1.148716688156128} -11/07/2021 04:02:43 - INFO - __main__ - Step 48288: {'lr': 0.00038872925675712493, 'samples': 9271296, 'steps': 48287, 'loss/train': 1.4003381729125977} -11/07/2021 04:02:43 - INFO - __main__ - Step 48289: {'lr': 0.0003887248420150016, 'samples': 9271488, 'steps': 48288, 'loss/train': 1.4225640296936035} -11/07/2021 04:02:43 - INFO - __main__ - Step 48290: {'lr': 0.00038872042721037087, 'samples': 9271680, 'steps': 48289, 'loss/train': 1.2903283834457397} -11/07/2021 04:02:45 - INFO - __main__ - Step 48291: {'lr': 0.00038871601234323494, 'samples': 9271872, 'steps': 48290, 'loss/train': 0.3443036377429962} -11/07/2021 04:02:45 - INFO - __main__ - Step 48292: {'lr': 0.00038871159741359567, 'samples': 9272064, 'steps': 48291, 'loss/train': 1.823111891746521} -11/07/2021 04:02:45 - INFO - __main__ - Step 48293: {'lr': 0.0003887071824214551, 'samples': 9272256, 'steps': 48292, 'loss/train': 1.5963959693908691} -11/07/2021 04:02:46 - INFO - __main__ - Step 48294: {'lr': 0.0003887027673668152, 'samples': 9272448, 'steps': 48293, 'loss/train': 1.734969139099121} -11/07/2021 04:02:46 - INFO - __main__ - Step 48295: {'lr': 0.0003886983522496781, 'samples': 9272640, 'steps': 48294, 'loss/train': 1.4370068311691284} -11/07/2021 04:02:47 - INFO - __main__ - Step 48296: {'lr': 0.00038869393707004554, 'samples': 9272832, 'steps': 48295, 'loss/train': 1.698050618171692} -11/07/2021 04:02:47 - INFO - __main__ - Step 48297: {'lr': 0.00038868952182791964, 'samples': 9273024, 'steps': 48296, 'loss/train': 1.2806745767593384} -11/07/2021 04:02:48 - INFO - __main__ - Step 48298: {'lr': 0.0003886851065233024, 'samples': 9273216, 'steps': 48297, 'loss/train': 1.7508585453033447} -11/07/2021 04:02:48 - INFO - __main__ - Step 48299: {'lr': 0.0003886806911561958, 'samples': 9273408, 'steps': 48298, 'loss/train': 1.9955202341079712} -11/07/2021 04:02:48 - INFO - __main__ - Step 48300: {'lr': 0.0003886762757266018, 'samples': 9273600, 'steps': 48299, 'loss/train': 1.306843876838684} -11/07/2021 04:02:50 - INFO - __main__ - Step 48301: {'lr': 0.0003886718602345224, 'samples': 9273792, 'steps': 48300, 'loss/train': 1.6101634502410889} -11/07/2021 04:02:50 - INFO - __main__ - Step 48302: {'lr': 0.0003886674446799596, 'samples': 9273984, 'steps': 48301, 'loss/train': 1.5550583600997925} -11/07/2021 04:02:50 - INFO - __main__ - Step 48303: {'lr': 0.00038866302906291546, 'samples': 9274176, 'steps': 48302, 'loss/train': 1.1555699110031128} -11/07/2021 04:02:51 - INFO - __main__ - Step 48304: {'lr': 0.0003886586133833918, 'samples': 9274368, 'steps': 48303, 'loss/train': 1.4424365758895874} -11/07/2021 04:02:51 - INFO - __main__ - Step 48305: {'lr': 0.00038865419764139077, 'samples': 9274560, 'steps': 48304, 'loss/train': 0.8644227385520935} -11/07/2021 04:02:51 - INFO - __main__ - Step 48306: {'lr': 0.00038864978183691425, 'samples': 9274752, 'steps': 48305, 'loss/train': 0.1560346931219101} -11/07/2021 04:02:52 - INFO - __main__ - Step 48307: {'lr': 0.00038864536596996437, 'samples': 9274944, 'steps': 48306, 'loss/train': 1.4520589113235474} -11/07/2021 04:02:53 - INFO - __main__ - Step 48308: {'lr': 0.0003886409500405429, 'samples': 9275136, 'steps': 48307, 'loss/train': 1.5580068826675415} -11/07/2021 04:02:53 - INFO - __main__ - Step 48309: {'lr': 0.00038863653404865207, 'samples': 9275328, 'steps': 48308, 'loss/train': 1.8992919921875} -11/07/2021 04:02:53 - INFO - __main__ - Step 48310: {'lr': 0.0003886321179942937, 'samples': 9275520, 'steps': 48309, 'loss/train': 1.8710448741912842} -11/07/2021 04:02:54 - INFO - __main__ - Step 48311: {'lr': 0.0003886277018774699, 'samples': 9275712, 'steps': 48310, 'loss/train': 1.650238037109375} -11/07/2021 04:02:55 - INFO - __main__ - Step 48312: {'lr': 0.0003886232856981825, 'samples': 9275904, 'steps': 48311, 'loss/train': 1.7266851663589478} -11/07/2021 04:02:55 - INFO - __main__ - Step 48313: {'lr': 0.00038861886945643363, 'samples': 9276096, 'steps': 48312, 'loss/train': 0.19809167087078094} -11/07/2021 04:02:55 - INFO - __main__ - Step 48314: {'lr': 0.00038861445315222523, 'samples': 9276288, 'steps': 48313, 'loss/train': 2.008556365966797} -11/07/2021 04:02:56 - INFO - __main__ - Step 48315: {'lr': 0.00038861003678555936, 'samples': 9276480, 'steps': 48314, 'loss/train': 1.3083784580230713} -11/07/2021 04:02:56 - INFO - __main__ - Step 48316: {'lr': 0.00038860562035643786, 'samples': 9276672, 'steps': 48315, 'loss/train': 1.8233020305633545} -11/07/2021 04:02:57 - INFO - __main__ - Step 48317: {'lr': 0.00038860120386486285, 'samples': 9276864, 'steps': 48316, 'loss/train': 1.6587094068527222} -11/07/2021 04:02:58 - INFO - __main__ - Step 48318: {'lr': 0.00038859678731083627, 'samples': 9277056, 'steps': 48317, 'loss/train': 1.7899813652038574} -11/07/2021 04:02:58 - INFO - __main__ - Step 48319: {'lr': 0.0003885923706943601, 'samples': 9277248, 'steps': 48318, 'loss/train': 1.2071336507797241} -11/07/2021 04:02:58 - INFO - __main__ - Step 48320: {'lr': 0.00038858795401543634, 'samples': 9277440, 'steps': 48319, 'loss/train': 1.0648425817489624} -11/07/2021 04:02:59 - INFO - __main__ - Step 48321: {'lr': 0.000388583537274067, 'samples': 9277632, 'steps': 48320, 'loss/train': 1.409128189086914} -11/07/2021 04:03:00 - INFO - __main__ - Step 48322: {'lr': 0.0003885791204702541, 'samples': 9277824, 'steps': 48321, 'loss/train': 1.2754244804382324} -11/07/2021 04:03:00 - INFO - __main__ - Step 48323: {'lr': 0.0003885747036039995, 'samples': 9278016, 'steps': 48322, 'loss/train': 1.552413821220398} -11/07/2021 04:03:00 - INFO - __main__ - Step 48324: {'lr': 0.0003885702866753054, 'samples': 9278208, 'steps': 48323, 'loss/train': 1.6152557134628296} -11/07/2021 04:03:01 - INFO - __main__ - Step 48325: {'lr': 0.00038856586968417353, 'samples': 9278400, 'steps': 48324, 'loss/train': 1.4518879652023315} -11/07/2021 04:03:01 - INFO - __main__ - Step 48326: {'lr': 0.00038856145263060606, 'samples': 9278592, 'steps': 48325, 'loss/train': 1.1021263599395752} -11/07/2021 04:03:02 - INFO - __main__ - Step 48327: {'lr': 0.00038855703551460497, 'samples': 9278784, 'steps': 48326, 'loss/train': 1.3933674097061157} -11/07/2021 04:03:02 - INFO - __main__ - Step 48328: {'lr': 0.00038855261833617216, 'samples': 9278976, 'steps': 48327, 'loss/train': 1.8830376863479614} -11/07/2021 04:03:03 - INFO - __main__ - Step 48329: {'lr': 0.00038854820109530974, 'samples': 9279168, 'steps': 48328, 'loss/train': 1.5740693807601929} -11/07/2021 04:03:03 - INFO - __main__ - Step 48330: {'lr': 0.00038854378379201966, 'samples': 9279360, 'steps': 48329, 'loss/train': 1.3352789878845215} -11/07/2021 04:03:04 - INFO - __main__ - Step 48331: {'lr': 0.0003885393664263038, 'samples': 9279552, 'steps': 48330, 'loss/train': 1.5021089315414429} -11/07/2021 04:03:05 - INFO - __main__ - Step 48332: {'lr': 0.00038853494899816434, 'samples': 9279744, 'steps': 48331, 'loss/train': 1.460158348083496} -11/07/2021 04:03:05 - INFO - __main__ - Step 48333: {'lr': 0.0003885305315076031, 'samples': 9279936, 'steps': 48332, 'loss/train': 1.4276036024093628} -11/07/2021 04:03:05 - INFO - __main__ - Step 48334: {'lr': 0.0003885261139546221, 'samples': 9280128, 'steps': 48333, 'loss/train': 1.0807746648788452} -11/07/2021 04:03:06 - INFO - __main__ - Step 48335: {'lr': 0.00038852169633922344, 'samples': 9280320, 'steps': 48334, 'loss/train': 1.3793299198150635} -11/07/2021 04:03:06 - INFO - __main__ - Step 48336: {'lr': 0.00038851727866140906, 'samples': 9280512, 'steps': 48335, 'loss/train': 1.3977899551391602} -11/07/2021 04:03:08 - INFO - __main__ - Step 48337: {'lr': 0.00038851286092118095, 'samples': 9280704, 'steps': 48336, 'loss/train': 1.2920801639556885} -11/07/2021 04:03:08 - INFO - __main__ - Step 48338: {'lr': 0.0003885084431185411, 'samples': 9280896, 'steps': 48337, 'loss/train': 1.3549143075942993} -11/07/2021 04:03:08 - INFO - __main__ - Step 48339: {'lr': 0.0003885040252534913, 'samples': 9281088, 'steps': 48338, 'loss/train': 2.4132800102233887} -11/07/2021 04:03:09 - INFO - __main__ - Step 48340: {'lr': 0.00038849960732603386, 'samples': 9281280, 'steps': 48339, 'loss/train': 2.2466821670532227} -11/07/2021 04:03:09 - INFO - __main__ - Step 48341: {'lr': 0.00038849518933617064, 'samples': 9281472, 'steps': 48340, 'loss/train': 1.1273099184036255} -11/07/2021 04:03:09 - INFO - __main__ - Step 48342: {'lr': 0.0003884907712839036, 'samples': 9281664, 'steps': 48341, 'loss/train': 1.5950285196304321} -11/07/2021 04:03:10 - INFO - __main__ - Step 48343: {'lr': 0.00038848635316923475, 'samples': 9281856, 'steps': 48342, 'loss/train': 1.6004289388656616} -11/07/2021 04:03:11 - INFO - __main__ - Step 48344: {'lr': 0.0003884819349921661, 'samples': 9282048, 'steps': 48343, 'loss/train': 1.8100656270980835} -11/07/2021 04:03:11 - INFO - __main__ - Step 48345: {'lr': 0.0003884775167526996, 'samples': 9282240, 'steps': 48344, 'loss/train': 1.493229627609253} -11/07/2021 04:03:11 - INFO - __main__ - Step 48346: {'lr': 0.0003884730984508373, 'samples': 9282432, 'steps': 48345, 'loss/train': 1.6365907192230225} -11/07/2021 04:03:12 - INFO - __main__ - Step 48347: {'lr': 0.0003884686800865812, 'samples': 9282624, 'steps': 48346, 'loss/train': 1.643216609954834} -11/07/2021 04:03:13 - INFO - __main__ - Step 48348: {'lr': 0.0003884642616599331, 'samples': 9282816, 'steps': 48347, 'loss/train': 1.2912529706954956} -11/07/2021 04:03:13 - INFO - __main__ - Step 48349: {'lr': 0.00038845984317089526, 'samples': 9283008, 'steps': 48348, 'loss/train': 1.9691541194915771} -11/07/2021 04:03:14 - INFO - __main__ - Step 48350: {'lr': 0.00038845542461946953, 'samples': 9283200, 'steps': 48349, 'loss/train': 1.8574779033660889} -11/07/2021 04:03:14 - INFO - __main__ - Step 48351: {'lr': 0.00038845100600565794, 'samples': 9283392, 'steps': 48350, 'loss/train': 1.6028879880905151} -11/07/2021 04:03:14 - INFO - __main__ - Step 48352: {'lr': 0.00038844658732946244, 'samples': 9283584, 'steps': 48351, 'loss/train': 1.471935510635376} -11/07/2021 04:03:15 - INFO - __main__ - Step 48353: {'lr': 0.000388442168590885, 'samples': 9283776, 'steps': 48352, 'loss/train': 1.7875932455062866} -11/07/2021 04:03:16 - INFO - __main__ - Step 48354: {'lr': 0.00038843774978992773, 'samples': 9283968, 'steps': 48353, 'loss/train': 1.2040324211120605} -11/07/2021 04:03:16 - INFO - __main__ - Step 48355: {'lr': 0.0003884333309265925, 'samples': 9284160, 'steps': 48354, 'loss/train': 2.1289470195770264} -11/07/2021 04:03:16 - INFO - __main__ - Step 48356: {'lr': 0.00038842891200088135, 'samples': 9284352, 'steps': 48355, 'loss/train': 1.300454020500183} -11/07/2021 04:03:17 - INFO - __main__ - Step 48357: {'lr': 0.0003884244930127963, 'samples': 9284544, 'steps': 48356, 'loss/train': 1.789948582649231} -11/07/2021 04:03:17 - INFO - __main__ - Step 48358: {'lr': 0.0003884200739623393, 'samples': 9284736, 'steps': 48357, 'loss/train': 1.8772468566894531} -11/07/2021 04:03:18 - INFO - __main__ - Step 48359: {'lr': 0.00038841565484951237, 'samples': 9284928, 'steps': 48358, 'loss/train': 1.9208248853683472} -11/07/2021 04:03:19 - INFO - __main__ - Step 48360: {'lr': 0.0003884112356743175, 'samples': 9285120, 'steps': 48359, 'loss/train': 1.1249557733535767} -11/07/2021 04:03:19 - INFO - __main__ - Step 48361: {'lr': 0.0003884068164367566, 'samples': 9285312, 'steps': 48360, 'loss/train': 1.8961440324783325} -11/07/2021 04:03:19 - INFO - __main__ - Step 48362: {'lr': 0.00038840239713683165, 'samples': 9285504, 'steps': 48361, 'loss/train': 1.3289682865142822} -11/07/2021 04:03:20 - INFO - __main__ - Step 48363: {'lr': 0.0003883979777745449, 'samples': 9285696, 'steps': 48362, 'loss/train': 1.716339111328125} -11/07/2021 04:03:20 - INFO - __main__ - Step 48364: {'lr': 0.00038839355834989806, 'samples': 9285888, 'steps': 48363, 'loss/train': 1.509454369544983} -11/07/2021 04:03:21 - INFO - __main__ - Step 48365: {'lr': 0.0003883891388628932, 'samples': 9286080, 'steps': 48364, 'loss/train': 1.4280014038085938} -11/07/2021 04:03:21 - INFO - __main__ - Step 48366: {'lr': 0.0003883847193135323, 'samples': 9286272, 'steps': 48365, 'loss/train': 1.377169132232666} -11/07/2021 04:03:22 - INFO - __main__ - Step 48367: {'lr': 0.0003883802997018174, 'samples': 9286464, 'steps': 48366, 'loss/train': 0.9458029270172119} -11/07/2021 04:03:22 - INFO - __main__ - Step 48368: {'lr': 0.00038837588002775054, 'samples': 9286656, 'steps': 48367, 'loss/train': 1.3015624284744263} -11/07/2021 04:03:22 - INFO - __main__ - Step 48369: {'lr': 0.0003883714602913336, 'samples': 9286848, 'steps': 48368, 'loss/train': 1.306085467338562} -11/07/2021 04:03:23 - INFO - __main__ - Step 48370: {'lr': 0.00038836704049256864, 'samples': 9287040, 'steps': 48369, 'loss/train': 1.64092218875885} -11/07/2021 04:03:24 - INFO - __main__ - Step 48371: {'lr': 0.0003883626206314577, 'samples': 9287232, 'steps': 48370, 'loss/train': 1.1958248615264893} -11/07/2021 04:03:24 - INFO - __main__ - Step 48372: {'lr': 0.0003883582007080025, 'samples': 9287424, 'steps': 48371, 'loss/train': 1.6516435146331787} -11/07/2021 04:03:25 - INFO - __main__ - Step 48373: {'lr': 0.0003883537807222054, 'samples': 9287616, 'steps': 48372, 'loss/train': 5.795014381408691} -11/07/2021 04:03:25 - INFO - __main__ - Step 48374: {'lr': 0.0003883493606740681, 'samples': 9287808, 'steps': 48373, 'loss/train': 1.2726349830627441} -11/07/2021 04:03:26 - INFO - __main__ - Step 48375: {'lr': 0.0003883449405635928, 'samples': 9288000, 'steps': 48374, 'loss/train': 1.3027281761169434} -11/07/2021 04:03:26 - INFO - __main__ - Step 48376: {'lr': 0.0003883405203907814, 'samples': 9288192, 'steps': 48375, 'loss/train': 1.632309079170227} -11/07/2021 04:03:27 - INFO - __main__ - Step 48377: {'lr': 0.0003883361001556359, 'samples': 9288384, 'steps': 48376, 'loss/train': 1.4304492473602295} -11/07/2021 04:03:27 - INFO - __main__ - Step 48378: {'lr': 0.0003883316798581582, 'samples': 9288576, 'steps': 48377, 'loss/train': 1.9488767385482788} -11/07/2021 04:03:27 - INFO - __main__ - Step 48379: {'lr': 0.0003883272594983505, 'samples': 9288768, 'steps': 48378, 'loss/train': 1.4861701726913452} -11/07/2021 04:03:28 - INFO - __main__ - Step 48380: {'lr': 0.00038832283907621457, 'samples': 9288960, 'steps': 48379, 'loss/train': 1.530775547027588} -11/07/2021 04:03:29 - INFO - __main__ - Step 48381: {'lr': 0.00038831841859175253, 'samples': 9289152, 'steps': 48380, 'loss/train': 1.578474998474121} -11/07/2021 04:03:29 - INFO - __main__ - Step 48382: {'lr': 0.0003883139980449664, 'samples': 9289344, 'steps': 48381, 'loss/train': 1.6181931495666504} -11/07/2021 04:03:29 - INFO - __main__ - Step 48383: {'lr': 0.00038830957743585807, 'samples': 9289536, 'steps': 48382, 'loss/train': 1.1623398065567017} -11/07/2021 04:03:30 - INFO - __main__ - Step 48384: {'lr': 0.0003883051567644296, 'samples': 9289728, 'steps': 48383, 'loss/train': 1.6592649221420288} -11/07/2021 04:03:31 - INFO - __main__ - Step 48385: {'lr': 0.00038830073603068297, 'samples': 9289920, 'steps': 48384, 'loss/train': 1.9188312292099} -11/07/2021 04:03:31 - INFO - __main__ - Step 48386: {'lr': 0.00038829631523462003, 'samples': 9290112, 'steps': 48385, 'loss/train': 1.1328415870666504} -11/07/2021 04:03:32 - INFO - __main__ - Step 48387: {'lr': 0.000388291894376243, 'samples': 9290304, 'steps': 48386, 'loss/train': 0.8931834101676941} -11/07/2021 04:03:32 - INFO - __main__ - Step 48388: {'lr': 0.0003882874734555538, 'samples': 9290496, 'steps': 48387, 'loss/train': 0.7181499600410461} -11/07/2021 04:03:32 - INFO - __main__ - Step 48389: {'lr': 0.00038828305247255447, 'samples': 9290688, 'steps': 48388, 'loss/train': 1.7743628025054932} -11/07/2021 04:03:33 - INFO - __main__ - Step 48390: {'lr': 0.00038827863142724685, 'samples': 9290880, 'steps': 48389, 'loss/train': 1.139664888381958} -11/07/2021 04:03:34 - INFO - __main__ - Step 48391: {'lr': 0.00038827421031963294, 'samples': 9291072, 'steps': 48390, 'loss/train': 1.466491937637329} -11/07/2021 04:03:34 - INFO - __main__ - Step 48392: {'lr': 0.0003882697891497149, 'samples': 9291264, 'steps': 48391, 'loss/train': 0.5570085048675537} -11/07/2021 04:03:35 - INFO - __main__ - Step 48393: {'lr': 0.00038826536791749454, 'samples': 9291456, 'steps': 48392, 'loss/train': 1.432281494140625} -11/07/2021 04:03:35 - INFO - __main__ - Step 48394: {'lr': 0.00038826094662297404, 'samples': 9291648, 'steps': 48393, 'loss/train': 1.030002474784851} -11/07/2021 04:03:35 - INFO - __main__ - Step 48395: {'lr': 0.0003882565252661553, 'samples': 9291840, 'steps': 48394, 'loss/train': 1.17636239528656} -11/07/2021 04:03:36 - INFO - __main__ - Step 48396: {'lr': 0.00038825210384704024, 'samples': 9292032, 'steps': 48395, 'loss/train': 1.313944935798645} -11/07/2021 04:03:37 - INFO - __main__ - Step 48397: {'lr': 0.0003882476823656309, 'samples': 9292224, 'steps': 48396, 'loss/train': 1.5488330125808716} -11/07/2021 04:03:37 - INFO - __main__ - Step 48398: {'lr': 0.00038824326082192935, 'samples': 9292416, 'steps': 48397, 'loss/train': 1.6451550722122192} -11/07/2021 04:03:37 - INFO - __main__ - Step 48399: {'lr': 0.0003882388392159375, 'samples': 9292608, 'steps': 48398, 'loss/train': 1.3582696914672852} -11/07/2021 04:03:38 - INFO - __main__ - Step 48400: {'lr': 0.0003882344175476573, 'samples': 9292800, 'steps': 48399, 'loss/train': 1.2250689268112183} -11/07/2021 04:03:39 - INFO - __main__ - Step 48401: {'lr': 0.00038822999581709087, 'samples': 9292992, 'steps': 48400, 'loss/train': 1.4877376556396484} -11/07/2021 04:03:39 - INFO - __main__ - Step 48402: {'lr': 0.0003882255740242401, 'samples': 9293184, 'steps': 48401, 'loss/train': 1.5930143594741821} -11/07/2021 04:03:39 - INFO - __main__ - Step 48403: {'lr': 0.0003882211521691071, 'samples': 9293376, 'steps': 48402, 'loss/train': 1.1649909019470215} -11/07/2021 04:03:40 - INFO - __main__ - Step 48404: {'lr': 0.0003882167302516937, 'samples': 9293568, 'steps': 48403, 'loss/train': 1.1903587579727173} -11/07/2021 04:03:40 - INFO - __main__ - Step 48405: {'lr': 0.000388212308272002, 'samples': 9293760, 'steps': 48404, 'loss/train': 1.2432438135147095} -11/07/2021 04:03:41 - INFO - __main__ - Step 48406: {'lr': 0.00038820788623003397, 'samples': 9293952, 'steps': 48405, 'loss/train': 1.5587519407272339} -11/07/2021 04:03:41 - INFO - __main__ - Step 48407: {'lr': 0.00038820346412579156, 'samples': 9294144, 'steps': 48406, 'loss/train': 1.460087776184082} -11/07/2021 04:03:42 - INFO - __main__ - Step 48408: {'lr': 0.0003881990419592768, 'samples': 9294336, 'steps': 48407, 'loss/train': 1.2280032634735107} -11/07/2021 04:03:42 - INFO - __main__ - Step 48409: {'lr': 0.00038819461973049177, 'samples': 9294528, 'steps': 48408, 'loss/train': 1.981165885925293} -11/07/2021 04:03:43 - INFO - __main__ - Step 48410: {'lr': 0.00038819019743943834, 'samples': 9294720, 'steps': 48409, 'loss/train': 1.597578763961792} -11/07/2021 04:03:44 - INFO - __main__ - Step 48411: {'lr': 0.00038818577508611854, 'samples': 9294912, 'steps': 48410, 'loss/train': 1.4958175420761108} -11/07/2021 04:03:44 - INFO - __main__ - Step 48412: {'lr': 0.00038818135267053435, 'samples': 9295104, 'steps': 48411, 'loss/train': 1.221787691116333} -11/07/2021 04:03:44 - INFO - __main__ - Step 48413: {'lr': 0.00038817693019268775, 'samples': 9295296, 'steps': 48412, 'loss/train': 1.3178467750549316} -11/07/2021 04:03:45 - INFO - __main__ - Step 48414: {'lr': 0.0003881725076525808, 'samples': 9295488, 'steps': 48413, 'loss/train': 1.1740386486053467} -11/07/2021 04:03:45 - INFO - __main__ - Step 48415: {'lr': 0.0003881680850502154, 'samples': 9295680, 'steps': 48414, 'loss/train': 1.349912405014038} -11/07/2021 04:03:46 - INFO - __main__ - Step 48416: {'lr': 0.00038816366238559366, 'samples': 9295872, 'steps': 48415, 'loss/train': 1.637817621231079} -11/07/2021 04:03:47 - INFO - __main__ - Step 48417: {'lr': 0.00038815923965871747, 'samples': 9296064, 'steps': 48416, 'loss/train': 1.4408929347991943} -11/07/2021 04:03:47 - INFO - __main__ - Step 48418: {'lr': 0.00038815481686958883, 'samples': 9296256, 'steps': 48417, 'loss/train': 1.164324164390564} -11/07/2021 04:03:47 - INFO - __main__ - Step 48419: {'lr': 0.0003881503940182098, 'samples': 9296448, 'steps': 48418, 'loss/train': 1.32057785987854} -11/07/2021 04:03:48 - INFO - __main__ - Step 48420: {'lr': 0.0003881459711045823, 'samples': 9296640, 'steps': 48419, 'loss/train': 1.1111409664154053} -11/07/2021 04:03:48 - INFO - __main__ - Step 48421: {'lr': 0.0003881415481287084, 'samples': 9296832, 'steps': 48420, 'loss/train': 1.074395775794983} -11/07/2021 04:03:49 - INFO - __main__ - Step 48422: {'lr': 0.00038813712509058995, 'samples': 9297024, 'steps': 48421, 'loss/train': 1.415626883506775} -11/07/2021 04:03:49 - INFO - __main__ - Step 48423: {'lr': 0.0003881327019902292, 'samples': 9297216, 'steps': 48422, 'loss/train': 1.8866455554962158} -11/07/2021 04:03:50 - INFO - __main__ - Step 48424: {'lr': 0.00038812827882762793, 'samples': 9297408, 'steps': 48423, 'loss/train': 1.7330360412597656} -11/07/2021 04:03:50 - INFO - __main__ - Step 48425: {'lr': 0.00038812385560278815, 'samples': 9297600, 'steps': 48424, 'loss/train': 1.602062702178955} -11/07/2021 04:03:50 - INFO - __main__ - Step 48426: {'lr': 0.0003881194323157119, 'samples': 9297792, 'steps': 48425, 'loss/train': 1.510677695274353} -11/07/2021 04:03:51 - INFO - __main__ - Step 48427: {'lr': 0.00038811500896640116, 'samples': 9297984, 'steps': 48426, 'loss/train': 1.292872428894043} -11/07/2021 04:03:52 - INFO - __main__ - Step 48428: {'lr': 0.0003881105855548579, 'samples': 9298176, 'steps': 48427, 'loss/train': 1.6281934976577759} -11/07/2021 04:03:52 - INFO - __main__ - Step 48429: {'lr': 0.00038810616208108416, 'samples': 9298368, 'steps': 48428, 'loss/train': 1.389033555984497} -11/07/2021 04:03:52 - INFO - __main__ - Step 48430: {'lr': 0.00038810173854508204, 'samples': 9298560, 'steps': 48429, 'loss/train': 1.1105941534042358} -11/07/2021 04:03:53 - INFO - __main__ - Step 48431: {'lr': 0.0003880973149468533, 'samples': 9298752, 'steps': 48430, 'loss/train': 1.383050799369812} -11/07/2021 04:03:54 - INFO - __main__ - Step 48432: {'lr': 0.00038809289128640003, 'samples': 9298944, 'steps': 48431, 'loss/train': 1.530485987663269} -11/07/2021 04:03:54 - INFO - __main__ - Step 48433: {'lr': 0.00038808846756372426, 'samples': 9299136, 'steps': 48432, 'loss/train': 1.4259238243103027} -11/07/2021 04:03:54 - INFO - __main__ - Step 48434: {'lr': 0.0003880840437788279, 'samples': 9299328, 'steps': 48433, 'loss/train': 1.7784948348999023} -11/07/2021 04:03:55 - INFO - __main__ - Step 48435: {'lr': 0.00038807961993171306, 'samples': 9299520, 'steps': 48434, 'loss/train': 1.703410267829895} -11/07/2021 04:03:55 - INFO - __main__ - Step 48436: {'lr': 0.00038807519602238174, 'samples': 9299712, 'steps': 48435, 'loss/train': 1.0404880046844482} -11/07/2021 04:03:56 - INFO - __main__ - Step 48437: {'lr': 0.00038807077205083577, 'samples': 9299904, 'steps': 48436, 'loss/train': 1.5217667818069458} -11/07/2021 04:03:56 - INFO - __main__ - Step 48438: {'lr': 0.0003880663480170772, 'samples': 9300096, 'steps': 48437, 'loss/train': 1.5590276718139648} -11/07/2021 04:03:57 - INFO - __main__ - Step 48439: {'lr': 0.00038806192392110817, 'samples': 9300288, 'steps': 48438, 'loss/train': 1.4246101379394531} -11/07/2021 04:03:57 - INFO - __main__ - Step 48440: {'lr': 0.0003880574997629305, 'samples': 9300480, 'steps': 48439, 'loss/train': 1.5377458333969116} -11/07/2021 04:03:58 - INFO - __main__ - Step 48441: {'lr': 0.0003880530755425462, 'samples': 9300672, 'steps': 48440, 'loss/train': 1.6214735507965088} -11/07/2021 04:03:58 - INFO - __main__ - Step 48442: {'lr': 0.0003880486512599574, 'samples': 9300864, 'steps': 48441, 'loss/train': 0.9166438579559326} -11/07/2021 04:03:59 - INFO - __main__ - Step 48443: {'lr': 0.00038804422691516606, 'samples': 9301056, 'steps': 48442, 'loss/train': 1.3133119344711304} -11/07/2021 04:03:59 - INFO - __main__ - Step 48444: {'lr': 0.0003880398025081741, 'samples': 9301248, 'steps': 48443, 'loss/train': 1.359276533126831} -11/07/2021 04:04:00 - INFO - __main__ - Step 48445: {'lr': 0.0003880353780389834, 'samples': 9301440, 'steps': 48444, 'loss/train': 0.9887827634811401} -11/07/2021 04:04:00 - INFO - __main__ - Step 48446: {'lr': 0.0003880309535075962, 'samples': 9301632, 'steps': 48445, 'loss/train': 1.2172267436981201} -11/07/2021 04:04:01 - INFO - __main__ - Step 48447: {'lr': 0.00038802652891401434, 'samples': 9301824, 'steps': 48446, 'loss/train': 2.194840669631958} -11/07/2021 04:04:01 - INFO - __main__ - Step 48448: {'lr': 0.0003880221042582399, 'samples': 9302016, 'steps': 48447, 'loss/train': 1.3867621421813965} -11/07/2021 04:04:02 - INFO - __main__ - Step 48449: {'lr': 0.0003880176795402748, 'samples': 9302208, 'steps': 48448, 'loss/train': 1.2776654958724976} -11/07/2021 04:04:02 - INFO - __main__ - Step 48450: {'lr': 0.00038801325476012113, 'samples': 9302400, 'steps': 48449, 'loss/train': 1.5412228107452393} -11/07/2021 04:04:02 - INFO - __main__ - Step 48451: {'lr': 0.00038800882991778073, 'samples': 9302592, 'steps': 48450, 'loss/train': 1.4281809329986572} -11/07/2021 04:04:03 - INFO - __main__ - Step 48452: {'lr': 0.00038800440501325574, 'samples': 9302784, 'steps': 48451, 'loss/train': 1.0717188119888306} -11/07/2021 04:04:04 - INFO - __main__ - Step 48453: {'lr': 0.000387999980046548, 'samples': 9302976, 'steps': 48452, 'loss/train': 1.6209484338760376} -11/07/2021 04:04:04 - INFO - __main__ - Step 48454: {'lr': 0.0003879955550176597, 'samples': 9303168, 'steps': 48453, 'loss/train': 2.196815252304077} -11/07/2021 04:04:05 - INFO - __main__ - Step 48455: {'lr': 0.00038799112992659267, 'samples': 9303360, 'steps': 48454, 'loss/train': 1.5383121967315674} -11/07/2021 04:04:05 - INFO - __main__ - Step 48456: {'lr': 0.00038798670477334894, 'samples': 9303552, 'steps': 48455, 'loss/train': 1.4590588808059692} -11/07/2021 04:04:05 - INFO - __main__ - Step 48457: {'lr': 0.00038798227955793066, 'samples': 9303744, 'steps': 48456, 'loss/train': 1.6237387657165527} -11/07/2021 04:04:06 - INFO - __main__ - Step 48458: {'lr': 0.0003879778542803396, 'samples': 9303936, 'steps': 48457, 'loss/train': 1.506496787071228} -11/07/2021 04:04:07 - INFO - __main__ - Step 48459: {'lr': 0.00038797342894057783, 'samples': 9304128, 'steps': 48458, 'loss/train': 0.8236624002456665} -11/07/2021 04:04:07 - INFO - __main__ - Step 48460: {'lr': 0.0003879690035386474, 'samples': 9304320, 'steps': 48459, 'loss/train': 1.6890909671783447} -11/07/2021 04:04:07 - INFO - __main__ - Step 48461: {'lr': 0.0003879645780745503, 'samples': 9304512, 'steps': 48460, 'loss/train': 1.3325366973876953} -11/07/2021 04:04:08 - INFO - __main__ - Step 48462: {'lr': 0.0003879601525482884, 'samples': 9304704, 'steps': 48461, 'loss/train': 1.5774303674697876} -11/07/2021 04:04:09 - INFO - __main__ - Step 48463: {'lr': 0.00038795572695986394, 'samples': 9304896, 'steps': 48462, 'loss/train': 1.639383316040039} -11/07/2021 04:04:09 - INFO - __main__ - Step 48464: {'lr': 0.00038795130130927857, 'samples': 9305088, 'steps': 48463, 'loss/train': 1.8844096660614014} -11/07/2021 04:04:09 - INFO - __main__ - Step 48465: {'lr': 0.0003879468755965346, 'samples': 9305280, 'steps': 48464, 'loss/train': 1.598170518875122} -11/07/2021 04:04:10 - INFO - __main__ - Step 48466: {'lr': 0.00038794244982163383, 'samples': 9305472, 'steps': 48465, 'loss/train': 1.6323853731155396} -11/07/2021 04:04:10 - INFO - __main__ - Step 48467: {'lr': 0.0003879380239845783, 'samples': 9305664, 'steps': 48466, 'loss/train': 0.7035285830497742} -11/07/2021 04:04:11 - INFO - __main__ - Step 48468: {'lr': 0.0003879335980853701, 'samples': 9305856, 'steps': 48467, 'loss/train': 1.063156008720398} -11/07/2021 04:04:12 - INFO - __main__ - Step 48469: {'lr': 0.00038792917212401114, 'samples': 9306048, 'steps': 48468, 'loss/train': 1.3900890350341797} -11/07/2021 04:04:12 - INFO - __main__ - Step 48470: {'lr': 0.0003879247461005034, 'samples': 9306240, 'steps': 48469, 'loss/train': 1.5695993900299072} -11/07/2021 04:04:12 - INFO - __main__ - Step 48471: {'lr': 0.0003879203200148489, 'samples': 9306432, 'steps': 48470, 'loss/train': 0.6920669674873352} -11/07/2021 04:04:13 - INFO - __main__ - Step 48472: {'lr': 0.0003879158938670496, 'samples': 9306624, 'steps': 48471, 'loss/train': 1.632412314414978} -11/07/2021 04:04:14 - INFO - __main__ - Step 48473: {'lr': 0.0003879114676571076, 'samples': 9306816, 'steps': 48472, 'loss/train': 1.1928110122680664} -11/07/2021 04:04:14 - INFO - __main__ - Step 48474: {'lr': 0.00038790704138502475, 'samples': 9307008, 'steps': 48473, 'loss/train': 1.233225703239441} -11/07/2021 04:04:14 - INFO - __main__ - Step 48475: {'lr': 0.0003879026150508032, 'samples': 9307200, 'steps': 48474, 'loss/train': 1.964782476425171} -11/07/2021 04:04:15 - INFO - __main__ - Step 48476: {'lr': 0.00038789818865444473, 'samples': 9307392, 'steps': 48475, 'loss/train': 2.022186040878296} -11/07/2021 04:04:15 - INFO - __main__ - Step 48477: {'lr': 0.0003878937621959516, 'samples': 9307584, 'steps': 48476, 'loss/train': 1.3771586418151855} -11/07/2021 04:04:16 - INFO - __main__ - Step 48478: {'lr': 0.0003878893356753256, 'samples': 9307776, 'steps': 48477, 'loss/train': 1.628832221031189} -11/07/2021 04:04:16 - INFO - __main__ - Step 48479: {'lr': 0.0003878849090925688, 'samples': 9307968, 'steps': 48478, 'loss/train': 1.2131322622299194} -11/07/2021 04:04:17 - INFO - __main__ - Step 48480: {'lr': 0.00038788048244768316, 'samples': 9308160, 'steps': 48479, 'loss/train': 1.4445890188217163} -11/07/2021 04:04:17 - INFO - __main__ - Step 48481: {'lr': 0.00038787605574067076, 'samples': 9308352, 'steps': 48480, 'loss/train': 1.3065617084503174} -11/07/2021 04:04:18 - INFO - __main__ - Step 48482: {'lr': 0.0003878716289715335, 'samples': 9308544, 'steps': 48481, 'loss/train': 1.4773340225219727} -11/07/2021 04:04:18 - INFO - __main__ - Step 48483: {'lr': 0.0003878672021402734, 'samples': 9308736, 'steps': 48482, 'loss/train': 1.5814417600631714} -11/07/2021 04:04:19 - INFO - __main__ - Step 48484: {'lr': 0.00038786277524689245, 'samples': 9308928, 'steps': 48483, 'loss/train': 1.6066398620605469} -11/07/2021 04:04:19 - INFO - __main__ - Step 48485: {'lr': 0.0003878583482913927, 'samples': 9309120, 'steps': 48484, 'loss/train': 1.5111255645751953} -11/07/2021 04:04:20 - INFO - __main__ - Step 48486: {'lr': 0.00038785392127377603, 'samples': 9309312, 'steps': 48485, 'loss/train': 1.7543655633926392} -11/07/2021 04:04:20 - INFO - __main__ - Step 48487: {'lr': 0.0003878494941940447, 'samples': 9309504, 'steps': 48486, 'loss/train': 1.267889380455017} -11/07/2021 04:04:20 - INFO - __main__ - Step 48488: {'lr': 0.0003878450670522004, 'samples': 9309696, 'steps': 48487, 'loss/train': 1.1851766109466553} -11/07/2021 04:04:21 - INFO - __main__ - Step 48489: {'lr': 0.00038784063984824516, 'samples': 9309888, 'steps': 48488, 'loss/train': 1.4379669427871704} -11/07/2021 04:04:22 - INFO - __main__ - Step 48490: {'lr': 0.00038783621258218115, 'samples': 9310080, 'steps': 48489, 'loss/train': 1.6245023012161255} -11/07/2021 04:04:22 - INFO - __main__ - Step 48491: {'lr': 0.00038783178525401025, 'samples': 9310272, 'steps': 48490, 'loss/train': 1.602535367012024} -11/07/2021 04:04:22 - INFO - __main__ - Step 48492: {'lr': 0.00038782735786373445, 'samples': 9310464, 'steps': 48491, 'loss/train': 1.8196521997451782} -11/07/2021 04:04:23 - INFO - __main__ - Step 48493: {'lr': 0.00038782293041135583, 'samples': 9310656, 'steps': 48492, 'loss/train': 1.6887304782867432} -11/07/2021 04:04:24 - INFO - __main__ - Step 48494: {'lr': 0.0003878185028968763, 'samples': 9310848, 'steps': 48493, 'loss/train': 1.529370665550232} -11/07/2021 04:04:24 - INFO - __main__ - Step 48495: {'lr': 0.00038781407532029785, 'samples': 9311040, 'steps': 48494, 'loss/train': 1.4546703100204468} -11/07/2021 04:04:25 - INFO - __main__ - Step 48496: {'lr': 0.0003878096476816225, 'samples': 9311232, 'steps': 48495, 'loss/train': 1.2742546796798706} -11/07/2021 04:04:25 - INFO - __main__ - Step 48497: {'lr': 0.0003878052199808523, 'samples': 9311424, 'steps': 48496, 'loss/train': 1.48627769947052} -11/07/2021 04:04:25 - INFO - __main__ - Step 48498: {'lr': 0.0003878007922179891, 'samples': 9311616, 'steps': 48497, 'loss/train': 1.6182938814163208} -11/07/2021 04:04:26 - INFO - __main__ - Step 48499: {'lr': 0.0003877963643930351, 'samples': 9311808, 'steps': 48498, 'loss/train': 1.3741947412490845} -11/07/2021 04:04:27 - INFO - __main__ - Step 48500: {'lr': 0.00038779193650599213, 'samples': 9312000, 'steps': 48499, 'loss/train': 1.2534310817718506} -11/07/2021 04:04:27 - INFO - __main__ - Step 48501: {'lr': 0.0003877875085568622, 'samples': 9312192, 'steps': 48500, 'loss/train': 1.628035306930542} -11/07/2021 04:04:27 - INFO - __main__ - Step 48502: {'lr': 0.0003877830805456474, 'samples': 9312384, 'steps': 48501, 'loss/train': 1.7516915798187256} -11/07/2021 04:04:28 - INFO - __main__ - Step 48503: {'lr': 0.00038777865247234967, 'samples': 9312576, 'steps': 48502, 'loss/train': 1.5887657403945923} -11/07/2021 04:04:28 - INFO - __main__ - Step 48504: {'lr': 0.00038777422433697106, 'samples': 9312768, 'steps': 48503, 'loss/train': 1.4785151481628418} -11/07/2021 04:04:29 - INFO - __main__ - Step 48505: {'lr': 0.00038776979613951347, 'samples': 9312960, 'steps': 48504, 'loss/train': 1.5877552032470703} -11/07/2021 04:04:29 - INFO - __main__ - Step 48506: {'lr': 0.00038776536787997885, 'samples': 9313152, 'steps': 48505, 'loss/train': 1.8600739240646362} -11/07/2021 04:04:30 - INFO - __main__ - Step 48507: {'lr': 0.0003877609395583693, 'samples': 9313344, 'steps': 48506, 'loss/train': 1.3988336324691772} -11/07/2021 04:04:30 - INFO - __main__ - Step 48508: {'lr': 0.0003877565111746869, 'samples': 9313536, 'steps': 48507, 'loss/train': 1.3312302827835083} -11/07/2021 04:04:31 - INFO - __main__ - Step 48509: {'lr': 0.00038775208272893346, 'samples': 9313728, 'steps': 48508, 'loss/train': 1.4225656986236572} -11/07/2021 04:04:32 - INFO - __main__ - Step 48510: {'lr': 0.0003877476542211111, 'samples': 9313920, 'steps': 48509, 'loss/train': 1.4918937683105469} -11/07/2021 04:04:33 - INFO - __main__ - Step 48511: {'lr': 0.0003877432256512218, 'samples': 9314112, 'steps': 48510, 'loss/train': 1.3282244205474854} -11/07/2021 04:04:33 - INFO - __main__ - Step 48512: {'lr': 0.00038773879701926747, 'samples': 9314304, 'steps': 48511, 'loss/train': 1.7111784219741821} -11/07/2021 04:04:33 - INFO - __main__ - Step 48513: {'lr': 0.0003877343683252501, 'samples': 9314496, 'steps': 48512, 'loss/train': 1.8285577297210693} -11/07/2021 04:04:34 - INFO - __main__ - Step 48514: {'lr': 0.00038772993956917183, 'samples': 9314688, 'steps': 48513, 'loss/train': 1.6901429891586304} -11/07/2021 04:04:34 - INFO - __main__ - Step 48515: {'lr': 0.00038772551075103457, 'samples': 9314880, 'steps': 48514, 'loss/train': 2.77165150642395} -11/07/2021 04:04:34 - INFO - __main__ - Step 48516: {'lr': 0.00038772108187084034, 'samples': 9315072, 'steps': 48515, 'loss/train': 2.760432004928589} -11/07/2021 04:04:35 - INFO - __main__ - Step 48517: {'lr': 0.00038771665292859116, 'samples': 9315264, 'steps': 48516, 'loss/train': 1.6580708026885986} -11/07/2021 04:04:36 - INFO - __main__ - Step 48518: {'lr': 0.00038771222392428885, 'samples': 9315456, 'steps': 48517, 'loss/train': 1.2777594327926636} -11/07/2021 04:04:36 - INFO - __main__ - Step 48519: {'lr': 0.0003877077948579356, 'samples': 9315648, 'steps': 48518, 'loss/train': 1.2819809913635254} -11/07/2021 04:04:36 - INFO - __main__ - Step 48520: {'lr': 0.00038770336572953334, 'samples': 9315840, 'steps': 48519, 'loss/train': 1.8734691143035889} -11/07/2021 04:04:37 - INFO - __main__ - Step 48521: {'lr': 0.00038769893653908404, 'samples': 9316032, 'steps': 48520, 'loss/train': 1.5955742597579956} -11/07/2021 04:04:38 - INFO - __main__ - Step 48522: {'lr': 0.0003876945072865898, 'samples': 9316224, 'steps': 48521, 'loss/train': 1.3457098007202148} -11/07/2021 04:04:38 - INFO - __main__ - Step 48523: {'lr': 0.0003876900779720525, 'samples': 9316416, 'steps': 48522, 'loss/train': 1.5795559883117676} -11/07/2021 04:04:39 - INFO - __main__ - Step 48524: {'lr': 0.0003876856485954742, 'samples': 9316608, 'steps': 48523, 'loss/train': 1.3283982276916504} -11/07/2021 04:04:39 - INFO - __main__ - Step 48525: {'lr': 0.00038768121915685685, 'samples': 9316800, 'steps': 48524, 'loss/train': 1.6154831647872925} -11/07/2021 04:04:39 - INFO - __main__ - Step 48526: {'lr': 0.00038767678965620245, 'samples': 9316992, 'steps': 48525, 'loss/train': 1.2984143495559692} -11/07/2021 04:04:40 - INFO - __main__ - Step 48527: {'lr': 0.00038767236009351304, 'samples': 9317184, 'steps': 48526, 'loss/train': 1.514677882194519} -11/07/2021 04:04:41 - INFO - __main__ - Step 48528: {'lr': 0.00038766793046879057, 'samples': 9317376, 'steps': 48527, 'loss/train': 0.9569680094718933} -11/07/2021 04:04:41 - INFO - __main__ - Step 48529: {'lr': 0.000387663500782037, 'samples': 9317568, 'steps': 48528, 'loss/train': 1.884013295173645} -11/07/2021 04:04:41 - INFO - __main__ - Step 48530: {'lr': 0.00038765907103325447, 'samples': 9317760, 'steps': 48529, 'loss/train': 1.5891244411468506} -11/07/2021 04:04:42 - INFO - __main__ - Step 48531: {'lr': 0.00038765464122244485, 'samples': 9317952, 'steps': 48530, 'loss/train': 1.4183497428894043} -11/07/2021 04:04:42 - INFO - __main__ - Step 48532: {'lr': 0.0003876502113496102, 'samples': 9318144, 'steps': 48531, 'loss/train': 1.2370476722717285} -11/07/2021 04:04:43 - INFO - __main__ - Step 48533: {'lr': 0.00038764578141475245, 'samples': 9318336, 'steps': 48532, 'loss/train': 1.615739345550537} -11/07/2021 04:04:43 - INFO - __main__ - Step 48534: {'lr': 0.0003876413514178736, 'samples': 9318528, 'steps': 48533, 'loss/train': 1.2059228420257568} -11/07/2021 04:04:44 - INFO - __main__ - Step 48535: {'lr': 0.0003876369213589758, 'samples': 9318720, 'steps': 48534, 'loss/train': 1.2580654621124268} -11/07/2021 04:04:44 - INFO - __main__ - Step 48536: {'lr': 0.0003876324912380608, 'samples': 9318912, 'steps': 48535, 'loss/train': 1.6176378726959229} -11/07/2021 04:04:44 - INFO - __main__ - Step 48537: {'lr': 0.00038762806105513084, 'samples': 9319104, 'steps': 48536, 'loss/train': 1.6030935049057007} -11/07/2021 04:04:45 - INFO - __main__ - Step 48538: {'lr': 0.0003876236308101877, 'samples': 9319296, 'steps': 48537, 'loss/train': 1.8924974203109741} -11/07/2021 04:04:46 - INFO - __main__ - Step 48539: {'lr': 0.0003876192005032335, 'samples': 9319488, 'steps': 48538, 'loss/train': 0.9740433692932129} -11/07/2021 04:04:46 - INFO - __main__ - Step 48540: {'lr': 0.00038761477013427026, 'samples': 9319680, 'steps': 48539, 'loss/train': 1.4934413433074951} -11/07/2021 04:04:47 - INFO - __main__ - Step 48541: {'lr': 0.00038761033970329987, 'samples': 9319872, 'steps': 48540, 'loss/train': 1.0842349529266357} -11/07/2021 04:04:47 - INFO - __main__ - Step 48542: {'lr': 0.00038760590921032445, 'samples': 9320064, 'steps': 48541, 'loss/train': 1.3521828651428223} -11/07/2021 04:04:48 - INFO - __main__ - Step 48543: {'lr': 0.0003876014786553459, 'samples': 9320256, 'steps': 48542, 'loss/train': 1.6854872703552246} -11/07/2021 04:04:48 - INFO - __main__ - Step 48544: {'lr': 0.00038759704803836625, 'samples': 9320448, 'steps': 48543, 'loss/train': 1.2868236303329468} -11/07/2021 04:04:49 - INFO - __main__ - Step 48545: {'lr': 0.00038759261735938743, 'samples': 9320640, 'steps': 48544, 'loss/train': 1.4686287641525269} -11/07/2021 04:04:49 - INFO - __main__ - Step 48546: {'lr': 0.00038758818661841155, 'samples': 9320832, 'steps': 48545, 'loss/train': 1.323473572731018} -11/07/2021 04:04:49 - INFO - __main__ - Step 48547: {'lr': 0.0003875837558154406, 'samples': 9321024, 'steps': 48546, 'loss/train': 1.3346006870269775} -11/07/2021 04:04:50 - INFO - __main__ - Step 48548: {'lr': 0.0003875793249504765, 'samples': 9321216, 'steps': 48547, 'loss/train': 1.331971526145935} -11/07/2021 04:04:51 - INFO - __main__ - Step 48549: {'lr': 0.00038757489402352124, 'samples': 9321408, 'steps': 48548, 'loss/train': 2.03489089012146} -11/07/2021 04:04:51 - INFO - __main__ - Step 48550: {'lr': 0.0003875704630345769, 'samples': 9321600, 'steps': 48549, 'loss/train': 1.404166579246521} -11/07/2021 04:04:51 - INFO - __main__ - Step 48551: {'lr': 0.00038756603198364544, 'samples': 9321792, 'steps': 48550, 'loss/train': 1.6891363859176636} -11/07/2021 04:04:52 - INFO - __main__ - Step 48552: {'lr': 0.0003875616008707288, 'samples': 9321984, 'steps': 48551, 'loss/train': 1.9975979328155518} -11/07/2021 04:04:53 - INFO - __main__ - Step 48553: {'lr': 0.00038755716969582913, 'samples': 9322176, 'steps': 48552, 'loss/train': 1.307058572769165} -11/07/2021 04:04:53 - INFO - __main__ - Step 48554: {'lr': 0.0003875527384589482, 'samples': 9322368, 'steps': 48553, 'loss/train': 1.2819502353668213} -11/07/2021 04:04:54 - INFO - __main__ - Step 48555: {'lr': 0.00038754830716008815, 'samples': 9322560, 'steps': 48554, 'loss/train': 1.1141554117202759} -11/07/2021 04:04:54 - INFO - __main__ - Step 48556: {'lr': 0.000387543875799251, 'samples': 9322752, 'steps': 48555, 'loss/train': 1.530539631843567} -11/07/2021 04:04:54 - INFO - __main__ - Step 48557: {'lr': 0.0003875394443764387, 'samples': 9322944, 'steps': 48556, 'loss/train': 2.102464199066162} -11/07/2021 04:04:55 - INFO - __main__ - Step 48558: {'lr': 0.00038753501289165324, 'samples': 9323136, 'steps': 48557, 'loss/train': 1.6528323888778687} -11/07/2021 04:04:56 - INFO - __main__ - Step 48559: {'lr': 0.0003875305813448966, 'samples': 9323328, 'steps': 48558, 'loss/train': 1.4500070810317993} -11/07/2021 04:04:56 - INFO - __main__ - Step 48560: {'lr': 0.00038752614973617085, 'samples': 9323520, 'steps': 48559, 'loss/train': 1.2675766944885254} -11/07/2021 04:04:56 - INFO - __main__ - Step 48561: {'lr': 0.0003875217180654779, 'samples': 9323712, 'steps': 48560, 'loss/train': 0.9635229706764221} -11/07/2021 04:04:57 - INFO - __main__ - Step 48562: {'lr': 0.00038751728633281974, 'samples': 9323904, 'steps': 48561, 'loss/train': 1.6561272144317627} -11/07/2021 04:04:57 - INFO - __main__ - Step 48563: {'lr': 0.00038751285453819846, 'samples': 9324096, 'steps': 48562, 'loss/train': 1.4693461656570435} -11/07/2021 04:04:59 - INFO - __main__ - Step 48564: {'lr': 0.000387508422681616, 'samples': 9324288, 'steps': 48563, 'loss/train': 1.416921854019165} -11/07/2021 04:04:59 - INFO - __main__ - Step 48565: {'lr': 0.0003875039907630744, 'samples': 9324480, 'steps': 48564, 'loss/train': 1.456447720527649} -11/07/2021 04:04:59 - INFO - __main__ - Step 48566: {'lr': 0.0003874995587825756, 'samples': 9324672, 'steps': 48565, 'loss/train': 1.5661808252334595} -11/07/2021 04:05:00 - INFO - __main__ - Step 48567: {'lr': 0.00038749512674012167, 'samples': 9324864, 'steps': 48566, 'loss/train': 1.9703129529953003} -11/07/2021 04:05:00 - INFO - __main__ - Step 48568: {'lr': 0.0003874906946357145, 'samples': 9325056, 'steps': 48567, 'loss/train': 1.4652469158172607} -11/07/2021 04:05:01 - INFO - __main__ - Step 48569: {'lr': 0.00038748626246935613, 'samples': 9325248, 'steps': 48568, 'loss/train': 1.4368247985839844} -11/07/2021 04:05:01 - INFO - __main__ - Step 48570: {'lr': 0.0003874818302410486, 'samples': 9325440, 'steps': 48569, 'loss/train': 0.7973642349243164} -11/07/2021 04:05:02 - INFO - __main__ - Step 48571: {'lr': 0.00038747739795079396, 'samples': 9325632, 'steps': 48570, 'loss/train': 1.7440383434295654} -11/07/2021 04:05:02 - INFO - __main__ - Step 48572: {'lr': 0.000387472965598594, 'samples': 9325824, 'steps': 48571, 'loss/train': 1.2948087453842163} -11/07/2021 04:05:03 - INFO - __main__ - Step 48573: {'lr': 0.0003874685331844509, 'samples': 9326016, 'steps': 48572, 'loss/train': 1.4181630611419678} -11/07/2021 04:05:03 - INFO - __main__ - Step 48574: {'lr': 0.0003874641007083666, 'samples': 9326208, 'steps': 48573, 'loss/train': 1.457755208015442} -11/07/2021 04:05:05 - INFO - __main__ - Step 48575: {'lr': 0.00038745966817034305, 'samples': 9326400, 'steps': 48574, 'loss/train': 1.319076418876648} -11/07/2021 04:05:05 - INFO - __main__ - Step 48576: {'lr': 0.0003874552355703823, 'samples': 9326592, 'steps': 48575, 'loss/train': 0.9433940052986145} -11/07/2021 04:05:05 - INFO - __main__ - Step 48577: {'lr': 0.00038745080290848635, 'samples': 9326784, 'steps': 48576, 'loss/train': 1.485592246055603} -11/07/2021 04:05:06 - INFO - __main__ - Step 48578: {'lr': 0.0003874463701846573, 'samples': 9326976, 'steps': 48577, 'loss/train': 0.6104253530502319} -11/07/2021 04:05:06 - INFO - __main__ - Step 48579: {'lr': 0.0003874419373988969, 'samples': 9327168, 'steps': 48578, 'loss/train': 1.7105915546417236} -11/07/2021 04:05:06 - INFO - __main__ - Step 48580: {'lr': 0.0003874375045512073, 'samples': 9327360, 'steps': 48579, 'loss/train': 1.3981499671936035} -11/07/2021 04:05:07 - INFO - __main__ - Step 48581: {'lr': 0.0003874330716415905, 'samples': 9327552, 'steps': 48580, 'loss/train': 1.525861382484436} -11/07/2021 04:05:08 - INFO - __main__ - Step 48582: {'lr': 0.00038742863867004853, 'samples': 9327744, 'steps': 48581, 'loss/train': 1.4717320203781128} -11/07/2021 04:05:08 - INFO - __main__ - Step 48583: {'lr': 0.0003874242056365833, 'samples': 9327936, 'steps': 48582, 'loss/train': 1.9312816858291626} -11/07/2021 04:05:08 - INFO - __main__ - Step 48584: {'lr': 0.0003874197725411969, 'samples': 9328128, 'steps': 48583, 'loss/train': 0.9575197100639343} -11/07/2021 04:05:09 - INFO - __main__ - Step 48585: {'lr': 0.00038741533938389117, 'samples': 9328320, 'steps': 48584, 'loss/train': 1.4876394271850586} -11/07/2021 04:05:10 - INFO - __main__ - Step 48586: {'lr': 0.00038741090616466824, 'samples': 9328512, 'steps': 48585, 'loss/train': 1.5372319221496582} -11/07/2021 04:05:10 - INFO - __main__ - Step 48587: {'lr': 0.0003874064728835301, 'samples': 9328704, 'steps': 48586, 'loss/train': 1.9714494943618774} -11/07/2021 04:05:10 - INFO - __main__ - Step 48588: {'lr': 0.0003874020395404787, 'samples': 9328896, 'steps': 48587, 'loss/train': 1.817679524421692} -11/07/2021 04:05:11 - INFO - __main__ - Step 48589: {'lr': 0.00038739760613551606, 'samples': 9329088, 'steps': 48588, 'loss/train': 1.5934373140335083} -11/07/2021 04:05:11 - INFO - __main__ - Step 48590: {'lr': 0.0003873931726686442, 'samples': 9329280, 'steps': 48589, 'loss/train': 1.5713540315628052} -11/07/2021 04:05:12 - INFO - __main__ - Step 48591: {'lr': 0.0003873887391398651, 'samples': 9329472, 'steps': 48590, 'loss/train': 1.4419883489608765} -11/07/2021 04:05:13 - INFO - __main__ - Step 48592: {'lr': 0.0003873843055491807, 'samples': 9329664, 'steps': 48591, 'loss/train': 1.312111496925354} -11/07/2021 04:05:13 - INFO - __main__ - Step 48593: {'lr': 0.00038737987189659315, 'samples': 9329856, 'steps': 48592, 'loss/train': 1.7823280096054077} -11/07/2021 04:05:13 - INFO - __main__ - Step 48594: {'lr': 0.00038737543818210423, 'samples': 9330048, 'steps': 48593, 'loss/train': 1.4560304880142212} -11/07/2021 04:05:14 - INFO - __main__ - Step 48595: {'lr': 0.00038737100440571615, 'samples': 9330240, 'steps': 48594, 'loss/train': 1.3260122537612915} -11/07/2021 04:05:15 - INFO - __main__ - Step 48596: {'lr': 0.00038736657056743075, 'samples': 9330432, 'steps': 48595, 'loss/train': 1.53359854221344} -11/07/2021 04:05:15 - INFO - __main__ - Step 48597: {'lr': 0.0003873621366672502, 'samples': 9330624, 'steps': 48596, 'loss/train': 1.49400794506073} -11/07/2021 04:05:15 - INFO - __main__ - Step 48598: {'lr': 0.0003873577027051763, 'samples': 9330816, 'steps': 48597, 'loss/train': 1.5908323526382446} -11/07/2021 04:05:16 - INFO - __main__ - Step 48599: {'lr': 0.0003873532686812111, 'samples': 9331008, 'steps': 48598, 'loss/train': 1.642113447189331} -11/07/2021 04:05:16 - INFO - __main__ - Step 48600: {'lr': 0.0003873488345953567, 'samples': 9331200, 'steps': 48599, 'loss/train': 1.4471324682235718} -11/07/2021 04:05:17 - INFO - __main__ - Step 48601: {'lr': 0.00038734440044761503, 'samples': 9331392, 'steps': 48600, 'loss/train': 0.10087435692548752} -11/07/2021 04:05:17 - INFO - __main__ - Step 48602: {'lr': 0.0003873399662379881, 'samples': 9331584, 'steps': 48601, 'loss/train': 1.194433569908142} -11/07/2021 04:05:18 - INFO - __main__ - Step 48603: {'lr': 0.00038733553196647786, 'samples': 9331776, 'steps': 48602, 'loss/train': 1.6700736284255981} -11/07/2021 04:05:18 - INFO - __main__ - Step 48604: {'lr': 0.00038733109763308644, 'samples': 9331968, 'steps': 48603, 'loss/train': 1.0045156478881836} -11/07/2021 04:05:18 - INFO - __main__ - Step 48605: {'lr': 0.0003873266632378157, 'samples': 9332160, 'steps': 48604, 'loss/train': 1.76278555393219} -11/07/2021 04:05:19 - INFO - __main__ - Step 48606: {'lr': 0.00038732222878066764, 'samples': 9332352, 'steps': 48605, 'loss/train': 1.3059808015823364} -11/07/2021 04:05:20 - INFO - __main__ - Step 48607: {'lr': 0.0003873177942616444, 'samples': 9332544, 'steps': 48606, 'loss/train': 1.3572828769683838} -11/07/2021 04:05:20 - INFO - __main__ - Step 48608: {'lr': 0.0003873133596807478, 'samples': 9332736, 'steps': 48607, 'loss/train': 1.509686827659607} -11/07/2021 04:05:21 - INFO - __main__ - Step 48609: {'lr': 0.00038730892503797986, 'samples': 9332928, 'steps': 48608, 'loss/train': 1.3287807703018188} -11/07/2021 04:05:21 - INFO - __main__ - Step 48610: {'lr': 0.00038730449033334277, 'samples': 9333120, 'steps': 48609, 'loss/train': 1.5132238864898682} -11/07/2021 04:05:21 - INFO - __main__ - Step 48611: {'lr': 0.00038730005556683833, 'samples': 9333312, 'steps': 48610, 'loss/train': 1.4505895376205444} -11/07/2021 04:05:22 - INFO - __main__ - Step 48612: {'lr': 0.00038729562073846856, 'samples': 9333504, 'steps': 48611, 'loss/train': 1.8530577421188354} -11/07/2021 04:05:23 - INFO - __main__ - Step 48613: {'lr': 0.00038729118584823557, 'samples': 9333696, 'steps': 48612, 'loss/train': 1.5153831243515015} -11/07/2021 04:05:23 - INFO - __main__ - Step 48614: {'lr': 0.0003872867508961413, 'samples': 9333888, 'steps': 48613, 'loss/train': 1.310623288154602} -11/07/2021 04:05:23 - INFO - __main__ - Step 48615: {'lr': 0.00038728231588218767, 'samples': 9334080, 'steps': 48614, 'loss/train': 1.5036399364471436} -11/07/2021 04:05:24 - INFO - __main__ - Step 48616: {'lr': 0.00038727788080637684, 'samples': 9334272, 'steps': 48615, 'loss/train': 1.897681713104248} -11/07/2021 04:05:25 - INFO - __main__ - Step 48617: {'lr': 0.00038727344566871064, 'samples': 9334464, 'steps': 48616, 'loss/train': 2.2115097045898438} -11/07/2021 04:05:25 - INFO - __main__ - Step 48618: {'lr': 0.00038726901046919114, 'samples': 9334656, 'steps': 48617, 'loss/train': 1.8675711154937744} -11/07/2021 04:05:26 - INFO - __main__ - Step 48619: {'lr': 0.00038726457520782046, 'samples': 9334848, 'steps': 48618, 'loss/train': 1.9020841121673584} -11/07/2021 04:05:26 - INFO - __main__ - Step 48620: {'lr': 0.00038726013988460027, 'samples': 9335040, 'steps': 48619, 'loss/train': 1.3993057012557983} -11/07/2021 04:05:26 - INFO - __main__ - Step 48621: {'lr': 0.00038725570449953296, 'samples': 9335232, 'steps': 48620, 'loss/train': 0.7827754020690918} -11/07/2021 04:05:27 - INFO - __main__ - Step 48622: {'lr': 0.0003872512690526203, 'samples': 9335424, 'steps': 48621, 'loss/train': 1.1186741590499878} -11/07/2021 04:05:28 - INFO - __main__ - Step 48623: {'lr': 0.0003872468335438643, 'samples': 9335616, 'steps': 48622, 'loss/train': 1.4439775943756104} -11/07/2021 04:05:28 - INFO - __main__ - Step 48624: {'lr': 0.000387242397973267, 'samples': 9335808, 'steps': 48623, 'loss/train': 1.7906427383422852} -11/07/2021 04:05:28 - INFO - __main__ - Step 48625: {'lr': 0.0003872379623408304, 'samples': 9336000, 'steps': 48624, 'loss/train': 1.492393970489502} -11/07/2021 04:05:29 - INFO - __main__ - Step 48626: {'lr': 0.0003872335266465565, 'samples': 9336192, 'steps': 48625, 'loss/train': 1.3923840522766113} -11/07/2021 04:05:30 - INFO - __main__ - Step 48627: {'lr': 0.00038722909089044735, 'samples': 9336384, 'steps': 48626, 'loss/train': 1.0367521047592163} -11/07/2021 04:05:30 - INFO - __main__ - Step 48628: {'lr': 0.0003872246550725048, 'samples': 9336576, 'steps': 48627, 'loss/train': 1.5686945915222168} -11/07/2021 04:05:30 - INFO - __main__ - Step 48629: {'lr': 0.000387220219192731, 'samples': 9336768, 'steps': 48628, 'loss/train': 1.4293190240859985} -11/07/2021 04:05:31 - INFO - __main__ - Step 48630: {'lr': 0.00038721578325112785, 'samples': 9336960, 'steps': 48629, 'loss/train': 2.342914342880249} -11/07/2021 04:05:31 - INFO - __main__ - Step 48631: {'lr': 0.00038721134724769733, 'samples': 9337152, 'steps': 48630, 'loss/train': 1.2137004137039185} -11/07/2021 04:05:32 - INFO - __main__ - Step 48632: {'lr': 0.00038720691118244164, 'samples': 9337344, 'steps': 48631, 'loss/train': 1.630367398262024} -11/07/2021 04:05:32 - INFO - __main__ - Step 48633: {'lr': 0.00038720247505536257, 'samples': 9337536, 'steps': 48632, 'loss/train': 1.723755955696106} -11/07/2021 04:05:33 - INFO - __main__ - Step 48634: {'lr': 0.0003871980388664621, 'samples': 9337728, 'steps': 48633, 'loss/train': 1.821600317955017} -11/07/2021 04:05:33 - INFO - __main__ - Step 48635: {'lr': 0.00038719360261574233, 'samples': 9337920, 'steps': 48634, 'loss/train': 1.6551693677902222} -11/07/2021 04:05:34 - INFO - __main__ - Step 48636: {'lr': 0.00038718916630320533, 'samples': 9338112, 'steps': 48635, 'loss/train': 1.846117615699768} -11/07/2021 04:05:34 - INFO - __main__ - Step 48637: {'lr': 0.0003871847299288529, 'samples': 9338304, 'steps': 48636, 'loss/train': 1.1855734586715698} -11/07/2021 04:05:35 - INFO - __main__ - Step 48638: {'lr': 0.00038718029349268723, 'samples': 9338496, 'steps': 48637, 'loss/train': 1.9610881805419922} -11/07/2021 04:05:35 - INFO - __main__ - Step 48639: {'lr': 0.00038717585699471024, 'samples': 9338688, 'steps': 48638, 'loss/train': 1.5299619436264038} -11/07/2021 04:05:36 - INFO - __main__ - Step 48640: {'lr': 0.0003871714204349239, 'samples': 9338880, 'steps': 48639, 'loss/train': 1.39769446849823} -11/07/2021 04:05:36 - INFO - __main__ - Step 48641: {'lr': 0.00038716698381333027, 'samples': 9339072, 'steps': 48640, 'loss/train': 1.4764127731323242} -11/07/2021 04:05:36 - INFO - __main__ - Step 48642: {'lr': 0.0003871625471299313, 'samples': 9339264, 'steps': 48641, 'loss/train': 1.362342357635498} -11/07/2021 04:05:37 - INFO - __main__ - Step 48643: {'lr': 0.00038715811038472894, 'samples': 9339456, 'steps': 48642, 'loss/train': 1.7338573932647705} -11/07/2021 04:05:38 - INFO - __main__ - Step 48644: {'lr': 0.0003871536735777252, 'samples': 9339648, 'steps': 48643, 'loss/train': 1.346001386642456} -11/07/2021 04:05:38 - INFO - __main__ - Step 48645: {'lr': 0.0003871492367089223, 'samples': 9339840, 'steps': 48644, 'loss/train': 1.7608494758605957} -11/07/2021 04:05:38 - INFO - __main__ - Step 48646: {'lr': 0.000387144799778322, 'samples': 9340032, 'steps': 48645, 'loss/train': 1.3227531909942627} -11/07/2021 04:05:39 - INFO - __main__ - Step 48647: {'lr': 0.00038714036278592636, 'samples': 9340224, 'steps': 48646, 'loss/train': 1.2336411476135254} -11/07/2021 04:05:40 - INFO - __main__ - Step 48648: {'lr': 0.0003871359257317374, 'samples': 9340416, 'steps': 48647, 'loss/train': 1.5839163064956665} -11/07/2021 04:05:40 - INFO - __main__ - Step 48649: {'lr': 0.0003871314886157571, 'samples': 9340608, 'steps': 48648, 'loss/train': 1.714418649673462} -11/07/2021 04:05:40 - INFO - __main__ - Step 48650: {'lr': 0.0003871270514379874, 'samples': 9340800, 'steps': 48649, 'loss/train': 0.7539232969284058} -11/07/2021 04:05:41 - INFO - __main__ - Step 48651: {'lr': 0.00038712261419843056, 'samples': 9340992, 'steps': 48650, 'loss/train': 1.4385876655578613} -11/07/2021 04:05:41 - INFO - __main__ - Step 48652: {'lr': 0.00038711817689708817, 'samples': 9341184, 'steps': 48651, 'loss/train': 1.1543158292770386} -11/07/2021 04:05:42 - INFO - __main__ - Step 48653: {'lr': 0.00038711373953396257, 'samples': 9341376, 'steps': 48652, 'loss/train': 1.554872751235962} -11/07/2021 04:05:43 - INFO - __main__ - Step 48654: {'lr': 0.0003871093021090556, 'samples': 9341568, 'steps': 48653, 'loss/train': 0.905467689037323} -11/07/2021 04:05:43 - INFO - __main__ - Step 48655: {'lr': 0.0003871048646223693, 'samples': 9341760, 'steps': 48654, 'loss/train': 1.8039259910583496} -11/07/2021 04:05:43 - INFO - __main__ - Step 48656: {'lr': 0.00038710042707390557, 'samples': 9341952, 'steps': 48655, 'loss/train': 1.3409221172332764} -11/07/2021 04:05:44 - INFO - __main__ - Step 48657: {'lr': 0.00038709598946366666, 'samples': 9342144, 'steps': 48656, 'loss/train': 0.9013664722442627} -11/07/2021 04:05:44 - INFO - __main__ - Step 48658: {'lr': 0.00038709155179165436, 'samples': 9342336, 'steps': 48657, 'loss/train': 1.5325487852096558} -11/07/2021 04:05:45 - INFO - __main__ - Step 48659: {'lr': 0.00038708711405787067, 'samples': 9342528, 'steps': 48658, 'loss/train': 1.698494553565979} -11/07/2021 04:05:45 - INFO - __main__ - Step 48660: {'lr': 0.0003870826762623177, 'samples': 9342720, 'steps': 48659, 'loss/train': 1.3557522296905518} -11/07/2021 04:05:46 - INFO - __main__ - Step 48661: {'lr': 0.00038707823840499736, 'samples': 9342912, 'steps': 48660, 'loss/train': 1.452558159828186} -11/07/2021 04:05:46 - INFO - __main__ - Step 48662: {'lr': 0.0003870738004859117, 'samples': 9343104, 'steps': 48661, 'loss/train': 1.7299939393997192} -11/07/2021 04:05:47 - INFO - __main__ - Step 48663: {'lr': 0.0003870693625050626, 'samples': 9343296, 'steps': 48662, 'loss/train': 1.2825325727462769} -11/07/2021 04:05:47 - INFO - __main__ - Step 48664: {'lr': 0.00038706492446245234, 'samples': 9343488, 'steps': 48663, 'loss/train': 1.4849152565002441} -11/07/2021 04:05:48 - INFO - __main__ - Step 48665: {'lr': 0.00038706048635808266, 'samples': 9343680, 'steps': 48664, 'loss/train': 1.9088115692138672} -11/07/2021 04:05:48 - INFO - __main__ - Step 48666: {'lr': 0.0003870560481919556, 'samples': 9343872, 'steps': 48665, 'loss/train': 1.2525205612182617} -11/07/2021 04:05:49 - INFO - __main__ - Step 48667: {'lr': 0.00038705160996407325, 'samples': 9344064, 'steps': 48666, 'loss/train': 1.3481857776641846} -11/07/2021 04:05:49 - INFO - __main__ - Step 48668: {'lr': 0.00038704717167443753, 'samples': 9344256, 'steps': 48667, 'loss/train': 1.5626063346862793} -11/07/2021 04:05:49 - INFO - __main__ - Step 48669: {'lr': 0.0003870427333230505, 'samples': 9344448, 'steps': 48668, 'loss/train': 1.2384713888168335} -11/07/2021 04:05:50 - INFO - __main__ - Step 48670: {'lr': 0.00038703829490991407, 'samples': 9344640, 'steps': 48669, 'loss/train': 1.6280044317245483} -11/07/2021 04:05:51 - INFO - __main__ - Step 48671: {'lr': 0.0003870338564350303, 'samples': 9344832, 'steps': 48670, 'loss/train': 1.4496784210205078} -11/07/2021 04:05:51 - INFO - __main__ - Step 48672: {'lr': 0.0003870294178984013, 'samples': 9345024, 'steps': 48671, 'loss/train': 1.2935545444488525} -11/07/2021 04:05:51 - INFO - __main__ - Step 48673: {'lr': 0.0003870249793000289, 'samples': 9345216, 'steps': 48672, 'loss/train': 1.9649289846420288} -11/07/2021 04:05:52 - INFO - __main__ - Step 48674: {'lr': 0.0003870205406399151, 'samples': 9345408, 'steps': 48673, 'loss/train': 1.470001459121704} -11/07/2021 04:05:53 - INFO - __main__ - Step 48675: {'lr': 0.000387016101918062, 'samples': 9345600, 'steps': 48674, 'loss/train': 1.6249600648880005} -11/07/2021 04:05:53 - INFO - __main__ - Step 48676: {'lr': 0.0003870116631344716, 'samples': 9345792, 'steps': 48675, 'loss/train': 1.3065425157546997} -11/07/2021 04:05:53 - INFO - __main__ - Step 48677: {'lr': 0.0003870072242891458, 'samples': 9345984, 'steps': 48676, 'loss/train': 2.1314406394958496} -11/07/2021 04:05:54 - INFO - __main__ - Step 48678: {'lr': 0.0003870027853820867, 'samples': 9346176, 'steps': 48677, 'loss/train': 1.4698635339736938} -11/07/2021 04:05:54 - INFO - __main__ - Step 48679: {'lr': 0.0003869983464132962, 'samples': 9346368, 'steps': 48678, 'loss/train': 1.4177656173706055} -11/07/2021 04:05:55 - INFO - __main__ - Step 48680: {'lr': 0.0003869939073827764, 'samples': 9346560, 'steps': 48679, 'loss/train': 1.283326506614685} -11/07/2021 04:05:55 - INFO - __main__ - Step 48681: {'lr': 0.00038698946829052926, 'samples': 9346752, 'steps': 48680, 'loss/train': 0.9898263812065125} -11/07/2021 04:05:56 - INFO - __main__ - Step 48682: {'lr': 0.00038698502913655673, 'samples': 9346944, 'steps': 48681, 'loss/train': 1.7014774084091187} -11/07/2021 04:05:56 - INFO - __main__ - Step 48683: {'lr': 0.00038698058992086095, 'samples': 9347136, 'steps': 48682, 'loss/train': 1.427775263786316} -11/07/2021 04:05:57 - INFO - __main__ - Step 48684: {'lr': 0.0003869761506434438, 'samples': 9347328, 'steps': 48683, 'loss/train': 1.2640846967697144} -11/07/2021 04:05:58 - INFO - __main__ - Step 48685: {'lr': 0.0003869717113043073, 'samples': 9347520, 'steps': 48684, 'loss/train': 1.5891711711883545} -11/07/2021 04:05:58 - INFO - __main__ - Step 48686: {'lr': 0.00038696727190345347, 'samples': 9347712, 'steps': 48685, 'loss/train': 1.3345023393630981} -11/07/2021 04:05:58 - INFO - __main__ - Step 48687: {'lr': 0.00038696283244088426, 'samples': 9347904, 'steps': 48686, 'loss/train': 1.5201863050460815} -11/07/2021 04:05:59 - INFO - __main__ - Step 48688: {'lr': 0.0003869583929166017, 'samples': 9348096, 'steps': 48687, 'loss/train': 1.3590421676635742} -11/07/2021 04:05:59 - INFO - __main__ - Step 48689: {'lr': 0.0003869539533306079, 'samples': 9348288, 'steps': 48688, 'loss/train': 1.1935977935791016} -11/07/2021 04:06:00 - INFO - __main__ - Step 48690: {'lr': 0.00038694951368290463, 'samples': 9348480, 'steps': 48689, 'loss/train': 1.6029000282287598} -11/07/2021 04:06:00 - INFO - __main__ - Step 48691: {'lr': 0.0003869450739734941, 'samples': 9348672, 'steps': 48690, 'loss/train': 1.3300920724868774} -11/07/2021 04:06:01 - INFO - __main__ - Step 48692: {'lr': 0.00038694063420237823, 'samples': 9348864, 'steps': 48691, 'loss/train': 0.9210855960845947} -11/07/2021 04:06:01 - INFO - __main__ - Step 48693: {'lr': 0.00038693619436955907, 'samples': 9349056, 'steps': 48692, 'loss/train': 1.2502361536026} -11/07/2021 04:06:01 - INFO - __main__ - Step 48694: {'lr': 0.0003869317544750385, 'samples': 9349248, 'steps': 48693, 'loss/train': 1.711861252784729} -11/07/2021 04:06:02 - INFO - __main__ - Step 48695: {'lr': 0.0003869273145188186, 'samples': 9349440, 'steps': 48694, 'loss/train': 1.7460613250732422} -11/07/2021 04:06:03 - INFO - __main__ - Step 48696: {'lr': 0.00038692287450090143, 'samples': 9349632, 'steps': 48695, 'loss/train': 1.3120661973953247} -11/07/2021 04:06:03 - INFO - __main__ - Step 48697: {'lr': 0.0003869184344212888, 'samples': 9349824, 'steps': 48696, 'loss/train': 1.6759048700332642} -11/07/2021 04:06:03 - INFO - __main__ - Step 48698: {'lr': 0.00038691399427998296, 'samples': 9350016, 'steps': 48697, 'loss/train': 1.2368032932281494} -11/07/2021 04:06:04 - INFO - __main__ - Step 48699: {'lr': 0.0003869095540769858, 'samples': 9350208, 'steps': 48698, 'loss/train': 1.4147051572799683} -11/07/2021 04:06:04 - INFO - __main__ - Step 48700: {'lr': 0.0003869051138122992, 'samples': 9350400, 'steps': 48699, 'loss/train': 1.457667350769043} -11/07/2021 04:06:05 - INFO - __main__ - Step 48701: {'lr': 0.0003869006734859253, 'samples': 9350592, 'steps': 48700, 'loss/train': 1.5897791385650635} -11/07/2021 04:06:06 - INFO - __main__ - Step 48702: {'lr': 0.00038689623309786617, 'samples': 9350784, 'steps': 48701, 'loss/train': 1.6684839725494385} -11/07/2021 04:06:06 - INFO - __main__ - Step 48703: {'lr': 0.00038689179264812356, 'samples': 9350976, 'steps': 48702, 'loss/train': 1.1511362791061401} -11/07/2021 04:06:06 - INFO - __main__ - Step 48704: {'lr': 0.00038688735213669967, 'samples': 9351168, 'steps': 48703, 'loss/train': 1.2333346605300903} -11/07/2021 04:06:07 - INFO - __main__ - Step 48705: {'lr': 0.00038688291156359654, 'samples': 9351360, 'steps': 48704, 'loss/train': 1.3094733953475952} -11/07/2021 04:06:08 - INFO - __main__ - Step 48706: {'lr': 0.000386878470928816, 'samples': 9351552, 'steps': 48705, 'loss/train': 1.6706844568252563} -11/07/2021 04:06:09 - INFO - __main__ - Step 48707: {'lr': 0.0003868740302323601, 'samples': 9351744, 'steps': 48706, 'loss/train': 1.051388144493103} -11/07/2021 04:06:09 - INFO - __main__ - Step 48708: {'lr': 0.00038686958947423096, 'samples': 9351936, 'steps': 48707, 'loss/train': 1.7953312397003174} -11/07/2021 04:06:10 - INFO - __main__ - Step 48709: {'lr': 0.00038686514865443047, 'samples': 9352128, 'steps': 48708, 'loss/train': 1.4169048070907593} -11/07/2021 04:06:10 - INFO - __main__ - Step 48710: {'lr': 0.00038686070777296057, 'samples': 9352320, 'steps': 48709, 'loss/train': 1.9127233028411865} -11/07/2021 04:06:10 - INFO - __main__ - Step 48711: {'lr': 0.00038685626682982347, 'samples': 9352512, 'steps': 48710, 'loss/train': 1.7541173696517944} -11/07/2021 04:06:11 - INFO - __main__ - Step 48712: {'lr': 0.000386851825825021, 'samples': 9352704, 'steps': 48711, 'loss/train': 1.7800002098083496} -11/07/2021 04:06:12 - INFO - __main__ - Step 48713: {'lr': 0.0003868473847585552, 'samples': 9352896, 'steps': 48712, 'loss/train': 0.9547432065010071} -11/07/2021 04:06:12 - INFO - __main__ - Step 48714: {'lr': 0.00038684294363042806, 'samples': 9353088, 'steps': 48713, 'loss/train': 1.3911314010620117} -11/07/2021 04:06:12 - INFO - __main__ - Step 48715: {'lr': 0.00038683850244064164, 'samples': 9353280, 'steps': 48714, 'loss/train': 1.717429280281067} -11/07/2021 04:06:13 - INFO - __main__ - Step 48716: {'lr': 0.0003868340611891978, 'samples': 9353472, 'steps': 48715, 'loss/train': 0.7260299324989319} -11/07/2021 04:06:13 - INFO - __main__ - Step 48717: {'lr': 0.0003868296198760988, 'samples': 9353664, 'steps': 48716, 'loss/train': 1.784231185913086} -11/07/2021 04:06:14 - INFO - __main__ - Step 48718: {'lr': 0.00038682517850134634, 'samples': 9353856, 'steps': 48717, 'loss/train': 1.1612917184829712} -11/07/2021 04:06:14 - INFO - __main__ - Step 48719: {'lr': 0.0003868207370649427, 'samples': 9354048, 'steps': 48718, 'loss/train': 1.3193871974945068} -11/07/2021 04:06:15 - INFO - __main__ - Step 48720: {'lr': 0.0003868162955668897, 'samples': 9354240, 'steps': 48719, 'loss/train': 1.63193678855896} -11/07/2021 04:06:15 - INFO - __main__ - Step 48721: {'lr': 0.0003868118540071894, 'samples': 9354432, 'steps': 48720, 'loss/train': 1.3199032545089722} -11/07/2021 04:06:16 - INFO - __main__ - Step 48722: {'lr': 0.0003868074123858437, 'samples': 9354624, 'steps': 48721, 'loss/train': 1.2110531330108643} -11/07/2021 04:06:17 - INFO - __main__ - Step 48723: {'lr': 0.0003868029707028548, 'samples': 9354816, 'steps': 48722, 'loss/train': 1.7190054655075073} -11/07/2021 04:06:17 - INFO - __main__ - Step 48724: {'lr': 0.00038679852895822454, 'samples': 9355008, 'steps': 48723, 'loss/train': 1.5598641633987427} -11/07/2021 04:06:17 - INFO - __main__ - Step 48725: {'lr': 0.000386794087151955, 'samples': 9355200, 'steps': 48724, 'loss/train': 1.8229436874389648} -11/07/2021 04:06:18 - INFO - __main__ - Step 48726: {'lr': 0.00038678964528404816, 'samples': 9355392, 'steps': 48725, 'loss/train': 1.6857901811599731} -11/07/2021 04:06:18 - INFO - __main__ - Step 48727: {'lr': 0.000386785203354506, 'samples': 9355584, 'steps': 48726, 'loss/train': 1.457085132598877} -11/07/2021 04:06:18 - INFO - __main__ - Step 48728: {'lr': 0.0003867807613633305, 'samples': 9355776, 'steps': 48727, 'loss/train': 1.4536830186843872} -11/07/2021 04:06:19 - INFO - __main__ - Step 48729: {'lr': 0.0003867763193105237, 'samples': 9355968, 'steps': 48728, 'loss/train': 1.7361259460449219} -11/07/2021 04:06:20 - INFO - __main__ - Step 48730: {'lr': 0.00038677187719608763, 'samples': 9356160, 'steps': 48729, 'loss/train': 1.7625551223754883} -11/07/2021 04:06:20 - INFO - __main__ - Step 48731: {'lr': 0.00038676743502002434, 'samples': 9356352, 'steps': 48730, 'loss/train': 1.319649338722229} -11/07/2021 04:06:20 - INFO - __main__ - Step 48732: {'lr': 0.0003867629927823357, 'samples': 9356544, 'steps': 48731, 'loss/train': 1.083548665046692} -11/07/2021 04:06:21 - INFO - __main__ - Step 48733: {'lr': 0.0003867585504830237, 'samples': 9356736, 'steps': 48732, 'loss/train': 1.518478512763977} -11/07/2021 04:06:22 - INFO - __main__ - Step 48734: {'lr': 0.00038675410812209044, 'samples': 9356928, 'steps': 48733, 'loss/train': 1.7668431997299194} -11/07/2021 04:06:22 - INFO - __main__ - Step 48735: {'lr': 0.0003867496656995379, 'samples': 9357120, 'steps': 48734, 'loss/train': 1.438031554222107} -11/07/2021 04:06:22 - INFO - __main__ - Step 48736: {'lr': 0.0003867452232153681, 'samples': 9357312, 'steps': 48735, 'loss/train': 1.722999095916748} -11/07/2021 04:06:23 - INFO - __main__ - Step 48737: {'lr': 0.00038674078066958296, 'samples': 9357504, 'steps': 48736, 'loss/train': 1.2756949663162231} -11/07/2021 04:06:23 - INFO - __main__ - Step 48738: {'lr': 0.0003867363380621846, 'samples': 9357696, 'steps': 48737, 'loss/train': 0.6910433173179626} -11/07/2021 04:06:24 - INFO - __main__ - Step 48739: {'lr': 0.0003867318953931749, 'samples': 9357888, 'steps': 48738, 'loss/train': 1.8019530773162842} -11/07/2021 04:06:25 - INFO - __main__ - Step 48740: {'lr': 0.00038672745266255594, 'samples': 9358080, 'steps': 48739, 'loss/train': 1.5454462766647339} -11/07/2021 04:06:25 - INFO - __main__ - Step 48741: {'lr': 0.0003867230098703297, 'samples': 9358272, 'steps': 48740, 'loss/train': 1.5047858953475952} -11/07/2021 04:06:25 - INFO - __main__ - Step 48742: {'lr': 0.00038671856701649813, 'samples': 9358464, 'steps': 48741, 'loss/train': 1.7610464096069336} -11/07/2021 04:06:26 - INFO - __main__ - Step 48743: {'lr': 0.0003867141241010633, 'samples': 9358656, 'steps': 48742, 'loss/train': 1.0106375217437744} -11/07/2021 04:06:27 - INFO - __main__ - Step 48744: {'lr': 0.00038670968112402724, 'samples': 9358848, 'steps': 48743, 'loss/train': 2.2555599212646484} -11/07/2021 04:06:27 - INFO - __main__ - Step 48745: {'lr': 0.00038670523808539194, 'samples': 9359040, 'steps': 48744, 'loss/train': 1.3200651407241821} -11/07/2021 04:06:27 - INFO - __main__ - Step 48746: {'lr': 0.0003867007949851593, 'samples': 9359232, 'steps': 48745, 'loss/train': 1.2698509693145752} -11/07/2021 04:06:28 - INFO - __main__ - Step 48747: {'lr': 0.0003866963518233314, 'samples': 9359424, 'steps': 48746, 'loss/train': 1.5615946054458618} -11/07/2021 04:06:28 - INFO - __main__ - Step 48748: {'lr': 0.00038669190859991025, 'samples': 9359616, 'steps': 48747, 'loss/train': 1.2709089517593384} -11/07/2021 04:06:29 - INFO - __main__ - Step 48749: {'lr': 0.00038668746531489787, 'samples': 9359808, 'steps': 48748, 'loss/train': 1.6371272802352905} -11/07/2021 04:06:29 - INFO - __main__ - Step 48750: {'lr': 0.0003866830219682962, 'samples': 9360000, 'steps': 48749, 'loss/train': 1.6976897716522217} -11/07/2021 04:06:30 - INFO - __main__ - Step 48751: {'lr': 0.00038667857856010727, 'samples': 9360192, 'steps': 48750, 'loss/train': 1.5372999906539917} -11/07/2021 04:06:30 - INFO - __main__ - Step 48752: {'lr': 0.00038667413509033306, 'samples': 9360384, 'steps': 48751, 'loss/train': 1.2858636379241943} -11/07/2021 04:06:30 - INFO - __main__ - Step 48753: {'lr': 0.0003866696915589756, 'samples': 9360576, 'steps': 48752, 'loss/train': 1.4410368204116821} -11/07/2021 04:06:32 - INFO - __main__ - Step 48754: {'lr': 0.0003866652479660369, 'samples': 9360768, 'steps': 48753, 'loss/train': 1.517182469367981} -11/07/2021 04:06:32 - INFO - __main__ - Step 48755: {'lr': 0.00038666080431151896, 'samples': 9360960, 'steps': 48754, 'loss/train': 1.2897025346755981} -11/07/2021 04:06:32 - INFO - __main__ - Step 48756: {'lr': 0.00038665636059542367, 'samples': 9361152, 'steps': 48755, 'loss/train': 1.6465325355529785} -11/07/2021 04:06:33 - INFO - __main__ - Step 48757: {'lr': 0.00038665191681775323, 'samples': 9361344, 'steps': 48756, 'loss/train': 1.4895535707473755} -11/07/2021 04:06:33 - INFO - __main__ - Step 48758: {'lr': 0.00038664747297850955, 'samples': 9361536, 'steps': 48757, 'loss/train': 1.6872446537017822} -11/07/2021 04:06:34 - INFO - __main__ - Step 48759: {'lr': 0.00038664302907769456, 'samples': 9361728, 'steps': 48758, 'loss/train': 1.286729335784912} -11/07/2021 04:06:34 - INFO - __main__ - Step 48760: {'lr': 0.00038663858511531034, 'samples': 9361920, 'steps': 48759, 'loss/train': 1.6060450077056885} -11/07/2021 04:06:35 - INFO - __main__ - Step 48761: {'lr': 0.000386634141091359, 'samples': 9362112, 'steps': 48760, 'loss/train': 1.1402372121810913} -11/07/2021 04:06:35 - INFO - __main__ - Step 48762: {'lr': 0.0003866296970058423, 'samples': 9362304, 'steps': 48761, 'loss/train': 1.502384901046753} -11/07/2021 04:06:35 - INFO - __main__ - Step 48763: {'lr': 0.0003866252528587624, 'samples': 9362496, 'steps': 48762, 'loss/train': 1.5161304473876953} -11/07/2021 04:06:37 - INFO - __main__ - Step 48764: {'lr': 0.00038662080865012127, 'samples': 9362688, 'steps': 48763, 'loss/train': 1.6916911602020264} -11/07/2021 04:06:37 - INFO - __main__ - Step 48765: {'lr': 0.00038661636437992093, 'samples': 9362880, 'steps': 48764, 'loss/train': 1.4508171081542969} -11/07/2021 04:06:37 - INFO - __main__ - Step 48766: {'lr': 0.0003866119200481634, 'samples': 9363072, 'steps': 48765, 'loss/train': 1.3959133625030518} -11/07/2021 04:06:38 - INFO - __main__ - Step 48767: {'lr': 0.00038660747565485054, 'samples': 9363264, 'steps': 48766, 'loss/train': 1.5454134941101074} -11/07/2021 04:06:38 - INFO - __main__ - Step 48768: {'lr': 0.0003866030311999845, 'samples': 9363456, 'steps': 48767, 'loss/train': 1.689577579498291} -11/07/2021 04:06:39 - INFO - __main__ - Step 48769: {'lr': 0.0003865985866835673, 'samples': 9363648, 'steps': 48768, 'loss/train': 1.476892113685608} -11/07/2021 04:06:39 - INFO - __main__ - Step 48770: {'lr': 0.00038659414210560087, 'samples': 9363840, 'steps': 48769, 'loss/train': 1.6476308107376099} -11/07/2021 04:06:40 - INFO - __main__ - Step 48771: {'lr': 0.00038658969746608717, 'samples': 9364032, 'steps': 48770, 'loss/train': 1.1548690795898438} -11/07/2021 04:06:40 - INFO - __main__ - Step 48772: {'lr': 0.0003865852527650283, 'samples': 9364224, 'steps': 48771, 'loss/train': 0.3828035891056061} -11/07/2021 04:06:40 - INFO - __main__ - Step 48773: {'lr': 0.0003865808080024262, 'samples': 9364416, 'steps': 48772, 'loss/train': 1.2640275955200195} -11/07/2021 04:06:41 - INFO - __main__ - Step 48774: {'lr': 0.00038657636317828293, 'samples': 9364608, 'steps': 48773, 'loss/train': 1.4242490530014038} -11/07/2021 04:06:42 - INFO - __main__ - Step 48775: {'lr': 0.00038657191829260043, 'samples': 9364800, 'steps': 48774, 'loss/train': 1.7121540307998657} -11/07/2021 04:06:42 - INFO - __main__ - Step 48776: {'lr': 0.00038656747334538073, 'samples': 9364992, 'steps': 48775, 'loss/train': 1.2917346954345703} -11/07/2021 04:06:42 - INFO - __main__ - Step 48777: {'lr': 0.00038656302833662583, 'samples': 9365184, 'steps': 48776, 'loss/train': 2.1382129192352295} -11/07/2021 04:06:43 - INFO - __main__ - Step 48778: {'lr': 0.00038655858326633774, 'samples': 9365376, 'steps': 48777, 'loss/train': 1.293482780456543} -11/07/2021 04:06:43 - INFO - __main__ - Step 48779: {'lr': 0.0003865541381345185, 'samples': 9365568, 'steps': 48778, 'loss/train': 0.16194438934326172} -11/07/2021 04:06:45 - INFO - __main__ - Step 48780: {'lr': 0.00038654969294117, 'samples': 9365760, 'steps': 48779, 'loss/train': 0.9568668007850647} -11/07/2021 04:06:45 - INFO - __main__ - Step 48781: {'lr': 0.0003865452476862944, 'samples': 9365952, 'steps': 48780, 'loss/train': 1.5685209035873413} -11/07/2021 04:06:45 - INFO - __main__ - Step 48782: {'lr': 0.0003865408023698935, 'samples': 9366144, 'steps': 48781, 'loss/train': 1.5595369338989258} -11/07/2021 04:06:46 - INFO - __main__ - Step 48783: {'lr': 0.00038653635699196956, 'samples': 9366336, 'steps': 48782, 'loss/train': 1.7438932657241821} -11/07/2021 04:06:46 - INFO - __main__ - Step 48784: {'lr': 0.0003865319115525244, 'samples': 9366528, 'steps': 48783, 'loss/train': 1.029396414756775} -11/07/2021 04:06:46 - INFO - __main__ - Step 48785: {'lr': 0.00038652746605156, 'samples': 9366720, 'steps': 48784, 'loss/train': 1.8966786861419678} -11/07/2021 04:06:47 - INFO - __main__ - Step 48786: {'lr': 0.0003865230204890785, 'samples': 9366912, 'steps': 48785, 'loss/train': 1.8196535110473633} -11/07/2021 04:06:48 - INFO - __main__ - Step 48787: {'lr': 0.0003865185748650818, 'samples': 9367104, 'steps': 48786, 'loss/train': 1.0815938711166382} -11/07/2021 04:06:48 - INFO - __main__ - Step 48788: {'lr': 0.00038651412917957195, 'samples': 9367296, 'steps': 48787, 'loss/train': 1.6344361305236816} -11/07/2021 04:06:48 - INFO - __main__ - Step 48789: {'lr': 0.000386509683432551, 'samples': 9367488, 'steps': 48788, 'loss/train': 1.7716069221496582} -11/07/2021 04:06:49 - INFO - __main__ - Step 48790: {'lr': 0.0003865052376240208, 'samples': 9367680, 'steps': 48789, 'loss/train': 1.2671294212341309} -11/07/2021 04:06:50 - INFO - __main__ - Step 48791: {'lr': 0.00038650079175398346, 'samples': 9367872, 'steps': 48790, 'loss/train': 1.7354562282562256} -11/07/2021 04:06:50 - INFO - __main__ - Step 48792: {'lr': 0.00038649634582244095, 'samples': 9368064, 'steps': 48791, 'loss/train': 1.3500326871871948} -11/07/2021 04:06:50 - INFO - __main__ - Step 48793: {'lr': 0.0003864918998293954, 'samples': 9368256, 'steps': 48792, 'loss/train': 1.6196799278259277} -11/07/2021 04:06:51 - INFO - __main__ - Step 48794: {'lr': 0.0003864874537748486, 'samples': 9368448, 'steps': 48793, 'loss/train': 1.5681240558624268} -11/07/2021 04:06:51 - INFO - __main__ - Step 48795: {'lr': 0.00038648300765880276, 'samples': 9368640, 'steps': 48794, 'loss/train': 1.248744249343872} -11/07/2021 04:06:52 - INFO - __main__ - Step 48796: {'lr': 0.0003864785614812597, 'samples': 9368832, 'steps': 48795, 'loss/train': 1.4846022129058838} -11/07/2021 04:06:53 - INFO - __main__ - Step 48797: {'lr': 0.00038647411524222146, 'samples': 9369024, 'steps': 48796, 'loss/train': 1.6658082008361816} -11/07/2021 04:06:53 - INFO - __main__ - Step 48798: {'lr': 0.00038646966894169014, 'samples': 9369216, 'steps': 48797, 'loss/train': 1.4880821704864502} -11/07/2021 04:06:53 - INFO - __main__ - Step 48799: {'lr': 0.00038646522257966776, 'samples': 9369408, 'steps': 48798, 'loss/train': 1.0046395063400269} -11/07/2021 04:06:54 - INFO - __main__ - Step 48800: {'lr': 0.0003864607761561562, 'samples': 9369600, 'steps': 48799, 'loss/train': 1.652105689048767} -11/07/2021 04:06:56 - INFO - __main__ - Step 48801: {'lr': 0.00038645632967115753, 'samples': 9369792, 'steps': 48800, 'loss/train': 1.5499067306518555} -11/07/2021 04:06:56 - INFO - __main__ - Step 48802: {'lr': 0.0003864518831246737, 'samples': 9369984, 'steps': 48801, 'loss/train': 1.5321955680847168} -11/07/2021 04:06:56 - INFO - __main__ - Step 48803: {'lr': 0.00038644743651670684, 'samples': 9370176, 'steps': 48802, 'loss/train': 1.5658891201019287} -11/07/2021 04:06:57 - INFO - __main__ - Step 48804: {'lr': 0.00038644298984725876, 'samples': 9370368, 'steps': 48803, 'loss/train': 1.4779611825942993} -11/07/2021 04:06:57 - INFO - __main__ - Step 48805: {'lr': 0.00038643854311633166, 'samples': 9370560, 'steps': 48804, 'loss/train': 1.4240643978118896} -11/07/2021 04:06:57 - INFO - __main__ - Step 48806: {'lr': 0.0003864340963239275, 'samples': 9370752, 'steps': 48805, 'loss/train': 1.3121813535690308} -11/07/2021 04:06:58 - INFO - __main__ - Step 48807: {'lr': 0.00038642964947004815, 'samples': 9370944, 'steps': 48806, 'loss/train': 0.7261683344841003} -11/07/2021 04:06:59 - INFO - __main__ - Step 48808: {'lr': 0.0003864252025546957, 'samples': 9371136, 'steps': 48807, 'loss/train': 0.8198906183242798} -11/07/2021 04:06:59 - INFO - __main__ - Step 48809: {'lr': 0.00038642075557787225, 'samples': 9371328, 'steps': 48808, 'loss/train': 1.670855164527893} -11/07/2021 04:07:00 - INFO - __main__ - Step 48810: {'lr': 0.0003864163085395797, 'samples': 9371520, 'steps': 48809, 'loss/train': 1.4442169666290283} -11/07/2021 04:07:00 - INFO - __main__ - Step 48811: {'lr': 0.00038641186143982, 'samples': 9371712, 'steps': 48810, 'loss/train': 1.5569305419921875} -11/07/2021 04:07:00 - INFO - __main__ - Step 48812: {'lr': 0.0003864074142785952, 'samples': 9371904, 'steps': 48811, 'loss/train': 1.8886054754257202} -11/07/2021 04:07:01 - INFO - __main__ - Step 48813: {'lr': 0.0003864029670559074, 'samples': 9372096, 'steps': 48812, 'loss/train': 0.931264340877533} -11/07/2021 04:07:02 - INFO - __main__ - Step 48814: {'lr': 0.0003863985197717585, 'samples': 9372288, 'steps': 48813, 'loss/train': 0.7957919239997864} -11/07/2021 04:07:02 - INFO - __main__ - Step 48815: {'lr': 0.0003863940724261505, 'samples': 9372480, 'steps': 48814, 'loss/train': 1.1304203271865845} -11/07/2021 04:07:02 - INFO - __main__ - Step 48816: {'lr': 0.0003863896250190855, 'samples': 9372672, 'steps': 48815, 'loss/train': 1.3601429462432861} -11/07/2021 04:07:03 - INFO - __main__ - Step 48817: {'lr': 0.00038638517755056534, 'samples': 9372864, 'steps': 48816, 'loss/train': 1.6283661127090454} -11/07/2021 04:07:03 - INFO - __main__ - Step 48818: {'lr': 0.00038638073002059223, 'samples': 9373056, 'steps': 48817, 'loss/train': 1.3443467617034912} -11/07/2021 04:07:04 - INFO - __main__ - Step 48819: {'lr': 0.000386376282429168, 'samples': 9373248, 'steps': 48818, 'loss/train': 0.7243291139602661} -11/07/2021 04:07:04 - INFO - __main__ - Step 48820: {'lr': 0.0003863718347762948, 'samples': 9373440, 'steps': 48819, 'loss/train': 1.125797152519226} -11/07/2021 04:07:05 - INFO - __main__ - Step 48821: {'lr': 0.0003863673870619744, 'samples': 9373632, 'steps': 48820, 'loss/train': 1.2432880401611328} -11/07/2021 04:07:05 - INFO - __main__ - Step 48822: {'lr': 0.00038636293928620915, 'samples': 9373824, 'steps': 48821, 'loss/train': 1.2100565433502197} -11/07/2021 04:07:05 - INFO - __main__ - Step 48823: {'lr': 0.0003863584914490007, 'samples': 9374016, 'steps': 48822, 'loss/train': 1.6470533609390259} -11/07/2021 04:07:07 - INFO - __main__ - Step 48824: {'lr': 0.0003863540435503513, 'samples': 9374208, 'steps': 48823, 'loss/train': 0.5824220180511475} -11/07/2021 04:07:07 - INFO - __main__ - Step 48825: {'lr': 0.0003863495955902629, 'samples': 9374400, 'steps': 48824, 'loss/train': 1.147403597831726} -11/07/2021 04:07:08 - INFO - __main__ - Step 48826: {'lr': 0.00038634514756873746, 'samples': 9374592, 'steps': 48825, 'loss/train': 1.6314716339111328} -11/07/2021 04:07:08 - INFO - __main__ - Step 48827: {'lr': 0.000386340699485777, 'samples': 9374784, 'steps': 48826, 'loss/train': 0.47161123156547546} -11/07/2021 04:07:08 - INFO - __main__ - Step 48828: {'lr': 0.0003863362513413835, 'samples': 9374976, 'steps': 48827, 'loss/train': 1.3701505661010742} -11/07/2021 04:07:09 - INFO - __main__ - Step 48829: {'lr': 0.00038633180313555894, 'samples': 9375168, 'steps': 48828, 'loss/train': 0.1184760332107544} -11/07/2021 04:07:10 - INFO - __main__ - Step 48830: {'lr': 0.0003863273548683054, 'samples': 9375360, 'steps': 48829, 'loss/train': 1.616905927658081} -11/07/2021 04:07:10 - INFO - __main__ - Step 48831: {'lr': 0.0003863229065396249, 'samples': 9375552, 'steps': 48830, 'loss/train': 1.8326122760772705} -11/07/2021 04:07:10 - INFO - __main__ - Step 48832: {'lr': 0.0003863184581495194, 'samples': 9375744, 'steps': 48831, 'loss/train': 1.295698642730713} -11/07/2021 04:07:11 - INFO - __main__ - Step 48833: {'lr': 0.0003863140096979909, 'samples': 9375936, 'steps': 48832, 'loss/train': 1.1749823093414307} -11/07/2021 04:07:12 - INFO - __main__ - Step 48834: {'lr': 0.00038630956118504146, 'samples': 9376128, 'steps': 48833, 'loss/train': 1.8343381881713867} -11/07/2021 04:07:12 - INFO - __main__ - Step 48835: {'lr': 0.00038630511261067294, 'samples': 9376320, 'steps': 48834, 'loss/train': 1.4257701635360718} -11/07/2021 04:07:13 - INFO - __main__ - Step 48836: {'lr': 0.0003863006639748875, 'samples': 9376512, 'steps': 48835, 'loss/train': 1.5344891548156738} -11/07/2021 04:07:13 - INFO - __main__ - Step 48837: {'lr': 0.000386296215277687, 'samples': 9376704, 'steps': 48836, 'loss/train': 0.5804466605186462} -11/07/2021 04:07:13 - INFO - __main__ - Step 48838: {'lr': 0.0003862917665190736, 'samples': 9376896, 'steps': 48837, 'loss/train': 1.2600109577178955} -11/07/2021 04:07:14 - INFO - __main__ - Step 48839: {'lr': 0.0003862873176990492, 'samples': 9377088, 'steps': 48838, 'loss/train': 1.8333112001419067} -11/07/2021 04:07:15 - INFO - __main__ - Step 48840: {'lr': 0.00038628286881761594, 'samples': 9377280, 'steps': 48839, 'loss/train': 1.3519837856292725} -11/07/2021 04:07:15 - INFO - __main__ - Step 48841: {'lr': 0.0003862784198747756, 'samples': 9377472, 'steps': 48840, 'loss/train': 0.9140884280204773} -11/07/2021 04:07:15 - INFO - __main__ - Step 48842: {'lr': 0.0003862739708705304, 'samples': 9377664, 'steps': 48841, 'loss/train': 1.6649800539016724} -11/07/2021 04:07:16 - INFO - __main__ - Step 48843: {'lr': 0.0003862695218048822, 'samples': 9377856, 'steps': 48842, 'loss/train': 1.3832347393035889} -11/07/2021 04:07:16 - INFO - __main__ - Step 48844: {'lr': 0.000386265072677833, 'samples': 9378048, 'steps': 48843, 'loss/train': 1.4973256587982178} -11/07/2021 04:07:17 - INFO - __main__ - Step 48845: {'lr': 0.00038626062348938494, 'samples': 9378240, 'steps': 48844, 'loss/train': 1.8129611015319824} -11/07/2021 04:07:18 - INFO - __main__ - Step 48846: {'lr': 0.00038625617423954, 'samples': 9378432, 'steps': 48845, 'loss/train': 1.4013532400131226} -11/07/2021 04:07:18 - INFO - __main__ - Step 48847: {'lr': 0.00038625172492829995, 'samples': 9378624, 'steps': 48846, 'loss/train': 1.7761856317520142} -11/07/2021 04:07:18 - INFO - __main__ - Step 48848: {'lr': 0.00038624727555566714, 'samples': 9378816, 'steps': 48847, 'loss/train': 2.2022461891174316} -11/07/2021 04:07:19 - INFO - __main__ - Step 48849: {'lr': 0.0003862428261216433, 'samples': 9379008, 'steps': 48848, 'loss/train': 1.5194182395935059} -11/07/2021 04:07:20 - INFO - __main__ - Step 48850: {'lr': 0.00038623837662623065, 'samples': 9379200, 'steps': 48849, 'loss/train': 1.8473443984985352} -11/07/2021 04:07:20 - INFO - __main__ - Step 48851: {'lr': 0.000386233927069431, 'samples': 9379392, 'steps': 48850, 'loss/train': 1.5626877546310425} -11/07/2021 04:07:20 - INFO - __main__ - Step 48852: {'lr': 0.0003862294774512465, 'samples': 9379584, 'steps': 48851, 'loss/train': 1.4937726259231567} -11/07/2021 04:07:21 - INFO - __main__ - Step 48853: {'lr': 0.00038622502777167913, 'samples': 9379776, 'steps': 48852, 'loss/train': 1.0545097589492798} -11/07/2021 04:07:21 - INFO - __main__ - Step 48854: {'lr': 0.00038622057803073075, 'samples': 9379968, 'steps': 48853, 'loss/train': 1.2151628732681274} -11/07/2021 04:07:21 - INFO - __main__ - Step 48855: {'lr': 0.0003862161282284036, 'samples': 9380160, 'steps': 48854, 'loss/train': 1.763312816619873} -11/07/2021 04:07:22 - INFO - __main__ - Step 48856: {'lr': 0.00038621167836469945, 'samples': 9380352, 'steps': 48855, 'loss/train': 1.5793697834014893} -11/07/2021 04:07:23 - INFO - __main__ - Step 48857: {'lr': 0.0003862072284396205, 'samples': 9380544, 'steps': 48856, 'loss/train': 1.4016894102096558} -11/07/2021 04:07:23 - INFO - __main__ - Step 48858: {'lr': 0.00038620277845316867, 'samples': 9380736, 'steps': 48857, 'loss/train': 1.4486711025238037} -11/07/2021 04:07:23 - INFO - __main__ - Step 48859: {'lr': 0.00038619832840534586, 'samples': 9380928, 'steps': 48858, 'loss/train': 0.8741102814674377} -11/07/2021 04:07:24 - INFO - __main__ - Step 48860: {'lr': 0.0003861938782961544, 'samples': 9381120, 'steps': 48859, 'loss/train': 1.3810038566589355} -11/07/2021 04:07:25 - INFO - __main__ - Step 48861: {'lr': 0.0003861894281255959, 'samples': 9381312, 'steps': 48860, 'loss/train': 1.1368257999420166} -11/07/2021 04:07:25 - INFO - __main__ - Step 48862: {'lr': 0.0003861849778936726, 'samples': 9381504, 'steps': 48861, 'loss/train': 1.2794278860092163} -11/07/2021 04:07:26 - INFO - __main__ - Step 48863: {'lr': 0.00038618052760038647, 'samples': 9381696, 'steps': 48862, 'loss/train': 1.540213942527771} -11/07/2021 04:07:26 - INFO - __main__ - Step 48864: {'lr': 0.00038617607724573944, 'samples': 9381888, 'steps': 48863, 'loss/train': 1.45363187789917} -11/07/2021 04:07:26 - INFO - __main__ - Step 48865: {'lr': 0.0003861716268297336, 'samples': 9382080, 'steps': 48864, 'loss/train': 0.20641732215881348} -11/07/2021 04:07:27 - INFO - __main__ - Step 48866: {'lr': 0.000386167176352371, 'samples': 9382272, 'steps': 48865, 'loss/train': 2.019467830657959} -11/07/2021 04:07:28 - INFO - __main__ - Step 48867: {'lr': 0.00038616272581365354, 'samples': 9382464, 'steps': 48866, 'loss/train': 1.715158462524414} -11/07/2021 04:07:28 - INFO - __main__ - Step 48868: {'lr': 0.00038615827521358315, 'samples': 9382656, 'steps': 48867, 'loss/train': 1.4227601289749146} -11/07/2021 04:07:28 - INFO - __main__ - Step 48869: {'lr': 0.00038615382455216204, 'samples': 9382848, 'steps': 48868, 'loss/train': 3.3128716945648193} -11/07/2021 04:07:29 - INFO - __main__ - Step 48870: {'lr': 0.0003861493738293921, 'samples': 9383040, 'steps': 48869, 'loss/train': 1.4049416780471802} -11/07/2021 04:07:30 - INFO - __main__ - Step 48871: {'lr': 0.0003861449230452753, 'samples': 9383232, 'steps': 48870, 'loss/train': 1.6238514184951782} -11/07/2021 04:07:30 - INFO - __main__ - Step 48872: {'lr': 0.00038614047219981374, 'samples': 9383424, 'steps': 48871, 'loss/train': 1.6514708995819092} -11/07/2021 04:07:31 - INFO - __main__ - Step 48873: {'lr': 0.0003861360212930094, 'samples': 9383616, 'steps': 48872, 'loss/train': 1.457114338874817} -11/07/2021 04:07:31 - INFO - __main__ - Step 48874: {'lr': 0.0003861315703248643, 'samples': 9383808, 'steps': 48873, 'loss/train': 2.123868703842163} -11/07/2021 04:07:31 - INFO - __main__ - Step 48875: {'lr': 0.0003861271192953804, 'samples': 9384000, 'steps': 48874, 'loss/train': 1.9054794311523438} -11/07/2021 04:07:32 - INFO - __main__ - Step 48876: {'lr': 0.00038612266820455964, 'samples': 9384192, 'steps': 48875, 'loss/train': 1.4032111167907715} -11/07/2021 04:07:33 - INFO - __main__ - Step 48877: {'lr': 0.0003861182170524041, 'samples': 9384384, 'steps': 48876, 'loss/train': 1.3080118894577026} -11/07/2021 04:07:33 - INFO - __main__ - Step 48878: {'lr': 0.0003861137658389159, 'samples': 9384576, 'steps': 48877, 'loss/train': 1.5100162029266357} -11/07/2021 04:07:33 - INFO - __main__ - Step 48879: {'lr': 0.0003861093145640969, 'samples': 9384768, 'steps': 48878, 'loss/train': 1.6183574199676514} -11/07/2021 04:07:34 - INFO - __main__ - Step 48880: {'lr': 0.00038610486322794915, 'samples': 9384960, 'steps': 48879, 'loss/train': 1.8066436052322388} -11/07/2021 04:07:34 - INFO - __main__ - Step 48881: {'lr': 0.0003861004118304746, 'samples': 9385152, 'steps': 48880, 'loss/train': 1.4952269792556763} -11/07/2021 04:07:35 - INFO - __main__ - Step 48882: {'lr': 0.0003860959603716754, 'samples': 9385344, 'steps': 48881, 'loss/train': 0.9843176603317261} -11/07/2021 04:07:35 - INFO - __main__ - Step 48883: {'lr': 0.00038609150885155337, 'samples': 9385536, 'steps': 48882, 'loss/train': 1.4871866703033447} -11/07/2021 04:07:36 - INFO - __main__ - Step 48884: {'lr': 0.0003860870572701106, 'samples': 9385728, 'steps': 48883, 'loss/train': 1.55475914478302} -11/07/2021 04:07:36 - INFO - __main__ - Step 48885: {'lr': 0.0003860826056273492, 'samples': 9385920, 'steps': 48884, 'loss/train': 1.460806131362915} -11/07/2021 04:07:36 - INFO - __main__ - Step 48886: {'lr': 0.0003860781539232709, 'samples': 9386112, 'steps': 48885, 'loss/train': 5.611880302429199} -11/07/2021 04:07:38 - INFO - __main__ - Step 48887: {'lr': 0.0003860737021578781, 'samples': 9386304, 'steps': 48886, 'loss/train': 1.2217185497283936} -11/07/2021 04:07:38 - INFO - __main__ - Step 48888: {'lr': 0.00038606925033117246, 'samples': 9386496, 'steps': 48887, 'loss/train': 1.5372991561889648} -11/07/2021 04:07:38 - INFO - __main__ - Step 48889: {'lr': 0.00038606479844315614, 'samples': 9386688, 'steps': 48888, 'loss/train': 1.4254859685897827} -11/07/2021 04:07:39 - INFO - __main__ - Step 48890: {'lr': 0.00038606034649383116, 'samples': 9386880, 'steps': 48889, 'loss/train': 1.2352256774902344} -11/07/2021 04:07:39 - INFO - __main__ - Step 48891: {'lr': 0.0003860558944831994, 'samples': 9387072, 'steps': 48890, 'loss/train': 0.6035268902778625} -11/07/2021 04:07:39 - INFO - __main__ - Step 48892: {'lr': 0.000386051442411263, 'samples': 9387264, 'steps': 48891, 'loss/train': 1.3484644889831543} -11/07/2021 04:07:41 - INFO - __main__ - Step 48893: {'lr': 0.00038604699027802394, 'samples': 9387456, 'steps': 48892, 'loss/train': 1.492655634880066} -11/07/2021 04:07:41 - INFO - __main__ - Step 48894: {'lr': 0.0003860425380834842, 'samples': 9387648, 'steps': 48893, 'loss/train': 1.4083945751190186} -11/07/2021 04:07:41 - INFO - __main__ - Step 48895: {'lr': 0.0003860380858276458, 'samples': 9387840, 'steps': 48894, 'loss/train': 0.21939469873905182} -11/07/2021 04:07:42 - INFO - __main__ - Step 48896: {'lr': 0.0003860336335105107, 'samples': 9388032, 'steps': 48895, 'loss/train': 1.3290843963623047} -11/07/2021 04:07:42 - INFO - __main__ - Step 48897: {'lr': 0.000386029181132081, 'samples': 9388224, 'steps': 48896, 'loss/train': 1.3532027006149292} -11/07/2021 04:07:43 - INFO - __main__ - Step 48898: {'lr': 0.0003860247286923586, 'samples': 9388416, 'steps': 48897, 'loss/train': 1.551863193511963} -11/07/2021 04:07:43 - INFO - __main__ - Step 48899: {'lr': 0.0003860202761913455, 'samples': 9388608, 'steps': 48898, 'loss/train': 1.5765019655227661} -11/07/2021 04:07:44 - INFO - __main__ - Step 48900: {'lr': 0.00038601582362904384, 'samples': 9388800, 'steps': 48899, 'loss/train': 1.5646566152572632} -11/07/2021 04:07:44 - INFO - __main__ - Step 48901: {'lr': 0.0003860113710054556, 'samples': 9388992, 'steps': 48900, 'loss/train': 1.491734266281128} -11/07/2021 04:07:44 - INFO - __main__ - Step 48902: {'lr': 0.00038600691832058265, 'samples': 9389184, 'steps': 48901, 'loss/train': 1.0709919929504395} -11/07/2021 04:07:46 - INFO - __main__ - Step 48903: {'lr': 0.0003860024655744271, 'samples': 9389376, 'steps': 48902, 'loss/train': 0.95680832862854} -11/07/2021 04:07:46 - INFO - __main__ - Step 48904: {'lr': 0.000385998012766991, 'samples': 9389568, 'steps': 48903, 'loss/train': 1.5748766660690308} -11/07/2021 04:07:46 - INFO - __main__ - Step 48905: {'lr': 0.0003859935598982762, 'samples': 9389760, 'steps': 48904, 'loss/train': 1.882698893547058} -11/07/2021 04:07:47 - INFO - __main__ - Step 48906: {'lr': 0.0003859891069682848, 'samples': 9389952, 'steps': 48905, 'loss/train': 1.5582358837127686} -11/07/2021 04:07:47 - INFO - __main__ - Step 48907: {'lr': 0.0003859846539770189, 'samples': 9390144, 'steps': 48906, 'loss/train': 0.37549105286598206} -11/07/2021 04:07:48 - INFO - __main__ - Step 48908: {'lr': 0.0003859802009244804, 'samples': 9390336, 'steps': 48907, 'loss/train': 1.8381954431533813} -11/07/2021 04:07:49 - INFO - __main__ - Step 48909: {'lr': 0.00038597574781067123, 'samples': 9390528, 'steps': 48908, 'loss/train': 1.480832815170288} -11/07/2021 04:07:49 - INFO - __main__ - Step 48910: {'lr': 0.0003859712946355936, 'samples': 9390720, 'steps': 48909, 'loss/train': 0.8164600133895874} -11/07/2021 04:07:49 - INFO - __main__ - Step 48911: {'lr': 0.0003859668413992493, 'samples': 9390912, 'steps': 48910, 'loss/train': 1.281607985496521} -11/07/2021 04:07:50 - INFO - __main__ - Step 48912: {'lr': 0.0003859623881016404, 'samples': 9391104, 'steps': 48911, 'loss/train': 1.6252738237380981} -11/07/2021 04:07:50 - INFO - __main__ - Step 48913: {'lr': 0.000385957934742769, 'samples': 9391296, 'steps': 48912, 'loss/train': 1.3718078136444092} -11/07/2021 04:07:51 - INFO - __main__ - Step 48914: {'lr': 0.0003859534813226372, 'samples': 9391488, 'steps': 48913, 'loss/train': 1.0985984802246094} -11/07/2021 04:07:51 - INFO - __main__ - Step 48915: {'lr': 0.00038594902784124663, 'samples': 9391680, 'steps': 48914, 'loss/train': 1.525246500968933} -11/07/2021 04:07:52 - INFO - __main__ - Step 48916: {'lr': 0.00038594457429859966, 'samples': 9391872, 'steps': 48915, 'loss/train': 1.7037945985794067} -11/07/2021 04:07:52 - INFO - __main__ - Step 48917: {'lr': 0.00038594012069469814, 'samples': 9392064, 'steps': 48916, 'loss/train': 1.8779573440551758} -11/07/2021 04:07:52 - INFO - __main__ - Step 48918: {'lr': 0.0003859356670295441, 'samples': 9392256, 'steps': 48917, 'loss/train': 1.5259239673614502} -11/07/2021 04:07:54 - INFO - __main__ - Step 48919: {'lr': 0.00038593121330313953, 'samples': 9392448, 'steps': 48918, 'loss/train': 1.8216310739517212} -11/07/2021 04:07:54 - INFO - __main__ - Step 48920: {'lr': 0.0003859267595154865, 'samples': 9392640, 'steps': 48919, 'loss/train': 1.6950819492340088} -11/07/2021 04:07:54 - INFO - __main__ - Step 48921: {'lr': 0.0003859223056665869, 'samples': 9392832, 'steps': 48920, 'loss/train': 2.4829678535461426} -11/07/2021 04:07:55 - INFO - __main__ - Step 48922: {'lr': 0.00038591785175644283, 'samples': 9393024, 'steps': 48921, 'loss/train': 1.4854564666748047} -11/07/2021 04:07:55 - INFO - __main__ - Step 48923: {'lr': 0.0003859133977850563, 'samples': 9393216, 'steps': 48922, 'loss/train': 1.3652397394180298} -11/07/2021 04:07:56 - INFO - __main__ - Step 48924: {'lr': 0.00038590894375242925, 'samples': 9393408, 'steps': 48923, 'loss/train': 1.6962120532989502} -11/07/2021 04:07:56 - INFO - __main__ - Step 48925: {'lr': 0.0003859044896585637, 'samples': 9393600, 'steps': 48924, 'loss/train': 1.3781741857528687} -11/07/2021 04:07:57 - INFO - __main__ - Step 48926: {'lr': 0.00038590003550346177, 'samples': 9393792, 'steps': 48925, 'loss/train': 1.7190457582473755} -11/07/2021 04:07:57 - INFO - __main__ - Step 48927: {'lr': 0.0003858955812871254, 'samples': 9393984, 'steps': 48926, 'loss/train': 1.9883801937103271} -11/07/2021 04:07:57 - INFO - __main__ - Step 48928: {'lr': 0.0003858911270095565, 'samples': 9394176, 'steps': 48927, 'loss/train': 1.4579230546951294} -11/07/2021 04:07:59 - INFO - __main__ - Step 48929: {'lr': 0.00038588667267075715, 'samples': 9394368, 'steps': 48928, 'loss/train': 1.4992196559906006} -11/07/2021 04:07:59 - INFO - __main__ - Step 48930: {'lr': 0.0003858822182707294, 'samples': 9394560, 'steps': 48929, 'loss/train': 1.516557216644287} -11/07/2021 04:07:59 - INFO - __main__ - Step 48931: {'lr': 0.00038587776380947516, 'samples': 9394752, 'steps': 48930, 'loss/train': 1.510056495666504} -11/07/2021 04:08:00 - INFO - __main__ - Step 48932: {'lr': 0.0003858733092869966, 'samples': 9394944, 'steps': 48931, 'loss/train': 1.8778561353683472} -11/07/2021 04:08:00 - INFO - __main__ - Step 48933: {'lr': 0.00038586885470329554, 'samples': 9395136, 'steps': 48932, 'loss/train': 1.3887089490890503} -11/07/2021 04:08:00 - INFO - __main__ - Step 48934: {'lr': 0.0003858644000583741, 'samples': 9395328, 'steps': 48933, 'loss/train': 1.4813086986541748} -11/07/2021 04:08:01 - INFO - __main__ - Step 48935: {'lr': 0.0003858599453522342, 'samples': 9395520, 'steps': 48934, 'loss/train': 1.7310360670089722} -11/07/2021 04:08:02 - INFO - __main__ - Step 48936: {'lr': 0.000385855490584878, 'samples': 9395712, 'steps': 48935, 'loss/train': 1.3012902736663818} -11/07/2021 04:08:02 - INFO - __main__ - Step 48937: {'lr': 0.0003858510357563074, 'samples': 9395904, 'steps': 48936, 'loss/train': 1.43248450756073} -11/07/2021 04:08:02 - INFO - __main__ - Step 48938: {'lr': 0.00038584658086652433, 'samples': 9396096, 'steps': 48937, 'loss/train': 1.7660819292068481} -11/07/2021 04:08:03 - INFO - __main__ - Step 48939: {'lr': 0.00038584212591553105, 'samples': 9396288, 'steps': 48938, 'loss/train': 1.2785720825195312} -11/07/2021 04:08:04 - INFO - __main__ - Step 48940: {'lr': 0.00038583767090332924, 'samples': 9396480, 'steps': 48939, 'loss/train': 1.5622167587280273} -11/07/2021 04:08:04 - INFO - __main__ - Step 48941: {'lr': 0.00038583321582992113, 'samples': 9396672, 'steps': 48940, 'loss/train': 1.2461129426956177} -11/07/2021 04:08:04 - INFO - __main__ - Step 48942: {'lr': 0.0003858287606953087, 'samples': 9396864, 'steps': 48941, 'loss/train': 1.3549952507019043} -11/07/2021 04:08:05 - INFO - __main__ - Step 48943: {'lr': 0.00038582430549949386, 'samples': 9397056, 'steps': 48942, 'loss/train': 1.319166660308838} -11/07/2021 04:08:05 - INFO - __main__ - Step 48944: {'lr': 0.00038581985024247877, 'samples': 9397248, 'steps': 48943, 'loss/train': 1.4726316928863525} -11/07/2021 04:08:06 - INFO - __main__ - Step 48945: {'lr': 0.0003858153949242653, 'samples': 9397440, 'steps': 48944, 'loss/train': 1.5756710767745972} -11/07/2021 04:08:07 - INFO - __main__ - Step 48946: {'lr': 0.00038581093954485554, 'samples': 9397632, 'steps': 48945, 'loss/train': 1.4263874292373657} -11/07/2021 04:08:07 - INFO - __main__ - Step 48947: {'lr': 0.00038580648410425146, 'samples': 9397824, 'steps': 48946, 'loss/train': 1.4357798099517822} -11/07/2021 04:08:07 - INFO - __main__ - Step 48948: {'lr': 0.00038580202860245507, 'samples': 9398016, 'steps': 48947, 'loss/train': 1.2987250089645386} -11/07/2021 04:08:08 - INFO - __main__ - Step 48949: {'lr': 0.00038579757303946826, 'samples': 9398208, 'steps': 48948, 'loss/train': 1.1880955696105957} -11/07/2021 04:08:09 - INFO - __main__ - Step 48950: {'lr': 0.0003857931174152933, 'samples': 9398400, 'steps': 48949, 'loss/train': 1.6143276691436768} -11/07/2021 04:08:09 - INFO - __main__ - Step 48951: {'lr': 0.000385788661729932, 'samples': 9398592, 'steps': 48950, 'loss/train': 1.5052846670150757} -11/07/2021 04:08:09 - INFO - __main__ - Step 48952: {'lr': 0.0003857842059833865, 'samples': 9398784, 'steps': 48951, 'loss/train': 1.6773607730865479} -11/07/2021 04:08:10 - INFO - __main__ - Step 48953: {'lr': 0.0003857797501756587, 'samples': 9398976, 'steps': 48952, 'loss/train': 1.5313549041748047} -11/07/2021 04:08:10 - INFO - __main__ - Step 48954: {'lr': 0.0003857752943067506, 'samples': 9399168, 'steps': 48953, 'loss/train': 1.5578811168670654} -11/07/2021 04:08:12 - INFO - __main__ - Step 48955: {'lr': 0.0003857708383766643, 'samples': 9399360, 'steps': 48954, 'loss/train': 1.220923662185669} -11/07/2021 04:08:12 - INFO - __main__ - Step 48956: {'lr': 0.00038576638238540167, 'samples': 9399552, 'steps': 48955, 'loss/train': 1.686860203742981} -11/07/2021 04:08:12 - INFO - __main__ - Step 48957: {'lr': 0.00038576192633296485, 'samples': 9399744, 'steps': 48956, 'loss/train': 1.7237331867218018} -11/07/2021 04:08:13 - INFO - __main__ - Step 48958: {'lr': 0.00038575747021935583, 'samples': 9399936, 'steps': 48957, 'loss/train': 1.772165060043335} -11/07/2021 04:08:13 - INFO - __main__ - Step 48959: {'lr': 0.0003857530140445765, 'samples': 9400128, 'steps': 48958, 'loss/train': 1.250779151916504} -11/07/2021 04:08:13 - INFO - __main__ - Step 48960: {'lr': 0.00038574855780862903, 'samples': 9400320, 'steps': 48959, 'loss/train': 1.3282482624053955} -11/07/2021 04:08:14 - INFO - __main__ - Step 48961: {'lr': 0.0003857441015115154, 'samples': 9400512, 'steps': 48960, 'loss/train': 1.4221696853637695} -11/07/2021 04:08:15 - INFO - __main__ - Step 48962: {'lr': 0.00038573964515323754, 'samples': 9400704, 'steps': 48961, 'loss/train': 1.850115418434143} -11/07/2021 04:08:15 - INFO - __main__ - Step 48963: {'lr': 0.0003857351887337974, 'samples': 9400896, 'steps': 48962, 'loss/train': 1.2149375677108765} -11/07/2021 04:08:15 - INFO - __main__ - Step 48964: {'lr': 0.00038573073225319724, 'samples': 9401088, 'steps': 48963, 'loss/train': 1.45426607131958} -11/07/2021 04:08:16 - INFO - __main__ - Step 48965: {'lr': 0.00038572627571143873, 'samples': 9401280, 'steps': 48964, 'loss/train': 1.7876821756362915} -11/07/2021 04:08:17 - INFO - __main__ - Step 48966: {'lr': 0.0003857218191085242, 'samples': 9401472, 'steps': 48965, 'loss/train': 1.346888542175293} -11/07/2021 04:08:17 - INFO - __main__ - Step 48967: {'lr': 0.0003857173624444554, 'samples': 9401664, 'steps': 48966, 'loss/train': 0.31117236614227295} -11/07/2021 04:08:18 - INFO - __main__ - Step 48968: {'lr': 0.00038571290571923455, 'samples': 9401856, 'steps': 48967, 'loss/train': 0.902428150177002} -11/07/2021 04:08:18 - INFO - __main__ - Step 48969: {'lr': 0.0003857084489328635, 'samples': 9402048, 'steps': 48968, 'loss/train': 1.6733211278915405} -11/07/2021 04:08:18 - INFO - __main__ - Step 48970: {'lr': 0.00038570399208534437, 'samples': 9402240, 'steps': 48969, 'loss/train': 1.519181489944458} -11/07/2021 04:08:19 - INFO - __main__ - Step 48971: {'lr': 0.000385699535176679, 'samples': 9402432, 'steps': 48970, 'loss/train': 1.7384952306747437} -11/07/2021 04:08:20 - INFO - __main__ - Step 48972: {'lr': 0.00038569507820686956, 'samples': 9402624, 'steps': 48971, 'loss/train': 1.4874610900878906} -11/07/2021 04:08:20 - INFO - __main__ - Step 48973: {'lr': 0.000385690621175918, 'samples': 9402816, 'steps': 48972, 'loss/train': 1.9224824905395508} -11/07/2021 04:08:20 - INFO - __main__ - Step 48974: {'lr': 0.0003856861640838265, 'samples': 9403008, 'steps': 48973, 'loss/train': 2.112514019012451} -11/07/2021 04:08:21 - INFO - __main__ - Step 48975: {'lr': 0.00038568170693059677, 'samples': 9403200, 'steps': 48974, 'loss/train': 1.4942660331726074} -11/07/2021 04:08:22 - INFO - __main__ - Step 48976: {'lr': 0.000385677249716231, 'samples': 9403392, 'steps': 48975, 'loss/train': 1.478994369506836} -11/07/2021 04:08:22 - INFO - __main__ - Step 48977: {'lr': 0.0003856727924407311, 'samples': 9403584, 'steps': 48976, 'loss/train': 1.1730769872665405} -11/07/2021 04:08:22 - INFO - __main__ - Step 48978: {'lr': 0.0003856683351040992, 'samples': 9403776, 'steps': 48977, 'loss/train': 1.257746696472168} -11/07/2021 04:08:23 - INFO - __main__ - Step 48979: {'lr': 0.00038566387770633715, 'samples': 9403968, 'steps': 48978, 'loss/train': 1.9970284700393677} -11/07/2021 04:08:23 - INFO - __main__ - Step 48980: {'lr': 0.00038565942024744703, 'samples': 9404160, 'steps': 48979, 'loss/train': 1.560881495475769} -11/07/2021 04:08:24 - INFO - __main__ - Step 48981: {'lr': 0.000385654962727431, 'samples': 9404352, 'steps': 48980, 'loss/train': 1.696020483970642} -11/07/2021 04:08:25 - INFO - __main__ - Step 48982: {'lr': 0.00038565050514629087, 'samples': 9404544, 'steps': 48981, 'loss/train': 1.3196929693222046} -11/07/2021 04:08:25 - INFO - __main__ - Step 48983: {'lr': 0.0003856460475040288, 'samples': 9404736, 'steps': 48982, 'loss/train': 1.0660433769226074} -11/07/2021 04:08:25 - INFO - __main__ - Step 48984: {'lr': 0.00038564158980064657, 'samples': 9404928, 'steps': 48983, 'loss/train': 1.5505517721176147} -11/07/2021 04:08:26 - INFO - __main__ - Step 48985: {'lr': 0.0003856371320361464, 'samples': 9405120, 'steps': 48984, 'loss/train': 1.1489191055297852} -11/07/2021 04:08:27 - INFO - __main__ - Step 48986: {'lr': 0.00038563267421053024, 'samples': 9405312, 'steps': 48985, 'loss/train': 1.3692070245742798} -11/07/2021 04:08:27 - INFO - __main__ - Step 48987: {'lr': 0.0003856282163238001, 'samples': 9405504, 'steps': 48986, 'loss/train': 1.6641390323638916} -11/07/2021 04:08:27 - INFO - __main__ - Step 48988: {'lr': 0.000385623758375958, 'samples': 9405696, 'steps': 48987, 'loss/train': 1.8186664581298828} -11/07/2021 04:08:28 - INFO - __main__ - Step 48989: {'lr': 0.0003856193003670058, 'samples': 9405888, 'steps': 48988, 'loss/train': 0.9343728423118591} -11/07/2021 04:08:28 - INFO - __main__ - Step 48990: {'lr': 0.0003856148422969458, 'samples': 9406080, 'steps': 48989, 'loss/train': 1.5853612422943115} -11/07/2021 04:08:29 - INFO - __main__ - Step 48991: {'lr': 0.0003856103841657797, 'samples': 9406272, 'steps': 48990, 'loss/train': 1.4318612813949585} -11/07/2021 04:08:29 - INFO - __main__ - Step 48992: {'lr': 0.00038560592597350975, 'samples': 9406464, 'steps': 48991, 'loss/train': 1.2812211513519287} -11/07/2021 04:08:30 - INFO - __main__ - Step 48993: {'lr': 0.0003856014677201378, 'samples': 9406656, 'steps': 48992, 'loss/train': 1.5667595863342285} -11/07/2021 04:08:30 - INFO - __main__ - Step 48994: {'lr': 0.000385597009405666, 'samples': 9406848, 'steps': 48993, 'loss/train': 1.3088542222976685} -11/07/2021 04:08:30 - INFO - __main__ - Step 48995: {'lr': 0.0003855925510300962, 'samples': 9407040, 'steps': 48994, 'loss/train': 1.3461893796920776} -11/07/2021 04:08:31 - INFO - __main__ - Step 48996: {'lr': 0.0003855880925934305, 'samples': 9407232, 'steps': 48995, 'loss/train': 1.308261513710022} -11/07/2021 04:08:32 - INFO - __main__ - Step 48997: {'lr': 0.000385583634095671, 'samples': 9407424, 'steps': 48996, 'loss/train': 1.569661259651184} -11/07/2021 04:08:32 - INFO - __main__ - Step 48998: {'lr': 0.00038557917553681944, 'samples': 9407616, 'steps': 48997, 'loss/train': 1.5256402492523193} -11/07/2021 04:08:32 - INFO - __main__ - Step 48999: {'lr': 0.00038557471691687804, 'samples': 9407808, 'steps': 48998, 'loss/train': 1.4784225225448608} -11/07/2021 04:08:33 - INFO - __main__ - Step 49000: {'lr': 0.0003855702582358489, 'samples': 9408000, 'steps': 48999, 'loss/train': 1.7442666292190552} -11/07/2021 04:08:33 - INFO - __main__ - Step 49001: {'lr': 0.00038556579949373384, 'samples': 9408192, 'steps': 49000, 'loss/train': 1.5192310810089111} -11/07/2021 04:08:34 - INFO - __main__ - Step 49002: {'lr': 0.00038556134069053484, 'samples': 9408384, 'steps': 49001, 'loss/train': 0.9820490479469299} -11/07/2021 04:08:34 - INFO - __main__ - Step 49003: {'lr': 0.00038555688182625406, 'samples': 9408576, 'steps': 49002, 'loss/train': 1.5996290445327759} -11/07/2021 04:08:35 - INFO - __main__ - Step 49004: {'lr': 0.0003855524229008934, 'samples': 9408768, 'steps': 49003, 'loss/train': 0.8507100939750671} -11/07/2021 04:08:35 - INFO - __main__ - Step 49005: {'lr': 0.0003855479639144549, 'samples': 9408960, 'steps': 49004, 'loss/train': 1.7345751523971558} -11/07/2021 04:08:35 - INFO - __main__ - Step 49006: {'lr': 0.0003855435048669406, 'samples': 9409152, 'steps': 49005, 'loss/train': 1.1710102558135986} -11/07/2021 04:08:37 - INFO - __main__ - Step 49007: {'lr': 0.0003855390457583525, 'samples': 9409344, 'steps': 49006, 'loss/train': 1.5970712900161743} -11/07/2021 04:08:37 - INFO - __main__ - Step 49008: {'lr': 0.0003855345865886926, 'samples': 9409536, 'steps': 49007, 'loss/train': 2.054039239883423} -11/07/2021 04:08:37 - INFO - __main__ - Step 49009: {'lr': 0.0003855301273579629, 'samples': 9409728, 'steps': 49008, 'loss/train': 4.088986396789551} -11/07/2021 04:08:38 - INFO - __main__ - Step 49010: {'lr': 0.0003855256680661654, 'samples': 9409920, 'steps': 49009, 'loss/train': 1.3908464908599854} -11/07/2021 04:08:38 - INFO - __main__ - Step 49011: {'lr': 0.00038552120871330217, 'samples': 9410112, 'steps': 49010, 'loss/train': 1.4406582117080688} -11/07/2021 04:08:38 - INFO - __main__ - Step 49012: {'lr': 0.0003855167492993751, 'samples': 9410304, 'steps': 49011, 'loss/train': 1.5320438146591187} -11/07/2021 04:08:39 - INFO - __main__ - Step 49013: {'lr': 0.00038551228982438635, 'samples': 9410496, 'steps': 49012, 'loss/train': 1.4877569675445557} -11/07/2021 04:08:40 - INFO - __main__ - Step 49014: {'lr': 0.00038550783028833786, 'samples': 9410688, 'steps': 49013, 'loss/train': 1.3163621425628662} -11/07/2021 04:08:40 - INFO - __main__ - Step 49015: {'lr': 0.00038550337069123155, 'samples': 9410880, 'steps': 49014, 'loss/train': 1.7298897504806519} -11/07/2021 04:08:41 - INFO - __main__ - Step 49016: {'lr': 0.00038549891103306953, 'samples': 9411072, 'steps': 49015, 'loss/train': 1.3940982818603516} -11/07/2021 04:08:41 - INFO - __main__ - Step 49017: {'lr': 0.00038549445131385386, 'samples': 9411264, 'steps': 49016, 'loss/train': 1.5628517866134644} -11/07/2021 04:08:42 - INFO - __main__ - Step 49018: {'lr': 0.00038548999153358645, 'samples': 9411456, 'steps': 49017, 'loss/train': 1.1688588857650757} -11/07/2021 04:08:42 - INFO - __main__ - Step 49019: {'lr': 0.0003854855316922693, 'samples': 9411648, 'steps': 49018, 'loss/train': 1.7715271711349487} -11/07/2021 04:08:43 - INFO - __main__ - Step 49020: {'lr': 0.0003854810717899045, 'samples': 9411840, 'steps': 49019, 'loss/train': 1.3426858186721802} -11/07/2021 04:08:43 - INFO - __main__ - Step 49021: {'lr': 0.0003854766118264941, 'samples': 9412032, 'steps': 49020, 'loss/train': 1.2353349924087524} -11/07/2021 04:08:43 - INFO - __main__ - Step 49022: {'lr': 0.0003854721518020399, 'samples': 9412224, 'steps': 49021, 'loss/train': 0.7917335033416748} -11/07/2021 04:08:44 - INFO - __main__ - Step 49023: {'lr': 0.00038546769171654403, 'samples': 9412416, 'steps': 49022, 'loss/train': 2.011986255645752} -11/07/2021 04:08:45 - INFO - __main__ - Step 49024: {'lr': 0.00038546323157000856, 'samples': 9412608, 'steps': 49023, 'loss/train': 1.5429515838623047} -11/07/2021 04:08:45 - INFO - __main__ - Step 49025: {'lr': 0.00038545877136243544, 'samples': 9412800, 'steps': 49024, 'loss/train': 1.461340308189392} -11/07/2021 04:08:46 - INFO - __main__ - Step 49026: {'lr': 0.00038545431109382667, 'samples': 9412992, 'steps': 49025, 'loss/train': 1.071258544921875} -11/07/2021 04:08:46 - INFO - __main__ - Step 49027: {'lr': 0.0003854498507641843, 'samples': 9413184, 'steps': 49026, 'loss/train': 2.099436044692993} -11/07/2021 04:08:46 - INFO - __main__ - Step 49028: {'lr': 0.00038544539037351037, 'samples': 9413376, 'steps': 49027, 'loss/train': 1.1202818155288696} -11/07/2021 04:08:47 - INFO - __main__ - Step 49029: {'lr': 0.0003854409299218068, 'samples': 9413568, 'steps': 49028, 'loss/train': 1.7763105630874634} -11/07/2021 04:08:48 - INFO - __main__ - Step 49030: {'lr': 0.00038543646940907564, 'samples': 9413760, 'steps': 49029, 'loss/train': 5.898472309112549} -11/07/2021 04:08:48 - INFO - __main__ - Step 49031: {'lr': 0.0003854320088353188, 'samples': 9413952, 'steps': 49030, 'loss/train': 1.3018929958343506} -11/07/2021 04:08:48 - INFO - __main__ - Step 49032: {'lr': 0.0003854275482005385, 'samples': 9414144, 'steps': 49031, 'loss/train': 1.8933767080307007} -11/07/2021 04:08:49 - INFO - __main__ - Step 49033: {'lr': 0.0003854230875047366, 'samples': 9414336, 'steps': 49032, 'loss/train': 1.587097406387329} -11/07/2021 04:08:49 - INFO - __main__ - Step 49034: {'lr': 0.0003854186267479151, 'samples': 9414528, 'steps': 49033, 'loss/train': 1.6172665357589722} -11/07/2021 04:08:51 - INFO - __main__ - Step 49035: {'lr': 0.00038541416593007615, 'samples': 9414720, 'steps': 49034, 'loss/train': 1.136541724205017} -11/07/2021 04:08:51 - INFO - __main__ - Step 49036: {'lr': 0.00038540970505122164, 'samples': 9414912, 'steps': 49035, 'loss/train': 1.8691534996032715} -11/07/2021 04:08:51 - INFO - __main__ - Step 49037: {'lr': 0.0003854052441113536, 'samples': 9415104, 'steps': 49036, 'loss/train': 1.267198085784912} -11/07/2021 04:08:52 - INFO - __main__ - Step 49038: {'lr': 0.00038540078311047397, 'samples': 9415296, 'steps': 49037, 'loss/train': 1.221850872039795} -11/07/2021 04:08:52 - INFO - __main__ - Step 49039: {'lr': 0.0003853963220485849, 'samples': 9415488, 'steps': 49038, 'loss/train': 1.516257882118225} -11/07/2021 04:08:52 - INFO - __main__ - Step 49040: {'lr': 0.00038539186092568833, 'samples': 9415680, 'steps': 49039, 'loss/train': 1.5481401681900024} -11/07/2021 04:08:53 - INFO - __main__ - Step 49041: {'lr': 0.00038538739974178633, 'samples': 9415872, 'steps': 49040, 'loss/train': 1.4090861082077026} -11/07/2021 04:08:54 - INFO - __main__ - Step 49042: {'lr': 0.00038538293849688077, 'samples': 9416064, 'steps': 49041, 'loss/train': 1.515071153640747} -11/07/2021 04:08:54 - INFO - __main__ - Step 49043: {'lr': 0.0003853784771909739, 'samples': 9416256, 'steps': 49042, 'loss/train': 1.0329222679138184} -11/07/2021 04:08:54 - INFO - __main__ - Step 49044: {'lr': 0.0003853740158240674, 'samples': 9416448, 'steps': 49043, 'loss/train': 1.4012494087219238} -11/07/2021 04:08:55 - INFO - __main__ - Step 49045: {'lr': 0.0003853695543961635, 'samples': 9416640, 'steps': 49044, 'loss/train': 2.0041351318359375} -11/07/2021 04:08:56 - INFO - __main__ - Step 49046: {'lr': 0.00038536509290726417, 'samples': 9416832, 'steps': 49045, 'loss/train': 1.7326302528381348} -11/07/2021 04:08:56 - INFO - __main__ - Step 49047: {'lr': 0.00038536063135737145, 'samples': 9417024, 'steps': 49046, 'loss/train': 1.3995091915130615} -11/07/2021 04:08:56 - INFO - __main__ - Step 49048: {'lr': 0.0003853561697464874, 'samples': 9417216, 'steps': 49047, 'loss/train': 1.129688024520874} -11/07/2021 04:08:57 - INFO - __main__ - Step 49049: {'lr': 0.0003853517080746138, 'samples': 9417408, 'steps': 49048, 'loss/train': 1.1902576684951782} -11/07/2021 04:08:57 - INFO - __main__ - Step 49050: {'lr': 0.00038534724634175285, 'samples': 9417600, 'steps': 49049, 'loss/train': 1.5384318828582764} -11/07/2021 04:08:58 - INFO - __main__ - Step 49051: {'lr': 0.0003853427845479065, 'samples': 9417792, 'steps': 49050, 'loss/train': 1.6219627857208252} -11/07/2021 04:08:59 - INFO - __main__ - Step 49052: {'lr': 0.0003853383226930768, 'samples': 9417984, 'steps': 49051, 'loss/train': 0.9121947288513184} -11/07/2021 04:08:59 - INFO - __main__ - Step 49053: {'lr': 0.00038533386077726573, 'samples': 9418176, 'steps': 49052, 'loss/train': 0.8772579431533813} -11/07/2021 04:08:59 - INFO - __main__ - Step 49054: {'lr': 0.00038532939880047535, 'samples': 9418368, 'steps': 49053, 'loss/train': 1.5285707712173462} -11/07/2021 04:09:00 - INFO - __main__ - Step 49055: {'lr': 0.00038532493676270765, 'samples': 9418560, 'steps': 49054, 'loss/train': 0.7943586707115173} -11/07/2021 04:09:00 - INFO - __main__ - Step 49056: {'lr': 0.0003853204746639646, 'samples': 9418752, 'steps': 49055, 'loss/train': 1.632174015045166} -11/07/2021 04:09:01 - INFO - __main__ - Step 49057: {'lr': 0.0003853160125042482, 'samples': 9418944, 'steps': 49056, 'loss/train': 1.5486323833465576} -11/07/2021 04:09:01 - INFO - __main__ - Step 49058: {'lr': 0.00038531155028356047, 'samples': 9419136, 'steps': 49057, 'loss/train': 1.500724196434021} -11/07/2021 04:09:02 - INFO - __main__ - Step 49059: {'lr': 0.0003853070880019035, 'samples': 9419328, 'steps': 49058, 'loss/train': 1.1665802001953125} -11/07/2021 04:09:02 - INFO - __main__ - Step 49060: {'lr': 0.0003853026256592792, 'samples': 9419520, 'steps': 49059, 'loss/train': 1.3292691707611084} -11/07/2021 04:09:02 - INFO - __main__ - Step 49061: {'lr': 0.0003852981632556897, 'samples': 9419712, 'steps': 49060, 'loss/train': 1.4833451509475708} -11/07/2021 04:09:03 - INFO - __main__ - Step 49062: {'lr': 0.0003852937007911369, 'samples': 9419904, 'steps': 49061, 'loss/train': 1.846569299697876} -11/07/2021 04:09:04 - INFO - __main__ - Step 49063: {'lr': 0.00038528923826562287, 'samples': 9420096, 'steps': 49062, 'loss/train': 1.3322322368621826} -11/07/2021 04:09:04 - INFO - __main__ - Step 49064: {'lr': 0.00038528477567914955, 'samples': 9420288, 'steps': 49063, 'loss/train': 1.1554535627365112} -11/07/2021 04:09:04 - INFO - __main__ - Step 49065: {'lr': 0.000385280313031719, 'samples': 9420480, 'steps': 49064, 'loss/train': 1.8195546865463257} -11/07/2021 04:09:05 - INFO - __main__ - Step 49066: {'lr': 0.00038527585032333326, 'samples': 9420672, 'steps': 49065, 'loss/train': 1.331484317779541} -11/07/2021 04:09:06 - INFO - __main__ - Step 49067: {'lr': 0.00038527138755399423, 'samples': 9420864, 'steps': 49066, 'loss/train': 1.426199197769165} -11/07/2021 04:09:06 - INFO - __main__ - Step 49068: {'lr': 0.00038526692472370407, 'samples': 9421056, 'steps': 49067, 'loss/train': 1.358767032623291} -11/07/2021 04:09:07 - INFO - __main__ - Step 49069: {'lr': 0.0003852624618324647, 'samples': 9421248, 'steps': 49068, 'loss/train': 1.6837997436523438} -11/07/2021 04:09:07 - INFO - __main__ - Step 49070: {'lr': 0.0003852579988802782, 'samples': 9421440, 'steps': 49069, 'loss/train': 2.1985177993774414} -11/07/2021 04:09:07 - INFO - __main__ - Step 49071: {'lr': 0.00038525353586714645, 'samples': 9421632, 'steps': 49070, 'loss/train': 1.5465973615646362} -11/07/2021 04:09:08 - INFO - __main__ - Step 49072: {'lr': 0.0003852490727930716, 'samples': 9421824, 'steps': 49071, 'loss/train': 1.1003345251083374} -11/07/2021 04:09:09 - INFO - __main__ - Step 49073: {'lr': 0.00038524460965805557, 'samples': 9422016, 'steps': 49072, 'loss/train': 1.042018175125122} -11/07/2021 04:09:09 - INFO - __main__ - Step 49074: {'lr': 0.00038524014646210044, 'samples': 9422208, 'steps': 49073, 'loss/train': 1.722677230834961} -11/07/2021 04:09:09 - INFO - __main__ - Step 49075: {'lr': 0.00038523568320520817, 'samples': 9422400, 'steps': 49074, 'loss/train': 1.2833806276321411} -11/07/2021 04:09:10 - INFO - __main__ - Step 49076: {'lr': 0.0003852312198873808, 'samples': 9422592, 'steps': 49075, 'loss/train': 1.5856560468673706} -11/07/2021 04:09:11 - INFO - __main__ - Step 49077: {'lr': 0.0003852267565086203, 'samples': 9422784, 'steps': 49076, 'loss/train': 1.6125866174697876} -11/07/2021 04:09:11 - INFO - __main__ - Step 49078: {'lr': 0.0003852222930689288, 'samples': 9422976, 'steps': 49077, 'loss/train': 1.5924015045166016} -11/07/2021 04:09:11 - INFO - __main__ - Step 49079: {'lr': 0.00038521782956830807, 'samples': 9423168, 'steps': 49078, 'loss/train': 1.728890299797058} -11/07/2021 04:09:12 - INFO - __main__ - Step 49080: {'lr': 0.00038521336600676035, 'samples': 9423360, 'steps': 49079, 'loss/train': 1.4587135314941406} -11/07/2021 04:09:12 - INFO - __main__ - Step 49081: {'lr': 0.00038520890238428763, 'samples': 9423552, 'steps': 49080, 'loss/train': 1.463641881942749} -11/07/2021 04:09:13 - INFO - __main__ - Step 49082: {'lr': 0.00038520443870089185, 'samples': 9423744, 'steps': 49081, 'loss/train': 1.0472511053085327} -11/07/2021 04:09:13 - INFO - __main__ - Step 49083: {'lr': 0.00038519997495657497, 'samples': 9423936, 'steps': 49082, 'loss/train': 1.4112025499343872} -11/07/2021 04:09:14 - INFO - __main__ - Step 49084: {'lr': 0.0003851955111513391, 'samples': 9424128, 'steps': 49083, 'loss/train': 0.6797143816947937} -11/07/2021 04:09:14 - INFO - __main__ - Step 49085: {'lr': 0.0003851910472851862, 'samples': 9424320, 'steps': 49084, 'loss/train': 1.422843098640442} -11/07/2021 04:09:14 - INFO - __main__ - Step 49086: {'lr': 0.0003851865833581183, 'samples': 9424512, 'steps': 49085, 'loss/train': 1.7759983539581299} -11/07/2021 04:09:15 - INFO - __main__ - Step 49087: {'lr': 0.0003851821193701375, 'samples': 9424704, 'steps': 49086, 'loss/train': 1.171252727508545} -11/07/2021 04:09:16 - INFO - __main__ - Step 49088: {'lr': 0.0003851776553212456, 'samples': 9424896, 'steps': 49087, 'loss/train': 0.863366425037384} -11/07/2021 04:09:16 - INFO - __main__ - Step 49089: {'lr': 0.0003851731912114448, 'samples': 9425088, 'steps': 49088, 'loss/train': 1.486554741859436} -11/07/2021 04:09:17 - INFO - __main__ - Step 49090: {'lr': 0.00038516872704073704, 'samples': 9425280, 'steps': 49089, 'loss/train': 1.8933355808258057} -11/07/2021 04:09:17 - INFO - __main__ - Step 49091: {'lr': 0.0003851642628091243, 'samples': 9425472, 'steps': 49090, 'loss/train': 1.3501158952713013} -11/07/2021 04:09:18 - INFO - __main__ - Step 49092: {'lr': 0.0003851597985166087, 'samples': 9425664, 'steps': 49091, 'loss/train': 1.405320167541504} -11/07/2021 04:09:18 - INFO - __main__ - Step 49093: {'lr': 0.0003851553341631921, 'samples': 9425856, 'steps': 49092, 'loss/train': 1.4765554666519165} -11/07/2021 04:09:19 - INFO - __main__ - Step 49094: {'lr': 0.0003851508697488766, 'samples': 9426048, 'steps': 49093, 'loss/train': 1.0383342504501343} -11/07/2021 04:09:19 - INFO - __main__ - Step 49095: {'lr': 0.0003851464052736643, 'samples': 9426240, 'steps': 49094, 'loss/train': 0.8753216862678528} -11/07/2021 04:09:19 - INFO - __main__ - Step 49096: {'lr': 0.00038514194073755706, 'samples': 9426432, 'steps': 49095, 'loss/train': 1.3852145671844482} -11/07/2021 04:09:20 - INFO - __main__ - Step 49097: {'lr': 0.00038513747614055696, 'samples': 9426624, 'steps': 49096, 'loss/train': 1.2463265657424927} -11/07/2021 04:09:21 - INFO - __main__ - Step 49098: {'lr': 0.0003851330114826659, 'samples': 9426816, 'steps': 49097, 'loss/train': 1.6080673933029175} -11/07/2021 04:09:21 - INFO - __main__ - Step 49099: {'lr': 0.0003851285467638861, 'samples': 9427008, 'steps': 49098, 'loss/train': 1.8316123485565186} -11/07/2021 04:09:21 - INFO - __main__ - Step 49100: {'lr': 0.00038512408198421936, 'samples': 9427200, 'steps': 49099, 'loss/train': 1.3645503520965576} -11/07/2021 04:09:22 - INFO - __main__ - Step 49101: {'lr': 0.0003851196171436679, 'samples': 9427392, 'steps': 49100, 'loss/train': 1.1806963682174683} -11/07/2021 04:09:23 - INFO - __main__ - Step 49102: {'lr': 0.0003851151522422336, 'samples': 9427584, 'steps': 49101, 'loss/train': 0.46137189865112305} -11/07/2021 04:09:23 - INFO - __main__ - Step 49103: {'lr': 0.0003851106872799185, 'samples': 9427776, 'steps': 49102, 'loss/train': 1.374953269958496} -11/07/2021 04:09:23 - INFO - __main__ - Step 49104: {'lr': 0.00038510622225672455, 'samples': 9427968, 'steps': 49103, 'loss/train': 1.1852757930755615} -11/07/2021 04:09:24 - INFO - __main__ - Step 49105: {'lr': 0.0003851017571726539, 'samples': 9428160, 'steps': 49104, 'loss/train': 0.906430184841156} -11/07/2021 04:09:24 - INFO - __main__ - Step 49106: {'lr': 0.00038509729202770843, 'samples': 9428352, 'steps': 49105, 'loss/train': 1.8787739276885986} -11/07/2021 04:09:24 - INFO - __main__ - Step 49107: {'lr': 0.00038509282682189016, 'samples': 9428544, 'steps': 49106, 'loss/train': 1.4721879959106445} -11/07/2021 04:09:26 - INFO - __main__ - Step 49108: {'lr': 0.0003850883615552012, 'samples': 9428736, 'steps': 49107, 'loss/train': 1.5572868585586548} -11/07/2021 04:09:26 - INFO - __main__ - Step 49109: {'lr': 0.0003850838962276436, 'samples': 9428928, 'steps': 49108, 'loss/train': 1.6854112148284912} -11/07/2021 04:09:26 - INFO - __main__ - Step 49110: {'lr': 0.0003850794308392192, 'samples': 9429120, 'steps': 49109, 'loss/train': 1.3845703601837158} -11/07/2021 04:09:27 - INFO - __main__ - Step 49111: {'lr': 0.00038507496538993006, 'samples': 9429312, 'steps': 49110, 'loss/train': 1.334354281425476} -11/07/2021 04:09:27 - INFO - __main__ - Step 49112: {'lr': 0.00038507049987977825, 'samples': 9429504, 'steps': 49111, 'loss/train': 1.1155405044555664} -11/07/2021 04:09:28 - INFO - __main__ - Step 49113: {'lr': 0.0003850660343087657, 'samples': 9429696, 'steps': 49112, 'loss/train': 0.5999600291252136} -11/07/2021 04:09:28 - INFO - __main__ - Step 49114: {'lr': 0.0003850615686768946, 'samples': 9429888, 'steps': 49113, 'loss/train': 1.5678521394729614} -11/07/2021 04:09:29 - INFO - __main__ - Step 49115: {'lr': 0.00038505710298416683, 'samples': 9430080, 'steps': 49114, 'loss/train': 1.5501654148101807} -11/07/2021 04:09:29 - INFO - __main__ - Step 49116: {'lr': 0.00038505263723058437, 'samples': 9430272, 'steps': 49115, 'loss/train': 0.7990596890449524} -11/07/2021 04:09:29 - INFO - __main__ - Step 49117: {'lr': 0.0003850481714161492, 'samples': 9430464, 'steps': 49116, 'loss/train': 1.1202987432479858} -11/07/2021 04:09:30 - INFO - __main__ - Step 49118: {'lr': 0.00038504370554086353, 'samples': 9430656, 'steps': 49117, 'loss/train': 1.5684027671813965} -11/07/2021 04:09:31 - INFO - __main__ - Step 49119: {'lr': 0.0003850392396047292, 'samples': 9430848, 'steps': 49118, 'loss/train': 1.6090108156204224} -11/07/2021 04:09:31 - INFO - __main__ - Step 49120: {'lr': 0.0003850347736077483, 'samples': 9431040, 'steps': 49119, 'loss/train': 1.100080132484436} -11/07/2021 04:09:31 - INFO - __main__ - Step 49121: {'lr': 0.0003850303075499227, 'samples': 9431232, 'steps': 49120, 'loss/train': 1.6162917613983154} -11/07/2021 04:09:32 - INFO - __main__ - Step 49122: {'lr': 0.0003850258414312547, 'samples': 9431424, 'steps': 49121, 'loss/train': 1.0960960388183594} -11/07/2021 04:09:33 - INFO - __main__ - Step 49123: {'lr': 0.000385021375251746, 'samples': 9431616, 'steps': 49122, 'loss/train': 1.4721559286117554} -11/07/2021 04:09:33 - INFO - __main__ - Step 49124: {'lr': 0.00038501690901139883, 'samples': 9431808, 'steps': 49123, 'loss/train': 0.6333041787147522} -11/07/2021 04:09:34 - INFO - __main__ - Step 49125: {'lr': 0.0003850124427102151, 'samples': 9432000, 'steps': 49124, 'loss/train': 2.3519115447998047} -11/07/2021 04:09:34 - INFO - __main__ - Step 49126: {'lr': 0.0003850079763481968, 'samples': 9432192, 'steps': 49125, 'loss/train': 1.4221237897872925} -11/07/2021 04:09:34 - INFO - __main__ - Step 49127: {'lr': 0.0003850035099253461, 'samples': 9432384, 'steps': 49126, 'loss/train': 5.797683238983154} -11/07/2021 04:09:35 - INFO - __main__ - Step 49128: {'lr': 0.00038499904344166483, 'samples': 9432576, 'steps': 49127, 'loss/train': 0.7352468967437744} -11/07/2021 04:09:36 - INFO - __main__ - Step 49129: {'lr': 0.0003849945768971551, 'samples': 9432768, 'steps': 49128, 'loss/train': 1.9143232107162476} -11/07/2021 04:09:36 - INFO - __main__ - Step 49130: {'lr': 0.0003849901102918189, 'samples': 9432960, 'steps': 49129, 'loss/train': 1.6455557346343994} -11/07/2021 04:09:36 - INFO - __main__ - Step 49131: {'lr': 0.00038498564362565826, 'samples': 9433152, 'steps': 49130, 'loss/train': 1.6137969493865967} -11/07/2021 04:09:37 - INFO - __main__ - Step 49132: {'lr': 0.0003849811768986751, 'samples': 9433344, 'steps': 49131, 'loss/train': 1.4530037641525269} -11/07/2021 04:09:37 - INFO - __main__ - Step 49133: {'lr': 0.0003849767101108715, 'samples': 9433536, 'steps': 49132, 'loss/train': 1.8602375984191895} -11/07/2021 04:09:38 - INFO - __main__ - Step 49134: {'lr': 0.0003849722432622495, 'samples': 9433728, 'steps': 49133, 'loss/train': 1.441968321800232} -11/07/2021 04:09:39 - INFO - __main__ - Step 49135: {'lr': 0.0003849677763528111, 'samples': 9433920, 'steps': 49134, 'loss/train': 1.8222562074661255} -11/07/2021 04:09:39 - INFO - __main__ - Step 49136: {'lr': 0.0003849633093825583, 'samples': 9434112, 'steps': 49135, 'loss/train': 1.0792269706726074} -11/07/2021 04:09:39 - INFO - __main__ - Step 49137: {'lr': 0.00038495884235149316, 'samples': 9434304, 'steps': 49136, 'loss/train': 1.2116094827651978} -11/07/2021 04:09:40 - INFO - __main__ - Step 49138: {'lr': 0.0003849543752596176, 'samples': 9434496, 'steps': 49137, 'loss/train': 1.5266435146331787} -11/07/2021 04:09:41 - INFO - __main__ - Step 49139: {'lr': 0.00038494990810693366, 'samples': 9434688, 'steps': 49138, 'loss/train': 1.8355218172073364} -11/07/2021 04:09:41 - INFO - __main__ - Step 49140: {'lr': 0.0003849454408934434, 'samples': 9434880, 'steps': 49139, 'loss/train': 1.7328380346298218} -11/07/2021 04:09:41 - INFO - __main__ - Step 49141: {'lr': 0.0003849409736191488, 'samples': 9435072, 'steps': 49140, 'loss/train': 1.72958505153656} -11/07/2021 04:09:42 - INFO - __main__ - Step 49142: {'lr': 0.00038493650628405196, 'samples': 9435264, 'steps': 49141, 'loss/train': 1.4418506622314453} -11/07/2021 04:09:42 - INFO - __main__ - Step 49143: {'lr': 0.0003849320388881547, 'samples': 9435456, 'steps': 49142, 'loss/train': 1.5139061212539673} -11/07/2021 04:09:43 - INFO - __main__ - Step 49144: {'lr': 0.0003849275714314592, 'samples': 9435648, 'steps': 49143, 'loss/train': 1.3376448154449463} -11/07/2021 04:09:43 - INFO - __main__ - Step 49145: {'lr': 0.0003849231039139674, 'samples': 9435840, 'steps': 49144, 'loss/train': 1.3212387561798096} -11/07/2021 04:09:44 - INFO - __main__ - Step 49146: {'lr': 0.00038491863633568135, 'samples': 9436032, 'steps': 49145, 'loss/train': 1.1440930366516113} -11/07/2021 04:09:44 - INFO - __main__ - Step 49147: {'lr': 0.000384914168696603, 'samples': 9436224, 'steps': 49146, 'loss/train': 1.305210828781128} -11/07/2021 04:09:45 - INFO - __main__ - Step 49148: {'lr': 0.0003849097009967344, 'samples': 9436416, 'steps': 49147, 'loss/train': 1.2001196146011353} -11/07/2021 04:09:46 - INFO - __main__ - Step 49149: {'lr': 0.0003849052332360777, 'samples': 9436608, 'steps': 49148, 'loss/train': 1.4368815422058105} -11/07/2021 04:09:46 - INFO - __main__ - Step 49150: {'lr': 0.0003849007654146347, 'samples': 9436800, 'steps': 49149, 'loss/train': 1.491844654083252} -11/07/2021 04:09:46 - INFO - __main__ - Step 49151: {'lr': 0.0003848962975324074, 'samples': 9436992, 'steps': 49150, 'loss/train': 1.9037903547286987} -11/07/2021 04:09:47 - INFO - __main__ - Step 49152: {'lr': 0.00038489182958939804, 'samples': 9437184, 'steps': 49151, 'loss/train': 1.6102936267852783} -11/07/2021 04:09:47 - INFO - __main__ - Step 49153: {'lr': 0.00038488736158560845, 'samples': 9437376, 'steps': 49152, 'loss/train': 1.3841238021850586} -11/07/2021 04:09:47 - INFO - __main__ - Step 49154: {'lr': 0.00038488289352104065, 'samples': 9437568, 'steps': 49153, 'loss/train': 1.4052152633666992} -11/07/2021 04:09:48 - INFO - __main__ - Step 49155: {'lr': 0.0003848784253956968, 'samples': 9437760, 'steps': 49154, 'loss/train': 1.306625485420227} -11/07/2021 04:09:49 - INFO - __main__ - Step 49156: {'lr': 0.00038487395720957884, 'samples': 9437952, 'steps': 49155, 'loss/train': 1.4390147924423218} -11/07/2021 04:09:49 - INFO - __main__ - Step 49157: {'lr': 0.0003848694889626886, 'samples': 9438144, 'steps': 49156, 'loss/train': 1.962949275970459} -11/07/2021 04:09:49 - INFO - __main__ - Step 49158: {'lr': 0.0003848650206550284, 'samples': 9438336, 'steps': 49157, 'loss/train': 0.8605524897575378} -11/07/2021 04:09:50 - INFO - __main__ - Step 49159: {'lr': 0.0003848605522866, 'samples': 9438528, 'steps': 49158, 'loss/train': 0.9240766167640686} -11/07/2021 04:09:51 - INFO - __main__ - Step 49160: {'lr': 0.00038485608385740555, 'samples': 9438720, 'steps': 49159, 'loss/train': 1.4867128133773804} -11/07/2021 04:09:51 - INFO - __main__ - Step 49161: {'lr': 0.00038485161536744707, 'samples': 9438912, 'steps': 49160, 'loss/train': 1.9888595342636108} -11/07/2021 04:09:52 - INFO - __main__ - Step 49162: {'lr': 0.0003848471468167265, 'samples': 9439104, 'steps': 49161, 'loss/train': 1.83589768409729} -11/07/2021 04:09:52 - INFO - __main__ - Step 49163: {'lr': 0.00038484267820524586, 'samples': 9439296, 'steps': 49162, 'loss/train': 1.7949270009994507} -11/07/2021 04:09:52 - INFO - __main__ - Step 49164: {'lr': 0.00038483820953300724, 'samples': 9439488, 'steps': 49163, 'loss/train': 1.58258855342865} -11/07/2021 04:09:53 - INFO - __main__ - Step 49165: {'lr': 0.00038483374080001254, 'samples': 9439680, 'steps': 49164, 'loss/train': 1.699041485786438} -11/07/2021 04:09:54 - INFO - __main__ - Step 49166: {'lr': 0.00038482927200626386, 'samples': 9439872, 'steps': 49165, 'loss/train': 1.4731369018554688} -11/07/2021 04:09:54 - INFO - __main__ - Step 49167: {'lr': 0.0003848248031517633, 'samples': 9440064, 'steps': 49166, 'loss/train': 1.3327513933181763} -11/07/2021 04:09:54 - INFO - __main__ - Step 49168: {'lr': 0.00038482033423651256, 'samples': 9440256, 'steps': 49167, 'loss/train': 1.5444903373718262} -11/07/2021 04:09:55 - INFO - __main__ - Step 49169: {'lr': 0.00038481586526051406, 'samples': 9440448, 'steps': 49168, 'loss/train': 1.2590073347091675} -11/07/2021 04:09:56 - INFO - __main__ - Step 49170: {'lr': 0.0003848113962237695, 'samples': 9440640, 'steps': 49169, 'loss/train': 1.7843161821365356} -11/07/2021 04:09:56 - INFO - __main__ - Step 49171: {'lr': 0.00038480692712628104, 'samples': 9440832, 'steps': 49170, 'loss/train': 1.728171467781067} -11/07/2021 04:09:57 - INFO - __main__ - Step 49172: {'lr': 0.0003848024579680506, 'samples': 9441024, 'steps': 49171, 'loss/train': 1.5877866744995117} -11/07/2021 04:09:57 - INFO - __main__ - Step 49173: {'lr': 0.00038479798874908026, 'samples': 9441216, 'steps': 49172, 'loss/train': 1.536706566810608} -11/07/2021 04:09:57 - INFO - __main__ - Step 49174: {'lr': 0.00038479351946937206, 'samples': 9441408, 'steps': 49173, 'loss/train': 1.5378828048706055} -11/07/2021 04:09:58 - INFO - __main__ - Step 49175: {'lr': 0.000384789050128928, 'samples': 9441600, 'steps': 49174, 'loss/train': 1.402969479560852} -11/07/2021 04:09:59 - INFO - __main__ - Step 49176: {'lr': 0.0003847845807277501, 'samples': 9441792, 'steps': 49175, 'loss/train': 1.3299713134765625} -11/07/2021 04:09:59 - INFO - __main__ - Step 49177: {'lr': 0.0003847801112658403, 'samples': 9441984, 'steps': 49176, 'loss/train': 1.167944312095642} -11/07/2021 04:09:59 - INFO - __main__ - Step 49178: {'lr': 0.0003847756417432007, 'samples': 9442176, 'steps': 49177, 'loss/train': 1.6673598289489746} -11/07/2021 04:10:00 - INFO - __main__ - Step 49179: {'lr': 0.00038477117215983316, 'samples': 9442368, 'steps': 49178, 'loss/train': 1.6264417171478271} -11/07/2021 04:10:01 - INFO - __main__ - Step 49180: {'lr': 0.0003847667025157399, 'samples': 9442560, 'steps': 49179, 'loss/train': 1.0405162572860718} -11/07/2021 04:10:01 - INFO - __main__ - Step 49181: {'lr': 0.0003847622328109228, 'samples': 9442752, 'steps': 49180, 'loss/train': 1.2665191888809204} -11/07/2021 04:10:01 - INFO - __main__ - Step 49182: {'lr': 0.000384757763045384, 'samples': 9442944, 'steps': 49181, 'loss/train': 1.2967607975006104} -11/07/2021 04:10:02 - INFO - __main__ - Step 49183: {'lr': 0.0003847532932191254, 'samples': 9443136, 'steps': 49182, 'loss/train': 1.3285562992095947} -11/07/2021 04:10:02 - INFO - __main__ - Step 49184: {'lr': 0.000384748823332149, 'samples': 9443328, 'steps': 49183, 'loss/train': 1.5022859573364258} -11/07/2021 04:10:03 - INFO - __main__ - Step 49185: {'lr': 0.0003847443533844569, 'samples': 9443520, 'steps': 49184, 'loss/train': 2.1024880409240723} -11/07/2021 04:10:04 - INFO - __main__ - Step 49186: {'lr': 0.000384739883376051, 'samples': 9443712, 'steps': 49185, 'loss/train': 1.6192253828048706} -11/07/2021 04:10:04 - INFO - __main__ - Step 49187: {'lr': 0.0003847354133069335, 'samples': 9443904, 'steps': 49186, 'loss/train': 1.399524450302124} -11/07/2021 04:10:04 - INFO - __main__ - Step 49188: {'lr': 0.0003847309431771062, 'samples': 9444096, 'steps': 49187, 'loss/train': 1.550622582435608} -11/07/2021 04:10:05 - INFO - __main__ - Step 49189: {'lr': 0.00038472647298657135, 'samples': 9444288, 'steps': 49188, 'loss/train': 1.5158143043518066} -11/07/2021 04:10:05 - INFO - __main__ - Step 49190: {'lr': 0.0003847220027353308, 'samples': 9444480, 'steps': 49189, 'loss/train': 1.0012966394424438} -11/07/2021 04:10:07 - INFO - __main__ - Step 49191: {'lr': 0.0003847175324233865, 'samples': 9444672, 'steps': 49190, 'loss/train': 1.4463376998901367} -11/07/2021 04:10:07 - INFO - __main__ - Step 49192: {'lr': 0.00038471306205074054, 'samples': 9444864, 'steps': 49191, 'loss/train': 1.320358157157898} -11/07/2021 04:10:07 - INFO - __main__ - Step 49193: {'lr': 0.00038470859161739504, 'samples': 9445056, 'steps': 49192, 'loss/train': 1.2056214809417725} -11/07/2021 04:10:08 - INFO - __main__ - Step 49194: {'lr': 0.00038470412112335184, 'samples': 9445248, 'steps': 49193, 'loss/train': 1.3874770402908325} -11/07/2021 04:10:08 - INFO - __main__ - Step 49195: {'lr': 0.0003846996505686131, 'samples': 9445440, 'steps': 49194, 'loss/train': 1.157554268836975} -11/07/2021 04:10:09 - INFO - __main__ - Step 49196: {'lr': 0.00038469517995318083, 'samples': 9445632, 'steps': 49195, 'loss/train': 1.8665660619735718} -11/07/2021 04:10:09 - INFO - __main__ - Step 49197: {'lr': 0.000384690709277057, 'samples': 9445824, 'steps': 49196, 'loss/train': 1.7280787229537964} -11/07/2021 04:10:10 - INFO - __main__ - Step 49198: {'lr': 0.0003846862385402435, 'samples': 9446016, 'steps': 49197, 'loss/train': 0.7833828330039978} -11/07/2021 04:10:10 - INFO - __main__ - Step 49199: {'lr': 0.00038468176774274253, 'samples': 9446208, 'steps': 49198, 'loss/train': 1.6302024126052856} -11/07/2021 04:10:10 - INFO - __main__ - Step 49200: {'lr': 0.000384677296884556, 'samples': 9446400, 'steps': 49199, 'loss/train': 1.3116899728775024} -11/07/2021 04:10:11 - INFO - __main__ - Step 49201: {'lr': 0.000384672825965686, 'samples': 9446592, 'steps': 49200, 'loss/train': 1.413428783416748} -11/07/2021 04:10:12 - INFO - __main__ - Step 49202: {'lr': 0.0003846683549861344, 'samples': 9446784, 'steps': 49201, 'loss/train': 1.2374444007873535} -11/07/2021 04:10:12 - INFO - __main__ - Step 49203: {'lr': 0.00038466388394590344, 'samples': 9446976, 'steps': 49202, 'loss/train': 1.4004100561141968} -11/07/2021 04:10:12 - INFO - __main__ - Step 49204: {'lr': 0.00038465941284499493, 'samples': 9447168, 'steps': 49203, 'loss/train': 1.2180466651916504} -11/07/2021 04:10:13 - INFO - __main__ - Step 49205: {'lr': 0.00038465494168341105, 'samples': 9447360, 'steps': 49204, 'loss/train': 1.7740188837051392} -11/07/2021 04:10:14 - INFO - __main__ - Step 49206: {'lr': 0.00038465047046115365, 'samples': 9447552, 'steps': 49205, 'loss/train': 0.7401227951049805} -11/07/2021 04:10:14 - INFO - __main__ - Step 49207: {'lr': 0.00038464599917822483, 'samples': 9447744, 'steps': 49206, 'loss/train': 1.6348817348480225} -11/07/2021 04:10:15 - INFO - __main__ - Step 49208: {'lr': 0.00038464152783462667, 'samples': 9447936, 'steps': 49207, 'loss/train': 1.5200368165969849} -11/07/2021 04:10:15 - INFO - __main__ - Step 49209: {'lr': 0.0003846370564303611, 'samples': 9448128, 'steps': 49208, 'loss/train': 1.825721263885498} -11/07/2021 04:10:15 - INFO - __main__ - Step 49210: {'lr': 0.00038463258496543014, 'samples': 9448320, 'steps': 49209, 'loss/train': 1.2741966247558594} -11/07/2021 04:10:16 - INFO - __main__ - Step 49211: {'lr': 0.0003846281134398358, 'samples': 9448512, 'steps': 49210, 'loss/train': 1.2416861057281494} -11/07/2021 04:10:17 - INFO - __main__ - Step 49212: {'lr': 0.0003846236418535801, 'samples': 9448704, 'steps': 49211, 'loss/train': 1.73604154586792} -11/07/2021 04:10:17 - INFO - __main__ - Step 49213: {'lr': 0.00038461917020666506, 'samples': 9448896, 'steps': 49212, 'loss/train': 2.193845272064209} -11/07/2021 04:10:17 - INFO - __main__ - Step 49214: {'lr': 0.0003846146984990927, 'samples': 9449088, 'steps': 49213, 'loss/train': 1.6842647790908813} -11/07/2021 04:10:18 - INFO - __main__ - Step 49215: {'lr': 0.00038461022673086506, 'samples': 9449280, 'steps': 49214, 'loss/train': 1.3088513612747192} -11/07/2021 04:10:19 - INFO - __main__ - Step 49216: {'lr': 0.0003846057549019841, 'samples': 9449472, 'steps': 49215, 'loss/train': 1.2411233186721802} -11/07/2021 04:10:19 - INFO - __main__ - Step 49217: {'lr': 0.0003846012830124519, 'samples': 9449664, 'steps': 49216, 'loss/train': 1.495794653892517} -11/07/2021 04:10:19 - INFO - __main__ - Step 49218: {'lr': 0.0003845968110622704, 'samples': 9449856, 'steps': 49217, 'loss/train': 1.6284512281417847} -11/07/2021 04:10:20 - INFO - __main__ - Step 49219: {'lr': 0.0003845923390514417, 'samples': 9450048, 'steps': 49218, 'loss/train': 1.5216821432113647} -11/07/2021 04:10:20 - INFO - __main__ - Step 49220: {'lr': 0.0003845878669799677, 'samples': 9450240, 'steps': 49219, 'loss/train': 1.9224973917007446} -11/07/2021 04:10:21 - INFO - __main__ - Step 49221: {'lr': 0.00038458339484785057, 'samples': 9450432, 'steps': 49220, 'loss/train': 1.6108232736587524} -11/07/2021 04:10:22 - INFO - __main__ - Step 49222: {'lr': 0.00038457892265509214, 'samples': 9450624, 'steps': 49221, 'loss/train': 1.7062171697616577} -11/07/2021 04:10:22 - INFO - __main__ - Step 49223: {'lr': 0.00038457445040169467, 'samples': 9450816, 'steps': 49222, 'loss/train': 0.9867490530014038} -11/07/2021 04:10:22 - INFO - __main__ - Step 49224: {'lr': 0.00038456997808765993, 'samples': 9451008, 'steps': 49223, 'loss/train': 1.5299254655838013} -11/07/2021 04:10:23 - INFO - __main__ - Step 49225: {'lr': 0.00038456550571299, 'samples': 9451200, 'steps': 49224, 'loss/train': 1.4590548276901245} -11/07/2021 04:10:23 - INFO - __main__ - Step 49226: {'lr': 0.000384561033277687, 'samples': 9451392, 'steps': 49225, 'loss/train': 0.8083837628364563} -11/07/2021 04:10:24 - INFO - __main__ - Step 49227: {'lr': 0.00038455656078175283, 'samples': 9451584, 'steps': 49226, 'loss/train': 1.7535966634750366} -11/07/2021 04:10:25 - INFO - __main__ - Step 49228: {'lr': 0.0003845520882251895, 'samples': 9451776, 'steps': 49227, 'loss/train': 1.3637335300445557} -11/07/2021 04:10:25 - INFO - __main__ - Step 49229: {'lr': 0.00038454761560799915, 'samples': 9451968, 'steps': 49228, 'loss/train': 1.4770692586898804} -11/07/2021 04:10:25 - INFO - __main__ - Step 49230: {'lr': 0.0003845431429301838, 'samples': 9452160, 'steps': 49229, 'loss/train': 2.0705811977386475} -11/07/2021 04:10:26 - INFO - __main__ - Step 49231: {'lr': 0.0003845386701917453, 'samples': 9452352, 'steps': 49230, 'loss/train': 1.1304152011871338} -11/07/2021 04:10:27 - INFO - __main__ - Step 49232: {'lr': 0.0003845341973926857, 'samples': 9452544, 'steps': 49231, 'loss/train': 1.4169456958770752} -11/07/2021 04:10:27 - INFO - __main__ - Step 49233: {'lr': 0.0003845297245330071, 'samples': 9452736, 'steps': 49232, 'loss/train': 1.4708280563354492} -11/07/2021 04:10:27 - INFO - __main__ - Step 49234: {'lr': 0.0003845252516127115, 'samples': 9452928, 'steps': 49233, 'loss/train': 1.5530120134353638} -11/07/2021 04:10:28 - INFO - __main__ - Step 49235: {'lr': 0.0003845207786318009, 'samples': 9453120, 'steps': 49234, 'loss/train': 2.7697346210479736} -11/07/2021 04:10:28 - INFO - __main__ - Step 49236: {'lr': 0.0003845163055902773, 'samples': 9453312, 'steps': 49235, 'loss/train': 1.5223881006240845} -11/07/2021 04:10:28 - INFO - __main__ - Step 49237: {'lr': 0.0003845118324881428, 'samples': 9453504, 'steps': 49236, 'loss/train': 1.5188398361206055} -11/07/2021 04:10:29 - INFO - __main__ - Step 49238: {'lr': 0.00038450735932539927, 'samples': 9453696, 'steps': 49237, 'loss/train': 1.7778433561325073} -11/07/2021 04:10:30 - INFO - __main__ - Step 49239: {'lr': 0.0003845028861020488, 'samples': 9453888, 'steps': 49238, 'loss/train': 1.739320993423462} -11/07/2021 04:10:30 - INFO - __main__ - Step 49240: {'lr': 0.0003844984128180934, 'samples': 9454080, 'steps': 49239, 'loss/train': 1.4633797407150269} -11/07/2021 04:10:30 - INFO - __main__ - Step 49241: {'lr': 0.00038449393947353507, 'samples': 9454272, 'steps': 49240, 'loss/train': 1.2488583326339722} -11/07/2021 04:10:31 - INFO - __main__ - Step 49242: {'lr': 0.00038448946606837585, 'samples': 9454464, 'steps': 49241, 'loss/train': 1.33491051197052} -11/07/2021 04:10:32 - INFO - __main__ - Step 49243: {'lr': 0.00038448499260261787, 'samples': 9454656, 'steps': 49242, 'loss/train': 3.0733556747436523} -11/07/2021 04:10:32 - INFO - __main__ - Step 49244: {'lr': 0.0003844805190762629, 'samples': 9454848, 'steps': 49243, 'loss/train': 1.5128308534622192} -11/07/2021 04:10:32 - INFO - __main__ - Step 49245: {'lr': 0.00038447604548931313, 'samples': 9455040, 'steps': 49244, 'loss/train': 1.3653062582015991} -11/07/2021 04:10:33 - INFO - __main__ - Step 49246: {'lr': 0.0003844715718417705, 'samples': 9455232, 'steps': 49245, 'loss/train': 1.8834713697433472} -11/07/2021 04:10:33 - INFO - __main__ - Step 49247: {'lr': 0.0003844670981336371, 'samples': 9455424, 'steps': 49246, 'loss/train': 1.5269482135772705} -11/07/2021 04:10:34 - INFO - __main__ - Step 49248: {'lr': 0.000384462624364915, 'samples': 9455616, 'steps': 49247, 'loss/train': 1.0469377040863037} -11/07/2021 04:10:34 - INFO - __main__ - Step 49249: {'lr': 0.00038445815053560596, 'samples': 9455808, 'steps': 49248, 'loss/train': 1.388178825378418} -11/07/2021 04:10:35 - INFO - __main__ - Step 49250: {'lr': 0.00038445367664571216, 'samples': 9456000, 'steps': 49249, 'loss/train': 1.3149610757827759} -11/07/2021 04:10:35 - INFO - __main__ - Step 49251: {'lr': 0.00038444920269523563, 'samples': 9456192, 'steps': 49250, 'loss/train': 1.2185102701187134} -11/07/2021 04:10:36 - INFO - __main__ - Step 49252: {'lr': 0.0003844447286841783, 'samples': 9456384, 'steps': 49251, 'loss/train': 1.2820465564727783} -11/07/2021 04:10:37 - INFO - __main__ - Step 49253: {'lr': 0.0003844402546125424, 'samples': 9456576, 'steps': 49252, 'loss/train': 1.7159557342529297} -11/07/2021 04:10:37 - INFO - __main__ - Step 49254: {'lr': 0.00038443578048032975, 'samples': 9456768, 'steps': 49253, 'loss/train': 1.5664453506469727} -11/07/2021 04:10:37 - INFO - __main__ - Step 49255: {'lr': 0.0003844313062875423, 'samples': 9456960, 'steps': 49254, 'loss/train': 0.8009182214736938} -11/07/2021 04:10:38 - INFO - __main__ - Step 49256: {'lr': 0.00038442683203418227, 'samples': 9457152, 'steps': 49255, 'loss/train': 1.176375389099121} -11/07/2021 04:10:38 - INFO - __main__ - Step 49257: {'lr': 0.0003844223577202516, 'samples': 9457344, 'steps': 49256, 'loss/train': 0.899752140045166} -11/07/2021 04:10:39 - INFO - __main__ - Step 49258: {'lr': 0.00038441788334575225, 'samples': 9457536, 'steps': 49257, 'loss/train': 1.9049264192581177} -11/07/2021 04:10:39 - INFO - __main__ - Step 49259: {'lr': 0.0003844134089106863, 'samples': 9457728, 'steps': 49258, 'loss/train': 1.2303478717803955} -11/07/2021 04:10:40 - INFO - __main__ - Step 49260: {'lr': 0.00038440893441505573, 'samples': 9457920, 'steps': 49259, 'loss/train': 1.3818678855895996} -11/07/2021 04:10:40 - INFO - __main__ - Step 49261: {'lr': 0.0003844044598588625, 'samples': 9458112, 'steps': 49260, 'loss/train': 1.93372642993927} -11/07/2021 04:10:40 - INFO - __main__ - Step 49262: {'lr': 0.0003843999852421088, 'samples': 9458304, 'steps': 49261, 'loss/train': 1.7044050693511963} -11/07/2021 04:10:41 - INFO - __main__ - Step 49263: {'lr': 0.0003843955105647965, 'samples': 9458496, 'steps': 49262, 'loss/train': 1.1875362396240234} -11/07/2021 04:10:42 - INFO - __main__ - Step 49264: {'lr': 0.0003843910358269277, 'samples': 9458688, 'steps': 49263, 'loss/train': 1.5284796953201294} -11/07/2021 04:10:42 - INFO - __main__ - Step 49265: {'lr': 0.0003843865610285043, 'samples': 9458880, 'steps': 49264, 'loss/train': 1.6451259851455688} -11/07/2021 04:10:42 - INFO - __main__ - Step 49266: {'lr': 0.0003843820861695284, 'samples': 9459072, 'steps': 49265, 'loss/train': 1.1807126998901367} -11/07/2021 04:10:43 - INFO - __main__ - Step 49267: {'lr': 0.00038437761125000204, 'samples': 9459264, 'steps': 49266, 'loss/train': 2.00026273727417} -11/07/2021 04:10:44 - INFO - __main__ - Step 49268: {'lr': 0.00038437313626992723, 'samples': 9459456, 'steps': 49267, 'loss/train': 0.694304347038269} -11/07/2021 04:10:44 - INFO - __main__ - Step 49269: {'lr': 0.0003843686612293059, 'samples': 9459648, 'steps': 49268, 'loss/train': 1.9365851879119873} -11/07/2021 04:10:45 - INFO - __main__ - Step 49270: {'lr': 0.0003843641861281402, 'samples': 9459840, 'steps': 49269, 'loss/train': 1.5159986019134521} -11/07/2021 04:10:45 - INFO - __main__ - Step 49271: {'lr': 0.00038435971096643196, 'samples': 9460032, 'steps': 49270, 'loss/train': 1.4350037574768066} -11/07/2021 04:10:45 - INFO - __main__ - Step 49272: {'lr': 0.00038435523574418336, 'samples': 9460224, 'steps': 49271, 'loss/train': 1.6132951974868774} -11/07/2021 04:10:46 - INFO - __main__ - Step 49273: {'lr': 0.0003843507604613964, 'samples': 9460416, 'steps': 49272, 'loss/train': 1.7995132207870483} -11/07/2021 04:10:47 - INFO - __main__ - Step 49274: {'lr': 0.00038434628511807296, 'samples': 9460608, 'steps': 49273, 'loss/train': 1.0257656574249268} -11/07/2021 04:10:47 - INFO - __main__ - Step 49275: {'lr': 0.00038434180971421523, 'samples': 9460800, 'steps': 49274, 'loss/train': 1.4039250612258911} -11/07/2021 04:10:47 - INFO - __main__ - Step 49276: {'lr': 0.0003843373342498251, 'samples': 9460992, 'steps': 49275, 'loss/train': 1.385812520980835} -11/07/2021 04:10:48 - INFO - __main__ - Step 49277: {'lr': 0.00038433285872490475, 'samples': 9461184, 'steps': 49276, 'loss/train': 1.634580135345459} -11/07/2021 04:10:48 - INFO - __main__ - Step 49278: {'lr': 0.000384328383139456, 'samples': 9461376, 'steps': 49277, 'loss/train': 1.0532727241516113} -11/07/2021 04:10:49 - INFO - __main__ - Step 49279: {'lr': 0.000384323907493481, 'samples': 9461568, 'steps': 49278, 'loss/train': 1.9170868396759033} -11/07/2021 04:10:49 - INFO - __main__ - Step 49280: {'lr': 0.0003843194317869817, 'samples': 9461760, 'steps': 49279, 'loss/train': 1.1617804765701294} -11/07/2021 04:10:50 - INFO - __main__ - Step 49281: {'lr': 0.0003843149560199601, 'samples': 9461952, 'steps': 49280, 'loss/train': 1.3052281141281128} -11/07/2021 04:10:50 - INFO - __main__ - Step 49282: {'lr': 0.0003843104801924183, 'samples': 9462144, 'steps': 49281, 'loss/train': 1.4169832468032837} -11/07/2021 04:10:51 - INFO - __main__ - Step 49283: {'lr': 0.00038430600430435825, 'samples': 9462336, 'steps': 49282, 'loss/train': 1.314243197441101} -11/07/2021 04:10:52 - INFO - __main__ - Step 49284: {'lr': 0.000384301528355782, 'samples': 9462528, 'steps': 49283, 'loss/train': 1.324676275253296} -11/07/2021 04:10:52 - INFO - __main__ - Step 49285: {'lr': 0.00038429705234669157, 'samples': 9462720, 'steps': 49284, 'loss/train': 1.4951428174972534} -11/07/2021 04:10:52 - INFO - __main__ - Step 49286: {'lr': 0.00038429257627708893, 'samples': 9462912, 'steps': 49285, 'loss/train': 1.447383999824524} -11/07/2021 04:10:53 - INFO - __main__ - Step 49287: {'lr': 0.00038428810014697615, 'samples': 9463104, 'steps': 49286, 'loss/train': 1.6952389478683472} -11/07/2021 04:10:53 - INFO - __main__ - Step 49288: {'lr': 0.00038428362395635514, 'samples': 9463296, 'steps': 49287, 'loss/train': 1.4429686069488525} -11/07/2021 04:10:54 - INFO - __main__ - Step 49289: {'lr': 0.0003842791477052281, 'samples': 9463488, 'steps': 49288, 'loss/train': 1.15886390209198} -11/07/2021 04:10:54 - INFO - __main__ - Step 49290: {'lr': 0.00038427467139359696, 'samples': 9463680, 'steps': 49289, 'loss/train': 1.347989559173584} -11/07/2021 04:10:55 - INFO - __main__ - Step 49291: {'lr': 0.00038427019502146364, 'samples': 9463872, 'steps': 49290, 'loss/train': 1.9227449893951416} -11/07/2021 04:10:55 - INFO - __main__ - Step 49292: {'lr': 0.0003842657185888303, 'samples': 9464064, 'steps': 49291, 'loss/train': 0.09805437177419662} -11/07/2021 04:10:56 - INFO - __main__ - Step 49293: {'lr': 0.00038426124209569885, 'samples': 9464256, 'steps': 49292, 'loss/train': 1.6097315549850464} -11/07/2021 04:10:57 - INFO - __main__ - Step 49294: {'lr': 0.00038425676554207133, 'samples': 9464448, 'steps': 49293, 'loss/train': 1.3904743194580078} -11/07/2021 04:10:57 - INFO - __main__ - Step 49295: {'lr': 0.0003842522889279499, 'samples': 9464640, 'steps': 49294, 'loss/train': 1.4921461343765259} -11/07/2021 04:10:57 - INFO - __main__ - Step 49296: {'lr': 0.00038424781225333636, 'samples': 9464832, 'steps': 49295, 'loss/train': 1.443150281906128} -11/07/2021 04:10:58 - INFO - __main__ - Step 49297: {'lr': 0.0003842433355182329, 'samples': 9465024, 'steps': 49296, 'loss/train': 1.2435979843139648} -11/07/2021 04:10:58 - INFO - __main__ - Step 49298: {'lr': 0.0003842388587226414, 'samples': 9465216, 'steps': 49297, 'loss/train': 1.4616177082061768} -11/07/2021 04:10:59 - INFO - __main__ - Step 49299: {'lr': 0.000384234381866564, 'samples': 9465408, 'steps': 49298, 'loss/train': 1.6488696336746216} -11/07/2021 04:10:59 - INFO - __main__ - Step 49300: {'lr': 0.00038422990495000267, 'samples': 9465600, 'steps': 49299, 'loss/train': 1.6438243389129639} -11/07/2021 04:11:00 - INFO - __main__ - Step 49301: {'lr': 0.00038422542797295935, 'samples': 9465792, 'steps': 49300, 'loss/train': 1.4698615074157715} -11/07/2021 04:11:00 - INFO - __main__ - Step 49302: {'lr': 0.0003842209509354362, 'samples': 9465984, 'steps': 49301, 'loss/train': 1.4135884046554565} -11/07/2021 04:11:00 - INFO - __main__ - Step 49303: {'lr': 0.00038421647383743505, 'samples': 9466176, 'steps': 49302, 'loss/train': 1.5925277471542358} -11/07/2021 04:11:01 - INFO - __main__ - Step 49304: {'lr': 0.00038421199667895814, 'samples': 9466368, 'steps': 49303, 'loss/train': 1.4623899459838867} -11/07/2021 04:11:02 - INFO - __main__ - Step 49305: {'lr': 0.0003842075194600073, 'samples': 9466560, 'steps': 49304, 'loss/train': 1.2562298774719238} -11/07/2021 04:11:02 - INFO - __main__ - Step 49306: {'lr': 0.00038420304218058466, 'samples': 9466752, 'steps': 49305, 'loss/train': 1.2742486000061035} -11/07/2021 04:11:03 - INFO - __main__ - Step 49307: {'lr': 0.00038419856484069216, 'samples': 9466944, 'steps': 49306, 'loss/train': 1.4497098922729492} -11/07/2021 04:11:03 - INFO - __main__ - Step 49308: {'lr': 0.0003841940874403319, 'samples': 9467136, 'steps': 49307, 'loss/train': 1.211452603340149} -11/07/2021 04:11:03 - INFO - __main__ - Step 49309: {'lr': 0.0003841896099795058, 'samples': 9467328, 'steps': 49308, 'loss/train': 1.1877186298370361} -11/07/2021 04:11:04 - INFO - __main__ - Step 49310: {'lr': 0.00038418513245821605, 'samples': 9467520, 'steps': 49309, 'loss/train': 1.3652452230453491} -11/07/2021 04:11:05 - INFO - __main__ - Step 49311: {'lr': 0.0003841806548764645, 'samples': 9467712, 'steps': 49310, 'loss/train': 1.6228737831115723} -11/07/2021 04:11:05 - INFO - __main__ - Step 49312: {'lr': 0.0003841761772342531, 'samples': 9467904, 'steps': 49311, 'loss/train': 2.3533477783203125} -11/07/2021 04:11:05 - INFO - __main__ - Step 49313: {'lr': 0.0003841716995315841, 'samples': 9468096, 'steps': 49312, 'loss/train': 1.301640272140503} -11/07/2021 04:11:06 - INFO - __main__ - Step 49314: {'lr': 0.00038416722176845943, 'samples': 9468288, 'steps': 49313, 'loss/train': 1.537453055381775} -11/07/2021 04:11:07 - INFO - __main__ - Step 49315: {'lr': 0.000384162743944881, 'samples': 9468480, 'steps': 49314, 'loss/train': 1.6197184324264526} -11/07/2021 04:11:07 - INFO - __main__ - Step 49316: {'lr': 0.0003841582660608509, 'samples': 9468672, 'steps': 49315, 'loss/train': 1.285697102546692} -11/07/2021 04:11:07 - INFO - __main__ - Step 49317: {'lr': 0.00038415378811637124, 'samples': 9468864, 'steps': 49316, 'loss/train': 1.6587913036346436} -11/07/2021 04:11:08 - INFO - __main__ - Step 49318: {'lr': 0.00038414931011144393, 'samples': 9469056, 'steps': 49317, 'loss/train': 1.7063889503479004} -11/07/2021 04:11:08 - INFO - __main__ - Step 49319: {'lr': 0.000384144832046071, 'samples': 9469248, 'steps': 49318, 'loss/train': 1.5879881381988525} -11/07/2021 04:11:10 - INFO - __main__ - Step 49320: {'lr': 0.0003841403539202545, 'samples': 9469440, 'steps': 49319, 'loss/train': 2.182030439376831} -11/07/2021 04:11:10 - INFO - __main__ - Step 49321: {'lr': 0.00038413587573399635, 'samples': 9469632, 'steps': 49320, 'loss/train': 1.5305895805358887} -11/07/2021 04:11:10 - INFO - __main__ - Step 49322: {'lr': 0.0003841313974872986, 'samples': 9469824, 'steps': 49321, 'loss/train': 1.6020350456237793} -11/07/2021 04:11:11 - INFO - __main__ - Step 49323: {'lr': 0.00038412691918016345, 'samples': 9470016, 'steps': 49322, 'loss/train': 0.9629158973693848} -11/07/2021 04:11:11 - INFO - __main__ - Step 49324: {'lr': 0.00038412244081259273, 'samples': 9470208, 'steps': 49323, 'loss/train': 1.748894214630127} -11/07/2021 04:11:11 - INFO - __main__ - Step 49325: {'lr': 0.00038411796238458853, 'samples': 9470400, 'steps': 49324, 'loss/train': 2.147814989089966} -11/07/2021 04:11:12 - INFO - __main__ - Step 49326: {'lr': 0.00038411348389615286, 'samples': 9470592, 'steps': 49325, 'loss/train': 2.2232298851013184} -11/07/2021 04:11:13 - INFO - __main__ - Step 49327: {'lr': 0.00038410900534728765, 'samples': 9470784, 'steps': 49326, 'loss/train': 1.5854507684707642} -11/07/2021 04:11:13 - INFO - __main__ - Step 49328: {'lr': 0.000384104526737995, 'samples': 9470976, 'steps': 49327, 'loss/train': 1.6244455575942993} -11/07/2021 04:11:13 - INFO - __main__ - Step 49329: {'lr': 0.0003841000480682769, 'samples': 9471168, 'steps': 49328, 'loss/train': 1.4646588563919067} -11/07/2021 04:11:14 - INFO - __main__ - Step 49330: {'lr': 0.0003840955693381355, 'samples': 9471360, 'steps': 49329, 'loss/train': 1.893558382987976} -11/07/2021 04:11:15 - INFO - __main__ - Step 49331: {'lr': 0.0003840910905475726, 'samples': 9471552, 'steps': 49330, 'loss/train': 1.3998960256576538} -11/07/2021 04:11:15 - INFO - __main__ - Step 49332: {'lr': 0.0003840866116965904, 'samples': 9471744, 'steps': 49331, 'loss/train': 1.8675849437713623} -11/07/2021 04:11:15 - INFO - __main__ - Step 49333: {'lr': 0.00038408213278519083, 'samples': 9471936, 'steps': 49332, 'loss/train': 1.5504200458526611} -11/07/2021 04:11:16 - INFO - __main__ - Step 49334: {'lr': 0.0003840776538133759, 'samples': 9472128, 'steps': 49333, 'loss/train': 1.301131248474121} -11/07/2021 04:11:16 - INFO - __main__ - Step 49335: {'lr': 0.00038407317478114764, 'samples': 9472320, 'steps': 49334, 'loss/train': 1.5315876007080078} -11/07/2021 04:11:17 - INFO - __main__ - Step 49336: {'lr': 0.00038406869568850805, 'samples': 9472512, 'steps': 49335, 'loss/train': 0.8331318497657776} -11/07/2021 04:11:18 - INFO - __main__ - Step 49337: {'lr': 0.00038406421653545926, 'samples': 9472704, 'steps': 49336, 'loss/train': 1.8083441257476807} -11/07/2021 04:11:18 - INFO - __main__ - Step 49338: {'lr': 0.00038405973732200317, 'samples': 9472896, 'steps': 49337, 'loss/train': 1.7773988246917725} -11/07/2021 04:11:18 - INFO - __main__ - Step 49339: {'lr': 0.0003840552580481418, 'samples': 9473088, 'steps': 49338, 'loss/train': 1.477247714996338} -11/07/2021 04:11:19 - INFO - __main__ - Step 49340: {'lr': 0.00038405077871387716, 'samples': 9473280, 'steps': 49339, 'loss/train': 1.6360654830932617} -11/07/2021 04:11:19 - INFO - __main__ - Step 49341: {'lr': 0.00038404629931921137, 'samples': 9473472, 'steps': 49340, 'loss/train': 5.7670135498046875} -11/07/2021 04:11:20 - INFO - __main__ - Step 49342: {'lr': 0.0003840418198641463, 'samples': 9473664, 'steps': 49341, 'loss/train': 1.1676645278930664} -11/07/2021 04:11:20 - INFO - __main__ - Step 49343: {'lr': 0.0003840373403486842, 'samples': 9473856, 'steps': 49342, 'loss/train': 1.524045467376709} -11/07/2021 04:11:21 - INFO - __main__ - Step 49344: {'lr': 0.0003840328607728269, 'samples': 9474048, 'steps': 49343, 'loss/train': 1.4302656650543213} -11/07/2021 04:11:21 - INFO - __main__ - Step 49345: {'lr': 0.0003840283811365764, 'samples': 9474240, 'steps': 49344, 'loss/train': 1.4958720207214355} -11/07/2021 04:11:21 - INFO - __main__ - Step 49346: {'lr': 0.00038402390143993484, 'samples': 9474432, 'steps': 49345, 'loss/train': 1.3384087085723877} -11/07/2021 04:11:23 - INFO - __main__ - Step 49347: {'lr': 0.0003840194216829042, 'samples': 9474624, 'steps': 49346, 'loss/train': 1.161323070526123} -11/07/2021 04:11:23 - INFO - __main__ - Step 49348: {'lr': 0.00038401494186548633, 'samples': 9474816, 'steps': 49347, 'loss/train': 1.4390065670013428} -11/07/2021 04:11:23 - INFO - __main__ - Step 49349: {'lr': 0.0003840104619876835, 'samples': 9475008, 'steps': 49348, 'loss/train': 1.1753920316696167} -11/07/2021 04:11:24 - INFO - __main__ - Step 49350: {'lr': 0.0003840059820494976, 'samples': 9475200, 'steps': 49349, 'loss/train': 1.6433159112930298} -11/07/2021 04:11:24 - INFO - __main__ - Step 49351: {'lr': 0.00038400150205093075, 'samples': 9475392, 'steps': 49350, 'loss/train': 1.245421290397644} -11/07/2021 04:11:24 - INFO - __main__ - Step 49352: {'lr': 0.00038399702199198486, 'samples': 9475584, 'steps': 49351, 'loss/train': 0.9821666479110718} -11/07/2021 04:11:25 - INFO - __main__ - Step 49353: {'lr': 0.00038399254187266186, 'samples': 9475776, 'steps': 49352, 'loss/train': 1.5022464990615845} -11/07/2021 04:11:26 - INFO - __main__ - Step 49354: {'lr': 0.000383988061692964, 'samples': 9475968, 'steps': 49353, 'loss/train': 1.3901777267456055} -11/07/2021 04:11:26 - INFO - __main__ - Step 49355: {'lr': 0.0003839835814528931, 'samples': 9476160, 'steps': 49354, 'loss/train': 1.644857406616211} -11/07/2021 04:11:26 - INFO - __main__ - Step 49356: {'lr': 0.0003839791011524514, 'samples': 9476352, 'steps': 49355, 'loss/train': 1.5316932201385498} -11/07/2021 04:11:27 - INFO - __main__ - Step 49357: {'lr': 0.0003839746207916407, 'samples': 9476544, 'steps': 49356, 'loss/train': 1.4775909185409546} -11/07/2021 04:11:28 - INFO - __main__ - Step 49358: {'lr': 0.0003839701403704631, 'samples': 9476736, 'steps': 49357, 'loss/train': 1.4452733993530273} -11/07/2021 04:11:28 - INFO - __main__ - Step 49359: {'lr': 0.00038396565988892063, 'samples': 9476928, 'steps': 49358, 'loss/train': 0.7642771601676941} -11/07/2021 04:11:28 - INFO - __main__ - Step 49360: {'lr': 0.00038396117934701537, 'samples': 9477120, 'steps': 49359, 'loss/train': 1.2526742219924927} -11/07/2021 04:11:29 - INFO - __main__ - Step 49361: {'lr': 0.00038395669874474915, 'samples': 9477312, 'steps': 49360, 'loss/train': 1.5693467855453491} -11/07/2021 04:11:29 - INFO - __main__ - Step 49362: {'lr': 0.00038395221808212415, 'samples': 9477504, 'steps': 49361, 'loss/train': 1.4363118410110474} -11/07/2021 04:11:30 - INFO - __main__ - Step 49363: {'lr': 0.0003839477373591423, 'samples': 9477696, 'steps': 49362, 'loss/train': 1.6547024250030518} -11/07/2021 04:11:31 - INFO - __main__ - Step 49364: {'lr': 0.0003839432565758059, 'samples': 9477888, 'steps': 49363, 'loss/train': 1.3071367740631104} -11/07/2021 04:11:31 - INFO - __main__ - Step 49365: {'lr': 0.0003839387757321165, 'samples': 9478080, 'steps': 49364, 'loss/train': 1.572064995765686} -11/07/2021 04:11:31 - INFO - __main__ - Step 49366: {'lr': 0.0003839342948280764, 'samples': 9478272, 'steps': 49365, 'loss/train': 1.5092639923095703} -11/07/2021 04:11:32 - INFO - __main__ - Step 49367: {'lr': 0.00038392981386368763, 'samples': 9478464, 'steps': 49366, 'loss/train': 1.7656980752944946} -11/07/2021 04:11:33 - INFO - __main__ - Step 49368: {'lr': 0.0003839253328389521, 'samples': 9478656, 'steps': 49367, 'loss/train': 1.7381960153579712} -11/07/2021 04:11:33 - INFO - __main__ - Step 49369: {'lr': 0.00038392085175387186, 'samples': 9478848, 'steps': 49368, 'loss/train': 1.2247587442398071} -11/07/2021 04:11:33 - INFO - __main__ - Step 49370: {'lr': 0.000383916370608449, 'samples': 9479040, 'steps': 49369, 'loss/train': 1.2737410068511963} -11/07/2021 04:11:34 - INFO - __main__ - Step 49371: {'lr': 0.0003839118894026855, 'samples': 9479232, 'steps': 49370, 'loss/train': 1.4327012300491333} -11/07/2021 04:11:34 - INFO - __main__ - Step 49372: {'lr': 0.0003839074081365833, 'samples': 9479424, 'steps': 49371, 'loss/train': 1.0670971870422363} -11/07/2021 04:11:35 - INFO - __main__ - Step 49373: {'lr': 0.0003839029268101446, 'samples': 9479616, 'steps': 49372, 'loss/train': 1.4543306827545166} -11/07/2021 04:11:36 - INFO - __main__ - Step 49374: {'lr': 0.00038389844542337123, 'samples': 9479808, 'steps': 49373, 'loss/train': 1.070849895477295} -11/07/2021 04:11:36 - INFO - __main__ - Step 49375: {'lr': 0.0003838939639762653, 'samples': 9480000, 'steps': 49374, 'loss/train': 1.360690951347351} -11/07/2021 04:11:36 - INFO - __main__ - Step 49376: {'lr': 0.00038388948246882883, 'samples': 9480192, 'steps': 49375, 'loss/train': 1.9821124076843262} -11/07/2021 04:11:37 - INFO - __main__ - Step 49377: {'lr': 0.0003838850009010638, 'samples': 9480384, 'steps': 49376, 'loss/train': 1.5155435800552368} -11/07/2021 04:11:38 - INFO - __main__ - Step 49378: {'lr': 0.0003838805192729723, 'samples': 9480576, 'steps': 49377, 'loss/train': 1.7489532232284546} -11/07/2021 04:11:38 - INFO - __main__ - Step 49379: {'lr': 0.00038387603758455624, 'samples': 9480768, 'steps': 49378, 'loss/train': 1.4840288162231445} -11/07/2021 04:11:38 - INFO - __main__ - Step 49380: {'lr': 0.00038387155583581773, 'samples': 9480960, 'steps': 49379, 'loss/train': 1.4947314262390137} -11/07/2021 04:11:39 - INFO - __main__ - Step 49381: {'lr': 0.00038386707402675877, 'samples': 9481152, 'steps': 49380, 'loss/train': 1.3950653076171875} -11/07/2021 04:11:39 - INFO - __main__ - Step 49382: {'lr': 0.00038386259215738135, 'samples': 9481344, 'steps': 49381, 'loss/train': 1.6808557510375977} -11/07/2021 04:11:40 - INFO - __main__ - Step 49383: {'lr': 0.0003838581102276876, 'samples': 9481536, 'steps': 49382, 'loss/train': 1.1713740825653076} -11/07/2021 04:11:40 - INFO - __main__ - Step 49384: {'lr': 0.00038385362823767935, 'samples': 9481728, 'steps': 49383, 'loss/train': 1.228548526763916} -11/07/2021 04:11:41 - INFO - __main__ - Step 49385: {'lr': 0.00038384914618735873, 'samples': 9481920, 'steps': 49384, 'loss/train': 1.4046412706375122} -11/07/2021 04:11:41 - INFO - __main__ - Step 49386: {'lr': 0.0003838446640767278, 'samples': 9482112, 'steps': 49385, 'loss/train': 1.7546875476837158} -11/07/2021 04:11:41 - INFO - __main__ - Step 49387: {'lr': 0.00038384018190578843, 'samples': 9482304, 'steps': 49386, 'loss/train': 1.4690765142440796} -11/07/2021 04:11:42 - INFO - __main__ - Step 49388: {'lr': 0.0003838356996745429, 'samples': 9482496, 'steps': 49387, 'loss/train': 0.9885172843933105} -11/07/2021 04:11:43 - INFO - __main__ - Step 49389: {'lr': 0.00038383121738299296, 'samples': 9482688, 'steps': 49388, 'loss/train': 1.657820463180542} -11/07/2021 04:11:43 - INFO - __main__ - Step 49390: {'lr': 0.00038382673503114075, 'samples': 9482880, 'steps': 49389, 'loss/train': 1.3290120363235474} -11/07/2021 04:11:44 - INFO - __main__ - Step 49391: {'lr': 0.0003838222526189883, 'samples': 9483072, 'steps': 49390, 'loss/train': 1.2781789302825928} -11/07/2021 04:11:44 - INFO - __main__ - Step 49392: {'lr': 0.0003838177701465376, 'samples': 9483264, 'steps': 49391, 'loss/train': 1.478083848953247} -11/07/2021 04:11:44 - INFO - __main__ - Step 49393: {'lr': 0.00038381328761379063, 'samples': 9483456, 'steps': 49392, 'loss/train': 2.3239057064056396} -11/07/2021 04:11:46 - INFO - __main__ - Step 49394: {'lr': 0.0003838088050207496, 'samples': 9483648, 'steps': 49393, 'loss/train': 1.419954776763916} -11/07/2021 04:11:46 - INFO - __main__ - Step 49395: {'lr': 0.00038380432236741625, 'samples': 9483840, 'steps': 49394, 'loss/train': 1.784666657447815} -11/07/2021 04:11:46 - INFO - __main__ - Step 49396: {'lr': 0.0003837998396537927, 'samples': 9484032, 'steps': 49395, 'loss/train': 0.4355214238166809} -11/07/2021 04:11:47 - INFO - __main__ - Step 49397: {'lr': 0.0003837953568798811, 'samples': 9484224, 'steps': 49396, 'loss/train': 1.6687462329864502} -11/07/2021 04:11:47 - INFO - __main__ - Step 49398: {'lr': 0.00038379087404568333, 'samples': 9484416, 'steps': 49397, 'loss/train': 1.2138727903366089} -11/07/2021 04:11:48 - INFO - __main__ - Step 49399: {'lr': 0.00038378639115120154, 'samples': 9484608, 'steps': 49398, 'loss/train': 1.3672698736190796} -11/07/2021 04:11:48 - INFO - __main__ - Step 49400: {'lr': 0.0003837819081964377, 'samples': 9484800, 'steps': 49399, 'loss/train': 1.1022813320159912} -11/07/2021 04:11:49 - INFO - __main__ - Step 49401: {'lr': 0.0003837774251813936, 'samples': 9484992, 'steps': 49400, 'loss/train': 1.3086178302764893} -11/07/2021 04:11:49 - INFO - __main__ - Step 49402: {'lr': 0.0003837729421060716, 'samples': 9485184, 'steps': 49401, 'loss/train': 1.7074296474456787} -11/07/2021 04:11:49 - INFO - __main__ - Step 49403: {'lr': 0.00038376845897047354, 'samples': 9485376, 'steps': 49402, 'loss/train': 0.9208493828773499} -11/07/2021 04:11:50 - INFO - __main__ - Step 49404: {'lr': 0.00038376397577460144, 'samples': 9485568, 'steps': 49403, 'loss/train': 1.593536376953125} -11/07/2021 04:11:51 - INFO - __main__ - Step 49405: {'lr': 0.00038375949251845745, 'samples': 9485760, 'steps': 49404, 'loss/train': 1.5746198892593384} -11/07/2021 04:11:51 - INFO - __main__ - Step 49406: {'lr': 0.0003837550092020434, 'samples': 9485952, 'steps': 49405, 'loss/train': 1.6538019180297852} -11/07/2021 04:11:52 - INFO - __main__ - Step 49407: {'lr': 0.0003837505258253615, 'samples': 9486144, 'steps': 49406, 'loss/train': 1.4615103006362915} -11/07/2021 04:11:52 - INFO - __main__ - Step 49408: {'lr': 0.0003837460423884136, 'samples': 9486336, 'steps': 49407, 'loss/train': 1.2624928951263428} -11/07/2021 04:11:53 - INFO - __main__ - Step 49409: {'lr': 0.00038374155889120176, 'samples': 9486528, 'steps': 49408, 'loss/train': 1.5209566354751587} -11/07/2021 04:11:53 - INFO - __main__ - Step 49410: {'lr': 0.0003837370753337281, 'samples': 9486720, 'steps': 49409, 'loss/train': 1.5793596506118774} -11/07/2021 04:11:54 - INFO - __main__ - Step 49411: {'lr': 0.00038373259171599463, 'samples': 9486912, 'steps': 49410, 'loss/train': 1.3892780542373657} -11/07/2021 04:11:54 - INFO - __main__ - Step 49412: {'lr': 0.0003837281080380033, 'samples': 9487104, 'steps': 49411, 'loss/train': 1.6055463552474976} -11/07/2021 04:11:54 - INFO - __main__ - Step 49413: {'lr': 0.00038372362429975603, 'samples': 9487296, 'steps': 49412, 'loss/train': 1.5732831954956055} -11/07/2021 04:11:55 - INFO - __main__ - Step 49414: {'lr': 0.0003837191405012551, 'samples': 9487488, 'steps': 49413, 'loss/train': 1.428322434425354} -11/07/2021 04:11:56 - INFO - __main__ - Step 49415: {'lr': 0.00038371465664250226, 'samples': 9487680, 'steps': 49414, 'loss/train': 1.847044825553894} -11/07/2021 04:11:56 - INFO - __main__ - Step 49416: {'lr': 0.0003837101727234997, 'samples': 9487872, 'steps': 49415, 'loss/train': 1.5304168462753296} -11/07/2021 04:11:56 - INFO - __main__ - Step 49417: {'lr': 0.0003837056887442495, 'samples': 9488064, 'steps': 49416, 'loss/train': 1.2969977855682373} -11/07/2021 04:11:57 - INFO - __main__ - Step 49418: {'lr': 0.00038370120470475355, 'samples': 9488256, 'steps': 49417, 'loss/train': 1.2422821521759033} -11/07/2021 04:11:58 - INFO - __main__ - Step 49419: {'lr': 0.0003836967206050138, 'samples': 9488448, 'steps': 49418, 'loss/train': 1.557572841644287} -11/07/2021 04:11:58 - INFO - __main__ - Step 49420: {'lr': 0.0003836922364450325, 'samples': 9488640, 'steps': 49419, 'loss/train': 1.4618909358978271} -11/07/2021 04:11:58 - INFO - __main__ - Step 49421: {'lr': 0.0003836877522248114, 'samples': 9488832, 'steps': 49420, 'loss/train': 3.2358062267303467} -11/07/2021 04:11:59 - INFO - __main__ - Step 49422: {'lr': 0.0003836832679443527, 'samples': 9489024, 'steps': 49421, 'loss/train': 1.930889368057251} -11/07/2021 04:11:59 - INFO - __main__ - Step 49423: {'lr': 0.00038367878360365845, 'samples': 9489216, 'steps': 49422, 'loss/train': 1.6684209108352661} -11/07/2021 04:12:00 - INFO - __main__ - Step 49424: {'lr': 0.00038367429920273054, 'samples': 9489408, 'steps': 49423, 'loss/train': 1.5331238508224487} -11/07/2021 04:12:01 - INFO - __main__ - Step 49425: {'lr': 0.00038366981474157114, 'samples': 9489600, 'steps': 49424, 'loss/train': 1.2940645217895508} -11/07/2021 04:12:01 - INFO - __main__ - Step 49426: {'lr': 0.00038366533022018214, 'samples': 9489792, 'steps': 49425, 'loss/train': 1.228728175163269} -11/07/2021 04:12:01 - INFO - __main__ - Step 49427: {'lr': 0.0003836608456385655, 'samples': 9489984, 'steps': 49426, 'loss/train': 2.0489604473114014} -11/07/2021 04:12:02 - INFO - __main__ - Step 49428: {'lr': 0.00038365636099672347, 'samples': 9490176, 'steps': 49427, 'loss/train': 0.9330426454544067} -11/07/2021 04:12:02 - INFO - __main__ - Step 49429: {'lr': 0.0003836518762946579, 'samples': 9490368, 'steps': 49428, 'loss/train': 1.604009747505188} -11/07/2021 04:12:03 - INFO - __main__ - Step 49430: {'lr': 0.0003836473915323709, 'samples': 9490560, 'steps': 49429, 'loss/train': 1.3320634365081787} -11/07/2021 04:12:03 - INFO - __main__ - Step 49431: {'lr': 0.0003836429067098645, 'samples': 9490752, 'steps': 49430, 'loss/train': 2.4549779891967773} -11/07/2021 04:12:04 - INFO - __main__ - Step 49432: {'lr': 0.0003836384218271405, 'samples': 9490944, 'steps': 49431, 'loss/train': 1.0012286901474} -11/07/2021 04:12:04 - INFO - __main__ - Step 49433: {'lr': 0.00038363393688420116, 'samples': 9491136, 'steps': 49432, 'loss/train': 1.3346449136734009} -11/07/2021 04:12:05 - INFO - __main__ - Step 49434: {'lr': 0.0003836294518810485, 'samples': 9491328, 'steps': 49433, 'loss/train': 1.3577319383621216} -11/07/2021 04:12:05 - INFO - __main__ - Step 49435: {'lr': 0.00038362496681768434, 'samples': 9491520, 'steps': 49434, 'loss/train': 1.2545278072357178} -11/07/2021 04:12:06 - INFO - __main__ - Step 49436: {'lr': 0.0003836204816941109, 'samples': 9491712, 'steps': 49435, 'loss/train': 1.6246488094329834} -11/07/2021 04:12:06 - INFO - __main__ - Step 49437: {'lr': 0.0003836159965103301, 'samples': 9491904, 'steps': 49436, 'loss/train': 1.687782883644104} -11/07/2021 04:12:07 - INFO - __main__ - Step 49438: {'lr': 0.0003836115112663441, 'samples': 9492096, 'steps': 49437, 'loss/train': 1.801659345626831} -11/07/2021 04:12:07 - INFO - __main__ - Step 49439: {'lr': 0.0003836070259621548, 'samples': 9492288, 'steps': 49438, 'loss/train': 1.387070655822754} -11/07/2021 04:12:08 - INFO - __main__ - Step 49440: {'lr': 0.0003836025405977641, 'samples': 9492480, 'steps': 49439, 'loss/train': 1.3248119354248047} -11/07/2021 04:12:08 - INFO - __main__ - Step 49441: {'lr': 0.00038359805517317427, 'samples': 9492672, 'steps': 49440, 'loss/train': 1.3795644044876099} -11/07/2021 04:12:09 - INFO - __main__ - Step 49442: {'lr': 0.00038359356968838723, 'samples': 9492864, 'steps': 49441, 'loss/train': 1.2761085033416748} -11/07/2021 04:12:09 - INFO - __main__ - Step 49443: {'lr': 0.00038358908414340485, 'samples': 9493056, 'steps': 49442, 'loss/train': 1.6001322269439697} -11/07/2021 04:12:09 - INFO - __main__ - Step 49444: {'lr': 0.0003835845985382294, 'samples': 9493248, 'steps': 49443, 'loss/train': 1.4786072969436646} -11/07/2021 04:12:10 - INFO - __main__ - Step 49445: {'lr': 0.00038358011287286287, 'samples': 9493440, 'steps': 49444, 'loss/train': 0.9966360330581665} -11/07/2021 04:12:11 - INFO - __main__ - Step 49446: {'lr': 0.0003835756271473071, 'samples': 9493632, 'steps': 49445, 'loss/train': 1.651698112487793} -11/07/2021 04:12:11 - INFO - __main__ - Step 49447: {'lr': 0.0003835711413615642, 'samples': 9493824, 'steps': 49446, 'loss/train': 1.3871666193008423} -11/07/2021 04:12:11 - INFO - __main__ - Step 49448: {'lr': 0.0003835666555156362, 'samples': 9494016, 'steps': 49447, 'loss/train': 1.2935926914215088} -11/07/2021 04:12:12 - INFO - __main__ - Step 49449: {'lr': 0.00038356216960952515, 'samples': 9494208, 'steps': 49448, 'loss/train': 1.6006450653076172} -11/07/2021 04:12:13 - INFO - __main__ - Step 49450: {'lr': 0.0003835576836432331, 'samples': 9494400, 'steps': 49449, 'loss/train': 0.46942609548568726} -11/07/2021 04:12:13 - INFO - __main__ - Step 49451: {'lr': 0.000383553197616762, 'samples': 9494592, 'steps': 49450, 'loss/train': 1.724548101425171} -11/07/2021 04:12:14 - INFO - __main__ - Step 49452: {'lr': 0.00038354871153011385, 'samples': 9494784, 'steps': 49451, 'loss/train': 1.2632355690002441} -11/07/2021 04:12:14 - INFO - __main__ - Step 49453: {'lr': 0.0003835442253832907, 'samples': 9494976, 'steps': 49452, 'loss/train': 1.3236713409423828} -11/07/2021 04:12:14 - INFO - __main__ - Step 49454: {'lr': 0.00038353973917629457, 'samples': 9495168, 'steps': 49453, 'loss/train': 1.5322283506393433} -11/07/2021 04:12:15 - INFO - __main__ - Step 49455: {'lr': 0.0003835352529091275, 'samples': 9495360, 'steps': 49454, 'loss/train': 1.0614477396011353} -11/07/2021 04:12:16 - INFO - __main__ - Step 49456: {'lr': 0.0003835307665817915, 'samples': 9495552, 'steps': 49455, 'loss/train': 1.7836710214614868} -11/07/2021 04:12:16 - INFO - __main__ - Step 49457: {'lr': 0.0003835262801942887, 'samples': 9495744, 'steps': 49456, 'loss/train': 0.15671800076961517} -11/07/2021 04:12:17 - INFO - __main__ - Step 49458: {'lr': 0.000383521793746621, 'samples': 9495936, 'steps': 49457, 'loss/train': 1.6529656648635864} -11/07/2021 04:12:17 - INFO - __main__ - Step 49459: {'lr': 0.00038351730723879034, 'samples': 9496128, 'steps': 49458, 'loss/train': 1.468443751335144} -11/07/2021 04:12:17 - INFO - __main__ - Step 49460: {'lr': 0.0003835128206707989, 'samples': 9496320, 'steps': 49459, 'loss/train': 1.6167665719985962} -11/07/2021 04:12:18 - INFO - __main__ - Step 49461: {'lr': 0.00038350833404264865, 'samples': 9496512, 'steps': 49460, 'loss/train': 1.1963554620742798} -11/07/2021 04:12:19 - INFO - __main__ - Step 49462: {'lr': 0.0003835038473543416, 'samples': 9496704, 'steps': 49461, 'loss/train': 1.8096206188201904} -11/07/2021 04:12:19 - INFO - __main__ - Step 49463: {'lr': 0.0003834993606058798, 'samples': 9496896, 'steps': 49462, 'loss/train': 1.7199034690856934} -11/07/2021 04:12:19 - INFO - __main__ - Step 49464: {'lr': 0.00038349487379726513, 'samples': 9497088, 'steps': 49463, 'loss/train': 1.3855326175689697} -11/07/2021 04:12:20 - INFO - __main__ - Step 49465: {'lr': 0.0003834903869284999, 'samples': 9497280, 'steps': 49464, 'loss/train': 1.2433205842971802} -11/07/2021 04:12:21 - INFO - __main__ - Step 49466: {'lr': 0.00038348589999958585, 'samples': 9497472, 'steps': 49465, 'loss/train': 1.5063279867172241} -11/07/2021 04:12:21 - INFO - __main__ - Step 49467: {'lr': 0.00038348141301052505, 'samples': 9497664, 'steps': 49466, 'loss/train': 1.8365730047225952} -11/07/2021 04:12:21 - INFO - __main__ - Step 49468: {'lr': 0.00038347692596131977, 'samples': 9497856, 'steps': 49467, 'loss/train': 1.5028265714645386} -11/07/2021 04:12:22 - INFO - __main__ - Step 49469: {'lr': 0.0003834724388519717, 'samples': 9498048, 'steps': 49468, 'loss/train': 1.3604669570922852} -11/07/2021 04:12:22 - INFO - __main__ - Step 49470: {'lr': 0.00038346795168248306, 'samples': 9498240, 'steps': 49469, 'loss/train': 1.525028944015503} -11/07/2021 04:12:23 - INFO - __main__ - Step 49471: {'lr': 0.00038346346445285585, 'samples': 9498432, 'steps': 49470, 'loss/train': 1.1660608053207397} -11/07/2021 04:12:24 - INFO - __main__ - Step 49472: {'lr': 0.0003834589771630921, 'samples': 9498624, 'steps': 49471, 'loss/train': 1.2024121284484863} -11/07/2021 04:12:24 - INFO - __main__ - Step 49473: {'lr': 0.0003834544898131936, 'samples': 9498816, 'steps': 49472, 'loss/train': 1.4175405502319336} -11/07/2021 04:12:25 - INFO - __main__ - Step 49474: {'lr': 0.00038345000240316276, 'samples': 9499008, 'steps': 49473, 'loss/train': 1.046689748764038} -11/07/2021 04:12:25 - INFO - __main__ - Step 49475: {'lr': 0.00038344551493300135, 'samples': 9499200, 'steps': 49474, 'loss/train': 1.3881487846374512} -11/07/2021 04:12:26 - INFO - __main__ - Step 49476: {'lr': 0.00038344102740271144, 'samples': 9499392, 'steps': 49475, 'loss/train': 1.2882369756698608} -11/07/2021 04:12:26 - INFO - __main__ - Step 49477: {'lr': 0.00038343653981229504, 'samples': 9499584, 'steps': 49476, 'loss/train': 1.7036164999008179} -11/07/2021 04:12:27 - INFO - __main__ - Step 49478: {'lr': 0.00038343205216175426, 'samples': 9499776, 'steps': 49477, 'loss/train': 0.9137195348739624} -11/07/2021 04:12:27 - INFO - __main__ - Step 49479: {'lr': 0.000383427564451091, 'samples': 9499968, 'steps': 49478, 'loss/train': 1.1925657987594604} -11/07/2021 04:12:27 - INFO - __main__ - Step 49480: {'lr': 0.00038342307668030737, 'samples': 9500160, 'steps': 49479, 'loss/train': 1.835159182548523} -11/07/2021 04:12:28 - INFO - __main__ - Step 49481: {'lr': 0.0003834185888494053, 'samples': 9500352, 'steps': 49480, 'loss/train': 1.017730951309204} -11/07/2021 04:12:29 - INFO - __main__ - Step 49482: {'lr': 0.00038341410095838694, 'samples': 9500544, 'steps': 49481, 'loss/train': 1.4684760570526123} -11/07/2021 04:12:29 - INFO - __main__ - Step 49483: {'lr': 0.0003834096130072542, 'samples': 9500736, 'steps': 49482, 'loss/train': 1.460621953010559} -11/07/2021 04:12:29 - INFO - __main__ - Step 49484: {'lr': 0.00038340512499600917, 'samples': 9500928, 'steps': 49483, 'loss/train': 0.677061915397644} -11/07/2021 04:12:30 - INFO - __main__ - Step 49485: {'lr': 0.00038340063692465386, 'samples': 9501120, 'steps': 49484, 'loss/train': 0.8293577432632446} -11/07/2021 04:12:30 - INFO - __main__ - Step 49486: {'lr': 0.00038339614879319027, 'samples': 9501312, 'steps': 49485, 'loss/train': 1.5253651142120361} -11/07/2021 04:12:31 - INFO - __main__ - Step 49487: {'lr': 0.00038339166060162046, 'samples': 9501504, 'steps': 49486, 'loss/train': 1.2394787073135376} -11/07/2021 04:12:31 - INFO - __main__ - Step 49488: {'lr': 0.00038338717234994633, 'samples': 9501696, 'steps': 49487, 'loss/train': 0.6876512765884399} -11/07/2021 04:12:32 - INFO - __main__ - Step 49489: {'lr': 0.0003833826840381701, 'samples': 9501888, 'steps': 49488, 'loss/train': 1.709553599357605} -11/07/2021 04:12:32 - INFO - __main__ - Step 49490: {'lr': 0.00038337819566629363, 'samples': 9502080, 'steps': 49489, 'loss/train': 2.0343925952911377} -11/07/2021 04:12:33 - INFO - __main__ - Step 49491: {'lr': 0.000383373707234319, 'samples': 9502272, 'steps': 49490, 'loss/train': 1.097631573677063} -11/07/2021 04:12:34 - INFO - __main__ - Step 49492: {'lr': 0.0003833692187422483, 'samples': 9502464, 'steps': 49491, 'loss/train': 1.8399280309677124} -11/07/2021 04:12:34 - INFO - __main__ - Step 49493: {'lr': 0.0003833647301900835, 'samples': 9502656, 'steps': 49492, 'loss/train': 1.6749378442764282} -11/07/2021 04:12:34 - INFO - __main__ - Step 49494: {'lr': 0.00038336024157782655, 'samples': 9502848, 'steps': 49493, 'loss/train': 1.6002864837646484} -11/07/2021 04:12:35 - INFO - __main__ - Step 49495: {'lr': 0.00038335575290547954, 'samples': 9503040, 'steps': 49494, 'loss/train': 1.5806015729904175} -11/07/2021 04:12:35 - INFO - __main__ - Step 49496: {'lr': 0.0003833512641730445, 'samples': 9503232, 'steps': 49495, 'loss/train': 0.9982802867889404} -11/07/2021 04:12:36 - INFO - __main__ - Step 49497: {'lr': 0.0003833467753805234, 'samples': 9503424, 'steps': 49496, 'loss/train': 1.2644473314285278} -11/07/2021 04:12:36 - INFO - __main__ - Step 49498: {'lr': 0.00038334228652791837, 'samples': 9503616, 'steps': 49497, 'loss/train': 1.4780821800231934} -11/07/2021 04:12:37 - INFO - __main__ - Step 49499: {'lr': 0.00038333779761523133, 'samples': 9503808, 'steps': 49498, 'loss/train': 1.47004234790802} -11/07/2021 04:12:37 - INFO - __main__ - Step 49500: {'lr': 0.0003833333086424643, 'samples': 9504000, 'steps': 49499, 'loss/train': 1.6942075490951538} -11/07/2021 04:12:38 - INFO - __main__ - Step 49501: {'lr': 0.00038332881960961943, 'samples': 9504192, 'steps': 49500, 'loss/train': 1.52151620388031} -11/07/2021 04:12:38 - INFO - __main__ - Step 49502: {'lr': 0.0003833243305166986, 'samples': 9504384, 'steps': 49501, 'loss/train': 1.5208748579025269} -11/07/2021 04:12:39 - INFO - __main__ - Step 49503: {'lr': 0.00038331984136370377, 'samples': 9504576, 'steps': 49502, 'loss/train': 1.6068562269210815} -11/07/2021 04:12:39 - INFO - __main__ - Step 49504: {'lr': 0.0003833153521506372, 'samples': 9504768, 'steps': 49503, 'loss/train': 1.0254100561141968} -11/07/2021 04:12:40 - INFO - __main__ - Step 49505: {'lr': 0.00038331086287750083, 'samples': 9504960, 'steps': 49504, 'loss/train': 1.1298511028289795} -11/07/2021 04:12:40 - INFO - __main__ - Step 49506: {'lr': 0.0003833063735442966, 'samples': 9505152, 'steps': 49505, 'loss/train': 1.3094515800476074} -11/07/2021 04:12:41 - INFO - __main__ - Step 49507: {'lr': 0.0003833018841510265, 'samples': 9505344, 'steps': 49506, 'loss/train': 1.68741774559021} -11/07/2021 04:12:41 - INFO - __main__ - Step 49508: {'lr': 0.00038329739469769277, 'samples': 9505536, 'steps': 49507, 'loss/train': 1.2099201679229736} -11/07/2021 04:12:42 - INFO - __main__ - Step 49509: {'lr': 0.0003832929051842972, 'samples': 9505728, 'steps': 49508, 'loss/train': 1.4359480142593384} -11/07/2021 04:12:42 - INFO - __main__ - Step 49510: {'lr': 0.0003832884156108418, 'samples': 9505920, 'steps': 49509, 'loss/train': 1.4834827184677124} -11/07/2021 04:12:42 - INFO - __main__ - Step 49511: {'lr': 0.0003832839259773289, 'samples': 9506112, 'steps': 49510, 'loss/train': 1.4688080549240112} -11/07/2021 04:12:43 - INFO - __main__ - Step 49512: {'lr': 0.00038327943628376025, 'samples': 9506304, 'steps': 49511, 'loss/train': 1.4338685274124146} -11/07/2021 04:12:44 - INFO - __main__ - Step 49513: {'lr': 0.00038327494653013787, 'samples': 9506496, 'steps': 49512, 'loss/train': 1.4766474962234497} -11/07/2021 04:12:44 - INFO - __main__ - Step 49514: {'lr': 0.00038327045671646386, 'samples': 9506688, 'steps': 49513, 'loss/train': 1.6842774152755737} -11/07/2021 04:12:45 - INFO - __main__ - Step 49515: {'lr': 0.00038326596684274035, 'samples': 9506880, 'steps': 49514, 'loss/train': 2.441283702850342} -11/07/2021 04:12:45 - INFO - __main__ - Step 49516: {'lr': 0.00038326147690896916, 'samples': 9507072, 'steps': 49515, 'loss/train': 1.7583577632904053} -11/07/2021 04:12:45 - INFO - __main__ - Step 49517: {'lr': 0.00038325698691515247, 'samples': 9507264, 'steps': 49516, 'loss/train': 1.6572788953781128} -11/07/2021 04:12:46 - INFO - __main__ - Step 49518: {'lr': 0.00038325249686129223, 'samples': 9507456, 'steps': 49517, 'loss/train': 1.929858684539795} -11/07/2021 04:12:47 - INFO - __main__ - Step 49519: {'lr': 0.0003832480067473904, 'samples': 9507648, 'steps': 49518, 'loss/train': 1.293485164642334} -11/07/2021 04:12:47 - INFO - __main__ - Step 49520: {'lr': 0.0003832435165734491, 'samples': 9507840, 'steps': 49519, 'loss/train': 1.440374493598938} -11/07/2021 04:12:47 - INFO - __main__ - Step 49521: {'lr': 0.0003832390263394704, 'samples': 9508032, 'steps': 49520, 'loss/train': 1.3797657489776611} -11/07/2021 04:12:48 - INFO - __main__ - Step 49522: {'lr': 0.0003832345360454561, 'samples': 9508224, 'steps': 49521, 'loss/train': 1.4090845584869385} -11/07/2021 04:12:49 - INFO - __main__ - Step 49523: {'lr': 0.00038323004569140853, 'samples': 9508416, 'steps': 49522, 'loss/train': 1.6031702756881714} -11/07/2021 04:12:49 - INFO - __main__ - Step 49524: {'lr': 0.0003832255552773295, 'samples': 9508608, 'steps': 49523, 'loss/train': 0.7252176403999329} -11/07/2021 04:12:50 - INFO - __main__ - Step 49525: {'lr': 0.00038322106480322105, 'samples': 9508800, 'steps': 49524, 'loss/train': 1.2934327125549316} -11/07/2021 04:12:50 - INFO - __main__ - Step 49526: {'lr': 0.00038321657426908527, 'samples': 9508992, 'steps': 49525, 'loss/train': 1.1309657096862793} -11/07/2021 04:12:50 - INFO - __main__ - Step 49527: {'lr': 0.0003832120836749242, 'samples': 9509184, 'steps': 49526, 'loss/train': 0.998445987701416} -11/07/2021 04:12:51 - INFO - __main__ - Step 49528: {'lr': 0.0003832075930207398, 'samples': 9509376, 'steps': 49527, 'loss/train': 1.4018816947937012} -11/07/2021 04:12:52 - INFO - __main__ - Step 49529: {'lr': 0.0003832031023065341, 'samples': 9509568, 'steps': 49528, 'loss/train': 1.630361557006836} -11/07/2021 04:12:52 - INFO - __main__ - Step 49530: {'lr': 0.0003831986115323092, 'samples': 9509760, 'steps': 49529, 'loss/train': 0.6628460884094238} -11/07/2021 04:12:52 - INFO - __main__ - Step 49531: {'lr': 0.00038319412069806694, 'samples': 9509952, 'steps': 49530, 'loss/train': 1.198029637336731} -11/07/2021 04:12:53 - INFO - __main__ - Step 49532: {'lr': 0.00038318962980380956, 'samples': 9510144, 'steps': 49531, 'loss/train': 1.4488250017166138} -11/07/2021 04:12:53 - INFO - __main__ - Step 49533: {'lr': 0.0003831851388495389, 'samples': 9510336, 'steps': 49532, 'loss/train': 1.459463119506836} -11/07/2021 04:12:54 - INFO - __main__ - Step 49534: {'lr': 0.0003831806478352572, 'samples': 9510528, 'steps': 49533, 'loss/train': 1.526487112045288} -11/07/2021 04:12:55 - INFO - __main__ - Step 49535: {'lr': 0.00038317615676096623, 'samples': 9510720, 'steps': 49534, 'loss/train': 1.530272126197815} -11/07/2021 04:12:55 - INFO - __main__ - Step 49536: {'lr': 0.00038317166562666817, 'samples': 9510912, 'steps': 49535, 'loss/train': 1.554976224899292} -11/07/2021 04:12:55 - INFO - __main__ - Step 49537: {'lr': 0.00038316717443236505, 'samples': 9511104, 'steps': 49536, 'loss/train': 1.4371247291564941} -11/07/2021 04:12:56 - INFO - __main__ - Step 49538: {'lr': 0.0003831626831780588, 'samples': 9511296, 'steps': 49537, 'loss/train': 1.523795485496521} -11/07/2021 04:12:57 - INFO - __main__ - Step 49539: {'lr': 0.0003831581918637516, 'samples': 9511488, 'steps': 49538, 'loss/train': 1.5631895065307617} -11/07/2021 04:12:57 - INFO - __main__ - Step 49540: {'lr': 0.0003831537004894453, 'samples': 9511680, 'steps': 49539, 'loss/train': 1.807240605354309} -11/07/2021 04:12:57 - INFO - __main__ - Step 49541: {'lr': 0.000383149209055142, 'samples': 9511872, 'steps': 49540, 'loss/train': 1.528426170349121} -11/07/2021 04:12:58 - INFO - __main__ - Step 49542: {'lr': 0.00038314471756084373, 'samples': 9512064, 'steps': 49541, 'loss/train': 1.4981565475463867} -11/07/2021 04:12:58 - INFO - __main__ - Step 49543: {'lr': 0.0003831402260065525, 'samples': 9512256, 'steps': 49542, 'loss/train': 1.3794786930084229} -11/07/2021 04:12:59 - INFO - __main__ - Step 49544: {'lr': 0.00038313573439227035, 'samples': 9512448, 'steps': 49543, 'loss/train': 1.2986475229263306} -11/07/2021 04:13:00 - INFO - __main__ - Step 49545: {'lr': 0.0003831312427179993, 'samples': 9512640, 'steps': 49544, 'loss/train': 1.5060278177261353} -11/07/2021 04:13:00 - INFO - __main__ - Step 49546: {'lr': 0.00038312675098374136, 'samples': 9512832, 'steps': 49545, 'loss/train': 1.2425042390823364} -11/07/2021 04:13:00 - INFO - __main__ - Step 49547: {'lr': 0.0003831222591894985, 'samples': 9513024, 'steps': 49546, 'loss/train': 1.5853462219238281} -11/07/2021 04:13:01 - INFO - __main__ - Step 49548: {'lr': 0.0003831177673352729, 'samples': 9513216, 'steps': 49547, 'loss/train': 1.7374829053878784} -11/07/2021 04:13:01 - INFO - __main__ - Step 49549: {'lr': 0.00038311327542106646, 'samples': 9513408, 'steps': 49548, 'loss/train': 1.6388118267059326} -11/07/2021 04:13:03 - INFO - __main__ - Step 49550: {'lr': 0.00038310878344688116, 'samples': 9513600, 'steps': 49549, 'loss/train': 0.2743910551071167} -11/07/2021 04:13:03 - INFO - __main__ - Step 49551: {'lr': 0.0003831042914127192, 'samples': 9513792, 'steps': 49550, 'loss/train': 1.3564828634262085} -11/07/2021 04:13:03 - INFO - __main__ - Step 49552: {'lr': 0.00038309979931858243, 'samples': 9513984, 'steps': 49551, 'loss/train': 2.0853230953216553} -11/07/2021 04:13:04 - INFO - __main__ - Step 49553: {'lr': 0.00038309530716447297, 'samples': 9514176, 'steps': 49552, 'loss/train': 1.543075680732727} -11/07/2021 04:13:04 - INFO - __main__ - Step 49554: {'lr': 0.00038309081495039275, 'samples': 9514368, 'steps': 49553, 'loss/train': 0.3885495364665985} -11/07/2021 04:13:05 - INFO - __main__ - Step 49555: {'lr': 0.00038308632267634396, 'samples': 9514560, 'steps': 49554, 'loss/train': 0.8817199468612671} -11/07/2021 04:13:05 - INFO - __main__ - Step 49556: {'lr': 0.00038308183034232844, 'samples': 9514752, 'steps': 49555, 'loss/train': 1.533594012260437} -11/07/2021 04:13:06 - INFO - __main__ - Step 49557: {'lr': 0.0003830773379483484, 'samples': 9514944, 'steps': 49556, 'loss/train': 1.54350745677948} -11/07/2021 04:13:06 - INFO - __main__ - Step 49558: {'lr': 0.0003830728454944057, 'samples': 9515136, 'steps': 49557, 'loss/train': 1.152811050415039} -11/07/2021 04:13:06 - INFO - __main__ - Step 49559: {'lr': 0.00038306835298050255, 'samples': 9515328, 'steps': 49558, 'loss/train': 1.62739896774292} -11/07/2021 04:13:07 - INFO - __main__ - Step 49560: {'lr': 0.0003830638604066407, 'samples': 9515520, 'steps': 49559, 'loss/train': 1.3035004138946533} -11/07/2021 04:13:08 - INFO - __main__ - Step 49561: {'lr': 0.00038305936777282233, 'samples': 9515712, 'steps': 49560, 'loss/train': 1.7126566171646118} -11/07/2021 04:13:08 - INFO - __main__ - Step 49562: {'lr': 0.00038305487507904956, 'samples': 9515904, 'steps': 49561, 'loss/train': 1.2861318588256836} -11/07/2021 04:13:08 - INFO - __main__ - Step 49563: {'lr': 0.0003830503823253243, 'samples': 9516096, 'steps': 49562, 'loss/train': 1.5957990884780884} -11/07/2021 04:13:09 - INFO - __main__ - Step 49564: {'lr': 0.0003830458895116485, 'samples': 9516288, 'steps': 49563, 'loss/train': 1.307597041130066} -11/07/2021 04:13:09 - INFO - __main__ - Step 49565: {'lr': 0.0003830413966380243, 'samples': 9516480, 'steps': 49564, 'loss/train': 1.5037707090377808} -11/07/2021 04:13:10 - INFO - __main__ - Step 49566: {'lr': 0.00038303690370445384, 'samples': 9516672, 'steps': 49565, 'loss/train': 0.9930906295776367} -11/07/2021 04:13:10 - INFO - __main__ - Step 49567: {'lr': 0.00038303241071093884, 'samples': 9516864, 'steps': 49566, 'loss/train': 1.5315903425216675} -11/07/2021 04:13:11 - INFO - __main__ - Step 49568: {'lr': 0.00038302791765748156, 'samples': 9517056, 'steps': 49567, 'loss/train': 1.6297444105148315} -11/07/2021 04:13:11 - INFO - __main__ - Step 49569: {'lr': 0.0003830234245440839, 'samples': 9517248, 'steps': 49568, 'loss/train': 1.4744263887405396} -11/07/2021 04:13:12 - INFO - __main__ - Step 49570: {'lr': 0.000383018931370748, 'samples': 9517440, 'steps': 49569, 'loss/train': 1.4099575281143188} -11/07/2021 04:13:13 - INFO - __main__ - Step 49571: {'lr': 0.00038301443813747583, 'samples': 9517632, 'steps': 49570, 'loss/train': 1.4269685745239258} -11/07/2021 04:13:13 - INFO - __main__ - Step 49572: {'lr': 0.00038300994484426936, 'samples': 9517824, 'steps': 49571, 'loss/train': 1.3018014430999756} -11/07/2021 04:13:13 - INFO - __main__ - Step 49573: {'lr': 0.0003830054514911307, 'samples': 9518016, 'steps': 49572, 'loss/train': 1.1602410078048706} -11/07/2021 04:13:14 - INFO - __main__ - Step 49574: {'lr': 0.0003830009580780618, 'samples': 9518208, 'steps': 49573, 'loss/train': 1.6300928592681885} -11/07/2021 04:13:14 - INFO - __main__ - Step 49575: {'lr': 0.00038299646460506474, 'samples': 9518400, 'steps': 49574, 'loss/train': 1.4427337646484375} -11/07/2021 04:13:15 - INFO - __main__ - Step 49576: {'lr': 0.0003829919710721415, 'samples': 9518592, 'steps': 49575, 'loss/train': 1.8379251956939697} -11/07/2021 04:13:16 - INFO - __main__ - Step 49577: {'lr': 0.0003829874774792941, 'samples': 9518784, 'steps': 49576, 'loss/train': 1.6046229600906372} -11/07/2021 04:13:16 - INFO - __main__ - Step 49578: {'lr': 0.00038298298382652467, 'samples': 9518976, 'steps': 49577, 'loss/train': 1.7580783367156982} -11/07/2021 04:13:16 - INFO - __main__ - Step 49579: {'lr': 0.00038297849011383517, 'samples': 9519168, 'steps': 49578, 'loss/train': 1.5407004356384277} -11/07/2021 04:13:17 - INFO - __main__ - Step 49580: {'lr': 0.0003829739963412276, 'samples': 9519360, 'steps': 49579, 'loss/train': 0.37775328755378723} -11/07/2021 04:13:18 - INFO - __main__ - Step 49581: {'lr': 0.000382969502508704, 'samples': 9519552, 'steps': 49580, 'loss/train': 1.6808826923370361} -11/07/2021 04:13:18 - INFO - __main__ - Step 49582: {'lr': 0.0003829650086162663, 'samples': 9519744, 'steps': 49581, 'loss/train': 1.637237310409546} -11/07/2021 04:13:18 - INFO - __main__ - Step 49583: {'lr': 0.0003829605146639167, 'samples': 9519936, 'steps': 49582, 'loss/train': 1.4391934871673584} -11/07/2021 04:13:19 - INFO - __main__ - Step 49584: {'lr': 0.00038295602065165714, 'samples': 9520128, 'steps': 49583, 'loss/train': 1.8345682621002197} -11/07/2021 04:13:19 - INFO - __main__ - Step 49585: {'lr': 0.0003829515265794896, 'samples': 9520320, 'steps': 49584, 'loss/train': 1.8743866682052612} -11/07/2021 04:13:20 - INFO - __main__ - Step 49586: {'lr': 0.00038294703244741625, 'samples': 9520512, 'steps': 49585, 'loss/train': 1.6653952598571777} -11/07/2021 04:13:20 - INFO - __main__ - Step 49587: {'lr': 0.000382942538255439, 'samples': 9520704, 'steps': 49586, 'loss/train': 1.7852160930633545} -11/07/2021 04:13:21 - INFO - __main__ - Step 49588: {'lr': 0.0003829380440035598, 'samples': 9520896, 'steps': 49587, 'loss/train': 1.1733639240264893} -11/07/2021 04:13:21 - INFO - __main__ - Step 49589: {'lr': 0.0003829335496917808, 'samples': 9521088, 'steps': 49588, 'loss/train': 0.9976392388343811} -11/07/2021 04:13:21 - INFO - __main__ - Step 49590: {'lr': 0.000382929055320104, 'samples': 9521280, 'steps': 49589, 'loss/train': 1.4055172204971313} -11/07/2021 04:13:22 - INFO - __main__ - Step 49591: {'lr': 0.0003829245608885315, 'samples': 9521472, 'steps': 49590, 'loss/train': 1.155929446220398} -11/07/2021 04:13:23 - INFO - __main__ - Step 49592: {'lr': 0.0003829200663970652, 'samples': 9521664, 'steps': 49591, 'loss/train': 2.5761666297912598} -11/07/2021 04:13:23 - INFO - __main__ - Step 49593: {'lr': 0.00038291557184570713, 'samples': 9521856, 'steps': 49592, 'loss/train': 1.8351387977600098} -11/07/2021 04:13:23 - INFO - __main__ - Step 49594: {'lr': 0.0003829110772344594, 'samples': 9522048, 'steps': 49593, 'loss/train': 1.4460923671722412} -11/07/2021 04:13:24 - INFO - __main__ - Step 49595: {'lr': 0.000382906582563324, 'samples': 9522240, 'steps': 49594, 'loss/train': 1.391068935394287} -11/07/2021 04:13:25 - INFO - __main__ - Step 49596: {'lr': 0.00038290208783230286, 'samples': 9522432, 'steps': 49595, 'loss/train': 1.0812073945999146} -11/07/2021 04:13:25 - INFO - __main__ - Step 49597: {'lr': 0.00038289759304139815, 'samples': 9522624, 'steps': 49596, 'loss/train': 1.5305726528167725} -11/07/2021 04:13:25 - INFO - __main__ - Step 49598: {'lr': 0.0003828930981906118, 'samples': 9522816, 'steps': 49597, 'loss/train': 1.4933536052703857} -11/07/2021 04:13:26 - INFO - __main__ - Step 49599: {'lr': 0.000382888603279946, 'samples': 9523008, 'steps': 49598, 'loss/train': 0.9710624814033508} -11/07/2021 04:13:26 - INFO - __main__ - Step 49600: {'lr': 0.00038288410830940246, 'samples': 9523200, 'steps': 49599, 'loss/train': 1.8931074142456055} -11/07/2021 04:13:27 - INFO - __main__ - Step 49601: {'lr': 0.00038287961327898346, 'samples': 9523392, 'steps': 49600, 'loss/train': 0.9926786422729492} -11/07/2021 04:13:28 - INFO - __main__ - Step 49602: {'lr': 0.000382875118188691, 'samples': 9523584, 'steps': 49601, 'loss/train': 1.5702821016311646} -11/07/2021 04:13:28 - INFO - __main__ - Step 49603: {'lr': 0.000382870623038527, 'samples': 9523776, 'steps': 49602, 'loss/train': 1.3586236238479614} -11/07/2021 04:13:28 - INFO - __main__ - Step 49604: {'lr': 0.0003828661278284936, 'samples': 9523968, 'steps': 49603, 'loss/train': 1.2675609588623047} -11/07/2021 04:13:29 - INFO - __main__ - Step 49605: {'lr': 0.00038286163255859276, 'samples': 9524160, 'steps': 49604, 'loss/train': 1.3705264329910278} -11/07/2021 04:13:30 - INFO - __main__ - Step 49606: {'lr': 0.0003828571372288265, 'samples': 9524352, 'steps': 49605, 'loss/train': 1.6547865867614746} -11/07/2021 04:13:30 - INFO - __main__ - Step 49607: {'lr': 0.00038285264183919696, 'samples': 9524544, 'steps': 49606, 'loss/train': 1.2476061582565308} -11/07/2021 04:13:30 - INFO - __main__ - Step 49608: {'lr': 0.00038284814638970594, 'samples': 9524736, 'steps': 49607, 'loss/train': 1.2930322885513306} -11/07/2021 04:13:31 - INFO - __main__ - Step 49609: {'lr': 0.00038284365088035564, 'samples': 9524928, 'steps': 49608, 'loss/train': 1.6116275787353516} -11/07/2021 04:13:31 - INFO - __main__ - Step 49610: {'lr': 0.00038283915531114806, 'samples': 9525120, 'steps': 49609, 'loss/train': 1.7082544565200806} -11/07/2021 04:13:32 - INFO - __main__ - Step 49611: {'lr': 0.0003828346596820852, 'samples': 9525312, 'steps': 49610, 'loss/train': 1.5115309953689575} -11/07/2021 04:13:32 - INFO - __main__ - Step 49612: {'lr': 0.00038283016399316905, 'samples': 9525504, 'steps': 49611, 'loss/train': 1.3873403072357178} -11/07/2021 04:13:33 - INFO - __main__ - Step 49613: {'lr': 0.00038282566824440176, 'samples': 9525696, 'steps': 49612, 'loss/train': 1.6959043741226196} -11/07/2021 04:13:33 - INFO - __main__ - Step 49614: {'lr': 0.0003828211724357852, 'samples': 9525888, 'steps': 49613, 'loss/train': 5.5632734298706055} -11/07/2021 04:13:33 - INFO - __main__ - Step 49615: {'lr': 0.00038281667656732144, 'samples': 9526080, 'steps': 49614, 'loss/train': 1.538751482963562} -11/07/2021 04:13:34 - INFO - __main__ - Step 49616: {'lr': 0.0003828121806390126, 'samples': 9526272, 'steps': 49615, 'loss/train': 1.3263506889343262} -11/07/2021 04:13:35 - INFO - __main__ - Step 49617: {'lr': 0.0003828076846508606, 'samples': 9526464, 'steps': 49616, 'loss/train': 1.384452223777771} -11/07/2021 04:13:35 - INFO - __main__ - Step 49618: {'lr': 0.00038280318860286756, 'samples': 9526656, 'steps': 49617, 'loss/train': 1.475805640220642} -11/07/2021 04:13:36 - INFO - __main__ - Step 49619: {'lr': 0.0003827986924950354, 'samples': 9526848, 'steps': 49618, 'loss/train': 1.462049961090088} -11/07/2021 04:13:36 - INFO - __main__ - Step 49620: {'lr': 0.0003827941963273663, 'samples': 9527040, 'steps': 49619, 'loss/train': 1.3185629844665527} -11/07/2021 04:13:36 - INFO - __main__ - Step 49621: {'lr': 0.00038278970009986206, 'samples': 9527232, 'steps': 49620, 'loss/train': 1.1094467639923096} -11/07/2021 04:13:37 - INFO - __main__ - Step 49622: {'lr': 0.0003827852038125249, 'samples': 9527424, 'steps': 49621, 'loss/train': 1.55144202709198} -11/07/2021 04:13:38 - INFO - __main__ - Step 49623: {'lr': 0.00038278070746535674, 'samples': 9527616, 'steps': 49622, 'loss/train': 1.518005132675171} -11/07/2021 04:13:38 - INFO - __main__ - Step 49624: {'lr': 0.0003827762110583597, 'samples': 9527808, 'steps': 49623, 'loss/train': 1.5901243686676025} -11/07/2021 04:13:38 - INFO - __main__ - Step 49625: {'lr': 0.0003827717145915357, 'samples': 9528000, 'steps': 49624, 'loss/train': 1.5442684888839722} -11/07/2021 04:13:39 - INFO - __main__ - Step 49626: {'lr': 0.0003827672180648868, 'samples': 9528192, 'steps': 49625, 'loss/train': 1.7559553384780884} -11/07/2021 04:13:40 - INFO - __main__ - Step 49627: {'lr': 0.0003827627214784151, 'samples': 9528384, 'steps': 49626, 'loss/train': 1.4572389125823975} -11/07/2021 04:13:40 - INFO - __main__ - Step 49628: {'lr': 0.0003827582248321225, 'samples': 9528576, 'steps': 49627, 'loss/train': 1.6016181707382202} -11/07/2021 04:13:41 - INFO - __main__ - Step 49629: {'lr': 0.0003827537281260111, 'samples': 9528768, 'steps': 49628, 'loss/train': 1.3121598958969116} -11/07/2021 04:13:41 - INFO - __main__ - Step 49630: {'lr': 0.00038274923136008294, 'samples': 9528960, 'steps': 49629, 'loss/train': 1.4197397232055664} -11/07/2021 04:13:41 - INFO - __main__ - Step 49631: {'lr': 0.00038274473453434, 'samples': 9529152, 'steps': 49630, 'loss/train': 1.2599914073944092} -11/07/2021 04:13:42 - INFO - __main__ - Step 49632: {'lr': 0.0003827402376487844, 'samples': 9529344, 'steps': 49631, 'loss/train': 1.630716323852539} -11/07/2021 04:13:43 - INFO - __main__ - Step 49633: {'lr': 0.0003827357407034181, 'samples': 9529536, 'steps': 49632, 'loss/train': 1.7098501920700073} -11/07/2021 04:13:43 - INFO - __main__ - Step 49634: {'lr': 0.00038273124369824304, 'samples': 9529728, 'steps': 49633, 'loss/train': 1.7722996473312378} -11/07/2021 04:13:43 - INFO - __main__ - Step 49635: {'lr': 0.00038272674663326136, 'samples': 9529920, 'steps': 49634, 'loss/train': 1.3559863567352295} -11/07/2021 04:13:44 - INFO - __main__ - Step 49636: {'lr': 0.000382722249508475, 'samples': 9530112, 'steps': 49635, 'loss/train': 1.5778757333755493} -11/07/2021 04:13:44 - INFO - __main__ - Step 49637: {'lr': 0.00038271775232388616, 'samples': 9530304, 'steps': 49636, 'loss/train': 1.48716402053833} -11/07/2021 04:13:45 - INFO - __main__ - Step 49638: {'lr': 0.00038271325507949666, 'samples': 9530496, 'steps': 49637, 'loss/train': 1.8214058876037598} -11/07/2021 04:13:45 - INFO - __main__ - Step 49639: {'lr': 0.00038270875777530864, 'samples': 9530688, 'steps': 49638, 'loss/train': 1.3735169172286987} -11/07/2021 04:13:46 - INFO - __main__ - Step 49640: {'lr': 0.0003827042604113241, 'samples': 9530880, 'steps': 49639, 'loss/train': 1.2777843475341797} -11/07/2021 04:13:46 - INFO - __main__ - Step 49641: {'lr': 0.0003826997629875451, 'samples': 9531072, 'steps': 49640, 'loss/train': 1.8156064748764038} -11/07/2021 04:13:46 - INFO - __main__ - Step 49642: {'lr': 0.0003826952655039736, 'samples': 9531264, 'steps': 49641, 'loss/train': 1.287994384765625} -11/07/2021 04:13:48 - INFO - __main__ - Step 49643: {'lr': 0.0003826907679606117, 'samples': 9531456, 'steps': 49642, 'loss/train': 1.5666861534118652} -11/07/2021 04:13:48 - INFO - __main__ - Step 49644: {'lr': 0.00038268627035746133, 'samples': 9531648, 'steps': 49643, 'loss/train': 1.2110158205032349} -11/07/2021 04:13:48 - INFO - __main__ - Step 49645: {'lr': 0.00038268177269452463, 'samples': 9531840, 'steps': 49644, 'loss/train': 1.4190071821212769} -11/07/2021 04:13:49 - INFO - __main__ - Step 49646: {'lr': 0.0003826772749718036, 'samples': 9532032, 'steps': 49645, 'loss/train': 1.5874351263046265} -11/07/2021 04:13:49 - INFO - __main__ - Step 49647: {'lr': 0.00038267277718930014, 'samples': 9532224, 'steps': 49646, 'loss/train': 1.654268503189087} -11/07/2021 04:13:49 - INFO - __main__ - Step 49648: {'lr': 0.0003826682793470164, 'samples': 9532416, 'steps': 49647, 'loss/train': 0.908328652381897} -11/07/2021 04:13:50 - INFO - __main__ - Step 49649: {'lr': 0.0003826637814449544, 'samples': 9532608, 'steps': 49648, 'loss/train': 1.3017082214355469} -11/07/2021 04:13:51 - INFO - __main__ - Step 49650: {'lr': 0.00038265928348311614, 'samples': 9532800, 'steps': 49649, 'loss/train': 1.3552396297454834} -11/07/2021 04:13:51 - INFO - __main__ - Step 49651: {'lr': 0.0003826547854615037, 'samples': 9532992, 'steps': 49650, 'loss/train': 1.3476513624191284} -11/07/2021 04:13:51 - INFO - __main__ - Step 49652: {'lr': 0.000382650287380119, 'samples': 9533184, 'steps': 49651, 'loss/train': 0.6778313517570496} -11/07/2021 04:13:52 - INFO - __main__ - Step 49653: {'lr': 0.00038264578923896415, 'samples': 9533376, 'steps': 49652, 'loss/train': 1.587056279182434} -11/07/2021 04:13:53 - INFO - __main__ - Step 49654: {'lr': 0.00038264129103804113, 'samples': 9533568, 'steps': 49653, 'loss/train': 1.9432332515716553} -11/07/2021 04:13:53 - INFO - __main__ - Step 49655: {'lr': 0.00038263679277735196, 'samples': 9533760, 'steps': 49654, 'loss/train': 1.1152772903442383} -11/07/2021 04:13:54 - INFO - __main__ - Step 49656: {'lr': 0.0003826322944568988, 'samples': 9533952, 'steps': 49655, 'loss/train': 0.20244891941547394} -11/07/2021 04:13:54 - INFO - __main__ - Step 49657: {'lr': 0.00038262779607668354, 'samples': 9534144, 'steps': 49656, 'loss/train': 1.5896071195602417} -11/07/2021 04:13:55 - INFO - __main__ - Step 49658: {'lr': 0.0003826232976367082, 'samples': 9534336, 'steps': 49657, 'loss/train': 1.1312906742095947} -11/07/2021 04:13:55 - INFO - __main__ - Step 49659: {'lr': 0.0003826187991369749, 'samples': 9534528, 'steps': 49658, 'loss/train': 1.2865389585494995} -11/07/2021 04:13:56 - INFO - __main__ - Step 49660: {'lr': 0.00038261430057748557, 'samples': 9534720, 'steps': 49659, 'loss/train': 1.4453037977218628} -11/07/2021 04:13:56 - INFO - __main__ - Step 49661: {'lr': 0.0003826098019582423, 'samples': 9534912, 'steps': 49660, 'loss/train': 1.836003065109253} -11/07/2021 04:13:57 - INFO - __main__ - Step 49662: {'lr': 0.00038260530327924715, 'samples': 9535104, 'steps': 49661, 'loss/train': 1.378966212272644} -11/07/2021 04:13:57 - INFO - __main__ - Step 49663: {'lr': 0.00038260080454050207, 'samples': 9535296, 'steps': 49662, 'loss/train': 1.3185806274414062} -11/07/2021 04:13:58 - INFO - __main__ - Step 49664: {'lr': 0.00038259630574200904, 'samples': 9535488, 'steps': 49663, 'loss/train': 1.0712865591049194} -11/07/2021 04:13:58 - INFO - __main__ - Step 49665: {'lr': 0.0003825918068837702, 'samples': 9535680, 'steps': 49664, 'loss/train': 1.7213788032531738} -11/07/2021 04:13:59 - INFO - __main__ - Step 49666: {'lr': 0.00038258730796578757, 'samples': 9535872, 'steps': 49665, 'loss/train': 0.6380241513252258} -11/07/2021 04:13:59 - INFO - __main__ - Step 49667: {'lr': 0.0003825828089880631, 'samples': 9536064, 'steps': 49666, 'loss/train': 1.4698467254638672} -11/07/2021 04:13:59 - INFO - __main__ - Step 49668: {'lr': 0.00038257830995059894, 'samples': 9536256, 'steps': 49667, 'loss/train': 1.3259644508361816} -11/07/2021 04:14:00 - INFO - __main__ - Step 49669: {'lr': 0.00038257381085339694, 'samples': 9536448, 'steps': 49668, 'loss/train': 1.43675696849823} -11/07/2021 04:14:01 - INFO - __main__ - Step 49670: {'lr': 0.00038256931169645925, 'samples': 9536640, 'steps': 49669, 'loss/train': 1.3211148977279663} -11/07/2021 04:14:01 - INFO - __main__ - Step 49671: {'lr': 0.00038256481247978793, 'samples': 9536832, 'steps': 49670, 'loss/train': 1.5604088306427002} -11/07/2021 04:14:01 - INFO - __main__ - Step 49672: {'lr': 0.00038256031320338494, 'samples': 9537024, 'steps': 49671, 'loss/train': 1.1204627752304077} -11/07/2021 04:14:02 - INFO - __main__ - Step 49673: {'lr': 0.0003825558138672523, 'samples': 9537216, 'steps': 49672, 'loss/train': 1.0878816843032837} -11/07/2021 04:14:03 - INFO - __main__ - Step 49674: {'lr': 0.00038255131447139203, 'samples': 9537408, 'steps': 49673, 'loss/train': 1.3592828512191772} -11/07/2021 04:14:03 - INFO - __main__ - Step 49675: {'lr': 0.00038254681501580625, 'samples': 9537600, 'steps': 49674, 'loss/train': 1.5508614778518677} -11/07/2021 04:14:03 - INFO - __main__ - Step 49676: {'lr': 0.00038254231550049686, 'samples': 9537792, 'steps': 49675, 'loss/train': 1.5368692874908447} -11/07/2021 04:14:04 - INFO - __main__ - Step 49677: {'lr': 0.00038253781592546593, 'samples': 9537984, 'steps': 49676, 'loss/train': 1.016180396080017} -11/07/2021 04:14:04 - INFO - __main__ - Step 49678: {'lr': 0.0003825333162907155, 'samples': 9538176, 'steps': 49677, 'loss/train': 1.0984134674072266} -11/07/2021 04:14:05 - INFO - __main__ - Step 49679: {'lr': 0.0003825288165962477, 'samples': 9538368, 'steps': 49678, 'loss/train': 1.4270671606063843} -11/07/2021 04:14:06 - INFO - __main__ - Step 49680: {'lr': 0.0003825243168420644, 'samples': 9538560, 'steps': 49679, 'loss/train': 1.6393283605575562} -11/07/2021 04:14:06 - INFO - __main__ - Step 49681: {'lr': 0.00038251981702816767, 'samples': 9538752, 'steps': 49680, 'loss/train': 1.3077753782272339} -11/07/2021 04:14:06 - INFO - __main__ - Step 49682: {'lr': 0.00038251531715455955, 'samples': 9538944, 'steps': 49681, 'loss/train': 1.278901219367981} -11/07/2021 04:14:07 - INFO - __main__ - Step 49683: {'lr': 0.00038251081722124214, 'samples': 9539136, 'steps': 49682, 'loss/train': 1.7971502542495728} -11/07/2021 04:14:08 - INFO - __main__ - Step 49684: {'lr': 0.0003825063172282174, 'samples': 9539328, 'steps': 49683, 'loss/train': 1.0549887418746948} -11/07/2021 04:14:08 - INFO - __main__ - Step 49685: {'lr': 0.00038250181717548726, 'samples': 9539520, 'steps': 49684, 'loss/train': 1.6527125835418701} -11/07/2021 04:14:08 - INFO - __main__ - Step 49686: {'lr': 0.0003824973170630539, 'samples': 9539712, 'steps': 49685, 'loss/train': 1.698177456855774} -11/07/2021 04:14:09 - INFO - __main__ - Step 49687: {'lr': 0.0003824928168909193, 'samples': 9539904, 'steps': 49686, 'loss/train': 1.2676993608474731} -11/07/2021 04:14:09 - INFO - __main__ - Step 49688: {'lr': 0.00038248831665908546, 'samples': 9540096, 'steps': 49687, 'loss/train': 1.2248433828353882} -11/07/2021 04:14:10 - INFO - __main__ - Step 49689: {'lr': 0.0003824838163675545, 'samples': 9540288, 'steps': 49688, 'loss/train': 1.0999497175216675} -11/07/2021 04:14:10 - INFO - __main__ - Step 49690: {'lr': 0.0003824793160163283, 'samples': 9540480, 'steps': 49689, 'loss/train': 1.3124828338623047} -11/07/2021 04:14:11 - INFO - __main__ - Step 49691: {'lr': 0.000382474815605409, 'samples': 9540672, 'steps': 49690, 'loss/train': 1.3977371454238892} -11/07/2021 04:14:11 - INFO - __main__ - Step 49692: {'lr': 0.00038247031513479856, 'samples': 9540864, 'steps': 49691, 'loss/train': 2.3644144535064697} -11/07/2021 04:14:12 - INFO - __main__ - Step 49693: {'lr': 0.0003824658146044991, 'samples': 9541056, 'steps': 49692, 'loss/train': 1.680859088897705} -11/07/2021 04:14:13 - INFO - __main__ - Step 49694: {'lr': 0.0003824613140145125, 'samples': 9541248, 'steps': 49693, 'loss/train': 1.5952850580215454} -11/07/2021 04:14:13 - INFO - __main__ - Step 49695: {'lr': 0.00038245681336484096, 'samples': 9541440, 'steps': 49694, 'loss/train': 1.8383580446243286} -11/07/2021 04:14:13 - INFO - __main__ - Step 49696: {'lr': 0.00038245231265548633, 'samples': 9541632, 'steps': 49695, 'loss/train': 0.7911908030509949} -11/07/2021 04:14:14 - INFO - __main__ - Step 49697: {'lr': 0.0003824478118864508, 'samples': 9541824, 'steps': 49696, 'loss/train': 1.490234375} -11/07/2021 04:14:14 - INFO - __main__ - Step 49698: {'lr': 0.0003824433110577363, 'samples': 9542016, 'steps': 49697, 'loss/train': 0.9387646317481995} -11/07/2021 04:14:15 - INFO - __main__ - Step 49699: {'lr': 0.0003824388101693449, 'samples': 9542208, 'steps': 49698, 'loss/train': 1.9955414533615112} -11/07/2021 04:14:15 - INFO - __main__ - Step 49700: {'lr': 0.00038243430922127865, 'samples': 9542400, 'steps': 49699, 'loss/train': 1.8206192255020142} -11/07/2021 04:14:16 - INFO - __main__ - Step 49701: {'lr': 0.00038242980821353954, 'samples': 9542592, 'steps': 49700, 'loss/train': 1.4436894655227661} -11/07/2021 04:14:16 - INFO - __main__ - Step 49702: {'lr': 0.00038242530714612953, 'samples': 9542784, 'steps': 49701, 'loss/train': 1.7632184028625488} -11/07/2021 04:14:16 - INFO - __main__ - Step 49703: {'lr': 0.00038242080601905083, 'samples': 9542976, 'steps': 49702, 'loss/train': 1.850001573562622} -11/07/2021 04:14:18 - INFO - __main__ - Step 49704: {'lr': 0.0003824163048323053, 'samples': 9543168, 'steps': 49703, 'loss/train': 1.4575488567352295} -11/07/2021 04:14:18 - INFO - __main__ - Step 49705: {'lr': 0.000382411803585895, 'samples': 9543360, 'steps': 49704, 'loss/train': 0.9507234692573547} -11/07/2021 04:14:18 - INFO - __main__ - Step 49706: {'lr': 0.000382407302279822, 'samples': 9543552, 'steps': 49705, 'loss/train': 0.6334741115570068} -11/07/2021 04:14:19 - INFO - __main__ - Step 49707: {'lr': 0.0003824028009140883, 'samples': 9543744, 'steps': 49706, 'loss/train': 1.6214922666549683} -11/07/2021 04:14:19 - INFO - __main__ - Step 49708: {'lr': 0.000382398299488696, 'samples': 9543936, 'steps': 49707, 'loss/train': 1.3992692232131958} -11/07/2021 04:14:20 - INFO - __main__ - Step 49709: {'lr': 0.000382393798003647, 'samples': 9544128, 'steps': 49708, 'loss/train': 1.5029001235961914} -11/07/2021 04:14:20 - INFO - __main__ - Step 49710: {'lr': 0.00038238929645894345, 'samples': 9544320, 'steps': 49709, 'loss/train': 1.2773594856262207} -11/07/2021 04:14:21 - INFO - __main__ - Step 49711: {'lr': 0.00038238479485458725, 'samples': 9544512, 'steps': 49710, 'loss/train': 1.6366949081420898} -11/07/2021 04:14:21 - INFO - __main__ - Step 49712: {'lr': 0.0003823802931905806, 'samples': 9544704, 'steps': 49711, 'loss/train': 1.3928391933441162} -11/07/2021 04:14:21 - INFO - __main__ - Step 49713: {'lr': 0.0003823757914669254, 'samples': 9544896, 'steps': 49712, 'loss/train': 0.8958503603935242} -11/07/2021 04:14:22 - INFO - __main__ - Step 49714: {'lr': 0.00038237128968362366, 'samples': 9545088, 'steps': 49713, 'loss/train': 1.345287561416626} -11/07/2021 04:14:23 - INFO - __main__ - Step 49715: {'lr': 0.0003823667878406776, 'samples': 9545280, 'steps': 49714, 'loss/train': 1.3177357912063599} -11/07/2021 04:14:23 - INFO - __main__ - Step 49716: {'lr': 0.000382362285938089, 'samples': 9545472, 'steps': 49715, 'loss/train': 1.5471429824829102} -11/07/2021 04:14:23 - INFO - __main__ - Step 49717: {'lr': 0.00038235778397586, 'samples': 9545664, 'steps': 49716, 'loss/train': 1.2901102304458618} -11/07/2021 04:14:24 - INFO - __main__ - Step 49718: {'lr': 0.00038235328195399253, 'samples': 9545856, 'steps': 49717, 'loss/train': 1.408123254776001} -11/07/2021 04:14:25 - INFO - __main__ - Step 49719: {'lr': 0.0003823487798724888, 'samples': 9546048, 'steps': 49718, 'loss/train': 0.8959937691688538} -11/07/2021 04:14:25 - INFO - __main__ - Step 49720: {'lr': 0.00038234427773135084, 'samples': 9546240, 'steps': 49719, 'loss/train': 1.272355556488037} -11/07/2021 04:14:26 - INFO - __main__ - Step 49721: {'lr': 0.00038233977553058055, 'samples': 9546432, 'steps': 49720, 'loss/train': 1.237605333328247} -11/07/2021 04:14:26 - INFO - __main__ - Step 49722: {'lr': 0.0003823352732701799, 'samples': 9546624, 'steps': 49721, 'loss/train': 2.2506821155548096} -11/07/2021 04:14:27 - INFO - __main__ - Step 49723: {'lr': 0.0003823307709501511, 'samples': 9546816, 'steps': 49722, 'loss/train': 1.407764196395874} -11/07/2021 04:14:28 - INFO - __main__ - Step 49724: {'lr': 0.0003823262685704961, 'samples': 9547008, 'steps': 49723, 'loss/train': 0.09105194360017776} -11/07/2021 04:14:28 - INFO - __main__ - Step 49725: {'lr': 0.00038232176613121687, 'samples': 9547200, 'steps': 49724, 'loss/train': 1.2535902261734009} -11/07/2021 04:14:28 - INFO - __main__ - Step 49726: {'lr': 0.00038231726363231554, 'samples': 9547392, 'steps': 49725, 'loss/train': 0.0777641236782074} -11/07/2021 04:14:29 - INFO - __main__ - Step 49727: {'lr': 0.0003823127610737941, 'samples': 9547584, 'steps': 49726, 'loss/train': 0.7437136173248291} -11/07/2021 04:14:29 - INFO - __main__ - Step 49728: {'lr': 0.00038230825845565454, 'samples': 9547776, 'steps': 49727, 'loss/train': 1.60201895236969} -11/07/2021 04:14:30 - INFO - __main__ - Step 49729: {'lr': 0.00038230375577789894, 'samples': 9547968, 'steps': 49728, 'loss/train': 1.3844270706176758} -11/07/2021 04:14:30 - INFO - __main__ - Step 49730: {'lr': 0.0003822992530405293, 'samples': 9548160, 'steps': 49729, 'loss/train': 1.0805037021636963} -11/07/2021 04:14:31 - INFO - __main__ - Step 49731: {'lr': 0.00038229475024354766, 'samples': 9548352, 'steps': 49730, 'loss/train': 0.09550980478525162} -11/07/2021 04:14:31 - INFO - __main__ - Step 49732: {'lr': 0.00038229024738695605, 'samples': 9548544, 'steps': 49731, 'loss/train': 1.4066355228424072} -11/07/2021 04:14:32 - INFO - __main__ - Step 49733: {'lr': 0.0003822857444707565, 'samples': 9548736, 'steps': 49732, 'loss/train': 0.9648271203041077} -11/07/2021 04:14:32 - INFO - __main__ - Step 49734: {'lr': 0.00038228124149495104, 'samples': 9548928, 'steps': 49733, 'loss/train': 0.6856678128242493} -11/07/2021 04:14:33 - INFO - __main__ - Step 49735: {'lr': 0.0003822767384595417, 'samples': 9549120, 'steps': 49734, 'loss/train': 1.0965052843093872} -11/07/2021 04:14:33 - INFO - __main__ - Step 49736: {'lr': 0.0003822722353645305, 'samples': 9549312, 'steps': 49735, 'loss/train': 1.3487507104873657} -11/07/2021 04:14:34 - INFO - __main__ - Step 49737: {'lr': 0.00038226773220991937, 'samples': 9549504, 'steps': 49736, 'loss/train': 1.2100340127944946} -11/07/2021 04:14:34 - INFO - __main__ - Step 49738: {'lr': 0.0003822632289957105, 'samples': 9549696, 'steps': 49737, 'loss/train': 1.3853355646133423} -11/07/2021 04:14:34 - INFO - __main__ - Step 49739: {'lr': 0.000382258725721906, 'samples': 9549888, 'steps': 49738, 'loss/train': 1.366625189781189} -11/07/2021 04:14:35 - INFO - __main__ - Step 49740: {'lr': 0.0003822542223885076, 'samples': 9550080, 'steps': 49739, 'loss/train': 2.083750009536743} -11/07/2021 04:14:36 - INFO - __main__ - Step 49741: {'lr': 0.0003822497189955175, 'samples': 9550272, 'steps': 49740, 'loss/train': 1.1018315553665161} -11/07/2021 04:14:36 - INFO - __main__ - Step 49742: {'lr': 0.0003822452155429378, 'samples': 9550464, 'steps': 49741, 'loss/train': 1.5830544233322144} -11/07/2021 04:14:36 - INFO - __main__ - Step 49743: {'lr': 0.0003822407120307704, 'samples': 9550656, 'steps': 49742, 'loss/train': 1.3785125017166138} -11/07/2021 04:14:37 - INFO - __main__ - Step 49744: {'lr': 0.0003822362084590174, 'samples': 9550848, 'steps': 49743, 'loss/train': 0.9274885654449463} -11/07/2021 04:14:38 - INFO - __main__ - Step 49745: {'lr': 0.0003822317048276808, 'samples': 9551040, 'steps': 49744, 'loss/train': 1.155612587928772} -11/07/2021 04:14:38 - INFO - __main__ - Step 49746: {'lr': 0.0003822272011367626, 'samples': 9551232, 'steps': 49745, 'loss/train': 1.5381557941436768} -11/07/2021 04:14:39 - INFO - __main__ - Step 49747: {'lr': 0.0003822226973862649, 'samples': 9551424, 'steps': 49746, 'loss/train': 1.1861746311187744} -11/07/2021 04:14:39 - INFO - __main__ - Step 49748: {'lr': 0.00038221819357618967, 'samples': 9551616, 'steps': 49747, 'loss/train': 1.2957367897033691} -11/07/2021 04:14:39 - INFO - __main__ - Step 49749: {'lr': 0.0003822136897065389, 'samples': 9551808, 'steps': 49748, 'loss/train': 1.6322989463806152} -11/07/2021 04:14:40 - INFO - __main__ - Step 49750: {'lr': 0.0003822091857773148, 'samples': 9552000, 'steps': 49749, 'loss/train': 1.41116464138031} -11/07/2021 04:14:41 - INFO - __main__ - Step 49751: {'lr': 0.00038220468178851917, 'samples': 9552192, 'steps': 49750, 'loss/train': 1.1397852897644043} -11/07/2021 04:14:41 - INFO - __main__ - Step 49752: {'lr': 0.00038220017774015427, 'samples': 9552384, 'steps': 49751, 'loss/train': 1.9566864967346191} -11/07/2021 04:14:41 - INFO - __main__ - Step 49753: {'lr': 0.00038219567363222183, 'samples': 9552576, 'steps': 49752, 'loss/train': 1.3994569778442383} -11/07/2021 04:14:42 - INFO - __main__ - Step 49754: {'lr': 0.00038219116946472425, 'samples': 9552768, 'steps': 49753, 'loss/train': 1.2265424728393555} -11/07/2021 04:14:43 - INFO - __main__ - Step 49755: {'lr': 0.0003821866652376633, 'samples': 9552960, 'steps': 49754, 'loss/train': 1.6414146423339844} -11/07/2021 04:14:43 - INFO - __main__ - Step 49756: {'lr': 0.0003821821609510411, 'samples': 9553152, 'steps': 49755, 'loss/train': 1.7572424411773682} -11/07/2021 04:14:44 - INFO - __main__ - Step 49757: {'lr': 0.0003821776566048596, 'samples': 9553344, 'steps': 49756, 'loss/train': 1.6133787631988525} -11/07/2021 04:14:44 - INFO - __main__ - Step 49758: {'lr': 0.0003821731521991209, 'samples': 9553536, 'steps': 49757, 'loss/train': 0.19680075347423553} -11/07/2021 04:14:44 - INFO - __main__ - Step 49759: {'lr': 0.00038216864773382703, 'samples': 9553728, 'steps': 49758, 'loss/train': 1.293948769569397} -11/07/2021 04:14:46 - INFO - __main__ - Step 49760: {'lr': 0.00038216414320898004, 'samples': 9553920, 'steps': 49759, 'loss/train': 1.4094274044036865} -11/07/2021 04:14:46 - INFO - __main__ - Step 49761: {'lr': 0.0003821596386245819, 'samples': 9554112, 'steps': 49760, 'loss/train': 1.4295532703399658} -11/07/2021 04:14:46 - INFO - __main__ - Step 49762: {'lr': 0.00038215513398063465, 'samples': 9554304, 'steps': 49761, 'loss/train': 1.2866480350494385} -11/07/2021 04:14:47 - INFO - __main__ - Step 49763: {'lr': 0.00038215062927714037, 'samples': 9554496, 'steps': 49762, 'loss/train': 1.7364535331726074} -11/07/2021 04:14:47 - INFO - __main__ - Step 49764: {'lr': 0.000382146124514101, 'samples': 9554688, 'steps': 49763, 'loss/train': 1.5931779146194458} -11/07/2021 04:14:48 - INFO - __main__ - Step 49765: {'lr': 0.00038214161969151865, 'samples': 9554880, 'steps': 49764, 'loss/train': 1.1106199026107788} -11/07/2021 04:14:48 - INFO - __main__ - Step 49766: {'lr': 0.0003821371148093954, 'samples': 9555072, 'steps': 49765, 'loss/train': 1.1809937953948975} -11/07/2021 04:14:49 - INFO - __main__ - Step 49767: {'lr': 0.0003821326098677331, 'samples': 9555264, 'steps': 49766, 'loss/train': 1.4365804195404053} -11/07/2021 04:14:49 - INFO - __main__ - Step 49768: {'lr': 0.00038212810486653394, 'samples': 9555456, 'steps': 49767, 'loss/train': 1.1563007831573486} -11/07/2021 04:14:49 - INFO - __main__ - Step 49769: {'lr': 0.0003821235998057999, 'samples': 9555648, 'steps': 49768, 'loss/train': 1.485763430595398} -11/07/2021 04:14:50 - INFO - __main__ - Step 49770: {'lr': 0.00038211909468553295, 'samples': 9555840, 'steps': 49769, 'loss/train': 1.531764030456543} -11/07/2021 04:14:51 - INFO - __main__ - Step 49771: {'lr': 0.00038211458950573526, 'samples': 9556032, 'steps': 49770, 'loss/train': 1.1895573139190674} -11/07/2021 04:14:51 - INFO - __main__ - Step 49772: {'lr': 0.0003821100842664087, 'samples': 9556224, 'steps': 49771, 'loss/train': 1.6334819793701172} -11/07/2021 04:14:51 - INFO - __main__ - Step 49773: {'lr': 0.00038210557896755536, 'samples': 9556416, 'steps': 49772, 'loss/train': 1.3276512622833252} -11/07/2021 04:14:52 - INFO - __main__ - Step 49774: {'lr': 0.0003821010736091774, 'samples': 9556608, 'steps': 49773, 'loss/train': 1.833406686782837} -11/07/2021 04:14:52 - INFO - __main__ - Step 49775: {'lr': 0.00038209656819127664, 'samples': 9556800, 'steps': 49774, 'loss/train': 1.2205287218093872} -11/07/2021 04:14:53 - INFO - __main__ - Step 49776: {'lr': 0.0003820920627138552, 'samples': 9556992, 'steps': 49775, 'loss/train': 1.4490100145339966} -11/07/2021 04:14:54 - INFO - __main__ - Step 49777: {'lr': 0.00038208755717691515, 'samples': 9557184, 'steps': 49776, 'loss/train': 1.194211483001709} -11/07/2021 04:14:54 - INFO - __main__ - Step 49778: {'lr': 0.00038208305158045846, 'samples': 9557376, 'steps': 49777, 'loss/train': 1.0601788759231567} -11/07/2021 04:14:54 - INFO - __main__ - Step 49779: {'lr': 0.0003820785459244872, 'samples': 9557568, 'steps': 49778, 'loss/train': 1.5217045545578003} -11/07/2021 04:14:55 - INFO - __main__ - Step 49780: {'lr': 0.00038207404020900343, 'samples': 9557760, 'steps': 49779, 'loss/train': 1.3851622343063354} -11/07/2021 04:14:56 - INFO - __main__ - Step 49781: {'lr': 0.0003820695344340091, 'samples': 9557952, 'steps': 49780, 'loss/train': 0.9521015882492065} -11/07/2021 04:14:56 - INFO - __main__ - Step 49782: {'lr': 0.00038206502859950624, 'samples': 9558144, 'steps': 49781, 'loss/train': 0.9233091473579407} -11/07/2021 04:14:56 - INFO - __main__ - Step 49783: {'lr': 0.000382060522705497, 'samples': 9558336, 'steps': 49782, 'loss/train': 1.2780437469482422} -11/07/2021 04:14:57 - INFO - __main__ - Step 49784: {'lr': 0.0003820560167519832, 'samples': 9558528, 'steps': 49783, 'loss/train': 1.763771891593933} -11/07/2021 04:14:57 - INFO - __main__ - Step 49785: {'lr': 0.000382051510738967, 'samples': 9558720, 'steps': 49784, 'loss/train': 1.419110655784607} -11/07/2021 04:14:58 - INFO - __main__ - Step 49786: {'lr': 0.0003820470046664506, 'samples': 9558912, 'steps': 49785, 'loss/train': 1.7713582515716553} -11/07/2021 04:14:58 - INFO - __main__ - Step 49787: {'lr': 0.0003820424985344357, 'samples': 9559104, 'steps': 49786, 'loss/train': 1.8338513374328613} -11/07/2021 04:14:59 - INFO - __main__ - Step 49788: {'lr': 0.0003820379923429246, 'samples': 9559296, 'steps': 49787, 'loss/train': 1.5551120042800903} -11/07/2021 04:14:59 - INFO - __main__ - Step 49789: {'lr': 0.00038203348609191915, 'samples': 9559488, 'steps': 49788, 'loss/train': 1.0834661722183228} -11/07/2021 04:15:00 - INFO - __main__ - Step 49790: {'lr': 0.00038202897978142144, 'samples': 9559680, 'steps': 49789, 'loss/train': 1.7385804653167725} -11/07/2021 04:15:01 - INFO - __main__ - Step 49791: {'lr': 0.00038202447341143355, 'samples': 9559872, 'steps': 49790, 'loss/train': 1.4318112134933472} -11/07/2021 04:15:01 - INFO - __main__ - Step 49792: {'lr': 0.0003820199669819574, 'samples': 9560064, 'steps': 49791, 'loss/train': 0.9425163269042969} -11/07/2021 04:15:01 - INFO - __main__ - Step 49793: {'lr': 0.00038201546049299517, 'samples': 9560256, 'steps': 49792, 'loss/train': 1.0969769954681396} -11/07/2021 04:15:02 - INFO - __main__ - Step 49794: {'lr': 0.00038201095394454874, 'samples': 9560448, 'steps': 49793, 'loss/train': 1.5377111434936523} -11/07/2021 04:15:02 - INFO - __main__ - Step 49795: {'lr': 0.0003820064473366203, 'samples': 9560640, 'steps': 49794, 'loss/train': 1.321353793144226} -11/07/2021 04:15:03 - INFO - __main__ - Step 49796: {'lr': 0.00038200194066921166, 'samples': 9560832, 'steps': 49795, 'loss/train': 1.2820968627929688} -11/07/2021 04:15:03 - INFO - __main__ - Step 49797: {'lr': 0.00038199743394232513, 'samples': 9561024, 'steps': 49796, 'loss/train': 1.299493670463562} -11/07/2021 04:15:04 - INFO - __main__ - Step 49798: {'lr': 0.0003819929271559625, 'samples': 9561216, 'steps': 49797, 'loss/train': 1.5363938808441162} -11/07/2021 04:15:04 - INFO - __main__ - Step 49799: {'lr': 0.00038198842031012594, 'samples': 9561408, 'steps': 49798, 'loss/train': 1.254093050956726} -11/07/2021 04:15:04 - INFO - __main__ - Step 49800: {'lr': 0.00038198391340481735, 'samples': 9561600, 'steps': 49799, 'loss/train': 1.1182819604873657} -11/07/2021 04:15:05 - INFO - __main__ - Step 49801: {'lr': 0.0003819794064400389, 'samples': 9561792, 'steps': 49800, 'loss/train': 1.2071176767349243} -11/07/2021 04:15:06 - INFO - __main__ - Step 49802: {'lr': 0.00038197489941579264, 'samples': 9561984, 'steps': 49801, 'loss/train': 1.5347254276275635} -11/07/2021 04:15:06 - INFO - __main__ - Step 49803: {'lr': 0.00038197039233208043, 'samples': 9562176, 'steps': 49802, 'loss/train': 1.8398714065551758} -11/07/2021 04:15:06 - INFO - __main__ - Step 49804: {'lr': 0.0003819658851889044, 'samples': 9562368, 'steps': 49803, 'loss/train': 1.399654507637024} -11/07/2021 04:15:07 - INFO - __main__ - Step 49805: {'lr': 0.00038196137798626663, 'samples': 9562560, 'steps': 49804, 'loss/train': 0.5613115429878235} -11/07/2021 04:15:08 - INFO - __main__ - Step 49806: {'lr': 0.00038195687072416906, 'samples': 9562752, 'steps': 49805, 'loss/train': 1.5593262910842896} -11/07/2021 04:15:08 - INFO - __main__ - Step 49807: {'lr': 0.00038195236340261374, 'samples': 9562944, 'steps': 49806, 'loss/train': 1.1653640270233154} -11/07/2021 04:15:08 - INFO - __main__ - Step 49808: {'lr': 0.0003819478560216029, 'samples': 9563136, 'steps': 49807, 'loss/train': 1.3279402256011963} -11/07/2021 04:15:09 - INFO - __main__ - Step 49809: {'lr': 0.00038194334858113817, 'samples': 9563328, 'steps': 49808, 'loss/train': 1.3673834800720215} -11/07/2021 04:15:09 - INFO - __main__ - Step 49810: {'lr': 0.0003819388410812219, 'samples': 9563520, 'steps': 49809, 'loss/train': 1.2251176834106445} -11/07/2021 04:15:10 - INFO - __main__ - Step 49811: {'lr': 0.00038193433352185597, 'samples': 9563712, 'steps': 49810, 'loss/train': 2.7023043632507324} -11/07/2021 04:15:11 - INFO - __main__ - Step 49812: {'lr': 0.0003819298259030425, 'samples': 9563904, 'steps': 49811, 'loss/train': 1.3174453973770142} -11/07/2021 04:15:11 - INFO - __main__ - Step 49813: {'lr': 0.00038192531822478347, 'samples': 9564096, 'steps': 49812, 'loss/train': 1.591962456703186} -11/07/2021 04:15:11 - INFO - __main__ - Step 49814: {'lr': 0.000381920810487081, 'samples': 9564288, 'steps': 49813, 'loss/train': 1.6464207172393799} -11/07/2021 04:15:12 - INFO - __main__ - Step 49815: {'lr': 0.0003819163026899369, 'samples': 9564480, 'steps': 49814, 'loss/train': 1.0955125093460083} -11/07/2021 04:15:13 - INFO - __main__ - Step 49816: {'lr': 0.00038191179483335346, 'samples': 9564672, 'steps': 49815, 'loss/train': 1.1044607162475586} -11/07/2021 04:15:13 - INFO - __main__ - Step 49817: {'lr': 0.0003819072869173326, 'samples': 9564864, 'steps': 49816, 'loss/train': 0.9763187766075134} -11/07/2021 04:15:13 - INFO - __main__ - Step 49818: {'lr': 0.0003819027789418764, 'samples': 9565056, 'steps': 49817, 'loss/train': 1.5007073879241943} -11/07/2021 04:15:14 - INFO - __main__ - Step 49819: {'lr': 0.0003818982709069867, 'samples': 9565248, 'steps': 49818, 'loss/train': 1.4065707921981812} -11/07/2021 04:15:14 - INFO - __main__ - Step 49820: {'lr': 0.00038189376281266575, 'samples': 9565440, 'steps': 49819, 'loss/train': 1.1974198818206787} -11/07/2021 04:15:14 - INFO - __main__ - Step 49821: {'lr': 0.00038188925465891554, 'samples': 9565632, 'steps': 49820, 'loss/train': 1.432716727256775} -11/07/2021 04:15:15 - INFO - __main__ - Step 49822: {'lr': 0.000381884746445738, 'samples': 9565824, 'steps': 49821, 'loss/train': 1.4346973896026611} -11/07/2021 04:15:16 - INFO - __main__ - Step 49823: {'lr': 0.0003818802381731353, 'samples': 9566016, 'steps': 49822, 'loss/train': 1.4307574033737183} -11/07/2021 04:15:16 - INFO - __main__ - Step 49824: {'lr': 0.00038187572984110937, 'samples': 9566208, 'steps': 49823, 'loss/train': 1.0929710865020752} -11/07/2021 04:15:16 - INFO - __main__ - Step 49825: {'lr': 0.00038187122144966225, 'samples': 9566400, 'steps': 49824, 'loss/train': 1.65118408203125} -11/07/2021 04:15:17 - INFO - __main__ - Step 49826: {'lr': 0.000381866712998796, 'samples': 9566592, 'steps': 49825, 'loss/train': 1.4581557512283325} -11/07/2021 04:15:18 - INFO - __main__ - Step 49827: {'lr': 0.0003818622044885126, 'samples': 9566784, 'steps': 49826, 'loss/train': 1.3367974758148193} -11/07/2021 04:15:18 - INFO - __main__ - Step 49828: {'lr': 0.00038185769591881426, 'samples': 9566976, 'steps': 49827, 'loss/train': 2.494285821914673} -11/07/2021 04:15:19 - INFO - __main__ - Step 49829: {'lr': 0.00038185318728970277, 'samples': 9567168, 'steps': 49828, 'loss/train': 1.6039881706237793} -11/07/2021 04:15:19 - INFO - __main__ - Step 49830: {'lr': 0.00038184867860118036, 'samples': 9567360, 'steps': 49829, 'loss/train': 1.405824899673462} -11/07/2021 04:15:19 - INFO - __main__ - Step 49831: {'lr': 0.0003818441698532488, 'samples': 9567552, 'steps': 49830, 'loss/train': 1.1581023931503296} -11/07/2021 04:15:21 - INFO - __main__ - Step 49832: {'lr': 0.00038183966104591037, 'samples': 9567744, 'steps': 49831, 'loss/train': 1.0995320081710815} -11/07/2021 04:15:21 - INFO - __main__ - Step 49833: {'lr': 0.0003818351521791671, 'samples': 9567936, 'steps': 49832, 'loss/train': 1.6082440614700317} -11/07/2021 04:15:21 - INFO - __main__ - Step 49834: {'lr': 0.0003818306432530209, 'samples': 9568128, 'steps': 49833, 'loss/train': 1.2923341989517212} -11/07/2021 04:15:22 - INFO - __main__ - Step 49835: {'lr': 0.0003818261342674738, 'samples': 9568320, 'steps': 49834, 'loss/train': 0.09563875943422318} -11/07/2021 04:15:22 - INFO - __main__ - Step 49836: {'lr': 0.00038182162522252795, 'samples': 9568512, 'steps': 49835, 'loss/train': 1.1273518800735474} -11/07/2021 04:15:23 - INFO - __main__ - Step 49837: {'lr': 0.0003818171161181853, 'samples': 9568704, 'steps': 49836, 'loss/train': 1.4690061807632446} -11/07/2021 04:15:23 - INFO - __main__ - Step 49838: {'lr': 0.00038181260695444784, 'samples': 9568896, 'steps': 49837, 'loss/train': 1.4633288383483887} -11/07/2021 04:15:24 - INFO - __main__ - Step 49839: {'lr': 0.00038180809773131764, 'samples': 9569088, 'steps': 49838, 'loss/train': 1.6124905347824097} -11/07/2021 04:15:24 - INFO - __main__ - Step 49840: {'lr': 0.0003818035884487968, 'samples': 9569280, 'steps': 49839, 'loss/train': 1.2007817029953003} -11/07/2021 04:15:24 - INFO - __main__ - Step 49841: {'lr': 0.0003817990791068873, 'samples': 9569472, 'steps': 49840, 'loss/train': 1.1484363079071045} -11/07/2021 04:15:25 - INFO - __main__ - Step 49842: {'lr': 0.00038179456970559116, 'samples': 9569664, 'steps': 49841, 'loss/train': 1.6722135543823242} -11/07/2021 04:15:26 - INFO - __main__ - Step 49843: {'lr': 0.0003817900602449104, 'samples': 9569856, 'steps': 49842, 'loss/train': 1.3057899475097656} -11/07/2021 04:15:26 - INFO - __main__ - Step 49844: {'lr': 0.0003817855507248471, 'samples': 9570048, 'steps': 49843, 'loss/train': 0.6849073767662048} -11/07/2021 04:15:26 - INFO - __main__ - Step 49845: {'lr': 0.00038178104114540326, 'samples': 9570240, 'steps': 49844, 'loss/train': 1.0210819244384766} -11/07/2021 04:15:27 - INFO - __main__ - Step 49846: {'lr': 0.0003817765315065809, 'samples': 9570432, 'steps': 49845, 'loss/train': 1.4170243740081787} -11/07/2021 04:15:28 - INFO - __main__ - Step 49847: {'lr': 0.000381772021808382, 'samples': 9570624, 'steps': 49846, 'loss/train': 1.5046032667160034} -11/07/2021 04:15:28 - INFO - __main__ - Step 49848: {'lr': 0.00038176751205080885, 'samples': 9570816, 'steps': 49847, 'loss/train': 1.5529192686080933} -11/07/2021 04:15:28 - INFO - __main__ - Step 49849: {'lr': 0.00038176300223386313, 'samples': 9571008, 'steps': 49848, 'loss/train': 1.2158565521240234} -11/07/2021 04:15:29 - INFO - __main__ - Step 49850: {'lr': 0.00038175849235754704, 'samples': 9571200, 'steps': 49849, 'loss/train': 1.4324151277542114} -11/07/2021 04:15:29 - INFO - __main__ - Step 49851: {'lr': 0.00038175398242186264, 'samples': 9571392, 'steps': 49850, 'loss/train': 1.5142985582351685} -11/07/2021 04:15:30 - INFO - __main__ - Step 49852: {'lr': 0.00038174947242681194, 'samples': 9571584, 'steps': 49851, 'loss/train': 1.4615650177001953} -11/07/2021 04:15:31 - INFO - __main__ - Step 49853: {'lr': 0.000381744962372397, 'samples': 9571776, 'steps': 49852, 'loss/train': 1.3350597620010376} -11/07/2021 04:15:31 - INFO - __main__ - Step 49854: {'lr': 0.00038174045225861976, 'samples': 9571968, 'steps': 49853, 'loss/train': 1.1813478469848633} -11/07/2021 04:15:31 - INFO - __main__ - Step 49855: {'lr': 0.00038173594208548234, 'samples': 9572160, 'steps': 49854, 'loss/train': 1.561554193496704} -11/07/2021 04:15:32 - INFO - __main__ - Step 49856: {'lr': 0.00038173143185298665, 'samples': 9572352, 'steps': 49855, 'loss/train': 0.08423556387424469} -11/07/2021 04:15:32 - INFO - __main__ - Step 49857: {'lr': 0.00038172692156113484, 'samples': 9572544, 'steps': 49856, 'loss/train': 1.0528861284255981} -11/07/2021 04:15:33 - INFO - __main__ - Step 49858: {'lr': 0.000381722411209929, 'samples': 9572736, 'steps': 49857, 'loss/train': 0.5608619451522827} -11/07/2021 04:15:33 - INFO - __main__ - Step 49859: {'lr': 0.00038171790079937097, 'samples': 9572928, 'steps': 49858, 'loss/train': 1.4621555805206299} -11/07/2021 04:15:34 - INFO - __main__ - Step 49860: {'lr': 0.000381713390329463, 'samples': 9573120, 'steps': 49859, 'loss/train': 1.6315885782241821} -11/07/2021 04:15:34 - INFO - __main__ - Step 49861: {'lr': 0.00038170887980020683, 'samples': 9573312, 'steps': 49860, 'loss/train': 1.1106321811676025} -11/07/2021 04:15:34 - INFO - __main__ - Step 49862: {'lr': 0.0003817043692116049, 'samples': 9573504, 'steps': 49861, 'loss/train': 1.6139997243881226} -11/07/2021 04:15:36 - INFO - __main__ - Step 49863: {'lr': 0.00038169985856365885, 'samples': 9573696, 'steps': 49862, 'loss/train': 1.5891435146331787} -11/07/2021 04:15:36 - INFO - __main__ - Step 49864: {'lr': 0.00038169534785637097, 'samples': 9573888, 'steps': 49863, 'loss/train': 1.7982343435287476} -11/07/2021 04:15:36 - INFO - __main__ - Step 49865: {'lr': 0.00038169083708974313, 'samples': 9574080, 'steps': 49864, 'loss/train': 1.48331618309021} -11/07/2021 04:15:37 - INFO - __main__ - Step 49866: {'lr': 0.0003816863262637774, 'samples': 9574272, 'steps': 49865, 'loss/train': 1.1913880109786987} -11/07/2021 04:15:37 - INFO - __main__ - Step 49867: {'lr': 0.0003816818153784759, 'samples': 9574464, 'steps': 49866, 'loss/train': 0.8057406544685364} -11/07/2021 04:15:38 - INFO - __main__ - Step 49868: {'lr': 0.00038167730443384063, 'samples': 9574656, 'steps': 49867, 'loss/train': 1.673979640007019} -11/07/2021 04:15:38 - INFO - __main__ - Step 49869: {'lr': 0.0003816727934298736, 'samples': 9574848, 'steps': 49868, 'loss/train': 1.4075284004211426} -11/07/2021 04:15:39 - INFO - __main__ - Step 49870: {'lr': 0.0003816682823665768, 'samples': 9575040, 'steps': 49869, 'loss/train': 1.7056241035461426} -11/07/2021 04:15:39 - INFO - __main__ - Step 49871: {'lr': 0.0003816637712439523, 'samples': 9575232, 'steps': 49870, 'loss/train': 1.5761786699295044} -11/07/2021 04:15:39 - INFO - __main__ - Step 49872: {'lr': 0.0003816592600620021, 'samples': 9575424, 'steps': 49871, 'loss/train': 1.599300742149353} -11/07/2021 04:15:40 - INFO - __main__ - Step 49873: {'lr': 0.0003816547488207284, 'samples': 9575616, 'steps': 49872, 'loss/train': 1.250908613204956} -11/07/2021 04:15:41 - INFO - __main__ - Step 49874: {'lr': 0.00038165023752013294, 'samples': 9575808, 'steps': 49873, 'loss/train': 1.2514135837554932} -11/07/2021 04:15:41 - INFO - __main__ - Step 49875: {'lr': 0.00038164572616021807, 'samples': 9576000, 'steps': 49874, 'loss/train': 1.779987096786499} -11/07/2021 04:15:41 - INFO - __main__ - Step 49876: {'lr': 0.0003816412147409856, 'samples': 9576192, 'steps': 49875, 'loss/train': 1.3635135889053345} -11/07/2021 04:15:42 - INFO - __main__ - Step 49877: {'lr': 0.0003816367032624376, 'samples': 9576384, 'steps': 49876, 'loss/train': 1.3634365797042847} -11/07/2021 04:15:43 - INFO - __main__ - Step 49878: {'lr': 0.0003816321917245761, 'samples': 9576576, 'steps': 49877, 'loss/train': 1.286026120185852} -11/07/2021 04:15:44 - INFO - __main__ - Step 49879: {'lr': 0.00038162768012740323, 'samples': 9576768, 'steps': 49878, 'loss/train': 1.2849881649017334} -11/07/2021 04:15:44 - INFO - __main__ - Step 49880: {'lr': 0.00038162316847092096, 'samples': 9576960, 'steps': 49879, 'loss/train': 1.0298362970352173} -11/07/2021 04:15:45 - INFO - __main__ - Step 49881: {'lr': 0.0003816186567551313, 'samples': 9577152, 'steps': 49880, 'loss/train': 0.4664343297481537} -11/07/2021 04:15:45 - INFO - __main__ - Step 49882: {'lr': 0.0003816141449800364, 'samples': 9577344, 'steps': 49881, 'loss/train': 1.3210618495941162} -11/07/2021 04:15:46 - INFO - __main__ - Step 49883: {'lr': 0.00038160963314563806, 'samples': 9577536, 'steps': 49882, 'loss/train': 1.3121057748794556} -11/07/2021 04:15:46 - INFO - __main__ - Step 49884: {'lr': 0.00038160512125193853, 'samples': 9577728, 'steps': 49883, 'loss/train': 1.4728535413742065} -11/07/2021 04:15:47 - INFO - __main__ - Step 49885: {'lr': 0.0003816006092989397, 'samples': 9577920, 'steps': 49884, 'loss/train': 1.027085542678833} -11/07/2021 04:15:47 - INFO - __main__ - Step 49886: {'lr': 0.0003815960972866437, 'samples': 9578112, 'steps': 49885, 'loss/train': 0.914968729019165} -11/07/2021 04:15:47 - INFO - __main__ - Step 49887: {'lr': 0.00038159158521505255, 'samples': 9578304, 'steps': 49886, 'loss/train': 1.4157140254974365} -11/07/2021 04:15:48 - INFO - __main__ - Step 49888: {'lr': 0.0003815870730841683, 'samples': 9578496, 'steps': 49887, 'loss/train': 1.4689892530441284} -11/07/2021 04:15:49 - INFO - __main__ - Step 49889: {'lr': 0.00038158256089399287, 'samples': 9578688, 'steps': 49888, 'loss/train': 1.092774748802185} -11/07/2021 04:15:49 - INFO - __main__ - Step 49890: {'lr': 0.0003815780486445284, 'samples': 9578880, 'steps': 49889, 'loss/train': 1.4610096216201782} -11/07/2021 04:15:49 - INFO - __main__ - Step 49891: {'lr': 0.00038157353633577686, 'samples': 9579072, 'steps': 49890, 'loss/train': 1.5496063232421875} -11/07/2021 04:15:50 - INFO - __main__ - Step 49892: {'lr': 0.0003815690239677403, 'samples': 9579264, 'steps': 49891, 'loss/train': 0.18603570759296417} -11/07/2021 04:15:51 - INFO - __main__ - Step 49893: {'lr': 0.00038156451154042084, 'samples': 9579456, 'steps': 49892, 'loss/train': 1.3252862691879272} -11/07/2021 04:15:51 - INFO - __main__ - Step 49894: {'lr': 0.0003815599990538203, 'samples': 9579648, 'steps': 49893, 'loss/train': 1.69198739528656} -11/07/2021 04:15:52 - INFO - __main__ - Step 49895: {'lr': 0.00038155548650794103, 'samples': 9579840, 'steps': 49894, 'loss/train': 1.2539637088775635} -11/07/2021 04:15:52 - INFO - __main__ - Step 49896: {'lr': 0.00038155097390278484, 'samples': 9580032, 'steps': 49895, 'loss/train': 1.6797884702682495} -11/07/2021 04:15:52 - INFO - __main__ - Step 49897: {'lr': 0.0003815464612383538, 'samples': 9580224, 'steps': 49896, 'loss/train': 1.6274105310440063} -11/07/2021 04:15:53 - INFO - __main__ - Step 49898: {'lr': 0.0003815419485146499, 'samples': 9580416, 'steps': 49897, 'loss/train': 1.5162203311920166} -11/07/2021 04:15:54 - INFO - __main__ - Step 49899: {'lr': 0.0003815374357316753, 'samples': 9580608, 'steps': 49898, 'loss/train': 1.5220880508422852} -11/07/2021 04:15:54 - INFO - __main__ - Step 49900: {'lr': 0.0003815329228894319, 'samples': 9580800, 'steps': 49899, 'loss/train': 1.3859000205993652} -11/07/2021 04:15:54 - INFO - __main__ - Step 49901: {'lr': 0.0003815284099879218, 'samples': 9580992, 'steps': 49900, 'loss/train': 1.3224958181381226} -11/07/2021 04:15:55 - INFO - __main__ - Step 49902: {'lr': 0.00038152389702714705, 'samples': 9581184, 'steps': 49901, 'loss/train': 1.0632014274597168} -11/07/2021 04:15:56 - INFO - __main__ - Step 49903: {'lr': 0.0003815193840071097, 'samples': 9581376, 'steps': 49902, 'loss/train': 1.4790116548538208} -11/07/2021 04:15:56 - INFO - __main__ - Step 49904: {'lr': 0.0003815148709278117, 'samples': 9581568, 'steps': 49903, 'loss/train': 1.837923526763916} -11/07/2021 04:15:56 - INFO - __main__ - Step 49905: {'lr': 0.00038151035778925514, 'samples': 9581760, 'steps': 49904, 'loss/train': 1.3551061153411865} -11/07/2021 04:15:57 - INFO - __main__ - Step 49906: {'lr': 0.000381505844591442, 'samples': 9581952, 'steps': 49905, 'loss/train': 1.1105365753173828} -11/07/2021 04:15:57 - INFO - __main__ - Step 49907: {'lr': 0.0003815013313343744, 'samples': 9582144, 'steps': 49906, 'loss/train': 1.5107008218765259} -11/07/2021 04:15:58 - INFO - __main__ - Step 49908: {'lr': 0.0003814968180180544, 'samples': 9582336, 'steps': 49907, 'loss/train': 1.464564323425293} -11/07/2021 04:15:59 - INFO - __main__ - Step 49909: {'lr': 0.00038149230464248386, 'samples': 9582528, 'steps': 49908, 'loss/train': 1.664136528968811} -11/07/2021 04:15:59 - INFO - __main__ - Step 49910: {'lr': 0.000381487791207665, 'samples': 9582720, 'steps': 49909, 'loss/train': 1.5816500186920166} -11/07/2021 04:15:59 - INFO - __main__ - Step 49911: {'lr': 0.0003814832777135997, 'samples': 9582912, 'steps': 49910, 'loss/train': 1.1990145444869995} -11/07/2021 04:16:00 - INFO - __main__ - Step 49912: {'lr': 0.00038147876416029004, 'samples': 9583104, 'steps': 49911, 'loss/train': 1.7254343032836914} -11/07/2021 04:16:00 - INFO - __main__ - Step 49913: {'lr': 0.0003814742505477381, 'samples': 9583296, 'steps': 49912, 'loss/train': 1.4630495309829712} -11/07/2021 04:16:01 - INFO - __main__ - Step 49914: {'lr': 0.0003814697368759459, 'samples': 9583488, 'steps': 49913, 'loss/train': 1.644455075263977} -11/07/2021 04:16:01 - INFO - __main__ - Step 49915: {'lr': 0.0003814652231449155, 'samples': 9583680, 'steps': 49914, 'loss/train': 1.118870735168457} -11/07/2021 04:16:02 - INFO - __main__ - Step 49916: {'lr': 0.0003814607093546489, 'samples': 9583872, 'steps': 49915, 'loss/train': 1.2629168033599854} -11/07/2021 04:16:02 - INFO - __main__ - Step 49917: {'lr': 0.0003814561955051481, 'samples': 9584064, 'steps': 49916, 'loss/train': 1.5991111993789673} -11/07/2021 04:16:02 - INFO - __main__ - Step 49918: {'lr': 0.00038145168159641515, 'samples': 9584256, 'steps': 49917, 'loss/train': 1.3697715997695923} -11/07/2021 04:16:03 - INFO - __main__ - Step 49919: {'lr': 0.0003814471676284521, 'samples': 9584448, 'steps': 49918, 'loss/train': 1.385772705078125} -11/07/2021 04:16:04 - INFO - __main__ - Step 49920: {'lr': 0.00038144265360126107, 'samples': 9584640, 'steps': 49919, 'loss/train': 1.071580410003662} -11/07/2021 04:16:04 - INFO - __main__ - Step 49921: {'lr': 0.00038143813951484396, 'samples': 9584832, 'steps': 49920, 'loss/train': 1.748077392578125} -11/07/2021 04:16:05 - INFO - __main__ - Step 49922: {'lr': 0.0003814336253692028, 'samples': 9585024, 'steps': 49921, 'loss/train': 0.9060306549072266} -11/07/2021 04:16:05 - INFO - __main__ - Step 49923: {'lr': 0.0003814291111643397, 'samples': 9585216, 'steps': 49922, 'loss/train': 1.5653313398361206} -11/07/2021 04:16:06 - INFO - __main__ - Step 49924: {'lr': 0.00038142459690025665, 'samples': 9585408, 'steps': 49923, 'loss/train': 1.4163196086883545} -11/07/2021 04:16:06 - INFO - __main__ - Step 49925: {'lr': 0.0003814200825769558, 'samples': 9585600, 'steps': 49924, 'loss/train': 1.6841281652450562} -11/07/2021 04:16:07 - INFO - __main__ - Step 49926: {'lr': 0.000381415568194439, 'samples': 9585792, 'steps': 49925, 'loss/train': 1.4563446044921875} -11/07/2021 04:16:07 - INFO - __main__ - Step 49927: {'lr': 0.00038141105375270846, 'samples': 9585984, 'steps': 49926, 'loss/train': 1.2546554803848267} -11/07/2021 04:16:07 - INFO - __main__ - Step 49928: {'lr': 0.00038140653925176606, 'samples': 9586176, 'steps': 49927, 'loss/train': 1.588482141494751} -11/07/2021 04:16:08 - INFO - __main__ - Step 49929: {'lr': 0.0003814020246916139, 'samples': 9586368, 'steps': 49928, 'loss/train': 0.6331830620765686} -11/07/2021 04:16:09 - INFO - __main__ - Step 49930: {'lr': 0.000381397510072254, 'samples': 9586560, 'steps': 49929, 'loss/train': 0.9107598662376404} -11/07/2021 04:16:09 - INFO - __main__ - Step 49931: {'lr': 0.0003813929953936884, 'samples': 9586752, 'steps': 49930, 'loss/train': 1.4552175998687744} -11/07/2021 04:16:09 - INFO - __main__ - Step 49932: {'lr': 0.00038138848065591923, 'samples': 9586944, 'steps': 49931, 'loss/train': 1.0978375673294067} -11/07/2021 04:16:10 - INFO - __main__ - Step 49933: {'lr': 0.00038138396585894843, 'samples': 9587136, 'steps': 49932, 'loss/train': 1.5072349309921265} -11/07/2021 04:16:11 - INFO - __main__ - Step 49934: {'lr': 0.0003813794510027779, 'samples': 9587328, 'steps': 49933, 'loss/train': 1.138684868812561} -11/07/2021 04:16:11 - INFO - __main__ - Step 49935: {'lr': 0.00038137493608741, 'samples': 9587520, 'steps': 49934, 'loss/train': 1.2428410053253174} -11/07/2021 04:16:12 - INFO - __main__ - Step 49936: {'lr': 0.0003813704211128465, 'samples': 9587712, 'steps': 49935, 'loss/train': 0.08512834459543228} -11/07/2021 04:16:12 - INFO - __main__ - Step 49937: {'lr': 0.0003813659060790895, 'samples': 9587904, 'steps': 49936, 'loss/train': 1.707636833190918} -11/07/2021 04:16:12 - INFO - __main__ - Step 49938: {'lr': 0.00038136139098614107, 'samples': 9588096, 'steps': 49937, 'loss/train': 1.393393874168396} -11/07/2021 04:16:13 - INFO - __main__ - Step 49939: {'lr': 0.00038135687583400326, 'samples': 9588288, 'steps': 49938, 'loss/train': 1.4983201026916504} -11/07/2021 04:16:14 - INFO - __main__ - Step 49940: {'lr': 0.000381352360622678, 'samples': 9588480, 'steps': 49939, 'loss/train': 1.282761812210083} -11/07/2021 04:16:14 - INFO - __main__ - Step 49941: {'lr': 0.00038134784535216737, 'samples': 9588672, 'steps': 49940, 'loss/train': 1.4226652383804321} -11/07/2021 04:16:14 - INFO - __main__ - Step 49942: {'lr': 0.0003813433300224735, 'samples': 9588864, 'steps': 49941, 'loss/train': 1.063042163848877} -11/07/2021 04:16:15 - INFO - __main__ - Step 49943: {'lr': 0.0003813388146335983, 'samples': 9589056, 'steps': 49942, 'loss/train': 1.04142427444458} -11/07/2021 04:16:16 - INFO - __main__ - Step 49944: {'lr': 0.00038133429918554395, 'samples': 9589248, 'steps': 49943, 'loss/train': 1.3146531581878662} -11/07/2021 04:16:16 - INFO - __main__ - Step 49945: {'lr': 0.00038132978367831226, 'samples': 9589440, 'steps': 49944, 'loss/train': 1.3345072269439697} -11/07/2021 04:16:17 - INFO - __main__ - Step 49946: {'lr': 0.00038132526811190547, 'samples': 9589632, 'steps': 49945, 'loss/train': 1.4192546606063843} -11/07/2021 04:16:17 - INFO - __main__ - Step 49947: {'lr': 0.00038132075248632557, 'samples': 9589824, 'steps': 49946, 'loss/train': 1.4883534908294678} -11/07/2021 04:16:17 - INFO - __main__ - Step 49948: {'lr': 0.0003813162368015745, 'samples': 9590016, 'steps': 49947, 'loss/train': 1.16780424118042} -11/07/2021 04:16:18 - INFO - __main__ - Step 49949: {'lr': 0.00038131172105765446, 'samples': 9590208, 'steps': 49948, 'loss/train': 1.5168664455413818} -11/07/2021 04:16:19 - INFO - __main__ - Step 49950: {'lr': 0.0003813072052545673, 'samples': 9590400, 'steps': 49949, 'loss/train': 1.0772747993469238} -11/07/2021 04:16:19 - INFO - __main__ - Step 49951: {'lr': 0.00038130268939231513, 'samples': 9590592, 'steps': 49950, 'loss/train': 1.8183636665344238} -11/07/2021 04:16:19 - INFO - __main__ - Step 49952: {'lr': 0.0003812981734709, 'samples': 9590784, 'steps': 49951, 'loss/train': 0.702171266078949} -11/07/2021 04:16:20 - INFO - __main__ - Step 49953: {'lr': 0.00038129365749032395, 'samples': 9590976, 'steps': 49952, 'loss/train': 1.9576735496520996} -11/07/2021 04:16:21 - INFO - __main__ - Step 49954: {'lr': 0.000381289141450589, 'samples': 9591168, 'steps': 49953, 'loss/train': 2.3979005813598633} -11/07/2021 04:16:21 - INFO - __main__ - Step 49955: {'lr': 0.00038128462535169715, 'samples': 9591360, 'steps': 49954, 'loss/train': 1.3407514095306396} -11/07/2021 04:16:21 - INFO - __main__ - Step 49956: {'lr': 0.00038128010919365066, 'samples': 9591552, 'steps': 49955, 'loss/train': 1.8588253259658813} -11/07/2021 04:16:22 - INFO - __main__ - Step 49957: {'lr': 0.0003812755929764512, 'samples': 9591744, 'steps': 49956, 'loss/train': 1.5412076711654663} -11/07/2021 04:16:22 - INFO - __main__ - Step 49958: {'lr': 0.000381271076700101, 'samples': 9591936, 'steps': 49957, 'loss/train': 1.4377400875091553} -11/07/2021 04:16:23 - INFO - __main__ - Step 49959: {'lr': 0.00038126656036460206, 'samples': 9592128, 'steps': 49958, 'loss/train': 1.0640348196029663} -11/07/2021 04:16:23 - INFO - __main__ - Step 49960: {'lr': 0.0003812620439699565, 'samples': 9592320, 'steps': 49959, 'loss/train': 1.584822177886963} -11/07/2021 04:16:24 - INFO - __main__ - Step 49961: {'lr': 0.00038125752751616625, 'samples': 9592512, 'steps': 49960, 'loss/train': 1.4965132474899292} -11/07/2021 04:16:24 - INFO - __main__ - Step 49962: {'lr': 0.00038125301100323344, 'samples': 9592704, 'steps': 49961, 'loss/train': 1.340742826461792} -11/07/2021 04:16:24 - INFO - __main__ - Step 49963: {'lr': 0.00038124849443116, 'samples': 9592896, 'steps': 49962, 'loss/train': 1.480609655380249} -11/07/2021 04:16:26 - INFO - __main__ - Step 49964: {'lr': 0.000381243977799948, 'samples': 9593088, 'steps': 49963, 'loss/train': 1.2617064714431763} -11/07/2021 04:16:26 - INFO - __main__ - Step 49965: {'lr': 0.0003812394611095995, 'samples': 9593280, 'steps': 49964, 'loss/train': 1.535764217376709} -11/07/2021 04:16:26 - INFO - __main__ - Step 49966: {'lr': 0.0003812349443601165, 'samples': 9593472, 'steps': 49965, 'loss/train': 1.6400853395462036} -11/07/2021 04:16:27 - INFO - __main__ - Step 49967: {'lr': 0.0003812304275515012, 'samples': 9593664, 'steps': 49966, 'loss/train': 1.1503257751464844} -11/07/2021 04:16:27 - INFO - __main__ - Step 49968: {'lr': 0.00038122591068375536, 'samples': 9593856, 'steps': 49967, 'loss/train': 1.3187167644500732} -11/07/2021 04:16:27 - INFO - __main__ - Step 49969: {'lr': 0.00038122139375688116, 'samples': 9594048, 'steps': 49968, 'loss/train': 1.1606495380401611} -11/07/2021 04:16:29 - INFO - __main__ - Step 49970: {'lr': 0.0003812168767708807, 'samples': 9594240, 'steps': 49969, 'loss/train': 0.9344202280044556} -11/07/2021 04:16:29 - INFO - __main__ - Step 49971: {'lr': 0.0003812123597257559, 'samples': 9594432, 'steps': 49970, 'loss/train': 1.361876368522644} -11/07/2021 04:16:29 - INFO - __main__ - Step 49972: {'lr': 0.00038120784262150875, 'samples': 9594624, 'steps': 49971, 'loss/train': 1.2185523509979248} -11/07/2021 04:16:30 - INFO - __main__ - Step 49973: {'lr': 0.0003812033254581414, 'samples': 9594816, 'steps': 49972, 'loss/train': 0.9987174272537231} -11/07/2021 04:16:30 - INFO - __main__ - Step 49974: {'lr': 0.0003811988082356559, 'samples': 9595008, 'steps': 49973, 'loss/train': 1.5329139232635498} -11/07/2021 04:16:31 - INFO - __main__ - Step 49975: {'lr': 0.0003811942909540542, 'samples': 9595200, 'steps': 49974, 'loss/train': 1.565413475036621} -11/07/2021 04:16:31 - INFO - __main__ - Step 49976: {'lr': 0.0003811897736133385, 'samples': 9595392, 'steps': 49975, 'loss/train': 1.2943179607391357} -11/07/2021 04:16:32 - INFO - __main__ - Step 49977: {'lr': 0.0003811852562135106, 'samples': 9595584, 'steps': 49976, 'loss/train': 1.1904795169830322} -11/07/2021 04:16:32 - INFO - __main__ - Step 49978: {'lr': 0.0003811807387545727, 'samples': 9595776, 'steps': 49977, 'loss/train': 1.2342473268508911} -11/07/2021 04:16:32 - INFO - __main__ - Step 49979: {'lr': 0.0003811762212365267, 'samples': 9595968, 'steps': 49978, 'loss/train': 1.3623075485229492} -11/07/2021 04:16:33 - INFO - __main__ - Step 49980: {'lr': 0.0003811717036593748, 'samples': 9596160, 'steps': 49979, 'loss/train': 0.9780320525169373} -11/07/2021 04:16:34 - INFO - __main__ - Step 49981: {'lr': 0.00038116718602311896, 'samples': 9596352, 'steps': 49980, 'loss/train': 1.3779079914093018} -11/07/2021 04:16:34 - INFO - __main__ - Step 49982: {'lr': 0.00038116266832776113, 'samples': 9596544, 'steps': 49981, 'loss/train': 0.8242561221122742} -11/07/2021 04:16:34 - INFO - __main__ - Step 49983: {'lr': 0.0003811581505733035, 'samples': 9596736, 'steps': 49982, 'loss/train': 1.616904616355896} -11/07/2021 04:16:35 - INFO - __main__ - Step 49984: {'lr': 0.000381153632759748, 'samples': 9596928, 'steps': 49983, 'loss/train': 1.6792519092559814} -11/07/2021 04:16:36 - INFO - __main__ - Step 49985: {'lr': 0.0003811491148870967, 'samples': 9597120, 'steps': 49984, 'loss/train': 1.758325457572937} -11/07/2021 04:16:36 - INFO - __main__ - Step 49986: {'lr': 0.0003811445969553516, 'samples': 9597312, 'steps': 49985, 'loss/train': 1.5427839756011963} -11/07/2021 04:16:37 - INFO - __main__ - Step 49987: {'lr': 0.00038114007896451486, 'samples': 9597504, 'steps': 49986, 'loss/train': 1.2429639101028442} -11/07/2021 04:16:37 - INFO - __main__ - Step 49988: {'lr': 0.0003811355609145883, 'samples': 9597696, 'steps': 49987, 'loss/train': 1.6669725179672241} -11/07/2021 04:16:37 - INFO - __main__ - Step 49989: {'lr': 0.0003811310428055742, 'samples': 9597888, 'steps': 49988, 'loss/train': 2.0266692638397217} -11/07/2021 04:16:38 - INFO - __main__ - Step 49990: {'lr': 0.00038112652463747444, 'samples': 9598080, 'steps': 49989, 'loss/train': 1.3608561754226685} -11/07/2021 04:16:39 - INFO - __main__ - Step 49991: {'lr': 0.00038112200641029104, 'samples': 9598272, 'steps': 49990, 'loss/train': 1.6590118408203125} -11/07/2021 04:16:39 - INFO - __main__ - Step 49992: {'lr': 0.00038111748812402616, 'samples': 9598464, 'steps': 49991, 'loss/train': 0.44961920380592346} -11/07/2021 04:16:39 - INFO - __main__ - Step 49993: {'lr': 0.0003811129697786817, 'samples': 9598656, 'steps': 49992, 'loss/train': 1.4356154203414917} -11/07/2021 04:16:40 - INFO - __main__ - Step 49994: {'lr': 0.00038110845137425976, 'samples': 9598848, 'steps': 49993, 'loss/train': 1.4192280769348145} -11/07/2021 04:16:41 - INFO - __main__ - Step 49995: {'lr': 0.0003811039329107624, 'samples': 9599040, 'steps': 49994, 'loss/train': 0.9220527410507202} -11/07/2021 04:16:42 - INFO - __main__ - Step 49996: {'lr': 0.00038109941438819165, 'samples': 9599232, 'steps': 49995, 'loss/train': 5.768974304199219} -11/07/2021 04:16:42 - INFO - __main__ - Step 49997: {'lr': 0.00038109489580654955, 'samples': 9599424, 'steps': 49996, 'loss/train': 1.6446173191070557} -11/07/2021 04:16:42 - INFO - __main__ - Step 49998: {'lr': 0.00038109037716583806, 'samples': 9599616, 'steps': 49997, 'loss/train': 1.6709755659103394} -11/07/2021 04:16:43 - INFO - __main__ - Step 49999: {'lr': 0.0003810858584660593, 'samples': 9599808, 'steps': 49998, 'loss/train': 1.74168062210083} -11/07/2021 04:16:43 - INFO - __main__ - Step 50000: {'lr': 0.0003810813397072152, 'samples': 9600000, 'steps': 49999, 'loss/train': 1.699582576751709} -11/07/2021 04:16:43 - INFO - __main__ - Step 50001: {'lr': 0.00038107682088930797, 'samples': 9600192, 'steps': 50000, 'loss/train': 1.4355201721191406} -11/07/2021 04:16:44 - INFO - __main__ - Step 50002: {'lr': 0.00038107230201233944, 'samples': 9600384, 'steps': 50001, 'loss/train': 1.7963310480117798} -11/07/2021 04:16:45 - INFO - __main__ - Step 50003: {'lr': 0.00038106778307631187, 'samples': 9600576, 'steps': 50002, 'loss/train': 1.7608848810195923} -11/07/2021 04:16:45 - INFO - __main__ - Step 50004: {'lr': 0.0003810632640812271, 'samples': 9600768, 'steps': 50003, 'loss/train': 1.6591436862945557} -11/07/2021 04:16:45 - INFO - __main__ - Step 50005: {'lr': 0.00038105874502708726, 'samples': 9600960, 'steps': 50004, 'loss/train': 1.6088366508483887} -11/07/2021 04:16:46 - INFO - __main__ - Step 50006: {'lr': 0.0003810542259138944, 'samples': 9601152, 'steps': 50005, 'loss/train': 1.5151917934417725} -11/07/2021 04:16:47 - INFO - __main__ - Step 50007: {'lr': 0.0003810497067416505, 'samples': 9601344, 'steps': 50006, 'loss/train': 1.273219347000122} -11/07/2021 04:16:47 - INFO - __main__ - Step 50008: {'lr': 0.0003810451875103576, 'samples': 9601536, 'steps': 50007, 'loss/train': 1.481964349746704} -11/07/2021 04:16:47 - INFO - __main__ - Step 50009: {'lr': 0.0003810406682200178, 'samples': 9601728, 'steps': 50008, 'loss/train': 1.6708675622940063} -11/07/2021 04:16:48 - INFO - __main__ - Step 50010: {'lr': 0.0003810361488706331, 'samples': 9601920, 'steps': 50009, 'loss/train': 1.252386212348938} -11/07/2021 04:16:48 - INFO - __main__ - Step 50011: {'lr': 0.0003810316294622056, 'samples': 9602112, 'steps': 50010, 'loss/train': 1.366594672203064} -11/07/2021 04:16:49 - INFO - __main__ - Step 50012: {'lr': 0.0003810271099947371, 'samples': 9602304, 'steps': 50011, 'loss/train': 1.3563555479049683} -11/07/2021 04:16:50 - INFO - __main__ - Step 50013: {'lr': 0.00038102259046822993, 'samples': 9602496, 'steps': 50012, 'loss/train': 1.6523642539978027} -11/07/2021 04:16:50 - INFO - __main__ - Step 50014: {'lr': 0.00038101807088268595, 'samples': 9602688, 'steps': 50013, 'loss/train': 1.2176542282104492} -11/07/2021 04:16:50 - INFO - __main__ - Step 50015: {'lr': 0.00038101355123810733, 'samples': 9602880, 'steps': 50014, 'loss/train': 1.590633511543274} -11/07/2021 04:16:51 - INFO - __main__ - Step 50016: {'lr': 0.00038100903153449596, 'samples': 9603072, 'steps': 50015, 'loss/train': 1.1036028861999512} -11/07/2021 04:16:52 - INFO - __main__ - Step 50017: {'lr': 0.00038100451177185395, 'samples': 9603264, 'steps': 50016, 'loss/train': 1.8031105995178223} -11/07/2021 04:16:52 - INFO - __main__ - Step 50018: {'lr': 0.0003809999919501833, 'samples': 9603456, 'steps': 50017, 'loss/train': 1.193867564201355} -11/07/2021 04:16:52 - INFO - __main__ - Step 50019: {'lr': 0.00038099547206948617, 'samples': 9603648, 'steps': 50018, 'loss/train': 1.4448760747909546} -11/07/2021 04:16:53 - INFO - __main__ - Step 50020: {'lr': 0.0003809909521297644, 'samples': 9603840, 'steps': 50019, 'loss/train': 1.6645346879959106} -11/07/2021 04:16:53 - INFO - __main__ - Step 50021: {'lr': 0.00038098643213102014, 'samples': 9604032, 'steps': 50020, 'loss/train': 1.0006576776504517} -11/07/2021 04:16:54 - INFO - __main__ - Step 50022: {'lr': 0.0003809819120732554, 'samples': 9604224, 'steps': 50021, 'loss/train': 1.2743947505950928} -11/07/2021 04:16:55 - INFO - __main__ - Step 50023: {'lr': 0.00038097739195647233, 'samples': 9604416, 'steps': 50022, 'loss/train': 1.3045101165771484} -11/07/2021 04:16:55 - INFO - __main__ - Step 50024: {'lr': 0.0003809728717806728, 'samples': 9604608, 'steps': 50023, 'loss/train': 0.8881009221076965} -11/07/2021 04:16:55 - INFO - __main__ - Step 50025: {'lr': 0.00038096835154585897, 'samples': 9604800, 'steps': 50024, 'loss/train': 0.4098493754863739} -11/07/2021 04:16:56 - INFO - __main__ - Step 50026: {'lr': 0.0003809638312520327, 'samples': 9604992, 'steps': 50025, 'loss/train': 1.20095956325531} -11/07/2021 04:16:57 - INFO - __main__ - Step 50027: {'lr': 0.0003809593108991962, 'samples': 9605184, 'steps': 50026, 'loss/train': 1.4733937978744507} -11/07/2021 04:16:57 - INFO - __main__ - Step 50028: {'lr': 0.0003809547904873515, 'samples': 9605376, 'steps': 50027, 'loss/train': 1.335333228111267} -11/07/2021 04:16:58 - INFO - __main__ - Step 50029: {'lr': 0.0003809502700165006, 'samples': 9605568, 'steps': 50028, 'loss/train': 1.0062395334243774} -11/07/2021 04:16:58 - INFO - __main__ - Step 50030: {'lr': 0.00038094574948664554, 'samples': 9605760, 'steps': 50029, 'loss/train': 0.22823107242584229} -11/07/2021 04:16:59 - INFO - __main__ - Step 50031: {'lr': 0.00038094122889778824, 'samples': 9605952, 'steps': 50030, 'loss/train': 1.204109787940979} -11/07/2021 04:17:00 - INFO - __main__ - Step 50032: {'lr': 0.000380936708249931, 'samples': 9606144, 'steps': 50031, 'loss/train': 0.7152600884437561} -11/07/2021 04:17:00 - INFO - __main__ - Step 50033: {'lr': 0.0003809321875430756, 'samples': 9606336, 'steps': 50032, 'loss/train': 1.490403175354004} -11/07/2021 04:17:00 - INFO - __main__ - Step 50034: {'lr': 0.0003809276667772241, 'samples': 9606528, 'steps': 50033, 'loss/train': 1.2764545679092407} -11/07/2021 04:17:01 - INFO - __main__ - Step 50035: {'lr': 0.00038092314595237873, 'samples': 9606720, 'steps': 50034, 'loss/train': 1.7428356409072876} -11/07/2021 04:17:01 - INFO - __main__ - Step 50036: {'lr': 0.0003809186250685414, 'samples': 9606912, 'steps': 50035, 'loss/train': 1.3986958265304565} -11/07/2021 04:17:02 - INFO - __main__ - Step 50037: {'lr': 0.0003809141041257141, 'samples': 9607104, 'steps': 50036, 'loss/train': 1.1598021984100342} -11/07/2021 04:17:02 - INFO - __main__ - Step 50038: {'lr': 0.000380909583123899, 'samples': 9607296, 'steps': 50037, 'loss/train': 1.2968944311141968} -11/07/2021 04:17:03 - INFO - __main__ - Step 50039: {'lr': 0.00038090506206309805, 'samples': 9607488, 'steps': 50038, 'loss/train': 1.6650761365890503} -11/07/2021 04:17:03 - INFO - __main__ - Step 50040: {'lr': 0.00038090054094331324, 'samples': 9607680, 'steps': 50039, 'loss/train': 1.1097683906555176} -11/07/2021 04:17:03 - INFO - __main__ - Step 50041: {'lr': 0.0003808960197645467, 'samples': 9607872, 'steps': 50040, 'loss/train': 1.4362438917160034} -11/07/2021 04:17:05 - INFO - __main__ - Step 50042: {'lr': 0.00038089149852680036, 'samples': 9608064, 'steps': 50041, 'loss/train': 1.7006573677062988} -11/07/2021 04:17:05 - INFO - __main__ - Step 50043: {'lr': 0.00038088697723007647, 'samples': 9608256, 'steps': 50042, 'loss/train': 1.070981740951538} -11/07/2021 04:17:05 - INFO - __main__ - Step 50044: {'lr': 0.00038088245587437685, 'samples': 9608448, 'steps': 50043, 'loss/train': 1.192070722579956} -11/07/2021 04:17:06 - INFO - __main__ - Step 50045: {'lr': 0.00038087793445970363, 'samples': 9608640, 'steps': 50044, 'loss/train': 1.2683120965957642} -11/07/2021 04:17:06 - INFO - __main__ - Step 50046: {'lr': 0.0003808734129860588, 'samples': 9608832, 'steps': 50045, 'loss/train': 1.0339076519012451} -11/07/2021 04:17:06 - INFO - __main__ - Step 50047: {'lr': 0.0003808688914534445, 'samples': 9609024, 'steps': 50046, 'loss/train': 1.137500286102295} -11/07/2021 04:17:07 - INFO - __main__ - Step 50048: {'lr': 0.00038086436986186267, 'samples': 9609216, 'steps': 50047, 'loss/train': 1.3772196769714355} -11/07/2021 04:17:08 - INFO - __main__ - Step 50049: {'lr': 0.00038085984821131536, 'samples': 9609408, 'steps': 50048, 'loss/train': 1.4623816013336182} -11/07/2021 04:17:08 - INFO - __main__ - Step 50050: {'lr': 0.00038085532650180464, 'samples': 9609600, 'steps': 50049, 'loss/train': 0.5126489996910095} -11/07/2021 04:17:09 - INFO - __main__ - Step 50051: {'lr': 0.0003808508047333325, 'samples': 9609792, 'steps': 50050, 'loss/train': 0.09533369541168213} -11/07/2021 04:17:09 - INFO - __main__ - Step 50052: {'lr': 0.000380846282905901, 'samples': 9609984, 'steps': 50051, 'loss/train': 1.4151746034622192} -11/07/2021 04:17:10 - INFO - __main__ - Step 50053: {'lr': 0.0003808417610195122, 'samples': 9610176, 'steps': 50052, 'loss/train': 1.6462810039520264} -11/07/2021 04:17:10 - INFO - __main__ - Step 50054: {'lr': 0.0003808372390741681, 'samples': 9610368, 'steps': 50053, 'loss/train': 1.304959774017334} -11/07/2021 04:17:11 - INFO - __main__ - Step 50055: {'lr': 0.0003808327170698708, 'samples': 9610560, 'steps': 50054, 'loss/train': 1.4613430500030518} -11/07/2021 04:17:11 - INFO - __main__ - Step 50056: {'lr': 0.0003808281950066223, 'samples': 9610752, 'steps': 50055, 'loss/train': 1.3599810600280762} -11/07/2021 04:17:11 - INFO - __main__ - Step 50057: {'lr': 0.0003808236728844246, 'samples': 9610944, 'steps': 50056, 'loss/train': 0.9918197989463806} -11/07/2021 04:17:12 - INFO - __main__ - Step 50058: {'lr': 0.0003808191507032798, 'samples': 9611136, 'steps': 50057, 'loss/train': 1.5752508640289307} -11/07/2021 04:17:13 - INFO - __main__ - Step 50059: {'lr': 0.00038081462846318984, 'samples': 9611328, 'steps': 50058, 'loss/train': 1.5404647588729858} -11/07/2021 04:17:13 - INFO - __main__ - Step 50060: {'lr': 0.000380810106164157, 'samples': 9611520, 'steps': 50059, 'loss/train': 1.406663179397583} -11/07/2021 04:17:13 - INFO - __main__ - Step 50061: {'lr': 0.000380805583806183, 'samples': 9611712, 'steps': 50060, 'loss/train': 1.639754056930542} -11/07/2021 04:17:14 - INFO - __main__ - Step 50062: {'lr': 0.00038080106138927, 'samples': 9611904, 'steps': 50061, 'loss/train': 1.8533631563186646} -11/07/2021 04:17:15 - INFO - __main__ - Step 50063: {'lr': 0.00038079653891342016, 'samples': 9612096, 'steps': 50062, 'loss/train': 1.365235686302185} -11/07/2021 04:17:15 - INFO - __main__ - Step 50064: {'lr': 0.0003807920163786353, 'samples': 9612288, 'steps': 50063, 'loss/train': 1.032162070274353} -11/07/2021 04:17:15 - INFO - __main__ - Step 50065: {'lr': 0.00038078749378491763, 'samples': 9612480, 'steps': 50064, 'loss/train': 1.5522141456604004} -11/07/2021 04:17:16 - INFO - __main__ - Step 50066: {'lr': 0.00038078297113226925, 'samples': 9612672, 'steps': 50065, 'loss/train': 0.29551154375076294} -11/07/2021 04:17:16 - INFO - __main__ - Step 50067: {'lr': 0.00038077844842069193, 'samples': 9612864, 'steps': 50066, 'loss/train': 1.5626736879348755} -11/07/2021 04:17:17 - INFO - __main__ - Step 50068: {'lr': 0.00038077392565018784, 'samples': 9613056, 'steps': 50067, 'loss/train': 1.2820627689361572} -11/07/2021 04:17:18 - INFO - __main__ - Step 50069: {'lr': 0.0003807694028207591, 'samples': 9613248, 'steps': 50068, 'loss/train': 1.2960739135742188} -11/07/2021 04:17:18 - INFO - __main__ - Step 50070: {'lr': 0.0003807648799324077, 'samples': 9613440, 'steps': 50069, 'loss/train': 1.5695760250091553} -11/07/2021 04:17:18 - INFO - __main__ - Step 50071: {'lr': 0.0003807603569851357, 'samples': 9613632, 'steps': 50070, 'loss/train': 1.5570412874221802} -11/07/2021 04:17:19 - INFO - __main__ - Step 50072: {'lr': 0.0003807558339789451, 'samples': 9613824, 'steps': 50071, 'loss/train': 1.4880906343460083} -11/07/2021 04:17:20 - INFO - __main__ - Step 50073: {'lr': 0.00038075131091383783, 'samples': 9614016, 'steps': 50072, 'loss/train': 1.4011688232421875} -11/07/2021 04:17:20 - INFO - __main__ - Step 50074: {'lr': 0.0003807467877898161, 'samples': 9614208, 'steps': 50073, 'loss/train': 1.616499662399292} -11/07/2021 04:17:20 - INFO - __main__ - Step 50075: {'lr': 0.00038074226460688186, 'samples': 9614400, 'steps': 50074, 'loss/train': 1.4088376760482788} -11/07/2021 04:17:21 - INFO - __main__ - Step 50076: {'lr': 0.0003807377413650372, 'samples': 9614592, 'steps': 50075, 'loss/train': 1.7282475233078003} -11/07/2021 04:17:21 - INFO - __main__ - Step 50077: {'lr': 0.0003807332180642842, 'samples': 9614784, 'steps': 50076, 'loss/train': 1.5338096618652344} -11/07/2021 04:17:22 - INFO - __main__ - Step 50078: {'lr': 0.00038072869470462465, 'samples': 9614976, 'steps': 50077, 'loss/train': 1.6608787775039673} -11/07/2021 04:17:23 - INFO - __main__ - Step 50079: {'lr': 0.00038072417128606095, 'samples': 9615168, 'steps': 50078, 'loss/train': 0.6714621186256409} -11/07/2021 04:17:23 - INFO - __main__ - Step 50080: {'lr': 0.00038071964780859486, 'samples': 9615360, 'steps': 50079, 'loss/train': 1.2888237237930298} -11/07/2021 04:17:23 - INFO - __main__ - Step 50081: {'lr': 0.0003807151242722285, 'samples': 9615552, 'steps': 50080, 'loss/train': 1.4392421245574951} -11/07/2021 04:17:24 - INFO - __main__ - Step 50082: {'lr': 0.00038071060067696393, 'samples': 9615744, 'steps': 50081, 'loss/train': 1.5196335315704346} -11/07/2021 04:17:25 - INFO - __main__ - Step 50083: {'lr': 0.00038070607702280325, 'samples': 9615936, 'steps': 50082, 'loss/train': 1.734366774559021} -11/07/2021 04:17:25 - INFO - __main__ - Step 50084: {'lr': 0.00038070155330974844, 'samples': 9616128, 'steps': 50083, 'loss/train': 1.2994858026504517} -11/07/2021 04:17:25 - INFO - __main__ - Step 50085: {'lr': 0.0003806970295378014, 'samples': 9616320, 'steps': 50084, 'loss/train': 1.5340774059295654} -11/07/2021 04:17:26 - INFO - __main__ - Step 50086: {'lr': 0.00038069250570696433, 'samples': 9616512, 'steps': 50085, 'loss/train': 1.9248086214065552} -11/07/2021 04:17:26 - INFO - __main__ - Step 50087: {'lr': 0.00038068798181723927, 'samples': 9616704, 'steps': 50086, 'loss/train': 1.6424987316131592} -11/07/2021 04:17:27 - INFO - __main__ - Step 50088: {'lr': 0.00038068345786862825, 'samples': 9616896, 'steps': 50087, 'loss/train': 0.971694827079773} -11/07/2021 04:17:28 - INFO - __main__ - Step 50089: {'lr': 0.0003806789338611333, 'samples': 9617088, 'steps': 50088, 'loss/train': 0.5746945142745972} -11/07/2021 04:17:28 - INFO - __main__ - Step 50090: {'lr': 0.00038067440979475635, 'samples': 9617280, 'steps': 50089, 'loss/train': 1.6796151399612427} -11/07/2021 04:17:28 - INFO - __main__ - Step 50091: {'lr': 0.0003806698856694996, 'samples': 9617472, 'steps': 50090, 'loss/train': 1.5130348205566406} -11/07/2021 04:17:29 - INFO - __main__ - Step 50092: {'lr': 0.00038066536148536495, 'samples': 9617664, 'steps': 50091, 'loss/train': 1.341958999633789} -11/07/2021 04:17:30 - INFO - __main__ - Step 50093: {'lr': 0.00038066083724235455, 'samples': 9617856, 'steps': 50092, 'loss/train': 1.1158323287963867} -11/07/2021 04:17:30 - INFO - __main__ - Step 50094: {'lr': 0.00038065631294047035, 'samples': 9618048, 'steps': 50093, 'loss/train': 1.3453494310379028} -11/07/2021 04:17:30 - INFO - __main__ - Step 50095: {'lr': 0.0003806517885797145, 'samples': 9618240, 'steps': 50094, 'loss/train': 1.2856875658035278} -11/07/2021 04:17:31 - INFO - __main__ - Step 50096: {'lr': 0.0003806472641600889, 'samples': 9618432, 'steps': 50095, 'loss/train': 1.086360216140747} -11/07/2021 04:17:31 - INFO - __main__ - Step 50097: {'lr': 0.00038064273968159575, 'samples': 9618624, 'steps': 50096, 'loss/train': 1.6092201471328735} -11/07/2021 04:17:33 - INFO - __main__ - Step 50098: {'lr': 0.00038063821514423694, 'samples': 9618816, 'steps': 50097, 'loss/train': 1.7410180568695068} -11/07/2021 04:17:33 - INFO - __main__ - Step 50099: {'lr': 0.00038063369054801456, 'samples': 9619008, 'steps': 50098, 'loss/train': 1.2810670137405396} -11/07/2021 04:17:33 - INFO - __main__ - Step 50100: {'lr': 0.00038062916589293064, 'samples': 9619200, 'steps': 50099, 'loss/train': 0.9716135859489441} -11/07/2021 04:17:34 - INFO - __main__ - Step 50101: {'lr': 0.0003806246411789872, 'samples': 9619392, 'steps': 50100, 'loss/train': 1.5850729942321777} -11/07/2021 04:17:34 - INFO - __main__ - Step 50102: {'lr': 0.00038062011640618636, 'samples': 9619584, 'steps': 50101, 'loss/train': 1.6093177795410156} -11/07/2021 04:17:35 - INFO - __main__ - Step 50103: {'lr': 0.00038061559157453014, 'samples': 9619776, 'steps': 50102, 'loss/train': 0.5811560153961182} -11/07/2021 04:17:35 - INFO - __main__ - Step 50104: {'lr': 0.00038061106668402055, 'samples': 9619968, 'steps': 50103, 'loss/train': 1.1450581550598145} -11/07/2021 04:17:36 - INFO - __main__ - Step 50105: {'lr': 0.0003806065417346596, 'samples': 9620160, 'steps': 50104, 'loss/train': 1.740180253982544} -11/07/2021 04:17:36 - INFO - __main__ - Step 50106: {'lr': 0.00038060201672644934, 'samples': 9620352, 'steps': 50105, 'loss/train': 1.3290950059890747} -11/07/2021 04:17:36 - INFO - __main__ - Step 50107: {'lr': 0.00038059749165939184, 'samples': 9620544, 'steps': 50106, 'loss/train': 1.5256736278533936} -11/07/2021 04:17:37 - INFO - __main__ - Step 50108: {'lr': 0.00038059296653348917, 'samples': 9620736, 'steps': 50107, 'loss/train': 1.0681893825531006} -11/07/2021 04:17:38 - INFO - __main__ - Step 50109: {'lr': 0.00038058844134874326, 'samples': 9620928, 'steps': 50108, 'loss/train': 1.5296568870544434} -11/07/2021 04:17:38 - INFO - __main__ - Step 50110: {'lr': 0.0003805839161051563, 'samples': 9621120, 'steps': 50109, 'loss/train': 1.5743610858917236} -11/07/2021 04:17:38 - INFO - __main__ - Step 50111: {'lr': 0.00038057939080273016, 'samples': 9621312, 'steps': 50110, 'loss/train': 1.1973341703414917} -11/07/2021 04:17:39 - INFO - __main__ - Step 50112: {'lr': 0.00038057486544146703, 'samples': 9621504, 'steps': 50111, 'loss/train': 1.5013760328292847} -11/07/2021 04:17:40 - INFO - __main__ - Step 50113: {'lr': 0.0003805703400213688, 'samples': 9621696, 'steps': 50112, 'loss/train': 1.4528602361679077} -11/07/2021 04:17:40 - INFO - __main__ - Step 50114: {'lr': 0.0003805658145424376, 'samples': 9621888, 'steps': 50113, 'loss/train': 1.760488748550415} -11/07/2021 04:17:40 - INFO - __main__ - Step 50115: {'lr': 0.00038056128900467546, 'samples': 9622080, 'steps': 50114, 'loss/train': 1.398864984512329} -11/07/2021 04:17:41 - INFO - __main__ - Step 50116: {'lr': 0.00038055676340808446, 'samples': 9622272, 'steps': 50115, 'loss/train': 1.3213566541671753} -11/07/2021 04:17:41 - INFO - __main__ - Step 50117: {'lr': 0.00038055223775266666, 'samples': 9622464, 'steps': 50116, 'loss/train': 1.8905999660491943} -11/07/2021 04:17:42 - INFO - __main__ - Step 50118: {'lr': 0.0003805477120384239, 'samples': 9622656, 'steps': 50117, 'loss/train': 1.3616106510162354} -11/07/2021 04:17:43 - INFO - __main__ - Step 50119: {'lr': 0.00038054318626535845, 'samples': 9622848, 'steps': 50118, 'loss/train': 1.5988349914550781} -11/07/2021 04:17:43 - INFO - __main__ - Step 50120: {'lr': 0.00038053866043347216, 'samples': 9623040, 'steps': 50119, 'loss/train': 1.7721415758132935} -11/07/2021 04:17:43 - INFO - __main__ - Step 50121: {'lr': 0.00038053413454276725, 'samples': 9623232, 'steps': 50120, 'loss/train': 1.3219261169433594} -11/07/2021 04:17:44 - INFO - __main__ - Step 50122: {'lr': 0.00038052960859324557, 'samples': 9623424, 'steps': 50121, 'loss/train': 1.76235830783844} -11/07/2021 04:17:44 - INFO - __main__ - Step 50123: {'lr': 0.0003805250825849094, 'samples': 9623616, 'steps': 50122, 'loss/train': 1.686732530593872} -11/07/2021 04:17:45 - INFO - __main__ - Step 50124: {'lr': 0.0003805205565177606, 'samples': 9623808, 'steps': 50123, 'loss/train': 1.3251734972000122} -11/07/2021 04:17:45 - INFO - __main__ - Step 50125: {'lr': 0.0003805160303918013, 'samples': 9624000, 'steps': 50124, 'loss/train': 1.3244572877883911} -11/07/2021 04:17:46 - INFO - __main__ - Step 50126: {'lr': 0.0003805115042070333, 'samples': 9624192, 'steps': 50125, 'loss/train': 1.2289057970046997} -11/07/2021 04:17:46 - INFO - __main__ - Step 50127: {'lr': 0.000380506977963459, 'samples': 9624384, 'steps': 50126, 'loss/train': 1.5427542924880981} -11/07/2021 04:17:46 - INFO - __main__ - Step 50128: {'lr': 0.00038050245166108024, 'samples': 9624576, 'steps': 50127, 'loss/train': 1.2708112001419067} -11/07/2021 04:17:47 - INFO - __main__ - Step 50129: {'lr': 0.000380497925299899, 'samples': 9624768, 'steps': 50128, 'loss/train': 1.509828805923462} -11/07/2021 04:17:48 - INFO - __main__ - Step 50130: {'lr': 0.0003804933988799175, 'samples': 9624960, 'steps': 50129, 'loss/train': 1.2576930522918701} -11/07/2021 04:17:48 - INFO - __main__ - Step 50131: {'lr': 0.0003804888724011377, 'samples': 9625152, 'steps': 50130, 'loss/train': 1.5663971900939941} -11/07/2021 04:17:48 - INFO - __main__ - Step 50132: {'lr': 0.00038048434586356164, 'samples': 9625344, 'steps': 50131, 'loss/train': 1.1456104516983032} -11/07/2021 04:17:49 - INFO - __main__ - Step 50133: {'lr': 0.0003804798192671912, 'samples': 9625536, 'steps': 50132, 'loss/train': 1.7524334192276} -11/07/2021 04:17:50 - INFO - __main__ - Step 50134: {'lr': 0.00038047529261202876, 'samples': 9625728, 'steps': 50133, 'loss/train': 1.5693469047546387} -11/07/2021 04:17:50 - INFO - __main__ - Step 50135: {'lr': 0.0003804707658980761, 'samples': 9625920, 'steps': 50134, 'loss/train': 1.1924694776535034} -11/07/2021 04:17:51 - INFO - __main__ - Step 50136: {'lr': 0.0003804662391253352, 'samples': 9626112, 'steps': 50135, 'loss/train': 1.474402666091919} -11/07/2021 04:17:51 - INFO - __main__ - Step 50137: {'lr': 0.00038046171229380837, 'samples': 9626304, 'steps': 50136, 'loss/train': 1.3929524421691895} -11/07/2021 04:17:51 - INFO - __main__ - Step 50138: {'lr': 0.0003804571854034975, 'samples': 9626496, 'steps': 50137, 'loss/train': 0.9163033366203308} -11/07/2021 04:17:52 - INFO - __main__ - Step 50139: {'lr': 0.0003804526584544046, 'samples': 9626688, 'steps': 50138, 'loss/train': 1.1019681692123413} -11/07/2021 04:17:53 - INFO - __main__ - Step 50140: {'lr': 0.0003804481314465317, 'samples': 9626880, 'steps': 50139, 'loss/train': 1.2081000804901123} -11/07/2021 04:17:53 - INFO - __main__ - Step 50141: {'lr': 0.0003804436043798809, 'samples': 9627072, 'steps': 50140, 'loss/train': 1.5302804708480835} -11/07/2021 04:17:53 - INFO - __main__ - Step 50142: {'lr': 0.00038043907725445424, 'samples': 9627264, 'steps': 50141, 'loss/train': 1.393977403640747} -11/07/2021 04:17:54 - INFO - __main__ - Step 50143: {'lr': 0.00038043455007025375, 'samples': 9627456, 'steps': 50142, 'loss/train': 1.6601444482803345} -11/07/2021 04:17:55 - INFO - __main__ - Step 50144: {'lr': 0.00038043002282728153, 'samples': 9627648, 'steps': 50143, 'loss/train': 1.873679757118225} -11/07/2021 04:17:55 - INFO - __main__ - Step 50145: {'lr': 0.00038042549552553954, 'samples': 9627840, 'steps': 50144, 'loss/train': 1.777874231338501} -11/07/2021 04:17:56 - INFO - __main__ - Step 50146: {'lr': 0.00038042096816502967, 'samples': 9628032, 'steps': 50145, 'loss/train': 1.4701316356658936} -11/07/2021 04:17:56 - INFO - __main__ - Step 50147: {'lr': 0.0003804164407457543, 'samples': 9628224, 'steps': 50146, 'loss/train': 1.5121428966522217} -11/07/2021 04:17:56 - INFO - __main__ - Step 50148: {'lr': 0.0003804119132677152, 'samples': 9628416, 'steps': 50147, 'loss/train': 1.4496904611587524} -11/07/2021 04:17:57 - INFO - __main__ - Step 50149: {'lr': 0.0003804073857309145, 'samples': 9628608, 'steps': 50148, 'loss/train': 2.126142740249634} -11/07/2021 04:17:58 - INFO - __main__ - Step 50150: {'lr': 0.00038040285813535434, 'samples': 9628800, 'steps': 50149, 'loss/train': 1.5035032033920288} -11/07/2021 04:17:58 - INFO - __main__ - Step 50151: {'lr': 0.0003803983304810367, 'samples': 9628992, 'steps': 50150, 'loss/train': 0.773347795009613} -11/07/2021 04:17:58 - INFO - __main__ - Step 50152: {'lr': 0.0003803938027679634, 'samples': 9629184, 'steps': 50151, 'loss/train': 0.7962072491645813} -11/07/2021 04:17:59 - INFO - __main__ - Step 50153: {'lr': 0.0003803892749961368, 'samples': 9629376, 'steps': 50152, 'loss/train': 1.6893115043640137} -11/07/2021 04:18:00 - INFO - __main__ - Step 50154: {'lr': 0.0003803847471655587, 'samples': 9629568, 'steps': 50153, 'loss/train': 1.2985191345214844} -11/07/2021 04:18:00 - INFO - __main__ - Step 50155: {'lr': 0.00038038021927623133, 'samples': 9629760, 'steps': 50154, 'loss/train': 2.1850473880767822} -11/07/2021 04:18:00 - INFO - __main__ - Step 50156: {'lr': 0.00038037569132815663, 'samples': 9629952, 'steps': 50155, 'loss/train': 1.6614058017730713} -11/07/2021 04:18:01 - INFO - __main__ - Step 50157: {'lr': 0.0003803711633213367, 'samples': 9630144, 'steps': 50156, 'loss/train': 0.8183517456054688} -11/07/2021 04:18:01 - INFO - __main__ - Step 50158: {'lr': 0.0003803666352557735, 'samples': 9630336, 'steps': 50157, 'loss/train': 1.7416718006134033} -11/07/2021 04:18:02 - INFO - __main__ - Step 50159: {'lr': 0.0003803621071314691, 'samples': 9630528, 'steps': 50158, 'loss/train': 1.6603349447250366} -11/07/2021 04:18:03 - INFO - __main__ - Step 50160: {'lr': 0.0003803575789484255, 'samples': 9630720, 'steps': 50159, 'loss/train': 1.5331896543502808} -11/07/2021 04:18:03 - INFO - __main__ - Step 50161: {'lr': 0.0003803530507066448, 'samples': 9630912, 'steps': 50160, 'loss/train': 1.3435156345367432} -11/07/2021 04:18:03 - INFO - __main__ - Step 50162: {'lr': 0.00038034852240612907, 'samples': 9631104, 'steps': 50161, 'loss/train': 1.4418418407440186} -11/07/2021 04:18:04 - INFO - __main__ - Step 50163: {'lr': 0.00038034399404688024, 'samples': 9631296, 'steps': 50162, 'loss/train': 0.3798968195915222} -11/07/2021 04:18:04 - INFO - __main__ - Step 50164: {'lr': 0.00038033946562890055, 'samples': 9631488, 'steps': 50163, 'loss/train': 0.9605880975723267} -11/07/2021 04:18:05 - INFO - __main__ - Step 50165: {'lr': 0.0003803349371521918, 'samples': 9631680, 'steps': 50164, 'loss/train': 1.5995622873306274} -11/07/2021 04:18:06 - INFO - __main__ - Step 50166: {'lr': 0.00038033040861675617, 'samples': 9631872, 'steps': 50165, 'loss/train': 1.0809211730957031} -11/07/2021 04:18:06 - INFO - __main__ - Step 50167: {'lr': 0.0003803258800225956, 'samples': 9632064, 'steps': 50166, 'loss/train': 0.08810996264219284} -11/07/2021 04:18:06 - INFO - __main__ - Step 50168: {'lr': 0.0003803213513697123, 'samples': 9632256, 'steps': 50167, 'loss/train': 1.607441782951355} -11/07/2021 04:18:07 - INFO - __main__ - Step 50169: {'lr': 0.0003803168226581082, 'samples': 9632448, 'steps': 50168, 'loss/train': 1.309495210647583} -11/07/2021 04:18:08 - INFO - __main__ - Step 50170: {'lr': 0.00038031229388778526, 'samples': 9632640, 'steps': 50169, 'loss/train': 1.2352304458618164} -11/07/2021 04:18:08 - INFO - __main__ - Step 50171: {'lr': 0.00038030776505874577, 'samples': 9632832, 'steps': 50170, 'loss/train': 1.6889320611953735} -11/07/2021 04:18:09 - INFO - __main__ - Step 50172: {'lr': 0.0003803032361709915, 'samples': 9633024, 'steps': 50171, 'loss/train': 1.7311201095581055} -11/07/2021 04:18:09 - INFO - __main__ - Step 50173: {'lr': 0.00038029870722452455, 'samples': 9633216, 'steps': 50172, 'loss/train': 1.1639690399169922} -11/07/2021 04:18:09 - INFO - __main__ - Step 50174: {'lr': 0.0003802941782193471, 'samples': 9633408, 'steps': 50173, 'loss/train': 0.15695008635520935} -11/07/2021 04:18:10 - INFO - __main__ - Step 50175: {'lr': 0.00038028964915546107, 'samples': 9633600, 'steps': 50174, 'loss/train': 1.5289998054504395} -11/07/2021 04:18:11 - INFO - __main__ - Step 50176: {'lr': 0.00038028512003286853, 'samples': 9633792, 'steps': 50175, 'loss/train': 1.2912172079086304} -11/07/2021 04:18:11 - INFO - __main__ - Step 50177: {'lr': 0.00038028059085157165, 'samples': 9633984, 'steps': 50176, 'loss/train': 1.3492580652236938} -11/07/2021 04:18:11 - INFO - __main__ - Step 50178: {'lr': 0.0003802760616115722, 'samples': 9634176, 'steps': 50177, 'loss/train': 1.8885968923568726} -11/07/2021 04:18:12 - INFO - __main__ - Step 50179: {'lr': 0.0003802715323128724, 'samples': 9634368, 'steps': 50178, 'loss/train': 1.1622658967971802} -11/07/2021 04:18:13 - INFO - __main__ - Step 50180: {'lr': 0.00038026700295547424, 'samples': 9634560, 'steps': 50179, 'loss/train': 1.4751503467559814} -11/07/2021 04:18:13 - INFO - __main__ - Step 50181: {'lr': 0.0003802624735393798, 'samples': 9634752, 'steps': 50180, 'loss/train': 1.3558752536773682} -11/07/2021 04:18:14 - INFO - __main__ - Step 50182: {'lr': 0.00038025794406459115, 'samples': 9634944, 'steps': 50181, 'loss/train': 1.3577591180801392} -11/07/2021 04:18:14 - INFO - __main__ - Step 50183: {'lr': 0.00038025341453111017, 'samples': 9635136, 'steps': 50182, 'loss/train': 1.314875841140747} -11/07/2021 04:18:14 - INFO - __main__ - Step 50184: {'lr': 0.0003802488849389391, 'samples': 9635328, 'steps': 50183, 'loss/train': 0.12867824733257294} -11/07/2021 04:18:15 - INFO - __main__ - Step 50185: {'lr': 0.0003802443552880799, 'samples': 9635520, 'steps': 50184, 'loss/train': 1.5836074352264404} -11/07/2021 04:18:16 - INFO - __main__ - Step 50186: {'lr': 0.00038023982557853456, 'samples': 9635712, 'steps': 50185, 'loss/train': 1.537987470626831} -11/07/2021 04:18:16 - INFO - __main__ - Step 50187: {'lr': 0.00038023529581030516, 'samples': 9635904, 'steps': 50186, 'loss/train': 1.3645615577697754} -11/07/2021 04:18:16 - INFO - __main__ - Step 50188: {'lr': 0.00038023076598339375, 'samples': 9636096, 'steps': 50187, 'loss/train': 1.2964589595794678} -11/07/2021 04:18:17 - INFO - __main__ - Step 50189: {'lr': 0.0003802262360978024, 'samples': 9636288, 'steps': 50188, 'loss/train': 4.468301296234131} -11/07/2021 04:18:18 - INFO - __main__ - Step 50190: {'lr': 0.00038022170615353314, 'samples': 9636480, 'steps': 50189, 'loss/train': 0.9755254983901978} -11/07/2021 04:18:18 - INFO - __main__ - Step 50191: {'lr': 0.00038021717615058795, 'samples': 9636672, 'steps': 50190, 'loss/train': 1.2911059856414795} -11/07/2021 04:18:18 - INFO - __main__ - Step 50192: {'lr': 0.00038021264608896884, 'samples': 9636864, 'steps': 50191, 'loss/train': 1.4070249795913696} -11/07/2021 04:18:19 - INFO - __main__ - Step 50193: {'lr': 0.000380208115968678, 'samples': 9637056, 'steps': 50192, 'loss/train': 1.7199753522872925} -11/07/2021 04:18:19 - INFO - __main__ - Step 50194: {'lr': 0.00038020358578971737, 'samples': 9637248, 'steps': 50193, 'loss/train': 0.8250120878219604} -11/07/2021 04:18:19 - INFO - __main__ - Step 50195: {'lr': 0.000380199055552089, 'samples': 9637440, 'steps': 50194, 'loss/train': 1.2280455827713013} -11/07/2021 04:18:21 - INFO - __main__ - Step 50196: {'lr': 0.000380194525255795, 'samples': 9637632, 'steps': 50195, 'loss/train': 0.7293029427528381} -11/07/2021 04:18:21 - INFO - __main__ - Step 50197: {'lr': 0.0003801899949008373, 'samples': 9637824, 'steps': 50196, 'loss/train': 1.4373277425765991} -11/07/2021 04:18:21 - INFO - __main__ - Step 50198: {'lr': 0.000380185464487218, 'samples': 9638016, 'steps': 50197, 'loss/train': 1.2845509052276611} -11/07/2021 04:18:22 - INFO - __main__ - Step 50199: {'lr': 0.00038018093401493916, 'samples': 9638208, 'steps': 50198, 'loss/train': 1.3581730127334595} -11/07/2021 04:18:22 - INFO - __main__ - Step 50200: {'lr': 0.00038017640348400286, 'samples': 9638400, 'steps': 50199, 'loss/train': 1.4440293312072754} -11/07/2021 04:18:23 - INFO - __main__ - Step 50201: {'lr': 0.000380171872894411, 'samples': 9638592, 'steps': 50200, 'loss/train': 1.8245569467544556} -11/07/2021 04:18:24 - INFO - __main__ - Step 50202: {'lr': 0.00038016734224616565, 'samples': 9638784, 'steps': 50201, 'loss/train': 1.4053648710250854} -11/07/2021 04:18:24 - INFO - __main__ - Step 50203: {'lr': 0.000380162811539269, 'samples': 9638976, 'steps': 50202, 'loss/train': 1.519346833229065} -11/07/2021 04:18:24 - INFO - __main__ - Step 50204: {'lr': 0.0003801582807737229, 'samples': 9639168, 'steps': 50203, 'loss/train': 0.9944263100624084} -11/07/2021 04:18:25 - INFO - __main__ - Step 50205: {'lr': 0.00038015374994952966, 'samples': 9639360, 'steps': 50204, 'loss/train': 1.582240343093872} -11/07/2021 04:18:25 - INFO - __main__ - Step 50206: {'lr': 0.0003801492190666911, 'samples': 9639552, 'steps': 50205, 'loss/train': 1.3527615070343018} -11/07/2021 04:18:26 - INFO - __main__ - Step 50207: {'lr': 0.00038014468812520917, 'samples': 9639744, 'steps': 50206, 'loss/train': 1.7546110153198242} -11/07/2021 04:18:26 - INFO - __main__ - Step 50208: {'lr': 0.00038014015712508617, 'samples': 9639936, 'steps': 50207, 'loss/train': 1.6559122800827026} -11/07/2021 04:18:27 - INFO - __main__ - Step 50209: {'lr': 0.000380135626066324, 'samples': 9640128, 'steps': 50208, 'loss/train': 1.6707357168197632} -11/07/2021 04:18:27 - INFO - __main__ - Step 50210: {'lr': 0.00038013109494892467, 'samples': 9640320, 'steps': 50209, 'loss/train': 1.460334062576294} -11/07/2021 04:18:27 - INFO - __main__ - Step 50211: {'lr': 0.00038012656377289035, 'samples': 9640512, 'steps': 50210, 'loss/train': 1.4711841344833374} -11/07/2021 04:18:29 - INFO - __main__ - Step 50212: {'lr': 0.000380122032538223, 'samples': 9640704, 'steps': 50211, 'loss/train': 1.8600960969924927} -11/07/2021 04:18:29 - INFO - __main__ - Step 50213: {'lr': 0.0003801175012449246, 'samples': 9640896, 'steps': 50212, 'loss/train': 1.8999093770980835} -11/07/2021 04:18:29 - INFO - __main__ - Step 50214: {'lr': 0.0003801129698929974, 'samples': 9641088, 'steps': 50213, 'loss/train': 1.8671318292617798} -11/07/2021 04:18:30 - INFO - __main__ - Step 50215: {'lr': 0.00038010843848244316, 'samples': 9641280, 'steps': 50214, 'loss/train': 1.1005767583847046} -11/07/2021 04:18:30 - INFO - __main__ - Step 50216: {'lr': 0.00038010390701326415, 'samples': 9641472, 'steps': 50215, 'loss/train': 1.3407621383666992} -11/07/2021 04:18:31 - INFO - __main__ - Step 50217: {'lr': 0.00038009937548546223, 'samples': 9641664, 'steps': 50216, 'loss/train': 1.4449464082717896} -11/07/2021 04:18:31 - INFO - __main__ - Step 50218: {'lr': 0.0003800948438990397, 'samples': 9641856, 'steps': 50217, 'loss/train': 0.5882311463356018} -11/07/2021 04:18:32 - INFO - __main__ - Step 50219: {'lr': 0.0003800903122539983, 'samples': 9642048, 'steps': 50218, 'loss/train': 1.342165470123291} -11/07/2021 04:18:32 - INFO - __main__ - Step 50220: {'lr': 0.00038008578055034024, 'samples': 9642240, 'steps': 50219, 'loss/train': 1.6090655326843262} -11/07/2021 04:18:32 - INFO - __main__ - Step 50221: {'lr': 0.0003800812487880676, 'samples': 9642432, 'steps': 50220, 'loss/train': 2.008596658706665} -11/07/2021 04:18:33 - INFO - __main__ - Step 50222: {'lr': 0.00038007671696718226, 'samples': 9642624, 'steps': 50221, 'loss/train': 1.2963448762893677} -11/07/2021 04:18:34 - INFO - __main__ - Step 50223: {'lr': 0.0003800721850876864, 'samples': 9642816, 'steps': 50222, 'loss/train': 1.3931059837341309} -11/07/2021 04:18:34 - INFO - __main__ - Step 50224: {'lr': 0.00038006765314958205, 'samples': 9643008, 'steps': 50223, 'loss/train': 1.0996228456497192} -11/07/2021 04:18:34 - INFO - __main__ - Step 50225: {'lr': 0.00038006312115287125, 'samples': 9643200, 'steps': 50224, 'loss/train': 0.7568684220314026} -11/07/2021 04:18:35 - INFO - __main__ - Step 50226: {'lr': 0.00038005858909755596, 'samples': 9643392, 'steps': 50225, 'loss/train': 1.444982647895813} -11/07/2021 04:18:36 - INFO - __main__ - Step 50227: {'lr': 0.00038005405698363824, 'samples': 9643584, 'steps': 50226, 'loss/train': 1.4651623964309692} -11/07/2021 04:18:36 - INFO - __main__ - Step 50228: {'lr': 0.0003800495248111202, 'samples': 9643776, 'steps': 50227, 'loss/train': 0.8650681376457214} -11/07/2021 04:18:36 - INFO - __main__ - Step 50229: {'lr': 0.00038004499258000393, 'samples': 9643968, 'steps': 50228, 'loss/train': 2.6625075340270996} -11/07/2021 04:18:37 - INFO - __main__ - Step 50230: {'lr': 0.0003800404602902913, 'samples': 9644160, 'steps': 50229, 'loss/train': 1.6091790199279785} -11/07/2021 04:18:37 - INFO - __main__ - Step 50231: {'lr': 0.0003800359279419845, 'samples': 9644352, 'steps': 50230, 'loss/train': 1.3057498931884766} -11/07/2021 04:18:38 - INFO - __main__ - Step 50232: {'lr': 0.0003800313955350855, 'samples': 9644544, 'steps': 50231, 'loss/train': 0.8586352467536926} -11/07/2021 04:18:38 - INFO - __main__ - Step 50233: {'lr': 0.0003800268630695963, 'samples': 9644736, 'steps': 50232, 'loss/train': 1.289310097694397} -11/07/2021 04:18:39 - INFO - __main__ - Step 50234: {'lr': 0.00038002233054551906, 'samples': 9644928, 'steps': 50233, 'loss/train': 1.217408537864685} -11/07/2021 04:18:39 - INFO - __main__ - Step 50235: {'lr': 0.00038001779796285575, 'samples': 9645120, 'steps': 50234, 'loss/train': 1.2559170722961426} -11/07/2021 04:18:40 - INFO - __main__ - Step 50236: {'lr': 0.0003800132653216084, 'samples': 9645312, 'steps': 50235, 'loss/train': 1.3718836307525635} -11/07/2021 04:18:41 - INFO - __main__ - Step 50237: {'lr': 0.00038000873262177914, 'samples': 9645504, 'steps': 50236, 'loss/train': 1.396490454673767} -11/07/2021 04:18:41 - INFO - __main__ - Step 50238: {'lr': 0.00038000419986336997, 'samples': 9645696, 'steps': 50237, 'loss/train': 1.6394122838974} -11/07/2021 04:18:41 - INFO - __main__ - Step 50239: {'lr': 0.0003799996670463828, 'samples': 9645888, 'steps': 50238, 'loss/train': 1.2472902536392212} -11/07/2021 04:18:42 - INFO - __main__ - Step 50240: {'lr': 0.0003799951341708199, 'samples': 9646080, 'steps': 50239, 'loss/train': 1.4720319509506226} -11/07/2021 04:18:42 - INFO - __main__ - Step 50241: {'lr': 0.0003799906012366832, 'samples': 9646272, 'steps': 50240, 'loss/train': 0.07744947820901871} -11/07/2021 04:18:43 - INFO - __main__ - Step 50242: {'lr': 0.0003799860682439746, 'samples': 9646464, 'steps': 50241, 'loss/train': 1.135290503501892} -11/07/2021 04:18:43 - INFO - __main__ - Step 50243: {'lr': 0.0003799815351926964, 'samples': 9646656, 'steps': 50242, 'loss/train': 2.1058695316314697} -11/07/2021 04:18:44 - INFO - __main__ - Step 50244: {'lr': 0.0003799770020828505, 'samples': 9646848, 'steps': 50243, 'loss/train': 1.246898889541626} -11/07/2021 04:18:44 - INFO - __main__ - Step 50245: {'lr': 0.000379972468914439, 'samples': 9647040, 'steps': 50244, 'loss/train': 1.1737421751022339} -11/07/2021 04:18:45 - INFO - __main__ - Step 50246: {'lr': 0.0003799679356874639, 'samples': 9647232, 'steps': 50245, 'loss/train': 1.6934196949005127} -11/07/2021 04:18:45 - INFO - __main__ - Step 50247: {'lr': 0.0003799634024019272, 'samples': 9647424, 'steps': 50246, 'loss/train': 1.6743232011795044} -11/07/2021 04:18:46 - INFO - __main__ - Step 50248: {'lr': 0.0003799588690578311, 'samples': 9647616, 'steps': 50247, 'loss/train': 5.710962772369385} -11/07/2021 04:18:46 - INFO - __main__ - Step 50249: {'lr': 0.0003799543356551773, 'samples': 9647808, 'steps': 50248, 'loss/train': 1.0744068622589111} -11/07/2021 04:18:47 - INFO - __main__ - Step 50250: {'lr': 0.00037994980219396835, 'samples': 9648000, 'steps': 50249, 'loss/train': 1.2862998247146606} -11/07/2021 04:18:47 - INFO - __main__ - Step 50251: {'lr': 0.00037994526867420595, 'samples': 9648192, 'steps': 50250, 'loss/train': 1.4021929502487183} -11/07/2021 04:18:47 - INFO - __main__ - Step 50252: {'lr': 0.0003799407350958922, 'samples': 9648384, 'steps': 50251, 'loss/train': 1.3082607984542847} -11/07/2021 04:18:48 - INFO - __main__ - Step 50253: {'lr': 0.00037993620145902914, 'samples': 9648576, 'steps': 50252, 'loss/train': 0.08240436017513275} -11/07/2021 04:18:49 - INFO - __main__ - Step 50254: {'lr': 0.00037993166776361883, 'samples': 9648768, 'steps': 50253, 'loss/train': 1.5516008138656616} -11/07/2021 04:18:49 - INFO - __main__ - Step 50255: {'lr': 0.0003799271340096633, 'samples': 9648960, 'steps': 50254, 'loss/train': 1.3444350957870483} -11/07/2021 04:18:49 - INFO - __main__ - Step 50256: {'lr': 0.00037992260019716463, 'samples': 9649152, 'steps': 50255, 'loss/train': 1.1952298879623413} -11/07/2021 04:18:50 - INFO - __main__ - Step 50257: {'lr': 0.00037991806632612485, 'samples': 9649344, 'steps': 50256, 'loss/train': 1.0896855592727661} -11/07/2021 04:18:51 - INFO - __main__ - Step 50258: {'lr': 0.000379913532396546, 'samples': 9649536, 'steps': 50257, 'loss/train': 1.1467939615249634} -11/07/2021 04:18:51 - INFO - __main__ - Step 50259: {'lr': 0.0003799089984084302, 'samples': 9649728, 'steps': 50258, 'loss/train': 1.575662612915039} -11/07/2021 04:18:51 - INFO - __main__ - Step 50260: {'lr': 0.00037990446436177925, 'samples': 9649920, 'steps': 50259, 'loss/train': 1.17159104347229} -11/07/2021 04:18:52 - INFO - __main__ - Step 50261: {'lr': 0.0003798999302565954, 'samples': 9650112, 'steps': 50260, 'loss/train': 1.5639235973358154} -11/07/2021 04:18:52 - INFO - __main__ - Step 50262: {'lr': 0.0003798953960928807, 'samples': 9650304, 'steps': 50261, 'loss/train': 1.9105384349822998} -11/07/2021 04:18:54 - INFO - __main__ - Step 50263: {'lr': 0.0003798908618706371, 'samples': 9650496, 'steps': 50262, 'loss/train': 1.8271366357803345} -11/07/2021 04:18:54 - INFO - __main__ - Step 50264: {'lr': 0.0003798863275898667, 'samples': 9650688, 'steps': 50263, 'loss/train': 1.162956953048706} -11/07/2021 04:18:54 - INFO - __main__ - Step 50265: {'lr': 0.00037988179325057156, 'samples': 9650880, 'steps': 50264, 'loss/train': 1.6414152383804321} -11/07/2021 04:18:55 - INFO - __main__ - Step 50266: {'lr': 0.0003798772588527536, 'samples': 9651072, 'steps': 50265, 'loss/train': 1.4641472101211548} -11/07/2021 04:18:55 - INFO - __main__ - Step 50267: {'lr': 0.000379872724396415, 'samples': 9651264, 'steps': 50266, 'loss/train': 0.9950963258743286} -11/07/2021 04:18:55 - INFO - __main__ - Step 50268: {'lr': 0.00037986818988155775, 'samples': 9651456, 'steps': 50267, 'loss/train': 1.4459974765777588} -11/07/2021 04:18:57 - INFO - __main__ - Step 50269: {'lr': 0.0003798636553081839, 'samples': 9651648, 'steps': 50268, 'loss/train': 1.2771360874176025} -11/07/2021 04:18:57 - INFO - __main__ - Step 50270: {'lr': 0.0003798591206762955, 'samples': 9651840, 'steps': 50269, 'loss/train': 1.2188576459884644} -11/07/2021 04:18:57 - INFO - __main__ - Step 50271: {'lr': 0.0003798545859858945, 'samples': 9652032, 'steps': 50270, 'loss/train': 1.3124229907989502} -11/07/2021 04:18:58 - INFO - __main__ - Step 50272: {'lr': 0.0003798500512369832, 'samples': 9652224, 'steps': 50271, 'loss/train': 1.11708402633667} -11/07/2021 04:18:58 - INFO - __main__ - Step 50273: {'lr': 0.00037984551642956336, 'samples': 9652416, 'steps': 50272, 'loss/train': 1.3915640115737915} -11/07/2021 04:18:59 - INFO - __main__ - Step 50274: {'lr': 0.0003798409815636371, 'samples': 9652608, 'steps': 50273, 'loss/train': 1.2666629552841187} -11/07/2021 04:18:59 - INFO - __main__ - Step 50275: {'lr': 0.00037983644663920656, 'samples': 9652800, 'steps': 50274, 'loss/train': 1.1245124340057373} -11/07/2021 04:19:00 - INFO - __main__ - Step 50276: {'lr': 0.0003798319116562737, 'samples': 9652992, 'steps': 50275, 'loss/train': 1.2249014377593994} -11/07/2021 04:19:00 - INFO - __main__ - Step 50277: {'lr': 0.00037982737661484056, 'samples': 9653184, 'steps': 50276, 'loss/train': 1.4194586277008057} -11/07/2021 04:19:01 - INFO - __main__ - Step 50278: {'lr': 0.00037982284151490933, 'samples': 9653376, 'steps': 50277, 'loss/train': 0.9645190834999084} -11/07/2021 04:19:02 - INFO - __main__ - Step 50279: {'lr': 0.00037981830635648177, 'samples': 9653568, 'steps': 50278, 'loss/train': 1.2584521770477295} -11/07/2021 04:19:02 - INFO - __main__ - Step 50280: {'lr': 0.0003798137711395602, 'samples': 9653760, 'steps': 50279, 'loss/train': 1.2484103441238403} -11/07/2021 04:19:02 - INFO - __main__ - Step 50281: {'lr': 0.00037980923586414646, 'samples': 9653952, 'steps': 50280, 'loss/train': 1.3946747779846191} -11/07/2021 04:19:03 - INFO - __main__ - Step 50282: {'lr': 0.0003798047005302427, 'samples': 9654144, 'steps': 50281, 'loss/train': 1.743774175643921} -11/07/2021 04:19:03 - INFO - __main__ - Step 50283: {'lr': 0.000379800165137851, 'samples': 9654336, 'steps': 50282, 'loss/train': 1.0040243864059448} -11/07/2021 04:19:04 - INFO - __main__ - Step 50284: {'lr': 0.00037979562968697324, 'samples': 9654528, 'steps': 50283, 'loss/train': 1.5647839307785034} -11/07/2021 04:19:04 - INFO - __main__ - Step 50285: {'lr': 0.0003797910941776117, 'samples': 9654720, 'steps': 50284, 'loss/train': 0.07238461077213287} -11/07/2021 04:19:05 - INFO - __main__ - Step 50286: {'lr': 0.00037978655860976826, 'samples': 9654912, 'steps': 50285, 'loss/train': 1.6101865768432617} -11/07/2021 04:19:05 - INFO - __main__ - Step 50287: {'lr': 0.00037978202298344496, 'samples': 9655104, 'steps': 50286, 'loss/train': 1.595892310142517} -11/07/2021 04:19:05 - INFO - __main__ - Step 50288: {'lr': 0.0003797774872986439, 'samples': 9655296, 'steps': 50287, 'loss/train': 1.5872743129730225} -11/07/2021 04:19:06 - INFO - __main__ - Step 50289: {'lr': 0.00037977295155536706, 'samples': 9655488, 'steps': 50288, 'loss/train': 1.563896894454956} -11/07/2021 04:19:07 - INFO - __main__ - Step 50290: {'lr': 0.00037976841575361665, 'samples': 9655680, 'steps': 50289, 'loss/train': 1.583510398864746} -11/07/2021 04:19:07 - INFO - __main__ - Step 50291: {'lr': 0.00037976387989339445, 'samples': 9655872, 'steps': 50290, 'loss/train': 1.1028339862823486} -11/07/2021 04:19:07 - INFO - __main__ - Step 50292: {'lr': 0.0003797593439747028, 'samples': 9656064, 'steps': 50291, 'loss/train': 1.603823184967041} -11/07/2021 04:19:08 - INFO - __main__ - Step 50293: {'lr': 0.0003797548079975435, 'samples': 9656256, 'steps': 50292, 'loss/train': 1.4887603521347046} -11/07/2021 04:19:08 - INFO - __main__ - Step 50294: {'lr': 0.0003797502719619187, 'samples': 9656448, 'steps': 50293, 'loss/train': 1.4273159503936768} -11/07/2021 04:19:09 - INFO - __main__ - Step 50295: {'lr': 0.0003797457358678304, 'samples': 9656640, 'steps': 50294, 'loss/train': 1.3308401107788086} -11/07/2021 04:19:10 - INFO - __main__ - Step 50296: {'lr': 0.0003797411997152807, 'samples': 9656832, 'steps': 50295, 'loss/train': 0.9965770244598389} -11/07/2021 04:19:10 - INFO - __main__ - Step 50297: {'lr': 0.0003797366635042716, 'samples': 9657024, 'steps': 50296, 'loss/train': 1.4599796533584595} -11/07/2021 04:19:10 - INFO - __main__ - Step 50298: {'lr': 0.0003797321272348052, 'samples': 9657216, 'steps': 50297, 'loss/train': 1.2639737129211426} -11/07/2021 04:19:11 - INFO - __main__ - Step 50299: {'lr': 0.00037972759090688354, 'samples': 9657408, 'steps': 50298, 'loss/train': 1.2504427433013916} -11/07/2021 04:19:12 - INFO - __main__ - Step 50300: {'lr': 0.0003797230545205086, 'samples': 9657600, 'steps': 50299, 'loss/train': 1.3856931924819946} -11/07/2021 04:19:12 - INFO - __main__ - Step 50301: {'lr': 0.00037971851807568237, 'samples': 9657792, 'steps': 50300, 'loss/train': 1.50432288646698} -11/07/2021 04:19:12 - INFO - __main__ - Step 50302: {'lr': 0.000379713981572407, 'samples': 9657984, 'steps': 50301, 'loss/train': 1.360334873199463} -11/07/2021 04:19:13 - INFO - __main__ - Step 50303: {'lr': 0.0003797094450106846, 'samples': 9658176, 'steps': 50302, 'loss/train': 1.5017192363739014} -11/07/2021 04:19:13 - INFO - __main__ - Step 50304: {'lr': 0.00037970490839051707, 'samples': 9658368, 'steps': 50303, 'loss/train': 1.1480355262756348} -11/07/2021 04:19:14 - INFO - __main__ - Step 50305: {'lr': 0.00037970037171190655, 'samples': 9658560, 'steps': 50304, 'loss/train': 1.4229942560195923} -11/07/2021 04:19:15 - INFO - __main__ - Step 50306: {'lr': 0.000379695834974855, 'samples': 9658752, 'steps': 50305, 'loss/train': 0.122550368309021} -11/07/2021 04:19:15 - INFO - __main__ - Step 50307: {'lr': 0.0003796912981793645, 'samples': 9658944, 'steps': 50306, 'loss/train': 1.2545815706253052} -11/07/2021 04:19:15 - INFO - __main__ - Step 50308: {'lr': 0.0003796867613254371, 'samples': 9659136, 'steps': 50307, 'loss/train': 1.4521191120147705} -11/07/2021 04:19:16 - INFO - __main__ - Step 50309: {'lr': 0.0003796822244130749, 'samples': 9659328, 'steps': 50308, 'loss/train': 1.373075246810913} -11/07/2021 04:19:17 - INFO - __main__ - Step 50310: {'lr': 0.00037967768744227984, 'samples': 9659520, 'steps': 50309, 'loss/train': 1.7056126594543457} -11/07/2021 04:19:17 - INFO - __main__ - Step 50311: {'lr': 0.000379673150413054, 'samples': 9659712, 'steps': 50310, 'loss/train': 1.5011404752731323} -11/07/2021 04:19:17 - INFO - __main__ - Step 50312: {'lr': 0.00037966861332539947, 'samples': 9659904, 'steps': 50311, 'loss/train': 1.3286014795303345} -11/07/2021 04:19:18 - INFO - __main__ - Step 50313: {'lr': 0.0003796640761793183, 'samples': 9660096, 'steps': 50312, 'loss/train': 1.5061498880386353} -11/07/2021 04:19:18 - INFO - __main__ - Step 50314: {'lr': 0.00037965953897481244, 'samples': 9660288, 'steps': 50313, 'loss/train': 1.6554516553878784} -11/07/2021 04:19:19 - INFO - __main__ - Step 50315: {'lr': 0.00037965500171188406, 'samples': 9660480, 'steps': 50314, 'loss/train': 1.2993578910827637} -11/07/2021 04:19:19 - INFO - __main__ - Step 50316: {'lr': 0.00037965046439053507, 'samples': 9660672, 'steps': 50315, 'loss/train': 0.6360580325126648} -11/07/2021 04:19:20 - INFO - __main__ - Step 50317: {'lr': 0.00037964592701076753, 'samples': 9660864, 'steps': 50316, 'loss/train': 1.4160159826278687} -11/07/2021 04:19:20 - INFO - __main__ - Step 50318: {'lr': 0.00037964138957258367, 'samples': 9661056, 'steps': 50317, 'loss/train': 0.6304948925971985} -11/07/2021 04:19:20 - INFO - __main__ - Step 50319: {'lr': 0.0003796368520759854, 'samples': 9661248, 'steps': 50318, 'loss/train': 1.1022051572799683} -11/07/2021 04:19:22 - INFO - __main__ - Step 50320: {'lr': 0.00037963231452097467, 'samples': 9661440, 'steps': 50319, 'loss/train': 1.4201772212982178} -11/07/2021 04:19:22 - INFO - __main__ - Step 50321: {'lr': 0.00037962777690755365, 'samples': 9661632, 'steps': 50320, 'loss/train': 1.3736419677734375} -11/07/2021 04:19:22 - INFO - __main__ - Step 50322: {'lr': 0.00037962323923572427, 'samples': 9661824, 'steps': 50321, 'loss/train': 1.2573219537734985} -11/07/2021 04:19:23 - INFO - __main__ - Step 50323: {'lr': 0.0003796187015054888, 'samples': 9662016, 'steps': 50322, 'loss/train': 1.9343341588974} -11/07/2021 04:19:23 - INFO - __main__ - Step 50324: {'lr': 0.00037961416371684907, 'samples': 9662208, 'steps': 50323, 'loss/train': 0.29651209712028503} -11/07/2021 04:19:24 - INFO - __main__ - Step 50325: {'lr': 0.0003796096258698073, 'samples': 9662400, 'steps': 50324, 'loss/train': 1.1519948244094849} -11/07/2021 04:19:24 - INFO - __main__ - Step 50326: {'lr': 0.0003796050879643653, 'samples': 9662592, 'steps': 50325, 'loss/train': 1.5263431072235107} -11/07/2021 04:19:25 - INFO - __main__ - Step 50327: {'lr': 0.0003796005500005253, 'samples': 9662784, 'steps': 50326, 'loss/train': 1.3878707885742188} -11/07/2021 04:19:25 - INFO - __main__ - Step 50328: {'lr': 0.0003795960119782893, 'samples': 9662976, 'steps': 50327, 'loss/train': 0.9455971121788025} -11/07/2021 04:19:25 - INFO - __main__ - Step 50329: {'lr': 0.0003795914738976594, 'samples': 9663168, 'steps': 50328, 'loss/train': 1.1657785177230835} -11/07/2021 04:19:26 - INFO - __main__ - Step 50330: {'lr': 0.00037958693575863747, 'samples': 9663360, 'steps': 50329, 'loss/train': 1.1909018754959106} -11/07/2021 04:19:27 - INFO - __main__ - Step 50331: {'lr': 0.0003795823975612257, 'samples': 9663552, 'steps': 50330, 'loss/train': 1.3688995838165283} -11/07/2021 04:19:27 - INFO - __main__ - Step 50332: {'lr': 0.0003795778593054261, 'samples': 9663744, 'steps': 50331, 'loss/train': 1.1265391111373901} -11/07/2021 04:19:28 - INFO - __main__ - Step 50333: {'lr': 0.00037957332099124066, 'samples': 9663936, 'steps': 50332, 'loss/train': 1.5496602058410645} -11/07/2021 04:19:28 - INFO - __main__ - Step 50334: {'lr': 0.00037956878261867163, 'samples': 9664128, 'steps': 50333, 'loss/train': 1.4843788146972656} -11/07/2021 04:19:29 - INFO - __main__ - Step 50335: {'lr': 0.0003795642441877208, 'samples': 9664320, 'steps': 50334, 'loss/train': 1.6729861497879028} -11/07/2021 04:19:29 - INFO - __main__ - Step 50336: {'lr': 0.0003795597056983903, 'samples': 9664512, 'steps': 50335, 'loss/train': 1.5528745651245117} -11/07/2021 04:19:30 - INFO - __main__ - Step 50337: {'lr': 0.0003795551671506823, 'samples': 9664704, 'steps': 50336, 'loss/train': 1.9175281524658203} -11/07/2021 04:19:30 - INFO - __main__ - Step 50338: {'lr': 0.0003795506285445987, 'samples': 9664896, 'steps': 50337, 'loss/train': 1.3358761072158813} -11/07/2021 04:19:30 - INFO - __main__ - Step 50339: {'lr': 0.0003795460898801415, 'samples': 9665088, 'steps': 50338, 'loss/train': 1.4042829275131226} -11/07/2021 04:19:31 - INFO - __main__ - Step 50340: {'lr': 0.00037954155115731294, 'samples': 9665280, 'steps': 50339, 'loss/train': 1.368674635887146} -11/07/2021 04:19:32 - INFO - __main__ - Step 50341: {'lr': 0.0003795370123761149, 'samples': 9665472, 'steps': 50340, 'loss/train': 1.57216215133667} -11/07/2021 04:19:32 - INFO - __main__ - Step 50342: {'lr': 0.00037953247353654946, 'samples': 9665664, 'steps': 50341, 'loss/train': 1.0828821659088135} -11/07/2021 04:19:32 - INFO - __main__ - Step 50343: {'lr': 0.00037952793463861867, 'samples': 9665856, 'steps': 50342, 'loss/train': 1.0894135236740112} -11/07/2021 04:19:33 - INFO - __main__ - Step 50344: {'lr': 0.0003795233956823246, 'samples': 9666048, 'steps': 50343, 'loss/train': 1.427432894706726} -11/07/2021 04:19:34 - INFO - __main__ - Step 50345: {'lr': 0.0003795188566676694, 'samples': 9666240, 'steps': 50344, 'loss/train': 1.0008103847503662} -11/07/2021 04:19:35 - INFO - __main__ - Step 50346: {'lr': 0.00037951431759465496, 'samples': 9666432, 'steps': 50345, 'loss/train': 1.2678896188735962} -11/07/2021 04:19:35 - INFO - __main__ - Step 50347: {'lr': 0.0003795097784632833, 'samples': 9666624, 'steps': 50346, 'loss/train': 1.6455512046813965} -11/07/2021 04:19:35 - INFO - __main__ - Step 50348: {'lr': 0.00037950523927355657, 'samples': 9666816, 'steps': 50347, 'loss/train': 1.758359670639038} -11/07/2021 04:19:36 - INFO - __main__ - Step 50349: {'lr': 0.0003795007000254768, 'samples': 9667008, 'steps': 50348, 'loss/train': 1.6530606746673584} -11/07/2021 04:19:36 - INFO - __main__ - Step 50350: {'lr': 0.00037949616071904593, 'samples': 9667200, 'steps': 50349, 'loss/train': 5.764377593994141} -11/07/2021 04:19:36 - INFO - __main__ - Step 50351: {'lr': 0.0003794916213542662, 'samples': 9667392, 'steps': 50350, 'loss/train': 1.215613842010498} -11/07/2021 04:19:37 - INFO - __main__ - Step 50352: {'lr': 0.00037948708193113947, 'samples': 9667584, 'steps': 50351, 'loss/train': 0.9372159838676453} -11/07/2021 04:19:38 - INFO - __main__ - Step 50353: {'lr': 0.00037948254244966786, 'samples': 9667776, 'steps': 50352, 'loss/train': 1.5439207553863525} -11/07/2021 04:19:38 - INFO - __main__ - Step 50354: {'lr': 0.00037947800290985344, 'samples': 9667968, 'steps': 50353, 'loss/train': 1.3743999004364014} -11/07/2021 04:19:38 - INFO - __main__ - Step 50355: {'lr': 0.00037947346331169816, 'samples': 9668160, 'steps': 50354, 'loss/train': 1.4863427877426147} -11/07/2021 04:19:39 - INFO - __main__ - Step 50356: {'lr': 0.00037946892365520423, 'samples': 9668352, 'steps': 50355, 'loss/train': 1.680455207824707} -11/07/2021 04:19:40 - INFO - __main__ - Step 50357: {'lr': 0.00037946438394037356, 'samples': 9668544, 'steps': 50356, 'loss/train': 1.0879682302474976} -11/07/2021 04:19:40 - INFO - __main__ - Step 50358: {'lr': 0.00037945984416720826, 'samples': 9668736, 'steps': 50357, 'loss/train': 1.3697302341461182} -11/07/2021 04:19:41 - INFO - __main__ - Step 50359: {'lr': 0.0003794553043357104, 'samples': 9668928, 'steps': 50358, 'loss/train': 1.5519213676452637} -11/07/2021 04:19:41 - INFO - __main__ - Step 50360: {'lr': 0.0003794507644458819, 'samples': 9669120, 'steps': 50359, 'loss/train': 1.4177567958831787} -11/07/2021 04:19:41 - INFO - __main__ - Step 50361: {'lr': 0.00037944622449772485, 'samples': 9669312, 'steps': 50360, 'loss/train': 1.1745578050613403} -11/07/2021 04:19:42 - INFO - __main__ - Step 50362: {'lr': 0.0003794416844912414, 'samples': 9669504, 'steps': 50361, 'loss/train': 1.5298815965652466} -11/07/2021 04:19:43 - INFO - __main__ - Step 50363: {'lr': 0.0003794371444264335, 'samples': 9669696, 'steps': 50362, 'loss/train': 1.569003939628601} -11/07/2021 04:19:43 - INFO - __main__ - Step 50364: {'lr': 0.00037943260430330317, 'samples': 9669888, 'steps': 50363, 'loss/train': 1.3630812168121338} -11/07/2021 04:19:44 - INFO - __main__ - Step 50365: {'lr': 0.00037942806412185254, 'samples': 9670080, 'steps': 50364, 'loss/train': 1.5234861373901367} -11/07/2021 04:19:44 - INFO - __main__ - Step 50366: {'lr': 0.0003794235238820837, 'samples': 9670272, 'steps': 50365, 'loss/train': 1.5544954538345337} -11/07/2021 04:19:44 - INFO - __main__ - Step 50367: {'lr': 0.0003794189835839985, 'samples': 9670464, 'steps': 50366, 'loss/train': 1.484514832496643} -11/07/2021 04:19:45 - INFO - __main__ - Step 50368: {'lr': 0.0003794144432275992, 'samples': 9670656, 'steps': 50367, 'loss/train': 0.7086828947067261} -11/07/2021 04:19:46 - INFO - __main__ - Step 50369: {'lr': 0.0003794099028128877, 'samples': 9670848, 'steps': 50368, 'loss/train': 1.7169569730758667} -11/07/2021 04:19:46 - INFO - __main__ - Step 50370: {'lr': 0.0003794053623398661, 'samples': 9671040, 'steps': 50369, 'loss/train': 1.511048436164856} -11/07/2021 04:19:46 - INFO - __main__ - Step 50371: {'lr': 0.00037940082180853643, 'samples': 9671232, 'steps': 50370, 'loss/train': 1.7683322429656982} -11/07/2021 04:19:47 - INFO - __main__ - Step 50372: {'lr': 0.0003793962812189008, 'samples': 9671424, 'steps': 50371, 'loss/train': 1.5911660194396973} -11/07/2021 04:19:48 - INFO - __main__ - Step 50373: {'lr': 0.00037939174057096114, 'samples': 9671616, 'steps': 50372, 'loss/train': 1.3682141304016113} -11/07/2021 04:19:48 - INFO - __main__ - Step 50374: {'lr': 0.0003793871998647196, 'samples': 9671808, 'steps': 50373, 'loss/train': 1.1681374311447144} -11/07/2021 04:19:49 - INFO - __main__ - Step 50375: {'lr': 0.00037938265910017813, 'samples': 9672000, 'steps': 50374, 'loss/train': 1.4625418186187744} -11/07/2021 04:19:49 - INFO - __main__ - Step 50376: {'lr': 0.0003793781182773388, 'samples': 9672192, 'steps': 50375, 'loss/train': 1.2847131490707397} -11/07/2021 04:19:49 - INFO - __main__ - Step 50377: {'lr': 0.00037937357739620383, 'samples': 9672384, 'steps': 50376, 'loss/train': 1.396962285041809} -11/07/2021 04:19:50 - INFO - __main__ - Step 50378: {'lr': 0.000379369036456775, 'samples': 9672576, 'steps': 50377, 'loss/train': 1.40147066116333} -11/07/2021 04:19:51 - INFO - __main__ - Step 50379: {'lr': 0.00037936449545905457, 'samples': 9672768, 'steps': 50378, 'loss/train': 1.1427726745605469} -11/07/2021 04:19:51 - INFO - __main__ - Step 50380: {'lr': 0.0003793599544030444, 'samples': 9672960, 'steps': 50379, 'loss/train': 0.7213249802589417} -11/07/2021 04:19:51 - INFO - __main__ - Step 50381: {'lr': 0.00037935541328874665, 'samples': 9673152, 'steps': 50380, 'loss/train': 0.06385089457035065} -11/07/2021 04:19:52 - INFO - __main__ - Step 50382: {'lr': 0.0003793508721161634, 'samples': 9673344, 'steps': 50381, 'loss/train': 1.3770196437835693} -11/07/2021 04:19:53 - INFO - __main__ - Step 50383: {'lr': 0.00037934633088529656, 'samples': 9673536, 'steps': 50382, 'loss/train': 1.456033706665039} -11/07/2021 04:19:53 - INFO - __main__ - Step 50384: {'lr': 0.00037934178959614834, 'samples': 9673728, 'steps': 50383, 'loss/train': 0.8930547833442688} -11/07/2021 04:19:54 - INFO - __main__ - Step 50385: {'lr': 0.00037933724824872067, 'samples': 9673920, 'steps': 50384, 'loss/train': 1.4878311157226562} -11/07/2021 04:19:54 - INFO - __main__ - Step 50386: {'lr': 0.00037933270684301567, 'samples': 9674112, 'steps': 50385, 'loss/train': 1.4187685251235962} -11/07/2021 04:19:54 - INFO - __main__ - Step 50387: {'lr': 0.00037932816537903535, 'samples': 9674304, 'steps': 50386, 'loss/train': 1.256471037864685} -11/07/2021 04:19:55 - INFO - __main__ - Step 50388: {'lr': 0.0003793236238567817, 'samples': 9674496, 'steps': 50387, 'loss/train': 1.0572724342346191} -11/07/2021 04:19:56 - INFO - __main__ - Step 50389: {'lr': 0.00037931908227625686, 'samples': 9674688, 'steps': 50388, 'loss/train': 1.6994491815567017} -11/07/2021 04:19:56 - INFO - __main__ - Step 50390: {'lr': 0.0003793145406374628, 'samples': 9674880, 'steps': 50389, 'loss/train': 1.6414024829864502} -11/07/2021 04:19:57 - INFO - __main__ - Step 50391: {'lr': 0.0003793099989404016, 'samples': 9675072, 'steps': 50390, 'loss/train': 0.18833202123641968} -11/07/2021 04:19:57 - INFO - __main__ - Step 50392: {'lr': 0.00037930545718507536, 'samples': 9675264, 'steps': 50391, 'loss/train': 1.4667836427688599} -11/07/2021 04:19:58 - INFO - __main__ - Step 50393: {'lr': 0.000379300915371486, 'samples': 9675456, 'steps': 50392, 'loss/train': 1.5009870529174805} -11/07/2021 04:19:58 - INFO - __main__ - Step 50394: {'lr': 0.00037929637349963573, 'samples': 9675648, 'steps': 50393, 'loss/train': 1.3425657749176025} -11/07/2021 04:19:59 - INFO - __main__ - Step 50395: {'lr': 0.00037929183156952653, 'samples': 9675840, 'steps': 50394, 'loss/train': 1.0846537351608276} -11/07/2021 04:19:59 - INFO - __main__ - Step 50396: {'lr': 0.00037928728958116034, 'samples': 9676032, 'steps': 50395, 'loss/train': 1.7205784320831299} -11/07/2021 04:19:59 - INFO - __main__ - Step 50397: {'lr': 0.0003792827475345393, 'samples': 9676224, 'steps': 50396, 'loss/train': 2.1761927604675293} -11/07/2021 04:20:00 - INFO - __main__ - Step 50398: {'lr': 0.00037927820542966545, 'samples': 9676416, 'steps': 50397, 'loss/train': 1.4321573972702026} -11/07/2021 04:20:01 - INFO - __main__ - Step 50399: {'lr': 0.0003792736632665409, 'samples': 9676608, 'steps': 50398, 'loss/train': 1.4543241262435913} -11/07/2021 04:20:01 - INFO - __main__ - Step 50400: {'lr': 0.0003792691210451676, 'samples': 9676800, 'steps': 50399, 'loss/train': 1.7749804258346558} -11/07/2021 04:20:01 - INFO - __main__ - Step 50401: {'lr': 0.0003792645787655476, 'samples': 9676992, 'steps': 50400, 'loss/train': 1.9975613355636597} -11/07/2021 04:20:02 - INFO - __main__ - Step 50402: {'lr': 0.000379260036427683, 'samples': 9677184, 'steps': 50401, 'loss/train': 2.0390677452087402} -11/07/2021 04:20:03 - INFO - __main__ - Step 50403: {'lr': 0.0003792554940315758, 'samples': 9677376, 'steps': 50402, 'loss/train': 0.8864619731903076} -11/07/2021 04:20:03 - INFO - __main__ - Step 50404: {'lr': 0.00037925095157722807, 'samples': 9677568, 'steps': 50403, 'loss/train': 0.966880738735199} -11/07/2021 04:20:03 - INFO - __main__ - Step 50405: {'lr': 0.0003792464090646419, 'samples': 9677760, 'steps': 50404, 'loss/train': 1.2450422048568726} -11/07/2021 04:20:04 - INFO - __main__ - Step 50406: {'lr': 0.00037924186649381924, 'samples': 9677952, 'steps': 50405, 'loss/train': 1.5221196413040161} -11/07/2021 04:20:04 - INFO - __main__ - Step 50407: {'lr': 0.00037923732386476225, 'samples': 9678144, 'steps': 50406, 'loss/train': 0.800771951675415} -11/07/2021 04:20:05 - INFO - __main__ - Step 50408: {'lr': 0.0003792327811774728, 'samples': 9678336, 'steps': 50407, 'loss/train': 1.0960415601730347} -11/07/2021 04:20:05 - INFO - __main__ - Step 50409: {'lr': 0.00037922823843195317, 'samples': 9678528, 'steps': 50408, 'loss/train': 0.9421395659446716} -11/07/2021 04:20:06 - INFO - __main__ - Step 50410: {'lr': 0.00037922369562820525, 'samples': 9678720, 'steps': 50409, 'loss/train': 1.4728403091430664} -11/07/2021 04:20:06 - INFO - __main__ - Step 50411: {'lr': 0.00037921915276623106, 'samples': 9678912, 'steps': 50410, 'loss/train': 1.227642297744751} -11/07/2021 04:20:07 - INFO - __main__ - Step 50412: {'lr': 0.00037921460984603284, 'samples': 9679104, 'steps': 50411, 'loss/train': 1.0253260135650635} -11/07/2021 04:20:08 - INFO - __main__ - Step 50413: {'lr': 0.0003792100668676125, 'samples': 9679296, 'steps': 50412, 'loss/train': 1.12844717502594} -11/07/2021 04:20:08 - INFO - __main__ - Step 50414: {'lr': 0.000379205523830972, 'samples': 9679488, 'steps': 50413, 'loss/train': 1.1844233274459839} -11/07/2021 04:20:08 - INFO - __main__ - Step 50415: {'lr': 0.0003792009807361135, 'samples': 9679680, 'steps': 50414, 'loss/train': 1.5617855787277222} -11/07/2021 04:20:09 - INFO - __main__ - Step 50416: {'lr': 0.00037919643758303913, 'samples': 9679872, 'steps': 50415, 'loss/train': 1.4274672269821167} -11/07/2021 04:20:09 - INFO - __main__ - Step 50417: {'lr': 0.0003791918943717507, 'samples': 9680064, 'steps': 50416, 'loss/train': 1.6753476858139038} -11/07/2021 04:20:09 - INFO - __main__ - Step 50418: {'lr': 0.0003791873511022505, 'samples': 9680256, 'steps': 50417, 'loss/train': 1.258516550064087} -11/07/2021 04:20:10 - INFO - __main__ - Step 50419: {'lr': 0.0003791828077745405, 'samples': 9680448, 'steps': 50418, 'loss/train': 1.3263862133026123} -11/07/2021 04:20:11 - INFO - __main__ - Step 50420: {'lr': 0.00037917826438862263, 'samples': 9680640, 'steps': 50419, 'loss/train': 1.6234769821166992} -11/07/2021 04:20:11 - INFO - __main__ - Step 50421: {'lr': 0.0003791737209444991, 'samples': 9680832, 'steps': 50420, 'loss/train': 1.2203651666641235} -11/07/2021 04:20:11 - INFO - __main__ - Step 50422: {'lr': 0.00037916917744217185, 'samples': 9681024, 'steps': 50421, 'loss/train': 1.0994569063186646} -11/07/2021 04:20:12 - INFO - __main__ - Step 50423: {'lr': 0.0003791646338816429, 'samples': 9681216, 'steps': 50422, 'loss/train': 1.255558967590332} -11/07/2021 04:20:13 - INFO - __main__ - Step 50424: {'lr': 0.0003791600902629144, 'samples': 9681408, 'steps': 50423, 'loss/train': 1.5016043186187744} -11/07/2021 04:20:13 - INFO - __main__ - Step 50425: {'lr': 0.0003791555465859884, 'samples': 9681600, 'steps': 50424, 'loss/train': 1.4460242986679077} -11/07/2021 04:20:14 - INFO - __main__ - Step 50426: {'lr': 0.0003791510028508669, 'samples': 9681792, 'steps': 50425, 'loss/train': 0.0705665796995163} -11/07/2021 04:20:14 - INFO - __main__ - Step 50427: {'lr': 0.0003791464590575519, 'samples': 9681984, 'steps': 50426, 'loss/train': 1.5198925733566284} -11/07/2021 04:20:14 - INFO - __main__ - Step 50428: {'lr': 0.0003791419152060455, 'samples': 9682176, 'steps': 50427, 'loss/train': 1.438368558883667} -11/07/2021 04:20:15 - INFO - __main__ - Step 50429: {'lr': 0.00037913737129634977, 'samples': 9682368, 'steps': 50428, 'loss/train': 1.4559372663497925} -11/07/2021 04:20:16 - INFO - __main__ - Step 50430: {'lr': 0.00037913282732846676, 'samples': 9682560, 'steps': 50429, 'loss/train': 1.1034575700759888} -11/07/2021 04:20:16 - INFO - __main__ - Step 50431: {'lr': 0.0003791282833023985, 'samples': 9682752, 'steps': 50430, 'loss/train': 0.6443070769309998} -11/07/2021 04:20:16 - INFO - __main__ - Step 50432: {'lr': 0.0003791237392181469, 'samples': 9682944, 'steps': 50431, 'loss/train': 1.4389891624450684} -11/07/2021 04:20:17 - INFO - __main__ - Step 50433: {'lr': 0.0003791191950757143, 'samples': 9683136, 'steps': 50432, 'loss/train': 1.4601596593856812} -11/07/2021 04:20:18 - INFO - __main__ - Step 50434: {'lr': 0.0003791146508751025, 'samples': 9683328, 'steps': 50433, 'loss/train': 1.0389693975448608} -11/07/2021 04:20:18 - INFO - __main__ - Step 50435: {'lr': 0.00037911010661631364, 'samples': 9683520, 'steps': 50434, 'loss/train': 1.6238583326339722} -11/07/2021 04:20:18 - INFO - __main__ - Step 50436: {'lr': 0.0003791055622993498, 'samples': 9683712, 'steps': 50435, 'loss/train': 1.509716510772705} -11/07/2021 04:20:19 - INFO - __main__ - Step 50437: {'lr': 0.0003791010179242129, 'samples': 9683904, 'steps': 50436, 'loss/train': 1.1959272623062134} -11/07/2021 04:20:19 - INFO - __main__ - Step 50438: {'lr': 0.0003790964734909051, 'samples': 9684096, 'steps': 50437, 'loss/train': 1.2539235353469849} -11/07/2021 04:20:20 - INFO - __main__ - Step 50439: {'lr': 0.00037909192899942846, 'samples': 9684288, 'steps': 50438, 'loss/train': 1.107391357421875} -11/07/2021 04:20:21 - INFO - __main__ - Step 50440: {'lr': 0.00037908738444978495, 'samples': 9684480, 'steps': 50439, 'loss/train': 1.3870924711227417} -11/07/2021 04:20:21 - INFO - __main__ - Step 50441: {'lr': 0.00037908283984197666, 'samples': 9684672, 'steps': 50440, 'loss/train': 1.7239774465560913} -11/07/2021 04:20:21 - INFO - __main__ - Step 50442: {'lr': 0.0003790782951760057, 'samples': 9684864, 'steps': 50441, 'loss/train': 1.4376455545425415} -11/07/2021 04:20:22 - INFO - __main__ - Step 50443: {'lr': 0.000379073750451874, 'samples': 9685056, 'steps': 50442, 'loss/train': 1.0883122682571411} -11/07/2021 04:20:23 - INFO - __main__ - Step 50444: {'lr': 0.00037906920566958363, 'samples': 9685248, 'steps': 50443, 'loss/train': 1.358377456665039} -11/07/2021 04:20:23 - INFO - __main__ - Step 50445: {'lr': 0.0003790646608291367, 'samples': 9685440, 'steps': 50444, 'loss/train': 1.310596227645874} -11/07/2021 04:20:23 - INFO - __main__ - Step 50446: {'lr': 0.00037906011593053527, 'samples': 9685632, 'steps': 50445, 'loss/train': 1.6248341798782349} -11/07/2021 04:20:24 - INFO - __main__ - Step 50447: {'lr': 0.00037905557097378127, 'samples': 9685824, 'steps': 50446, 'loss/train': 1.4741896390914917} -11/07/2021 04:20:24 - INFO - __main__ - Step 50448: {'lr': 0.00037905102595887685, 'samples': 9686016, 'steps': 50447, 'loss/train': 1.413648247718811} -11/07/2021 04:20:25 - INFO - __main__ - Step 50449: {'lr': 0.00037904648088582407, 'samples': 9686208, 'steps': 50448, 'loss/train': 1.1509143114089966} -11/07/2021 04:20:25 - INFO - __main__ - Step 50450: {'lr': 0.0003790419357546249, 'samples': 9686400, 'steps': 50449, 'loss/train': 1.2753708362579346} -11/07/2021 04:20:26 - INFO - __main__ - Step 50451: {'lr': 0.0003790373905652814, 'samples': 9686592, 'steps': 50450, 'loss/train': 1.6979026794433594} -11/07/2021 04:20:26 - INFO - __main__ - Step 50452: {'lr': 0.0003790328453177957, 'samples': 9686784, 'steps': 50451, 'loss/train': 1.5667774677276611} -11/07/2021 04:20:26 - INFO - __main__ - Step 50453: {'lr': 0.0003790283000121697, 'samples': 9686976, 'steps': 50452, 'loss/train': 1.496895670890808} -11/07/2021 04:20:27 - INFO - __main__ - Step 50454: {'lr': 0.0003790237546484056, 'samples': 9687168, 'steps': 50453, 'loss/train': 1.5901826620101929} -11/07/2021 04:20:28 - INFO - __main__ - Step 50455: {'lr': 0.00037901920922650534, 'samples': 9687360, 'steps': 50454, 'loss/train': 1.4874805212020874} -11/07/2021 04:20:28 - INFO - __main__ - Step 50456: {'lr': 0.0003790146637464711, 'samples': 9687552, 'steps': 50455, 'loss/train': 1.5322622060775757} -11/07/2021 04:20:28 - INFO - __main__ - Step 50457: {'lr': 0.0003790101182083048, 'samples': 9687744, 'steps': 50456, 'loss/train': 2.1499805450439453} -11/07/2021 04:20:29 - INFO - __main__ - Step 50458: {'lr': 0.0003790055726120085, 'samples': 9687936, 'steps': 50457, 'loss/train': 1.5269300937652588} -11/07/2021 04:20:29 - INFO - __main__ - Step 50459: {'lr': 0.0003790010269575844, 'samples': 9688128, 'steps': 50458, 'loss/train': 0.9556301236152649} -11/07/2021 04:20:31 - INFO - __main__ - Step 50460: {'lr': 0.00037899648124503426, 'samples': 9688320, 'steps': 50459, 'loss/train': 1.2562488317489624} -11/07/2021 04:20:31 - INFO - __main__ - Step 50461: {'lr': 0.0003789919354743604, 'samples': 9688512, 'steps': 50460, 'loss/train': 1.3984532356262207} -11/07/2021 04:20:31 - INFO - __main__ - Step 50462: {'lr': 0.00037898738964556474, 'samples': 9688704, 'steps': 50461, 'loss/train': 1.095470905303955} -11/07/2021 04:20:32 - INFO - __main__ - Step 50463: {'lr': 0.0003789828437586494, 'samples': 9688896, 'steps': 50462, 'loss/train': 0.21125854551792145} -11/07/2021 04:20:32 - INFO - __main__ - Step 50464: {'lr': 0.0003789782978136163, 'samples': 9689088, 'steps': 50463, 'loss/train': 1.7625631093978882} -11/07/2021 04:20:33 - INFO - __main__ - Step 50465: {'lr': 0.0003789737518104676, 'samples': 9689280, 'steps': 50464, 'loss/train': 1.1391310691833496} -11/07/2021 04:20:34 - INFO - __main__ - Step 50466: {'lr': 0.0003789692057492053, 'samples': 9689472, 'steps': 50465, 'loss/train': 0.7298038005828857} -11/07/2021 04:20:34 - INFO - __main__ - Step 50467: {'lr': 0.0003789646596298315, 'samples': 9689664, 'steps': 50466, 'loss/train': 0.6776963472366333} -11/07/2021 04:20:34 - INFO - __main__ - Step 50468: {'lr': 0.0003789601134523482, 'samples': 9689856, 'steps': 50467, 'loss/train': 1.4561177492141724} -11/07/2021 04:20:35 - INFO - __main__ - Step 50469: {'lr': 0.0003789555672167575, 'samples': 9690048, 'steps': 50468, 'loss/train': 1.309482455253601} -11/07/2021 04:20:36 - INFO - __main__ - Step 50470: {'lr': 0.00037895102092306134, 'samples': 9690240, 'steps': 50469, 'loss/train': 1.7961630821228027} -11/07/2021 04:20:36 - INFO - __main__ - Step 50471: {'lr': 0.00037894647457126186, 'samples': 9690432, 'steps': 50470, 'loss/train': 1.5374242067337036} -11/07/2021 04:20:36 - INFO - __main__ - Step 50472: {'lr': 0.00037894192816136107, 'samples': 9690624, 'steps': 50471, 'loss/train': 1.2444005012512207} -11/07/2021 04:20:37 - INFO - __main__ - Step 50473: {'lr': 0.00037893738169336114, 'samples': 9690816, 'steps': 50472, 'loss/train': 1.5550144910812378} -11/07/2021 04:20:37 - INFO - __main__ - Step 50474: {'lr': 0.00037893283516726397, 'samples': 9691008, 'steps': 50473, 'loss/train': 1.3162457942962646} -11/07/2021 04:20:38 - INFO - __main__ - Step 50475: {'lr': 0.0003789282885830716, 'samples': 9691200, 'steps': 50474, 'loss/train': 2.113288164138794} -11/07/2021 04:20:38 - INFO - __main__ - Step 50476: {'lr': 0.0003789237419407862, 'samples': 9691392, 'steps': 50475, 'loss/train': 1.8515410423278809} -11/07/2021 04:20:39 - INFO - __main__ - Step 50477: {'lr': 0.00037891919524040964, 'samples': 9691584, 'steps': 50476, 'loss/train': 1.5828161239624023} -11/07/2021 04:20:39 - INFO - __main__ - Step 50478: {'lr': 0.0003789146484819442, 'samples': 9691776, 'steps': 50477, 'loss/train': 0.8145389556884766} -11/07/2021 04:20:40 - INFO - __main__ - Step 50479: {'lr': 0.00037891010166539175, 'samples': 9691968, 'steps': 50478, 'loss/train': 1.2109582424163818} -11/07/2021 04:20:41 - INFO - __main__ - Step 50480: {'lr': 0.00037890555479075437, 'samples': 9692160, 'steps': 50479, 'loss/train': 1.516937255859375} -11/07/2021 04:20:42 - INFO - __main__ - Step 50481: {'lr': 0.0003789010078580342, 'samples': 9692352, 'steps': 50480, 'loss/train': 1.3102186918258667} -11/07/2021 04:20:42 - INFO - __main__ - Step 50482: {'lr': 0.00037889646086723325, 'samples': 9692544, 'steps': 50481, 'loss/train': 1.1893430948257446} -11/07/2021 04:20:42 - INFO - __main__ - Step 50483: {'lr': 0.0003788919138183534, 'samples': 9692736, 'steps': 50482, 'loss/train': 1.4249972105026245} -11/07/2021 04:20:43 - INFO - __main__ - Step 50484: {'lr': 0.000378887366711397, 'samples': 9692928, 'steps': 50483, 'loss/train': 1.0710270404815674} -11/07/2021 04:20:43 - INFO - __main__ - Step 50485: {'lr': 0.0003788828195463658, 'samples': 9693120, 'steps': 50484, 'loss/train': 0.8438765406608582} -11/07/2021 04:20:44 - INFO - __main__ - Step 50486: {'lr': 0.0003788782723232621, 'samples': 9693312, 'steps': 50485, 'loss/train': 1.1044734716415405} -11/07/2021 04:20:44 - INFO - __main__ - Step 50487: {'lr': 0.00037887372504208784, 'samples': 9693504, 'steps': 50486, 'loss/train': 0.1660122126340866} -11/07/2021 04:20:45 - INFO - __main__ - Step 50488: {'lr': 0.000378869177702845, 'samples': 9693696, 'steps': 50487, 'loss/train': 1.5479238033294678} -11/07/2021 04:20:45 - INFO - __main__ - Step 50489: {'lr': 0.00037886463030553576, 'samples': 9693888, 'steps': 50488, 'loss/train': 0.8453708291053772} -11/07/2021 04:20:45 - INFO - __main__ - Step 50490: {'lr': 0.0003788600828501621, 'samples': 9694080, 'steps': 50489, 'loss/train': 1.5299060344696045} -11/07/2021 04:20:47 - INFO - __main__ - Step 50491: {'lr': 0.000378855535336726, 'samples': 9694272, 'steps': 50490, 'loss/train': 1.4592078924179077} -11/07/2021 04:20:47 - INFO - __main__ - Step 50492: {'lr': 0.00037885098776522966, 'samples': 9694464, 'steps': 50491, 'loss/train': 1.3624205589294434} -11/07/2021 04:20:47 - INFO - __main__ - Step 50493: {'lr': 0.00037884644013567504, 'samples': 9694656, 'steps': 50492, 'loss/train': 1.2569674253463745} -11/07/2021 04:20:48 - INFO - __main__ - Step 50494: {'lr': 0.0003788418924480642, 'samples': 9694848, 'steps': 50493, 'loss/train': 1.4081571102142334} -11/07/2021 04:20:48 - INFO - __main__ - Step 50495: {'lr': 0.00037883734470239914, 'samples': 9695040, 'steps': 50494, 'loss/train': 0.1726246476173401} -11/07/2021 04:20:49 - INFO - __main__ - Step 50496: {'lr': 0.00037883279689868203, 'samples': 9695232, 'steps': 50495, 'loss/train': 1.0943998098373413} -11/07/2021 04:20:49 - INFO - __main__ - Step 50497: {'lr': 0.00037882824903691484, 'samples': 9695424, 'steps': 50496, 'loss/train': 1.4701080322265625} -11/07/2021 04:20:50 - INFO - __main__ - Step 50498: {'lr': 0.00037882370111709963, 'samples': 9695616, 'steps': 50497, 'loss/train': 1.3461015224456787} -11/07/2021 04:20:50 - INFO - __main__ - Step 50499: {'lr': 0.00037881915313923845, 'samples': 9695808, 'steps': 50498, 'loss/train': 1.5255160331726074} -11/07/2021 04:20:50 - INFO - __main__ - Step 50500: {'lr': 0.0003788146051033333, 'samples': 9696000, 'steps': 50499, 'loss/train': 1.5375534296035767} -11/07/2021 04:20:51 - INFO - __main__ - Step 50501: {'lr': 0.0003788100570093863, 'samples': 9696192, 'steps': 50500, 'loss/train': 1.058691143989563} -11/07/2021 04:20:52 - INFO - __main__ - Step 50502: {'lr': 0.0003788055088573995, 'samples': 9696384, 'steps': 50501, 'loss/train': 1.8498750925064087} -11/07/2021 04:20:52 - INFO - __main__ - Step 50503: {'lr': 0.0003788009606473749, 'samples': 9696576, 'steps': 50502, 'loss/train': 1.3221867084503174} -11/07/2021 04:20:52 - INFO - __main__ - Step 50504: {'lr': 0.0003787964123793146, 'samples': 9696768, 'steps': 50503, 'loss/train': 1.1646900177001953} -11/07/2021 04:20:53 - INFO - __main__ - Step 50505: {'lr': 0.0003787918640532206, 'samples': 9696960, 'steps': 50504, 'loss/train': 1.4190033674240112} -11/07/2021 04:20:54 - INFO - __main__ - Step 50506: {'lr': 0.000378787315669095, 'samples': 9697152, 'steps': 50505, 'loss/train': 1.230149507522583} -11/07/2021 04:20:54 - INFO - __main__ - Step 50507: {'lr': 0.00037878276722693984, 'samples': 9697344, 'steps': 50506, 'loss/train': 1.09401273727417} -11/07/2021 04:20:55 - INFO - __main__ - Step 50508: {'lr': 0.00037877821872675705, 'samples': 9697536, 'steps': 50507, 'loss/train': 1.4707863330841064} -11/07/2021 04:20:55 - INFO - __main__ - Step 50509: {'lr': 0.00037877367016854886, 'samples': 9697728, 'steps': 50508, 'loss/train': 1.4535642862319946} -11/07/2021 04:20:55 - INFO - __main__ - Step 50510: {'lr': 0.00037876912155231725, 'samples': 9697920, 'steps': 50509, 'loss/train': 1.3505984544754028} -11/07/2021 04:20:56 - INFO - __main__ - Step 50511: {'lr': 0.0003787645728780642, 'samples': 9698112, 'steps': 50510, 'loss/train': 1.0581302642822266} -11/07/2021 04:20:57 - INFO - __main__ - Step 50512: {'lr': 0.0003787600241457918, 'samples': 9698304, 'steps': 50511, 'loss/train': 1.6496787071228027} -11/07/2021 04:20:57 - INFO - __main__ - Step 50513: {'lr': 0.0003787554753555022, 'samples': 9698496, 'steps': 50512, 'loss/train': 1.4941242933273315} -11/07/2021 04:20:57 - INFO - __main__ - Step 50514: {'lr': 0.00037875092650719737, 'samples': 9698688, 'steps': 50513, 'loss/train': 1.7991743087768555} -11/07/2021 04:20:58 - INFO - __main__ - Step 50515: {'lr': 0.0003787463776008794, 'samples': 9698880, 'steps': 50514, 'loss/train': 1.6457631587982178} -11/07/2021 04:20:58 - INFO - __main__ - Step 50516: {'lr': 0.00037874182863655015, 'samples': 9699072, 'steps': 50515, 'loss/train': 3.9654839038848877} -11/07/2021 04:20:59 - INFO - __main__ - Step 50517: {'lr': 0.00037873727961421197, 'samples': 9699264, 'steps': 50516, 'loss/train': 1.1913834810256958} -11/07/2021 04:21:00 - INFO - __main__ - Step 50518: {'lr': 0.00037873273053386664, 'samples': 9699456, 'steps': 50517, 'loss/train': 1.2977443933486938} -11/07/2021 04:21:00 - INFO - __main__ - Step 50519: {'lr': 0.00037872818139551633, 'samples': 9699648, 'steps': 50518, 'loss/train': 0.13847365975379944} -11/07/2021 04:21:01 - INFO - __main__ - Step 50520: {'lr': 0.0003787236321991632, 'samples': 9699840, 'steps': 50519, 'loss/train': 1.0413885116577148} -11/07/2021 04:21:01 - INFO - __main__ - Step 50521: {'lr': 0.0003787190829448092, 'samples': 9700032, 'steps': 50520, 'loss/train': 0.9799793362617493} -11/07/2021 04:21:01 - INFO - __main__ - Step 50522: {'lr': 0.00037871453363245625, 'samples': 9700224, 'steps': 50521, 'loss/train': 1.574615716934204} -11/07/2021 04:21:02 - INFO - __main__ - Step 50523: {'lr': 0.0003787099842621066, 'samples': 9700416, 'steps': 50522, 'loss/train': 1.5450891256332397} -11/07/2021 04:21:03 - INFO - __main__ - Step 50524: {'lr': 0.0003787054348337621, 'samples': 9700608, 'steps': 50523, 'loss/train': 1.689807653427124} -11/07/2021 04:21:03 - INFO - __main__ - Step 50525: {'lr': 0.000378700885347425, 'samples': 9700800, 'steps': 50524, 'loss/train': 1.999502182006836} -11/07/2021 04:21:03 - INFO - __main__ - Step 50526: {'lr': 0.0003786963358030973, 'samples': 9700992, 'steps': 50525, 'loss/train': 1.3054684400558472} -11/07/2021 04:21:04 - INFO - __main__ - Step 50527: {'lr': 0.000378691786200781, 'samples': 9701184, 'steps': 50526, 'loss/train': 1.6954087018966675} -11/07/2021 04:21:05 - INFO - __main__ - Step 50528: {'lr': 0.0003786872365404781, 'samples': 9701376, 'steps': 50527, 'loss/train': 1.4089579582214355} -11/07/2021 04:21:05 - INFO - __main__ - Step 50529: {'lr': 0.00037868268682219073, 'samples': 9701568, 'steps': 50528, 'loss/train': 1.2623209953308105} -11/07/2021 04:21:05 - INFO - __main__ - Step 50530: {'lr': 0.000378678137045921, 'samples': 9701760, 'steps': 50529, 'loss/train': 1.2020975351333618} -11/07/2021 04:21:06 - INFO - __main__ - Step 50531: {'lr': 0.0003786735872116709, 'samples': 9701952, 'steps': 50530, 'loss/train': 1.2616205215454102} -11/07/2021 04:21:06 - INFO - __main__ - Step 50532: {'lr': 0.00037866903731944234, 'samples': 9702144, 'steps': 50531, 'loss/train': 1.9756957292556763} -11/07/2021 04:21:07 - INFO - __main__ - Step 50533: {'lr': 0.0003786644873692376, 'samples': 9702336, 'steps': 50532, 'loss/train': 1.620253562927246} -11/07/2021 04:21:08 - INFO - __main__ - Step 50534: {'lr': 0.0003786599373610586, 'samples': 9702528, 'steps': 50533, 'loss/train': 1.2405271530151367} -11/07/2021 04:21:08 - INFO - __main__ - Step 50535: {'lr': 0.00037865538729490745, 'samples': 9702720, 'steps': 50534, 'loss/train': 1.2175302505493164} -11/07/2021 04:21:08 - INFO - __main__ - Step 50536: {'lr': 0.00037865083717078605, 'samples': 9702912, 'steps': 50535, 'loss/train': 1.144630789756775} -11/07/2021 04:21:09 - INFO - __main__ - Step 50537: {'lr': 0.00037864628698869676, 'samples': 9703104, 'steps': 50536, 'loss/train': 1.092538833618164} -11/07/2021 04:21:10 - INFO - __main__ - Step 50538: {'lr': 0.0003786417367486413, 'samples': 9703296, 'steps': 50537, 'loss/train': 1.1753264665603638} -11/07/2021 04:21:10 - INFO - __main__ - Step 50539: {'lr': 0.00037863718645062184, 'samples': 9703488, 'steps': 50538, 'loss/train': 1.6783736944198608} -11/07/2021 04:21:10 - INFO - __main__ - Step 50540: {'lr': 0.00037863263609464056, 'samples': 9703680, 'steps': 50539, 'loss/train': 1.5667228698730469} -11/07/2021 04:21:11 - INFO - __main__ - Step 50541: {'lr': 0.00037862808568069935, 'samples': 9703872, 'steps': 50540, 'loss/train': 1.5426188707351685} -11/07/2021 04:21:11 - INFO - __main__ - Step 50542: {'lr': 0.00037862353520880026, 'samples': 9704064, 'steps': 50541, 'loss/train': 1.5579650402069092} -11/07/2021 04:21:12 - INFO - __main__ - Step 50543: {'lr': 0.0003786189846789454, 'samples': 9704256, 'steps': 50542, 'loss/train': 1.1260631084442139} -11/07/2021 04:21:12 - INFO - __main__ - Step 50544: {'lr': 0.00037861443409113683, 'samples': 9704448, 'steps': 50543, 'loss/train': 1.2102491855621338} -11/07/2021 04:21:13 - INFO - __main__ - Step 50545: {'lr': 0.0003786098834453766, 'samples': 9704640, 'steps': 50544, 'loss/train': 1.4704492092132568} -11/07/2021 04:21:13 - INFO - __main__ - Step 50546: {'lr': 0.00037860533274166675, 'samples': 9704832, 'steps': 50545, 'loss/train': 1.130420446395874} -11/07/2021 04:21:13 - INFO - __main__ - Step 50547: {'lr': 0.0003786007819800094, 'samples': 9705024, 'steps': 50546, 'loss/train': 1.5193778276443481} -11/07/2021 04:21:14 - INFO - __main__ - Step 50548: {'lr': 0.00037859623116040633, 'samples': 9705216, 'steps': 50547, 'loss/train': 1.3470855951309204} -11/07/2021 04:21:15 - INFO - __main__ - Step 50549: {'lr': 0.00037859168028285984, 'samples': 9705408, 'steps': 50548, 'loss/train': 1.4055453538894653} -11/07/2021 04:21:15 - INFO - __main__ - Step 50550: {'lr': 0.000378587129347372, 'samples': 9705600, 'steps': 50549, 'loss/train': 1.0417683124542236} -11/07/2021 04:21:16 - INFO - __main__ - Step 50551: {'lr': 0.00037858257835394473, 'samples': 9705792, 'steps': 50550, 'loss/train': 1.7074761390686035} -11/07/2021 04:21:16 - INFO - __main__ - Step 50552: {'lr': 0.0003785780273025802, 'samples': 9705984, 'steps': 50551, 'loss/train': 1.2066880464553833} -11/07/2021 04:21:17 - INFO - __main__ - Step 50553: {'lr': 0.00037857347619328033, 'samples': 9706176, 'steps': 50552, 'loss/train': 1.751990556716919} -11/07/2021 04:21:17 - INFO - __main__ - Step 50554: {'lr': 0.0003785689250260472, 'samples': 9706368, 'steps': 50553, 'loss/train': 1.3436176776885986} -11/07/2021 04:21:18 - INFO - __main__ - Step 50555: {'lr': 0.00037856437380088295, 'samples': 9706560, 'steps': 50554, 'loss/train': 1.865929365158081} -11/07/2021 04:21:18 - INFO - __main__ - Step 50556: {'lr': 0.0003785598225177896, 'samples': 9706752, 'steps': 50555, 'loss/train': 1.5532974004745483} -11/07/2021 04:21:18 - INFO - __main__ - Step 50557: {'lr': 0.0003785552711767691, 'samples': 9706944, 'steps': 50556, 'loss/train': 1.744436502456665} -11/07/2021 04:21:19 - INFO - __main__ - Step 50558: {'lr': 0.0003785507197778236, 'samples': 9707136, 'steps': 50557, 'loss/train': 1.4375718832015991} -11/07/2021 04:21:20 - INFO - __main__ - Step 50559: {'lr': 0.0003785461683209552, 'samples': 9707328, 'steps': 50558, 'loss/train': 1.1379846334457397} -11/07/2021 04:21:20 - INFO - __main__ - Step 50560: {'lr': 0.00037854161680616586, 'samples': 9707520, 'steps': 50559, 'loss/train': 1.375577688217163} -11/07/2021 04:21:21 - INFO - __main__ - Step 50561: {'lr': 0.00037853706523345766, 'samples': 9707712, 'steps': 50560, 'loss/train': 1.7637293338775635} -11/07/2021 04:21:21 - INFO - __main__ - Step 50562: {'lr': 0.0003785325136028326, 'samples': 9707904, 'steps': 50561, 'loss/train': 1.5140193700790405} -11/07/2021 04:21:21 - INFO - __main__ - Step 50563: {'lr': 0.0003785279619142927, 'samples': 9708096, 'steps': 50562, 'loss/train': 1.4685074090957642} -11/07/2021 04:21:22 - INFO - __main__ - Step 50564: {'lr': 0.0003785234101678402, 'samples': 9708288, 'steps': 50563, 'loss/train': 1.5050429105758667} -11/07/2021 04:21:23 - INFO - __main__ - Step 50565: {'lr': 0.000378518858363477, 'samples': 9708480, 'steps': 50564, 'loss/train': 1.1843069791793823} -11/07/2021 04:21:23 - INFO - __main__ - Step 50566: {'lr': 0.00037851430650120516, 'samples': 9708672, 'steps': 50565, 'loss/train': 1.375612497329712} -11/07/2021 04:21:23 - INFO - __main__ - Step 50567: {'lr': 0.00037850975458102686, 'samples': 9708864, 'steps': 50566, 'loss/train': 1.0893933773040771} -11/07/2021 04:21:24 - INFO - __main__ - Step 50568: {'lr': 0.000378505202602944, 'samples': 9709056, 'steps': 50567, 'loss/train': 1.0624316930770874} -11/07/2021 04:21:25 - INFO - __main__ - Step 50569: {'lr': 0.0003785006505669586, 'samples': 9709248, 'steps': 50568, 'loss/train': 1.5698699951171875} -11/07/2021 04:21:25 - INFO - __main__ - Step 50570: {'lr': 0.0003784960984730728, 'samples': 9709440, 'steps': 50569, 'loss/train': 1.3673588037490845} -11/07/2021 04:21:25 - INFO - __main__ - Step 50571: {'lr': 0.00037849154632128867, 'samples': 9709632, 'steps': 50570, 'loss/train': 1.5583531856536865} -11/07/2021 04:21:26 - INFO - __main__ - Step 50572: {'lr': 0.0003784869941116082, 'samples': 9709824, 'steps': 50571, 'loss/train': 1.3499821424484253} -11/07/2021 04:21:26 - INFO - __main__ - Step 50573: {'lr': 0.00037848244184403356, 'samples': 9710016, 'steps': 50572, 'loss/train': 1.1018770933151245} -11/07/2021 04:21:27 - INFO - __main__ - Step 50574: {'lr': 0.0003784778895185667, 'samples': 9710208, 'steps': 50573, 'loss/train': 1.6546837091445923} -11/07/2021 04:21:27 - INFO - __main__ - Step 50575: {'lr': 0.00037847333713520966, 'samples': 9710400, 'steps': 50574, 'loss/train': 2.1528480052948} -11/07/2021 04:21:28 - INFO - __main__ - Step 50576: {'lr': 0.0003784687846939645, 'samples': 9710592, 'steps': 50575, 'loss/train': 1.3178619146347046} -11/07/2021 04:21:28 - INFO - __main__ - Step 50577: {'lr': 0.00037846423219483325, 'samples': 9710784, 'steps': 50576, 'loss/train': 1.562099814414978} -11/07/2021 04:21:29 - INFO - __main__ - Step 50578: {'lr': 0.00037845967963781807, 'samples': 9710976, 'steps': 50577, 'loss/train': 1.1327686309814453} -11/07/2021 04:21:29 - INFO - __main__ - Step 50579: {'lr': 0.00037845512702292097, 'samples': 9711168, 'steps': 50578, 'loss/train': 1.1399965286254883} -11/07/2021 04:21:30 - INFO - __main__ - Step 50580: {'lr': 0.00037845057435014384, 'samples': 9711360, 'steps': 50579, 'loss/train': 1.2374995946884155} -11/07/2021 04:21:30 - INFO - __main__ - Step 50581: {'lr': 0.000378446021619489, 'samples': 9711552, 'steps': 50580, 'loss/train': 1.163236379623413} -11/07/2021 04:21:31 - INFO - __main__ - Step 50582: {'lr': 0.0003784414688309583, 'samples': 9711744, 'steps': 50581, 'loss/train': 0.9576605558395386} -11/07/2021 04:21:31 - INFO - __main__ - Step 50583: {'lr': 0.0003784369159845539, 'samples': 9711936, 'steps': 50582, 'loss/train': 1.6346780061721802} -11/07/2021 04:21:31 - INFO - __main__ - Step 50584: {'lr': 0.00037843236308027776, 'samples': 9712128, 'steps': 50583, 'loss/train': 1.5481826066970825} -11/07/2021 04:21:32 - INFO - __main__ - Step 50585: {'lr': 0.000378427810118132, 'samples': 9712320, 'steps': 50584, 'loss/train': 1.5417025089263916} -11/07/2021 04:21:33 - INFO - __main__ - Step 50586: {'lr': 0.0003784232570981186, 'samples': 9712512, 'steps': 50585, 'loss/train': 1.3001868724822998} -11/07/2021 04:21:33 - INFO - __main__ - Step 50587: {'lr': 0.0003784187040202398, 'samples': 9712704, 'steps': 50586, 'loss/train': 1.3041154146194458} -11/07/2021 04:21:33 - INFO - __main__ - Step 50588: {'lr': 0.0003784141508844974, 'samples': 9712896, 'steps': 50587, 'loss/train': 1.7065526247024536} -11/07/2021 04:21:34 - INFO - __main__ - Step 50589: {'lr': 0.00037840959769089354, 'samples': 9713088, 'steps': 50588, 'loss/train': 1.3818120956420898} -11/07/2021 04:21:35 - INFO - __main__ - Step 50590: {'lr': 0.00037840504443943033, 'samples': 9713280, 'steps': 50589, 'loss/train': 1.0090471506118774} -11/07/2021 04:21:35 - INFO - __main__ - Step 50591: {'lr': 0.00037840049113010976, 'samples': 9713472, 'steps': 50590, 'loss/train': 1.7250033617019653} -11/07/2021 04:21:35 - INFO - __main__ - Step 50592: {'lr': 0.000378395937762934, 'samples': 9713664, 'steps': 50591, 'loss/train': 1.4000662565231323} -11/07/2021 04:21:36 - INFO - __main__ - Step 50593: {'lr': 0.000378391384337905, 'samples': 9713856, 'steps': 50592, 'loss/train': 1.5273271799087524} -11/07/2021 04:21:36 - INFO - __main__ - Step 50594: {'lr': 0.00037838683085502473, 'samples': 9714048, 'steps': 50593, 'loss/train': 0.9857616424560547} -11/07/2021 04:21:37 - INFO - __main__ - Step 50595: {'lr': 0.0003783822773142954, 'samples': 9714240, 'steps': 50594, 'loss/train': 1.7231225967407227} -11/07/2021 04:21:37 - INFO - __main__ - Step 50596: {'lr': 0.00037837772371571897, 'samples': 9714432, 'steps': 50595, 'loss/train': 1.5911321640014648} -11/07/2021 04:21:38 - INFO - __main__ - Step 50597: {'lr': 0.0003783731700592975, 'samples': 9714624, 'steps': 50596, 'loss/train': 1.0957367420196533} -11/07/2021 04:21:38 - INFO - __main__ - Step 50598: {'lr': 0.0003783686163450332, 'samples': 9714816, 'steps': 50597, 'loss/train': 1.6767088174819946} -11/07/2021 04:21:38 - INFO - __main__ - Step 50599: {'lr': 0.0003783640625729278, 'samples': 9715008, 'steps': 50598, 'loss/train': 1.8420186042785645} -11/07/2021 04:21:40 - INFO - __main__ - Step 50600: {'lr': 0.00037835950874298365, 'samples': 9715200, 'steps': 50599, 'loss/train': 1.783567190170288} -11/07/2021 04:21:40 - INFO - __main__ - Step 50601: {'lr': 0.0003783549548552027, 'samples': 9715392, 'steps': 50600, 'loss/train': 1.1593835353851318} -11/07/2021 04:21:40 - INFO - __main__ - Step 50602: {'lr': 0.00037835040090958684, 'samples': 9715584, 'steps': 50601, 'loss/train': 1.4136946201324463} -11/07/2021 04:21:41 - INFO - __main__ - Step 50603: {'lr': 0.0003783458469061384, 'samples': 9715776, 'steps': 50602, 'loss/train': 1.1507467031478882} -11/07/2021 04:21:41 - INFO - __main__ - Step 50604: {'lr': 0.0003783412928448593, 'samples': 9715968, 'steps': 50603, 'loss/train': 1.043258786201477} -11/07/2021 04:21:42 - INFO - __main__ - Step 50605: {'lr': 0.00037833673872575153, 'samples': 9716160, 'steps': 50604, 'loss/train': 1.5505529642105103} -11/07/2021 04:21:42 - INFO - __main__ - Step 50606: {'lr': 0.00037833218454881725, 'samples': 9716352, 'steps': 50605, 'loss/train': 1.3890246152877808} -11/07/2021 04:21:43 - INFO - __main__ - Step 50607: {'lr': 0.0003783276303140584, 'samples': 9716544, 'steps': 50606, 'loss/train': 1.0809133052825928} -11/07/2021 04:21:43 - INFO - __main__ - Step 50608: {'lr': 0.0003783230760214772, 'samples': 9716736, 'steps': 50607, 'loss/train': 1.2744044065475464} -11/07/2021 04:21:43 - INFO - __main__ - Step 50609: {'lr': 0.00037831852167107563, 'samples': 9716928, 'steps': 50608, 'loss/train': 0.9171972870826721} -11/07/2021 04:21:44 - INFO - __main__ - Step 50610: {'lr': 0.0003783139672628556, 'samples': 9717120, 'steps': 50609, 'loss/train': 1.0866856575012207} -11/07/2021 04:21:45 - INFO - __main__ - Step 50611: {'lr': 0.0003783094127968193, 'samples': 9717312, 'steps': 50610, 'loss/train': 0.7773082852363586} -11/07/2021 04:21:45 - INFO - __main__ - Step 50612: {'lr': 0.0003783048582729688, 'samples': 9717504, 'steps': 50611, 'loss/train': 1.7726795673370361} -11/07/2021 04:21:46 - INFO - __main__ - Step 50613: {'lr': 0.0003783003036913061, 'samples': 9717696, 'steps': 50612, 'loss/train': 1.2064554691314697} -11/07/2021 04:21:46 - INFO - __main__ - Step 50614: {'lr': 0.0003782957490518332, 'samples': 9717888, 'steps': 50613, 'loss/train': 1.362608551979065} -11/07/2021 04:21:47 - INFO - __main__ - Step 50615: {'lr': 0.00037829119435455226, 'samples': 9718080, 'steps': 50614, 'loss/train': 1.2910335063934326} -11/07/2021 04:21:47 - INFO - __main__ - Step 50616: {'lr': 0.00037828663959946527, 'samples': 9718272, 'steps': 50615, 'loss/train': 1.0467013120651245} -11/07/2021 04:21:48 - INFO - __main__ - Step 50617: {'lr': 0.0003782820847865743, 'samples': 9718464, 'steps': 50616, 'loss/train': 1.650442361831665} -11/07/2021 04:21:48 - INFO - __main__ - Step 50618: {'lr': 0.0003782775299158815, 'samples': 9718656, 'steps': 50617, 'loss/train': 0.8560373783111572} -11/07/2021 04:21:48 - INFO - __main__ - Step 50619: {'lr': 0.0003782729749873887, 'samples': 9718848, 'steps': 50618, 'loss/train': 1.4592068195343018} -11/07/2021 04:21:49 - INFO - __main__ - Step 50620: {'lr': 0.0003782684200010981, 'samples': 9719040, 'steps': 50619, 'loss/train': 1.7602537870407104} -11/07/2021 04:21:50 - INFO - __main__ - Step 50621: {'lr': 0.0003782638649570118, 'samples': 9719232, 'steps': 50620, 'loss/train': 1.3714299201965332} -11/07/2021 04:21:50 - INFO - __main__ - Step 50622: {'lr': 0.00037825930985513177, 'samples': 9719424, 'steps': 50621, 'loss/train': 1.1895204782485962} -11/07/2021 04:21:50 - INFO - __main__ - Step 50623: {'lr': 0.00037825475469546, 'samples': 9719616, 'steps': 50622, 'loss/train': 1.2780832052230835} -11/07/2021 04:21:51 - INFO - __main__ - Step 50624: {'lr': 0.00037825019947799863, 'samples': 9719808, 'steps': 50623, 'loss/train': 1.401994228363037} -11/07/2021 04:21:52 - INFO - __main__ - Step 50625: {'lr': 0.0003782456442027498, 'samples': 9720000, 'steps': 50624, 'loss/train': 2.208725929260254} -11/07/2021 04:21:52 - INFO - __main__ - Step 50626: {'lr': 0.0003782410888697153, 'samples': 9720192, 'steps': 50625, 'loss/train': 2.153963088989258} -11/07/2021 04:21:52 - INFO - __main__ - Step 50627: {'lr': 0.00037823653347889745, 'samples': 9720384, 'steps': 50626, 'loss/train': 0.7837381958961487} -11/07/2021 04:21:53 - INFO - __main__ - Step 50628: {'lr': 0.0003782319780302982, 'samples': 9720576, 'steps': 50627, 'loss/train': 1.6824977397918701} -11/07/2021 04:21:53 - INFO - __main__ - Step 50629: {'lr': 0.00037822742252391963, 'samples': 9720768, 'steps': 50628, 'loss/train': 1.5285260677337646} -11/07/2021 04:21:54 - INFO - __main__ - Step 50630: {'lr': 0.0003782228669597637, 'samples': 9720960, 'steps': 50629, 'loss/train': 0.8713791966438293} -11/07/2021 04:21:54 - INFO - __main__ - Step 50631: {'lr': 0.00037821831133783246, 'samples': 9721152, 'steps': 50630, 'loss/train': 1.676653265953064} -11/07/2021 04:21:55 - INFO - __main__ - Step 50632: {'lr': 0.00037821375565812816, 'samples': 9721344, 'steps': 50631, 'loss/train': 1.2008812427520752} -11/07/2021 04:21:55 - INFO - __main__ - Step 50633: {'lr': 0.00037820919992065263, 'samples': 9721536, 'steps': 50632, 'loss/train': 1.4452593326568604} -11/07/2021 04:21:55 - INFO - __main__ - Step 50634: {'lr': 0.00037820464412540805, 'samples': 9721728, 'steps': 50633, 'loss/train': 1.4773658514022827} -11/07/2021 04:21:56 - INFO - __main__ - Step 50635: {'lr': 0.0003782000882723965, 'samples': 9721920, 'steps': 50634, 'loss/train': 1.4276493787765503} -11/07/2021 04:21:57 - INFO - __main__ - Step 50636: {'lr': 0.00037819553236161985, 'samples': 9722112, 'steps': 50635, 'loss/train': 1.3189899921417236} -11/07/2021 04:21:57 - INFO - __main__ - Step 50637: {'lr': 0.0003781909763930803, 'samples': 9722304, 'steps': 50636, 'loss/train': 1.030458927154541} -11/07/2021 04:21:57 - INFO - __main__ - Step 50638: {'lr': 0.00037818642036677993, 'samples': 9722496, 'steps': 50637, 'loss/train': 1.0234310626983643} -11/07/2021 04:21:58 - INFO - __main__ - Step 50639: {'lr': 0.00037818186428272064, 'samples': 9722688, 'steps': 50638, 'loss/train': 1.3208693265914917} -11/07/2021 04:21:59 - INFO - __main__ - Step 50640: {'lr': 0.00037817730814090466, 'samples': 9722880, 'steps': 50639, 'loss/train': 1.2710895538330078} -11/07/2021 04:21:59 - INFO - __main__ - Step 50641: {'lr': 0.000378172751941334, 'samples': 9723072, 'steps': 50640, 'loss/train': 1.9764162302017212} -11/07/2021 04:22:00 - INFO - __main__ - Step 50642: {'lr': 0.0003781681956840106, 'samples': 9723264, 'steps': 50641, 'loss/train': 1.6260383129119873} -11/07/2021 04:22:00 - INFO - __main__ - Step 50643: {'lr': 0.0003781636393689366, 'samples': 9723456, 'steps': 50642, 'loss/train': 1.8933266401290894} -11/07/2021 04:22:00 - INFO - __main__ - Step 50644: {'lr': 0.0003781590829961141, 'samples': 9723648, 'steps': 50643, 'loss/train': 1.2901744842529297} -11/07/2021 04:22:01 - INFO - __main__ - Step 50645: {'lr': 0.000378154526565545, 'samples': 9723840, 'steps': 50644, 'loss/train': 1.571274757385254} -11/07/2021 04:22:02 - INFO - __main__ - Step 50646: {'lr': 0.00037814997007723153, 'samples': 9724032, 'steps': 50645, 'loss/train': 1.4527223110198975} -11/07/2021 04:22:02 - INFO - __main__ - Step 50647: {'lr': 0.0003781454135311756, 'samples': 9724224, 'steps': 50646, 'loss/train': 1.5039423704147339} -11/07/2021 04:22:02 - INFO - __main__ - Step 50648: {'lr': 0.0003781408569273794, 'samples': 9724416, 'steps': 50647, 'loss/train': 0.5214137434959412} -11/07/2021 04:22:03 - INFO - __main__ - Step 50649: {'lr': 0.0003781363002658448, 'samples': 9724608, 'steps': 50648, 'loss/train': 1.3853232860565186} -11/07/2021 04:22:03 - INFO - __main__ - Step 50650: {'lr': 0.000378131743546574, 'samples': 9724800, 'steps': 50649, 'loss/train': 1.7496758699417114} -11/07/2021 04:22:04 - INFO - __main__ - Step 50651: {'lr': 0.000378127186769569, 'samples': 9724992, 'steps': 50650, 'loss/train': 1.6479120254516602} -11/07/2021 04:22:05 - INFO - __main__ - Step 50652: {'lr': 0.00037812262993483194, 'samples': 9725184, 'steps': 50651, 'loss/train': 1.4466067552566528} -11/07/2021 04:22:05 - INFO - __main__ - Step 50653: {'lr': 0.0003781180730423648, 'samples': 9725376, 'steps': 50652, 'loss/train': 1.361926555633545} -11/07/2021 04:22:05 - INFO - __main__ - Step 50654: {'lr': 0.00037811351609216956, 'samples': 9725568, 'steps': 50653, 'loss/train': 1.057162880897522} -11/07/2021 04:22:06 - INFO - __main__ - Step 50655: {'lr': 0.00037810895908424837, 'samples': 9725760, 'steps': 50654, 'loss/train': 1.5812091827392578} -11/07/2021 04:22:07 - INFO - __main__ - Step 50656: {'lr': 0.0003781044020186033, 'samples': 9725952, 'steps': 50655, 'loss/train': 1.335661768913269} -11/07/2021 04:22:07 - INFO - __main__ - Step 50657: {'lr': 0.0003780998448952363, 'samples': 9726144, 'steps': 50656, 'loss/train': 1.419960856437683} -11/07/2021 04:22:07 - INFO - __main__ - Step 50658: {'lr': 0.0003780952877141495, 'samples': 9726336, 'steps': 50657, 'loss/train': 0.1022462397813797} -11/07/2021 04:22:08 - INFO - __main__ - Step 50659: {'lr': 0.0003780907304753449, 'samples': 9726528, 'steps': 50658, 'loss/train': 1.390694260597229} -11/07/2021 04:22:08 - INFO - __main__ - Step 50660: {'lr': 0.0003780861731788247, 'samples': 9726720, 'steps': 50659, 'loss/train': 1.6995733976364136} -11/07/2021 04:22:09 - INFO - __main__ - Step 50661: {'lr': 0.0003780816158245908, 'samples': 9726912, 'steps': 50660, 'loss/train': 1.3688750267028809} -11/07/2021 04:22:09 - INFO - __main__ - Step 50662: {'lr': 0.0003780770584126453, 'samples': 9727104, 'steps': 50661, 'loss/train': 1.521982192993164} -11/07/2021 04:22:10 - INFO - __main__ - Step 50663: {'lr': 0.0003780725009429903, 'samples': 9727296, 'steps': 50662, 'loss/train': 1.281760334968567} -11/07/2021 04:22:10 - INFO - __main__ - Step 50664: {'lr': 0.00037806794341562773, 'samples': 9727488, 'steps': 50663, 'loss/train': 0.08871020376682281} -11/07/2021 04:22:11 - INFO - __main__ - Step 50665: {'lr': 0.00037806338583055976, 'samples': 9727680, 'steps': 50664, 'loss/train': 1.4168148040771484} -11/07/2021 04:22:12 - INFO - __main__ - Step 50666: {'lr': 0.0003780588281877884, 'samples': 9727872, 'steps': 50665, 'loss/train': 1.6245907545089722} -11/07/2021 04:22:12 - INFO - __main__ - Step 50667: {'lr': 0.00037805427048731566, 'samples': 9728064, 'steps': 50666, 'loss/train': 1.5741922855377197} -11/07/2021 04:22:12 - INFO - __main__ - Step 50668: {'lr': 0.0003780497127291437, 'samples': 9728256, 'steps': 50667, 'loss/train': 1.537471055984497} -11/07/2021 04:22:13 - INFO - __main__ - Step 50669: {'lr': 0.0003780451549132745, 'samples': 9728448, 'steps': 50668, 'loss/train': 1.3848398923873901} -11/07/2021 04:22:13 - INFO - __main__ - Step 50670: {'lr': 0.00037804059703971016, 'samples': 9728640, 'steps': 50669, 'loss/train': 1.594283938407898} -11/07/2021 04:22:14 - INFO - __main__ - Step 50671: {'lr': 0.00037803603910845264, 'samples': 9728832, 'steps': 50670, 'loss/train': 0.884373664855957} -11/07/2021 04:22:14 - INFO - __main__ - Step 50672: {'lr': 0.00037803148111950407, 'samples': 9729024, 'steps': 50671, 'loss/train': 0.6188684701919556} -11/07/2021 04:22:15 - INFO - __main__ - Step 50673: {'lr': 0.0003780269230728665, 'samples': 9729216, 'steps': 50672, 'loss/train': 1.2383602857589722} -11/07/2021 04:22:15 - INFO - __main__ - Step 50674: {'lr': 0.000378022364968542, 'samples': 9729408, 'steps': 50673, 'loss/train': 1.4449785947799683} -11/07/2021 04:22:15 - INFO - __main__ - Step 50675: {'lr': 0.00037801780680653263, 'samples': 9729600, 'steps': 50674, 'loss/train': 1.3962541818618774} -11/07/2021 04:22:16 - INFO - __main__ - Step 50676: {'lr': 0.0003780132485868403, 'samples': 9729792, 'steps': 50675, 'loss/train': 1.3470677137374878} -11/07/2021 04:22:17 - INFO - __main__ - Step 50677: {'lr': 0.0003780086903094673, 'samples': 9729984, 'steps': 50676, 'loss/train': 1.3629646301269531} -11/07/2021 04:22:17 - INFO - __main__ - Step 50678: {'lr': 0.0003780041319744154, 'samples': 9730176, 'steps': 50677, 'loss/train': 1.3893108367919922} -11/07/2021 04:22:17 - INFO - __main__ - Step 50679: {'lr': 0.00037799957358168693, 'samples': 9730368, 'steps': 50678, 'loss/train': 1.2100180387496948} -11/07/2021 04:22:18 - INFO - __main__ - Step 50680: {'lr': 0.0003779950151312838, 'samples': 9730560, 'steps': 50679, 'loss/train': 1.3467028141021729} -11/07/2021 04:22:19 - INFO - __main__ - Step 50681: {'lr': 0.0003779904566232081, 'samples': 9730752, 'steps': 50680, 'loss/train': 1.2199546098709106} -11/07/2021 04:22:19 - INFO - __main__ - Step 50682: {'lr': 0.0003779858980574619, 'samples': 9730944, 'steps': 50681, 'loss/train': 1.311398983001709} -11/07/2021 04:22:20 - INFO - __main__ - Step 50683: {'lr': 0.0003779813394340472, 'samples': 9731136, 'steps': 50682, 'loss/train': 1.609716534614563} -11/07/2021 04:22:20 - INFO - __main__ - Step 50684: {'lr': 0.0003779767807529661, 'samples': 9731328, 'steps': 50683, 'loss/train': 1.0118694305419922} -11/07/2021 04:22:20 - INFO - __main__ - Step 50685: {'lr': 0.0003779722220142206, 'samples': 9731520, 'steps': 50684, 'loss/train': 1.3198235034942627} -11/07/2021 04:22:21 - INFO - __main__ - Step 50686: {'lr': 0.00037796766321781286, 'samples': 9731712, 'steps': 50685, 'loss/train': 1.7070567607879639} -11/07/2021 04:22:22 - INFO - __main__ - Step 50687: {'lr': 0.00037796310436374474, 'samples': 9731904, 'steps': 50686, 'loss/train': 3.05145525932312} -11/07/2021 04:22:22 - INFO - __main__ - Step 50688: {'lr': 0.0003779585454520186, 'samples': 9732096, 'steps': 50687, 'loss/train': 1.5338678359985352} -11/07/2021 04:22:22 - INFO - __main__ - Step 50689: {'lr': 0.0003779539864826362, 'samples': 9732288, 'steps': 50688, 'loss/train': 1.711365818977356} -11/07/2021 04:22:23 - INFO - __main__ - Step 50690: {'lr': 0.0003779494274555997, 'samples': 9732480, 'steps': 50689, 'loss/train': 1.7390422821044922} -11/07/2021 04:22:24 - INFO - __main__ - Step 50691: {'lr': 0.0003779448683709111, 'samples': 9732672, 'steps': 50690, 'loss/train': 1.5304346084594727} -11/07/2021 04:22:24 - INFO - __main__ - Step 50692: {'lr': 0.0003779403092285727, 'samples': 9732864, 'steps': 50691, 'loss/train': 1.2473922967910767} -11/07/2021 04:22:24 - INFO - __main__ - Step 50693: {'lr': 0.00037793575002858625, 'samples': 9733056, 'steps': 50692, 'loss/train': 1.4359720945358276} -11/07/2021 04:22:25 - INFO - __main__ - Step 50694: {'lr': 0.00037793119077095396, 'samples': 9733248, 'steps': 50693, 'loss/train': 1.259575605392456} -11/07/2021 04:22:25 - INFO - __main__ - Step 50695: {'lr': 0.00037792663145567784, 'samples': 9733440, 'steps': 50694, 'loss/train': 1.3352851867675781} -11/07/2021 04:22:26 - INFO - __main__ - Step 50696: {'lr': 0.00037792207208275995, 'samples': 9733632, 'steps': 50695, 'loss/train': 2.020500659942627} -11/07/2021 04:22:27 - INFO - __main__ - Step 50697: {'lr': 0.0003779175126522023, 'samples': 9733824, 'steps': 50696, 'loss/train': 1.638195514678955} -11/07/2021 04:22:27 - INFO - __main__ - Step 50698: {'lr': 0.0003779129531640071, 'samples': 9734016, 'steps': 50697, 'loss/train': 1.8014445304870605} -11/07/2021 04:22:27 - INFO - __main__ - Step 50699: {'lr': 0.0003779083936181762, 'samples': 9734208, 'steps': 50698, 'loss/train': 1.3109745979309082} -11/07/2021 04:22:28 - INFO - __main__ - Step 50700: {'lr': 0.0003779038340147118, 'samples': 9734400, 'steps': 50699, 'loss/train': 1.7507801055908203} -11/07/2021 04:22:29 - INFO - __main__ - Step 50701: {'lr': 0.0003778992743536159, 'samples': 9734592, 'steps': 50700, 'loss/train': 1.6560417413711548} -11/07/2021 04:22:29 - INFO - __main__ - Step 50702: {'lr': 0.0003778947146348906, 'samples': 9734784, 'steps': 50701, 'loss/train': 1.7197080850601196} -11/07/2021 04:22:29 - INFO - __main__ - Step 50703: {'lr': 0.00037789015485853786, 'samples': 9734976, 'steps': 50702, 'loss/train': 1.6700061559677124} -11/07/2021 04:22:30 - INFO - __main__ - Step 50704: {'lr': 0.0003778855950245598, 'samples': 9735168, 'steps': 50703, 'loss/train': 1.8428999185562134} -11/07/2021 04:22:30 - INFO - __main__ - Step 50705: {'lr': 0.00037788103513295844, 'samples': 9735360, 'steps': 50704, 'loss/train': 1.0536830425262451} -11/07/2021 04:22:31 - INFO - __main__ - Step 50706: {'lr': 0.00037787647518373586, 'samples': 9735552, 'steps': 50705, 'loss/train': 1.2545115947723389} -11/07/2021 04:22:31 - INFO - __main__ - Step 50707: {'lr': 0.0003778719151768941, 'samples': 9735744, 'steps': 50706, 'loss/train': 1.4495525360107422} -11/07/2021 04:22:32 - INFO - __main__ - Step 50708: {'lr': 0.0003778673551124353, 'samples': 9735936, 'steps': 50707, 'loss/train': 0.7083872556686401} -11/07/2021 04:22:32 - INFO - __main__ - Step 50709: {'lr': 0.0003778627949903615, 'samples': 9736128, 'steps': 50708, 'loss/train': 1.3951613903045654} -11/07/2021 04:22:33 - INFO - __main__ - Step 50710: {'lr': 0.00037785823481067455, 'samples': 9736320, 'steps': 50709, 'loss/train': 1.2276339530944824} -11/07/2021 04:22:33 - INFO - __main__ - Step 50711: {'lr': 0.0003778536745733767, 'samples': 9736512, 'steps': 50710, 'loss/train': 1.5364985466003418} -11/07/2021 04:22:34 - INFO - __main__ - Step 50712: {'lr': 0.00037784911427846997, 'samples': 9736704, 'steps': 50711, 'loss/train': 0.06656911224126816} -11/07/2021 04:22:34 - INFO - __main__ - Step 50713: {'lr': 0.0003778445539259564, 'samples': 9736896, 'steps': 50712, 'loss/train': 1.4633636474609375} -11/07/2021 04:22:35 - INFO - __main__ - Step 50714: {'lr': 0.000377839993515838, 'samples': 9737088, 'steps': 50713, 'loss/train': 1.334006667137146} -11/07/2021 04:22:35 - INFO - __main__ - Step 50715: {'lr': 0.000377835433048117, 'samples': 9737280, 'steps': 50714, 'loss/train': 1.427729606628418} -11/07/2021 04:22:35 - INFO - __main__ - Step 50716: {'lr': 0.00037783087252279523, 'samples': 9737472, 'steps': 50715, 'loss/train': 1.0502132177352905} -11/07/2021 04:22:36 - INFO - __main__ - Step 50717: {'lr': 0.0003778263119398748, 'samples': 9737664, 'steps': 50716, 'loss/train': 1.142493486404419} -11/07/2021 04:22:37 - INFO - __main__ - Step 50718: {'lr': 0.00037782175129935793, 'samples': 9737856, 'steps': 50717, 'loss/train': 1.661091923713684} -11/07/2021 04:22:37 - INFO - __main__ - Step 50719: {'lr': 0.0003778171906012464, 'samples': 9738048, 'steps': 50718, 'loss/train': 1.5472112894058228} -11/07/2021 04:22:37 - INFO - __main__ - Step 50720: {'lr': 0.0003778126298455425, 'samples': 9738240, 'steps': 50719, 'loss/train': 0.9596140384674072} -11/07/2021 04:22:38 - INFO - __main__ - Step 50721: {'lr': 0.0003778080690322483, 'samples': 9738432, 'steps': 50720, 'loss/train': 1.7238438129425049} -11/07/2021 04:22:39 - INFO - __main__ - Step 50722: {'lr': 0.0003778035081613656, 'samples': 9738624, 'steps': 50721, 'loss/train': 0.9496026635169983} -11/07/2021 04:22:39 - INFO - __main__ - Step 50723: {'lr': 0.00037779894723289666, 'samples': 9738816, 'steps': 50722, 'loss/train': 0.970390260219574} -11/07/2021 04:22:39 - INFO - __main__ - Step 50724: {'lr': 0.00037779438624684346, 'samples': 9739008, 'steps': 50723, 'loss/train': 1.4665848016738892} -11/07/2021 04:22:40 - INFO - __main__ - Step 50725: {'lr': 0.00037778982520320813, 'samples': 9739200, 'steps': 50724, 'loss/train': 1.033931851387024} -11/07/2021 04:22:40 - INFO - __main__ - Step 50726: {'lr': 0.00037778526410199266, 'samples': 9739392, 'steps': 50725, 'loss/train': 1.2364975214004517} -11/07/2021 04:22:41 - INFO - __main__ - Step 50727: {'lr': 0.0003777807029431992, 'samples': 9739584, 'steps': 50726, 'loss/train': 0.11913690716028214} -11/07/2021 04:22:42 - INFO - __main__ - Step 50728: {'lr': 0.0003777761417268296, 'samples': 9739776, 'steps': 50727, 'loss/train': 1.2327946424484253} -11/07/2021 04:22:42 - INFO - __main__ - Step 50729: {'lr': 0.00037777158045288606, 'samples': 9739968, 'steps': 50728, 'loss/train': 1.6647366285324097} -11/07/2021 04:22:42 - INFO - __main__ - Step 50730: {'lr': 0.00037776701912137066, 'samples': 9740160, 'steps': 50729, 'loss/train': 1.1865135431289673} -11/07/2021 04:22:43 - INFO - __main__ - Step 50731: {'lr': 0.00037776245773228547, 'samples': 9740352, 'steps': 50730, 'loss/train': 0.562919020652771} -11/07/2021 04:22:43 - INFO - __main__ - Step 50732: {'lr': 0.0003777578962856324, 'samples': 9740544, 'steps': 50731, 'loss/train': 1.2084091901779175} -11/07/2021 04:22:44 - INFO - __main__ - Step 50733: {'lr': 0.0003777533347814136, 'samples': 9740736, 'steps': 50732, 'loss/train': 1.3344764709472656} -11/07/2021 04:22:44 - INFO - __main__ - Step 50734: {'lr': 0.0003777487732196312, 'samples': 9740928, 'steps': 50733, 'loss/train': 1.5014675855636597} -11/07/2021 04:22:45 - INFO - __main__ - Step 50735: {'lr': 0.00037774421160028705, 'samples': 9741120, 'steps': 50734, 'loss/train': 1.603287935256958} -11/07/2021 04:22:45 - INFO - __main__ - Step 50736: {'lr': 0.0003777396499233834, 'samples': 9741312, 'steps': 50735, 'loss/train': 2.493743658065796} -11/07/2021 04:22:45 - INFO - __main__ - Step 50737: {'lr': 0.00037773508818892223, 'samples': 9741504, 'steps': 50736, 'loss/train': 1.6289881467819214} -11/07/2021 04:22:46 - INFO - __main__ - Step 50738: {'lr': 0.0003777305263969056, 'samples': 9741696, 'steps': 50737, 'loss/train': 1.4261382818222046} -11/07/2021 04:22:47 - INFO - __main__ - Step 50739: {'lr': 0.00037772596454733554, 'samples': 9741888, 'steps': 50738, 'loss/train': 1.0800403356552124} -11/07/2021 04:22:47 - INFO - __main__ - Step 50740: {'lr': 0.00037772140264021416, 'samples': 9742080, 'steps': 50739, 'loss/train': 1.165719747543335} -11/07/2021 04:22:47 - INFO - __main__ - Step 50741: {'lr': 0.00037771684067554345, 'samples': 9742272, 'steps': 50740, 'loss/train': 1.4455782175064087} -11/07/2021 04:22:48 - INFO - __main__ - Step 50742: {'lr': 0.0003777122786533255, 'samples': 9742464, 'steps': 50741, 'loss/train': 1.5963486433029175} -11/07/2021 04:22:49 - INFO - __main__ - Step 50743: {'lr': 0.0003777077165735625, 'samples': 9742656, 'steps': 50742, 'loss/train': 1.311700463294983} -11/07/2021 04:22:49 - INFO - __main__ - Step 50744: {'lr': 0.0003777031544362562, 'samples': 9742848, 'steps': 50743, 'loss/train': 1.2413666248321533} -11/07/2021 04:22:50 - INFO - __main__ - Step 50745: {'lr': 0.0003776985922414089, 'samples': 9743040, 'steps': 50744, 'loss/train': 1.693814754486084} -11/07/2021 04:22:50 - INFO - __main__ - Step 50746: {'lr': 0.0003776940299890226, 'samples': 9743232, 'steps': 50745, 'loss/train': 1.498221516609192} -11/07/2021 04:22:50 - INFO - __main__ - Step 50747: {'lr': 0.0003776894676790993, 'samples': 9743424, 'steps': 50746, 'loss/train': 0.10506287217140198} -11/07/2021 04:22:51 - INFO - __main__ - Step 50748: {'lr': 0.0003776849053116411, 'samples': 9743616, 'steps': 50747, 'loss/train': 1.1215659379959106} -11/07/2021 04:22:52 - INFO - __main__ - Step 50749: {'lr': 0.00037768034288665015, 'samples': 9743808, 'steps': 50748, 'loss/train': 1.410152554512024} -11/07/2021 04:22:52 - INFO - __main__ - Step 50750: {'lr': 0.0003776757804041283, 'samples': 9744000, 'steps': 50749, 'loss/train': 1.4149744510650635} -11/07/2021 04:22:52 - INFO - __main__ - Step 50751: {'lr': 0.00037767121786407774, 'samples': 9744192, 'steps': 50750, 'loss/train': 1.5454553365707397} -11/07/2021 04:22:53 - INFO - __main__ - Step 50752: {'lr': 0.00037766665526650054, 'samples': 9744384, 'steps': 50751, 'loss/train': 1.801805019378662} -11/07/2021 04:22:54 - INFO - __main__ - Step 50753: {'lr': 0.0003776620926113986, 'samples': 9744576, 'steps': 50752, 'loss/train': 1.524074912071228} -11/07/2021 04:22:54 - INFO - __main__ - Step 50754: {'lr': 0.0003776575298987742, 'samples': 9744768, 'steps': 50753, 'loss/train': 1.9182108640670776} -11/07/2021 04:22:54 - INFO - __main__ - Step 50755: {'lr': 0.00037765296712862927, 'samples': 9744960, 'steps': 50754, 'loss/train': 1.1489320993423462} -11/07/2021 04:22:55 - INFO - __main__ - Step 50756: {'lr': 0.00037764840430096593, 'samples': 9745152, 'steps': 50755, 'loss/train': 0.532424807548523} -11/07/2021 04:22:55 - INFO - __main__ - Step 50757: {'lr': 0.0003776438414157861, 'samples': 9745344, 'steps': 50756, 'loss/train': 1.3537510633468628} -11/07/2021 04:22:56 - INFO - __main__ - Step 50758: {'lr': 0.00037763927847309195, 'samples': 9745536, 'steps': 50757, 'loss/train': 0.9443285465240479} -11/07/2021 04:22:57 - INFO - __main__ - Step 50759: {'lr': 0.00037763471547288554, 'samples': 9745728, 'steps': 50758, 'loss/train': 1.5967708826065063} -11/07/2021 04:22:57 - INFO - __main__ - Step 50760: {'lr': 0.00037763015241516887, 'samples': 9745920, 'steps': 50759, 'loss/train': 1.276456356048584} -11/07/2021 04:22:57 - INFO - __main__ - Step 50761: {'lr': 0.00037762558929994394, 'samples': 9746112, 'steps': 50760, 'loss/train': 1.8176703453063965} -11/07/2021 04:22:58 - INFO - __main__ - Step 50762: {'lr': 0.00037762102612721305, 'samples': 9746304, 'steps': 50761, 'loss/train': 0.9380192160606384} -11/07/2021 04:22:59 - INFO - __main__ - Step 50763: {'lr': 0.00037761646289697796, 'samples': 9746496, 'steps': 50762, 'loss/train': 1.3880196809768677} -11/07/2021 04:22:59 - INFO - __main__ - Step 50764: {'lr': 0.0003776118996092409, 'samples': 9746688, 'steps': 50763, 'loss/train': 1.337918758392334} -11/07/2021 04:22:59 - INFO - __main__ - Step 50765: {'lr': 0.00037760733626400396, 'samples': 9746880, 'steps': 50764, 'loss/train': 1.2872546911239624} -11/07/2021 04:23:00 - INFO - __main__ - Step 50766: {'lr': 0.00037760277286126906, 'samples': 9747072, 'steps': 50765, 'loss/train': 1.5700017213821411} -11/07/2021 04:23:00 - INFO - __main__ - Step 50767: {'lr': 0.00037759820940103827, 'samples': 9747264, 'steps': 50766, 'loss/train': 1.6338597536087036} -11/07/2021 04:23:00 - INFO - __main__ - Step 50768: {'lr': 0.0003775936458833138, 'samples': 9747456, 'steps': 50767, 'loss/train': 0.943385124206543} -11/07/2021 04:23:01 - INFO - __main__ - Step 50769: {'lr': 0.00037758908230809757, 'samples': 9747648, 'steps': 50768, 'loss/train': 1.0664221048355103} -11/07/2021 04:23:02 - INFO - __main__ - Step 50770: {'lr': 0.0003775845186753917, 'samples': 9747840, 'steps': 50769, 'loss/train': 1.719895362854004} -11/07/2021 04:23:02 - INFO - __main__ - Step 50771: {'lr': 0.00037757995498519814, 'samples': 9748032, 'steps': 50770, 'loss/train': 1.3944305181503296} -11/07/2021 04:23:02 - INFO - __main__ - Step 50772: {'lr': 0.00037757539123751906, 'samples': 9748224, 'steps': 50771, 'loss/train': 1.4768362045288086} -11/07/2021 04:23:03 - INFO - __main__ - Step 50773: {'lr': 0.00037757082743235644, 'samples': 9748416, 'steps': 50772, 'loss/train': 1.4655301570892334} -11/07/2021 04:23:04 - INFO - __main__ - Step 50774: {'lr': 0.00037756626356971236, 'samples': 9748608, 'steps': 50773, 'loss/train': 0.987450897693634} -11/07/2021 04:23:04 - INFO - __main__ - Step 50775: {'lr': 0.00037756169964958897, 'samples': 9748800, 'steps': 50774, 'loss/train': 1.2702594995498657} -11/07/2021 04:23:04 - INFO - __main__ - Step 50776: {'lr': 0.00037755713567198823, 'samples': 9748992, 'steps': 50775, 'loss/train': 1.52090585231781} -11/07/2021 04:23:05 - INFO - __main__ - Step 50777: {'lr': 0.00037755257163691214, 'samples': 9749184, 'steps': 50776, 'loss/train': 1.83846116065979} -11/07/2021 04:23:05 - INFO - __main__ - Step 50778: {'lr': 0.00037754800754436293, 'samples': 9749376, 'steps': 50777, 'loss/train': 1.0825878381729126} -11/07/2021 04:23:06 - INFO - __main__ - Step 50779: {'lr': 0.0003775434433943425, 'samples': 9749568, 'steps': 50778, 'loss/train': 1.220787763595581} -11/07/2021 04:23:06 - INFO - __main__ - Step 50780: {'lr': 0.00037753887918685295, 'samples': 9749760, 'steps': 50779, 'loss/train': 1.7025530338287354} -11/07/2021 04:23:07 - INFO - __main__ - Step 50781: {'lr': 0.0003775343149218964, 'samples': 9749952, 'steps': 50780, 'loss/train': 1.3414987325668335} -11/07/2021 04:23:07 - INFO - __main__ - Step 50782: {'lr': 0.0003775297505994748, 'samples': 9750144, 'steps': 50781, 'loss/train': 1.3007538318634033} -11/07/2021 04:23:07 - INFO - __main__ - Step 50783: {'lr': 0.0003775251862195903, 'samples': 9750336, 'steps': 50782, 'loss/train': 1.2600034475326538} -11/07/2021 04:23:09 - INFO - __main__ - Step 50784: {'lr': 0.0003775206217822449, 'samples': 9750528, 'steps': 50783, 'loss/train': 1.5636194944381714} -11/07/2021 04:23:09 - INFO - __main__ - Step 50785: {'lr': 0.00037751605728744063, 'samples': 9750720, 'steps': 50784, 'loss/train': 1.5546804666519165} -11/07/2021 04:23:09 - INFO - __main__ - Step 50786: {'lr': 0.0003775114927351797, 'samples': 9750912, 'steps': 50785, 'loss/train': 1.2205405235290527} -11/07/2021 04:23:10 - INFO - __main__ - Step 50787: {'lr': 0.00037750692812546396, 'samples': 9751104, 'steps': 50786, 'loss/train': 1.3504419326782227} -11/07/2021 04:23:10 - INFO - __main__ - Step 50788: {'lr': 0.00037750236345829557, 'samples': 9751296, 'steps': 50787, 'loss/train': 1.6261910200119019} -11/07/2021 04:23:11 - INFO - __main__ - Step 50789: {'lr': 0.0003774977987336767, 'samples': 9751488, 'steps': 50788, 'loss/train': 1.0199942588806152} -11/07/2021 04:23:11 - INFO - __main__ - Step 50790: {'lr': 0.0003774932339516092, 'samples': 9751680, 'steps': 50789, 'loss/train': 1.037049651145935} -11/07/2021 04:23:12 - INFO - __main__ - Step 50791: {'lr': 0.00037748866911209525, 'samples': 9751872, 'steps': 50790, 'loss/train': 1.5314488410949707} -11/07/2021 04:23:12 - INFO - __main__ - Step 50792: {'lr': 0.00037748410421513677, 'samples': 9752064, 'steps': 50791, 'loss/train': 0.8069332838058472} -11/07/2021 04:23:12 - INFO - __main__ - Step 50793: {'lr': 0.000377479539260736, 'samples': 9752256, 'steps': 50792, 'loss/train': 1.3279070854187012} -11/07/2021 04:23:13 - INFO - __main__ - Step 50794: {'lr': 0.0003774749742488949, 'samples': 9752448, 'steps': 50793, 'loss/train': 1.1581848859786987} -11/07/2021 04:23:14 - INFO - __main__ - Step 50795: {'lr': 0.0003774704091796156, 'samples': 9752640, 'steps': 50794, 'loss/train': 1.2445685863494873} -11/07/2021 04:23:14 - INFO - __main__ - Step 50796: {'lr': 0.00037746584405290006, 'samples': 9752832, 'steps': 50795, 'loss/train': 1.3859024047851562} -11/07/2021 04:23:14 - INFO - __main__ - Step 50797: {'lr': 0.00037746127886875035, 'samples': 9753024, 'steps': 50796, 'loss/train': 1.5053210258483887} -11/07/2021 04:23:15 - INFO - __main__ - Step 50798: {'lr': 0.0003774567136271686, 'samples': 9753216, 'steps': 50797, 'loss/train': 1.9043644666671753} -11/07/2021 04:23:16 - INFO - __main__ - Step 50799: {'lr': 0.0003774521483281568, 'samples': 9753408, 'steps': 50798, 'loss/train': 1.689976692199707} -11/07/2021 04:23:16 - INFO - __main__ - Step 50800: {'lr': 0.00037744758297171706, 'samples': 9753600, 'steps': 50799, 'loss/train': 1.27703058719635} -11/07/2021 04:23:17 - INFO - __main__ - Step 50801: {'lr': 0.00037744301755785137, 'samples': 9753792, 'steps': 50800, 'loss/train': 1.5397943258285522} -11/07/2021 04:23:17 - INFO - __main__ - Step 50802: {'lr': 0.0003774384520865618, 'samples': 9753984, 'steps': 50801, 'loss/train': 1.4204710721969604} -11/07/2021 04:23:17 - INFO - __main__ - Step 50803: {'lr': 0.0003774338865578505, 'samples': 9754176, 'steps': 50802, 'loss/train': 1.2714866399765015} -11/07/2021 04:23:18 - INFO - __main__ - Step 50804: {'lr': 0.00037742932097171945, 'samples': 9754368, 'steps': 50803, 'loss/train': 1.2413955926895142} -11/07/2021 04:23:19 - INFO - __main__ - Step 50805: {'lr': 0.0003774247553281707, 'samples': 9754560, 'steps': 50804, 'loss/train': 1.5885212421417236} -11/07/2021 04:23:19 - INFO - __main__ - Step 50806: {'lr': 0.00037742018962720625, 'samples': 9754752, 'steps': 50805, 'loss/train': 1.8339276313781738} -11/07/2021 04:23:19 - INFO - __main__ - Step 50807: {'lr': 0.0003774156238688282, 'samples': 9754944, 'steps': 50806, 'loss/train': 1.2531362771987915} -11/07/2021 04:23:20 - INFO - __main__ - Step 50808: {'lr': 0.00037741105805303874, 'samples': 9755136, 'steps': 50807, 'loss/train': 1.233770489692688} -11/07/2021 04:23:21 - INFO - __main__ - Step 50809: {'lr': 0.0003774064921798399, 'samples': 9755328, 'steps': 50808, 'loss/train': 1.383651614189148} -11/07/2021 04:23:21 - INFO - __main__ - Step 50810: {'lr': 0.00037740192624923354, 'samples': 9755520, 'steps': 50809, 'loss/train': 1.0668141841888428} -11/07/2021 04:23:22 - INFO - __main__ - Step 50811: {'lr': 0.00037739736026122186, 'samples': 9755712, 'steps': 50810, 'loss/train': 1.4635947942733765} -11/07/2021 04:23:22 - INFO - __main__ - Step 50812: {'lr': 0.00037739279421580683, 'samples': 9755904, 'steps': 50811, 'loss/train': 1.1940083503723145} -11/07/2021 04:23:22 - INFO - __main__ - Step 50813: {'lr': 0.00037738822811299067, 'samples': 9756096, 'steps': 50812, 'loss/train': 1.7556402683258057} -11/07/2021 04:23:23 - INFO - __main__ - Step 50814: {'lr': 0.00037738366195277527, 'samples': 9756288, 'steps': 50813, 'loss/train': 1.406965970993042} -11/07/2021 04:23:24 - INFO - __main__ - Step 50815: {'lr': 0.0003773790957351628, 'samples': 9756480, 'steps': 50814, 'loss/train': 1.1583935022354126} -11/07/2021 04:23:24 - INFO - __main__ - Step 50816: {'lr': 0.00037737452946015533, 'samples': 9756672, 'steps': 50815, 'loss/train': 1.148431420326233} -11/07/2021 04:23:24 - INFO - __main__ - Step 50817: {'lr': 0.0003773699631277548, 'samples': 9756864, 'steps': 50816, 'loss/train': 1.3440370559692383} -11/07/2021 04:23:25 - INFO - __main__ - Step 50818: {'lr': 0.00037736539673796334, 'samples': 9757056, 'steps': 50817, 'loss/train': 1.1187483072280884} -11/07/2021 04:23:26 - INFO - __main__ - Step 50819: {'lr': 0.00037736083029078294, 'samples': 9757248, 'steps': 50818, 'loss/train': 1.1490564346313477} -11/07/2021 04:23:27 - INFO - __main__ - Step 50820: {'lr': 0.00037735626378621577, 'samples': 9757440, 'steps': 50819, 'loss/train': 1.4225025177001953} -11/07/2021 04:23:27 - INFO - __main__ - Step 50821: {'lr': 0.00037735169722426384, 'samples': 9757632, 'steps': 50820, 'loss/train': 5.91687536239624} -11/07/2021 04:23:27 - INFO - __main__ - Step 50822: {'lr': 0.0003773471306049292, 'samples': 9757824, 'steps': 50821, 'loss/train': 5.8392863273620605} -11/07/2021 04:23:28 - INFO - __main__ - Step 50823: {'lr': 0.00037734256392821393, 'samples': 9758016, 'steps': 50822, 'loss/train': 0.9705638289451599} -11/07/2021 04:23:28 - INFO - __main__ - Step 50824: {'lr': 0.00037733799719411997, 'samples': 9758208, 'steps': 50823, 'loss/train': 1.161920428276062} -11/07/2021 04:23:28 - INFO - __main__ - Step 50825: {'lr': 0.00037733343040264954, 'samples': 9758400, 'steps': 50824, 'loss/train': 2.0557708740234375} -11/07/2021 04:23:29 - INFO - __main__ - Step 50826: {'lr': 0.00037732886355380465, 'samples': 9758592, 'steps': 50825, 'loss/train': 1.666393518447876} -11/07/2021 04:23:30 - INFO - __main__ - Step 50827: {'lr': 0.00037732429664758725, 'samples': 9758784, 'steps': 50826, 'loss/train': 1.5360578298568726} -11/07/2021 04:23:30 - INFO - __main__ - Step 50828: {'lr': 0.0003773197296839996, 'samples': 9758976, 'steps': 50827, 'loss/train': 1.7051162719726562} -11/07/2021 04:23:30 - INFO - __main__ - Step 50829: {'lr': 0.00037731516266304355, 'samples': 9759168, 'steps': 50828, 'loss/train': 1.089630365371704} -11/07/2021 04:23:31 - INFO - __main__ - Step 50830: {'lr': 0.00037731059558472136, 'samples': 9759360, 'steps': 50829, 'loss/train': 1.4240920543670654} -11/07/2021 04:23:32 - INFO - __main__ - Step 50831: {'lr': 0.00037730602844903495, 'samples': 9759552, 'steps': 50830, 'loss/train': 1.5600533485412598} -11/07/2021 04:23:32 - INFO - __main__ - Step 50832: {'lr': 0.00037730146125598634, 'samples': 9759744, 'steps': 50831, 'loss/train': 1.3985621929168701} -11/07/2021 04:23:32 - INFO - __main__ - Step 50833: {'lr': 0.0003772968940055777, 'samples': 9759936, 'steps': 50832, 'loss/train': 1.2548178434371948} -11/07/2021 04:23:33 - INFO - __main__ - Step 50834: {'lr': 0.000377292326697811, 'samples': 9760128, 'steps': 50833, 'loss/train': 0.6145873665809631} -11/07/2021 04:23:33 - INFO - __main__ - Step 50835: {'lr': 0.00037728775933268844, 'samples': 9760320, 'steps': 50834, 'loss/train': 1.3260642290115356} -11/07/2021 04:23:34 - INFO - __main__ - Step 50836: {'lr': 0.0003772831919102119, 'samples': 9760512, 'steps': 50835, 'loss/train': 1.3751753568649292} -11/07/2021 04:23:35 - INFO - __main__ - Step 50837: {'lr': 0.00037727862443038353, 'samples': 9760704, 'steps': 50836, 'loss/train': 1.3612593412399292} -11/07/2021 04:23:35 - INFO - __main__ - Step 50838: {'lr': 0.00037727405689320535, 'samples': 9760896, 'steps': 50837, 'loss/train': 1.3940775394439697} -11/07/2021 04:23:35 - INFO - __main__ - Step 50839: {'lr': 0.00037726948929867955, 'samples': 9761088, 'steps': 50838, 'loss/train': 1.1814788579940796} -11/07/2021 04:23:36 - INFO - __main__ - Step 50840: {'lr': 0.00037726492164680796, 'samples': 9761280, 'steps': 50839, 'loss/train': 0.9084142446517944} -11/07/2021 04:23:37 - INFO - __main__ - Step 50841: {'lr': 0.00037726035393759286, 'samples': 9761472, 'steps': 50840, 'loss/train': 1.009061574935913} -11/07/2021 04:23:37 - INFO - __main__ - Step 50842: {'lr': 0.00037725578617103605, 'samples': 9761664, 'steps': 50841, 'loss/train': 1.5422435998916626} -11/07/2021 04:23:38 - INFO - __main__ - Step 50843: {'lr': 0.00037725121834713995, 'samples': 9761856, 'steps': 50842, 'loss/train': 0.6560593247413635} -11/07/2021 04:23:38 - INFO - __main__ - Step 50844: {'lr': 0.0003772466504659063, 'samples': 9762048, 'steps': 50843, 'loss/train': 1.5334835052490234} -11/07/2021 04:23:38 - INFO - __main__ - Step 50845: {'lr': 0.00037724208252733725, 'samples': 9762240, 'steps': 50844, 'loss/train': 1.6152210235595703} -11/07/2021 04:23:39 - INFO - __main__ - Step 50846: {'lr': 0.000377237514531435, 'samples': 9762432, 'steps': 50845, 'loss/train': 0.46458733081817627} -11/07/2021 04:23:40 - INFO - __main__ - Step 50847: {'lr': 0.0003772329464782014, 'samples': 9762624, 'steps': 50846, 'loss/train': 0.9685691595077515} -11/07/2021 04:23:40 - INFO - __main__ - Step 50848: {'lr': 0.00037722837836763856, 'samples': 9762816, 'steps': 50847, 'loss/train': 1.5266244411468506} -11/07/2021 04:23:40 - INFO - __main__ - Step 50849: {'lr': 0.0003772238101997486, 'samples': 9763008, 'steps': 50848, 'loss/train': 1.5096989870071411} -11/07/2021 04:23:41 - INFO - __main__ - Step 50850: {'lr': 0.0003772192419745336, 'samples': 9763200, 'steps': 50849, 'loss/train': 1.3950402736663818} -11/07/2021 04:23:41 - INFO - __main__ - Step 50851: {'lr': 0.0003772146736919956, 'samples': 9763392, 'steps': 50850, 'loss/train': 1.409664511680603} -11/07/2021 04:23:42 - INFO - __main__ - Step 50852: {'lr': 0.0003772101053521366, 'samples': 9763584, 'steps': 50851, 'loss/train': 0.7390536665916443} -11/07/2021 04:23:43 - INFO - __main__ - Step 50853: {'lr': 0.0003772055369549586, 'samples': 9763776, 'steps': 50852, 'loss/train': 1.3061412572860718} -11/07/2021 04:23:43 - INFO - __main__ - Step 50854: {'lr': 0.0003772009685004638, 'samples': 9763968, 'steps': 50853, 'loss/train': 1.6045711040496826} -11/07/2021 04:23:43 - INFO - __main__ - Step 50855: {'lr': 0.0003771963999886543, 'samples': 9764160, 'steps': 50854, 'loss/train': 1.455470323562622} -11/07/2021 04:23:44 - INFO - __main__ - Step 50856: {'lr': 0.000377191831419532, 'samples': 9764352, 'steps': 50855, 'loss/train': 1.2654258012771606} -11/07/2021 04:23:45 - INFO - __main__ - Step 50857: {'lr': 0.000377187262793099, 'samples': 9764544, 'steps': 50856, 'loss/train': 0.07830142974853516} -11/07/2021 04:23:45 - INFO - __main__ - Step 50858: {'lr': 0.0003771826941093574, 'samples': 9764736, 'steps': 50857, 'loss/train': 1.545218586921692} -11/07/2021 04:23:45 - INFO - __main__ - Step 50859: {'lr': 0.0003771781253683092, 'samples': 9764928, 'steps': 50858, 'loss/train': 1.5167969465255737} -11/07/2021 04:23:46 - INFO - __main__ - Step 50860: {'lr': 0.00037717355656995653, 'samples': 9765120, 'steps': 50859, 'loss/train': 0.9585990309715271} -11/07/2021 04:23:46 - INFO - __main__ - Step 50861: {'lr': 0.0003771689877143015, 'samples': 9765312, 'steps': 50860, 'loss/train': 0.734885573387146} -11/07/2021 04:23:47 - INFO - __main__ - Step 50862: {'lr': 0.000377164418801346, 'samples': 9765504, 'steps': 50861, 'loss/train': 1.4071004390716553} -11/07/2021 04:23:47 - INFO - __main__ - Step 50863: {'lr': 0.0003771598498310922, 'samples': 9765696, 'steps': 50862, 'loss/train': 1.0230638980865479} -11/07/2021 04:23:48 - INFO - __main__ - Step 50864: {'lr': 0.0003771552808035421, 'samples': 9765888, 'steps': 50863, 'loss/train': 1.6071019172668457} -11/07/2021 04:23:48 - INFO - __main__ - Step 50865: {'lr': 0.0003771507117186978, 'samples': 9766080, 'steps': 50864, 'loss/train': 1.5947484970092773} -11/07/2021 04:23:49 - INFO - __main__ - Step 50866: {'lr': 0.0003771461425765614, 'samples': 9766272, 'steps': 50865, 'loss/train': 1.2703443765640259} -11/07/2021 04:23:50 - INFO - __main__ - Step 50867: {'lr': 0.00037714157337713483, 'samples': 9766464, 'steps': 50866, 'loss/train': 1.5110069513320923} -11/07/2021 04:23:50 - INFO - __main__ - Step 50868: {'lr': 0.0003771370041204203, 'samples': 9766656, 'steps': 50867, 'loss/train': 1.8053284883499146} -11/07/2021 04:23:50 - INFO - __main__ - Step 50869: {'lr': 0.0003771324348064198, 'samples': 9766848, 'steps': 50868, 'loss/train': 1.1192725896835327} -11/07/2021 04:23:51 - INFO - __main__ - Step 50870: {'lr': 0.00037712786543513534, 'samples': 9767040, 'steps': 50869, 'loss/train': 1.066977858543396} -11/07/2021 04:23:51 - INFO - __main__ - Step 50871: {'lr': 0.000377123296006569, 'samples': 9767232, 'steps': 50870, 'loss/train': 1.4052960872650146} -11/07/2021 04:23:52 - INFO - __main__ - Step 50872: {'lr': 0.000377118726520723, 'samples': 9767424, 'steps': 50871, 'loss/train': 1.4068541526794434} -11/07/2021 04:23:52 - INFO - __main__ - Step 50873: {'lr': 0.0003771141569775991, 'samples': 9767616, 'steps': 50872, 'loss/train': 1.9116144180297852} -11/07/2021 04:23:53 - INFO - __main__ - Step 50874: {'lr': 0.0003771095873771996, 'samples': 9767808, 'steps': 50873, 'loss/train': 1.5371664762496948} -11/07/2021 04:23:53 - INFO - __main__ - Step 50875: {'lr': 0.0003771050177195265, 'samples': 9768000, 'steps': 50874, 'loss/train': 1.178216814994812} -11/07/2021 04:23:53 - INFO - __main__ - Step 50876: {'lr': 0.0003771004480045818, 'samples': 9768192, 'steps': 50875, 'loss/train': 1.0844007730484009} -11/07/2021 04:23:54 - INFO - __main__ - Step 50877: {'lr': 0.00037709587823236767, 'samples': 9768384, 'steps': 50876, 'loss/train': 1.0935975313186646} -11/07/2021 04:23:55 - INFO - __main__ - Step 50878: {'lr': 0.00037709130840288605, 'samples': 9768576, 'steps': 50877, 'loss/train': 1.5046992301940918} -11/07/2021 04:23:56 - INFO - __main__ - Step 50879: {'lr': 0.00037708673851613903, 'samples': 9768768, 'steps': 50878, 'loss/train': 1.512107014656067} -11/07/2021 04:23:56 - INFO - __main__ - Step 50880: {'lr': 0.00037708216857212863, 'samples': 9768960, 'steps': 50879, 'loss/train': 1.4767941236495972} -11/07/2021 04:23:56 - INFO - __main__ - Step 50881: {'lr': 0.0003770775985708571, 'samples': 9769152, 'steps': 50880, 'loss/train': 1.2471498250961304} -11/07/2021 04:23:57 - INFO - __main__ - Step 50882: {'lr': 0.0003770730285123263, 'samples': 9769344, 'steps': 50881, 'loss/train': 1.632147192955017} -11/07/2021 04:23:58 - INFO - __main__ - Step 50883: {'lr': 0.0003770684583965384, 'samples': 9769536, 'steps': 50882, 'loss/train': 0.994832456111908} -11/07/2021 04:23:58 - INFO - __main__ - Step 50884: {'lr': 0.0003770638882234953, 'samples': 9769728, 'steps': 50883, 'loss/train': 1.422627568244934} -11/07/2021 04:23:58 - INFO - __main__ - Step 50885: {'lr': 0.0003770593179931993, 'samples': 9769920, 'steps': 50884, 'loss/train': 1.1419776678085327} -11/07/2021 04:23:59 - INFO - __main__ - Step 50886: {'lr': 0.00037705474770565215, 'samples': 9770112, 'steps': 50885, 'loss/train': 1.7810052633285522} -11/07/2021 04:23:59 - INFO - __main__ - Step 50887: {'lr': 0.00037705017736085623, 'samples': 9770304, 'steps': 50886, 'loss/train': 1.781874179840088} -11/07/2021 04:23:59 - INFO - __main__ - Step 50888: {'lr': 0.00037704560695881346, 'samples': 9770496, 'steps': 50887, 'loss/train': 1.0416572093963623} -11/07/2021 04:24:01 - INFO - __main__ - Step 50889: {'lr': 0.0003770410364995259, 'samples': 9770688, 'steps': 50888, 'loss/train': 1.0607938766479492} -11/07/2021 04:24:01 - INFO - __main__ - Step 50890: {'lr': 0.00037703646598299554, 'samples': 9770880, 'steps': 50889, 'loss/train': 1.4012714624404907} -11/07/2021 04:24:02 - INFO - __main__ - Step 50891: {'lr': 0.00037703189540922463, 'samples': 9771072, 'steps': 50890, 'loss/train': 1.1869800090789795} -11/07/2021 04:24:02 - INFO - __main__ - Step 50892: {'lr': 0.000377027324778215, 'samples': 9771264, 'steps': 50891, 'loss/train': 1.6377372741699219} -11/07/2021 04:24:02 - INFO - __main__ - Step 50893: {'lr': 0.0003770227540899689, 'samples': 9771456, 'steps': 50892, 'loss/train': 1.1716175079345703} -11/07/2021 04:24:03 - INFO - __main__ - Step 50894: {'lr': 0.0003770181833444882, 'samples': 9771648, 'steps': 50893, 'loss/train': 0.227674663066864} -11/07/2021 04:24:04 - INFO - __main__ - Step 50895: {'lr': 0.0003770136125417751, 'samples': 9771840, 'steps': 50894, 'loss/train': 1.4408305883407593} -11/07/2021 04:24:04 - INFO - __main__ - Step 50896: {'lr': 0.0003770090416818317, 'samples': 9772032, 'steps': 50895, 'loss/train': 1.4755432605743408} -11/07/2021 04:24:05 - INFO - __main__ - Step 50897: {'lr': 0.00037700447076465996, 'samples': 9772224, 'steps': 50896, 'loss/train': 1.4067610502243042} -11/07/2021 04:24:05 - INFO - __main__ - Step 50898: {'lr': 0.0003769998997902619, 'samples': 9772416, 'steps': 50897, 'loss/train': 1.731428623199463} -11/07/2021 04:24:05 - INFO - __main__ - Step 50899: {'lr': 0.00037699532875863976, 'samples': 9772608, 'steps': 50898, 'loss/train': 1.5574582815170288} -11/07/2021 04:24:06 - INFO - __main__ - Step 50900: {'lr': 0.0003769907576697954, 'samples': 9772800, 'steps': 50899, 'loss/train': 1.311132550239563} -11/07/2021 04:24:07 - INFO - __main__ - Step 50901: {'lr': 0.000376986186523731, 'samples': 9772992, 'steps': 50900, 'loss/train': 1.404496192932129} -11/07/2021 04:24:07 - INFO - __main__ - Step 50902: {'lr': 0.0003769816153204485, 'samples': 9773184, 'steps': 50901, 'loss/train': 1.2235862016677856} -11/07/2021 04:24:07 - INFO - __main__ - Step 50903: {'lr': 0.00037697704405995015, 'samples': 9773376, 'steps': 50902, 'loss/train': 1.45487642288208} -11/07/2021 04:24:08 - INFO - __main__ - Step 50904: {'lr': 0.0003769724727422379, 'samples': 9773568, 'steps': 50903, 'loss/train': 1.3382630348205566} -11/07/2021 04:24:09 - INFO - __main__ - Step 50905: {'lr': 0.0003769679013673137, 'samples': 9773760, 'steps': 50904, 'loss/train': 1.6522085666656494} -11/07/2021 04:24:09 - INFO - __main__ - Step 50906: {'lr': 0.00037696332993517983, 'samples': 9773952, 'steps': 50905, 'loss/train': 1.360925316810608} -11/07/2021 04:24:09 - INFO - __main__ - Step 50907: {'lr': 0.0003769587584458382, 'samples': 9774144, 'steps': 50906, 'loss/train': 1.3342199325561523} -11/07/2021 04:24:10 - INFO - __main__ - Step 50908: {'lr': 0.00037695418689929095, 'samples': 9774336, 'steps': 50907, 'loss/train': 1.4487676620483398} -11/07/2021 04:24:10 - INFO - __main__ - Step 50909: {'lr': 0.00037694961529554006, 'samples': 9774528, 'steps': 50908, 'loss/train': 1.2917283773422241} -11/07/2021 04:24:11 - INFO - __main__ - Step 50910: {'lr': 0.0003769450436345877, 'samples': 9774720, 'steps': 50909, 'loss/train': 1.2469871044158936} -11/07/2021 04:24:11 - INFO - __main__ - Step 50911: {'lr': 0.00037694047191643576, 'samples': 9774912, 'steps': 50910, 'loss/train': 0.7166115045547485} -11/07/2021 04:24:12 - INFO - __main__ - Step 50912: {'lr': 0.00037693590014108646, 'samples': 9775104, 'steps': 50911, 'loss/train': 1.480364203453064} -11/07/2021 04:24:12 - INFO - __main__ - Step 50913: {'lr': 0.0003769313283085418, 'samples': 9775296, 'steps': 50912, 'loss/train': 1.0824471712112427} -11/07/2021 04:24:12 - INFO - __main__ - Step 50914: {'lr': 0.0003769267564188038, 'samples': 9775488, 'steps': 50913, 'loss/train': 1.4203639030456543} -11/07/2021 04:24:13 - INFO - __main__ - Step 50915: {'lr': 0.0003769221844718746, 'samples': 9775680, 'steps': 50914, 'loss/train': 1.8766120672225952} -11/07/2021 04:24:14 - INFO - __main__ - Step 50916: {'lr': 0.00037691761246775625, 'samples': 9775872, 'steps': 50915, 'loss/train': 1.2549500465393066} -11/07/2021 04:24:14 - INFO - __main__ - Step 50917: {'lr': 0.00037691304040645074, 'samples': 9776064, 'steps': 50916, 'loss/train': 1.245263695716858} -11/07/2021 04:24:15 - INFO - __main__ - Step 50918: {'lr': 0.00037690846828796024, 'samples': 9776256, 'steps': 50917, 'loss/train': 1.5781947374343872} -11/07/2021 04:24:15 - INFO - __main__ - Step 50919: {'lr': 0.00037690389611228664, 'samples': 9776448, 'steps': 50918, 'loss/train': 1.6627144813537598} -11/07/2021 04:24:16 - INFO - __main__ - Step 50920: {'lr': 0.00037689932387943216, 'samples': 9776640, 'steps': 50919, 'loss/train': 1.681615948677063} -11/07/2021 04:24:16 - INFO - __main__ - Step 50921: {'lr': 0.0003768947515893988, 'samples': 9776832, 'steps': 50920, 'loss/train': 2.0066945552825928} -11/07/2021 04:24:17 - INFO - __main__ - Step 50922: {'lr': 0.0003768901792421886, 'samples': 9777024, 'steps': 50921, 'loss/train': 1.188463568687439} -11/07/2021 04:24:17 - INFO - __main__ - Step 50923: {'lr': 0.0003768856068378036, 'samples': 9777216, 'steps': 50922, 'loss/train': 1.2847148180007935} -11/07/2021 04:24:17 - INFO - __main__ - Step 50924: {'lr': 0.000376881034376246, 'samples': 9777408, 'steps': 50923, 'loss/train': 1.717268943786621} -11/07/2021 04:24:18 - INFO - __main__ - Step 50925: {'lr': 0.0003768764618575178, 'samples': 9777600, 'steps': 50924, 'loss/train': 1.064644694328308} -11/07/2021 04:24:19 - INFO - __main__ - Step 50926: {'lr': 0.00037687188928162087, 'samples': 9777792, 'steps': 50925, 'loss/train': 1.1622135639190674} -11/07/2021 04:24:19 - INFO - __main__ - Step 50927: {'lr': 0.00037686731664855755, 'samples': 9777984, 'steps': 50926, 'loss/train': 1.6185857057571411} -11/07/2021 04:24:19 - INFO - __main__ - Step 50928: {'lr': 0.0003768627439583297, 'samples': 9778176, 'steps': 50927, 'loss/train': 1.2021294832229614} -11/07/2021 04:24:20 - INFO - __main__ - Step 50929: {'lr': 0.00037685817121093946, 'samples': 9778368, 'steps': 50928, 'loss/train': 1.309601068496704} -11/07/2021 04:24:21 - INFO - __main__ - Step 50930: {'lr': 0.000376853598406389, 'samples': 9778560, 'steps': 50929, 'loss/train': 0.9625622630119324} -11/07/2021 04:24:21 - INFO - __main__ - Step 50931: {'lr': 0.00037684902554468015, 'samples': 9778752, 'steps': 50930, 'loss/train': 1.2327609062194824} -11/07/2021 04:24:22 - INFO - __main__ - Step 50932: {'lr': 0.0003768444526258151, 'samples': 9778944, 'steps': 50931, 'loss/train': 1.4789179563522339} -11/07/2021 04:24:22 - INFO - __main__ - Step 50933: {'lr': 0.0003768398796497959, 'samples': 9779136, 'steps': 50932, 'loss/train': 1.0722277164459229} -11/07/2021 04:24:22 - INFO - __main__ - Step 50934: {'lr': 0.00037683530661662457, 'samples': 9779328, 'steps': 50933, 'loss/train': 1.4856834411621094} -11/07/2021 04:24:23 - INFO - __main__ - Step 50935: {'lr': 0.00037683073352630327, 'samples': 9779520, 'steps': 50934, 'loss/train': 1.6969283819198608} -11/07/2021 04:24:24 - INFO - __main__ - Step 50936: {'lr': 0.000376826160378834, 'samples': 9779712, 'steps': 50935, 'loss/train': 1.0604041814804077} -11/07/2021 04:24:24 - INFO - __main__ - Step 50937: {'lr': 0.0003768215871742188, 'samples': 9779904, 'steps': 50936, 'loss/train': 1.147591471672058} -11/07/2021 04:24:24 - INFO - __main__ - Step 50938: {'lr': 0.00037681701391245983, 'samples': 9780096, 'steps': 50937, 'loss/train': 0.8042525053024292} -11/07/2021 04:24:25 - INFO - __main__ - Step 50939: {'lr': 0.0003768124405935589, 'samples': 9780288, 'steps': 50938, 'loss/train': 1.5059691667556763} -11/07/2021 04:24:25 - INFO - __main__ - Step 50940: {'lr': 0.00037680786721751834, 'samples': 9780480, 'steps': 50939, 'loss/train': 1.6961679458618164} -11/07/2021 04:24:26 - INFO - __main__ - Step 50941: {'lr': 0.0003768032937843401, 'samples': 9780672, 'steps': 50940, 'loss/train': 1.6141343116760254} -11/07/2021 04:24:26 - INFO - __main__ - Step 50942: {'lr': 0.00037679872029402627, 'samples': 9780864, 'steps': 50941, 'loss/train': 1.6517798900604248} -11/07/2021 04:24:27 - INFO - __main__ - Step 50943: {'lr': 0.0003767941467465789, 'samples': 9781056, 'steps': 50942, 'loss/train': 2.1457533836364746} -11/07/2021 04:24:27 - INFO - __main__ - Step 50944: {'lr': 0.000376789573142, 'samples': 9781248, 'steps': 50943, 'loss/train': 1.5147534608840942} -11/07/2021 04:24:28 - INFO - __main__ - Step 50945: {'lr': 0.0003767849994802918, 'samples': 9781440, 'steps': 50944, 'loss/train': 1.5164519548416138} -11/07/2021 04:24:29 - INFO - __main__ - Step 50946: {'lr': 0.0003767804257614561, 'samples': 9781632, 'steps': 50945, 'loss/train': 1.181636095046997} -11/07/2021 04:24:29 - INFO - __main__ - Step 50947: {'lr': 0.00037677585198549516, 'samples': 9781824, 'steps': 50946, 'loss/train': 1.5399096012115479} -11/07/2021 04:24:29 - INFO - __main__ - Step 50948: {'lr': 0.00037677127815241086, 'samples': 9782016, 'steps': 50947, 'loss/train': 1.3078244924545288} -11/07/2021 04:24:30 - INFO - __main__ - Step 50949: {'lr': 0.00037676670426220547, 'samples': 9782208, 'steps': 50948, 'loss/train': 1.358941912651062} -11/07/2021 04:24:30 - INFO - __main__ - Step 50950: {'lr': 0.00037676213031488095, 'samples': 9782400, 'steps': 50949, 'loss/train': 1.3406785726547241} -11/07/2021 04:24:31 - INFO - __main__ - Step 50951: {'lr': 0.0003767575563104394, 'samples': 9782592, 'steps': 50950, 'loss/train': 1.4531294107437134} -11/07/2021 04:24:31 - INFO - __main__ - Step 50952: {'lr': 0.00037675298224888287, 'samples': 9782784, 'steps': 50951, 'loss/train': 1.345122218132019} -11/07/2021 04:24:32 - INFO - __main__ - Step 50953: {'lr': 0.0003767484081302133, 'samples': 9782976, 'steps': 50952, 'loss/train': 1.617568850517273} -11/07/2021 04:24:32 - INFO - __main__ - Step 50954: {'lr': 0.000376743833954433, 'samples': 9783168, 'steps': 50953, 'loss/train': 1.5393524169921875} -11/07/2021 04:24:33 - INFO - __main__ - Step 50955: {'lr': 0.00037673925972154376, 'samples': 9783360, 'steps': 50954, 'loss/train': 1.5331530570983887} -11/07/2021 04:24:34 - INFO - __main__ - Step 50956: {'lr': 0.00037673468543154777, 'samples': 9783552, 'steps': 50955, 'loss/train': 0.05478181689977646} -11/07/2021 04:24:34 - INFO - __main__ - Step 50957: {'lr': 0.0003767301110844472, 'samples': 9783744, 'steps': 50956, 'loss/train': 1.8871591091156006} -11/07/2021 04:24:34 - INFO - __main__ - Step 50958: {'lr': 0.0003767255366802439, 'samples': 9783936, 'steps': 50957, 'loss/train': 1.2720681428909302} -11/07/2021 04:24:35 - INFO - __main__ - Step 50959: {'lr': 0.00037672096221894004, 'samples': 9784128, 'steps': 50958, 'loss/train': 1.5616569519042969} -11/07/2021 04:24:35 - INFO - __main__ - Step 50960: {'lr': 0.0003767163877005376, 'samples': 9784320, 'steps': 50959, 'loss/train': 1.6533688306808472} -11/07/2021 04:24:36 - INFO - __main__ - Step 50961: {'lr': 0.0003767118131250388, 'samples': 9784512, 'steps': 50960, 'loss/train': 2.0300369262695312} -11/07/2021 04:24:36 - INFO - __main__ - Step 50962: {'lr': 0.00037670723849244557, 'samples': 9784704, 'steps': 50961, 'loss/train': 1.1564273834228516} -11/07/2021 04:24:37 - INFO - __main__ - Step 50963: {'lr': 0.0003767026638027601, 'samples': 9784896, 'steps': 50962, 'loss/train': 1.2109038829803467} -11/07/2021 04:24:37 - INFO - __main__ - Step 50964: {'lr': 0.00037669808905598434, 'samples': 9785088, 'steps': 50963, 'loss/train': 2.1062874794006348} -11/07/2021 04:24:37 - INFO - __main__ - Step 50965: {'lr': 0.0003766935142521203, 'samples': 9785280, 'steps': 50964, 'loss/train': 1.395483136177063} -11/07/2021 04:24:38 - INFO - __main__ - Step 50966: {'lr': 0.00037668893939117023, 'samples': 9785472, 'steps': 50965, 'loss/train': 1.069337010383606} -11/07/2021 04:24:39 - INFO - __main__ - Step 50967: {'lr': 0.000376684364473136, 'samples': 9785664, 'steps': 50966, 'loss/train': 1.7145888805389404} -11/07/2021 04:24:39 - INFO - __main__ - Step 50968: {'lr': 0.00037667978949801974, 'samples': 9785856, 'steps': 50967, 'loss/train': 1.388250470161438} -11/07/2021 04:24:39 - INFO - __main__ - Step 50969: {'lr': 0.00037667521446582355, 'samples': 9786048, 'steps': 50968, 'loss/train': 1.8198034763336182} -11/07/2021 04:24:40 - INFO - __main__ - Step 50970: {'lr': 0.00037667063937654944, 'samples': 9786240, 'steps': 50969, 'loss/train': 1.6997214555740356} -11/07/2021 04:24:41 - INFO - __main__ - Step 50971: {'lr': 0.00037666606423019956, 'samples': 9786432, 'steps': 50970, 'loss/train': 1.4291136264801025} -11/07/2021 04:24:41 - INFO - __main__ - Step 50972: {'lr': 0.00037666148902677576, 'samples': 9786624, 'steps': 50971, 'loss/train': 1.5241873264312744} -11/07/2021 04:24:42 - INFO - __main__ - Step 50973: {'lr': 0.0003766569137662804, 'samples': 9786816, 'steps': 50972, 'loss/train': 1.5081205368041992} -11/07/2021 04:24:42 - INFO - __main__ - Step 50974: {'lr': 0.00037665233844871534, 'samples': 9787008, 'steps': 50973, 'loss/train': 1.5813207626342773} -11/07/2021 04:24:42 - INFO - __main__ - Step 50975: {'lr': 0.0003766477630740827, 'samples': 9787200, 'steps': 50974, 'loss/train': 0.9070396423339844} -11/07/2021 04:24:43 - INFO - __main__ - Step 50976: {'lr': 0.00037664318764238445, 'samples': 9787392, 'steps': 50975, 'loss/train': 0.4607886075973511} -11/07/2021 04:24:44 - INFO - __main__ - Step 50977: {'lr': 0.0003766386121536228, 'samples': 9787584, 'steps': 50976, 'loss/train': 3.141408681869507} -11/07/2021 04:24:44 - INFO - __main__ - Step 50978: {'lr': 0.00037663403660779984, 'samples': 9787776, 'steps': 50977, 'loss/train': 1.2351731061935425} -11/07/2021 04:24:44 - INFO - __main__ - Step 50979: {'lr': 0.00037662946100491736, 'samples': 9787968, 'steps': 50978, 'loss/train': 1.4202797412872314} -11/07/2021 04:24:45 - INFO - __main__ - Step 50980: {'lr': 0.00037662488534497766, 'samples': 9788160, 'steps': 50979, 'loss/train': 0.7293932437896729} -11/07/2021 04:24:45 - INFO - __main__ - Step 50981: {'lr': 0.0003766203096279828, 'samples': 9788352, 'steps': 50980, 'loss/train': 2.311060667037964} -11/07/2021 04:24:46 - INFO - __main__ - Step 50982: {'lr': 0.00037661573385393477, 'samples': 9788544, 'steps': 50981, 'loss/train': 1.1850734949111938} -11/07/2021 04:24:47 - INFO - __main__ - Step 50983: {'lr': 0.0003766111580228356, 'samples': 9788736, 'steps': 50982, 'loss/train': 1.104164719581604} -11/07/2021 04:24:47 - INFO - __main__ - Step 50984: {'lr': 0.00037660658213468744, 'samples': 9788928, 'steps': 50983, 'loss/train': 1.3133814334869385} -11/07/2021 04:24:47 - INFO - __main__ - Step 50985: {'lr': 0.00037660200618949225, 'samples': 9789120, 'steps': 50984, 'loss/train': 1.201141357421875} -11/07/2021 04:24:48 - INFO - __main__ - Step 50986: {'lr': 0.0003765974301872522, 'samples': 9789312, 'steps': 50985, 'loss/train': 1.0673134326934814} -11/07/2021 04:24:49 - INFO - __main__ - Step 50987: {'lr': 0.0003765928541279693, 'samples': 9789504, 'steps': 50986, 'loss/train': 1.4994068145751953} -11/07/2021 04:24:49 - INFO - __main__ - Step 50988: {'lr': 0.0003765882780116455, 'samples': 9789696, 'steps': 50987, 'loss/train': 0.5558611750602722} -11/07/2021 04:24:49 - INFO - __main__ - Step 50989: {'lr': 0.0003765837018382831, 'samples': 9789888, 'steps': 50988, 'loss/train': 1.6570909023284912} -11/07/2021 04:24:50 - INFO - __main__ - Step 50990: {'lr': 0.0003765791256078841, 'samples': 9790080, 'steps': 50989, 'loss/train': 1.2512147426605225} -11/07/2021 04:24:50 - INFO - __main__ - Step 50991: {'lr': 0.00037657454932045036, 'samples': 9790272, 'steps': 50990, 'loss/train': 0.9478741884231567} -11/07/2021 04:24:51 - INFO - __main__ - Step 50992: {'lr': 0.00037656997297598417, 'samples': 9790464, 'steps': 50991, 'loss/train': 1.110074520111084} -11/07/2021 04:24:51 - INFO - __main__ - Step 50993: {'lr': 0.0003765653965744874, 'samples': 9790656, 'steps': 50992, 'loss/train': 1.4602985382080078} -11/07/2021 04:24:52 - INFO - __main__ - Step 50994: {'lr': 0.00037656082011596224, 'samples': 9790848, 'steps': 50993, 'loss/train': 1.0839636325836182} -11/07/2021 04:24:52 - INFO - __main__ - Step 50995: {'lr': 0.00037655624360041084, 'samples': 9791040, 'steps': 50994, 'loss/train': 0.879666805267334} -11/07/2021 04:24:52 - INFO - __main__ - Step 50996: {'lr': 0.00037655166702783507, 'samples': 9791232, 'steps': 50995, 'loss/train': 1.4642044305801392} -11/07/2021 04:24:54 - INFO - __main__ - Step 50997: {'lr': 0.0003765470903982371, 'samples': 9791424, 'steps': 50996, 'loss/train': 1.9917117357254028} -11/07/2021 04:24:54 - INFO - __main__ - Step 50998: {'lr': 0.0003765425137116189, 'samples': 9791616, 'steps': 50997, 'loss/train': 1.369557499885559} -11/07/2021 04:24:54 - INFO - __main__ - Step 50999: {'lr': 0.00037653793696798267, 'samples': 9791808, 'steps': 50998, 'loss/train': 1.602256178855896} -11/07/2021 04:24:55 - INFO - __main__ - Step 51000: {'lr': 0.0003765333601673303, 'samples': 9792000, 'steps': 50999, 'loss/train': 1.2036160230636597} -11/07/2021 04:24:55 - INFO - __main__ - Step 51001: {'lr': 0.0003765287833096641, 'samples': 9792192, 'steps': 51000, 'loss/train': 1.0194517374038696} -11/07/2021 04:24:56 - INFO - __main__ - Step 51002: {'lr': 0.00037652420639498583, 'samples': 9792384, 'steps': 51001, 'loss/train': 0.9271731376647949} -11/07/2021 04:24:56 - INFO - __main__ - Step 51003: {'lr': 0.00037651962942329784, 'samples': 9792576, 'steps': 51002, 'loss/train': 1.1674859523773193} -11/07/2021 04:24:57 - INFO - __main__ - Step 51004: {'lr': 0.0003765150523946019, 'samples': 9792768, 'steps': 51003, 'loss/train': 1.4975206851959229} -11/07/2021 04:24:57 - INFO - __main__ - Step 51005: {'lr': 0.00037651047530890035, 'samples': 9792960, 'steps': 51004, 'loss/train': 1.5388249158859253} -11/07/2021 04:24:57 - INFO - __main__ - Step 51006: {'lr': 0.0003765058981661952, 'samples': 9793152, 'steps': 51005, 'loss/train': 1.3791348934173584} -11/07/2021 04:24:58 - INFO - __main__ - Step 51007: {'lr': 0.0003765013209664883, 'samples': 9793344, 'steps': 51006, 'loss/train': 1.4319292306900024} -11/07/2021 04:24:59 - INFO - __main__ - Step 51008: {'lr': 0.00037649674370978195, 'samples': 9793536, 'steps': 51007, 'loss/train': 0.7983530759811401} -11/07/2021 04:24:59 - INFO - __main__ - Step 51009: {'lr': 0.000376492166396078, 'samples': 9793728, 'steps': 51008, 'loss/train': 1.3422341346740723} -11/07/2021 04:24:59 - INFO - __main__ - Step 51010: {'lr': 0.0003764875890253787, 'samples': 9793920, 'steps': 51009, 'loss/train': 1.3380659818649292} -11/07/2021 04:25:00 - INFO - __main__ - Step 51011: {'lr': 0.0003764830115976861, 'samples': 9794112, 'steps': 51010, 'loss/train': 2.4802086353302} -11/07/2021 04:25:00 - INFO - __main__ - Step 51012: {'lr': 0.00037647843411300213, 'samples': 9794304, 'steps': 51011, 'loss/train': 0.9203962087631226} -11/07/2021 04:25:01 - INFO - __main__ - Step 51013: {'lr': 0.00037647385657132895, 'samples': 9794496, 'steps': 51012, 'loss/train': 1.365518569946289} -11/07/2021 04:25:02 - INFO - __main__ - Step 51014: {'lr': 0.0003764692789726686, 'samples': 9794688, 'steps': 51013, 'loss/train': 0.8856534957885742} -11/07/2021 04:25:02 - INFO - __main__ - Step 51015: {'lr': 0.00037646470131702314, 'samples': 9794880, 'steps': 51014, 'loss/train': 1.6138612031936646} -11/07/2021 04:25:02 - INFO - __main__ - Step 51016: {'lr': 0.00037646012360439463, 'samples': 9795072, 'steps': 51015, 'loss/train': 1.444564700126648} -11/07/2021 04:25:03 - INFO - __main__ - Step 51017: {'lr': 0.0003764555458347851, 'samples': 9795264, 'steps': 51016, 'loss/train': 1.4704002141952515} -11/07/2021 04:25:04 - INFO - __main__ - Step 51018: {'lr': 0.00037645096800819684, 'samples': 9795456, 'steps': 51017, 'loss/train': 1.9046685695648193} -11/07/2021 04:25:04 - INFO - __main__ - Step 51019: {'lr': 0.00037644639012463155, 'samples': 9795648, 'steps': 51018, 'loss/train': 1.228771448135376} -11/07/2021 04:25:04 - INFO - __main__ - Step 51020: {'lr': 0.00037644181218409156, 'samples': 9795840, 'steps': 51019, 'loss/train': 1.7821251153945923} -11/07/2021 04:25:05 - INFO - __main__ - Step 51021: {'lr': 0.0003764372341865788, 'samples': 9796032, 'steps': 51020, 'loss/train': 1.356489658355713} -11/07/2021 04:25:05 - INFO - __main__ - Step 51022: {'lr': 0.00037643265613209533, 'samples': 9796224, 'steps': 51021, 'loss/train': 1.0176609754562378} -11/07/2021 04:25:06 - INFO - __main__ - Step 51023: {'lr': 0.00037642807802064327, 'samples': 9796416, 'steps': 51022, 'loss/train': 1.3684649467468262} -11/07/2021 04:25:07 - INFO - __main__ - Step 51024: {'lr': 0.00037642349985222474, 'samples': 9796608, 'steps': 51023, 'loss/train': 1.8060178756713867} -11/07/2021 04:25:07 - INFO - __main__ - Step 51025: {'lr': 0.0003764189216268417, 'samples': 9796800, 'steps': 51024, 'loss/train': 1.5317825078964233} -11/07/2021 04:25:07 - INFO - __main__ - Step 51026: {'lr': 0.0003764143433444962, 'samples': 9796992, 'steps': 51025, 'loss/train': 1.35077702999115} -11/07/2021 04:25:08 - INFO - __main__ - Step 51027: {'lr': 0.00037640976500519035, 'samples': 9797184, 'steps': 51026, 'loss/train': 2.0202128887176514} -11/07/2021 04:25:09 - INFO - __main__ - Step 51028: {'lr': 0.0003764051866089262, 'samples': 9797376, 'steps': 51027, 'loss/train': 1.3916025161743164} -11/07/2021 04:25:09 - INFO - __main__ - Step 51029: {'lr': 0.00037640060815570585, 'samples': 9797568, 'steps': 51028, 'loss/train': 1.1106539964675903} -11/07/2021 04:25:09 - INFO - __main__ - Step 51030: {'lr': 0.0003763960296455314, 'samples': 9797760, 'steps': 51029, 'loss/train': 1.4245356321334839} -11/07/2021 04:25:10 - INFO - __main__ - Step 51031: {'lr': 0.0003763914510784048, 'samples': 9797952, 'steps': 51030, 'loss/train': 1.5696529150009155} -11/07/2021 04:25:10 - INFO - __main__ - Step 51032: {'lr': 0.00037638687245432817, 'samples': 9798144, 'steps': 51031, 'loss/train': 1.0840160846710205} -11/07/2021 04:25:11 - INFO - __main__ - Step 51033: {'lr': 0.00037638229377330356, 'samples': 9798336, 'steps': 51032, 'loss/train': 1.2295622825622559} -11/07/2021 04:25:12 - INFO - __main__ - Step 51034: {'lr': 0.00037637771503533303, 'samples': 9798528, 'steps': 51033, 'loss/train': 1.0383323431015015} -11/07/2021 04:25:12 - INFO - __main__ - Step 51035: {'lr': 0.00037637313624041863, 'samples': 9798720, 'steps': 51034, 'loss/train': 1.4757288694381714} -11/07/2021 04:25:12 - INFO - __main__ - Step 51036: {'lr': 0.00037636855738856247, 'samples': 9798912, 'steps': 51035, 'loss/train': 1.072751522064209} -11/07/2021 04:25:13 - INFO - __main__ - Step 51037: {'lr': 0.00037636397847976656, 'samples': 9799104, 'steps': 51036, 'loss/train': 1.022415041923523} -11/07/2021 04:25:14 - INFO - __main__ - Step 51038: {'lr': 0.00037635939951403307, 'samples': 9799296, 'steps': 51037, 'loss/train': 1.2919124364852905} -11/07/2021 04:25:14 - INFO - __main__ - Step 51039: {'lr': 0.00037635482049136395, 'samples': 9799488, 'steps': 51038, 'loss/train': 2.3762500286102295} -11/07/2021 04:25:14 - INFO - __main__ - Step 51040: {'lr': 0.0003763502414117612, 'samples': 9799680, 'steps': 51039, 'loss/train': 1.3238046169281006} -11/07/2021 04:25:15 - INFO - __main__ - Step 51041: {'lr': 0.0003763456622752271, 'samples': 9799872, 'steps': 51040, 'loss/train': 1.8432047367095947} -11/07/2021 04:25:15 - INFO - __main__ - Step 51042: {'lr': 0.0003763410830817635, 'samples': 9800064, 'steps': 51041, 'loss/train': 1.0838677883148193} -11/07/2021 04:25:15 - INFO - __main__ - Step 51043: {'lr': 0.00037633650383137263, 'samples': 9800256, 'steps': 51042, 'loss/train': 0.8608529567718506} -11/07/2021 04:25:16 - INFO - __main__ - Step 51044: {'lr': 0.0003763319245240565, 'samples': 9800448, 'steps': 51043, 'loss/train': 1.2664395570755005} -11/07/2021 04:25:17 - INFO - __main__ - Step 51045: {'lr': 0.00037632734515981715, 'samples': 9800640, 'steps': 51044, 'loss/train': 1.5198123455047607} -11/07/2021 04:25:17 - INFO - __main__ - Step 51046: {'lr': 0.00037632276573865657, 'samples': 9800832, 'steps': 51045, 'loss/train': 2.2718794345855713} -11/07/2021 04:25:18 - INFO - __main__ - Step 51047: {'lr': 0.00037631818626057695, 'samples': 9801024, 'steps': 51046, 'loss/train': 1.485799789428711} -11/07/2021 04:25:18 - INFO - __main__ - Step 51048: {'lr': 0.0003763136067255803, 'samples': 9801216, 'steps': 51047, 'loss/train': 1.0966688394546509} -11/07/2021 04:25:19 - INFO - __main__ - Step 51049: {'lr': 0.00037630902713366865, 'samples': 9801408, 'steps': 51048, 'loss/train': 1.274632215499878} -11/07/2021 04:25:19 - INFO - __main__ - Step 51050: {'lr': 0.00037630444748484415, 'samples': 9801600, 'steps': 51049, 'loss/train': 1.422975778579712} -11/07/2021 04:25:20 - INFO - __main__ - Step 51051: {'lr': 0.00037629986777910885, 'samples': 9801792, 'steps': 51050, 'loss/train': 1.4993656873703003} -11/07/2021 04:25:20 - INFO - __main__ - Step 51052: {'lr': 0.00037629528801646475, 'samples': 9801984, 'steps': 51051, 'loss/train': 1.592901349067688} -11/07/2021 04:25:20 - INFO - __main__ - Step 51053: {'lr': 0.0003762907081969139, 'samples': 9802176, 'steps': 51052, 'loss/train': 1.0042757987976074} -11/07/2021 04:25:21 - INFO - __main__ - Step 51054: {'lr': 0.00037628612832045846, 'samples': 9802368, 'steps': 51053, 'loss/train': 1.1692345142364502} -11/07/2021 04:25:22 - INFO - __main__ - Step 51055: {'lr': 0.0003762815483871004, 'samples': 9802560, 'steps': 51054, 'loss/train': 0.5680693984031677} -11/07/2021 04:25:22 - INFO - __main__ - Step 51056: {'lr': 0.00037627696839684176, 'samples': 9802752, 'steps': 51055, 'loss/train': 1.7787619829177856} -11/07/2021 04:25:22 - INFO - __main__ - Step 51057: {'lr': 0.0003762723883496848, 'samples': 9802944, 'steps': 51056, 'loss/train': 1.5501517057418823} -11/07/2021 04:25:23 - INFO - __main__ - Step 51058: {'lr': 0.00037626780824563145, 'samples': 9803136, 'steps': 51057, 'loss/train': 1.1457315683364868} -11/07/2021 04:25:24 - INFO - __main__ - Step 51059: {'lr': 0.0003762632280846837, 'samples': 9803328, 'steps': 51058, 'loss/train': 1.0320316553115845} -11/07/2021 04:25:24 - INFO - __main__ - Step 51060: {'lr': 0.00037625864786684364, 'samples': 9803520, 'steps': 51059, 'loss/train': 1.1877084970474243} -11/07/2021 04:25:25 - INFO - __main__ - Step 51061: {'lr': 0.00037625406759211346, 'samples': 9803712, 'steps': 51060, 'loss/train': 1.035565733909607} -11/07/2021 04:25:25 - INFO - __main__ - Step 51062: {'lr': 0.00037624948726049513, 'samples': 9803904, 'steps': 51061, 'loss/train': 1.4257559776306152} -11/07/2021 04:25:25 - INFO - __main__ - Step 51063: {'lr': 0.0003762449068719907, 'samples': 9804096, 'steps': 51062, 'loss/train': 1.0471153259277344} -11/07/2021 04:25:26 - INFO - __main__ - Step 51064: {'lr': 0.00037624032642660234, 'samples': 9804288, 'steps': 51063, 'loss/train': 1.2665207386016846} -11/07/2021 04:25:27 - INFO - __main__ - Step 51065: {'lr': 0.00037623574592433195, 'samples': 9804480, 'steps': 51064, 'loss/train': 1.2061656713485718} -11/07/2021 04:25:27 - INFO - __main__ - Step 51066: {'lr': 0.00037623116536518176, 'samples': 9804672, 'steps': 51065, 'loss/train': 0.8431649804115295} -11/07/2021 04:25:27 - INFO - __main__ - Step 51067: {'lr': 0.00037622658474915373, 'samples': 9804864, 'steps': 51066, 'loss/train': 1.7555702924728394} -11/07/2021 04:25:28 - INFO - __main__ - Step 51068: {'lr': 0.0003762220040762499, 'samples': 9805056, 'steps': 51067, 'loss/train': 1.3444541692733765} -11/07/2021 04:25:29 - INFO - __main__ - Step 51069: {'lr': 0.0003762174233464724, 'samples': 9805248, 'steps': 51068, 'loss/train': 1.6199666261672974} -11/07/2021 04:25:29 - INFO - __main__ - Step 51070: {'lr': 0.00037621284255982324, 'samples': 9805440, 'steps': 51069, 'loss/train': 1.1775859594345093} -11/07/2021 04:25:30 - INFO - __main__ - Step 51071: {'lr': 0.0003762082617163046, 'samples': 9805632, 'steps': 51070, 'loss/train': 1.2825325727462769} -11/07/2021 04:25:30 - INFO - __main__ - Step 51072: {'lr': 0.0003762036808159185, 'samples': 9805824, 'steps': 51071, 'loss/train': 1.4918760061264038} -11/07/2021 04:25:30 - INFO - __main__ - Step 51073: {'lr': 0.0003761990998586669, 'samples': 9806016, 'steps': 51072, 'loss/train': 1.979184627532959} -11/07/2021 04:25:31 - INFO - __main__ - Step 51074: {'lr': 0.0003761945188445519, 'samples': 9806208, 'steps': 51073, 'loss/train': 1.551345944404602} -11/07/2021 04:25:32 - INFO - __main__ - Step 51075: {'lr': 0.00037618993777357567, 'samples': 9806400, 'steps': 51074, 'loss/train': 1.4490280151367188} -11/07/2021 04:25:32 - INFO - __main__ - Step 51076: {'lr': 0.00037618535664574014, 'samples': 9806592, 'steps': 51075, 'loss/train': 1.307779312133789} -11/07/2021 04:25:32 - INFO - __main__ - Step 51077: {'lr': 0.0003761807754610475, 'samples': 9806784, 'steps': 51076, 'loss/train': 1.5131794214248657} -11/07/2021 04:25:33 - INFO - __main__ - Step 51078: {'lr': 0.0003761761942194997, 'samples': 9806976, 'steps': 51077, 'loss/train': 1.1490602493286133} -11/07/2021 04:25:34 - INFO - __main__ - Step 51079: {'lr': 0.00037617161292109887, 'samples': 9807168, 'steps': 51078, 'loss/train': 1.1951687335968018} -11/07/2021 04:25:34 - INFO - __main__ - Step 51080: {'lr': 0.0003761670315658471, 'samples': 9807360, 'steps': 51079, 'loss/train': 1.4678398370742798} -11/07/2021 04:25:34 - INFO - __main__ - Step 51081: {'lr': 0.0003761624501537463, 'samples': 9807552, 'steps': 51080, 'loss/train': 1.7070611715316772} -11/07/2021 04:25:35 - INFO - __main__ - Step 51082: {'lr': 0.00037615786868479875, 'samples': 9807744, 'steps': 51081, 'loss/train': 1.6293083429336548} -11/07/2021 04:25:35 - INFO - __main__ - Step 51083: {'lr': 0.0003761532871590063, 'samples': 9807936, 'steps': 51082, 'loss/train': 2.0467350482940674} -11/07/2021 04:25:36 - INFO - __main__ - Step 51084: {'lr': 0.0003761487055763713, 'samples': 9808128, 'steps': 51083, 'loss/train': 1.0840213298797607} -11/07/2021 04:25:37 - INFO - __main__ - Step 51085: {'lr': 0.0003761441239368955, 'samples': 9808320, 'steps': 51084, 'loss/train': 1.654410481452942} -11/07/2021 04:25:37 - INFO - __main__ - Step 51086: {'lr': 0.0003761395422405811, 'samples': 9808512, 'steps': 51085, 'loss/train': 1.5213103294372559} -11/07/2021 04:25:37 - INFO - __main__ - Step 51087: {'lr': 0.00037613496048743023, 'samples': 9808704, 'steps': 51086, 'loss/train': 2.194960832595825} -11/07/2021 04:25:38 - INFO - __main__ - Step 51088: {'lr': 0.00037613037867744494, 'samples': 9808896, 'steps': 51087, 'loss/train': 1.4452787637710571} -11/07/2021 04:25:39 - INFO - __main__ - Step 51089: {'lr': 0.00037612579681062713, 'samples': 9809088, 'steps': 51088, 'loss/train': 2.0537967681884766} -11/07/2021 04:25:39 - INFO - __main__ - Step 51090: {'lr': 0.000376121214886979, 'samples': 9809280, 'steps': 51089, 'loss/train': 1.2467275857925415} -11/07/2021 04:25:39 - INFO - __main__ - Step 51091: {'lr': 0.00037611663290650267, 'samples': 9809472, 'steps': 51090, 'loss/train': 1.3502446413040161} -11/07/2021 04:25:40 - INFO - __main__ - Step 51092: {'lr': 0.0003761120508692001, 'samples': 9809664, 'steps': 51091, 'loss/train': 1.2698564529418945} -11/07/2021 04:25:40 - INFO - __main__ - Step 51093: {'lr': 0.00037610746877507343, 'samples': 9809856, 'steps': 51092, 'loss/train': 1.6742361783981323} -11/07/2021 04:25:41 - INFO - __main__ - Step 51094: {'lr': 0.0003761028866241246, 'samples': 9810048, 'steps': 51093, 'loss/train': 1.6833693981170654} -11/07/2021 04:25:41 - INFO - __main__ - Step 51095: {'lr': 0.00037609830441635573, 'samples': 9810240, 'steps': 51094, 'loss/train': 1.6488521099090576} -11/07/2021 04:25:42 - INFO - __main__ - Step 51096: {'lr': 0.00037609372215176897, 'samples': 9810432, 'steps': 51095, 'loss/train': 1.3324769735336304} -11/07/2021 04:25:42 - INFO - __main__ - Step 51097: {'lr': 0.0003760891398303663, 'samples': 9810624, 'steps': 51096, 'loss/train': 1.8812788724899292} -11/07/2021 04:25:42 - INFO - __main__ - Step 51098: {'lr': 0.0003760845574521499, 'samples': 9810816, 'steps': 51097, 'loss/train': 1.2763627767562866} -11/07/2021 04:25:43 - INFO - __main__ - Step 51099: {'lr': 0.00037607997501712165, 'samples': 9811008, 'steps': 51098, 'loss/train': 1.563471794128418} -11/07/2021 04:25:44 - INFO - __main__ - Step 51100: {'lr': 0.0003760753925252838, 'samples': 9811200, 'steps': 51099, 'loss/train': 0.26753655076026917} -11/07/2021 04:25:44 - INFO - __main__ - Step 51101: {'lr': 0.0003760708099766382, 'samples': 9811392, 'steps': 51100, 'loss/train': 2.09893798828125} -11/07/2021 04:25:45 - INFO - __main__ - Step 51102: {'lr': 0.00037606622737118713, 'samples': 9811584, 'steps': 51101, 'loss/train': 1.1198339462280273} -11/07/2021 04:25:45 - INFO - __main__ - Step 51103: {'lr': 0.00037606164470893247, 'samples': 9811776, 'steps': 51102, 'loss/train': 1.3035331964492798} -11/07/2021 04:25:45 - INFO - __main__ - Step 51104: {'lr': 0.00037605706198987646, 'samples': 9811968, 'steps': 51103, 'loss/train': 0.9974083304405212} -11/07/2021 04:25:46 - INFO - __main__ - Step 51105: {'lr': 0.0003760524792140211, 'samples': 9812160, 'steps': 51104, 'loss/train': 1.4258350133895874} -11/07/2021 04:25:47 - INFO - __main__ - Step 51106: {'lr': 0.0003760478963813684, 'samples': 9812352, 'steps': 51105, 'loss/train': 1.657906413078308} -11/07/2021 04:25:47 - INFO - __main__ - Step 51107: {'lr': 0.00037604331349192047, 'samples': 9812544, 'steps': 51106, 'loss/train': 1.748923659324646} -11/07/2021 04:25:47 - INFO - __main__ - Step 51108: {'lr': 0.00037603873054567927, 'samples': 9812736, 'steps': 51107, 'loss/train': 1.3222150802612305} -11/07/2021 04:25:48 - INFO - __main__ - Step 51109: {'lr': 0.00037603414754264707, 'samples': 9812928, 'steps': 51108, 'loss/train': 1.42711341381073} -11/07/2021 04:25:49 - INFO - __main__ - Step 51110: {'lr': 0.00037602956448282577, 'samples': 9813120, 'steps': 51109, 'loss/train': 1.2570126056671143} -11/07/2021 04:25:49 - INFO - __main__ - Step 51111: {'lr': 0.00037602498136621754, 'samples': 9813312, 'steps': 51110, 'loss/train': 1.5092865228652954} -11/07/2021 04:25:50 - INFO - __main__ - Step 51112: {'lr': 0.00037602039819282444, 'samples': 9813504, 'steps': 51111, 'loss/train': 1.6016576290130615} -11/07/2021 04:25:50 - INFO - __main__ - Step 51113: {'lr': 0.00037601581496264847, 'samples': 9813696, 'steps': 51112, 'loss/train': 1.3010882139205933} -11/07/2021 04:25:50 - INFO - __main__ - Step 51114: {'lr': 0.0003760112316756917, 'samples': 9813888, 'steps': 51113, 'loss/train': 1.7741448879241943} -11/07/2021 04:25:51 - INFO - __main__ - Step 51115: {'lr': 0.0003760066483319562, 'samples': 9814080, 'steps': 51114, 'loss/train': 0.8605861067771912} -11/07/2021 04:25:52 - INFO - __main__ - Step 51116: {'lr': 0.000376002064931444, 'samples': 9814272, 'steps': 51115, 'loss/train': 1.5896106958389282} -11/07/2021 04:25:52 - INFO - __main__ - Step 51117: {'lr': 0.00037599748147415724, 'samples': 9814464, 'steps': 51116, 'loss/train': 1.5450607538223267} -11/07/2021 04:25:52 - INFO - __main__ - Step 51118: {'lr': 0.000375992897960098, 'samples': 9814656, 'steps': 51117, 'loss/train': 1.7376378774642944} -11/07/2021 04:25:53 - INFO - __main__ - Step 51119: {'lr': 0.0003759883143892683, 'samples': 9814848, 'steps': 51118, 'loss/train': 2.2202067375183105} -11/07/2021 04:25:53 - INFO - __main__ - Step 51120: {'lr': 0.00037598373076167023, 'samples': 9815040, 'steps': 51119, 'loss/train': 1.8037248849868774} -11/07/2021 04:25:54 - INFO - __main__ - Step 51121: {'lr': 0.0003759791470773058, 'samples': 9815232, 'steps': 51120, 'loss/train': 1.4552325010299683} -11/07/2021 04:25:54 - INFO - __main__ - Step 51122: {'lr': 0.0003759745633361771, 'samples': 9815424, 'steps': 51121, 'loss/train': 1.3235969543457031} -11/07/2021 04:25:55 - INFO - __main__ - Step 51123: {'lr': 0.0003759699795382863, 'samples': 9815616, 'steps': 51122, 'loss/train': 1.767889142036438} -11/07/2021 04:25:55 - INFO - __main__ - Step 51124: {'lr': 0.00037596539568363524, 'samples': 9815808, 'steps': 51123, 'loss/train': 1.190832257270813} -11/07/2021 04:25:56 - INFO - __main__ - Step 51125: {'lr': 0.0003759608117722262, 'samples': 9816000, 'steps': 51124, 'loss/train': 1.942044734954834} -11/07/2021 04:25:57 - INFO - __main__ - Step 51126: {'lr': 0.00037595622780406114, 'samples': 9816192, 'steps': 51125, 'loss/train': 1.6755667924880981} -11/07/2021 04:25:57 - INFO - __main__ - Step 51127: {'lr': 0.0003759516437791421, 'samples': 9816384, 'steps': 51126, 'loss/train': 5.812788963317871} -11/07/2021 04:25:57 - INFO - __main__ - Step 51128: {'lr': 0.0003759470596974712, 'samples': 9816576, 'steps': 51127, 'loss/train': 1.7180052995681763} -11/07/2021 04:25:58 - INFO - __main__ - Step 51129: {'lr': 0.0003759424755590505, 'samples': 9816768, 'steps': 51128, 'loss/train': 1.8356326818466187} -11/07/2021 04:25:58 - INFO - __main__ - Step 51130: {'lr': 0.0003759378913638822, 'samples': 9816960, 'steps': 51129, 'loss/train': 1.433469295501709} -11/07/2021 04:25:58 - INFO - __main__ - Step 51131: {'lr': 0.0003759333071119681, 'samples': 9817152, 'steps': 51130, 'loss/train': 1.8264704942703247} -11/07/2021 04:26:00 - INFO - __main__ - Step 51132: {'lr': 0.0003759287228033104, 'samples': 9817344, 'steps': 51131, 'loss/train': 1.4732524156570435} -11/07/2021 04:26:00 - INFO - __main__ - Step 51133: {'lr': 0.0003759241384379112, 'samples': 9817536, 'steps': 51132, 'loss/train': 1.5256009101867676} -11/07/2021 04:26:01 - INFO - __main__ - Step 51134: {'lr': 0.0003759195540157725, 'samples': 9817728, 'steps': 51133, 'loss/train': 5.581474304199219} -11/07/2021 04:26:01 - INFO - __main__ - Step 51135: {'lr': 0.00037591496953689644, 'samples': 9817920, 'steps': 51134, 'loss/train': 5.611433982849121} -11/07/2021 04:26:01 - INFO - __main__ - Step 51136: {'lr': 0.00037591038500128495, 'samples': 9818112, 'steps': 51135, 'loss/train': 1.5781525373458862} -11/07/2021 04:26:02 - INFO - __main__ - Step 51137: {'lr': 0.00037590580040894024, 'samples': 9818304, 'steps': 51136, 'loss/train': 1.3154970407485962} -11/07/2021 04:26:03 - INFO - __main__ - Step 51138: {'lr': 0.0003759012157598643, 'samples': 9818496, 'steps': 51137, 'loss/train': 1.8281892538070679} -11/07/2021 04:26:03 - INFO - __main__ - Step 51139: {'lr': 0.00037589663105405924, 'samples': 9818688, 'steps': 51138, 'loss/train': 1.3921667337417603} -11/07/2021 04:26:03 - INFO - __main__ - Step 51140: {'lr': 0.00037589204629152705, 'samples': 9818880, 'steps': 51139, 'loss/train': 1.0147649049758911} -11/07/2021 04:26:04 - INFO - __main__ - Step 51141: {'lr': 0.00037588746147226994, 'samples': 9819072, 'steps': 51140, 'loss/train': 1.3558980226516724} -11/07/2021 04:26:04 - INFO - __main__ - Step 51142: {'lr': 0.00037588287659628977, 'samples': 9819264, 'steps': 51141, 'loss/train': 1.4923806190490723} -11/07/2021 04:26:05 - INFO - __main__ - Step 51143: {'lr': 0.0003758782916635888, 'samples': 9819456, 'steps': 51142, 'loss/train': 1.5209615230560303} -11/07/2021 04:26:05 - INFO - __main__ - Step 51144: {'lr': 0.000375873706674169, 'samples': 9819648, 'steps': 51143, 'loss/train': 1.5310009717941284} -11/07/2021 04:26:06 - INFO - __main__ - Step 51145: {'lr': 0.0003758691216280324, 'samples': 9819840, 'steps': 51144, 'loss/train': 1.2682783603668213} -11/07/2021 04:26:06 - INFO - __main__ - Step 51146: {'lr': 0.00037586453652518117, 'samples': 9820032, 'steps': 51145, 'loss/train': 1.249147891998291} -11/07/2021 04:26:06 - INFO - __main__ - Step 51147: {'lr': 0.00037585995136561734, 'samples': 9820224, 'steps': 51146, 'loss/train': 1.5766587257385254} -11/07/2021 04:26:07 - INFO - __main__ - Step 51148: {'lr': 0.0003758553661493429, 'samples': 9820416, 'steps': 51147, 'loss/train': 1.3657782077789307} -11/07/2021 04:26:08 - INFO - __main__ - Step 51149: {'lr': 0.00037585078087635994, 'samples': 9820608, 'steps': 51148, 'loss/train': 1.239439845085144} -11/07/2021 04:26:08 - INFO - __main__ - Step 51150: {'lr': 0.00037584619554667065, 'samples': 9820800, 'steps': 51149, 'loss/train': 1.6626681089401245} -11/07/2021 04:26:09 - INFO - __main__ - Step 51151: {'lr': 0.000375841610160277, 'samples': 9820992, 'steps': 51150, 'loss/train': 1.2145030498504639} -11/07/2021 04:26:09 - INFO - __main__ - Step 51152: {'lr': 0.00037583702471718106, 'samples': 9821184, 'steps': 51151, 'loss/train': 1.277573823928833} -11/07/2021 04:26:09 - INFO - __main__ - Step 51153: {'lr': 0.00037583243921738484, 'samples': 9821376, 'steps': 51152, 'loss/train': 1.323180079460144} -11/07/2021 04:26:10 - INFO - __main__ - Step 51154: {'lr': 0.0003758278536608905, 'samples': 9821568, 'steps': 51153, 'loss/train': 1.5218793153762817} -11/07/2021 04:26:11 - INFO - __main__ - Step 51155: {'lr': 0.00037582326804770004, 'samples': 9821760, 'steps': 51154, 'loss/train': 1.1672931909561157} -11/07/2021 04:26:11 - INFO - __main__ - Step 51156: {'lr': 0.0003758186823778156, 'samples': 9821952, 'steps': 51155, 'loss/train': 1.6178406476974487} -11/07/2021 04:26:11 - INFO - __main__ - Step 51157: {'lr': 0.0003758140966512392, 'samples': 9822144, 'steps': 51156, 'loss/train': 1.4110069274902344} -11/07/2021 04:26:12 - INFO - __main__ - Step 51158: {'lr': 0.0003758095108679729, 'samples': 9822336, 'steps': 51157, 'loss/train': 1.5689750909805298} -11/07/2021 04:26:13 - INFO - __main__ - Step 51159: {'lr': 0.0003758049250280188, 'samples': 9822528, 'steps': 51158, 'loss/train': 1.546869158744812} -11/07/2021 04:26:13 - INFO - __main__ - Step 51160: {'lr': 0.0003758003391313789, 'samples': 9822720, 'steps': 51159, 'loss/train': 1.3399982452392578} -11/07/2021 04:26:13 - INFO - __main__ - Step 51161: {'lr': 0.00037579575317805525, 'samples': 9822912, 'steps': 51160, 'loss/train': 1.4853978157043457} -11/07/2021 04:26:14 - INFO - __main__ - Step 51162: {'lr': 0.00037579116716805007, 'samples': 9823104, 'steps': 51161, 'loss/train': 1.910470962524414} -11/07/2021 04:26:14 - INFO - __main__ - Step 51163: {'lr': 0.00037578658110136535, 'samples': 9823296, 'steps': 51162, 'loss/train': 1.8178781270980835} -11/07/2021 04:26:15 - INFO - __main__ - Step 51164: {'lr': 0.00037578199497800304, 'samples': 9823488, 'steps': 51163, 'loss/train': 1.254246711730957} -11/07/2021 04:26:16 - INFO - __main__ - Step 51165: {'lr': 0.0003757774087979654, 'samples': 9823680, 'steps': 51164, 'loss/train': 1.3284828662872314} -11/07/2021 04:26:16 - INFO - __main__ - Step 51166: {'lr': 0.0003757728225612543, 'samples': 9823872, 'steps': 51165, 'loss/train': 1.1570911407470703} -11/07/2021 04:26:16 - INFO - __main__ - Step 51167: {'lr': 0.00037576823626787203, 'samples': 9824064, 'steps': 51166, 'loss/train': 1.0579010248184204} -11/07/2021 04:26:17 - INFO - __main__ - Step 51168: {'lr': 0.00037576364991782045, 'samples': 9824256, 'steps': 51167, 'loss/train': 1.2708224058151245} -11/07/2021 04:26:18 - INFO - __main__ - Step 51169: {'lr': 0.00037575906351110174, 'samples': 9824448, 'steps': 51168, 'loss/train': 1.0911803245544434} -11/07/2021 04:26:18 - INFO - __main__ - Step 51170: {'lr': 0.0003757544770477179, 'samples': 9824640, 'steps': 51169, 'loss/train': 1.6708488464355469} -11/07/2021 04:26:18 - INFO - __main__ - Step 51171: {'lr': 0.00037574989052767106, 'samples': 9824832, 'steps': 51170, 'loss/train': 1.4156115055084229} -11/07/2021 04:26:19 - INFO - __main__ - Step 51172: {'lr': 0.0003757453039509633, 'samples': 9825024, 'steps': 51171, 'loss/train': 1.4718499183654785} -11/07/2021 04:26:19 - INFO - __main__ - Step 51173: {'lr': 0.0003757407173175966, 'samples': 9825216, 'steps': 51172, 'loss/train': 1.422802448272705} -11/07/2021 04:26:20 - INFO - __main__ - Step 51174: {'lr': 0.00037573613062757304, 'samples': 9825408, 'steps': 51173, 'loss/train': 1.4421409368515015} -11/07/2021 04:26:20 - INFO - __main__ - Step 51175: {'lr': 0.00037573154388089483, 'samples': 9825600, 'steps': 51174, 'loss/train': 1.019473910331726} -11/07/2021 04:26:21 - INFO - __main__ - Step 51176: {'lr': 0.00037572695707756385, 'samples': 9825792, 'steps': 51175, 'loss/train': 1.5388219356536865} -11/07/2021 04:26:21 - INFO - __main__ - Step 51177: {'lr': 0.0003757223702175822, 'samples': 9825984, 'steps': 51176, 'loss/train': 1.487369179725647} -11/07/2021 04:26:22 - INFO - __main__ - Step 51178: {'lr': 0.00037571778330095206, 'samples': 9826176, 'steps': 51177, 'loss/train': 0.8048746585845947} -11/07/2021 04:26:22 - INFO - __main__ - Step 51179: {'lr': 0.00037571319632767543, 'samples': 9826368, 'steps': 51178, 'loss/train': 1.4266879558563232} -11/07/2021 04:26:23 - INFO - __main__ - Step 51180: {'lr': 0.0003757086092977544, 'samples': 9826560, 'steps': 51179, 'loss/train': 1.2909984588623047} -11/07/2021 04:26:23 - INFO - __main__ - Step 51181: {'lr': 0.00037570402221119093, 'samples': 9826752, 'steps': 51180, 'loss/train': 1.4604463577270508} -11/07/2021 04:26:24 - INFO - __main__ - Step 51182: {'lr': 0.0003756994350679872, 'samples': 9826944, 'steps': 51181, 'loss/train': 1.4334055185317993} -11/07/2021 04:26:24 - INFO - __main__ - Step 51183: {'lr': 0.00037569484786814525, 'samples': 9827136, 'steps': 51182, 'loss/train': 1.5371993780136108} -11/07/2021 04:26:24 - INFO - __main__ - Step 51184: {'lr': 0.0003756902606116671, 'samples': 9827328, 'steps': 51183, 'loss/train': 1.7246803045272827} -11/07/2021 04:26:26 - INFO - __main__ - Step 51185: {'lr': 0.00037568567329855483, 'samples': 9827520, 'steps': 51184, 'loss/train': 1.031441330909729} -11/07/2021 04:26:26 - INFO - __main__ - Step 51186: {'lr': 0.00037568108592881067, 'samples': 9827712, 'steps': 51185, 'loss/train': 0.8346840739250183} -11/07/2021 04:26:26 - INFO - __main__ - Step 51187: {'lr': 0.00037567649850243646, 'samples': 9827904, 'steps': 51186, 'loss/train': 1.7006884813308716} -11/07/2021 04:26:27 - INFO - __main__ - Step 51188: {'lr': 0.00037567191101943437, 'samples': 9828096, 'steps': 51187, 'loss/train': 1.8177293539047241} -11/07/2021 04:26:27 - INFO - __main__ - Step 51189: {'lr': 0.00037566732347980647, 'samples': 9828288, 'steps': 51188, 'loss/train': 1.2582699060440063} -11/07/2021 04:26:28 - INFO - __main__ - Step 51190: {'lr': 0.0003756627358835548, 'samples': 9828480, 'steps': 51189, 'loss/train': 1.6479040384292603} -11/07/2021 04:26:28 - INFO - __main__ - Step 51191: {'lr': 0.00037565814823068143, 'samples': 9828672, 'steps': 51190, 'loss/train': 1.7629849910736084} -11/07/2021 04:26:29 - INFO - __main__ - Step 51192: {'lr': 0.0003756535605211885, 'samples': 9828864, 'steps': 51191, 'loss/train': 0.8963702917098999} -11/07/2021 04:26:29 - INFO - __main__ - Step 51193: {'lr': 0.000375648972755078, 'samples': 9829056, 'steps': 51192, 'loss/train': 1.5291481018066406} -11/07/2021 04:26:29 - INFO - __main__ - Step 51194: {'lr': 0.00037564438493235195, 'samples': 9829248, 'steps': 51193, 'loss/train': 1.6048918962478638} -11/07/2021 04:26:31 - INFO - __main__ - Step 51195: {'lr': 0.0003756397970530125, 'samples': 9829440, 'steps': 51194, 'loss/train': 1.336006999015808} -11/07/2021 04:26:31 - INFO - __main__ - Step 51196: {'lr': 0.00037563520911706175, 'samples': 9829632, 'steps': 51195, 'loss/train': 1.1494961977005005} -11/07/2021 04:26:32 - INFO - __main__ - Step 51197: {'lr': 0.0003756306211245016, 'samples': 9829824, 'steps': 51196, 'loss/train': 1.3077516555786133} -11/07/2021 04:26:32 - INFO - __main__ - Step 51198: {'lr': 0.0003756260330753343, 'samples': 9830016, 'steps': 51197, 'loss/train': 1.2972228527069092} -11/07/2021 04:26:32 - INFO - __main__ - Step 51199: {'lr': 0.00037562144496956193, 'samples': 9830208, 'steps': 51198, 'loss/train': 0.075208380818367} -11/07/2021 04:26:33 - INFO - __main__ - Step 51200: {'lr': 0.0003756168568071864, 'samples': 9830400, 'steps': 51199, 'loss/train': 1.175175666809082} -11/07/2021 04:26:34 - INFO - __main__ - Step 51201: {'lr': 0.0003756122685882098, 'samples': 9830592, 'steps': 51200, 'loss/train': 1.2902253866195679} -11/07/2021 04:26:34 - INFO - __main__ - Step 51202: {'lr': 0.00037560768031263427, 'samples': 9830784, 'steps': 51201, 'loss/train': 1.6287318468093872} -11/07/2021 04:26:34 - INFO - __main__ - Step 51203: {'lr': 0.0003756030919804619, 'samples': 9830976, 'steps': 51202, 'loss/train': 1.1665724515914917} -11/07/2021 04:26:35 - INFO - __main__ - Step 51204: {'lr': 0.00037559850359169465, 'samples': 9831168, 'steps': 51203, 'loss/train': 1.0926939249038696} -11/07/2021 04:26:35 - INFO - __main__ - Step 51205: {'lr': 0.0003755939151463347, 'samples': 9831360, 'steps': 51204, 'loss/train': 1.5217796564102173} -11/07/2021 04:26:36 - INFO - __main__ - Step 51206: {'lr': 0.0003755893266443842, 'samples': 9831552, 'steps': 51205, 'loss/train': 1.3197687864303589} -11/07/2021 04:26:37 - INFO - __main__ - Step 51207: {'lr': 0.0003755847380858449, 'samples': 9831744, 'steps': 51206, 'loss/train': 1.1206849813461304} -11/07/2021 04:26:37 - INFO - __main__ - Step 51208: {'lr': 0.0003755801494707191, 'samples': 9831936, 'steps': 51207, 'loss/train': 1.1840324401855469} -11/07/2021 04:26:37 - INFO - __main__ - Step 51209: {'lr': 0.00037557556079900886, 'samples': 9832128, 'steps': 51208, 'loss/train': 1.5369545221328735} -11/07/2021 04:26:38 - INFO - __main__ - Step 51210: {'lr': 0.0003755709720707161, 'samples': 9832320, 'steps': 51209, 'loss/train': 1.1344716548919678} -11/07/2021 04:26:39 - INFO - __main__ - Step 51211: {'lr': 0.00037556638328584314, 'samples': 9832512, 'steps': 51210, 'loss/train': 1.7113068103790283} -11/07/2021 04:26:39 - INFO - __main__ - Step 51212: {'lr': 0.0003755617944443919, 'samples': 9832704, 'steps': 51211, 'loss/train': 1.5996965169906616} -11/07/2021 04:26:39 - INFO - __main__ - Step 51213: {'lr': 0.00037555720554636443, 'samples': 9832896, 'steps': 51212, 'loss/train': 1.3318369388580322} -11/07/2021 04:26:40 - INFO - __main__ - Step 51214: {'lr': 0.00037555261659176275, 'samples': 9833088, 'steps': 51213, 'loss/train': 1.6860949993133545} -11/07/2021 04:26:40 - INFO - __main__ - Step 51215: {'lr': 0.00037554802758058903, 'samples': 9833280, 'steps': 51214, 'loss/train': 1.3410645723342896} -11/07/2021 04:26:41 - INFO - __main__ - Step 51216: {'lr': 0.0003755434385128453, 'samples': 9833472, 'steps': 51215, 'loss/train': 1.4011985063552856} -11/07/2021 04:26:41 - INFO - __main__ - Step 51217: {'lr': 0.00037553884938853365, 'samples': 9833664, 'steps': 51216, 'loss/train': 1.1416559219360352} -11/07/2021 04:26:42 - INFO - __main__ - Step 51218: {'lr': 0.0003755342602076561, 'samples': 9833856, 'steps': 51217, 'loss/train': 1.0293290615081787} -11/07/2021 04:26:42 - INFO - __main__ - Step 51219: {'lr': 0.0003755296709702148, 'samples': 9834048, 'steps': 51218, 'loss/train': 1.7509585618972778} -11/07/2021 04:26:42 - INFO - __main__ - Step 51220: {'lr': 0.0003755250816762118, 'samples': 9834240, 'steps': 51219, 'loss/train': 1.5241022109985352} -11/07/2021 04:26:44 - INFO - __main__ - Step 51221: {'lr': 0.00037552049232564906, 'samples': 9834432, 'steps': 51220, 'loss/train': 1.921941876411438} -11/07/2021 04:26:44 - INFO - __main__ - Step 51222: {'lr': 0.0003755159029185288, 'samples': 9834624, 'steps': 51221, 'loss/train': 1.2071889638900757} -11/07/2021 04:26:44 - INFO - __main__ - Step 51223: {'lr': 0.0003755113134548529, 'samples': 9834816, 'steps': 51222, 'loss/train': 1.339905858039856} -11/07/2021 04:26:45 - INFO - __main__ - Step 51224: {'lr': 0.00037550672393462357, 'samples': 9835008, 'steps': 51223, 'loss/train': 1.5776480436325073} -11/07/2021 04:26:45 - INFO - __main__ - Step 51225: {'lr': 0.0003755021343578429, 'samples': 9835200, 'steps': 51224, 'loss/train': 1.6987099647521973} -11/07/2021 04:26:46 - INFO - __main__ - Step 51226: {'lr': 0.0003754975447245129, 'samples': 9835392, 'steps': 51225, 'loss/train': 1.362648844718933} -11/07/2021 04:26:46 - INFO - __main__ - Step 51227: {'lr': 0.00037549295503463563, 'samples': 9835584, 'steps': 51226, 'loss/train': 1.7931948900222778} -11/07/2021 04:26:47 - INFO - __main__ - Step 51228: {'lr': 0.0003754883652882132, 'samples': 9835776, 'steps': 51227, 'loss/train': 1.7281259298324585} -11/07/2021 04:26:47 - INFO - __main__ - Step 51229: {'lr': 0.00037548377548524755, 'samples': 9835968, 'steps': 51228, 'loss/train': 1.7389373779296875} -11/07/2021 04:26:47 - INFO - __main__ - Step 51230: {'lr': 0.0003754791856257409, 'samples': 9836160, 'steps': 51229, 'loss/train': 1.3119885921478271} -11/07/2021 04:26:48 - INFO - __main__ - Step 51231: {'lr': 0.00037547459570969527, 'samples': 9836352, 'steps': 51230, 'loss/train': 1.4407776594161987} -11/07/2021 04:26:49 - INFO - __main__ - Step 51232: {'lr': 0.0003754700057371127, 'samples': 9836544, 'steps': 51231, 'loss/train': 1.476395606994629} -11/07/2021 04:26:49 - INFO - __main__ - Step 51233: {'lr': 0.0003754654157079954, 'samples': 9836736, 'steps': 51232, 'loss/train': 1.6063034534454346} -11/07/2021 04:26:49 - INFO - __main__ - Step 51234: {'lr': 0.00037546082562234516, 'samples': 9836928, 'steps': 51233, 'loss/train': 1.552552580833435} -11/07/2021 04:26:50 - INFO - __main__ - Step 51235: {'lr': 0.00037545623548016426, 'samples': 9837120, 'steps': 51234, 'loss/train': 1.502600073814392} -11/07/2021 04:26:51 - INFO - __main__ - Step 51236: {'lr': 0.00037545164528145474, 'samples': 9837312, 'steps': 51235, 'loss/train': 1.330193281173706} -11/07/2021 04:26:51 - INFO - __main__ - Step 51237: {'lr': 0.00037544705502621866, 'samples': 9837504, 'steps': 51236, 'loss/train': 1.2627513408660889} -11/07/2021 04:26:52 - INFO - __main__ - Step 51238: {'lr': 0.000375442464714458, 'samples': 9837696, 'steps': 51237, 'loss/train': 2.0160419940948486} -11/07/2021 04:26:52 - INFO - __main__ - Step 51239: {'lr': 0.000375437874346175, 'samples': 9837888, 'steps': 51238, 'loss/train': 1.600635051727295} -11/07/2021 04:26:52 - INFO - __main__ - Step 51240: {'lr': 0.0003754332839213716, 'samples': 9838080, 'steps': 51239, 'loss/train': 1.4182648658752441} -11/07/2021 04:26:53 - INFO - __main__ - Step 51241: {'lr': 0.00037542869344004987, 'samples': 9838272, 'steps': 51240, 'loss/train': 1.7461457252502441} -11/07/2021 04:26:54 - INFO - __main__ - Step 51242: {'lr': 0.0003754241029022119, 'samples': 9838464, 'steps': 51241, 'loss/train': 1.2371352910995483} -11/07/2021 04:26:54 - INFO - __main__ - Step 51243: {'lr': 0.00037541951230785975, 'samples': 9838656, 'steps': 51242, 'loss/train': 1.3465973138809204} -11/07/2021 04:26:54 - INFO - __main__ - Step 51244: {'lr': 0.00037541492165699554, 'samples': 9838848, 'steps': 51243, 'loss/train': 1.5332742929458618} -11/07/2021 04:26:55 - INFO - __main__ - Step 51245: {'lr': 0.0003754103309496213, 'samples': 9839040, 'steps': 51244, 'loss/train': 1.625928521156311} -11/07/2021 04:26:55 - INFO - __main__ - Step 51246: {'lr': 0.00037540574018573913, 'samples': 9839232, 'steps': 51245, 'loss/train': 1.4563348293304443} -11/07/2021 04:26:56 - INFO - __main__ - Step 51247: {'lr': 0.00037540114936535107, 'samples': 9839424, 'steps': 51246, 'loss/train': 0.9256128668785095} -11/07/2021 04:26:56 - INFO - __main__ - Step 51248: {'lr': 0.0003753965584884591, 'samples': 9839616, 'steps': 51247, 'loss/train': 1.4945613145828247} -11/07/2021 04:26:57 - INFO - __main__ - Step 51249: {'lr': 0.00037539196755506546, 'samples': 9839808, 'steps': 51248, 'loss/train': 1.4203832149505615} -11/07/2021 04:26:57 - INFO - __main__ - Step 51250: {'lr': 0.0003753873765651721, 'samples': 9840000, 'steps': 51249, 'loss/train': 1.7863932847976685} -11/07/2021 04:26:57 - INFO - __main__ - Step 51251: {'lr': 0.0003753827855187811, 'samples': 9840192, 'steps': 51250, 'loss/train': 1.2520095109939575} -11/07/2021 04:26:59 - INFO - __main__ - Step 51252: {'lr': 0.00037537819441589457, 'samples': 9840384, 'steps': 51251, 'loss/train': 1.857222318649292} -11/07/2021 04:26:59 - INFO - __main__ - Step 51253: {'lr': 0.0003753736032565146, 'samples': 9840576, 'steps': 51252, 'loss/train': 1.4762943983078003} -11/07/2021 04:26:59 - INFO - __main__ - Step 51254: {'lr': 0.0003753690120406432, 'samples': 9840768, 'steps': 51253, 'loss/train': 1.2805707454681396} -11/07/2021 04:27:00 - INFO - __main__ - Step 51255: {'lr': 0.00037536442076828235, 'samples': 9840960, 'steps': 51254, 'loss/train': 1.5488632917404175} -11/07/2021 04:27:00 - INFO - __main__ - Step 51256: {'lr': 0.00037535982943943437, 'samples': 9841152, 'steps': 51255, 'loss/train': 1.2295396327972412} -11/07/2021 04:27:00 - INFO - __main__ - Step 51257: {'lr': 0.0003753552380541011, 'samples': 9841344, 'steps': 51256, 'loss/train': 1.6443824768066406} -11/07/2021 04:27:02 - INFO - __main__ - Step 51258: {'lr': 0.00037535064661228476, 'samples': 9841536, 'steps': 51257, 'loss/train': 1.77608060836792} -11/07/2021 04:27:02 - INFO - __main__ - Step 51259: {'lr': 0.00037534605511398736, 'samples': 9841728, 'steps': 51258, 'loss/train': 1.365010380744934} -11/07/2021 04:27:02 - INFO - __main__ - Step 51260: {'lr': 0.0003753414635592109, 'samples': 9841920, 'steps': 51259, 'loss/train': 1.306699514389038} -11/07/2021 04:27:03 - INFO - __main__ - Step 51261: {'lr': 0.0003753368719479575, 'samples': 9842112, 'steps': 51260, 'loss/train': 1.4501153230667114} -11/07/2021 04:27:03 - INFO - __main__ - Step 51262: {'lr': 0.00037533228028022923, 'samples': 9842304, 'steps': 51261, 'loss/train': 0.8957582116127014} -11/07/2021 04:27:04 - INFO - __main__ - Step 51263: {'lr': 0.0003753276885560283, 'samples': 9842496, 'steps': 51262, 'loss/train': 1.4621988534927368} -11/07/2021 04:27:04 - INFO - __main__ - Step 51264: {'lr': 0.0003753230967753566, 'samples': 9842688, 'steps': 51263, 'loss/train': 1.0747171640396118} -11/07/2021 04:27:05 - INFO - __main__ - Step 51265: {'lr': 0.00037531850493821616, 'samples': 9842880, 'steps': 51264, 'loss/train': 1.7383825778961182} -11/07/2021 04:27:05 - INFO - __main__ - Step 51266: {'lr': 0.00037531391304460916, 'samples': 9843072, 'steps': 51265, 'loss/train': 1.8504222631454468} -11/07/2021 04:27:05 - INFO - __main__ - Step 51267: {'lr': 0.00037530932109453767, 'samples': 9843264, 'steps': 51266, 'loss/train': 0.8919113874435425} -11/07/2021 04:27:06 - INFO - __main__ - Step 51268: {'lr': 0.00037530472908800375, 'samples': 9843456, 'steps': 51267, 'loss/train': 1.6534337997436523} -11/07/2021 04:27:07 - INFO - __main__ - Step 51269: {'lr': 0.0003753001370250094, 'samples': 9843648, 'steps': 51268, 'loss/train': 1.3912287950515747} -11/07/2021 04:27:07 - INFO - __main__ - Step 51270: {'lr': 0.00037529554490555686, 'samples': 9843840, 'steps': 51269, 'loss/train': 1.5490639209747314} -11/07/2021 04:27:07 - INFO - __main__ - Step 51271: {'lr': 0.00037529095272964796, 'samples': 9844032, 'steps': 51270, 'loss/train': 0.9925702810287476} -11/07/2021 04:27:08 - INFO - __main__ - Step 51272: {'lr': 0.0003752863604972849, 'samples': 9844224, 'steps': 51271, 'loss/train': 1.397322177886963} -11/07/2021 04:27:09 - INFO - __main__ - Step 51273: {'lr': 0.00037528176820846975, 'samples': 9844416, 'steps': 51272, 'loss/train': 1.414917230606079} -11/07/2021 04:27:09 - INFO - __main__ - Step 51274: {'lr': 0.00037527717586320457, 'samples': 9844608, 'steps': 51273, 'loss/train': 1.25178062915802} -11/07/2021 04:27:10 - INFO - __main__ - Step 51275: {'lr': 0.00037527258346149153, 'samples': 9844800, 'steps': 51274, 'loss/train': 1.7030956745147705} -11/07/2021 04:27:10 - INFO - __main__ - Step 51276: {'lr': 0.0003752679910033325, 'samples': 9844992, 'steps': 51275, 'loss/train': 1.7786269187927246} -11/07/2021 04:27:10 - INFO - __main__ - Step 51277: {'lr': 0.00037526339848872956, 'samples': 9845184, 'steps': 51276, 'loss/train': 1.3212450742721558} -11/07/2021 04:27:11 - INFO - __main__ - Step 51278: {'lr': 0.000375258805917685, 'samples': 9845376, 'steps': 51277, 'loss/train': 1.3959523439407349} -11/07/2021 04:27:12 - INFO - __main__ - Step 51279: {'lr': 0.0003752542132902007, 'samples': 9845568, 'steps': 51278, 'loss/train': 1.5075372457504272} -11/07/2021 04:27:12 - INFO - __main__ - Step 51280: {'lr': 0.00037524962060627885, 'samples': 9845760, 'steps': 51279, 'loss/train': 1.4516735076904297} -11/07/2021 04:27:12 - INFO - __main__ - Step 51281: {'lr': 0.0003752450278659214, 'samples': 9845952, 'steps': 51280, 'loss/train': 1.4751049280166626} -11/07/2021 04:27:13 - INFO - __main__ - Step 51282: {'lr': 0.00037524043506913045, 'samples': 9846144, 'steps': 51281, 'loss/train': 1.726582646369934} -11/07/2021 04:27:13 - INFO - __main__ - Step 51283: {'lr': 0.0003752358422159081, 'samples': 9846336, 'steps': 51282, 'loss/train': 1.9660826921463013} -11/07/2021 04:27:14 - INFO - __main__ - Step 51284: {'lr': 0.0003752312493062564, 'samples': 9846528, 'steps': 51283, 'loss/train': 1.5405163764953613} -11/07/2021 04:27:14 - INFO - __main__ - Step 51285: {'lr': 0.0003752266563401775, 'samples': 9846720, 'steps': 51284, 'loss/train': 1.2178876399993896} -11/07/2021 04:27:15 - INFO - __main__ - Step 51286: {'lr': 0.00037522206331767335, 'samples': 9846912, 'steps': 51285, 'loss/train': 1.6081781387329102} -11/07/2021 04:27:15 - INFO - __main__ - Step 51287: {'lr': 0.00037521747023874606, 'samples': 9847104, 'steps': 51286, 'loss/train': 1.0516690015792847} -11/07/2021 04:27:15 - INFO - __main__ - Step 51288: {'lr': 0.0003752128771033978, 'samples': 9847296, 'steps': 51287, 'loss/train': 1.0194778442382812} -11/07/2021 04:27:17 - INFO - __main__ - Step 51289: {'lr': 0.0003752082839116304, 'samples': 9847488, 'steps': 51288, 'loss/train': 1.3066163063049316} -11/07/2021 04:27:17 - INFO - __main__ - Step 51290: {'lr': 0.0003752036906634462, 'samples': 9847680, 'steps': 51289, 'loss/train': 1.0381736755371094} -11/07/2021 04:27:17 - INFO - __main__ - Step 51291: {'lr': 0.0003751990973588471, 'samples': 9847872, 'steps': 51290, 'loss/train': 2.442082166671753} -11/07/2021 04:27:18 - INFO - __main__ - Step 51292: {'lr': 0.0003751945039978353, 'samples': 9848064, 'steps': 51291, 'loss/train': 1.7478818893432617} -11/07/2021 04:27:18 - INFO - __main__ - Step 51293: {'lr': 0.00037518991058041267, 'samples': 9848256, 'steps': 51292, 'loss/train': 1.6824642419815063} -11/07/2021 04:27:20 - INFO - __main__ - Step 51294: {'lr': 0.00037518531710658144, 'samples': 9848448, 'steps': 51293, 'loss/train': 1.36592435836792} -11/07/2021 04:27:20 - INFO - __main__ - Step 51295: {'lr': 0.0003751807235763437, 'samples': 9848640, 'steps': 51294, 'loss/train': 1.5273423194885254} -11/07/2021 04:27:21 - INFO - __main__ - Step 51296: {'lr': 0.00037517612998970136, 'samples': 9848832, 'steps': 51295, 'loss/train': 1.6209473609924316} -11/07/2021 04:27:21 - INFO - __main__ - Step 51297: {'lr': 0.00037517153634665664, 'samples': 9849024, 'steps': 51296, 'loss/train': 1.7631850242614746} -11/07/2021 04:27:21 - INFO - __main__ - Step 51298: {'lr': 0.0003751669426472115, 'samples': 9849216, 'steps': 51297, 'loss/train': 1.006211280822754} -11/07/2021 04:27:22 - INFO - __main__ - Step 51299: {'lr': 0.0003751623488913681, 'samples': 9849408, 'steps': 51298, 'loss/train': 1.5204555988311768} -11/07/2021 04:27:22 - INFO - __main__ - Step 51300: {'lr': 0.00037515775507912855, 'samples': 9849600, 'steps': 51299, 'loss/train': 1.7774275541305542} -11/07/2021 04:27:23 - INFO - __main__ - Step 51301: {'lr': 0.0003751531612104948, 'samples': 9849792, 'steps': 51300, 'loss/train': 0.8453087210655212} -11/07/2021 04:27:24 - INFO - __main__ - Step 51302: {'lr': 0.00037514856728546893, 'samples': 9849984, 'steps': 51301, 'loss/train': 1.785905122756958} -11/07/2021 04:27:24 - INFO - __main__ - Step 51303: {'lr': 0.00037514397330405306, 'samples': 9850176, 'steps': 51302, 'loss/train': 1.390616536140442} -11/07/2021 04:27:24 - INFO - __main__ - Step 51304: {'lr': 0.00037513937926624924, 'samples': 9850368, 'steps': 51303, 'loss/train': 1.6205112934112549} -11/07/2021 04:27:25 - INFO - __main__ - Step 51305: {'lr': 0.0003751347851720596, 'samples': 9850560, 'steps': 51304, 'loss/train': 1.3488975763320923} -11/07/2021 04:27:25 - INFO - __main__ - Step 51306: {'lr': 0.00037513019102148606, 'samples': 9850752, 'steps': 51305, 'loss/train': 1.1012285947799683} -11/07/2021 04:27:26 - INFO - __main__ - Step 51307: {'lr': 0.0003751255968145309, 'samples': 9850944, 'steps': 51306, 'loss/train': 1.2730046510696411} -11/07/2021 04:27:26 - INFO - __main__ - Step 51308: {'lr': 0.00037512100255119603, 'samples': 9851136, 'steps': 51307, 'loss/train': 1.618487000465393} -11/07/2021 04:27:27 - INFO - __main__ - Step 51309: {'lr': 0.0003751164082314835, 'samples': 9851328, 'steps': 51308, 'loss/train': 1.5488232374191284} -11/07/2021 04:27:27 - INFO - __main__ - Step 51310: {'lr': 0.00037511181385539553, 'samples': 9851520, 'steps': 51309, 'loss/train': 0.549214243888855} -11/07/2021 04:27:28 - INFO - __main__ - Step 51311: {'lr': 0.00037510721942293415, 'samples': 9851712, 'steps': 51310, 'loss/train': 1.7520240545272827} -11/07/2021 04:27:28 - INFO - __main__ - Step 51312: {'lr': 0.0003751026249341013, 'samples': 9851904, 'steps': 51311, 'loss/train': 1.4599018096923828} -11/07/2021 04:27:29 - INFO - __main__ - Step 51313: {'lr': 0.0003750980303888991, 'samples': 9852096, 'steps': 51312, 'loss/train': 1.903134822845459} -11/07/2021 04:27:29 - INFO - __main__ - Step 51314: {'lr': 0.0003750934357873298, 'samples': 9852288, 'steps': 51313, 'loss/train': 1.5627148151397705} -11/07/2021 04:27:30 - INFO - __main__ - Step 51315: {'lr': 0.00037508884112939523, 'samples': 9852480, 'steps': 51314, 'loss/train': 1.7844643592834473} -11/07/2021 04:27:30 - INFO - __main__ - Step 51316: {'lr': 0.0003750842464150975, 'samples': 9852672, 'steps': 51315, 'loss/train': 1.4671173095703125} -11/07/2021 04:27:30 - INFO - __main__ - Step 51317: {'lr': 0.0003750796516444389, 'samples': 9852864, 'steps': 51316, 'loss/train': 1.6843032836914062} -11/07/2021 04:27:31 - INFO - __main__ - Step 51318: {'lr': 0.0003750750568174212, 'samples': 9853056, 'steps': 51317, 'loss/train': 1.5260761976242065} -11/07/2021 04:27:32 - INFO - __main__ - Step 51319: {'lr': 0.00037507046193404665, 'samples': 9853248, 'steps': 51318, 'loss/train': 1.6331720352172852} -11/07/2021 04:27:32 - INFO - __main__ - Step 51320: {'lr': 0.0003750658669943173, 'samples': 9853440, 'steps': 51319, 'loss/train': 1.2930999994277954} -11/07/2021 04:27:32 - INFO - __main__ - Step 51321: {'lr': 0.00037506127199823523, 'samples': 9853632, 'steps': 51320, 'loss/train': 0.9876997470855713} -11/07/2021 04:27:33 - INFO - __main__ - Step 51322: {'lr': 0.00037505667694580244, 'samples': 9853824, 'steps': 51321, 'loss/train': 1.3453137874603271} -11/07/2021 04:27:34 - INFO - __main__ - Step 51323: {'lr': 0.000375052081837021, 'samples': 9854016, 'steps': 51322, 'loss/train': 2.2082297801971436} -11/07/2021 04:27:34 - INFO - __main__ - Step 51324: {'lr': 0.0003750474866718931, 'samples': 9854208, 'steps': 51323, 'loss/train': 0.22028931975364685} -11/07/2021 04:27:35 - INFO - __main__ - Step 51325: {'lr': 0.0003750428914504207, 'samples': 9854400, 'steps': 51324, 'loss/train': 1.3859983682632446} -11/07/2021 04:27:35 - INFO - __main__ - Step 51326: {'lr': 0.0003750382961726059, 'samples': 9854592, 'steps': 51325, 'loss/train': 2.015860080718994} -11/07/2021 04:27:35 - INFO - __main__ - Step 51327: {'lr': 0.0003750337008384508, 'samples': 9854784, 'steps': 51326, 'loss/train': 1.8525826930999756} -11/07/2021 04:27:36 - INFO - __main__ - Step 51328: {'lr': 0.0003750291054479574, 'samples': 9854976, 'steps': 51327, 'loss/train': 1.1386030912399292} -11/07/2021 04:27:37 - INFO - __main__ - Step 51329: {'lr': 0.0003750245100011278, 'samples': 9855168, 'steps': 51328, 'loss/train': 1.5202986001968384} -11/07/2021 04:27:37 - INFO - __main__ - Step 51330: {'lr': 0.00037501991449796415, 'samples': 9855360, 'steps': 51329, 'loss/train': 0.1436721235513687} -11/07/2021 04:27:37 - INFO - __main__ - Step 51331: {'lr': 0.0003750153189384684, 'samples': 9855552, 'steps': 51330, 'loss/train': 1.4653372764587402} -11/07/2021 04:27:38 - INFO - __main__ - Step 51332: {'lr': 0.00037501072332264267, 'samples': 9855744, 'steps': 51331, 'loss/train': 1.437253713607788} -11/07/2021 04:27:38 - INFO - __main__ - Step 51333: {'lr': 0.0003750061276504891, 'samples': 9855936, 'steps': 51332, 'loss/train': 1.316138505935669} -11/07/2021 04:27:39 - INFO - __main__ - Step 51334: {'lr': 0.0003750015319220097, 'samples': 9856128, 'steps': 51333, 'loss/train': 1.7797185182571411} -11/07/2021 04:27:39 - INFO - __main__ - Step 51335: {'lr': 0.0003749969361372065, 'samples': 9856320, 'steps': 51334, 'loss/train': 1.5513956546783447} -11/07/2021 04:27:40 - INFO - __main__ - Step 51336: {'lr': 0.0003749923402960816, 'samples': 9856512, 'steps': 51335, 'loss/train': 1.8163543939590454} -11/07/2021 04:27:40 - INFO - __main__ - Step 51337: {'lr': 0.00037498774439863704, 'samples': 9856704, 'steps': 51336, 'loss/train': 1.3807144165039062} -11/07/2021 04:27:41 - INFO - __main__ - Step 51338: {'lr': 0.000374983148444875, 'samples': 9856896, 'steps': 51337, 'loss/train': 1.6411243677139282} -11/07/2021 04:27:41 - INFO - __main__ - Step 51339: {'lr': 0.00037497855243479744, 'samples': 9857088, 'steps': 51338, 'loss/train': 1.4071072340011597} -11/07/2021 04:27:42 - INFO - __main__ - Step 51340: {'lr': 0.0003749739563684065, 'samples': 9857280, 'steps': 51339, 'loss/train': 0.8938208818435669} -11/07/2021 04:27:42 - INFO - __main__ - Step 51341: {'lr': 0.00037496936024570426, 'samples': 9857472, 'steps': 51340, 'loss/train': 1.4135487079620361} -11/07/2021 04:27:43 - INFO - __main__ - Step 51342: {'lr': 0.0003749647640666927, 'samples': 9857664, 'steps': 51341, 'loss/train': 0.7178032398223877} -11/07/2021 04:27:43 - INFO - __main__ - Step 51343: {'lr': 0.000374960167831374, 'samples': 9857856, 'steps': 51342, 'loss/train': 1.3337452411651611} -11/07/2021 04:27:44 - INFO - __main__ - Step 51344: {'lr': 0.00037495557153975016, 'samples': 9858048, 'steps': 51343, 'loss/train': 1.2852369546890259} -11/07/2021 04:27:44 - INFO - __main__ - Step 51345: {'lr': 0.0003749509751918232, 'samples': 9858240, 'steps': 51344, 'loss/train': 1.4947065114974976} -11/07/2021 04:27:45 - INFO - __main__ - Step 51346: {'lr': 0.0003749463787875953, 'samples': 9858432, 'steps': 51345, 'loss/train': 1.188281774520874} -11/07/2021 04:27:45 - INFO - __main__ - Step 51347: {'lr': 0.00037494178232706847, 'samples': 9858624, 'steps': 51346, 'loss/train': 1.556554913520813} -11/07/2021 04:27:45 - INFO - __main__ - Step 51348: {'lr': 0.00037493718581024484, 'samples': 9858816, 'steps': 51347, 'loss/train': 1.08109450340271} -11/07/2021 04:27:46 - INFO - __main__ - Step 51349: {'lr': 0.0003749325892371264, 'samples': 9859008, 'steps': 51348, 'loss/train': 1.705818772315979} -11/07/2021 04:27:47 - INFO - __main__ - Step 51350: {'lr': 0.0003749279926077153, 'samples': 9859200, 'steps': 51349, 'loss/train': 1.6825324296951294} -11/07/2021 04:27:47 - INFO - __main__ - Step 51351: {'lr': 0.0003749233959220136, 'samples': 9859392, 'steps': 51350, 'loss/train': 1.872248649597168} -11/07/2021 04:27:47 - INFO - __main__ - Step 51352: {'lr': 0.00037491879918002323, 'samples': 9859584, 'steps': 51351, 'loss/train': 1.6915991306304932} -11/07/2021 04:27:48 - INFO - __main__ - Step 51353: {'lr': 0.0003749142023817465, 'samples': 9859776, 'steps': 51352, 'loss/train': 1.0961235761642456} -11/07/2021 04:27:48 - INFO - __main__ - Step 51354: {'lr': 0.00037490960552718534, 'samples': 9859968, 'steps': 51353, 'loss/train': 1.577583909034729} -11/07/2021 04:27:49 - INFO - __main__ - Step 51355: {'lr': 0.00037490500861634183, 'samples': 9860160, 'steps': 51354, 'loss/train': 1.4419667720794678} -11/07/2021 04:27:50 - INFO - __main__ - Step 51356: {'lr': 0.00037490041164921803, 'samples': 9860352, 'steps': 51355, 'loss/train': 1.8501923084259033} -11/07/2021 04:27:50 - INFO - __main__ - Step 51357: {'lr': 0.000374895814625816, 'samples': 9860544, 'steps': 51356, 'loss/train': 1.4689220190048218} -11/07/2021 04:27:50 - INFO - __main__ - Step 51358: {'lr': 0.00037489121754613787, 'samples': 9860736, 'steps': 51357, 'loss/train': 1.227744698524475} -11/07/2021 04:27:51 - INFO - __main__ - Step 51359: {'lr': 0.00037488662041018574, 'samples': 9860928, 'steps': 51358, 'loss/train': 1.2650045156478882} -11/07/2021 04:27:52 - INFO - __main__ - Step 51360: {'lr': 0.00037488202321796156, 'samples': 9861120, 'steps': 51359, 'loss/train': 1.6581660509109497} -11/07/2021 04:27:52 - INFO - __main__ - Step 51361: {'lr': 0.0003748774259694675, 'samples': 9861312, 'steps': 51360, 'loss/train': 1.516729474067688} -11/07/2021 04:27:52 - INFO - __main__ - Step 51362: {'lr': 0.00037487282866470565, 'samples': 9861504, 'steps': 51361, 'loss/train': 1.3707294464111328} -11/07/2021 04:27:53 - INFO - __main__ - Step 51363: {'lr': 0.00037486823130367786, 'samples': 9861696, 'steps': 51362, 'loss/train': 1.912338137626648} -11/07/2021 04:27:53 - INFO - __main__ - Step 51364: {'lr': 0.0003748636338863865, 'samples': 9861888, 'steps': 51363, 'loss/train': 1.4236916303634644} -11/07/2021 04:27:54 - INFO - __main__ - Step 51365: {'lr': 0.0003748590364128335, 'samples': 9862080, 'steps': 51364, 'loss/train': 1.3337184190750122} -11/07/2021 04:27:54 - INFO - __main__ - Step 51366: {'lr': 0.00037485443888302095, 'samples': 9862272, 'steps': 51365, 'loss/train': 1.347653865814209} -11/07/2021 04:27:55 - INFO - __main__ - Step 51367: {'lr': 0.00037484984129695096, 'samples': 9862464, 'steps': 51366, 'loss/train': 1.1018328666687012} -11/07/2021 04:27:55 - INFO - __main__ - Step 51368: {'lr': 0.00037484524365462545, 'samples': 9862656, 'steps': 51367, 'loss/train': 2.0757765769958496} -11/07/2021 04:27:55 - INFO - __main__ - Step 51369: {'lr': 0.0003748406459560466, 'samples': 9862848, 'steps': 51368, 'loss/train': 1.8313307762145996} -11/07/2021 04:27:56 - INFO - __main__ - Step 51370: {'lr': 0.0003748360482012166, 'samples': 9863040, 'steps': 51369, 'loss/train': 1.4531660079956055} -11/07/2021 04:27:57 - INFO - __main__ - Step 51371: {'lr': 0.00037483145039013735, 'samples': 9863232, 'steps': 51370, 'loss/train': 1.2641748189926147} -11/07/2021 04:27:57 - INFO - __main__ - Step 51372: {'lr': 0.0003748268525228109, 'samples': 9863424, 'steps': 51371, 'loss/train': 1.3420898914337158} -11/07/2021 04:27:58 - INFO - __main__ - Step 51373: {'lr': 0.00037482225459923945, 'samples': 9863616, 'steps': 51372, 'loss/train': 1.6101536750793457} -11/07/2021 04:27:58 - INFO - __main__ - Step 51374: {'lr': 0.00037481765661942506, 'samples': 9863808, 'steps': 51373, 'loss/train': 0.9312657117843628} -11/07/2021 04:27:59 - INFO - __main__ - Step 51375: {'lr': 0.0003748130585833697, 'samples': 9864000, 'steps': 51374, 'loss/train': 1.268650770187378} -11/07/2021 04:27:59 - INFO - __main__ - Step 51376: {'lr': 0.0003748084604910755, 'samples': 9864192, 'steps': 51375, 'loss/train': 1.219296932220459} -11/07/2021 04:28:00 - INFO - __main__ - Step 51377: {'lr': 0.0003748038623425446, 'samples': 9864384, 'steps': 51376, 'loss/train': 1.5603306293487549} -11/07/2021 04:28:00 - INFO - __main__ - Step 51378: {'lr': 0.00037479926413777896, 'samples': 9864576, 'steps': 51377, 'loss/train': 1.482375144958496} -11/07/2021 04:28:00 - INFO - __main__ - Step 51379: {'lr': 0.0003747946658767807, 'samples': 9864768, 'steps': 51378, 'loss/train': 0.4298912286758423} -11/07/2021 04:28:01 - INFO - __main__ - Step 51380: {'lr': 0.0003747900675595519, 'samples': 9864960, 'steps': 51379, 'loss/train': 1.7146047353744507} -11/07/2021 04:28:02 - INFO - __main__ - Step 51381: {'lr': 0.00037478546918609464, 'samples': 9865152, 'steps': 51380, 'loss/train': 2.189980983734131} -11/07/2021 04:28:02 - INFO - __main__ - Step 51382: {'lr': 0.00037478087075641095, 'samples': 9865344, 'steps': 51381, 'loss/train': 1.391196846961975} -11/07/2021 04:28:02 - INFO - __main__ - Step 51383: {'lr': 0.00037477627227050286, 'samples': 9865536, 'steps': 51382, 'loss/train': 1.5402201414108276} -11/07/2021 04:28:03 - INFO - __main__ - Step 51384: {'lr': 0.0003747716737283726, 'samples': 9865728, 'steps': 51383, 'loss/train': 2.444733142852783} -11/07/2021 04:28:03 - INFO - __main__ - Step 51385: {'lr': 0.00037476707513002213, 'samples': 9865920, 'steps': 51384, 'loss/train': 1.5121098756790161} -11/07/2021 04:28:04 - INFO - __main__ - Step 51386: {'lr': 0.0003747624764754535, 'samples': 9866112, 'steps': 51385, 'loss/train': 1.090367078781128} -11/07/2021 04:28:04 - INFO - __main__ - Step 51387: {'lr': 0.00037475787776466887, 'samples': 9866304, 'steps': 51386, 'loss/train': 1.01362943649292} -11/07/2021 04:28:05 - INFO - __main__ - Step 51388: {'lr': 0.00037475327899767026, 'samples': 9866496, 'steps': 51387, 'loss/train': 1.2422531843185425} -11/07/2021 04:28:05 - INFO - __main__ - Step 51389: {'lr': 0.0003747486801744597, 'samples': 9866688, 'steps': 51388, 'loss/train': 2.2478537559509277} -11/07/2021 04:28:06 - INFO - __main__ - Step 51390: {'lr': 0.0003747440812950393, 'samples': 9866880, 'steps': 51389, 'loss/train': 1.2774142026901245} -11/07/2021 04:28:06 - INFO - __main__ - Step 51391: {'lr': 0.0003747394823594112, 'samples': 9867072, 'steps': 51390, 'loss/train': 1.6010338068008423} -11/07/2021 04:28:07 - INFO - __main__ - Step 51392: {'lr': 0.00037473488336757743, 'samples': 9867264, 'steps': 51391, 'loss/train': 2.4366376399993896} -11/07/2021 04:28:07 - INFO - __main__ - Step 51393: {'lr': 0.00037473028431954006, 'samples': 9867456, 'steps': 51392, 'loss/train': 1.157906174659729} -11/07/2021 04:28:08 - INFO - __main__ - Step 51394: {'lr': 0.00037472568521530107, 'samples': 9867648, 'steps': 51393, 'loss/train': 1.1847411394119263} -11/07/2021 04:28:08 - INFO - __main__ - Step 51395: {'lr': 0.0003747210860548627, 'samples': 9867840, 'steps': 51394, 'loss/train': 0.23853078484535217} -11/07/2021 04:28:09 - INFO - __main__ - Step 51396: {'lr': 0.00037471648683822683, 'samples': 9868032, 'steps': 51395, 'loss/train': 1.126974105834961} -11/07/2021 04:28:09 - INFO - __main__ - Step 51397: {'lr': 0.0003747118875653957, 'samples': 9868224, 'steps': 51396, 'loss/train': 1.9312546253204346} -11/07/2021 04:28:10 - INFO - __main__ - Step 51398: {'lr': 0.00037470728823637135, 'samples': 9868416, 'steps': 51397, 'loss/train': 1.4620530605316162} -11/07/2021 04:28:10 - INFO - __main__ - Step 51399: {'lr': 0.0003747026888511558, 'samples': 9868608, 'steps': 51398, 'loss/train': 1.5368403196334839} -11/07/2021 04:28:10 - INFO - __main__ - Step 51400: {'lr': 0.00037469808940975106, 'samples': 9868800, 'steps': 51399, 'loss/train': 1.1409534215927124} -11/07/2021 04:28:11 - INFO - __main__ - Step 51401: {'lr': 0.00037469348991215934, 'samples': 9868992, 'steps': 51400, 'loss/train': 1.626787543296814} -11/07/2021 04:28:12 - INFO - __main__ - Step 51402: {'lr': 0.00037468889035838264, 'samples': 9869184, 'steps': 51401, 'loss/train': 1.4606435298919678} -11/07/2021 04:28:12 - INFO - __main__ - Step 51403: {'lr': 0.0003746842907484231, 'samples': 9869376, 'steps': 51402, 'loss/train': 3.1921544075012207} -11/07/2021 04:28:12 - INFO - __main__ - Step 51404: {'lr': 0.0003746796910822827, 'samples': 9869568, 'steps': 51403, 'loss/train': 1.2902007102966309} -11/07/2021 04:28:13 - INFO - __main__ - Step 51405: {'lr': 0.0003746750913599636, 'samples': 9869760, 'steps': 51404, 'loss/train': 0.8975526690483093} -11/07/2021 04:28:13 - INFO - __main__ - Step 51406: {'lr': 0.00037467049158146777, 'samples': 9869952, 'steps': 51405, 'loss/train': 1.7837495803833008} -11/07/2021 04:28:14 - INFO - __main__ - Step 51407: {'lr': 0.00037466589174679733, 'samples': 9870144, 'steps': 51406, 'loss/train': 1.249118685722351} -11/07/2021 04:28:14 - INFO - __main__ - Step 51408: {'lr': 0.0003746612918559544, 'samples': 9870336, 'steps': 51407, 'loss/train': 1.4978562593460083} -11/07/2021 04:28:15 - INFO - __main__ - Step 51409: {'lr': 0.00037465669190894107, 'samples': 9870528, 'steps': 51408, 'loss/train': 1.2435975074768066} -11/07/2021 04:28:15 - INFO - __main__ - Step 51410: {'lr': 0.00037465209190575927, 'samples': 9870720, 'steps': 51409, 'loss/train': 1.4231942892074585} -11/07/2021 04:28:16 - INFO - __main__ - Step 51411: {'lr': 0.00037464749184641123, 'samples': 9870912, 'steps': 51410, 'loss/train': 1.044649362564087} -11/07/2021 04:28:17 - INFO - __main__ - Step 51412: {'lr': 0.0003746428917308989, 'samples': 9871104, 'steps': 51411, 'loss/train': 1.5776267051696777} -11/07/2021 04:28:17 - INFO - __main__ - Step 51413: {'lr': 0.0003746382915592244, 'samples': 9871296, 'steps': 51412, 'loss/train': 1.2381223440170288} -11/07/2021 04:28:17 - INFO - __main__ - Step 51414: {'lr': 0.0003746336913313898, 'samples': 9871488, 'steps': 51413, 'loss/train': 1.206687569618225} -11/07/2021 04:28:18 - INFO - __main__ - Step 51415: {'lr': 0.0003746290910473973, 'samples': 9871680, 'steps': 51414, 'loss/train': 1.6536258459091187} -11/07/2021 04:28:18 - INFO - __main__ - Step 51416: {'lr': 0.00037462449070724876, 'samples': 9871872, 'steps': 51415, 'loss/train': 1.7118861675262451} -11/07/2021 04:28:19 - INFO - __main__ - Step 51417: {'lr': 0.00037461989031094636, 'samples': 9872064, 'steps': 51416, 'loss/train': 1.6540234088897705} -11/07/2021 04:28:20 - INFO - __main__ - Step 51418: {'lr': 0.00037461528985849215, 'samples': 9872256, 'steps': 51417, 'loss/train': 1.264769196510315} -11/07/2021 04:28:20 - INFO - __main__ - Step 51419: {'lr': 0.0003746106893498882, 'samples': 9872448, 'steps': 51418, 'loss/train': 1.1097873449325562} -11/07/2021 04:28:20 - INFO - __main__ - Step 51420: {'lr': 0.00037460608878513656, 'samples': 9872640, 'steps': 51419, 'loss/train': 1.7027997970581055} -11/07/2021 04:28:21 - INFO - __main__ - Step 51421: {'lr': 0.00037460148816423946, 'samples': 9872832, 'steps': 51420, 'loss/train': 1.830729365348816} -11/07/2021 04:28:21 - INFO - __main__ - Step 51422: {'lr': 0.0003745968874871988, 'samples': 9873024, 'steps': 51421, 'loss/train': 1.856423020362854} -11/07/2021 04:28:21 - INFO - __main__ - Step 51423: {'lr': 0.00037459228675401667, 'samples': 9873216, 'steps': 51422, 'loss/train': 0.4582367539405823} -11/07/2021 04:28:22 - INFO - __main__ - Step 51424: {'lr': 0.00037458768596469516, 'samples': 9873408, 'steps': 51423, 'loss/train': 1.4918971061706543} -11/07/2021 04:28:23 - INFO - __main__ - Step 51425: {'lr': 0.0003745830851192364, 'samples': 9873600, 'steps': 51424, 'loss/train': 1.3095556497573853} -11/07/2021 04:28:23 - INFO - __main__ - Step 51426: {'lr': 0.00037457848421764247, 'samples': 9873792, 'steps': 51425, 'loss/train': 1.410119652748108} -11/07/2021 04:28:23 - INFO - __main__ - Step 51427: {'lr': 0.0003745738832599153, 'samples': 9873984, 'steps': 51426, 'loss/train': 1.9977155923843384} -11/07/2021 04:28:24 - INFO - __main__ - Step 51428: {'lr': 0.0003745692822460572, 'samples': 9874176, 'steps': 51427, 'loss/train': 1.139614224433899} -11/07/2021 04:28:25 - INFO - __main__ - Step 51429: {'lr': 0.00037456468117607, 'samples': 9874368, 'steps': 51428, 'loss/train': 1.6224833726882935} -11/07/2021 04:28:26 - INFO - __main__ - Step 51430: {'lr': 0.0003745600800499559, 'samples': 9874560, 'steps': 51429, 'loss/train': 1.3608607053756714} -11/07/2021 04:28:26 - INFO - __main__ - Step 51431: {'lr': 0.0003745554788677169, 'samples': 9874752, 'steps': 51430, 'loss/train': 1.467066764831543} -11/07/2021 04:28:26 - INFO - __main__ - Step 51432: {'lr': 0.0003745508776293551, 'samples': 9874944, 'steps': 51431, 'loss/train': 1.8557852506637573} -11/07/2021 04:28:27 - INFO - __main__ - Step 51433: {'lr': 0.0003745462763348727, 'samples': 9875136, 'steps': 51432, 'loss/train': 1.9213792085647583} -11/07/2021 04:28:27 - INFO - __main__ - Step 51434: {'lr': 0.00037454167498427165, 'samples': 9875328, 'steps': 51433, 'loss/train': 1.5387630462646484} -11/07/2021 04:28:28 - INFO - __main__ - Step 51435: {'lr': 0.0003745370735775541, 'samples': 9875520, 'steps': 51434, 'loss/train': 1.3750271797180176} -11/07/2021 04:28:28 - INFO - __main__ - Step 51436: {'lr': 0.00037453247211472195, 'samples': 9875712, 'steps': 51435, 'loss/train': 2.651184320449829} -11/07/2021 04:28:29 - INFO - __main__ - Step 51437: {'lr': 0.0003745278705957774, 'samples': 9875904, 'steps': 51436, 'loss/train': 1.0046931505203247} -11/07/2021 04:28:29 - INFO - __main__ - Step 51438: {'lr': 0.00037452326902072256, 'samples': 9876096, 'steps': 51437, 'loss/train': 1.501657485961914} -11/07/2021 04:28:30 - INFO - __main__ - Step 51439: {'lr': 0.0003745186673895594, 'samples': 9876288, 'steps': 51438, 'loss/train': 1.5010449886322021} -11/07/2021 04:28:31 - INFO - __main__ - Step 51440: {'lr': 0.0003745140657022901, 'samples': 9876480, 'steps': 51439, 'loss/train': 1.5103965997695923} -11/07/2021 04:28:31 - INFO - __main__ - Step 51441: {'lr': 0.0003745094639589167, 'samples': 9876672, 'steps': 51440, 'loss/train': 1.458385705947876} -11/07/2021 04:28:31 - INFO - __main__ - Step 51442: {'lr': 0.00037450486215944123, 'samples': 9876864, 'steps': 51441, 'loss/train': 1.954463005065918} -11/07/2021 04:28:32 - INFO - __main__ - Step 51443: {'lr': 0.0003745002603038658, 'samples': 9877056, 'steps': 51442, 'loss/train': 1.5138039588928223} -11/07/2021 04:28:32 - INFO - __main__ - Step 51444: {'lr': 0.00037449565839219246, 'samples': 9877248, 'steps': 51443, 'loss/train': 0.8293909430503845} -11/07/2021 04:28:33 - INFO - __main__ - Step 51445: {'lr': 0.0003744910564244233, 'samples': 9877440, 'steps': 51444, 'loss/train': 0.7137060761451721} -11/07/2021 04:28:33 - INFO - __main__ - Step 51446: {'lr': 0.0003744864544005604, 'samples': 9877632, 'steps': 51445, 'loss/train': 1.6284750699996948} -11/07/2021 04:28:34 - INFO - __main__ - Step 51447: {'lr': 0.0003744818523206058, 'samples': 9877824, 'steps': 51446, 'loss/train': 1.0235060453414917} -11/07/2021 04:28:34 - INFO - __main__ - Step 51448: {'lr': 0.00037447725018456167, 'samples': 9878016, 'steps': 51447, 'loss/train': 1.4038679599761963} -11/07/2021 04:28:34 - INFO - __main__ - Step 51449: {'lr': 0.00037447264799243, 'samples': 9878208, 'steps': 51448, 'loss/train': 1.4147348403930664} -11/07/2021 04:28:35 - INFO - __main__ - Step 51450: {'lr': 0.00037446804574421276, 'samples': 9878400, 'steps': 51449, 'loss/train': 1.1394082307815552} -11/07/2021 04:28:36 - INFO - __main__ - Step 51451: {'lr': 0.00037446344343991224, 'samples': 9878592, 'steps': 51450, 'loss/train': 1.2706471681594849} -11/07/2021 04:28:36 - INFO - __main__ - Step 51452: {'lr': 0.0003744588410795304, 'samples': 9878784, 'steps': 51451, 'loss/train': 1.8876612186431885} -11/07/2021 04:28:37 - INFO - __main__ - Step 51453: {'lr': 0.00037445423866306926, 'samples': 9878976, 'steps': 51452, 'loss/train': 1.4991883039474487} -11/07/2021 04:28:37 - INFO - __main__ - Step 51454: {'lr': 0.00037444963619053103, 'samples': 9879168, 'steps': 51453, 'loss/train': 1.1963261365890503} -11/07/2021 04:28:37 - INFO - __main__ - Step 51455: {'lr': 0.00037444503366191776, 'samples': 9879360, 'steps': 51454, 'loss/train': 1.015403389930725} -11/07/2021 04:28:38 - INFO - __main__ - Step 51456: {'lr': 0.00037444043107723134, 'samples': 9879552, 'steps': 51455, 'loss/train': 1.8410333395004272} -11/07/2021 04:28:39 - INFO - __main__ - Step 51457: {'lr': 0.0003744358284364741, 'samples': 9879744, 'steps': 51456, 'loss/train': 1.4342031478881836} -11/07/2021 04:28:39 - INFO - __main__ - Step 51458: {'lr': 0.00037443122573964794, 'samples': 9879936, 'steps': 51457, 'loss/train': 1.4363067150115967} -11/07/2021 04:28:39 - INFO - __main__ - Step 51459: {'lr': 0.000374426622986755, 'samples': 9880128, 'steps': 51458, 'loss/train': 1.6961021423339844} -11/07/2021 04:28:40 - INFO - __main__ - Step 51460: {'lr': 0.0003744220201777974, 'samples': 9880320, 'steps': 51459, 'loss/train': 1.4590411186218262} -11/07/2021 04:28:41 - INFO - __main__ - Step 51461: {'lr': 0.0003744174173127771, 'samples': 9880512, 'steps': 51460, 'loss/train': 1.4540116786956787} -11/07/2021 04:28:41 - INFO - __main__ - Step 51462: {'lr': 0.00037441281439169624, 'samples': 9880704, 'steps': 51461, 'loss/train': 1.4658534526824951} -11/07/2021 04:28:41 - INFO - __main__ - Step 51463: {'lr': 0.0003744082114145568, 'samples': 9880896, 'steps': 51462, 'loss/train': 1.1046414375305176} -11/07/2021 04:28:42 - INFO - __main__ - Step 51464: {'lr': 0.00037440360838136106, 'samples': 9881088, 'steps': 51463, 'loss/train': 1.3326470851898193} -11/07/2021 04:28:42 - INFO - __main__ - Step 51465: {'lr': 0.0003743990052921109, 'samples': 9881280, 'steps': 51464, 'loss/train': 1.2350364923477173} -11/07/2021 04:28:43 - INFO - __main__ - Step 51466: {'lr': 0.00037439440214680854, 'samples': 9881472, 'steps': 51465, 'loss/train': 1.0318598747253418} -11/07/2021 04:28:44 - INFO - __main__ - Step 51467: {'lr': 0.00037438979894545595, 'samples': 9881664, 'steps': 51466, 'loss/train': 1.6322429180145264} -11/07/2021 04:28:44 - INFO - __main__ - Step 51468: {'lr': 0.0003743851956880553, 'samples': 9881856, 'steps': 51467, 'loss/train': 1.3701001405715942} -11/07/2021 04:28:44 - INFO - __main__ - Step 51469: {'lr': 0.00037438059237460846, 'samples': 9882048, 'steps': 51468, 'loss/train': 1.480985164642334} -11/07/2021 04:28:45 - INFO - __main__ - Step 51470: {'lr': 0.0003743759890051177, 'samples': 9882240, 'steps': 51469, 'loss/train': 1.0128283500671387} -11/07/2021 04:28:46 - INFO - __main__ - Step 51471: {'lr': 0.00037437138557958505, 'samples': 9882432, 'steps': 51470, 'loss/train': 1.2985695600509644} -11/07/2021 04:28:46 - INFO - __main__ - Step 51472: {'lr': 0.0003743667820980126, 'samples': 9882624, 'steps': 51471, 'loss/train': 1.4783293008804321} -11/07/2021 04:28:46 - INFO - __main__ - Step 51473: {'lr': 0.0003743621785604024, 'samples': 9882816, 'steps': 51472, 'loss/train': 1.547150731086731} -11/07/2021 04:28:47 - INFO - __main__ - Step 51474: {'lr': 0.00037435757496675646, 'samples': 9883008, 'steps': 51473, 'loss/train': 1.023967981338501} -11/07/2021 04:28:47 - INFO - __main__ - Step 51475: {'lr': 0.000374352971317077, 'samples': 9883200, 'steps': 51474, 'loss/train': 1.2801886796951294} -11/07/2021 04:28:48 - INFO - __main__ - Step 51476: {'lr': 0.0003743483676113659, 'samples': 9883392, 'steps': 51475, 'loss/train': 1.77716064453125} -11/07/2021 04:28:48 - INFO - __main__ - Step 51477: {'lr': 0.00037434376384962544, 'samples': 9883584, 'steps': 51476, 'loss/train': 1.5756834745407104} -11/07/2021 04:28:49 - INFO - __main__ - Step 51478: {'lr': 0.00037433916003185757, 'samples': 9883776, 'steps': 51477, 'loss/train': 1.6418976783752441} -11/07/2021 04:28:49 - INFO - __main__ - Step 51479: {'lr': 0.0003743345561580644, 'samples': 9883968, 'steps': 51478, 'loss/train': 1.2006781101226807} -11/07/2021 04:28:49 - INFO - __main__ - Step 51480: {'lr': 0.0003743299522282479, 'samples': 9884160, 'steps': 51479, 'loss/train': 1.4376378059387207} -11/07/2021 04:28:51 - INFO - __main__ - Step 51481: {'lr': 0.0003743253482424104, 'samples': 9884352, 'steps': 51480, 'loss/train': 1.3342554569244385} -11/07/2021 04:28:51 - INFO - __main__ - Step 51482: {'lr': 0.00037432074420055376, 'samples': 9884544, 'steps': 51481, 'loss/train': 1.9823734760284424} -11/07/2021 04:28:51 - INFO - __main__ - Step 51483: {'lr': 0.00037431614010268013, 'samples': 9884736, 'steps': 51482, 'loss/train': 1.7683123350143433} -11/07/2021 04:28:52 - INFO - __main__ - Step 51484: {'lr': 0.0003743115359487915, 'samples': 9884928, 'steps': 51483, 'loss/train': 1.566193699836731} -11/07/2021 04:28:52 - INFO - __main__ - Step 51485: {'lr': 0.00037430693173889, 'samples': 9885120, 'steps': 51484, 'loss/train': 1.6051998138427734} -11/07/2021 04:28:53 - INFO - __main__ - Step 51486: {'lr': 0.00037430232747297774, 'samples': 9885312, 'steps': 51485, 'loss/train': 1.6360217332839966} -11/07/2021 04:28:53 - INFO - __main__ - Step 51487: {'lr': 0.00037429772315105683, 'samples': 9885504, 'steps': 51486, 'loss/train': 1.1560131311416626} -11/07/2021 04:28:54 - INFO - __main__ - Step 51488: {'lr': 0.0003742931187731293, 'samples': 9885696, 'steps': 51487, 'loss/train': 0.9204044938087463} -11/07/2021 04:28:54 - INFO - __main__ - Step 51489: {'lr': 0.00037428851433919707, 'samples': 9885888, 'steps': 51488, 'loss/train': 1.2909021377563477} -11/07/2021 04:28:54 - INFO - __main__ - Step 51490: {'lr': 0.0003742839098492625, 'samples': 9886080, 'steps': 51489, 'loss/train': 1.2641663551330566} -11/07/2021 04:28:55 - INFO - __main__ - Step 51491: {'lr': 0.0003742793053033274, 'samples': 9886272, 'steps': 51490, 'loss/train': 1.4978505373001099} -11/07/2021 04:28:56 - INFO - __main__ - Step 51492: {'lr': 0.000374274700701394, 'samples': 9886464, 'steps': 51491, 'loss/train': 1.688596487045288} -11/07/2021 04:28:56 - INFO - __main__ - Step 51493: {'lr': 0.00037427009604346437, 'samples': 9886656, 'steps': 51492, 'loss/train': 1.7720634937286377} -11/07/2021 04:28:57 - INFO - __main__ - Step 51494: {'lr': 0.0003742654913295405, 'samples': 9886848, 'steps': 51493, 'loss/train': 1.5528498888015747} -11/07/2021 04:28:57 - INFO - __main__ - Step 51495: {'lr': 0.0003742608865596246, 'samples': 9887040, 'steps': 51494, 'loss/train': 1.5911250114440918} -11/07/2021 04:28:57 - INFO - __main__ - Step 51496: {'lr': 0.0003742562817337186, 'samples': 9887232, 'steps': 51495, 'loss/train': 1.3602335453033447} -11/07/2021 04:28:58 - INFO - __main__ - Step 51497: {'lr': 0.0003742516768518247, 'samples': 9887424, 'steps': 51496, 'loss/train': 1.474177598953247} -11/07/2021 04:28:59 - INFO - __main__ - Step 51498: {'lr': 0.0003742470719139448, 'samples': 9887616, 'steps': 51497, 'loss/train': 1.5765888690948486} -11/07/2021 04:28:59 - INFO - __main__ - Step 51499: {'lr': 0.0003742424669200811, 'samples': 9887808, 'steps': 51498, 'loss/train': 1.1993672847747803} -11/07/2021 04:28:59 - INFO - __main__ - Step 51500: {'lr': 0.00037423786187023574, 'samples': 9888000, 'steps': 51499, 'loss/train': 0.9676117300987244} -11/07/2021 04:29:00 - INFO - __main__ - Step 51501: {'lr': 0.00037423325676441064, 'samples': 9888192, 'steps': 51500, 'loss/train': 0.9103842973709106} -11/07/2021 04:29:01 - INFO - __main__ - Step 51502: {'lr': 0.0003742286516026081, 'samples': 9888384, 'steps': 51501, 'loss/train': 1.3378478288650513} -11/07/2021 04:29:01 - INFO - __main__ - Step 51503: {'lr': 0.0003742240463848299, 'samples': 9888576, 'steps': 51502, 'loss/train': 1.6188141107559204} -11/07/2021 04:29:01 - INFO - __main__ - Step 51504: {'lr': 0.0003742194411110783, 'samples': 9888768, 'steps': 51503, 'loss/train': 1.5715343952178955} -11/07/2021 04:29:02 - INFO - __main__ - Step 51505: {'lr': 0.00037421483578135536, 'samples': 9888960, 'steps': 51504, 'loss/train': 1.6032418012619019} -11/07/2021 04:29:02 - INFO - __main__ - Step 51506: {'lr': 0.0003742102303956631, 'samples': 9889152, 'steps': 51505, 'loss/train': 1.5006656646728516} -11/07/2021 04:29:03 - INFO - __main__ - Step 51507: {'lr': 0.0003742056249540036, 'samples': 9889344, 'steps': 51506, 'loss/train': 1.2101598978042603} -11/07/2021 04:29:03 - INFO - __main__ - Step 51508: {'lr': 0.00037420101945637906, 'samples': 9889536, 'steps': 51507, 'loss/train': 1.6999436616897583} -11/07/2021 04:29:04 - INFO - __main__ - Step 51509: {'lr': 0.00037419641390279136, 'samples': 9889728, 'steps': 51508, 'loss/train': 0.9679996967315674} -11/07/2021 04:29:04 - INFO - __main__ - Step 51510: {'lr': 0.00037419180829324273, 'samples': 9889920, 'steps': 51509, 'loss/train': 1.518884539604187} -11/07/2021 04:29:04 - INFO - __main__ - Step 51511: {'lr': 0.0003741872026277351, 'samples': 9890112, 'steps': 51510, 'loss/train': 1.2138888835906982} -11/07/2021 04:29:05 - INFO - __main__ - Step 51512: {'lr': 0.00037418259690627075, 'samples': 9890304, 'steps': 51511, 'loss/train': 2.737327814102173} -11/07/2021 04:29:06 - INFO - __main__ - Step 51513: {'lr': 0.0003741779911288516, 'samples': 9890496, 'steps': 51512, 'loss/train': 1.3141067028045654} -11/07/2021 04:29:06 - INFO - __main__ - Step 51514: {'lr': 0.0003741733852954797, 'samples': 9890688, 'steps': 51513, 'loss/train': 1.173534631729126} -11/07/2021 04:29:07 - INFO - __main__ - Step 51515: {'lr': 0.00037416877940615737, 'samples': 9890880, 'steps': 51514, 'loss/train': 1.575916051864624} -11/07/2021 04:29:07 - INFO - __main__ - Step 51516: {'lr': 0.00037416417346088635, 'samples': 9891072, 'steps': 51515, 'loss/train': 1.3990917205810547} -11/07/2021 04:29:07 - INFO - __main__ - Step 51517: {'lr': 0.0003741595674596688, 'samples': 9891264, 'steps': 51516, 'loss/train': 2.040133237838745} -11/07/2021 04:29:08 - INFO - __main__ - Step 51518: {'lr': 0.000374154961402507, 'samples': 9891456, 'steps': 51517, 'loss/train': 1.1698777675628662} -11/07/2021 04:29:09 - INFO - __main__ - Step 51519: {'lr': 0.00037415035528940284, 'samples': 9891648, 'steps': 51518, 'loss/train': 1.1059638261795044} -11/07/2021 04:29:09 - INFO - __main__ - Step 51520: {'lr': 0.00037414574912035845, 'samples': 9891840, 'steps': 51519, 'loss/train': 1.148276448249817} -11/07/2021 04:29:09 - INFO - __main__ - Step 51521: {'lr': 0.0003741411428953759, 'samples': 9892032, 'steps': 51520, 'loss/train': 1.3834562301635742} -11/07/2021 04:29:10 - INFO - __main__ - Step 51522: {'lr': 0.00037413653661445736, 'samples': 9892224, 'steps': 51521, 'loss/train': 1.5016969442367554} -11/07/2021 04:29:11 - INFO - __main__ - Step 51523: {'lr': 0.00037413193027760466, 'samples': 9892416, 'steps': 51522, 'loss/train': 1.725628137588501} -11/07/2021 04:29:11 - INFO - __main__ - Step 51524: {'lr': 0.00037412732388482015, 'samples': 9892608, 'steps': 51523, 'loss/train': 0.6794720888137817} -11/07/2021 04:29:12 - INFO - __main__ - Step 51525: {'lr': 0.0003741227174361057, 'samples': 9892800, 'steps': 51524, 'loss/train': 0.9042429327964783} -11/07/2021 04:29:12 - INFO - __main__ - Step 51526: {'lr': 0.00037411811093146345, 'samples': 9892992, 'steps': 51525, 'loss/train': 1.3141316175460815} -11/07/2021 04:29:12 - INFO - __main__ - Step 51527: {'lr': 0.0003741135043708956, 'samples': 9893184, 'steps': 51526, 'loss/train': 1.630672574043274} -11/07/2021 04:29:13 - INFO - __main__ - Step 51528: {'lr': 0.000374108897754404, 'samples': 9893376, 'steps': 51527, 'loss/train': 1.5166720151901245} -11/07/2021 04:29:14 - INFO - __main__ - Step 51529: {'lr': 0.00037410429108199097, 'samples': 9893568, 'steps': 51528, 'loss/train': 1.4905604124069214} -11/07/2021 04:29:14 - INFO - __main__ - Step 51530: {'lr': 0.0003740996843536584, 'samples': 9893760, 'steps': 51529, 'loss/train': 1.3705830574035645} -11/07/2021 04:29:14 - INFO - __main__ - Step 51531: {'lr': 0.00037409507756940843, 'samples': 9893952, 'steps': 51530, 'loss/train': 1.4777553081512451} -11/07/2021 04:29:15 - INFO - __main__ - Step 51532: {'lr': 0.00037409047072924307, 'samples': 9894144, 'steps': 51531, 'loss/train': 1.2640812397003174} -11/07/2021 04:29:15 - INFO - __main__ - Step 51533: {'lr': 0.0003740858638331646, 'samples': 9894336, 'steps': 51532, 'loss/train': 0.8791767358779907} -11/07/2021 04:29:16 - INFO - __main__ - Step 51534: {'lr': 0.0003740812568811748, 'samples': 9894528, 'steps': 51533, 'loss/train': 1.3411303758621216} -11/07/2021 04:29:17 - INFO - __main__ - Step 51535: {'lr': 0.000374076649873276, 'samples': 9894720, 'steps': 51534, 'loss/train': 1.0225270986557007} -11/07/2021 04:29:17 - INFO - __main__ - Step 51536: {'lr': 0.00037407204280947014, 'samples': 9894912, 'steps': 51535, 'loss/train': 1.6323903799057007} -11/07/2021 04:29:17 - INFO - __main__ - Step 51537: {'lr': 0.0003740674356897593, 'samples': 9895104, 'steps': 51536, 'loss/train': 0.9552247524261475} -11/07/2021 04:29:18 - INFO - __main__ - Step 51538: {'lr': 0.0003740628285141457, 'samples': 9895296, 'steps': 51537, 'loss/train': 1.5924347639083862} -11/07/2021 04:29:19 - INFO - __main__ - Step 51539: {'lr': 0.00037405822128263125, 'samples': 9895488, 'steps': 51538, 'loss/train': 0.8937223553657532} -11/07/2021 04:29:19 - INFO - __main__ - Step 51540: {'lr': 0.000374053613995218, 'samples': 9895680, 'steps': 51539, 'loss/train': 1.7730861902236938} -11/07/2021 04:29:19 - INFO - __main__ - Step 51541: {'lr': 0.0003740490066519082, 'samples': 9895872, 'steps': 51540, 'loss/train': 5.167013645172119} -11/07/2021 04:29:20 - INFO - __main__ - Step 51542: {'lr': 0.0003740443992527038, 'samples': 9896064, 'steps': 51541, 'loss/train': 1.4915814399719238} -11/07/2021 04:29:20 - INFO - __main__ - Step 51543: {'lr': 0.00037403979179760687, 'samples': 9896256, 'steps': 51542, 'loss/train': 1.727198600769043} -11/07/2021 04:29:20 - INFO - __main__ - Step 51544: {'lr': 0.0003740351842866196, 'samples': 9896448, 'steps': 51543, 'loss/train': 1.2733923196792603} -11/07/2021 04:29:21 - INFO - __main__ - Step 51545: {'lr': 0.0003740305767197439, 'samples': 9896640, 'steps': 51544, 'loss/train': 1.4166321754455566} -11/07/2021 04:29:22 - INFO - __main__ - Step 51546: {'lr': 0.0003740259690969821, 'samples': 9896832, 'steps': 51545, 'loss/train': 1.5141226053237915} -11/07/2021 04:29:22 - INFO - __main__ - Step 51547: {'lr': 0.00037402136141833595, 'samples': 9897024, 'steps': 51546, 'loss/train': 1.39847993850708} -11/07/2021 04:29:22 - INFO - __main__ - Step 51548: {'lr': 0.0003740167536838077, 'samples': 9897216, 'steps': 51547, 'loss/train': 1.4686611890792847} -11/07/2021 04:29:23 - INFO - __main__ - Step 51549: {'lr': 0.0003740121458933995, 'samples': 9897408, 'steps': 51548, 'loss/train': 2.0743227005004883} -11/07/2021 04:29:24 - INFO - __main__ - Step 51550: {'lr': 0.0003740075380471133, 'samples': 9897600, 'steps': 51549, 'loss/train': 1.748748540878296} -11/07/2021 04:29:24 - INFO - __main__ - Step 51551: {'lr': 0.0003740029301449512, 'samples': 9897792, 'steps': 51550, 'loss/train': 1.677230715751648} -11/07/2021 04:29:25 - INFO - __main__ - Step 51552: {'lr': 0.0003739983221869153, 'samples': 9897984, 'steps': 51551, 'loss/train': 0.8572708368301392} -11/07/2021 04:29:25 - INFO - __main__ - Step 51553: {'lr': 0.00037399371417300766, 'samples': 9898176, 'steps': 51552, 'loss/train': 1.0359253883361816} -11/07/2021 04:29:25 - INFO - __main__ - Step 51554: {'lr': 0.00037398910610323034, 'samples': 9898368, 'steps': 51553, 'loss/train': 0.7630068063735962} -11/07/2021 04:29:26 - INFO - __main__ - Step 51555: {'lr': 0.0003739844979775855, 'samples': 9898560, 'steps': 51554, 'loss/train': 5.784372806549072} -11/07/2021 04:29:27 - INFO - __main__ - Step 51556: {'lr': 0.0003739798897960752, 'samples': 9898752, 'steps': 51555, 'loss/train': 2.1621899604797363} -11/07/2021 04:29:27 - INFO - __main__ - Step 51557: {'lr': 0.00037397528155870134, 'samples': 9898944, 'steps': 51556, 'loss/train': 1.7338827848434448} -11/07/2021 04:29:27 - INFO - __main__ - Step 51558: {'lr': 0.00037397067326546616, 'samples': 9899136, 'steps': 51557, 'loss/train': 1.0028150081634521} -11/07/2021 04:29:28 - INFO - __main__ - Step 51559: {'lr': 0.0003739660649163718, 'samples': 9899328, 'steps': 51558, 'loss/train': 1.5446821451187134} -11/07/2021 04:29:28 - INFO - __main__ - Step 51560: {'lr': 0.0003739614565114202, 'samples': 9899520, 'steps': 51559, 'loss/train': 1.6628481149673462} -11/07/2021 04:29:29 - INFO - __main__ - Step 51561: {'lr': 0.00037395684805061345, 'samples': 9899712, 'steps': 51560, 'loss/train': 1.4018369913101196} -11/07/2021 04:29:30 - INFO - __main__ - Step 51562: {'lr': 0.00037395223953395375, 'samples': 9899904, 'steps': 51561, 'loss/train': 1.3891258239746094} -11/07/2021 04:29:30 - INFO - __main__ - Step 51563: {'lr': 0.000373947630961443, 'samples': 9900096, 'steps': 51562, 'loss/train': 1.5041695833206177} -11/07/2021 04:29:30 - INFO - __main__ - Step 51564: {'lr': 0.00037394302233308336, 'samples': 9900288, 'steps': 51563, 'loss/train': 1.408871054649353} -11/07/2021 04:29:31 - INFO - __main__ - Step 51565: {'lr': 0.0003739384136488769, 'samples': 9900480, 'steps': 51564, 'loss/train': 1.5967864990234375} -11/07/2021 04:29:32 - INFO - __main__ - Step 51566: {'lr': 0.00037393380490882575, 'samples': 9900672, 'steps': 51565, 'loss/train': 1.0944602489471436} -11/07/2021 04:29:32 - INFO - __main__ - Step 51567: {'lr': 0.0003739291961129319, 'samples': 9900864, 'steps': 51566, 'loss/train': 1.4621555805206299} -11/07/2021 04:29:32 - INFO - __main__ - Step 51568: {'lr': 0.0003739245872611975, 'samples': 9901056, 'steps': 51567, 'loss/train': 1.713440179824829} -11/07/2021 04:29:33 - INFO - __main__ - Step 51569: {'lr': 0.0003739199783536246, 'samples': 9901248, 'steps': 51568, 'loss/train': 1.344717025756836} -11/07/2021 04:29:33 - INFO - __main__ - Step 51570: {'lr': 0.0003739153693902152, 'samples': 9901440, 'steps': 51569, 'loss/train': 1.5534286499023438} -11/07/2021 04:29:34 - INFO - __main__ - Step 51571: {'lr': 0.0003739107603709715, 'samples': 9901632, 'steps': 51570, 'loss/train': 1.600929856300354} -11/07/2021 04:29:35 - INFO - __main__ - Step 51572: {'lr': 0.00037390615129589554, 'samples': 9901824, 'steps': 51571, 'loss/train': 1.3709287643432617} -11/07/2021 04:29:35 - INFO - __main__ - Step 51573: {'lr': 0.00037390154216498933, 'samples': 9902016, 'steps': 51572, 'loss/train': 1.6646630764007568} -11/07/2021 04:29:35 - INFO - __main__ - Step 51574: {'lr': 0.000373896932978255, 'samples': 9902208, 'steps': 51573, 'loss/train': 0.6080346703529358} -11/07/2021 04:29:36 - INFO - __main__ - Step 51575: {'lr': 0.00037389232373569463, 'samples': 9902400, 'steps': 51574, 'loss/train': 1.31934654712677} -11/07/2021 04:29:37 - INFO - __main__ - Step 51576: {'lr': 0.0003738877144373104, 'samples': 9902592, 'steps': 51575, 'loss/train': 1.0798628330230713} -11/07/2021 04:29:37 - INFO - __main__ - Step 51577: {'lr': 0.0003738831050831042, 'samples': 9902784, 'steps': 51576, 'loss/train': 1.7884399890899658} -11/07/2021 04:29:37 - INFO - __main__ - Step 51578: {'lr': 0.0003738784956730781, 'samples': 9902976, 'steps': 51577, 'loss/train': 1.9427136182785034} -11/07/2021 04:29:38 - INFO - __main__ - Step 51579: {'lr': 0.0003738738862072343, 'samples': 9903168, 'steps': 51578, 'loss/train': 1.6550885438919067} -11/07/2021 04:29:38 - INFO - __main__ - Step 51580: {'lr': 0.00037386927668557493, 'samples': 9903360, 'steps': 51579, 'loss/train': 1.5623819828033447} -11/07/2021 04:29:38 - INFO - __main__ - Step 51581: {'lr': 0.0003738646671081019, 'samples': 9903552, 'steps': 51580, 'loss/train': 1.5108397006988525} -11/07/2021 04:29:39 - INFO - __main__ - Step 51582: {'lr': 0.00037386005747481744, 'samples': 9903744, 'steps': 51581, 'loss/train': 1.5365359783172607} -11/07/2021 04:29:40 - INFO - __main__ - Step 51583: {'lr': 0.00037385544778572346, 'samples': 9903936, 'steps': 51582, 'loss/train': 1.7460014820098877} -11/07/2021 04:29:40 - INFO - __main__ - Step 51584: {'lr': 0.00037385083804082213, 'samples': 9904128, 'steps': 51583, 'loss/train': 1.2553999423980713} -11/07/2021 04:29:40 - INFO - __main__ - Step 51585: {'lr': 0.00037384622824011555, 'samples': 9904320, 'steps': 51584, 'loss/train': 0.9383065104484558} -11/07/2021 04:29:41 - INFO - __main__ - Step 51586: {'lr': 0.00037384161838360574, 'samples': 9904512, 'steps': 51585, 'loss/train': 1.4494212865829468} -11/07/2021 04:29:42 - INFO - __main__ - Step 51587: {'lr': 0.00037383700847129487, 'samples': 9904704, 'steps': 51586, 'loss/train': 1.7529298067092896} -11/07/2021 04:29:42 - INFO - __main__ - Step 51588: {'lr': 0.0003738323985031849, 'samples': 9904896, 'steps': 51587, 'loss/train': 1.9423640966415405} -11/07/2021 04:29:43 - INFO - __main__ - Step 51589: {'lr': 0.000373827788479278, 'samples': 9905088, 'steps': 51588, 'loss/train': 1.507910132408142} -11/07/2021 04:29:43 - INFO - __main__ - Step 51590: {'lr': 0.0003738231783995762, 'samples': 9905280, 'steps': 51589, 'loss/train': 1.803034782409668} -11/07/2021 04:29:43 - INFO - __main__ - Step 51591: {'lr': 0.00037381856826408156, 'samples': 9905472, 'steps': 51590, 'loss/train': 1.5332369804382324} -11/07/2021 04:29:45 - INFO - __main__ - Step 51592: {'lr': 0.00037381395807279625, 'samples': 9905664, 'steps': 51591, 'loss/train': 0.134771466255188} -11/07/2021 04:29:45 - INFO - __main__ - Step 51593: {'lr': 0.0003738093478257222, 'samples': 9905856, 'steps': 51592, 'loss/train': 1.1799582242965698} -11/07/2021 04:29:45 - INFO - __main__ - Step 51594: {'lr': 0.0003738047375228616, 'samples': 9906048, 'steps': 51593, 'loss/train': 1.308282732963562} -11/07/2021 04:29:46 - INFO - __main__ - Step 51595: {'lr': 0.00037380012716421647, 'samples': 9906240, 'steps': 51594, 'loss/train': 1.6689704656600952} -11/07/2021 04:29:46 - INFO - __main__ - Step 51596: {'lr': 0.00037379551674978896, 'samples': 9906432, 'steps': 51595, 'loss/train': 1.452520728111267} -11/07/2021 04:29:47 - INFO - __main__ - Step 51597: {'lr': 0.0003737909062795811, 'samples': 9906624, 'steps': 51596, 'loss/train': 1.5214353799819946} -11/07/2021 04:29:47 - INFO - __main__ - Step 51598: {'lr': 0.00037378629575359493, 'samples': 9906816, 'steps': 51597, 'loss/train': 2.1359145641326904} -11/07/2021 04:29:48 - INFO - __main__ - Step 51599: {'lr': 0.0003737816851718326, 'samples': 9907008, 'steps': 51598, 'loss/train': 1.743646502494812} -11/07/2021 04:29:48 - INFO - __main__ - Step 51600: {'lr': 0.0003737770745342961, 'samples': 9907200, 'steps': 51599, 'loss/train': 1.3906631469726562} -11/07/2021 04:29:48 - INFO - __main__ - Step 51601: {'lr': 0.0003737724638409876, 'samples': 9907392, 'steps': 51600, 'loss/train': 1.3511393070220947} -11/07/2021 04:29:49 - INFO - __main__ - Step 51602: {'lr': 0.00037376785309190913, 'samples': 9907584, 'steps': 51601, 'loss/train': 1.3243608474731445} -11/07/2021 04:29:50 - INFO - __main__ - Step 51603: {'lr': 0.0003737632422870628, 'samples': 9907776, 'steps': 51602, 'loss/train': 1.7266608476638794} -11/07/2021 04:29:50 - INFO - __main__ - Step 51604: {'lr': 0.00037375863142645064, 'samples': 9907968, 'steps': 51603, 'loss/train': 1.8057512044906616} -11/07/2021 04:29:50 - INFO - __main__ - Step 51605: {'lr': 0.00037375402051007477, 'samples': 9908160, 'steps': 51604, 'loss/train': 0.5424093008041382} -11/07/2021 04:29:51 - INFO - __main__ - Step 51606: {'lr': 0.00037374940953793724, 'samples': 9908352, 'steps': 51605, 'loss/train': 1.5453418493270874} -11/07/2021 04:29:51 - INFO - __main__ - Step 51607: {'lr': 0.00037374479851004006, 'samples': 9908544, 'steps': 51606, 'loss/train': 1.4249101877212524} -11/07/2021 04:29:52 - INFO - __main__ - Step 51608: {'lr': 0.0003737401874263855, 'samples': 9908736, 'steps': 51607, 'loss/train': 1.4591652154922485} -11/07/2021 04:29:53 - INFO - __main__ - Step 51609: {'lr': 0.0003737355762869755, 'samples': 9908928, 'steps': 51608, 'loss/train': 1.513169765472412} -11/07/2021 04:29:53 - INFO - __main__ - Step 51610: {'lr': 0.0003737309650918121, 'samples': 9909120, 'steps': 51609, 'loss/train': 1.3394849300384521} -11/07/2021 04:29:53 - INFO - __main__ - Step 51611: {'lr': 0.0003737263538408975, 'samples': 9909312, 'steps': 51610, 'loss/train': 1.6213732957839966} -11/07/2021 04:29:54 - INFO - __main__ - Step 51612: {'lr': 0.0003737217425342336, 'samples': 9909504, 'steps': 51611, 'loss/train': 1.1712919473648071} -11/07/2021 04:29:55 - INFO - __main__ - Step 51613: {'lr': 0.0003737171311718227, 'samples': 9909696, 'steps': 51612, 'loss/train': 0.9208439588546753} -11/07/2021 04:29:55 - INFO - __main__ - Step 51614: {'lr': 0.0003737125197536667, 'samples': 9909888, 'steps': 51613, 'loss/train': 1.4358117580413818} -11/07/2021 04:29:55 - INFO - __main__ - Step 51615: {'lr': 0.0003737079082797678, 'samples': 9910080, 'steps': 51614, 'loss/train': 1.3692514896392822} -11/07/2021 04:29:56 - INFO - __main__ - Step 51616: {'lr': 0.000373703296750128, 'samples': 9910272, 'steps': 51615, 'loss/train': 1.4786714315414429} -11/07/2021 04:29:56 - INFO - __main__ - Step 51617: {'lr': 0.0003736986851647495, 'samples': 9910464, 'steps': 51616, 'loss/train': 1.227534294128418} -11/07/2021 04:29:57 - INFO - __main__ - Step 51618: {'lr': 0.00037369407352363417, 'samples': 9910656, 'steps': 51617, 'loss/train': 1.4258657693862915} -11/07/2021 04:29:57 - INFO - __main__ - Step 51619: {'lr': 0.0003736894618267842, 'samples': 9910848, 'steps': 51618, 'loss/train': 1.7483607530593872} -11/07/2021 04:29:58 - INFO - __main__ - Step 51620: {'lr': 0.0003736848500742017, 'samples': 9911040, 'steps': 51619, 'loss/train': 1.0665727853775024} -11/07/2021 04:29:58 - INFO - __main__ - Step 51621: {'lr': 0.0003736802382658887, 'samples': 9911232, 'steps': 51620, 'loss/train': 1.5844364166259766} -11/07/2021 04:29:58 - INFO - __main__ - Step 51622: {'lr': 0.00037367562640184735, 'samples': 9911424, 'steps': 51621, 'loss/train': 1.685865044593811} -11/07/2021 04:29:59 - INFO - __main__ - Step 51623: {'lr': 0.0003736710144820796, 'samples': 9911616, 'steps': 51622, 'loss/train': 2.9197614192962646} -11/07/2021 04:30:00 - INFO - __main__ - Step 51624: {'lr': 0.00037366640250658767, 'samples': 9911808, 'steps': 51623, 'loss/train': 1.7044905424118042} -11/07/2021 04:30:00 - INFO - __main__ - Step 51625: {'lr': 0.00037366179047537354, 'samples': 9912000, 'steps': 51624, 'loss/train': 1.2015422582626343} -11/07/2021 04:30:01 - INFO - __main__ - Step 51626: {'lr': 0.0003736571783884393, 'samples': 9912192, 'steps': 51625, 'loss/train': 1.9773355722427368} -11/07/2021 04:30:01 - INFO - __main__ - Step 51627: {'lr': 0.00037365256624578695, 'samples': 9912384, 'steps': 51626, 'loss/train': 1.3225902318954468} -11/07/2021 04:30:02 - INFO - __main__ - Step 51628: {'lr': 0.0003736479540474188, 'samples': 9912576, 'steps': 51627, 'loss/train': 0.1793370544910431} -11/07/2021 04:30:02 - INFO - __main__ - Step 51629: {'lr': 0.00037364334179333674, 'samples': 9912768, 'steps': 51628, 'loss/train': 1.239203929901123} -11/07/2021 04:30:03 - INFO - __main__ - Step 51630: {'lr': 0.00037363872948354294, 'samples': 9912960, 'steps': 51629, 'loss/train': 1.4803258180618286} -11/07/2021 04:30:03 - INFO - __main__ - Step 51631: {'lr': 0.00037363411711803935, 'samples': 9913152, 'steps': 51630, 'loss/train': 1.6821731328964233} -11/07/2021 04:30:03 - INFO - __main__ - Step 51632: {'lr': 0.0003736295046968282, 'samples': 9913344, 'steps': 51631, 'loss/train': 1.213153600692749} -11/07/2021 04:30:04 - INFO - __main__ - Step 51633: {'lr': 0.0003736248922199115, 'samples': 9913536, 'steps': 51632, 'loss/train': 1.9221079349517822} -11/07/2021 04:30:05 - INFO - __main__ - Step 51634: {'lr': 0.0003736202796872913, 'samples': 9913728, 'steps': 51633, 'loss/train': 1.223962426185608} -11/07/2021 04:30:05 - INFO - __main__ - Step 51635: {'lr': 0.00037361566709896964, 'samples': 9913920, 'steps': 51634, 'loss/train': 1.9123646020889282} -11/07/2021 04:30:05 - INFO - __main__ - Step 51636: {'lr': 0.00037361105445494884, 'samples': 9914112, 'steps': 51635, 'loss/train': 1.6113739013671875} -11/07/2021 04:30:06 - INFO - __main__ - Step 51637: {'lr': 0.0003736064417552307, 'samples': 9914304, 'steps': 51636, 'loss/train': 1.8846906423568726} -11/07/2021 04:30:06 - INFO - __main__ - Step 51638: {'lr': 0.0003736018289998174, 'samples': 9914496, 'steps': 51637, 'loss/train': 2.0408263206481934} -11/07/2021 04:30:07 - INFO - __main__ - Step 51639: {'lr': 0.00037359721618871107, 'samples': 9914688, 'steps': 51638, 'loss/train': 0.6913129091262817} -11/07/2021 04:30:07 - INFO - __main__ - Step 51640: {'lr': 0.0003735926033219137, 'samples': 9914880, 'steps': 51639, 'loss/train': 1.5510092973709106} -11/07/2021 04:30:08 - INFO - __main__ - Step 51641: {'lr': 0.00037358799039942744, 'samples': 9915072, 'steps': 51640, 'loss/train': 1.5725252628326416} -11/07/2021 04:30:08 - INFO - __main__ - Step 51642: {'lr': 0.00037358337742125433, 'samples': 9915264, 'steps': 51641, 'loss/train': 1.0196442604064941} -11/07/2021 04:30:08 - INFO - __main__ - Step 51643: {'lr': 0.0003735787643873965, 'samples': 9915456, 'steps': 51642, 'loss/train': 0.9055829048156738} -11/07/2021 04:30:10 - INFO - __main__ - Step 51644: {'lr': 0.00037357415129785586, 'samples': 9915648, 'steps': 51643, 'loss/train': 0.6788956522941589} -11/07/2021 04:30:10 - INFO - __main__ - Step 51645: {'lr': 0.00037356953815263473, 'samples': 9915840, 'steps': 51644, 'loss/train': 1.7450796365737915} -11/07/2021 04:30:10 - INFO - __main__ - Step 51646: {'lr': 0.00037356492495173505, 'samples': 9916032, 'steps': 51645, 'loss/train': 1.5990597009658813} -11/07/2021 04:30:11 - INFO - __main__ - Step 51647: {'lr': 0.00037356031169515894, 'samples': 9916224, 'steps': 51646, 'loss/train': 1.8649356365203857} -11/07/2021 04:30:11 - INFO - __main__ - Step 51648: {'lr': 0.0003735556983829084, 'samples': 9916416, 'steps': 51647, 'loss/train': 2.3101606369018555} -11/07/2021 04:30:12 - INFO - __main__ - Step 51649: {'lr': 0.00037355108501498557, 'samples': 9916608, 'steps': 51648, 'loss/train': 0.7279643416404724} -11/07/2021 04:30:12 - INFO - __main__ - Step 51650: {'lr': 0.0003735464715913926, 'samples': 9916800, 'steps': 51649, 'loss/train': 1.4655834436416626} -11/07/2021 04:30:13 - INFO - __main__ - Step 51651: {'lr': 0.00037354185811213145, 'samples': 9916992, 'steps': 51650, 'loss/train': 1.3757160902023315} -11/07/2021 04:30:13 - INFO - __main__ - Step 51652: {'lr': 0.0003735372445772042, 'samples': 9917184, 'steps': 51651, 'loss/train': 1.4900068044662476} -11/07/2021 04:30:13 - INFO - __main__ - Step 51653: {'lr': 0.00037353263098661304, 'samples': 9917376, 'steps': 51652, 'loss/train': 1.225886583328247} -11/07/2021 04:30:15 - INFO - __main__ - Step 51654: {'lr': 0.00037352801734036, 'samples': 9917568, 'steps': 51653, 'loss/train': 1.6471189260482788} -11/07/2021 04:30:15 - INFO - __main__ - Step 51655: {'lr': 0.00037352340363844706, 'samples': 9917760, 'steps': 51654, 'loss/train': 1.3263717889785767} -11/07/2021 04:30:15 - INFO - __main__ - Step 51656: {'lr': 0.00037351878988087646, 'samples': 9917952, 'steps': 51655, 'loss/train': 1.8218783140182495} -11/07/2021 04:30:16 - INFO - __main__ - Step 51657: {'lr': 0.0003735141760676501, 'samples': 9918144, 'steps': 51656, 'loss/train': 1.5391809940338135} -11/07/2021 04:30:16 - INFO - __main__ - Step 51658: {'lr': 0.0003735095621987703, 'samples': 9918336, 'steps': 51657, 'loss/train': 1.4478362798690796} -11/07/2021 04:30:17 - INFO - __main__ - Step 51659: {'lr': 0.00037350494827423884, 'samples': 9918528, 'steps': 51658, 'loss/train': 1.8777034282684326} -11/07/2021 04:30:17 - INFO - __main__ - Step 51660: {'lr': 0.00037350033429405806, 'samples': 9918720, 'steps': 51659, 'loss/train': 1.7261641025543213} -11/07/2021 04:30:18 - INFO - __main__ - Step 51661: {'lr': 0.0003734957202582299, 'samples': 9918912, 'steps': 51660, 'loss/train': 1.31928551197052} -11/07/2021 04:30:18 - INFO - __main__ - Step 51662: {'lr': 0.00037349110616675653, 'samples': 9919104, 'steps': 51661, 'loss/train': 1.650587558746338} -11/07/2021 04:30:18 - INFO - __main__ - Step 51663: {'lr': 0.0003734864920196399, 'samples': 9919296, 'steps': 51662, 'loss/train': 1.3911428451538086} -11/07/2021 04:30:19 - INFO - __main__ - Step 51664: {'lr': 0.0003734818778168823, 'samples': 9919488, 'steps': 51663, 'loss/train': 1.6656628847122192} -11/07/2021 04:30:20 - INFO - __main__ - Step 51665: {'lr': 0.0003734772635584855, 'samples': 9919680, 'steps': 51664, 'loss/train': 1.6247785091400146} -11/07/2021 04:30:20 - INFO - __main__ - Step 51666: {'lr': 0.0003734726492444518, 'samples': 9919872, 'steps': 51665, 'loss/train': 1.460745930671692} -11/07/2021 04:30:20 - INFO - __main__ - Step 51667: {'lr': 0.00037346803487478325, 'samples': 9920064, 'steps': 51666, 'loss/train': 1.350220799446106} -11/07/2021 04:30:21 - INFO - __main__ - Step 51668: {'lr': 0.0003734634204494819, 'samples': 9920256, 'steps': 51667, 'loss/train': 1.5722851753234863} -11/07/2021 04:30:21 - INFO - __main__ - Step 51669: {'lr': 0.0003734588059685499, 'samples': 9920448, 'steps': 51668, 'loss/train': 1.341074824333191} -11/07/2021 04:30:22 - INFO - __main__ - Step 51670: {'lr': 0.0003734541914319892, 'samples': 9920640, 'steps': 51669, 'loss/train': 2.1882638931274414} -11/07/2021 04:30:22 - INFO - __main__ - Step 51671: {'lr': 0.0003734495768398019, 'samples': 9920832, 'steps': 51670, 'loss/train': 1.5213651657104492} -11/07/2021 04:30:23 - INFO - __main__ - Step 51672: {'lr': 0.00037344496219199016, 'samples': 9921024, 'steps': 51671, 'loss/train': 1.61359703540802} -11/07/2021 04:30:23 - INFO - __main__ - Step 51673: {'lr': 0.0003734403474885561, 'samples': 9921216, 'steps': 51672, 'loss/train': 1.300546646118164} -11/07/2021 04:30:24 - INFO - __main__ - Step 51674: {'lr': 0.00037343573272950167, 'samples': 9921408, 'steps': 51673, 'loss/train': 1.4245498180389404} -11/07/2021 04:30:25 - INFO - __main__ - Step 51675: {'lr': 0.00037343111791482897, 'samples': 9921600, 'steps': 51674, 'loss/train': 1.6947277784347534} -11/07/2021 04:30:25 - INFO - __main__ - Step 51676: {'lr': 0.0003734265030445401, 'samples': 9921792, 'steps': 51675, 'loss/train': 1.4293681383132935} -11/07/2021 04:30:25 - INFO - __main__ - Step 51677: {'lr': 0.0003734218881186372, 'samples': 9921984, 'steps': 51676, 'loss/train': 1.6062393188476562} -11/07/2021 04:30:26 - INFO - __main__ - Step 51678: {'lr': 0.00037341727313712237, 'samples': 9922176, 'steps': 51677, 'loss/train': 1.2721912860870361} -11/07/2021 04:30:26 - INFO - __main__ - Step 51679: {'lr': 0.0003734126580999975, 'samples': 9922368, 'steps': 51678, 'loss/train': 1.5690890550613403} -11/07/2021 04:30:27 - INFO - __main__ - Step 51680: {'lr': 0.0003734080430072649, 'samples': 9922560, 'steps': 51679, 'loss/train': 1.523789882659912} -11/07/2021 04:30:27 - INFO - __main__ - Step 51681: {'lr': 0.0003734034278589265, 'samples': 9922752, 'steps': 51680, 'loss/train': 1.4328149557113647} -11/07/2021 04:30:28 - INFO - __main__ - Step 51682: {'lr': 0.0003733988126549843, 'samples': 9922944, 'steps': 51681, 'loss/train': 1.4673817157745361} -11/07/2021 04:30:28 - INFO - __main__ - Step 51683: {'lr': 0.0003733941973954407, 'samples': 9923136, 'steps': 51682, 'loss/train': 1.2372491359710693} -11/07/2021 04:30:28 - INFO - __main__ - Step 51684: {'lr': 0.00037338958208029744, 'samples': 9923328, 'steps': 51683, 'loss/train': 1.281899333000183} -11/07/2021 04:30:30 - INFO - __main__ - Step 51685: {'lr': 0.0003733849667095568, 'samples': 9923520, 'steps': 51684, 'loss/train': 1.811161756515503} -11/07/2021 04:30:30 - INFO - __main__ - Step 51686: {'lr': 0.00037338035128322075, 'samples': 9923712, 'steps': 51685, 'loss/train': 1.7999763488769531} -11/07/2021 04:30:30 - INFO - __main__ - Step 51687: {'lr': 0.00037337573580129143, 'samples': 9923904, 'steps': 51686, 'loss/train': 0.15734606981277466} -11/07/2021 04:30:31 - INFO - __main__ - Step 51688: {'lr': 0.0003733711202637709, 'samples': 9924096, 'steps': 51687, 'loss/train': 2.9371252059936523} -11/07/2021 04:30:31 - INFO - __main__ - Step 51689: {'lr': 0.00037336650467066125, 'samples': 9924288, 'steps': 51688, 'loss/train': 1.6733360290527344} -11/07/2021 04:30:31 - INFO - __main__ - Step 51690: {'lr': 0.0003733618890219646, 'samples': 9924480, 'steps': 51689, 'loss/train': 1.1849936246871948} -11/07/2021 04:30:33 - INFO - __main__ - Step 51691: {'lr': 0.000373357273317683, 'samples': 9924672, 'steps': 51690, 'loss/train': 5.7699737548828125} -11/07/2021 04:30:33 - INFO - __main__ - Step 51692: {'lr': 0.00037335265755781844, 'samples': 9924864, 'steps': 51691, 'loss/train': 1.5762732028961182} -11/07/2021 04:30:33 - INFO - __main__ - Step 51693: {'lr': 0.00037334804174237314, 'samples': 9925056, 'steps': 51692, 'loss/train': 0.768830418586731} -11/07/2021 04:30:34 - INFO - __main__ - Step 51694: {'lr': 0.0003733434258713491, 'samples': 9925248, 'steps': 51693, 'loss/train': 1.4546159505844116} -11/07/2021 04:30:34 - INFO - __main__ - Step 51695: {'lr': 0.00037333880994474834, 'samples': 9925440, 'steps': 51694, 'loss/train': 0.9135294556617737} -11/07/2021 04:30:35 - INFO - __main__ - Step 51696: {'lr': 0.00037333419396257307, 'samples': 9925632, 'steps': 51695, 'loss/train': 1.7703784704208374} -11/07/2021 04:30:36 - INFO - __main__ - Step 51697: {'lr': 0.00037332957792482534, 'samples': 9925824, 'steps': 51696, 'loss/train': 1.1710397005081177} -11/07/2021 04:30:36 - INFO - __main__ - Step 51698: {'lr': 0.0003733249618315072, 'samples': 9926016, 'steps': 51697, 'loss/train': 1.419105052947998} -11/07/2021 04:30:36 - INFO - __main__ - Step 51699: {'lr': 0.0003733203456826207, 'samples': 9926208, 'steps': 51698, 'loss/train': 1.4877972602844238} -11/07/2021 04:30:37 - INFO - __main__ - Step 51700: {'lr': 0.000373315729478168, 'samples': 9926400, 'steps': 51699, 'loss/train': 1.1597901582717896} -11/07/2021 04:30:37 - INFO - __main__ - Step 51701: {'lr': 0.0003733111132181511, 'samples': 9926592, 'steps': 51700, 'loss/train': 1.6634995937347412} -11/07/2021 04:30:38 - INFO - __main__ - Step 51702: {'lr': 0.0003733064969025721, 'samples': 9926784, 'steps': 51701, 'loss/train': 1.2895931005477905} -11/07/2021 04:30:38 - INFO - __main__ - Step 51703: {'lr': 0.00037330188053143323, 'samples': 9926976, 'steps': 51702, 'loss/train': 1.1735255718231201} -11/07/2021 04:30:39 - INFO - __main__ - Step 51704: {'lr': 0.0003732972641047363, 'samples': 9927168, 'steps': 51703, 'loss/train': 1.7416150569915771} -11/07/2021 04:30:39 - INFO - __main__ - Step 51705: {'lr': 0.0003732926476224835, 'samples': 9927360, 'steps': 51704, 'loss/train': 1.1643649339675903} -11/07/2021 04:30:39 - INFO - __main__ - Step 51706: {'lr': 0.00037328803108467704, 'samples': 9927552, 'steps': 51705, 'loss/train': 1.7630983591079712} -11/07/2021 04:30:41 - INFO - __main__ - Step 51707: {'lr': 0.0003732834144913188, 'samples': 9927744, 'steps': 51706, 'loss/train': 1.2046449184417725} -11/07/2021 04:30:41 - INFO - __main__ - Step 51708: {'lr': 0.00037327879784241095, 'samples': 9927936, 'steps': 51707, 'loss/train': 1.187599778175354} -11/07/2021 04:30:41 - INFO - __main__ - Step 51709: {'lr': 0.00037327418113795565, 'samples': 9928128, 'steps': 51708, 'loss/train': 1.437038779258728} -11/07/2021 04:30:42 - INFO - __main__ - Step 51710: {'lr': 0.0003732695643779549, 'samples': 9928320, 'steps': 51709, 'loss/train': 1.5829737186431885} -11/07/2021 04:30:42 - INFO - __main__ - Step 51711: {'lr': 0.0003732649475624108, 'samples': 9928512, 'steps': 51710, 'loss/train': 1.6034432649612427} -11/07/2021 04:30:43 - INFO - __main__ - Step 51712: {'lr': 0.0003732603306913254, 'samples': 9928704, 'steps': 51711, 'loss/train': 1.2415457963943481} -11/07/2021 04:30:44 - INFO - __main__ - Step 51713: {'lr': 0.00037325571376470074, 'samples': 9928896, 'steps': 51712, 'loss/train': 1.7289055585861206} -11/07/2021 04:30:44 - INFO - __main__ - Step 51714: {'lr': 0.00037325109678253897, 'samples': 9929088, 'steps': 51713, 'loss/train': 1.754821538925171} -11/07/2021 04:30:45 - INFO - __main__ - Step 51715: {'lr': 0.0003732464797448422, 'samples': 9929280, 'steps': 51714, 'loss/train': 1.5865949392318726} -11/07/2021 04:30:45 - INFO - __main__ - Step 51716: {'lr': 0.0003732418626516125, 'samples': 9929472, 'steps': 51715, 'loss/train': 1.9165054559707642} -11/07/2021 04:30:47 - INFO - __main__ - Step 51717: {'lr': 0.0003732372455028519, 'samples': 9929664, 'steps': 51716, 'loss/train': 0.8452095985412598} -11/07/2021 04:30:47 - INFO - __main__ - Step 51718: {'lr': 0.00037323262829856246, 'samples': 9929856, 'steps': 51717, 'loss/train': 1.0609043836593628} -11/07/2021 04:30:47 - INFO - __main__ - Step 51719: {'lr': 0.00037322801103874633, 'samples': 9930048, 'steps': 51718, 'loss/train': 2.9352524280548096} -11/07/2021 04:30:48 - INFO - __main__ - Step 51720: {'lr': 0.00037322339372340555, 'samples': 9930240, 'steps': 51719, 'loss/train': 1.8885968923568726} -11/07/2021 04:30:48 - INFO - __main__ - Step 51721: {'lr': 0.0003732187763525421, 'samples': 9930432, 'steps': 51720, 'loss/train': 1.7703211307525635} -11/07/2021 04:30:48 - INFO - __main__ - Step 51722: {'lr': 0.00037321415892615833, 'samples': 9930624, 'steps': 51721, 'loss/train': 0.9961236715316772} -11/07/2021 04:30:49 - INFO - __main__ - Step 51723: {'lr': 0.0003732095414442561, 'samples': 9930816, 'steps': 51722, 'loss/train': 1.6001304388046265} -11/07/2021 04:30:50 - INFO - __main__ - Step 51724: {'lr': 0.00037320492390683756, 'samples': 9931008, 'steps': 51723, 'loss/train': 1.4640626907348633} -11/07/2021 04:30:50 - INFO - __main__ - Step 51725: {'lr': 0.00037320030631390476, 'samples': 9931200, 'steps': 51724, 'loss/train': 1.0389316082000732} -11/07/2021 04:30:51 - INFO - __main__ - Step 51726: {'lr': 0.00037319568866545983, 'samples': 9931392, 'steps': 51725, 'loss/train': 0.3944765627384186} -11/07/2021 04:30:51 - INFO - __main__ - Step 51727: {'lr': 0.00037319107096150483, 'samples': 9931584, 'steps': 51726, 'loss/train': 1.802032470703125} -11/07/2021 04:30:51 - INFO - __main__ - Step 51728: {'lr': 0.00037318645320204183, 'samples': 9931776, 'steps': 51727, 'loss/train': 1.6470043659210205} -11/07/2021 04:30:52 - INFO - __main__ - Step 51729: {'lr': 0.0003731818353870729, 'samples': 9931968, 'steps': 51728, 'loss/train': 1.5274968147277832} -11/07/2021 04:30:53 - INFO - __main__ - Step 51730: {'lr': 0.00037317721751660014, 'samples': 9932160, 'steps': 51729, 'loss/train': 1.6125394105911255} -11/07/2021 04:30:53 - INFO - __main__ - Step 51731: {'lr': 0.00037317259959062564, 'samples': 9932352, 'steps': 51730, 'loss/train': 1.8147977590560913} -11/07/2021 04:30:53 - INFO - __main__ - Step 51732: {'lr': 0.0003731679816091514, 'samples': 9932544, 'steps': 51731, 'loss/train': 1.1446830034255981} -11/07/2021 04:30:54 - INFO - __main__ - Step 51733: {'lr': 0.00037316336357217966, 'samples': 9932736, 'steps': 51732, 'loss/train': 1.0742896795272827} -11/07/2021 04:30:55 - INFO - __main__ - Step 51734: {'lr': 0.0003731587454797124, 'samples': 9932928, 'steps': 51733, 'loss/train': 1.5206941366195679} -11/07/2021 04:30:55 - INFO - __main__ - Step 51735: {'lr': 0.0003731541273317517, 'samples': 9933120, 'steps': 51734, 'loss/train': 1.9338865280151367} -11/07/2021 04:30:55 - INFO - __main__ - Step 51736: {'lr': 0.0003731495091282996, 'samples': 9933312, 'steps': 51735, 'loss/train': 1.4734269380569458} -11/07/2021 04:30:56 - INFO - __main__ - Step 51737: {'lr': 0.0003731448908693583, 'samples': 9933504, 'steps': 51736, 'loss/train': 1.5363223552703857} -11/07/2021 04:30:56 - INFO - __main__ - Step 51738: {'lr': 0.0003731402725549298, 'samples': 9933696, 'steps': 51737, 'loss/train': 1.4811780452728271} -11/07/2021 04:30:57 - INFO - __main__ - Step 51739: {'lr': 0.0003731356541850162, 'samples': 9933888, 'steps': 51738, 'loss/train': 3.218954086303711} -11/07/2021 04:30:58 - INFO - __main__ - Step 51740: {'lr': 0.0003731310357596195, 'samples': 9934080, 'steps': 51739, 'loss/train': 1.2267725467681885} -11/07/2021 04:30:58 - INFO - __main__ - Step 51741: {'lr': 0.0003731264172787419, 'samples': 9934272, 'steps': 51740, 'loss/train': 1.9757555723190308} -11/07/2021 04:30:58 - INFO - __main__ - Step 51742: {'lr': 0.0003731217987423854, 'samples': 9934464, 'steps': 51741, 'loss/train': 1.652662754058838} -11/07/2021 04:30:59 - INFO - __main__ - Step 51743: {'lr': 0.00037311718015055215, 'samples': 9934656, 'steps': 51742, 'loss/train': 1.73580002784729} -11/07/2021 04:30:59 - INFO - __main__ - Step 51744: {'lr': 0.0003731125615032442, 'samples': 9934848, 'steps': 51743, 'loss/train': 1.3464809656143188} -11/07/2021 04:31:00 - INFO - __main__ - Step 51745: {'lr': 0.0003731079428004637, 'samples': 9935040, 'steps': 51744, 'loss/train': 1.7845275402069092} -11/07/2021 04:31:00 - INFO - __main__ - Step 51746: {'lr': 0.00037310332404221256, 'samples': 9935232, 'steps': 51745, 'loss/train': 2.0145421028137207} -11/07/2021 04:31:01 - INFO - __main__ - Step 51747: {'lr': 0.000373098705228493, 'samples': 9935424, 'steps': 51746, 'loss/train': 1.3998632431030273} -11/07/2021 04:31:01 - INFO - __main__ - Step 51748: {'lr': 0.00037309408635930705, 'samples': 9935616, 'steps': 51747, 'loss/train': 1.2065773010253906} -11/07/2021 04:31:01 - INFO - __main__ - Step 51749: {'lr': 0.0003730894674346568, 'samples': 9935808, 'steps': 51748, 'loss/train': 1.1705305576324463} -11/07/2021 04:31:02 - INFO - __main__ - Step 51750: {'lr': 0.00037308484845454434, 'samples': 9936000, 'steps': 51749, 'loss/train': 1.5436286926269531} -11/07/2021 04:31:03 - INFO - __main__ - Step 51751: {'lr': 0.0003730802294189718, 'samples': 9936192, 'steps': 51750, 'loss/train': 1.499884843826294} -11/07/2021 04:31:03 - INFO - __main__ - Step 51752: {'lr': 0.00037307561032794113, 'samples': 9936384, 'steps': 51751, 'loss/train': 1.10182785987854} -11/07/2021 04:31:03 - INFO - __main__ - Step 51753: {'lr': 0.0003730709911814545, 'samples': 9936576, 'steps': 51752, 'loss/train': 1.6749976873397827} -11/07/2021 04:31:04 - INFO - __main__ - Step 51754: {'lr': 0.000373066371979514, 'samples': 9936768, 'steps': 51753, 'loss/train': 1.492154598236084} -11/07/2021 04:31:05 - INFO - __main__ - Step 51755: {'lr': 0.00037306175272212166, 'samples': 9936960, 'steps': 51754, 'loss/train': 1.5916110277175903} -11/07/2021 04:31:05 - INFO - __main__ - Step 51756: {'lr': 0.0003730571334092796, 'samples': 9937152, 'steps': 51755, 'loss/train': 1.5051785707473755} -11/07/2021 04:31:05 - INFO - __main__ - Step 51757: {'lr': 0.00037305251404099, 'samples': 9937344, 'steps': 51756, 'loss/train': 1.2896778583526611} -11/07/2021 04:31:06 - INFO - __main__ - Step 51758: {'lr': 0.00037304789461725473, 'samples': 9937536, 'steps': 51757, 'loss/train': 1.5637562274932861} -11/07/2021 04:31:06 - INFO - __main__ - Step 51759: {'lr': 0.000373043275138076, 'samples': 9937728, 'steps': 51758, 'loss/train': 1.2381839752197266} -11/07/2021 04:31:07 - INFO - __main__ - Step 51760: {'lr': 0.00037303865560345587, 'samples': 9937920, 'steps': 51759, 'loss/train': 1.8927297592163086} -11/07/2021 04:31:08 - INFO - __main__ - Step 51761: {'lr': 0.00037303403601339643, 'samples': 9938112, 'steps': 51760, 'loss/train': 1.7042573690414429} -11/07/2021 04:31:08 - INFO - __main__ - Step 51762: {'lr': 0.0003730294163678997, 'samples': 9938304, 'steps': 51761, 'loss/train': 1.8782144784927368} -11/07/2021 04:31:08 - INFO - __main__ - Step 51763: {'lr': 0.00037302479666696787, 'samples': 9938496, 'steps': 51762, 'loss/train': 1.4256799221038818} -11/07/2021 04:31:09 - INFO - __main__ - Step 51764: {'lr': 0.000373020176910603, 'samples': 9938688, 'steps': 51763, 'loss/train': 0.7905405759811401} -11/07/2021 04:31:09 - INFO - __main__ - Step 51765: {'lr': 0.00037301555709880706, 'samples': 9938880, 'steps': 51764, 'loss/train': 1.828656554222107} -11/07/2021 04:31:10 - INFO - __main__ - Step 51766: {'lr': 0.00037301093723158223, 'samples': 9939072, 'steps': 51765, 'loss/train': 0.8808240294456482} -11/07/2021 04:31:10 - INFO - __main__ - Step 51767: {'lr': 0.0003730063173089306, 'samples': 9939264, 'steps': 51766, 'loss/train': 0.9141917824745178} -11/07/2021 04:31:11 - INFO - __main__ - Step 51768: {'lr': 0.0003730016973308542, 'samples': 9939456, 'steps': 51767, 'loss/train': 1.409717082977295} -11/07/2021 04:31:11 - INFO - __main__ - Step 51769: {'lr': 0.0003729970772973551, 'samples': 9939648, 'steps': 51768, 'loss/train': 1.1435794830322266} -11/07/2021 04:31:11 - INFO - __main__ - Step 51770: {'lr': 0.00037299245720843544, 'samples': 9939840, 'steps': 51769, 'loss/train': 1.2731410264968872} -11/07/2021 04:31:12 - INFO - __main__ - Step 51771: {'lr': 0.0003729878370640973, 'samples': 9940032, 'steps': 51770, 'loss/train': 0.7276386618614197} -11/07/2021 04:31:13 - INFO - __main__ - Step 51772: {'lr': 0.0003729832168643428, 'samples': 9940224, 'steps': 51771, 'loss/train': 1.9008690118789673} -11/07/2021 04:31:13 - INFO - __main__ - Step 51773: {'lr': 0.00037297859660917384, 'samples': 9940416, 'steps': 51772, 'loss/train': 1.7732874155044556} -11/07/2021 04:31:14 - INFO - __main__ - Step 51774: {'lr': 0.00037297397629859266, 'samples': 9940608, 'steps': 51773, 'loss/train': 1.7407798767089844} -11/07/2021 04:31:14 - INFO - __main__ - Step 51775: {'lr': 0.0003729693559326013, 'samples': 9940800, 'steps': 51774, 'loss/train': 2.1384971141815186} -11/07/2021 04:31:15 - INFO - __main__ - Step 51776: {'lr': 0.00037296473551120185, 'samples': 9940992, 'steps': 51775, 'loss/train': 1.0660651922225952} -11/07/2021 04:31:16 - INFO - __main__ - Step 51777: {'lr': 0.00037296011503439643, 'samples': 9941184, 'steps': 51776, 'loss/train': 1.4928719997406006} -11/07/2021 04:31:16 - INFO - __main__ - Step 51778: {'lr': 0.00037295549450218704, 'samples': 9941376, 'steps': 51777, 'loss/train': 0.5091902017593384} -11/07/2021 04:31:17 - INFO - __main__ - Step 51779: {'lr': 0.0003729508739145758, 'samples': 9941568, 'steps': 51778, 'loss/train': 1.3106775283813477} -11/07/2021 04:31:17 - INFO - __main__ - Step 51780: {'lr': 0.0003729462532715648, 'samples': 9941760, 'steps': 51779, 'loss/train': 1.698462963104248} -11/07/2021 04:31:17 - INFO - __main__ - Step 51781: {'lr': 0.0003729416325731561, 'samples': 9941952, 'steps': 51780, 'loss/train': 1.79434335231781} -11/07/2021 04:31:18 - INFO - __main__ - Step 51782: {'lr': 0.0003729370118193518, 'samples': 9942144, 'steps': 51781, 'loss/train': 1.734641671180725} -11/07/2021 04:31:19 - INFO - __main__ - Step 51783: {'lr': 0.00037293239101015397, 'samples': 9942336, 'steps': 51782, 'loss/train': 1.9667565822601318} -11/07/2021 04:31:19 - INFO - __main__ - Step 51784: {'lr': 0.0003729277701455648, 'samples': 9942528, 'steps': 51783, 'loss/train': 1.8873034715652466} -11/07/2021 04:31:19 - INFO - __main__ - Step 51785: {'lr': 0.00037292314922558615, 'samples': 9942720, 'steps': 51784, 'loss/train': 0.9962705373764038} -11/07/2021 04:31:20 - INFO - __main__ - Step 51786: {'lr': 0.0003729185282502203, 'samples': 9942912, 'steps': 51785, 'loss/train': 1.6829118728637695} -11/07/2021 04:31:20 - INFO - __main__ - Step 51787: {'lr': 0.00037291390721946914, 'samples': 9943104, 'steps': 51786, 'loss/train': 1.8479154109954834} -11/07/2021 04:31:21 - INFO - __main__ - Step 51788: {'lr': 0.00037290928613333495, 'samples': 9943296, 'steps': 51787, 'loss/train': 1.1238924264907837} -11/07/2021 04:31:22 - INFO - __main__ - Step 51789: {'lr': 0.00037290466499181977, 'samples': 9943488, 'steps': 51788, 'loss/train': 1.8052947521209717} -11/07/2021 04:31:22 - INFO - __main__ - Step 51790: {'lr': 0.0003729000437949256, 'samples': 9943680, 'steps': 51789, 'loss/train': 5.505935192108154} -11/07/2021 04:31:22 - INFO - __main__ - Step 51791: {'lr': 0.0003728954225426546, 'samples': 9943872, 'steps': 51790, 'loss/train': 5.436152935028076} -11/07/2021 04:31:23 - INFO - __main__ - Step 51792: {'lr': 0.00037289080123500886, 'samples': 9944064, 'steps': 51791, 'loss/train': 1.7828023433685303} -11/07/2021 04:31:23 - INFO - __main__ - Step 51793: {'lr': 0.0003728861798719903, 'samples': 9944256, 'steps': 51792, 'loss/train': 1.127197504043579} -11/07/2021 04:31:24 - INFO - __main__ - Step 51794: {'lr': 0.00037288155845360116, 'samples': 9944448, 'steps': 51793, 'loss/train': 1.2389522790908813} -11/07/2021 04:31:25 - INFO - __main__ - Step 51795: {'lr': 0.00037287693697984355, 'samples': 9944640, 'steps': 51794, 'loss/train': 1.238544225692749} -11/07/2021 04:31:25 - INFO - __main__ - Step 51796: {'lr': 0.0003728723154507195, 'samples': 9944832, 'steps': 51795, 'loss/train': 1.530659556388855} -11/07/2021 04:31:25 - INFO - __main__ - Step 51797: {'lr': 0.000372867693866231, 'samples': 9945024, 'steps': 51796, 'loss/train': 0.9943727254867554} -11/07/2021 04:31:26 - INFO - __main__ - Step 51798: {'lr': 0.0003728630722263803, 'samples': 9945216, 'steps': 51797, 'loss/train': 1.7220540046691895} -11/07/2021 04:31:27 - INFO - __main__ - Step 51799: {'lr': 0.0003728584505311693, 'samples': 9945408, 'steps': 51798, 'loss/train': 1.9942365884780884} -11/07/2021 04:31:27 - INFO - __main__ - Step 51800: {'lr': 0.0003728538287806002, 'samples': 9945600, 'steps': 51799, 'loss/train': 1.9418936967849731} -11/07/2021 04:31:27 - INFO - __main__ - Step 51801: {'lr': 0.00037284920697467505, 'samples': 9945792, 'steps': 51800, 'loss/train': 1.168082356452942} -11/07/2021 04:31:28 - INFO - __main__ - Step 51802: {'lr': 0.00037284458511339604, 'samples': 9945984, 'steps': 51801, 'loss/train': 1.4020640850067139} -11/07/2021 04:31:28 - INFO - __main__ - Step 51803: {'lr': 0.00037283996319676505, 'samples': 9946176, 'steps': 51802, 'loss/train': 1.0403871536254883} -11/07/2021 04:31:29 - INFO - __main__ - Step 51804: {'lr': 0.0003728353412247843, 'samples': 9946368, 'steps': 51803, 'loss/train': 1.0290791988372803} -11/07/2021 04:31:29 - INFO - __main__ - Step 51805: {'lr': 0.0003728307191974558, 'samples': 9946560, 'steps': 51804, 'loss/train': 1.4733210802078247} -11/07/2021 04:31:30 - INFO - __main__ - Step 51806: {'lr': 0.00037282609711478175, 'samples': 9946752, 'steps': 51805, 'loss/train': 1.1654385328292847} -11/07/2021 04:31:30 - INFO - __main__ - Step 51807: {'lr': 0.00037282147497676415, 'samples': 9946944, 'steps': 51806, 'loss/train': 1.5371730327606201} -11/07/2021 04:31:30 - INFO - __main__ - Step 51808: {'lr': 0.000372816852783405, 'samples': 9947136, 'steps': 51807, 'loss/train': 1.8102275133132935} -11/07/2021 04:31:31 - INFO - __main__ - Step 51809: {'lr': 0.0003728122305347066, 'samples': 9947328, 'steps': 51808, 'loss/train': 1.6196417808532715} -11/07/2021 04:31:33 - INFO - __main__ - Step 51810: {'lr': 0.00037280760823067086, 'samples': 9947520, 'steps': 51809, 'loss/train': 1.4983396530151367} -11/07/2021 04:31:33 - INFO - __main__ - Step 51811: {'lr': 0.00037280298587129984, 'samples': 9947712, 'steps': 51810, 'loss/train': 1.291886329650879} -11/07/2021 04:31:33 - INFO - __main__ - Step 51812: {'lr': 0.0003727983634565958, 'samples': 9947904, 'steps': 51811, 'loss/train': 2.8370022773742676} -11/07/2021 04:31:34 - INFO - __main__ - Step 51813: {'lr': 0.0003727937409865606, 'samples': 9948096, 'steps': 51812, 'loss/train': 2.879993438720703} -11/07/2021 04:31:34 - INFO - __main__ - Step 51814: {'lr': 0.0003727891184611965, 'samples': 9948288, 'steps': 51813, 'loss/train': 1.6335194110870361} -11/07/2021 04:31:34 - INFO - __main__ - Step 51815: {'lr': 0.0003727844958805055, 'samples': 9948480, 'steps': 51814, 'loss/train': 1.2594209909439087} -11/07/2021 04:31:35 - INFO - __main__ - Step 51816: {'lr': 0.0003727798732444897, 'samples': 9948672, 'steps': 51815, 'loss/train': 1.3646434545516968} -11/07/2021 04:31:36 - INFO - __main__ - Step 51817: {'lr': 0.00037277525055315114, 'samples': 9948864, 'steps': 51816, 'loss/train': 1.7088550329208374} -11/07/2021 04:31:36 - INFO - __main__ - Step 51818: {'lr': 0.0003727706278064921, 'samples': 9949056, 'steps': 51817, 'loss/train': 1.1961368322372437} -11/07/2021 04:31:36 - INFO - __main__ - Step 51819: {'lr': 0.00037276600500451434, 'samples': 9949248, 'steps': 51818, 'loss/train': 0.8588838577270508} -11/07/2021 04:31:37 - INFO - __main__ - Step 51820: {'lr': 0.00037276138214722016, 'samples': 9949440, 'steps': 51819, 'loss/train': 1.0528807640075684} -11/07/2021 04:31:38 - INFO - __main__ - Step 51821: {'lr': 0.0003727567592346116, 'samples': 9949632, 'steps': 51820, 'loss/train': 1.587601900100708} -11/07/2021 04:31:38 - INFO - __main__ - Step 51822: {'lr': 0.00037275213626669076, 'samples': 9949824, 'steps': 51821, 'loss/train': 1.6551111936569214} -11/07/2021 04:31:39 - INFO - __main__ - Step 51823: {'lr': 0.00037274751324345966, 'samples': 9950016, 'steps': 51822, 'loss/train': 1.622349739074707} -11/07/2021 04:31:39 - INFO - __main__ - Step 51824: {'lr': 0.0003727428901649205, 'samples': 9950208, 'steps': 51823, 'loss/train': 2.177377939224243} -11/07/2021 04:31:39 - INFO - __main__ - Step 51825: {'lr': 0.00037273826703107527, 'samples': 9950400, 'steps': 51824, 'loss/train': 1.2760615348815918} -11/07/2021 04:31:40 - INFO - __main__ - Step 51826: {'lr': 0.000372733643841926, 'samples': 9950592, 'steps': 51825, 'loss/train': 1.5299488306045532} -11/07/2021 04:31:41 - INFO - __main__ - Step 51827: {'lr': 0.00037272902059747487, 'samples': 9950784, 'steps': 51826, 'loss/train': 1.2025662660598755} -11/07/2021 04:31:41 - INFO - __main__ - Step 51828: {'lr': 0.00037272439729772397, 'samples': 9950976, 'steps': 51827, 'loss/train': 1.5960502624511719} -11/07/2021 04:31:41 - INFO - __main__ - Step 51829: {'lr': 0.00037271977394267534, 'samples': 9951168, 'steps': 51828, 'loss/train': 1.3377803564071655} -11/07/2021 04:31:42 - INFO - __main__ - Step 51830: {'lr': 0.0003727151505323311, 'samples': 9951360, 'steps': 51829, 'loss/train': 0.9705298542976379} -11/07/2021 04:31:43 - INFO - __main__ - Step 51831: {'lr': 0.0003727105270666933, 'samples': 9951552, 'steps': 51830, 'loss/train': 1.0445075035095215} -11/07/2021 04:31:43 - INFO - __main__ - Step 51832: {'lr': 0.00037270590354576396, 'samples': 9951744, 'steps': 51831, 'loss/train': 1.5251946449279785} -11/07/2021 04:31:43 - INFO - __main__ - Step 51833: {'lr': 0.0003727012799695453, 'samples': 9951936, 'steps': 51832, 'loss/train': 1.1685718297958374} -11/07/2021 04:31:44 - INFO - __main__ - Step 51834: {'lr': 0.0003726966563380393, 'samples': 9952128, 'steps': 51833, 'loss/train': 1.306240200996399} -11/07/2021 04:31:44 - INFO - __main__ - Step 51835: {'lr': 0.00037269203265124807, 'samples': 9952320, 'steps': 51834, 'loss/train': 1.5331083536148071} -11/07/2021 04:31:45 - INFO - __main__ - Step 51836: {'lr': 0.00037268740890917374, 'samples': 9952512, 'steps': 51835, 'loss/train': 1.4534672498703003} -11/07/2021 04:31:46 - INFO - __main__ - Step 51837: {'lr': 0.0003726827851118183, 'samples': 9952704, 'steps': 51836, 'loss/train': 1.3268409967422485} -11/07/2021 04:31:46 - INFO - __main__ - Step 51838: {'lr': 0.00037267816125918394, 'samples': 9952896, 'steps': 51837, 'loss/train': 1.8532732725143433} -11/07/2021 04:31:46 - INFO - __main__ - Step 51839: {'lr': 0.00037267353735127276, 'samples': 9953088, 'steps': 51838, 'loss/train': 1.5745549201965332} -11/07/2021 04:31:47 - INFO - __main__ - Step 51840: {'lr': 0.00037266891338808667, 'samples': 9953280, 'steps': 51839, 'loss/train': 1.067560076713562} -11/07/2021 04:31:47 - INFO - __main__ - Step 51841: {'lr': 0.00037266428936962785, 'samples': 9953472, 'steps': 51840, 'loss/train': 1.5043675899505615} -11/07/2021 04:31:48 - INFO - __main__ - Step 51842: {'lr': 0.00037265966529589846, 'samples': 9953664, 'steps': 51841, 'loss/train': 1.3698827028274536} -11/07/2021 04:31:48 - INFO - __main__ - Step 51843: {'lr': 0.0003726550411669005, 'samples': 9953856, 'steps': 51842, 'loss/train': 0.9738919734954834} -11/07/2021 04:31:49 - INFO - __main__ - Step 51844: {'lr': 0.000372650416982636, 'samples': 9954048, 'steps': 51843, 'loss/train': 2.3924238681793213} -11/07/2021 04:31:49 - INFO - __main__ - Step 51845: {'lr': 0.0003726457927431073, 'samples': 9954240, 'steps': 51844, 'loss/train': 1.8212895393371582} -11/07/2021 04:31:50 - INFO - __main__ - Step 51846: {'lr': 0.0003726411684483161, 'samples': 9954432, 'steps': 51845, 'loss/train': 1.4313552379608154} -11/07/2021 04:31:50 - INFO - __main__ - Step 51847: {'lr': 0.0003726365440982648, 'samples': 9954624, 'steps': 51846, 'loss/train': 1.6480627059936523} -11/07/2021 04:31:51 - INFO - __main__ - Step 51848: {'lr': 0.00037263191969295537, 'samples': 9954816, 'steps': 51847, 'loss/train': 1.3523963689804077} -11/07/2021 04:31:51 - INFO - __main__ - Step 51849: {'lr': 0.0003726272952323898, 'samples': 9955008, 'steps': 51848, 'loss/train': 1.597180962562561} -11/07/2021 04:31:51 - INFO - __main__ - Step 51850: {'lr': 0.0003726226707165703, 'samples': 9955200, 'steps': 51849, 'loss/train': 1.6327004432678223} -11/07/2021 04:31:52 - INFO - __main__ - Step 51851: {'lr': 0.000372618046145499, 'samples': 9955392, 'steps': 51850, 'loss/train': 1.4291988611221313} -11/07/2021 04:31:53 - INFO - __main__ - Step 51852: {'lr': 0.0003726134215191778, 'samples': 9955584, 'steps': 51851, 'loss/train': 1.3706315755844116} -11/07/2021 04:31:53 - INFO - __main__ - Step 51853: {'lr': 0.0003726087968376089, 'samples': 9955776, 'steps': 51852, 'loss/train': 1.2131381034851074} -11/07/2021 04:31:54 - INFO - __main__ - Step 51854: {'lr': 0.0003726041721007944, 'samples': 9955968, 'steps': 51853, 'loss/train': 5.908267498016357} -11/07/2021 04:31:54 - INFO - __main__ - Step 51855: {'lr': 0.0003725995473087363, 'samples': 9956160, 'steps': 51854, 'loss/train': 1.3329787254333496} -11/07/2021 04:31:54 - INFO - __main__ - Step 51856: {'lr': 0.0003725949224614368, 'samples': 9956352, 'steps': 51855, 'loss/train': 1.276503562927246} -11/07/2021 04:31:55 - INFO - __main__ - Step 51857: {'lr': 0.00037259029755889783, 'samples': 9956544, 'steps': 51856, 'loss/train': 0.7896950244903564} -11/07/2021 04:31:56 - INFO - __main__ - Step 51858: {'lr': 0.00037258567260112165, 'samples': 9956736, 'steps': 51857, 'loss/train': 0.9399859309196472} -11/07/2021 04:31:56 - INFO - __main__ - Step 51859: {'lr': 0.00037258104758811024, 'samples': 9956928, 'steps': 51858, 'loss/train': 1.4322720766067505} -11/07/2021 04:31:56 - INFO - __main__ - Step 51860: {'lr': 0.00037257642251986567, 'samples': 9957120, 'steps': 51859, 'loss/train': 2.2745914459228516} -11/07/2021 04:31:57 - INFO - __main__ - Step 51861: {'lr': 0.00037257179739639006, 'samples': 9957312, 'steps': 51860, 'loss/train': 1.4123642444610596} -11/07/2021 04:31:57 - INFO - __main__ - Step 51862: {'lr': 0.00037256717221768556, 'samples': 9957504, 'steps': 51861, 'loss/train': 1.6009799242019653} -11/07/2021 04:31:58 - INFO - __main__ - Step 51863: {'lr': 0.0003725625469837541, 'samples': 9957696, 'steps': 51862, 'loss/train': 1.8816026449203491} -11/07/2021 04:31:58 - INFO - __main__ - Step 51864: {'lr': 0.00037255792169459785, 'samples': 9957888, 'steps': 51863, 'loss/train': 1.9500659704208374} -11/07/2021 04:31:59 - INFO - __main__ - Step 51865: {'lr': 0.00037255329635021896, 'samples': 9958080, 'steps': 51864, 'loss/train': 1.6771234273910522} -11/07/2021 04:31:59 - INFO - __main__ - Step 51866: {'lr': 0.0003725486709506194, 'samples': 9958272, 'steps': 51865, 'loss/train': 1.736471176147461} -11/07/2021 04:31:59 - INFO - __main__ - Step 51867: {'lr': 0.0003725440454958013, 'samples': 9958464, 'steps': 51866, 'loss/train': 1.9499398469924927} -11/07/2021 04:32:00 - INFO - __main__ - Step 51868: {'lr': 0.0003725394199857667, 'samples': 9958656, 'steps': 51867, 'loss/train': 1.7287940979003906} -11/07/2021 04:32:01 - INFO - __main__ - Step 51869: {'lr': 0.0003725347944205178, 'samples': 9958848, 'steps': 51868, 'loss/train': 1.9378396272659302} -11/07/2021 04:32:01 - INFO - __main__ - Step 51870: {'lr': 0.0003725301688000566, 'samples': 9959040, 'steps': 51869, 'loss/train': 2.1761879920959473} -11/07/2021 04:32:02 - INFO - __main__ - Step 51871: {'lr': 0.0003725255431243852, 'samples': 9959232, 'steps': 51870, 'loss/train': 1.4214507341384888} -11/07/2021 04:32:02 - INFO - __main__ - Step 51872: {'lr': 0.00037252091739350566, 'samples': 9959424, 'steps': 51871, 'loss/train': 1.181527853012085} -11/07/2021 04:32:03 - INFO - __main__ - Step 51873: {'lr': 0.0003725162916074201, 'samples': 9959616, 'steps': 51872, 'loss/train': 1.4796147346496582} -11/07/2021 04:32:03 - INFO - __main__ - Step 51874: {'lr': 0.0003725116657661306, 'samples': 9959808, 'steps': 51873, 'loss/train': 1.6419570446014404} -11/07/2021 04:32:04 - INFO - __main__ - Step 51875: {'lr': 0.00037250703986963917, 'samples': 9960000, 'steps': 51874, 'loss/train': 1.7105646133422852} -11/07/2021 04:32:04 - INFO - __main__ - Step 51876: {'lr': 0.000372502413917948, 'samples': 9960192, 'steps': 51875, 'loss/train': 1.1473350524902344} -11/07/2021 04:32:04 - INFO - __main__ - Step 51877: {'lr': 0.00037249778791105916, 'samples': 9960384, 'steps': 51876, 'loss/train': 1.1271415948867798} -11/07/2021 04:32:06 - INFO - __main__ - Step 51878: {'lr': 0.0003724931618489747, 'samples': 9960576, 'steps': 51877, 'loss/train': 1.3002792596817017} -11/07/2021 04:32:06 - INFO - __main__ - Step 51879: {'lr': 0.0003724885357316967, 'samples': 9960768, 'steps': 51878, 'loss/train': 1.4516825675964355} -11/07/2021 04:32:06 - INFO - __main__ - Step 51880: {'lr': 0.00037248390955922726, 'samples': 9960960, 'steps': 51879, 'loss/train': 1.018768072128296} -11/07/2021 04:32:07 - INFO - __main__ - Step 51881: {'lr': 0.00037247928333156844, 'samples': 9961152, 'steps': 51880, 'loss/train': 1.8426998853683472} -11/07/2021 04:32:07 - INFO - __main__ - Step 51882: {'lr': 0.0003724746570487223, 'samples': 9961344, 'steps': 51881, 'loss/train': 1.809626817703247} -11/07/2021 04:32:07 - INFO - __main__ - Step 51883: {'lr': 0.00037247003071069106, 'samples': 9961536, 'steps': 51882, 'loss/train': 1.4476546049118042} -11/07/2021 04:32:08 - INFO - __main__ - Step 51884: {'lr': 0.0003724654043174767, 'samples': 9961728, 'steps': 51883, 'loss/train': 1.1984243392944336} -11/07/2021 04:32:09 - INFO - __main__ - Step 51885: {'lr': 0.0003724607778690813, 'samples': 9961920, 'steps': 51884, 'loss/train': 1.2851240634918213} -11/07/2021 04:32:09 - INFO - __main__ - Step 51886: {'lr': 0.00037245615136550695, 'samples': 9962112, 'steps': 51885, 'loss/train': 1.0749436616897583} -11/07/2021 04:32:09 - INFO - __main__ - Step 51887: {'lr': 0.00037245152480675577, 'samples': 9962304, 'steps': 51886, 'loss/train': 1.9282810688018799} -11/07/2021 04:32:10 - INFO - __main__ - Step 51888: {'lr': 0.0003724468981928298, 'samples': 9962496, 'steps': 51887, 'loss/train': 1.6814134120941162} -11/07/2021 04:32:10 - INFO - __main__ - Step 51889: {'lr': 0.00037244227152373113, 'samples': 9962688, 'steps': 51888, 'loss/train': 1.3974967002868652} -11/07/2021 04:32:11 - INFO - __main__ - Step 51890: {'lr': 0.0003724376447994619, 'samples': 9962880, 'steps': 51889, 'loss/train': 1.7117220163345337} -11/07/2021 04:32:12 - INFO - __main__ - Step 51891: {'lr': 0.00037243301802002414, 'samples': 9963072, 'steps': 51890, 'loss/train': 1.6015797853469849} -11/07/2021 04:32:12 - INFO - __main__ - Step 51892: {'lr': 0.00037242839118542, 'samples': 9963264, 'steps': 51891, 'loss/train': 1.636836051940918} -11/07/2021 04:32:12 - INFO - __main__ - Step 51893: {'lr': 0.00037242376429565143, 'samples': 9963456, 'steps': 51892, 'loss/train': 1.7007267475128174} -11/07/2021 04:32:13 - INFO - __main__ - Step 51894: {'lr': 0.0003724191373507206, 'samples': 9963648, 'steps': 51893, 'loss/train': 0.9272041916847229} -11/07/2021 04:32:14 - INFO - __main__ - Step 51895: {'lr': 0.00037241451035062965, 'samples': 9963840, 'steps': 51894, 'loss/train': 1.2658214569091797} -11/07/2021 04:32:14 - INFO - __main__ - Step 51896: {'lr': 0.0003724098832953806, 'samples': 9964032, 'steps': 51895, 'loss/train': 1.257627248764038} -11/07/2021 04:32:14 - INFO - __main__ - Step 51897: {'lr': 0.00037240525618497555, 'samples': 9964224, 'steps': 51896, 'loss/train': 1.2878658771514893} -11/07/2021 04:32:15 - INFO - __main__ - Step 51898: {'lr': 0.00037240062901941663, 'samples': 9964416, 'steps': 51897, 'loss/train': 1.421335220336914} -11/07/2021 04:32:15 - INFO - __main__ - Step 51899: {'lr': 0.0003723960017987058, 'samples': 9964608, 'steps': 51898, 'loss/train': 1.9077128171920776} -11/07/2021 04:32:16 - INFO - __main__ - Step 51900: {'lr': 0.00037239137452284527, 'samples': 9964800, 'steps': 51899, 'loss/train': 1.497809648513794} -11/07/2021 04:32:16 - INFO - __main__ - Step 51901: {'lr': 0.0003723867471918371, 'samples': 9964992, 'steps': 51900, 'loss/train': 1.8138912916183472} -11/07/2021 04:32:17 - INFO - __main__ - Step 51902: {'lr': 0.00037238211980568326, 'samples': 9965184, 'steps': 51901, 'loss/train': 0.4053778350353241} -11/07/2021 04:32:17 - INFO - __main__ - Step 51903: {'lr': 0.00037237749236438593, 'samples': 9965376, 'steps': 51902, 'loss/train': 1.2938474416732788} -11/07/2021 04:32:18 - INFO - __main__ - Step 51904: {'lr': 0.0003723728648679472, 'samples': 9965568, 'steps': 51903, 'loss/train': 1.5468488931655884} -11/07/2021 04:32:18 - INFO - __main__ - Step 51905: {'lr': 0.0003723682373163693, 'samples': 9965760, 'steps': 51904, 'loss/train': 1.8980106115341187} -11/07/2021 04:32:19 - INFO - __main__ - Step 51906: {'lr': 0.0003723636097096539, 'samples': 9965952, 'steps': 51905, 'loss/train': 1.3081457614898682} -11/07/2021 04:32:19 - INFO - __main__ - Step 51907: {'lr': 0.00037235898204780347, 'samples': 9966144, 'steps': 51906, 'loss/train': 1.562143325805664} -11/07/2021 04:32:20 - INFO - __main__ - Step 51908: {'lr': 0.00037235435433082004, 'samples': 9966336, 'steps': 51907, 'loss/train': 1.954079270362854} -11/07/2021 04:32:20 - INFO - __main__ - Step 51909: {'lr': 0.0003723497265587055, 'samples': 9966528, 'steps': 51908, 'loss/train': 0.8910297751426697} -11/07/2021 04:32:21 - INFO - __main__ - Step 51910: {'lr': 0.0003723450987314622, 'samples': 9966720, 'steps': 51909, 'loss/train': 1.4652249813079834} -11/07/2021 04:32:21 - INFO - __main__ - Step 51911: {'lr': 0.00037234047084909195, 'samples': 9966912, 'steps': 51910, 'loss/train': 1.4521297216415405} -11/07/2021 04:32:22 - INFO - __main__ - Step 51912: {'lr': 0.0003723358429115971, 'samples': 9967104, 'steps': 51911, 'loss/train': 1.370575189590454} -11/07/2021 04:32:22 - INFO - __main__ - Step 51913: {'lr': 0.00037233121491897953, 'samples': 9967296, 'steps': 51912, 'loss/train': 0.8230983018875122} -11/07/2021 04:32:22 - INFO - __main__ - Step 51914: {'lr': 0.00037232658687124135, 'samples': 9967488, 'steps': 51913, 'loss/train': 1.110690951347351} -11/07/2021 04:32:23 - INFO - __main__ - Step 51915: {'lr': 0.00037232195876838484, 'samples': 9967680, 'steps': 51914, 'loss/train': 1.117390513420105} -11/07/2021 04:32:24 - INFO - __main__ - Step 51916: {'lr': 0.00037231733061041176, 'samples': 9967872, 'steps': 51915, 'loss/train': 1.2352626323699951} -11/07/2021 04:32:24 - INFO - __main__ - Step 51917: {'lr': 0.0003723127023973245, 'samples': 9968064, 'steps': 51916, 'loss/train': 1.2384299039840698} -11/07/2021 04:32:24 - INFO - __main__ - Step 51918: {'lr': 0.00037230807412912505, 'samples': 9968256, 'steps': 51917, 'loss/train': 1.602675437927246} -11/07/2021 04:32:25 - INFO - __main__ - Step 51919: {'lr': 0.00037230344580581543, 'samples': 9968448, 'steps': 51918, 'loss/train': 1.3293837308883667} -11/07/2021 04:32:26 - INFO - __main__ - Step 51920: {'lr': 0.00037229881742739776, 'samples': 9968640, 'steps': 51919, 'loss/train': 1.4339882135391235} -11/07/2021 04:32:26 - INFO - __main__ - Step 51921: {'lr': 0.0003722941889938741, 'samples': 9968832, 'steps': 51920, 'loss/train': 1.3232321739196777} -11/07/2021 04:32:26 - INFO - __main__ - Step 51922: {'lr': 0.0003722895605052466, 'samples': 9969024, 'steps': 51921, 'loss/train': 1.449321985244751} -11/07/2021 04:32:27 - INFO - __main__ - Step 51923: {'lr': 0.0003722849319615173, 'samples': 9969216, 'steps': 51922, 'loss/train': 1.5120227336883545} -11/07/2021 04:32:27 - INFO - __main__ - Step 51924: {'lr': 0.0003722803033626883, 'samples': 9969408, 'steps': 51923, 'loss/train': 1.466483235359192} -11/07/2021 04:32:28 - INFO - __main__ - Step 51925: {'lr': 0.0003722756747087617, 'samples': 9969600, 'steps': 51924, 'loss/train': 1.7208658456802368} -11/07/2021 04:32:29 - INFO - __main__ - Step 51926: {'lr': 0.0003722710459997395, 'samples': 9969792, 'steps': 51925, 'loss/train': 1.3644756078720093} -11/07/2021 04:32:29 - INFO - __main__ - Step 51927: {'lr': 0.00037226641723562393, 'samples': 9969984, 'steps': 51926, 'loss/train': 1.3063249588012695} -11/07/2021 04:32:29 - INFO - __main__ - Step 51928: {'lr': 0.000372261788416417, 'samples': 9970176, 'steps': 51927, 'loss/train': 1.3560901880264282} -11/07/2021 04:32:30 - INFO - __main__ - Step 51929: {'lr': 0.00037225715954212075, 'samples': 9970368, 'steps': 51928, 'loss/train': 1.6959338188171387} -11/07/2021 04:32:30 - INFO - __main__ - Step 51930: {'lr': 0.00037225253061273734, 'samples': 9970560, 'steps': 51929, 'loss/train': 1.0584107637405396} -11/07/2021 04:32:31 - INFO - __main__ - Step 51931: {'lr': 0.0003722479016282688, 'samples': 9970752, 'steps': 51930, 'loss/train': 1.3664273023605347} -11/07/2021 04:32:31 - INFO - __main__ - Step 51932: {'lr': 0.00037224327258871724, 'samples': 9970944, 'steps': 51931, 'loss/train': 1.2679414749145508} -11/07/2021 04:32:32 - INFO - __main__ - Step 51933: {'lr': 0.00037223864349408484, 'samples': 9971136, 'steps': 51932, 'loss/train': 1.3450313806533813} -11/07/2021 04:32:32 - INFO - __main__ - Step 51934: {'lr': 0.0003722340143443735, 'samples': 9971328, 'steps': 51933, 'loss/train': 1.2071459293365479} -11/07/2021 04:32:32 - INFO - __main__ - Step 51935: {'lr': 0.0003722293851395854, 'samples': 9971520, 'steps': 51934, 'loss/train': 1.6511484384536743} -11/07/2021 04:32:33 - INFO - __main__ - Step 51936: {'lr': 0.00037222475587972263, 'samples': 9971712, 'steps': 51935, 'loss/train': 1.1503103971481323} -11/07/2021 04:32:34 - INFO - __main__ - Step 51937: {'lr': 0.00037222012656478733, 'samples': 9971904, 'steps': 51936, 'loss/train': 1.4829190969467163} -11/07/2021 04:32:34 - INFO - __main__ - Step 51938: {'lr': 0.00037221549719478145, 'samples': 9972096, 'steps': 51937, 'loss/train': 1.1945439577102661} -11/07/2021 04:32:34 - INFO - __main__ - Step 51939: {'lr': 0.0003722108677697072, 'samples': 9972288, 'steps': 51938, 'loss/train': 1.6184502840042114} -11/07/2021 04:32:35 - INFO - __main__ - Step 51940: {'lr': 0.00037220623828956655, 'samples': 9972480, 'steps': 51939, 'loss/train': 1.6197539567947388} -11/07/2021 04:32:36 - INFO - __main__ - Step 51941: {'lr': 0.00037220160875436176, 'samples': 9972672, 'steps': 51940, 'loss/train': 1.4190608263015747} -11/07/2021 04:32:37 - INFO - __main__ - Step 51942: {'lr': 0.0003721969791640948, 'samples': 9972864, 'steps': 51941, 'loss/train': 1.4613615274429321} -11/07/2021 04:32:37 - INFO - __main__ - Step 51943: {'lr': 0.0003721923495187677, 'samples': 9973056, 'steps': 51942, 'loss/train': 1.7495886087417603} -11/07/2021 04:32:38 - INFO - __main__ - Step 51944: {'lr': 0.00037218771981838264, 'samples': 9973248, 'steps': 51943, 'loss/train': 1.5991290807724} -11/07/2021 04:32:38 - INFO - __main__ - Step 51945: {'lr': 0.0003721830900629416, 'samples': 9973440, 'steps': 51944, 'loss/train': 1.4240131378173828} -11/07/2021 04:32:38 - INFO - __main__ - Step 51946: {'lr': 0.00037217846025244686, 'samples': 9973632, 'steps': 51945, 'loss/train': 1.5212458372116089} -11/07/2021 04:32:39 - INFO - __main__ - Step 51947: {'lr': 0.0003721738303869004, 'samples': 9973824, 'steps': 51946, 'loss/train': 4.068519592285156} -11/07/2021 04:32:40 - INFO - __main__ - Step 51948: {'lr': 0.0003721692004663042, 'samples': 9974016, 'steps': 51947, 'loss/train': 4.253776550292969} -11/07/2021 04:32:40 - INFO - __main__ - Step 51949: {'lr': 0.0003721645704906605, 'samples': 9974208, 'steps': 51948, 'loss/train': 1.685030221939087} -11/07/2021 04:32:40 - INFO - __main__ - Step 51950: {'lr': 0.0003721599404599713, 'samples': 9974400, 'steps': 51949, 'loss/train': 0.7306886911392212} -11/07/2021 04:32:41 - INFO - __main__ - Step 51951: {'lr': 0.0003721553103742388, 'samples': 9974592, 'steps': 51950, 'loss/train': 1.0275191068649292} -11/07/2021 04:32:41 - INFO - __main__ - Step 51952: {'lr': 0.00037215068023346495, 'samples': 9974784, 'steps': 51951, 'loss/train': 1.06412935256958} -11/07/2021 04:32:43 - INFO - __main__ - Step 51953: {'lr': 0.0003721460500376518, 'samples': 9974976, 'steps': 51952, 'loss/train': 1.450171709060669} -11/07/2021 04:32:43 - INFO - __main__ - Step 51954: {'lr': 0.00037214141978680166, 'samples': 9975168, 'steps': 51953, 'loss/train': 2.867142915725708} -11/07/2021 04:32:44 - INFO - __main__ - Step 51955: {'lr': 0.00037213678948091637, 'samples': 9975360, 'steps': 51954, 'loss/train': 2.8771166801452637} -11/07/2021 04:32:44 - INFO - __main__ - Step 51956: {'lr': 0.0003721321591199982, 'samples': 9975552, 'steps': 51955, 'loss/train': 2.8488717079162598} -11/07/2021 04:32:44 - INFO - __main__ - Step 51957: {'lr': 0.00037212752870404917, 'samples': 9975744, 'steps': 51956, 'loss/train': 1.3689314126968384} -11/07/2021 04:32:45 - INFO - __main__ - Step 51958: {'lr': 0.0003721228982330713, 'samples': 9975936, 'steps': 51957, 'loss/train': 1.8371143341064453} -11/07/2021 04:32:45 - INFO - __main__ - Step 51959: {'lr': 0.0003721182677070668, 'samples': 9976128, 'steps': 51958, 'loss/train': 0.7011808753013611} -11/07/2021 04:32:46 - INFO - __main__ - Step 51960: {'lr': 0.00037211363712603767, 'samples': 9976320, 'steps': 51959, 'loss/train': 1.4102351665496826} -11/07/2021 04:32:47 - INFO - __main__ - Step 51961: {'lr': 0.00037210900648998604, 'samples': 9976512, 'steps': 51960, 'loss/train': 1.3600716590881348} -11/07/2021 04:32:47 - INFO - __main__ - Step 51962: {'lr': 0.0003721043757989139, 'samples': 9976704, 'steps': 51961, 'loss/train': 1.119926929473877} -11/07/2021 04:32:47 - INFO - __main__ - Step 51963: {'lr': 0.0003720997450528235, 'samples': 9976896, 'steps': 51962, 'loss/train': 1.2507145404815674} -11/07/2021 04:32:48 - INFO - __main__ - Step 51964: {'lr': 0.0003720951142517168, 'samples': 9977088, 'steps': 51963, 'loss/train': 1.713240623474121} -11/07/2021 04:32:48 - INFO - __main__ - Step 51965: {'lr': 0.0003720904833955959, 'samples': 9977280, 'steps': 51964, 'loss/train': 2.1338562965393066} -11/07/2021 04:32:49 - INFO - __main__ - Step 51966: {'lr': 0.000372085852484463, 'samples': 9977472, 'steps': 51965, 'loss/train': 2.168433904647827} -11/07/2021 04:32:50 - INFO - __main__ - Step 51967: {'lr': 0.00037208122151832004, 'samples': 9977664, 'steps': 51966, 'loss/train': 1.1912193298339844} -11/07/2021 04:32:50 - INFO - __main__ - Step 51968: {'lr': 0.0003720765904971691, 'samples': 9977856, 'steps': 51967, 'loss/train': 2.077446699142456} -11/07/2021 04:32:50 - INFO - __main__ - Step 51969: {'lr': 0.0003720719594210124, 'samples': 9978048, 'steps': 51968, 'loss/train': 1.4788835048675537} -11/07/2021 04:32:51 - INFO - __main__ - Step 51970: {'lr': 0.00037206732828985197, 'samples': 9978240, 'steps': 51969, 'loss/train': 0.874961793422699} -11/07/2021 04:32:52 - INFO - __main__ - Step 51971: {'lr': 0.00037206269710368987, 'samples': 9978432, 'steps': 51970, 'loss/train': 1.4377036094665527} -11/07/2021 04:32:52 - INFO - __main__ - Step 51972: {'lr': 0.0003720580658625282, 'samples': 9978624, 'steps': 51971, 'loss/train': 1.9104055166244507} -11/07/2021 04:32:52 - INFO - __main__ - Step 51973: {'lr': 0.00037205343456636907, 'samples': 9978816, 'steps': 51972, 'loss/train': 1.0862919092178345} -11/07/2021 04:32:53 - INFO - __main__ - Step 51974: {'lr': 0.0003720488032152145, 'samples': 9979008, 'steps': 51973, 'loss/train': 1.4456400871276855} -11/07/2021 04:32:53 - INFO - __main__ - Step 51975: {'lr': 0.0003720441718090667, 'samples': 9979200, 'steps': 51974, 'loss/train': 1.407605528831482} -11/07/2021 04:32:55 - INFO - __main__ - Step 51976: {'lr': 0.0003720395403479276, 'samples': 9979392, 'steps': 51975, 'loss/train': 1.2332403659820557} -11/07/2021 04:32:56 - INFO - __main__ - Step 51977: {'lr': 0.00037203490883179935, 'samples': 9979584, 'steps': 51976, 'loss/train': 1.1306183338165283} -11/07/2021 04:32:56 - INFO - __main__ - Step 51978: {'lr': 0.0003720302772606841, 'samples': 9979776, 'steps': 51977, 'loss/train': 1.499109148979187} -11/07/2021 04:32:56 - INFO - __main__ - Step 51979: {'lr': 0.00037202564563458394, 'samples': 9979968, 'steps': 51978, 'loss/train': 1.4061548709869385} -11/07/2021 04:32:57 - INFO - __main__ - Step 51980: {'lr': 0.00037202101395350084, 'samples': 9980160, 'steps': 51979, 'loss/train': 1.3858675956726074} -11/07/2021 04:32:57 - INFO - __main__ - Step 51981: {'lr': 0.0003720163822174369, 'samples': 9980352, 'steps': 51980, 'loss/train': 1.4802196025848389} -11/07/2021 04:32:57 - INFO - __main__ - Step 51982: {'lr': 0.0003720117504263944, 'samples': 9980544, 'steps': 51981, 'loss/train': 1.8351459503173828} -11/07/2021 04:32:58 - INFO - __main__ - Step 51983: {'lr': 0.0003720071185803752, 'samples': 9980736, 'steps': 51982, 'loss/train': 1.2026005983352661} -11/07/2021 04:32:59 - INFO - __main__ - Step 51984: {'lr': 0.00037200248667938155, 'samples': 9980928, 'steps': 51983, 'loss/train': 1.4524941444396973} -11/07/2021 04:32:59 - INFO - __main__ - Step 51985: {'lr': 0.00037199785472341536, 'samples': 9981120, 'steps': 51984, 'loss/train': 1.9673750400543213} -11/07/2021 04:32:59 - INFO - __main__ - Step 51986: {'lr': 0.00037199322271247887, 'samples': 9981312, 'steps': 51985, 'loss/train': 1.7801264524459839} -11/07/2021 04:33:00 - INFO - __main__ - Step 51987: {'lr': 0.00037198859064657415, 'samples': 9981504, 'steps': 51986, 'loss/train': 0.8017715215682983} -11/07/2021 04:33:00 - INFO - __main__ - Step 51988: {'lr': 0.0003719839585257032, 'samples': 9981696, 'steps': 51987, 'loss/train': 1.621757984161377} -11/07/2021 04:33:01 - INFO - __main__ - Step 51989: {'lr': 0.0003719793263498681, 'samples': 9981888, 'steps': 51988, 'loss/train': 1.4853129386901855} -11/07/2021 04:33:02 - INFO - __main__ - Step 51990: {'lr': 0.00037197469411907115, 'samples': 9982080, 'steps': 51989, 'loss/train': 1.7996766567230225} -11/07/2021 04:33:02 - INFO - __main__ - Step 51991: {'lr': 0.0003719700618333142, 'samples': 9982272, 'steps': 51990, 'loss/train': 1.4016635417938232} -11/07/2021 04:33:02 - INFO - __main__ - Step 51992: {'lr': 0.0003719654294925994, 'samples': 9982464, 'steps': 51991, 'loss/train': 1.3064631223678589} -11/07/2021 04:33:03 - INFO - __main__ - Step 51993: {'lr': 0.00037196079709692894, 'samples': 9982656, 'steps': 51992, 'loss/train': 1.7431122064590454} -11/07/2021 04:33:04 - INFO - __main__ - Step 51994: {'lr': 0.0003719561646463048, 'samples': 9982848, 'steps': 51993, 'loss/train': 1.6113237142562866} -11/07/2021 04:33:04 - INFO - __main__ - Step 51995: {'lr': 0.00037195153214072903, 'samples': 9983040, 'steps': 51994, 'loss/train': 1.4810059070587158} -11/07/2021 04:33:04 - INFO - __main__ - Step 51996: {'lr': 0.0003719468995802038, 'samples': 9983232, 'steps': 51995, 'loss/train': 1.485140085220337} -11/07/2021 04:33:05 - INFO - __main__ - Step 51997: {'lr': 0.0003719422669647312, 'samples': 9983424, 'steps': 51996, 'loss/train': 1.5733298063278198} -11/07/2021 04:33:05 - INFO - __main__ - Step 51998: {'lr': 0.0003719376342943133, 'samples': 9983616, 'steps': 51997, 'loss/train': 1.1706762313842773} -11/07/2021 04:33:06 - INFO - __main__ - Step 51999: {'lr': 0.00037193300156895223, 'samples': 9983808, 'steps': 51998, 'loss/train': 1.4785041809082031} -11/07/2021 04:33:06 - INFO - __main__ - Step 52000: {'lr': 0.00037192836878864995, 'samples': 9984000, 'steps': 51999, 'loss/train': 1.6460516452789307} -11/07/2021 04:33:07 - INFO - __main__ - Step 52001: {'lr': 0.00037192373595340864, 'samples': 9984192, 'steps': 52000, 'loss/train': 1.6769099235534668} -11/07/2021 04:33:07 - INFO - __main__ - Step 52002: {'lr': 0.0003719191030632304, 'samples': 9984384, 'steps': 52001, 'loss/train': 1.7142972946166992} -11/07/2021 04:33:07 - INFO - __main__ - Step 52003: {'lr': 0.0003719144701181173, 'samples': 9984576, 'steps': 52002, 'loss/train': 1.564306616783142} -11/07/2021 04:33:08 - INFO - __main__ - Step 52004: {'lr': 0.0003719098371180714, 'samples': 9984768, 'steps': 52003, 'loss/train': 1.6705996990203857} -11/07/2021 04:33:09 - INFO - __main__ - Step 52005: {'lr': 0.00037190520406309483, 'samples': 9984960, 'steps': 52004, 'loss/train': 1.523310899734497} -11/07/2021 04:33:09 - INFO - __main__ - Step 52006: {'lr': 0.00037190057095318966, 'samples': 9985152, 'steps': 52005, 'loss/train': 1.764891505241394} -11/07/2021 04:33:10 - INFO - __main__ - Step 52007: {'lr': 0.00037189593778835794, 'samples': 9985344, 'steps': 52006, 'loss/train': 0.8343120217323303} -11/07/2021 04:33:10 - INFO - __main__ - Step 52008: {'lr': 0.0003718913045686018, 'samples': 9985536, 'steps': 52007, 'loss/train': 0.5164644122123718} -11/07/2021 04:33:10 - INFO - __main__ - Step 52009: {'lr': 0.0003718866712939233, 'samples': 9985728, 'steps': 52008, 'loss/train': 1.4166632890701294} -11/07/2021 04:33:11 - INFO - __main__ - Step 52010: {'lr': 0.00037188203796432464, 'samples': 9985920, 'steps': 52009, 'loss/train': 0.5160446166992188} -11/07/2021 04:33:12 - INFO - __main__ - Step 52011: {'lr': 0.00037187740457980776, 'samples': 9986112, 'steps': 52010, 'loss/train': 1.352651596069336} -11/07/2021 04:33:12 - INFO - __main__ - Step 52012: {'lr': 0.0003718727711403748, 'samples': 9986304, 'steps': 52011, 'loss/train': 1.4476298093795776} -11/07/2021 04:33:12 - INFO - __main__ - Step 52013: {'lr': 0.00037186813764602785, 'samples': 9986496, 'steps': 52012, 'loss/train': 0.8069983720779419} -11/07/2021 04:33:13 - INFO - __main__ - Step 52014: {'lr': 0.00037186350409676894, 'samples': 9986688, 'steps': 52013, 'loss/train': 1.9650357961654663} -11/07/2021 04:33:14 - INFO - __main__ - Step 52015: {'lr': 0.00037185887049260023, 'samples': 9986880, 'steps': 52014, 'loss/train': 1.585021734237671} -11/07/2021 04:33:14 - INFO - __main__ - Step 52016: {'lr': 0.0003718542368335239, 'samples': 9987072, 'steps': 52015, 'loss/train': 1.3363664150238037} -11/07/2021 04:33:14 - INFO - __main__ - Step 52017: {'lr': 0.0003718496031195419, 'samples': 9987264, 'steps': 52016, 'loss/train': 1.2658580541610718} -11/07/2021 04:33:15 - INFO - __main__ - Step 52018: {'lr': 0.00037184496935065625, 'samples': 9987456, 'steps': 52017, 'loss/train': 1.2854598760604858} -11/07/2021 04:33:15 - INFO - __main__ - Step 52019: {'lr': 0.0003718403355268692, 'samples': 9987648, 'steps': 52018, 'loss/train': 1.6694667339324951} -11/07/2021 04:33:16 - INFO - __main__ - Step 52020: {'lr': 0.0003718357016481828, 'samples': 9987840, 'steps': 52019, 'loss/train': 1.105134129524231} -11/07/2021 04:33:16 - INFO - __main__ - Step 52021: {'lr': 0.00037183106771459905, 'samples': 9988032, 'steps': 52020, 'loss/train': 1.6343470811843872} -11/07/2021 04:33:17 - INFO - __main__ - Step 52022: {'lr': 0.00037182643372612014, 'samples': 9988224, 'steps': 52021, 'loss/train': 1.064949631690979} -11/07/2021 04:33:17 - INFO - __main__ - Step 52023: {'lr': 0.00037182179968274807, 'samples': 9988416, 'steps': 52022, 'loss/train': 1.6126441955566406} -11/07/2021 04:33:18 - INFO - __main__ - Step 52024: {'lr': 0.00037181716558448507, 'samples': 9988608, 'steps': 52023, 'loss/train': 1.5883631706237793} -11/07/2021 04:33:19 - INFO - __main__ - Step 52025: {'lr': 0.0003718125314313331, 'samples': 9988800, 'steps': 52024, 'loss/train': 1.135672688484192} -11/07/2021 04:33:19 - INFO - __main__ - Step 52026: {'lr': 0.0003718078972232943, 'samples': 9988992, 'steps': 52025, 'loss/train': 1.3619341850280762} -11/07/2021 04:33:19 - INFO - __main__ - Step 52027: {'lr': 0.0003718032629603707, 'samples': 9989184, 'steps': 52026, 'loss/train': 1.456044316291809} -11/07/2021 04:33:20 - INFO - __main__ - Step 52028: {'lr': 0.00037179862864256444, 'samples': 9989376, 'steps': 52027, 'loss/train': 1.5300452709197998} -11/07/2021 04:33:20 - INFO - __main__ - Step 52029: {'lr': 0.00037179399426987757, 'samples': 9989568, 'steps': 52028, 'loss/train': 1.679802656173706} -11/07/2021 04:33:21 - INFO - __main__ - Step 52030: {'lr': 0.0003717893598423122, 'samples': 9989760, 'steps': 52029, 'loss/train': 1.2130610942840576} -11/07/2021 04:33:21 - INFO - __main__ - Step 52031: {'lr': 0.0003717847253598705, 'samples': 9989952, 'steps': 52030, 'loss/train': 1.6011747121810913} -11/07/2021 04:33:22 - INFO - __main__ - Step 52032: {'lr': 0.0003717800908225544, 'samples': 9990144, 'steps': 52031, 'loss/train': 0.8002707958221436} -11/07/2021 04:33:22 - INFO - __main__ - Step 52033: {'lr': 0.0003717754562303661, 'samples': 9990336, 'steps': 52032, 'loss/train': 1.558195948600769} -11/07/2021 04:33:22 - INFO - __main__ - Step 52034: {'lr': 0.00037177082158330773, 'samples': 9990528, 'steps': 52033, 'loss/train': 1.7184574604034424} -11/07/2021 04:33:23 - INFO - __main__ - Step 52035: {'lr': 0.0003717661868813812, 'samples': 9990720, 'steps': 52034, 'loss/train': 1.2530268430709839} -11/07/2021 04:33:24 - INFO - __main__ - Step 52036: {'lr': 0.00037176155212458875, 'samples': 9990912, 'steps': 52035, 'loss/train': 1.1753389835357666} -11/07/2021 04:33:24 - INFO - __main__ - Step 52037: {'lr': 0.0003717569173129324, 'samples': 9991104, 'steps': 52036, 'loss/train': 1.2855608463287354} -11/07/2021 04:33:25 - INFO - __main__ - Step 52038: {'lr': 0.0003717522824464143, 'samples': 9991296, 'steps': 52037, 'loss/train': 1.7887563705444336} -11/07/2021 04:33:25 - INFO - __main__ - Step 52039: {'lr': 0.0003717476475250365, 'samples': 9991488, 'steps': 52038, 'loss/train': 1.3528296947479248} -11/07/2021 04:33:25 - INFO - __main__ - Step 52040: {'lr': 0.0003717430125488011, 'samples': 9991680, 'steps': 52039, 'loss/train': 1.8824183940887451} -11/07/2021 04:33:26 - INFO - __main__ - Step 52041: {'lr': 0.0003717383775177101, 'samples': 9991872, 'steps': 52040, 'loss/train': 1.8882192373275757} -11/07/2021 04:33:27 - INFO - __main__ - Step 52042: {'lr': 0.0003717337424317657, 'samples': 9992064, 'steps': 52041, 'loss/train': 1.4328219890594482} -11/07/2021 04:33:27 - INFO - __main__ - Step 52043: {'lr': 0.00037172910729097006, 'samples': 9992256, 'steps': 52042, 'loss/train': 1.5730630159378052} -11/07/2021 04:33:28 - INFO - __main__ - Step 52044: {'lr': 0.000371724472095325, 'samples': 9992448, 'steps': 52043, 'loss/train': 1.2859323024749756} -11/07/2021 04:33:28 - INFO - __main__ - Step 52045: {'lr': 0.00037171983684483286, 'samples': 9992640, 'steps': 52044, 'loss/train': 1.8064703941345215} -11/07/2021 04:33:29 - INFO - __main__ - Step 52046: {'lr': 0.00037171520153949565, 'samples': 9992832, 'steps': 52045, 'loss/train': 1.1901495456695557} -11/07/2021 04:33:29 - INFO - __main__ - Step 52047: {'lr': 0.00037171056617931543, 'samples': 9993024, 'steps': 52046, 'loss/train': 1.4095689058303833} -11/07/2021 04:33:30 - INFO - __main__ - Step 52048: {'lr': 0.00037170593076429426, 'samples': 9993216, 'steps': 52047, 'loss/train': 1.3955882787704468} -11/07/2021 04:33:30 - INFO - __main__ - Step 52049: {'lr': 0.00037170129529443436, 'samples': 9993408, 'steps': 52048, 'loss/train': 1.4494365453720093} -11/07/2021 04:33:30 - INFO - __main__ - Step 52050: {'lr': 0.0003716966597697377, 'samples': 9993600, 'steps': 52049, 'loss/train': 1.5685220956802368} -11/07/2021 04:33:31 - INFO - __main__ - Step 52051: {'lr': 0.0003716920241902064, 'samples': 9993792, 'steps': 52050, 'loss/train': 1.1115155220031738} -11/07/2021 04:33:32 - INFO - __main__ - Step 52052: {'lr': 0.0003716873885558425, 'samples': 9993984, 'steps': 52051, 'loss/train': 1.441890835762024} -11/07/2021 04:33:32 - INFO - __main__ - Step 52053: {'lr': 0.0003716827528666482, 'samples': 9994176, 'steps': 52052, 'loss/train': 1.656650424003601} -11/07/2021 04:33:32 - INFO - __main__ - Step 52054: {'lr': 0.0003716781171226255, 'samples': 9994368, 'steps': 52053, 'loss/train': 1.5867408514022827} -11/07/2021 04:33:33 - INFO - __main__ - Step 52055: {'lr': 0.00037167348132377656, 'samples': 9994560, 'steps': 52054, 'loss/train': 1.499980092048645} -11/07/2021 04:33:34 - INFO - __main__ - Step 52056: {'lr': 0.0003716688454701034, 'samples': 9994752, 'steps': 52055, 'loss/train': 1.607343316078186} -11/07/2021 04:33:34 - INFO - __main__ - Step 52057: {'lr': 0.00037166420956160815, 'samples': 9994944, 'steps': 52056, 'loss/train': 0.8065264821052551} -11/07/2021 04:33:34 - INFO - __main__ - Step 52058: {'lr': 0.0003716595735982928, 'samples': 9995136, 'steps': 52057, 'loss/train': 1.3024451732635498} -11/07/2021 04:33:35 - INFO - __main__ - Step 52059: {'lr': 0.0003716549375801597, 'samples': 9995328, 'steps': 52058, 'loss/train': 2.1499733924865723} -11/07/2021 04:33:35 - INFO - __main__ - Step 52060: {'lr': 0.0003716503015072106, 'samples': 9995520, 'steps': 52059, 'loss/train': 1.2450579404830933} -11/07/2021 04:33:36 - INFO - __main__ - Step 52061: {'lr': 0.00037164566537944776, 'samples': 9995712, 'steps': 52060, 'loss/train': 2.1072373390197754} -11/07/2021 04:33:37 - INFO - __main__ - Step 52062: {'lr': 0.00037164102919687335, 'samples': 9995904, 'steps': 52061, 'loss/train': 1.5504851341247559} -11/07/2021 04:33:37 - INFO - __main__ - Step 52063: {'lr': 0.00037163639295948933, 'samples': 9996096, 'steps': 52062, 'loss/train': 1.3318660259246826} -11/07/2021 04:33:37 - INFO - __main__ - Step 52064: {'lr': 0.0003716317566672978, 'samples': 9996288, 'steps': 52063, 'loss/train': 1.722896933555603} -11/07/2021 04:33:38 - INFO - __main__ - Step 52065: {'lr': 0.00037162712032030095, 'samples': 9996480, 'steps': 52064, 'loss/train': 1.8784534931182861} -11/07/2021 04:33:38 - INFO - __main__ - Step 52066: {'lr': 0.00037162248391850076, 'samples': 9996672, 'steps': 52065, 'loss/train': 1.5277537107467651} -11/07/2021 04:33:39 - INFO - __main__ - Step 52067: {'lr': 0.0003716178474618993, 'samples': 9996864, 'steps': 52066, 'loss/train': 1.6308097839355469} -11/07/2021 04:33:39 - INFO - __main__ - Step 52068: {'lr': 0.0003716132109504988, 'samples': 9997056, 'steps': 52067, 'loss/train': 1.5583269596099854} -11/07/2021 04:33:40 - INFO - __main__ - Step 52069: {'lr': 0.0003716085743843012, 'samples': 9997248, 'steps': 52068, 'loss/train': 0.9065039157867432} -11/07/2021 04:33:40 - INFO - __main__ - Step 52070: {'lr': 0.0003716039377633087, 'samples': 9997440, 'steps': 52069, 'loss/train': 1.153981328010559} -11/07/2021 04:33:41 - INFO - __main__ - Step 52071: {'lr': 0.00037159930108752326, 'samples': 9997632, 'steps': 52070, 'loss/train': 1.4276835918426514} -11/07/2021 04:33:42 - INFO - __main__ - Step 52072: {'lr': 0.0003715946643569471, 'samples': 9997824, 'steps': 52071, 'loss/train': 1.7018718719482422} -11/07/2021 04:33:42 - INFO - __main__ - Step 52073: {'lr': 0.0003715900275715823, 'samples': 9998016, 'steps': 52072, 'loss/train': 1.0280437469482422} -11/07/2021 04:33:42 - INFO - __main__ - Step 52074: {'lr': 0.0003715853907314309, 'samples': 9998208, 'steps': 52073, 'loss/train': 0.7347991466522217} -11/07/2021 04:33:43 - INFO - __main__ - Step 52075: {'lr': 0.0003715807538364949, 'samples': 9998400, 'steps': 52074, 'loss/train': 1.3218401670455933} -11/07/2021 04:33:43 - INFO - __main__ - Step 52076: {'lr': 0.00037157611688677666, 'samples': 9998592, 'steps': 52075, 'loss/train': 1.8234870433807373} -11/07/2021 04:33:44 - INFO - __main__ - Step 52077: {'lr': 0.000371571479882278, 'samples': 9998784, 'steps': 52076, 'loss/train': 0.9849280118942261} -11/07/2021 04:33:44 - INFO - __main__ - Step 52078: {'lr': 0.00037156684282300105, 'samples': 9998976, 'steps': 52077, 'loss/train': 1.448745846748352} -11/07/2021 04:33:45 - INFO - __main__ - Step 52079: {'lr': 0.00037156220570894806, 'samples': 9999168, 'steps': 52078, 'loss/train': 1.3544305562973022} -11/07/2021 04:33:45 - INFO - __main__ - Step 52080: {'lr': 0.00037155756854012097, 'samples': 9999360, 'steps': 52079, 'loss/train': 1.0842026472091675} -11/07/2021 04:33:46 - INFO - __main__ - Step 52081: {'lr': 0.000371552931316522, 'samples': 9999552, 'steps': 52080, 'loss/train': 0.9628018736839294} -11/07/2021 04:33:47 - INFO - __main__ - Step 52082: {'lr': 0.00037154829403815307, 'samples': 9999744, 'steps': 52081, 'loss/train': 1.5966683626174927} -11/07/2021 04:33:47 - INFO - __main__ - Step 52083: {'lr': 0.0003715436567050163, 'samples': 9999936, 'steps': 52082, 'loss/train': 1.1053435802459717} -11/07/2021 04:33:47 - INFO - __main__ - Step 52084: {'lr': 0.0003715390193171139, 'samples': 10000128, 'steps': 52083, 'loss/train': 2.0694639682769775} -11/07/2021 04:33:48 - INFO - __main__ - Step 52085: {'lr': 0.0003715343818744479, 'samples': 10000320, 'steps': 52084, 'loss/train': 1.1751145124435425} -11/07/2021 04:33:48 - INFO - __main__ - Step 52086: {'lr': 0.0003715297443770203, 'samples': 10000512, 'steps': 52085, 'loss/train': 1.136919379234314} -11/07/2021 04:33:49 - INFO - __main__ - Step 52087: {'lr': 0.0003715251068248334, 'samples': 10000704, 'steps': 52086, 'loss/train': 1.6594806909561157} -11/07/2021 04:33:50 - INFO - __main__ - Step 52088: {'lr': 0.00037152046921788906, 'samples': 10000896, 'steps': 52087, 'loss/train': 0.5346752405166626} -11/07/2021 04:33:50 - INFO - __main__ - Step 52089: {'lr': 0.00037151583155618957, 'samples': 10001088, 'steps': 52088, 'loss/train': 1.593422770500183} -11/07/2021 04:33:50 - INFO - __main__ - Step 52090: {'lr': 0.00037151119383973684, 'samples': 10001280, 'steps': 52089, 'loss/train': 1.4512618780136108} -11/07/2021 04:33:51 - INFO - __main__ - Step 52091: {'lr': 0.0003715065560685331, 'samples': 10001472, 'steps': 52090, 'loss/train': 5.8047614097595215} -11/07/2021 04:33:51 - INFO - __main__ - Step 52092: {'lr': 0.00037150191824258027, 'samples': 10001664, 'steps': 52091, 'loss/train': 1.467519998550415} -11/07/2021 04:33:52 - INFO - __main__ - Step 52093: {'lr': 0.00037149728036188067, 'samples': 10001856, 'steps': 52092, 'loss/train': 1.4725695848464966} -11/07/2021 04:33:52 - INFO - __main__ - Step 52094: {'lr': 0.0003714926424264363, 'samples': 10002048, 'steps': 52093, 'loss/train': 1.010266661643982} -11/07/2021 04:33:53 - INFO - __main__ - Step 52095: {'lr': 0.00037148800443624906, 'samples': 10002240, 'steps': 52094, 'loss/train': 1.4820456504821777} -11/07/2021 04:33:53 - INFO - __main__ - Step 52096: {'lr': 0.0003714833663913213, 'samples': 10002432, 'steps': 52095, 'loss/train': 1.5023173093795776} -11/07/2021 04:33:53 - INFO - __main__ - Step 52097: {'lr': 0.00037147872829165497, 'samples': 10002624, 'steps': 52096, 'loss/train': 1.4011294841766357} -11/07/2021 04:33:54 - INFO - __main__ - Step 52098: {'lr': 0.00037147409013725226, 'samples': 10002816, 'steps': 52097, 'loss/train': 1.8304104804992676} -11/07/2021 04:33:55 - INFO - __main__ - Step 52099: {'lr': 0.00037146945192811513, 'samples': 10003008, 'steps': 52098, 'loss/train': 1.5196019411087036} -11/07/2021 04:33:55 - INFO - __main__ - Step 52100: {'lr': 0.00037146481366424585, 'samples': 10003200, 'steps': 52099, 'loss/train': 1.5309158563613892} -11/07/2021 04:33:56 - INFO - __main__ - Step 52101: {'lr': 0.0003714601753456463, 'samples': 10003392, 'steps': 52100, 'loss/train': 1.7246387004852295} -11/07/2021 04:33:56 - INFO - __main__ - Step 52102: {'lr': 0.0003714555369723187, 'samples': 10003584, 'steps': 52101, 'loss/train': 1.4665919542312622} -11/07/2021 04:33:56 - INFO - __main__ - Step 52103: {'lr': 0.00037145089854426504, 'samples': 10003776, 'steps': 52102, 'loss/train': 1.6272002458572388} -11/07/2021 04:33:57 - INFO - __main__ - Step 52104: {'lr': 0.0003714462600614876, 'samples': 10003968, 'steps': 52103, 'loss/train': 1.3589495420455933} -11/07/2021 04:33:58 - INFO - __main__ - Step 52105: {'lr': 0.0003714416215239883, 'samples': 10004160, 'steps': 52104, 'loss/train': 1.5083616971969604} -11/07/2021 04:33:58 - INFO - __main__ - Step 52106: {'lr': 0.00037143698293176923, 'samples': 10004352, 'steps': 52105, 'loss/train': 1.0739424228668213} -11/07/2021 04:33:58 - INFO - __main__ - Step 52107: {'lr': 0.0003714323442848326, 'samples': 10004544, 'steps': 52106, 'loss/train': 1.4502241611480713} -11/07/2021 04:33:59 - INFO - __main__ - Step 52108: {'lr': 0.0003714277055831804, 'samples': 10004736, 'steps': 52107, 'loss/train': 1.6501597166061401} -11/07/2021 04:34:00 - INFO - __main__ - Step 52109: {'lr': 0.00037142306682681476, 'samples': 10004928, 'steps': 52108, 'loss/train': 1.2590582370758057} -11/07/2021 04:34:00 - INFO - __main__ - Step 52110: {'lr': 0.00037141842801573775, 'samples': 10005120, 'steps': 52109, 'loss/train': 1.1598715782165527} -11/07/2021 04:34:00 - INFO - __main__ - Step 52111: {'lr': 0.00037141378914995146, 'samples': 10005312, 'steps': 52110, 'loss/train': 1.8247171640396118} -11/07/2021 04:34:01 - INFO - __main__ - Step 52112: {'lr': 0.000371409150229458, 'samples': 10005504, 'steps': 52111, 'loss/train': 1.4721322059631348} -11/07/2021 04:34:01 - INFO - __main__ - Step 52113: {'lr': 0.00037140451125425945, 'samples': 10005696, 'steps': 52112, 'loss/train': 1.5720247030258179} -11/07/2021 04:34:02 - INFO - __main__ - Step 52114: {'lr': 0.0003713998722243579, 'samples': 10005888, 'steps': 52113, 'loss/train': 1.7562553882598877} -11/07/2021 04:34:02 - INFO - __main__ - Step 52115: {'lr': 0.00037139523313975544, 'samples': 10006080, 'steps': 52114, 'loss/train': 1.492295742034912} -11/07/2021 04:34:03 - INFO - __main__ - Step 52116: {'lr': 0.00037139059400045416, 'samples': 10006272, 'steps': 52115, 'loss/train': 1.6417118310928345} -11/07/2021 04:34:03 - INFO - __main__ - Step 52117: {'lr': 0.00037138595480645613, 'samples': 10006464, 'steps': 52116, 'loss/train': 1.6110855340957642} -11/07/2021 04:34:03 - INFO - __main__ - Step 52118: {'lr': 0.0003713813155577635, 'samples': 10006656, 'steps': 52117, 'loss/train': 1.171640396118164} -11/07/2021 04:34:05 - INFO - __main__ - Step 52119: {'lr': 0.0003713766762543783, 'samples': 10006848, 'steps': 52118, 'loss/train': 1.4638890027999878} -11/07/2021 04:34:05 - INFO - __main__ - Step 52120: {'lr': 0.0003713720368963027, 'samples': 10007040, 'steps': 52119, 'loss/train': 1.145456075668335} -11/07/2021 04:34:05 - INFO - __main__ - Step 52121: {'lr': 0.0003713673974835387, 'samples': 10007232, 'steps': 52120, 'loss/train': 1.0905083417892456} -11/07/2021 04:34:06 - INFO - __main__ - Step 52122: {'lr': 0.0003713627580160884, 'samples': 10007424, 'steps': 52121, 'loss/train': 1.7812553644180298} -11/07/2021 04:34:06 - INFO - __main__ - Step 52123: {'lr': 0.0003713581184939539, 'samples': 10007616, 'steps': 52122, 'loss/train': 1.7905954122543335} -11/07/2021 04:34:07 - INFO - __main__ - Step 52124: {'lr': 0.00037135347891713733, 'samples': 10007808, 'steps': 52123, 'loss/train': 0.9739303588867188} -11/07/2021 04:34:07 - INFO - __main__ - Step 52125: {'lr': 0.00037134883928564074, 'samples': 10008000, 'steps': 52124, 'loss/train': 2.040052890777588} -11/07/2021 04:34:08 - INFO - __main__ - Step 52126: {'lr': 0.00037134419959946626, 'samples': 10008192, 'steps': 52125, 'loss/train': 1.1834639310836792} -11/07/2021 04:34:08 - INFO - __main__ - Step 52127: {'lr': 0.00037133955985861595, 'samples': 10008384, 'steps': 52126, 'loss/train': 1.6054444313049316} -11/07/2021 04:34:08 - INFO - __main__ - Step 52128: {'lr': 0.00037133492006309187, 'samples': 10008576, 'steps': 52127, 'loss/train': 0.986207127571106} -11/07/2021 04:34:09 - INFO - __main__ - Step 52129: {'lr': 0.00037133028021289625, 'samples': 10008768, 'steps': 52128, 'loss/train': 2.1998698711395264} -11/07/2021 04:34:10 - INFO - __main__ - Step 52130: {'lr': 0.000371325640308031, 'samples': 10008960, 'steps': 52129, 'loss/train': 1.144845724105835} -11/07/2021 04:34:10 - INFO - __main__ - Step 52131: {'lr': 0.0003713210003484982, 'samples': 10009152, 'steps': 52130, 'loss/train': 1.2223379611968994} -11/07/2021 04:34:10 - INFO - __main__ - Step 52132: {'lr': 0.00037131636033430017, 'samples': 10009344, 'steps': 52131, 'loss/train': 1.4668699502944946} -11/07/2021 04:34:11 - INFO - __main__ - Step 52133: {'lr': 0.0003713117202654388, 'samples': 10009536, 'steps': 52132, 'loss/train': 1.0695420503616333} -11/07/2021 04:34:12 - INFO - __main__ - Step 52134: {'lr': 0.0003713070801419163, 'samples': 10009728, 'steps': 52133, 'loss/train': 1.5132064819335938} -11/07/2021 04:34:12 - INFO - __main__ - Step 52135: {'lr': 0.00037130243996373466, 'samples': 10009920, 'steps': 52134, 'loss/train': 1.7165154218673706} -11/07/2021 04:34:13 - INFO - __main__ - Step 52136: {'lr': 0.00037129779973089596, 'samples': 10010112, 'steps': 52135, 'loss/train': 1.2871824502944946} -11/07/2021 04:34:13 - INFO - __main__ - Step 52137: {'lr': 0.0003712931594434024, 'samples': 10010304, 'steps': 52136, 'loss/train': 1.0461310148239136} -11/07/2021 04:34:13 - INFO - __main__ - Step 52138: {'lr': 0.000371288519101256, 'samples': 10010496, 'steps': 52137, 'loss/train': 1.2248376607894897} -11/07/2021 04:34:14 - INFO - __main__ - Step 52139: {'lr': 0.00037128387870445883, 'samples': 10010688, 'steps': 52138, 'loss/train': 1.1509482860565186} -11/07/2021 04:34:15 - INFO - __main__ - Step 52140: {'lr': 0.00037127923825301315, 'samples': 10010880, 'steps': 52139, 'loss/train': 1.6599177122116089} -11/07/2021 04:34:15 - INFO - __main__ - Step 52141: {'lr': 0.0003712745977469208, 'samples': 10011072, 'steps': 52140, 'loss/train': 2.065338134765625} -11/07/2021 04:34:15 - INFO - __main__ - Step 52142: {'lr': 0.000371269957186184, 'samples': 10011264, 'steps': 52141, 'loss/train': 1.4618128538131714} -11/07/2021 04:34:16 - INFO - __main__ - Step 52143: {'lr': 0.0003712653165708048, 'samples': 10011456, 'steps': 52142, 'loss/train': 0.9149712324142456} -11/07/2021 04:34:16 - INFO - __main__ - Step 52144: {'lr': 0.00037126067590078537, 'samples': 10011648, 'steps': 52143, 'loss/train': 1.1253894567489624} -11/07/2021 04:34:17 - INFO - __main__ - Step 52145: {'lr': 0.00037125603517612773, 'samples': 10011840, 'steps': 52144, 'loss/train': 2.2957513332366943} -11/07/2021 04:34:17 - INFO - __main__ - Step 52146: {'lr': 0.00037125139439683405, 'samples': 10012032, 'steps': 52145, 'loss/train': 1.360108494758606} -11/07/2021 04:34:18 - INFO - __main__ - Step 52147: {'lr': 0.00037124675356290635, 'samples': 10012224, 'steps': 52146, 'loss/train': 1.1610556840896606} -11/07/2021 04:34:18 - INFO - __main__ - Step 52148: {'lr': 0.00037124211267434667, 'samples': 10012416, 'steps': 52147, 'loss/train': 1.3958730697631836} -11/07/2021 04:34:18 - INFO - __main__ - Step 52149: {'lr': 0.0003712374717311572, 'samples': 10012608, 'steps': 52148, 'loss/train': 1.436025619506836} -11/07/2021 04:34:20 - INFO - __main__ - Step 52150: {'lr': 0.00037123283073333996, 'samples': 10012800, 'steps': 52149, 'loss/train': 0.7066998481750488} -11/07/2021 04:34:20 - INFO - __main__ - Step 52151: {'lr': 0.0003712281896808971, 'samples': 10012992, 'steps': 52150, 'loss/train': 1.125436782836914} -11/07/2021 04:34:20 - INFO - __main__ - Step 52152: {'lr': 0.0003712235485738307, 'samples': 10013184, 'steps': 52151, 'loss/train': 1.9018964767456055} -11/07/2021 04:34:21 - INFO - __main__ - Step 52153: {'lr': 0.0003712189074121428, 'samples': 10013376, 'steps': 52152, 'loss/train': 1.6347655057907104} -11/07/2021 04:34:21 - INFO - __main__ - Step 52154: {'lr': 0.0003712142661958356, 'samples': 10013568, 'steps': 52153, 'loss/train': 1.5352139472961426} -11/07/2021 04:34:22 - INFO - __main__ - Step 52155: {'lr': 0.0003712096249249111, 'samples': 10013760, 'steps': 52154, 'loss/train': 1.4936988353729248} -11/07/2021 04:34:22 - INFO - __main__ - Step 52156: {'lr': 0.00037120498359937136, 'samples': 10013952, 'steps': 52155, 'loss/train': 2.040149450302124} -11/07/2021 04:34:23 - INFO - __main__ - Step 52157: {'lr': 0.0003712003422192186, 'samples': 10014144, 'steps': 52156, 'loss/train': 1.3096764087677002} -11/07/2021 04:34:23 - INFO - __main__ - Step 52158: {'lr': 0.00037119570078445477, 'samples': 10014336, 'steps': 52157, 'loss/train': 1.6156455278396606} -11/07/2021 04:34:23 - INFO - __main__ - Step 52159: {'lr': 0.00037119105929508207, 'samples': 10014528, 'steps': 52158, 'loss/train': 1.2151671648025513} -11/07/2021 04:34:24 - INFO - __main__ - Step 52160: {'lr': 0.0003711864177511025, 'samples': 10014720, 'steps': 52159, 'loss/train': 1.809687614440918} -11/07/2021 04:34:25 - INFO - __main__ - Step 52161: {'lr': 0.0003711817761525183, 'samples': 10014912, 'steps': 52160, 'loss/train': 1.2535426616668701} -11/07/2021 04:34:25 - INFO - __main__ - Step 52162: {'lr': 0.00037117713449933136, 'samples': 10015104, 'steps': 52161, 'loss/train': 1.4790703058242798} -11/07/2021 04:34:25 - INFO - __main__ - Step 52163: {'lr': 0.0003711724927915439, 'samples': 10015296, 'steps': 52162, 'loss/train': 1.4326823949813843} -11/07/2021 04:34:26 - INFO - __main__ - Step 52164: {'lr': 0.000371167851029158, 'samples': 10015488, 'steps': 52163, 'loss/train': 1.416654109954834} -11/07/2021 04:34:26 - INFO - __main__ - Step 52165: {'lr': 0.0003711632092121757, 'samples': 10015680, 'steps': 52164, 'loss/train': 1.4773273468017578} -11/07/2021 04:34:27 - INFO - __main__ - Step 52166: {'lr': 0.00037115856734059916, 'samples': 10015872, 'steps': 52165, 'loss/train': 0.7316718101501465} -11/07/2021 04:34:27 - INFO - __main__ - Step 52167: {'lr': 0.0003711539254144305, 'samples': 10016064, 'steps': 52166, 'loss/train': 0.7960385084152222} -11/07/2021 04:34:28 - INFO - __main__ - Step 52168: {'lr': 0.0003711492834336717, 'samples': 10016256, 'steps': 52167, 'loss/train': 1.4833855628967285} -11/07/2021 04:34:28 - INFO - __main__ - Step 52169: {'lr': 0.00037114464139832487, 'samples': 10016448, 'steps': 52168, 'loss/train': 1.1186985969543457} -11/07/2021 04:34:28 - INFO - __main__ - Step 52170: {'lr': 0.00037113999930839215, 'samples': 10016640, 'steps': 52169, 'loss/train': 1.6359552145004272} -11/07/2021 04:34:29 - INFO - __main__ - Step 52171: {'lr': 0.00037113535716387565, 'samples': 10016832, 'steps': 52170, 'loss/train': 0.7417372465133667} -11/07/2021 04:34:30 - INFO - __main__ - Step 52172: {'lr': 0.00037113071496477733, 'samples': 10017024, 'steps': 52171, 'loss/train': 1.2818551063537598} -11/07/2021 04:34:30 - INFO - __main__ - Step 52173: {'lr': 0.0003711260727110995, 'samples': 10017216, 'steps': 52172, 'loss/train': 1.242611050605774} -11/07/2021 04:34:30 - INFO - __main__ - Step 52174: {'lr': 0.0003711214304028441, 'samples': 10017408, 'steps': 52173, 'loss/train': 1.686108946800232} -11/07/2021 04:34:31 - INFO - __main__ - Step 52175: {'lr': 0.00037111678804001324, 'samples': 10017600, 'steps': 52174, 'loss/train': 0.7480536103248596} -11/07/2021 04:34:32 - INFO - __main__ - Step 52176: {'lr': 0.00037111214562260896, 'samples': 10017792, 'steps': 52175, 'loss/train': 1.652687907218933} -11/07/2021 04:34:32 - INFO - __main__ - Step 52177: {'lr': 0.0003711075031506335, 'samples': 10017984, 'steps': 52176, 'loss/train': 1.6718931198120117} -11/07/2021 04:34:33 - INFO - __main__ - Step 52178: {'lr': 0.0003711028606240888, 'samples': 10018176, 'steps': 52177, 'loss/train': 1.234239101409912} -11/07/2021 04:34:33 - INFO - __main__ - Step 52179: {'lr': 0.00037109821804297706, 'samples': 10018368, 'steps': 52178, 'loss/train': 0.9123637676239014} -11/07/2021 04:34:33 - INFO - __main__ - Step 52180: {'lr': 0.00037109357540730033, 'samples': 10018560, 'steps': 52179, 'loss/train': 0.998516321182251} -11/07/2021 04:34:34 - INFO - __main__ - Step 52181: {'lr': 0.00037108893271706075, 'samples': 10018752, 'steps': 52180, 'loss/train': 1.4245970249176025} -11/07/2021 04:34:35 - INFO - __main__ - Step 52182: {'lr': 0.0003710842899722603, 'samples': 10018944, 'steps': 52181, 'loss/train': 0.6998801231384277} -11/07/2021 04:34:35 - INFO - __main__ - Step 52183: {'lr': 0.00037107964717290117, 'samples': 10019136, 'steps': 52182, 'loss/train': 1.276153326034546} -11/07/2021 04:34:35 - INFO - __main__ - Step 52184: {'lr': 0.0003710750043189854, 'samples': 10019328, 'steps': 52183, 'loss/train': 1.2006757259368896} -11/07/2021 04:34:36 - INFO - __main__ - Step 52185: {'lr': 0.0003710703614105151, 'samples': 10019520, 'steps': 52184, 'loss/train': 0.8838239908218384} -11/07/2021 04:34:37 - INFO - __main__ - Step 52186: {'lr': 0.0003710657184474924, 'samples': 10019712, 'steps': 52185, 'loss/train': 1.9587353467941284} -11/07/2021 04:34:37 - INFO - __main__ - Step 52187: {'lr': 0.00037106107542991937, 'samples': 10019904, 'steps': 52186, 'loss/train': 1.2354145050048828} -11/07/2021 04:34:37 - INFO - __main__ - Step 52188: {'lr': 0.00037105643235779803, 'samples': 10020096, 'steps': 52187, 'loss/train': 1.402997374534607} -11/07/2021 04:34:38 - INFO - __main__ - Step 52189: {'lr': 0.0003710517892311305, 'samples': 10020288, 'steps': 52188, 'loss/train': 1.4153070449829102} -11/07/2021 04:34:38 - INFO - __main__ - Step 52190: {'lr': 0.00037104714604991896, 'samples': 10020480, 'steps': 52189, 'loss/train': 1.4302728176116943} -11/07/2021 04:34:38 - INFO - __main__ - Step 52191: {'lr': 0.0003710425028141654, 'samples': 10020672, 'steps': 52190, 'loss/train': 1.6049634218215942} -11/07/2021 04:34:40 - INFO - __main__ - Step 52192: {'lr': 0.000371037859523872, 'samples': 10020864, 'steps': 52191, 'loss/train': 1.017406702041626} -11/07/2021 04:34:40 - INFO - __main__ - Step 52193: {'lr': 0.00037103321617904076, 'samples': 10021056, 'steps': 52192, 'loss/train': 1.6501271724700928} -11/07/2021 04:34:40 - INFO - __main__ - Step 52194: {'lr': 0.00037102857277967387, 'samples': 10021248, 'steps': 52193, 'loss/train': 1.695813775062561} -11/07/2021 04:34:41 - INFO - __main__ - Step 52195: {'lr': 0.0003710239293257734, 'samples': 10021440, 'steps': 52194, 'loss/train': 1.6397981643676758} -11/07/2021 04:34:41 - INFO - __main__ - Step 52196: {'lr': 0.00037101928581734136, 'samples': 10021632, 'steps': 52195, 'loss/train': 1.3900978565216064} -11/07/2021 04:34:42 - INFO - __main__ - Step 52197: {'lr': 0.00037101464225437986, 'samples': 10021824, 'steps': 52196, 'loss/train': 1.402624249458313} -11/07/2021 04:34:42 - INFO - __main__ - Step 52198: {'lr': 0.0003710099986368911, 'samples': 10022016, 'steps': 52197, 'loss/train': 1.3117009401321411} -11/07/2021 04:34:43 - INFO - __main__ - Step 52199: {'lr': 0.0003710053549648771, 'samples': 10022208, 'steps': 52198, 'loss/train': 1.4527676105499268} -11/07/2021 04:34:43 - INFO - __main__ - Step 52200: {'lr': 0.00037100071123833994, 'samples': 10022400, 'steps': 52199, 'loss/train': 1.0785988569259644} -11/07/2021 04:34:43 - INFO - __main__ - Step 52201: {'lr': 0.0003709960674572817, 'samples': 10022592, 'steps': 52200, 'loss/train': 1.6540666818618774} -11/07/2021 04:34:45 - INFO - __main__ - Step 52202: {'lr': 0.00037099142362170454, 'samples': 10022784, 'steps': 52201, 'loss/train': 1.695608377456665} -11/07/2021 04:34:45 - INFO - __main__ - Step 52203: {'lr': 0.0003709867797316105, 'samples': 10022976, 'steps': 52202, 'loss/train': 1.1415761709213257} -11/07/2021 04:34:46 - INFO - __main__ - Step 52204: {'lr': 0.0003709821357870016, 'samples': 10023168, 'steps': 52203, 'loss/train': 0.9897325038909912} -11/07/2021 04:34:46 - INFO - __main__ - Step 52205: {'lr': 0.0003709774917878802, 'samples': 10023360, 'steps': 52204, 'loss/train': 1.4016780853271484} -11/07/2021 04:34:46 - INFO - __main__ - Step 52206: {'lr': 0.00037097284773424805, 'samples': 10023552, 'steps': 52205, 'loss/train': 0.12023314088582993} -11/07/2021 04:34:47 - INFO - __main__ - Step 52207: {'lr': 0.0003709682036261075, 'samples': 10023744, 'steps': 52206, 'loss/train': 1.1758884191513062} -11/07/2021 04:34:48 - INFO - __main__ - Step 52208: {'lr': 0.00037096355946346045, 'samples': 10023936, 'steps': 52207, 'loss/train': 1.5671637058258057} -11/07/2021 04:34:48 - INFO - __main__ - Step 52209: {'lr': 0.00037095891524630914, 'samples': 10024128, 'steps': 52208, 'loss/train': 1.3916738033294678} -11/07/2021 04:34:48 - INFO - __main__ - Step 52210: {'lr': 0.00037095427097465564, 'samples': 10024320, 'steps': 52209, 'loss/train': 0.7325248122215271} -11/07/2021 04:34:49 - INFO - __main__ - Step 52211: {'lr': 0.00037094962664850194, 'samples': 10024512, 'steps': 52210, 'loss/train': 1.4294133186340332} -11/07/2021 04:34:50 - INFO - __main__ - Step 52212: {'lr': 0.00037094498226785023, 'samples': 10024704, 'steps': 52211, 'loss/train': 0.8006132245063782} -11/07/2021 04:34:50 - INFO - __main__ - Step 52213: {'lr': 0.00037094033783270256, 'samples': 10024896, 'steps': 52212, 'loss/train': 1.655676007270813} -11/07/2021 04:34:50 - INFO - __main__ - Step 52214: {'lr': 0.0003709356933430611, 'samples': 10025088, 'steps': 52213, 'loss/train': 1.8293867111206055} -11/07/2021 04:34:51 - INFO - __main__ - Step 52215: {'lr': 0.00037093104879892786, 'samples': 10025280, 'steps': 52214, 'loss/train': 1.439482569694519} -11/07/2021 04:34:51 - INFO - __main__ - Step 52216: {'lr': 0.000370926404200305, 'samples': 10025472, 'steps': 52215, 'loss/train': 0.9110205769538879} -11/07/2021 04:34:52 - INFO - __main__ - Step 52217: {'lr': 0.0003709217595471945, 'samples': 10025664, 'steps': 52216, 'loss/train': 1.7956041097640991} -11/07/2021 04:34:53 - INFO - __main__ - Step 52218: {'lr': 0.0003709171148395985, 'samples': 10025856, 'steps': 52217, 'loss/train': 1.5604493618011475} -11/07/2021 04:34:53 - INFO - __main__ - Step 52219: {'lr': 0.00037091247007751916, 'samples': 10026048, 'steps': 52218, 'loss/train': 1.6892719268798828} -11/07/2021 04:34:53 - INFO - __main__ - Step 52220: {'lr': 0.0003709078252609585, 'samples': 10026240, 'steps': 52219, 'loss/train': 1.3288346529006958} -11/07/2021 04:34:54 - INFO - __main__ - Step 52221: {'lr': 0.0003709031803899187, 'samples': 10026432, 'steps': 52220, 'loss/train': 1.9864845275878906} -11/07/2021 04:34:54 - INFO - __main__ - Step 52222: {'lr': 0.0003708985354644017, 'samples': 10026624, 'steps': 52221, 'loss/train': 1.2254571914672852} -11/07/2021 04:34:55 - INFO - __main__ - Step 52223: {'lr': 0.00037089389048440975, 'samples': 10026816, 'steps': 52222, 'loss/train': 1.5201977491378784} -11/07/2021 04:34:55 - INFO - __main__ - Step 52224: {'lr': 0.0003708892454499448, 'samples': 10027008, 'steps': 52223, 'loss/train': 2.122084856033325} -11/07/2021 04:34:56 - INFO - __main__ - Step 52225: {'lr': 0.00037088460036100915, 'samples': 10027200, 'steps': 52224, 'loss/train': 2.207977771759033} -11/07/2021 04:34:56 - INFO - __main__ - Step 52226: {'lr': 0.0003708799552176046, 'samples': 10027392, 'steps': 52225, 'loss/train': 1.3794692754745483} -11/07/2021 04:34:56 - INFO - __main__ - Step 52227: {'lr': 0.0003708753100197336, 'samples': 10027584, 'steps': 52226, 'loss/train': 1.742241382598877} -11/07/2021 04:34:57 - INFO - __main__ - Step 52228: {'lr': 0.00037087066476739795, 'samples': 10027776, 'steps': 52227, 'loss/train': 1.3941805362701416} -11/07/2021 04:34:58 - INFO - __main__ - Step 52229: {'lr': 0.0003708660194605998, 'samples': 10027968, 'steps': 52228, 'loss/train': 1.2187187671661377} -11/07/2021 04:34:58 - INFO - __main__ - Step 52230: {'lr': 0.0003708613740993414, 'samples': 10028160, 'steps': 52229, 'loss/train': 1.5902061462402344} -11/07/2021 04:34:59 - INFO - __main__ - Step 52231: {'lr': 0.00037085672868362464, 'samples': 10028352, 'steps': 52230, 'loss/train': 1.5531061887741089} -11/07/2021 04:34:59 - INFO - __main__ - Step 52232: {'lr': 0.0003708520832134518, 'samples': 10028544, 'steps': 52231, 'loss/train': 2.109830141067505} -11/07/2021 04:35:00 - INFO - __main__ - Step 52233: {'lr': 0.00037084743768882474, 'samples': 10028736, 'steps': 52232, 'loss/train': 1.4185560941696167} -11/07/2021 04:35:00 - INFO - __main__ - Step 52234: {'lr': 0.00037084279210974577, 'samples': 10028928, 'steps': 52233, 'loss/train': 1.798834204673767} -11/07/2021 04:35:01 - INFO - __main__ - Step 52235: {'lr': 0.00037083814647621686, 'samples': 10029120, 'steps': 52234, 'loss/train': 2.322261333465576} -11/07/2021 04:35:01 - INFO - __main__ - Step 52236: {'lr': 0.0003708335007882402, 'samples': 10029312, 'steps': 52235, 'loss/train': 1.1212799549102783} -11/07/2021 04:35:01 - INFO - __main__ - Step 52237: {'lr': 0.00037082885504581775, 'samples': 10029504, 'steps': 52236, 'loss/train': 0.9621900320053101} -11/07/2021 04:35:02 - INFO - __main__ - Step 52238: {'lr': 0.0003708242092489518, 'samples': 10029696, 'steps': 52237, 'loss/train': 1.47548508644104} -11/07/2021 04:35:03 - INFO - __main__ - Step 52239: {'lr': 0.0003708195633976442, 'samples': 10029888, 'steps': 52238, 'loss/train': 0.9711529612541199} -11/07/2021 04:35:03 - INFO - __main__ - Step 52240: {'lr': 0.0003708149174918972, 'samples': 10030080, 'steps': 52239, 'loss/train': 1.5734766721725464} -11/07/2021 04:35:03 - INFO - __main__ - Step 52241: {'lr': 0.000370810271531713, 'samples': 10030272, 'steps': 52240, 'loss/train': 1.292687177658081} -11/07/2021 04:35:04 - INFO - __main__ - Step 52242: {'lr': 0.0003708056255170934, 'samples': 10030464, 'steps': 52241, 'loss/train': 1.3701890707015991} -11/07/2021 04:35:04 - INFO - __main__ - Step 52243: {'lr': 0.0003708009794480407, 'samples': 10030656, 'steps': 52242, 'loss/train': 1.7831813097000122} -11/07/2021 04:35:05 - INFO - __main__ - Step 52244: {'lr': 0.0003707963333245569, 'samples': 10030848, 'steps': 52243, 'loss/train': 1.6027790307998657} -11/07/2021 04:35:05 - INFO - __main__ - Step 52245: {'lr': 0.0003707916871466442, 'samples': 10031040, 'steps': 52244, 'loss/train': 1.0570629835128784} -11/07/2021 04:35:06 - INFO - __main__ - Step 52246: {'lr': 0.0003707870409143046, 'samples': 10031232, 'steps': 52245, 'loss/train': 1.3571195602416992} -11/07/2021 04:35:06 - INFO - __main__ - Step 52247: {'lr': 0.00037078239462754023, 'samples': 10031424, 'steps': 52246, 'loss/train': 1.5466933250427246} -11/07/2021 04:35:06 - INFO - __main__ - Step 52248: {'lr': 0.0003707777482863532, 'samples': 10031616, 'steps': 52247, 'loss/train': 1.3029929399490356} -11/07/2021 04:35:07 - INFO - __main__ - Step 52249: {'lr': 0.00037077310189074554, 'samples': 10031808, 'steps': 52248, 'loss/train': 1.5803481340408325} -11/07/2021 04:35:08 - INFO - __main__ - Step 52250: {'lr': 0.0003707684554407194, 'samples': 10032000, 'steps': 52249, 'loss/train': 1.0084435939788818} -11/07/2021 04:35:08 - INFO - __main__ - Step 52251: {'lr': 0.0003707638089362769, 'samples': 10032192, 'steps': 52250, 'loss/train': 1.7735447883605957} -11/07/2021 04:35:08 - INFO - __main__ - Step 52252: {'lr': 0.00037075916237742, 'samples': 10032384, 'steps': 52251, 'loss/train': 1.7647929191589355} -11/07/2021 04:35:09 - INFO - __main__ - Step 52253: {'lr': 0.00037075451576415095, 'samples': 10032576, 'steps': 52252, 'loss/train': 2.0002384185791016} -11/07/2021 04:35:10 - INFO - __main__ - Step 52254: {'lr': 0.00037074986909647173, 'samples': 10032768, 'steps': 52253, 'loss/train': 1.2115262746810913} -11/07/2021 04:35:10 - INFO - __main__ - Step 52255: {'lr': 0.00037074522237438455, 'samples': 10032960, 'steps': 52254, 'loss/train': 1.3711144924163818} -11/07/2021 04:35:11 - INFO - __main__ - Step 52256: {'lr': 0.0003707405755978914, 'samples': 10033152, 'steps': 52255, 'loss/train': 1.4815617799758911} -11/07/2021 04:35:11 - INFO - __main__ - Step 52257: {'lr': 0.00037073592876699443, 'samples': 10033344, 'steps': 52256, 'loss/train': 1.395278811454773} -11/07/2021 04:35:11 - INFO - __main__ - Step 52258: {'lr': 0.0003707312818816956, 'samples': 10033536, 'steps': 52257, 'loss/train': 1.6057864427566528} -11/07/2021 04:35:12 - INFO - __main__ - Step 52259: {'lr': 0.00037072663494199724, 'samples': 10033728, 'steps': 52258, 'loss/train': 1.6924219131469727} -11/07/2021 04:35:13 - INFO - __main__ - Step 52260: {'lr': 0.0003707219879479013, 'samples': 10033920, 'steps': 52259, 'loss/train': 0.9788321852684021} -11/07/2021 04:35:13 - INFO - __main__ - Step 52261: {'lr': 0.0003707173408994099, 'samples': 10034112, 'steps': 52260, 'loss/train': 1.6294881105422974} -11/07/2021 04:35:13 - INFO - __main__ - Step 52262: {'lr': 0.0003707126937965251, 'samples': 10034304, 'steps': 52261, 'loss/train': 1.7520924806594849} -11/07/2021 04:35:14 - INFO - __main__ - Step 52263: {'lr': 0.0003707080466392491, 'samples': 10034496, 'steps': 52262, 'loss/train': 1.4391309022903442} -11/07/2021 04:35:15 - INFO - __main__ - Step 52264: {'lr': 0.0003707033994275838, 'samples': 10034688, 'steps': 52263, 'loss/train': 1.4674715995788574} -11/07/2021 04:35:15 - INFO - __main__ - Step 52265: {'lr': 0.0003706987521615315, 'samples': 10034880, 'steps': 52264, 'loss/train': 1.7465715408325195} -11/07/2021 04:35:15 - INFO - __main__ - Step 52266: {'lr': 0.0003706941048410941, 'samples': 10035072, 'steps': 52265, 'loss/train': 1.4335037469863892} -11/07/2021 04:35:16 - INFO - __main__ - Step 52267: {'lr': 0.0003706894574662739, 'samples': 10035264, 'steps': 52266, 'loss/train': 1.3291215896606445} -11/07/2021 04:35:16 - INFO - __main__ - Step 52268: {'lr': 0.0003706848100370729, 'samples': 10035456, 'steps': 52267, 'loss/train': 1.7214386463165283} -11/07/2021 04:35:17 - INFO - __main__ - Step 52269: {'lr': 0.00037068016255349315, 'samples': 10035648, 'steps': 52268, 'loss/train': 0.7420121431350708} -11/07/2021 04:35:17 - INFO - __main__ - Step 52270: {'lr': 0.0003706755150155368, 'samples': 10035840, 'steps': 52269, 'loss/train': 1.389876127243042} -11/07/2021 04:35:18 - INFO - __main__ - Step 52271: {'lr': 0.0003706708674232059, 'samples': 10036032, 'steps': 52270, 'loss/train': 1.0616005659103394} -11/07/2021 04:35:18 - INFO - __main__ - Step 52272: {'lr': 0.0003706662197765025, 'samples': 10036224, 'steps': 52271, 'loss/train': 1.2601686716079712} -11/07/2021 04:35:19 - INFO - __main__ - Step 52273: {'lr': 0.00037066157207542885, 'samples': 10036416, 'steps': 52272, 'loss/train': 1.566015362739563} -11/07/2021 04:35:19 - INFO - __main__ - Step 52274: {'lr': 0.00037065692431998695, 'samples': 10036608, 'steps': 52273, 'loss/train': 1.3770115375518799} -11/07/2021 04:35:20 - INFO - __main__ - Step 52275: {'lr': 0.00037065227651017897, 'samples': 10036800, 'steps': 52274, 'loss/train': 1.5455814599990845} -11/07/2021 04:35:20 - INFO - __main__ - Step 52276: {'lr': 0.0003706476286460068, 'samples': 10036992, 'steps': 52275, 'loss/train': 1.2364351749420166} -11/07/2021 04:35:21 - INFO - __main__ - Step 52277: {'lr': 0.0003706429807274728, 'samples': 10037184, 'steps': 52276, 'loss/train': 1.5304927825927734} -11/07/2021 04:35:21 - INFO - __main__ - Step 52278: {'lr': 0.0003706383327545788, 'samples': 10037376, 'steps': 52277, 'loss/train': 1.2667349576950073} -11/07/2021 04:35:21 - INFO - __main__ - Step 52279: {'lr': 0.0003706336847273271, 'samples': 10037568, 'steps': 52278, 'loss/train': 1.5852817296981812} -11/07/2021 04:35:22 - INFO - __main__ - Step 52280: {'lr': 0.00037062903664571975, 'samples': 10037760, 'steps': 52279, 'loss/train': 1.7066222429275513} -11/07/2021 04:35:23 - INFO - __main__ - Step 52281: {'lr': 0.00037062438850975877, 'samples': 10037952, 'steps': 52280, 'loss/train': 1.5558053255081177} -11/07/2021 04:35:23 - INFO - __main__ - Step 52282: {'lr': 0.00037061974031944635, 'samples': 10038144, 'steps': 52281, 'loss/train': 1.5429325103759766} -11/07/2021 04:35:23 - INFO - __main__ - Step 52283: {'lr': 0.0003706150920747845, 'samples': 10038336, 'steps': 52282, 'loss/train': 1.3963603973388672} -11/07/2021 04:35:24 - INFO - __main__ - Step 52284: {'lr': 0.00037061044377577535, 'samples': 10038528, 'steps': 52283, 'loss/train': 1.558125376701355} -11/07/2021 04:35:25 - INFO - __main__ - Step 52285: {'lr': 0.00037060579542242094, 'samples': 10038720, 'steps': 52284, 'loss/train': 1.5957164764404297} -11/07/2021 04:35:25 - INFO - __main__ - Step 52286: {'lr': 0.00037060114701472355, 'samples': 10038912, 'steps': 52285, 'loss/train': 1.7144229412078857} -11/07/2021 04:35:25 - INFO - __main__ - Step 52287: {'lr': 0.00037059649855268503, 'samples': 10039104, 'steps': 52286, 'loss/train': 1.2599412202835083} -11/07/2021 04:35:26 - INFO - __main__ - Step 52288: {'lr': 0.0003705918500363077, 'samples': 10039296, 'steps': 52287, 'loss/train': 1.2666865587234497} -11/07/2021 04:35:26 - INFO - __main__ - Step 52289: {'lr': 0.0003705872014655934, 'samples': 10039488, 'steps': 52288, 'loss/train': 1.5479722023010254} -11/07/2021 04:35:27 - INFO - __main__ - Step 52290: {'lr': 0.0003705825528405445, 'samples': 10039680, 'steps': 52289, 'loss/train': 1.3783215284347534} -11/07/2021 04:35:27 - INFO - __main__ - Step 52291: {'lr': 0.0003705779041611629, 'samples': 10039872, 'steps': 52290, 'loss/train': 1.649381160736084} -11/07/2021 04:35:28 - INFO - __main__ - Step 52292: {'lr': 0.00037057325542745075, 'samples': 10040064, 'steps': 52291, 'loss/train': 1.252488374710083} -11/07/2021 04:35:28 - INFO - __main__ - Step 52293: {'lr': 0.00037056860663941014, 'samples': 10040256, 'steps': 52292, 'loss/train': 1.1404080390930176} -11/07/2021 04:35:29 - INFO - __main__ - Step 52294: {'lr': 0.0003705639577970432, 'samples': 10040448, 'steps': 52293, 'loss/train': 1.6178735494613647} -11/07/2021 04:35:29 - INFO - __main__ - Step 52295: {'lr': 0.00037055930890035203, 'samples': 10040640, 'steps': 52294, 'loss/train': 1.131771206855774} -11/07/2021 04:35:30 - INFO - __main__ - Step 52296: {'lr': 0.00037055465994933866, 'samples': 10040832, 'steps': 52295, 'loss/train': 1.2351644039154053} -11/07/2021 04:35:30 - INFO - __main__ - Step 52297: {'lr': 0.00037055001094400523, 'samples': 10041024, 'steps': 52296, 'loss/train': 1.5820939540863037} -11/07/2021 04:35:31 - INFO - __main__ - Step 52298: {'lr': 0.0003705453618843538, 'samples': 10041216, 'steps': 52297, 'loss/train': 1.3582496643066406} -11/07/2021 04:35:31 - INFO - __main__ - Step 52299: {'lr': 0.00037054071277038654, 'samples': 10041408, 'steps': 52298, 'loss/train': 1.574306607246399} -11/07/2021 04:35:31 - INFO - __main__ - Step 52300: {'lr': 0.00037053606360210544, 'samples': 10041600, 'steps': 52299, 'loss/train': 1.3616039752960205} -11/07/2021 04:35:32 - INFO - __main__ - Step 52301: {'lr': 0.00037053141437951264, 'samples': 10041792, 'steps': 52300, 'loss/train': 1.6979727745056152} -11/07/2021 04:35:33 - INFO - __main__ - Step 52302: {'lr': 0.00037052676510261043, 'samples': 10041984, 'steps': 52301, 'loss/train': 1.4811590909957886} -11/07/2021 04:35:33 - INFO - __main__ - Step 52303: {'lr': 0.00037052211577140047, 'samples': 10042176, 'steps': 52302, 'loss/train': 1.540258765220642} -11/07/2021 04:35:33 - INFO - __main__ - Step 52304: {'lr': 0.00037051746638588526, 'samples': 10042368, 'steps': 52303, 'loss/train': 2.055814504623413} -11/07/2021 04:35:34 - INFO - __main__ - Step 52305: {'lr': 0.00037051281694606666, 'samples': 10042560, 'steps': 52304, 'loss/train': 1.7825428247451782} -11/07/2021 04:35:35 - INFO - __main__ - Step 52306: {'lr': 0.00037050816745194686, 'samples': 10042752, 'steps': 52305, 'loss/train': 1.316963791847229} -11/07/2021 04:35:36 - INFO - __main__ - Step 52307: {'lr': 0.00037050351790352795, 'samples': 10042944, 'steps': 52306, 'loss/train': 0.2811761200428009} -11/07/2021 04:35:36 - INFO - __main__ - Step 52308: {'lr': 0.00037049886830081203, 'samples': 10043136, 'steps': 52307, 'loss/train': 2.200223207473755} -11/07/2021 04:35:36 - INFO - __main__ - Step 52309: {'lr': 0.00037049421864380116, 'samples': 10043328, 'steps': 52308, 'loss/train': 1.544974684715271} -11/07/2021 04:35:37 - INFO - __main__ - Step 52310: {'lr': 0.00037048956893249746, 'samples': 10043520, 'steps': 52309, 'loss/train': 1.5108259916305542} -11/07/2021 04:35:37 - INFO - __main__ - Step 52311: {'lr': 0.00037048491916690304, 'samples': 10043712, 'steps': 52310, 'loss/train': 1.7455787658691406} -11/07/2021 04:35:38 - INFO - __main__ - Step 52312: {'lr': 0.00037048026934701997, 'samples': 10043904, 'steps': 52311, 'loss/train': 0.5629734992980957} -11/07/2021 04:35:38 - INFO - __main__ - Step 52313: {'lr': 0.0003704756194728503, 'samples': 10044096, 'steps': 52312, 'loss/train': 2.0434930324554443} -11/07/2021 04:35:39 - INFO - __main__ - Step 52314: {'lr': 0.0003704709695443962, 'samples': 10044288, 'steps': 52313, 'loss/train': 1.4854761362075806} -11/07/2021 04:35:39 - INFO - __main__ - Step 52315: {'lr': 0.00037046631956165975, 'samples': 10044480, 'steps': 52314, 'loss/train': 1.2033756971359253} -11/07/2021 04:35:40 - INFO - __main__ - Step 52316: {'lr': 0.00037046166952464307, 'samples': 10044672, 'steps': 52315, 'loss/train': 1.3256874084472656} -11/07/2021 04:35:41 - INFO - __main__ - Step 52317: {'lr': 0.00037045701943334814, 'samples': 10044864, 'steps': 52316, 'loss/train': 2.1899333000183105} -11/07/2021 04:35:41 - INFO - __main__ - Step 52318: {'lr': 0.0003704523692877772, 'samples': 10045056, 'steps': 52317, 'loss/train': 0.2942962050437927} -11/07/2021 04:35:41 - INFO - __main__ - Step 52319: {'lr': 0.00037044771908793225, 'samples': 10045248, 'steps': 52318, 'loss/train': 1.5847573280334473} -11/07/2021 04:35:42 - INFO - __main__ - Step 52320: {'lr': 0.0003704430688338154, 'samples': 10045440, 'steps': 52319, 'loss/train': 1.1405531167984009} -11/07/2021 04:35:42 - INFO - __main__ - Step 52321: {'lr': 0.0003704384185254288, 'samples': 10045632, 'steps': 52320, 'loss/train': 1.4911326169967651} -11/07/2021 04:35:43 - INFO - __main__ - Step 52322: {'lr': 0.00037043376816277453, 'samples': 10045824, 'steps': 52321, 'loss/train': 1.1727687120437622} -11/07/2021 04:35:44 - INFO - __main__ - Step 52323: {'lr': 0.00037042911774585465, 'samples': 10046016, 'steps': 52322, 'loss/train': 5.766360759735107} -11/07/2021 04:35:44 - INFO - __main__ - Step 52324: {'lr': 0.0003704244672746712, 'samples': 10046208, 'steps': 52323, 'loss/train': 1.3843739032745361} -11/07/2021 04:35:44 - INFO - __main__ - Step 52325: {'lr': 0.00037041981674922644, 'samples': 10046400, 'steps': 52324, 'loss/train': 1.3703349828720093} -11/07/2021 04:35:45 - INFO - __main__ - Step 52326: {'lr': 0.00037041516616952223, 'samples': 10046592, 'steps': 52325, 'loss/train': 1.5113415718078613} -11/07/2021 04:35:45 - INFO - __main__ - Step 52327: {'lr': 0.0003704105155355609, 'samples': 10046784, 'steps': 52326, 'loss/train': 1.5702812671661377} -11/07/2021 04:35:46 - INFO - __main__ - Step 52328: {'lr': 0.0003704058648473445, 'samples': 10046976, 'steps': 52327, 'loss/train': 1.2943845987319946} -11/07/2021 04:35:46 - INFO - __main__ - Step 52329: {'lr': 0.000370401214104875, 'samples': 10047168, 'steps': 52328, 'loss/train': 1.3867039680480957} -11/07/2021 04:35:47 - INFO - __main__ - Step 52330: {'lr': 0.0003703965633081546, 'samples': 10047360, 'steps': 52329, 'loss/train': 1.4289169311523438} -11/07/2021 04:35:47 - INFO - __main__ - Step 52331: {'lr': 0.00037039191245718536, 'samples': 10047552, 'steps': 52330, 'loss/train': 1.3633909225463867} -11/07/2021 04:35:47 - INFO - __main__ - Step 52332: {'lr': 0.00037038726155196934, 'samples': 10047744, 'steps': 52331, 'loss/train': 1.0888973474502563} -11/07/2021 04:35:48 - INFO - __main__ - Step 52333: {'lr': 0.00037038261059250873, 'samples': 10047936, 'steps': 52332, 'loss/train': 1.523136854171753} -11/07/2021 04:35:49 - INFO - __main__ - Step 52334: {'lr': 0.0003703779595788056, 'samples': 10048128, 'steps': 52333, 'loss/train': 1.490991234779358} -11/07/2021 04:35:49 - INFO - __main__ - Step 52335: {'lr': 0.00037037330851086194, 'samples': 10048320, 'steps': 52334, 'loss/train': 1.7871202230453491} -11/07/2021 04:35:49 - INFO - __main__ - Step 52336: {'lr': 0.00037036865738868, 'samples': 10048512, 'steps': 52335, 'loss/train': 1.5942060947418213} -11/07/2021 04:35:50 - INFO - __main__ - Step 52337: {'lr': 0.00037036400621226175, 'samples': 10048704, 'steps': 52336, 'loss/train': 1.4056665897369385} -11/07/2021 04:35:51 - INFO - __main__ - Step 52338: {'lr': 0.00037035935498160933, 'samples': 10048896, 'steps': 52337, 'loss/train': 1.394268274307251} -11/07/2021 04:35:51 - INFO - __main__ - Step 52339: {'lr': 0.00037035470369672484, 'samples': 10049088, 'steps': 52338, 'loss/train': 1.4369909763336182} -11/07/2021 04:35:51 - INFO - __main__ - Step 52340: {'lr': 0.0003703500523576104, 'samples': 10049280, 'steps': 52339, 'loss/train': 1.4380542039871216} -11/07/2021 04:35:52 - INFO - __main__ - Step 52341: {'lr': 0.0003703454009642681, 'samples': 10049472, 'steps': 52340, 'loss/train': 0.6161519289016724} -11/07/2021 04:35:52 - INFO - __main__ - Step 52342: {'lr': 0.0003703407495167, 'samples': 10049664, 'steps': 52341, 'loss/train': 1.1656584739685059} -11/07/2021 04:35:53 - INFO - __main__ - Step 52343: {'lr': 0.0003703360980149082, 'samples': 10049856, 'steps': 52342, 'loss/train': 1.527284860610962} -11/07/2021 04:35:54 - INFO - __main__ - Step 52344: {'lr': 0.00037033144645889487, 'samples': 10050048, 'steps': 52343, 'loss/train': 0.4405560791492462} -11/07/2021 04:35:54 - INFO - __main__ - Step 52345: {'lr': 0.000370326794848662, 'samples': 10050240, 'steps': 52344, 'loss/train': 1.3896318674087524} -11/07/2021 04:35:54 - INFO - __main__ - Step 52346: {'lr': 0.00037032214318421174, 'samples': 10050432, 'steps': 52345, 'loss/train': 1.2713168859481812} -11/07/2021 04:35:55 - INFO - __main__ - Step 52347: {'lr': 0.00037031749146554616, 'samples': 10050624, 'steps': 52346, 'loss/train': 1.679565668106079} -11/07/2021 04:35:56 - INFO - __main__ - Step 52348: {'lr': 0.00037031283969266737, 'samples': 10050816, 'steps': 52347, 'loss/train': 1.7118709087371826} -11/07/2021 04:35:56 - INFO - __main__ - Step 52349: {'lr': 0.0003703081878655775, 'samples': 10051008, 'steps': 52348, 'loss/train': 1.497228980064392} -11/07/2021 04:35:56 - INFO - __main__ - Step 52350: {'lr': 0.00037030353598427866, 'samples': 10051200, 'steps': 52349, 'loss/train': 1.8344635963439941} -11/07/2021 04:35:57 - INFO - __main__ - Step 52351: {'lr': 0.0003702988840487728, 'samples': 10051392, 'steps': 52350, 'loss/train': 1.1844738721847534} -11/07/2021 04:35:57 - INFO - __main__ - Step 52352: {'lr': 0.0003702942320590622, 'samples': 10051584, 'steps': 52351, 'loss/train': 1.0559014081954956} -11/07/2021 04:35:58 - INFO - __main__ - Step 52353: {'lr': 0.00037028958001514886, 'samples': 10051776, 'steps': 52352, 'loss/train': 1.5483312606811523} -11/07/2021 04:35:58 - INFO - __main__ - Step 52354: {'lr': 0.00037028492791703484, 'samples': 10051968, 'steps': 52353, 'loss/train': 5.4565935134887695} -11/07/2021 04:35:59 - INFO - __main__ - Step 52355: {'lr': 0.0003702802757647223, 'samples': 10052160, 'steps': 52354, 'loss/train': 1.3493404388427734} -11/07/2021 04:35:59 - INFO - __main__ - Step 52356: {'lr': 0.0003702756235582134, 'samples': 10052352, 'steps': 52355, 'loss/train': 1.788238525390625} -11/07/2021 04:36:00 - INFO - __main__ - Step 52357: {'lr': 0.00037027097129751016, 'samples': 10052544, 'steps': 52356, 'loss/train': 1.8171045780181885} -11/07/2021 04:36:00 - INFO - __main__ - Step 52358: {'lr': 0.0003702663189826146, 'samples': 10052736, 'steps': 52357, 'loss/train': 1.5824415683746338} -11/07/2021 04:36:01 - INFO - __main__ - Step 52359: {'lr': 0.0003702616666135289, 'samples': 10052928, 'steps': 52358, 'loss/train': 1.1794646978378296} -11/07/2021 04:36:01 - INFO - __main__ - Step 52360: {'lr': 0.0003702570141902552, 'samples': 10053120, 'steps': 52359, 'loss/train': 1.9084322452545166} -11/07/2021 04:36:01 - INFO - __main__ - Step 52361: {'lr': 0.00037025236171279546, 'samples': 10053312, 'steps': 52360, 'loss/train': 1.4402989149093628} -11/07/2021 04:36:02 - INFO - __main__ - Step 52362: {'lr': 0.000370247709181152, 'samples': 10053504, 'steps': 52361, 'loss/train': 1.2373167276382446} -11/07/2021 04:36:02 - INFO - __main__ - Step 52363: {'lr': 0.00037024305659532665, 'samples': 10053696, 'steps': 52362, 'loss/train': 1.5906411409378052} -11/07/2021 04:36:03 - INFO - __main__ - Step 52364: {'lr': 0.00037023840395532167, 'samples': 10053888, 'steps': 52363, 'loss/train': 1.3774484395980835} -11/07/2021 04:36:04 - INFO - __main__ - Step 52365: {'lr': 0.0003702337512611391, 'samples': 10054080, 'steps': 52364, 'loss/train': 1.7504037618637085} -11/07/2021 04:36:04 - INFO - __main__ - Step 52366: {'lr': 0.00037022909851278107, 'samples': 10054272, 'steps': 52365, 'loss/train': 1.125939965248108} -11/07/2021 04:36:04 - INFO - __main__ - Step 52367: {'lr': 0.0003702244457102497, 'samples': 10054464, 'steps': 52366, 'loss/train': 1.6031582355499268} -11/07/2021 04:36:05 - INFO - __main__ - Step 52368: {'lr': 0.000370219792853547, 'samples': 10054656, 'steps': 52367, 'loss/train': 2.110670566558838} -11/07/2021 04:36:06 - INFO - __main__ - Step 52369: {'lr': 0.0003702151399426752, 'samples': 10054848, 'steps': 52368, 'loss/train': 0.9725801348686218} -11/07/2021 04:36:06 - INFO - __main__ - Step 52370: {'lr': 0.0003702104869776362, 'samples': 10055040, 'steps': 52369, 'loss/train': 1.8233392238616943} -11/07/2021 04:36:06 - INFO - __main__ - Step 52371: {'lr': 0.0003702058339584323, 'samples': 10055232, 'steps': 52370, 'loss/train': 1.6103260517120361} -11/07/2021 04:36:07 - INFO - __main__ - Step 52372: {'lr': 0.00037020118088506546, 'samples': 10055424, 'steps': 52371, 'loss/train': 1.3690156936645508} -11/07/2021 04:36:07 - INFO - __main__ - Step 52373: {'lr': 0.0003701965277575378, 'samples': 10055616, 'steps': 52372, 'loss/train': 1.5724278688430786} -11/07/2021 04:36:08 - INFO - __main__ - Step 52374: {'lr': 0.0003701918745758515, 'samples': 10055808, 'steps': 52373, 'loss/train': 1.6084142923355103} -11/07/2021 04:36:08 - INFO - __main__ - Step 52375: {'lr': 0.00037018722134000856, 'samples': 10056000, 'steps': 52374, 'loss/train': 1.272934913635254} -11/07/2021 04:36:09 - INFO - __main__ - Step 52376: {'lr': 0.00037018256805001115, 'samples': 10056192, 'steps': 52375, 'loss/train': 1.0911200046539307} -11/07/2021 04:36:09 - INFO - __main__ - Step 52377: {'lr': 0.00037017791470586126, 'samples': 10056384, 'steps': 52376, 'loss/train': 1.0611250400543213} -11/07/2021 04:36:09 - INFO - __main__ - Step 52378: {'lr': 0.0003701732613075611, 'samples': 10056576, 'steps': 52377, 'loss/train': 1.5138376951217651} -11/07/2021 04:36:11 - INFO - __main__ - Step 52379: {'lr': 0.00037016860785511274, 'samples': 10056768, 'steps': 52378, 'loss/train': 1.3715938329696655} -11/07/2021 04:36:11 - INFO - __main__ - Step 52380: {'lr': 0.00037016395434851825, 'samples': 10056960, 'steps': 52379, 'loss/train': 2.1460390090942383} -11/07/2021 04:36:11 - INFO - __main__ - Step 52381: {'lr': 0.0003701593007877797, 'samples': 10057152, 'steps': 52380, 'loss/train': 1.119550347328186} -11/07/2021 04:36:12 - INFO - __main__ - Step 52382: {'lr': 0.00037015464717289924, 'samples': 10057344, 'steps': 52381, 'loss/train': 0.9674318432807922} -11/07/2021 04:36:12 - INFO - __main__ - Step 52383: {'lr': 0.000370149993503879, 'samples': 10057536, 'steps': 52382, 'loss/train': 1.636091709136963} -11/07/2021 04:36:13 - INFO - __main__ - Step 52384: {'lr': 0.000370145339780721, 'samples': 10057728, 'steps': 52383, 'loss/train': 1.5504209995269775} -11/07/2021 04:36:13 - INFO - __main__ - Step 52385: {'lr': 0.0003701406860034273, 'samples': 10057920, 'steps': 52384, 'loss/train': 1.3792790174484253} -11/07/2021 04:36:14 - INFO - __main__ - Step 52386: {'lr': 0.0003701360321720001, 'samples': 10058112, 'steps': 52385, 'loss/train': 1.3007304668426514} -11/07/2021 04:36:14 - INFO - __main__ - Step 52387: {'lr': 0.0003701313782864415, 'samples': 10058304, 'steps': 52386, 'loss/train': 1.4700512886047363} -11/07/2021 04:36:14 - INFO - __main__ - Step 52388: {'lr': 0.0003701267243467535, 'samples': 10058496, 'steps': 52387, 'loss/train': 1.9685583114624023} -11/07/2021 04:36:15 - INFO - __main__ - Step 52389: {'lr': 0.00037012207035293834, 'samples': 10058688, 'steps': 52388, 'loss/train': 1.2751091718673706} -11/07/2021 04:36:16 - INFO - __main__ - Step 52390: {'lr': 0.00037011741630499796, 'samples': 10058880, 'steps': 52389, 'loss/train': 1.6515552997589111} -11/07/2021 04:36:16 - INFO - __main__ - Step 52391: {'lr': 0.00037011276220293447, 'samples': 10059072, 'steps': 52390, 'loss/train': 1.0018212795257568} -11/07/2021 04:36:16 - INFO - __main__ - Step 52392: {'lr': 0.0003701081080467501, 'samples': 10059264, 'steps': 52391, 'loss/train': 1.524664044380188} -11/07/2021 04:36:17 - INFO - __main__ - Step 52393: {'lr': 0.0003701034538364468, 'samples': 10059456, 'steps': 52392, 'loss/train': 1.8944721221923828} -11/07/2021 04:36:17 - INFO - __main__ - Step 52394: {'lr': 0.0003700987995720269, 'samples': 10059648, 'steps': 52393, 'loss/train': 0.9276136159896851} -11/07/2021 04:36:18 - INFO - __main__ - Step 52395: {'lr': 0.0003700941452534922, 'samples': 10059840, 'steps': 52394, 'loss/train': 1.7017980813980103} -11/07/2021 04:36:19 - INFO - __main__ - Step 52396: {'lr': 0.0003700894908808449, 'samples': 10060032, 'steps': 52395, 'loss/train': 1.5161792039871216} -11/07/2021 04:36:19 - INFO - __main__ - Step 52397: {'lr': 0.0003700848364540872, 'samples': 10060224, 'steps': 52396, 'loss/train': 1.536611557006836} -11/07/2021 04:36:19 - INFO - __main__ - Step 52398: {'lr': 0.0003700801819732211, 'samples': 10060416, 'steps': 52397, 'loss/train': 1.2143956422805786} -11/07/2021 04:36:20 - INFO - __main__ - Step 52399: {'lr': 0.0003700755274382487, 'samples': 10060608, 'steps': 52398, 'loss/train': 1.8598138093948364} -11/07/2021 04:36:21 - INFO - __main__ - Step 52400: {'lr': 0.0003700708728491722, 'samples': 10060800, 'steps': 52399, 'loss/train': 1.3368159532546997} -11/07/2021 04:36:21 - INFO - __main__ - Step 52401: {'lr': 0.0003700662182059936, 'samples': 10060992, 'steps': 52400, 'loss/train': 1.0483607053756714} -11/07/2021 04:36:21 - INFO - __main__ - Step 52402: {'lr': 0.0003700615635087149, 'samples': 10061184, 'steps': 52401, 'loss/train': 1.4616649150848389} -11/07/2021 04:36:22 - INFO - __main__ - Step 52403: {'lr': 0.00037005690875733843, 'samples': 10061376, 'steps': 52402, 'loss/train': 1.5702778100967407} -11/07/2021 04:36:22 - INFO - __main__ - Step 52404: {'lr': 0.00037005225395186616, 'samples': 10061568, 'steps': 52403, 'loss/train': 1.7624890804290771} -11/07/2021 04:36:23 - INFO - __main__ - Step 52405: {'lr': 0.00037004759909230016, 'samples': 10061760, 'steps': 52404, 'loss/train': 1.0354856252670288} -11/07/2021 04:36:24 - INFO - __main__ - Step 52406: {'lr': 0.0003700429441786426, 'samples': 10061952, 'steps': 52405, 'loss/train': 1.3917793035507202} -11/07/2021 04:36:24 - INFO - __main__ - Step 52407: {'lr': 0.0003700382892108955, 'samples': 10062144, 'steps': 52406, 'loss/train': 1.4974435567855835} -11/07/2021 04:36:24 - INFO - __main__ - Step 52408: {'lr': 0.000370033634189061, 'samples': 10062336, 'steps': 52407, 'loss/train': 1.3563601970672607} -11/07/2021 04:36:25 - INFO - __main__ - Step 52409: {'lr': 0.00037002897911314126, 'samples': 10062528, 'steps': 52408, 'loss/train': 1.632383108139038} -11/07/2021 04:36:26 - INFO - __main__ - Step 52410: {'lr': 0.0003700243239831382, 'samples': 10062720, 'steps': 52409, 'loss/train': 1.2046328783035278} -11/07/2021 04:36:26 - INFO - __main__ - Step 52411: {'lr': 0.00037001966879905414, 'samples': 10062912, 'steps': 52410, 'loss/train': 1.6029366254806519} -11/07/2021 04:36:26 - INFO - __main__ - Step 52412: {'lr': 0.00037001501356089103, 'samples': 10063104, 'steps': 52411, 'loss/train': 1.5252598524093628} -11/07/2021 04:36:27 - INFO - __main__ - Step 52413: {'lr': 0.00037001035826865096, 'samples': 10063296, 'steps': 52412, 'loss/train': 1.8335431814193726} -11/07/2021 04:36:27 - INFO - __main__ - Step 52414: {'lr': 0.00037000570292233613, 'samples': 10063488, 'steps': 52413, 'loss/train': 1.4575445652008057} -11/07/2021 04:36:28 - INFO - __main__ - Step 52415: {'lr': 0.00037000104752194857, 'samples': 10063680, 'steps': 52414, 'loss/train': 1.302187204360962} -11/07/2021 04:36:28 - INFO - __main__ - Step 52416: {'lr': 0.0003699963920674905, 'samples': 10063872, 'steps': 52415, 'loss/train': 1.4415488243103027} -11/07/2021 04:36:29 - INFO - __main__ - Step 52417: {'lr': 0.00036999173655896374, 'samples': 10064064, 'steps': 52416, 'loss/train': 1.3341501951217651} -11/07/2021 04:36:29 - INFO - __main__ - Step 52418: {'lr': 0.00036998708099637064, 'samples': 10064256, 'steps': 52417, 'loss/train': 1.7092583179473877} -11/07/2021 04:36:30 - INFO - __main__ - Step 52419: {'lr': 0.00036998242537971315, 'samples': 10064448, 'steps': 52418, 'loss/train': 1.554855227470398} -11/07/2021 04:36:31 - INFO - __main__ - Step 52420: {'lr': 0.00036997776970899344, 'samples': 10064640, 'steps': 52419, 'loss/train': 1.633256196975708} -11/07/2021 04:36:31 - INFO - __main__ - Step 52421: {'lr': 0.0003699731139842136, 'samples': 10064832, 'steps': 52420, 'loss/train': 1.1283069849014282} -11/07/2021 04:36:31 - INFO - __main__ - Step 52422: {'lr': 0.0003699684582053758, 'samples': 10065024, 'steps': 52421, 'loss/train': 0.8390668630599976} -11/07/2021 04:36:32 - INFO - __main__ - Step 52423: {'lr': 0.00036996380237248205, 'samples': 10065216, 'steps': 52422, 'loss/train': 1.277381181716919} -11/07/2021 04:36:32 - INFO - __main__ - Step 52424: {'lr': 0.0003699591464855344, 'samples': 10065408, 'steps': 52423, 'loss/train': 1.3982897996902466} -11/07/2021 04:36:32 - INFO - __main__ - Step 52425: {'lr': 0.00036995449054453503, 'samples': 10065600, 'steps': 52424, 'loss/train': 1.5712449550628662} -11/07/2021 04:36:33 - INFO - __main__ - Step 52426: {'lr': 0.00036994983454948605, 'samples': 10065792, 'steps': 52425, 'loss/train': 1.5282293558120728} -11/07/2021 04:36:34 - INFO - __main__ - Step 52427: {'lr': 0.0003699451785003895, 'samples': 10065984, 'steps': 52426, 'loss/train': 1.2385307550430298} -11/07/2021 04:36:34 - INFO - __main__ - Step 52428: {'lr': 0.0003699405223972475, 'samples': 10066176, 'steps': 52427, 'loss/train': 0.7437629103660583} -11/07/2021 04:36:34 - INFO - __main__ - Step 52429: {'lr': 0.0003699358662400622, 'samples': 10066368, 'steps': 52428, 'loss/train': 1.2149325609207153} -11/07/2021 04:36:35 - INFO - __main__ - Step 52430: {'lr': 0.00036993121002883557, 'samples': 10066560, 'steps': 52429, 'loss/train': 1.6896101236343384} -11/07/2021 04:36:36 - INFO - __main__ - Step 52431: {'lr': 0.0003699265537635698, 'samples': 10066752, 'steps': 52430, 'loss/train': 2.1384401321411133} -11/07/2021 04:36:36 - INFO - __main__ - Step 52432: {'lr': 0.000369921897444267, 'samples': 10066944, 'steps': 52431, 'loss/train': 1.595112681388855} -11/07/2021 04:36:37 - INFO - __main__ - Step 52433: {'lr': 0.00036991724107092927, 'samples': 10067136, 'steps': 52432, 'loss/train': 1.4829649925231934} -11/07/2021 04:36:37 - INFO - __main__ - Step 52434: {'lr': 0.00036991258464355863, 'samples': 10067328, 'steps': 52433, 'loss/train': 2.3356728553771973} -11/07/2021 04:36:37 - INFO - __main__ - Step 52435: {'lr': 0.00036990792816215726, 'samples': 10067520, 'steps': 52434, 'loss/train': 1.679817795753479} -11/07/2021 04:36:38 - INFO - __main__ - Step 52436: {'lr': 0.0003699032716267273, 'samples': 10067712, 'steps': 52435, 'loss/train': 1.3072232007980347} -11/07/2021 04:36:39 - INFO - __main__ - Step 52437: {'lr': 0.00036989861503727064, 'samples': 10067904, 'steps': 52436, 'loss/train': 1.4434219598770142} -11/07/2021 04:36:39 - INFO - __main__ - Step 52438: {'lr': 0.0003698939583937896, 'samples': 10068096, 'steps': 52437, 'loss/train': 1.5289331674575806} -11/07/2021 04:36:39 - INFO - __main__ - Step 52439: {'lr': 0.0003698893016962861, 'samples': 10068288, 'steps': 52438, 'loss/train': 1.2497870922088623} -11/07/2021 04:36:40 - INFO - __main__ - Step 52440: {'lr': 0.00036988464494476243, 'samples': 10068480, 'steps': 52439, 'loss/train': 1.7348291873931885} -11/07/2021 04:36:41 - INFO - __main__ - Step 52441: {'lr': 0.0003698799881392205, 'samples': 10068672, 'steps': 52440, 'loss/train': 1.2171458005905151} -11/07/2021 04:36:41 - INFO - __main__ - Step 52442: {'lr': 0.00036987533127966253, 'samples': 10068864, 'steps': 52441, 'loss/train': 1.4699468612670898} -11/07/2021 04:36:41 - INFO - __main__ - Step 52443: {'lr': 0.0003698706743660907, 'samples': 10069056, 'steps': 52442, 'loss/train': 1.6238996982574463} -11/07/2021 04:36:42 - INFO - __main__ - Step 52444: {'lr': 0.0003698660173985069, 'samples': 10069248, 'steps': 52443, 'loss/train': 1.011279821395874} -11/07/2021 04:36:42 - INFO - __main__ - Step 52445: {'lr': 0.0003698613603769133, 'samples': 10069440, 'steps': 52444, 'loss/train': 1.3448474407196045} -11/07/2021 04:36:43 - INFO - __main__ - Step 52446: {'lr': 0.00036985670330131205, 'samples': 10069632, 'steps': 52445, 'loss/train': 1.0529274940490723} -11/07/2021 04:36:43 - INFO - __main__ - Step 52447: {'lr': 0.0003698520461717052, 'samples': 10069824, 'steps': 52446, 'loss/train': 1.2374534606933594} -11/07/2021 04:36:44 - INFO - __main__ - Step 52448: {'lr': 0.0003698473889880949, 'samples': 10070016, 'steps': 52447, 'loss/train': 1.584261178970337} -11/07/2021 04:36:44 - INFO - __main__ - Step 52449: {'lr': 0.0003698427317504832, 'samples': 10070208, 'steps': 52448, 'loss/train': 1.6233322620391846} -11/07/2021 04:36:44 - INFO - __main__ - Step 52450: {'lr': 0.00036983807445887217, 'samples': 10070400, 'steps': 52449, 'loss/train': 0.7425636053085327} -11/07/2021 04:36:45 - INFO - __main__ - Step 52451: {'lr': 0.00036983341711326403, 'samples': 10070592, 'steps': 52450, 'loss/train': 1.4514048099517822} -11/07/2021 04:36:46 - INFO - __main__ - Step 52452: {'lr': 0.00036982875971366074, 'samples': 10070784, 'steps': 52451, 'loss/train': 1.2515755891799927} -11/07/2021 04:36:46 - INFO - __main__ - Step 52453: {'lr': 0.00036982410226006445, 'samples': 10070976, 'steps': 52452, 'loss/train': 1.7804089784622192} -11/07/2021 04:36:47 - INFO - __main__ - Step 52454: {'lr': 0.0003698194447524773, 'samples': 10071168, 'steps': 52453, 'loss/train': 1.7630228996276855} -11/07/2021 04:36:47 - INFO - __main__ - Step 52455: {'lr': 0.0003698147871909014, 'samples': 10071360, 'steps': 52454, 'loss/train': 1.496080756187439} -11/07/2021 04:36:48 - INFO - __main__ - Step 52456: {'lr': 0.0003698101295753388, 'samples': 10071552, 'steps': 52455, 'loss/train': 0.8906934261322021} -11/07/2021 04:36:48 - INFO - __main__ - Step 52457: {'lr': 0.00036980547190579153, 'samples': 10071744, 'steps': 52456, 'loss/train': 1.3202104568481445} -11/07/2021 04:36:49 - INFO - __main__ - Step 52458: {'lr': 0.0003698008141822618, 'samples': 10071936, 'steps': 52457, 'loss/train': 1.3986629247665405} -11/07/2021 04:36:49 - INFO - __main__ - Step 52459: {'lr': 0.00036979615640475165, 'samples': 10072128, 'steps': 52458, 'loss/train': 1.3181469440460205} -11/07/2021 04:36:49 - INFO - __main__ - Step 52460: {'lr': 0.0003697914985732632, 'samples': 10072320, 'steps': 52459, 'loss/train': 1.538682460784912} -11/07/2021 04:36:50 - INFO - __main__ - Step 52461: {'lr': 0.0003697868406877986, 'samples': 10072512, 'steps': 52460, 'loss/train': 1.3042988777160645} -11/07/2021 04:36:51 - INFO - __main__ - Step 52462: {'lr': 0.00036978218274835993, 'samples': 10072704, 'steps': 52461, 'loss/train': 1.4915683269500732} -11/07/2021 04:36:51 - INFO - __main__ - Step 52463: {'lr': 0.0003697775247549492, 'samples': 10072896, 'steps': 52462, 'loss/train': 1.5328110456466675} -11/07/2021 04:36:51 - INFO - __main__ - Step 52464: {'lr': 0.00036977286670756854, 'samples': 10073088, 'steps': 52463, 'loss/train': 1.7254937887191772} -11/07/2021 04:36:52 - INFO - __main__ - Step 52465: {'lr': 0.00036976820860622005, 'samples': 10073280, 'steps': 52464, 'loss/train': 1.226966142654419} -11/07/2021 04:36:52 - INFO - __main__ - Step 52466: {'lr': 0.00036976355045090594, 'samples': 10073472, 'steps': 52465, 'loss/train': 2.6069347858428955} -11/07/2021 04:36:53 - INFO - __main__ - Step 52467: {'lr': 0.00036975889224162816, 'samples': 10073664, 'steps': 52466, 'loss/train': 1.3844895362854004} -11/07/2021 04:36:53 - INFO - __main__ - Step 52468: {'lr': 0.000369754233978389, 'samples': 10073856, 'steps': 52467, 'loss/train': 1.1404250860214233} -11/07/2021 04:36:54 - INFO - __main__ - Step 52469: {'lr': 0.00036974957566119027, 'samples': 10074048, 'steps': 52468, 'loss/train': 1.866579532623291} -11/07/2021 04:36:54 - INFO - __main__ - Step 52470: {'lr': 0.00036974491729003427, 'samples': 10074240, 'steps': 52469, 'loss/train': 1.5345561504364014} -11/07/2021 04:36:54 - INFO - __main__ - Step 52471: {'lr': 0.00036974025886492306, 'samples': 10074432, 'steps': 52470, 'loss/train': 1.763494849205017} -11/07/2021 04:36:56 - INFO - __main__ - Step 52472: {'lr': 0.00036973560038585876, 'samples': 10074624, 'steps': 52471, 'loss/train': 1.8525594472885132} -11/07/2021 04:36:56 - INFO - __main__ - Step 52473: {'lr': 0.0003697309418528435, 'samples': 10074816, 'steps': 52472, 'loss/train': 1.4374958276748657} -11/07/2021 04:36:56 - INFO - __main__ - Step 52474: {'lr': 0.0003697262832658792, 'samples': 10075008, 'steps': 52473, 'loss/train': 1.283557415008545} -11/07/2021 04:36:57 - INFO - __main__ - Step 52475: {'lr': 0.00036972162462496817, 'samples': 10075200, 'steps': 52474, 'loss/train': 1.6452559232711792} -11/07/2021 04:36:57 - INFO - __main__ - Step 52476: {'lr': 0.0003697169659301124, 'samples': 10075392, 'steps': 52475, 'loss/train': 1.243672490119934} -11/07/2021 04:36:58 - INFO - __main__ - Step 52477: {'lr': 0.000369712307181314, 'samples': 10075584, 'steps': 52476, 'loss/train': 1.765824317932129} -11/07/2021 04:36:58 - INFO - __main__ - Step 52478: {'lr': 0.00036970764837857505, 'samples': 10075776, 'steps': 52477, 'loss/train': 0.7308313250541687} -11/07/2021 04:36:59 - INFO - __main__ - Step 52479: {'lr': 0.0003697029895218978, 'samples': 10075968, 'steps': 52478, 'loss/train': 1.3887279033660889} -11/07/2021 04:36:59 - INFO - __main__ - Step 52480: {'lr': 0.0003696983306112842, 'samples': 10076160, 'steps': 52479, 'loss/train': 1.4204062223434448} -11/07/2021 04:36:59 - INFO - __main__ - Step 52481: {'lr': 0.00036969367164673626, 'samples': 10076352, 'steps': 52480, 'loss/train': 1.1525694131851196} -11/07/2021 04:37:00 - INFO - __main__ - Step 52482: {'lr': 0.0003696890126282563, 'samples': 10076544, 'steps': 52481, 'loss/train': 1.8334134817123413} -11/07/2021 04:37:01 - INFO - __main__ - Step 52483: {'lr': 0.0003696843535558463, 'samples': 10076736, 'steps': 52482, 'loss/train': 1.369024634361267} -11/07/2021 04:37:01 - INFO - __main__ - Step 52484: {'lr': 0.0003696796944295084, 'samples': 10076928, 'steps': 52483, 'loss/train': 1.4560978412628174} -11/07/2021 04:37:01 - INFO - __main__ - Step 52485: {'lr': 0.00036967503524924463, 'samples': 10077120, 'steps': 52484, 'loss/train': 1.6482877731323242} -11/07/2021 04:37:02 - INFO - __main__ - Step 52486: {'lr': 0.00036967037601505715, 'samples': 10077312, 'steps': 52485, 'loss/train': 1.0509904623031616} -11/07/2021 04:37:03 - INFO - __main__ - Step 52487: {'lr': 0.000369665716726948, 'samples': 10077504, 'steps': 52486, 'loss/train': 1.792357325553894} -11/07/2021 04:37:03 - INFO - __main__ - Step 52488: {'lr': 0.0003696610573849194, 'samples': 10077696, 'steps': 52487, 'loss/train': 1.3979697227478027} -11/07/2021 04:37:04 - INFO - __main__ - Step 52489: {'lr': 0.0003696563979889733, 'samples': 10077888, 'steps': 52488, 'loss/train': 1.4037448167800903} -11/07/2021 04:37:04 - INFO - __main__ - Step 52490: {'lr': 0.00036965173853911195, 'samples': 10078080, 'steps': 52489, 'loss/train': 1.6520057916641235} -11/07/2021 04:37:04 - INFO - __main__ - Step 52491: {'lr': 0.0003696470790353373, 'samples': 10078272, 'steps': 52490, 'loss/train': 1.4462602138519287} -11/07/2021 04:37:05 - INFO - __main__ - Step 52492: {'lr': 0.0003696424194776516, 'samples': 10078464, 'steps': 52491, 'loss/train': 1.744876742362976} -11/07/2021 04:37:06 - INFO - __main__ - Step 52493: {'lr': 0.0003696377598660569, 'samples': 10078656, 'steps': 52492, 'loss/train': 1.4057873487472534} -11/07/2021 04:37:06 - INFO - __main__ - Step 52494: {'lr': 0.0003696331002005551, 'samples': 10078848, 'steps': 52493, 'loss/train': 1.3740580081939697} -11/07/2021 04:37:06 - INFO - __main__ - Step 52495: {'lr': 0.00036962844048114856, 'samples': 10079040, 'steps': 52494, 'loss/train': 0.8017370700836182} -11/07/2021 04:37:07 - INFO - __main__ - Step 52496: {'lr': 0.0003696237807078393, 'samples': 10079232, 'steps': 52495, 'loss/train': 1.0897456407546997} -11/07/2021 04:37:08 - INFO - __main__ - Step 52497: {'lr': 0.00036961912088062947, 'samples': 10079424, 'steps': 52496, 'loss/train': 1.2632558345794678} -11/07/2021 04:37:08 - INFO - __main__ - Step 52498: {'lr': 0.00036961446099952104, 'samples': 10079616, 'steps': 52497, 'loss/train': 1.6042799949645996} -11/07/2021 04:37:09 - INFO - __main__ - Step 52499: {'lr': 0.0003696098010645162, 'samples': 10079808, 'steps': 52498, 'loss/train': 1.7075955867767334} -11/07/2021 04:37:09 - INFO - __main__ - Step 52500: {'lr': 0.00036960514107561707, 'samples': 10080000, 'steps': 52499, 'loss/train': 1.529590368270874} -11/07/2021 04:37:09 - INFO - __main__ - Step 52501: {'lr': 0.00036960048103282564, 'samples': 10080192, 'steps': 52500, 'loss/train': 1.487412452697754} -11/07/2021 04:37:10 - INFO - __main__ - Step 52502: {'lr': 0.00036959582093614406, 'samples': 10080384, 'steps': 52501, 'loss/train': 0.9780846834182739} -11/07/2021 04:37:11 - INFO - __main__ - Step 52503: {'lr': 0.00036959116078557453, 'samples': 10080576, 'steps': 52502, 'loss/train': 1.3496427536010742} -11/07/2021 04:37:11 - INFO - __main__ - Step 52504: {'lr': 0.000369586500581119, 'samples': 10080768, 'steps': 52503, 'loss/train': 1.612030029296875} -11/07/2021 04:37:11 - INFO - __main__ - Step 52505: {'lr': 0.00036958184032277974, 'samples': 10080960, 'steps': 52504, 'loss/train': 1.4903218746185303} -11/07/2021 04:37:12 - INFO - __main__ - Step 52506: {'lr': 0.0003695771800105586, 'samples': 10081152, 'steps': 52505, 'loss/train': 1.9057798385620117} -11/07/2021 04:37:12 - INFO - __main__ - Step 52507: {'lr': 0.0003695725196444579, 'samples': 10081344, 'steps': 52506, 'loss/train': 1.758776307106018} -11/07/2021 04:37:13 - INFO - __main__ - Step 52508: {'lr': 0.0003695678592244797, 'samples': 10081536, 'steps': 52507, 'loss/train': 1.4301761388778687} -11/07/2021 04:37:13 - INFO - __main__ - Step 52509: {'lr': 0.00036956319875062604, 'samples': 10081728, 'steps': 52508, 'loss/train': 1.5318809747695923} -11/07/2021 04:37:14 - INFO - __main__ - Step 52510: {'lr': 0.0003695585382228991, 'samples': 10081920, 'steps': 52509, 'loss/train': 1.4332736730575562} -11/07/2021 04:37:14 - INFO - __main__ - Step 52511: {'lr': 0.0003695538776413009, 'samples': 10082112, 'steps': 52510, 'loss/train': 1.3565497398376465} -11/07/2021 04:37:14 - INFO - __main__ - Step 52512: {'lr': 0.0003695492170058335, 'samples': 10082304, 'steps': 52511, 'loss/train': 1.397042989730835} -11/07/2021 04:37:16 - INFO - __main__ - Step 52513: {'lr': 0.0003695445563164991, 'samples': 10082496, 'steps': 52512, 'loss/train': 1.3915115594863892} -11/07/2021 04:37:16 - INFO - __main__ - Step 52514: {'lr': 0.00036953989557329976, 'samples': 10082688, 'steps': 52513, 'loss/train': 1.6850425004959106} -11/07/2021 04:37:16 - INFO - __main__ - Step 52515: {'lr': 0.0003695352347762376, 'samples': 10082880, 'steps': 52514, 'loss/train': 1.2292646169662476} -11/07/2021 04:37:17 - INFO - __main__ - Step 52516: {'lr': 0.00036953057392531474, 'samples': 10083072, 'steps': 52515, 'loss/train': 1.9233672618865967} -11/07/2021 04:37:17 - INFO - __main__ - Step 52517: {'lr': 0.00036952591302053325, 'samples': 10083264, 'steps': 52516, 'loss/train': 1.7152197360992432} -11/07/2021 04:37:18 - INFO - __main__ - Step 52518: {'lr': 0.00036952125206189516, 'samples': 10083456, 'steps': 52517, 'loss/train': 1.3954459428787231} -11/07/2021 04:37:18 - INFO - __main__ - Step 52519: {'lr': 0.00036951659104940274, 'samples': 10083648, 'steps': 52518, 'loss/train': 1.5164927244186401} -11/07/2021 04:37:19 - INFO - __main__ - Step 52520: {'lr': 0.0003695119299830579, 'samples': 10083840, 'steps': 52519, 'loss/train': 0.9250338077545166} -11/07/2021 04:37:19 - INFO - __main__ - Step 52521: {'lr': 0.0003695072688628628, 'samples': 10084032, 'steps': 52520, 'loss/train': 1.6769369840621948} -11/07/2021 04:37:19 - INFO - __main__ - Step 52522: {'lr': 0.00036950260768881963, 'samples': 10084224, 'steps': 52521, 'loss/train': 1.140705943107605} -11/07/2021 04:37:20 - INFO - __main__ - Step 52523: {'lr': 0.00036949794646093045, 'samples': 10084416, 'steps': 52522, 'loss/train': 1.746580958366394} -11/07/2021 04:37:21 - INFO - __main__ - Step 52524: {'lr': 0.00036949328517919735, 'samples': 10084608, 'steps': 52523, 'loss/train': 1.4720600843429565} -11/07/2021 04:37:21 - INFO - __main__ - Step 52525: {'lr': 0.0003694886238436224, 'samples': 10084800, 'steps': 52524, 'loss/train': 1.255598545074463} -11/07/2021 04:37:22 - INFO - __main__ - Step 52526: {'lr': 0.0003694839624542077, 'samples': 10084992, 'steps': 52525, 'loss/train': 1.5190978050231934} -11/07/2021 04:37:22 - INFO - __main__ - Step 52527: {'lr': 0.0003694793010109553, 'samples': 10085184, 'steps': 52526, 'loss/train': 1.9542680978775024} -11/07/2021 04:37:23 - INFO - __main__ - Step 52528: {'lr': 0.00036947463951386743, 'samples': 10085376, 'steps': 52527, 'loss/train': 1.2795751094818115} -11/07/2021 04:37:23 - INFO - __main__ - Step 52529: {'lr': 0.0003694699779629461, 'samples': 10085568, 'steps': 52528, 'loss/train': 0.9457770586013794} -11/07/2021 04:37:24 - INFO - __main__ - Step 52530: {'lr': 0.0003694653163581936, 'samples': 10085760, 'steps': 52529, 'loss/train': 1.4678503274917603} -11/07/2021 04:37:24 - INFO - __main__ - Step 52531: {'lr': 0.0003694606546996117, 'samples': 10085952, 'steps': 52530, 'loss/train': 1.4220609664916992} -11/07/2021 04:37:24 - INFO - __main__ - Step 52532: {'lr': 0.0003694559929872028, 'samples': 10086144, 'steps': 52531, 'loss/train': 0.9893736243247986} -11/07/2021 04:37:26 - INFO - __main__ - Step 52533: {'lr': 0.00036945133122096875, 'samples': 10086336, 'steps': 52532, 'loss/train': 0.9789683222770691} -11/07/2021 04:37:26 - INFO - __main__ - Step 52534: {'lr': 0.0003694466694009118, 'samples': 10086528, 'steps': 52533, 'loss/train': 1.138243317604065} -11/07/2021 04:37:26 - INFO - __main__ - Step 52535: {'lr': 0.00036944200752703405, 'samples': 10086720, 'steps': 52534, 'loss/train': 1.3803220987319946} -11/07/2021 04:37:27 - INFO - __main__ - Step 52536: {'lr': 0.0003694373455993376, 'samples': 10086912, 'steps': 52535, 'loss/train': 1.5448083877563477} -11/07/2021 04:37:27 - INFO - __main__ - Step 52537: {'lr': 0.0003694326836178245, 'samples': 10087104, 'steps': 52536, 'loss/train': 1.1240888833999634} -11/07/2021 04:37:28 - INFO - __main__ - Step 52538: {'lr': 0.0003694280215824969, 'samples': 10087296, 'steps': 52537, 'loss/train': 2.725187301635742} -11/07/2021 04:37:29 - INFO - __main__ - Step 52539: {'lr': 0.0003694233594933568, 'samples': 10087488, 'steps': 52538, 'loss/train': 1.2964894771575928} -11/07/2021 04:37:29 - INFO - __main__ - Step 52540: {'lr': 0.00036941869735040647, 'samples': 10087680, 'steps': 52539, 'loss/train': 0.9070099592208862} -11/07/2021 04:37:29 - INFO - __main__ - Step 52541: {'lr': 0.0003694140351536479, 'samples': 10087872, 'steps': 52540, 'loss/train': 1.3074787855148315} -11/07/2021 04:37:30 - INFO - __main__ - Step 52542: {'lr': 0.00036940937290308315, 'samples': 10088064, 'steps': 52541, 'loss/train': 1.516692042350769} -11/07/2021 04:37:30 - INFO - __main__ - Step 52543: {'lr': 0.0003694047105987144, 'samples': 10088256, 'steps': 52542, 'loss/train': 0.9241036772727966} -11/07/2021 04:37:31 - INFO - __main__ - Step 52544: {'lr': 0.00036940004824054376, 'samples': 10088448, 'steps': 52543, 'loss/train': 1.690172791481018} -11/07/2021 04:37:31 - INFO - __main__ - Step 52545: {'lr': 0.0003693953858285733, 'samples': 10088640, 'steps': 52544, 'loss/train': 1.2397607564926147} -11/07/2021 04:37:32 - INFO - __main__ - Step 52546: {'lr': 0.0003693907233628051, 'samples': 10088832, 'steps': 52545, 'loss/train': 0.42579424381256104} -11/07/2021 04:37:32 - INFO - __main__ - Step 52547: {'lr': 0.00036938606084324123, 'samples': 10089024, 'steps': 52546, 'loss/train': 1.5375990867614746} -11/07/2021 04:37:32 - INFO - __main__ - Step 52548: {'lr': 0.00036938139826988393, 'samples': 10089216, 'steps': 52547, 'loss/train': 1.901663064956665} -11/07/2021 04:37:34 - INFO - __main__ - Step 52549: {'lr': 0.0003693767356427352, 'samples': 10089408, 'steps': 52548, 'loss/train': 1.3865082263946533} -11/07/2021 04:37:34 - INFO - __main__ - Step 52550: {'lr': 0.00036937207296179717, 'samples': 10089600, 'steps': 52549, 'loss/train': 1.1753380298614502} -11/07/2021 04:37:34 - INFO - __main__ - Step 52551: {'lr': 0.0003693674102270719, 'samples': 10089792, 'steps': 52550, 'loss/train': 1.980668306350708} -11/07/2021 04:37:35 - INFO - __main__ - Step 52552: {'lr': 0.0003693627474385615, 'samples': 10089984, 'steps': 52551, 'loss/train': 1.3791366815567017} -11/07/2021 04:37:35 - INFO - __main__ - Step 52553: {'lr': 0.00036935808459626806, 'samples': 10090176, 'steps': 52552, 'loss/train': 1.610526442527771} -11/07/2021 04:37:36 - INFO - __main__ - Step 52554: {'lr': 0.00036935342170019375, 'samples': 10090368, 'steps': 52553, 'loss/train': 1.6922630071640015} -11/07/2021 04:37:37 - INFO - __main__ - Step 52555: {'lr': 0.00036934875875034063, 'samples': 10090560, 'steps': 52554, 'loss/train': 1.4130017757415771} -11/07/2021 04:37:37 - INFO - __main__ - Step 52556: {'lr': 0.0003693440957467108, 'samples': 10090752, 'steps': 52555, 'loss/train': 1.6270310878753662} -11/07/2021 04:37:38 - INFO - __main__ - Step 52557: {'lr': 0.00036933943268930636, 'samples': 10090944, 'steps': 52556, 'loss/train': 1.6018462181091309} -11/07/2021 04:37:38 - INFO - __main__ - Step 52558: {'lr': 0.00036933476957812944, 'samples': 10091136, 'steps': 52557, 'loss/train': 1.3814212083816528} -11/07/2021 04:37:39 - INFO - __main__ - Step 52559: {'lr': 0.0003693301064131821, 'samples': 10091328, 'steps': 52558, 'loss/train': 0.15778601169586182} -11/07/2021 04:37:39 - INFO - __main__ - Step 52560: {'lr': 0.0003693254431944664, 'samples': 10091520, 'steps': 52559, 'loss/train': 1.6924690008163452} -11/07/2021 04:37:40 - INFO - __main__ - Step 52561: {'lr': 0.00036932077992198455, 'samples': 10091712, 'steps': 52560, 'loss/train': 1.5354642868041992} -11/07/2021 04:37:40 - INFO - __main__ - Step 52562: {'lr': 0.0003693161165957386, 'samples': 10091904, 'steps': 52561, 'loss/train': 0.11148352921009064} -11/07/2021 04:37:40 - INFO - __main__ - Step 52563: {'lr': 0.0003693114532157306, 'samples': 10092096, 'steps': 52562, 'loss/train': 0.8067753911018372} -11/07/2021 04:37:41 - INFO - __main__ - Step 52564: {'lr': 0.00036930678978196283, 'samples': 10092288, 'steps': 52563, 'loss/train': 1.5785139799118042} -11/07/2021 04:37:42 - INFO - __main__ - Step 52565: {'lr': 0.00036930212629443716, 'samples': 10092480, 'steps': 52564, 'loss/train': 1.1247729063034058} -11/07/2021 04:37:42 - INFO - __main__ - Step 52566: {'lr': 0.00036929746275315577, 'samples': 10092672, 'steps': 52565, 'loss/train': 1.0086208581924438} -11/07/2021 04:37:43 - INFO - __main__ - Step 52567: {'lr': 0.0003692927991581208, 'samples': 10092864, 'steps': 52566, 'loss/train': 0.7568204998970032} -11/07/2021 04:37:43 - INFO - __main__ - Step 52568: {'lr': 0.0003692881355093344, 'samples': 10093056, 'steps': 52567, 'loss/train': 1.6512137651443481} -11/07/2021 04:37:43 - INFO - __main__ - Step 52569: {'lr': 0.00036928347180679847, 'samples': 10093248, 'steps': 52568, 'loss/train': 0.9752391576766968} -11/07/2021 04:37:44 - INFO - __main__ - Step 52570: {'lr': 0.0003692788080505154, 'samples': 10093440, 'steps': 52569, 'loss/train': 1.4460619688034058} -11/07/2021 04:37:45 - INFO - __main__ - Step 52571: {'lr': 0.0003692741442404871, 'samples': 10093632, 'steps': 52570, 'loss/train': 1.1609233617782593} -11/07/2021 04:37:45 - INFO - __main__ - Step 52572: {'lr': 0.0003692694803767157, 'samples': 10093824, 'steps': 52571, 'loss/train': 1.4413496255874634} -11/07/2021 04:37:45 - INFO - __main__ - Step 52573: {'lr': 0.0003692648164592033, 'samples': 10094016, 'steps': 52572, 'loss/train': 1.7335922718048096} -11/07/2021 04:37:46 - INFO - __main__ - Step 52574: {'lr': 0.00036926015248795195, 'samples': 10094208, 'steps': 52573, 'loss/train': 1.4201934337615967} -11/07/2021 04:37:47 - INFO - __main__ - Step 52575: {'lr': 0.0003692554884629639, 'samples': 10094400, 'steps': 52574, 'loss/train': 1.4277849197387695} -11/07/2021 04:37:47 - INFO - __main__ - Step 52576: {'lr': 0.00036925082438424116, 'samples': 10094592, 'steps': 52575, 'loss/train': 0.9422187209129333} -11/07/2021 04:37:47 - INFO - __main__ - Step 52577: {'lr': 0.00036924616025178585, 'samples': 10094784, 'steps': 52576, 'loss/train': 1.1624577045440674} -11/07/2021 04:37:48 - INFO - __main__ - Step 52578: {'lr': 0.0003692414960656, 'samples': 10094976, 'steps': 52577, 'loss/train': 1.2759878635406494} -11/07/2021 04:37:48 - INFO - __main__ - Step 52579: {'lr': 0.00036923683182568586, 'samples': 10095168, 'steps': 52578, 'loss/train': 1.250462532043457} -11/07/2021 04:37:48 - INFO - __main__ - Step 52580: {'lr': 0.00036923216753204536, 'samples': 10095360, 'steps': 52579, 'loss/train': 1.490509033203125} -11/07/2021 04:37:49 - INFO - __main__ - Step 52581: {'lr': 0.00036922750318468074, 'samples': 10095552, 'steps': 52580, 'loss/train': 1.3488402366638184} -11/07/2021 04:37:50 - INFO - __main__ - Step 52582: {'lr': 0.00036922283878359396, 'samples': 10095744, 'steps': 52581, 'loss/train': 1.675639033317566} -11/07/2021 04:37:50 - INFO - __main__ - Step 52583: {'lr': 0.0003692181743287873, 'samples': 10095936, 'steps': 52582, 'loss/train': 1.3151415586471558} -11/07/2021 04:37:50 - INFO - __main__ - Step 52584: {'lr': 0.0003692135098202628, 'samples': 10096128, 'steps': 52583, 'loss/train': 1.478013515472412} -11/07/2021 04:37:51 - INFO - __main__ - Step 52585: {'lr': 0.0003692088452580225, 'samples': 10096320, 'steps': 52584, 'loss/train': 1.319058895111084} -11/07/2021 04:37:52 - INFO - __main__ - Step 52586: {'lr': 0.00036920418064206845, 'samples': 10096512, 'steps': 52585, 'loss/train': 1.2535852193832397} -11/07/2021 04:37:52 - INFO - __main__ - Step 52587: {'lr': 0.0003691995159724029, 'samples': 10096704, 'steps': 52586, 'loss/train': 1.552321195602417} -11/07/2021 04:37:52 - INFO - __main__ - Step 52588: {'lr': 0.00036919485124902785, 'samples': 10096896, 'steps': 52587, 'loss/train': 1.5046734809875488} -11/07/2021 04:37:53 - INFO - __main__ - Step 52589: {'lr': 0.00036919018647194545, 'samples': 10097088, 'steps': 52588, 'loss/train': 1.6909958124160767} -11/07/2021 04:37:53 - INFO - __main__ - Step 52590: {'lr': 0.0003691855216411578, 'samples': 10097280, 'steps': 52589, 'loss/train': 1.3594661951065063} -11/07/2021 04:37:54 - INFO - __main__ - Step 52591: {'lr': 0.00036918085675666706, 'samples': 10097472, 'steps': 52590, 'loss/train': 1.430137276649475} -11/07/2021 04:37:55 - INFO - __main__ - Step 52592: {'lr': 0.00036917619181847525, 'samples': 10097664, 'steps': 52591, 'loss/train': 1.3334394693374634} -11/07/2021 04:37:55 - INFO - __main__ - Step 52593: {'lr': 0.00036917152682658437, 'samples': 10097856, 'steps': 52592, 'loss/train': 1.7569663524627686} -11/07/2021 04:37:55 - INFO - __main__ - Step 52594: {'lr': 0.0003691668617809968, 'samples': 10098048, 'steps': 52593, 'loss/train': 1.6426643133163452} -11/07/2021 04:37:56 - INFO - __main__ - Step 52595: {'lr': 0.00036916219668171435, 'samples': 10098240, 'steps': 52594, 'loss/train': 1.2272065877914429} -11/07/2021 04:37:57 - INFO - __main__ - Step 52596: {'lr': 0.0003691575315287393, 'samples': 10098432, 'steps': 52595, 'loss/train': 0.9954767823219299} -11/07/2021 04:37:57 - INFO - __main__ - Step 52597: {'lr': 0.00036915286632207374, 'samples': 10098624, 'steps': 52596, 'loss/train': 1.4305698871612549} -11/07/2021 04:37:57 - INFO - __main__ - Step 52598: {'lr': 0.0003691482010617197, 'samples': 10098816, 'steps': 52597, 'loss/train': 1.2820786237716675} -11/07/2021 04:37:58 - INFO - __main__ - Step 52599: {'lr': 0.00036914353574767935, 'samples': 10099008, 'steps': 52598, 'loss/train': 0.8896142244338989} -11/07/2021 04:37:58 - INFO - __main__ - Step 52600: {'lr': 0.0003691388703799547, 'samples': 10099200, 'steps': 52599, 'loss/train': 1.439296841621399} -11/07/2021 04:37:59 - INFO - __main__ - Step 52601: {'lr': 0.00036913420495854793, 'samples': 10099392, 'steps': 52600, 'loss/train': 1.7042537927627563} -11/07/2021 04:37:59 - INFO - __main__ - Step 52602: {'lr': 0.00036912953948346115, 'samples': 10099584, 'steps': 52601, 'loss/train': 1.6592191457748413} -11/07/2021 04:38:00 - INFO - __main__ - Step 52603: {'lr': 0.00036912487395469645, 'samples': 10099776, 'steps': 52602, 'loss/train': 1.6329528093338013} -11/07/2021 04:38:00 - INFO - __main__ - Step 52604: {'lr': 0.0003691202083722559, 'samples': 10099968, 'steps': 52603, 'loss/train': 1.626839518547058} -11/07/2021 04:38:01 - INFO - __main__ - Step 52605: {'lr': 0.0003691155427361416, 'samples': 10100160, 'steps': 52604, 'loss/train': 1.8369107246398926} -11/07/2021 04:38:01 - INFO - __main__ - Step 52606: {'lr': 0.0003691108770463557, 'samples': 10100352, 'steps': 52605, 'loss/train': 1.1976712942123413} -11/07/2021 04:38:02 - INFO - __main__ - Step 52607: {'lr': 0.00036910621130290027, 'samples': 10100544, 'steps': 52606, 'loss/train': 1.3801106214523315} -11/07/2021 04:38:02 - INFO - __main__ - Step 52608: {'lr': 0.0003691015455057775, 'samples': 10100736, 'steps': 52607, 'loss/train': 0.8249280452728271} -11/07/2021 04:38:03 - INFO - __main__ - Step 52609: {'lr': 0.0003690968796549893, 'samples': 10100928, 'steps': 52608, 'loss/train': 1.2240235805511475} -11/07/2021 04:38:03 - INFO - __main__ - Step 52610: {'lr': 0.0003690922137505379, 'samples': 10101120, 'steps': 52609, 'loss/train': 0.8298952579498291} -11/07/2021 04:38:03 - INFO - __main__ - Step 52611: {'lr': 0.00036908754779242545, 'samples': 10101312, 'steps': 52610, 'loss/train': 0.6339261531829834} -11/07/2021 04:38:04 - INFO - __main__ - Step 52612: {'lr': 0.00036908288178065393, 'samples': 10101504, 'steps': 52611, 'loss/train': 1.789779782295227} -11/07/2021 04:38:05 - INFO - __main__ - Step 52613: {'lr': 0.00036907821571522553, 'samples': 10101696, 'steps': 52612, 'loss/train': 1.3123681545257568} -11/07/2021 04:38:05 - INFO - __main__ - Step 52614: {'lr': 0.0003690735495961423, 'samples': 10101888, 'steps': 52613, 'loss/train': 1.3512696027755737} -11/07/2021 04:38:05 - INFO - __main__ - Step 52615: {'lr': 0.0003690688834234064, 'samples': 10102080, 'steps': 52614, 'loss/train': 0.40644317865371704} -11/07/2021 04:38:06 - INFO - __main__ - Step 52616: {'lr': 0.0003690642171970198, 'samples': 10102272, 'steps': 52615, 'loss/train': 1.7856353521347046} -11/07/2021 04:38:07 - INFO - __main__ - Step 52617: {'lr': 0.0003690595509169848, 'samples': 10102464, 'steps': 52616, 'loss/train': 1.9296809434890747} -11/07/2021 04:38:07 - INFO - __main__ - Step 52618: {'lr': 0.00036905488458330337, 'samples': 10102656, 'steps': 52617, 'loss/train': 1.402385950088501} -11/07/2021 04:38:07 - INFO - __main__ - Step 52619: {'lr': 0.00036905021819597767, 'samples': 10102848, 'steps': 52618, 'loss/train': 1.3527421951293945} -11/07/2021 04:38:08 - INFO - __main__ - Step 52620: {'lr': 0.00036904555175500977, 'samples': 10103040, 'steps': 52619, 'loss/train': 1.1639877557754517} -11/07/2021 04:38:08 - INFO - __main__ - Step 52621: {'lr': 0.00036904088526040177, 'samples': 10103232, 'steps': 52620, 'loss/train': 1.4407010078430176} -11/07/2021 04:38:09 - INFO - __main__ - Step 52622: {'lr': 0.00036903621871215575, 'samples': 10103424, 'steps': 52621, 'loss/train': 1.1555688381195068} -11/07/2021 04:38:10 - INFO - __main__ - Step 52623: {'lr': 0.0003690315521102739, 'samples': 10103616, 'steps': 52622, 'loss/train': 1.330957293510437} -11/07/2021 04:38:10 - INFO - __main__ - Step 52624: {'lr': 0.0003690268854547583, 'samples': 10103808, 'steps': 52623, 'loss/train': 1.6458876132965088} -11/07/2021 04:38:10 - INFO - __main__ - Step 52625: {'lr': 0.00036902221874561097, 'samples': 10104000, 'steps': 52624, 'loss/train': 1.416123867034912} -11/07/2021 04:38:11 - INFO - __main__ - Step 52626: {'lr': 0.00036901755198283403, 'samples': 10104192, 'steps': 52625, 'loss/train': 1.401869773864746} -11/07/2021 04:38:12 - INFO - __main__ - Step 52627: {'lr': 0.0003690128851664297, 'samples': 10104384, 'steps': 52626, 'loss/train': 1.1351631879806519} -11/07/2021 04:38:12 - INFO - __main__ - Step 52628: {'lr': 0.0003690082182964, 'samples': 10104576, 'steps': 52627, 'loss/train': 1.4857701063156128} -11/07/2021 04:38:12 - INFO - __main__ - Step 52629: {'lr': 0.00036900355137274696, 'samples': 10104768, 'steps': 52628, 'loss/train': 0.9550331234931946} -11/07/2021 04:38:13 - INFO - __main__ - Step 52630: {'lr': 0.00036899888439547276, 'samples': 10104960, 'steps': 52629, 'loss/train': 1.4199917316436768} -11/07/2021 04:38:13 - INFO - __main__ - Step 52631: {'lr': 0.00036899421736457955, 'samples': 10105152, 'steps': 52630, 'loss/train': 1.479548454284668} -11/07/2021 04:38:14 - INFO - __main__ - Step 52632: {'lr': 0.00036898955028006936, 'samples': 10105344, 'steps': 52631, 'loss/train': 1.6742368936538696} -11/07/2021 04:38:14 - INFO - __main__ - Step 52633: {'lr': 0.0003689848831419443, 'samples': 10105536, 'steps': 52632, 'loss/train': 1.5146318674087524} -11/07/2021 04:38:15 - INFO - __main__ - Step 52634: {'lr': 0.0003689802159502065, 'samples': 10105728, 'steps': 52633, 'loss/train': 1.5963118076324463} -11/07/2021 04:38:15 - INFO - __main__ - Step 52635: {'lr': 0.00036897554870485804, 'samples': 10105920, 'steps': 52634, 'loss/train': 1.5557894706726074} -11/07/2021 04:38:15 - INFO - __main__ - Step 52636: {'lr': 0.000368970881405901, 'samples': 10106112, 'steps': 52635, 'loss/train': 1.2636913061141968} -11/07/2021 04:38:16 - INFO - __main__ - Step 52637: {'lr': 0.0003689662140533376, 'samples': 10106304, 'steps': 52636, 'loss/train': 1.3850836753845215} -11/07/2021 04:38:17 - INFO - __main__ - Step 52638: {'lr': 0.00036896154664716987, 'samples': 10106496, 'steps': 52637, 'loss/train': 1.4937160015106201} -11/07/2021 04:38:17 - INFO - __main__ - Step 52639: {'lr': 0.00036895687918739984, 'samples': 10106688, 'steps': 52638, 'loss/train': 1.4627037048339844} -11/07/2021 04:38:17 - INFO - __main__ - Step 52640: {'lr': 0.0003689522116740296, 'samples': 10106880, 'steps': 52639, 'loss/train': 1.375765323638916} -11/07/2021 04:38:18 - INFO - __main__ - Step 52641: {'lr': 0.0003689475441070615, 'samples': 10107072, 'steps': 52640, 'loss/train': 0.9709281921386719} -11/07/2021 04:38:19 - INFO - __main__ - Step 52642: {'lr': 0.0003689428764864974, 'samples': 10107264, 'steps': 52641, 'loss/train': 1.6289591789245605} -11/07/2021 04:38:19 - INFO - __main__ - Step 52643: {'lr': 0.0003689382088123394, 'samples': 10107456, 'steps': 52642, 'loss/train': 1.2757549285888672} -11/07/2021 04:38:20 - INFO - __main__ - Step 52644: {'lr': 0.0003689335410845898, 'samples': 10107648, 'steps': 52643, 'loss/train': 1.6775438785552979} -11/07/2021 04:38:20 - INFO - __main__ - Step 52645: {'lr': 0.00036892887330325054, 'samples': 10107840, 'steps': 52644, 'loss/train': 1.077232837677002} -11/07/2021 04:38:20 - INFO - __main__ - Step 52646: {'lr': 0.00036892420546832375, 'samples': 10108032, 'steps': 52645, 'loss/train': 0.8511205911636353} -11/07/2021 04:38:21 - INFO - __main__ - Step 52647: {'lr': 0.0003689195375798115, 'samples': 10108224, 'steps': 52646, 'loss/train': 1.0628376007080078} -11/07/2021 04:38:22 - INFO - __main__ - Step 52648: {'lr': 0.00036891486963771603, 'samples': 10108416, 'steps': 52647, 'loss/train': 1.3356902599334717} -11/07/2021 04:38:22 - INFO - __main__ - Step 52649: {'lr': 0.00036891020164203924, 'samples': 10108608, 'steps': 52648, 'loss/train': 1.426182508468628} -11/07/2021 04:38:22 - INFO - __main__ - Step 52650: {'lr': 0.00036890553359278345, 'samples': 10108800, 'steps': 52649, 'loss/train': 0.993011474609375} -11/07/2021 04:38:23 - INFO - __main__ - Step 52651: {'lr': 0.0003689008654899507, 'samples': 10108992, 'steps': 52650, 'loss/train': 1.282455563545227} -11/07/2021 04:38:23 - INFO - __main__ - Step 52652: {'lr': 0.00036889619733354297, 'samples': 10109184, 'steps': 52651, 'loss/train': 1.4460147619247437} -11/07/2021 04:38:24 - INFO - __main__ - Step 52653: {'lr': 0.0003688915291235625, 'samples': 10109376, 'steps': 52652, 'loss/train': 1.548343539237976} -11/07/2021 04:38:24 - INFO - __main__ - Step 52654: {'lr': 0.0003688868608600113, 'samples': 10109568, 'steps': 52653, 'loss/train': 1.2227991819381714} -11/07/2021 04:38:25 - INFO - __main__ - Step 52655: {'lr': 0.00036888219254289147, 'samples': 10109760, 'steps': 52654, 'loss/train': 1.3856556415557861} -11/07/2021 04:38:25 - INFO - __main__ - Step 52656: {'lr': 0.0003688775241722052, 'samples': 10109952, 'steps': 52655, 'loss/train': 1.3090105056762695} -11/07/2021 04:38:25 - INFO - __main__ - Step 52657: {'lr': 0.0003688728557479546, 'samples': 10110144, 'steps': 52656, 'loss/train': 1.471129298210144} -11/07/2021 04:38:27 - INFO - __main__ - Step 52658: {'lr': 0.00036886818727014173, 'samples': 10110336, 'steps': 52657, 'loss/train': 1.2394299507141113} -11/07/2021 04:38:27 - INFO - __main__ - Step 52659: {'lr': 0.0003688635187387686, 'samples': 10110528, 'steps': 52658, 'loss/train': 1.114780068397522} -11/07/2021 04:38:27 - INFO - __main__ - Step 52660: {'lr': 0.0003688588501538375, 'samples': 10110720, 'steps': 52659, 'loss/train': 1.5244759321212769} -11/07/2021 04:38:28 - INFO - __main__ - Step 52661: {'lr': 0.00036885418151535033, 'samples': 10110912, 'steps': 52660, 'loss/train': 1.6582838296890259} -11/07/2021 04:38:28 - INFO - __main__ - Step 52662: {'lr': 0.00036884951282330935, 'samples': 10111104, 'steps': 52661, 'loss/train': 1.3638769388198853} -11/07/2021 04:38:28 - INFO - __main__ - Step 52663: {'lr': 0.00036884484407771664, 'samples': 10111296, 'steps': 52662, 'loss/train': 1.2208144664764404} -11/07/2021 04:38:29 - INFO - __main__ - Step 52664: {'lr': 0.00036884017527857426, 'samples': 10111488, 'steps': 52663, 'loss/train': 1.3330110311508179} -11/07/2021 04:38:30 - INFO - __main__ - Step 52665: {'lr': 0.0003688355064258844, 'samples': 10111680, 'steps': 52664, 'loss/train': 0.10926000028848648} -11/07/2021 04:38:30 - INFO - __main__ - Step 52666: {'lr': 0.00036883083751964896, 'samples': 10111872, 'steps': 52665, 'loss/train': 1.4924814701080322} -11/07/2021 04:38:30 - INFO - __main__ - Step 52667: {'lr': 0.00036882616855987027, 'samples': 10112064, 'steps': 52666, 'loss/train': 1.1043123006820679} -11/07/2021 04:38:31 - INFO - __main__ - Step 52668: {'lr': 0.0003688214995465503, 'samples': 10112256, 'steps': 52667, 'loss/train': 1.3527469635009766} -11/07/2021 04:38:32 - INFO - __main__ - Step 52669: {'lr': 0.00036881683047969115, 'samples': 10112448, 'steps': 52668, 'loss/train': 1.0695163011550903} -11/07/2021 04:38:32 - INFO - __main__ - Step 52670: {'lr': 0.00036881216135929506, 'samples': 10112640, 'steps': 52669, 'loss/train': 1.1192641258239746} -11/07/2021 04:38:33 - INFO - __main__ - Step 52671: {'lr': 0.0003688074921853641, 'samples': 10112832, 'steps': 52670, 'loss/train': 1.308417797088623} -11/07/2021 04:38:33 - INFO - __main__ - Step 52672: {'lr': 0.0003688028229579002, 'samples': 10113024, 'steps': 52671, 'loss/train': 1.0733835697174072} -11/07/2021 04:38:33 - INFO - __main__ - Step 52673: {'lr': 0.0003687981536769056, 'samples': 10113216, 'steps': 52672, 'loss/train': 1.4950209856033325} -11/07/2021 04:38:34 - INFO - __main__ - Step 52674: {'lr': 0.00036879348434238235, 'samples': 10113408, 'steps': 52673, 'loss/train': 1.5509028434753418} -11/07/2021 04:38:35 - INFO - __main__ - Step 52675: {'lr': 0.00036878881495433264, 'samples': 10113600, 'steps': 52674, 'loss/train': 1.8097690343856812} -11/07/2021 04:38:35 - INFO - __main__ - Step 52676: {'lr': 0.0003687841455127585, 'samples': 10113792, 'steps': 52675, 'loss/train': 1.6956031322479248} -11/07/2021 04:38:35 - INFO - __main__ - Step 52677: {'lr': 0.0003687794760176621, 'samples': 10113984, 'steps': 52676, 'loss/train': 1.7950348854064941} -11/07/2021 04:38:36 - INFO - __main__ - Step 52678: {'lr': 0.0003687748064690455, 'samples': 10114176, 'steps': 52677, 'loss/train': 1.0014179944992065} -11/07/2021 04:38:37 - INFO - __main__ - Step 52679: {'lr': 0.0003687701368669108, 'samples': 10114368, 'steps': 52678, 'loss/train': 1.463243842124939} -11/07/2021 04:38:37 - INFO - __main__ - Step 52680: {'lr': 0.0003687654672112601, 'samples': 10114560, 'steps': 52679, 'loss/train': 1.2007852792739868} -11/07/2021 04:38:37 - INFO - __main__ - Step 52681: {'lr': 0.00036876079750209544, 'samples': 10114752, 'steps': 52680, 'loss/train': 1.4676156044006348} -11/07/2021 04:38:38 - INFO - __main__ - Step 52682: {'lr': 0.00036875612773941906, 'samples': 10114944, 'steps': 52681, 'loss/train': 1.2182501554489136} -11/07/2021 04:38:38 - INFO - __main__ - Step 52683: {'lr': 0.00036875145792323303, 'samples': 10115136, 'steps': 52682, 'loss/train': 1.168044090270996} -11/07/2021 04:38:39 - INFO - __main__ - Step 52684: {'lr': 0.0003687467880535394, 'samples': 10115328, 'steps': 52683, 'loss/train': 1.3582491874694824} -11/07/2021 04:38:40 - INFO - __main__ - Step 52685: {'lr': 0.00036874211813034034, 'samples': 10115520, 'steps': 52684, 'loss/train': 1.5834335088729858} -11/07/2021 04:38:40 - INFO - __main__ - Step 52686: {'lr': 0.00036873744815363785, 'samples': 10115712, 'steps': 52685, 'loss/train': 1.6150399446487427} -11/07/2021 04:38:40 - INFO - __main__ - Step 52687: {'lr': 0.0003687327781234341, 'samples': 10115904, 'steps': 52686, 'loss/train': 1.1509486436843872} -11/07/2021 04:38:41 - INFO - __main__ - Step 52688: {'lr': 0.0003687281080397312, 'samples': 10116096, 'steps': 52687, 'loss/train': 1.3488634824752808} -11/07/2021 04:38:42 - INFO - __main__ - Step 52689: {'lr': 0.0003687234379025313, 'samples': 10116288, 'steps': 52688, 'loss/train': 1.3734240531921387} -11/07/2021 04:38:42 - INFO - __main__ - Step 52690: {'lr': 0.00036871876771183635, 'samples': 10116480, 'steps': 52689, 'loss/train': 1.438968300819397} -11/07/2021 04:38:42 - INFO - __main__ - Step 52691: {'lr': 0.0003687140974676486, 'samples': 10116672, 'steps': 52690, 'loss/train': 1.4034918546676636} -11/07/2021 04:38:43 - INFO - __main__ - Step 52692: {'lr': 0.0003687094271699702, 'samples': 10116864, 'steps': 52691, 'loss/train': 0.7095943093299866} -11/07/2021 04:38:43 - INFO - __main__ - Step 52693: {'lr': 0.00036870475681880313, 'samples': 10117056, 'steps': 52692, 'loss/train': 1.2739990949630737} -11/07/2021 04:38:44 - INFO - __main__ - Step 52694: {'lr': 0.00036870008641414945, 'samples': 10117248, 'steps': 52693, 'loss/train': 1.3993279933929443} -11/07/2021 04:38:44 - INFO - __main__ - Step 52695: {'lr': 0.0003686954159560114, 'samples': 10117440, 'steps': 52694, 'loss/train': 0.857010543346405} -11/07/2021 04:38:45 - INFO - __main__ - Step 52696: {'lr': 0.00036869074544439097, 'samples': 10117632, 'steps': 52695, 'loss/train': 1.7480690479278564} -11/07/2021 04:38:45 - INFO - __main__ - Step 52697: {'lr': 0.00036868607487929034, 'samples': 10117824, 'steps': 52696, 'loss/train': 1.7123708724975586} -11/07/2021 04:38:45 - INFO - __main__ - Step 52698: {'lr': 0.00036868140426071165, 'samples': 10118016, 'steps': 52697, 'loss/train': 0.7053462266921997} -11/07/2021 04:38:46 - INFO - __main__ - Step 52699: {'lr': 0.00036867673358865696, 'samples': 10118208, 'steps': 52698, 'loss/train': 1.1842609643936157} -11/07/2021 04:38:47 - INFO - __main__ - Step 52700: {'lr': 0.0003686720628631283, 'samples': 10118400, 'steps': 52699, 'loss/train': 1.9817100763320923} -11/07/2021 04:38:47 - INFO - __main__ - Step 52701: {'lr': 0.0003686673920841278, 'samples': 10118592, 'steps': 52700, 'loss/train': 1.0959868431091309} -11/07/2021 04:38:47 - INFO - __main__ - Step 52702: {'lr': 0.0003686627212516577, 'samples': 10118784, 'steps': 52701, 'loss/train': 1.3468350172042847} -11/07/2021 04:38:48 - INFO - __main__ - Step 52703: {'lr': 0.0003686580503657199, 'samples': 10118976, 'steps': 52702, 'loss/train': 0.9252719879150391} -11/07/2021 04:38:49 - INFO - __main__ - Step 52704: {'lr': 0.00036865337942631674, 'samples': 10119168, 'steps': 52703, 'loss/train': 1.5211286544799805} -11/07/2021 04:38:49 - INFO - __main__ - Step 52705: {'lr': 0.00036864870843345015, 'samples': 10119360, 'steps': 52704, 'loss/train': 1.3844294548034668} -11/07/2021 04:38:50 - INFO - __main__ - Step 52706: {'lr': 0.00036864403738712226, 'samples': 10119552, 'steps': 52705, 'loss/train': 1.3543879985809326} -11/07/2021 04:38:50 - INFO - __main__ - Step 52707: {'lr': 0.00036863936628733524, 'samples': 10119744, 'steps': 52706, 'loss/train': 1.4449284076690674} -11/07/2021 04:38:50 - INFO - __main__ - Step 52708: {'lr': 0.0003686346951340911, 'samples': 10119936, 'steps': 52707, 'loss/train': 1.6860452890396118} -11/07/2021 04:38:51 - INFO - __main__ - Step 52709: {'lr': 0.000368630023927392, 'samples': 10120128, 'steps': 52708, 'loss/train': 1.3681421279907227} -11/07/2021 04:38:52 - INFO - __main__ - Step 52710: {'lr': 0.00036862535266724006, 'samples': 10120320, 'steps': 52709, 'loss/train': 1.2561464309692383} -11/07/2021 04:38:52 - INFO - __main__ - Step 52711: {'lr': 0.0003686206813536374, 'samples': 10120512, 'steps': 52710, 'loss/train': 1.1494148969650269} -11/07/2021 04:38:52 - INFO - __main__ - Step 52712: {'lr': 0.0003686160099865861, 'samples': 10120704, 'steps': 52711, 'loss/train': 1.4577538967132568} -11/07/2021 04:38:53 - INFO - __main__ - Step 52713: {'lr': 0.00036861133856608817, 'samples': 10120896, 'steps': 52712, 'loss/train': 0.9733343124389648} -11/07/2021 04:38:53 - INFO - __main__ - Step 52714: {'lr': 0.0003686066670921459, 'samples': 10121088, 'steps': 52713, 'loss/train': 1.50171959400177} -11/07/2021 04:38:54 - INFO - __main__ - Step 52715: {'lr': 0.00036860199556476125, 'samples': 10121280, 'steps': 52714, 'loss/train': 1.476938247680664} -11/07/2021 04:38:54 - INFO - __main__ - Step 52716: {'lr': 0.0003685973239839364, 'samples': 10121472, 'steps': 52715, 'loss/train': 1.5557302236557007} -11/07/2021 04:38:55 - INFO - __main__ - Step 52717: {'lr': 0.0003685926523496733, 'samples': 10121664, 'steps': 52716, 'loss/train': 1.514423131942749} -11/07/2021 04:38:55 - INFO - __main__ - Step 52718: {'lr': 0.0003685879806619743, 'samples': 10121856, 'steps': 52717, 'loss/train': 1.328827142715454} -11/07/2021 04:38:56 - INFO - __main__ - Step 52719: {'lr': 0.0003685833089208414, 'samples': 10122048, 'steps': 52718, 'loss/train': 1.6780064105987549} -11/07/2021 04:38:57 - INFO - __main__ - Step 52720: {'lr': 0.00036857863712627664, 'samples': 10122240, 'steps': 52719, 'loss/train': 0.09408082067966461} -11/07/2021 04:38:57 - INFO - __main__ - Step 52721: {'lr': 0.0003685739652782822, 'samples': 10122432, 'steps': 52720, 'loss/train': 1.4401472806930542} -11/07/2021 04:38:57 - INFO - __main__ - Step 52722: {'lr': 0.00036856929337686015, 'samples': 10122624, 'steps': 52721, 'loss/train': 1.3808116912841797} -11/07/2021 04:38:58 - INFO - __main__ - Step 52723: {'lr': 0.0003685646214220126, 'samples': 10122816, 'steps': 52722, 'loss/train': 0.9897241592407227} -11/07/2021 04:38:58 - INFO - __main__ - Step 52724: {'lr': 0.00036855994941374165, 'samples': 10123008, 'steps': 52723, 'loss/train': 1.315622091293335} -11/07/2021 04:38:59 - INFO - __main__ - Step 52725: {'lr': 0.0003685552773520495, 'samples': 10123200, 'steps': 52724, 'loss/train': 1.044396162033081} -11/07/2021 04:38:59 - INFO - __main__ - Step 52726: {'lr': 0.0003685506052369381, 'samples': 10123392, 'steps': 52725, 'loss/train': 1.548998236656189} -11/07/2021 04:39:00 - INFO - __main__ - Step 52727: {'lr': 0.00036854593306840955, 'samples': 10123584, 'steps': 52726, 'loss/train': 1.4104607105255127} -11/07/2021 04:39:00 - INFO - __main__ - Step 52728: {'lr': 0.0003685412608464661, 'samples': 10123776, 'steps': 52727, 'loss/train': 1.6745527982711792} -11/07/2021 04:39:00 - INFO - __main__ - Step 52729: {'lr': 0.00036853658857110986, 'samples': 10123968, 'steps': 52728, 'loss/train': 1.0913670063018799} -11/07/2021 04:39:01 - INFO - __main__ - Step 52730: {'lr': 0.0003685319162423428, 'samples': 10124160, 'steps': 52729, 'loss/train': 0.8038442730903625} -11/07/2021 04:39:02 - INFO - __main__ - Step 52731: {'lr': 0.0003685272438601671, 'samples': 10124352, 'steps': 52730, 'loss/train': 1.4698398113250732} -11/07/2021 04:39:02 - INFO - __main__ - Step 52732: {'lr': 0.0003685225714245848, 'samples': 10124544, 'steps': 52731, 'loss/train': 1.162439227104187} -11/07/2021 04:39:03 - INFO - __main__ - Step 52733: {'lr': 0.0003685178989355981, 'samples': 10124736, 'steps': 52732, 'loss/train': 1.3873324394226074} -11/07/2021 04:39:03 - INFO - __main__ - Step 52734: {'lr': 0.00036851322639320903, 'samples': 10124928, 'steps': 52733, 'loss/train': 1.532759666442871} -11/07/2021 04:39:04 - INFO - __main__ - Step 52735: {'lr': 0.00036850855379741984, 'samples': 10125120, 'steps': 52734, 'loss/train': 1.61179780960083} -11/07/2021 04:39:04 - INFO - __main__ - Step 52736: {'lr': 0.0003685038811482324, 'samples': 10125312, 'steps': 52735, 'loss/train': 1.3504177331924438} -11/07/2021 04:39:05 - INFO - __main__ - Step 52737: {'lr': 0.00036849920844564903, 'samples': 10125504, 'steps': 52736, 'loss/train': 1.3645915985107422} -11/07/2021 04:39:05 - INFO - __main__ - Step 52738: {'lr': 0.00036849453568967174, 'samples': 10125696, 'steps': 52737, 'loss/train': 1.734371304512024} -11/07/2021 04:39:05 - INFO - __main__ - Step 52739: {'lr': 0.0003684898628803026, 'samples': 10125888, 'steps': 52738, 'loss/train': 1.2029647827148438} -11/07/2021 04:39:06 - INFO - __main__ - Step 52740: {'lr': 0.00036848519001754374, 'samples': 10126080, 'steps': 52739, 'loss/train': 1.7320870161056519} -11/07/2021 04:39:07 - INFO - __main__ - Step 52741: {'lr': 0.0003684805171013973, 'samples': 10126272, 'steps': 52740, 'loss/train': 1.3814479112625122} -11/07/2021 04:39:07 - INFO - __main__ - Step 52742: {'lr': 0.00036847584413186537, 'samples': 10126464, 'steps': 52741, 'loss/train': 0.9930067658424377} -11/07/2021 04:39:07 - INFO - __main__ - Step 52743: {'lr': 0.0003684711711089501, 'samples': 10126656, 'steps': 52742, 'loss/train': 1.5547336339950562} -11/07/2021 04:39:08 - INFO - __main__ - Step 52744: {'lr': 0.00036846649803265344, 'samples': 10126848, 'steps': 52743, 'loss/train': 1.307753086090088} -11/07/2021 04:39:10 - INFO - __main__ - Step 52745: {'lr': 0.0003684618249029776, 'samples': 10127040, 'steps': 52744, 'loss/train': 1.7585844993591309} -11/07/2021 04:39:10 - INFO - __main__ - Step 52746: {'lr': 0.0003684571517199248, 'samples': 10127232, 'steps': 52745, 'loss/train': 1.3824597597122192} -11/07/2021 04:39:10 - INFO - __main__ - Step 52747: {'lr': 0.000368452478483497, 'samples': 10127424, 'steps': 52746, 'loss/train': 1.4839593172073364} -11/07/2021 04:39:11 - INFO - __main__ - Step 52748: {'lr': 0.0003684478051936964, 'samples': 10127616, 'steps': 52747, 'loss/train': 1.148180603981018} -11/07/2021 04:39:11 - INFO - __main__ - Step 52749: {'lr': 0.0003684431318505249, 'samples': 10127808, 'steps': 52748, 'loss/train': 1.2352585792541504} -11/07/2021 04:39:11 - INFO - __main__ - Step 52750: {'lr': 0.0003684384584539848, 'samples': 10128000, 'steps': 52749, 'loss/train': 1.4004900455474854} -11/07/2021 04:39:12 - INFO - __main__ - Step 52751: {'lr': 0.0003684337850040782, 'samples': 10128192, 'steps': 52750, 'loss/train': 1.7843750715255737} -11/07/2021 04:39:12 - INFO - __main__ - Step 52752: {'lr': 0.00036842911150080716, 'samples': 10128384, 'steps': 52751, 'loss/train': 1.7915418148040771} -11/07/2021 04:39:13 - INFO - __main__ - Step 52753: {'lr': 0.0003684244379441738, 'samples': 10128576, 'steps': 52752, 'loss/train': 0.08706151694059372} -11/07/2021 04:39:14 - INFO - __main__ - Step 52754: {'lr': 0.00036841976433418024, 'samples': 10128768, 'steps': 52753, 'loss/train': 1.140884280204773} -11/07/2021 04:39:14 - INFO - __main__ - Step 52755: {'lr': 0.0003684150906708285, 'samples': 10128960, 'steps': 52754, 'loss/train': 1.865882396697998} -11/07/2021 04:39:14 - INFO - __main__ - Step 52756: {'lr': 0.00036841041695412076, 'samples': 10129152, 'steps': 52755, 'loss/train': 1.543358564376831} -11/07/2021 04:39:15 - INFO - __main__ - Step 52757: {'lr': 0.00036840574318405914, 'samples': 10129344, 'steps': 52756, 'loss/train': 2.6298458576202393} -11/07/2021 04:39:16 - INFO - __main__ - Step 52758: {'lr': 0.00036840106936064567, 'samples': 10129536, 'steps': 52757, 'loss/train': 1.492418646812439} -11/07/2021 04:39:16 - INFO - __main__ - Step 52759: {'lr': 0.0003683963954838826, 'samples': 10129728, 'steps': 52758, 'loss/train': 1.6637871265411377} -11/07/2021 04:39:16 - INFO - __main__ - Step 52760: {'lr': 0.00036839172155377184, 'samples': 10129920, 'steps': 52759, 'loss/train': 0.6908199787139893} -11/07/2021 04:39:17 - INFO - __main__ - Step 52761: {'lr': 0.0003683870475703156, 'samples': 10130112, 'steps': 52760, 'loss/train': 1.5701454877853394} -11/07/2021 04:39:17 - INFO - __main__ - Step 52762: {'lr': 0.000368382373533516, 'samples': 10130304, 'steps': 52761, 'loss/train': 1.6280708312988281} -11/07/2021 04:39:18 - INFO - __main__ - Step 52763: {'lr': 0.0003683776994433752, 'samples': 10130496, 'steps': 52762, 'loss/train': 1.4984570741653442} -11/07/2021 04:39:18 - INFO - __main__ - Step 52764: {'lr': 0.0003683730252998951, 'samples': 10130688, 'steps': 52763, 'loss/train': 1.3527424335479736} -11/07/2021 04:39:19 - INFO - __main__ - Step 52765: {'lr': 0.00036836835110307803, 'samples': 10130880, 'steps': 52764, 'loss/train': 1.1018459796905518} -11/07/2021 04:39:19 - INFO - __main__ - Step 52766: {'lr': 0.00036836367685292605, 'samples': 10131072, 'steps': 52765, 'loss/train': 1.0537971258163452} -11/07/2021 04:39:19 - INFO - __main__ - Step 52767: {'lr': 0.00036835900254944114, 'samples': 10131264, 'steps': 52766, 'loss/train': 1.1499534845352173} -11/07/2021 04:39:20 - INFO - __main__ - Step 52768: {'lr': 0.0003683543281926255, 'samples': 10131456, 'steps': 52767, 'loss/train': 2.200810670852661} -11/07/2021 04:39:21 - INFO - __main__ - Step 52769: {'lr': 0.0003683496537824813, 'samples': 10131648, 'steps': 52768, 'loss/train': 3.037747621536255} -11/07/2021 04:39:21 - INFO - __main__ - Step 52770: {'lr': 0.0003683449793190105, 'samples': 10131840, 'steps': 52769, 'loss/train': 1.3351248502731323} -11/07/2021 04:39:22 - INFO - __main__ - Step 52771: {'lr': 0.0003683403048022153, 'samples': 10132032, 'steps': 52770, 'loss/train': 1.5194337368011475} -11/07/2021 04:39:22 - INFO - __main__ - Step 52772: {'lr': 0.0003683356302320978, 'samples': 10132224, 'steps': 52771, 'loss/train': 1.1175599098205566} -11/07/2021 04:39:22 - INFO - __main__ - Step 52773: {'lr': 0.00036833095560866007, 'samples': 10132416, 'steps': 52772, 'loss/train': 1.6043848991394043} -11/07/2021 04:39:23 - INFO - __main__ - Step 52774: {'lr': 0.00036832628093190424, 'samples': 10132608, 'steps': 52773, 'loss/train': 1.1120038032531738} -11/07/2021 04:39:24 - INFO - __main__ - Step 52775: {'lr': 0.0003683216062018324, 'samples': 10132800, 'steps': 52774, 'loss/train': 1.2036117315292358} -11/07/2021 04:39:24 - INFO - __main__ - Step 52776: {'lr': 0.0003683169314184467, 'samples': 10132992, 'steps': 52775, 'loss/train': 1.5896140336990356} -11/07/2021 04:39:24 - INFO - __main__ - Step 52777: {'lr': 0.00036831225658174915, 'samples': 10133184, 'steps': 52776, 'loss/train': 1.4444432258605957} -11/07/2021 04:39:25 - INFO - __main__ - Step 52778: {'lr': 0.000368307581691742, 'samples': 10133376, 'steps': 52777, 'loss/train': 1.8758273124694824} -11/07/2021 04:39:26 - INFO - __main__ - Step 52779: {'lr': 0.0003683029067484273, 'samples': 10133568, 'steps': 52778, 'loss/train': 1.510718822479248} -11/07/2021 04:39:26 - INFO - __main__ - Step 52780: {'lr': 0.0003682982317518071, 'samples': 10133760, 'steps': 52779, 'loss/train': 1.6195272207260132} -11/07/2021 04:39:27 - INFO - __main__ - Step 52781: {'lr': 0.00036829355670188355, 'samples': 10133952, 'steps': 52780, 'loss/train': 1.4773942232131958} -11/07/2021 04:39:27 - INFO - __main__ - Step 52782: {'lr': 0.0003682888815986587, 'samples': 10134144, 'steps': 52781, 'loss/train': 1.7710773944854736} -11/07/2021 04:39:27 - INFO - __main__ - Step 52783: {'lr': 0.00036828420644213474, 'samples': 10134336, 'steps': 52782, 'loss/train': 1.5674437284469604} -11/07/2021 04:39:28 - INFO - __main__ - Step 52784: {'lr': 0.00036827953123231373, 'samples': 10134528, 'steps': 52783, 'loss/train': 1.591394305229187} -11/07/2021 04:39:29 - INFO - __main__ - Step 52785: {'lr': 0.00036827485596919773, 'samples': 10134720, 'steps': 52784, 'loss/train': 1.6549326181411743} -11/07/2021 04:39:29 - INFO - __main__ - Step 52786: {'lr': 0.00036827018065278903, 'samples': 10134912, 'steps': 52785, 'loss/train': 1.7973638772964478} -11/07/2021 04:39:29 - INFO - __main__ - Step 52787: {'lr': 0.00036826550528308956, 'samples': 10135104, 'steps': 52786, 'loss/train': 1.8353632688522339} -11/07/2021 04:39:30 - INFO - __main__ - Step 52788: {'lr': 0.00036826082986010145, 'samples': 10135296, 'steps': 52787, 'loss/train': 1.3484896421432495} -11/07/2021 04:39:31 - INFO - __main__ - Step 52789: {'lr': 0.00036825615438382687, 'samples': 10135488, 'steps': 52788, 'loss/train': 1.712052345275879} -11/07/2021 04:39:31 - INFO - __main__ - Step 52790: {'lr': 0.00036825147885426786, 'samples': 10135680, 'steps': 52789, 'loss/train': 1.2510075569152832} -11/07/2021 04:39:31 - INFO - __main__ - Step 52791: {'lr': 0.00036824680327142656, 'samples': 10135872, 'steps': 52790, 'loss/train': 1.3238176107406616} -11/07/2021 04:39:32 - INFO - __main__ - Step 52792: {'lr': 0.0003682421276353051, 'samples': 10136064, 'steps': 52791, 'loss/train': 1.807876467704773} -11/07/2021 04:39:32 - INFO - __main__ - Step 52793: {'lr': 0.0003682374519459056, 'samples': 10136256, 'steps': 52792, 'loss/train': 1.330115556716919} -11/07/2021 04:39:33 - INFO - __main__ - Step 52794: {'lr': 0.00036823277620323, 'samples': 10136448, 'steps': 52793, 'loss/train': 1.3857930898666382} -11/07/2021 04:39:33 - INFO - __main__ - Step 52795: {'lr': 0.00036822810040728065, 'samples': 10136640, 'steps': 52794, 'loss/train': 1.3801594972610474} -11/07/2021 04:39:34 - INFO - __main__ - Step 52796: {'lr': 0.00036822342455805954, 'samples': 10136832, 'steps': 52795, 'loss/train': 1.4747073650360107} -11/07/2021 04:39:34 - INFO - __main__ - Step 52797: {'lr': 0.0003682187486555687, 'samples': 10137024, 'steps': 52796, 'loss/train': 1.7067310810089111} -11/07/2021 04:39:34 - INFO - __main__ - Step 52798: {'lr': 0.0003682140726998104, 'samples': 10137216, 'steps': 52797, 'loss/train': 1.6776131391525269} -11/07/2021 04:39:35 - INFO - __main__ - Step 52799: {'lr': 0.0003682093966907867, 'samples': 10137408, 'steps': 52798, 'loss/train': 1.3789921998977661} -11/07/2021 04:39:36 - INFO - __main__ - Step 52800: {'lr': 0.00036820472062849954, 'samples': 10137600, 'steps': 52799, 'loss/train': 2.107645034790039} -11/07/2021 04:39:36 - INFO - __main__ - Step 52801: {'lr': 0.0003682000445129512, 'samples': 10137792, 'steps': 52800, 'loss/train': 1.6758891344070435} -11/07/2021 04:39:36 - INFO - __main__ - Step 52802: {'lr': 0.00036819536834414374, 'samples': 10137984, 'steps': 52801, 'loss/train': 1.5608279705047607} -11/07/2021 04:39:37 - INFO - __main__ - Step 52803: {'lr': 0.00036819069212207933, 'samples': 10138176, 'steps': 52802, 'loss/train': 1.8600659370422363} -11/07/2021 04:39:38 - INFO - __main__ - Step 52804: {'lr': 0.00036818601584675994, 'samples': 10138368, 'steps': 52803, 'loss/train': 1.3875086307525635} -11/07/2021 04:39:38 - INFO - __main__ - Step 52805: {'lr': 0.0003681813395181878, 'samples': 10138560, 'steps': 52804, 'loss/train': 1.279493808746338} -11/07/2021 04:39:39 - INFO - __main__ - Step 52806: {'lr': 0.000368176663136365, 'samples': 10138752, 'steps': 52805, 'loss/train': 1.4216787815093994} -11/07/2021 04:39:39 - INFO - __main__ - Step 52807: {'lr': 0.00036817198670129357, 'samples': 10138944, 'steps': 52806, 'loss/train': 1.4187105894088745} -11/07/2021 04:39:39 - INFO - __main__ - Step 52808: {'lr': 0.00036816731021297567, 'samples': 10139136, 'steps': 52807, 'loss/train': 1.3704214096069336} -11/07/2021 04:39:40 - INFO - __main__ - Step 52809: {'lr': 0.0003681626336714134, 'samples': 10139328, 'steps': 52808, 'loss/train': 1.5069106817245483} -11/07/2021 04:39:41 - INFO - __main__ - Step 52810: {'lr': 0.00036815795707660886, 'samples': 10139520, 'steps': 52809, 'loss/train': 1.245521903038025} -11/07/2021 04:39:41 - INFO - __main__ - Step 52811: {'lr': 0.00036815328042856424, 'samples': 10139712, 'steps': 52810, 'loss/train': 1.384450078010559} -11/07/2021 04:39:42 - INFO - __main__ - Step 52812: {'lr': 0.0003681486037272815, 'samples': 10139904, 'steps': 52811, 'loss/train': 1.499172568321228} -11/07/2021 04:39:42 - INFO - __main__ - Step 52813: {'lr': 0.0003681439269727629, 'samples': 10140096, 'steps': 52812, 'loss/train': 2.122101068496704} -11/07/2021 04:39:42 - INFO - __main__ - Step 52814: {'lr': 0.00036813925016501036, 'samples': 10140288, 'steps': 52813, 'loss/train': 0.27971822023391724} -11/07/2021 04:39:43 - INFO - __main__ - Step 52815: {'lr': 0.00036813457330402616, 'samples': 10140480, 'steps': 52814, 'loss/train': 0.21748846769332886} -11/07/2021 04:39:44 - INFO - __main__ - Step 52816: {'lr': 0.0003681298963898124, 'samples': 10140672, 'steps': 52815, 'loss/train': 1.3669146299362183} -11/07/2021 04:39:44 - INFO - __main__ - Step 52817: {'lr': 0.000368125219422371, 'samples': 10140864, 'steps': 52816, 'loss/train': 1.6275256872177124} -11/07/2021 04:39:44 - INFO - __main__ - Step 52818: {'lr': 0.00036812054240170427, 'samples': 10141056, 'steps': 52817, 'loss/train': 1.4270051717758179} -11/07/2021 04:39:45 - INFO - __main__ - Step 52819: {'lr': 0.00036811586532781425, 'samples': 10141248, 'steps': 52818, 'loss/train': 1.4802923202514648} -11/07/2021 04:39:46 - INFO - __main__ - Step 52820: {'lr': 0.0003681111882007031, 'samples': 10141440, 'steps': 52819, 'loss/train': 1.1163501739501953} -11/07/2021 04:39:46 - INFO - __main__ - Step 52821: {'lr': 0.0003681065110203728, 'samples': 10141632, 'steps': 52820, 'loss/train': 1.1054524183273315} -11/07/2021 04:39:47 - INFO - __main__ - Step 52822: {'lr': 0.0003681018337868255, 'samples': 10141824, 'steps': 52821, 'loss/train': 1.3694102764129639} -11/07/2021 04:39:47 - INFO - __main__ - Step 52823: {'lr': 0.00036809715650006335, 'samples': 10142016, 'steps': 52822, 'loss/train': 1.2319449186325073} -11/07/2021 04:39:47 - INFO - __main__ - Step 52824: {'lr': 0.0003680924791600885, 'samples': 10142208, 'steps': 52823, 'loss/train': 2.1207361221313477} -11/07/2021 04:39:49 - INFO - __main__ - Step 52825: {'lr': 0.000368087801766903, 'samples': 10142400, 'steps': 52824, 'loss/train': 1.6262270212173462} -11/07/2021 04:39:49 - INFO - __main__ - Step 52826: {'lr': 0.0003680831243205089, 'samples': 10142592, 'steps': 52825, 'loss/train': 1.576689600944519} -11/07/2021 04:39:49 - INFO - __main__ - Step 52827: {'lr': 0.00036807844682090843, 'samples': 10142784, 'steps': 52826, 'loss/train': 1.8751413822174072} -11/07/2021 04:39:50 - INFO - __main__ - Step 52828: {'lr': 0.0003680737692681036, 'samples': 10142976, 'steps': 52827, 'loss/train': 0.7473287582397461} -11/07/2021 04:39:50 - INFO - __main__ - Step 52829: {'lr': 0.0003680690916620966, 'samples': 10143168, 'steps': 52828, 'loss/train': 2.2561402320861816} -11/07/2021 04:39:50 - INFO - __main__ - Step 52830: {'lr': 0.00036806441400288935, 'samples': 10143360, 'steps': 52829, 'loss/train': 1.2570043802261353} -11/07/2021 04:39:52 - INFO - __main__ - Step 52831: {'lr': 0.00036805973629048416, 'samples': 10143552, 'steps': 52830, 'loss/train': 0.8068132400512695} -11/07/2021 04:39:52 - INFO - __main__ - Step 52832: {'lr': 0.0003680550585248831, 'samples': 10143744, 'steps': 52831, 'loss/train': 1.494175910949707} -11/07/2021 04:39:52 - INFO - __main__ - Step 52833: {'lr': 0.0003680503807060883, 'samples': 10143936, 'steps': 52832, 'loss/train': 0.6244137287139893} -11/07/2021 04:39:53 - INFO - __main__ - Step 52834: {'lr': 0.0003680457028341018, 'samples': 10144128, 'steps': 52833, 'loss/train': 1.396943211555481} -11/07/2021 04:39:53 - INFO - __main__ - Step 52835: {'lr': 0.00036804102490892567, 'samples': 10144320, 'steps': 52834, 'loss/train': 0.6147857904434204} -11/07/2021 04:39:53 - INFO - __main__ - Step 52836: {'lr': 0.0003680363469305621, 'samples': 10144512, 'steps': 52835, 'loss/train': 1.2490501403808594} -11/07/2021 04:39:55 - INFO - __main__ - Step 52837: {'lr': 0.00036803166889901316, 'samples': 10144704, 'steps': 52836, 'loss/train': 1.5557249784469604} -11/07/2021 04:39:55 - INFO - __main__ - Step 52838: {'lr': 0.000368026990814281, 'samples': 10144896, 'steps': 52837, 'loss/train': 1.5296154022216797} -11/07/2021 04:39:55 - INFO - __main__ - Step 52839: {'lr': 0.00036802231267636773, 'samples': 10145088, 'steps': 52838, 'loss/train': 1.4874796867370605} -11/07/2021 04:39:56 - INFO - __main__ - Step 52840: {'lr': 0.0003680176344852754, 'samples': 10145280, 'steps': 52839, 'loss/train': 1.9834364652633667} -11/07/2021 04:39:56 - INFO - __main__ - Step 52841: {'lr': 0.00036801295624100616, 'samples': 10145472, 'steps': 52840, 'loss/train': 1.5413490533828735} -11/07/2021 04:39:56 - INFO - __main__ - Step 52842: {'lr': 0.00036800827794356206, 'samples': 10145664, 'steps': 52841, 'loss/train': 0.3478671908378601} -11/07/2021 04:39:57 - INFO - __main__ - Step 52843: {'lr': 0.0003680035995929453, 'samples': 10145856, 'steps': 52842, 'loss/train': 1.8136168718338013} -11/07/2021 04:39:58 - INFO - __main__ - Step 52844: {'lr': 0.00036799892118915785, 'samples': 10146048, 'steps': 52843, 'loss/train': 1.2765828371047974} -11/07/2021 04:39:58 - INFO - __main__ - Step 52845: {'lr': 0.0003679942427322019, 'samples': 10146240, 'steps': 52844, 'loss/train': 1.1193867921829224} -11/07/2021 04:39:58 - INFO - __main__ - Step 52846: {'lr': 0.00036798956422207975, 'samples': 10146432, 'steps': 52845, 'loss/train': 1.0044621229171753} -11/07/2021 04:39:59 - INFO - __main__ - Step 52847: {'lr': 0.0003679848856587932, 'samples': 10146624, 'steps': 52846, 'loss/train': 1.0877169370651245} -11/07/2021 04:40:00 - INFO - __main__ - Step 52848: {'lr': 0.0003679802070423445, 'samples': 10146816, 'steps': 52847, 'loss/train': 1.8449225425720215} -11/07/2021 04:40:00 - INFO - __main__ - Step 52849: {'lr': 0.0003679755283727357, 'samples': 10147008, 'steps': 52848, 'loss/train': 1.5287681818008423} -11/07/2021 04:40:01 - INFO - __main__ - Step 52850: {'lr': 0.0003679708496499689, 'samples': 10147200, 'steps': 52849, 'loss/train': 0.08660674095153809} -11/07/2021 04:40:01 - INFO - __main__ - Step 52851: {'lr': 0.0003679661708740463, 'samples': 10147392, 'steps': 52850, 'loss/train': 1.3134608268737793} -11/07/2021 04:40:01 - INFO - __main__ - Step 52852: {'lr': 0.00036796149204497, 'samples': 10147584, 'steps': 52851, 'loss/train': 1.192000150680542} -11/07/2021 04:40:02 - INFO - __main__ - Step 52853: {'lr': 0.0003679568131627421, 'samples': 10147776, 'steps': 52852, 'loss/train': 1.604162573814392} -11/07/2021 04:40:03 - INFO - __main__ - Step 52854: {'lr': 0.0003679521342273647, 'samples': 10147968, 'steps': 52853, 'loss/train': 1.0740938186645508} -11/07/2021 04:40:03 - INFO - __main__ - Step 52855: {'lr': 0.00036794745523883977, 'samples': 10148160, 'steps': 52854, 'loss/train': 1.07406485080719} -11/07/2021 04:40:03 - INFO - __main__ - Step 52856: {'lr': 0.0003679427761971696, 'samples': 10148352, 'steps': 52855, 'loss/train': 1.535104751586914} -11/07/2021 04:40:04 - INFO - __main__ - Step 52857: {'lr': 0.0003679380971023562, 'samples': 10148544, 'steps': 52856, 'loss/train': 1.2201820611953735} -11/07/2021 04:40:05 - INFO - __main__ - Step 52858: {'lr': 0.00036793341795440175, 'samples': 10148736, 'steps': 52857, 'loss/train': 0.13308845460414886} -11/07/2021 04:40:05 - INFO - __main__ - Step 52859: {'lr': 0.00036792873875330837, 'samples': 10148928, 'steps': 52858, 'loss/train': 1.3101484775543213} -11/07/2021 04:40:05 - INFO - __main__ - Step 52860: {'lr': 0.000367924059499078, 'samples': 10149120, 'steps': 52859, 'loss/train': 1.8716589212417603} -11/07/2021 04:40:06 - INFO - __main__ - Step 52861: {'lr': 0.000367919380191713, 'samples': 10149312, 'steps': 52860, 'loss/train': 1.605707049369812} -11/07/2021 04:40:06 - INFO - __main__ - Step 52862: {'lr': 0.0003679147008312153, 'samples': 10149504, 'steps': 52861, 'loss/train': 1.4423457384109497} -11/07/2021 04:40:07 - INFO - __main__ - Step 52863: {'lr': 0.000367910021417587, 'samples': 10149696, 'steps': 52862, 'loss/train': 1.2574059963226318} -11/07/2021 04:40:08 - INFO - __main__ - Step 52864: {'lr': 0.0003679053419508303, 'samples': 10149888, 'steps': 52863, 'loss/train': 1.2672683000564575} -11/07/2021 04:40:08 - INFO - __main__ - Step 52865: {'lr': 0.0003679006624309472, 'samples': 10150080, 'steps': 52864, 'loss/train': 1.4139201641082764} -11/07/2021 04:40:08 - INFO - __main__ - Step 52866: {'lr': 0.00036789598285794003, 'samples': 10150272, 'steps': 52865, 'loss/train': 1.1911715269088745} -11/07/2021 04:40:09 - INFO - __main__ - Step 52867: {'lr': 0.0003678913032318107, 'samples': 10150464, 'steps': 52866, 'loss/train': 1.4001514911651611} -11/07/2021 04:40:10 - INFO - __main__ - Step 52868: {'lr': 0.0003678866235525613, 'samples': 10150656, 'steps': 52867, 'loss/train': 1.3431363105773926} -11/07/2021 04:40:10 - INFO - __main__ - Step 52869: {'lr': 0.00036788194382019406, 'samples': 10150848, 'steps': 52868, 'loss/train': 1.4878185987472534} -11/07/2021 04:40:10 - INFO - __main__ - Step 52870: {'lr': 0.000367877264034711, 'samples': 10151040, 'steps': 52869, 'loss/train': 1.5815105438232422} -11/07/2021 04:40:11 - INFO - __main__ - Step 52871: {'lr': 0.0003678725841961144, 'samples': 10151232, 'steps': 52870, 'loss/train': 1.1997718811035156} -11/07/2021 04:40:11 - INFO - __main__ - Step 52872: {'lr': 0.00036786790430440606, 'samples': 10151424, 'steps': 52871, 'loss/train': 1.1991007328033447} -11/07/2021 04:40:12 - INFO - __main__ - Step 52873: {'lr': 0.0003678632243595883, 'samples': 10151616, 'steps': 52872, 'loss/train': 1.9988185167312622} -11/07/2021 04:40:12 - INFO - __main__ - Step 52874: {'lr': 0.0003678585443616632, 'samples': 10151808, 'steps': 52873, 'loss/train': 1.3749264478683472} -11/07/2021 04:40:13 - INFO - __main__ - Step 52875: {'lr': 0.0003678538643106329, 'samples': 10152000, 'steps': 52874, 'loss/train': 1.6679110527038574} -11/07/2021 04:40:13 - INFO - __main__ - Step 52876: {'lr': 0.0003678491842064995, 'samples': 10152192, 'steps': 52875, 'loss/train': 1.896567702293396} -11/07/2021 04:40:13 - INFO - __main__ - Step 52877: {'lr': 0.00036784450404926493, 'samples': 10152384, 'steps': 52876, 'loss/train': 1.790103554725647} -11/07/2021 04:40:14 - INFO - __main__ - Step 52878: {'lr': 0.00036783982383893155, 'samples': 10152576, 'steps': 52877, 'loss/train': 1.5069408416748047} -11/07/2021 04:40:15 - INFO - __main__ - Step 52879: {'lr': 0.0003678351435755014, 'samples': 10152768, 'steps': 52878, 'loss/train': 1.5018293857574463} -11/07/2021 04:40:15 - INFO - __main__ - Step 52880: {'lr': 0.0003678304632589764, 'samples': 10152960, 'steps': 52879, 'loss/train': 1.562927484512329} -11/07/2021 04:40:15 - INFO - __main__ - Step 52881: {'lr': 0.00036782578288935893, 'samples': 10153152, 'steps': 52880, 'loss/train': 1.2411366701126099} -11/07/2021 04:40:16 - INFO - __main__ - Step 52882: {'lr': 0.000367821102466651, 'samples': 10153344, 'steps': 52881, 'loss/train': 1.8379011154174805} -11/07/2021 04:40:16 - INFO - __main__ - Step 52883: {'lr': 0.0003678164219908546, 'samples': 10153536, 'steps': 52882, 'loss/train': 1.386399269104004} -11/07/2021 04:40:17 - INFO - __main__ - Step 52884: {'lr': 0.00036781174146197207, 'samples': 10153728, 'steps': 52883, 'loss/train': 1.314054012298584} -11/07/2021 04:40:17 - INFO - __main__ - Step 52885: {'lr': 0.00036780706088000524, 'samples': 10153920, 'steps': 52884, 'loss/train': 1.4697747230529785} -11/07/2021 04:40:18 - INFO - __main__ - Step 52886: {'lr': 0.0003678023802449564, 'samples': 10154112, 'steps': 52885, 'loss/train': 1.603981614112854} -11/07/2021 04:40:18 - INFO - __main__ - Step 52887: {'lr': 0.0003677976995568277, 'samples': 10154304, 'steps': 52886, 'loss/train': 3.247936487197876} -11/07/2021 04:40:19 - INFO - __main__ - Step 52888: {'lr': 0.00036779301881562115, 'samples': 10154496, 'steps': 52887, 'loss/train': 1.4492740631103516} -11/07/2021 04:40:20 - INFO - __main__ - Step 52889: {'lr': 0.00036778833802133886, 'samples': 10154688, 'steps': 52888, 'loss/train': 1.2354487180709839} -11/07/2021 04:40:20 - INFO - __main__ - Step 52890: {'lr': 0.000367783657173983, 'samples': 10154880, 'steps': 52889, 'loss/train': 1.3675084114074707} -11/07/2021 04:40:20 - INFO - __main__ - Step 52891: {'lr': 0.0003677789762735556, 'samples': 10155072, 'steps': 52890, 'loss/train': 1.591147541999817} -11/07/2021 04:40:21 - INFO - __main__ - Step 52892: {'lr': 0.0003677742953200588, 'samples': 10155264, 'steps': 52891, 'loss/train': 1.391609787940979} -11/07/2021 04:40:21 - INFO - __main__ - Step 52893: {'lr': 0.0003677696143134948, 'samples': 10155456, 'steps': 52892, 'loss/train': 1.3725422620773315} -11/07/2021 04:40:22 - INFO - __main__ - Step 52894: {'lr': 0.00036776493325386554, 'samples': 10155648, 'steps': 52893, 'loss/train': 1.142369031906128} -11/07/2021 04:40:22 - INFO - __main__ - Step 52895: {'lr': 0.00036776025214117325, 'samples': 10155840, 'steps': 52894, 'loss/train': 1.3131283521652222} -11/07/2021 04:40:23 - INFO - __main__ - Step 52896: {'lr': 0.00036775557097542, 'samples': 10156032, 'steps': 52895, 'loss/train': 1.5847556591033936} -11/07/2021 04:40:23 - INFO - __main__ - Step 52897: {'lr': 0.00036775088975660793, 'samples': 10156224, 'steps': 52896, 'loss/train': 0.18475568294525146} -11/07/2021 04:40:23 - INFO - __main__ - Step 52898: {'lr': 0.0003677462084847391, 'samples': 10156416, 'steps': 52897, 'loss/train': 1.4460605382919312} -11/07/2021 04:40:24 - INFO - __main__ - Step 52899: {'lr': 0.0003677415271598157, 'samples': 10156608, 'steps': 52898, 'loss/train': 1.1791458129882812} -11/07/2021 04:40:25 - INFO - __main__ - Step 52900: {'lr': 0.00036773684578183976, 'samples': 10156800, 'steps': 52899, 'loss/train': 1.582863450050354} -11/07/2021 04:40:25 - INFO - __main__ - Step 52901: {'lr': 0.00036773216435081335, 'samples': 10156992, 'steps': 52900, 'loss/train': 1.208898901939392} -11/07/2021 04:40:25 - INFO - __main__ - Step 52902: {'lr': 0.00036772748286673866, 'samples': 10157184, 'steps': 52901, 'loss/train': 1.6890238523483276} -11/07/2021 04:40:26 - INFO - __main__ - Step 52903: {'lr': 0.00036772280132961786, 'samples': 10157376, 'steps': 52902, 'loss/train': 0.6045779585838318} -11/07/2021 04:40:27 - INFO - __main__ - Step 52904: {'lr': 0.0003677181197394529, 'samples': 10157568, 'steps': 52903, 'loss/train': 1.7396961450576782} -11/07/2021 04:40:27 - INFO - __main__ - Step 52905: {'lr': 0.000367713438096246, 'samples': 10157760, 'steps': 52904, 'loss/train': 1.5900174379348755} -11/07/2021 04:40:28 - INFO - __main__ - Step 52906: {'lr': 0.00036770875639999923, 'samples': 10157952, 'steps': 52905, 'loss/train': 5.787691593170166} -11/07/2021 04:40:28 - INFO - __main__ - Step 52907: {'lr': 0.0003677040746507148, 'samples': 10158144, 'steps': 52906, 'loss/train': 1.204666018486023} -11/07/2021 04:40:28 - INFO - __main__ - Step 52908: {'lr': 0.00036769939284839463, 'samples': 10158336, 'steps': 52907, 'loss/train': 1.6088929176330566} -11/07/2021 04:40:29 - INFO - __main__ - Step 52909: {'lr': 0.000367694710993041, 'samples': 10158528, 'steps': 52908, 'loss/train': 1.2527908086776733} -11/07/2021 04:40:30 - INFO - __main__ - Step 52910: {'lr': 0.00036769002908465585, 'samples': 10158720, 'steps': 52909, 'loss/train': 1.308556318283081} -11/07/2021 04:40:30 - INFO - __main__ - Step 52911: {'lr': 0.0003676853471232415, 'samples': 10158912, 'steps': 52910, 'loss/train': 1.3853533267974854} -11/07/2021 04:40:31 - INFO - __main__ - Step 52912: {'lr': 0.00036768066510879985, 'samples': 10159104, 'steps': 52911, 'loss/train': 1.427247405052185} -11/07/2021 04:40:31 - INFO - __main__ - Step 52913: {'lr': 0.0003676759830413332, 'samples': 10159296, 'steps': 52912, 'loss/train': 1.8365446329116821} -11/07/2021 04:40:31 - INFO - __main__ - Step 52914: {'lr': 0.0003676713009208435, 'samples': 10159488, 'steps': 52913, 'loss/train': 1.6054060459136963} -11/07/2021 04:40:32 - INFO - __main__ - Step 52915: {'lr': 0.000367666618747333, 'samples': 10159680, 'steps': 52914, 'loss/train': 1.307416319847107} -11/07/2021 04:40:33 - INFO - __main__ - Step 52916: {'lr': 0.0003676619365208036, 'samples': 10159872, 'steps': 52915, 'loss/train': 1.5037816762924194} -11/07/2021 04:40:33 - INFO - __main__ - Step 52917: {'lr': 0.0003676572542412576, 'samples': 10160064, 'steps': 52916, 'loss/train': 1.2301470041275024} -11/07/2021 04:40:34 - INFO - __main__ - Step 52918: {'lr': 0.00036765257190869715, 'samples': 10160256, 'steps': 52917, 'loss/train': 1.2114273309707642} -11/07/2021 04:40:34 - INFO - __main__ - Step 52919: {'lr': 0.0003676478895231242, 'samples': 10160448, 'steps': 52918, 'loss/train': 1.2205685377120972} -11/07/2021 04:40:34 - INFO - __main__ - Step 52920: {'lr': 0.00036764320708454094, 'samples': 10160640, 'steps': 52919, 'loss/train': 0.9563878178596497} -11/07/2021 04:40:35 - INFO - __main__ - Step 52921: {'lr': 0.0003676385245929494, 'samples': 10160832, 'steps': 52920, 'loss/train': 1.5602089166641235} -11/07/2021 04:40:36 - INFO - __main__ - Step 52922: {'lr': 0.00036763384204835186, 'samples': 10161024, 'steps': 52921, 'loss/train': 1.5643709897994995} -11/07/2021 04:40:36 - INFO - __main__ - Step 52923: {'lr': 0.0003676291594507503, 'samples': 10161216, 'steps': 52922, 'loss/train': 1.4799211025238037} -11/07/2021 04:40:36 - INFO - __main__ - Step 52924: {'lr': 0.0003676244768001468, 'samples': 10161408, 'steps': 52923, 'loss/train': 1.402815341949463} -11/07/2021 04:40:37 - INFO - __main__ - Step 52925: {'lr': 0.00036761979409654353, 'samples': 10161600, 'steps': 52924, 'loss/train': 1.6642074584960938} -11/07/2021 04:40:38 - INFO - __main__ - Step 52926: {'lr': 0.0003676151113399427, 'samples': 10161792, 'steps': 52925, 'loss/train': 1.6063995361328125} -11/07/2021 04:40:38 - INFO - __main__ - Step 52927: {'lr': 0.0003676104285303463, 'samples': 10161984, 'steps': 52926, 'loss/train': 1.527408480644226} -11/07/2021 04:40:39 - INFO - __main__ - Step 52928: {'lr': 0.00036760574566775634, 'samples': 10162176, 'steps': 52927, 'loss/train': 1.8549025058746338} -11/07/2021 04:40:39 - INFO - __main__ - Step 52929: {'lr': 0.0003676010627521751, 'samples': 10162368, 'steps': 52928, 'loss/train': 0.8605169653892517} -11/07/2021 04:40:39 - INFO - __main__ - Step 52930: {'lr': 0.00036759637978360467, 'samples': 10162560, 'steps': 52929, 'loss/train': 1.3480849266052246} -11/07/2021 04:40:40 - INFO - __main__ - Step 52931: {'lr': 0.00036759169676204705, 'samples': 10162752, 'steps': 52930, 'loss/train': 3.5450997352600098} -11/07/2021 04:40:41 - INFO - __main__ - Step 52932: {'lr': 0.0003675870136875045, 'samples': 10162944, 'steps': 52931, 'loss/train': 1.152413010597229} -11/07/2021 04:40:41 - INFO - __main__ - Step 52933: {'lr': 0.00036758233055997905, 'samples': 10163136, 'steps': 52932, 'loss/train': 1.3054156303405762} -11/07/2021 04:40:42 - INFO - __main__ - Step 52934: {'lr': 0.0003675776473794728, 'samples': 10163328, 'steps': 52933, 'loss/train': 1.5548264980316162} -11/07/2021 04:40:42 - INFO - __main__ - Step 52935: {'lr': 0.00036757296414598786, 'samples': 10163520, 'steps': 52934, 'loss/train': 1.5610015392303467} -11/07/2021 04:40:42 - INFO - __main__ - Step 52936: {'lr': 0.00036756828085952637, 'samples': 10163712, 'steps': 52935, 'loss/train': 3.2426817417144775} -11/07/2021 04:40:43 - INFO - __main__ - Step 52937: {'lr': 0.0003675635975200904, 'samples': 10163904, 'steps': 52936, 'loss/train': 1.5200356245040894} -11/07/2021 04:40:44 - INFO - __main__ - Step 52938: {'lr': 0.0003675589141276821, 'samples': 10164096, 'steps': 52937, 'loss/train': 1.821755051612854} -11/07/2021 04:40:44 - INFO - __main__ - Step 52939: {'lr': 0.0003675542306823036, 'samples': 10164288, 'steps': 52938, 'loss/train': 1.5270503759384155} -11/07/2021 04:40:44 - INFO - __main__ - Step 52940: {'lr': 0.000367549547183957, 'samples': 10164480, 'steps': 52939, 'loss/train': 1.5565789937973022} -11/07/2021 04:40:45 - INFO - __main__ - Step 52941: {'lr': 0.0003675448636326443, 'samples': 10164672, 'steps': 52940, 'loss/train': 1.1866822242736816} -11/07/2021 04:40:46 - INFO - __main__ - Step 52942: {'lr': 0.0003675401800283678, 'samples': 10164864, 'steps': 52941, 'loss/train': 1.5489954948425293} -11/07/2021 04:40:46 - INFO - __main__ - Step 52943: {'lr': 0.0003675354963711294, 'samples': 10165056, 'steps': 52942, 'loss/train': 1.4503802061080933} -11/07/2021 04:40:47 - INFO - __main__ - Step 52944: {'lr': 0.00036753081266093136, 'samples': 10165248, 'steps': 52943, 'loss/train': 1.572939395904541} -11/07/2021 04:40:47 - INFO - __main__ - Step 52945: {'lr': 0.00036752612889777577, 'samples': 10165440, 'steps': 52944, 'loss/train': 1.523209810256958} -11/07/2021 04:40:47 - INFO - __main__ - Step 52946: {'lr': 0.0003675214450816647, 'samples': 10165632, 'steps': 52945, 'loss/train': 1.3453178405761719} -11/07/2021 04:40:48 - INFO - __main__ - Step 52947: {'lr': 0.00036751676121260035, 'samples': 10165824, 'steps': 52946, 'loss/train': 1.3668791055679321} -11/07/2021 04:40:49 - INFO - __main__ - Step 52948: {'lr': 0.00036751207729058465, 'samples': 10166016, 'steps': 52947, 'loss/train': 1.5065885782241821} -11/07/2021 04:40:49 - INFO - __main__ - Step 52949: {'lr': 0.00036750739331561986, 'samples': 10166208, 'steps': 52948, 'loss/train': 1.566748023033142} -11/07/2021 04:40:49 - INFO - __main__ - Step 52950: {'lr': 0.0003675027092877081, 'samples': 10166400, 'steps': 52949, 'loss/train': 1.1874886751174927} -11/07/2021 04:40:50 - INFO - __main__ - Step 52951: {'lr': 0.0003674980252068514, 'samples': 10166592, 'steps': 52950, 'loss/train': 0.9539691209793091} -11/07/2021 04:40:51 - INFO - __main__ - Step 52952: {'lr': 0.0003674933410730519, 'samples': 10166784, 'steps': 52951, 'loss/train': 1.2791460752487183} -11/07/2021 04:40:51 - INFO - __main__ - Step 52953: {'lr': 0.00036748865688631175, 'samples': 10166976, 'steps': 52952, 'loss/train': 1.7817262411117554} -11/07/2021 04:40:51 - INFO - __main__ - Step 52954: {'lr': 0.000367483972646633, 'samples': 10167168, 'steps': 52953, 'loss/train': 1.161556363105774} -11/07/2021 04:40:52 - INFO - __main__ - Step 52955: {'lr': 0.00036747928835401773, 'samples': 10167360, 'steps': 52954, 'loss/train': 0.9506720304489136} -11/07/2021 04:40:52 - INFO - __main__ - Step 52956: {'lr': 0.00036747460400846815, 'samples': 10167552, 'steps': 52955, 'loss/train': 1.0091511011123657} -11/07/2021 04:40:53 - INFO - __main__ - Step 52957: {'lr': 0.00036746991960998635, 'samples': 10167744, 'steps': 52956, 'loss/train': 1.3968636989593506} -11/07/2021 04:40:53 - INFO - __main__ - Step 52958: {'lr': 0.00036746523515857434, 'samples': 10167936, 'steps': 52957, 'loss/train': 1.1523995399475098} -11/07/2021 04:40:54 - INFO - __main__ - Step 52959: {'lr': 0.00036746055065423435, 'samples': 10168128, 'steps': 52958, 'loss/train': 1.3701913356781006} -11/07/2021 04:40:54 - INFO - __main__ - Step 52960: {'lr': 0.0003674558660969685, 'samples': 10168320, 'steps': 52959, 'loss/train': 1.5888440608978271} -11/07/2021 04:40:55 - INFO - __main__ - Step 52961: {'lr': 0.0003674511814867788, 'samples': 10168512, 'steps': 52960, 'loss/train': 1.3518424034118652} -11/07/2021 04:40:56 - INFO - __main__ - Step 52962: {'lr': 0.00036744649682366744, 'samples': 10168704, 'steps': 52961, 'loss/train': 1.3583984375} -11/07/2021 04:40:56 - INFO - __main__ - Step 52963: {'lr': 0.0003674418121076365, 'samples': 10168896, 'steps': 52962, 'loss/train': 1.5291193723678589} -11/07/2021 04:40:57 - INFO - __main__ - Step 52964: {'lr': 0.00036743712733868807, 'samples': 10169088, 'steps': 52963, 'loss/train': 1.021351933479309} -11/07/2021 04:40:57 - INFO - __main__ - Step 52965: {'lr': 0.00036743244251682424, 'samples': 10169280, 'steps': 52964, 'loss/train': 1.406258225440979} -11/07/2021 04:40:57 - INFO - __main__ - Step 52966: {'lr': 0.00036742775764204717, 'samples': 10169472, 'steps': 52965, 'loss/train': 0.17799949645996094} -11/07/2021 04:40:58 - INFO - __main__ - Step 52967: {'lr': 0.000367423072714359, 'samples': 10169664, 'steps': 52966, 'loss/train': 1.4866503477096558} -11/07/2021 04:40:59 - INFO - __main__ - Step 52968: {'lr': 0.00036741838773376187, 'samples': 10169856, 'steps': 52967, 'loss/train': 0.9869881272315979} -11/07/2021 04:40:59 - INFO - __main__ - Step 52969: {'lr': 0.00036741370270025776, 'samples': 10170048, 'steps': 52968, 'loss/train': 1.5774484872817993} -11/07/2021 04:40:59 - INFO - __main__ - Step 52970: {'lr': 0.0003674090176138488, 'samples': 10170240, 'steps': 52969, 'loss/train': 1.9227925539016724} -11/07/2021 04:41:00 - INFO - __main__ - Step 52971: {'lr': 0.0003674043324745372, 'samples': 10170432, 'steps': 52970, 'loss/train': 1.5562046766281128} -11/07/2021 04:41:00 - INFO - __main__ - Step 52972: {'lr': 0.000367399647282325, 'samples': 10170624, 'steps': 52971, 'loss/train': 1.7658380270004272} -11/07/2021 04:41:01 - INFO - __main__ - Step 52973: {'lr': 0.0003673949620372143, 'samples': 10170816, 'steps': 52972, 'loss/train': 1.072238802909851} -11/07/2021 04:41:02 - INFO - __main__ - Step 52974: {'lr': 0.0003673902767392074, 'samples': 10171008, 'steps': 52973, 'loss/train': 1.7072405815124512} -11/07/2021 04:41:02 - INFO - __main__ - Step 52975: {'lr': 0.00036738559138830613, 'samples': 10171200, 'steps': 52974, 'loss/train': 0.4392591416835785} -11/07/2021 04:41:02 - INFO - __main__ - Step 52976: {'lr': 0.0003673809059845127, 'samples': 10171392, 'steps': 52975, 'loss/train': 1.2999823093414307} -11/07/2021 04:41:03 - INFO - __main__ - Step 52977: {'lr': 0.00036737622052782933, 'samples': 10171584, 'steps': 52976, 'loss/train': 1.0242704153060913} -11/07/2021 04:41:04 - INFO - __main__ - Step 52978: {'lr': 0.000367371535018258, 'samples': 10171776, 'steps': 52977, 'loss/train': 0.625713586807251} -11/07/2021 04:41:04 - INFO - __main__ - Step 52979: {'lr': 0.00036736684945580083, 'samples': 10171968, 'steps': 52978, 'loss/train': 1.398547649383545} -11/07/2021 04:41:04 - INFO - __main__ - Step 52980: {'lr': 0.00036736216384046, 'samples': 10172160, 'steps': 52979, 'loss/train': 0.5298481583595276} -11/07/2021 04:41:05 - INFO - __main__ - Step 52981: {'lr': 0.00036735747817223766, 'samples': 10172352, 'steps': 52980, 'loss/train': 1.3302054405212402} -11/07/2021 04:41:05 - INFO - __main__ - Step 52982: {'lr': 0.00036735279245113573, 'samples': 10172544, 'steps': 52981, 'loss/train': 1.6523569822311401} -11/07/2021 04:41:06 - INFO - __main__ - Step 52983: {'lr': 0.0003673481066771565, 'samples': 10172736, 'steps': 52982, 'loss/train': 0.9141687154769897} -11/07/2021 04:41:07 - INFO - __main__ - Step 52984: {'lr': 0.00036734342085030205, 'samples': 10172928, 'steps': 52983, 'loss/train': 1.2575457096099854} -11/07/2021 04:41:07 - INFO - __main__ - Step 52985: {'lr': 0.0003673387349705744, 'samples': 10173120, 'steps': 52984, 'loss/train': 0.15876692533493042} -11/07/2021 04:41:07 - INFO - __main__ - Step 52986: {'lr': 0.00036733404903797575, 'samples': 10173312, 'steps': 52985, 'loss/train': 1.4802007675170898} -11/07/2021 04:41:08 - INFO - __main__ - Step 52987: {'lr': 0.00036732936305250826, 'samples': 10173504, 'steps': 52986, 'loss/train': 0.9805260300636292} -11/07/2021 04:41:09 - INFO - __main__ - Step 52988: {'lr': 0.00036732467701417387, 'samples': 10173696, 'steps': 52987, 'loss/train': 1.862620234489441} -11/07/2021 04:41:10 - INFO - __main__ - Step 52989: {'lr': 0.00036731999092297487, 'samples': 10173888, 'steps': 52988, 'loss/train': 1.2013376951217651} -11/07/2021 04:41:10 - INFO - __main__ - Step 52990: {'lr': 0.0003673153047789132, 'samples': 10174080, 'steps': 52989, 'loss/train': 0.9784761667251587} -11/07/2021 04:41:10 - INFO - __main__ - Step 52991: {'lr': 0.0003673106185819911, 'samples': 10174272, 'steps': 52990, 'loss/train': 1.5166722536087036} -11/07/2021 04:41:11 - INFO - __main__ - Step 52992: {'lr': 0.00036730593233221074, 'samples': 10174464, 'steps': 52991, 'loss/train': 1.002928376197815} -11/07/2021 04:41:11 - INFO - __main__ - Step 52993: {'lr': 0.000367301246029574, 'samples': 10174656, 'steps': 52992, 'loss/train': 0.31574416160583496} -11/07/2021 04:41:12 - INFO - __main__ - Step 52994: {'lr': 0.00036729655967408326, 'samples': 10174848, 'steps': 52993, 'loss/train': 0.4325564205646515} -11/07/2021 04:41:13 - INFO - __main__ - Step 52995: {'lr': 0.00036729187326574043, 'samples': 10175040, 'steps': 52994, 'loss/train': 1.2070051431655884} -11/07/2021 04:41:13 - INFO - __main__ - Step 52996: {'lr': 0.00036728718680454763, 'samples': 10175232, 'steps': 52995, 'loss/train': 1.5072743892669678} -11/07/2021 04:41:13 - INFO - __main__ - Step 52997: {'lr': 0.0003672825002905071, 'samples': 10175424, 'steps': 52996, 'loss/train': 1.7143254280090332} -11/07/2021 04:41:14 - INFO - __main__ - Step 52998: {'lr': 0.0003672778137236209, 'samples': 10175616, 'steps': 52997, 'loss/train': 1.6909080743789673} -11/07/2021 04:41:15 - INFO - __main__ - Step 52999: {'lr': 0.0003672731271038911, 'samples': 10175808, 'steps': 52998, 'loss/train': 1.1389824151992798} -11/07/2021 04:41:15 - INFO - __main__ - Step 53000: {'lr': 0.0003672684404313199, 'samples': 10176000, 'steps': 52999, 'loss/train': 2.1818671226501465} -11/07/2021 04:41:15 - INFO - __main__ - Step 53001: {'lr': 0.00036726375370590926, 'samples': 10176192, 'steps': 53000, 'loss/train': 1.1636219024658203} -11/07/2021 04:41:16 - INFO - __main__ - Step 53002: {'lr': 0.0003672590669276614, 'samples': 10176384, 'steps': 53001, 'loss/train': 1.425121784210205} -11/07/2021 04:41:16 - INFO - __main__ - Step 53003: {'lr': 0.0003672543800965784, 'samples': 10176576, 'steps': 53002, 'loss/train': 1.5879302024841309} -11/07/2021 04:41:17 - INFO - __main__ - Step 53004: {'lr': 0.00036724969321266245, 'samples': 10176768, 'steps': 53003, 'loss/train': 1.3570855855941772} -11/07/2021 04:41:17 - INFO - __main__ - Step 53005: {'lr': 0.0003672450062759156, 'samples': 10176960, 'steps': 53004, 'loss/train': 1.5459725856781006} -11/07/2021 04:41:18 - INFO - __main__ - Step 53006: {'lr': 0.00036724031928633995, 'samples': 10177152, 'steps': 53005, 'loss/train': 1.6546989679336548} -11/07/2021 04:41:18 - INFO - __main__ - Step 53007: {'lr': 0.00036723563224393753, 'samples': 10177344, 'steps': 53006, 'loss/train': 1.8153413534164429} -11/07/2021 04:41:18 - INFO - __main__ - Step 53008: {'lr': 0.0003672309451487106, 'samples': 10177536, 'steps': 53007, 'loss/train': 1.5242239236831665} -11/07/2021 04:41:20 - INFO - __main__ - Step 53009: {'lr': 0.0003672262580006612, 'samples': 10177728, 'steps': 53008, 'loss/train': 1.094207763671875} -11/07/2021 04:41:20 - INFO - __main__ - Step 53010: {'lr': 0.00036722157079979153, 'samples': 10177920, 'steps': 53009, 'loss/train': 1.5206443071365356} -11/07/2021 04:41:21 - INFO - __main__ - Step 53011: {'lr': 0.0003672168835461036, 'samples': 10178112, 'steps': 53010, 'loss/train': 1.6117490530014038} -11/07/2021 04:41:21 - INFO - __main__ - Step 53012: {'lr': 0.00036721219623959956, 'samples': 10178304, 'steps': 53011, 'loss/train': 0.5125022530555725} -11/07/2021 04:41:21 - INFO - __main__ - Step 53013: {'lr': 0.00036720750888028143, 'samples': 10178496, 'steps': 53012, 'loss/train': 0.4820607602596283} -11/07/2021 04:41:22 - INFO - __main__ - Step 53014: {'lr': 0.0003672028214681515, 'samples': 10178688, 'steps': 53013, 'loss/train': 0.36183875799179077} -11/07/2021 04:41:23 - INFO - __main__ - Step 53015: {'lr': 0.00036719813400321174, 'samples': 10178880, 'steps': 53014, 'loss/train': 1.2964993715286255} -11/07/2021 04:41:23 - INFO - __main__ - Step 53016: {'lr': 0.0003671934464854643, 'samples': 10179072, 'steps': 53015, 'loss/train': 1.4271796941757202} -11/07/2021 04:41:23 - INFO - __main__ - Step 53017: {'lr': 0.00036718875891491134, 'samples': 10179264, 'steps': 53016, 'loss/train': 1.3503791093826294} -11/07/2021 04:41:24 - INFO - __main__ - Step 53018: {'lr': 0.0003671840712915549, 'samples': 10179456, 'steps': 53017, 'loss/train': 1.1013667583465576} -11/07/2021 04:41:25 - INFO - __main__ - Step 53019: {'lr': 0.0003671793836153972, 'samples': 10179648, 'steps': 53018, 'loss/train': 1.2425892353057861} -11/07/2021 04:41:25 - INFO - __main__ - Step 53020: {'lr': 0.00036717469588644017, 'samples': 10179840, 'steps': 53019, 'loss/train': 1.2072207927703857} -11/07/2021 04:41:25 - INFO - __main__ - Step 53021: {'lr': 0.000367170008104686, 'samples': 10180032, 'steps': 53020, 'loss/train': 1.719152808189392} -11/07/2021 04:41:26 - INFO - __main__ - Step 53022: {'lr': 0.000367165320270137, 'samples': 10180224, 'steps': 53021, 'loss/train': 1.2317638397216797} -11/07/2021 04:41:26 - INFO - __main__ - Step 53023: {'lr': 0.000367160632382795, 'samples': 10180416, 'steps': 53022, 'loss/train': 0.9830251932144165} -11/07/2021 04:41:27 - INFO - __main__ - Step 53024: {'lr': 0.00036715594444266224, 'samples': 10180608, 'steps': 53023, 'loss/train': 0.9751511216163635} -11/07/2021 04:41:27 - INFO - __main__ - Step 53025: {'lr': 0.0003671512564497408, 'samples': 10180800, 'steps': 53024, 'loss/train': 0.847625195980072} -11/07/2021 04:41:28 - INFO - __main__ - Step 53026: {'lr': 0.0003671465684040328, 'samples': 10180992, 'steps': 53025, 'loss/train': 0.9451130032539368} -11/07/2021 04:41:28 - INFO - __main__ - Step 53027: {'lr': 0.00036714188030554046, 'samples': 10181184, 'steps': 53026, 'loss/train': 1.130821704864502} -11/07/2021 04:41:28 - INFO - __main__ - Step 53028: {'lr': 0.00036713719215426577, 'samples': 10181376, 'steps': 53027, 'loss/train': 1.5467818975448608} -11/07/2021 04:41:29 - INFO - __main__ - Step 53029: {'lr': 0.0003671325039502108, 'samples': 10181568, 'steps': 53028, 'loss/train': 1.7766822576522827} -11/07/2021 04:41:30 - INFO - __main__ - Step 53030: {'lr': 0.0003671278156933778, 'samples': 10181760, 'steps': 53029, 'loss/train': 1.1858930587768555} -11/07/2021 04:41:30 - INFO - __main__ - Step 53031: {'lr': 0.00036712312738376875, 'samples': 10181952, 'steps': 53030, 'loss/train': 1.2770707607269287} -11/07/2021 04:41:30 - INFO - __main__ - Step 53032: {'lr': 0.00036711843902138586, 'samples': 10182144, 'steps': 53031, 'loss/train': 1.662916660308838} -11/07/2021 04:41:31 - INFO - __main__ - Step 53033: {'lr': 0.0003671137506062312, 'samples': 10182336, 'steps': 53032, 'loss/train': 1.1410259008407593} -11/07/2021 04:41:32 - INFO - __main__ - Step 53034: {'lr': 0.000367109062138307, 'samples': 10182528, 'steps': 53033, 'loss/train': 1.4344712495803833} -11/07/2021 04:41:32 - INFO - __main__ - Step 53035: {'lr': 0.00036710437361761513, 'samples': 10182720, 'steps': 53034, 'loss/train': 0.7155401110649109} -11/07/2021 04:41:33 - INFO - __main__ - Step 53036: {'lr': 0.00036709968504415786, 'samples': 10182912, 'steps': 53035, 'loss/train': 1.6942758560180664} -11/07/2021 04:41:33 - INFO - __main__ - Step 53037: {'lr': 0.00036709499641793725, 'samples': 10183104, 'steps': 53036, 'loss/train': 1.1712610721588135} -11/07/2021 04:41:33 - INFO - __main__ - Step 53038: {'lr': 0.00036709030773895545, 'samples': 10183296, 'steps': 53037, 'loss/train': 1.5960693359375} -11/07/2021 04:41:35 - INFO - __main__ - Step 53039: {'lr': 0.0003670856190072146, 'samples': 10183488, 'steps': 53038, 'loss/train': 0.23049531877040863} -11/07/2021 04:41:35 - INFO - __main__ - Step 53040: {'lr': 0.00036708093022271677, 'samples': 10183680, 'steps': 53039, 'loss/train': 1.8371566534042358} -11/07/2021 04:41:35 - INFO - __main__ - Step 53041: {'lr': 0.0003670762413854641, 'samples': 10183872, 'steps': 53040, 'loss/train': 1.4111393690109253} -11/07/2021 04:41:36 - INFO - __main__ - Step 53042: {'lr': 0.0003670715524954587, 'samples': 10184064, 'steps': 53041, 'loss/train': 1.3444184064865112} -11/07/2021 04:41:36 - INFO - __main__ - Step 53043: {'lr': 0.0003670668635527026, 'samples': 10184256, 'steps': 53042, 'loss/train': 1.6000396013259888} -11/07/2021 04:41:37 - INFO - __main__ - Step 53044: {'lr': 0.00036706217455719805, 'samples': 10184448, 'steps': 53043, 'loss/train': 1.6131395101547241} -11/07/2021 04:41:37 - INFO - __main__ - Step 53045: {'lr': 0.000367057485508947, 'samples': 10184640, 'steps': 53044, 'loss/train': 1.2647408246994019} -11/07/2021 04:41:38 - INFO - __main__ - Step 53046: {'lr': 0.0003670527964079517, 'samples': 10184832, 'steps': 53045, 'loss/train': 1.4808870553970337} -11/07/2021 04:41:38 - INFO - __main__ - Step 53047: {'lr': 0.0003670481072542142, 'samples': 10185024, 'steps': 53046, 'loss/train': 1.9649957418441772} -11/07/2021 04:41:38 - INFO - __main__ - Step 53048: {'lr': 0.0003670434180477367, 'samples': 10185216, 'steps': 53047, 'loss/train': 0.874976396560669} -11/07/2021 04:41:39 - INFO - __main__ - Step 53049: {'lr': 0.00036703872878852115, 'samples': 10185408, 'steps': 53048, 'loss/train': 1.363416314125061} -11/07/2021 04:41:40 - INFO - __main__ - Step 53050: {'lr': 0.00036703403947656977, 'samples': 10185600, 'steps': 53049, 'loss/train': 1.3838443756103516} -11/07/2021 04:41:40 - INFO - __main__ - Step 53051: {'lr': 0.0003670293501118847, 'samples': 10185792, 'steps': 53050, 'loss/train': 1.5967652797698975} -11/07/2021 04:41:41 - INFO - __main__ - Step 53052: {'lr': 0.00036702466069446797, 'samples': 10185984, 'steps': 53051, 'loss/train': 1.5647650957107544} -11/07/2021 04:41:41 - INFO - __main__ - Step 53053: {'lr': 0.00036701997122432173, 'samples': 10186176, 'steps': 53052, 'loss/train': 1.5553793907165527} -11/07/2021 04:41:42 - INFO - __main__ - Step 53054: {'lr': 0.00036701528170144813, 'samples': 10186368, 'steps': 53053, 'loss/train': 2.1166625022888184} -11/07/2021 04:41:42 - INFO - __main__ - Step 53055: {'lr': 0.0003670105921258493, 'samples': 10186560, 'steps': 53054, 'loss/train': 1.009533166885376} -11/07/2021 04:41:43 - INFO - __main__ - Step 53056: {'lr': 0.0003670059024975272, 'samples': 10186752, 'steps': 53055, 'loss/train': 1.0486948490142822} -11/07/2021 04:41:43 - INFO - __main__ - Step 53057: {'lr': 0.00036700121281648415, 'samples': 10186944, 'steps': 53056, 'loss/train': 1.3450143337249756} -11/07/2021 04:41:43 - INFO - __main__ - Step 53058: {'lr': 0.000366996523082722, 'samples': 10187136, 'steps': 53057, 'loss/train': 1.5745469331741333} -11/07/2021 04:41:44 - INFO - __main__ - Step 53059: {'lr': 0.00036699183329624315, 'samples': 10187328, 'steps': 53058, 'loss/train': 0.5636777877807617} -11/07/2021 04:41:45 - INFO - __main__ - Step 53060: {'lr': 0.00036698714345704956, 'samples': 10187520, 'steps': 53059, 'loss/train': 1.2411562204360962} -11/07/2021 04:41:45 - INFO - __main__ - Step 53061: {'lr': 0.00036698245356514336, 'samples': 10187712, 'steps': 53060, 'loss/train': 1.4474177360534668} -11/07/2021 04:41:45 - INFO - __main__ - Step 53062: {'lr': 0.0003669777636205267, 'samples': 10187904, 'steps': 53061, 'loss/train': 1.518201470375061} -11/07/2021 04:41:46 - INFO - __main__ - Step 53063: {'lr': 0.00036697307362320165, 'samples': 10188096, 'steps': 53062, 'loss/train': 1.5803409814834595} -11/07/2021 04:41:46 - INFO - __main__ - Step 53064: {'lr': 0.0003669683835731703, 'samples': 10188288, 'steps': 53063, 'loss/train': 1.2509534358978271} -11/07/2021 04:41:47 - INFO - __main__ - Step 53065: {'lr': 0.00036696369347043477, 'samples': 10188480, 'steps': 53064, 'loss/train': 1.2445851564407349} -11/07/2021 04:41:48 - INFO - __main__ - Step 53066: {'lr': 0.00036695900331499735, 'samples': 10188672, 'steps': 53065, 'loss/train': 0.7373975515365601} -11/07/2021 04:41:48 - INFO - __main__ - Step 53067: {'lr': 0.0003669543131068599, 'samples': 10188864, 'steps': 53066, 'loss/train': 1.220491886138916} -11/07/2021 04:41:48 - INFO - __main__ - Step 53068: {'lr': 0.0003669496228460247, 'samples': 10189056, 'steps': 53067, 'loss/train': 1.3528779745101929} -11/07/2021 04:41:49 - INFO - __main__ - Step 53069: {'lr': 0.00036694493253249373, 'samples': 10189248, 'steps': 53068, 'loss/train': 0.6026855707168579} -11/07/2021 04:41:50 - INFO - __main__ - Step 53070: {'lr': 0.0003669402421662692, 'samples': 10189440, 'steps': 53069, 'loss/train': 1.7145239114761353} -11/07/2021 04:41:50 - INFO - __main__ - Step 53071: {'lr': 0.0003669355517473532, 'samples': 10189632, 'steps': 53070, 'loss/train': 2.2936959266662598} -11/07/2021 04:41:50 - INFO - __main__ - Step 53072: {'lr': 0.0003669308612757479, 'samples': 10189824, 'steps': 53071, 'loss/train': 1.1821892261505127} -11/07/2021 04:41:51 - INFO - __main__ - Step 53073: {'lr': 0.0003669261707514553, 'samples': 10190016, 'steps': 53072, 'loss/train': 1.20310640335083} -11/07/2021 04:41:51 - INFO - __main__ - Step 53074: {'lr': 0.0003669214801744776, 'samples': 10190208, 'steps': 53073, 'loss/train': 1.389641284942627} -11/07/2021 04:41:52 - INFO - __main__ - Step 53075: {'lr': 0.0003669167895448169, 'samples': 10190400, 'steps': 53074, 'loss/train': 1.560219645500183} -11/07/2021 04:41:52 - INFO - __main__ - Step 53076: {'lr': 0.0003669120988624752, 'samples': 10190592, 'steps': 53075, 'loss/train': 1.284456729888916} -11/07/2021 04:41:53 - INFO - __main__ - Step 53077: {'lr': 0.0003669074081274548, 'samples': 10190784, 'steps': 53076, 'loss/train': 1.1114064455032349} -11/07/2021 04:41:53 - INFO - __main__ - Step 53078: {'lr': 0.0003669027173397577, 'samples': 10190976, 'steps': 53077, 'loss/train': 1.3795138597488403} -11/07/2021 04:41:54 - INFO - __main__ - Step 53079: {'lr': 0.00036689802649938607, 'samples': 10191168, 'steps': 53078, 'loss/train': 1.1561951637268066} -11/07/2021 04:41:54 - INFO - __main__ - Step 53080: {'lr': 0.00036689333560634195, 'samples': 10191360, 'steps': 53079, 'loss/train': 1.5332540273666382} -11/07/2021 04:41:55 - INFO - __main__ - Step 53081: {'lr': 0.00036688864466062756, 'samples': 10191552, 'steps': 53080, 'loss/train': 1.370802402496338} -11/07/2021 04:41:55 - INFO - __main__ - Step 53082: {'lr': 0.0003668839536622449, 'samples': 10191744, 'steps': 53081, 'loss/train': 1.1882829666137695} -11/07/2021 04:41:56 - INFO - __main__ - Step 53083: {'lr': 0.0003668792626111962, 'samples': 10191936, 'steps': 53082, 'loss/train': 1.2191630601882935} -11/07/2021 04:41:56 - INFO - __main__ - Step 53084: {'lr': 0.0003668745715074834, 'samples': 10192128, 'steps': 53083, 'loss/train': 1.7221304178237915} -11/07/2021 04:41:57 - INFO - __main__ - Step 53085: {'lr': 0.00036686988035110877, 'samples': 10192320, 'steps': 53084, 'loss/train': 1.3087737560272217} -11/07/2021 04:41:57 - INFO - __main__ - Step 53086: {'lr': 0.0003668651891420744, 'samples': 10192512, 'steps': 53085, 'loss/train': 1.5288056135177612} -11/07/2021 04:41:58 - INFO - __main__ - Step 53087: {'lr': 0.0003668604978803823, 'samples': 10192704, 'steps': 53086, 'loss/train': 1.5008461475372314} -11/07/2021 04:41:58 - INFO - __main__ - Step 53088: {'lr': 0.0003668558065660348, 'samples': 10192896, 'steps': 53087, 'loss/train': 1.3333481550216675} -11/07/2021 04:41:58 - INFO - __main__ - Step 53089: {'lr': 0.0003668511151990338, 'samples': 10193088, 'steps': 53088, 'loss/train': 1.4734662771224976} -11/07/2021 04:41:59 - INFO - __main__ - Step 53090: {'lr': 0.0003668464237793815, 'samples': 10193280, 'steps': 53089, 'loss/train': 1.0968613624572754} -11/07/2021 04:42:00 - INFO - __main__ - Step 53091: {'lr': 0.00036684173230707996, 'samples': 10193472, 'steps': 53090, 'loss/train': 1.2754640579223633} -11/07/2021 04:42:00 - INFO - __main__ - Step 53092: {'lr': 0.00036683704078213137, 'samples': 10193664, 'steps': 53091, 'loss/train': 1.2075488567352295} -11/07/2021 04:42:00 - INFO - __main__ - Step 53093: {'lr': 0.00036683234920453783, 'samples': 10193856, 'steps': 53092, 'loss/train': 1.518633246421814} -11/07/2021 04:42:01 - INFO - __main__ - Step 53094: {'lr': 0.0003668276575743014, 'samples': 10194048, 'steps': 53093, 'loss/train': 1.2452999353408813} -11/07/2021 04:42:01 - INFO - __main__ - Step 53095: {'lr': 0.0003668229658914243, 'samples': 10194240, 'steps': 53094, 'loss/train': 1.1099741458892822} -11/07/2021 04:42:02 - INFO - __main__ - Step 53096: {'lr': 0.0003668182741559085, 'samples': 10194432, 'steps': 53095, 'loss/train': 1.2349625825881958} -11/07/2021 04:42:03 - INFO - __main__ - Step 53097: {'lr': 0.00036681358236775625, 'samples': 10194624, 'steps': 53096, 'loss/train': 1.0939483642578125} -11/07/2021 04:42:03 - INFO - __main__ - Step 53098: {'lr': 0.00036680889052696954, 'samples': 10194816, 'steps': 53097, 'loss/train': 1.4480918645858765} -11/07/2021 04:42:03 - INFO - __main__ - Step 53099: {'lr': 0.00036680419863355056, 'samples': 10195008, 'steps': 53098, 'loss/train': 0.1520826816558838} -11/07/2021 04:42:04 - INFO - __main__ - Step 53100: {'lr': 0.0003667995066875014, 'samples': 10195200, 'steps': 53099, 'loss/train': 1.2088161706924438} -11/07/2021 04:42:05 - INFO - __main__ - Step 53101: {'lr': 0.00036679481468882425, 'samples': 10195392, 'steps': 53100, 'loss/train': 1.375238299369812} -11/07/2021 04:42:05 - INFO - __main__ - Step 53102: {'lr': 0.00036679012263752115, 'samples': 10195584, 'steps': 53101, 'loss/train': 1.405340552330017} -11/07/2021 04:42:05 - INFO - __main__ - Step 53103: {'lr': 0.00036678543053359413, 'samples': 10195776, 'steps': 53102, 'loss/train': 1.8700934648513794} -11/07/2021 04:42:06 - INFO - __main__ - Step 53104: {'lr': 0.0003667807383770455, 'samples': 10195968, 'steps': 53103, 'loss/train': 1.4020655155181885} -11/07/2021 04:42:06 - INFO - __main__ - Step 53105: {'lr': 0.00036677604616787717, 'samples': 10196160, 'steps': 53104, 'loss/train': 1.789962887763977} -11/07/2021 04:42:07 - INFO - __main__ - Step 53106: {'lr': 0.00036677135390609145, 'samples': 10196352, 'steps': 53105, 'loss/train': 1.2877886295318604} -11/07/2021 04:42:07 - INFO - __main__ - Step 53107: {'lr': 0.0003667666615916903, 'samples': 10196544, 'steps': 53106, 'loss/train': 1.5096367597579956} -11/07/2021 04:42:08 - INFO - __main__ - Step 53108: {'lr': 0.00036676196922467595, 'samples': 10196736, 'steps': 53107, 'loss/train': 1.4057319164276123} -11/07/2021 04:42:08 - INFO - __main__ - Step 53109: {'lr': 0.00036675727680505045, 'samples': 10196928, 'steps': 53108, 'loss/train': 1.3050413131713867} -11/07/2021 04:42:08 - INFO - __main__ - Step 53110: {'lr': 0.0003667525843328159, 'samples': 10197120, 'steps': 53109, 'loss/train': 1.1219984292984009} -11/07/2021 04:42:09 - INFO - __main__ - Step 53111: {'lr': 0.0003667478918079744, 'samples': 10197312, 'steps': 53110, 'loss/train': 1.7990424633026123} -11/07/2021 04:42:10 - INFO - __main__ - Step 53112: {'lr': 0.0003667431992305281, 'samples': 10197504, 'steps': 53111, 'loss/train': 1.388959527015686} -11/07/2021 04:42:10 - INFO - __main__ - Step 53113: {'lr': 0.0003667385066004792, 'samples': 10197696, 'steps': 53112, 'loss/train': 1.0651360750198364} -11/07/2021 04:42:11 - INFO - __main__ - Step 53114: {'lr': 0.0003667338139178297, 'samples': 10197888, 'steps': 53113, 'loss/train': 0.6847978830337524} -11/07/2021 04:42:11 - INFO - __main__ - Step 53115: {'lr': 0.0003667291211825817, 'samples': 10198080, 'steps': 53114, 'loss/train': 1.4442719221115112} -11/07/2021 04:42:12 - INFO - __main__ - Step 53116: {'lr': 0.0003667244283947374, 'samples': 10198272, 'steps': 53115, 'loss/train': 1.5201616287231445} -11/07/2021 04:42:12 - INFO - __main__ - Step 53117: {'lr': 0.0003667197355542989, 'samples': 10198464, 'steps': 53116, 'loss/train': 1.1403840780258179} -11/07/2021 04:42:13 - INFO - __main__ - Step 53118: {'lr': 0.0003667150426612682, 'samples': 10198656, 'steps': 53117, 'loss/train': 1.546968698501587} -11/07/2021 04:42:13 - INFO - __main__ - Step 53119: {'lr': 0.0003667103497156475, 'samples': 10198848, 'steps': 53118, 'loss/train': 1.7902982234954834} -11/07/2021 04:42:13 - INFO - __main__ - Step 53120: {'lr': 0.00036670565671743905, 'samples': 10199040, 'steps': 53119, 'loss/train': 1.352241039276123} -11/07/2021 04:42:14 - INFO - __main__ - Step 53121: {'lr': 0.0003667009636666447, 'samples': 10199232, 'steps': 53120, 'loss/train': 1.0399212837219238} -11/07/2021 04:42:15 - INFO - __main__ - Step 53122: {'lr': 0.00036669627056326685, 'samples': 10199424, 'steps': 53121, 'loss/train': 1.4006602764129639} -11/07/2021 04:42:15 - INFO - __main__ - Step 53123: {'lr': 0.0003666915774073073, 'samples': 10199616, 'steps': 53122, 'loss/train': 1.2680741548538208} -11/07/2021 04:42:16 - INFO - __main__ - Step 53124: {'lr': 0.00036668688419876837, 'samples': 10199808, 'steps': 53123, 'loss/train': 1.5843561887741089} -11/07/2021 04:42:16 - INFO - __main__ - Step 53125: {'lr': 0.0003666821909376522, 'samples': 10200000, 'steps': 53124, 'loss/train': 1.2021772861480713} -11/07/2021 04:42:16 - INFO - __main__ - Step 53126: {'lr': 0.00036667749762396074, 'samples': 10200192, 'steps': 53125, 'loss/train': 1.378400444984436} -11/07/2021 04:42:17 - INFO - __main__ - Step 53127: {'lr': 0.0003666728042576962, 'samples': 10200384, 'steps': 53126, 'loss/train': 0.9234182238578796} -11/07/2021 04:42:18 - INFO - __main__ - Step 53128: {'lr': 0.0003666681108388608, 'samples': 10200576, 'steps': 53127, 'loss/train': 1.4577910900115967} -11/07/2021 04:42:18 - INFO - __main__ - Step 53129: {'lr': 0.0003666634173674565, 'samples': 10200768, 'steps': 53128, 'loss/train': 1.1644287109375} -11/07/2021 04:42:18 - INFO - __main__ - Step 53130: {'lr': 0.00036665872384348543, 'samples': 10200960, 'steps': 53129, 'loss/train': 2.0268161296844482} -11/07/2021 04:42:19 - INFO - __main__ - Step 53131: {'lr': 0.00036665403026694976, 'samples': 10201152, 'steps': 53130, 'loss/train': 1.7038955688476562} -11/07/2021 04:42:19 - INFO - __main__ - Step 53132: {'lr': 0.0003666493366378516, 'samples': 10201344, 'steps': 53131, 'loss/train': 2.0351192951202393} -11/07/2021 04:42:20 - INFO - __main__ - Step 53133: {'lr': 0.00036664464295619296, 'samples': 10201536, 'steps': 53132, 'loss/train': 1.5343565940856934} -11/07/2021 04:42:20 - INFO - __main__ - Step 53134: {'lr': 0.0003666399492219762, 'samples': 10201728, 'steps': 53133, 'loss/train': 1.140608549118042} -11/07/2021 04:42:21 - INFO - __main__ - Step 53135: {'lr': 0.0003666352554352032, 'samples': 10201920, 'steps': 53134, 'loss/train': 1.3192079067230225} -11/07/2021 04:42:21 - INFO - __main__ - Step 53136: {'lr': 0.00036663056159587614, 'samples': 10202112, 'steps': 53135, 'loss/train': 0.8051148653030396} -11/07/2021 04:42:22 - INFO - __main__ - Step 53137: {'lr': 0.0003666258677039971, 'samples': 10202304, 'steps': 53136, 'loss/train': 1.203921914100647} -11/07/2021 04:42:23 - INFO - __main__ - Step 53138: {'lr': 0.00036662117375956834, 'samples': 10202496, 'steps': 53137, 'loss/train': 1.6183037757873535} -11/07/2021 04:42:23 - INFO - __main__ - Step 53139: {'lr': 0.00036661647976259185, 'samples': 10202688, 'steps': 53138, 'loss/train': 1.3904577493667603} -11/07/2021 04:42:23 - INFO - __main__ - Step 53140: {'lr': 0.0003666117857130698, 'samples': 10202880, 'steps': 53139, 'loss/train': 1.312795639038086} -11/07/2021 04:42:24 - INFO - __main__ - Step 53141: {'lr': 0.00036660709161100423, 'samples': 10203072, 'steps': 53140, 'loss/train': 1.4761615991592407} -11/07/2021 04:42:24 - INFO - __main__ - Step 53142: {'lr': 0.0003666023974563973, 'samples': 10203264, 'steps': 53141, 'loss/train': 1.2925437688827515} -11/07/2021 04:42:25 - INFO - __main__ - Step 53143: {'lr': 0.0003665977032492511, 'samples': 10203456, 'steps': 53142, 'loss/train': 1.2739945650100708} -11/07/2021 04:42:26 - INFO - __main__ - Step 53144: {'lr': 0.00036659300898956784, 'samples': 10203648, 'steps': 53143, 'loss/train': 1.3361073732376099} -11/07/2021 04:42:26 - INFO - __main__ - Step 53145: {'lr': 0.0003665883146773496, 'samples': 10203840, 'steps': 53144, 'loss/train': 1.0176421403884888} -11/07/2021 04:42:26 - INFO - __main__ - Step 53146: {'lr': 0.0003665836203125984, 'samples': 10204032, 'steps': 53145, 'loss/train': 1.5041325092315674} -11/07/2021 04:42:27 - INFO - __main__ - Step 53147: {'lr': 0.0003665789258953164, 'samples': 10204224, 'steps': 53146, 'loss/train': 1.6452785730361938} -11/07/2021 04:42:27 - INFO - __main__ - Step 53148: {'lr': 0.00036657423142550576, 'samples': 10204416, 'steps': 53147, 'loss/train': 1.0984362363815308} -11/07/2021 04:42:28 - INFO - __main__ - Step 53149: {'lr': 0.00036656953690316865, 'samples': 10204608, 'steps': 53148, 'loss/train': 1.234283208847046} -11/07/2021 04:42:29 - INFO - __main__ - Step 53150: {'lr': 0.000366564842328307, 'samples': 10204800, 'steps': 53149, 'loss/train': 0.9838631749153137} -11/07/2021 04:42:29 - INFO - __main__ - Step 53151: {'lr': 0.0003665601477009231, 'samples': 10204992, 'steps': 53150, 'loss/train': 1.545081615447998} -11/07/2021 04:42:29 - INFO - __main__ - Step 53152: {'lr': 0.00036655545302101894, 'samples': 10205184, 'steps': 53151, 'loss/train': 1.600849986076355} -11/07/2021 04:42:30 - INFO - __main__ - Step 53153: {'lr': 0.00036655075828859673, 'samples': 10205376, 'steps': 53152, 'loss/train': 1.3004236221313477} -11/07/2021 04:42:31 - INFO - __main__ - Step 53154: {'lr': 0.0003665460635036585, 'samples': 10205568, 'steps': 53153, 'loss/train': 1.072939395904541} -11/07/2021 04:42:31 - INFO - __main__ - Step 53155: {'lr': 0.00036654136866620646, 'samples': 10205760, 'steps': 53154, 'loss/train': 1.4235090017318726} -11/07/2021 04:42:31 - INFO - __main__ - Step 53156: {'lr': 0.0003665366737762427, 'samples': 10205952, 'steps': 53155, 'loss/train': 1.2102850675582886} -11/07/2021 04:42:32 - INFO - __main__ - Step 53157: {'lr': 0.0003665319788337692, 'samples': 10206144, 'steps': 53156, 'loss/train': 1.6960684061050415} -11/07/2021 04:42:32 - INFO - __main__ - Step 53158: {'lr': 0.0003665272838387883, 'samples': 10206336, 'steps': 53157, 'loss/train': 1.5066572427749634} -11/07/2021 04:42:33 - INFO - __main__ - Step 53159: {'lr': 0.00036652258879130194, 'samples': 10206528, 'steps': 53158, 'loss/train': 1.4323980808258057} -11/07/2021 04:42:33 - INFO - __main__ - Step 53160: {'lr': 0.0003665178936913123, 'samples': 10206720, 'steps': 53159, 'loss/train': 1.448259711265564} -11/07/2021 04:42:34 - INFO - __main__ - Step 53161: {'lr': 0.0003665131985388215, 'samples': 10206912, 'steps': 53160, 'loss/train': 1.64296555519104} -11/07/2021 04:42:34 - INFO - __main__ - Step 53162: {'lr': 0.00036650850333383174, 'samples': 10207104, 'steps': 53161, 'loss/train': 1.4066882133483887} -11/07/2021 04:42:34 - INFO - __main__ - Step 53163: {'lr': 0.000366503808076345, 'samples': 10207296, 'steps': 53162, 'loss/train': 1.3050343990325928} -11/07/2021 04:42:35 - INFO - __main__ - Step 53164: {'lr': 0.00036649911276636336, 'samples': 10207488, 'steps': 53163, 'loss/train': 1.0233391523361206} -11/07/2021 04:42:36 - INFO - __main__ - Step 53165: {'lr': 0.0003664944174038891, 'samples': 10207680, 'steps': 53164, 'loss/train': 1.230887770652771} -11/07/2021 04:42:36 - INFO - __main__ - Step 53166: {'lr': 0.0003664897219889242, 'samples': 10207872, 'steps': 53165, 'loss/train': 1.853659987449646} -11/07/2021 04:42:36 - INFO - __main__ - Step 53167: {'lr': 0.0003664850265214709, 'samples': 10208064, 'steps': 53166, 'loss/train': 1.800600528717041} -11/07/2021 04:42:37 - INFO - __main__ - Step 53168: {'lr': 0.00036648033100153117, 'samples': 10208256, 'steps': 53167, 'loss/train': 1.7309788465499878} -11/07/2021 04:42:38 - INFO - __main__ - Step 53169: {'lr': 0.0003664756354291073, 'samples': 10208448, 'steps': 53168, 'loss/train': 1.5815919637680054} -11/07/2021 04:42:38 - INFO - __main__ - Step 53170: {'lr': 0.0003664709398042012, 'samples': 10208640, 'steps': 53169, 'loss/train': 1.2343692779541016} -11/07/2021 04:42:39 - INFO - __main__ - Step 53171: {'lr': 0.00036646624412681514, 'samples': 10208832, 'steps': 53170, 'loss/train': 1.4695652723312378} -11/07/2021 04:42:39 - INFO - __main__ - Step 53172: {'lr': 0.0003664615483969511, 'samples': 10209024, 'steps': 53171, 'loss/train': 1.4880211353302002} -11/07/2021 04:42:39 - INFO - __main__ - Step 53173: {'lr': 0.0003664568526146114, 'samples': 10209216, 'steps': 53172, 'loss/train': 1.166122555732727} -11/07/2021 04:42:40 - INFO - __main__ - Step 53174: {'lr': 0.000366452156779798, 'samples': 10209408, 'steps': 53173, 'loss/train': 1.0564590692520142} -11/07/2021 04:42:41 - INFO - __main__ - Step 53175: {'lr': 0.000366447460892513, 'samples': 10209600, 'steps': 53174, 'loss/train': 1.40821373462677} -11/07/2021 04:42:41 - INFO - __main__ - Step 53176: {'lr': 0.0003664427649527587, 'samples': 10209792, 'steps': 53175, 'loss/train': 1.0120983123779297} -11/07/2021 04:42:42 - INFO - __main__ - Step 53177: {'lr': 0.000366438068960537, 'samples': 10209984, 'steps': 53176, 'loss/train': 1.0967178344726562} -11/07/2021 04:42:42 - INFO - __main__ - Step 53178: {'lr': 0.0003664333729158501, 'samples': 10210176, 'steps': 53177, 'loss/train': 1.3859779834747314} -11/07/2021 04:42:43 - INFO - __main__ - Step 53179: {'lr': 0.0003664286768187002, 'samples': 10210368, 'steps': 53178, 'loss/train': 1.549895167350769} -11/07/2021 04:42:43 - INFO - __main__ - Step 53180: {'lr': 0.0003664239806690892, 'samples': 10210560, 'steps': 53179, 'loss/train': 1.21084463596344} -11/07/2021 04:42:44 - INFO - __main__ - Step 53181: {'lr': 0.00036641928446701943, 'samples': 10210752, 'steps': 53180, 'loss/train': 1.6016613245010376} -11/07/2021 04:42:44 - INFO - __main__ - Step 53182: {'lr': 0.00036641458821249295, 'samples': 10210944, 'steps': 53181, 'loss/train': 0.8361701965332031} -11/07/2021 04:42:44 - INFO - __main__ - Step 53183: {'lr': 0.00036640989190551184, 'samples': 10211136, 'steps': 53182, 'loss/train': 1.4793580770492554} -11/07/2021 04:42:45 - INFO - __main__ - Step 53184: {'lr': 0.00036640519554607823, 'samples': 10211328, 'steps': 53183, 'loss/train': 0.36974507570266724} -11/07/2021 04:42:46 - INFO - __main__ - Step 53185: {'lr': 0.00036640049913419417, 'samples': 10211520, 'steps': 53184, 'loss/train': 1.7542303800582886} -11/07/2021 04:42:46 - INFO - __main__ - Step 53186: {'lr': 0.00036639580266986183, 'samples': 10211712, 'steps': 53185, 'loss/train': 1.954509973526001} -11/07/2021 04:42:46 - INFO - __main__ - Step 53187: {'lr': 0.00036639110615308343, 'samples': 10211904, 'steps': 53186, 'loss/train': 1.5697658061981201} -11/07/2021 04:42:47 - INFO - __main__ - Step 53188: {'lr': 0.0003663864095838609, 'samples': 10212096, 'steps': 53187, 'loss/train': 1.2949846982955933} -11/07/2021 04:42:48 - INFO - __main__ - Step 53189: {'lr': 0.0003663817129621966, 'samples': 10212288, 'steps': 53188, 'loss/train': 1.4699655771255493} -11/07/2021 04:42:48 - INFO - __main__ - Step 53190: {'lr': 0.0003663770162880924, 'samples': 10212480, 'steps': 53189, 'loss/train': 1.5642396211624146} -11/07/2021 04:42:48 - INFO - __main__ - Step 53191: {'lr': 0.00036637231956155046, 'samples': 10212672, 'steps': 53190, 'loss/train': 0.9616280794143677} -11/07/2021 04:42:49 - INFO - __main__ - Step 53192: {'lr': 0.000366367622782573, 'samples': 10212864, 'steps': 53191, 'loss/train': 1.5829464197158813} -11/07/2021 04:42:49 - INFO - __main__ - Step 53193: {'lr': 0.0003663629259511621, 'samples': 10213056, 'steps': 53192, 'loss/train': 1.0942155122756958} -11/07/2021 04:42:50 - INFO - __main__ - Step 53194: {'lr': 0.00036635822906731986, 'samples': 10213248, 'steps': 53193, 'loss/train': 0.8965877294540405} -11/07/2021 04:42:50 - INFO - __main__ - Step 53195: {'lr': 0.0003663535321310484, 'samples': 10213440, 'steps': 53194, 'loss/train': 1.493140697479248} -11/07/2021 04:42:51 - INFO - __main__ - Step 53196: {'lr': 0.00036634883514234987, 'samples': 10213632, 'steps': 53195, 'loss/train': 1.5236399173736572} -11/07/2021 04:42:51 - INFO - __main__ - Step 53197: {'lr': 0.00036634413810122626, 'samples': 10213824, 'steps': 53196, 'loss/train': 1.4427578449249268} -11/07/2021 04:42:51 - INFO - __main__ - Step 53198: {'lr': 0.0003663394410076798, 'samples': 10214016, 'steps': 53197, 'loss/train': 1.128544807434082} -11/07/2021 04:42:52 - INFO - __main__ - Step 53199: {'lr': 0.00036633474386171263, 'samples': 10214208, 'steps': 53198, 'loss/train': 1.072456955909729} -11/07/2021 04:42:53 - INFO - __main__ - Step 53200: {'lr': 0.00036633004666332674, 'samples': 10214400, 'steps': 53199, 'loss/train': 1.6818119287490845} -11/07/2021 04:42:54 - INFO - __main__ - Step 53201: {'lr': 0.0003663253494125244, 'samples': 10214592, 'steps': 53200, 'loss/train': 1.135022521018982} -11/07/2021 04:42:54 - INFO - __main__ - Step 53202: {'lr': 0.0003663206521093076, 'samples': 10214784, 'steps': 53201, 'loss/train': 2.0167996883392334} -11/07/2021 04:42:54 - INFO - __main__ - Step 53203: {'lr': 0.00036631595475367855, 'samples': 10214976, 'steps': 53202, 'loss/train': 1.3336080312728882} -11/07/2021 04:42:55 - INFO - __main__ - Step 53204: {'lr': 0.0003663112573456393, 'samples': 10215168, 'steps': 53203, 'loss/train': 1.409445881843567} -11/07/2021 04:42:56 - INFO - __main__ - Step 53205: {'lr': 0.00036630655988519203, 'samples': 10215360, 'steps': 53204, 'loss/train': 0.08970138430595398} -11/07/2021 04:42:56 - INFO - __main__ - Step 53206: {'lr': 0.00036630186237233877, 'samples': 10215552, 'steps': 53205, 'loss/train': 1.392133116722107} -11/07/2021 04:42:56 - INFO - __main__ - Step 53207: {'lr': 0.00036629716480708174, 'samples': 10215744, 'steps': 53206, 'loss/train': 1.4997931718826294} -11/07/2021 04:42:57 - INFO - __main__ - Step 53208: {'lr': 0.00036629246718942294, 'samples': 10215936, 'steps': 53207, 'loss/train': 1.5354804992675781} -11/07/2021 04:42:57 - INFO - __main__ - Step 53209: {'lr': 0.0003662877695193646, 'samples': 10216128, 'steps': 53208, 'loss/train': 1.1489993333816528} -11/07/2021 04:42:58 - INFO - __main__ - Step 53210: {'lr': 0.00036628307179690877, 'samples': 10216320, 'steps': 53209, 'loss/train': 1.0780820846557617} -11/07/2021 04:42:58 - INFO - __main__ - Step 53211: {'lr': 0.0003662783740220576, 'samples': 10216512, 'steps': 53210, 'loss/train': 1.525235652923584} -11/07/2021 04:42:59 - INFO - __main__ - Step 53212: {'lr': 0.00036627367619481316, 'samples': 10216704, 'steps': 53211, 'loss/train': 1.4894222021102905} -11/07/2021 04:42:59 - INFO - __main__ - Step 53213: {'lr': 0.00036626897831517756, 'samples': 10216896, 'steps': 53212, 'loss/train': 0.07788790017366409} -11/07/2021 04:43:00 - INFO - __main__ - Step 53214: {'lr': 0.000366264280383153, 'samples': 10217088, 'steps': 53213, 'loss/train': 2.0759551525115967} -11/07/2021 04:43:01 - INFO - __main__ - Step 53215: {'lr': 0.00036625958239874156, 'samples': 10217280, 'steps': 53214, 'loss/train': 1.3804129362106323} -11/07/2021 04:43:01 - INFO - __main__ - Step 53216: {'lr': 0.0003662548843619454, 'samples': 10217472, 'steps': 53215, 'loss/train': 1.3251698017120361} -11/07/2021 04:43:01 - INFO - __main__ - Step 53217: {'lr': 0.00036625018627276646, 'samples': 10217664, 'steps': 53216, 'loss/train': 1.5707327127456665} -11/07/2021 04:43:02 - INFO - __main__ - Step 53218: {'lr': 0.0003662454881312071, 'samples': 10217856, 'steps': 53217, 'loss/train': 1.3364756107330322} -11/07/2021 04:43:02 - INFO - __main__ - Step 53219: {'lr': 0.0003662407899372692, 'samples': 10218048, 'steps': 53218, 'loss/train': 1.5194370746612549} -11/07/2021 04:43:04 - INFO - __main__ - Step 53220: {'lr': 0.000366236091690955, 'samples': 10218240, 'steps': 53219, 'loss/train': 1.5489014387130737} -11/07/2021 04:43:04 - INFO - __main__ - Step 53221: {'lr': 0.00036623139339226664, 'samples': 10218432, 'steps': 53220, 'loss/train': 1.1221784353256226} -11/07/2021 04:43:04 - INFO - __main__ - Step 53222: {'lr': 0.00036622669504120627, 'samples': 10218624, 'steps': 53221, 'loss/train': 1.5648833513259888} -11/07/2021 04:43:05 - INFO - __main__ - Step 53223: {'lr': 0.0003662219966377759, 'samples': 10218816, 'steps': 53222, 'loss/train': 1.6098930835723877} -11/07/2021 04:43:05 - INFO - __main__ - Step 53224: {'lr': 0.0003662172981819777, 'samples': 10219008, 'steps': 53223, 'loss/train': 1.4301648139953613} -11/07/2021 04:43:05 - INFO - __main__ - Step 53225: {'lr': 0.00036621259967381374, 'samples': 10219200, 'steps': 53224, 'loss/train': 1.5039647817611694} -11/07/2021 04:43:06 - INFO - __main__ - Step 53226: {'lr': 0.0003662079011132862, 'samples': 10219392, 'steps': 53225, 'loss/train': 1.1975923776626587} -11/07/2021 04:43:07 - INFO - __main__ - Step 53227: {'lr': 0.0003662032025003972, 'samples': 10219584, 'steps': 53226, 'loss/train': 1.125380516052246} -11/07/2021 04:43:07 - INFO - __main__ - Step 53228: {'lr': 0.0003661985038351488, 'samples': 10219776, 'steps': 53227, 'loss/train': 1.6176185607910156} -11/07/2021 04:43:07 - INFO - __main__ - Step 53229: {'lr': 0.0003661938051175432, 'samples': 10219968, 'steps': 53228, 'loss/train': 1.3787031173706055} -11/07/2021 04:43:08 - INFO - __main__ - Step 53230: {'lr': 0.0003661891063475824, 'samples': 10220160, 'steps': 53229, 'loss/train': 1.0745278596878052} -11/07/2021 04:43:09 - INFO - __main__ - Step 53231: {'lr': 0.0003661844075252686, 'samples': 10220352, 'steps': 53230, 'loss/train': 1.470468282699585} -11/07/2021 04:43:09 - INFO - __main__ - Step 53232: {'lr': 0.0003661797086506039, 'samples': 10220544, 'steps': 53231, 'loss/train': 1.6155319213867188} -11/07/2021 04:43:10 - INFO - __main__ - Step 53233: {'lr': 0.0003661750097235904, 'samples': 10220736, 'steps': 53232, 'loss/train': 1.4225972890853882} -11/07/2021 04:43:10 - INFO - __main__ - Step 53234: {'lr': 0.00036617031074423023, 'samples': 10220928, 'steps': 53233, 'loss/train': 1.4886188507080078} -11/07/2021 04:43:10 - INFO - __main__ - Step 53235: {'lr': 0.00036616561171252547, 'samples': 10221120, 'steps': 53234, 'loss/train': 1.8060020208358765} -11/07/2021 04:43:11 - INFO - __main__ - Step 53236: {'lr': 0.0003661609126284784, 'samples': 10221312, 'steps': 53235, 'loss/train': 1.5143846273422241} -11/07/2021 04:43:12 - INFO - __main__ - Step 53237: {'lr': 0.00036615621349209094, 'samples': 10221504, 'steps': 53236, 'loss/train': 0.9544692635536194} -11/07/2021 04:43:12 - INFO - __main__ - Step 53238: {'lr': 0.00036615151430336536, 'samples': 10221696, 'steps': 53237, 'loss/train': 1.2647370100021362} -11/07/2021 04:43:12 - INFO - __main__ - Step 53239: {'lr': 0.0003661468150623036, 'samples': 10221888, 'steps': 53238, 'loss/train': 1.6468429565429688} -11/07/2021 04:43:13 - INFO - __main__ - Step 53240: {'lr': 0.0003661421157689079, 'samples': 10222080, 'steps': 53239, 'loss/train': 0.07004977762699127} -11/07/2021 04:43:14 - INFO - __main__ - Step 53241: {'lr': 0.00036613741642318033, 'samples': 10222272, 'steps': 53240, 'loss/train': 1.4579503536224365} -11/07/2021 04:43:14 - INFO - __main__ - Step 53242: {'lr': 0.00036613271702512306, 'samples': 10222464, 'steps': 53241, 'loss/train': 1.2062925100326538} -11/07/2021 04:43:15 - INFO - __main__ - Step 53243: {'lr': 0.00036612801757473823, 'samples': 10222656, 'steps': 53242, 'loss/train': 1.461490511894226} -11/07/2021 04:43:15 - INFO - __main__ - Step 53244: {'lr': 0.00036612331807202785, 'samples': 10222848, 'steps': 53243, 'loss/train': 1.7669768333435059} -11/07/2021 04:43:15 - INFO - __main__ - Step 53245: {'lr': 0.00036611861851699415, 'samples': 10223040, 'steps': 53244, 'loss/train': 1.256188988685608} -11/07/2021 04:43:16 - INFO - __main__ - Step 53246: {'lr': 0.00036611391890963913, 'samples': 10223232, 'steps': 53245, 'loss/train': 1.417641520500183} -11/07/2021 04:43:17 - INFO - __main__ - Step 53247: {'lr': 0.000366109219249965, 'samples': 10223424, 'steps': 53246, 'loss/train': 1.5248044729232788} -11/07/2021 04:43:17 - INFO - __main__ - Step 53248: {'lr': 0.00036610451953797386, 'samples': 10223616, 'steps': 53247, 'loss/train': 1.5818085670471191} -11/07/2021 04:43:17 - INFO - __main__ - Step 53249: {'lr': 0.0003660998197736677, 'samples': 10223808, 'steps': 53248, 'loss/train': 1.3921006917953491} -11/07/2021 04:43:18 - INFO - __main__ - Step 53250: {'lr': 0.00036609511995704894, 'samples': 10224000, 'steps': 53249, 'loss/train': 1.4409935474395752} -11/07/2021 04:43:19 - INFO - __main__ - Step 53251: {'lr': 0.0003660904200881194, 'samples': 10224192, 'steps': 53250, 'loss/train': 1.338744044303894} -11/07/2021 04:43:19 - INFO - __main__ - Step 53252: {'lr': 0.00036608572016688136, 'samples': 10224384, 'steps': 53251, 'loss/train': 1.491830825805664} -11/07/2021 04:43:19 - INFO - __main__ - Step 53253: {'lr': 0.00036608102019333684, 'samples': 10224576, 'steps': 53252, 'loss/train': 1.646281361579895} -11/07/2021 04:43:20 - INFO - __main__ - Step 53254: {'lr': 0.00036607632016748796, 'samples': 10224768, 'steps': 53253, 'loss/train': 1.2800869941711426} -11/07/2021 04:43:20 - INFO - __main__ - Step 53255: {'lr': 0.00036607162008933696, 'samples': 10224960, 'steps': 53254, 'loss/train': 1.4255291223526} -11/07/2021 04:43:21 - INFO - __main__ - Step 53256: {'lr': 0.00036606691995888594, 'samples': 10225152, 'steps': 53255, 'loss/train': 1.3554235696792603} -11/07/2021 04:43:21 - INFO - __main__ - Step 53257: {'lr': 0.00036606221977613686, 'samples': 10225344, 'steps': 53256, 'loss/train': 1.6191420555114746} -11/07/2021 04:43:22 - INFO - __main__ - Step 53258: {'lr': 0.0003660575195410919, 'samples': 10225536, 'steps': 53257, 'loss/train': 1.1593029499053955} -11/07/2021 04:43:22 - INFO - __main__ - Step 53259: {'lr': 0.0003660528192537533, 'samples': 10225728, 'steps': 53258, 'loss/train': 1.086011528968811} -11/07/2021 04:43:22 - INFO - __main__ - Step 53260: {'lr': 0.00036604811891412296, 'samples': 10225920, 'steps': 53259, 'loss/train': 1.4210145473480225} -11/07/2021 04:43:24 - INFO - __main__ - Step 53261: {'lr': 0.00036604341852220325, 'samples': 10226112, 'steps': 53260, 'loss/train': 1.5465900897979736} -11/07/2021 04:43:24 - INFO - __main__ - Step 53262: {'lr': 0.00036603871807799616, 'samples': 10226304, 'steps': 53261, 'loss/train': 1.6001391410827637} -11/07/2021 04:43:24 - INFO - __main__ - Step 53263: {'lr': 0.0003660340175815038, 'samples': 10226496, 'steps': 53262, 'loss/train': 1.5498238801956177} -11/07/2021 04:43:25 - INFO - __main__ - Step 53264: {'lr': 0.0003660293170327283, 'samples': 10226688, 'steps': 53263, 'loss/train': 1.7648087739944458} -11/07/2021 04:43:25 - INFO - __main__ - Step 53265: {'lr': 0.0003660246164316717, 'samples': 10226880, 'steps': 53264, 'loss/train': 1.5192945003509521} -11/07/2021 04:43:26 - INFO - __main__ - Step 53266: {'lr': 0.00036601991577833634, 'samples': 10227072, 'steps': 53265, 'loss/train': 1.386931300163269} -11/07/2021 04:43:26 - INFO - __main__ - Step 53267: {'lr': 0.00036601521507272414, 'samples': 10227264, 'steps': 53266, 'loss/train': 1.0379760265350342} -11/07/2021 04:43:27 - INFO - __main__ - Step 53268: {'lr': 0.00036601051431483725, 'samples': 10227456, 'steps': 53267, 'loss/train': 1.528818130493164} -11/07/2021 04:43:27 - INFO - __main__ - Step 53269: {'lr': 0.0003660058135046778, 'samples': 10227648, 'steps': 53268, 'loss/train': 1.4720981121063232} -11/07/2021 04:43:27 - INFO - __main__ - Step 53270: {'lr': 0.000366001112642248, 'samples': 10227840, 'steps': 53269, 'loss/train': 1.534490942955017} -11/07/2021 04:43:28 - INFO - __main__ - Step 53271: {'lr': 0.00036599641172754984, 'samples': 10228032, 'steps': 53270, 'loss/train': 1.5040323734283447} -11/07/2021 04:43:29 - INFO - __main__ - Step 53272: {'lr': 0.0003659917107605854, 'samples': 10228224, 'steps': 53271, 'loss/train': 1.1398561000823975} -11/07/2021 04:43:29 - INFO - __main__ - Step 53273: {'lr': 0.000365987009741357, 'samples': 10228416, 'steps': 53272, 'loss/train': 0.8920938968658447} -11/07/2021 04:43:29 - INFO - __main__ - Step 53274: {'lr': 0.0003659823086698666, 'samples': 10228608, 'steps': 53273, 'loss/train': 1.3302233219146729} -11/07/2021 04:43:30 - INFO - __main__ - Step 53275: {'lr': 0.0003659776075461164, 'samples': 10228800, 'steps': 53274, 'loss/train': 1.2213811874389648} -11/07/2021 04:43:31 - INFO - __main__ - Step 53276: {'lr': 0.0003659729063701084, 'samples': 10228992, 'steps': 53275, 'loss/train': 1.399293303489685} -11/07/2021 04:43:31 - INFO - __main__ - Step 53277: {'lr': 0.00036596820514184485, 'samples': 10229184, 'steps': 53276, 'loss/train': 1.7406283617019653} -11/07/2021 04:43:32 - INFO - __main__ - Step 53278: {'lr': 0.00036596350386132784, 'samples': 10229376, 'steps': 53277, 'loss/train': 1.2684037685394287} -11/07/2021 04:43:32 - INFO - __main__ - Step 53279: {'lr': 0.0003659588025285594, 'samples': 10229568, 'steps': 53278, 'loss/train': 1.9442917108535767} -11/07/2021 04:43:32 - INFO - __main__ - Step 53280: {'lr': 0.0003659541011435418, 'samples': 10229760, 'steps': 53279, 'loss/train': 1.444143295288086} -11/07/2021 04:43:33 - INFO - __main__ - Step 53281: {'lr': 0.00036594939970627704, 'samples': 10229952, 'steps': 53280, 'loss/train': 1.5801076889038086} -11/07/2021 04:43:34 - INFO - __main__ - Step 53282: {'lr': 0.0003659446982167672, 'samples': 10230144, 'steps': 53281, 'loss/train': 1.7955842018127441} -11/07/2021 04:43:34 - INFO - __main__ - Step 53283: {'lr': 0.00036593999667501457, 'samples': 10230336, 'steps': 53282, 'loss/train': 1.5097438097000122} -11/07/2021 04:43:34 - INFO - __main__ - Step 53284: {'lr': 0.0003659352950810211, 'samples': 10230528, 'steps': 53283, 'loss/train': 1.2218964099884033} -11/07/2021 04:43:35 - INFO - __main__ - Step 53285: {'lr': 0.00036593059343478904, 'samples': 10230720, 'steps': 53284, 'loss/train': 1.3489710092544556} -11/07/2021 04:43:36 - INFO - __main__ - Step 53286: {'lr': 0.0003659258917363204, 'samples': 10230912, 'steps': 53285, 'loss/train': 1.256871223449707} -11/07/2021 04:43:36 - INFO - __main__ - Step 53287: {'lr': 0.0003659211899856173, 'samples': 10231104, 'steps': 53286, 'loss/train': 1.3437983989715576} -11/07/2021 04:43:36 - INFO - __main__ - Step 53288: {'lr': 0.0003659164881826819, 'samples': 10231296, 'steps': 53287, 'loss/train': 1.0385193824768066} -11/07/2021 04:43:37 - INFO - __main__ - Step 53289: {'lr': 0.00036591178632751635, 'samples': 10231488, 'steps': 53288, 'loss/train': 1.3750908374786377} -11/07/2021 04:43:37 - INFO - __main__ - Step 53290: {'lr': 0.00036590708442012275, 'samples': 10231680, 'steps': 53289, 'loss/train': 1.4072775840759277} -11/07/2021 04:43:38 - INFO - __main__ - Step 53291: {'lr': 0.0003659023824605033, 'samples': 10231872, 'steps': 53290, 'loss/train': 1.370407223701477} -11/07/2021 04:43:38 - INFO - __main__ - Step 53292: {'lr': 0.0003658976804486599, 'samples': 10232064, 'steps': 53291, 'loss/train': 1.3309603929519653} -11/07/2021 04:43:39 - INFO - __main__ - Step 53293: {'lr': 0.0003658929783845948, 'samples': 10232256, 'steps': 53292, 'loss/train': 1.2490254640579224} -11/07/2021 04:43:39 - INFO - __main__ - Step 53294: {'lr': 0.0003658882762683101, 'samples': 10232448, 'steps': 53293, 'loss/train': 1.263980507850647} -11/07/2021 04:43:39 - INFO - __main__ - Step 53295: {'lr': 0.000365883574099808, 'samples': 10232640, 'steps': 53294, 'loss/train': 1.3692395687103271} -11/07/2021 04:43:40 - INFO - __main__ - Step 53296: {'lr': 0.00036587887187909045, 'samples': 10232832, 'steps': 53295, 'loss/train': 1.2554272413253784} -11/07/2021 04:43:41 - INFO - __main__ - Step 53297: {'lr': 0.0003658741696061598, 'samples': 10233024, 'steps': 53296, 'loss/train': 1.6472340822219849} -11/07/2021 04:43:41 - INFO - __main__ - Step 53298: {'lr': 0.0003658694672810179, 'samples': 10233216, 'steps': 53297, 'loss/train': 1.2174272537231445} -11/07/2021 04:43:41 - INFO - __main__ - Step 53299: {'lr': 0.00036586476490366713, 'samples': 10233408, 'steps': 53298, 'loss/train': 0.06238739192485809} -11/07/2021 04:43:42 - INFO - __main__ - Step 53300: {'lr': 0.0003658600624741094, 'samples': 10233600, 'steps': 53299, 'loss/train': 1.3266628980636597} -11/07/2021 04:43:42 - INFO - __main__ - Step 53301: {'lr': 0.00036585535999234697, 'samples': 10233792, 'steps': 53300, 'loss/train': 1.4299750328063965} -11/07/2021 04:43:44 - INFO - __main__ - Step 53302: {'lr': 0.0003658506574583819, 'samples': 10233984, 'steps': 53301, 'loss/train': 1.2797915935516357} -11/07/2021 04:43:44 - INFO - __main__ - Step 53303: {'lr': 0.0003658459548722163, 'samples': 10234176, 'steps': 53302, 'loss/train': 1.6376073360443115} -11/07/2021 04:43:44 - INFO - __main__ - Step 53304: {'lr': 0.00036584125223385224, 'samples': 10234368, 'steps': 53303, 'loss/train': 1.6182200908660889} -11/07/2021 04:43:45 - INFO - __main__ - Step 53305: {'lr': 0.0003658365495432919, 'samples': 10234560, 'steps': 53304, 'loss/train': 1.4072526693344116} -11/07/2021 04:43:45 - INFO - __main__ - Step 53306: {'lr': 0.0003658318468005375, 'samples': 10234752, 'steps': 53305, 'loss/train': 1.190161943435669} -11/07/2021 04:43:46 - INFO - __main__ - Step 53307: {'lr': 0.000365827144005591, 'samples': 10234944, 'steps': 53306, 'loss/train': 1.2810604572296143} -11/07/2021 04:43:46 - INFO - __main__ - Step 53308: {'lr': 0.0003658224411584545, 'samples': 10235136, 'steps': 53307, 'loss/train': 1.5987610816955566} -11/07/2021 04:43:47 - INFO - __main__ - Step 53309: {'lr': 0.0003658177382591303, 'samples': 10235328, 'steps': 53308, 'loss/train': 1.5264441967010498} -11/07/2021 04:43:47 - INFO - __main__ - Step 53310: {'lr': 0.0003658130353076204, 'samples': 10235520, 'steps': 53309, 'loss/train': 1.1257977485656738} -11/07/2021 04:43:47 - INFO - __main__ - Step 53311: {'lr': 0.00036580833230392696, 'samples': 10235712, 'steps': 53310, 'loss/train': 1.4543594121932983} -11/07/2021 04:43:48 - INFO - __main__ - Step 53312: {'lr': 0.00036580362924805204, 'samples': 10235904, 'steps': 53311, 'loss/train': 1.5833771228790283} -11/07/2021 04:43:49 - INFO - __main__ - Step 53313: {'lr': 0.0003657989261399978, 'samples': 10236096, 'steps': 53312, 'loss/train': 1.826405644416809} -11/07/2021 04:43:49 - INFO - __main__ - Step 53314: {'lr': 0.0003657942229797663, 'samples': 10236288, 'steps': 53313, 'loss/train': 1.50407075881958} -11/07/2021 04:43:49 - INFO - __main__ - Step 53315: {'lr': 0.00036578951976735973, 'samples': 10236480, 'steps': 53314, 'loss/train': 1.4628835916519165} -11/07/2021 04:43:50 - INFO - __main__ - Step 53316: {'lr': 0.00036578481650278023, 'samples': 10236672, 'steps': 53315, 'loss/train': 1.3163783550262451} -11/07/2021 04:43:51 - INFO - __main__ - Step 53317: {'lr': 0.0003657801131860299, 'samples': 10236864, 'steps': 53316, 'loss/train': 1.312928557395935} -11/07/2021 04:43:51 - INFO - __main__ - Step 53318: {'lr': 0.0003657754098171108, 'samples': 10237056, 'steps': 53317, 'loss/train': 1.446033239364624} -11/07/2021 04:43:51 - INFO - __main__ - Step 53319: {'lr': 0.0003657707063960251, 'samples': 10237248, 'steps': 53318, 'loss/train': 1.3465927839279175} -11/07/2021 04:43:52 - INFO - __main__ - Step 53320: {'lr': 0.00036576600292277477, 'samples': 10237440, 'steps': 53319, 'loss/train': 1.060685634613037} -11/07/2021 04:43:52 - INFO - __main__ - Step 53321: {'lr': 0.0003657612993973622, 'samples': 10237632, 'steps': 53320, 'loss/train': 1.0209652185440063} -11/07/2021 04:43:53 - INFO - __main__ - Step 53322: {'lr': 0.00036575659581978935, 'samples': 10237824, 'steps': 53321, 'loss/train': 1.5221610069274902} -11/07/2021 04:43:53 - INFO - __main__ - Step 53323: {'lr': 0.0003657518921900583, 'samples': 10238016, 'steps': 53322, 'loss/train': 1.7708724737167358} -11/07/2021 04:43:54 - INFO - __main__ - Step 53324: {'lr': 0.0003657471885081714, 'samples': 10238208, 'steps': 53323, 'loss/train': 1.097522258758545} -11/07/2021 04:43:54 - INFO - __main__ - Step 53325: {'lr': 0.0003657424847741305, 'samples': 10238400, 'steps': 53324, 'loss/train': 1.5267057418823242} -11/07/2021 04:43:55 - INFO - __main__ - Step 53326: {'lr': 0.0003657377809879378, 'samples': 10238592, 'steps': 53325, 'loss/train': 1.7962665557861328} -11/07/2021 04:43:55 - INFO - __main__ - Step 53327: {'lr': 0.0003657330771495955, 'samples': 10238784, 'steps': 53326, 'loss/train': 1.2069767713546753} -11/07/2021 04:43:56 - INFO - __main__ - Step 53328: {'lr': 0.0003657283732591056, 'samples': 10238976, 'steps': 53327, 'loss/train': 1.2866443395614624} -11/07/2021 04:43:56 - INFO - __main__ - Step 53329: {'lr': 0.00036572366931647034, 'samples': 10239168, 'steps': 53328, 'loss/train': 1.5319390296936035} -11/07/2021 04:43:57 - INFO - __main__ - Step 53330: {'lr': 0.0003657189653216918, 'samples': 10239360, 'steps': 53329, 'loss/train': 0.8240731954574585} -11/07/2021 04:43:57 - INFO - __main__ - Step 53331: {'lr': 0.000365714261274772, 'samples': 10239552, 'steps': 53330, 'loss/train': 1.9161169528961182} -11/07/2021 04:43:57 - INFO - __main__ - Step 53332: {'lr': 0.00036570955717571315, 'samples': 10239744, 'steps': 53331, 'loss/train': 1.3911247253417969} -11/07/2021 04:43:58 - INFO - __main__ - Step 53333: {'lr': 0.0003657048530245174, 'samples': 10239936, 'steps': 53332, 'loss/train': 1.295586347579956} -11/07/2021 04:43:59 - INFO - __main__ - Step 53334: {'lr': 0.0003657001488211868, 'samples': 10240128, 'steps': 53333, 'loss/train': 0.737235426902771} -11/07/2021 04:43:59 - INFO - __main__ - Step 53335: {'lr': 0.00036569544456572346, 'samples': 10240320, 'steps': 53334, 'loss/train': 1.0752605199813843} -11/07/2021 04:44:00 - INFO - __main__ - Step 53336: {'lr': 0.0003656907402581296, 'samples': 10240512, 'steps': 53335, 'loss/train': 1.7795945405960083} -11/07/2021 04:44:00 - INFO - __main__ - Step 53337: {'lr': 0.00036568603589840734, 'samples': 10240704, 'steps': 53336, 'loss/train': 1.2930161952972412} -11/07/2021 04:44:01 - INFO - __main__ - Step 53338: {'lr': 0.00036568133148655855, 'samples': 10240896, 'steps': 53337, 'loss/train': 1.6007355451583862} -11/07/2021 04:44:01 - INFO - __main__ - Step 53339: {'lr': 0.0003656766270225857, 'samples': 10241088, 'steps': 53338, 'loss/train': 1.1706973314285278} -11/07/2021 04:44:02 - INFO - __main__ - Step 53340: {'lr': 0.00036567192250649066, 'samples': 10241280, 'steps': 53339, 'loss/train': 1.1047382354736328} -11/07/2021 04:44:02 - INFO - __main__ - Step 53341: {'lr': 0.0003656672179382757, 'samples': 10241472, 'steps': 53340, 'loss/train': 1.2220205068588257} -11/07/2021 04:44:02 - INFO - __main__ - Step 53342: {'lr': 0.00036566251331794284, 'samples': 10241664, 'steps': 53341, 'loss/train': 1.6235361099243164} -11/07/2021 04:44:03 - INFO - __main__ - Step 53343: {'lr': 0.00036565780864549423, 'samples': 10241856, 'steps': 53342, 'loss/train': 1.4334454536437988} -11/07/2021 04:44:04 - INFO - __main__ - Step 53344: {'lr': 0.00036565310392093204, 'samples': 10242048, 'steps': 53343, 'loss/train': 1.7549564838409424} -11/07/2021 04:44:04 - INFO - __main__ - Step 53345: {'lr': 0.0003656483991442583, 'samples': 10242240, 'steps': 53344, 'loss/train': 1.4066451787948608} -11/07/2021 04:44:04 - INFO - __main__ - Step 53346: {'lr': 0.0003656436943154752, 'samples': 10242432, 'steps': 53345, 'loss/train': 0.18494181334972382} -11/07/2021 04:44:05 - INFO - __main__ - Step 53347: {'lr': 0.0003656389894345848, 'samples': 10242624, 'steps': 53346, 'loss/train': 2.0516510009765625} -11/07/2021 04:44:06 - INFO - __main__ - Step 53348: {'lr': 0.0003656342845015893, 'samples': 10242816, 'steps': 53347, 'loss/train': 1.5392905473709106} -11/07/2021 04:44:06 - INFO - __main__ - Step 53349: {'lr': 0.00036562957951649075, 'samples': 10243008, 'steps': 53348, 'loss/train': 1.7591869831085205} -11/07/2021 04:44:06 - INFO - __main__ - Step 53350: {'lr': 0.00036562487447929133, 'samples': 10243200, 'steps': 53349, 'loss/train': 1.567441463470459} -11/07/2021 04:44:07 - INFO - __main__ - Step 53351: {'lr': 0.0003656201693899931, 'samples': 10243392, 'steps': 53350, 'loss/train': 1.250799298286438} -11/07/2021 04:44:07 - INFO - __main__ - Step 53352: {'lr': 0.0003656154642485982, 'samples': 10243584, 'steps': 53351, 'loss/train': 1.1381863355636597} -11/07/2021 04:44:08 - INFO - __main__ - Step 53353: {'lr': 0.00036561075905510874, 'samples': 10243776, 'steps': 53352, 'loss/train': 1.5367908477783203} -11/07/2021 04:44:09 - INFO - __main__ - Step 53354: {'lr': 0.00036560605380952686, 'samples': 10243968, 'steps': 53353, 'loss/train': 1.4778127670288086} -11/07/2021 04:44:09 - INFO - __main__ - Step 53355: {'lr': 0.00036560134851185475, 'samples': 10244160, 'steps': 53354, 'loss/train': 1.3822078704833984} -11/07/2021 04:44:09 - INFO - __main__ - Step 53356: {'lr': 0.00036559664316209437, 'samples': 10244352, 'steps': 53355, 'loss/train': 0.31846997141838074} -11/07/2021 04:44:10 - INFO - __main__ - Step 53357: {'lr': 0.00036559193776024794, 'samples': 10244544, 'steps': 53356, 'loss/train': 1.2317649126052856} -11/07/2021 04:44:11 - INFO - __main__ - Step 53358: {'lr': 0.00036558723230631764, 'samples': 10244736, 'steps': 53357, 'loss/train': 1.395480751991272} -11/07/2021 04:44:11 - INFO - __main__ - Step 53359: {'lr': 0.00036558252680030546, 'samples': 10244928, 'steps': 53358, 'loss/train': 1.1462469100952148} -11/07/2021 04:44:11 - INFO - __main__ - Step 53360: {'lr': 0.0003655778212422135, 'samples': 10245120, 'steps': 53359, 'loss/train': 1.554935097694397} -11/07/2021 04:44:12 - INFO - __main__ - Step 53361: {'lr': 0.0003655731156320441, 'samples': 10245312, 'steps': 53360, 'loss/train': 0.32667481899261475} -11/07/2021 04:44:12 - INFO - __main__ - Step 53362: {'lr': 0.00036556840996979914, 'samples': 10245504, 'steps': 53361, 'loss/train': 1.145167350769043} -11/07/2021 04:44:13 - INFO - __main__ - Step 53363: {'lr': 0.0003655637042554809, 'samples': 10245696, 'steps': 53362, 'loss/train': 1.7694740295410156} -11/07/2021 04:44:13 - INFO - __main__ - Step 53364: {'lr': 0.0003655589984890914, 'samples': 10245888, 'steps': 53363, 'loss/train': 0.7376524209976196} -11/07/2021 04:44:14 - INFO - __main__ - Step 53365: {'lr': 0.00036555429267063277, 'samples': 10246080, 'steps': 53364, 'loss/train': 1.1962106227874756} -11/07/2021 04:44:14 - INFO - __main__ - Step 53366: {'lr': 0.0003655495868001072, 'samples': 10246272, 'steps': 53365, 'loss/train': 1.0792287588119507} -11/07/2021 04:44:14 - INFO - __main__ - Step 53367: {'lr': 0.00036554488087751674, 'samples': 10246464, 'steps': 53366, 'loss/train': 1.6274288892745972} -11/07/2021 04:44:16 - INFO - __main__ - Step 53368: {'lr': 0.00036554017490286354, 'samples': 10246656, 'steps': 53367, 'loss/train': 1.4863463640213013} -11/07/2021 04:44:16 - INFO - __main__ - Step 53369: {'lr': 0.0003655354688761498, 'samples': 10246848, 'steps': 53368, 'loss/train': 1.4312962293624878} -11/07/2021 04:44:16 - INFO - __main__ - Step 53370: {'lr': 0.00036553076279737743, 'samples': 10247040, 'steps': 53369, 'loss/train': 2.0777783393859863} -11/07/2021 04:44:17 - INFO - __main__ - Step 53371: {'lr': 0.0003655260566665488, 'samples': 10247232, 'steps': 53370, 'loss/train': 1.3745750188827515} -11/07/2021 04:44:17 - INFO - __main__ - Step 53372: {'lr': 0.0003655213504836659, 'samples': 10247424, 'steps': 53371, 'loss/train': 1.7350544929504395} -11/07/2021 04:44:17 - INFO - __main__ - Step 53373: {'lr': 0.00036551664424873084, 'samples': 10247616, 'steps': 53372, 'loss/train': 1.1542366743087769} -11/07/2021 04:44:18 - INFO - __main__ - Step 53374: {'lr': 0.00036551193796174577, 'samples': 10247808, 'steps': 53373, 'loss/train': 1.0817580223083496} -11/07/2021 04:44:19 - INFO - __main__ - Step 53375: {'lr': 0.0003655072316227127, 'samples': 10248000, 'steps': 53374, 'loss/train': 1.3213239908218384} -11/07/2021 04:44:19 - INFO - __main__ - Step 53376: {'lr': 0.000365502525231634, 'samples': 10248192, 'steps': 53375, 'loss/train': 1.5007151365280151} -11/07/2021 04:44:19 - INFO - __main__ - Step 53377: {'lr': 0.00036549781878851155, 'samples': 10248384, 'steps': 53376, 'loss/train': 1.3726071119308472} -11/07/2021 04:44:20 - INFO - __main__ - Step 53378: {'lr': 0.0003654931122933476, 'samples': 10248576, 'steps': 53377, 'loss/train': 0.986018180847168} -11/07/2021 04:44:21 - INFO - __main__ - Step 53379: {'lr': 0.0003654884057461443, 'samples': 10248768, 'steps': 53378, 'loss/train': 1.1477071046829224} -11/07/2021 04:44:21 - INFO - __main__ - Step 53380: {'lr': 0.0003654836991469036, 'samples': 10248960, 'steps': 53379, 'loss/train': 1.3435907363891602} -11/07/2021 04:44:21 - INFO - __main__ - Step 53381: {'lr': 0.00036547899249562776, 'samples': 10249152, 'steps': 53380, 'loss/train': 1.4615086317062378} -11/07/2021 04:44:22 - INFO - __main__ - Step 53382: {'lr': 0.00036547428579231886, 'samples': 10249344, 'steps': 53381, 'loss/train': 1.4760574102401733} -11/07/2021 04:44:22 - INFO - __main__ - Step 53383: {'lr': 0.000365469579036979, 'samples': 10249536, 'steps': 53382, 'loss/train': 1.1706430912017822} -11/07/2021 04:44:23 - INFO - __main__ - Step 53384: {'lr': 0.00036546487222961045, 'samples': 10249728, 'steps': 53383, 'loss/train': 1.2544550895690918} -11/07/2021 04:44:24 - INFO - __main__ - Step 53385: {'lr': 0.0003654601653702151, 'samples': 10249920, 'steps': 53384, 'loss/train': 1.4860308170318604} -11/07/2021 04:44:24 - INFO - __main__ - Step 53386: {'lr': 0.0003654554584587952, 'samples': 10250112, 'steps': 53385, 'loss/train': 1.3248411417007446} -11/07/2021 04:44:24 - INFO - __main__ - Step 53387: {'lr': 0.0003654507514953529, 'samples': 10250304, 'steps': 53386, 'loss/train': 1.7449822425842285} -11/07/2021 04:44:25 - INFO - __main__ - Step 53388: {'lr': 0.0003654460444798902, 'samples': 10250496, 'steps': 53387, 'loss/train': 1.3748877048492432} -11/07/2021 04:44:26 - INFO - __main__ - Step 53389: {'lr': 0.00036544133741240936, 'samples': 10250688, 'steps': 53388, 'loss/train': 1.5594673156738281} -11/07/2021 04:44:26 - INFO - __main__ - Step 53390: {'lr': 0.0003654366302929124, 'samples': 10250880, 'steps': 53389, 'loss/train': 1.599009394645691} -11/07/2021 04:44:26 - INFO - __main__ - Step 53391: {'lr': 0.0003654319231214015, 'samples': 10251072, 'steps': 53390, 'loss/train': 1.4899357557296753} -11/07/2021 04:44:27 - INFO - __main__ - Step 53392: {'lr': 0.00036542721589787877, 'samples': 10251264, 'steps': 53391, 'loss/train': 1.1830111742019653} -11/07/2021 04:44:27 - INFO - __main__ - Step 53393: {'lr': 0.0003654225086223463, 'samples': 10251456, 'steps': 53392, 'loss/train': 2.0893449783325195} -11/07/2021 04:44:28 - INFO - __main__ - Step 53394: {'lr': 0.00036541780129480616, 'samples': 10251648, 'steps': 53393, 'loss/train': 1.5052937269210815} -11/07/2021 04:44:28 - INFO - __main__ - Step 53395: {'lr': 0.00036541309391526064, 'samples': 10251840, 'steps': 53394, 'loss/train': 0.8931623697280884} -11/07/2021 04:44:29 - INFO - __main__ - Step 53396: {'lr': 0.0003654083864837117, 'samples': 10252032, 'steps': 53395, 'loss/train': 1.2950444221496582} -11/07/2021 04:44:29 - INFO - __main__ - Step 53397: {'lr': 0.0003654036790001616, 'samples': 10252224, 'steps': 53396, 'loss/train': 1.530462622642517} -11/07/2021 04:44:29 - INFO - __main__ - Step 53398: {'lr': 0.00036539897146461227, 'samples': 10252416, 'steps': 53397, 'loss/train': 1.3619475364685059} -11/07/2021 04:44:30 - INFO - __main__ - Step 53399: {'lr': 0.000365394263877066, 'samples': 10252608, 'steps': 53398, 'loss/train': 1.2248635292053223} -11/07/2021 04:44:31 - INFO - __main__ - Step 53400: {'lr': 0.0003653895562375248, 'samples': 10252800, 'steps': 53399, 'loss/train': 1.672544002532959} -11/07/2021 04:44:31 - INFO - __main__ - Step 53401: {'lr': 0.0003653848485459909, 'samples': 10252992, 'steps': 53400, 'loss/train': 1.9200359582901} -11/07/2021 04:44:31 - INFO - __main__ - Step 53402: {'lr': 0.0003653801408024664, 'samples': 10253184, 'steps': 53401, 'loss/train': 1.3319880962371826} -11/07/2021 04:44:32 - INFO - __main__ - Step 53403: {'lr': 0.00036537543300695335, 'samples': 10253376, 'steps': 53402, 'loss/train': 1.3862860202789307} -11/07/2021 04:44:33 - INFO - __main__ - Step 53404: {'lr': 0.0003653707251594539, 'samples': 10253568, 'steps': 53403, 'loss/train': 0.7829197645187378} -11/07/2021 04:44:33 - INFO - __main__ - Step 53405: {'lr': 0.0003653660172599702, 'samples': 10253760, 'steps': 53404, 'loss/train': 1.0968180894851685} -11/07/2021 04:44:34 - INFO - __main__ - Step 53406: {'lr': 0.00036536130930850435, 'samples': 10253952, 'steps': 53405, 'loss/train': 1.2832274436950684} -11/07/2021 04:44:34 - INFO - __main__ - Step 53407: {'lr': 0.0003653566013050585, 'samples': 10254144, 'steps': 53406, 'loss/train': 1.0513582229614258} -11/07/2021 04:44:34 - INFO - __main__ - Step 53408: {'lr': 0.0003653518932496347, 'samples': 10254336, 'steps': 53407, 'loss/train': 1.6917462348937988} -11/07/2021 04:44:35 - INFO - __main__ - Step 53409: {'lr': 0.00036534718514223517, 'samples': 10254528, 'steps': 53408, 'loss/train': 1.126509428024292} -11/07/2021 04:44:36 - INFO - __main__ - Step 53410: {'lr': 0.00036534247698286195, 'samples': 10254720, 'steps': 53409, 'loss/train': 1.294304609298706} -11/07/2021 04:44:36 - INFO - __main__ - Step 53411: {'lr': 0.0003653377687715171, 'samples': 10254912, 'steps': 53410, 'loss/train': 1.2954366207122803} -11/07/2021 04:44:36 - INFO - __main__ - Step 53412: {'lr': 0.00036533306050820296, 'samples': 10255104, 'steps': 53411, 'loss/train': 1.6132702827453613} -11/07/2021 04:44:37 - INFO - __main__ - Step 53413: {'lr': 0.00036532835219292147, 'samples': 10255296, 'steps': 53412, 'loss/train': 1.3538674116134644} -11/07/2021 04:44:37 - INFO - __main__ - Step 53414: {'lr': 0.0003653236438256748, 'samples': 10255488, 'steps': 53413, 'loss/train': 1.5556293725967407} -11/07/2021 04:44:38 - INFO - __main__ - Step 53415: {'lr': 0.0003653189354064652, 'samples': 10255680, 'steps': 53414, 'loss/train': 1.6456143856048584} -11/07/2021 04:44:38 - INFO - __main__ - Step 53416: {'lr': 0.0003653142269352945, 'samples': 10255872, 'steps': 53415, 'loss/train': 1.5403021574020386} -11/07/2021 04:44:39 - INFO - __main__ - Step 53417: {'lr': 0.00036530951841216505, 'samples': 10256064, 'steps': 53416, 'loss/train': 1.4491617679595947} -11/07/2021 04:44:39 - INFO - __main__ - Step 53418: {'lr': 0.00036530480983707885, 'samples': 10256256, 'steps': 53417, 'loss/train': 1.2381377220153809} -11/07/2021 04:44:39 - INFO - __main__ - Step 53419: {'lr': 0.0003653001012100382, 'samples': 10256448, 'steps': 53418, 'loss/train': 1.6028646230697632} -11/07/2021 04:44:41 - INFO - __main__ - Step 53420: {'lr': 0.00036529539253104507, 'samples': 10256640, 'steps': 53419, 'loss/train': 1.0861432552337646} -11/07/2021 04:44:41 - INFO - __main__ - Step 53421: {'lr': 0.00036529068380010155, 'samples': 10256832, 'steps': 53420, 'loss/train': 1.8178462982177734} -11/07/2021 04:44:41 - INFO - __main__ - Step 53422: {'lr': 0.00036528597501720984, 'samples': 10257024, 'steps': 53421, 'loss/train': 0.979706346988678} -11/07/2021 04:44:42 - INFO - __main__ - Step 53423: {'lr': 0.00036528126618237206, 'samples': 10257216, 'steps': 53422, 'loss/train': 1.5682344436645508} -11/07/2021 04:44:42 - INFO - __main__ - Step 53424: {'lr': 0.00036527655729559036, 'samples': 10257408, 'steps': 53423, 'loss/train': 1.6208622455596924} -11/07/2021 04:44:43 - INFO - __main__ - Step 53425: {'lr': 0.0003652718483568668, 'samples': 10257600, 'steps': 53424, 'loss/train': 1.4337201118469238} -11/07/2021 04:44:43 - INFO - __main__ - Step 53426: {'lr': 0.00036526713936620354, 'samples': 10257792, 'steps': 53425, 'loss/train': 1.003976821899414} -11/07/2021 04:44:44 - INFO - __main__ - Step 53427: {'lr': 0.00036526243032360264, 'samples': 10257984, 'steps': 53426, 'loss/train': 1.253382682800293} -11/07/2021 04:44:44 - INFO - __main__ - Step 53428: {'lr': 0.0003652577212290663, 'samples': 10258176, 'steps': 53427, 'loss/train': 1.2909741401672363} -11/07/2021 04:44:44 - INFO - __main__ - Step 53429: {'lr': 0.0003652530120825966, 'samples': 10258368, 'steps': 53428, 'loss/train': 1.1331803798675537} -11/07/2021 04:44:45 - INFO - __main__ - Step 53430: {'lr': 0.0003652483028841956, 'samples': 10258560, 'steps': 53429, 'loss/train': 1.1578407287597656} -11/07/2021 04:44:46 - INFO - __main__ - Step 53431: {'lr': 0.0003652435936338656, 'samples': 10258752, 'steps': 53430, 'loss/train': 1.2707332372665405} -11/07/2021 04:44:46 - INFO - __main__ - Step 53432: {'lr': 0.00036523888433160864, 'samples': 10258944, 'steps': 53431, 'loss/train': 0.9340760111808777} -11/07/2021 04:44:46 - INFO - __main__ - Step 53433: {'lr': 0.00036523417497742673, 'samples': 10259136, 'steps': 53432, 'loss/train': 1.292786717414856} -11/07/2021 04:44:47 - INFO - __main__ - Step 53434: {'lr': 0.00036522946557132206, 'samples': 10259328, 'steps': 53433, 'loss/train': 1.3662357330322266} -11/07/2021 04:44:48 - INFO - __main__ - Step 53435: {'lr': 0.00036522475611329685, 'samples': 10259520, 'steps': 53434, 'loss/train': 1.433696985244751} -11/07/2021 04:44:48 - INFO - __main__ - Step 53436: {'lr': 0.00036522004660335304, 'samples': 10259712, 'steps': 53435, 'loss/train': 1.3966200351715088} -11/07/2021 04:44:49 - INFO - __main__ - Step 53437: {'lr': 0.000365215337041493, 'samples': 10259904, 'steps': 53436, 'loss/train': 1.2878247499465942} -11/07/2021 04:44:49 - INFO - __main__ - Step 53438: {'lr': 0.00036521062742771865, 'samples': 10260096, 'steps': 53437, 'loss/train': 0.956116795539856} -11/07/2021 04:44:49 - INFO - __main__ - Step 53439: {'lr': 0.0003652059177620322, 'samples': 10260288, 'steps': 53438, 'loss/train': 0.9694187641143799} -11/07/2021 04:44:50 - INFO - __main__ - Step 53440: {'lr': 0.00036520120804443563, 'samples': 10260480, 'steps': 53439, 'loss/train': 0.9357909560203552} -11/07/2021 04:44:51 - INFO - __main__ - Step 53441: {'lr': 0.00036519649827493117, 'samples': 10260672, 'steps': 53440, 'loss/train': 1.8616234064102173} -11/07/2021 04:44:51 - INFO - __main__ - Step 53442: {'lr': 0.000365191788453521, 'samples': 10260864, 'steps': 53441, 'loss/train': 1.3704938888549805} -11/07/2021 04:44:51 - INFO - __main__ - Step 53443: {'lr': 0.0003651870785802072, 'samples': 10261056, 'steps': 53442, 'loss/train': 0.5557447075843811} -11/07/2021 04:44:52 - INFO - __main__ - Step 53444: {'lr': 0.00036518236865499187, 'samples': 10261248, 'steps': 53443, 'loss/train': 1.4378814697265625} -11/07/2021 04:44:53 - INFO - __main__ - Step 53445: {'lr': 0.0003651776586778772, 'samples': 10261440, 'steps': 53444, 'loss/train': 1.5799425840377808} -11/07/2021 04:44:53 - INFO - __main__ - Step 53446: {'lr': 0.00036517294864886517, 'samples': 10261632, 'steps': 53445, 'loss/train': 2.1427876949310303} -11/07/2021 04:44:53 - INFO - __main__ - Step 53447: {'lr': 0.00036516823856795806, 'samples': 10261824, 'steps': 53446, 'loss/train': 0.9222480654716492} -11/07/2021 04:44:54 - INFO - __main__ - Step 53448: {'lr': 0.0003651635284351579, 'samples': 10262016, 'steps': 53447, 'loss/train': 1.2064964771270752} -11/07/2021 04:44:54 - INFO - __main__ - Step 53449: {'lr': 0.00036515881825046676, 'samples': 10262208, 'steps': 53448, 'loss/train': 1.5260143280029297} -11/07/2021 04:44:55 - INFO - __main__ - Step 53450: {'lr': 0.00036515410801388686, 'samples': 10262400, 'steps': 53449, 'loss/train': 1.222004771232605} -11/07/2021 04:44:55 - INFO - __main__ - Step 53451: {'lr': 0.0003651493977254204, 'samples': 10262592, 'steps': 53450, 'loss/train': 1.1987919807434082} -11/07/2021 04:44:56 - INFO - __main__ - Step 53452: {'lr': 0.0003651446873850693, 'samples': 10262784, 'steps': 53451, 'loss/train': 1.5520845651626587} -11/07/2021 04:44:56 - INFO - __main__ - Step 53453: {'lr': 0.0003651399769928358, 'samples': 10262976, 'steps': 53452, 'loss/train': 1.459889531135559} -11/07/2021 04:44:57 - INFO - __main__ - Step 53454: {'lr': 0.000365135266548722, 'samples': 10263168, 'steps': 53453, 'loss/train': 1.5366923809051514} -11/07/2021 04:44:58 - INFO - __main__ - Step 53455: {'lr': 0.00036513055605273, 'samples': 10263360, 'steps': 53454, 'loss/train': 3.485288143157959} -11/07/2021 04:44:58 - INFO - __main__ - Step 53456: {'lr': 0.0003651258455048619, 'samples': 10263552, 'steps': 53455, 'loss/train': 1.5448509454727173} -11/07/2021 04:44:58 - INFO - __main__ - Step 53457: {'lr': 0.00036512113490512, 'samples': 10263744, 'steps': 53456, 'loss/train': 1.5369842052459717} -11/07/2021 04:44:59 - INFO - __main__ - Step 53458: {'lr': 0.00036511642425350626, 'samples': 10263936, 'steps': 53457, 'loss/train': 1.3163940906524658} -11/07/2021 04:44:59 - INFO - __main__ - Step 53459: {'lr': 0.00036511171355002283, 'samples': 10264128, 'steps': 53458, 'loss/train': 1.2179282903671265} -11/07/2021 04:45:00 - INFO - __main__ - Step 53460: {'lr': 0.0003651070027946718, 'samples': 10264320, 'steps': 53459, 'loss/train': 1.1904709339141846} -11/07/2021 04:45:01 - INFO - __main__ - Step 53461: {'lr': 0.0003651022919874554, 'samples': 10264512, 'steps': 53460, 'loss/train': 1.4106436967849731} -11/07/2021 04:45:01 - INFO - __main__ - Step 53462: {'lr': 0.0003650975811283756, 'samples': 10264704, 'steps': 53461, 'loss/train': 1.307440996170044} -11/07/2021 04:45:01 - INFO - __main__ - Step 53463: {'lr': 0.00036509287021743465, 'samples': 10264896, 'steps': 53462, 'loss/train': 0.7371805906295776} -11/07/2021 04:45:02 - INFO - __main__ - Step 53464: {'lr': 0.00036508815925463456, 'samples': 10265088, 'steps': 53463, 'loss/train': 0.8744301199913025} -11/07/2021 04:45:02 - INFO - __main__ - Step 53465: {'lr': 0.0003650834482399776, 'samples': 10265280, 'steps': 53464, 'loss/train': 1.3795242309570312} -11/07/2021 04:45:03 - INFO - __main__ - Step 53466: {'lr': 0.00036507873717346584, 'samples': 10265472, 'steps': 53465, 'loss/train': 1.2720105648040771} -11/07/2021 04:45:03 - INFO - __main__ - Step 53467: {'lr': 0.00036507402605510134, 'samples': 10265664, 'steps': 53466, 'loss/train': 1.4956802129745483} -11/07/2021 04:45:04 - INFO - __main__ - Step 53468: {'lr': 0.00036506931488488627, 'samples': 10265856, 'steps': 53467, 'loss/train': 1.259634017944336} -11/07/2021 04:45:04 - INFO - __main__ - Step 53469: {'lr': 0.0003650646036628227, 'samples': 10266048, 'steps': 53468, 'loss/train': 1.3439853191375732} -11/07/2021 04:45:04 - INFO - __main__ - Step 53470: {'lr': 0.0003650598923889128, 'samples': 10266240, 'steps': 53469, 'loss/train': 1.5502805709838867} -11/07/2021 04:45:06 - INFO - __main__ - Step 53471: {'lr': 0.0003650551810631587, 'samples': 10266432, 'steps': 53470, 'loss/train': 1.3919814825057983} -11/07/2021 04:45:06 - INFO - __main__ - Step 53472: {'lr': 0.00036505046968556253, 'samples': 10266624, 'steps': 53471, 'loss/train': 1.6537296772003174} -11/07/2021 04:45:06 - INFO - __main__ - Step 53473: {'lr': 0.0003650457582561264, 'samples': 10266816, 'steps': 53472, 'loss/train': 4.414062023162842} -11/07/2021 04:45:07 - INFO - __main__ - Step 53474: {'lr': 0.0003650410467748524, 'samples': 10267008, 'steps': 53473, 'loss/train': 1.4036349058151245} -11/07/2021 04:45:07 - INFO - __main__ - Step 53475: {'lr': 0.0003650363352417427, 'samples': 10267200, 'steps': 53474, 'loss/train': 1.817798376083374} -11/07/2021 04:45:07 - INFO - __main__ - Step 53476: {'lr': 0.00036503162365679936, 'samples': 10267392, 'steps': 53475, 'loss/train': 1.4261497259140015} -11/07/2021 04:45:08 - INFO - __main__ - Step 53477: {'lr': 0.00036502691202002456, 'samples': 10267584, 'steps': 53476, 'loss/train': 1.447472095489502} -11/07/2021 04:45:09 - INFO - __main__ - Step 53478: {'lr': 0.00036502220033142045, 'samples': 10267776, 'steps': 53477, 'loss/train': 1.4116909503936768} -11/07/2021 04:45:09 - INFO - __main__ - Step 53479: {'lr': 0.0003650174885909891, 'samples': 10267968, 'steps': 53478, 'loss/train': 1.485318899154663} -11/07/2021 04:45:10 - INFO - __main__ - Step 53480: {'lr': 0.0003650127767987326, 'samples': 10268160, 'steps': 53479, 'loss/train': 1.534500002861023} -11/07/2021 04:45:10 - INFO - __main__ - Step 53481: {'lr': 0.00036500806495465315, 'samples': 10268352, 'steps': 53480, 'loss/train': 1.147910475730896} -11/07/2021 04:45:11 - INFO - __main__ - Step 53482: {'lr': 0.0003650033530587529, 'samples': 10268544, 'steps': 53481, 'loss/train': 1.1712579727172852} -11/07/2021 04:45:11 - INFO - __main__ - Step 53483: {'lr': 0.00036499864111103384, 'samples': 10268736, 'steps': 53482, 'loss/train': 1.265006184577942} -11/07/2021 04:45:12 - INFO - __main__ - Step 53484: {'lr': 0.00036499392911149817, 'samples': 10268928, 'steps': 53483, 'loss/train': 1.2264678478240967} -11/07/2021 04:45:12 - INFO - __main__ - Step 53485: {'lr': 0.00036498921706014804, 'samples': 10269120, 'steps': 53484, 'loss/train': 1.565567135810852} -11/07/2021 04:45:12 - INFO - __main__ - Step 53486: {'lr': 0.00036498450495698557, 'samples': 10269312, 'steps': 53485, 'loss/train': 1.284726858139038} -11/07/2021 04:45:13 - INFO - __main__ - Step 53487: {'lr': 0.00036497979280201276, 'samples': 10269504, 'steps': 53486, 'loss/train': 1.3235887289047241} -11/07/2021 04:45:14 - INFO - __main__ - Step 53488: {'lr': 0.0003649750805952319, 'samples': 10269696, 'steps': 53487, 'loss/train': 1.6617445945739746} -11/07/2021 04:45:14 - INFO - __main__ - Step 53489: {'lr': 0.000364970368336645, 'samples': 10269888, 'steps': 53488, 'loss/train': 1.4836846590042114} -11/07/2021 04:45:14 - INFO - __main__ - Step 53490: {'lr': 0.0003649656560262542, 'samples': 10270080, 'steps': 53489, 'loss/train': 1.16900634765625} -11/07/2021 04:45:15 - INFO - __main__ - Step 53491: {'lr': 0.00036496094366406166, 'samples': 10270272, 'steps': 53490, 'loss/train': 1.4340850114822388} -11/07/2021 04:45:16 - INFO - __main__ - Step 53492: {'lr': 0.0003649562312500696, 'samples': 10270464, 'steps': 53491, 'loss/train': 1.9902280569076538} -11/07/2021 04:45:16 - INFO - __main__ - Step 53493: {'lr': 0.00036495151878427994, 'samples': 10270656, 'steps': 53492, 'loss/train': 0.06550008803606033} -11/07/2021 04:45:17 - INFO - __main__ - Step 53494: {'lr': 0.00036494680626669495, 'samples': 10270848, 'steps': 53493, 'loss/train': 1.1288018226623535} -11/07/2021 04:45:17 - INFO - __main__ - Step 53495: {'lr': 0.00036494209369731666, 'samples': 10271040, 'steps': 53494, 'loss/train': 1.6085138320922852} -11/07/2021 04:45:17 - INFO - __main__ - Step 53496: {'lr': 0.0003649373810761473, 'samples': 10271232, 'steps': 53495, 'loss/train': 1.1278513669967651} -11/07/2021 04:45:18 - INFO - __main__ - Step 53497: {'lr': 0.00036493266840318886, 'samples': 10271424, 'steps': 53496, 'loss/train': 1.226789951324463} -11/07/2021 04:45:19 - INFO - __main__ - Step 53498: {'lr': 0.0003649279556784436, 'samples': 10271616, 'steps': 53497, 'loss/train': 1.1760696172714233} -11/07/2021 04:45:19 - INFO - __main__ - Step 53499: {'lr': 0.0003649232429019135, 'samples': 10271808, 'steps': 53498, 'loss/train': 1.5847797393798828} -11/07/2021 04:45:19 - INFO - __main__ - Step 53500: {'lr': 0.0003649185300736008, 'samples': 10272000, 'steps': 53499, 'loss/train': 1.463171124458313} -11/07/2021 04:45:20 - INFO - __main__ - Step 53501: {'lr': 0.0003649138171935076, 'samples': 10272192, 'steps': 53500, 'loss/train': 1.2854593992233276} -11/07/2021 04:45:21 - INFO - __main__ - Step 53502: {'lr': 0.0003649091042616359, 'samples': 10272384, 'steps': 53501, 'loss/train': 1.0506432056427002} -11/07/2021 04:45:21 - INFO - __main__ - Step 53503: {'lr': 0.000364904391277988, 'samples': 10272576, 'steps': 53502, 'loss/train': 0.06548427045345306} -11/07/2021 04:45:22 - INFO - __main__ - Step 53504: {'lr': 0.00036489967824256597, 'samples': 10272768, 'steps': 53503, 'loss/train': 1.4971596002578735} -11/07/2021 04:45:22 - INFO - __main__ - Step 53505: {'lr': 0.000364894965155372, 'samples': 10272960, 'steps': 53504, 'loss/train': 5.800402641296387} -11/07/2021 04:45:22 - INFO - __main__ - Step 53506: {'lr': 0.000364890252016408, 'samples': 10273152, 'steps': 53505, 'loss/train': 1.3495075702667236} -11/07/2021 04:45:23 - INFO - __main__ - Step 53507: {'lr': 0.0003648855388256763, 'samples': 10273344, 'steps': 53506, 'loss/train': 1.5951036214828491} -11/07/2021 04:45:24 - INFO - __main__ - Step 53508: {'lr': 0.0003648808255831789, 'samples': 10273536, 'steps': 53507, 'loss/train': 1.4750956296920776} -11/07/2021 04:45:24 - INFO - __main__ - Step 53509: {'lr': 0.00036487611228891805, 'samples': 10273728, 'steps': 53508, 'loss/train': 1.296762466430664} -11/07/2021 04:45:25 - INFO - __main__ - Step 53510: {'lr': 0.00036487139894289566, 'samples': 10273920, 'steps': 53509, 'loss/train': 1.7952351570129395} -11/07/2021 04:45:25 - INFO - __main__ - Step 53511: {'lr': 0.0003648666855451141, 'samples': 10274112, 'steps': 53510, 'loss/train': 1.3936107158660889} -11/07/2021 04:45:25 - INFO - __main__ - Step 53512: {'lr': 0.0003648619720955754, 'samples': 10274304, 'steps': 53511, 'loss/train': 1.4741666316986084} -11/07/2021 04:45:27 - INFO - __main__ - Step 53513: {'lr': 0.00036485725859428163, 'samples': 10274496, 'steps': 53512, 'loss/train': 0.07048851251602173} -11/07/2021 04:45:27 - INFO - __main__ - Step 53514: {'lr': 0.00036485254504123495, 'samples': 10274688, 'steps': 53513, 'loss/train': 0.936514139175415} -11/07/2021 04:45:27 - INFO - __main__ - Step 53515: {'lr': 0.00036484783143643745, 'samples': 10274880, 'steps': 53514, 'loss/train': 1.230549693107605} -11/07/2021 04:45:28 - INFO - __main__ - Step 53516: {'lr': 0.0003648431177798913, 'samples': 10275072, 'steps': 53515, 'loss/train': 1.5734517574310303} -11/07/2021 04:45:28 - INFO - __main__ - Step 53517: {'lr': 0.00036483840407159864, 'samples': 10275264, 'steps': 53516, 'loss/train': 1.1997522115707397} -11/07/2021 04:45:29 - INFO - __main__ - Step 53518: {'lr': 0.0003648336903115616, 'samples': 10275456, 'steps': 53517, 'loss/train': 1.3396321535110474} -11/07/2021 04:45:29 - INFO - __main__ - Step 53519: {'lr': 0.0003648289764997823, 'samples': 10275648, 'steps': 53518, 'loss/train': 1.186674952507019} -11/07/2021 04:45:30 - INFO - __main__ - Step 53520: {'lr': 0.00036482426263626265, 'samples': 10275840, 'steps': 53519, 'loss/train': 1.2877269983291626} -11/07/2021 04:45:30 - INFO - __main__ - Step 53521: {'lr': 0.0003648195487210051, 'samples': 10276032, 'steps': 53520, 'loss/train': 0.8472537398338318} -11/07/2021 04:45:30 - INFO - __main__ - Step 53522: {'lr': 0.0003648148347540116, 'samples': 10276224, 'steps': 53521, 'loss/train': 1.4158985614776611} -11/07/2021 04:45:31 - INFO - __main__ - Step 53523: {'lr': 0.0003648101207352843, 'samples': 10276416, 'steps': 53522, 'loss/train': 1.3949472904205322} -11/07/2021 04:45:32 - INFO - __main__ - Step 53524: {'lr': 0.00036480540666482535, 'samples': 10276608, 'steps': 53523, 'loss/train': 1.6620945930480957} -11/07/2021 04:45:32 - INFO - __main__ - Step 53525: {'lr': 0.00036480069254263693, 'samples': 10276800, 'steps': 53524, 'loss/train': 1.4589643478393555} -11/07/2021 04:45:32 - INFO - __main__ - Step 53526: {'lr': 0.000364795978368721, 'samples': 10276992, 'steps': 53525, 'loss/train': 1.1077258586883545} -11/07/2021 04:45:33 - INFO - __main__ - Step 53527: {'lr': 0.0003647912641430798, 'samples': 10277184, 'steps': 53526, 'loss/train': 1.6570274829864502} -11/07/2021 04:45:34 - INFO - __main__ - Step 53528: {'lr': 0.0003647865498657154, 'samples': 10277376, 'steps': 53527, 'loss/train': 1.724677324295044} -11/07/2021 04:45:34 - INFO - __main__ - Step 53529: {'lr': 0.0003647818355366299, 'samples': 10277568, 'steps': 53528, 'loss/train': 0.858352541923523} -11/07/2021 04:45:35 - INFO - __main__ - Step 53530: {'lr': 0.00036477712115582555, 'samples': 10277760, 'steps': 53529, 'loss/train': 1.4554532766342163} -11/07/2021 04:45:35 - INFO - __main__ - Step 53531: {'lr': 0.0003647724067233044, 'samples': 10277952, 'steps': 53530, 'loss/train': 1.0617146492004395} -11/07/2021 04:45:35 - INFO - __main__ - Step 53532: {'lr': 0.00036476769223906864, 'samples': 10278144, 'steps': 53531, 'loss/train': 0.09869363158941269} -11/07/2021 04:45:36 - INFO - __main__ - Step 53533: {'lr': 0.0003647629777031202, 'samples': 10278336, 'steps': 53532, 'loss/train': 1.4492369890213013} -11/07/2021 04:45:37 - INFO - __main__ - Step 53534: {'lr': 0.0003647582631154614, 'samples': 10278528, 'steps': 53533, 'loss/train': 1.1524577140808105} -11/07/2021 04:45:37 - INFO - __main__ - Step 53535: {'lr': 0.00036475354847609434, 'samples': 10278720, 'steps': 53534, 'loss/train': 1.536961555480957} -11/07/2021 04:45:37 - INFO - __main__ - Step 53536: {'lr': 0.000364748833785021, 'samples': 10278912, 'steps': 53535, 'loss/train': 1.051010012626648} -11/07/2021 04:45:38 - INFO - __main__ - Step 53537: {'lr': 0.0003647441190422437, 'samples': 10279104, 'steps': 53536, 'loss/train': 1.30070161819458} -11/07/2021 04:45:38 - INFO - __main__ - Step 53538: {'lr': 0.00036473940424776443, 'samples': 10279296, 'steps': 53537, 'loss/train': 1.432908535003662} -11/07/2021 04:45:39 - INFO - __main__ - Step 53539: {'lr': 0.0003647346894015853, 'samples': 10279488, 'steps': 53538, 'loss/train': 1.2249596118927002} -11/07/2021 04:45:39 - INFO - __main__ - Step 53540: {'lr': 0.0003647299745037085, 'samples': 10279680, 'steps': 53539, 'loss/train': 1.7161222696304321} -11/07/2021 04:45:40 - INFO - __main__ - Step 53541: {'lr': 0.00036472525955413626, 'samples': 10279872, 'steps': 53540, 'loss/train': 1.095268964767456} -11/07/2021 04:45:40 - INFO - __main__ - Step 53542: {'lr': 0.00036472054455287053, 'samples': 10280064, 'steps': 53541, 'loss/train': 1.3333752155303955} -11/07/2021 04:45:40 - INFO - __main__ - Step 53543: {'lr': 0.00036471582949991347, 'samples': 10280256, 'steps': 53542, 'loss/train': 1.6389453411102295} -11/07/2021 04:45:42 - INFO - __main__ - Step 53544: {'lr': 0.0003647111143952672, 'samples': 10280448, 'steps': 53543, 'loss/train': 1.4052221775054932} -11/07/2021 04:45:42 - INFO - __main__ - Step 53545: {'lr': 0.0003647063992389339, 'samples': 10280640, 'steps': 53544, 'loss/train': 1.2893710136413574} -11/07/2021 04:45:42 - INFO - __main__ - Step 53546: {'lr': 0.00036470168403091567, 'samples': 10280832, 'steps': 53545, 'loss/train': 1.4591162204742432} -11/07/2021 04:45:43 - INFO - __main__ - Step 53547: {'lr': 0.00036469696877121464, 'samples': 10281024, 'steps': 53546, 'loss/train': 1.500877022743225} -11/07/2021 04:45:43 - INFO - __main__ - Step 53548: {'lr': 0.000364692253459833, 'samples': 10281216, 'steps': 53547, 'loss/train': 1.5913686752319336} -11/07/2021 04:45:44 - INFO - __main__ - Step 53549: {'lr': 0.0003646875380967727, 'samples': 10281408, 'steps': 53548, 'loss/train': 1.3998956680297852} -11/07/2021 04:45:45 - INFO - __main__ - Step 53550: {'lr': 0.00036468282268203595, 'samples': 10281600, 'steps': 53549, 'loss/train': 1.3212279081344604} -11/07/2021 04:45:45 - INFO - __main__ - Step 53551: {'lr': 0.0003646781072156249, 'samples': 10281792, 'steps': 53550, 'loss/train': 0.31877216696739197} -11/07/2021 04:45:45 - INFO - __main__ - Step 53552: {'lr': 0.00036467339169754173, 'samples': 10281984, 'steps': 53551, 'loss/train': 1.8028637170791626} -11/07/2021 04:45:46 - INFO - __main__ - Step 53553: {'lr': 0.0003646686761277884, 'samples': 10282176, 'steps': 53552, 'loss/train': 1.836937665939331} -11/07/2021 04:45:46 - INFO - __main__ - Step 53554: {'lr': 0.00036466396050636725, 'samples': 10282368, 'steps': 53553, 'loss/train': 2.672879457473755} -11/07/2021 04:45:47 - INFO - __main__ - Step 53555: {'lr': 0.0003646592448332802, 'samples': 10282560, 'steps': 53554, 'loss/train': 1.848436951637268} -11/07/2021 04:45:48 - INFO - __main__ - Step 53556: {'lr': 0.00036465452910852946, 'samples': 10282752, 'steps': 53555, 'loss/train': 1.1363451480865479} -11/07/2021 04:45:48 - INFO - __main__ - Step 53557: {'lr': 0.00036464981333211724, 'samples': 10282944, 'steps': 53556, 'loss/train': 0.9401386976242065} -11/07/2021 04:45:48 - INFO - __main__ - Step 53558: {'lr': 0.0003646450975040455, 'samples': 10283136, 'steps': 53557, 'loss/train': 1.7269724607467651} -11/07/2021 04:45:49 - INFO - __main__ - Step 53559: {'lr': 0.00036464038162431657, 'samples': 10283328, 'steps': 53558, 'loss/train': 1.0810272693634033} -11/07/2021 04:45:50 - INFO - __main__ - Step 53560: {'lr': 0.00036463566569293235, 'samples': 10283520, 'steps': 53559, 'loss/train': 1.4755587577819824} -11/07/2021 04:45:50 - INFO - __main__ - Step 53561: {'lr': 0.0003646309497098951, 'samples': 10283712, 'steps': 53560, 'loss/train': 1.209079623222351} -11/07/2021 04:45:50 - INFO - __main__ - Step 53562: {'lr': 0.00036462623367520684, 'samples': 10283904, 'steps': 53561, 'loss/train': 1.545916199684143} -11/07/2021 04:45:51 - INFO - __main__ - Step 53563: {'lr': 0.00036462151758886985, 'samples': 10284096, 'steps': 53562, 'loss/train': 1.3853113651275635} -11/07/2021 04:45:51 - INFO - __main__ - Step 53564: {'lr': 0.0003646168014508861, 'samples': 10284288, 'steps': 53563, 'loss/train': 1.524139404296875} -11/07/2021 04:45:52 - INFO - __main__ - Step 53565: {'lr': 0.00036461208526125785, 'samples': 10284480, 'steps': 53564, 'loss/train': 1.2327629327774048} -11/07/2021 04:45:53 - INFO - __main__ - Step 53566: {'lr': 0.0003646073690199872, 'samples': 10284672, 'steps': 53565, 'loss/train': 1.8953274488449097} -11/07/2021 04:45:53 - INFO - __main__ - Step 53567: {'lr': 0.00036460265272707617, 'samples': 10284864, 'steps': 53566, 'loss/train': 1.569270372390747} -11/07/2021 04:45:53 - INFO - __main__ - Step 53568: {'lr': 0.000364597936382527, 'samples': 10285056, 'steps': 53567, 'loss/train': 1.6651109457015991} -11/07/2021 04:45:54 - INFO - __main__ - Step 53569: {'lr': 0.0003645932199863417, 'samples': 10285248, 'steps': 53568, 'loss/train': 0.5657076239585876} -11/07/2021 04:45:54 - INFO - __main__ - Step 53570: {'lr': 0.00036458850353852246, 'samples': 10285440, 'steps': 53569, 'loss/train': 1.2051150798797607} -11/07/2021 04:45:55 - INFO - __main__ - Step 53571: {'lr': 0.0003645837870390715, 'samples': 10285632, 'steps': 53570, 'loss/train': 1.6608856916427612} -11/07/2021 04:45:55 - INFO - __main__ - Step 53572: {'lr': 0.00036457907048799084, 'samples': 10285824, 'steps': 53571, 'loss/train': 1.7461100816726685} -11/07/2021 04:45:56 - INFO - __main__ - Step 53573: {'lr': 0.00036457435388528257, 'samples': 10286016, 'steps': 53572, 'loss/train': 1.378989338874817} -11/07/2021 04:45:56 - INFO - __main__ - Step 53574: {'lr': 0.0003645696372309488, 'samples': 10286208, 'steps': 53573, 'loss/train': 1.4414912462234497} -11/07/2021 04:45:57 - INFO - __main__ - Step 53575: {'lr': 0.00036456492052499185, 'samples': 10286400, 'steps': 53574, 'loss/train': 1.825268030166626} -11/07/2021 04:45:58 - INFO - __main__ - Step 53576: {'lr': 0.00036456020376741363, 'samples': 10286592, 'steps': 53575, 'loss/train': 1.3124676942825317} -11/07/2021 04:45:58 - INFO - __main__ - Step 53577: {'lr': 0.0003645554869582164, 'samples': 10286784, 'steps': 53576, 'loss/train': 1.6099679470062256} -11/07/2021 04:45:58 - INFO - __main__ - Step 53578: {'lr': 0.0003645507700974022, 'samples': 10286976, 'steps': 53577, 'loss/train': 1.296777606010437} -11/07/2021 04:45:59 - INFO - __main__ - Step 53579: {'lr': 0.00036454605318497323, 'samples': 10287168, 'steps': 53578, 'loss/train': 1.4289377927780151} -11/07/2021 04:45:59 - INFO - __main__ - Step 53580: {'lr': 0.00036454133622093154, 'samples': 10287360, 'steps': 53579, 'loss/train': 1.4092215299606323} -11/07/2021 04:46:00 - INFO - __main__ - Step 53581: {'lr': 0.00036453661920527933, 'samples': 10287552, 'steps': 53580, 'loss/train': 1.2635722160339355} -11/07/2021 04:46:00 - INFO - __main__ - Step 53582: {'lr': 0.0003645319021380186, 'samples': 10287744, 'steps': 53581, 'loss/train': 0.8141332268714905} -11/07/2021 04:46:01 - INFO - __main__ - Step 53583: {'lr': 0.00036452718501915165, 'samples': 10287936, 'steps': 53582, 'loss/train': 1.2602858543395996} -11/07/2021 04:46:01 - INFO - __main__ - Step 53584: {'lr': 0.00036452246784868047, 'samples': 10288128, 'steps': 53583, 'loss/train': 1.5883314609527588} -11/07/2021 04:46:01 - INFO - __main__ - Step 53585: {'lr': 0.0003645177506266072, 'samples': 10288320, 'steps': 53584, 'loss/train': 1.6093188524246216} -11/07/2021 04:46:03 - INFO - __main__ - Step 53586: {'lr': 0.0003645130333529342, 'samples': 10288512, 'steps': 53585, 'loss/train': 5.9109697341918945} -11/07/2021 04:46:03 - INFO - __main__ - Step 53587: {'lr': 0.0003645083160276632, 'samples': 10288704, 'steps': 53586, 'loss/train': 1.1899070739746094} -11/07/2021 04:46:03 - INFO - __main__ - Step 53588: {'lr': 0.0003645035986507966, 'samples': 10288896, 'steps': 53587, 'loss/train': 1.0773814916610718} -11/07/2021 04:46:04 - INFO - __main__ - Step 53589: {'lr': 0.00036449888122233636, 'samples': 10289088, 'steps': 53588, 'loss/train': 1.2378230094909668} -11/07/2021 04:46:04 - INFO - __main__ - Step 53590: {'lr': 0.00036449416374228474, 'samples': 10289280, 'steps': 53589, 'loss/train': 1.4816677570343018} -11/07/2021 04:46:04 - INFO - __main__ - Step 53591: {'lr': 0.00036448944621064386, 'samples': 10289472, 'steps': 53590, 'loss/train': 1.2232826948165894} -11/07/2021 04:46:05 - INFO - __main__ - Step 53592: {'lr': 0.00036448472862741577, 'samples': 10289664, 'steps': 53591, 'loss/train': 1.4840363264083862} -11/07/2021 04:46:06 - INFO - __main__ - Step 53593: {'lr': 0.0003644800109926026, 'samples': 10289856, 'steps': 53592, 'loss/train': 1.1795276403427124} -11/07/2021 04:46:06 - INFO - __main__ - Step 53594: {'lr': 0.00036447529330620653, 'samples': 10290048, 'steps': 53593, 'loss/train': 1.5766221284866333} -11/07/2021 04:46:07 - INFO - __main__ - Step 53595: {'lr': 0.0003644705755682296, 'samples': 10290240, 'steps': 53594, 'loss/train': 1.8372597694396973} -11/07/2021 04:46:07 - INFO - __main__ - Step 53596: {'lr': 0.00036446585777867406, 'samples': 10290432, 'steps': 53595, 'loss/train': 1.5694047212600708} -11/07/2021 04:46:08 - INFO - __main__ - Step 53597: {'lr': 0.0003644611399375419, 'samples': 10290624, 'steps': 53596, 'loss/train': 1.432969570159912} -11/07/2021 04:46:08 - INFO - __main__ - Step 53598: {'lr': 0.0003644564220448354, 'samples': 10290816, 'steps': 53597, 'loss/train': 1.5193006992340088} -11/07/2021 04:46:09 - INFO - __main__ - Step 53599: {'lr': 0.0003644517041005566, 'samples': 10291008, 'steps': 53598, 'loss/train': 1.0880459547042847} -11/07/2021 04:46:09 - INFO - __main__ - Step 53600: {'lr': 0.0003644469861047076, 'samples': 10291200, 'steps': 53599, 'loss/train': 1.2695410251617432} -11/07/2021 04:46:09 - INFO - __main__ - Step 53601: {'lr': 0.0003644422680572906, 'samples': 10291392, 'steps': 53600, 'loss/train': 1.6431523561477661} -11/07/2021 04:46:10 - INFO - __main__ - Step 53602: {'lr': 0.00036443754995830763, 'samples': 10291584, 'steps': 53601, 'loss/train': 1.2466450929641724} -11/07/2021 04:46:11 - INFO - __main__ - Step 53603: {'lr': 0.0003644328318077609, 'samples': 10291776, 'steps': 53602, 'loss/train': 0.5655657649040222} -11/07/2021 04:46:11 - INFO - __main__ - Step 53604: {'lr': 0.0003644281136056524, 'samples': 10291968, 'steps': 53603, 'loss/train': 1.275779366493225} -11/07/2021 04:46:11 - INFO - __main__ - Step 53605: {'lr': 0.00036442339535198444, 'samples': 10292160, 'steps': 53604, 'loss/train': 1.2544212341308594} -11/07/2021 04:46:12 - INFO - __main__ - Step 53606: {'lr': 0.00036441867704675913, 'samples': 10292352, 'steps': 53605, 'loss/train': 1.4334867000579834} -11/07/2021 04:46:13 - INFO - __main__ - Step 53607: {'lr': 0.00036441395868997843, 'samples': 10292544, 'steps': 53606, 'loss/train': 0.7503970265388489} -11/07/2021 04:46:13 - INFO - __main__ - Step 53608: {'lr': 0.00036440924028164457, 'samples': 10292736, 'steps': 53607, 'loss/train': 1.4109858274459839} -11/07/2021 04:46:13 - INFO - __main__ - Step 53609: {'lr': 0.0003644045218217597, 'samples': 10292928, 'steps': 53608, 'loss/train': 0.9213677644729614} -11/07/2021 04:46:14 - INFO - __main__ - Step 53610: {'lr': 0.000364399803310326, 'samples': 10293120, 'steps': 53609, 'loss/train': 1.2618991136550903} -11/07/2021 04:46:14 - INFO - __main__ - Step 53611: {'lr': 0.0003643950847473453, 'samples': 10293312, 'steps': 53610, 'loss/train': 1.7567811012268066} -11/07/2021 04:46:15 - INFO - __main__ - Step 53612: {'lr': 0.0003643903661328201, 'samples': 10293504, 'steps': 53611, 'loss/train': 1.2855720520019531} -11/07/2021 04:46:16 - INFO - __main__ - Step 53613: {'lr': 0.0003643856474667524, 'samples': 10293696, 'steps': 53612, 'loss/train': 2.0284533500671387} -11/07/2021 04:46:16 - INFO - __main__ - Step 53614: {'lr': 0.0003643809287491442, 'samples': 10293888, 'steps': 53613, 'loss/train': 2.2099084854125977} -11/07/2021 04:46:16 - INFO - __main__ - Step 53615: {'lr': 0.00036437620997999777, 'samples': 10294080, 'steps': 53614, 'loss/train': 0.9690789580345154} -11/07/2021 04:46:17 - INFO - __main__ - Step 53616: {'lr': 0.0003643714911593151, 'samples': 10294272, 'steps': 53615, 'loss/train': 1.2599529027938843} -11/07/2021 04:46:18 - INFO - __main__ - Step 53617: {'lr': 0.00036436677228709845, 'samples': 10294464, 'steps': 53616, 'loss/train': 1.177477240562439} -11/07/2021 04:46:18 - INFO - __main__ - Step 53618: {'lr': 0.00036436205336334995, 'samples': 10294656, 'steps': 53617, 'loss/train': 1.4854182004928589} -11/07/2021 04:46:18 - INFO - __main__ - Step 53619: {'lr': 0.0003643573343880716, 'samples': 10294848, 'steps': 53618, 'loss/train': 1.0214343070983887} -11/07/2021 04:46:19 - INFO - __main__ - Step 53620: {'lr': 0.00036435261536126566, 'samples': 10295040, 'steps': 53619, 'loss/train': 1.2438859939575195} -11/07/2021 04:46:19 - INFO - __main__ - Step 53621: {'lr': 0.0003643478962829342, 'samples': 10295232, 'steps': 53620, 'loss/train': 1.707126498222351} -11/07/2021 04:46:20 - INFO - __main__ - Step 53622: {'lr': 0.0003643431771530793, 'samples': 10295424, 'steps': 53621, 'loss/train': 1.0260186195373535} -11/07/2021 04:46:20 - INFO - __main__ - Step 53623: {'lr': 0.0003643384579717031, 'samples': 10295616, 'steps': 53622, 'loss/train': 1.2955429553985596} -11/07/2021 04:46:21 - INFO - __main__ - Step 53624: {'lr': 0.0003643337387388078, 'samples': 10295808, 'steps': 53623, 'loss/train': 1.1433353424072266} -11/07/2021 04:46:21 - INFO - __main__ - Step 53625: {'lr': 0.00036432901945439544, 'samples': 10296000, 'steps': 53624, 'loss/train': 1.1356937885284424} -11/07/2021 04:46:22 - INFO - __main__ - Step 53626: {'lr': 0.0003643243001184683, 'samples': 10296192, 'steps': 53625, 'loss/train': 1.1286875009536743} -11/07/2021 04:46:23 - INFO - __main__ - Step 53627: {'lr': 0.00036431958073102825, 'samples': 10296384, 'steps': 53626, 'loss/train': 1.6646336317062378} -11/07/2021 04:46:23 - INFO - __main__ - Step 53628: {'lr': 0.00036431486129207767, 'samples': 10296576, 'steps': 53627, 'loss/train': 1.510939598083496} -11/07/2021 04:46:23 - INFO - __main__ - Step 53629: {'lr': 0.00036431014180161853, 'samples': 10296768, 'steps': 53628, 'loss/train': 1.5132286548614502} -11/07/2021 04:46:24 - INFO - __main__ - Step 53630: {'lr': 0.000364305422259653, 'samples': 10296960, 'steps': 53629, 'loss/train': 1.8390154838562012} -11/07/2021 04:46:24 - INFO - __main__ - Step 53631: {'lr': 0.0003643007026661832, 'samples': 10297152, 'steps': 53630, 'loss/train': 1.5268847942352295} -11/07/2021 04:46:24 - INFO - __main__ - Step 53632: {'lr': 0.0003642959830212113, 'samples': 10297344, 'steps': 53631, 'loss/train': 0.9875638484954834} -11/07/2021 04:46:26 - INFO - __main__ - Step 53633: {'lr': 0.0003642912633247394, 'samples': 10297536, 'steps': 53632, 'loss/train': 1.898142695426941} -11/07/2021 04:46:26 - INFO - __main__ - Step 53634: {'lr': 0.0003642865435767696, 'samples': 10297728, 'steps': 53633, 'loss/train': 2.0873570442199707} -11/07/2021 04:46:26 - INFO - __main__ - Step 53635: {'lr': 0.00036428182377730407, 'samples': 10297920, 'steps': 53634, 'loss/train': 1.409475564956665} -11/07/2021 04:46:27 - INFO - __main__ - Step 53636: {'lr': 0.00036427710392634483, 'samples': 10298112, 'steps': 53635, 'loss/train': 1.2655452489852905} -11/07/2021 04:46:27 - INFO - __main__ - Step 53637: {'lr': 0.0003642723840238942, 'samples': 10298304, 'steps': 53636, 'loss/train': 1.5383204221725464} -11/07/2021 04:46:28 - INFO - __main__ - Step 53638: {'lr': 0.0003642676640699542, 'samples': 10298496, 'steps': 53637, 'loss/train': 1.6451209783554077} -11/07/2021 04:46:28 - INFO - __main__ - Step 53639: {'lr': 0.0003642629440645269, 'samples': 10298688, 'steps': 53638, 'loss/train': 1.602700114250183} -11/07/2021 04:46:29 - INFO - __main__ - Step 53640: {'lr': 0.00036425822400761444, 'samples': 10298880, 'steps': 53639, 'loss/train': 1.311402440071106} -11/07/2021 04:46:29 - INFO - __main__ - Step 53641: {'lr': 0.000364253503899219, 'samples': 10299072, 'steps': 53640, 'loss/train': 1.4763884544372559} -11/07/2021 04:46:29 - INFO - __main__ - Step 53642: {'lr': 0.00036424878373934275, 'samples': 10299264, 'steps': 53641, 'loss/train': 1.4716440439224243} -11/07/2021 04:46:30 - INFO - __main__ - Step 53643: {'lr': 0.0003642440635279877, 'samples': 10299456, 'steps': 53642, 'loss/train': 1.5461177825927734} -11/07/2021 04:46:31 - INFO - __main__ - Step 53644: {'lr': 0.0003642393432651561, 'samples': 10299648, 'steps': 53643, 'loss/train': 1.2750368118286133} -11/07/2021 04:46:31 - INFO - __main__ - Step 53645: {'lr': 0.00036423462295085, 'samples': 10299840, 'steps': 53644, 'loss/train': 2.0808663368225098} -11/07/2021 04:46:31 - INFO - __main__ - Step 53646: {'lr': 0.00036422990258507155, 'samples': 10300032, 'steps': 53645, 'loss/train': 1.3094879388809204} -11/07/2021 04:46:32 - INFO - __main__ - Step 53647: {'lr': 0.00036422518216782285, 'samples': 10300224, 'steps': 53646, 'loss/train': 1.192118525505066} -11/07/2021 04:46:33 - INFO - __main__ - Step 53648: {'lr': 0.00036422046169910604, 'samples': 10300416, 'steps': 53647, 'loss/train': 1.42933189868927} -11/07/2021 04:46:33 - INFO - __main__ - Step 53649: {'lr': 0.00036421574117892323, 'samples': 10300608, 'steps': 53648, 'loss/train': 0.10659755021333694} -11/07/2021 04:46:34 - INFO - __main__ - Step 53650: {'lr': 0.0003642110206072766, 'samples': 10300800, 'steps': 53649, 'loss/train': 1.4478704929351807} -11/07/2021 04:46:34 - INFO - __main__ - Step 53651: {'lr': 0.0003642062999841682, 'samples': 10300992, 'steps': 53650, 'loss/train': 1.446449637413025} -11/07/2021 04:46:34 - INFO - __main__ - Step 53652: {'lr': 0.00036420157930960027, 'samples': 10301184, 'steps': 53651, 'loss/train': 1.577466368675232} -11/07/2021 04:46:36 - INFO - __main__ - Step 53653: {'lr': 0.00036419685858357485, 'samples': 10301376, 'steps': 53652, 'loss/train': 1.2220356464385986} -11/07/2021 04:46:36 - INFO - __main__ - Step 53654: {'lr': 0.0003641921378060941, 'samples': 10301568, 'steps': 53653, 'loss/train': 0.8797346949577332} -11/07/2021 04:46:36 - INFO - __main__ - Step 53655: {'lr': 0.00036418741697716013, 'samples': 10301760, 'steps': 53654, 'loss/train': 1.463127851486206} -11/07/2021 04:46:37 - INFO - __main__ - Step 53656: {'lr': 0.00036418269609677506, 'samples': 10301952, 'steps': 53655, 'loss/train': 1.4317694902420044} -11/07/2021 04:46:37 - INFO - __main__ - Step 53657: {'lr': 0.000364177975164941, 'samples': 10302144, 'steps': 53656, 'loss/train': 1.1459680795669556} -11/07/2021 04:46:38 - INFO - __main__ - Step 53658: {'lr': 0.0003641732541816601, 'samples': 10302336, 'steps': 53657, 'loss/train': 1.4241100549697876} -11/07/2021 04:46:38 - INFO - __main__ - Step 53659: {'lr': 0.0003641685331469346, 'samples': 10302528, 'steps': 53658, 'loss/train': 1.5625414848327637} -11/07/2021 04:46:39 - INFO - __main__ - Step 53660: {'lr': 0.0003641638120607665, 'samples': 10302720, 'steps': 53659, 'loss/train': 1.0930854082107544} -11/07/2021 04:46:39 - INFO - __main__ - Step 53661: {'lr': 0.00036415909092315786, 'samples': 10302912, 'steps': 53660, 'loss/train': 1.5359793901443481} -11/07/2021 04:46:39 - INFO - __main__ - Step 53662: {'lr': 0.00036415436973411095, 'samples': 10303104, 'steps': 53661, 'loss/train': 1.6880676746368408} -11/07/2021 04:46:40 - INFO - __main__ - Step 53663: {'lr': 0.0003641496484936278, 'samples': 10303296, 'steps': 53662, 'loss/train': 1.3289389610290527} -11/07/2021 04:46:41 - INFO - __main__ - Step 53664: {'lr': 0.0003641449272017106, 'samples': 10303488, 'steps': 53663, 'loss/train': 1.5129036903381348} -11/07/2021 04:46:41 - INFO - __main__ - Step 53665: {'lr': 0.00036414020585836144, 'samples': 10303680, 'steps': 53664, 'loss/train': 1.5871593952178955} -11/07/2021 04:46:41 - INFO - __main__ - Step 53666: {'lr': 0.00036413548446358255, 'samples': 10303872, 'steps': 53665, 'loss/train': 1.5378220081329346} -11/07/2021 04:46:42 - INFO - __main__ - Step 53667: {'lr': 0.0003641307630173759, 'samples': 10304064, 'steps': 53666, 'loss/train': 1.207553744316101} -11/07/2021 04:46:43 - INFO - __main__ - Step 53668: {'lr': 0.0003641260415197437, 'samples': 10304256, 'steps': 53667, 'loss/train': 0.4405873119831085} -11/07/2021 04:46:43 - INFO - __main__ - Step 53669: {'lr': 0.0003641213199706881, 'samples': 10304448, 'steps': 53668, 'loss/train': 1.459364414215088} -11/07/2021 04:46:43 - INFO - __main__ - Step 53670: {'lr': 0.0003641165983702111, 'samples': 10304640, 'steps': 53669, 'loss/train': 1.4419173002243042} -11/07/2021 04:46:44 - INFO - __main__ - Step 53671: {'lr': 0.000364111876718315, 'samples': 10304832, 'steps': 53670, 'loss/train': 1.442563533782959} -11/07/2021 04:46:44 - INFO - __main__ - Step 53672: {'lr': 0.0003641071550150019, 'samples': 10305024, 'steps': 53671, 'loss/train': 1.708547592163086} -11/07/2021 04:46:45 - INFO - __main__ - Step 53673: {'lr': 0.00036410243326027373, 'samples': 10305216, 'steps': 53672, 'loss/train': 1.2650524377822876} -11/07/2021 04:46:46 - INFO - __main__ - Step 53674: {'lr': 0.0003640977114541328, 'samples': 10305408, 'steps': 53673, 'loss/train': 1.3750654458999634} -11/07/2021 04:46:46 - INFO - __main__ - Step 53675: {'lr': 0.0003640929895965813, 'samples': 10305600, 'steps': 53674, 'loss/train': 1.3330191373825073} -11/07/2021 04:46:46 - INFO - __main__ - Step 53676: {'lr': 0.0003640882676876212, 'samples': 10305792, 'steps': 53675, 'loss/train': 1.2945555448532104} -11/07/2021 04:46:47 - INFO - __main__ - Step 53677: {'lr': 0.0003640835457272547, 'samples': 10305984, 'steps': 53676, 'loss/train': 0.9961517453193665} -11/07/2021 04:46:47 - INFO - __main__ - Step 53678: {'lr': 0.00036407882371548394, 'samples': 10306176, 'steps': 53677, 'loss/train': 1.57715904712677} -11/07/2021 04:46:48 - INFO - __main__ - Step 53679: {'lr': 0.00036407410165231096, 'samples': 10306368, 'steps': 53678, 'loss/train': 1.3340072631835938} -11/07/2021 04:46:48 - INFO - __main__ - Step 53680: {'lr': 0.000364069379537738, 'samples': 10306560, 'steps': 53679, 'loss/train': 1.40402352809906} -11/07/2021 04:46:49 - INFO - __main__ - Step 53681: {'lr': 0.0003640646573717671, 'samples': 10306752, 'steps': 53680, 'loss/train': 1.870320200920105} -11/07/2021 04:46:49 - INFO - __main__ - Step 53682: {'lr': 0.00036405993515440044, 'samples': 10306944, 'steps': 53681, 'loss/train': 1.4479228258132935} -11/07/2021 04:46:49 - INFO - __main__ - Step 53683: {'lr': 0.0003640552128856401, 'samples': 10307136, 'steps': 53682, 'loss/train': 1.7776511907577515} -11/07/2021 04:46:50 - INFO - __main__ - Step 53684: {'lr': 0.00036405049056548834, 'samples': 10307328, 'steps': 53683, 'loss/train': 1.0751904249191284} -11/07/2021 04:46:51 - INFO - __main__ - Step 53685: {'lr': 0.0003640457681939471, 'samples': 10307520, 'steps': 53684, 'loss/train': 1.1244386434555054} -11/07/2021 04:46:51 - INFO - __main__ - Step 53686: {'lr': 0.0003640410457710186, 'samples': 10307712, 'steps': 53685, 'loss/train': 1.837347149848938} -11/07/2021 04:46:51 - INFO - __main__ - Step 53687: {'lr': 0.000364036323296705, 'samples': 10307904, 'steps': 53686, 'loss/train': 1.4676305055618286} -11/07/2021 04:46:52 - INFO - __main__ - Step 53688: {'lr': 0.0003640316007710084, 'samples': 10308096, 'steps': 53687, 'loss/train': 1.7935171127319336} -11/07/2021 04:46:53 - INFO - __main__ - Step 53689: {'lr': 0.0003640268781939309, 'samples': 10308288, 'steps': 53688, 'loss/train': 0.6592240333557129} -11/07/2021 04:46:53 - INFO - __main__ - Step 53690: {'lr': 0.0003640221555654747, 'samples': 10308480, 'steps': 53689, 'loss/train': 1.243087887763977} -11/07/2021 04:46:53 - INFO - __main__ - Step 53691: {'lr': 0.0003640174328856418, 'samples': 10308672, 'steps': 53690, 'loss/train': 1.3240450620651245} -11/07/2021 04:46:54 - INFO - __main__ - Step 53692: {'lr': 0.0003640127101544344, 'samples': 10308864, 'steps': 53691, 'loss/train': 1.3351621627807617} -11/07/2021 04:46:54 - INFO - __main__ - Step 53693: {'lr': 0.00036400798737185465, 'samples': 10309056, 'steps': 53692, 'loss/train': 1.294119954109192} -11/07/2021 04:46:55 - INFO - __main__ - Step 53694: {'lr': 0.0003640032645379047, 'samples': 10309248, 'steps': 53693, 'loss/train': 1.5483777523040771} -11/07/2021 04:46:56 - INFO - __main__ - Step 53695: {'lr': 0.0003639985416525866, 'samples': 10309440, 'steps': 53694, 'loss/train': 1.6617079973220825} -11/07/2021 04:46:56 - INFO - __main__ - Step 53696: {'lr': 0.00036399381871590254, 'samples': 10309632, 'steps': 53695, 'loss/train': 1.4084619283676147} -11/07/2021 04:46:56 - INFO - __main__ - Step 53697: {'lr': 0.0003639890957278546, 'samples': 10309824, 'steps': 53696, 'loss/train': 0.486763060092926} -11/07/2021 04:46:57 - INFO - __main__ - Step 53698: {'lr': 0.0003639843726884449, 'samples': 10310016, 'steps': 53697, 'loss/train': 0.8962081670761108} -11/07/2021 04:46:58 - INFO - __main__ - Step 53699: {'lr': 0.0003639796495976757, 'samples': 10310208, 'steps': 53698, 'loss/train': 1.4068572521209717} -11/07/2021 04:46:58 - INFO - __main__ - Step 53700: {'lr': 0.000363974926455549, 'samples': 10310400, 'steps': 53699, 'loss/train': 1.7828649282455444} -11/07/2021 04:46:58 - INFO - __main__ - Step 53701: {'lr': 0.0003639702032620669, 'samples': 10310592, 'steps': 53700, 'loss/train': 1.5869852304458618} -11/07/2021 04:46:59 - INFO - __main__ - Step 53702: {'lr': 0.00036396548001723164, 'samples': 10310784, 'steps': 53701, 'loss/train': 1.3004422187805176} -11/07/2021 04:46:59 - INFO - __main__ - Step 53703: {'lr': 0.00036396075672104523, 'samples': 10310976, 'steps': 53702, 'loss/train': 0.5950105786323547} -11/07/2021 04:47:00 - INFO - __main__ - Step 53704: {'lr': 0.00036395603337350987, 'samples': 10311168, 'steps': 53703, 'loss/train': 1.9966845512390137} -11/07/2021 04:47:01 - INFO - __main__ - Step 53705: {'lr': 0.0003639513099746277, 'samples': 10311360, 'steps': 53704, 'loss/train': 1.6448525190353394} -11/07/2021 04:47:01 - INFO - __main__ - Step 53706: {'lr': 0.0003639465865244008, 'samples': 10311552, 'steps': 53705, 'loss/train': 1.3442103862762451} -11/07/2021 04:47:01 - INFO - __main__ - Step 53707: {'lr': 0.0003639418630228314, 'samples': 10311744, 'steps': 53706, 'loss/train': 1.686835765838623} -11/07/2021 04:47:02 - INFO - __main__ - Step 53708: {'lr': 0.00036393713946992156, 'samples': 10311936, 'steps': 53707, 'loss/train': 1.5133798122406006} -11/07/2021 04:47:02 - INFO - __main__ - Step 53709: {'lr': 0.0003639324158656733, 'samples': 10312128, 'steps': 53708, 'loss/train': 1.7039297819137573} -11/07/2021 04:47:03 - INFO - __main__ - Step 53710: {'lr': 0.00036392769221008895, 'samples': 10312320, 'steps': 53709, 'loss/train': 1.2365678548812866} -11/07/2021 04:47:03 - INFO - __main__ - Step 53711: {'lr': 0.0003639229685031705, 'samples': 10312512, 'steps': 53710, 'loss/train': 1.77914559841156} -11/07/2021 04:47:04 - INFO - __main__ - Step 53712: {'lr': 0.0003639182447449201, 'samples': 10312704, 'steps': 53711, 'loss/train': 1.595699429512024} -11/07/2021 04:47:04 - INFO - __main__ - Step 53713: {'lr': 0.00036391352093533995, 'samples': 10312896, 'steps': 53712, 'loss/train': 1.299613118171692} -11/07/2021 04:47:04 - INFO - __main__ - Step 53714: {'lr': 0.0003639087970744321, 'samples': 10313088, 'steps': 53713, 'loss/train': 1.5028570890426636} -11/07/2021 04:47:05 - INFO - __main__ - Step 53715: {'lr': 0.00036390407316219865, 'samples': 10313280, 'steps': 53714, 'loss/train': 1.6350452899932861} -11/07/2021 04:47:06 - INFO - __main__ - Step 53716: {'lr': 0.0003638993491986419, 'samples': 10313472, 'steps': 53715, 'loss/train': 1.6072763204574585} -11/07/2021 04:47:06 - INFO - __main__ - Step 53717: {'lr': 0.0003638946251837637, 'samples': 10313664, 'steps': 53716, 'loss/train': 0.8431642651557922} -11/07/2021 04:47:07 - INFO - __main__ - Step 53718: {'lr': 0.0003638899011175664, 'samples': 10313856, 'steps': 53717, 'loss/train': 1.6525471210479736} -11/07/2021 04:47:07 - INFO - __main__ - Step 53719: {'lr': 0.00036388517700005214, 'samples': 10314048, 'steps': 53718, 'loss/train': 1.4922749996185303} -11/07/2021 04:47:08 - INFO - __main__ - Step 53720: {'lr': 0.00036388045283122295, 'samples': 10314240, 'steps': 53719, 'loss/train': 1.281136393547058} -11/07/2021 04:47:08 - INFO - __main__ - Step 53721: {'lr': 0.00036387572861108097, 'samples': 10314432, 'steps': 53720, 'loss/train': 1.217883825302124} -11/07/2021 04:47:09 - INFO - __main__ - Step 53722: {'lr': 0.0003638710043396283, 'samples': 10314624, 'steps': 53721, 'loss/train': 1.5383968353271484} -11/07/2021 04:47:09 - INFO - __main__ - Step 53723: {'lr': 0.0003638662800168672, 'samples': 10314816, 'steps': 53722, 'loss/train': 1.8818771839141846} -11/07/2021 04:47:09 - INFO - __main__ - Step 53724: {'lr': 0.00036386155564279967, 'samples': 10315008, 'steps': 53723, 'loss/train': 2.0879263877868652} -11/07/2021 04:47:10 - INFO - __main__ - Step 53725: {'lr': 0.00036385683121742786, 'samples': 10315200, 'steps': 53724, 'loss/train': 1.3340603113174438} -11/07/2021 04:47:11 - INFO - __main__ - Step 53726: {'lr': 0.00036385210674075394, 'samples': 10315392, 'steps': 53725, 'loss/train': 0.9048414826393127} -11/07/2021 04:47:11 - INFO - __main__ - Step 53727: {'lr': 0.00036384738221278, 'samples': 10315584, 'steps': 53726, 'loss/train': 1.2589433193206787} -11/07/2021 04:47:11 - INFO - __main__ - Step 53728: {'lr': 0.0003638426576335082, 'samples': 10315776, 'steps': 53727, 'loss/train': 1.4779775142669678} -11/07/2021 04:47:12 - INFO - __main__ - Step 53729: {'lr': 0.00036383793300294063, 'samples': 10315968, 'steps': 53728, 'loss/train': 1.1890757083892822} -11/07/2021 04:47:13 - INFO - __main__ - Step 53730: {'lr': 0.00036383320832107945, 'samples': 10316160, 'steps': 53729, 'loss/train': 0.902030885219574} -11/07/2021 04:47:13 - INFO - __main__ - Step 53731: {'lr': 0.0003638284835879268, 'samples': 10316352, 'steps': 53730, 'loss/train': 1.5771640539169312} -11/07/2021 04:47:14 - INFO - __main__ - Step 53732: {'lr': 0.0003638237588034848, 'samples': 10316544, 'steps': 53731, 'loss/train': 1.7153632640838623} -11/07/2021 04:47:14 - INFO - __main__ - Step 53733: {'lr': 0.00036381903396775556, 'samples': 10316736, 'steps': 53732, 'loss/train': 1.4391967058181763} -11/07/2021 04:47:14 - INFO - __main__ - Step 53734: {'lr': 0.00036381430908074126, 'samples': 10316928, 'steps': 53733, 'loss/train': 0.6550378799438477} -11/07/2021 04:47:15 - INFO - __main__ - Step 53735: {'lr': 0.00036380958414244393, 'samples': 10317120, 'steps': 53734, 'loss/train': 1.7250784635543823} -11/07/2021 04:47:16 - INFO - __main__ - Step 53736: {'lr': 0.0003638048591528658, 'samples': 10317312, 'steps': 53735, 'loss/train': 1.365229606628418} -11/07/2021 04:47:16 - INFO - __main__ - Step 53737: {'lr': 0.0003638001341120089, 'samples': 10317504, 'steps': 53736, 'loss/train': 1.5920060873031616} -11/07/2021 04:47:16 - INFO - __main__ - Step 53738: {'lr': 0.00036379540901987546, 'samples': 10317696, 'steps': 53737, 'loss/train': 1.2214041948318481} -11/07/2021 04:47:17 - INFO - __main__ - Step 53739: {'lr': 0.0003637906838764675, 'samples': 10317888, 'steps': 53738, 'loss/train': 1.0287377834320068} -11/07/2021 04:47:18 - INFO - __main__ - Step 53740: {'lr': 0.00036378595868178737, 'samples': 10318080, 'steps': 53739, 'loss/train': 0.5260177254676819} -11/07/2021 04:47:18 - INFO - __main__ - Step 53741: {'lr': 0.00036378123343583694, 'samples': 10318272, 'steps': 53740, 'loss/train': 4.54772424697876} -11/07/2021 04:47:18 - INFO - __main__ - Step 53742: {'lr': 0.0003637765081386184, 'samples': 10318464, 'steps': 53741, 'loss/train': 1.2605921030044556} -11/07/2021 04:47:19 - INFO - __main__ - Step 53743: {'lr': 0.000363771782790134, 'samples': 10318656, 'steps': 53742, 'loss/train': 1.553490400314331} -11/07/2021 04:47:19 - INFO - __main__ - Step 53744: {'lr': 0.0003637670573903857, 'samples': 10318848, 'steps': 53743, 'loss/train': 1.5717657804489136} -11/07/2021 04:47:20 - INFO - __main__ - Step 53745: {'lr': 0.0003637623319393758, 'samples': 10319040, 'steps': 53744, 'loss/train': 1.5152475833892822} -11/07/2021 04:47:21 - INFO - __main__ - Step 53746: {'lr': 0.0003637576064371063, 'samples': 10319232, 'steps': 53745, 'loss/train': 1.27506685256958} -11/07/2021 04:47:21 - INFO - __main__ - Step 53747: {'lr': 0.0003637528808835794, 'samples': 10319424, 'steps': 53746, 'loss/train': 1.5017693042755127} -11/07/2021 04:47:21 - INFO - __main__ - Step 53748: {'lr': 0.00036374815527879725, 'samples': 10319616, 'steps': 53747, 'loss/train': 0.9367703795433044} -11/07/2021 04:47:22 - INFO - __main__ - Step 53749: {'lr': 0.0003637434296227619, 'samples': 10319808, 'steps': 53748, 'loss/train': 1.4065848588943481} -11/07/2021 04:47:22 - INFO - __main__ - Step 53750: {'lr': 0.0003637387039154755, 'samples': 10320000, 'steps': 53749, 'loss/train': 1.6673144102096558} -11/07/2021 04:47:23 - INFO - __main__ - Step 53751: {'lr': 0.0003637339781569402, 'samples': 10320192, 'steps': 53750, 'loss/train': 1.3397016525268555} -11/07/2021 04:47:23 - INFO - __main__ - Step 53752: {'lr': 0.0003637292523471581, 'samples': 10320384, 'steps': 53751, 'loss/train': 1.1209821701049805} -11/07/2021 04:47:24 - INFO - __main__ - Step 53753: {'lr': 0.0003637245264861314, 'samples': 10320576, 'steps': 53752, 'loss/train': 1.556083083152771} -11/07/2021 04:47:24 - INFO - __main__ - Step 53754: {'lr': 0.0003637198005738622, 'samples': 10320768, 'steps': 53753, 'loss/train': 1.0590068101882935} -11/07/2021 04:47:24 - INFO - __main__ - Step 53755: {'lr': 0.0003637150746103526, 'samples': 10320960, 'steps': 53754, 'loss/train': 1.3447222709655762} -11/07/2021 04:47:26 - INFO - __main__ - Step 53756: {'lr': 0.0003637103485956047, 'samples': 10321152, 'steps': 53755, 'loss/train': 1.2610257863998413} -11/07/2021 04:47:26 - INFO - __main__ - Step 53757: {'lr': 0.0003637056225296207, 'samples': 10321344, 'steps': 53756, 'loss/train': 1.4213162660598755} -11/07/2021 04:47:26 - INFO - __main__ - Step 53758: {'lr': 0.00036370089641240264, 'samples': 10321536, 'steps': 53757, 'loss/train': 1.2108180522918701} -11/07/2021 04:47:27 - INFO - __main__ - Step 53759: {'lr': 0.0003636961702439527, 'samples': 10321728, 'steps': 53758, 'loss/train': 2.09029483795166} -11/07/2021 04:47:27 - INFO - __main__ - Step 53760: {'lr': 0.0003636914440242732, 'samples': 10321920, 'steps': 53759, 'loss/train': 0.6936137080192566} -11/07/2021 04:47:28 - INFO - __main__ - Step 53761: {'lr': 0.00036368671775336597, 'samples': 10322112, 'steps': 53760, 'loss/train': 5.76736307144165} -11/07/2021 04:47:28 - INFO - __main__ - Step 53762: {'lr': 0.00036368199143123326, 'samples': 10322304, 'steps': 53761, 'loss/train': 0.5955904126167297} -11/07/2021 04:47:29 - INFO - __main__ - Step 53763: {'lr': 0.0003636772650578772, 'samples': 10322496, 'steps': 53762, 'loss/train': 1.3145180940628052} -11/07/2021 04:47:29 - INFO - __main__ - Step 53764: {'lr': 0.0003636725386332999, 'samples': 10322688, 'steps': 53763, 'loss/train': 1.5261660814285278} -11/07/2021 04:47:30 - INFO - __main__ - Step 53765: {'lr': 0.00036366781215750355, 'samples': 10322880, 'steps': 53764, 'loss/train': 1.5784448385238647} -11/07/2021 04:47:31 - INFO - __main__ - Step 53766: {'lr': 0.0003636630856304902, 'samples': 10323072, 'steps': 53765, 'loss/train': 1.6527149677276611} -11/07/2021 04:47:31 - INFO - __main__ - Step 53767: {'lr': 0.0003636583590522621, 'samples': 10323264, 'steps': 53766, 'loss/train': 1.1597646474838257} -11/07/2021 04:47:31 - INFO - __main__ - Step 53768: {'lr': 0.00036365363242282117, 'samples': 10323456, 'steps': 53767, 'loss/train': 1.369114637374878} -11/07/2021 04:47:32 - INFO - __main__ - Step 53769: {'lr': 0.00036364890574216974, 'samples': 10323648, 'steps': 53768, 'loss/train': 1.6082525253295898} -11/07/2021 04:47:32 - INFO - __main__ - Step 53770: {'lr': 0.0003636441790103098, 'samples': 10323840, 'steps': 53769, 'loss/train': 1.1371461153030396} -11/07/2021 04:47:32 - INFO - __main__ - Step 53771: {'lr': 0.00036363945222724363, 'samples': 10324032, 'steps': 53770, 'loss/train': 1.4053053855895996} -11/07/2021 04:47:33 - INFO - __main__ - Step 53772: {'lr': 0.0003636347253929733, 'samples': 10324224, 'steps': 53771, 'loss/train': 1.359999179840088} -11/07/2021 04:47:34 - INFO - __main__ - Step 53773: {'lr': 0.0003636299985075008, 'samples': 10324416, 'steps': 53772, 'loss/train': 0.18141159415245056} -11/07/2021 04:47:34 - INFO - __main__ - Step 53774: {'lr': 0.00036362527157082845, 'samples': 10324608, 'steps': 53773, 'loss/train': 1.189090371131897} -11/07/2021 04:47:34 - INFO - __main__ - Step 53775: {'lr': 0.00036362054458295836, 'samples': 10324800, 'steps': 53774, 'loss/train': 1.1098508834838867} -11/07/2021 04:47:35 - INFO - __main__ - Step 53776: {'lr': 0.0003636158175438925, 'samples': 10324992, 'steps': 53775, 'loss/train': 1.6424130201339722} -11/07/2021 04:47:36 - INFO - __main__ - Step 53777: {'lr': 0.00036361109045363315, 'samples': 10325184, 'steps': 53776, 'loss/train': 1.2648173570632935} -11/07/2021 04:47:36 - INFO - __main__ - Step 53778: {'lr': 0.0003636063633121824, 'samples': 10325376, 'steps': 53777, 'loss/train': 1.6093236207962036} -11/07/2021 04:47:36 - INFO - __main__ - Step 53779: {'lr': 0.0003636016361195423, 'samples': 10325568, 'steps': 53778, 'loss/train': 1.2295337915420532} -11/07/2021 04:47:37 - INFO - __main__ - Step 53780: {'lr': 0.0003635969088757152, 'samples': 10325760, 'steps': 53779, 'loss/train': 1.4420655965805054} -11/07/2021 04:47:37 - INFO - __main__ - Step 53781: {'lr': 0.000363592181580703, 'samples': 10325952, 'steps': 53780, 'loss/train': 1.3411906957626343} -11/07/2021 04:47:38 - INFO - __main__ - Step 53782: {'lr': 0.00036358745423450793, 'samples': 10326144, 'steps': 53781, 'loss/train': 1.7579644918441772} -11/07/2021 04:47:38 - INFO - __main__ - Step 53783: {'lr': 0.00036358272683713214, 'samples': 10326336, 'steps': 53782, 'loss/train': 1.5507636070251465} -11/07/2021 04:47:39 - INFO - __main__ - Step 53784: {'lr': 0.00036357799938857766, 'samples': 10326528, 'steps': 53783, 'loss/train': 1.4037292003631592} -11/07/2021 04:47:39 - INFO - __main__ - Step 53785: {'lr': 0.0003635732718888467, 'samples': 10326720, 'steps': 53784, 'loss/train': 1.7858861684799194} -11/07/2021 04:47:39 - INFO - __main__ - Step 53786: {'lr': 0.0003635685443379414, 'samples': 10326912, 'steps': 53785, 'loss/train': 1.620208501815796} -11/07/2021 04:47:41 - INFO - __main__ - Step 53787: {'lr': 0.0003635638167358639, 'samples': 10327104, 'steps': 53786, 'loss/train': 1.504921793937683} -11/07/2021 04:47:41 - INFO - __main__ - Step 53788: {'lr': 0.00036355908908261624, 'samples': 10327296, 'steps': 53787, 'loss/train': 1.457025170326233} -11/07/2021 04:47:41 - INFO - __main__ - Step 53789: {'lr': 0.0003635543613782006, 'samples': 10327488, 'steps': 53788, 'loss/train': 1.4828907251358032} -11/07/2021 04:47:42 - INFO - __main__ - Step 53790: {'lr': 0.0003635496336226192, 'samples': 10327680, 'steps': 53789, 'loss/train': 1.8180770874023438} -11/07/2021 04:47:42 - INFO - __main__ - Step 53791: {'lr': 0.00036354490581587396, 'samples': 10327872, 'steps': 53790, 'loss/train': 1.270146131515503} -11/07/2021 04:47:43 - INFO - __main__ - Step 53792: {'lr': 0.0003635401779579672, 'samples': 10328064, 'steps': 53791, 'loss/train': 1.7751363515853882} -11/07/2021 04:47:43 - INFO - __main__ - Step 53793: {'lr': 0.000363535450048901, 'samples': 10328256, 'steps': 53792, 'loss/train': 1.0968623161315918} -11/07/2021 04:47:44 - INFO - __main__ - Step 53794: {'lr': 0.00036353072208867746, 'samples': 10328448, 'steps': 53793, 'loss/train': 1.5342804193496704} -11/07/2021 04:47:44 - INFO - __main__ - Step 53795: {'lr': 0.00036352599407729873, 'samples': 10328640, 'steps': 53794, 'loss/train': 2.254974126815796} -11/07/2021 04:47:44 - INFO - __main__ - Step 53796: {'lr': 0.00036352126601476697, 'samples': 10328832, 'steps': 53795, 'loss/train': 0.7802295088768005} -11/07/2021 04:47:46 - INFO - __main__ - Step 53797: {'lr': 0.0003635165379010842, 'samples': 10329024, 'steps': 53796, 'loss/train': 1.4556673765182495} -11/07/2021 04:47:46 - INFO - __main__ - Step 53798: {'lr': 0.0003635118097362528, 'samples': 10329216, 'steps': 53797, 'loss/train': 1.4433975219726562} -11/07/2021 04:47:46 - INFO - __main__ - Step 53799: {'lr': 0.0003635070815202746, 'samples': 10329408, 'steps': 53798, 'loss/train': 1.3020963668823242} -11/07/2021 04:47:47 - INFO - __main__ - Step 53800: {'lr': 0.0003635023532531518, 'samples': 10329600, 'steps': 53799, 'loss/train': 1.1585911512374878} -11/07/2021 04:47:47 - INFO - __main__ - Step 53801: {'lr': 0.00036349762493488667, 'samples': 10329792, 'steps': 53800, 'loss/train': 1.520574927330017} -11/07/2021 04:47:48 - INFO - __main__ - Step 53802: {'lr': 0.0003634928965654813, 'samples': 10329984, 'steps': 53801, 'loss/train': 1.0751932859420776} -11/07/2021 04:47:48 - INFO - __main__ - Step 53803: {'lr': 0.0003634881681449377, 'samples': 10330176, 'steps': 53802, 'loss/train': 1.605992317199707} -11/07/2021 04:47:49 - INFO - __main__ - Step 53804: {'lr': 0.00036348343967325814, 'samples': 10330368, 'steps': 53803, 'loss/train': 1.3527597188949585} -11/07/2021 04:47:49 - INFO - __main__ - Step 53805: {'lr': 0.00036347871115044466, 'samples': 10330560, 'steps': 53804, 'loss/train': 1.6451653242111206} -11/07/2021 04:47:49 - INFO - __main__ - Step 53806: {'lr': 0.0003634739825764995, 'samples': 10330752, 'steps': 53805, 'loss/train': 1.4473252296447754} -11/07/2021 04:47:50 - INFO - __main__ - Step 53807: {'lr': 0.00036346925395142467, 'samples': 10330944, 'steps': 53806, 'loss/train': 1.5503804683685303} -11/07/2021 04:47:51 - INFO - __main__ - Step 53808: {'lr': 0.00036346452527522233, 'samples': 10331136, 'steps': 53807, 'loss/train': 0.5679416656494141} -11/07/2021 04:47:51 - INFO - __main__ - Step 53809: {'lr': 0.0003634597965478946, 'samples': 10331328, 'steps': 53808, 'loss/train': 1.4964993000030518} -11/07/2021 04:47:51 - INFO - __main__ - Step 53810: {'lr': 0.00036345506776944364, 'samples': 10331520, 'steps': 53809, 'loss/train': 1.9264088869094849} -11/07/2021 04:47:52 - INFO - __main__ - Step 53811: {'lr': 0.00036345033893987164, 'samples': 10331712, 'steps': 53810, 'loss/train': 1.2241166830062866} -11/07/2021 04:47:53 - INFO - __main__ - Step 53812: {'lr': 0.00036344561005918064, 'samples': 10331904, 'steps': 53811, 'loss/train': 1.086397409439087} -11/07/2021 04:47:53 - INFO - __main__ - Step 53813: {'lr': 0.00036344088112737276, 'samples': 10332096, 'steps': 53812, 'loss/train': 1.5006593465805054} -11/07/2021 04:47:53 - INFO - __main__ - Step 53814: {'lr': 0.0003634361521444502, 'samples': 10332288, 'steps': 53813, 'loss/train': 1.4294464588165283} -11/07/2021 04:47:54 - INFO - __main__ - Step 53815: {'lr': 0.00036343142311041503, 'samples': 10332480, 'steps': 53814, 'loss/train': 1.3686741590499878} -11/07/2021 04:47:54 - INFO - __main__ - Step 53816: {'lr': 0.00036342669402526946, 'samples': 10332672, 'steps': 53815, 'loss/train': 1.4084200859069824} -11/07/2021 04:47:55 - INFO - __main__ - Step 53817: {'lr': 0.0003634219648890156, 'samples': 10332864, 'steps': 53816, 'loss/train': 1.3252638578414917} -11/07/2021 04:47:55 - INFO - __main__ - Step 53818: {'lr': 0.00036341723570165545, 'samples': 10333056, 'steps': 53817, 'loss/train': 1.0600765943527222} -11/07/2021 04:47:56 - INFO - __main__ - Step 53819: {'lr': 0.0003634125064631913, 'samples': 10333248, 'steps': 53818, 'loss/train': 1.2755149602890015} -11/07/2021 04:47:56 - INFO - __main__ - Step 53820: {'lr': 0.0003634077771736252, 'samples': 10333440, 'steps': 53819, 'loss/train': 1.4315431118011475} -11/07/2021 04:47:57 - INFO - __main__ - Step 53821: {'lr': 0.00036340304783295937, 'samples': 10333632, 'steps': 53820, 'loss/train': 1.654606819152832} -11/07/2021 04:47:57 - INFO - __main__ - Step 53822: {'lr': 0.0003633983184411958, 'samples': 10333824, 'steps': 53821, 'loss/train': 1.3569787740707397} -11/07/2021 04:47:58 - INFO - __main__ - Step 53823: {'lr': 0.00036339358899833675, 'samples': 10334016, 'steps': 53822, 'loss/train': 1.6146955490112305} -11/07/2021 04:47:59 - INFO - __main__ - Step 53824: {'lr': 0.00036338885950438425, 'samples': 10334208, 'steps': 53823, 'loss/train': 1.7868359088897705} -11/07/2021 04:47:59 - INFO - __main__ - Step 53825: {'lr': 0.00036338412995934056, 'samples': 10334400, 'steps': 53824, 'loss/train': 1.8714745044708252} -11/07/2021 04:47:59 - INFO - __main__ - Step 53826: {'lr': 0.00036337940036320764, 'samples': 10334592, 'steps': 53825, 'loss/train': 1.0929986238479614} -11/07/2021 04:48:00 - INFO - __main__ - Step 53827: {'lr': 0.0003633746707159877, 'samples': 10334784, 'steps': 53826, 'loss/train': 1.3598603010177612} -11/07/2021 04:48:01 - INFO - __main__ - Step 53828: {'lr': 0.00036336994101768304, 'samples': 10334976, 'steps': 53827, 'loss/train': 0.10197296738624573} -11/07/2021 04:48:01 - INFO - __main__ - Step 53829: {'lr': 0.00036336521126829554, 'samples': 10335168, 'steps': 53828, 'loss/train': 0.9619058966636658} -11/07/2021 04:48:01 - INFO - __main__ - Step 53830: {'lr': 0.00036336048146782743, 'samples': 10335360, 'steps': 53829, 'loss/train': 1.5208972692489624} -11/07/2021 04:48:02 - INFO - __main__ - Step 53831: {'lr': 0.00036335575161628076, 'samples': 10335552, 'steps': 53830, 'loss/train': 1.1052848100662231} -11/07/2021 04:48:02 - INFO - __main__ - Step 53832: {'lr': 0.0003633510217136578, 'samples': 10335744, 'steps': 53831, 'loss/train': 1.211521029472351} -11/07/2021 04:48:02 - INFO - __main__ - Step 53833: {'lr': 0.0003633462917599606, 'samples': 10335936, 'steps': 53832, 'loss/train': 1.2743152379989624} -11/07/2021 04:48:04 - INFO - __main__ - Step 53834: {'lr': 0.0003633415617551914, 'samples': 10336128, 'steps': 53833, 'loss/train': 1.2937463521957397} -11/07/2021 04:48:04 - INFO - __main__ - Step 53835: {'lr': 0.0003633368316993521, 'samples': 10336320, 'steps': 53834, 'loss/train': 1.0048315525054932} -11/07/2021 04:48:04 - INFO - __main__ - Step 53836: {'lr': 0.0003633321015924451, 'samples': 10336512, 'steps': 53835, 'loss/train': 1.6738377809524536} -11/07/2021 04:48:05 - INFO - __main__ - Step 53837: {'lr': 0.0003633273714344723, 'samples': 10336704, 'steps': 53836, 'loss/train': 1.8290668725967407} -11/07/2021 04:48:05 - INFO - __main__ - Step 53838: {'lr': 0.00036332264122543594, 'samples': 10336896, 'steps': 53837, 'loss/train': 1.311269998550415} -11/07/2021 04:48:06 - INFO - __main__ - Step 53839: {'lr': 0.00036331791096533815, 'samples': 10337088, 'steps': 53838, 'loss/train': 1.4427428245544434} -11/07/2021 04:48:06 - INFO - __main__ - Step 53840: {'lr': 0.0003633131806541811, 'samples': 10337280, 'steps': 53839, 'loss/train': 1.5543686151504517} -11/07/2021 04:48:07 - INFO - __main__ - Step 53841: {'lr': 0.000363308450291967, 'samples': 10337472, 'steps': 53840, 'loss/train': 1.4297562837600708} -11/07/2021 04:48:07 - INFO - __main__ - Step 53842: {'lr': 0.0003633037198786977, 'samples': 10337664, 'steps': 53841, 'loss/train': 1.35160493850708} -11/07/2021 04:48:07 - INFO - __main__ - Step 53843: {'lr': 0.0003632989894143755, 'samples': 10337856, 'steps': 53842, 'loss/train': 1.9040676355361938} -11/07/2021 04:48:09 - INFO - __main__ - Step 53844: {'lr': 0.0003632942588990025, 'samples': 10338048, 'steps': 53843, 'loss/train': 0.9160776734352112} -11/07/2021 04:48:09 - INFO - __main__ - Step 53845: {'lr': 0.00036328952833258096, 'samples': 10338240, 'steps': 53844, 'loss/train': 1.2757924795150757} -11/07/2021 04:48:09 - INFO - __main__ - Step 53846: {'lr': 0.0003632847977151128, 'samples': 10338432, 'steps': 53845, 'loss/train': 1.3739603757858276} -11/07/2021 04:48:10 - INFO - __main__ - Step 53847: {'lr': 0.0003632800670466003, 'samples': 10338624, 'steps': 53846, 'loss/train': 2.090402126312256} -11/07/2021 04:48:10 - INFO - __main__ - Step 53848: {'lr': 0.0003632753363270456, 'samples': 10338816, 'steps': 53847, 'loss/train': 1.2552708387374878} -11/07/2021 04:48:11 - INFO - __main__ - Step 53849: {'lr': 0.00036327060555645075, 'samples': 10339008, 'steps': 53848, 'loss/train': 2.2328643798828125} -11/07/2021 04:48:11 - INFO - __main__ - Step 53850: {'lr': 0.0003632658747348179, 'samples': 10339200, 'steps': 53849, 'loss/train': 1.481790542602539} -11/07/2021 04:48:12 - INFO - __main__ - Step 53851: {'lr': 0.0003632611438621492, 'samples': 10339392, 'steps': 53850, 'loss/train': 1.4229248762130737} -11/07/2021 04:48:12 - INFO - __main__ - Step 53852: {'lr': 0.00036325641293844674, 'samples': 10339584, 'steps': 53851, 'loss/train': 1.4889165163040161} -11/07/2021 04:48:13 - INFO - __main__ - Step 53853: {'lr': 0.0003632516819637127, 'samples': 10339776, 'steps': 53852, 'loss/train': 1.4895575046539307} -11/07/2021 04:48:14 - INFO - __main__ - Step 53854: {'lr': 0.0003632469509379492, 'samples': 10339968, 'steps': 53853, 'loss/train': 1.564021110534668} -11/07/2021 04:48:14 - INFO - __main__ - Step 53855: {'lr': 0.00036324221986115847, 'samples': 10340160, 'steps': 53854, 'loss/train': 1.301256775856018} -11/07/2021 04:48:14 - INFO - __main__ - Step 53856: {'lr': 0.00036323748873334246, 'samples': 10340352, 'steps': 53855, 'loss/train': 1.5127121210098267} -11/07/2021 04:48:15 - INFO - __main__ - Step 53857: {'lr': 0.00036323275755450335, 'samples': 10340544, 'steps': 53856, 'loss/train': 1.2701239585876465} -11/07/2021 04:48:15 - INFO - __main__ - Step 53858: {'lr': 0.00036322802632464336, 'samples': 10340736, 'steps': 53857, 'loss/train': 1.4404006004333496} -11/07/2021 04:48:16 - INFO - __main__ - Step 53859: {'lr': 0.00036322329504376457, 'samples': 10340928, 'steps': 53858, 'loss/train': 1.1640100479125977} -11/07/2021 04:48:16 - INFO - __main__ - Step 53860: {'lr': 0.0003632185637118691, 'samples': 10341120, 'steps': 53859, 'loss/train': 3.0354626178741455} -11/07/2021 04:48:17 - INFO - __main__ - Step 53861: {'lr': 0.0003632138323289591, 'samples': 10341312, 'steps': 53860, 'loss/train': 1.0776021480560303} -11/07/2021 04:48:17 - INFO - __main__ - Step 53862: {'lr': 0.00036320910089503665, 'samples': 10341504, 'steps': 53861, 'loss/train': 1.5987331867218018} -11/07/2021 04:48:17 - INFO - __main__ - Step 53863: {'lr': 0.00036320436941010396, 'samples': 10341696, 'steps': 53862, 'loss/train': 1.5577402114868164} -11/07/2021 04:48:19 - INFO - __main__ - Step 53864: {'lr': 0.00036319963787416313, 'samples': 10341888, 'steps': 53863, 'loss/train': 1.2340596914291382} -11/07/2021 04:48:19 - INFO - __main__ - Step 53865: {'lr': 0.0003631949062872163, 'samples': 10342080, 'steps': 53864, 'loss/train': 1.2378990650177002} -11/07/2021 04:48:19 - INFO - __main__ - Step 53866: {'lr': 0.0003631901746492656, 'samples': 10342272, 'steps': 53865, 'loss/train': 0.44143298268318176} -11/07/2021 04:48:20 - INFO - __main__ - Step 53867: {'lr': 0.0003631854429603131, 'samples': 10342464, 'steps': 53866, 'loss/train': 1.5051151514053345} -11/07/2021 04:48:20 - INFO - __main__ - Step 53868: {'lr': 0.00036318071122036104, 'samples': 10342656, 'steps': 53867, 'loss/train': 1.5813905000686646} -11/07/2021 04:48:20 - INFO - __main__ - Step 53869: {'lr': 0.0003631759794294115, 'samples': 10342848, 'steps': 53868, 'loss/train': 0.08255495876073837} -11/07/2021 04:48:21 - INFO - __main__ - Step 53870: {'lr': 0.00036317124758746656, 'samples': 10343040, 'steps': 53869, 'loss/train': 1.330836296081543} -11/07/2021 04:48:22 - INFO - __main__ - Step 53871: {'lr': 0.0003631665156945284, 'samples': 10343232, 'steps': 53870, 'loss/train': 1.091623306274414} -11/07/2021 04:48:22 - INFO - __main__ - Step 53872: {'lr': 0.0003631617837505992, 'samples': 10343424, 'steps': 53871, 'loss/train': 1.3825600147247314} -11/07/2021 04:48:22 - INFO - __main__ - Step 53873: {'lr': 0.00036315705175568103, 'samples': 10343616, 'steps': 53872, 'loss/train': 1.1355825662612915} -11/07/2021 04:48:23 - INFO - __main__ - Step 53874: {'lr': 0.000363152319709776, 'samples': 10343808, 'steps': 53873, 'loss/train': 1.1304973363876343} -11/07/2021 04:48:24 - INFO - __main__ - Step 53875: {'lr': 0.00036314758761288643, 'samples': 10344000, 'steps': 53874, 'loss/train': 1.3253768682479858} -11/07/2021 04:48:24 - INFO - __main__ - Step 53876: {'lr': 0.00036314285546501415, 'samples': 10344192, 'steps': 53875, 'loss/train': 1.359163522720337} -11/07/2021 04:48:24 - INFO - __main__ - Step 53877: {'lr': 0.0003631381232661615, 'samples': 10344384, 'steps': 53876, 'loss/train': 1.0204049348831177} -11/07/2021 04:48:25 - INFO - __main__ - Step 53878: {'lr': 0.0003631333910163305, 'samples': 10344576, 'steps': 53877, 'loss/train': 1.375170111656189} -11/07/2021 04:48:25 - INFO - __main__ - Step 53879: {'lr': 0.0003631286587155234, 'samples': 10344768, 'steps': 53878, 'loss/train': 1.1854912042617798} -11/07/2021 04:48:26 - INFO - __main__ - Step 53880: {'lr': 0.00036312392636374225, 'samples': 10344960, 'steps': 53879, 'loss/train': 1.249647855758667} -11/07/2021 04:48:26 - INFO - __main__ - Step 53881: {'lr': 0.00036311919396098927, 'samples': 10345152, 'steps': 53880, 'loss/train': 1.4819236993789673} -11/07/2021 04:48:27 - INFO - __main__ - Step 53882: {'lr': 0.0003631144615072665, 'samples': 10345344, 'steps': 53881, 'loss/train': 1.2886788845062256} -11/07/2021 04:48:27 - INFO - __main__ - Step 53883: {'lr': 0.000363109729002576, 'samples': 10345536, 'steps': 53882, 'loss/train': 1.022611379623413} -11/07/2021 04:48:28 - INFO - __main__ - Step 53884: {'lr': 0.0003631049964469201, 'samples': 10345728, 'steps': 53883, 'loss/train': 0.9048346877098083} -11/07/2021 04:48:29 - INFO - __main__ - Step 53885: {'lr': 0.0003631002638403008, 'samples': 10345920, 'steps': 53884, 'loss/train': 1.0623703002929688} -11/07/2021 04:48:29 - INFO - __main__ - Step 53886: {'lr': 0.0003630955311827202, 'samples': 10346112, 'steps': 53885, 'loss/train': 1.9823561906814575} -11/07/2021 04:48:29 - INFO - __main__ - Step 53887: {'lr': 0.0003630907984741806, 'samples': 10346304, 'steps': 53886, 'loss/train': 1.3129116296768188} -11/07/2021 04:48:30 - INFO - __main__ - Step 53888: {'lr': 0.00036308606571468406, 'samples': 10346496, 'steps': 53887, 'loss/train': 1.1289273500442505} -11/07/2021 04:48:30 - INFO - __main__ - Step 53889: {'lr': 0.00036308133290423257, 'samples': 10346688, 'steps': 53888, 'loss/train': 1.3464230298995972} -11/07/2021 04:48:31 - INFO - __main__ - Step 53890: {'lr': 0.00036307660004282846, 'samples': 10346880, 'steps': 53889, 'loss/train': 2.4567363262176514} -11/07/2021 04:48:31 - INFO - __main__ - Step 53891: {'lr': 0.0003630718671304737, 'samples': 10347072, 'steps': 53890, 'loss/train': 2.03482985496521} -11/07/2021 04:48:32 - INFO - __main__ - Step 53892: {'lr': 0.0003630671341671705, 'samples': 10347264, 'steps': 53891, 'loss/train': 1.603682518005371} -11/07/2021 04:48:32 - INFO - __main__ - Step 53893: {'lr': 0.0003630624011529211, 'samples': 10347456, 'steps': 53892, 'loss/train': 1.567132592201233} -11/07/2021 04:48:33 - INFO - __main__ - Step 53894: {'lr': 0.00036305766808772746, 'samples': 10347648, 'steps': 53893, 'loss/train': 1.824984073638916} -11/07/2021 04:48:34 - INFO - __main__ - Step 53895: {'lr': 0.0003630529349715918, 'samples': 10347840, 'steps': 53894, 'loss/train': 1.2993921041488647} -11/07/2021 04:48:34 - INFO - __main__ - Step 53896: {'lr': 0.0003630482018045163, 'samples': 10348032, 'steps': 53895, 'loss/train': 1.4212656021118164} -11/07/2021 04:48:34 - INFO - __main__ - Step 53897: {'lr': 0.0003630434685865029, 'samples': 10348224, 'steps': 53896, 'loss/train': 1.712717890739441} -11/07/2021 04:48:35 - INFO - __main__ - Step 53898: {'lr': 0.0003630387353175539, 'samples': 10348416, 'steps': 53897, 'loss/train': 1.80906081199646} -11/07/2021 04:48:35 - INFO - __main__ - Step 53899: {'lr': 0.0003630340019976713, 'samples': 10348608, 'steps': 53898, 'loss/train': 1.4683196544647217} -11/07/2021 04:48:35 - INFO - __main__ - Step 53900: {'lr': 0.0003630292686268575, 'samples': 10348800, 'steps': 53899, 'loss/train': 1.5854510068893433} -11/07/2021 04:48:36 - INFO - __main__ - Step 53901: {'lr': 0.00036302453520511437, 'samples': 10348992, 'steps': 53900, 'loss/train': 1.466431736946106} -11/07/2021 04:48:37 - INFO - __main__ - Step 53902: {'lr': 0.0003630198017324441, 'samples': 10349184, 'steps': 53901, 'loss/train': 1.3616070747375488} -11/07/2021 04:48:37 - INFO - __main__ - Step 53903: {'lr': 0.0003630150682088489, 'samples': 10349376, 'steps': 53902, 'loss/train': 1.537035346031189} -11/07/2021 04:48:37 - INFO - __main__ - Step 53904: {'lr': 0.00036301033463433086, 'samples': 10349568, 'steps': 53903, 'loss/train': 1.1756144762039185} -11/07/2021 04:48:38 - INFO - __main__ - Step 53905: {'lr': 0.0003630056010088921, 'samples': 10349760, 'steps': 53904, 'loss/train': 1.52498459815979} -11/07/2021 04:48:39 - INFO - __main__ - Step 53906: {'lr': 0.00036300086733253466, 'samples': 10349952, 'steps': 53905, 'loss/train': 1.091630220413208} -11/07/2021 04:48:39 - INFO - __main__ - Step 53907: {'lr': 0.0003629961336052609, 'samples': 10350144, 'steps': 53906, 'loss/train': 1.2740652561187744} -11/07/2021 04:48:39 - INFO - __main__ - Step 53908: {'lr': 0.0003629913998270728, 'samples': 10350336, 'steps': 53907, 'loss/train': 1.3619333505630493} -11/07/2021 04:48:40 - INFO - __main__ - Step 53909: {'lr': 0.00036298666599797247, 'samples': 10350528, 'steps': 53908, 'loss/train': 1.5594091415405273} -11/07/2021 04:48:40 - INFO - __main__ - Step 53910: {'lr': 0.00036298193211796215, 'samples': 10350720, 'steps': 53909, 'loss/train': 1.852355718612671} -11/07/2021 04:48:41 - INFO - __main__ - Step 53911: {'lr': 0.0003629771981870439, 'samples': 10350912, 'steps': 53910, 'loss/train': 1.3001776933670044} -11/07/2021 04:48:42 - INFO - __main__ - Step 53912: {'lr': 0.0003629724642052198, 'samples': 10351104, 'steps': 53911, 'loss/train': 1.5244321823120117} -11/07/2021 04:48:42 - INFO - __main__ - Step 53913: {'lr': 0.00036296773017249214, 'samples': 10351296, 'steps': 53912, 'loss/train': 1.7219111919403076} -11/07/2021 04:48:42 - INFO - __main__ - Step 53914: {'lr': 0.0003629629960888629, 'samples': 10351488, 'steps': 53913, 'loss/train': 0.431939959526062} -11/07/2021 04:48:43 - INFO - __main__ - Step 53915: {'lr': 0.00036295826195433434, 'samples': 10351680, 'steps': 53914, 'loss/train': 1.7920550107955933} -11/07/2021 04:48:44 - INFO - __main__ - Step 53916: {'lr': 0.0003629535277689085, 'samples': 10351872, 'steps': 53915, 'loss/train': 1.7504496574401855} -11/07/2021 04:48:44 - INFO - __main__ - Step 53917: {'lr': 0.00036294879353258755, 'samples': 10352064, 'steps': 53916, 'loss/train': 1.102777361869812} -11/07/2021 04:48:45 - INFO - __main__ - Step 53918: {'lr': 0.0003629440592453736, 'samples': 10352256, 'steps': 53917, 'loss/train': 1.5030699968338013} -11/07/2021 04:48:45 - INFO - __main__ - Step 53919: {'lr': 0.0003629393249072688, 'samples': 10352448, 'steps': 53918, 'loss/train': 1.0274672508239746} -11/07/2021 04:48:45 - INFO - __main__ - Step 53920: {'lr': 0.00036293459051827526, 'samples': 10352640, 'steps': 53919, 'loss/train': 1.5233278274536133} -11/07/2021 04:48:46 - INFO - __main__ - Step 53921: {'lr': 0.0003629298560783952, 'samples': 10352832, 'steps': 53920, 'loss/train': 1.2541234493255615} -11/07/2021 04:48:47 - INFO - __main__ - Step 53922: {'lr': 0.0003629251215876307, 'samples': 10353024, 'steps': 53921, 'loss/train': 1.6004103422164917} -11/07/2021 04:48:47 - INFO - __main__ - Step 53923: {'lr': 0.0003629203870459838, 'samples': 10353216, 'steps': 53922, 'loss/train': 1.385047435760498} -11/07/2021 04:48:47 - INFO - __main__ - Step 53924: {'lr': 0.00036291565245345677, 'samples': 10353408, 'steps': 53923, 'loss/train': 1.3251805305480957} -11/07/2021 04:48:48 - INFO - __main__ - Step 53925: {'lr': 0.0003629109178100516, 'samples': 10353600, 'steps': 53924, 'loss/train': 1.2210359573364258} -11/07/2021 04:48:48 - INFO - __main__ - Step 53926: {'lr': 0.0003629061831157706, 'samples': 10353792, 'steps': 53925, 'loss/train': 0.8227512836456299} -11/07/2021 04:48:49 - INFO - __main__ - Step 53927: {'lr': 0.00036290144837061586, 'samples': 10353984, 'steps': 53926, 'loss/train': 1.217120885848999} -11/07/2021 04:48:50 - INFO - __main__ - Step 53928: {'lr': 0.00036289671357458937, 'samples': 10354176, 'steps': 53927, 'loss/train': 0.7737321257591248} -11/07/2021 04:48:50 - INFO - __main__ - Step 53929: {'lr': 0.00036289197872769346, 'samples': 10354368, 'steps': 53928, 'loss/train': 1.5767134428024292} -11/07/2021 04:48:50 - INFO - __main__ - Step 53930: {'lr': 0.0003628872438299301, 'samples': 10354560, 'steps': 53929, 'loss/train': 1.3147779703140259} -11/07/2021 04:48:51 - INFO - __main__ - Step 53931: {'lr': 0.0003628825088813015, 'samples': 10354752, 'steps': 53930, 'loss/train': 0.9428694248199463} -11/07/2021 04:48:52 - INFO - __main__ - Step 53932: {'lr': 0.00036287777388180977, 'samples': 10354944, 'steps': 53931, 'loss/train': 1.4914923906326294} -11/07/2021 04:48:52 - INFO - __main__ - Step 53933: {'lr': 0.00036287303883145703, 'samples': 10355136, 'steps': 53932, 'loss/train': 1.3886076211929321} -11/07/2021 04:48:52 - INFO - __main__ - Step 53934: {'lr': 0.00036286830373024546, 'samples': 10355328, 'steps': 53933, 'loss/train': 1.3711997270584106} -11/07/2021 04:48:53 - INFO - __main__ - Step 53935: {'lr': 0.00036286356857817727, 'samples': 10355520, 'steps': 53934, 'loss/train': 1.2949281930923462} -11/07/2021 04:48:53 - INFO - __main__ - Step 53936: {'lr': 0.0003628588333752544, 'samples': 10355712, 'steps': 53935, 'loss/train': 1.4670205116271973} -11/07/2021 04:48:54 - INFO - __main__ - Step 53937: {'lr': 0.0003628540981214791, 'samples': 10355904, 'steps': 53936, 'loss/train': 1.432778239250183} -11/07/2021 04:48:54 - INFO - __main__ - Step 53938: {'lr': 0.00036284936281685354, 'samples': 10356096, 'steps': 53937, 'loss/train': 1.5690598487854004} -11/07/2021 04:48:55 - INFO - __main__ - Step 53939: {'lr': 0.0003628446274613797, 'samples': 10356288, 'steps': 53938, 'loss/train': 1.3823480606079102} -11/07/2021 04:48:55 - INFO - __main__ - Step 53940: {'lr': 0.00036283989205505987, 'samples': 10356480, 'steps': 53939, 'loss/train': 1.4392648935317993} -11/07/2021 04:48:55 - INFO - __main__ - Step 53941: {'lr': 0.00036283515659789615, 'samples': 10356672, 'steps': 53940, 'loss/train': 1.712378978729248} -11/07/2021 04:48:56 - INFO - __main__ - Step 53942: {'lr': 0.0003628304210898906, 'samples': 10356864, 'steps': 53941, 'loss/train': 1.7036980390548706} -11/07/2021 04:48:57 - INFO - __main__ - Step 53943: {'lr': 0.00036282568553104545, 'samples': 10357056, 'steps': 53942, 'loss/train': 1.7509475946426392} -11/07/2021 04:48:57 - INFO - __main__ - Step 53944: {'lr': 0.00036282094992136273, 'samples': 10357248, 'steps': 53943, 'loss/train': 1.8214190006256104} -11/07/2021 04:48:57 - INFO - __main__ - Step 53945: {'lr': 0.00036281621426084465, 'samples': 10357440, 'steps': 53944, 'loss/train': 1.5594524145126343} -11/07/2021 04:48:58 - INFO - __main__ - Step 53946: {'lr': 0.0003628114785494934, 'samples': 10357632, 'steps': 53945, 'loss/train': 1.8242552280426025} -11/07/2021 04:48:59 - INFO - __main__ - Step 53947: {'lr': 0.00036280674278731096, 'samples': 10357824, 'steps': 53946, 'loss/train': 1.0017260313034058} -11/07/2021 04:48:59 - INFO - __main__ - Step 53948: {'lr': 0.00036280200697429957, 'samples': 10358016, 'steps': 53947, 'loss/train': 1.238772988319397} -11/07/2021 04:48:59 - INFO - __main__ - Step 53949: {'lr': 0.00036279727111046127, 'samples': 10358208, 'steps': 53948, 'loss/train': 0.9045762419700623} -11/07/2021 04:49:00 - INFO - __main__ - Step 53950: {'lr': 0.0003627925351957983, 'samples': 10358400, 'steps': 53949, 'loss/train': 1.3031666278839111} -11/07/2021 04:49:00 - INFO - __main__ - Step 53951: {'lr': 0.0003627877992303128, 'samples': 10358592, 'steps': 53950, 'loss/train': 1.427990198135376} -11/07/2021 04:49:01 - INFO - __main__ - Step 53952: {'lr': 0.0003627830632140068, 'samples': 10358784, 'steps': 53951, 'loss/train': 1.4603978395462036} -11/07/2021 04:49:01 - INFO - __main__ - Step 53953: {'lr': 0.0003627783271468825, 'samples': 10358976, 'steps': 53952, 'loss/train': 1.7184420824050903} -11/07/2021 04:49:02 - INFO - __main__ - Step 53954: {'lr': 0.0003627735910289421, 'samples': 10359168, 'steps': 53953, 'loss/train': 1.546921730041504} -11/07/2021 04:49:02 - INFO - __main__ - Step 53955: {'lr': 0.0003627688548601876, 'samples': 10359360, 'steps': 53954, 'loss/train': 1.5725740194320679} -11/07/2021 04:49:03 - INFO - __main__ - Step 53956: {'lr': 0.00036276411864062116, 'samples': 10359552, 'steps': 53955, 'loss/train': 1.5984454154968262} -11/07/2021 04:49:03 - INFO - __main__ - Step 53957: {'lr': 0.00036275938237024505, 'samples': 10359744, 'steps': 53956, 'loss/train': 1.3893181085586548} -11/07/2021 04:49:04 - INFO - __main__ - Step 53958: {'lr': 0.00036275464604906116, 'samples': 10359936, 'steps': 53957, 'loss/train': 1.3340251445770264} -11/07/2021 04:49:04 - INFO - __main__ - Step 53959: {'lr': 0.0003627499096770719, 'samples': 10360128, 'steps': 53958, 'loss/train': 0.9483999609947205} -11/07/2021 04:49:05 - INFO - __main__ - Step 53960: {'lr': 0.0003627451732542791, 'samples': 10360320, 'steps': 53959, 'loss/train': 1.4981751441955566} -11/07/2021 04:49:05 - INFO - __main__ - Step 53961: {'lr': 0.00036274043678068526, 'samples': 10360512, 'steps': 53960, 'loss/train': 1.141883373260498} -11/07/2021 04:49:05 - INFO - __main__ - Step 53962: {'lr': 0.0003627357002562923, 'samples': 10360704, 'steps': 53961, 'loss/train': 1.1795448064804077} -11/07/2021 04:49:06 - INFO - __main__ - Step 53963: {'lr': 0.0003627309636811023, 'samples': 10360896, 'steps': 53962, 'loss/train': 1.356592059135437} -11/07/2021 04:49:07 - INFO - __main__ - Step 53964: {'lr': 0.00036272622705511745, 'samples': 10361088, 'steps': 53963, 'loss/train': 0.8316559195518494} -11/07/2021 04:49:07 - INFO - __main__ - Step 53965: {'lr': 0.0003627214903783399, 'samples': 10361280, 'steps': 53964, 'loss/train': 1.6369526386260986} -11/07/2021 04:49:07 - INFO - __main__ - Step 53966: {'lr': 0.00036271675365077185, 'samples': 10361472, 'steps': 53965, 'loss/train': 1.0900590419769287} -11/07/2021 04:49:08 - INFO - __main__ - Step 53967: {'lr': 0.0003627120168724153, 'samples': 10361664, 'steps': 53966, 'loss/train': 1.1406044960021973} -11/07/2021 04:49:09 - INFO - __main__ - Step 53968: {'lr': 0.00036270728004327246, 'samples': 10361856, 'steps': 53967, 'loss/train': 1.480116367340088} -11/07/2021 04:49:09 - INFO - __main__ - Step 53969: {'lr': 0.0003627025431633455, 'samples': 10362048, 'steps': 53968, 'loss/train': 1.4173986911773682} -11/07/2021 04:49:10 - INFO - __main__ - Step 53970: {'lr': 0.00036269780623263647, 'samples': 10362240, 'steps': 53969, 'loss/train': 1.6775959730148315} -11/07/2021 04:49:10 - INFO - __main__ - Step 53971: {'lr': 0.00036269306925114765, 'samples': 10362432, 'steps': 53970, 'loss/train': 0.3500784933567047} -11/07/2021 04:49:10 - INFO - __main__ - Step 53972: {'lr': 0.000362688332218881, 'samples': 10362624, 'steps': 53971, 'loss/train': 1.574920654296875} -11/07/2021 04:49:11 - INFO - __main__ - Step 53973: {'lr': 0.0003626835951358387, 'samples': 10362816, 'steps': 53972, 'loss/train': 1.0546258687973022} -11/07/2021 04:49:12 - INFO - __main__ - Step 53974: {'lr': 0.00036267885800202296, 'samples': 10363008, 'steps': 53973, 'loss/train': 1.5321637392044067} -11/07/2021 04:49:12 - INFO - __main__ - Step 53975: {'lr': 0.00036267412081743576, 'samples': 10363200, 'steps': 53974, 'loss/train': 1.3582209348678589} -11/07/2021 04:49:12 - INFO - __main__ - Step 53976: {'lr': 0.00036266938358207944, 'samples': 10363392, 'steps': 53975, 'loss/train': 1.6329455375671387} -11/07/2021 04:49:13 - INFO - __main__ - Step 53977: {'lr': 0.0003626646462959561, 'samples': 10363584, 'steps': 53976, 'loss/train': 1.1768256425857544} -11/07/2021 04:49:14 - INFO - __main__ - Step 53978: {'lr': 0.00036265990895906767, 'samples': 10363776, 'steps': 53977, 'loss/train': 1.0313069820404053} -11/07/2021 04:49:14 - INFO - __main__ - Step 53979: {'lr': 0.0003626551715714165, 'samples': 10363968, 'steps': 53978, 'loss/train': 1.4519003629684448} -11/07/2021 04:49:14 - INFO - __main__ - Step 53980: {'lr': 0.00036265043413300456, 'samples': 10364160, 'steps': 53979, 'loss/train': 1.3776179552078247} -11/07/2021 04:49:15 - INFO - __main__ - Step 53981: {'lr': 0.0003626456966438342, 'samples': 10364352, 'steps': 53980, 'loss/train': 0.06659340113401413} -11/07/2021 04:49:15 - INFO - __main__ - Step 53982: {'lr': 0.00036264095910390736, 'samples': 10364544, 'steps': 53981, 'loss/train': 1.3852801322937012} -11/07/2021 04:49:16 - INFO - __main__ - Step 53983: {'lr': 0.0003626362215132263, 'samples': 10364736, 'steps': 53982, 'loss/train': 1.8173325061798096} -11/07/2021 04:49:16 - INFO - __main__ - Step 53984: {'lr': 0.00036263148387179303, 'samples': 10364928, 'steps': 53983, 'loss/train': 1.6196330785751343} -11/07/2021 04:49:17 - INFO - __main__ - Step 53985: {'lr': 0.0003626267461796097, 'samples': 10365120, 'steps': 53984, 'loss/train': 1.427735447883606} -11/07/2021 04:49:17 - INFO - __main__ - Step 53986: {'lr': 0.0003626220084366786, 'samples': 10365312, 'steps': 53985, 'loss/train': 0.9255143404006958} -11/07/2021 04:49:18 - INFO - __main__ - Step 53987: {'lr': 0.0003626172706430017, 'samples': 10365504, 'steps': 53986, 'loss/train': 1.3839311599731445} -11/07/2021 04:49:18 - INFO - __main__ - Step 53988: {'lr': 0.0003626125327985812, 'samples': 10365696, 'steps': 53987, 'loss/train': 1.7437059879302979} -11/07/2021 04:49:19 - INFO - __main__ - Step 53989: {'lr': 0.0003626077949034193, 'samples': 10365888, 'steps': 53988, 'loss/train': 1.4239369630813599} -11/07/2021 04:49:19 - INFO - __main__ - Step 53990: {'lr': 0.000362603056957518, 'samples': 10366080, 'steps': 53989, 'loss/train': 1.8578649759292603} -11/07/2021 04:49:20 - INFO - __main__ - Step 53991: {'lr': 0.0003625983189608795, 'samples': 10366272, 'steps': 53990, 'loss/train': 1.660885214805603} -11/07/2021 04:49:20 - INFO - __main__ - Step 53992: {'lr': 0.00036259358091350597, 'samples': 10366464, 'steps': 53991, 'loss/train': 1.3914047479629517} -11/07/2021 04:49:20 - INFO - __main__ - Step 53993: {'lr': 0.0003625888428153995, 'samples': 10366656, 'steps': 53992, 'loss/train': 1.2779313325881958} -11/07/2021 04:49:21 - INFO - __main__ - Step 53994: {'lr': 0.0003625841046665622, 'samples': 10366848, 'steps': 53993, 'loss/train': 1.4684120416641235} -11/07/2021 04:49:22 - INFO - __main__ - Step 53995: {'lr': 0.00036257936646699626, 'samples': 10367040, 'steps': 53994, 'loss/train': 1.657848834991455} -11/07/2021 04:49:22 - INFO - __main__ - Step 53996: {'lr': 0.00036257462821670387, 'samples': 10367232, 'steps': 53995, 'loss/train': 0.1811019480228424} -11/07/2021 04:49:22 - INFO - __main__ - Step 53997: {'lr': 0.00036256988991568696, 'samples': 10367424, 'steps': 53996, 'loss/train': 0.8272801637649536} -11/07/2021 04:49:23 - INFO - __main__ - Step 53998: {'lr': 0.0003625651515639479, 'samples': 10367616, 'steps': 53997, 'loss/train': 1.1919171810150146} -11/07/2021 04:49:24 - INFO - __main__ - Step 53999: {'lr': 0.00036256041316148864, 'samples': 10367808, 'steps': 53998, 'loss/train': 1.85353684425354} -11/07/2021 04:49:24 - INFO - __main__ - Step 54000: {'lr': 0.0003625556747083114, 'samples': 10368000, 'steps': 53999, 'loss/train': 1.776261568069458} -11/07/2021 04:49:25 - INFO - __main__ - Step 54001: {'lr': 0.0003625509362044183, 'samples': 10368192, 'steps': 54000, 'loss/train': 0.9551630616188049} -11/07/2021 04:49:25 - INFO - __main__ - Step 54002: {'lr': 0.00036254619764981155, 'samples': 10368384, 'steps': 54001, 'loss/train': 2.972165584564209} -11/07/2021 04:49:25 - INFO - __main__ - Step 54003: {'lr': 0.0003625414590444932, 'samples': 10368576, 'steps': 54002, 'loss/train': 1.1933668851852417} -11/07/2021 04:49:26 - INFO - __main__ - Step 54004: {'lr': 0.0003625367203884654, 'samples': 10368768, 'steps': 54003, 'loss/train': 1.2040570974349976} -11/07/2021 04:49:27 - INFO - __main__ - Step 54005: {'lr': 0.0003625319816817303, 'samples': 10368960, 'steps': 54004, 'loss/train': 1.7131401300430298} -11/07/2021 04:49:27 - INFO - __main__ - Step 54006: {'lr': 0.00036252724292429, 'samples': 10369152, 'steps': 54005, 'loss/train': 1.2289642095565796} -11/07/2021 04:49:27 - INFO - __main__ - Step 54007: {'lr': 0.00036252250411614666, 'samples': 10369344, 'steps': 54006, 'loss/train': 2.046152353286743} -11/07/2021 04:49:28 - INFO - __main__ - Step 54008: {'lr': 0.0003625177652573024, 'samples': 10369536, 'steps': 54007, 'loss/train': 1.5472607612609863} -11/07/2021 04:49:28 - INFO - __main__ - Step 54009: {'lr': 0.0003625130263477595, 'samples': 10369728, 'steps': 54008, 'loss/train': 1.8445370197296143} -11/07/2021 04:49:29 - INFO - __main__ - Step 54010: {'lr': 0.00036250828738751986, 'samples': 10369920, 'steps': 54009, 'loss/train': 1.957759976387024} -11/07/2021 04:49:29 - INFO - __main__ - Step 54011: {'lr': 0.0003625035483765857, 'samples': 10370112, 'steps': 54010, 'loss/train': 1.6986782550811768} -11/07/2021 04:49:30 - INFO - __main__ - Step 54012: {'lr': 0.00036249880931495923, 'samples': 10370304, 'steps': 54011, 'loss/train': 1.4239552021026611} -11/07/2021 04:49:30 - INFO - __main__ - Step 54013: {'lr': 0.00036249407020264246, 'samples': 10370496, 'steps': 54012, 'loss/train': 1.3341420888900757} -11/07/2021 04:49:30 - INFO - __main__ - Step 54014: {'lr': 0.00036248933103963767, 'samples': 10370688, 'steps': 54013, 'loss/train': 1.6599293947219849} -11/07/2021 04:49:31 - INFO - __main__ - Step 54015: {'lr': 0.0003624845918259469, 'samples': 10370880, 'steps': 54014, 'loss/train': 1.383053183555603} -11/07/2021 04:49:32 - INFO - __main__ - Step 54016: {'lr': 0.00036247985256157236, 'samples': 10371072, 'steps': 54015, 'loss/train': 1.2755595445632935} -11/07/2021 04:49:32 - INFO - __main__ - Step 54017: {'lr': 0.0003624751132465161, 'samples': 10371264, 'steps': 54016, 'loss/train': 1.4104011058807373} -11/07/2021 04:49:32 - INFO - __main__ - Step 54018: {'lr': 0.00036247037388078017, 'samples': 10371456, 'steps': 54017, 'loss/train': 1.340372085571289} -11/07/2021 04:49:33 - INFO - __main__ - Step 54019: {'lr': 0.00036246563446436697, 'samples': 10371648, 'steps': 54018, 'loss/train': 1.0824288129806519} -11/07/2021 04:49:34 - INFO - __main__ - Step 54020: {'lr': 0.00036246089499727843, 'samples': 10371840, 'steps': 54019, 'loss/train': 1.7775789499282837} -11/07/2021 04:49:34 - INFO - __main__ - Step 54021: {'lr': 0.0003624561554795168, 'samples': 10372032, 'steps': 54020, 'loss/train': 1.7932307720184326} -11/07/2021 04:49:35 - INFO - __main__ - Step 54022: {'lr': 0.0003624514159110841, 'samples': 10372224, 'steps': 54021, 'loss/train': 1.6062067747116089} -11/07/2021 04:49:35 - INFO - __main__ - Step 54023: {'lr': 0.0003624466762919826, 'samples': 10372416, 'steps': 54022, 'loss/train': 1.559800386428833} -11/07/2021 04:49:35 - INFO - __main__ - Step 54024: {'lr': 0.00036244193662221427, 'samples': 10372608, 'steps': 54023, 'loss/train': 1.265794038772583} -11/07/2021 04:49:36 - INFO - __main__ - Step 54025: {'lr': 0.0003624371969017814, 'samples': 10372800, 'steps': 54024, 'loss/train': 1.1560970544815063} -11/07/2021 04:49:37 - INFO - __main__ - Step 54026: {'lr': 0.000362432457130686, 'samples': 10372992, 'steps': 54025, 'loss/train': 1.1742134094238281} -11/07/2021 04:49:37 - INFO - __main__ - Step 54027: {'lr': 0.0003624277173089303, 'samples': 10373184, 'steps': 54026, 'loss/train': 1.1121913194656372} -11/07/2021 04:49:37 - INFO - __main__ - Step 54028: {'lr': 0.0003624229774365165, 'samples': 10373376, 'steps': 54027, 'loss/train': 1.2578948736190796} -11/07/2021 04:49:38 - INFO - __main__ - Step 54029: {'lr': 0.00036241823751344656, 'samples': 10373568, 'steps': 54028, 'loss/train': 1.18523371219635} -11/07/2021 04:49:38 - INFO - __main__ - Step 54030: {'lr': 0.0003624134975397227, 'samples': 10373760, 'steps': 54029, 'loss/train': 0.6954852938652039} -11/07/2021 04:49:39 - INFO - __main__ - Step 54031: {'lr': 0.0003624087575153471, 'samples': 10373952, 'steps': 54030, 'loss/train': 1.4838982820510864} -11/07/2021 04:49:39 - INFO - __main__ - Step 54032: {'lr': 0.00036240401744032174, 'samples': 10374144, 'steps': 54031, 'loss/train': 1.252082109451294} -11/07/2021 04:49:40 - INFO - __main__ - Step 54033: {'lr': 0.00036239927731464896, 'samples': 10374336, 'steps': 54032, 'loss/train': 1.4678068161010742} -11/07/2021 04:49:40 - INFO - __main__ - Step 54034: {'lr': 0.0003623945371383307, 'samples': 10374528, 'steps': 54033, 'loss/train': 1.1606920957565308} -11/07/2021 04:49:40 - INFO - __main__ - Step 54035: {'lr': 0.0003623897969113693, 'samples': 10374720, 'steps': 54034, 'loss/train': 1.449933409690857} -11/07/2021 04:49:42 - INFO - __main__ - Step 54036: {'lr': 0.00036238505663376675, 'samples': 10374912, 'steps': 54035, 'loss/train': 1.7730284929275513} -11/07/2021 04:49:42 - INFO - __main__ - Step 54037: {'lr': 0.00036238031630552527, 'samples': 10375104, 'steps': 54036, 'loss/train': 1.622470736503601} -11/07/2021 04:49:42 - INFO - __main__ - Step 54038: {'lr': 0.0003623755759266469, 'samples': 10375296, 'steps': 54037, 'loss/train': 0.9323673248291016} -11/07/2021 04:49:43 - INFO - __main__ - Step 54039: {'lr': 0.00036237083549713387, 'samples': 10375488, 'steps': 54038, 'loss/train': 1.631394386291504} -11/07/2021 04:49:43 - INFO - __main__ - Step 54040: {'lr': 0.0003623660950169882, 'samples': 10375680, 'steps': 54039, 'loss/train': 1.4027773141860962} -11/07/2021 04:49:44 - INFO - __main__ - Step 54041: {'lr': 0.00036236135448621215, 'samples': 10375872, 'steps': 54040, 'loss/train': 1.392757773399353} -11/07/2021 04:49:44 - INFO - __main__ - Step 54042: {'lr': 0.0003623566139048078, 'samples': 10376064, 'steps': 54041, 'loss/train': 0.9803919196128845} -11/07/2021 04:49:45 - INFO - __main__ - Step 54043: {'lr': 0.00036235187327277735, 'samples': 10376256, 'steps': 54042, 'loss/train': 1.434658169746399} -11/07/2021 04:49:45 - INFO - __main__ - Step 54044: {'lr': 0.0003623471325901228, 'samples': 10376448, 'steps': 54043, 'loss/train': 1.3706212043762207} -11/07/2021 04:49:45 - INFO - __main__ - Step 54045: {'lr': 0.00036234239185684643, 'samples': 10376640, 'steps': 54044, 'loss/train': 1.1884236335754395} -11/07/2021 04:49:46 - INFO - __main__ - Step 54046: {'lr': 0.00036233765107295023, 'samples': 10376832, 'steps': 54045, 'loss/train': 2.0011510848999023} -11/07/2021 04:49:47 - INFO - __main__ - Step 54047: {'lr': 0.00036233291023843653, 'samples': 10377024, 'steps': 54046, 'loss/train': 1.5218291282653809} -11/07/2021 04:49:47 - INFO - __main__ - Step 54048: {'lr': 0.00036232816935330723, 'samples': 10377216, 'steps': 54047, 'loss/train': 1.739459753036499} -11/07/2021 04:49:47 - INFO - __main__ - Step 54049: {'lr': 0.00036232342841756467, 'samples': 10377408, 'steps': 54048, 'loss/train': 1.8697669506072998} -11/07/2021 04:49:48 - INFO - __main__ - Step 54050: {'lr': 0.00036231868743121095, 'samples': 10377600, 'steps': 54049, 'loss/train': 1.3852152824401855} -11/07/2021 04:49:48 - INFO - __main__ - Step 54051: {'lr': 0.0003623139463942481, 'samples': 10377792, 'steps': 54050, 'loss/train': 4.39796257019043} -11/07/2021 04:49:49 - INFO - __main__ - Step 54052: {'lr': 0.0003623092053066783, 'samples': 10377984, 'steps': 54051, 'loss/train': 1.9474323987960815} -11/07/2021 04:49:50 - INFO - __main__ - Step 54053: {'lr': 0.0003623044641685037, 'samples': 10378176, 'steps': 54052, 'loss/train': 1.0721606016159058} -11/07/2021 04:49:50 - INFO - __main__ - Step 54054: {'lr': 0.00036229972297972644, 'samples': 10378368, 'steps': 54053, 'loss/train': 1.2265321016311646} -11/07/2021 04:49:50 - INFO - __main__ - Step 54055: {'lr': 0.00036229498174034867, 'samples': 10378560, 'steps': 54054, 'loss/train': 1.8366349935531616} -11/07/2021 04:49:51 - INFO - __main__ - Step 54056: {'lr': 0.00036229024045037264, 'samples': 10378752, 'steps': 54055, 'loss/train': 1.0183594226837158} -11/07/2021 04:49:52 - INFO - __main__ - Step 54057: {'lr': 0.00036228549910980026, 'samples': 10378944, 'steps': 54056, 'loss/train': 1.1268253326416016} -11/07/2021 04:49:52 - INFO - __main__ - Step 54058: {'lr': 0.0003622807577186337, 'samples': 10379136, 'steps': 54057, 'loss/train': 1.5386079549789429} -11/07/2021 04:49:52 - INFO - __main__ - Step 54059: {'lr': 0.0003622760162768752, 'samples': 10379328, 'steps': 54058, 'loss/train': 1.5613408088684082} -11/07/2021 04:49:53 - INFO - __main__ - Step 54060: {'lr': 0.0003622712747845269, 'samples': 10379520, 'steps': 54059, 'loss/train': 1.7073429822921753} -11/07/2021 04:49:53 - INFO - __main__ - Step 54061: {'lr': 0.0003622665332415909, 'samples': 10379712, 'steps': 54060, 'loss/train': 1.2677898406982422} -11/07/2021 04:49:54 - INFO - __main__ - Step 54062: {'lr': 0.00036226179164806926, 'samples': 10379904, 'steps': 54061, 'loss/train': 0.06435222923755646} -11/07/2021 04:49:55 - INFO - __main__ - Step 54063: {'lr': 0.00036225705000396424, 'samples': 10380096, 'steps': 54062, 'loss/train': 1.371171236038208} -11/07/2021 04:49:55 - INFO - __main__ - Step 54064: {'lr': 0.000362252308309278, 'samples': 10380288, 'steps': 54063, 'loss/train': 1.5303770303726196} -11/07/2021 04:49:55 - INFO - __main__ - Step 54065: {'lr': 0.00036224756656401245, 'samples': 10380480, 'steps': 54064, 'loss/train': 1.3622829914093018} -11/07/2021 04:49:56 - INFO - __main__ - Step 54066: {'lr': 0.0003622428247681699, 'samples': 10380672, 'steps': 54065, 'loss/train': 1.0054705142974854} -11/07/2021 04:49:56 - INFO - __main__ - Step 54067: {'lr': 0.0003622380829217526, 'samples': 10380864, 'steps': 54066, 'loss/train': 1.0937042236328125} -11/07/2021 04:49:57 - INFO - __main__ - Step 54068: {'lr': 0.00036223334102476247, 'samples': 10381056, 'steps': 54067, 'loss/train': 1.4480668306350708} -11/07/2021 04:49:57 - INFO - __main__ - Step 54069: {'lr': 0.00036222859907720167, 'samples': 10381248, 'steps': 54068, 'loss/train': 1.1883262395858765} -11/07/2021 04:49:58 - INFO - __main__ - Step 54070: {'lr': 0.00036222385707907254, 'samples': 10381440, 'steps': 54069, 'loss/train': 1.5054994821548462} -11/07/2021 04:49:58 - INFO - __main__ - Step 54071: {'lr': 0.000362219115030377, 'samples': 10381632, 'steps': 54070, 'loss/train': 1.5895830392837524} -11/07/2021 04:49:58 - INFO - __main__ - Step 54072: {'lr': 0.0003622143729311172, 'samples': 10381824, 'steps': 54071, 'loss/train': 1.5016613006591797} -11/07/2021 04:49:59 - INFO - __main__ - Step 54073: {'lr': 0.00036220963078129536, 'samples': 10382016, 'steps': 54072, 'loss/train': 1.3931150436401367} -11/07/2021 04:50:00 - INFO - __main__ - Step 54074: {'lr': 0.0003622048885809136, 'samples': 10382208, 'steps': 54073, 'loss/train': 1.243634819984436} -11/07/2021 04:50:00 - INFO - __main__ - Step 54075: {'lr': 0.0003622001463299741, 'samples': 10382400, 'steps': 54074, 'loss/train': 1.7613712549209595} -11/07/2021 04:50:00 - INFO - __main__ - Step 54076: {'lr': 0.0003621954040284789, 'samples': 10382592, 'steps': 54075, 'loss/train': 0.41087788343429565} -11/07/2021 04:50:01 - INFO - __main__ - Step 54077: {'lr': 0.00036219066167643015, 'samples': 10382784, 'steps': 54076, 'loss/train': 1.0473359823226929} -11/07/2021 04:50:02 - INFO - __main__ - Step 54078: {'lr': 0.00036218591927383, 'samples': 10382976, 'steps': 54077, 'loss/train': 1.528517723083496} -11/07/2021 04:50:02 - INFO - __main__ - Step 54079: {'lr': 0.00036218117682068076, 'samples': 10383168, 'steps': 54078, 'loss/train': 1.5811829566955566} -11/07/2021 04:50:03 - INFO - __main__ - Step 54080: {'lr': 0.0003621764343169843, 'samples': 10383360, 'steps': 54079, 'loss/train': 1.828255295753479} -11/07/2021 04:50:03 - INFO - __main__ - Step 54081: {'lr': 0.0003621716917627429, 'samples': 10383552, 'steps': 54080, 'loss/train': 1.3414658308029175} -11/07/2021 04:50:03 - INFO - __main__ - Step 54082: {'lr': 0.0003621669491579587, 'samples': 10383744, 'steps': 54081, 'loss/train': 1.5407863855361938} -11/07/2021 04:50:04 - INFO - __main__ - Step 54083: {'lr': 0.0003621622065026337, 'samples': 10383936, 'steps': 54082, 'loss/train': 1.6347789764404297} -11/07/2021 04:50:05 - INFO - __main__ - Step 54084: {'lr': 0.0003621574637967702, 'samples': 10384128, 'steps': 54083, 'loss/train': 4.492691993713379} -11/07/2021 04:50:05 - INFO - __main__ - Step 54085: {'lr': 0.00036215272104037023, 'samples': 10384320, 'steps': 54084, 'loss/train': 1.2677205801010132} -11/07/2021 04:50:05 - INFO - __main__ - Step 54086: {'lr': 0.0003621479782334361, 'samples': 10384512, 'steps': 54085, 'loss/train': 1.4585630893707275} -11/07/2021 04:50:06 - INFO - __main__ - Step 54087: {'lr': 0.00036214323537596974, 'samples': 10384704, 'steps': 54086, 'loss/train': 0.7516101598739624} -11/07/2021 04:50:06 - INFO - __main__ - Step 54088: {'lr': 0.0003621384924679733, 'samples': 10384896, 'steps': 54087, 'loss/train': 2.0621416568756104} -11/07/2021 04:50:07 - INFO - __main__ - Step 54089: {'lr': 0.00036213374950944913, 'samples': 10385088, 'steps': 54088, 'loss/train': 1.4169466495513916} -11/07/2021 04:50:08 - INFO - __main__ - Step 54090: {'lr': 0.0003621290065003991, 'samples': 10385280, 'steps': 54089, 'loss/train': 1.8630374670028687} -11/07/2021 04:50:08 - INFO - __main__ - Step 54091: {'lr': 0.00036212426344082554, 'samples': 10385472, 'steps': 54090, 'loss/train': 0.8615546822547913} -11/07/2021 04:50:08 - INFO - __main__ - Step 54092: {'lr': 0.0003621195203307305, 'samples': 10385664, 'steps': 54091, 'loss/train': 1.5436806678771973} -11/07/2021 04:50:09 - INFO - __main__ - Step 54093: {'lr': 0.0003621147771701161, 'samples': 10385856, 'steps': 54092, 'loss/train': 2.168379306793213} -11/07/2021 04:50:10 - INFO - __main__ - Step 54094: {'lr': 0.00036211003395898456, 'samples': 10386048, 'steps': 54093, 'loss/train': 0.6066447496414185} -11/07/2021 04:50:10 - INFO - __main__ - Step 54095: {'lr': 0.0003621052906973379, 'samples': 10386240, 'steps': 54094, 'loss/train': 1.5131169557571411} -11/07/2021 04:50:10 - INFO - __main__ - Step 54096: {'lr': 0.0003621005473851784, 'samples': 10386432, 'steps': 54095, 'loss/train': 1.8245435953140259} -11/07/2021 04:50:11 - INFO - __main__ - Step 54097: {'lr': 0.0003620958040225081, 'samples': 10386624, 'steps': 54096, 'loss/train': 1.176207184791565} -11/07/2021 04:50:11 - INFO - __main__ - Step 54098: {'lr': 0.0003620910606093292, 'samples': 10386816, 'steps': 54097, 'loss/train': 1.4618706703186035} -11/07/2021 04:50:12 - INFO - __main__ - Step 54099: {'lr': 0.0003620863171456437, 'samples': 10387008, 'steps': 54098, 'loss/train': 1.1126728057861328} -11/07/2021 04:50:12 - INFO - __main__ - Step 54100: {'lr': 0.0003620815736314539, 'samples': 10387200, 'steps': 54099, 'loss/train': 1.6649500131607056} -11/07/2021 04:50:13 - INFO - __main__ - Step 54101: {'lr': 0.0003620768300667618, 'samples': 10387392, 'steps': 54100, 'loss/train': 1.5151457786560059} -11/07/2021 04:50:13 - INFO - __main__ - Step 54102: {'lr': 0.00036207208645156977, 'samples': 10387584, 'steps': 54101, 'loss/train': 1.6389533281326294} -11/07/2021 04:50:13 - INFO - __main__ - Step 54103: {'lr': 0.00036206734278587964, 'samples': 10387776, 'steps': 54102, 'loss/train': 1.6350964307785034} -11/07/2021 04:50:15 - INFO - __main__ - Step 54104: {'lr': 0.0003620625990696937, 'samples': 10387968, 'steps': 54103, 'loss/train': 1.5984524488449097} -11/07/2021 04:50:15 - INFO - __main__ - Step 54105: {'lr': 0.00036205785530301417, 'samples': 10388160, 'steps': 54104, 'loss/train': 1.4757647514343262} -11/07/2021 04:50:15 - INFO - __main__ - Step 54106: {'lr': 0.00036205311148584306, 'samples': 10388352, 'steps': 54105, 'loss/train': 1.5447732210159302} -11/07/2021 04:50:16 - INFO - __main__ - Step 54107: {'lr': 0.00036204836761818255, 'samples': 10388544, 'steps': 54106, 'loss/train': 1.7922970056533813} -11/07/2021 04:50:16 - INFO - __main__ - Step 54108: {'lr': 0.00036204362370003475, 'samples': 10388736, 'steps': 54107, 'loss/train': 1.2513302564620972} -11/07/2021 04:50:17 - INFO - __main__ - Step 54109: {'lr': 0.00036203887973140184, 'samples': 10388928, 'steps': 54108, 'loss/train': 2.252163887023926} -11/07/2021 04:50:17 - INFO - __main__ - Step 54110: {'lr': 0.000362034135712286, 'samples': 10389120, 'steps': 54109, 'loss/train': 1.445444107055664} -11/07/2021 04:50:18 - INFO - __main__ - Step 54111: {'lr': 0.00036202939164268924, 'samples': 10389312, 'steps': 54110, 'loss/train': 1.8695931434631348} -11/07/2021 04:50:18 - INFO - __main__ - Step 54112: {'lr': 0.0003620246475226138, 'samples': 10389504, 'steps': 54111, 'loss/train': 1.2193603515625} -11/07/2021 04:50:18 - INFO - __main__ - Step 54113: {'lr': 0.0003620199033520617, 'samples': 10389696, 'steps': 54112, 'loss/train': 0.8813428282737732} -11/07/2021 04:50:19 - INFO - __main__ - Step 54114: {'lr': 0.0003620151591310352, 'samples': 10389888, 'steps': 54113, 'loss/train': 1.7636504173278809} -11/07/2021 04:50:20 - INFO - __main__ - Step 54115: {'lr': 0.0003620104148595364, 'samples': 10390080, 'steps': 54114, 'loss/train': 1.3986188173294067} -11/07/2021 04:50:20 - INFO - __main__ - Step 54116: {'lr': 0.00036200567053756746, 'samples': 10390272, 'steps': 54115, 'loss/train': 1.3709259033203125} -11/07/2021 04:50:20 - INFO - __main__ - Step 54117: {'lr': 0.0003620009261651305, 'samples': 10390464, 'steps': 54116, 'loss/train': 1.6733927726745605} -11/07/2021 04:50:21 - INFO - __main__ - Step 54118: {'lr': 0.0003619961817422276, 'samples': 10390656, 'steps': 54117, 'loss/train': 1.5279405117034912} -11/07/2021 04:50:21 - INFO - __main__ - Step 54119: {'lr': 0.00036199143726886097, 'samples': 10390848, 'steps': 54118, 'loss/train': 1.7747327089309692} -11/07/2021 04:50:22 - INFO - __main__ - Step 54120: {'lr': 0.00036198669274503274, 'samples': 10391040, 'steps': 54119, 'loss/train': 1.4915437698364258} -11/07/2021 04:50:22 - INFO - __main__ - Step 54121: {'lr': 0.00036198194817074503, 'samples': 10391232, 'steps': 54120, 'loss/train': 1.5646147727966309} -11/07/2021 04:50:23 - INFO - __main__ - Step 54122: {'lr': 0.00036197720354599997, 'samples': 10391424, 'steps': 54121, 'loss/train': 1.1594526767730713} -11/07/2021 04:50:23 - INFO - __main__ - Step 54123: {'lr': 0.0003619724588707997, 'samples': 10391616, 'steps': 54122, 'loss/train': 1.6819772720336914} -11/07/2021 04:50:23 - INFO - __main__ - Step 54124: {'lr': 0.00036196771414514643, 'samples': 10391808, 'steps': 54123, 'loss/train': 1.259159803390503} -11/07/2021 04:50:25 - INFO - __main__ - Step 54125: {'lr': 0.0003619629693690422, 'samples': 10392000, 'steps': 54124, 'loss/train': 1.4479601383209229} -11/07/2021 04:50:25 - INFO - __main__ - Step 54126: {'lr': 0.00036195822454248916, 'samples': 10392192, 'steps': 54125, 'loss/train': 1.284369945526123} -11/07/2021 04:50:25 - INFO - __main__ - Step 54127: {'lr': 0.00036195347966548955, 'samples': 10392384, 'steps': 54126, 'loss/train': 5.417552471160889} -11/07/2021 04:50:26 - INFO - __main__ - Step 54128: {'lr': 0.0003619487347380454, 'samples': 10392576, 'steps': 54127, 'loss/train': 1.50994873046875} -11/07/2021 04:50:26 - INFO - __main__ - Step 54129: {'lr': 0.00036194398976015875, 'samples': 10392768, 'steps': 54128, 'loss/train': 2.001593589782715} -11/07/2021 04:50:27 - INFO - __main__ - Step 54130: {'lr': 0.00036193924473183205, 'samples': 10392960, 'steps': 54129, 'loss/train': 1.5888789892196655} -11/07/2021 04:50:28 - INFO - __main__ - Step 54131: {'lr': 0.00036193449965306714, 'samples': 10393152, 'steps': 54130, 'loss/train': 1.8174561262130737} -11/07/2021 04:50:28 - INFO - __main__ - Step 54132: {'lr': 0.0003619297545238663, 'samples': 10393344, 'steps': 54131, 'loss/train': 1.3752504587173462} -11/07/2021 04:50:28 - INFO - __main__ - Step 54133: {'lr': 0.00036192500934423163, 'samples': 10393536, 'steps': 54132, 'loss/train': 1.7326428890228271} -11/07/2021 04:50:29 - INFO - __main__ - Step 54134: {'lr': 0.0003619202641141652, 'samples': 10393728, 'steps': 54133, 'loss/train': 1.702778935432434} -11/07/2021 04:50:29 - INFO - __main__ - Step 54135: {'lr': 0.00036191551883366937, 'samples': 10393920, 'steps': 54134, 'loss/train': 1.3861414194107056} -11/07/2021 04:50:30 - INFO - __main__ - Step 54136: {'lr': 0.000361910773502746, 'samples': 10394112, 'steps': 54135, 'loss/train': 1.3360629081726074} -11/07/2021 04:50:31 - INFO - __main__ - Step 54137: {'lr': 0.00036190602812139757, 'samples': 10394304, 'steps': 54136, 'loss/train': 1.3992722034454346} -11/07/2021 04:50:31 - INFO - __main__ - Step 54138: {'lr': 0.00036190128268962586, 'samples': 10394496, 'steps': 54137, 'loss/train': 1.0293000936508179} -11/07/2021 04:50:31 - INFO - __main__ - Step 54139: {'lr': 0.00036189653720743317, 'samples': 10394688, 'steps': 54138, 'loss/train': 0.8107431530952454} -11/07/2021 04:50:32 - INFO - __main__ - Step 54140: {'lr': 0.0003618917916748216, 'samples': 10394880, 'steps': 54139, 'loss/train': 1.5401232242584229} -11/07/2021 04:50:33 - INFO - __main__ - Step 54141: {'lr': 0.00036188704609179333, 'samples': 10395072, 'steps': 54140, 'loss/train': 1.5690703392028809} -11/07/2021 04:50:33 - INFO - __main__ - Step 54142: {'lr': 0.00036188230045835053, 'samples': 10395264, 'steps': 54141, 'loss/train': 1.303375482559204} -11/07/2021 04:50:33 - INFO - __main__ - Step 54143: {'lr': 0.00036187755477449525, 'samples': 10395456, 'steps': 54142, 'loss/train': 0.09238816797733307} -11/07/2021 04:50:34 - INFO - __main__ - Step 54144: {'lr': 0.00036187280904022973, 'samples': 10395648, 'steps': 54143, 'loss/train': 1.3750076293945312} -11/07/2021 04:50:34 - INFO - __main__ - Step 54145: {'lr': 0.000361868063255556, 'samples': 10395840, 'steps': 54144, 'loss/train': 1.9195276498794556} -11/07/2021 04:50:35 - INFO - __main__ - Step 54146: {'lr': 0.00036186331742047627, 'samples': 10396032, 'steps': 54145, 'loss/train': 1.367439866065979} -11/07/2021 04:50:36 - INFO - __main__ - Step 54147: {'lr': 0.0003618585715349926, 'samples': 10396224, 'steps': 54146, 'loss/train': 1.5602264404296875} -11/07/2021 04:50:36 - INFO - __main__ - Step 54148: {'lr': 0.00036185382559910723, 'samples': 10396416, 'steps': 54147, 'loss/train': 1.2956527471542358} -11/07/2021 04:50:36 - INFO - __main__ - Step 54149: {'lr': 0.0003618490796128222, 'samples': 10396608, 'steps': 54148, 'loss/train': 1.2464632987976074} -11/07/2021 04:50:37 - INFO - __main__ - Step 54150: {'lr': 0.0003618443335761398, 'samples': 10396800, 'steps': 54149, 'loss/train': 1.4042271375656128} -11/07/2021 04:50:38 - INFO - __main__ - Step 54151: {'lr': 0.00036183958748906204, 'samples': 10396992, 'steps': 54150, 'loss/train': 1.5905922651290894} -11/07/2021 04:50:38 - INFO - __main__ - Step 54152: {'lr': 0.00036183484135159105, 'samples': 10397184, 'steps': 54151, 'loss/train': 1.538983702659607} -11/07/2021 04:50:38 - INFO - __main__ - Step 54153: {'lr': 0.000361830095163729, 'samples': 10397376, 'steps': 54152, 'loss/train': 1.7917529344558716} -11/07/2021 04:50:39 - INFO - __main__ - Step 54154: {'lr': 0.000361825348925478, 'samples': 10397568, 'steps': 54153, 'loss/train': 1.845569133758545} -11/07/2021 04:50:39 - INFO - __main__ - Step 54155: {'lr': 0.0003618206026368403, 'samples': 10397760, 'steps': 54154, 'loss/train': 1.2024149894714355} -11/07/2021 04:50:40 - INFO - __main__ - Step 54156: {'lr': 0.00036181585629781795, 'samples': 10397952, 'steps': 54155, 'loss/train': 1.522216558456421} -11/07/2021 04:50:40 - INFO - __main__ - Step 54157: {'lr': 0.0003618111099084131, 'samples': 10398144, 'steps': 54156, 'loss/train': 1.477552056312561} -11/07/2021 04:50:41 - INFO - __main__ - Step 54158: {'lr': 0.00036180636346862786, 'samples': 10398336, 'steps': 54157, 'loss/train': 1.573291301727295} -11/07/2021 04:50:41 - INFO - __main__ - Step 54159: {'lr': 0.0003618016169784645, 'samples': 10398528, 'steps': 54158, 'loss/train': 1.4481648206710815} -11/07/2021 04:50:42 - INFO - __main__ - Step 54160: {'lr': 0.0003617968704379249, 'samples': 10398720, 'steps': 54159, 'loss/train': 1.1955894231796265} -11/07/2021 04:50:42 - INFO - __main__ - Step 54161: {'lr': 0.0003617921238470114, 'samples': 10398912, 'steps': 54160, 'loss/train': 1.571686863899231} -11/07/2021 04:50:43 - INFO - __main__ - Step 54162: {'lr': 0.00036178737720572615, 'samples': 10399104, 'steps': 54161, 'loss/train': 0.8738097548484802} -11/07/2021 04:50:43 - INFO - __main__ - Step 54163: {'lr': 0.0003617826305140712, 'samples': 10399296, 'steps': 54162, 'loss/train': 0.8634712100028992} -11/07/2021 04:50:43 - INFO - __main__ - Step 54164: {'lr': 0.0003617778837720488, 'samples': 10399488, 'steps': 54163, 'loss/train': 1.8333909511566162} -11/07/2021 04:50:44 - INFO - __main__ - Step 54165: {'lr': 0.00036177313697966087, 'samples': 10399680, 'steps': 54164, 'loss/train': 1.1427308320999146} -11/07/2021 04:50:44 - INFO - __main__ - Step 54166: {'lr': 0.00036176839013690975, 'samples': 10399872, 'steps': 54165, 'loss/train': 0.8946309089660645} -11/07/2021 04:50:45 - INFO - __main__ - Step 54167: {'lr': 0.0003617636432437975, 'samples': 10400064, 'steps': 54166, 'loss/train': 2.0450594425201416} -11/07/2021 04:50:46 - INFO - __main__ - Step 54168: {'lr': 0.00036175889630032633, 'samples': 10400256, 'steps': 54167, 'loss/train': 1.6099635362625122} -11/07/2021 04:50:46 - INFO - __main__ - Step 54169: {'lr': 0.0003617541493064983, 'samples': 10400448, 'steps': 54168, 'loss/train': 3.37135648727417} -11/07/2021 04:50:46 - INFO - __main__ - Step 54170: {'lr': 0.00036174940226231555, 'samples': 10400640, 'steps': 54169, 'loss/train': 1.496845006942749} -11/07/2021 04:50:47 - INFO - __main__ - Step 54171: {'lr': 0.0003617446551677803, 'samples': 10400832, 'steps': 54170, 'loss/train': 1.6073050498962402} -11/07/2021 04:50:48 - INFO - __main__ - Step 54172: {'lr': 0.0003617399080228946, 'samples': 10401024, 'steps': 54171, 'loss/train': 1.785964012145996} -11/07/2021 04:50:48 - INFO - __main__ - Step 54173: {'lr': 0.0003617351608276606, 'samples': 10401216, 'steps': 54172, 'loss/train': 1.5745853185653687} -11/07/2021 04:50:48 - INFO - __main__ - Step 54174: {'lr': 0.00036173041358208047, 'samples': 10401408, 'steps': 54173, 'loss/train': 2.1846258640289307} -11/07/2021 04:50:49 - INFO - __main__ - Step 54175: {'lr': 0.0003617256662861563, 'samples': 10401600, 'steps': 54174, 'loss/train': 1.8046305179595947} -11/07/2021 04:50:49 - INFO - __main__ - Step 54176: {'lr': 0.00036172091893989033, 'samples': 10401792, 'steps': 54175, 'loss/train': 1.360886573791504} -11/07/2021 04:50:50 - INFO - __main__ - Step 54177: {'lr': 0.0003617161715432847, 'samples': 10401984, 'steps': 54176, 'loss/train': 2.502126455307007} -11/07/2021 04:50:50 - INFO - __main__ - Step 54178: {'lr': 0.0003617114240963414, 'samples': 10402176, 'steps': 54177, 'loss/train': 1.4828987121582031} -11/07/2021 04:50:51 - INFO - __main__ - Step 54179: {'lr': 0.00036170667659906263, 'samples': 10402368, 'steps': 54178, 'loss/train': 1.2660387754440308} -11/07/2021 04:50:51 - INFO - __main__ - Step 54180: {'lr': 0.0003617019290514506, 'samples': 10402560, 'steps': 54179, 'loss/train': 1.5110920667648315} -11/07/2021 04:50:51 - INFO - __main__ - Step 54181: {'lr': 0.0003616971814535074, 'samples': 10402752, 'steps': 54180, 'loss/train': 1.2024673223495483} -11/07/2021 04:50:52 - INFO - __main__ - Step 54182: {'lr': 0.0003616924338052352, 'samples': 10402944, 'steps': 54181, 'loss/train': 1.0852046012878418} -11/07/2021 04:50:53 - INFO - __main__ - Step 54183: {'lr': 0.00036168768610663605, 'samples': 10403136, 'steps': 54182, 'loss/train': 1.3982117176055908} -11/07/2021 04:50:53 - INFO - __main__ - Step 54184: {'lr': 0.0003616829383577123, 'samples': 10403328, 'steps': 54183, 'loss/train': 1.0698223114013672} -11/07/2021 04:50:54 - INFO - __main__ - Step 54185: {'lr': 0.00036167819055846575, 'samples': 10403520, 'steps': 54184, 'loss/train': 0.8570522665977478} -11/07/2021 04:50:54 - INFO - __main__ - Step 54186: {'lr': 0.0003616734427088988, 'samples': 10403712, 'steps': 54185, 'loss/train': 0.9845548868179321} -11/07/2021 04:50:55 - INFO - __main__ - Step 54187: {'lr': 0.00036166869480901354, 'samples': 10403904, 'steps': 54186, 'loss/train': 1.6993108987808228} -11/07/2021 04:50:55 - INFO - __main__ - Step 54188: {'lr': 0.0003616639468588121, 'samples': 10404096, 'steps': 54187, 'loss/train': 1.4021564722061157} -11/07/2021 04:50:56 - INFO - __main__ - Step 54189: {'lr': 0.00036165919885829654, 'samples': 10404288, 'steps': 54188, 'loss/train': 0.9608977437019348} -11/07/2021 04:50:56 - INFO - __main__ - Step 54190: {'lr': 0.0003616544508074691, 'samples': 10404480, 'steps': 54189, 'loss/train': 1.4246867895126343} -11/07/2021 04:50:56 - INFO - __main__ - Step 54191: {'lr': 0.00036164970270633195, 'samples': 10404672, 'steps': 54190, 'loss/train': 1.4522274732589722} -11/07/2021 04:50:57 - INFO - __main__ - Step 54192: {'lr': 0.0003616449545548871, 'samples': 10404864, 'steps': 54191, 'loss/train': 1.4007220268249512} -11/07/2021 04:50:58 - INFO - __main__ - Step 54193: {'lr': 0.00036164020635313677, 'samples': 10405056, 'steps': 54192, 'loss/train': 1.5226939916610718} -11/07/2021 04:50:58 - INFO - __main__ - Step 54194: {'lr': 0.0003616354581010831, 'samples': 10405248, 'steps': 54193, 'loss/train': 2.048875570297241} -11/07/2021 04:50:58 - INFO - __main__ - Step 54195: {'lr': 0.0003616307097987282, 'samples': 10405440, 'steps': 54194, 'loss/train': 1.852852702140808} -11/07/2021 04:50:59 - INFO - __main__ - Step 54196: {'lr': 0.00036162596144607425, 'samples': 10405632, 'steps': 54195, 'loss/train': 1.2445474863052368} -11/07/2021 04:50:59 - INFO - __main__ - Step 54197: {'lr': 0.00036162121304312336, 'samples': 10405824, 'steps': 54196, 'loss/train': 1.5783623456954956} -11/07/2021 04:51:00 - INFO - __main__ - Step 54198: {'lr': 0.0003616164645898776, 'samples': 10406016, 'steps': 54197, 'loss/train': 1.7226239442825317} -11/07/2021 04:51:01 - INFO - __main__ - Step 54199: {'lr': 0.0003616117160863393, 'samples': 10406208, 'steps': 54198, 'loss/train': 1.533337116241455} -11/07/2021 04:51:01 - INFO - __main__ - Step 54200: {'lr': 0.00036160696753251043, 'samples': 10406400, 'steps': 54199, 'loss/train': 0.7449395656585693} -11/07/2021 04:51:01 - INFO - __main__ - Step 54201: {'lr': 0.0003616022189283932, 'samples': 10406592, 'steps': 54200, 'loss/train': 1.16170072555542} -11/07/2021 04:51:02 - INFO - __main__ - Step 54202: {'lr': 0.00036159747027398963, 'samples': 10406784, 'steps': 54201, 'loss/train': 0.32056573033332825} -11/07/2021 04:51:03 - INFO - __main__ - Step 54203: {'lr': 0.0003615927215693021, 'samples': 10406976, 'steps': 54202, 'loss/train': 1.3610919713974} -11/07/2021 04:51:03 - INFO - __main__ - Step 54204: {'lr': 0.0003615879728143325, 'samples': 10407168, 'steps': 54203, 'loss/train': 1.335235834121704} -11/07/2021 04:51:03 - INFO - __main__ - Step 54205: {'lr': 0.00036158322400908316, 'samples': 10407360, 'steps': 54204, 'loss/train': 0.9815249443054199} -11/07/2021 04:51:04 - INFO - __main__ - Step 54206: {'lr': 0.00036157847515355614, 'samples': 10407552, 'steps': 54205, 'loss/train': 1.557557225227356} -11/07/2021 04:51:04 - INFO - __main__ - Step 54207: {'lr': 0.0003615737262477535, 'samples': 10407744, 'steps': 54206, 'loss/train': 1.1291550397872925} -11/07/2021 04:51:05 - INFO - __main__ - Step 54208: {'lr': 0.0003615689772916776, 'samples': 10407936, 'steps': 54207, 'loss/train': 1.934542179107666} -11/07/2021 04:51:05 - INFO - __main__ - Step 54209: {'lr': 0.00036156422828533035, 'samples': 10408128, 'steps': 54208, 'loss/train': 1.5808987617492676} -11/07/2021 04:51:06 - INFO - __main__ - Step 54210: {'lr': 0.000361559479228714, 'samples': 10408320, 'steps': 54209, 'loss/train': 1.5406129360198975} -11/07/2021 04:51:06 - INFO - __main__ - Step 54211: {'lr': 0.00036155473012183066, 'samples': 10408512, 'steps': 54210, 'loss/train': 1.6734875440597534} -11/07/2021 04:51:07 - INFO - __main__ - Step 54212: {'lr': 0.00036154998096468244, 'samples': 10408704, 'steps': 54211, 'loss/train': 1.8039016723632812} -11/07/2021 04:51:07 - INFO - __main__ - Step 54213: {'lr': 0.00036154523175727153, 'samples': 10408896, 'steps': 54212, 'loss/train': 1.470895528793335} -11/07/2021 04:51:08 - INFO - __main__ - Step 54214: {'lr': 0.00036154048249960015, 'samples': 10409088, 'steps': 54213, 'loss/train': 2.054375171661377} -11/07/2021 04:51:08 - INFO - __main__ - Step 54215: {'lr': 0.0003615357331916703, 'samples': 10409280, 'steps': 54214, 'loss/train': 2.149806022644043} -11/07/2021 04:51:09 - INFO - __main__ - Step 54216: {'lr': 0.0003615309838334841, 'samples': 10409472, 'steps': 54215, 'loss/train': 1.2030466794967651} -11/07/2021 04:51:09 - INFO - __main__ - Step 54217: {'lr': 0.00036152623442504386, 'samples': 10409664, 'steps': 54216, 'loss/train': 2.1831858158111572} -11/07/2021 04:51:09 - INFO - __main__ - Step 54218: {'lr': 0.0003615214849663516, 'samples': 10409856, 'steps': 54217, 'loss/train': 1.5984482765197754} -11/07/2021 04:51:10 - INFO - __main__ - Step 54219: {'lr': 0.0003615167354574094, 'samples': 10410048, 'steps': 54218, 'loss/train': 0.8072491884231567} -11/07/2021 04:51:11 - INFO - __main__ - Step 54220: {'lr': 0.0003615119858982196, 'samples': 10410240, 'steps': 54219, 'loss/train': 1.3046067953109741} -11/07/2021 04:51:11 - INFO - __main__ - Step 54221: {'lr': 0.0003615072362887841, 'samples': 10410432, 'steps': 54220, 'loss/train': 1.6609251499176025} -11/07/2021 04:51:11 - INFO - __main__ - Step 54222: {'lr': 0.0003615024866291052, 'samples': 10410624, 'steps': 54221, 'loss/train': 1.4929295778274536} -11/07/2021 04:51:12 - INFO - __main__ - Step 54223: {'lr': 0.0003614977369191851, 'samples': 10410816, 'steps': 54222, 'loss/train': 1.5850660800933838} -11/07/2021 04:51:13 - INFO - __main__ - Step 54224: {'lr': 0.00036149298715902573, 'samples': 10411008, 'steps': 54223, 'loss/train': 1.8780813217163086} -11/07/2021 04:51:13 - INFO - __main__ - Step 54225: {'lr': 0.00036148823734862934, 'samples': 10411200, 'steps': 54224, 'loss/train': 1.2997181415557861} -11/07/2021 04:51:14 - INFO - __main__ - Step 54226: {'lr': 0.00036148348748799816, 'samples': 10411392, 'steps': 54225, 'loss/train': 1.6346073150634766} -11/07/2021 04:51:14 - INFO - __main__ - Step 54227: {'lr': 0.00036147873757713417, 'samples': 10411584, 'steps': 54226, 'loss/train': 1.4231724739074707} -11/07/2021 04:51:14 - INFO - __main__ - Step 54228: {'lr': 0.0003614739876160396, 'samples': 10411776, 'steps': 54227, 'loss/train': 1.5670398473739624} -11/07/2021 04:51:15 - INFO - __main__ - Step 54229: {'lr': 0.0003614692376047165, 'samples': 10411968, 'steps': 54228, 'loss/train': 2.5385074615478516} -11/07/2021 04:51:16 - INFO - __main__ - Step 54230: {'lr': 0.00036146448754316717, 'samples': 10412160, 'steps': 54229, 'loss/train': 1.8390408754348755} -11/07/2021 04:51:16 - INFO - __main__ - Step 54231: {'lr': 0.0003614597374313937, 'samples': 10412352, 'steps': 54230, 'loss/train': 1.3580020666122437} -11/07/2021 04:51:16 - INFO - __main__ - Step 54232: {'lr': 0.00036145498726939806, 'samples': 10412544, 'steps': 54231, 'loss/train': 1.5656042098999023} -11/07/2021 04:51:17 - INFO - __main__ - Step 54233: {'lr': 0.0003614502370571826, 'samples': 10412736, 'steps': 54232, 'loss/train': 1.4175289869308472} -11/07/2021 04:51:17 - INFO - __main__ - Step 54234: {'lr': 0.00036144548679474943, 'samples': 10412928, 'steps': 54233, 'loss/train': 1.0778534412384033} -11/07/2021 04:51:18 - INFO - __main__ - Step 54235: {'lr': 0.0003614407364821005, 'samples': 10413120, 'steps': 54234, 'loss/train': 1.378931999206543} -11/07/2021 04:51:18 - INFO - __main__ - Step 54236: {'lr': 0.0003614359861192382, 'samples': 10413312, 'steps': 54235, 'loss/train': 0.9593347311019897} -11/07/2021 04:51:19 - INFO - __main__ - Step 54237: {'lr': 0.00036143123570616455, 'samples': 10413504, 'steps': 54236, 'loss/train': 1.707717776298523} -11/07/2021 04:51:19 - INFO - __main__ - Step 54238: {'lr': 0.0003614264852428817, 'samples': 10413696, 'steps': 54237, 'loss/train': 1.3806053400039673} -11/07/2021 04:51:19 - INFO - __main__ - Step 54239: {'lr': 0.0003614217347293918, 'samples': 10413888, 'steps': 54238, 'loss/train': 1.4995834827423096} -11/07/2021 04:51:20 - INFO - __main__ - Step 54240: {'lr': 0.000361416984165697, 'samples': 10414080, 'steps': 54239, 'loss/train': 1.6374309062957764} -11/07/2021 04:51:21 - INFO - __main__ - Step 54241: {'lr': 0.0003614122335517994, 'samples': 10414272, 'steps': 54240, 'loss/train': 1.4964238405227661} -11/07/2021 04:51:21 - INFO - __main__ - Step 54242: {'lr': 0.0003614074828877012, 'samples': 10414464, 'steps': 54241, 'loss/train': 2.1100287437438965} -11/07/2021 04:51:22 - INFO - __main__ - Step 54243: {'lr': 0.00036140273217340446, 'samples': 10414656, 'steps': 54242, 'loss/train': 0.5982230305671692} -11/07/2021 04:51:22 - INFO - __main__ - Step 54244: {'lr': 0.00036139798140891134, 'samples': 10414848, 'steps': 54243, 'loss/train': 1.047103762626648} -11/07/2021 04:51:23 - INFO - __main__ - Step 54245: {'lr': 0.0003613932305942241, 'samples': 10415040, 'steps': 54244, 'loss/train': 1.2297859191894531} -11/07/2021 04:51:23 - INFO - __main__ - Step 54246: {'lr': 0.00036138847972934477, 'samples': 10415232, 'steps': 54245, 'loss/train': 1.5348211526870728} -11/07/2021 04:51:24 - INFO - __main__ - Step 54247: {'lr': 0.0003613837288142755, 'samples': 10415424, 'steps': 54246, 'loss/train': 1.353988528251648} -11/07/2021 04:51:24 - INFO - __main__ - Step 54248: {'lr': 0.00036137897784901843, 'samples': 10415616, 'steps': 54247, 'loss/train': 1.3973597288131714} -11/07/2021 04:51:24 - INFO - __main__ - Step 54249: {'lr': 0.00036137422683357566, 'samples': 10415808, 'steps': 54248, 'loss/train': 1.4454056024551392} -11/07/2021 04:51:25 - INFO - __main__ - Step 54250: {'lr': 0.00036136947576794945, 'samples': 10416000, 'steps': 54249, 'loss/train': 1.7359259128570557} -11/07/2021 04:51:26 - INFO - __main__ - Step 54251: {'lr': 0.00036136472465214187, 'samples': 10416192, 'steps': 54250, 'loss/train': 1.2222212553024292} -11/07/2021 04:51:26 - INFO - __main__ - Step 54252: {'lr': 0.00036135997348615503, 'samples': 10416384, 'steps': 54251, 'loss/train': 1.7826566696166992} -11/07/2021 04:51:26 - INFO - __main__ - Step 54253: {'lr': 0.00036135522226999115, 'samples': 10416576, 'steps': 54252, 'loss/train': 1.589324951171875} -11/07/2021 04:51:27 - INFO - __main__ - Step 54254: {'lr': 0.00036135047100365223, 'samples': 10416768, 'steps': 54253, 'loss/train': 1.2796744108200073} -11/07/2021 04:51:27 - INFO - __main__ - Step 54255: {'lr': 0.00036134571968714056, 'samples': 10416960, 'steps': 54254, 'loss/train': 1.3641828298568726} -11/07/2021 04:51:28 - INFO - __main__ - Step 54256: {'lr': 0.00036134096832045825, 'samples': 10417152, 'steps': 54255, 'loss/train': 1.4050275087356567} -11/07/2021 04:51:29 - INFO - __main__ - Step 54257: {'lr': 0.0003613362169036074, 'samples': 10417344, 'steps': 54256, 'loss/train': 1.2682961225509644} -11/07/2021 04:51:29 - INFO - __main__ - Step 54258: {'lr': 0.00036133146543659026, 'samples': 10417536, 'steps': 54257, 'loss/train': 1.2486658096313477} -11/07/2021 04:51:29 - INFO - __main__ - Step 54259: {'lr': 0.00036132671391940875, 'samples': 10417728, 'steps': 54258, 'loss/train': 1.6154391765594482} -11/07/2021 04:51:30 - INFO - __main__ - Step 54260: {'lr': 0.0003613219623520652, 'samples': 10417920, 'steps': 54259, 'loss/train': 1.7659212350845337} -11/07/2021 04:51:31 - INFO - __main__ - Step 54261: {'lr': 0.00036131721073456163, 'samples': 10418112, 'steps': 54260, 'loss/train': 1.2127161026000977} -11/07/2021 04:51:31 - INFO - __main__ - Step 54262: {'lr': 0.0003613124590669003, 'samples': 10418304, 'steps': 54261, 'loss/train': 0.9236514568328857} -11/07/2021 04:51:31 - INFO - __main__ - Step 54263: {'lr': 0.0003613077073490832, 'samples': 10418496, 'steps': 54262, 'loss/train': 1.465780258178711} -11/07/2021 04:51:32 - INFO - __main__ - Step 54264: {'lr': 0.0003613029555811127, 'samples': 10418688, 'steps': 54263, 'loss/train': 1.7864091396331787} -11/07/2021 04:51:32 - INFO - __main__ - Step 54265: {'lr': 0.0003612982037629908, 'samples': 10418880, 'steps': 54264, 'loss/train': 1.5634664297103882} -11/07/2021 04:51:33 - INFO - __main__ - Step 54266: {'lr': 0.0003612934518947196, 'samples': 10419072, 'steps': 54265, 'loss/train': 1.3271775245666504} -11/07/2021 04:51:33 - INFO - __main__ - Step 54267: {'lr': 0.00036128869997630134, 'samples': 10419264, 'steps': 54266, 'loss/train': 1.2767351865768433} -11/07/2021 04:51:34 - INFO - __main__ - Step 54268: {'lr': 0.000361283948007738, 'samples': 10419456, 'steps': 54267, 'loss/train': 1.6081736087799072} -11/07/2021 04:51:34 - INFO - __main__ - Step 54269: {'lr': 0.00036127919598903186, 'samples': 10419648, 'steps': 54268, 'loss/train': 1.4866764545440674} -11/07/2021 04:51:35 - INFO - __main__ - Step 54270: {'lr': 0.00036127444392018503, 'samples': 10419840, 'steps': 54269, 'loss/train': 1.5276362895965576} -11/07/2021 04:51:35 - INFO - __main__ - Step 54271: {'lr': 0.00036126969180119977, 'samples': 10420032, 'steps': 54270, 'loss/train': 1.4294250011444092} -11/07/2021 04:51:36 - INFO - __main__ - Step 54272: {'lr': 0.000361264939632078, 'samples': 10420224, 'steps': 54271, 'loss/train': 1.4313125610351562} -11/07/2021 04:51:36 - INFO - __main__ - Step 54273: {'lr': 0.00036126018741282194, 'samples': 10420416, 'steps': 54272, 'loss/train': 1.4946861267089844} -11/07/2021 04:51:37 - INFO - __main__ - Step 54274: {'lr': 0.0003612554351434338, 'samples': 10420608, 'steps': 54273, 'loss/train': 0.9294034838676453} -11/07/2021 04:51:37 - INFO - __main__ - Step 54275: {'lr': 0.0003612506828239157, 'samples': 10420800, 'steps': 54274, 'loss/train': 1.4074270725250244} -11/07/2021 04:51:37 - INFO - __main__ - Step 54276: {'lr': 0.00036124593045426973, 'samples': 10420992, 'steps': 54275, 'loss/train': 1.4687080383300781} -11/07/2021 04:51:38 - INFO - __main__ - Step 54277: {'lr': 0.00036124117803449805, 'samples': 10421184, 'steps': 54276, 'loss/train': 1.4551621675491333} -11/07/2021 04:51:39 - INFO - __main__ - Step 54278: {'lr': 0.00036123642556460284, 'samples': 10421376, 'steps': 54277, 'loss/train': 1.1469041109085083} -11/07/2021 04:51:39 - INFO - __main__ - Step 54279: {'lr': 0.0003612316730445862, 'samples': 10421568, 'steps': 54278, 'loss/train': 1.6708741188049316} -11/07/2021 04:51:39 - INFO - __main__ - Step 54280: {'lr': 0.00036122692047445027, 'samples': 10421760, 'steps': 54279, 'loss/train': 1.777620792388916} -11/07/2021 04:51:40 - INFO - __main__ - Step 54281: {'lr': 0.00036122216785419725, 'samples': 10421952, 'steps': 54280, 'loss/train': 2.0170483589172363} -11/07/2021 04:51:41 - INFO - __main__ - Step 54282: {'lr': 0.00036121741518382915, 'samples': 10422144, 'steps': 54281, 'loss/train': 1.4133511781692505} -11/07/2021 04:51:41 - INFO - __main__ - Step 54283: {'lr': 0.00036121266246334825, 'samples': 10422336, 'steps': 54282, 'loss/train': 1.4715251922607422} -11/07/2021 04:51:42 - INFO - __main__ - Step 54284: {'lr': 0.00036120790969275667, 'samples': 10422528, 'steps': 54283, 'loss/train': 0.9404296278953552} -11/07/2021 04:51:42 - INFO - __main__ - Step 54285: {'lr': 0.0003612031568720565, 'samples': 10422720, 'steps': 54284, 'loss/train': 1.6253358125686646} -11/07/2021 04:51:42 - INFO - __main__ - Step 54286: {'lr': 0.0003611984040012499, 'samples': 10422912, 'steps': 54285, 'loss/train': 1.5697365999221802} -11/07/2021 04:51:43 - INFO - __main__ - Step 54287: {'lr': 0.000361193651080339, 'samples': 10423104, 'steps': 54286, 'loss/train': 1.9644566774368286} -11/07/2021 04:51:44 - INFO - __main__ - Step 54288: {'lr': 0.000361188898109326, 'samples': 10423296, 'steps': 54287, 'loss/train': 1.6080108880996704} -11/07/2021 04:51:44 - INFO - __main__ - Step 54289: {'lr': 0.00036118414508821295, 'samples': 10423488, 'steps': 54288, 'loss/train': 1.6078134775161743} -11/07/2021 04:51:44 - INFO - __main__ - Step 54290: {'lr': 0.0003611793920170021, 'samples': 10423680, 'steps': 54289, 'loss/train': 1.1907614469528198} -11/07/2021 04:51:45 - INFO - __main__ - Step 54291: {'lr': 0.0003611746388956955, 'samples': 10423872, 'steps': 54290, 'loss/train': 1.3729536533355713} -11/07/2021 04:51:46 - INFO - __main__ - Step 54292: {'lr': 0.00036116988572429534, 'samples': 10424064, 'steps': 54291, 'loss/train': 1.1345936059951782} -11/07/2021 04:51:46 - INFO - __main__ - Step 54293: {'lr': 0.0003611651325028037, 'samples': 10424256, 'steps': 54292, 'loss/train': 1.1989638805389404} -11/07/2021 04:51:46 - INFO - __main__ - Step 54294: {'lr': 0.0003611603792312228, 'samples': 10424448, 'steps': 54293, 'loss/train': 1.0696619749069214} -11/07/2021 04:51:47 - INFO - __main__ - Step 54295: {'lr': 0.0003611556259095547, 'samples': 10424640, 'steps': 54294, 'loss/train': 1.2648447751998901} -11/07/2021 04:51:47 - INFO - __main__ - Step 54296: {'lr': 0.00036115087253780164, 'samples': 10424832, 'steps': 54295, 'loss/train': 1.5976979732513428} -11/07/2021 04:51:48 - INFO - __main__ - Step 54297: {'lr': 0.0003611461191159657, 'samples': 10425024, 'steps': 54296, 'loss/train': 1.587814211845398} -11/07/2021 04:51:48 - INFO - __main__ - Step 54298: {'lr': 0.00036114136564404905, 'samples': 10425216, 'steps': 54297, 'loss/train': 1.583405613899231} -11/07/2021 04:51:49 - INFO - __main__ - Step 54299: {'lr': 0.0003611366121220538, 'samples': 10425408, 'steps': 54298, 'loss/train': 1.291266918182373} -11/07/2021 04:51:49 - INFO - __main__ - Step 54300: {'lr': 0.0003611318585499821, 'samples': 10425600, 'steps': 54299, 'loss/train': 1.4985302686691284} -11/07/2021 04:51:49 - INFO - __main__ - Step 54301: {'lr': 0.00036112710492783605, 'samples': 10425792, 'steps': 54300, 'loss/train': 1.4486124515533447} -11/07/2021 04:51:50 - INFO - __main__ - Step 54302: {'lr': 0.0003611223512556179, 'samples': 10425984, 'steps': 54301, 'loss/train': 1.560719609260559} -11/07/2021 04:51:51 - INFO - __main__ - Step 54303: {'lr': 0.0003611175975333297, 'samples': 10426176, 'steps': 54302, 'loss/train': 1.3340426683425903} -11/07/2021 04:51:51 - INFO - __main__ - Step 54304: {'lr': 0.0003611128437609737, 'samples': 10426368, 'steps': 54303, 'loss/train': 1.3235589265823364} -11/07/2021 04:51:51 - INFO - __main__ - Step 54305: {'lr': 0.00036110808993855195, 'samples': 10426560, 'steps': 54304, 'loss/train': 1.4664251804351807} -11/07/2021 04:51:52 - INFO - __main__ - Step 54306: {'lr': 0.0003611033360660666, 'samples': 10426752, 'steps': 54305, 'loss/train': 1.3883143663406372} -11/07/2021 04:51:52 - INFO - __main__ - Step 54307: {'lr': 0.00036109858214351977, 'samples': 10426944, 'steps': 54306, 'loss/train': 1.0334155559539795} -11/07/2021 04:51:53 - INFO - __main__ - Step 54308: {'lr': 0.0003610938281709136, 'samples': 10427136, 'steps': 54307, 'loss/train': 1.3422967195510864} -11/07/2021 04:51:54 - INFO - __main__ - Step 54309: {'lr': 0.0003610890741482503, 'samples': 10427328, 'steps': 54308, 'loss/train': 1.5439521074295044} -11/07/2021 04:51:54 - INFO - __main__ - Step 54310: {'lr': 0.000361084320075532, 'samples': 10427520, 'steps': 54309, 'loss/train': 1.237337350845337} -11/07/2021 04:51:54 - INFO - __main__ - Step 54311: {'lr': 0.00036107956595276083, 'samples': 10427712, 'steps': 54310, 'loss/train': 1.5016213655471802} -11/07/2021 04:51:55 - INFO - __main__ - Step 54312: {'lr': 0.00036107481177993897, 'samples': 10427904, 'steps': 54311, 'loss/train': 0.9651145935058594} -11/07/2021 04:51:56 - INFO - __main__ - Step 54313: {'lr': 0.0003610700575570684, 'samples': 10428096, 'steps': 54312, 'loss/train': 1.3069701194763184} -11/07/2021 04:51:56 - INFO - __main__ - Step 54314: {'lr': 0.00036106530328415136, 'samples': 10428288, 'steps': 54313, 'loss/train': 1.1593788862228394} -11/07/2021 04:51:56 - INFO - __main__ - Step 54315: {'lr': 0.0003610605489611901, 'samples': 10428480, 'steps': 54314, 'loss/train': 1.3796184062957764} -11/07/2021 04:51:57 - INFO - __main__ - Step 54316: {'lr': 0.0003610557945881866, 'samples': 10428672, 'steps': 54315, 'loss/train': 1.698350191116333} -11/07/2021 04:51:57 - INFO - __main__ - Step 54317: {'lr': 0.0003610510401651431, 'samples': 10428864, 'steps': 54316, 'loss/train': 1.696230411529541} -11/07/2021 04:51:58 - INFO - __main__ - Step 54318: {'lr': 0.00036104628569206176, 'samples': 10429056, 'steps': 54317, 'loss/train': 1.3979032039642334} -11/07/2021 04:51:58 - INFO - __main__ - Step 54319: {'lr': 0.00036104153116894465, 'samples': 10429248, 'steps': 54318, 'loss/train': 0.9612535834312439} -11/07/2021 04:51:59 - INFO - __main__ - Step 54320: {'lr': 0.00036103677659579393, 'samples': 10429440, 'steps': 54319, 'loss/train': 1.3281012773513794} -11/07/2021 04:51:59 - INFO - __main__ - Step 54321: {'lr': 0.0003610320219726118, 'samples': 10429632, 'steps': 54320, 'loss/train': 1.3183045387268066} -11/07/2021 04:52:00 - INFO - __main__ - Step 54322: {'lr': 0.00036102726729940026, 'samples': 10429824, 'steps': 54321, 'loss/train': 1.418987512588501} -11/07/2021 04:52:00 - INFO - __main__ - Step 54323: {'lr': 0.0003610225125761616, 'samples': 10430016, 'steps': 54322, 'loss/train': 1.4627366065979004} -11/07/2021 04:52:01 - INFO - __main__ - Step 54324: {'lr': 0.0003610177578028979, 'samples': 10430208, 'steps': 54323, 'loss/train': 1.9382911920547485} -11/07/2021 04:52:01 - INFO - __main__ - Step 54325: {'lr': 0.0003610130029796114, 'samples': 10430400, 'steps': 54324, 'loss/train': 1.7260798215866089} -11/07/2021 04:52:02 - INFO - __main__ - Step 54326: {'lr': 0.000361008248106304, 'samples': 10430592, 'steps': 54325, 'loss/train': 1.382545828819275} -11/07/2021 04:52:02 - INFO - __main__ - Step 54327: {'lr': 0.0003610034931829781, 'samples': 10430784, 'steps': 54326, 'loss/train': 1.1825271844863892} -11/07/2021 04:52:03 - INFO - __main__ - Step 54328: {'lr': 0.0003609987382096357, 'samples': 10430976, 'steps': 54327, 'loss/train': 2.017258882522583} -11/07/2021 04:52:03 - INFO - __main__ - Step 54329: {'lr': 0.00036099398318627896, 'samples': 10431168, 'steps': 54328, 'loss/train': 1.383423089981079} -11/07/2021 04:52:04 - INFO - __main__ - Step 54330: {'lr': 0.00036098922811291, 'samples': 10431360, 'steps': 54329, 'loss/train': 0.9380173683166504} -11/07/2021 04:52:04 - INFO - __main__ - Step 54331: {'lr': 0.00036098447298953107, 'samples': 10431552, 'steps': 54330, 'loss/train': 1.2224643230438232} -11/07/2021 04:52:04 - INFO - __main__ - Step 54332: {'lr': 0.00036097971781614435, 'samples': 10431744, 'steps': 54331, 'loss/train': 1.1786091327667236} -11/07/2021 04:52:05 - INFO - __main__ - Step 54333: {'lr': 0.0003609749625927518, 'samples': 10431936, 'steps': 54332, 'loss/train': 1.3576468229293823} -11/07/2021 04:52:06 - INFO - __main__ - Step 54334: {'lr': 0.0003609702073193556, 'samples': 10432128, 'steps': 54333, 'loss/train': 2.0165226459503174} -11/07/2021 04:52:06 - INFO - __main__ - Step 54335: {'lr': 0.000360965451995958, 'samples': 10432320, 'steps': 54334, 'loss/train': 1.2862190008163452} -11/07/2021 04:52:06 - INFO - __main__ - Step 54336: {'lr': 0.000360960696622561, 'samples': 10432512, 'steps': 54335, 'loss/train': 0.9898625612258911} -11/07/2021 04:52:07 - INFO - __main__ - Step 54337: {'lr': 0.0003609559411991669, 'samples': 10432704, 'steps': 54336, 'loss/train': 1.6091269254684448} -11/07/2021 04:52:08 - INFO - __main__ - Step 54338: {'lr': 0.00036095118572577773, 'samples': 10432896, 'steps': 54337, 'loss/train': 1.989393949508667} -11/07/2021 04:52:08 - INFO - __main__ - Step 54339: {'lr': 0.00036094643020239564, 'samples': 10433088, 'steps': 54338, 'loss/train': 0.6083117127418518} -11/07/2021 04:52:08 - INFO - __main__ - Step 54340: {'lr': 0.0003609416746290228, 'samples': 10433280, 'steps': 54339, 'loss/train': 0.7100966572761536} -11/07/2021 04:52:09 - INFO - __main__ - Step 54341: {'lr': 0.00036093691900566146, 'samples': 10433472, 'steps': 54340, 'loss/train': 1.5817288160324097} -11/07/2021 04:52:09 - INFO - __main__ - Step 54342: {'lr': 0.00036093216333231356, 'samples': 10433664, 'steps': 54341, 'loss/train': 1.5909347534179688} -11/07/2021 04:52:10 - INFO - __main__ - Step 54343: {'lr': 0.0003609274076089813, 'samples': 10433856, 'steps': 54342, 'loss/train': 1.1382523775100708} -11/07/2021 04:52:10 - INFO - __main__ - Step 54344: {'lr': 0.00036092265183566705, 'samples': 10434048, 'steps': 54343, 'loss/train': 1.5417569875717163} -11/07/2021 04:52:11 - INFO - __main__ - Step 54345: {'lr': 0.0003609178960123726, 'samples': 10434240, 'steps': 54344, 'loss/train': 1.293168544769287} -11/07/2021 04:52:11 - INFO - __main__ - Step 54346: {'lr': 0.0003609131401391003, 'samples': 10434432, 'steps': 54345, 'loss/train': 1.2680710554122925} -11/07/2021 04:52:11 - INFO - __main__ - Step 54347: {'lr': 0.00036090838421585223, 'samples': 10434624, 'steps': 54346, 'loss/train': 1.698599100112915} -11/07/2021 04:52:13 - INFO - __main__ - Step 54348: {'lr': 0.0003609036282426306, 'samples': 10434816, 'steps': 54347, 'loss/train': 1.044775366783142} -11/07/2021 04:52:13 - INFO - __main__ - Step 54349: {'lr': 0.0003608988722194375, 'samples': 10435008, 'steps': 54348, 'loss/train': 1.6415693759918213} -11/07/2021 04:52:13 - INFO - __main__ - Step 54350: {'lr': 0.000360894116146275, 'samples': 10435200, 'steps': 54349, 'loss/train': 1.753548264503479} -11/07/2021 04:52:14 - INFO - __main__ - Step 54351: {'lr': 0.0003608893600231454, 'samples': 10435392, 'steps': 54350, 'loss/train': 1.502634048461914} -11/07/2021 04:52:14 - INFO - __main__ - Step 54352: {'lr': 0.00036088460385005076, 'samples': 10435584, 'steps': 54351, 'loss/train': 1.4957200288772583} -11/07/2021 04:52:14 - INFO - __main__ - Step 54353: {'lr': 0.00036087984762699316, 'samples': 10435776, 'steps': 54352, 'loss/train': 1.4521698951721191} -11/07/2021 04:52:15 - INFO - __main__ - Step 54354: {'lr': 0.00036087509135397487, 'samples': 10435968, 'steps': 54353, 'loss/train': 1.2603263854980469} -11/07/2021 04:52:16 - INFO - __main__ - Step 54355: {'lr': 0.00036087033503099796, 'samples': 10436160, 'steps': 54354, 'loss/train': 1.5180668830871582} -11/07/2021 04:52:16 - INFO - __main__ - Step 54356: {'lr': 0.00036086557865806464, 'samples': 10436352, 'steps': 54355, 'loss/train': 1.1182160377502441} -11/07/2021 04:52:16 - INFO - __main__ - Step 54357: {'lr': 0.000360860822235177, 'samples': 10436544, 'steps': 54356, 'loss/train': 1.7119102478027344} -11/07/2021 04:52:17 - INFO - __main__ - Step 54358: {'lr': 0.0003608560657623371, 'samples': 10436736, 'steps': 54357, 'loss/train': 1.7710380554199219} -11/07/2021 04:52:18 - INFO - __main__ - Step 54359: {'lr': 0.0003608513092395472, 'samples': 10436928, 'steps': 54358, 'loss/train': 1.1594558954238892} -11/07/2021 04:52:18 - INFO - __main__ - Step 54360: {'lr': 0.00036084655266680946, 'samples': 10437120, 'steps': 54359, 'loss/train': 1.8689113855361938} -11/07/2021 04:52:19 - INFO - __main__ - Step 54361: {'lr': 0.00036084179604412594, 'samples': 10437312, 'steps': 54360, 'loss/train': 0.38729095458984375} -11/07/2021 04:52:19 - INFO - __main__ - Step 54362: {'lr': 0.00036083703937149877, 'samples': 10437504, 'steps': 54361, 'loss/train': 1.2443463802337646} -11/07/2021 04:52:19 - INFO - __main__ - Step 54363: {'lr': 0.0003608322826489302, 'samples': 10437696, 'steps': 54362, 'loss/train': 1.8838434219360352} -11/07/2021 04:52:20 - INFO - __main__ - Step 54364: {'lr': 0.00036082752587642225, 'samples': 10437888, 'steps': 54363, 'loss/train': 1.8106375932693481} -11/07/2021 04:52:21 - INFO - __main__ - Step 54365: {'lr': 0.00036082276905397714, 'samples': 10438080, 'steps': 54364, 'loss/train': 1.8011395931243896} -11/07/2021 04:52:21 - INFO - __main__ - Step 54366: {'lr': 0.0003608180121815971, 'samples': 10438272, 'steps': 54365, 'loss/train': 0.9508764147758484} -11/07/2021 04:52:21 - INFO - __main__ - Step 54367: {'lr': 0.0003608132552592841, 'samples': 10438464, 'steps': 54366, 'loss/train': 1.3006246089935303} -11/07/2021 04:52:22 - INFO - __main__ - Step 54368: {'lr': 0.0003608084982870404, 'samples': 10438656, 'steps': 54367, 'loss/train': 1.1658813953399658} -11/07/2021 04:52:22 - INFO - __main__ - Step 54369: {'lr': 0.00036080374126486804, 'samples': 10438848, 'steps': 54368, 'loss/train': 0.719493567943573} -11/07/2021 04:52:23 - INFO - __main__ - Step 54370: {'lr': 0.00036079898419276923, 'samples': 10439040, 'steps': 54369, 'loss/train': 1.668667197227478} -11/07/2021 04:52:23 - INFO - __main__ - Step 54371: {'lr': 0.0003607942270707461, 'samples': 10439232, 'steps': 54370, 'loss/train': 1.707180142402649} -11/07/2021 04:52:24 - INFO - __main__ - Step 54372: {'lr': 0.0003607894698988009, 'samples': 10439424, 'steps': 54371, 'loss/train': 1.9096475839614868} -11/07/2021 04:52:24 - INFO - __main__ - Step 54373: {'lr': 0.0003607847126769356, 'samples': 10439616, 'steps': 54372, 'loss/train': 1.17087984085083} -11/07/2021 04:52:24 - INFO - __main__ - Step 54374: {'lr': 0.0003607799554051524, 'samples': 10439808, 'steps': 54373, 'loss/train': 1.7106337547302246} -11/07/2021 04:52:25 - INFO - __main__ - Step 54375: {'lr': 0.0003607751980834535, 'samples': 10440000, 'steps': 54374, 'loss/train': 1.3186962604522705} -11/07/2021 04:52:26 - INFO - __main__ - Step 54376: {'lr': 0.00036077044071184094, 'samples': 10440192, 'steps': 54375, 'loss/train': 1.4960261583328247} -11/07/2021 04:52:26 - INFO - __main__ - Step 54377: {'lr': 0.00036076568329031694, 'samples': 10440384, 'steps': 54376, 'loss/train': 1.5511620044708252} -11/07/2021 04:52:26 - INFO - __main__ - Step 54378: {'lr': 0.0003607609258188837, 'samples': 10440576, 'steps': 54377, 'loss/train': 1.56057870388031} -11/07/2021 04:52:27 - INFO - __main__ - Step 54379: {'lr': 0.00036075616829754333, 'samples': 10440768, 'steps': 54378, 'loss/train': 1.3680694103240967} -11/07/2021 04:52:28 - INFO - __main__ - Step 54380: {'lr': 0.0003607514107262978, 'samples': 10440960, 'steps': 54379, 'loss/train': 1.5334746837615967} -11/07/2021 04:52:28 - INFO - __main__ - Step 54381: {'lr': 0.0003607466531051495, 'samples': 10441152, 'steps': 54380, 'loss/train': 0.6852833032608032} -11/07/2021 04:52:29 - INFO - __main__ - Step 54382: {'lr': 0.0003607418954341004, 'samples': 10441344, 'steps': 54381, 'loss/train': 1.2319045066833496} -11/07/2021 04:52:29 - INFO - __main__ - Step 54383: {'lr': 0.00036073713771315276, 'samples': 10441536, 'steps': 54382, 'loss/train': 1.784158706665039} -11/07/2021 04:52:29 - INFO - __main__ - Step 54384: {'lr': 0.00036073237994230863, 'samples': 10441728, 'steps': 54383, 'loss/train': 1.4005428552627563} -11/07/2021 04:52:31 - INFO - __main__ - Step 54385: {'lr': 0.0003607276221215702, 'samples': 10441920, 'steps': 54384, 'loss/train': 1.500992774963379} -11/07/2021 04:52:31 - INFO - __main__ - Step 54386: {'lr': 0.0003607228642509397, 'samples': 10442112, 'steps': 54385, 'loss/train': 1.3948326110839844} -11/07/2021 04:52:32 - INFO - __main__ - Step 54387: {'lr': 0.00036071810633041913, 'samples': 10442304, 'steps': 54386, 'loss/train': 1.016112208366394} -11/07/2021 04:52:32 - INFO - __main__ - Step 54388: {'lr': 0.0003607133483600107, 'samples': 10442496, 'steps': 54387, 'loss/train': 1.4534598588943481} -11/07/2021 04:52:32 - INFO - __main__ - Step 54389: {'lr': 0.00036070859033971646, 'samples': 10442688, 'steps': 54388, 'loss/train': 0.3873778283596039} -11/07/2021 04:52:33 - INFO - __main__ - Step 54390: {'lr': 0.00036070383226953875, 'samples': 10442880, 'steps': 54389, 'loss/train': 0.34228697419166565} -11/07/2021 04:52:34 - INFO - __main__ - Step 54391: {'lr': 0.0003606990741494795, 'samples': 10443072, 'steps': 54390, 'loss/train': 1.409023404121399} -11/07/2021 04:52:34 - INFO - __main__ - Step 54392: {'lr': 0.00036069431597954103, 'samples': 10443264, 'steps': 54391, 'loss/train': 1.137148141860962} -11/07/2021 04:52:35 - INFO - __main__ - Step 54393: {'lr': 0.0003606895577597254, 'samples': 10443456, 'steps': 54392, 'loss/train': 1.4473907947540283} -11/07/2021 04:52:35 - INFO - __main__ - Step 54394: {'lr': 0.0003606847994900347, 'samples': 10443648, 'steps': 54393, 'loss/train': 1.473389983177185} -11/07/2021 04:52:36 - INFO - __main__ - Step 54395: {'lr': 0.00036068004117047127, 'samples': 10443840, 'steps': 54394, 'loss/train': 1.6775680780410767} -11/07/2021 04:52:36 - INFO - __main__ - Step 54396: {'lr': 0.000360675282801037, 'samples': 10444032, 'steps': 54395, 'loss/train': 1.2410303354263306} -11/07/2021 04:52:37 - INFO - __main__ - Step 54397: {'lr': 0.0003606705243817342, 'samples': 10444224, 'steps': 54396, 'loss/train': 1.5199062824249268} -11/07/2021 04:52:37 - INFO - __main__ - Step 54398: {'lr': 0.00036066576591256496, 'samples': 10444416, 'steps': 54397, 'loss/train': 0.6575682163238525} -11/07/2021 04:52:37 - INFO - __main__ - Step 54399: {'lr': 0.00036066100739353145, 'samples': 10444608, 'steps': 54398, 'loss/train': 1.3232568502426147} -11/07/2021 04:52:38 - INFO - __main__ - Step 54400: {'lr': 0.0003606562488246358, 'samples': 10444800, 'steps': 54399, 'loss/train': 1.3682371377944946} -11/07/2021 04:52:39 - INFO - __main__ - Step 54401: {'lr': 0.00036065149020588015, 'samples': 10444992, 'steps': 54400, 'loss/train': 0.9206700325012207} -11/07/2021 04:52:39 - INFO - __main__ - Step 54402: {'lr': 0.00036064673153726664, 'samples': 10445184, 'steps': 54401, 'loss/train': 1.3973582983016968} -11/07/2021 04:52:39 - INFO - __main__ - Step 54403: {'lr': 0.0003606419728187974, 'samples': 10445376, 'steps': 54402, 'loss/train': 1.6272251605987549} -11/07/2021 04:52:40 - INFO - __main__ - Step 54404: {'lr': 0.00036063721405047463, 'samples': 10445568, 'steps': 54403, 'loss/train': 1.5553442239761353} -11/07/2021 04:52:40 - INFO - __main__ - Step 54405: {'lr': 0.00036063245523230037, 'samples': 10445760, 'steps': 54404, 'loss/train': 1.4646358489990234} -11/07/2021 04:52:41 - INFO - __main__ - Step 54406: {'lr': 0.0003606276963642769, 'samples': 10445952, 'steps': 54405, 'loss/train': 0.8105902075767517} -11/07/2021 04:52:42 - INFO - __main__ - Step 54407: {'lr': 0.00036062293744640637, 'samples': 10446144, 'steps': 54406, 'loss/train': 1.3325507640838623} -11/07/2021 04:52:42 - INFO - __main__ - Step 54408: {'lr': 0.0003606181784786907, 'samples': 10446336, 'steps': 54407, 'loss/train': 1.3325507640838623} -11/07/2021 04:52:42 - INFO - __main__ - Step 54409: {'lr': 0.00036061341946113225, 'samples': 10446528, 'steps': 54408, 'loss/train': 1.77774977684021} -11/07/2021 04:52:43 - INFO - __main__ - Step 54410: {'lr': 0.0003606086603937331, 'samples': 10446720, 'steps': 54409, 'loss/train': 0.8325642347335815} -11/07/2021 04:52:44 - INFO - __main__ - Step 54411: {'lr': 0.00036060390127649536, 'samples': 10446912, 'steps': 54410, 'loss/train': 1.4419652223587036} -11/07/2021 04:52:44 - INFO - __main__ - Step 54412: {'lr': 0.00036059914210942126, 'samples': 10447104, 'steps': 54411, 'loss/train': 0.8393263816833496} -11/07/2021 04:52:44 - INFO - __main__ - Step 54413: {'lr': 0.0003605943828925129, 'samples': 10447296, 'steps': 54412, 'loss/train': 1.6156970262527466} -11/07/2021 04:52:45 - INFO - __main__ - Step 54414: {'lr': 0.0003605896236257724, 'samples': 10447488, 'steps': 54413, 'loss/train': 1.5920202732086182} -11/07/2021 04:52:45 - INFO - __main__ - Step 54415: {'lr': 0.0003605848643092019, 'samples': 10447680, 'steps': 54414, 'loss/train': 1.5970395803451538} -11/07/2021 04:52:46 - INFO - __main__ - Step 54416: {'lr': 0.00036058010494280357, 'samples': 10447872, 'steps': 54415, 'loss/train': 1.5743522644042969} -11/07/2021 04:52:46 - INFO - __main__ - Step 54417: {'lr': 0.00036057534552657954, 'samples': 10448064, 'steps': 54416, 'loss/train': 0.698424756526947} -11/07/2021 04:52:47 - INFO - __main__ - Step 54418: {'lr': 0.000360570586060532, 'samples': 10448256, 'steps': 54417, 'loss/train': 0.8364660143852234} -11/07/2021 04:52:47 - INFO - __main__ - Step 54419: {'lr': 0.0003605658265446631, 'samples': 10448448, 'steps': 54418, 'loss/train': 1.6641874313354492} -11/07/2021 04:52:47 - INFO - __main__ - Step 54420: {'lr': 0.00036056106697897485, 'samples': 10448640, 'steps': 54419, 'loss/train': 1.6034648418426514} -11/07/2021 04:52:48 - INFO - __main__ - Step 54421: {'lr': 0.0003605563073634696, 'samples': 10448832, 'steps': 54420, 'loss/train': 1.2959027290344238} -11/07/2021 04:52:49 - INFO - __main__ - Step 54422: {'lr': 0.00036055154769814923, 'samples': 10449024, 'steps': 54421, 'loss/train': 1.5499179363250732} -11/07/2021 04:52:49 - INFO - __main__ - Step 54423: {'lr': 0.0003605467879830161, 'samples': 10449216, 'steps': 54422, 'loss/train': 1.3453330993652344} -11/07/2021 04:52:49 - INFO - __main__ - Step 54424: {'lr': 0.00036054202821807235, 'samples': 10449408, 'steps': 54423, 'loss/train': 0.702586829662323} -11/07/2021 04:52:50 - INFO - __main__ - Step 54425: {'lr': 0.00036053726840332004, 'samples': 10449600, 'steps': 54424, 'loss/train': 1.5528888702392578} -11/07/2021 04:52:50 - INFO - __main__ - Step 54426: {'lr': 0.00036053250853876134, 'samples': 10449792, 'steps': 54425, 'loss/train': 1.2884200811386108} -11/07/2021 04:52:51 - INFO - __main__ - Step 54427: {'lr': 0.0003605277486243984, 'samples': 10449984, 'steps': 54426, 'loss/train': 1.3678855895996094} -11/07/2021 04:52:52 - INFO - __main__ - Step 54428: {'lr': 0.0003605229886602334, 'samples': 10450176, 'steps': 54427, 'loss/train': 1.1845022439956665} -11/07/2021 04:52:52 - INFO - __main__ - Step 54429: {'lr': 0.0003605182286462683, 'samples': 10450368, 'steps': 54428, 'loss/train': 1.6093850135803223} -11/07/2021 04:52:52 - INFO - __main__ - Step 54430: {'lr': 0.00036051346858250556, 'samples': 10450560, 'steps': 54429, 'loss/train': 1.5918231010437012} -11/07/2021 04:52:53 - INFO - __main__ - Step 54431: {'lr': 0.0003605087084689471, 'samples': 10450752, 'steps': 54430, 'loss/train': 1.4565256834030151} -11/07/2021 04:52:54 - INFO - __main__ - Step 54432: {'lr': 0.0003605039483055951, 'samples': 10450944, 'steps': 54431, 'loss/train': 1.2546392679214478} -11/07/2021 04:52:54 - INFO - __main__ - Step 54433: {'lr': 0.00036049918809245173, 'samples': 10451136, 'steps': 54432, 'loss/train': 0.7608054876327515} -11/07/2021 04:52:54 - INFO - __main__ - Step 54434: {'lr': 0.00036049442782951915, 'samples': 10451328, 'steps': 54433, 'loss/train': 1.2936904430389404} -11/07/2021 04:52:55 - INFO - __main__ - Step 54435: {'lr': 0.00036048966751679945, 'samples': 10451520, 'steps': 54434, 'loss/train': 1.3748066425323486} -11/07/2021 04:52:55 - INFO - __main__ - Step 54436: {'lr': 0.0003604849071542948, 'samples': 10451712, 'steps': 54435, 'loss/train': 1.7087937593460083} -11/07/2021 04:52:56 - INFO - __main__ - Step 54437: {'lr': 0.0003604801467420074, 'samples': 10451904, 'steps': 54436, 'loss/train': 1.6028019189834595} -11/07/2021 04:52:56 - INFO - __main__ - Step 54438: {'lr': 0.00036047538627993937, 'samples': 10452096, 'steps': 54437, 'loss/train': 2.164919376373291} -11/07/2021 04:52:57 - INFO - __main__ - Step 54439: {'lr': 0.00036047062576809283, 'samples': 10452288, 'steps': 54438, 'loss/train': 1.4333831071853638} -11/07/2021 04:52:57 - INFO - __main__ - Step 54440: {'lr': 0.0003604658652064699, 'samples': 10452480, 'steps': 54439, 'loss/train': 0.7021957039833069} -11/07/2021 04:52:57 - INFO - __main__ - Step 54441: {'lr': 0.00036046110459507275, 'samples': 10452672, 'steps': 54440, 'loss/train': 1.6664040088653564} -11/07/2021 04:52:58 - INFO - __main__ - Step 54442: {'lr': 0.00036045634393390354, 'samples': 10452864, 'steps': 54441, 'loss/train': 1.2602707147598267} -11/07/2021 04:52:59 - INFO - __main__ - Step 54443: {'lr': 0.0003604515832229644, 'samples': 10453056, 'steps': 54442, 'loss/train': 0.9451863169670105} -11/07/2021 04:52:59 - INFO - __main__ - Step 54444: {'lr': 0.0003604468224622575, 'samples': 10453248, 'steps': 54443, 'loss/train': 1.4609249830245972} -11/07/2021 04:53:00 - INFO - __main__ - Step 54445: {'lr': 0.00036044206165178496, 'samples': 10453440, 'steps': 54444, 'loss/train': 1.35500168800354} -11/07/2021 04:53:00 - INFO - __main__ - Step 54446: {'lr': 0.00036043730079154897, 'samples': 10453632, 'steps': 54445, 'loss/train': 1.7862550020217896} -11/07/2021 04:53:01 - INFO - __main__ - Step 54447: {'lr': 0.00036043253988155157, 'samples': 10453824, 'steps': 54446, 'loss/train': 1.4353855848312378} -11/07/2021 04:53:01 - INFO - __main__ - Step 54448: {'lr': 0.00036042777892179503, 'samples': 10454016, 'steps': 54447, 'loss/train': 1.9089937210083008} -11/07/2021 04:53:02 - INFO - __main__ - Step 54449: {'lr': 0.0003604230179122814, 'samples': 10454208, 'steps': 54448, 'loss/train': 0.8357492685317993} -11/07/2021 04:53:02 - INFO - __main__ - Step 54450: {'lr': 0.0003604182568530128, 'samples': 10454400, 'steps': 54449, 'loss/train': 1.3180925846099854} -11/07/2021 04:53:02 - INFO - __main__ - Step 54451: {'lr': 0.0003604134957439915, 'samples': 10454592, 'steps': 54450, 'loss/train': 1.654521107673645} -11/07/2021 04:53:03 - INFO - __main__ - Step 54452: {'lr': 0.00036040873458521963, 'samples': 10454784, 'steps': 54451, 'loss/train': 1.3976401090621948} -11/07/2021 04:53:04 - INFO - __main__ - Step 54453: {'lr': 0.0003604039733766992, 'samples': 10454976, 'steps': 54452, 'loss/train': 0.8282707333564758} -11/07/2021 04:53:04 - INFO - __main__ - Step 54454: {'lr': 0.00036039921211843254, 'samples': 10455168, 'steps': 54453, 'loss/train': 1.454387903213501} -11/07/2021 04:53:04 - INFO - __main__ - Step 54455: {'lr': 0.0003603944508104216, 'samples': 10455360, 'steps': 54454, 'loss/train': 1.7368769645690918} -11/07/2021 04:53:05 - INFO - __main__ - Step 54456: {'lr': 0.0003603896894526687, 'samples': 10455552, 'steps': 54455, 'loss/train': 1.3560283184051514} -11/07/2021 04:53:06 - INFO - __main__ - Step 54457: {'lr': 0.00036038492804517586, 'samples': 10455744, 'steps': 54456, 'loss/train': 1.470711588859558} -11/07/2021 04:53:06 - INFO - __main__ - Step 54458: {'lr': 0.00036038016658794525, 'samples': 10455936, 'steps': 54457, 'loss/train': 1.2212845087051392} -11/07/2021 04:53:06 - INFO - __main__ - Step 54459: {'lr': 0.0003603754050809791, 'samples': 10456128, 'steps': 54458, 'loss/train': 0.828596830368042} -11/07/2021 04:53:07 - INFO - __main__ - Step 54460: {'lr': 0.0003603706435242795, 'samples': 10456320, 'steps': 54459, 'loss/train': 1.429358959197998} -11/07/2021 04:53:07 - INFO - __main__ - Step 54461: {'lr': 0.00036036588191784856, 'samples': 10456512, 'steps': 54460, 'loss/train': 1.4888195991516113} -11/07/2021 04:53:07 - INFO - __main__ - Step 54462: {'lr': 0.0003603611202616885, 'samples': 10456704, 'steps': 54461, 'loss/train': 1.4282782077789307} -11/07/2021 04:53:09 - INFO - __main__ - Step 54463: {'lr': 0.0003603563585558014, 'samples': 10456896, 'steps': 54462, 'loss/train': 0.9998105764389038} -11/07/2021 04:53:09 - INFO - __main__ - Step 54464: {'lr': 0.00036035159680018937, 'samples': 10457088, 'steps': 54463, 'loss/train': 1.499611258506775} -11/07/2021 04:53:09 - INFO - __main__ - Step 54465: {'lr': 0.00036034683499485467, 'samples': 10457280, 'steps': 54464, 'loss/train': 1.0547444820404053} -11/07/2021 04:53:10 - INFO - __main__ - Step 54466: {'lr': 0.0003603420731397994, 'samples': 10457472, 'steps': 54465, 'loss/train': 1.8761290311813354} -11/07/2021 04:53:10 - INFO - __main__ - Step 54467: {'lr': 0.00036033731123502567, 'samples': 10457664, 'steps': 54466, 'loss/train': 0.4542864263057709} -11/07/2021 04:53:11 - INFO - __main__ - Step 54468: {'lr': 0.00036033254928053565, 'samples': 10457856, 'steps': 54467, 'loss/train': 1.2216380834579468} -11/07/2021 04:53:11 - INFO - __main__ - Step 54469: {'lr': 0.0003603277872763315, 'samples': 10458048, 'steps': 54468, 'loss/train': 1.6646921634674072} -11/07/2021 04:53:12 - INFO - __main__ - Step 54470: {'lr': 0.0003603230252224153, 'samples': 10458240, 'steps': 54469, 'loss/train': 2.8909945487976074} -11/07/2021 04:53:12 - INFO - __main__ - Step 54471: {'lr': 0.0003603182631187893, 'samples': 10458432, 'steps': 54470, 'loss/train': 1.6032060384750366} -11/07/2021 04:53:12 - INFO - __main__ - Step 54472: {'lr': 0.00036031350096545555, 'samples': 10458624, 'steps': 54471, 'loss/train': 1.352306604385376} -11/07/2021 04:53:13 - INFO - __main__ - Step 54473: {'lr': 0.0003603087387624163, 'samples': 10458816, 'steps': 54472, 'loss/train': 1.335830569267273} -11/07/2021 04:53:14 - INFO - __main__ - Step 54474: {'lr': 0.0003603039765096736, 'samples': 10459008, 'steps': 54473, 'loss/train': 0.9098039269447327} -11/07/2021 04:53:14 - INFO - __main__ - Step 54475: {'lr': 0.00036029921420722966, 'samples': 10459200, 'steps': 54474, 'loss/train': 1.742047667503357} -11/07/2021 04:53:15 - INFO - __main__ - Step 54476: {'lr': 0.0003602944518550866, 'samples': 10459392, 'steps': 54475, 'loss/train': 1.7945836782455444} -11/07/2021 04:53:15 - INFO - __main__ - Step 54477: {'lr': 0.00036028968945324647, 'samples': 10459584, 'steps': 54476, 'loss/train': 1.4792283773422241} -11/07/2021 04:53:16 - INFO - __main__ - Step 54478: {'lr': 0.00036028492700171166, 'samples': 10459776, 'steps': 54477, 'loss/train': 1.4864531755447388} -11/07/2021 04:53:16 - INFO - __main__ - Step 54479: {'lr': 0.0003602801645004841, 'samples': 10459968, 'steps': 54478, 'loss/train': 1.3378815650939941} -11/07/2021 04:53:17 - INFO - __main__ - Step 54480: {'lr': 0.00036027540194956593, 'samples': 10460160, 'steps': 54479, 'loss/train': 1.5457781553268433} -11/07/2021 04:53:17 - INFO - __main__ - Step 54481: {'lr': 0.00036027063934895935, 'samples': 10460352, 'steps': 54480, 'loss/train': 1.1741148233413696} -11/07/2021 04:53:17 - INFO - __main__ - Step 54482: {'lr': 0.0003602658766986666, 'samples': 10460544, 'steps': 54481, 'loss/train': 0.20403732359409332} -11/07/2021 04:53:18 - INFO - __main__ - Step 54483: {'lr': 0.00036026111399868973, 'samples': 10460736, 'steps': 54482, 'loss/train': 1.2347005605697632} -11/07/2021 04:53:19 - INFO - __main__ - Step 54484: {'lr': 0.00036025635124903093, 'samples': 10460928, 'steps': 54483, 'loss/train': 1.3686023950576782} -11/07/2021 04:53:19 - INFO - __main__ - Step 54485: {'lr': 0.0003602515884496923, 'samples': 10461120, 'steps': 54484, 'loss/train': 2.0651817321777344} -11/07/2021 04:53:20 - INFO - __main__ - Step 54486: {'lr': 0.00036024682560067603, 'samples': 10461312, 'steps': 54485, 'loss/train': 1.4665913581848145} -11/07/2021 04:53:20 - INFO - __main__ - Step 54487: {'lr': 0.00036024206270198416, 'samples': 10461504, 'steps': 54486, 'loss/train': 1.2947725057601929} -11/07/2021 04:53:20 - INFO - __main__ - Step 54488: {'lr': 0.00036023729975361897, 'samples': 10461696, 'steps': 54487, 'loss/train': 1.147482991218567} -11/07/2021 04:53:21 - INFO - __main__ - Step 54489: {'lr': 0.00036023253675558257, 'samples': 10461888, 'steps': 54488, 'loss/train': 1.2997239828109741} -11/07/2021 04:53:22 - INFO - __main__ - Step 54490: {'lr': 0.0003602277737078771, 'samples': 10462080, 'steps': 54489, 'loss/train': 0.9417256712913513} -11/07/2021 04:53:22 - INFO - __main__ - Step 54491: {'lr': 0.00036022301061050467, 'samples': 10462272, 'steps': 54490, 'loss/train': 1.7079122066497803} -11/07/2021 04:53:22 - INFO - __main__ - Step 54492: {'lr': 0.00036021824746346746, 'samples': 10462464, 'steps': 54491, 'loss/train': 0.9305670261383057} -11/07/2021 04:53:23 - INFO - __main__ - Step 54493: {'lr': 0.00036021348426676754, 'samples': 10462656, 'steps': 54492, 'loss/train': 1.520282506942749} -11/07/2021 04:53:24 - INFO - __main__ - Step 54494: {'lr': 0.00036020872102040727, 'samples': 10462848, 'steps': 54493, 'loss/train': 1.3972678184509277} -11/07/2021 04:53:24 - INFO - __main__ - Step 54495: {'lr': 0.00036020395772438853, 'samples': 10463040, 'steps': 54494, 'loss/train': 1.6086684465408325} -11/07/2021 04:53:24 - INFO - __main__ - Step 54496: {'lr': 0.00036019919437871355, 'samples': 10463232, 'steps': 54495, 'loss/train': 1.4100995063781738} -11/07/2021 04:53:25 - INFO - __main__ - Step 54497: {'lr': 0.0003601944309833846, 'samples': 10463424, 'steps': 54496, 'loss/train': 1.7696830034255981} -11/07/2021 04:53:25 - INFO - __main__ - Step 54498: {'lr': 0.0003601896675384037, 'samples': 10463616, 'steps': 54497, 'loss/train': 0.6956066489219666} -11/07/2021 04:53:26 - INFO - __main__ - Step 54499: {'lr': 0.0003601849040437731, 'samples': 10463808, 'steps': 54498, 'loss/train': 1.7751015424728394} -11/07/2021 04:53:26 - INFO - __main__ - Step 54500: {'lr': 0.0003601801404994949, 'samples': 10464000, 'steps': 54499, 'loss/train': 1.4549936056137085} -11/07/2021 04:53:27 - INFO - __main__ - Step 54501: {'lr': 0.0003601753769055711, 'samples': 10464192, 'steps': 54500, 'loss/train': 1.4666833877563477} -11/07/2021 04:53:27 - INFO - __main__ - Step 54502: {'lr': 0.00036017061326200405, 'samples': 10464384, 'steps': 54501, 'loss/train': 1.3497642278671265} -11/07/2021 04:53:27 - INFO - __main__ - Step 54503: {'lr': 0.0003601658495687958, 'samples': 10464576, 'steps': 54502, 'loss/train': 1.423039197921753} -11/07/2021 04:53:29 - INFO - __main__ - Step 54504: {'lr': 0.0003601610858259485, 'samples': 10464768, 'steps': 54503, 'loss/train': 1.674121618270874} -11/07/2021 04:53:30 - INFO - __main__ - Step 54505: {'lr': 0.0003601563220334644, 'samples': 10464960, 'steps': 54504, 'loss/train': 0.5751160979270935} -11/07/2021 04:53:30 - INFO - __main__ - Step 54506: {'lr': 0.0003601515581913455, 'samples': 10465152, 'steps': 54505, 'loss/train': 0.6630145907402039} -11/07/2021 04:53:31 - INFO - __main__ - Step 54507: {'lr': 0.0003601467942995941, 'samples': 10465344, 'steps': 54506, 'loss/train': 1.765760898590088} -11/07/2021 04:53:31 - INFO - __main__ - Step 54508: {'lr': 0.00036014203035821213, 'samples': 10465536, 'steps': 54507, 'loss/train': 1.625728726387024} -11/07/2021 04:53:31 - INFO - __main__ - Step 54509: {'lr': 0.0003601372663672019, 'samples': 10465728, 'steps': 54508, 'loss/train': 1.4943439960479736} -11/07/2021 04:53:32 - INFO - __main__ - Step 54510: {'lr': 0.00036013250232656553, 'samples': 10465920, 'steps': 54509, 'loss/train': 1.8026031255722046} -11/07/2021 04:53:33 - INFO - __main__ - Step 54511: {'lr': 0.0003601277382363051, 'samples': 10466112, 'steps': 54510, 'loss/train': 1.1128720045089722} -11/07/2021 04:53:33 - INFO - __main__ - Step 54512: {'lr': 0.0003601229740964229, 'samples': 10466304, 'steps': 54511, 'loss/train': 1.4502888917922974} -11/07/2021 04:53:33 - INFO - __main__ - Step 54513: {'lr': 0.000360118209906921, 'samples': 10466496, 'steps': 54512, 'loss/train': 1.446730613708496} -11/07/2021 04:53:34 - INFO - __main__ - Step 54514: {'lr': 0.0003601134456678014, 'samples': 10466688, 'steps': 54513, 'loss/train': 1.6567314863204956} -11/07/2021 04:53:35 - INFO - __main__ - Step 54515: {'lr': 0.0003601086813790665, 'samples': 10466880, 'steps': 54514, 'loss/train': 1.2719297409057617} -11/07/2021 04:53:35 - INFO - __main__ - Step 54516: {'lr': 0.00036010391704071823, 'samples': 10467072, 'steps': 54515, 'loss/train': 1.5631134510040283} -11/07/2021 04:53:35 - INFO - __main__ - Step 54517: {'lr': 0.0003600991526527589, 'samples': 10467264, 'steps': 54516, 'loss/train': 1.6666017770767212} -11/07/2021 04:53:36 - INFO - __main__ - Step 54518: {'lr': 0.00036009438821519056, 'samples': 10467456, 'steps': 54517, 'loss/train': 1.1656901836395264} -11/07/2021 04:53:36 - INFO - __main__ - Step 54519: {'lr': 0.0003600896237280154, 'samples': 10467648, 'steps': 54518, 'loss/train': 1.5136204957962036} -11/07/2021 04:53:37 - INFO - __main__ - Step 54520: {'lr': 0.0003600848591912356, 'samples': 10467840, 'steps': 54519, 'loss/train': 2.2862720489501953} -11/07/2021 04:53:38 - INFO - __main__ - Step 54521: {'lr': 0.00036008009460485323, 'samples': 10468032, 'steps': 54520, 'loss/train': 1.4150656461715698} -11/07/2021 04:53:38 - INFO - __main__ - Step 54522: {'lr': 0.00036007532996887043, 'samples': 10468224, 'steps': 54521, 'loss/train': 1.6245402097702026} -11/07/2021 04:53:38 - INFO - __main__ - Step 54523: {'lr': 0.0003600705652832894, 'samples': 10468416, 'steps': 54522, 'loss/train': 1.3718273639678955} -11/07/2021 04:53:39 - INFO - __main__ - Step 54524: {'lr': 0.00036006580054811235, 'samples': 10468608, 'steps': 54523, 'loss/train': 0.33106160163879395} -11/07/2021 04:53:39 - INFO - __main__ - Step 54525: {'lr': 0.00036006103576334124, 'samples': 10468800, 'steps': 54524, 'loss/train': 1.3807979822158813} -11/07/2021 04:53:40 - INFO - __main__ - Step 54526: {'lr': 0.00036005627092897835, 'samples': 10468992, 'steps': 54525, 'loss/train': 1.3589504957199097} -11/07/2021 04:53:40 - INFO - __main__ - Step 54527: {'lr': 0.0003600515060450259, 'samples': 10469184, 'steps': 54526, 'loss/train': 1.1738468408584595} -11/07/2021 04:53:41 - INFO - __main__ - Step 54528: {'lr': 0.0003600467411114858, 'samples': 10469376, 'steps': 54527, 'loss/train': 1.4811841249465942} -11/07/2021 04:53:41 - INFO - __main__ - Step 54529: {'lr': 0.00036004197612836045, 'samples': 10469568, 'steps': 54528, 'loss/train': 1.2551336288452148} -11/07/2021 04:53:41 - INFO - __main__ - Step 54530: {'lr': 0.0003600372110956518, 'samples': 10469760, 'steps': 54529, 'loss/train': 1.477476954460144} -11/07/2021 04:53:42 - INFO - __main__ - Step 54531: {'lr': 0.0003600324460133621, 'samples': 10469952, 'steps': 54530, 'loss/train': 5.719179630279541} -11/07/2021 04:53:43 - INFO - __main__ - Step 54532: {'lr': 0.0003600276808814935, 'samples': 10470144, 'steps': 54531, 'loss/train': 1.3719375133514404} -11/07/2021 04:53:43 - INFO - __main__ - Step 54533: {'lr': 0.00036002291570004806, 'samples': 10470336, 'steps': 54532, 'loss/train': 0.9591979384422302} -11/07/2021 04:53:44 - INFO - __main__ - Step 54534: {'lr': 0.0003600181504690281, 'samples': 10470528, 'steps': 54533, 'loss/train': 1.4933171272277832} -11/07/2021 04:53:44 - INFO - __main__ - Step 54535: {'lr': 0.00036001338518843563, 'samples': 10470720, 'steps': 54534, 'loss/train': 1.0749701261520386} -11/07/2021 04:53:45 - INFO - __main__ - Step 54536: {'lr': 0.0003600086198582728, 'samples': 10470912, 'steps': 54535, 'loss/train': 1.3410433530807495} -11/07/2021 04:53:46 - INFO - __main__ - Step 54537: {'lr': 0.00036000385447854176, 'samples': 10471104, 'steps': 54536, 'loss/train': 1.4538391828536987} -11/07/2021 04:53:46 - INFO - __main__ - Step 54538: {'lr': 0.0003599990890492447, 'samples': 10471296, 'steps': 54537, 'loss/train': 1.852305293083191} -11/07/2021 04:53:46 - INFO - __main__ - Step 54539: {'lr': 0.00035999432357038374, 'samples': 10471488, 'steps': 54538, 'loss/train': 1.7534759044647217} -11/07/2021 04:53:47 - INFO - __main__ - Step 54540: {'lr': 0.0003599895580419611, 'samples': 10471680, 'steps': 54539, 'loss/train': 1.1182537078857422} -11/07/2021 04:53:47 - INFO - __main__ - Step 54541: {'lr': 0.0003599847924639788, 'samples': 10471872, 'steps': 54540, 'loss/train': 1.510610580444336} -11/07/2021 04:53:48 - INFO - __main__ - Step 54542: {'lr': 0.00035998002683643903, 'samples': 10472064, 'steps': 54541, 'loss/train': 0.08167430013418198} -11/07/2021 04:53:48 - INFO - __main__ - Step 54543: {'lr': 0.00035997526115934405, 'samples': 10472256, 'steps': 54542, 'loss/train': 0.7035478353500366} -11/07/2021 04:53:49 - INFO - __main__ - Step 54544: {'lr': 0.00035997049543269583, 'samples': 10472448, 'steps': 54543, 'loss/train': 1.052796721458435} -11/07/2021 04:53:49 - INFO - __main__ - Step 54545: {'lr': 0.0003599657296564966, 'samples': 10472640, 'steps': 54544, 'loss/train': 1.1861445903778076} -11/07/2021 04:53:49 - INFO - __main__ - Step 54546: {'lr': 0.00035996096383074855, 'samples': 10472832, 'steps': 54545, 'loss/train': 1.3695660829544067} -11/07/2021 04:53:50 - INFO - __main__ - Step 54547: {'lr': 0.0003599561979554538, 'samples': 10473024, 'steps': 54546, 'loss/train': 1.4467450380325317} -11/07/2021 04:53:51 - INFO - __main__ - Step 54548: {'lr': 0.0003599514320306144, 'samples': 10473216, 'steps': 54547, 'loss/train': 1.014519214630127} -11/07/2021 04:53:51 - INFO - __main__ - Step 54549: {'lr': 0.0003599466660562327, 'samples': 10473408, 'steps': 54548, 'loss/train': 1.5184181928634644} -11/07/2021 04:53:51 - INFO - __main__ - Step 54550: {'lr': 0.00035994190003231063, 'samples': 10473600, 'steps': 54549, 'loss/train': 1.8656283617019653} -11/07/2021 04:53:52 - INFO - __main__ - Step 54551: {'lr': 0.0003599371339588505, 'samples': 10473792, 'steps': 54550, 'loss/train': 1.8684369325637817} -11/07/2021 04:53:53 - INFO - __main__ - Step 54552: {'lr': 0.00035993236783585437, 'samples': 10473984, 'steps': 54551, 'loss/train': 1.1571929454803467} -11/07/2021 04:53:53 - INFO - __main__ - Step 54553: {'lr': 0.00035992760166332437, 'samples': 10474176, 'steps': 54552, 'loss/train': 1.4314864873886108} -11/07/2021 04:53:53 - INFO - __main__ - Step 54554: {'lr': 0.00035992283544126276, 'samples': 10474368, 'steps': 54553, 'loss/train': 1.5210908651351929} -11/07/2021 04:53:54 - INFO - __main__ - Step 54555: {'lr': 0.00035991806916967154, 'samples': 10474560, 'steps': 54554, 'loss/train': 1.3890198469161987} -11/07/2021 04:53:54 - INFO - __main__ - Step 54556: {'lr': 0.000359913302848553, 'samples': 10474752, 'steps': 54555, 'loss/train': 1.4590320587158203} -11/07/2021 04:53:55 - INFO - __main__ - Step 54557: {'lr': 0.0003599085364779092, 'samples': 10474944, 'steps': 54556, 'loss/train': 1.2427164316177368} -11/07/2021 04:53:55 - INFO - __main__ - Step 54558: {'lr': 0.0003599037700577423, 'samples': 10475136, 'steps': 54557, 'loss/train': 0.5811551213264465} -11/07/2021 04:53:56 - INFO - __main__ - Step 54559: {'lr': 0.0003598990035880545, 'samples': 10475328, 'steps': 54558, 'loss/train': 1.1282968521118164} -11/07/2021 04:53:56 - INFO - __main__ - Step 54560: {'lr': 0.0003598942370688479, 'samples': 10475520, 'steps': 54559, 'loss/train': 1.6033250093460083} -11/07/2021 04:53:57 - INFO - __main__ - Step 54561: {'lr': 0.0003598894705001246, 'samples': 10475712, 'steps': 54560, 'loss/train': 1.3572427034378052} -11/07/2021 04:53:58 - INFO - __main__ - Step 54562: {'lr': 0.00035988470388188684, 'samples': 10475904, 'steps': 54561, 'loss/train': 1.8462798595428467} -11/07/2021 04:53:59 - INFO - __main__ - Step 54563: {'lr': 0.0003598799372141367, 'samples': 10476096, 'steps': 54562, 'loss/train': 1.3394297361373901} -11/07/2021 04:53:59 - INFO - __main__ - Step 54564: {'lr': 0.00035987517049687633, 'samples': 10476288, 'steps': 54563, 'loss/train': 1.4395896196365356} -11/07/2021 04:53:59 - INFO - __main__ - Step 54565: {'lr': 0.0003598704037301079, 'samples': 10476480, 'steps': 54564, 'loss/train': 1.1239593029022217} -11/07/2021 04:54:00 - INFO - __main__ - Step 54566: {'lr': 0.00035986563691383364, 'samples': 10476672, 'steps': 54565, 'loss/train': 1.3218730688095093} -11/07/2021 04:54:00 - INFO - __main__ - Step 54567: {'lr': 0.0003598608700480556, 'samples': 10476864, 'steps': 54566, 'loss/train': 1.663745403289795} -11/07/2021 04:54:01 - INFO - __main__ - Step 54568: {'lr': 0.00035985610313277595, 'samples': 10477056, 'steps': 54567, 'loss/train': 1.3814071416854858} -11/07/2021 04:54:01 - INFO - __main__ - Step 54569: {'lr': 0.0003598513361679968, 'samples': 10477248, 'steps': 54568, 'loss/train': 1.009146809577942} -11/07/2021 04:54:02 - INFO - __main__ - Step 54570: {'lr': 0.00035984656915372034, 'samples': 10477440, 'steps': 54569, 'loss/train': 1.7624433040618896} -11/07/2021 04:54:02 - INFO - __main__ - Step 54571: {'lr': 0.0003598418020899487, 'samples': 10477632, 'steps': 54570, 'loss/train': 0.8357031345367432} -11/07/2021 04:54:02 - INFO - __main__ - Step 54572: {'lr': 0.0003598370349766841, 'samples': 10477824, 'steps': 54571, 'loss/train': 1.2402217388153076} -11/07/2021 04:54:04 - INFO - __main__ - Step 54573: {'lr': 0.0003598322678139285, 'samples': 10478016, 'steps': 54572, 'loss/train': 1.397077202796936} -11/07/2021 04:54:04 - INFO - __main__ - Step 54574: {'lr': 0.00035982750060168436, 'samples': 10478208, 'steps': 54573, 'loss/train': 1.3012789487838745} -11/07/2021 04:54:04 - INFO - __main__ - Step 54575: {'lr': 0.0003598227333399535, 'samples': 10478400, 'steps': 54574, 'loss/train': 1.774486780166626} -11/07/2021 04:54:05 - INFO - __main__ - Step 54576: {'lr': 0.00035981796602873825, 'samples': 10478592, 'steps': 54575, 'loss/train': 1.4299341440200806} -11/07/2021 04:54:05 - INFO - __main__ - Step 54577: {'lr': 0.00035981319866804074, 'samples': 10478784, 'steps': 54576, 'loss/train': 1.7281969785690308} -11/07/2021 04:54:05 - INFO - __main__ - Step 54578: {'lr': 0.00035980843125786306, 'samples': 10478976, 'steps': 54577, 'loss/train': 1.4509475231170654} -11/07/2021 04:54:06 - INFO - __main__ - Step 54579: {'lr': 0.0003598036637982074, 'samples': 10479168, 'steps': 54578, 'loss/train': 0.8924833536148071} -11/07/2021 04:54:07 - INFO - __main__ - Step 54580: {'lr': 0.00035979889628907593, 'samples': 10479360, 'steps': 54579, 'loss/train': 1.6304229497909546} -11/07/2021 04:54:07 - INFO - __main__ - Step 54581: {'lr': 0.0003597941287304708, 'samples': 10479552, 'steps': 54580, 'loss/train': 1.5461974143981934} -11/07/2021 04:54:07 - INFO - __main__ - Step 54582: {'lr': 0.0003597893611223941, 'samples': 10479744, 'steps': 54581, 'loss/train': 1.5604580640792847} -11/07/2021 04:54:08 - INFO - __main__ - Step 54583: {'lr': 0.00035978459346484794, 'samples': 10479936, 'steps': 54582, 'loss/train': 1.3171463012695312} -11/07/2021 04:54:10 - INFO - __main__ - Step 54584: {'lr': 0.0003597798257578346, 'samples': 10480128, 'steps': 54583, 'loss/train': 1.2966458797454834} -11/07/2021 04:54:11 - INFO - __main__ - Step 54585: {'lr': 0.0003597750580013561, 'samples': 10480320, 'steps': 54584, 'loss/train': 1.376119613647461} -11/07/2021 04:54:11 - INFO - __main__ - Step 54586: {'lr': 0.0003597702901954147, 'samples': 10480512, 'steps': 54585, 'loss/train': 1.302351713180542} -11/07/2021 04:54:11 - INFO - __main__ - Step 54587: {'lr': 0.00035976552234001256, 'samples': 10480704, 'steps': 54586, 'loss/train': 1.7879868745803833} -11/07/2021 04:54:12 - INFO - __main__ - Step 54588: {'lr': 0.00035976075443515176, 'samples': 10480896, 'steps': 54587, 'loss/train': 1.8037214279174805} -11/07/2021 04:54:12 - INFO - __main__ - Step 54589: {'lr': 0.0003597559864808344, 'samples': 10481088, 'steps': 54588, 'loss/train': 1.7866116762161255} -11/07/2021 04:54:12 - INFO - __main__ - Step 54590: {'lr': 0.0003597512184770627, 'samples': 10481280, 'steps': 54589, 'loss/train': 1.7747493982315063} -11/07/2021 04:54:13 - INFO - __main__ - Step 54591: {'lr': 0.0003597464504238388, 'samples': 10481472, 'steps': 54590, 'loss/train': 1.5926944017410278} -11/07/2021 04:54:14 - INFO - __main__ - Step 54592: {'lr': 0.00035974168232116486, 'samples': 10481664, 'steps': 54591, 'loss/train': 1.5279266834259033} -11/07/2021 04:54:14 - INFO - __main__ - Step 54593: {'lr': 0.00035973691416904297, 'samples': 10481856, 'steps': 54592, 'loss/train': 1.7045717239379883} -11/07/2021 04:54:14 - INFO - __main__ - Step 54594: {'lr': 0.0003597321459674754, 'samples': 10482048, 'steps': 54593, 'loss/train': 1.2987728118896484} -11/07/2021 04:54:15 - INFO - __main__ - Step 54595: {'lr': 0.0003597273777164641, 'samples': 10482240, 'steps': 54594, 'loss/train': 1.4758131504058838} -11/07/2021 04:54:15 - INFO - __main__ - Step 54596: {'lr': 0.00035972260941601145, 'samples': 10482432, 'steps': 54595, 'loss/train': 0.771090030670166} -11/07/2021 04:54:16 - INFO - __main__ - Step 54597: {'lr': 0.0003597178410661194, 'samples': 10482624, 'steps': 54596, 'loss/train': 1.8686833381652832} -11/07/2021 04:54:17 - INFO - __main__ - Step 54598: {'lr': 0.00035971307266679023, 'samples': 10482816, 'steps': 54597, 'loss/train': 0.07533127069473267} -11/07/2021 04:54:17 - INFO - __main__ - Step 54599: {'lr': 0.000359708304218026, 'samples': 10483008, 'steps': 54598, 'loss/train': 1.3319792747497559} -11/07/2021 04:54:17 - INFO - __main__ - Step 54600: {'lr': 0.00035970353571982897, 'samples': 10483200, 'steps': 54599, 'loss/train': 1.1695317029953003} -11/07/2021 04:54:18 - INFO - __main__ - Step 54601: {'lr': 0.0003596987671722012, 'samples': 10483392, 'steps': 54600, 'loss/train': 1.0282728672027588} -11/07/2021 04:54:19 - INFO - __main__ - Step 54602: {'lr': 0.00035969399857514484, 'samples': 10483584, 'steps': 54601, 'loss/train': 1.557262659072876} -11/07/2021 04:54:19 - INFO - __main__ - Step 54603: {'lr': 0.00035968922992866205, 'samples': 10483776, 'steps': 54602, 'loss/train': 1.3373254537582397} -11/07/2021 04:54:19 - INFO - __main__ - Step 54604: {'lr': 0.00035968446123275493, 'samples': 10483968, 'steps': 54603, 'loss/train': 1.6461188793182373} -11/07/2021 04:54:20 - INFO - __main__ - Step 54605: {'lr': 0.00035967969248742576, 'samples': 10484160, 'steps': 54604, 'loss/train': 1.3914114236831665} -11/07/2021 04:54:20 - INFO - __main__ - Step 54606: {'lr': 0.00035967492369267664, 'samples': 10484352, 'steps': 54605, 'loss/train': 1.6466848850250244} -11/07/2021 04:54:21 - INFO - __main__ - Step 54607: {'lr': 0.00035967015484850964, 'samples': 10484544, 'steps': 54606, 'loss/train': 1.8524785041809082} -11/07/2021 04:54:21 - INFO - __main__ - Step 54608: {'lr': 0.000359665385954927, 'samples': 10484736, 'steps': 54607, 'loss/train': 1.4837788343429565} -11/07/2021 04:54:22 - INFO - __main__ - Step 54609: {'lr': 0.00035966061701193073, 'samples': 10484928, 'steps': 54608, 'loss/train': 1.4896328449249268} -11/07/2021 04:54:22 - INFO - __main__ - Step 54610: {'lr': 0.00035965584801952316, 'samples': 10485120, 'steps': 54609, 'loss/train': 1.3101656436920166} -11/07/2021 04:54:23 - INFO - __main__ - Step 54611: {'lr': 0.0003596510789777064, 'samples': 10485312, 'steps': 54610, 'loss/train': 1.8135974407196045} -11/07/2021 04:54:23 - INFO - __main__ - Step 54612: {'lr': 0.0003596463098864825, 'samples': 10485504, 'steps': 54611, 'loss/train': 1.3681882619857788} -11/07/2021 04:54:24 - INFO - __main__ - Step 54613: {'lr': 0.00035964154074585365, 'samples': 10485696, 'steps': 54612, 'loss/train': 1.1502083539962769} -11/07/2021 04:54:24 - INFO - __main__ - Step 54614: {'lr': 0.00035963677155582204, 'samples': 10485888, 'steps': 54613, 'loss/train': 1.2346999645233154} -11/07/2021 04:54:25 - INFO - __main__ - Step 54615: {'lr': 0.0003596320023163898, 'samples': 10486080, 'steps': 54614, 'loss/train': 2.0042223930358887} -11/07/2021 04:54:25 - INFO - __main__ - Step 54616: {'lr': 0.000359627233027559, 'samples': 10486272, 'steps': 54615, 'loss/train': 1.206191062927246} -11/07/2021 04:54:25 - INFO - __main__ - Step 54617: {'lr': 0.0003596224636893319, 'samples': 10486464, 'steps': 54616, 'loss/train': 1.0956661701202393} -11/07/2021 04:54:26 - INFO - __main__ - Step 54618: {'lr': 0.0003596176943017107, 'samples': 10486656, 'steps': 54617, 'loss/train': 1.5135501623153687} -11/07/2021 04:54:27 - INFO - __main__ - Step 54619: {'lr': 0.0003596129248646974, 'samples': 10486848, 'steps': 54618, 'loss/train': 1.3166604042053223} -11/07/2021 04:54:27 - INFO - __main__ - Step 54620: {'lr': 0.0003596081553782942, 'samples': 10487040, 'steps': 54619, 'loss/train': 0.583804190158844} -11/07/2021 04:54:28 - INFO - __main__ - Step 54621: {'lr': 0.0003596033858425032, 'samples': 10487232, 'steps': 54620, 'loss/train': 1.8584426641464233} -11/07/2021 04:54:28 - INFO - __main__ - Step 54622: {'lr': 0.00035959861625732667, 'samples': 10487424, 'steps': 54621, 'loss/train': 1.3924795389175415} -11/07/2021 04:54:29 - INFO - __main__ - Step 54623: {'lr': 0.0003595938466227667, 'samples': 10487616, 'steps': 54622, 'loss/train': 1.4461191892623901} -11/07/2021 04:54:29 - INFO - __main__ - Step 54624: {'lr': 0.0003595890769388254, 'samples': 10487808, 'steps': 54623, 'loss/train': 1.0373965501785278} -11/07/2021 04:54:30 - INFO - __main__ - Step 54625: {'lr': 0.00035958430720550494, 'samples': 10488000, 'steps': 54624, 'loss/train': 1.4201768636703491} -11/07/2021 04:54:30 - INFO - __main__ - Step 54626: {'lr': 0.00035957953742280754, 'samples': 10488192, 'steps': 54625, 'loss/train': 1.5804579257965088} -11/07/2021 04:54:30 - INFO - __main__ - Step 54627: {'lr': 0.0003595747675907352, 'samples': 10488384, 'steps': 54626, 'loss/train': 1.476851463317871} -11/07/2021 04:54:31 - INFO - __main__ - Step 54628: {'lr': 0.0003595699977092902, 'samples': 10488576, 'steps': 54627, 'loss/train': 1.5772747993469238} -11/07/2021 04:54:32 - INFO - __main__ - Step 54629: {'lr': 0.00035956522777847474, 'samples': 10488768, 'steps': 54628, 'loss/train': 1.0126844644546509} -11/07/2021 04:54:32 - INFO - __main__ - Step 54630: {'lr': 0.00035956045779829085, 'samples': 10488960, 'steps': 54629, 'loss/train': 1.3361972570419312} -11/07/2021 04:54:33 - INFO - __main__ - Step 54631: {'lr': 0.00035955568776874057, 'samples': 10489152, 'steps': 54630, 'loss/train': 1.5533382892608643} -11/07/2021 04:54:33 - INFO - __main__ - Step 54632: {'lr': 0.0003595509176898263, 'samples': 10489344, 'steps': 54631, 'loss/train': 1.1519670486450195} -11/07/2021 04:54:33 - INFO - __main__ - Step 54633: {'lr': 0.0003595461475615501, 'samples': 10489536, 'steps': 54632, 'loss/train': 1.5794849395751953} -11/07/2021 04:54:34 - INFO - __main__ - Step 54634: {'lr': 0.00035954137738391405, 'samples': 10489728, 'steps': 54633, 'loss/train': 2.0183982849121094} -11/07/2021 04:54:35 - INFO - __main__ - Step 54635: {'lr': 0.00035953660715692037, 'samples': 10489920, 'steps': 54634, 'loss/train': 1.477344274520874} -11/07/2021 04:54:35 - INFO - __main__ - Step 54636: {'lr': 0.0003595318368805711, 'samples': 10490112, 'steps': 54635, 'loss/train': 1.7437412738800049} -11/07/2021 04:54:35 - INFO - __main__ - Step 54637: {'lr': 0.00035952706655486855, 'samples': 10490304, 'steps': 54636, 'loss/train': 1.31654691696167} -11/07/2021 04:54:36 - INFO - __main__ - Step 54638: {'lr': 0.0003595222961798148, 'samples': 10490496, 'steps': 54637, 'loss/train': 1.4689444303512573} -11/07/2021 04:54:37 - INFO - __main__ - Step 54639: {'lr': 0.000359517525755412, 'samples': 10490688, 'steps': 54638, 'loss/train': 1.7984954118728638} -11/07/2021 04:54:37 - INFO - __main__ - Step 54640: {'lr': 0.0003595127552816623, 'samples': 10490880, 'steps': 54639, 'loss/train': 0.9978362321853638} -11/07/2021 04:54:37 - INFO - __main__ - Step 54641: {'lr': 0.00035950798475856783, 'samples': 10491072, 'steps': 54640, 'loss/train': 1.6896424293518066} -11/07/2021 04:54:38 - INFO - __main__ - Step 54642: {'lr': 0.0003595032141861307, 'samples': 10491264, 'steps': 54641, 'loss/train': 1.4855388402938843} -11/07/2021 04:54:38 - INFO - __main__ - Step 54643: {'lr': 0.00035949844356435314, 'samples': 10491456, 'steps': 54642, 'loss/train': 1.5688718557357788} -11/07/2021 04:54:39 - INFO - __main__ - Step 54644: {'lr': 0.00035949367289323723, 'samples': 10491648, 'steps': 54643, 'loss/train': 1.24217689037323} -11/07/2021 04:54:40 - INFO - __main__ - Step 54645: {'lr': 0.00035948890217278525, 'samples': 10491840, 'steps': 54644, 'loss/train': 1.5060263872146606} -11/07/2021 04:54:40 - INFO - __main__ - Step 54646: {'lr': 0.0003594841314029992, 'samples': 10492032, 'steps': 54645, 'loss/train': 0.8719421029090881} -11/07/2021 04:54:40 - INFO - __main__ - Step 54647: {'lr': 0.00035947936058388134, 'samples': 10492224, 'steps': 54646, 'loss/train': 1.6886515617370605} -11/07/2021 04:54:41 - INFO - __main__ - Step 54648: {'lr': 0.00035947458971543375, 'samples': 10492416, 'steps': 54647, 'loss/train': 1.4497294425964355} -11/07/2021 04:54:42 - INFO - __main__ - Step 54649: {'lr': 0.00035946981879765854, 'samples': 10492608, 'steps': 54648, 'loss/train': 1.4971867799758911} -11/07/2021 04:54:42 - INFO - __main__ - Step 54650: {'lr': 0.000359465047830558, 'samples': 10492800, 'steps': 54649, 'loss/train': 1.4914140701293945} -11/07/2021 04:54:42 - INFO - __main__ - Step 54651: {'lr': 0.0003594602768141342, 'samples': 10492992, 'steps': 54650, 'loss/train': 1.6268728971481323} -11/07/2021 04:54:43 - INFO - __main__ - Step 54652: {'lr': 0.0003594555057483892, 'samples': 10493184, 'steps': 54651, 'loss/train': 0.7136030793190002} -11/07/2021 04:54:43 - INFO - __main__ - Step 54653: {'lr': 0.0003594507346333253, 'samples': 10493376, 'steps': 54652, 'loss/train': 1.345230221748352} -11/07/2021 04:54:44 - INFO - __main__ - Step 54654: {'lr': 0.00035944596346894456, 'samples': 10493568, 'steps': 54653, 'loss/train': 1.0661356449127197} -11/07/2021 04:54:45 - INFO - __main__ - Step 54655: {'lr': 0.00035944119225524916, 'samples': 10493760, 'steps': 54654, 'loss/train': 1.279564380645752} -11/07/2021 04:54:45 - INFO - __main__ - Step 54656: {'lr': 0.00035943642099224126, 'samples': 10493952, 'steps': 54655, 'loss/train': 1.2487595081329346} -11/07/2021 04:54:45 - INFO - __main__ - Step 54657: {'lr': 0.00035943164967992304, 'samples': 10494144, 'steps': 54656, 'loss/train': 1.5451102256774902} -11/07/2021 04:54:46 - INFO - __main__ - Step 54658: {'lr': 0.00035942687831829655, 'samples': 10494336, 'steps': 54657, 'loss/train': 1.196775197982788} -11/07/2021 04:54:47 - INFO - __main__ - Step 54659: {'lr': 0.000359422106907364, 'samples': 10494528, 'steps': 54658, 'loss/train': 1.6793714761734009} -11/07/2021 04:54:47 - INFO - __main__ - Step 54660: {'lr': 0.00035941733544712755, 'samples': 10494720, 'steps': 54659, 'loss/train': 0.9637711048126221} -11/07/2021 04:54:47 - INFO - __main__ - Step 54661: {'lr': 0.0003594125639375894, 'samples': 10494912, 'steps': 54660, 'loss/train': 1.2932835817337036} -11/07/2021 04:54:48 - INFO - __main__ - Step 54662: {'lr': 0.00035940779237875154, 'samples': 10495104, 'steps': 54661, 'loss/train': 1.0968278646469116} -11/07/2021 04:54:48 - INFO - __main__ - Step 54663: {'lr': 0.00035940302077061624, 'samples': 10495296, 'steps': 54662, 'loss/train': 1.633630394935608} -11/07/2021 04:54:48 - INFO - __main__ - Step 54664: {'lr': 0.0003593982491131857, 'samples': 10495488, 'steps': 54663, 'loss/train': 1.551399827003479} -11/07/2021 04:54:49 - INFO - __main__ - Step 54665: {'lr': 0.00035939347740646186, 'samples': 10495680, 'steps': 54664, 'loss/train': 2.6731960773468018} -11/07/2021 04:54:50 - INFO - __main__ - Step 54666: {'lr': 0.00035938870565044713, 'samples': 10495872, 'steps': 54665, 'loss/train': 1.301660180091858} -11/07/2021 04:54:50 - INFO - __main__ - Step 54667: {'lr': 0.0003593839338451435, 'samples': 10496064, 'steps': 54666, 'loss/train': 1.536627173423767} -11/07/2021 04:54:50 - INFO - __main__ - Step 54668: {'lr': 0.0003593791619905532, 'samples': 10496256, 'steps': 54667, 'loss/train': 1.3612464666366577} -11/07/2021 04:54:51 - INFO - __main__ - Step 54669: {'lr': 0.00035937439008667827, 'samples': 10496448, 'steps': 54668, 'loss/train': 1.4350947141647339} -11/07/2021 04:54:52 - INFO - __main__ - Step 54670: {'lr': 0.00035936961813352094, 'samples': 10496640, 'steps': 54669, 'loss/train': 2.1642894744873047} -11/07/2021 04:54:52 - INFO - __main__ - Step 54671: {'lr': 0.0003593648461310833, 'samples': 10496832, 'steps': 54670, 'loss/train': 1.3447295427322388} -11/07/2021 04:54:53 - INFO - __main__ - Step 54672: {'lr': 0.0003593600740793676, 'samples': 10497024, 'steps': 54671, 'loss/train': 1.5652481317520142} -11/07/2021 04:54:53 - INFO - __main__ - Step 54673: {'lr': 0.00035935530197837596, 'samples': 10497216, 'steps': 54672, 'loss/train': 1.2834434509277344} -11/07/2021 04:54:53 - INFO - __main__ - Step 54674: {'lr': 0.00035935052982811046, 'samples': 10497408, 'steps': 54673, 'loss/train': 1.7741061449050903} -11/07/2021 04:54:54 - INFO - __main__ - Step 54675: {'lr': 0.00035934575762857333, 'samples': 10497600, 'steps': 54674, 'loss/train': 1.2563782930374146} -11/07/2021 04:54:55 - INFO - __main__ - Step 54676: {'lr': 0.00035934098537976675, 'samples': 10497792, 'steps': 54675, 'loss/train': 1.5968042612075806} -11/07/2021 04:54:55 - INFO - __main__ - Step 54677: {'lr': 0.00035933621308169273, 'samples': 10497984, 'steps': 54676, 'loss/train': 1.2757591009140015} -11/07/2021 04:54:55 - INFO - __main__ - Step 54678: {'lr': 0.0003593314407343535, 'samples': 10498176, 'steps': 54677, 'loss/train': 1.7727009057998657} -11/07/2021 04:54:56 - INFO - __main__ - Step 54679: {'lr': 0.00035932666833775117, 'samples': 10498368, 'steps': 54678, 'loss/train': 1.224920630455017} -11/07/2021 04:54:57 - INFO - __main__ - Step 54680: {'lr': 0.00035932189589188803, 'samples': 10498560, 'steps': 54679, 'loss/train': 2.0108485221862793} -11/07/2021 04:54:57 - INFO - __main__ - Step 54681: {'lr': 0.00035931712339676617, 'samples': 10498752, 'steps': 54680, 'loss/train': 1.2102726697921753} -11/07/2021 04:54:57 - INFO - __main__ - Step 54682: {'lr': 0.00035931235085238754, 'samples': 10498944, 'steps': 54681, 'loss/train': 1.6900962591171265} -11/07/2021 04:54:58 - INFO - __main__ - Step 54683: {'lr': 0.0003593075782587545, 'samples': 10499136, 'steps': 54682, 'loss/train': 1.5737942457199097} -11/07/2021 04:54:58 - INFO - __main__ - Step 54684: {'lr': 0.0003593028056158692, 'samples': 10499328, 'steps': 54683, 'loss/train': 1.7900334596633911} -11/07/2021 04:54:58 - INFO - __main__ - Step 54685: {'lr': 0.0003592980329237337, 'samples': 10499520, 'steps': 54684, 'loss/train': 1.5666292905807495} -11/07/2021 04:54:59 - INFO - __main__ - Step 54686: {'lr': 0.0003592932601823502, 'samples': 10499712, 'steps': 54685, 'loss/train': 1.1327369213104248} -11/07/2021 04:55:00 - INFO - __main__ - Step 54687: {'lr': 0.0003592884873917209, 'samples': 10499904, 'steps': 54686, 'loss/train': 1.9120479822158813} -11/07/2021 04:55:00 - INFO - __main__ - Step 54688: {'lr': 0.0003592837145518479, 'samples': 10500096, 'steps': 54687, 'loss/train': 1.423751950263977} -11/07/2021 04:55:01 - INFO - __main__ - Step 54689: {'lr': 0.00035927894166273323, 'samples': 10500288, 'steps': 54688, 'loss/train': 0.8661104440689087} -11/07/2021 04:55:01 - INFO - __main__ - Step 54690: {'lr': 0.0003592741687243792, 'samples': 10500480, 'steps': 54689, 'loss/train': 1.3181918859481812} -11/07/2021 04:55:02 - INFO - __main__ - Step 54691: {'lr': 0.00035926939573678796, 'samples': 10500672, 'steps': 54690, 'loss/train': 0.8958945870399475} -11/07/2021 04:55:02 - INFO - __main__ - Step 54692: {'lr': 0.0003592646226999616, 'samples': 10500864, 'steps': 54691, 'loss/train': 1.375899076461792} -11/07/2021 04:55:02 - INFO - __main__ - Step 54693: {'lr': 0.0003592598496139023, 'samples': 10501056, 'steps': 54692, 'loss/train': 1.7506818771362305} -11/07/2021 04:55:03 - INFO - __main__ - Step 54694: {'lr': 0.0003592550764786122, 'samples': 10501248, 'steps': 54693, 'loss/train': 1.0960344076156616} -11/07/2021 04:55:03 - INFO - __main__ - Step 54695: {'lr': 0.00035925030329409343, 'samples': 10501440, 'steps': 54694, 'loss/train': 1.2517138719558716} -11/07/2021 04:55:04 - INFO - __main__ - Step 54696: {'lr': 0.0003592455300603481, 'samples': 10501632, 'steps': 54695, 'loss/train': 1.1153273582458496} -11/07/2021 04:55:05 - INFO - __main__ - Step 54697: {'lr': 0.0003592407567773785, 'samples': 10501824, 'steps': 54696, 'loss/train': 1.6166651248931885} -11/07/2021 04:55:05 - INFO - __main__ - Step 54698: {'lr': 0.0003592359834451866, 'samples': 10502016, 'steps': 54697, 'loss/train': 1.2193481922149658} -11/07/2021 04:55:05 - INFO - __main__ - Step 54699: {'lr': 0.0003592312100637748, 'samples': 10502208, 'steps': 54698, 'loss/train': 1.7973885536193848} -11/07/2021 04:55:06 - INFO - __main__ - Step 54700: {'lr': 0.00035922643663314504, 'samples': 10502400, 'steps': 54699, 'loss/train': 1.788243293762207} -11/07/2021 04:55:07 - INFO - __main__ - Step 54701: {'lr': 0.00035922166315329954, 'samples': 10502592, 'steps': 54700, 'loss/train': 1.3844908475875854} -11/07/2021 04:55:07 - INFO - __main__ - Step 54702: {'lr': 0.0003592168896242404, 'samples': 10502784, 'steps': 54701, 'loss/train': 1.2753205299377441} -11/07/2021 04:55:07 - INFO - __main__ - Step 54703: {'lr': 0.00035921211604596985, 'samples': 10502976, 'steps': 54702, 'loss/train': 1.247143030166626} -11/07/2021 04:55:08 - INFO - __main__ - Step 54704: {'lr': 0.00035920734241849, 'samples': 10503168, 'steps': 54703, 'loss/train': 1.7621675729751587} -11/07/2021 04:55:08 - INFO - __main__ - Step 54705: {'lr': 0.00035920256874180304, 'samples': 10503360, 'steps': 54704, 'loss/train': 1.524994134902954} -11/07/2021 04:55:09 - INFO - __main__ - Step 54706: {'lr': 0.00035919779501591097, 'samples': 10503552, 'steps': 54705, 'loss/train': 1.1982957124710083} -11/07/2021 04:55:09 - INFO - __main__ - Step 54707: {'lr': 0.00035919302124081613, 'samples': 10503744, 'steps': 54706, 'loss/train': 1.6131422519683838} -11/07/2021 04:55:10 - INFO - __main__ - Step 54708: {'lr': 0.0003591882474165207, 'samples': 10503936, 'steps': 54707, 'loss/train': 1.636912226676941} -11/07/2021 04:55:10 - INFO - __main__ - Step 54709: {'lr': 0.00035918347354302663, 'samples': 10504128, 'steps': 54708, 'loss/train': 1.732164740562439} -11/07/2021 04:55:10 - INFO - __main__ - Step 54710: {'lr': 0.00035917869962033615, 'samples': 10504320, 'steps': 54709, 'loss/train': 1.8825229406356812} -11/07/2021 04:55:11 - INFO - __main__ - Step 54711: {'lr': 0.00035917392564845146, 'samples': 10504512, 'steps': 54710, 'loss/train': 1.311721920967102} -11/07/2021 04:55:12 - INFO - __main__ - Step 54712: {'lr': 0.00035916915162737467, 'samples': 10504704, 'steps': 54711, 'loss/train': 1.5228288173675537} -11/07/2021 04:55:12 - INFO - __main__ - Step 54713: {'lr': 0.00035916437755710795, 'samples': 10504896, 'steps': 54712, 'loss/train': 1.5763819217681885} -11/07/2021 04:55:13 - INFO - __main__ - Step 54714: {'lr': 0.0003591596034376535, 'samples': 10505088, 'steps': 54713, 'loss/train': 1.1772390604019165} -11/07/2021 04:55:13 - INFO - __main__ - Step 54715: {'lr': 0.0003591548292690134, 'samples': 10505280, 'steps': 54714, 'loss/train': 1.0528409481048584} -11/07/2021 04:55:15 - INFO - __main__ - Step 54716: {'lr': 0.0003591500550511898, 'samples': 10505472, 'steps': 54715, 'loss/train': 1.5328580141067505} -11/07/2021 04:55:15 - INFO - __main__ - Step 54717: {'lr': 0.00035914528078418486, 'samples': 10505664, 'steps': 54716, 'loss/train': 1.5203498601913452} -11/07/2021 04:55:15 - INFO - __main__ - Step 54718: {'lr': 0.0003591405064680007, 'samples': 10505856, 'steps': 54717, 'loss/train': 1.7637076377868652} -11/07/2021 04:55:16 - INFO - __main__ - Step 54719: {'lr': 0.0003591357321026396, 'samples': 10506048, 'steps': 54718, 'loss/train': 1.7425967454910278} -11/07/2021 04:55:16 - INFO - __main__ - Step 54720: {'lr': 0.00035913095768810356, 'samples': 10506240, 'steps': 54719, 'loss/train': 1.5587249994277954} -11/07/2021 04:55:17 - INFO - __main__ - Step 54721: {'lr': 0.00035912618322439483, 'samples': 10506432, 'steps': 54720, 'loss/train': 1.2138665914535522} -11/07/2021 04:55:17 - INFO - __main__ - Step 54722: {'lr': 0.00035912140871151554, 'samples': 10506624, 'steps': 54721, 'loss/train': 0.9029083847999573} -11/07/2021 04:55:17 - INFO - __main__ - Step 54723: {'lr': 0.0003591166341494678, 'samples': 10506816, 'steps': 54722, 'loss/train': 1.1368441581726074} -11/07/2021 04:55:18 - INFO - __main__ - Step 54724: {'lr': 0.00035911185953825373, 'samples': 10507008, 'steps': 54723, 'loss/train': 2.8409199714660645} -11/07/2021 04:55:19 - INFO - __main__ - Step 54725: {'lr': 0.0003591070848778756, 'samples': 10507200, 'steps': 54724, 'loss/train': 1.2468154430389404} -11/07/2021 04:55:19 - INFO - __main__ - Step 54726: {'lr': 0.0003591023101683355, 'samples': 10507392, 'steps': 54725, 'loss/train': 1.3183799982070923} -11/07/2021 04:55:19 - INFO - __main__ - Step 54727: {'lr': 0.0003590975354096356, 'samples': 10507584, 'steps': 54726, 'loss/train': 1.333478331565857} -11/07/2021 04:55:20 - INFO - __main__ - Step 54728: {'lr': 0.000359092760601778, 'samples': 10507776, 'steps': 54727, 'loss/train': 0.8363317251205444} -11/07/2021 04:55:21 - INFO - __main__ - Step 54729: {'lr': 0.0003590879857447649, 'samples': 10507968, 'steps': 54728, 'loss/train': 1.8350917100906372} -11/07/2021 04:55:21 - INFO - __main__ - Step 54730: {'lr': 0.0003590832108385985, 'samples': 10508160, 'steps': 54729, 'loss/train': 1.5275685787200928} -11/07/2021 04:55:22 - INFO - __main__ - Step 54731: {'lr': 0.0003590784358832808, 'samples': 10508352, 'steps': 54730, 'loss/train': 1.3093987703323364} -11/07/2021 04:55:22 - INFO - __main__ - Step 54732: {'lr': 0.00035907366087881403, 'samples': 10508544, 'steps': 54731, 'loss/train': 1.8257447481155396} -11/07/2021 04:55:22 - INFO - __main__ - Step 54733: {'lr': 0.00035906888582520034, 'samples': 10508736, 'steps': 54732, 'loss/train': 2.0174505710601807} -11/07/2021 04:55:23 - INFO - __main__ - Step 54734: {'lr': 0.000359064110722442, 'samples': 10508928, 'steps': 54733, 'loss/train': 1.5022810697555542} -11/07/2021 04:55:24 - INFO - __main__ - Step 54735: {'lr': 0.00035905933557054103, 'samples': 10509120, 'steps': 54734, 'loss/train': 1.521554708480835} -11/07/2021 04:55:24 - INFO - __main__ - Step 54736: {'lr': 0.0003590545603694996, 'samples': 10509312, 'steps': 54735, 'loss/train': 0.6441707015037537} -11/07/2021 04:55:24 - INFO - __main__ - Step 54737: {'lr': 0.0003590497851193198, 'samples': 10509504, 'steps': 54736, 'loss/train': 1.5682966709136963} -11/07/2021 04:55:25 - INFO - __main__ - Step 54738: {'lr': 0.00035904500982000386, 'samples': 10509696, 'steps': 54737, 'loss/train': 1.404206395149231} -11/07/2021 04:55:25 - INFO - __main__ - Step 54739: {'lr': 0.0003590402344715539, 'samples': 10509888, 'steps': 54738, 'loss/train': 1.6242003440856934} -11/07/2021 04:55:26 - INFO - __main__ - Step 54740: {'lr': 0.00035903545907397215, 'samples': 10510080, 'steps': 54739, 'loss/train': 1.3122817277908325} -11/07/2021 04:55:26 - INFO - __main__ - Step 54741: {'lr': 0.0003590306836272608, 'samples': 10510272, 'steps': 54740, 'loss/train': 1.3039827346801758} -11/07/2021 04:55:27 - INFO - __main__ - Step 54742: {'lr': 0.0003590259081314218, 'samples': 10510464, 'steps': 54741, 'loss/train': 1.6676901578903198} -11/07/2021 04:55:27 - INFO - __main__ - Step 54743: {'lr': 0.00035902113258645733, 'samples': 10510656, 'steps': 54742, 'loss/train': 1.427638292312622} -11/07/2021 04:55:27 - INFO - __main__ - Step 54744: {'lr': 0.0003590163569923697, 'samples': 10510848, 'steps': 54743, 'loss/train': 1.2986115217208862} -11/07/2021 04:55:28 - INFO - __main__ - Step 54745: {'lr': 0.000359011581349161, 'samples': 10511040, 'steps': 54744, 'loss/train': 1.6545664072036743} -11/07/2021 04:55:29 - INFO - __main__ - Step 54746: {'lr': 0.00035900680565683333, 'samples': 10511232, 'steps': 54745, 'loss/train': 1.1662455797195435} -11/07/2021 04:55:29 - INFO - __main__ - Step 54747: {'lr': 0.00035900202991538894, 'samples': 10511424, 'steps': 54746, 'loss/train': 1.3269716501235962} -11/07/2021 04:55:29 - INFO - __main__ - Step 54748: {'lr': 0.00035899725412482985, 'samples': 10511616, 'steps': 54747, 'loss/train': 1.8401679992675781} -11/07/2021 04:55:30 - INFO - __main__ - Step 54749: {'lr': 0.00035899247828515837, 'samples': 10511808, 'steps': 54748, 'loss/train': 1.302247166633606} -11/07/2021 04:55:31 - INFO - __main__ - Step 54750: {'lr': 0.0003589877023963765, 'samples': 10512000, 'steps': 54749, 'loss/train': 1.7354470491409302} -11/07/2021 04:55:31 - INFO - __main__ - Step 54751: {'lr': 0.0003589829264584864, 'samples': 10512192, 'steps': 54750, 'loss/train': 1.776680827140808} -11/07/2021 04:55:31 - INFO - __main__ - Step 54752: {'lr': 0.00035897815047149033, 'samples': 10512384, 'steps': 54751, 'loss/train': 1.0573840141296387} -11/07/2021 04:55:32 - INFO - __main__ - Step 54753: {'lr': 0.00035897337443539036, 'samples': 10512576, 'steps': 54752, 'loss/train': 0.4910214841365814} -11/07/2021 04:55:32 - INFO - __main__ - Step 54754: {'lr': 0.0003589685983501887, 'samples': 10512768, 'steps': 54753, 'loss/train': 1.791231632232666} -11/07/2021 04:55:33 - INFO - __main__ - Step 54755: {'lr': 0.0003589638222158874, 'samples': 10512960, 'steps': 54754, 'loss/train': 1.1934956312179565} -11/07/2021 04:55:34 - INFO - __main__ - Step 54756: {'lr': 0.00035895904603248875, 'samples': 10513152, 'steps': 54755, 'loss/train': 1.5078513622283936} -11/07/2021 04:55:34 - INFO - __main__ - Step 54757: {'lr': 0.0003589542697999948, 'samples': 10513344, 'steps': 54756, 'loss/train': 1.753839135169983} -11/07/2021 04:55:34 - INFO - __main__ - Step 54758: {'lr': 0.00035894949351840784, 'samples': 10513536, 'steps': 54757, 'loss/train': 1.292758822441101} -11/07/2021 04:55:35 - INFO - __main__ - Step 54759: {'lr': 0.0003589447171877298, 'samples': 10513728, 'steps': 54758, 'loss/train': 1.2573915719985962} -11/07/2021 04:55:36 - INFO - __main__ - Step 54760: {'lr': 0.000358939940807963, 'samples': 10513920, 'steps': 54759, 'loss/train': 1.3286813497543335} -11/07/2021 04:55:36 - INFO - __main__ - Step 54761: {'lr': 0.00035893516437910956, 'samples': 10514112, 'steps': 54760, 'loss/train': 1.1425011157989502} -11/07/2021 04:55:37 - INFO - __main__ - Step 54762: {'lr': 0.00035893038790117156, 'samples': 10514304, 'steps': 54761, 'loss/train': 1.787023901939392} -11/07/2021 04:55:37 - INFO - __main__ - Step 54763: {'lr': 0.0003589256113741513, 'samples': 10514496, 'steps': 54762, 'loss/train': 1.1434789896011353} -11/07/2021 04:55:37 - INFO - __main__ - Step 54764: {'lr': 0.00035892083479805077, 'samples': 10514688, 'steps': 54763, 'loss/train': 1.3133426904678345} -11/07/2021 04:55:38 - INFO - __main__ - Step 54765: {'lr': 0.0003589160581728722, 'samples': 10514880, 'steps': 54764, 'loss/train': 1.6563326120376587} -11/07/2021 04:55:39 - INFO - __main__ - Step 54766: {'lr': 0.0003589112814986177, 'samples': 10515072, 'steps': 54765, 'loss/train': 0.22022061049938202} -11/07/2021 04:55:40 - INFO - __main__ - Step 54767: {'lr': 0.00035890650477528953, 'samples': 10515264, 'steps': 54766, 'loss/train': 1.168055534362793} -11/07/2021 04:55:40 - INFO - __main__ - Step 54768: {'lr': 0.00035890172800288965, 'samples': 10515456, 'steps': 54767, 'loss/train': 1.6907206773757935} -11/07/2021 04:55:40 - INFO - __main__ - Step 54769: {'lr': 0.0003588969511814205, 'samples': 10515648, 'steps': 54768, 'loss/train': 1.3247848749160767} -11/07/2021 04:55:41 - INFO - __main__ - Step 54770: {'lr': 0.00035889217431088396, 'samples': 10515840, 'steps': 54769, 'loss/train': 1.4610716104507446} -11/07/2021 04:55:41 - INFO - __main__ - Step 54771: {'lr': 0.00035888739739128227, 'samples': 10516032, 'steps': 54770, 'loss/train': 1.753288984298706} -11/07/2021 04:55:42 - INFO - __main__ - Step 54772: {'lr': 0.00035888262042261767, 'samples': 10516224, 'steps': 54771, 'loss/train': 1.5406216382980347} -11/07/2021 04:55:42 - INFO - __main__ - Step 54773: {'lr': 0.0003588778434048922, 'samples': 10516416, 'steps': 54772, 'loss/train': 1.367986798286438} -11/07/2021 04:55:43 - INFO - __main__ - Step 54774: {'lr': 0.0003588730663381081, 'samples': 10516608, 'steps': 54773, 'loss/train': 1.1686124801635742} -11/07/2021 04:55:43 - INFO - __main__ - Step 54775: {'lr': 0.00035886828922226737, 'samples': 10516800, 'steps': 54774, 'loss/train': 1.2851676940917969} -11/07/2021 04:55:44 - INFO - __main__ - Step 54776: {'lr': 0.00035886351205737237, 'samples': 10516992, 'steps': 54775, 'loss/train': 1.709902286529541} -11/07/2021 04:55:45 - INFO - __main__ - Step 54777: {'lr': 0.00035885873484342514, 'samples': 10517184, 'steps': 54776, 'loss/train': 0.9926208853721619} -11/07/2021 04:55:45 - INFO - __main__ - Step 54778: {'lr': 0.00035885395758042784, 'samples': 10517376, 'steps': 54777, 'loss/train': 1.3379695415496826} -11/07/2021 04:55:45 - INFO - __main__ - Step 54779: {'lr': 0.0003588491802683826, 'samples': 10517568, 'steps': 54778, 'loss/train': 1.153033971786499} -11/07/2021 04:55:46 - INFO - __main__ - Step 54780: {'lr': 0.0003588444029072916, 'samples': 10517760, 'steps': 54779, 'loss/train': 2.080644130706787} -11/07/2021 04:55:46 - INFO - __main__ - Step 54781: {'lr': 0.000358839625497157, 'samples': 10517952, 'steps': 54780, 'loss/train': 1.499314546585083} -11/07/2021 04:55:47 - INFO - __main__ - Step 54782: {'lr': 0.0003588348480379809, 'samples': 10518144, 'steps': 54781, 'loss/train': 1.6469850540161133} -11/07/2021 04:55:48 - INFO - __main__ - Step 54783: {'lr': 0.0003588300705297656, 'samples': 10518336, 'steps': 54782, 'loss/train': 1.3472864627838135} -11/07/2021 04:55:48 - INFO - __main__ - Step 54784: {'lr': 0.0003588252929725131, 'samples': 10518528, 'steps': 54783, 'loss/train': 1.4015719890594482} -11/07/2021 04:55:48 - INFO - __main__ - Step 54785: {'lr': 0.0003588205153662256, 'samples': 10518720, 'steps': 54784, 'loss/train': 1.296350359916687} -11/07/2021 04:55:49 - INFO - __main__ - Step 54786: {'lr': 0.0003588157377109052, 'samples': 10518912, 'steps': 54785, 'loss/train': 1.4564239978790283} -11/07/2021 04:55:49 - INFO - __main__ - Step 54787: {'lr': 0.0003588109600065541, 'samples': 10519104, 'steps': 54786, 'loss/train': 1.848463535308838} -11/07/2021 04:55:50 - INFO - __main__ - Step 54788: {'lr': 0.0003588061822531745, 'samples': 10519296, 'steps': 54787, 'loss/train': 1.4672874212265015} -11/07/2021 04:55:50 - INFO - __main__ - Step 54789: {'lr': 0.00035880140445076857, 'samples': 10519488, 'steps': 54788, 'loss/train': 1.2948073148727417} -11/07/2021 04:55:51 - INFO - __main__ - Step 54790: {'lr': 0.0003587966265993384, 'samples': 10519680, 'steps': 54789, 'loss/train': 1.4138782024383545} -11/07/2021 04:55:51 - INFO - __main__ - Step 54791: {'lr': 0.0003587918486988861, 'samples': 10519872, 'steps': 54790, 'loss/train': 1.0976370573043823} -11/07/2021 04:55:51 - INFO - __main__ - Step 54792: {'lr': 0.0003587870707494139, 'samples': 10520064, 'steps': 54791, 'loss/train': 1.3246370553970337} -11/07/2021 04:55:52 - INFO - __main__ - Step 54793: {'lr': 0.0003587822927509239, 'samples': 10520256, 'steps': 54792, 'loss/train': 1.5439074039459229} -11/07/2021 04:55:53 - INFO - __main__ - Step 54794: {'lr': 0.00035877751470341824, 'samples': 10520448, 'steps': 54793, 'loss/train': 1.418664813041687} -11/07/2021 04:55:53 - INFO - __main__ - Step 54795: {'lr': 0.00035877273660689916, 'samples': 10520640, 'steps': 54794, 'loss/train': 1.3769599199295044} -11/07/2021 04:55:53 - INFO - __main__ - Step 54796: {'lr': 0.0003587679584613688, 'samples': 10520832, 'steps': 54795, 'loss/train': 1.7042253017425537} -11/07/2021 04:55:54 - INFO - __main__ - Step 54797: {'lr': 0.00035876318026682925, 'samples': 10521024, 'steps': 54796, 'loss/train': 1.5919417142868042} -11/07/2021 04:55:55 - INFO - __main__ - Step 54798: {'lr': 0.0003587584020232827, 'samples': 10521216, 'steps': 54797, 'loss/train': 1.1344317197799683} -11/07/2021 04:55:55 - INFO - __main__ - Step 54799: {'lr': 0.00035875362373073125, 'samples': 10521408, 'steps': 54798, 'loss/train': 1.5724691152572632} -11/07/2021 04:55:56 - INFO - __main__ - Step 54800: {'lr': 0.00035874884538917705, 'samples': 10521600, 'steps': 54799, 'loss/train': 1.3933013677597046} -11/07/2021 04:55:56 - INFO - __main__ - Step 54801: {'lr': 0.0003587440669986224, 'samples': 10521792, 'steps': 54800, 'loss/train': 1.2266603708267212} -11/07/2021 04:55:56 - INFO - __main__ - Step 54802: {'lr': 0.00035873928855906933, 'samples': 10521984, 'steps': 54801, 'loss/train': 1.2729222774505615} -11/07/2021 04:55:58 - INFO - __main__ - Step 54803: {'lr': 0.00035873451007052, 'samples': 10522176, 'steps': 54802, 'loss/train': 1.3956317901611328} -11/07/2021 04:55:58 - INFO - __main__ - Step 54804: {'lr': 0.00035872973153297657, 'samples': 10522368, 'steps': 54803, 'loss/train': 1.8258665800094604} -11/07/2021 04:55:58 - INFO - __main__ - Step 54805: {'lr': 0.0003587249529464412, 'samples': 10522560, 'steps': 54804, 'loss/train': 1.849915623664856} -11/07/2021 04:55:59 - INFO - __main__ - Step 54806: {'lr': 0.00035872017431091605, 'samples': 10522752, 'steps': 54805, 'loss/train': 1.55470609664917} -11/07/2021 04:55:59 - INFO - __main__ - Step 54807: {'lr': 0.0003587153956264033, 'samples': 10522944, 'steps': 54806, 'loss/train': 1.1715747117996216} -11/07/2021 04:56:00 - INFO - __main__ - Step 54808: {'lr': 0.00035871061689290496, 'samples': 10523136, 'steps': 54807, 'loss/train': 2.1414685249328613} -11/07/2021 04:56:00 - INFO - __main__ - Step 54809: {'lr': 0.00035870583811042347, 'samples': 10523328, 'steps': 54808, 'loss/train': 1.671202301979065} -11/07/2021 04:56:01 - INFO - __main__ - Step 54810: {'lr': 0.0003587010592789607, 'samples': 10523520, 'steps': 54809, 'loss/train': 1.3291504383087158} -11/07/2021 04:56:01 - INFO - __main__ - Step 54811: {'lr': 0.0003586962803985189, 'samples': 10523712, 'steps': 54810, 'loss/train': 1.4139256477355957} -11/07/2021 04:56:01 - INFO - __main__ - Step 54812: {'lr': 0.00035869150146910025, 'samples': 10523904, 'steps': 54811, 'loss/train': 1.8183473348617554} -11/07/2021 04:56:02 - INFO - __main__ - Step 54813: {'lr': 0.00035868672249070684, 'samples': 10524096, 'steps': 54812, 'loss/train': 1.4273749589920044} -11/07/2021 04:56:03 - INFO - __main__ - Step 54814: {'lr': 0.00035868194346334094, 'samples': 10524288, 'steps': 54813, 'loss/train': 1.55579674243927} -11/07/2021 04:56:03 - INFO - __main__ - Step 54815: {'lr': 0.0003586771643870046, 'samples': 10524480, 'steps': 54814, 'loss/train': 1.4467002153396606} -11/07/2021 04:56:03 - INFO - __main__ - Step 54816: {'lr': 0.0003586723852617, 'samples': 10524672, 'steps': 54815, 'loss/train': 1.8852932453155518} -11/07/2021 04:56:04 - INFO - __main__ - Step 54817: {'lr': 0.00035866760608742934, 'samples': 10524864, 'steps': 54816, 'loss/train': 1.3477979898452759} -11/07/2021 04:56:04 - INFO - __main__ - Step 54818: {'lr': 0.0003586628268641947, 'samples': 10525056, 'steps': 54817, 'loss/train': 2.309300661087036} -11/07/2021 04:56:05 - INFO - __main__ - Step 54819: {'lr': 0.00035865804759199825, 'samples': 10525248, 'steps': 54818, 'loss/train': 1.7186243534088135} -11/07/2021 04:56:06 - INFO - __main__ - Step 54820: {'lr': 0.00035865326827084224, 'samples': 10525440, 'steps': 54819, 'loss/train': 1.4784338474273682} -11/07/2021 04:56:06 - INFO - __main__ - Step 54821: {'lr': 0.00035864848890072864, 'samples': 10525632, 'steps': 54820, 'loss/train': 0.2255532443523407} -11/07/2021 04:56:06 - INFO - __main__ - Step 54822: {'lr': 0.0003586437094816598, 'samples': 10525824, 'steps': 54821, 'loss/train': 1.672151803970337} -11/07/2021 04:56:07 - INFO - __main__ - Step 54823: {'lr': 0.00035863893001363776, 'samples': 10526016, 'steps': 54822, 'loss/train': 1.2856768369674683} -11/07/2021 04:56:08 - INFO - __main__ - Step 54824: {'lr': 0.0003586341504966647, 'samples': 10526208, 'steps': 54823, 'loss/train': 1.5706262588500977} -11/07/2021 04:56:08 - INFO - __main__ - Step 54825: {'lr': 0.00035862937093074273, 'samples': 10526400, 'steps': 54824, 'loss/train': 1.5209360122680664} -11/07/2021 04:56:08 - INFO - __main__ - Step 54826: {'lr': 0.000358624591315874, 'samples': 10526592, 'steps': 54825, 'loss/train': 1.3436338901519775} -11/07/2021 04:56:09 - INFO - __main__ - Step 54827: {'lr': 0.0003586198116520608, 'samples': 10526784, 'steps': 54826, 'loss/train': 1.5253491401672363} -11/07/2021 04:56:09 - INFO - __main__ - Step 54828: {'lr': 0.0003586150319393051, 'samples': 10526976, 'steps': 54827, 'loss/train': 1.2950458526611328} -11/07/2021 04:56:10 - INFO - __main__ - Step 54829: {'lr': 0.00035861025217760924, 'samples': 10527168, 'steps': 54828, 'loss/train': 1.3377083539962769} -11/07/2021 04:56:10 - INFO - __main__ - Step 54830: {'lr': 0.00035860547236697525, 'samples': 10527360, 'steps': 54829, 'loss/train': 1.8295022249221802} -11/07/2021 04:56:11 - INFO - __main__ - Step 54831: {'lr': 0.0003586006925074053, 'samples': 10527552, 'steps': 54830, 'loss/train': 1.5570582151412964} -11/07/2021 04:56:11 - INFO - __main__ - Step 54832: {'lr': 0.0003585959125989015, 'samples': 10527744, 'steps': 54831, 'loss/train': 1.6938668489456177} -11/07/2021 04:56:11 - INFO - __main__ - Step 54833: {'lr': 0.00035859113264146607, 'samples': 10527936, 'steps': 54832, 'loss/train': 1.421567440032959} -11/07/2021 04:56:12 - INFO - __main__ - Step 54834: {'lr': 0.00035858635263510117, 'samples': 10528128, 'steps': 54833, 'loss/train': 1.3689855337142944} -11/07/2021 04:56:13 - INFO - __main__ - Step 54835: {'lr': 0.00035858157257980894, 'samples': 10528320, 'steps': 54834, 'loss/train': 1.3991369009017944} -11/07/2021 04:56:13 - INFO - __main__ - Step 54836: {'lr': 0.0003585767924755916, 'samples': 10528512, 'steps': 54835, 'loss/train': 1.5207114219665527} -11/07/2021 04:56:13 - INFO - __main__ - Step 54837: {'lr': 0.0003585720123224512, 'samples': 10528704, 'steps': 54836, 'loss/train': 1.5550506114959717} -11/07/2021 04:56:14 - INFO - __main__ - Step 54838: {'lr': 0.00035856723212038987, 'samples': 10528896, 'steps': 54837, 'loss/train': 1.6766122579574585} -11/07/2021 04:56:16 - INFO - __main__ - Step 54839: {'lr': 0.0003585624518694098, 'samples': 10529088, 'steps': 54838, 'loss/train': 1.085741639137268} -11/07/2021 04:56:16 - INFO - __main__ - Step 54840: {'lr': 0.00035855767156951323, 'samples': 10529280, 'steps': 54839, 'loss/train': 1.7896482944488525} -11/07/2021 04:56:16 - INFO - __main__ - Step 54841: {'lr': 0.0003585528912207022, 'samples': 10529472, 'steps': 54840, 'loss/train': 1.8680771589279175} -11/07/2021 04:56:17 - INFO - __main__ - Step 54842: {'lr': 0.0003585481108229789, 'samples': 10529664, 'steps': 54841, 'loss/train': 1.7494255304336548} -11/07/2021 04:56:17 - INFO - __main__ - Step 54843: {'lr': 0.0003585433303763456, 'samples': 10529856, 'steps': 54842, 'loss/train': 1.7449979782104492} -11/07/2021 04:56:17 - INFO - __main__ - Step 54844: {'lr': 0.0003585385498808043, 'samples': 10530048, 'steps': 54843, 'loss/train': 1.756689190864563} -11/07/2021 04:56:18 - INFO - __main__ - Step 54845: {'lr': 0.00035853376933635717, 'samples': 10530240, 'steps': 54844, 'loss/train': 1.3483474254608154} -11/07/2021 04:56:19 - INFO - __main__ - Step 54846: {'lr': 0.0003585289887430064, 'samples': 10530432, 'steps': 54845, 'loss/train': 0.672095537185669} -11/07/2021 04:56:19 - INFO - __main__ - Step 54847: {'lr': 0.0003585242081007542, 'samples': 10530624, 'steps': 54846, 'loss/train': 1.7137326002120972} -11/07/2021 04:56:19 - INFO - __main__ - Step 54848: {'lr': 0.0003585194274096026, 'samples': 10530816, 'steps': 54847, 'loss/train': 1.1771575212478638} -11/07/2021 04:56:20 - INFO - __main__ - Step 54849: {'lr': 0.00035851464666955383, 'samples': 10531008, 'steps': 54848, 'loss/train': 1.3936138153076172} -11/07/2021 04:56:20 - INFO - __main__ - Step 54850: {'lr': 0.0003585098658806101, 'samples': 10531200, 'steps': 54849, 'loss/train': 1.1228164434432983} -11/07/2021 04:56:21 - INFO - __main__ - Step 54851: {'lr': 0.00035850508504277345, 'samples': 10531392, 'steps': 54850, 'loss/train': 1.3927152156829834} -11/07/2021 04:56:22 - INFO - __main__ - Step 54852: {'lr': 0.0003585003041560461, 'samples': 10531584, 'steps': 54851, 'loss/train': 1.5183683633804321} -11/07/2021 04:56:22 - INFO - __main__ - Step 54853: {'lr': 0.00035849552322043016, 'samples': 10531776, 'steps': 54852, 'loss/train': 1.6004995107650757} -11/07/2021 04:56:22 - INFO - __main__ - Step 54854: {'lr': 0.0003584907422359278, 'samples': 10531968, 'steps': 54853, 'loss/train': 1.502145528793335} -11/07/2021 04:56:23 - INFO - __main__ - Step 54855: {'lr': 0.00035848596120254125, 'samples': 10532160, 'steps': 54854, 'loss/train': 1.7841987609863281} -11/07/2021 04:56:24 - INFO - __main__ - Step 54856: {'lr': 0.0003584811801202726, 'samples': 10532352, 'steps': 54855, 'loss/train': 1.1733726263046265} -11/07/2021 04:56:24 - INFO - __main__ - Step 54857: {'lr': 0.00035847639898912395, 'samples': 10532544, 'steps': 54856, 'loss/train': 1.5412342548370361} -11/07/2021 04:56:25 - INFO - __main__ - Step 54858: {'lr': 0.00035847161780909746, 'samples': 10532736, 'steps': 54857, 'loss/train': 1.5491420030593872} -11/07/2021 04:56:25 - INFO - __main__ - Step 54859: {'lr': 0.0003584668365801954, 'samples': 10532928, 'steps': 54858, 'loss/train': 1.6432112455368042} -11/07/2021 04:56:25 - INFO - __main__ - Step 54860: {'lr': 0.00035846205530241985, 'samples': 10533120, 'steps': 54859, 'loss/train': 1.6675420999526978} -11/07/2021 04:56:26 - INFO - __main__ - Step 54861: {'lr': 0.00035845727397577296, 'samples': 10533312, 'steps': 54860, 'loss/train': 2.051708698272705} -11/07/2021 04:56:27 - INFO - __main__ - Step 54862: {'lr': 0.0003584524926002569, 'samples': 10533504, 'steps': 54861, 'loss/train': 2.053427219390869} -11/07/2021 04:56:27 - INFO - __main__ - Step 54863: {'lr': 0.00035844771117587396, 'samples': 10533696, 'steps': 54862, 'loss/train': 1.2147974967956543} -11/07/2021 04:56:27 - INFO - __main__ - Step 54864: {'lr': 0.0003584429297026259, 'samples': 10533888, 'steps': 54863, 'loss/train': 1.6371829509735107} -11/07/2021 04:56:28 - INFO - __main__ - Step 54865: {'lr': 0.00035843814818051537, 'samples': 10534080, 'steps': 54864, 'loss/train': 1.8123425245285034} -11/07/2021 04:56:29 - INFO - __main__ - Step 54866: {'lr': 0.0003584333666095441, 'samples': 10534272, 'steps': 54865, 'loss/train': 1.2196067571640015} -11/07/2021 04:56:29 - INFO - __main__ - Step 54867: {'lr': 0.0003584285849897145, 'samples': 10534464, 'steps': 54866, 'loss/train': 1.0219111442565918} -11/07/2021 04:56:30 - INFO - __main__ - Step 54868: {'lr': 0.00035842380332102864, 'samples': 10534656, 'steps': 54867, 'loss/train': 1.749085545539856} -11/07/2021 04:56:30 - INFO - __main__ - Step 54869: {'lr': 0.0003584190216034887, 'samples': 10534848, 'steps': 54868, 'loss/train': 1.6745190620422363} -11/07/2021 04:56:30 - INFO - __main__ - Step 54870: {'lr': 0.0003584142398370969, 'samples': 10535040, 'steps': 54869, 'loss/train': 1.1375041007995605} -11/07/2021 04:56:32 - INFO - __main__ - Step 54871: {'lr': 0.0003584094580218552, 'samples': 10535232, 'steps': 54870, 'loss/train': 1.648248314857483} -11/07/2021 04:56:32 - INFO - __main__ - Step 54872: {'lr': 0.00035840467615776584, 'samples': 10535424, 'steps': 54871, 'loss/train': 1.3192315101623535} -11/07/2021 04:56:32 - INFO - __main__ - Step 54873: {'lr': 0.0003583998942448311, 'samples': 10535616, 'steps': 54872, 'loss/train': 1.1297112703323364} -11/07/2021 04:56:33 - INFO - __main__ - Step 54874: {'lr': 0.000358395112283053, 'samples': 10535808, 'steps': 54873, 'loss/train': 0.830177903175354} -11/07/2021 04:56:33 - INFO - __main__ - Step 54875: {'lr': 0.00035839033027243374, 'samples': 10536000, 'steps': 54874, 'loss/train': 1.4521688222885132} -11/07/2021 04:56:33 - INFO - __main__ - Step 54876: {'lr': 0.0003583855482129755, 'samples': 10536192, 'steps': 54875, 'loss/train': 1.3463702201843262} -11/07/2021 04:56:34 - INFO - __main__ - Step 54877: {'lr': 0.0003583807661046804, 'samples': 10536384, 'steps': 54876, 'loss/train': 1.3776121139526367} -11/07/2021 04:56:35 - INFO - __main__ - Step 54878: {'lr': 0.0003583759839475506, 'samples': 10536576, 'steps': 54877, 'loss/train': 1.6864997148513794} -11/07/2021 04:56:35 - INFO - __main__ - Step 54879: {'lr': 0.00035837120174158824, 'samples': 10536768, 'steps': 54878, 'loss/train': 1.2307826280593872} -11/07/2021 04:56:35 - INFO - __main__ - Step 54880: {'lr': 0.00035836641948679544, 'samples': 10536960, 'steps': 54879, 'loss/train': 1.410631537437439} -11/07/2021 04:56:36 - INFO - __main__ - Step 54881: {'lr': 0.0003583616371831745, 'samples': 10537152, 'steps': 54880, 'loss/train': 1.5849672555923462} -11/07/2021 04:56:37 - INFO - __main__ - Step 54882: {'lr': 0.0003583568548307274, 'samples': 10537344, 'steps': 54881, 'loss/train': 1.581113338470459} -11/07/2021 04:56:37 - INFO - __main__ - Step 54883: {'lr': 0.0003583520724294564, 'samples': 10537536, 'steps': 54882, 'loss/train': 1.610122561454773} -11/07/2021 04:56:37 - INFO - __main__ - Step 54884: {'lr': 0.0003583472899793636, 'samples': 10537728, 'steps': 54883, 'loss/train': 1.4421613216400146} -11/07/2021 04:56:38 - INFO - __main__ - Step 54885: {'lr': 0.0003583425074804512, 'samples': 10537920, 'steps': 54884, 'loss/train': 1.5189831256866455} -11/07/2021 04:56:38 - INFO - __main__ - Step 54886: {'lr': 0.0003583377249327213, 'samples': 10538112, 'steps': 54885, 'loss/train': 1.2513885498046875} -11/07/2021 04:56:39 - INFO - __main__ - Step 54887: {'lr': 0.00035833294233617626, 'samples': 10538304, 'steps': 54886, 'loss/train': 0.901969850063324} -11/07/2021 04:56:40 - INFO - __main__ - Step 54888: {'lr': 0.0003583281596908179, 'samples': 10538496, 'steps': 54887, 'loss/train': 1.3590373992919922} -11/07/2021 04:56:40 - INFO - __main__ - Step 54889: {'lr': 0.00035832337699664865, 'samples': 10538688, 'steps': 54888, 'loss/train': 1.3569122552871704} -11/07/2021 04:56:40 - INFO - __main__ - Step 54890: {'lr': 0.0003583185942536704, 'samples': 10538880, 'steps': 54889, 'loss/train': 1.6509311199188232} -11/07/2021 04:56:41 - INFO - __main__ - Step 54891: {'lr': 0.00035831381146188556, 'samples': 10539072, 'steps': 54890, 'loss/train': 1.7270584106445312} -11/07/2021 04:56:42 - INFO - __main__ - Step 54892: {'lr': 0.00035830902862129627, 'samples': 10539264, 'steps': 54891, 'loss/train': 1.676131010055542} -11/07/2021 04:56:42 - INFO - __main__ - Step 54893: {'lr': 0.0003583042457319045, 'samples': 10539456, 'steps': 54892, 'loss/train': 1.7393121719360352} -11/07/2021 04:56:42 - INFO - __main__ - Step 54894: {'lr': 0.0003582994627937125, 'samples': 10539648, 'steps': 54893, 'loss/train': 1.097292423248291} -11/07/2021 04:56:43 - INFO - __main__ - Step 54895: {'lr': 0.00035829467980672247, 'samples': 10539840, 'steps': 54894, 'loss/train': 2.1243093013763428} -11/07/2021 04:56:43 - INFO - __main__ - Step 54896: {'lr': 0.00035828989677093656, 'samples': 10540032, 'steps': 54895, 'loss/train': 1.4508275985717773} -11/07/2021 04:56:44 - INFO - __main__ - Step 54897: {'lr': 0.00035828511368635684, 'samples': 10540224, 'steps': 54896, 'loss/train': 1.221198558807373} -11/07/2021 04:56:44 - INFO - __main__ - Step 54898: {'lr': 0.0003582803305529856, 'samples': 10540416, 'steps': 54897, 'loss/train': 1.4680225849151611} -11/07/2021 04:56:45 - INFO - __main__ - Step 54899: {'lr': 0.0003582755473708248, 'samples': 10540608, 'steps': 54898, 'loss/train': 1.4800821542739868} -11/07/2021 04:56:45 - INFO - __main__ - Step 54900: {'lr': 0.00035827076413987675, 'samples': 10540800, 'steps': 54899, 'loss/train': 0.9042848348617554} -11/07/2021 04:56:46 - INFO - __main__ - Step 54901: {'lr': 0.00035826598086014357, 'samples': 10540992, 'steps': 54900, 'loss/train': 1.3569746017456055} -11/07/2021 04:56:47 - INFO - __main__ - Step 54902: {'lr': 0.0003582611975316274, 'samples': 10541184, 'steps': 54901, 'loss/train': 1.4082578420639038} -11/07/2021 04:56:47 - INFO - __main__ - Step 54903: {'lr': 0.00035825641415433045, 'samples': 10541376, 'steps': 54902, 'loss/train': 1.1146998405456543} -11/07/2021 04:56:47 - INFO - __main__ - Step 54904: {'lr': 0.0003582516307282548, 'samples': 10541568, 'steps': 54903, 'loss/train': 1.0259791612625122} -11/07/2021 04:56:48 - INFO - __main__ - Step 54905: {'lr': 0.00035824684725340263, 'samples': 10541760, 'steps': 54904, 'loss/train': 1.6249933242797852} -11/07/2021 04:56:48 - INFO - __main__ - Step 54906: {'lr': 0.00035824206372977606, 'samples': 10541952, 'steps': 54905, 'loss/train': 1.9509371519088745} -11/07/2021 04:56:49 - INFO - __main__ - Step 54907: {'lr': 0.00035823728015737735, 'samples': 10542144, 'steps': 54906, 'loss/train': 1.9668883085250854} -11/07/2021 04:56:50 - INFO - __main__ - Step 54908: {'lr': 0.0003582324965362086, 'samples': 10542336, 'steps': 54907, 'loss/train': 1.0915250778198242} -11/07/2021 04:56:50 - INFO - __main__ - Step 54909: {'lr': 0.0003582277128662719, 'samples': 10542528, 'steps': 54908, 'loss/train': 1.6986463069915771} -11/07/2021 04:56:50 - INFO - __main__ - Step 54910: {'lr': 0.00035822292914756954, 'samples': 10542720, 'steps': 54909, 'loss/train': 1.019133448600769} -11/07/2021 04:56:51 - INFO - __main__ - Step 54911: {'lr': 0.00035821814538010356, 'samples': 10542912, 'steps': 54910, 'loss/train': 1.1962698698043823} -11/07/2021 04:56:51 - INFO - __main__ - Step 54912: {'lr': 0.00035821336156387614, 'samples': 10543104, 'steps': 54911, 'loss/train': 1.3298062086105347} -11/07/2021 04:56:52 - INFO - __main__ - Step 54913: {'lr': 0.00035820857769888943, 'samples': 10543296, 'steps': 54912, 'loss/train': 1.249089241027832} -11/07/2021 04:56:52 - INFO - __main__ - Step 54914: {'lr': 0.0003582037937851456, 'samples': 10543488, 'steps': 54913, 'loss/train': 1.4023022651672363} -11/07/2021 04:56:53 - INFO - __main__ - Step 54915: {'lr': 0.00035819900982264684, 'samples': 10543680, 'steps': 54914, 'loss/train': 1.013444423675537} -11/07/2021 04:56:53 - INFO - __main__ - Step 54916: {'lr': 0.0003581942258113953, 'samples': 10543872, 'steps': 54915, 'loss/train': 1.0797520875930786} -11/07/2021 04:56:53 - INFO - __main__ - Step 54917: {'lr': 0.00035818944175139314, 'samples': 10544064, 'steps': 54916, 'loss/train': 1.686318039894104} -11/07/2021 04:56:54 - INFO - __main__ - Step 54918: {'lr': 0.0003581846576426423, 'samples': 10544256, 'steps': 54917, 'loss/train': 1.8161580562591553} -11/07/2021 04:56:55 - INFO - __main__ - Step 54919: {'lr': 0.0003581798734851453, 'samples': 10544448, 'steps': 54918, 'loss/train': 1.405177354812622} -11/07/2021 04:56:55 - INFO - __main__ - Step 54920: {'lr': 0.00035817508927890406, 'samples': 10544640, 'steps': 54919, 'loss/train': 1.540561556816101} -11/07/2021 04:56:55 - INFO - __main__ - Step 54921: {'lr': 0.00035817030502392083, 'samples': 10544832, 'steps': 54920, 'loss/train': 1.726969599723816} -11/07/2021 04:56:56 - INFO - __main__ - Step 54922: {'lr': 0.0003581655207201977, 'samples': 10545024, 'steps': 54921, 'loss/train': 0.9665097594261169} -11/07/2021 04:56:57 - INFO - __main__ - Step 54923: {'lr': 0.00035816073636773686, 'samples': 10545216, 'steps': 54922, 'loss/train': 1.431938648223877} -11/07/2021 04:56:57 - INFO - __main__ - Step 54924: {'lr': 0.0003581559519665405, 'samples': 10545408, 'steps': 54923, 'loss/train': 1.5702717304229736} -11/07/2021 04:56:58 - INFO - __main__ - Step 54925: {'lr': 0.0003581511675166107, 'samples': 10545600, 'steps': 54924, 'loss/train': 1.6298109292984009} -11/07/2021 04:56:58 - INFO - __main__ - Step 54926: {'lr': 0.00035814638301794966, 'samples': 10545792, 'steps': 54925, 'loss/train': 1.6957331895828247} -11/07/2021 04:56:58 - INFO - __main__ - Step 54927: {'lr': 0.0003581415984705595, 'samples': 10545984, 'steps': 54926, 'loss/train': 2.11731219291687} -11/07/2021 04:56:59 - INFO - __main__ - Step 54928: {'lr': 0.0003581368138744424, 'samples': 10546176, 'steps': 54927, 'loss/train': 1.3969091176986694} -11/07/2021 04:57:00 - INFO - __main__ - Step 54929: {'lr': 0.00035813202922960056, 'samples': 10546368, 'steps': 54928, 'loss/train': 1.469664454460144} -11/07/2021 04:57:00 - INFO - __main__ - Step 54930: {'lr': 0.00035812724453603614, 'samples': 10546560, 'steps': 54929, 'loss/train': 1.673553466796875} -11/07/2021 04:57:00 - INFO - __main__ - Step 54931: {'lr': 0.00035812245979375114, 'samples': 10546752, 'steps': 54930, 'loss/train': 1.3558012247085571} -11/07/2021 04:57:01 - INFO - __main__ - Step 54932: {'lr': 0.0003581176750027479, 'samples': 10546944, 'steps': 54931, 'loss/train': 1.2782957553863525} -11/07/2021 04:57:02 - INFO - __main__ - Step 54933: {'lr': 0.00035811289016302847, 'samples': 10547136, 'steps': 54932, 'loss/train': 0.5100459456443787} -11/07/2021 04:57:02 - INFO - __main__ - Step 54934: {'lr': 0.000358108105274595, 'samples': 10547328, 'steps': 54933, 'loss/train': 1.7913730144500732} -11/07/2021 04:57:02 - INFO - __main__ - Step 54935: {'lr': 0.0003581033203374498, 'samples': 10547520, 'steps': 54934, 'loss/train': 2.0409095287323} -11/07/2021 04:57:03 - INFO - __main__ - Step 54936: {'lr': 0.0003580985353515948, 'samples': 10547712, 'steps': 54935, 'loss/train': 1.9671167135238647} -11/07/2021 04:57:03 - INFO - __main__ - Step 54937: {'lr': 0.0003580937503170324, 'samples': 10547904, 'steps': 54936, 'loss/train': 1.8756842613220215} -11/07/2021 04:57:03 - INFO - __main__ - Step 54938: {'lr': 0.00035808896523376456, 'samples': 10548096, 'steps': 54937, 'loss/train': 1.152647614479065} -11/07/2021 04:57:05 - INFO - __main__ - Step 54939: {'lr': 0.00035808418010179345, 'samples': 10548288, 'steps': 54938, 'loss/train': 1.2513864040374756} -11/07/2021 04:57:05 - INFO - __main__ - Step 54940: {'lr': 0.0003580793949211213, 'samples': 10548480, 'steps': 54939, 'loss/train': 0.8941771984100342} -11/07/2021 04:57:05 - INFO - __main__ - Step 54941: {'lr': 0.00035807460969175027, 'samples': 10548672, 'steps': 54940, 'loss/train': 1.5848958492279053} -11/07/2021 04:57:06 - INFO - __main__ - Step 54942: {'lr': 0.0003580698244136825, 'samples': 10548864, 'steps': 54941, 'loss/train': 1.5485233068466187} -11/07/2021 04:57:06 - INFO - __main__ - Step 54943: {'lr': 0.0003580650390869201, 'samples': 10549056, 'steps': 54942, 'loss/train': 1.5843173265457153} -11/07/2021 04:57:07 - INFO - __main__ - Step 54944: {'lr': 0.0003580602537114653, 'samples': 10549248, 'steps': 54943, 'loss/train': 1.5410370826721191} -11/07/2021 04:57:07 - INFO - __main__ - Step 54945: {'lr': 0.0003580554682873202, 'samples': 10549440, 'steps': 54944, 'loss/train': 1.7643157243728638} -11/07/2021 04:57:08 - INFO - __main__ - Step 54946: {'lr': 0.00035805068281448687, 'samples': 10549632, 'steps': 54945, 'loss/train': 1.6490561962127686} -11/07/2021 04:57:08 - INFO - __main__ - Step 54947: {'lr': 0.00035804589729296766, 'samples': 10549824, 'steps': 54946, 'loss/train': 1.2998273372650146} -11/07/2021 04:57:08 - INFO - __main__ - Step 54948: {'lr': 0.00035804111172276464, 'samples': 10550016, 'steps': 54947, 'loss/train': 1.4899073839187622} -11/07/2021 04:57:09 - INFO - __main__ - Step 54949: {'lr': 0.00035803632610388, 'samples': 10550208, 'steps': 54948, 'loss/train': 1.5985949039459229} -11/07/2021 04:57:10 - INFO - __main__ - Step 54950: {'lr': 0.0003580315404363158, 'samples': 10550400, 'steps': 54949, 'loss/train': 1.704199194908142} -11/07/2021 04:57:10 - INFO - __main__ - Step 54951: {'lr': 0.0003580267547200743, 'samples': 10550592, 'steps': 54950, 'loss/train': 1.5796351432800293} -11/07/2021 04:57:11 - INFO - __main__ - Step 54952: {'lr': 0.00035802196895515757, 'samples': 10550784, 'steps': 54951, 'loss/train': 1.6180907487869263} -11/07/2021 04:57:11 - INFO - __main__ - Step 54953: {'lr': 0.00035801718314156785, 'samples': 10550976, 'steps': 54952, 'loss/train': 1.3222569227218628} -11/07/2021 04:57:12 - INFO - __main__ - Step 54954: {'lr': 0.00035801239727930716, 'samples': 10551168, 'steps': 54953, 'loss/train': 1.3321624994277954} -11/07/2021 04:57:12 - INFO - __main__ - Step 54955: {'lr': 0.00035800761136837783, 'samples': 10551360, 'steps': 54954, 'loss/train': 1.2968820333480835} -11/07/2021 04:57:13 - INFO - __main__ - Step 54956: {'lr': 0.0003580028254087819, 'samples': 10551552, 'steps': 54955, 'loss/train': 1.2862237691879272} -11/07/2021 04:57:13 - INFO - __main__ - Step 54957: {'lr': 0.00035799803940052163, 'samples': 10551744, 'steps': 54956, 'loss/train': 1.720456838607788} -11/07/2021 04:57:13 - INFO - __main__ - Step 54958: {'lr': 0.00035799325334359906, 'samples': 10551936, 'steps': 54957, 'loss/train': 1.7125890254974365} -11/07/2021 04:57:14 - INFO - __main__ - Step 54959: {'lr': 0.00035798846723801635, 'samples': 10552128, 'steps': 54958, 'loss/train': 1.3855805397033691} -11/07/2021 04:57:15 - INFO - __main__ - Step 54960: {'lr': 0.0003579836810837758, 'samples': 10552320, 'steps': 54959, 'loss/train': 1.5711387395858765} -11/07/2021 04:57:15 - INFO - __main__ - Step 54961: {'lr': 0.0003579788948808794, 'samples': 10552512, 'steps': 54960, 'loss/train': 1.1467931270599365} -11/07/2021 04:57:15 - INFO - __main__ - Step 54962: {'lr': 0.0003579741086293294, 'samples': 10552704, 'steps': 54961, 'loss/train': 1.2307853698730469} -11/07/2021 04:57:16 - INFO - __main__ - Step 54963: {'lr': 0.00035796932232912793, 'samples': 10552896, 'steps': 54962, 'loss/train': 1.5768113136291504} -11/07/2021 04:57:17 - INFO - __main__ - Step 54964: {'lr': 0.00035796453598027725, 'samples': 10553088, 'steps': 54963, 'loss/train': 1.4683003425598145} -11/07/2021 04:57:17 - INFO - __main__ - Step 54965: {'lr': 0.0003579597495827793, 'samples': 10553280, 'steps': 54964, 'loss/train': 1.5094189643859863} -11/07/2021 04:57:18 - INFO - __main__ - Step 54966: {'lr': 0.0003579549631366363, 'samples': 10553472, 'steps': 54965, 'loss/train': 1.278933048248291} -11/07/2021 04:57:18 - INFO - __main__ - Step 54967: {'lr': 0.0003579501766418505, 'samples': 10553664, 'steps': 54966, 'loss/train': 0.46214476227760315} -11/07/2021 04:57:18 - INFO - __main__ - Step 54968: {'lr': 0.0003579453900984241, 'samples': 10553856, 'steps': 54967, 'loss/train': 1.4764328002929688} -11/07/2021 04:57:19 - INFO - __main__ - Step 54969: {'lr': 0.0003579406035063591, 'samples': 10554048, 'steps': 54968, 'loss/train': 1.3582720756530762} -11/07/2021 04:57:20 - INFO - __main__ - Step 54970: {'lr': 0.0003579358168656577, 'samples': 10554240, 'steps': 54969, 'loss/train': 1.1853805780410767} -11/07/2021 04:57:20 - INFO - __main__ - Step 54971: {'lr': 0.00035793103017632224, 'samples': 10554432, 'steps': 54970, 'loss/train': 1.7739368677139282} -11/07/2021 04:57:21 - INFO - __main__ - Step 54972: {'lr': 0.0003579262434383546, 'samples': 10554624, 'steps': 54971, 'loss/train': 1.290099859237671} -11/07/2021 04:57:21 - INFO - __main__ - Step 54973: {'lr': 0.0003579214566517571, 'samples': 10554816, 'steps': 54972, 'loss/train': 1.2865920066833496} -11/07/2021 04:57:22 - INFO - __main__ - Step 54974: {'lr': 0.00035791666981653184, 'samples': 10555008, 'steps': 54973, 'loss/train': 0.5530202388763428} -11/07/2021 04:57:23 - INFO - __main__ - Step 54975: {'lr': 0.00035791188293268094, 'samples': 10555200, 'steps': 54974, 'loss/train': 1.7353119850158691} -11/07/2021 04:57:23 - INFO - __main__ - Step 54976: {'lr': 0.00035790709600020667, 'samples': 10555392, 'steps': 54975, 'loss/train': 1.444684386253357} -11/07/2021 04:57:23 - INFO - __main__ - Step 54977: {'lr': 0.00035790230901911114, 'samples': 10555584, 'steps': 54976, 'loss/train': 0.6288148760795593} -11/07/2021 04:57:24 - INFO - __main__ - Step 54978: {'lr': 0.00035789752198939646, 'samples': 10555776, 'steps': 54977, 'loss/train': 0.6787629127502441} -11/07/2021 04:57:24 - INFO - __main__ - Step 54979: {'lr': 0.00035789273491106485, 'samples': 10555968, 'steps': 54978, 'loss/train': 1.2206088304519653} -11/07/2021 04:57:25 - INFO - __main__ - Step 54980: {'lr': 0.00035788794778411837, 'samples': 10556160, 'steps': 54979, 'loss/train': 0.4907543957233429} -11/07/2021 04:57:25 - INFO - __main__ - Step 54981: {'lr': 0.0003578831606085593, 'samples': 10556352, 'steps': 54980, 'loss/train': 1.2815356254577637} -11/07/2021 04:57:26 - INFO - __main__ - Step 54982: {'lr': 0.00035787837338438976, 'samples': 10556544, 'steps': 54981, 'loss/train': 0.5801774859428406} -11/07/2021 04:57:26 - INFO - __main__ - Step 54983: {'lr': 0.00035787358611161186, 'samples': 10556736, 'steps': 54982, 'loss/train': 1.256115436553955} -11/07/2021 04:57:26 - INFO - __main__ - Step 54984: {'lr': 0.0003578687987902278, 'samples': 10556928, 'steps': 54983, 'loss/train': 0.5729624032974243} -11/07/2021 04:57:28 - INFO - __main__ - Step 54985: {'lr': 0.00035786401142023975, 'samples': 10557120, 'steps': 54984, 'loss/train': 1.3811451196670532} -11/07/2021 04:57:28 - INFO - __main__ - Step 54986: {'lr': 0.00035785922400164983, 'samples': 10557312, 'steps': 54985, 'loss/train': 1.2688241004943848} -11/07/2021 04:57:28 - INFO - __main__ - Step 54987: {'lr': 0.00035785443653446017, 'samples': 10557504, 'steps': 54986, 'loss/train': 1.331153392791748} -11/07/2021 04:57:29 - INFO - __main__ - Step 54988: {'lr': 0.000357849649018673, 'samples': 10557696, 'steps': 54987, 'loss/train': 1.2635180950164795} -11/07/2021 04:57:29 - INFO - __main__ - Step 54989: {'lr': 0.0003578448614542904, 'samples': 10557888, 'steps': 54988, 'loss/train': 0.9246165752410889} -11/07/2021 04:57:30 - INFO - __main__ - Step 54990: {'lr': 0.0003578400738413146, 'samples': 10558080, 'steps': 54989, 'loss/train': 1.4906529188156128} -11/07/2021 04:57:30 - INFO - __main__ - Step 54991: {'lr': 0.00035783528617974774, 'samples': 10558272, 'steps': 54990, 'loss/train': 0.8243188261985779} -11/07/2021 04:57:31 - INFO - __main__ - Step 54992: {'lr': 0.000357830498469592, 'samples': 10558464, 'steps': 54991, 'loss/train': 1.657012939453125} -11/07/2021 04:57:31 - INFO - __main__ - Step 54993: {'lr': 0.0003578257107108494, 'samples': 10558656, 'steps': 54992, 'loss/train': 1.5241446495056152} -11/07/2021 04:57:31 - INFO - __main__ - Step 54994: {'lr': 0.0003578209229035222, 'samples': 10558848, 'steps': 54993, 'loss/train': 0.8030633926391602} -11/07/2021 04:57:32 - INFO - __main__ - Step 54995: {'lr': 0.0003578161350476127, 'samples': 10559040, 'steps': 54994, 'loss/train': 1.4325087070465088} -11/07/2021 04:57:33 - INFO - __main__ - Step 54996: {'lr': 0.00035781134714312277, 'samples': 10559232, 'steps': 54995, 'loss/train': 1.1097663640975952} -11/07/2021 04:57:33 - INFO - __main__ - Step 54997: {'lr': 0.0003578065591900548, 'samples': 10559424, 'steps': 54996, 'loss/train': 1.9446706771850586} -11/07/2021 04:57:34 - INFO - __main__ - Step 54998: {'lr': 0.0003578017711884108, 'samples': 10559616, 'steps': 54997, 'loss/train': 0.1882682591676712} -11/07/2021 04:57:34 - INFO - __main__ - Step 54999: {'lr': 0.000357796983138193, 'samples': 10559808, 'steps': 54998, 'loss/train': 1.3456265926361084} -11/07/2021 04:57:35 - INFO - __main__ - Step 55000: {'lr': 0.0003577921950394035, 'samples': 10560000, 'steps': 54999, 'loss/train': 1.5979148149490356} -11/07/2021 04:57:35 - INFO - __main__ - Step 55001: {'lr': 0.00035778740689204456, 'samples': 10560192, 'steps': 55000, 'loss/train': 1.1905561685562134} -11/07/2021 04:57:36 - INFO - __main__ - Step 55002: {'lr': 0.0003577826186961183, 'samples': 10560384, 'steps': 55001, 'loss/train': 0.9871057868003845} -11/07/2021 04:57:36 - INFO - __main__ - Step 55003: {'lr': 0.0003577778304516268, 'samples': 10560576, 'steps': 55002, 'loss/train': 1.6301368474960327} -11/07/2021 04:57:37 - INFO - __main__ - Step 55004: {'lr': 0.0003577730421585723, 'samples': 10560768, 'steps': 55003, 'loss/train': 1.747949242591858} -11/07/2021 04:57:37 - INFO - __main__ - Step 55005: {'lr': 0.00035776825381695693, 'samples': 10560960, 'steps': 55004, 'loss/train': 0.9194250702857971} -11/07/2021 04:57:38 - INFO - __main__ - Step 55006: {'lr': 0.0003577634654267828, 'samples': 10561152, 'steps': 55005, 'loss/train': 1.667545199394226} -11/07/2021 04:57:38 - INFO - __main__ - Step 55007: {'lr': 0.0003577586769880522, 'samples': 10561344, 'steps': 55006, 'loss/train': 1.3301728963851929} -11/07/2021 04:57:39 - INFO - __main__ - Step 55008: {'lr': 0.00035775388850076714, 'samples': 10561536, 'steps': 55007, 'loss/train': 1.6160812377929688} -11/07/2021 04:57:39 - INFO - __main__ - Step 55009: {'lr': 0.0003577490999649298, 'samples': 10561728, 'steps': 55008, 'loss/train': 2.0927774906158447} -11/07/2021 04:57:39 - INFO - __main__ - Step 55010: {'lr': 0.0003577443113805425, 'samples': 10561920, 'steps': 55009, 'loss/train': 1.492805004119873} -11/07/2021 04:57:40 - INFO - __main__ - Step 55011: {'lr': 0.00035773952274760723, 'samples': 10562112, 'steps': 55010, 'loss/train': 1.437565565109253} -11/07/2021 04:57:41 - INFO - __main__ - Step 55012: {'lr': 0.00035773473406612615, 'samples': 10562304, 'steps': 55011, 'loss/train': 1.6526776552200317} -11/07/2021 04:57:41 - INFO - __main__ - Step 55013: {'lr': 0.0003577299453361015, 'samples': 10562496, 'steps': 55012, 'loss/train': 1.2323278188705444} -11/07/2021 04:57:41 - INFO - __main__ - Step 55014: {'lr': 0.00035772515655753536, 'samples': 10562688, 'steps': 55013, 'loss/train': 1.0117645263671875} -11/07/2021 04:57:42 - INFO - __main__ - Step 55015: {'lr': 0.00035772036773042994, 'samples': 10562880, 'steps': 55014, 'loss/train': 1.9306058883666992} -11/07/2021 04:57:43 - INFO - __main__ - Step 55016: {'lr': 0.00035771557885478744, 'samples': 10563072, 'steps': 55015, 'loss/train': 1.0696053504943848} -11/07/2021 04:57:43 - INFO - __main__ - Step 55017: {'lr': 0.0003577107899306099, 'samples': 10563264, 'steps': 55016, 'loss/train': 1.4434189796447754} -11/07/2021 04:57:43 - INFO - __main__ - Step 55018: {'lr': 0.00035770600095789957, 'samples': 10563456, 'steps': 55017, 'loss/train': 1.374860167503357} -11/07/2021 04:57:44 - INFO - __main__ - Step 55019: {'lr': 0.0003577012119366586, 'samples': 10563648, 'steps': 55018, 'loss/train': 1.7924306392669678} -11/07/2021 04:57:44 - INFO - __main__ - Step 55020: {'lr': 0.00035769642286688903, 'samples': 10563840, 'steps': 55019, 'loss/train': 1.1546483039855957} -11/07/2021 04:57:45 - INFO - __main__ - Step 55021: {'lr': 0.00035769163374859325, 'samples': 10564032, 'steps': 55020, 'loss/train': 1.1657540798187256} -11/07/2021 04:57:45 - INFO - __main__ - Step 55022: {'lr': 0.0003576868445817732, 'samples': 10564224, 'steps': 55021, 'loss/train': 1.4878591299057007} -11/07/2021 04:57:46 - INFO - __main__ - Step 55023: {'lr': 0.0003576820553664311, 'samples': 10564416, 'steps': 55022, 'loss/train': 1.4696134328842163} -11/07/2021 04:57:46 - INFO - __main__ - Step 55024: {'lr': 0.0003576772661025691, 'samples': 10564608, 'steps': 55023, 'loss/train': 1.193994402885437} -11/07/2021 04:57:46 - INFO - __main__ - Step 55025: {'lr': 0.0003576724767901895, 'samples': 10564800, 'steps': 55024, 'loss/train': 1.5176256895065308} -11/07/2021 04:57:48 - INFO - __main__ - Step 55026: {'lr': 0.00035766768742929436, 'samples': 10564992, 'steps': 55025, 'loss/train': 1.5638397932052612} -11/07/2021 04:57:48 - INFO - __main__ - Step 55027: {'lr': 0.00035766289801988574, 'samples': 10565184, 'steps': 55026, 'loss/train': 1.2947450876235962} -11/07/2021 04:57:48 - INFO - __main__ - Step 55028: {'lr': 0.00035765810856196585, 'samples': 10565376, 'steps': 55027, 'loss/train': 1.4492391347885132} -11/07/2021 04:57:49 - INFO - __main__ - Step 55029: {'lr': 0.00035765331905553686, 'samples': 10565568, 'steps': 55028, 'loss/train': 1.794018030166626} -11/07/2021 04:57:49 - INFO - __main__ - Step 55030: {'lr': 0.000357648529500601, 'samples': 10565760, 'steps': 55029, 'loss/train': 1.7248971462249756} -11/07/2021 04:57:50 - INFO - __main__ - Step 55031: {'lr': 0.00035764373989716035, 'samples': 10565952, 'steps': 55030, 'loss/train': 0.8968067169189453} -11/07/2021 04:57:50 - INFO - __main__ - Step 55032: {'lr': 0.0003576389502452172, 'samples': 10566144, 'steps': 55031, 'loss/train': 1.6573113203048706} -11/07/2021 04:57:51 - INFO - __main__ - Step 55033: {'lr': 0.0003576341605447735, 'samples': 10566336, 'steps': 55032, 'loss/train': 1.3684130907058716} -11/07/2021 04:57:51 - INFO - __main__ - Step 55034: {'lr': 0.0003576293707958315, 'samples': 10566528, 'steps': 55033, 'loss/train': 1.1835936307907104} -11/07/2021 04:57:51 - INFO - __main__ - Step 55035: {'lr': 0.0003576245809983934, 'samples': 10566720, 'steps': 55034, 'loss/train': 1.1828055381774902} -11/07/2021 04:57:52 - INFO - __main__ - Step 55036: {'lr': 0.0003576197911524613, 'samples': 10566912, 'steps': 55035, 'loss/train': 1.211046814918518} -11/07/2021 04:57:53 - INFO - __main__ - Step 55037: {'lr': 0.0003576150012580374, 'samples': 10567104, 'steps': 55036, 'loss/train': 1.112857699394226} -11/07/2021 04:57:53 - INFO - __main__ - Step 55038: {'lr': 0.00035761021131512383, 'samples': 10567296, 'steps': 55037, 'loss/train': 1.4128081798553467} -11/07/2021 04:57:54 - INFO - __main__ - Step 55039: {'lr': 0.00035760542132372275, 'samples': 10567488, 'steps': 55038, 'loss/train': 1.4762065410614014} -11/07/2021 04:57:54 - INFO - __main__ - Step 55040: {'lr': 0.00035760063128383637, 'samples': 10567680, 'steps': 55039, 'loss/train': 1.4175198078155518} -11/07/2021 04:57:54 - INFO - __main__ - Step 55041: {'lr': 0.0003575958411954668, 'samples': 10567872, 'steps': 55040, 'loss/train': 2.396432638168335} -11/07/2021 04:57:55 - INFO - __main__ - Step 55042: {'lr': 0.00035759105105861614, 'samples': 10568064, 'steps': 55041, 'loss/train': 1.0133460760116577} -11/07/2021 04:57:56 - INFO - __main__ - Step 55043: {'lr': 0.00035758626087328664, 'samples': 10568256, 'steps': 55042, 'loss/train': 1.1450141668319702} -11/07/2021 04:57:56 - INFO - __main__ - Step 55044: {'lr': 0.00035758147063948056, 'samples': 10568448, 'steps': 55043, 'loss/train': 2.798823595046997} -11/07/2021 04:57:56 - INFO - __main__ - Step 55045: {'lr': 0.00035757668035719974, 'samples': 10568640, 'steps': 55044, 'loss/train': 1.7040687799453735} -11/07/2021 04:57:57 - INFO - __main__ - Step 55046: {'lr': 0.00035757189002644664, 'samples': 10568832, 'steps': 55045, 'loss/train': 1.5583311319351196} -11/07/2021 04:57:58 - INFO - __main__ - Step 55047: {'lr': 0.00035756709964722324, 'samples': 10569024, 'steps': 55046, 'loss/train': 1.4309717416763306} -11/07/2021 04:57:58 - INFO - __main__ - Step 55048: {'lr': 0.00035756230921953183, 'samples': 10569216, 'steps': 55047, 'loss/train': 1.5375730991363525} -11/07/2021 04:57:58 - INFO - __main__ - Step 55049: {'lr': 0.0003575575187433744, 'samples': 10569408, 'steps': 55048, 'loss/train': 1.8171958923339844} -11/07/2021 04:57:59 - INFO - __main__ - Step 55050: {'lr': 0.0003575527282187533, 'samples': 10569600, 'steps': 55049, 'loss/train': 1.4335161447525024} -11/07/2021 04:57:59 - INFO - __main__ - Step 55051: {'lr': 0.00035754793764567063, 'samples': 10569792, 'steps': 55050, 'loss/train': 1.3283638954162598} -11/07/2021 04:58:00 - INFO - __main__ - Step 55052: {'lr': 0.0003575431470241285, 'samples': 10569984, 'steps': 55051, 'loss/train': 0.7707861661911011} -11/07/2021 04:58:00 - INFO - __main__ - Step 55053: {'lr': 0.000357538356354129, 'samples': 10570176, 'steps': 55052, 'loss/train': 1.370285153388977} -11/07/2021 04:58:01 - INFO - __main__ - Step 55054: {'lr': 0.0003575335656356744, 'samples': 10570368, 'steps': 55053, 'loss/train': 1.6500614881515503} -11/07/2021 04:58:01 - INFO - __main__ - Step 55055: {'lr': 0.0003575287748687669, 'samples': 10570560, 'steps': 55054, 'loss/train': 0.6962327361106873} -11/07/2021 04:58:02 - INFO - __main__ - Step 55056: {'lr': 0.0003575239840534086, 'samples': 10570752, 'steps': 55055, 'loss/train': 1.1676795482635498} -11/07/2021 04:58:03 - INFO - __main__ - Step 55057: {'lr': 0.00035751919318960157, 'samples': 10570944, 'steps': 55056, 'loss/train': 1.1781184673309326} -11/07/2021 04:58:03 - INFO - __main__ - Step 55058: {'lr': 0.0003575144022773481, 'samples': 10571136, 'steps': 55057, 'loss/train': 1.1429388523101807} -11/07/2021 04:58:03 - INFO - __main__ - Step 55059: {'lr': 0.00035750961131665034, 'samples': 10571328, 'steps': 55058, 'loss/train': 1.7127009630203247} -11/07/2021 04:58:04 - INFO - __main__ - Step 55060: {'lr': 0.0003575048203075103, 'samples': 10571520, 'steps': 55059, 'loss/train': 1.3227245807647705} -11/07/2021 04:58:04 - INFO - __main__ - Step 55061: {'lr': 0.0003575000292499303, 'samples': 10571712, 'steps': 55060, 'loss/train': 1.6034808158874512} -11/07/2021 04:58:04 - INFO - __main__ - Step 55062: {'lr': 0.0003574952381439125, 'samples': 10571904, 'steps': 55061, 'loss/train': 0.8018674254417419} -11/07/2021 04:58:05 - INFO - __main__ - Step 55063: {'lr': 0.0003574904469894589, 'samples': 10572096, 'steps': 55062, 'loss/train': 1.1603502035140991} -11/07/2021 04:58:06 - INFO - __main__ - Step 55064: {'lr': 0.00035748565578657185, 'samples': 10572288, 'steps': 55063, 'loss/train': 1.4817630052566528} -11/07/2021 04:58:06 - INFO - __main__ - Step 55065: {'lr': 0.0003574808645352534, 'samples': 10572480, 'steps': 55064, 'loss/train': 1.4915812015533447} -11/07/2021 04:58:07 - INFO - __main__ - Step 55066: {'lr': 0.00035747607323550573, 'samples': 10572672, 'steps': 55065, 'loss/train': 0.9114412069320679} -11/07/2021 04:58:07 - INFO - __main__ - Step 55067: {'lr': 0.000357471281887331, 'samples': 10572864, 'steps': 55066, 'loss/train': 1.3542866706848145} -11/07/2021 04:58:08 - INFO - __main__ - Step 55068: {'lr': 0.0003574664904907314, 'samples': 10573056, 'steps': 55067, 'loss/train': 1.4151079654693604} -11/07/2021 04:58:08 - INFO - __main__ - Step 55069: {'lr': 0.00035746169904570896, 'samples': 10573248, 'steps': 55068, 'loss/train': 1.4811794757843018} -11/07/2021 04:58:09 - INFO - __main__ - Step 55070: {'lr': 0.000357456907552266, 'samples': 10573440, 'steps': 55069, 'loss/train': 1.2116820812225342} -11/07/2021 04:58:09 - INFO - __main__ - Step 55071: {'lr': 0.00035745211601040464, 'samples': 10573632, 'steps': 55070, 'loss/train': 2.0120761394500732} -11/07/2021 04:58:09 - INFO - __main__ - Step 55072: {'lr': 0.000357447324420127, 'samples': 10573824, 'steps': 55071, 'loss/train': 1.7886202335357666} -11/07/2021 04:58:10 - INFO - __main__ - Step 55073: {'lr': 0.00035744253278143526, 'samples': 10574016, 'steps': 55072, 'loss/train': 2.2052876949310303} -11/07/2021 04:58:11 - INFO - __main__ - Step 55074: {'lr': 0.0003574377410943315, 'samples': 10574208, 'steps': 55073, 'loss/train': 1.3213140964508057} -11/07/2021 04:58:11 - INFO - __main__ - Step 55075: {'lr': 0.00035743294935881804, 'samples': 10574400, 'steps': 55074, 'loss/train': 1.1828625202178955} -11/07/2021 04:58:11 - INFO - __main__ - Step 55076: {'lr': 0.0003574281575748969, 'samples': 10574592, 'steps': 55075, 'loss/train': 0.9429059624671936} -11/07/2021 04:58:12 - INFO - __main__ - Step 55077: {'lr': 0.0003574233657425703, 'samples': 10574784, 'steps': 55076, 'loss/train': 1.2194664478302002} -11/07/2021 04:58:13 - INFO - __main__ - Step 55078: {'lr': 0.0003574185738618404, 'samples': 10574976, 'steps': 55077, 'loss/train': 1.5214813947677612} -11/07/2021 04:58:13 - INFO - __main__ - Step 55079: {'lr': 0.00035741378193270934, 'samples': 10575168, 'steps': 55078, 'loss/train': 2.3881895542144775} -11/07/2021 04:58:14 - INFO - __main__ - Step 55080: {'lr': 0.00035740898995517933, 'samples': 10575360, 'steps': 55079, 'loss/train': 3.341811180114746} -11/07/2021 04:58:14 - INFO - __main__ - Step 55081: {'lr': 0.00035740419792925244, 'samples': 10575552, 'steps': 55080, 'loss/train': 1.680826187133789} -11/07/2021 04:58:14 - INFO - __main__ - Step 55082: {'lr': 0.0003573994058549309, 'samples': 10575744, 'steps': 55081, 'loss/train': 1.295062780380249} -11/07/2021 04:58:15 - INFO - __main__ - Step 55083: {'lr': 0.00035739461373221677, 'samples': 10575936, 'steps': 55082, 'loss/train': 1.247595191001892} -11/07/2021 04:58:16 - INFO - __main__ - Step 55084: {'lr': 0.00035738982156111233, 'samples': 10576128, 'steps': 55083, 'loss/train': 1.5760958194732666} -11/07/2021 04:58:16 - INFO - __main__ - Step 55085: {'lr': 0.0003573850293416198, 'samples': 10576320, 'steps': 55084, 'loss/train': 1.8488069772720337} -11/07/2021 04:58:16 - INFO - __main__ - Step 55086: {'lr': 0.00035738023707374114, 'samples': 10576512, 'steps': 55085, 'loss/train': 1.074326992034912} -11/07/2021 04:58:17 - INFO - __main__ - Step 55087: {'lr': 0.0003573754447574785, 'samples': 10576704, 'steps': 55086, 'loss/train': 1.8997424840927124} -11/07/2021 04:58:17 - INFO - __main__ - Step 55088: {'lr': 0.0003573706523928343, 'samples': 10576896, 'steps': 55087, 'loss/train': 1.388343334197998} -11/07/2021 04:58:18 - INFO - __main__ - Step 55089: {'lr': 0.00035736585997981046, 'samples': 10577088, 'steps': 55088, 'loss/train': 1.54605233669281} -11/07/2021 04:58:18 - INFO - __main__ - Step 55090: {'lr': 0.00035736106751840926, 'samples': 10577280, 'steps': 55089, 'loss/train': 1.278705358505249} -11/07/2021 04:58:19 - INFO - __main__ - Step 55091: {'lr': 0.00035735627500863275, 'samples': 10577472, 'steps': 55090, 'loss/train': 1.3363699913024902} -11/07/2021 04:58:19 - INFO - __main__ - Step 55092: {'lr': 0.00035735148245048326, 'samples': 10577664, 'steps': 55091, 'loss/train': 1.4652860164642334} -11/07/2021 04:58:20 - INFO - __main__ - Step 55093: {'lr': 0.0003573466898439628, 'samples': 10577856, 'steps': 55092, 'loss/train': 1.192568302154541} -11/07/2021 04:58:21 - INFO - __main__ - Step 55094: {'lr': 0.00035734189718907364, 'samples': 10578048, 'steps': 55093, 'loss/train': 1.6429756879806519} -11/07/2021 04:58:21 - INFO - __main__ - Step 55095: {'lr': 0.00035733710448581773, 'samples': 10578240, 'steps': 55094, 'loss/train': 1.6769375801086426} -11/07/2021 04:58:21 - INFO - __main__ - Step 55096: {'lr': 0.0003573323117341975, 'samples': 10578432, 'steps': 55095, 'loss/train': 1.516952395439148} -11/07/2021 04:58:22 - INFO - __main__ - Step 55097: {'lr': 0.00035732751893421494, 'samples': 10578624, 'steps': 55096, 'loss/train': 1.70482337474823} -11/07/2021 04:58:22 - INFO - __main__ - Step 55098: {'lr': 0.0003573227260858723, 'samples': 10578816, 'steps': 55097, 'loss/train': 1.5933622121810913} -11/07/2021 04:58:24 - INFO - __main__ - Step 55099: {'lr': 0.00035731793318917167, 'samples': 10579008, 'steps': 55098, 'loss/train': 1.691129207611084} -11/07/2021 04:58:24 - INFO - __main__ - Step 55100: {'lr': 0.0003573131402441152, 'samples': 10579200, 'steps': 55099, 'loss/train': 1.790935754776001} -11/07/2021 04:58:25 - INFO - __main__ - Step 55101: {'lr': 0.0003573083472507051, 'samples': 10579392, 'steps': 55100, 'loss/train': 1.7911534309387207} -11/07/2021 04:58:25 - INFO - __main__ - Step 55102: {'lr': 0.00035730355420894355, 'samples': 10579584, 'steps': 55101, 'loss/train': 1.7881889343261719} -11/07/2021 04:58:25 - INFO - __main__ - Step 55103: {'lr': 0.00035729876111883265, 'samples': 10579776, 'steps': 55102, 'loss/train': 1.4734764099121094} -11/07/2021 04:58:26 - INFO - __main__ - Step 55104: {'lr': 0.0003572939679803746, 'samples': 10579968, 'steps': 55103, 'loss/train': 1.5647242069244385} -11/07/2021 04:58:26 - INFO - __main__ - Step 55105: {'lr': 0.00035728917479357154, 'samples': 10580160, 'steps': 55104, 'loss/train': 1.3219374418258667} -11/07/2021 04:58:27 - INFO - __main__ - Step 55106: {'lr': 0.00035728438155842556, 'samples': 10580352, 'steps': 55105, 'loss/train': 1.6424331665039062} -11/07/2021 04:58:27 - INFO - __main__ - Step 55107: {'lr': 0.000357279588274939, 'samples': 10580544, 'steps': 55106, 'loss/train': 1.7871103286743164} -11/07/2021 04:58:28 - INFO - __main__ - Step 55108: {'lr': 0.00035727479494311387, 'samples': 10580736, 'steps': 55107, 'loss/train': 0.7385053634643555} -11/07/2021 04:58:28 - INFO - __main__ - Step 55109: {'lr': 0.0003572700015629524, 'samples': 10580928, 'steps': 55108, 'loss/train': 1.3223023414611816} -11/07/2021 04:58:28 - INFO - __main__ - Step 55110: {'lr': 0.0003572652081344566, 'samples': 10581120, 'steps': 55109, 'loss/train': 1.6981300115585327} -11/07/2021 04:58:30 - INFO - __main__ - Step 55111: {'lr': 0.00035726041465762885, 'samples': 10581312, 'steps': 55110, 'loss/train': 1.184633493423462} -11/07/2021 04:58:30 - INFO - __main__ - Step 55112: {'lr': 0.0003572556211324713, 'samples': 10581504, 'steps': 55111, 'loss/train': 1.4075344800949097} -11/07/2021 04:58:30 - INFO - __main__ - Step 55113: {'lr': 0.0003572508275589859, 'samples': 10581696, 'steps': 55112, 'loss/train': 1.3846694231033325} -11/07/2021 04:58:31 - INFO - __main__ - Step 55114: {'lr': 0.00035724603393717493, 'samples': 10581888, 'steps': 55113, 'loss/train': 1.4604871273040771} -11/07/2021 04:58:31 - INFO - __main__ - Step 55115: {'lr': 0.00035724124026704064, 'samples': 10582080, 'steps': 55114, 'loss/train': 1.9760327339172363} -11/07/2021 04:58:31 - INFO - __main__ - Step 55116: {'lr': 0.000357236446548585, 'samples': 10582272, 'steps': 55115, 'loss/train': 0.805184543132782} -11/07/2021 04:58:32 - INFO - __main__ - Step 55117: {'lr': 0.0003572316527818103, 'samples': 10582464, 'steps': 55116, 'loss/train': 1.3658256530761719} -11/07/2021 04:58:33 - INFO - __main__ - Step 55118: {'lr': 0.00035722685896671876, 'samples': 10582656, 'steps': 55117, 'loss/train': 1.6515177488327026} -11/07/2021 04:58:33 - INFO - __main__ - Step 55119: {'lr': 0.00035722206510331237, 'samples': 10582848, 'steps': 55118, 'loss/train': 1.3519814014434814} -11/07/2021 04:58:33 - INFO - __main__ - Step 55120: {'lr': 0.0003572172711915934, 'samples': 10583040, 'steps': 55119, 'loss/train': 1.557307243347168} -11/07/2021 04:58:34 - INFO - __main__ - Step 55121: {'lr': 0.0003572124772315639, 'samples': 10583232, 'steps': 55120, 'loss/train': 1.3858848810195923} -11/07/2021 04:58:35 - INFO - __main__ - Step 55122: {'lr': 0.0003572076832232262, 'samples': 10583424, 'steps': 55121, 'loss/train': 1.3028733730316162} -11/07/2021 04:58:35 - INFO - __main__ - Step 55123: {'lr': 0.0003572028891665823, 'samples': 10583616, 'steps': 55122, 'loss/train': 1.1942554712295532} -11/07/2021 04:58:36 - INFO - __main__ - Step 55124: {'lr': 0.00035719809506163454, 'samples': 10583808, 'steps': 55123, 'loss/train': 1.3237128257751465} -11/07/2021 04:58:36 - INFO - __main__ - Step 55125: {'lr': 0.0003571933009083849, 'samples': 10584000, 'steps': 55124, 'loss/train': 1.6525145769119263} -11/07/2021 04:58:36 - INFO - __main__ - Step 55126: {'lr': 0.00035718850670683565, 'samples': 10584192, 'steps': 55125, 'loss/train': 1.6280956268310547} -11/07/2021 04:58:37 - INFO - __main__ - Step 55127: {'lr': 0.00035718371245698887, 'samples': 10584384, 'steps': 55126, 'loss/train': 0.13471516966819763} -11/07/2021 04:58:38 - INFO - __main__ - Step 55128: {'lr': 0.0003571789181588468, 'samples': 10584576, 'steps': 55127, 'loss/train': 1.616760015487671} -11/07/2021 04:58:38 - INFO - __main__ - Step 55129: {'lr': 0.00035717412381241153, 'samples': 10584768, 'steps': 55128, 'loss/train': 1.5680081844329834} -11/07/2021 04:58:38 - INFO - __main__ - Step 55130: {'lr': 0.00035716932941768525, 'samples': 10584960, 'steps': 55129, 'loss/train': 1.6211940050125122} -11/07/2021 04:58:39 - INFO - __main__ - Step 55131: {'lr': 0.0003571645349746702, 'samples': 10585152, 'steps': 55130, 'loss/train': 1.2587850093841553} -11/07/2021 04:58:40 - INFO - __main__ - Step 55132: {'lr': 0.00035715974048336843, 'samples': 10585344, 'steps': 55131, 'loss/train': 1.1344618797302246} -11/07/2021 04:58:40 - INFO - __main__ - Step 55133: {'lr': 0.0003571549459437821, 'samples': 10585536, 'steps': 55132, 'loss/train': 1.1305006742477417} -11/07/2021 04:58:41 - INFO - __main__ - Step 55134: {'lr': 0.00035715015135591346, 'samples': 10585728, 'steps': 55133, 'loss/train': 1.698072910308838} -11/07/2021 04:58:41 - INFO - __main__ - Step 55135: {'lr': 0.0003571453567197645, 'samples': 10585920, 'steps': 55134, 'loss/train': 1.8285516500473022} -11/07/2021 04:58:41 - INFO - __main__ - Step 55136: {'lr': 0.0003571405620353376, 'samples': 10586112, 'steps': 55135, 'loss/train': 1.2474533319473267} -11/07/2021 04:58:42 - INFO - __main__ - Step 55137: {'lr': 0.00035713576730263475, 'samples': 10586304, 'steps': 55136, 'loss/train': 1.4400640726089478} -11/07/2021 04:58:43 - INFO - __main__ - Step 55138: {'lr': 0.0003571309725216582, 'samples': 10586496, 'steps': 55137, 'loss/train': 0.987962543964386} -11/07/2021 04:58:43 - INFO - __main__ - Step 55139: {'lr': 0.0003571261776924102, 'samples': 10586688, 'steps': 55138, 'loss/train': 1.189251184463501} -11/07/2021 04:58:43 - INFO - __main__ - Step 55140: {'lr': 0.00035712138281489264, 'samples': 10586880, 'steps': 55139, 'loss/train': 0.8905391693115234} -11/07/2021 04:58:44 - INFO - __main__ - Step 55141: {'lr': 0.0003571165878891079, 'samples': 10587072, 'steps': 55140, 'loss/train': 1.3201361894607544} -11/07/2021 04:58:45 - INFO - __main__ - Step 55142: {'lr': 0.00035711179291505806, 'samples': 10587264, 'steps': 55141, 'loss/train': 1.5405439138412476} -11/07/2021 04:58:45 - INFO - __main__ - Step 55143: {'lr': 0.0003571069978927453, 'samples': 10587456, 'steps': 55142, 'loss/train': 1.4250941276550293} -11/07/2021 04:58:45 - INFO - __main__ - Step 55144: {'lr': 0.00035710220282217175, 'samples': 10587648, 'steps': 55143, 'loss/train': 0.9400364756584167} -11/07/2021 04:58:46 - INFO - __main__ - Step 55145: {'lr': 0.0003570974077033397, 'samples': 10587840, 'steps': 55144, 'loss/train': 1.5619584321975708} -11/07/2021 04:58:46 - INFO - __main__ - Step 55146: {'lr': 0.00035709261253625115, 'samples': 10588032, 'steps': 55145, 'loss/train': 0.9394890666007996} -11/07/2021 04:58:47 - INFO - __main__ - Step 55147: {'lr': 0.00035708781732090835, 'samples': 10588224, 'steps': 55146, 'loss/train': 1.5081124305725098} -11/07/2021 04:58:48 - INFO - __main__ - Step 55148: {'lr': 0.00035708302205731334, 'samples': 10588416, 'steps': 55147, 'loss/train': 1.3798731565475464} -11/07/2021 04:58:48 - INFO - __main__ - Step 55149: {'lr': 0.00035707822674546847, 'samples': 10588608, 'steps': 55148, 'loss/train': 1.479280710220337} -11/07/2021 04:58:48 - INFO - __main__ - Step 55150: {'lr': 0.00035707343138537584, 'samples': 10588800, 'steps': 55149, 'loss/train': 1.2436096668243408} -11/07/2021 04:58:49 - INFO - __main__ - Step 55151: {'lr': 0.00035706863597703746, 'samples': 10588992, 'steps': 55150, 'loss/train': 1.5817415714263916} -11/07/2021 04:58:50 - INFO - __main__ - Step 55152: {'lr': 0.00035706384052045567, 'samples': 10589184, 'steps': 55151, 'loss/train': 1.42521071434021} -11/07/2021 04:58:50 - INFO - __main__ - Step 55153: {'lr': 0.0003570590450156325, 'samples': 10589376, 'steps': 55152, 'loss/train': 1.4141230583190918} -11/07/2021 04:58:51 - INFO - __main__ - Step 55154: {'lr': 0.00035705424946257027, 'samples': 10589568, 'steps': 55153, 'loss/train': 1.715566873550415} -11/07/2021 04:58:51 - INFO - __main__ - Step 55155: {'lr': 0.000357049453861271, 'samples': 10589760, 'steps': 55154, 'loss/train': 0.5692832469940186} -11/07/2021 04:58:51 - INFO - __main__ - Step 55156: {'lr': 0.00035704465821173695, 'samples': 10589952, 'steps': 55155, 'loss/train': 1.2147572040557861} -11/07/2021 04:58:52 - INFO - __main__ - Step 55157: {'lr': 0.00035703986251397015, 'samples': 10590144, 'steps': 55156, 'loss/train': 1.3184512853622437} -11/07/2021 04:58:53 - INFO - __main__ - Step 55158: {'lr': 0.00035703506676797284, 'samples': 10590336, 'steps': 55157, 'loss/train': 1.4686580896377563} -11/07/2021 04:58:53 - INFO - __main__ - Step 55159: {'lr': 0.00035703027097374717, 'samples': 10590528, 'steps': 55158, 'loss/train': 1.6541765928268433} -11/07/2021 04:58:53 - INFO - __main__ - Step 55160: {'lr': 0.00035702547513129533, 'samples': 10590720, 'steps': 55159, 'loss/train': 1.4428073167800903} -11/07/2021 04:58:54 - INFO - __main__ - Step 55161: {'lr': 0.0003570206792406195, 'samples': 10590912, 'steps': 55160, 'loss/train': 1.1663644313812256} -11/07/2021 04:58:54 - INFO - __main__ - Step 55162: {'lr': 0.0003570158833017219, 'samples': 10591104, 'steps': 55161, 'loss/train': 1.5408821105957031} -11/07/2021 04:58:55 - INFO - __main__ - Step 55163: {'lr': 0.0003570110873146044, 'samples': 10591296, 'steps': 55162, 'loss/train': 1.4008692502975464} -11/07/2021 04:58:55 - INFO - __main__ - Step 55164: {'lr': 0.0003570062912792694, 'samples': 10591488, 'steps': 55163, 'loss/train': 1.1255208253860474} -11/07/2021 04:58:56 - INFO - __main__ - Step 55165: {'lr': 0.0003570014951957191, 'samples': 10591680, 'steps': 55164, 'loss/train': 1.3669341802597046} -11/07/2021 04:58:56 - INFO - __main__ - Step 55166: {'lr': 0.00035699669906395554, 'samples': 10591872, 'steps': 55165, 'loss/train': 1.8413978815078735} -11/07/2021 04:58:57 - INFO - __main__ - Step 55167: {'lr': 0.00035699190288398093, 'samples': 10592064, 'steps': 55166, 'loss/train': 1.1969252824783325} -11/07/2021 04:58:58 - INFO - __main__ - Step 55168: {'lr': 0.0003569871066557974, 'samples': 10592256, 'steps': 55167, 'loss/train': 1.5171173810958862} -11/07/2021 04:58:59 - INFO - __main__ - Step 55169: {'lr': 0.0003569823103794071, 'samples': 10592448, 'steps': 55168, 'loss/train': 1.1714458465576172} -11/07/2021 04:58:59 - INFO - __main__ - Step 55170: {'lr': 0.0003569775140548122, 'samples': 10592640, 'steps': 55169, 'loss/train': 1.2222853899002075} -11/07/2021 04:58:59 - INFO - __main__ - Step 55171: {'lr': 0.00035697271768201494, 'samples': 10592832, 'steps': 55170, 'loss/train': 0.13801901042461395} -11/07/2021 04:59:00 - INFO - __main__ - Step 55172: {'lr': 0.0003569679212610175, 'samples': 10593024, 'steps': 55171, 'loss/train': 0.31321340799331665} -11/07/2021 04:59:00 - INFO - __main__ - Step 55173: {'lr': 0.00035696312479182186, 'samples': 10593216, 'steps': 55172, 'loss/train': 0.2924405038356781} -11/07/2021 04:59:01 - INFO - __main__ - Step 55174: {'lr': 0.0003569583282744303, 'samples': 10593408, 'steps': 55173, 'loss/train': 0.39519545435905457} -11/07/2021 04:59:02 - INFO - __main__ - Step 55175: {'lr': 0.00035695353170884494, 'samples': 10593600, 'steps': 55174, 'loss/train': 1.630731463432312} -11/07/2021 04:59:02 - INFO - __main__ - Step 55176: {'lr': 0.000356948735095068, 'samples': 10593792, 'steps': 55175, 'loss/train': 1.5511635541915894} -11/07/2021 04:59:02 - INFO - __main__ - Step 55177: {'lr': 0.0003569439384331016, 'samples': 10593984, 'steps': 55176, 'loss/train': 1.8013595342636108} -11/07/2021 04:59:03 - INFO - __main__ - Step 55178: {'lr': 0.00035693914172294796, 'samples': 10594176, 'steps': 55177, 'loss/train': 1.6304501295089722} -11/07/2021 04:59:04 - INFO - __main__ - Step 55179: {'lr': 0.0003569343449646092, 'samples': 10594368, 'steps': 55178, 'loss/train': 1.5907942056655884} -11/07/2021 04:59:04 - INFO - __main__ - Step 55180: {'lr': 0.0003569295481580874, 'samples': 10594560, 'steps': 55179, 'loss/train': 1.7025096416473389} -11/07/2021 04:59:04 - INFO - __main__ - Step 55181: {'lr': 0.0003569247513033848, 'samples': 10594752, 'steps': 55180, 'loss/train': 1.6277837753295898} -11/07/2021 04:59:05 - INFO - __main__ - Step 55182: {'lr': 0.00035691995440050364, 'samples': 10594944, 'steps': 55181, 'loss/train': 1.5280399322509766} -11/07/2021 04:59:05 - INFO - __main__ - Step 55183: {'lr': 0.0003569151574494459, 'samples': 10595136, 'steps': 55182, 'loss/train': 2.082932472229004} -11/07/2021 04:59:05 - INFO - __main__ - Step 55184: {'lr': 0.00035691036045021384, 'samples': 10595328, 'steps': 55183, 'loss/train': 1.4191107749938965} -11/07/2021 04:59:06 - INFO - __main__ - Step 55185: {'lr': 0.0003569055634028097, 'samples': 10595520, 'steps': 55184, 'loss/train': 1.123810052871704} -11/07/2021 04:59:07 - INFO - __main__ - Step 55186: {'lr': 0.00035690076630723555, 'samples': 10595712, 'steps': 55185, 'loss/train': 1.7939107418060303} -11/07/2021 04:59:07 - INFO - __main__ - Step 55187: {'lr': 0.0003568959691634935, 'samples': 10595904, 'steps': 55186, 'loss/train': 1.6975566148757935} -11/07/2021 04:59:07 - INFO - __main__ - Step 55188: {'lr': 0.0003568911719715858, 'samples': 10596096, 'steps': 55187, 'loss/train': 1.7787225246429443} -11/07/2021 04:59:08 - INFO - __main__ - Step 55189: {'lr': 0.00035688637473151464, 'samples': 10596288, 'steps': 55188, 'loss/train': 1.1431853771209717} -11/07/2021 04:59:09 - INFO - __main__ - Step 55190: {'lr': 0.0003568815774432821, 'samples': 10596480, 'steps': 55189, 'loss/train': 1.4977154731750488} -11/07/2021 04:59:10 - INFO - __main__ - Step 55191: {'lr': 0.00035687678010689033, 'samples': 10596672, 'steps': 55190, 'loss/train': 0.1889737993478775} -11/07/2021 04:59:10 - INFO - __main__ - Step 55192: {'lr': 0.00035687198272234163, 'samples': 10596864, 'steps': 55191, 'loss/train': 1.3264491558074951} -11/07/2021 04:59:10 - INFO - __main__ - Step 55193: {'lr': 0.00035686718528963804, 'samples': 10597056, 'steps': 55192, 'loss/train': 1.0734184980392456} -11/07/2021 04:59:11 - INFO - __main__ - Step 55194: {'lr': 0.00035686238780878167, 'samples': 10597248, 'steps': 55193, 'loss/train': 1.3196901082992554} -11/07/2021 04:59:12 - INFO - __main__ - Step 55195: {'lr': 0.0003568575902797748, 'samples': 10597440, 'steps': 55194, 'loss/train': 1.5095797777175903} -11/07/2021 04:59:12 - INFO - __main__ - Step 55196: {'lr': 0.0003568527927026195, 'samples': 10597632, 'steps': 55195, 'loss/train': 1.3618577718734741} -11/07/2021 04:59:12 - INFO - __main__ - Step 55197: {'lr': 0.000356847995077318, 'samples': 10597824, 'steps': 55196, 'loss/train': 1.2174633741378784} -11/07/2021 04:59:13 - INFO - __main__ - Step 55198: {'lr': 0.0003568431974038725, 'samples': 10598016, 'steps': 55197, 'loss/train': 2.0520200729370117} -11/07/2021 04:59:13 - INFO - __main__ - Step 55199: {'lr': 0.0003568383996822851, 'samples': 10598208, 'steps': 55198, 'loss/train': 1.5670710802078247} -11/07/2021 04:59:14 - INFO - __main__ - Step 55200: {'lr': 0.0003568336019125579, 'samples': 10598400, 'steps': 55199, 'loss/train': 1.8527283668518066} -11/07/2021 04:59:14 - INFO - __main__ - Step 55201: {'lr': 0.0003568288040946931, 'samples': 10598592, 'steps': 55200, 'loss/train': 1.5662264823913574} -11/07/2021 04:59:15 - INFO - __main__ - Step 55202: {'lr': 0.000356824006228693, 'samples': 10598784, 'steps': 55201, 'loss/train': 1.0995025634765625} -11/07/2021 04:59:15 - INFO - __main__ - Step 55203: {'lr': 0.0003568192083145596, 'samples': 10598976, 'steps': 55202, 'loss/train': 1.422552466392517} -11/07/2021 04:59:15 - INFO - __main__ - Step 55204: {'lr': 0.0003568144103522951, 'samples': 10599168, 'steps': 55203, 'loss/train': 1.1638541221618652} -11/07/2021 04:59:16 - INFO - __main__ - Step 55205: {'lr': 0.00035680961234190166, 'samples': 10599360, 'steps': 55204, 'loss/train': 1.671225905418396} -11/07/2021 04:59:17 - INFO - __main__ - Step 55206: {'lr': 0.00035680481428338156, 'samples': 10599552, 'steps': 55205, 'loss/train': 1.1339223384857178} -11/07/2021 04:59:17 - INFO - __main__ - Step 55207: {'lr': 0.0003568000161767368, 'samples': 10599744, 'steps': 55206, 'loss/train': 1.547345519065857} -11/07/2021 04:59:18 - INFO - __main__ - Step 55208: {'lr': 0.0003567952180219696, 'samples': 10599936, 'steps': 55207, 'loss/train': 0.9051850438117981} -11/07/2021 04:59:18 - INFO - __main__ - Step 55209: {'lr': 0.00035679041981908206, 'samples': 10600128, 'steps': 55208, 'loss/train': 1.6167963743209839} -11/07/2021 04:59:19 - INFO - __main__ - Step 55210: {'lr': 0.0003567856215680765, 'samples': 10600320, 'steps': 55209, 'loss/train': 1.4095200300216675} -11/07/2021 04:59:19 - INFO - __main__ - Step 55211: {'lr': 0.0003567808232689549, 'samples': 10600512, 'steps': 55210, 'loss/train': 1.5192729234695435} -11/07/2021 04:59:20 - INFO - __main__ - Step 55212: {'lr': 0.00035677602492171953, 'samples': 10600704, 'steps': 55211, 'loss/train': 1.4212462902069092} -11/07/2021 04:59:20 - INFO - __main__ - Step 55213: {'lr': 0.0003567712265263726, 'samples': 10600896, 'steps': 55212, 'loss/train': 1.7365148067474365} -11/07/2021 04:59:20 - INFO - __main__ - Step 55214: {'lr': 0.0003567664280829161, 'samples': 10601088, 'steps': 55213, 'loss/train': 1.2166881561279297} -11/07/2021 04:59:21 - INFO - __main__ - Step 55215: {'lr': 0.0003567616295913524, 'samples': 10601280, 'steps': 55214, 'loss/train': 1.1411106586456299} -11/07/2021 04:59:22 - INFO - __main__ - Step 55216: {'lr': 0.0003567568310516834, 'samples': 10601472, 'steps': 55215, 'loss/train': 1.3288177251815796} -11/07/2021 04:59:22 - INFO - __main__ - Step 55217: {'lr': 0.0003567520324639116, 'samples': 10601664, 'steps': 55216, 'loss/train': 1.064652442932129} -11/07/2021 04:59:22 - INFO - __main__ - Step 55218: {'lr': 0.0003567472338280389, 'samples': 10601856, 'steps': 55217, 'loss/train': 1.6468113660812378} -11/07/2021 04:59:23 - INFO - __main__ - Step 55219: {'lr': 0.00035674243514406754, 'samples': 10602048, 'steps': 55218, 'loss/train': 1.756061315536499} -11/07/2021 04:59:23 - INFO - __main__ - Step 55220: {'lr': 0.00035673763641199974, 'samples': 10602240, 'steps': 55219, 'loss/train': 1.2694787979125977} -11/07/2021 04:59:24 - INFO - __main__ - Step 55221: {'lr': 0.0003567328376318375, 'samples': 10602432, 'steps': 55220, 'loss/train': 1.4165061712265015} -11/07/2021 04:59:25 - INFO - __main__ - Step 55222: {'lr': 0.0003567280388035832, 'samples': 10602624, 'steps': 55221, 'loss/train': 0.7822771668434143} -11/07/2021 04:59:25 - INFO - __main__ - Step 55223: {'lr': 0.0003567232399272388, 'samples': 10602816, 'steps': 55222, 'loss/train': 1.3410395383834839} -11/07/2021 04:59:25 - INFO - __main__ - Step 55224: {'lr': 0.0003567184410028066, 'samples': 10603008, 'steps': 55223, 'loss/train': 1.2008610963821411} -11/07/2021 04:59:26 - INFO - __main__ - Step 55225: {'lr': 0.0003567136420302887, 'samples': 10603200, 'steps': 55224, 'loss/train': 1.2869157791137695} -11/07/2021 04:59:27 - INFO - __main__ - Step 55226: {'lr': 0.00035670884300968735, 'samples': 10603392, 'steps': 55225, 'loss/train': 1.367020606994629} -11/07/2021 04:59:27 - INFO - __main__ - Step 55227: {'lr': 0.0003567040439410046, 'samples': 10603584, 'steps': 55226, 'loss/train': 1.6534112691879272} -11/07/2021 04:59:27 - INFO - __main__ - Step 55228: {'lr': 0.0003566992448242427, 'samples': 10603776, 'steps': 55227, 'loss/train': 1.0427751541137695} -11/07/2021 04:59:28 - INFO - __main__ - Step 55229: {'lr': 0.0003566944456594036, 'samples': 10603968, 'steps': 55228, 'loss/train': 1.3932331800460815} -11/07/2021 04:59:28 - INFO - __main__ - Step 55230: {'lr': 0.00035668964644648975, 'samples': 10604160, 'steps': 55229, 'loss/train': 1.6934592723846436} -11/07/2021 04:59:28 - INFO - __main__ - Step 55231: {'lr': 0.0003566848471855032, 'samples': 10604352, 'steps': 55230, 'loss/train': 1.457594633102417} -11/07/2021 04:59:29 - INFO - __main__ - Step 55232: {'lr': 0.0003566800478764461, 'samples': 10604544, 'steps': 55231, 'loss/train': 1.8326622247695923} -11/07/2021 04:59:30 - INFO - __main__ - Step 55233: {'lr': 0.00035667524851932066, 'samples': 10604736, 'steps': 55232, 'loss/train': 1.4921889305114746} -11/07/2021 04:59:30 - INFO - __main__ - Step 55234: {'lr': 0.0003566704491141289, 'samples': 10604928, 'steps': 55233, 'loss/train': 1.7390446662902832} -11/07/2021 04:59:30 - INFO - __main__ - Step 55235: {'lr': 0.0003566656496608731, 'samples': 10605120, 'steps': 55234, 'loss/train': 1.584368109703064} -11/07/2021 04:59:31 - INFO - __main__ - Step 55236: {'lr': 0.0003566608501595554, 'samples': 10605312, 'steps': 55235, 'loss/train': 1.5843379497528076} -11/07/2021 04:59:32 - INFO - __main__ - Step 55237: {'lr': 0.000356656050610178, 'samples': 10605504, 'steps': 55236, 'loss/train': 1.2228553295135498} -11/07/2021 04:59:32 - INFO - __main__ - Step 55238: {'lr': 0.000356651251012743, 'samples': 10605696, 'steps': 55237, 'loss/train': 1.507058024406433} -11/07/2021 04:59:32 - INFO - __main__ - Step 55239: {'lr': 0.0003566464513672527, 'samples': 10605888, 'steps': 55238, 'loss/train': 1.0552634000778198} -11/07/2021 04:59:33 - INFO - __main__ - Step 55240: {'lr': 0.00035664165167370907, 'samples': 10606080, 'steps': 55239, 'loss/train': 1.8468682765960693} -11/07/2021 04:59:33 - INFO - __main__ - Step 55241: {'lr': 0.0003566368519321144, 'samples': 10606272, 'steps': 55240, 'loss/train': 0.9865829944610596} -11/07/2021 04:59:34 - INFO - __main__ - Step 55242: {'lr': 0.0003566320521424707, 'samples': 10606464, 'steps': 55241, 'loss/train': 1.405584454536438} -11/07/2021 04:59:35 - INFO - __main__ - Step 55243: {'lr': 0.0003566272523047803, 'samples': 10606656, 'steps': 55242, 'loss/train': 1.6511468887329102} -11/07/2021 04:59:35 - INFO - __main__ - Step 55244: {'lr': 0.00035662245241904533, 'samples': 10606848, 'steps': 55243, 'loss/train': 1.335024118423462} -11/07/2021 04:59:35 - INFO - __main__ - Step 55245: {'lr': 0.0003566176524852679, 'samples': 10607040, 'steps': 55244, 'loss/train': 1.1019014120101929} -11/07/2021 04:59:36 - INFO - __main__ - Step 55246: {'lr': 0.00035661285250345023, 'samples': 10607232, 'steps': 55245, 'loss/train': 1.3142695426940918} -11/07/2021 04:59:37 - INFO - __main__ - Step 55247: {'lr': 0.00035660805247359444, 'samples': 10607424, 'steps': 55246, 'loss/train': 1.6288530826568604} -11/07/2021 04:59:37 - INFO - __main__ - Step 55248: {'lr': 0.0003566032523957027, 'samples': 10607616, 'steps': 55247, 'loss/train': 1.4779716730117798} -11/07/2021 04:59:37 - INFO - __main__ - Step 55249: {'lr': 0.00035659845226977715, 'samples': 10607808, 'steps': 55248, 'loss/train': 1.170922875404358} -11/07/2021 04:59:38 - INFO - __main__ - Step 55250: {'lr': 0.00035659365209582004, 'samples': 10608000, 'steps': 55249, 'loss/train': 1.358385682106018} -11/07/2021 04:59:38 - INFO - __main__ - Step 55251: {'lr': 0.00035658885187383343, 'samples': 10608192, 'steps': 55250, 'loss/train': 1.4741021394729614} -11/07/2021 04:59:39 - INFO - __main__ - Step 55252: {'lr': 0.0003565840516038196, 'samples': 10608384, 'steps': 55251, 'loss/train': 1.5403051376342773} -11/07/2021 04:59:39 - INFO - __main__ - Step 55253: {'lr': 0.00035657925128578064, 'samples': 10608576, 'steps': 55252, 'loss/train': 1.1264894008636475} -11/07/2021 04:59:40 - INFO - __main__ - Step 55254: {'lr': 0.00035657445091971863, 'samples': 10608768, 'steps': 55253, 'loss/train': 1.2137291431427002} -11/07/2021 04:59:40 - INFO - __main__ - Step 55255: {'lr': 0.00035656965050563584, 'samples': 10608960, 'steps': 55254, 'loss/train': 1.276440978050232} -11/07/2021 04:59:40 - INFO - __main__ - Step 55256: {'lr': 0.0003565648500435344, 'samples': 10609152, 'steps': 55255, 'loss/train': 1.6435093879699707} -11/07/2021 04:59:41 - INFO - __main__ - Step 55257: {'lr': 0.0003565600495334165, 'samples': 10609344, 'steps': 55256, 'loss/train': 0.828242838382721} -11/07/2021 04:59:42 - INFO - __main__ - Step 55258: {'lr': 0.0003565552489752843, 'samples': 10609536, 'steps': 55257, 'loss/train': 1.0416570901870728} -11/07/2021 04:59:42 - INFO - __main__ - Step 55259: {'lr': 0.0003565504483691399, 'samples': 10609728, 'steps': 55258, 'loss/train': 1.0516154766082764} -11/07/2021 04:59:42 - INFO - __main__ - Step 55260: {'lr': 0.0003565456477149856, 'samples': 10609920, 'steps': 55259, 'loss/train': 0.9261599779129028} -11/07/2021 04:59:43 - INFO - __main__ - Step 55261: {'lr': 0.0003565408470128234, 'samples': 10610112, 'steps': 55260, 'loss/train': 1.4984734058380127} -11/07/2021 04:59:44 - INFO - __main__ - Step 55262: {'lr': 0.00035653604626265556, 'samples': 10610304, 'steps': 55261, 'loss/train': 0.5827086567878723} -11/07/2021 04:59:44 - INFO - __main__ - Step 55263: {'lr': 0.00035653124546448423, 'samples': 10610496, 'steps': 55262, 'loss/train': 1.7296804189682007} -11/07/2021 04:59:45 - INFO - __main__ - Step 55264: {'lr': 0.0003565264446183116, 'samples': 10610688, 'steps': 55263, 'loss/train': 2.3289999961853027} -11/07/2021 04:59:45 - INFO - __main__ - Step 55265: {'lr': 0.00035652164372413975, 'samples': 10610880, 'steps': 55264, 'loss/train': 1.4187769889831543} -11/07/2021 04:59:45 - INFO - __main__ - Step 55266: {'lr': 0.0003565168427819709, 'samples': 10611072, 'steps': 55265, 'loss/train': 2.162388801574707} -11/07/2021 04:59:46 - INFO - __main__ - Step 55267: {'lr': 0.00035651204179180723, 'samples': 10611264, 'steps': 55266, 'loss/train': 1.417816162109375} -11/07/2021 04:59:47 - INFO - __main__ - Step 55268: {'lr': 0.00035650724075365084, 'samples': 10611456, 'steps': 55267, 'loss/train': 1.6270649433135986} -11/07/2021 04:59:47 - INFO - __main__ - Step 55269: {'lr': 0.000356502439667504, 'samples': 10611648, 'steps': 55268, 'loss/train': 2.0392963886260986} -11/07/2021 04:59:48 - INFO - __main__ - Step 55270: {'lr': 0.0003564976385333687, 'samples': 10611840, 'steps': 55269, 'loss/train': 1.2095744609832764} -11/07/2021 04:59:48 - INFO - __main__ - Step 55271: {'lr': 0.00035649283735124723, 'samples': 10612032, 'steps': 55270, 'loss/train': 1.201027512550354} -11/07/2021 04:59:48 - INFO - __main__ - Step 55272: {'lr': 0.0003564880361211418, 'samples': 10612224, 'steps': 55271, 'loss/train': 1.771641731262207} -11/07/2021 04:59:49 - INFO - __main__ - Step 55273: {'lr': 0.00035648323484305445, 'samples': 10612416, 'steps': 55272, 'loss/train': 1.5814708471298218} -11/07/2021 04:59:50 - INFO - __main__ - Step 55274: {'lr': 0.00035647843351698736, 'samples': 10612608, 'steps': 55273, 'loss/train': 1.9617000818252563} -11/07/2021 04:59:50 - INFO - __main__ - Step 55275: {'lr': 0.0003564736321429428, 'samples': 10612800, 'steps': 55274, 'loss/train': 1.4196951389312744} -11/07/2021 04:59:50 - INFO - __main__ - Step 55276: {'lr': 0.00035646883072092285, 'samples': 10612992, 'steps': 55275, 'loss/train': 1.2456954717636108} -11/07/2021 04:59:51 - INFO - __main__ - Step 55277: {'lr': 0.00035646402925092966, 'samples': 10613184, 'steps': 55276, 'loss/train': 1.528760552406311} -11/07/2021 04:59:52 - INFO - __main__ - Step 55278: {'lr': 0.00035645922773296546, 'samples': 10613376, 'steps': 55277, 'loss/train': 1.3044077157974243} -11/07/2021 04:59:52 - INFO - __main__ - Step 55279: {'lr': 0.0003564544261670324, 'samples': 10613568, 'steps': 55278, 'loss/train': 1.3315811157226562} -11/07/2021 04:59:52 - INFO - __main__ - Step 55280: {'lr': 0.0003564496245531326, 'samples': 10613760, 'steps': 55279, 'loss/train': 1.7874959707260132} -11/07/2021 04:59:53 - INFO - __main__ - Step 55281: {'lr': 0.0003564448228912682, 'samples': 10613952, 'steps': 55280, 'loss/train': 1.3334084749221802} -11/07/2021 04:59:53 - INFO - __main__ - Step 55282: {'lr': 0.0003564400211814414, 'samples': 10614144, 'steps': 55281, 'loss/train': 1.3982524871826172} -11/07/2021 04:59:54 - INFO - __main__ - Step 55283: {'lr': 0.0003564352194236544, 'samples': 10614336, 'steps': 55282, 'loss/train': 1.5548148155212402} -11/07/2021 04:59:55 - INFO - __main__ - Step 55284: {'lr': 0.00035643041761790936, 'samples': 10614528, 'steps': 55283, 'loss/train': 1.3802969455718994} -11/07/2021 04:59:55 - INFO - __main__ - Step 55285: {'lr': 0.00035642561576420834, 'samples': 10614720, 'steps': 55284, 'loss/train': 1.5726593732833862} -11/07/2021 04:59:55 - INFO - __main__ - Step 55286: {'lr': 0.00035642081386255366, 'samples': 10614912, 'steps': 55285, 'loss/train': 1.7341140508651733} -11/07/2021 04:59:56 - INFO - __main__ - Step 55287: {'lr': 0.0003564160119129473, 'samples': 10615104, 'steps': 55286, 'loss/train': 1.3809142112731934} -11/07/2021 04:59:56 - INFO - __main__ - Step 55288: {'lr': 0.0003564112099153916, 'samples': 10615296, 'steps': 55287, 'loss/train': 0.09288747608661652} -11/07/2021 04:59:57 - INFO - __main__ - Step 55289: {'lr': 0.00035640640786988866, 'samples': 10615488, 'steps': 55288, 'loss/train': 1.3767549991607666} -11/07/2021 04:59:58 - INFO - __main__ - Step 55290: {'lr': 0.0003564016057764406, 'samples': 10615680, 'steps': 55289, 'loss/train': 1.3744242191314697} -11/07/2021 04:59:58 - INFO - __main__ - Step 55291: {'lr': 0.00035639680363504965, 'samples': 10615872, 'steps': 55290, 'loss/train': 0.11196830868721008} -11/07/2021 04:59:59 - INFO - __main__ - Step 55292: {'lr': 0.0003563920014457179, 'samples': 10616064, 'steps': 55291, 'loss/train': 1.2871259450912476} -11/07/2021 04:59:59 - INFO - __main__ - Step 55293: {'lr': 0.0003563871992084476, 'samples': 10616256, 'steps': 55292, 'loss/train': 1.16878342628479} -11/07/2021 05:00:00 - INFO - __main__ - Step 55294: {'lr': 0.0003563823969232409, 'samples': 10616448, 'steps': 55293, 'loss/train': 1.460994005203247} -11/07/2021 05:00:00 - INFO - __main__ - Step 55295: {'lr': 0.0003563775945900999, 'samples': 10616640, 'steps': 55294, 'loss/train': 0.4720584750175476} -11/07/2021 05:00:01 - INFO - __main__ - Step 55296: {'lr': 0.00035637279220902677, 'samples': 10616832, 'steps': 55295, 'loss/train': 1.453580379486084} -11/07/2021 05:00:01 - INFO - __main__ - Step 55297: {'lr': 0.00035636798978002374, 'samples': 10617024, 'steps': 55296, 'loss/train': 1.009641408920288} -11/07/2021 05:00:01 - INFO - __main__ - Step 55298: {'lr': 0.00035636318730309285, 'samples': 10617216, 'steps': 55297, 'loss/train': 1.3926947116851807} -11/07/2021 05:00:02 - INFO - __main__ - Step 55299: {'lr': 0.0003563583847782364, 'samples': 10617408, 'steps': 55298, 'loss/train': 1.8583132028579712} -11/07/2021 05:00:03 - INFO - __main__ - Step 55300: {'lr': 0.0003563535822054565, 'samples': 10617600, 'steps': 55299, 'loss/train': 1.485907793045044} -11/07/2021 05:00:03 - INFO - __main__ - Step 55301: {'lr': 0.00035634877958475535, 'samples': 10617792, 'steps': 55300, 'loss/train': 1.32669198513031} -11/07/2021 05:00:03 - INFO - __main__ - Step 55302: {'lr': 0.0003563439769161351, 'samples': 10617984, 'steps': 55301, 'loss/train': 1.3650391101837158} -11/07/2021 05:00:04 - INFO - __main__ - Step 55303: {'lr': 0.00035633917419959784, 'samples': 10618176, 'steps': 55302, 'loss/train': 1.4098504781723022} -11/07/2021 05:00:05 - INFO - __main__ - Step 55304: {'lr': 0.0003563343714351458, 'samples': 10618368, 'steps': 55303, 'loss/train': 0.8533596992492676} -11/07/2021 05:00:06 - INFO - __main__ - Step 55305: {'lr': 0.0003563295686227811, 'samples': 10618560, 'steps': 55304, 'loss/train': 1.6199250221252441} -11/07/2021 05:00:06 - INFO - __main__ - Step 55306: {'lr': 0.000356324765762506, 'samples': 10618752, 'steps': 55305, 'loss/train': 1.3163352012634277} -11/07/2021 05:00:06 - INFO - __main__ - Step 55307: {'lr': 0.0003563199628543226, 'samples': 10618944, 'steps': 55306, 'loss/train': 0.8771881461143494} -11/07/2021 05:00:07 - INFO - __main__ - Step 55308: {'lr': 0.00035631515989823306, 'samples': 10619136, 'steps': 55307, 'loss/train': 1.5897128582000732} -11/07/2021 05:00:08 - INFO - __main__ - Step 55309: {'lr': 0.0003563103568942395, 'samples': 10619328, 'steps': 55308, 'loss/train': 0.20608165860176086} -11/07/2021 05:00:08 - INFO - __main__ - Step 55310: {'lr': 0.0003563055538423441, 'samples': 10619520, 'steps': 55309, 'loss/train': 1.151322603225708} -11/07/2021 05:00:08 - INFO - __main__ - Step 55311: {'lr': 0.00035630075074254917, 'samples': 10619712, 'steps': 55310, 'loss/train': 1.5774955749511719} -11/07/2021 05:00:09 - INFO - __main__ - Step 55312: {'lr': 0.0003562959475948567, 'samples': 10619904, 'steps': 55311, 'loss/train': 1.6166630983352661} -11/07/2021 05:00:09 - INFO - __main__ - Step 55313: {'lr': 0.00035629114439926897, 'samples': 10620096, 'steps': 55312, 'loss/train': 1.3984489440917969} -11/07/2021 05:00:10 - INFO - __main__ - Step 55314: {'lr': 0.00035628634115578806, 'samples': 10620288, 'steps': 55313, 'loss/train': 1.7488480806350708} -11/07/2021 05:00:11 - INFO - __main__ - Step 55315: {'lr': 0.00035628153786441616, 'samples': 10620480, 'steps': 55314, 'loss/train': 1.669127345085144} -11/07/2021 05:00:11 - INFO - __main__ - Step 55316: {'lr': 0.0003562767345251554, 'samples': 10620672, 'steps': 55315, 'loss/train': 1.605141282081604} -11/07/2021 05:00:11 - INFO - __main__ - Step 55317: {'lr': 0.00035627193113800797, 'samples': 10620864, 'steps': 55316, 'loss/train': 1.0980522632598877} -11/07/2021 05:00:12 - INFO - __main__ - Step 55318: {'lr': 0.0003562671277029761, 'samples': 10621056, 'steps': 55317, 'loss/train': 1.114978313446045} -11/07/2021 05:00:13 - INFO - __main__ - Step 55319: {'lr': 0.00035626232422006186, 'samples': 10621248, 'steps': 55318, 'loss/train': 0.24382823705673218} -11/07/2021 05:00:13 - INFO - __main__ - Step 55320: {'lr': 0.0003562575206892676, 'samples': 10621440, 'steps': 55319, 'loss/train': 1.6088790893554688} -11/07/2021 05:00:13 - INFO - __main__ - Step 55321: {'lr': 0.0003562527171105952, 'samples': 10621632, 'steps': 55320, 'loss/train': 1.1404860019683838} -11/07/2021 05:00:14 - INFO - __main__ - Step 55322: {'lr': 0.000356247913484047, 'samples': 10621824, 'steps': 55321, 'loss/train': 1.7770678997039795} -11/07/2021 05:00:14 - INFO - __main__ - Step 55323: {'lr': 0.00035624310980962516, 'samples': 10622016, 'steps': 55322, 'loss/train': 1.3695993423461914} -11/07/2021 05:00:16 - INFO - __main__ - Step 55324: {'lr': 0.0003562383060873318, 'samples': 10622208, 'steps': 55323, 'loss/train': 1.3157083988189697} -11/07/2021 05:00:16 - INFO - __main__ - Step 55325: {'lr': 0.000356233502317169, 'samples': 10622400, 'steps': 55324, 'loss/train': 1.2763516902923584} -11/07/2021 05:00:17 - INFO - __main__ - Step 55326: {'lr': 0.00035622869849913916, 'samples': 10622592, 'steps': 55325, 'loss/train': 1.2261382341384888} -11/07/2021 05:00:17 - INFO - __main__ - Step 55327: {'lr': 0.00035622389463324424, 'samples': 10622784, 'steps': 55326, 'loss/train': 1.374090313911438} -11/07/2021 05:00:17 - INFO - __main__ - Step 55328: {'lr': 0.0003562190907194865, 'samples': 10622976, 'steps': 55327, 'loss/train': 1.3394628763198853} -11/07/2021 05:00:18 - INFO - __main__ - Step 55329: {'lr': 0.00035621428675786804, 'samples': 10623168, 'steps': 55328, 'loss/train': 0.39241358637809753} -11/07/2021 05:00:19 - INFO - __main__ - Step 55330: {'lr': 0.0003562094827483911, 'samples': 10623360, 'steps': 55329, 'loss/train': 0.10898163914680481} -11/07/2021 05:00:19 - INFO - __main__ - Step 55331: {'lr': 0.0003562046786910578, 'samples': 10623552, 'steps': 55330, 'loss/train': 1.525092363357544} -11/07/2021 05:00:19 - INFO - __main__ - Step 55332: {'lr': 0.0003561998745858703, 'samples': 10623744, 'steps': 55331, 'loss/train': 1.3611594438552856} -11/07/2021 05:00:20 - INFO - __main__ - Step 55333: {'lr': 0.00035619507043283075, 'samples': 10623936, 'steps': 55332, 'loss/train': 1.5670605897903442} -11/07/2021 05:00:20 - INFO - __main__ - Step 55334: {'lr': 0.0003561902662319414, 'samples': 10624128, 'steps': 55333, 'loss/train': 0.6823264360427856} -11/07/2021 05:00:21 - INFO - __main__ - Step 55335: {'lr': 0.00035618546198320426, 'samples': 10624320, 'steps': 55334, 'loss/train': 1.4306527376174927} -11/07/2021 05:00:22 - INFO - __main__ - Step 55336: {'lr': 0.0003561806576866217, 'samples': 10624512, 'steps': 55335, 'loss/train': 0.6125316619873047} -11/07/2021 05:00:22 - INFO - __main__ - Step 55337: {'lr': 0.0003561758533421957, 'samples': 10624704, 'steps': 55336, 'loss/train': 1.3668783903121948} -11/07/2021 05:00:22 - INFO - __main__ - Step 55338: {'lr': 0.00035617104894992854, 'samples': 10624896, 'steps': 55337, 'loss/train': 1.2590347528457642} -11/07/2021 05:00:23 - INFO - __main__ - Step 55339: {'lr': 0.00035616624450982227, 'samples': 10625088, 'steps': 55338, 'loss/train': 1.9527186155319214} -11/07/2021 05:00:24 - INFO - __main__ - Step 55340: {'lr': 0.0003561614400218792, 'samples': 10625280, 'steps': 55339, 'loss/train': 1.564045786857605} -11/07/2021 05:00:24 - INFO - __main__ - Step 55341: {'lr': 0.00035615663548610145, 'samples': 10625472, 'steps': 55340, 'loss/train': 1.387307047843933} -11/07/2021 05:00:24 - INFO - __main__ - Step 55342: {'lr': 0.0003561518309024911, 'samples': 10625664, 'steps': 55341, 'loss/train': 1.4752954244613647} -11/07/2021 05:00:25 - INFO - __main__ - Step 55343: {'lr': 0.0003561470262710504, 'samples': 10625856, 'steps': 55342, 'loss/train': 1.4978200197219849} -11/07/2021 05:00:25 - INFO - __main__ - Step 55344: {'lr': 0.00035614222159178143, 'samples': 10626048, 'steps': 55343, 'loss/train': 1.1438692808151245} -11/07/2021 05:00:26 - INFO - __main__ - Step 55345: {'lr': 0.00035613741686468646, 'samples': 10626240, 'steps': 55344, 'loss/train': 1.4912155866622925} -11/07/2021 05:00:27 - INFO - __main__ - Step 55346: {'lr': 0.0003561326120897676, 'samples': 10626432, 'steps': 55345, 'loss/train': 1.2749402523040771} -11/07/2021 05:00:27 - INFO - __main__ - Step 55347: {'lr': 0.00035612780726702707, 'samples': 10626624, 'steps': 55346, 'loss/train': 1.9267258644104004} -11/07/2021 05:00:27 - INFO - __main__ - Step 55348: {'lr': 0.00035612300239646694, 'samples': 10626816, 'steps': 55347, 'loss/train': 1.3484121561050415} -11/07/2021 05:00:28 - INFO - __main__ - Step 55349: {'lr': 0.00035611819747808943, 'samples': 10627008, 'steps': 55348, 'loss/train': 1.1575568914413452} -11/07/2021 05:00:28 - INFO - __main__ - Step 55350: {'lr': 0.00035611339251189665, 'samples': 10627200, 'steps': 55349, 'loss/train': 1.8071938753128052} -11/07/2021 05:00:29 - INFO - __main__ - Step 55351: {'lr': 0.0003561085874978909, 'samples': 10627392, 'steps': 55350, 'loss/train': 2.0694077014923096} -11/07/2021 05:00:29 - INFO - __main__ - Step 55352: {'lr': 0.00035610378243607424, 'samples': 10627584, 'steps': 55351, 'loss/train': 1.7644639015197754} -11/07/2021 05:00:30 - INFO - __main__ - Step 55353: {'lr': 0.0003560989773264488, 'samples': 10627776, 'steps': 55352, 'loss/train': 1.836050271987915} -11/07/2021 05:00:30 - INFO - __main__ - Step 55354: {'lr': 0.00035609417216901683, 'samples': 10627968, 'steps': 55353, 'loss/train': 0.966948390007019} -11/07/2021 05:00:30 - INFO - __main__ - Step 55355: {'lr': 0.00035608936696378046, 'samples': 10628160, 'steps': 55354, 'loss/train': 1.9758682250976562} -11/07/2021 05:00:31 - INFO - __main__ - Step 55356: {'lr': 0.0003560845617107419, 'samples': 10628352, 'steps': 55355, 'loss/train': 1.2718393802642822} -11/07/2021 05:00:32 - INFO - __main__ - Step 55357: {'lr': 0.0003560797564099032, 'samples': 10628544, 'steps': 55356, 'loss/train': 1.1412488222122192} -11/07/2021 05:00:32 - INFO - __main__ - Step 55358: {'lr': 0.00035607495106126664, 'samples': 10628736, 'steps': 55357, 'loss/train': 1.7440805435180664} -11/07/2021 05:00:33 - INFO - __main__ - Step 55359: {'lr': 0.0003560701456648343, 'samples': 10628928, 'steps': 55358, 'loss/train': 1.2522573471069336} -11/07/2021 05:00:33 - INFO - __main__ - Step 55360: {'lr': 0.0003560653402206085, 'samples': 10629120, 'steps': 55359, 'loss/train': 1.4632554054260254} -11/07/2021 05:00:34 - INFO - __main__ - Step 55361: {'lr': 0.0003560605347285912, 'samples': 10629312, 'steps': 55360, 'loss/train': 1.911437749862671} -11/07/2021 05:00:34 - INFO - __main__ - Step 55362: {'lr': 0.0003560557291887847, 'samples': 10629504, 'steps': 55361, 'loss/train': 1.4185771942138672} -11/07/2021 05:00:35 - INFO - __main__ - Step 55363: {'lr': 0.0003560509236011911, 'samples': 10629696, 'steps': 55362, 'loss/train': 1.55713951587677} -11/07/2021 05:00:35 - INFO - __main__ - Step 55364: {'lr': 0.0003560461179658125, 'samples': 10629888, 'steps': 55363, 'loss/train': 2.0547432899475098} -11/07/2021 05:00:35 - INFO - __main__ - Step 55365: {'lr': 0.0003560413122826513, 'samples': 10630080, 'steps': 55364, 'loss/train': 1.1069855690002441} -11/07/2021 05:00:36 - INFO - __main__ - Step 55366: {'lr': 0.0003560365065517095, 'samples': 10630272, 'steps': 55365, 'loss/train': 1.6910406351089478} -11/07/2021 05:00:37 - INFO - __main__ - Step 55367: {'lr': 0.0003560317007729893, 'samples': 10630464, 'steps': 55366, 'loss/train': 1.2973557710647583} -11/07/2021 05:00:37 - INFO - __main__ - Step 55368: {'lr': 0.00035602689494649274, 'samples': 10630656, 'steps': 55367, 'loss/train': 1.5025098323822021} -11/07/2021 05:00:37 - INFO - __main__ - Step 55369: {'lr': 0.0003560220890722222, 'samples': 10630848, 'steps': 55368, 'loss/train': 1.8217743635177612} -11/07/2021 05:00:38 - INFO - __main__ - Step 55370: {'lr': 0.00035601728315017966, 'samples': 10631040, 'steps': 55369, 'loss/train': 1.04408597946167} -11/07/2021 05:00:39 - INFO - __main__ - Step 55371: {'lr': 0.00035601247718036744, 'samples': 10631232, 'steps': 55370, 'loss/train': 1.1525126695632935} -11/07/2021 05:00:39 - INFO - __main__ - Step 55372: {'lr': 0.00035600767116278765, 'samples': 10631424, 'steps': 55371, 'loss/train': 1.5420783758163452} -11/07/2021 05:00:39 - INFO - __main__ - Step 55373: {'lr': 0.0003560028650974424, 'samples': 10631616, 'steps': 55372, 'loss/train': 1.541002869606018} -11/07/2021 05:00:40 - INFO - __main__ - Step 55374: {'lr': 0.0003559980589843339, 'samples': 10631808, 'steps': 55373, 'loss/train': 1.1891919374465942} -11/07/2021 05:00:40 - INFO - __main__ - Step 55375: {'lr': 0.0003559932528234643, 'samples': 10632000, 'steps': 55374, 'loss/train': 1.2719550132751465} -11/07/2021 05:00:41 - INFO - __main__ - Step 55376: {'lr': 0.0003559884466148358, 'samples': 10632192, 'steps': 55375, 'loss/train': 1.1132653951644897} -11/07/2021 05:00:41 - INFO - __main__ - Step 55377: {'lr': 0.0003559836403584505, 'samples': 10632384, 'steps': 55376, 'loss/train': 1.6261625289916992} -11/07/2021 05:00:42 - INFO - __main__ - Step 55378: {'lr': 0.00035597883405431066, 'samples': 10632576, 'steps': 55377, 'loss/train': 1.1378587484359741} -11/07/2021 05:00:42 - INFO - __main__ - Step 55379: {'lr': 0.0003559740277024183, 'samples': 10632768, 'steps': 55378, 'loss/train': 1.080365777015686} -11/07/2021 05:00:43 - INFO - __main__ - Step 55380: {'lr': 0.0003559692213027758, 'samples': 10632960, 'steps': 55379, 'loss/train': 1.2772960662841797} -11/07/2021 05:00:43 - INFO - __main__ - Step 55381: {'lr': 0.00035596441485538513, 'samples': 10633152, 'steps': 55380, 'loss/train': 0.5054352283477783} -11/07/2021 05:00:44 - INFO - __main__ - Step 55382: {'lr': 0.00035595960836024856, 'samples': 10633344, 'steps': 55381, 'loss/train': 0.09342030435800552} -11/07/2021 05:00:44 - INFO - __main__ - Step 55383: {'lr': 0.00035595480181736816, 'samples': 10633536, 'steps': 55382, 'loss/train': 0.9672507047653198} -11/07/2021 05:00:45 - INFO - __main__ - Step 55384: {'lr': 0.0003559499952267462, 'samples': 10633728, 'steps': 55383, 'loss/train': 1.3447973728179932} -11/07/2021 05:00:45 - INFO - __main__ - Step 55385: {'lr': 0.00035594518858838485, 'samples': 10633920, 'steps': 55384, 'loss/train': 1.415655255317688} -11/07/2021 05:00:46 - INFO - __main__ - Step 55386: {'lr': 0.0003559403819022862, 'samples': 10634112, 'steps': 55385, 'loss/train': 1.2938896417617798} -11/07/2021 05:00:46 - INFO - __main__ - Step 55387: {'lr': 0.0003559355751684525, 'samples': 10634304, 'steps': 55386, 'loss/train': 1.2487860918045044} -11/07/2021 05:00:47 - INFO - __main__ - Step 55388: {'lr': 0.00035593076838688576, 'samples': 10634496, 'steps': 55387, 'loss/train': 1.5711008310317993} -11/07/2021 05:00:47 - INFO - __main__ - Step 55389: {'lr': 0.0003559259615575883, 'samples': 10634688, 'steps': 55388, 'loss/train': 0.8426490426063538} -11/07/2021 05:00:47 - INFO - __main__ - Step 55390: {'lr': 0.00035592115468056223, 'samples': 10634880, 'steps': 55389, 'loss/train': 1.5957858562469482} -11/07/2021 05:00:48 - INFO - __main__ - Step 55391: {'lr': 0.0003559163477558098, 'samples': 10635072, 'steps': 55390, 'loss/train': 1.5772674083709717} -11/07/2021 05:00:49 - INFO - __main__ - Step 55392: {'lr': 0.000355911540783333, 'samples': 10635264, 'steps': 55391, 'loss/train': 1.4916237592697144} -11/07/2021 05:00:49 - INFO - __main__ - Step 55393: {'lr': 0.0003559067337631341, 'samples': 10635456, 'steps': 55392, 'loss/train': 1.1380609273910522} -11/07/2021 05:00:49 - INFO - __main__ - Step 55394: {'lr': 0.0003559019266952153, 'samples': 10635648, 'steps': 55393, 'loss/train': 1.0099992752075195} -11/07/2021 05:00:50 - INFO - __main__ - Step 55395: {'lr': 0.0003558971195795787, 'samples': 10635840, 'steps': 55394, 'loss/train': 1.6600886583328247} -11/07/2021 05:00:50 - INFO - __main__ - Step 55396: {'lr': 0.00035589231241622653, 'samples': 10636032, 'steps': 55395, 'loss/train': 1.3273447751998901} -11/07/2021 05:00:51 - INFO - __main__ - Step 55397: {'lr': 0.0003558875052051609, 'samples': 10636224, 'steps': 55396, 'loss/train': 1.3793827295303345} -11/07/2021 05:00:52 - INFO - __main__ - Step 55398: {'lr': 0.000355882697946384, 'samples': 10636416, 'steps': 55397, 'loss/train': 1.4172426462173462} -11/07/2021 05:00:52 - INFO - __main__ - Step 55399: {'lr': 0.00035587789063989793, 'samples': 10636608, 'steps': 55398, 'loss/train': 1.429591417312622} -11/07/2021 05:00:52 - INFO - __main__ - Step 55400: {'lr': 0.0003558730832857049, 'samples': 10636800, 'steps': 55399, 'loss/train': 1.3588968515396118} -11/07/2021 05:00:53 - INFO - __main__ - Step 55401: {'lr': 0.00035586827588380724, 'samples': 10636992, 'steps': 55400, 'loss/train': 1.4501574039459229} -11/07/2021 05:00:54 - INFO - __main__ - Step 55402: {'lr': 0.00035586346843420694, 'samples': 10637184, 'steps': 55401, 'loss/train': 1.075702428817749} -11/07/2021 05:00:54 - INFO - __main__ - Step 55403: {'lr': 0.0003558586609369061, 'samples': 10637376, 'steps': 55402, 'loss/train': 1.8202695846557617} -11/07/2021 05:00:54 - INFO - __main__ - Step 55404: {'lr': 0.000355853853391907, 'samples': 10637568, 'steps': 55403, 'loss/train': 2.1382062435150146} -11/07/2021 05:00:55 - INFO - __main__ - Step 55405: {'lr': 0.0003558490457992118, 'samples': 10637760, 'steps': 55404, 'loss/train': 0.784355878829956} -11/07/2021 05:00:55 - INFO - __main__ - Step 55406: {'lr': 0.00035584423815882265, 'samples': 10637952, 'steps': 55405, 'loss/train': 1.167901873588562} -11/07/2021 05:00:56 - INFO - __main__ - Step 55407: {'lr': 0.00035583943047074173, 'samples': 10638144, 'steps': 55406, 'loss/train': 1.8354178667068481} -11/07/2021 05:00:57 - INFO - __main__ - Step 55408: {'lr': 0.00035583462273497125, 'samples': 10638336, 'steps': 55407, 'loss/train': 1.2057093381881714} -11/07/2021 05:00:57 - INFO - __main__ - Step 55409: {'lr': 0.0003558298149515132, 'samples': 10638528, 'steps': 55408, 'loss/train': 1.6236366033554077} -11/07/2021 05:00:57 - INFO - __main__ - Step 55410: {'lr': 0.00035582500712037, 'samples': 10638720, 'steps': 55409, 'loss/train': 1.6326333284378052} -11/07/2021 05:00:58 - INFO - __main__ - Step 55411: {'lr': 0.0003558201992415436, 'samples': 10638912, 'steps': 55410, 'loss/train': 0.08839976787567139} -11/07/2021 05:00:59 - INFO - __main__ - Step 55412: {'lr': 0.00035581539131503625, 'samples': 10639104, 'steps': 55411, 'loss/train': 1.2671127319335938} -11/07/2021 05:00:59 - INFO - __main__ - Step 55413: {'lr': 0.00035581058334085015, 'samples': 10639296, 'steps': 55412, 'loss/train': 1.4644861221313477} -11/07/2021 05:00:59 - INFO - __main__ - Step 55414: {'lr': 0.00035580577531898745, 'samples': 10639488, 'steps': 55413, 'loss/train': 1.4764949083328247} -11/07/2021 05:01:00 - INFO - __main__ - Step 55415: {'lr': 0.00035580096724945027, 'samples': 10639680, 'steps': 55414, 'loss/train': 1.5854401588439941} -11/07/2021 05:01:00 - INFO - __main__ - Step 55416: {'lr': 0.00035579615913224077, 'samples': 10639872, 'steps': 55415, 'loss/train': 1.243757724761963} -11/07/2021 05:01:01 - INFO - __main__ - Step 55417: {'lr': 0.0003557913509673612, 'samples': 10640064, 'steps': 55416, 'loss/train': 1.207960844039917} -11/07/2021 05:01:02 - INFO - __main__ - Step 55418: {'lr': 0.0003557865427548137, 'samples': 10640256, 'steps': 55417, 'loss/train': 0.07647102326154709} -11/07/2021 05:01:02 - INFO - __main__ - Step 55419: {'lr': 0.0003557817344946004, 'samples': 10640448, 'steps': 55418, 'loss/train': 1.532102108001709} -11/07/2021 05:01:02 - INFO - __main__ - Step 55420: {'lr': 0.0003557769261867235, 'samples': 10640640, 'steps': 55419, 'loss/train': 1.1410948038101196} -11/07/2021 05:01:03 - INFO - __main__ - Step 55421: {'lr': 0.0003557721178311851, 'samples': 10640832, 'steps': 55420, 'loss/train': 1.5957534313201904} -11/07/2021 05:01:04 - INFO - __main__ - Step 55422: {'lr': 0.0003557673094279874, 'samples': 10641024, 'steps': 55421, 'loss/train': 1.580186128616333} -11/07/2021 05:01:04 - INFO - __main__ - Step 55423: {'lr': 0.00035576250097713263, 'samples': 10641216, 'steps': 55422, 'loss/train': 1.1744462251663208} -11/07/2021 05:01:05 - INFO - __main__ - Step 55424: {'lr': 0.00035575769247862295, 'samples': 10641408, 'steps': 55423, 'loss/train': 1.4780709743499756} -11/07/2021 05:01:05 - INFO - __main__ - Step 55425: {'lr': 0.0003557528839324604, 'samples': 10641600, 'steps': 55424, 'loss/train': 0.10940485447645187} -11/07/2021 05:01:05 - INFO - __main__ - Step 55426: {'lr': 0.0003557480753386473, 'samples': 10641792, 'steps': 55425, 'loss/train': 1.5092653036117554} -11/07/2021 05:01:06 - INFO - __main__ - Step 55427: {'lr': 0.0003557432666971857, 'samples': 10641984, 'steps': 55426, 'loss/train': 1.1131150722503662} -11/07/2021 05:01:07 - INFO - __main__ - Step 55428: {'lr': 0.0003557384580080778, 'samples': 10642176, 'steps': 55427, 'loss/train': 1.2832558155059814} -11/07/2021 05:01:07 - INFO - __main__ - Step 55429: {'lr': 0.0003557336492713258, 'samples': 10642368, 'steps': 55428, 'loss/train': 1.6966832876205444} -11/07/2021 05:01:07 - INFO - __main__ - Step 55430: {'lr': 0.00035572884048693193, 'samples': 10642560, 'steps': 55429, 'loss/train': 1.5837956666946411} -11/07/2021 05:01:08 - INFO - __main__ - Step 55431: {'lr': 0.0003557240316548982, 'samples': 10642752, 'steps': 55430, 'loss/train': 1.6265196800231934} -11/07/2021 05:01:09 - INFO - __main__ - Step 55432: {'lr': 0.0003557192227752268, 'samples': 10642944, 'steps': 55431, 'loss/train': 1.322920322418213} -11/07/2021 05:01:09 - INFO - __main__ - Step 55433: {'lr': 0.00035571441384792005, 'samples': 10643136, 'steps': 55432, 'loss/train': 1.5318617820739746} -11/07/2021 05:01:09 - INFO - __main__ - Step 55434: {'lr': 0.00035570960487298, 'samples': 10643328, 'steps': 55433, 'loss/train': 1.135300636291504} -11/07/2021 05:01:10 - INFO - __main__ - Step 55435: {'lr': 0.00035570479585040883, 'samples': 10643520, 'steps': 55434, 'loss/train': 1.3599398136138916} -11/07/2021 05:01:10 - INFO - __main__ - Step 55436: {'lr': 0.00035569998678020866, 'samples': 10643712, 'steps': 55435, 'loss/train': 1.7021390199661255} -11/07/2021 05:01:11 - INFO - __main__ - Step 55437: {'lr': 0.0003556951776623817, 'samples': 10643904, 'steps': 55436, 'loss/train': 1.6679959297180176} -11/07/2021 05:01:12 - INFO - __main__ - Step 55438: {'lr': 0.0003556903684969302, 'samples': 10644096, 'steps': 55437, 'loss/train': 1.413353681564331} -11/07/2021 05:01:12 - INFO - __main__ - Step 55439: {'lr': 0.0003556855592838562, 'samples': 10644288, 'steps': 55438, 'loss/train': 0.949391782283783} -11/07/2021 05:01:12 - INFO - __main__ - Step 55440: {'lr': 0.00035568075002316194, 'samples': 10644480, 'steps': 55439, 'loss/train': 1.5333319902420044} -11/07/2021 05:01:13 - INFO - __main__ - Step 55441: {'lr': 0.0003556759407148496, 'samples': 10644672, 'steps': 55440, 'loss/train': 1.7259225845336914} -11/07/2021 05:01:14 - INFO - __main__ - Step 55442: {'lr': 0.00035567113135892125, 'samples': 10644864, 'steps': 55441, 'loss/train': 1.1740769147872925} -11/07/2021 05:01:14 - INFO - __main__ - Step 55443: {'lr': 0.0003556663219553791, 'samples': 10645056, 'steps': 55442, 'loss/train': 1.4690876007080078} -11/07/2021 05:01:14 - INFO - __main__ - Step 55444: {'lr': 0.00035566151250422543, 'samples': 10645248, 'steps': 55443, 'loss/train': 1.029263973236084} -11/07/2021 05:01:15 - INFO - __main__ - Step 55445: {'lr': 0.0003556567030054622, 'samples': 10645440, 'steps': 55444, 'loss/train': 2.324265480041504} -11/07/2021 05:01:15 - INFO - __main__ - Step 55446: {'lr': 0.00035565189345909177, 'samples': 10645632, 'steps': 55445, 'loss/train': 1.2199026346206665} -11/07/2021 05:01:16 - INFO - __main__ - Step 55447: {'lr': 0.0003556470838651162, 'samples': 10645824, 'steps': 55446, 'loss/train': 0.14488187432289124} -11/07/2021 05:01:17 - INFO - __main__ - Step 55448: {'lr': 0.0003556422742235377, 'samples': 10646016, 'steps': 55447, 'loss/train': 1.4290181398391724} -11/07/2021 05:01:17 - INFO - __main__ - Step 55449: {'lr': 0.0003556374645343584, 'samples': 10646208, 'steps': 55448, 'loss/train': 1.3962857723236084} -11/07/2021 05:01:17 - INFO - __main__ - Step 55450: {'lr': 0.0003556326547975805, 'samples': 10646400, 'steps': 55449, 'loss/train': 1.8636422157287598} -11/07/2021 05:01:18 - INFO - __main__ - Step 55451: {'lr': 0.0003556278450132062, 'samples': 10646592, 'steps': 55450, 'loss/train': 0.9242614507675171} -11/07/2021 05:01:18 - INFO - __main__ - Step 55452: {'lr': 0.0003556230351812375, 'samples': 10646784, 'steps': 55451, 'loss/train': 1.8774685859680176} -11/07/2021 05:01:19 - INFO - __main__ - Step 55453: {'lr': 0.00035561822530167677, 'samples': 10646976, 'steps': 55452, 'loss/train': 1.392649531364441} -11/07/2021 05:01:19 - INFO - __main__ - Step 55454: {'lr': 0.0003556134153745261, 'samples': 10647168, 'steps': 55453, 'loss/train': 1.306005597114563} -11/07/2021 05:01:20 - INFO - __main__ - Step 55455: {'lr': 0.0003556086053997877, 'samples': 10647360, 'steps': 55454, 'loss/train': 1.3837898969650269} -11/07/2021 05:01:20 - INFO - __main__ - Step 55456: {'lr': 0.0003556037953774636, 'samples': 10647552, 'steps': 55455, 'loss/train': 2.020146369934082} -11/07/2021 05:01:20 - INFO - __main__ - Step 55457: {'lr': 0.0003555989853075561, 'samples': 10647744, 'steps': 55456, 'loss/train': 1.6230862140655518} -11/07/2021 05:01:21 - INFO - __main__ - Step 55458: {'lr': 0.0003555941751900673, 'samples': 10647936, 'steps': 55457, 'loss/train': 1.6130120754241943} -11/07/2021 05:01:22 - INFO - __main__ - Step 55459: {'lr': 0.00035558936502499944, 'samples': 10648128, 'steps': 55458, 'loss/train': 1.3010731935501099} -11/07/2021 05:01:22 - INFO - __main__ - Step 55460: {'lr': 0.00035558455481235463, 'samples': 10648320, 'steps': 55459, 'loss/train': 1.4402084350585938} -11/07/2021 05:01:22 - INFO - __main__ - Step 55461: {'lr': 0.000355579744552135, 'samples': 10648512, 'steps': 55460, 'loss/train': 1.2482751607894897} -11/07/2021 05:01:23 - INFO - __main__ - Step 55462: {'lr': 0.00035557493424434285, 'samples': 10648704, 'steps': 55461, 'loss/train': 1.2822860479354858} -11/07/2021 05:01:24 - INFO - __main__ - Step 55463: {'lr': 0.0003555701238889802, 'samples': 10648896, 'steps': 55462, 'loss/train': 1.7497222423553467} -11/07/2021 05:01:24 - INFO - __main__ - Step 55464: {'lr': 0.0003555653134860493, 'samples': 10649088, 'steps': 55463, 'loss/train': 1.5999925136566162} -11/07/2021 05:01:24 - INFO - __main__ - Step 55465: {'lr': 0.00035556050303555233, 'samples': 10649280, 'steps': 55464, 'loss/train': 1.547693133354187} -11/07/2021 05:01:25 - INFO - __main__ - Step 55466: {'lr': 0.00035555569253749135, 'samples': 10649472, 'steps': 55465, 'loss/train': 1.3012789487838745} -11/07/2021 05:01:25 - INFO - __main__ - Step 55467: {'lr': 0.0003555508819918687, 'samples': 10649664, 'steps': 55466, 'loss/train': 1.346777081489563} -11/07/2021 05:01:26 - INFO - __main__ - Step 55468: {'lr': 0.0003555460713986864, 'samples': 10649856, 'steps': 55467, 'loss/train': 1.7407342195510864} -11/07/2021 05:01:27 - INFO - __main__ - Step 55469: {'lr': 0.00035554126075794666, 'samples': 10650048, 'steps': 55468, 'loss/train': 1.5766143798828125} -11/07/2021 05:01:27 - INFO - __main__ - Step 55470: {'lr': 0.0003555364500696517, 'samples': 10650240, 'steps': 55469, 'loss/train': 1.2244343757629395} -11/07/2021 05:01:28 - INFO - __main__ - Step 55471: {'lr': 0.0003555316393338036, 'samples': 10650432, 'steps': 55470, 'loss/train': 0.45889508724212646} -11/07/2021 05:01:28 - INFO - __main__ - Step 55472: {'lr': 0.0003555268285504045, 'samples': 10650624, 'steps': 55471, 'loss/train': 1.283272624015808} -11/07/2021 05:01:29 - INFO - __main__ - Step 55473: {'lr': 0.00035552201771945675, 'samples': 10650816, 'steps': 55472, 'loss/train': 1.3844774961471558} -11/07/2021 05:01:29 - INFO - __main__ - Step 55474: {'lr': 0.0003555172068409624, 'samples': 10651008, 'steps': 55473, 'loss/train': 1.8402692079544067} -11/07/2021 05:01:30 - INFO - __main__ - Step 55475: {'lr': 0.0003555123959149236, 'samples': 10651200, 'steps': 55474, 'loss/train': 1.477421760559082} -11/07/2021 05:01:30 - INFO - __main__ - Step 55476: {'lr': 0.00035550758494134257, 'samples': 10651392, 'steps': 55475, 'loss/train': 1.8838911056518555} -11/07/2021 05:01:30 - INFO - __main__ - Step 55477: {'lr': 0.0003555027739202214, 'samples': 10651584, 'steps': 55476, 'loss/train': 1.3513555526733398} -11/07/2021 05:01:31 - INFO - __main__ - Step 55478: {'lr': 0.00035549796285156234, 'samples': 10651776, 'steps': 55477, 'loss/train': 0.6545446515083313} -11/07/2021 05:01:32 - INFO - __main__ - Step 55479: {'lr': 0.0003554931517353675, 'samples': 10651968, 'steps': 55478, 'loss/train': 1.3153272867202759} -11/07/2021 05:01:32 - INFO - __main__ - Step 55480: {'lr': 0.0003554883405716391, 'samples': 10652160, 'steps': 55479, 'loss/train': 1.3092068433761597} -11/07/2021 05:01:32 - INFO - __main__ - Step 55481: {'lr': 0.0003554835293603793, 'samples': 10652352, 'steps': 55480, 'loss/train': 2.0189783573150635} -11/07/2021 05:01:33 - INFO - __main__ - Step 55482: {'lr': 0.0003554787181015903, 'samples': 10652544, 'steps': 55481, 'loss/train': 1.1473562717437744} -11/07/2021 05:01:33 - INFO - __main__ - Step 55483: {'lr': 0.0003554739067952741, 'samples': 10652736, 'steps': 55482, 'loss/train': 1.3377685546875} -11/07/2021 05:01:34 - INFO - __main__ - Step 55484: {'lr': 0.00035546909544143304, 'samples': 10652928, 'steps': 55483, 'loss/train': 1.6772104501724243} -11/07/2021 05:01:34 - INFO - __main__ - Step 55485: {'lr': 0.00035546428404006913, 'samples': 10653120, 'steps': 55484, 'loss/train': 1.154433250427246} -11/07/2021 05:01:35 - INFO - __main__ - Step 55486: {'lr': 0.0003554594725911848, 'samples': 10653312, 'steps': 55485, 'loss/train': 0.08047390729188919} -11/07/2021 05:01:35 - INFO - __main__ - Step 55487: {'lr': 0.00035545466109478195, 'samples': 10653504, 'steps': 55486, 'loss/train': 1.0241944789886475} -11/07/2021 05:01:35 - INFO - __main__ - Step 55488: {'lr': 0.00035544984955086296, 'samples': 10653696, 'steps': 55487, 'loss/train': 1.5227360725402832} -11/07/2021 05:01:37 - INFO - __main__ - Step 55489: {'lr': 0.00035544503795942984, 'samples': 10653888, 'steps': 55488, 'loss/train': 1.5348587036132812} -11/07/2021 05:01:37 - INFO - __main__ - Step 55490: {'lr': 0.00035544022632048476, 'samples': 10654080, 'steps': 55489, 'loss/train': 2.0114195346832275} -11/07/2021 05:01:37 - INFO - __main__ - Step 55491: {'lr': 0.00035543541463402994, 'samples': 10654272, 'steps': 55490, 'loss/train': 1.1516433954238892} -11/07/2021 05:01:38 - INFO - __main__ - Step 55492: {'lr': 0.0003554306029000676, 'samples': 10654464, 'steps': 55491, 'loss/train': 1.52472984790802} -11/07/2021 05:01:38 - INFO - __main__ - Step 55493: {'lr': 0.00035542579111859986, 'samples': 10654656, 'steps': 55492, 'loss/train': 1.7366708517074585} -11/07/2021 05:01:39 - INFO - __main__ - Step 55494: {'lr': 0.0003554209792896289, 'samples': 10654848, 'steps': 55493, 'loss/train': 1.614952564239502} -11/07/2021 05:01:39 - INFO - __main__ - Step 55495: {'lr': 0.00035541616741315685, 'samples': 10655040, 'steps': 55494, 'loss/train': 1.4215108156204224} -11/07/2021 05:01:40 - INFO - __main__ - Step 55496: {'lr': 0.0003554113554891859, 'samples': 10655232, 'steps': 55495, 'loss/train': 1.2625516653060913} -11/07/2021 05:01:40 - INFO - __main__ - Step 55497: {'lr': 0.0003554065435177183, 'samples': 10655424, 'steps': 55496, 'loss/train': 1.1632428169250488} -11/07/2021 05:01:40 - INFO - __main__ - Step 55498: {'lr': 0.00035540173149875597, 'samples': 10655616, 'steps': 55497, 'loss/train': 1.403335690498352} -11/07/2021 05:01:42 - INFO - __main__ - Step 55499: {'lr': 0.00035539691943230135, 'samples': 10655808, 'steps': 55498, 'loss/train': 1.8241478204727173} -11/07/2021 05:01:42 - INFO - __main__ - Step 55500: {'lr': 0.00035539210731835646, 'samples': 10656000, 'steps': 55499, 'loss/train': 1.243905782699585} -11/07/2021 05:01:42 - INFO - __main__ - Step 55501: {'lr': 0.00035538729515692356, 'samples': 10656192, 'steps': 55500, 'loss/train': 1.7358616590499878} -11/07/2021 05:01:43 - INFO - __main__ - Step 55502: {'lr': 0.0003553824829480048, 'samples': 10656384, 'steps': 55501, 'loss/train': 1.4769762754440308} -11/07/2021 05:01:43 - INFO - __main__ - Step 55503: {'lr': 0.00035537767069160234, 'samples': 10656576, 'steps': 55502, 'loss/train': 1.0820908546447754} -11/07/2021 05:01:44 - INFO - __main__ - Step 55504: {'lr': 0.00035537285838771823, 'samples': 10656768, 'steps': 55503, 'loss/train': 1.6202404499053955} -11/07/2021 05:01:44 - INFO - __main__ - Step 55505: {'lr': 0.00035536804603635474, 'samples': 10656960, 'steps': 55504, 'loss/train': 1.3159245252609253} -11/07/2021 05:01:45 - INFO - __main__ - Step 55506: {'lr': 0.00035536323363751405, 'samples': 10657152, 'steps': 55505, 'loss/train': 1.5448861122131348} -11/07/2021 05:01:45 - INFO - __main__ - Step 55507: {'lr': 0.0003553584211911983, 'samples': 10657344, 'steps': 55506, 'loss/train': 1.380665898323059} -11/07/2021 05:01:45 - INFO - __main__ - Step 55508: {'lr': 0.00035535360869740973, 'samples': 10657536, 'steps': 55507, 'loss/train': 1.0124974250793457} -11/07/2021 05:01:46 - INFO - __main__ - Step 55509: {'lr': 0.00035534879615615046, 'samples': 10657728, 'steps': 55508, 'loss/train': 1.0134326219558716} -11/07/2021 05:01:47 - INFO - __main__ - Step 55510: {'lr': 0.0003553439835674226, 'samples': 10657920, 'steps': 55509, 'loss/train': 1.1719768047332764} -11/07/2021 05:01:47 - INFO - __main__ - Step 55511: {'lr': 0.00035533917093122835, 'samples': 10658112, 'steps': 55510, 'loss/train': 1.3605214357376099} -11/07/2021 05:01:48 - INFO - __main__ - Step 55512: {'lr': 0.00035533435824756986, 'samples': 10658304, 'steps': 55511, 'loss/train': 1.351001501083374} -11/07/2021 05:01:48 - INFO - __main__ - Step 55513: {'lr': 0.00035532954551644944, 'samples': 10658496, 'steps': 55512, 'loss/train': 1.2918845415115356} -11/07/2021 05:01:48 - INFO - __main__ - Step 55514: {'lr': 0.0003553247327378691, 'samples': 10658688, 'steps': 55513, 'loss/train': 1.2629348039627075} -11/07/2021 05:01:49 - INFO - __main__ - Step 55515: {'lr': 0.0003553199199118311, 'samples': 10658880, 'steps': 55514, 'loss/train': 1.4175992012023926} -11/07/2021 05:01:50 - INFO - __main__ - Step 55516: {'lr': 0.00035531510703833754, 'samples': 10659072, 'steps': 55515, 'loss/train': 1.5937676429748535} -11/07/2021 05:01:50 - INFO - __main__ - Step 55517: {'lr': 0.00035531029411739056, 'samples': 10659264, 'steps': 55516, 'loss/train': 1.3809469938278198} -11/07/2021 05:01:50 - INFO - __main__ - Step 55518: {'lr': 0.00035530548114899243, 'samples': 10659456, 'steps': 55517, 'loss/train': 1.5462132692337036} -11/07/2021 05:01:51 - INFO - __main__ - Step 55519: {'lr': 0.00035530066813314534, 'samples': 10659648, 'steps': 55518, 'loss/train': 1.0150903463363647} -11/07/2021 05:01:52 - INFO - __main__ - Step 55520: {'lr': 0.0003552958550698513, 'samples': 10659840, 'steps': 55519, 'loss/train': 1.4693259000778198} -11/07/2021 05:01:52 - INFO - __main__ - Step 55521: {'lr': 0.00035529104195911255, 'samples': 10660032, 'steps': 55520, 'loss/train': 0.9689898490905762} -11/07/2021 05:01:52 - INFO - __main__ - Step 55522: {'lr': 0.00035528622880093145, 'samples': 10660224, 'steps': 55521, 'loss/train': 1.226699948310852} -11/07/2021 05:01:53 - INFO - __main__ - Step 55523: {'lr': 0.00035528141559530984, 'samples': 10660416, 'steps': 55522, 'loss/train': 1.4950664043426514} -11/07/2021 05:01:53 - INFO - __main__ - Step 55524: {'lr': 0.0003552766023422501, 'samples': 10660608, 'steps': 55523, 'loss/train': 1.5928208827972412} -11/07/2021 05:01:54 - INFO - __main__ - Step 55525: {'lr': 0.00035527178904175435, 'samples': 10660800, 'steps': 55524, 'loss/train': 1.644692063331604} -11/07/2021 05:01:54 - INFO - __main__ - Step 55526: {'lr': 0.0003552669756938247, 'samples': 10660992, 'steps': 55525, 'loss/train': 1.6959644556045532} -11/07/2021 05:01:55 - INFO - __main__ - Step 55527: {'lr': 0.0003552621622984634, 'samples': 10661184, 'steps': 55526, 'loss/train': 1.4864704608917236} -11/07/2021 05:01:55 - INFO - __main__ - Step 55528: {'lr': 0.00035525734885567275, 'samples': 10661376, 'steps': 55527, 'loss/train': 1.743637204170227} -11/07/2021 05:01:55 - INFO - __main__ - Step 55529: {'lr': 0.0003552525353654546, 'samples': 10661568, 'steps': 55528, 'loss/train': 4.9168701171875} -11/07/2021 05:01:56 - INFO - __main__ - Step 55530: {'lr': 0.0003552477218278113, 'samples': 10661760, 'steps': 55529, 'loss/train': 1.2728878259658813} -11/07/2021 05:01:57 - INFO - __main__ - Step 55531: {'lr': 0.00035524290824274504, 'samples': 10661952, 'steps': 55530, 'loss/train': 1.0321156978607178} -11/07/2021 05:01:57 - INFO - __main__ - Step 55532: {'lr': 0.0003552380946102579, 'samples': 10662144, 'steps': 55531, 'loss/train': 0.8566840291023254} -11/07/2021 05:01:57 - INFO - __main__ - Step 55533: {'lr': 0.0003552332809303521, 'samples': 10662336, 'steps': 55532, 'loss/train': 0.9766098260879517} -11/07/2021 05:01:58 - INFO - __main__ - Step 55534: {'lr': 0.0003552284672030298, 'samples': 10662528, 'steps': 55533, 'loss/train': 1.8043036460876465} -11/07/2021 05:01:59 - INFO - __main__ - Step 55535: {'lr': 0.0003552236534282933, 'samples': 10662720, 'steps': 55534, 'loss/train': 1.1812506914138794} -11/07/2021 05:01:59 - INFO - __main__ - Step 55536: {'lr': 0.00035521883960614456, 'samples': 10662912, 'steps': 55535, 'loss/train': 1.427696704864502} -11/07/2021 05:02:00 - INFO - __main__ - Step 55537: {'lr': 0.0003552140257365858, 'samples': 10663104, 'steps': 55536, 'loss/train': 1.419637680053711} -11/07/2021 05:02:00 - INFO - __main__ - Step 55538: {'lr': 0.00035520921181961924, 'samples': 10663296, 'steps': 55537, 'loss/train': 1.5478235483169556} -11/07/2021 05:02:00 - INFO - __main__ - Step 55539: {'lr': 0.00035520439785524703, 'samples': 10663488, 'steps': 55538, 'loss/train': 1.291942834854126} -11/07/2021 05:02:01 - INFO - __main__ - Step 55540: {'lr': 0.00035519958384347134, 'samples': 10663680, 'steps': 55539, 'loss/train': 1.566218376159668} -11/07/2021 05:02:02 - INFO - __main__ - Step 55541: {'lr': 0.00035519476978429433, 'samples': 10663872, 'steps': 55540, 'loss/train': 1.5057703256607056} -11/07/2021 05:02:02 - INFO - __main__ - Step 55542: {'lr': 0.0003551899556777183, 'samples': 10664064, 'steps': 55541, 'loss/train': 1.5911173820495605} -11/07/2021 05:02:02 - INFO - __main__ - Step 55543: {'lr': 0.00035518514152374514, 'samples': 10664256, 'steps': 55542, 'loss/train': 1.2359411716461182} -11/07/2021 05:02:03 - INFO - __main__ - Step 55544: {'lr': 0.00035518032732237724, 'samples': 10664448, 'steps': 55543, 'loss/train': 1.1860450506210327} -11/07/2021 05:02:04 - INFO - __main__ - Step 55545: {'lr': 0.00035517551307361674, 'samples': 10664640, 'steps': 55544, 'loss/train': 3.10489821434021} -11/07/2021 05:02:04 - INFO - __main__ - Step 55546: {'lr': 0.0003551706987774657, 'samples': 10664832, 'steps': 55545, 'loss/train': 1.326438307762146} -11/07/2021 05:02:05 - INFO - __main__ - Step 55547: {'lr': 0.00035516588443392644, 'samples': 10665024, 'steps': 55546, 'loss/train': 1.4802407026290894} -11/07/2021 05:02:05 - INFO - __main__ - Step 55548: {'lr': 0.00035516107004300107, 'samples': 10665216, 'steps': 55547, 'loss/train': 1.7567200660705566} -11/07/2021 05:02:05 - INFO - __main__ - Step 55549: {'lr': 0.00035515625560469174, 'samples': 10665408, 'steps': 55548, 'loss/train': 1.3075168132781982} -11/07/2021 05:02:06 - INFO - __main__ - Step 55550: {'lr': 0.00035515144111900054, 'samples': 10665600, 'steps': 55549, 'loss/train': 1.2171063423156738} -11/07/2021 05:02:07 - INFO - __main__ - Step 55551: {'lr': 0.00035514662658592977, 'samples': 10665792, 'steps': 55550, 'loss/train': 1.5514367818832397} -11/07/2021 05:02:07 - INFO - __main__ - Step 55552: {'lr': 0.0003551418120054816, 'samples': 10665984, 'steps': 55551, 'loss/train': 1.5149608850479126} -11/07/2021 05:02:07 - INFO - __main__ - Step 55553: {'lr': 0.0003551369973776581, 'samples': 10666176, 'steps': 55552, 'loss/train': 1.4682872295379639} -11/07/2021 05:02:08 - INFO - __main__ - Step 55554: {'lr': 0.0003551321827024615, 'samples': 10666368, 'steps': 55553, 'loss/train': 1.1639363765716553} -11/07/2021 05:02:09 - INFO - __main__ - Step 55555: {'lr': 0.0003551273679798939, 'samples': 10666560, 'steps': 55554, 'loss/train': 1.7590302228927612} -11/07/2021 05:02:09 - INFO - __main__ - Step 55556: {'lr': 0.00035512255320995764, 'samples': 10666752, 'steps': 55555, 'loss/train': 1.9666401147842407} -11/07/2021 05:02:09 - INFO - __main__ - Step 55557: {'lr': 0.0003551177383926547, 'samples': 10666944, 'steps': 55556, 'loss/train': 1.5923014879226685} -11/07/2021 05:02:10 - INFO - __main__ - Step 55558: {'lr': 0.00035511292352798736, 'samples': 10667136, 'steps': 55557, 'loss/train': 1.565259575843811} -11/07/2021 05:02:10 - INFO - __main__ - Step 55559: {'lr': 0.0003551081086159578, 'samples': 10667328, 'steps': 55558, 'loss/train': 1.5437698364257812} -11/07/2021 05:02:11 - INFO - __main__ - Step 55560: {'lr': 0.0003551032936565681, 'samples': 10667520, 'steps': 55559, 'loss/train': 1.3968523740768433} -11/07/2021 05:02:12 - INFO - __main__ - Step 55561: {'lr': 0.0003550984786498205, 'samples': 10667712, 'steps': 55560, 'loss/train': 1.0897365808486938} -11/07/2021 05:02:12 - INFO - __main__ - Step 55562: {'lr': 0.0003550936635957171, 'samples': 10667904, 'steps': 55561, 'loss/train': 1.755570888519287} -11/07/2021 05:02:12 - INFO - __main__ - Step 55563: {'lr': 0.00035508884849426014, 'samples': 10668096, 'steps': 55562, 'loss/train': 1.15757417678833} -11/07/2021 05:02:13 - INFO - __main__ - Step 55564: {'lr': 0.0003550840333454518, 'samples': 10668288, 'steps': 55563, 'loss/train': 1.2781257629394531} -11/07/2021 05:02:13 - INFO - __main__ - Step 55565: {'lr': 0.00035507921814929415, 'samples': 10668480, 'steps': 55564, 'loss/train': 1.5428166389465332} -11/07/2021 05:02:14 - INFO - __main__ - Step 55566: {'lr': 0.0003550744029057895, 'samples': 10668672, 'steps': 55565, 'loss/train': 1.2315104007720947} -11/07/2021 05:02:14 - INFO - __main__ - Step 55567: {'lr': 0.0003550695876149399, 'samples': 10668864, 'steps': 55566, 'loss/train': 1.3412801027297974} -11/07/2021 05:02:15 - INFO - __main__ - Step 55568: {'lr': 0.00035506477227674753, 'samples': 10669056, 'steps': 55567, 'loss/train': 0.994350790977478} -11/07/2021 05:02:15 - INFO - __main__ - Step 55569: {'lr': 0.0003550599568912147, 'samples': 10669248, 'steps': 55568, 'loss/train': 1.5082281827926636} -11/07/2021 05:02:15 - INFO - __main__ - Step 55570: {'lr': 0.00035505514145834337, 'samples': 10669440, 'steps': 55569, 'loss/train': 0.8763818144798279} -11/07/2021 05:02:16 - INFO - __main__ - Step 55571: {'lr': 0.0003550503259781359, 'samples': 10669632, 'steps': 55570, 'loss/train': 1.2236778736114502} -11/07/2021 05:02:17 - INFO - __main__ - Step 55572: {'lr': 0.0003550455104505943, 'samples': 10669824, 'steps': 55571, 'loss/train': 1.1714478731155396} -11/07/2021 05:02:17 - INFO - __main__ - Step 55573: {'lr': 0.00035504069487572086, 'samples': 10670016, 'steps': 55572, 'loss/train': 1.3182233572006226} -11/07/2021 05:02:17 - INFO - __main__ - Step 55574: {'lr': 0.00035503587925351767, 'samples': 10670208, 'steps': 55573, 'loss/train': 1.1601752042770386} -11/07/2021 05:02:18 - INFO - __main__ - Step 55575: {'lr': 0.00035503106358398694, 'samples': 10670400, 'steps': 55574, 'loss/train': 1.5089037418365479} -11/07/2021 05:02:19 - INFO - __main__ - Step 55576: {'lr': 0.0003550262478671309, 'samples': 10670592, 'steps': 55575, 'loss/train': 1.5794835090637207} -11/07/2021 05:02:19 - INFO - __main__ - Step 55577: {'lr': 0.00035502143210295163, 'samples': 10670784, 'steps': 55576, 'loss/train': 1.2077217102050781} -11/07/2021 05:02:20 - INFO - __main__ - Step 55578: {'lr': 0.0003550166162914513, 'samples': 10670976, 'steps': 55577, 'loss/train': 1.2896077632904053} -11/07/2021 05:02:20 - INFO - __main__ - Step 55579: {'lr': 0.00035501180043263203, 'samples': 10671168, 'steps': 55578, 'loss/train': 1.2451173067092896} -11/07/2021 05:02:20 - INFO - __main__ - Step 55580: {'lr': 0.00035500698452649613, 'samples': 10671360, 'steps': 55579, 'loss/train': 1.1873743534088135} -11/07/2021 05:02:21 - INFO - __main__ - Step 55581: {'lr': 0.00035500216857304575, 'samples': 10671552, 'steps': 55580, 'loss/train': 1.361046552658081} -11/07/2021 05:02:22 - INFO - __main__ - Step 55582: {'lr': 0.000354997352572283, 'samples': 10671744, 'steps': 55581, 'loss/train': 1.1923409700393677} -11/07/2021 05:02:22 - INFO - __main__ - Step 55583: {'lr': 0.00035499253652421, 'samples': 10671936, 'steps': 55582, 'loss/train': 1.2904736995697021} -11/07/2021 05:02:22 - INFO - __main__ - Step 55584: {'lr': 0.000354987720428829, 'samples': 10672128, 'steps': 55583, 'loss/train': 1.4541096687316895} -11/07/2021 05:02:23 - INFO - __main__ - Step 55585: {'lr': 0.00035498290428614217, 'samples': 10672320, 'steps': 55584, 'loss/train': 1.910554051399231} -11/07/2021 05:02:24 - INFO - __main__ - Step 55586: {'lr': 0.0003549780880961516, 'samples': 10672512, 'steps': 55585, 'loss/train': 1.4025523662567139} -11/07/2021 05:02:24 - INFO - __main__ - Step 55587: {'lr': 0.00035497327185885966, 'samples': 10672704, 'steps': 55586, 'loss/train': 1.4680031538009644} -11/07/2021 05:02:24 - INFO - __main__ - Step 55588: {'lr': 0.00035496845557426824, 'samples': 10672896, 'steps': 55587, 'loss/train': 1.2862597703933716} -11/07/2021 05:02:25 - INFO - __main__ - Step 55589: {'lr': 0.0003549636392423798, 'samples': 10673088, 'steps': 55588, 'loss/train': 4.9805216789245605} -11/07/2021 05:02:25 - INFO - __main__ - Step 55590: {'lr': 0.00035495882286319625, 'samples': 10673280, 'steps': 55589, 'loss/train': 1.4303516149520874} -11/07/2021 05:02:26 - INFO - __main__ - Step 55591: {'lr': 0.0003549540064367199, 'samples': 10673472, 'steps': 55590, 'loss/train': 1.1181601285934448} -11/07/2021 05:02:26 - INFO - __main__ - Step 55592: {'lr': 0.0003549491899629529, 'samples': 10673664, 'steps': 55591, 'loss/train': 1.3412623405456543} -11/07/2021 05:02:27 - INFO - __main__ - Step 55593: {'lr': 0.00035494437344189746, 'samples': 10673856, 'steps': 55592, 'loss/train': 1.5310654640197754} -11/07/2021 05:02:27 - INFO - __main__ - Step 55594: {'lr': 0.0003549395568735556, 'samples': 10674048, 'steps': 55593, 'loss/train': 1.5789437294006348} -11/07/2021 05:02:28 - INFO - __main__ - Step 55595: {'lr': 0.00035493474025792966, 'samples': 10674240, 'steps': 55594, 'loss/train': 1.375770092010498} -11/07/2021 05:02:29 - INFO - __main__ - Step 55596: {'lr': 0.0003549299235950218, 'samples': 10674432, 'steps': 55595, 'loss/train': 1.112752914428711} -11/07/2021 05:02:29 - INFO - __main__ - Step 55597: {'lr': 0.000354925106884834, 'samples': 10674624, 'steps': 55596, 'loss/train': 1.0414875745773315} -11/07/2021 05:02:29 - INFO - __main__ - Step 55598: {'lr': 0.0003549202901273687, 'samples': 10674816, 'steps': 55597, 'loss/train': 1.5901310443878174} -11/07/2021 05:02:30 - INFO - __main__ - Step 55599: {'lr': 0.00035491547332262786, 'samples': 10675008, 'steps': 55598, 'loss/train': 1.6778441667556763} -11/07/2021 05:02:30 - INFO - __main__ - Step 55600: {'lr': 0.00035491065647061377, 'samples': 10675200, 'steps': 55599, 'loss/train': 1.326326608657837} -11/07/2021 05:02:31 - INFO - __main__ - Step 55601: {'lr': 0.0003549058395713285, 'samples': 10675392, 'steps': 55600, 'loss/train': 1.043556809425354} -11/07/2021 05:02:31 - INFO - __main__ - Step 55602: {'lr': 0.00035490102262477436, 'samples': 10675584, 'steps': 55601, 'loss/train': 1.8972359895706177} -11/07/2021 05:02:32 - INFO - __main__ - Step 55603: {'lr': 0.0003548962056309534, 'samples': 10675776, 'steps': 55602, 'loss/train': 0.05763842165470123} -11/07/2021 05:02:32 - INFO - __main__ - Step 55604: {'lr': 0.0003548913885898678, 'samples': 10675968, 'steps': 55603, 'loss/train': 1.331835389137268} -11/07/2021 05:02:32 - INFO - __main__ - Step 55605: {'lr': 0.0003548865715015198, 'samples': 10676160, 'steps': 55604, 'loss/train': 1.4535555839538574} -11/07/2021 05:02:34 - INFO - __main__ - Step 55606: {'lr': 0.00035488175436591146, 'samples': 10676352, 'steps': 55605, 'loss/train': 1.5322768688201904} -11/07/2021 05:02:34 - INFO - __main__ - Step 55607: {'lr': 0.00035487693718304504, 'samples': 10676544, 'steps': 55606, 'loss/train': 1.1713974475860596} -11/07/2021 05:02:34 - INFO - __main__ - Step 55608: {'lr': 0.00035487211995292276, 'samples': 10676736, 'steps': 55607, 'loss/train': 1.6466498374938965} -11/07/2021 05:02:35 - INFO - __main__ - Step 55609: {'lr': 0.00035486730267554666, 'samples': 10676928, 'steps': 55608, 'loss/train': 1.2568548917770386} -11/07/2021 05:02:35 - INFO - __main__ - Step 55610: {'lr': 0.000354862485350919, 'samples': 10677120, 'steps': 55609, 'loss/train': 1.1440668106079102} -11/07/2021 05:02:35 - INFO - __main__ - Step 55611: {'lr': 0.0003548576679790419, 'samples': 10677312, 'steps': 55610, 'loss/train': 0.8220343589782715} -11/07/2021 05:02:36 - INFO - __main__ - Step 55612: {'lr': 0.00035485285055991754, 'samples': 10677504, 'steps': 55611, 'loss/train': 1.3758190870285034} -11/07/2021 05:02:37 - INFO - __main__ - Step 55613: {'lr': 0.00035484803309354814, 'samples': 10677696, 'steps': 55612, 'loss/train': 1.9407711029052734} -11/07/2021 05:02:37 - INFO - __main__ - Step 55614: {'lr': 0.0003548432155799358, 'samples': 10677888, 'steps': 55613, 'loss/train': 1.3740770816802979} -11/07/2021 05:02:38 - INFO - __main__ - Step 55615: {'lr': 0.00035483839801908276, 'samples': 10678080, 'steps': 55614, 'loss/train': 1.1971131563186646} -11/07/2021 05:02:38 - INFO - __main__ - Step 55616: {'lr': 0.00035483358041099117, 'samples': 10678272, 'steps': 55615, 'loss/train': 1.2182449102401733} -11/07/2021 05:02:39 - INFO - __main__ - Step 55617: {'lr': 0.00035482876275566317, 'samples': 10678464, 'steps': 55616, 'loss/train': 1.621694564819336} -11/07/2021 05:02:39 - INFO - __main__ - Step 55618: {'lr': 0.00035482394505310087, 'samples': 10678656, 'steps': 55617, 'loss/train': 1.561873435974121} -11/07/2021 05:02:40 - INFO - __main__ - Step 55619: {'lr': 0.0003548191273033066, 'samples': 10678848, 'steps': 55618, 'loss/train': 0.8010305762290955} -11/07/2021 05:02:40 - INFO - __main__ - Step 55620: {'lr': 0.0003548143095062825, 'samples': 10679040, 'steps': 55619, 'loss/train': 1.3462319374084473} -11/07/2021 05:02:40 - INFO - __main__ - Step 55621: {'lr': 0.00035480949166203057, 'samples': 10679232, 'steps': 55620, 'loss/train': 1.859246015548706} -11/07/2021 05:02:41 - INFO - __main__ - Step 55622: {'lr': 0.00035480467377055314, 'samples': 10679424, 'steps': 55621, 'loss/train': 1.6003825664520264} -11/07/2021 05:02:42 - INFO - __main__ - Step 55623: {'lr': 0.00035479985583185237, 'samples': 10679616, 'steps': 55622, 'loss/train': 0.9864547848701477} -11/07/2021 05:02:42 - INFO - __main__ - Step 55624: {'lr': 0.0003547950378459304, 'samples': 10679808, 'steps': 55623, 'loss/train': 1.4512523412704468} -11/07/2021 05:02:42 - INFO - __main__ - Step 55625: {'lr': 0.00035479021981278935, 'samples': 10680000, 'steps': 55624, 'loss/train': 1.546105146408081} -11/07/2021 05:02:43 - INFO - __main__ - Step 55626: {'lr': 0.0003547854017324315, 'samples': 10680192, 'steps': 55625, 'loss/train': 1.1211549043655396} -11/07/2021 05:02:44 - INFO - __main__ - Step 55627: {'lr': 0.000354780583604859, 'samples': 10680384, 'steps': 55626, 'loss/train': 2.3880438804626465} -11/07/2021 05:02:44 - INFO - __main__ - Step 55628: {'lr': 0.0003547757654300739, 'samples': 10680576, 'steps': 55627, 'loss/train': 1.8930439949035645} -11/07/2021 05:02:45 - INFO - __main__ - Step 55629: {'lr': 0.0003547709472080785, 'samples': 10680768, 'steps': 55628, 'loss/train': 1.3211060762405396} -11/07/2021 05:02:45 - INFO - __main__ - Step 55630: {'lr': 0.00035476612893887494, 'samples': 10680960, 'steps': 55629, 'loss/train': 0.43241170048713684} -11/07/2021 05:02:45 - INFO - __main__ - Step 55631: {'lr': 0.0003547613106224653, 'samples': 10681152, 'steps': 55630, 'loss/train': 1.4644253253936768} -11/07/2021 05:02:46 - INFO - __main__ - Step 55632: {'lr': 0.0003547564922588519, 'samples': 10681344, 'steps': 55631, 'loss/train': 1.2657135725021362} -11/07/2021 05:02:47 - INFO - __main__ - Step 55633: {'lr': 0.0003547516738480369, 'samples': 10681536, 'steps': 55632, 'loss/train': 0.6447150707244873} -11/07/2021 05:02:47 - INFO - __main__ - Step 55634: {'lr': 0.0003547468553900223, 'samples': 10681728, 'steps': 55633, 'loss/train': 0.8582543134689331} -11/07/2021 05:02:47 - INFO - __main__ - Step 55635: {'lr': 0.0003547420368848104, 'samples': 10681920, 'steps': 55634, 'loss/train': 1.463858962059021} -11/07/2021 05:02:48 - INFO - __main__ - Step 55636: {'lr': 0.0003547372183324034, 'samples': 10682112, 'steps': 55635, 'loss/train': 1.176918625831604} -11/07/2021 05:02:49 - INFO - __main__ - Step 55637: {'lr': 0.0003547323997328034, 'samples': 10682304, 'steps': 55636, 'loss/train': 1.400640606880188} -11/07/2021 05:02:49 - INFO - __main__ - Step 55638: {'lr': 0.0003547275810860126, 'samples': 10682496, 'steps': 55637, 'loss/train': 1.6146177053451538} -11/07/2021 05:02:50 - INFO - __main__ - Step 55639: {'lr': 0.00035472276239203315, 'samples': 10682688, 'steps': 55638, 'loss/train': 1.731985092163086} -11/07/2021 05:02:50 - INFO - __main__ - Step 55640: {'lr': 0.00035471794365086724, 'samples': 10682880, 'steps': 55639, 'loss/train': 1.5149266719818115} -11/07/2021 05:02:50 - INFO - __main__ - Step 55641: {'lr': 0.00035471312486251707, 'samples': 10683072, 'steps': 55640, 'loss/train': 1.0393422842025757} -11/07/2021 05:02:51 - INFO - __main__ - Step 55642: {'lr': 0.0003547083060269848, 'samples': 10683264, 'steps': 55641, 'loss/train': 1.256230115890503} -11/07/2021 05:02:52 - INFO - __main__ - Step 55643: {'lr': 0.00035470348714427256, 'samples': 10683456, 'steps': 55642, 'loss/train': 1.4536901712417603} -11/07/2021 05:02:52 - INFO - __main__ - Step 55644: {'lr': 0.0003546986682143825, 'samples': 10683648, 'steps': 55643, 'loss/train': 1.0605077743530273} -11/07/2021 05:02:53 - INFO - __main__ - Step 55645: {'lr': 0.0003546938492373169, 'samples': 10683840, 'steps': 55644, 'loss/train': 1.6237866878509521} -11/07/2021 05:02:53 - INFO - __main__ - Step 55646: {'lr': 0.0003546890302130778, 'samples': 10684032, 'steps': 55645, 'loss/train': 1.383773922920227} -11/07/2021 05:02:54 - INFO - __main__ - Step 55647: {'lr': 0.0003546842111416675, 'samples': 10684224, 'steps': 55646, 'loss/train': 2.5310633182525635} -11/07/2021 05:02:54 - INFO - __main__ - Step 55648: {'lr': 0.0003546793920230881, 'samples': 10684416, 'steps': 55647, 'loss/train': 1.7178682088851929} -11/07/2021 05:02:55 - INFO - __main__ - Step 55649: {'lr': 0.0003546745728573418, 'samples': 10684608, 'steps': 55648, 'loss/train': 1.7007197141647339} -11/07/2021 05:02:55 - INFO - __main__ - Step 55650: {'lr': 0.0003546697536444307, 'samples': 10684800, 'steps': 55649, 'loss/train': 1.089084267616272} -11/07/2021 05:02:55 - INFO - __main__ - Step 55651: {'lr': 0.00035466493438435703, 'samples': 10684992, 'steps': 55650, 'loss/train': 1.3870054483413696} -11/07/2021 05:02:57 - INFO - __main__ - Step 55652: {'lr': 0.000354660115077123, 'samples': 10685184, 'steps': 55651, 'loss/train': 1.2411152124404907} -11/07/2021 05:02:57 - INFO - __main__ - Step 55653: {'lr': 0.0003546552957227307, 'samples': 10685376, 'steps': 55652, 'loss/train': 1.4214160442352295} -11/07/2021 05:02:57 - INFO - __main__ - Step 55654: {'lr': 0.0003546504763211823, 'samples': 10685568, 'steps': 55653, 'loss/train': 1.6649715900421143} -11/07/2021 05:02:58 - INFO - __main__ - Step 55655: {'lr': 0.0003546456568724801, 'samples': 10685760, 'steps': 55654, 'loss/train': 2.0860495567321777} -11/07/2021 05:02:58 - INFO - __main__ - Step 55656: {'lr': 0.0003546408373766262, 'samples': 10685952, 'steps': 55655, 'loss/train': 1.3127493858337402} -11/07/2021 05:02:59 - INFO - __main__ - Step 55657: {'lr': 0.0003546360178336226, 'samples': 10686144, 'steps': 55656, 'loss/train': 1.2331385612487793} -11/07/2021 05:02:59 - INFO - __main__ - Step 55658: {'lr': 0.0003546311982434717, 'samples': 10686336, 'steps': 55657, 'loss/train': 1.3542340993881226} -11/07/2021 05:03:00 - INFO - __main__ - Step 55659: {'lr': 0.00035462637860617563, 'samples': 10686528, 'steps': 55658, 'loss/train': 1.4579474925994873} -11/07/2021 05:03:00 - INFO - __main__ - Step 55660: {'lr': 0.00035462155892173654, 'samples': 10686720, 'steps': 55659, 'loss/train': 1.4526863098144531} -11/07/2021 05:03:00 - INFO - __main__ - Step 55661: {'lr': 0.0003546167391901566, 'samples': 10686912, 'steps': 55660, 'loss/train': 1.1624071598052979} -11/07/2021 05:03:01 - INFO - __main__ - Step 55662: {'lr': 0.0003546119194114379, 'samples': 10687104, 'steps': 55661, 'loss/train': 1.5463212728500366} -11/07/2021 05:03:02 - INFO - __main__ - Step 55663: {'lr': 0.00035460709958558273, 'samples': 10687296, 'steps': 55662, 'loss/train': 1.1025784015655518} -11/07/2021 05:03:02 - INFO - __main__ - Step 55664: {'lr': 0.0003546022797125932, 'samples': 10687488, 'steps': 55663, 'loss/train': 1.408887267112732} -11/07/2021 05:03:02 - INFO - __main__ - Step 55665: {'lr': 0.00035459745979247146, 'samples': 10687680, 'steps': 55664, 'loss/train': 1.5203648805618286} -11/07/2021 05:03:03 - INFO - __main__ - Step 55666: {'lr': 0.00035459263982521975, 'samples': 10687872, 'steps': 55665, 'loss/train': 1.1913645267486572} -11/07/2021 05:03:03 - INFO - __main__ - Step 55667: {'lr': 0.00035458781981084026, 'samples': 10688064, 'steps': 55666, 'loss/train': 1.3048712015151978} -11/07/2021 05:03:04 - INFO - __main__ - Step 55668: {'lr': 0.00035458299974933506, 'samples': 10688256, 'steps': 55667, 'loss/train': 1.9954164028167725} -11/07/2021 05:03:05 - INFO - __main__ - Step 55669: {'lr': 0.00035457817964070637, 'samples': 10688448, 'steps': 55668, 'loss/train': 1.4409780502319336} -11/07/2021 05:03:05 - INFO - __main__ - Step 55670: {'lr': 0.0003545733594849564, 'samples': 10688640, 'steps': 55669, 'loss/train': 1.484114408493042} -11/07/2021 05:03:05 - INFO - __main__ - Step 55671: {'lr': 0.0003545685392820873, 'samples': 10688832, 'steps': 55670, 'loss/train': 1.255584716796875} -11/07/2021 05:03:06 - INFO - __main__ - Step 55672: {'lr': 0.0003545637190321012, 'samples': 10689024, 'steps': 55671, 'loss/train': 0.7551189064979553} -11/07/2021 05:03:07 - INFO - __main__ - Step 55673: {'lr': 0.00035455889873500026, 'samples': 10689216, 'steps': 55672, 'loss/train': 1.4032310247421265} -11/07/2021 05:03:07 - INFO - __main__ - Step 55674: {'lr': 0.00035455407839078673, 'samples': 10689408, 'steps': 55673, 'loss/train': 1.6993948221206665} -11/07/2021 05:03:07 - INFO - __main__ - Step 55675: {'lr': 0.00035454925799946273, 'samples': 10689600, 'steps': 55674, 'loss/train': 1.3456084728240967} -11/07/2021 05:03:08 - INFO - __main__ - Step 55676: {'lr': 0.0003545444375610306, 'samples': 10689792, 'steps': 55675, 'loss/train': 1.4696476459503174} -11/07/2021 05:03:08 - INFO - __main__ - Step 55677: {'lr': 0.0003545396170754922, 'samples': 10689984, 'steps': 55676, 'loss/train': 0.8574563264846802} -11/07/2021 05:03:09 - INFO - __main__ - Step 55678: {'lr': 0.0003545347965428498, 'samples': 10690176, 'steps': 55677, 'loss/train': 1.7760615348815918} -11/07/2021 05:03:09 - INFO - __main__ - Step 55679: {'lr': 0.00035452997596310576, 'samples': 10690368, 'steps': 55678, 'loss/train': 1.7549160718917847} -11/07/2021 05:03:10 - INFO - __main__ - Step 55680: {'lr': 0.00035452515533626204, 'samples': 10690560, 'steps': 55679, 'loss/train': 1.2228102684020996} -11/07/2021 05:03:10 - INFO - __main__ - Step 55681: {'lr': 0.00035452033466232095, 'samples': 10690752, 'steps': 55680, 'loss/train': 1.4908599853515625} -11/07/2021 05:03:11 - INFO - __main__ - Step 55682: {'lr': 0.0003545155139412847, 'samples': 10690944, 'steps': 55681, 'loss/train': 1.7345000505447388} -11/07/2021 05:03:11 - INFO - __main__ - Step 55683: {'lr': 0.00035451069317315526, 'samples': 10691136, 'steps': 55682, 'loss/train': 1.1505171060562134} -11/07/2021 05:03:12 - INFO - __main__ - Step 55684: {'lr': 0.00035450587235793493, 'samples': 10691328, 'steps': 55683, 'loss/train': 1.6514390707015991} -11/07/2021 05:03:12 - INFO - __main__ - Step 55685: {'lr': 0.0003545010514956258, 'samples': 10691520, 'steps': 55684, 'loss/train': 1.8190395832061768} -11/07/2021 05:03:13 - INFO - __main__ - Step 55686: {'lr': 0.0003544962305862302, 'samples': 10691712, 'steps': 55685, 'loss/train': 1.4316520690917969} -11/07/2021 05:03:13 - INFO - __main__ - Step 55687: {'lr': 0.0003544914096297502, 'samples': 10691904, 'steps': 55686, 'loss/train': 1.3914636373519897} -11/07/2021 05:03:13 - INFO - __main__ - Step 55688: {'lr': 0.000354486588626188, 'samples': 10692096, 'steps': 55687, 'loss/train': 1.4303710460662842} -11/07/2021 05:03:14 - INFO - __main__ - Step 55689: {'lr': 0.00035448176757554574, 'samples': 10692288, 'steps': 55688, 'loss/train': 1.674943208694458} -11/07/2021 05:03:15 - INFO - __main__ - Step 55690: {'lr': 0.0003544769464778256, 'samples': 10692480, 'steps': 55689, 'loss/train': 2.552509069442749} -11/07/2021 05:03:15 - INFO - __main__ - Step 55691: {'lr': 0.00035447212533302975, 'samples': 10692672, 'steps': 55690, 'loss/train': 1.3160301446914673} -11/07/2021 05:03:15 - INFO - __main__ - Step 55692: {'lr': 0.00035446730414116036, 'samples': 10692864, 'steps': 55691, 'loss/train': 1.3368175029754639} -11/07/2021 05:03:16 - INFO - __main__ - Step 55693: {'lr': 0.00035446248290221967, 'samples': 10693056, 'steps': 55692, 'loss/train': 1.7469947338104248} -11/07/2021 05:03:17 - INFO - __main__ - Step 55694: {'lr': 0.00035445766161620976, 'samples': 10693248, 'steps': 55693, 'loss/train': 1.2765860557556152} -11/07/2021 05:03:17 - INFO - __main__ - Step 55695: {'lr': 0.00035445284028313284, 'samples': 10693440, 'steps': 55694, 'loss/train': 1.7284281253814697} -11/07/2021 05:03:17 - INFO - __main__ - Step 55696: {'lr': 0.00035444801890299103, 'samples': 10693632, 'steps': 55695, 'loss/train': 1.036617398262024} -11/07/2021 05:03:18 - INFO - __main__ - Step 55697: {'lr': 0.0003544431974757866, 'samples': 10693824, 'steps': 55696, 'loss/train': 0.9842028021812439} -11/07/2021 05:03:18 - INFO - __main__ - Step 55698: {'lr': 0.00035443837600152174, 'samples': 10694016, 'steps': 55697, 'loss/train': 1.3776626586914062} -11/07/2021 05:03:19 - INFO - __main__ - Step 55699: {'lr': 0.00035443355448019854, 'samples': 10694208, 'steps': 55698, 'loss/train': 1.433046579360962} -11/07/2021 05:03:19 - INFO - __main__ - Step 55700: {'lr': 0.0003544287329118191, 'samples': 10694400, 'steps': 55699, 'loss/train': 1.37983238697052} -11/07/2021 05:03:20 - INFO - __main__ - Step 55701: {'lr': 0.0003544239112963857, 'samples': 10694592, 'steps': 55700, 'loss/train': 1.3031537532806396} -11/07/2021 05:03:20 - INFO - __main__ - Step 55702: {'lr': 0.0003544190896339006, 'samples': 10694784, 'steps': 55701, 'loss/train': 1.7372462749481201} -11/07/2021 05:03:21 - INFO - __main__ - Step 55703: {'lr': 0.00035441426792436574, 'samples': 10694976, 'steps': 55702, 'loss/train': 1.5571116209030151} -11/07/2021 05:03:22 - INFO - __main__ - Step 55704: {'lr': 0.0003544094461677836, 'samples': 10695168, 'steps': 55703, 'loss/train': 1.8758482933044434} -11/07/2021 05:03:22 - INFO - __main__ - Step 55705: {'lr': 0.000354404624364156, 'samples': 10695360, 'steps': 55704, 'loss/train': 1.7318722009658813} -11/07/2021 05:03:22 - INFO - __main__ - Step 55706: {'lr': 0.00035439980251348533, 'samples': 10695552, 'steps': 55705, 'loss/train': 1.0945961475372314} -11/07/2021 05:03:23 - INFO - __main__ - Step 55707: {'lr': 0.0003543949806157738, 'samples': 10695744, 'steps': 55706, 'loss/train': 1.7378387451171875} -11/07/2021 05:03:23 - INFO - __main__ - Step 55708: {'lr': 0.0003543901586710234, 'samples': 10695936, 'steps': 55707, 'loss/train': 1.4655539989471436} -11/07/2021 05:03:23 - INFO - __main__ - Step 55709: {'lr': 0.00035438533667923644, 'samples': 10696128, 'steps': 55708, 'loss/train': 1.4681276082992554} -11/07/2021 05:03:24 - INFO - __main__ - Step 55710: {'lr': 0.0003543805146404151, 'samples': 10696320, 'steps': 55709, 'loss/train': 1.5186320543289185} -11/07/2021 05:03:25 - INFO - __main__ - Step 55711: {'lr': 0.0003543756925545615, 'samples': 10696512, 'steps': 55710, 'loss/train': 1.5182175636291504} -11/07/2021 05:03:25 - INFO - __main__ - Step 55712: {'lr': 0.0003543708704216778, 'samples': 10696704, 'steps': 55711, 'loss/train': 1.3943164348602295} -11/07/2021 05:03:25 - INFO - __main__ - Step 55713: {'lr': 0.00035436604824176616, 'samples': 10696896, 'steps': 55712, 'loss/train': 1.1336770057678223} -11/07/2021 05:03:26 - INFO - __main__ - Step 55714: {'lr': 0.0003543612260148288, 'samples': 10697088, 'steps': 55713, 'loss/train': 1.567400336265564} -11/07/2021 05:03:27 - INFO - __main__ - Step 55715: {'lr': 0.0003543564037408679, 'samples': 10697280, 'steps': 55714, 'loss/train': 1.5476655960083008} -11/07/2021 05:03:27 - INFO - __main__ - Step 55716: {'lr': 0.00035435158141988564, 'samples': 10697472, 'steps': 55715, 'loss/train': 1.5898628234863281} -11/07/2021 05:03:27 - INFO - __main__ - Step 55717: {'lr': 0.0003543467590518842, 'samples': 10697664, 'steps': 55716, 'loss/train': 1.419777274131775} -11/07/2021 05:03:28 - INFO - __main__ - Step 55718: {'lr': 0.00035434193663686566, 'samples': 10697856, 'steps': 55717, 'loss/train': 1.6237761974334717} -11/07/2021 05:03:28 - INFO - __main__ - Step 55719: {'lr': 0.0003543371141748323, 'samples': 10698048, 'steps': 55718, 'loss/train': 1.4816151857376099} -11/07/2021 05:03:30 - INFO - __main__ - Step 55720: {'lr': 0.0003543322916657862, 'samples': 10698240, 'steps': 55719, 'loss/train': 1.4831697940826416} -11/07/2021 05:03:30 - INFO - __main__ - Step 55721: {'lr': 0.0003543274691097295, 'samples': 10698432, 'steps': 55720, 'loss/train': 1.7541534900665283} -11/07/2021 05:03:30 - INFO - __main__ - Step 55722: {'lr': 0.00035432264650666457, 'samples': 10698624, 'steps': 55721, 'loss/train': 1.258467674255371} -11/07/2021 05:03:31 - INFO - __main__ - Step 55723: {'lr': 0.0003543178238565935, 'samples': 10698816, 'steps': 55722, 'loss/train': 1.677546739578247} -11/07/2021 05:03:31 - INFO - __main__ - Step 55724: {'lr': 0.0003543130011595183, 'samples': 10699008, 'steps': 55723, 'loss/train': 1.0825533866882324} -11/07/2021 05:03:32 - INFO - __main__ - Step 55725: {'lr': 0.0003543081784154414, 'samples': 10699200, 'steps': 55724, 'loss/train': 0.9049617648124695} -11/07/2021 05:03:32 - INFO - __main__ - Step 55726: {'lr': 0.00035430335562436474, 'samples': 10699392, 'steps': 55725, 'loss/train': 1.016931414604187} -11/07/2021 05:03:33 - INFO - __main__ - Step 55727: {'lr': 0.00035429853278629063, 'samples': 10699584, 'steps': 55726, 'loss/train': 1.0655796527862549} -11/07/2021 05:03:33 - INFO - __main__ - Step 55728: {'lr': 0.00035429370990122124, 'samples': 10699776, 'steps': 55727, 'loss/train': 1.3815515041351318} -11/07/2021 05:03:33 - INFO - __main__ - Step 55729: {'lr': 0.0003542888869691586, 'samples': 10699968, 'steps': 55728, 'loss/train': 1.3427400588989258} -11/07/2021 05:03:34 - INFO - __main__ - Step 55730: {'lr': 0.00035428406399010516, 'samples': 10700160, 'steps': 55729, 'loss/train': 1.446705937385559} -11/07/2021 05:03:35 - INFO - __main__ - Step 55731: {'lr': 0.00035427924096406287, 'samples': 10700352, 'steps': 55730, 'loss/train': 1.5031720399856567} -11/07/2021 05:03:35 - INFO - __main__ - Step 55732: {'lr': 0.00035427441789103397, 'samples': 10700544, 'steps': 55731, 'loss/train': 1.099146842956543} -11/07/2021 05:03:35 - INFO - __main__ - Step 55733: {'lr': 0.0003542695947710206, 'samples': 10700736, 'steps': 55732, 'loss/train': 1.984749674797058} -11/07/2021 05:03:36 - INFO - __main__ - Step 55734: {'lr': 0.00035426477160402495, 'samples': 10700928, 'steps': 55733, 'loss/train': 1.5043107271194458} -11/07/2021 05:03:37 - INFO - __main__ - Step 55735: {'lr': 0.0003542599483900492, 'samples': 10701120, 'steps': 55734, 'loss/train': 1.2688812017440796} -11/07/2021 05:03:37 - INFO - __main__ - Step 55736: {'lr': 0.00035425512512909555, 'samples': 10701312, 'steps': 55735, 'loss/train': 1.0769466161727905} -11/07/2021 05:03:37 - INFO - __main__ - Step 55737: {'lr': 0.00035425030182116617, 'samples': 10701504, 'steps': 55736, 'loss/train': 1.056416392326355} -11/07/2021 05:03:38 - INFO - __main__ - Step 55738: {'lr': 0.0003542454784662632, 'samples': 10701696, 'steps': 55737, 'loss/train': 1.3985483646392822} -11/07/2021 05:03:38 - INFO - __main__ - Step 55739: {'lr': 0.00035424065506438877, 'samples': 10701888, 'steps': 55738, 'loss/train': 1.5039695501327515} -11/07/2021 05:03:39 - INFO - __main__ - Step 55740: {'lr': 0.0003542358316155452, 'samples': 10702080, 'steps': 55739, 'loss/train': 1.6511571407318115} -11/07/2021 05:03:39 - INFO - __main__ - Step 55741: {'lr': 0.00035423100811973453, 'samples': 10702272, 'steps': 55740, 'loss/train': 1.7982109785079956} -11/07/2021 05:03:40 - INFO - __main__ - Step 55742: {'lr': 0.00035422618457695893, 'samples': 10702464, 'steps': 55741, 'loss/train': 1.3135054111480713} -11/07/2021 05:03:40 - INFO - __main__ - Step 55743: {'lr': 0.0003542213609872207, 'samples': 10702656, 'steps': 55742, 'loss/train': 1.3639512062072754} -11/07/2021 05:03:41 - INFO - __main__ - Step 55744: {'lr': 0.0003542165373505219, 'samples': 10702848, 'steps': 55743, 'loss/train': 1.1558784246444702} -11/07/2021 05:03:42 - INFO - __main__ - Step 55745: {'lr': 0.0003542117136668647, 'samples': 10703040, 'steps': 55744, 'loss/train': 1.5514709949493408} -11/07/2021 05:03:42 - INFO - __main__ - Step 55746: {'lr': 0.0003542068899362514, 'samples': 10703232, 'steps': 55745, 'loss/train': 1.05830717086792} -11/07/2021 05:03:43 - INFO - __main__ - Step 55747: {'lr': 0.000354202066158684, 'samples': 10703424, 'steps': 55746, 'loss/train': 1.4797271490097046} -11/07/2021 05:03:43 - INFO - __main__ - Step 55748: {'lr': 0.0003541972423341648, 'samples': 10703616, 'steps': 55747, 'loss/train': 0.926233172416687} -11/07/2021 05:03:43 - INFO - __main__ - Step 55749: {'lr': 0.0003541924184626959, 'samples': 10703808, 'steps': 55748, 'loss/train': 1.4752252101898193} -11/07/2021 05:03:44 - INFO - __main__ - Step 55750: {'lr': 0.00035418759454427953, 'samples': 10704000, 'steps': 55749, 'loss/train': 1.860127329826355} -11/07/2021 05:03:45 - INFO - __main__ - Step 55751: {'lr': 0.00035418277057891776, 'samples': 10704192, 'steps': 55750, 'loss/train': 1.6169946193695068} -11/07/2021 05:03:45 - INFO - __main__ - Step 55752: {'lr': 0.00035417794656661297, 'samples': 10704384, 'steps': 55751, 'loss/train': 1.3335211277008057} -11/07/2021 05:03:45 - INFO - __main__ - Step 55753: {'lr': 0.0003541731225073671, 'samples': 10704576, 'steps': 55752, 'loss/train': 1.571130394935608} -11/07/2021 05:03:46 - INFO - __main__ - Step 55754: {'lr': 0.0003541682984011825, 'samples': 10704768, 'steps': 55753, 'loss/train': 1.1665571928024292} -11/07/2021 05:03:46 - INFO - __main__ - Step 55755: {'lr': 0.00035416347424806124, 'samples': 10704960, 'steps': 55754, 'loss/train': 1.2701736688613892} -11/07/2021 05:03:47 - INFO - __main__ - Step 55756: {'lr': 0.00035415865004800553, 'samples': 10705152, 'steps': 55755, 'loss/train': 1.2953274250030518} -11/07/2021 05:03:47 - INFO - __main__ - Step 55757: {'lr': 0.00035415382580101753, 'samples': 10705344, 'steps': 55756, 'loss/train': 1.617814302444458} -11/07/2021 05:03:48 - INFO - __main__ - Step 55758: {'lr': 0.00035414900150709946, 'samples': 10705536, 'steps': 55757, 'loss/train': 1.571497917175293} -11/07/2021 05:03:48 - INFO - __main__ - Step 55759: {'lr': 0.00035414417716625343, 'samples': 10705728, 'steps': 55758, 'loss/train': 1.2555686235427856} -11/07/2021 05:03:48 - INFO - __main__ - Step 55760: {'lr': 0.00035413935277848156, 'samples': 10705920, 'steps': 55759, 'loss/train': 1.4754409790039062} -11/07/2021 05:03:50 - INFO - __main__ - Step 55761: {'lr': 0.00035413452834378624, 'samples': 10706112, 'steps': 55760, 'loss/train': 1.7791800498962402} -11/07/2021 05:03:50 - INFO - __main__ - Step 55762: {'lr': 0.0003541297038621694, 'samples': 10706304, 'steps': 55761, 'loss/train': 1.4712127447128296} -11/07/2021 05:03:50 - INFO - __main__ - Step 55763: {'lr': 0.00035412487933363335, 'samples': 10706496, 'steps': 55762, 'loss/train': 0.13739466667175293} -11/07/2021 05:03:51 - INFO - __main__ - Step 55764: {'lr': 0.00035412005475818033, 'samples': 10706688, 'steps': 55763, 'loss/train': 1.9544419050216675} -11/07/2021 05:03:51 - INFO - __main__ - Step 55765: {'lr': 0.0003541152301358124, 'samples': 10706880, 'steps': 55764, 'loss/train': 1.2634907960891724} -11/07/2021 05:03:52 - INFO - __main__ - Step 55766: {'lr': 0.0003541104054665316, 'samples': 10707072, 'steps': 55765, 'loss/train': 1.4438755512237549} -11/07/2021 05:03:52 - INFO - __main__ - Step 55767: {'lr': 0.0003541055807503404, 'samples': 10707264, 'steps': 55766, 'loss/train': 1.4670195579528809} -11/07/2021 05:03:53 - INFO - __main__ - Step 55768: {'lr': 0.0003541007559872408, 'samples': 10707456, 'steps': 55767, 'loss/train': 1.658206820487976} -11/07/2021 05:03:53 - INFO - __main__ - Step 55769: {'lr': 0.000354095931177235, 'samples': 10707648, 'steps': 55768, 'loss/train': 1.565147876739502} -11/07/2021 05:03:53 - INFO - __main__ - Step 55770: {'lr': 0.0003540911063203252, 'samples': 10707840, 'steps': 55769, 'loss/train': 1.3767871856689453} -11/07/2021 05:03:54 - INFO - __main__ - Step 55771: {'lr': 0.00035408628141651356, 'samples': 10708032, 'steps': 55770, 'loss/train': 1.4693639278411865} -11/07/2021 05:03:55 - INFO - __main__ - Step 55772: {'lr': 0.0003540814564658022, 'samples': 10708224, 'steps': 55771, 'loss/train': 1.3036214113235474} -11/07/2021 05:03:55 - INFO - __main__ - Step 55773: {'lr': 0.00035407663146819337, 'samples': 10708416, 'steps': 55772, 'loss/train': 1.8937538862228394} -11/07/2021 05:03:55 - INFO - __main__ - Step 55774: {'lr': 0.0003540718064236892, 'samples': 10708608, 'steps': 55773, 'loss/train': 1.8074778318405151} -11/07/2021 05:03:56 - INFO - __main__ - Step 55775: {'lr': 0.0003540669813322919, 'samples': 10708800, 'steps': 55774, 'loss/train': 1.460472583770752} -11/07/2021 05:03:56 - INFO - __main__ - Step 55776: {'lr': 0.00035406215619400357, 'samples': 10708992, 'steps': 55775, 'loss/train': 1.9324228763580322} -11/07/2021 05:03:57 - INFO - __main__ - Step 55777: {'lr': 0.00035405733100882654, 'samples': 10709184, 'steps': 55776, 'loss/train': 1.4910401105880737} -11/07/2021 05:03:58 - INFO - __main__ - Step 55778: {'lr': 0.0003540525057767628, 'samples': 10709376, 'steps': 55777, 'loss/train': 1.679534912109375} -11/07/2021 05:03:58 - INFO - __main__ - Step 55779: {'lr': 0.0003540476804978146, 'samples': 10709568, 'steps': 55778, 'loss/train': 1.5839797258377075} -11/07/2021 05:03:58 - INFO - __main__ - Step 55780: {'lr': 0.00035404285517198417, 'samples': 10709760, 'steps': 55779, 'loss/train': 1.5468313694000244} -11/07/2021 05:03:59 - INFO - __main__ - Step 55781: {'lr': 0.00035403802979927355, 'samples': 10709952, 'steps': 55780, 'loss/train': 1.651582956314087} -11/07/2021 05:04:00 - INFO - __main__ - Step 55782: {'lr': 0.0003540332043796851, 'samples': 10710144, 'steps': 55781, 'loss/train': 1.212729811668396} -11/07/2021 05:04:00 - INFO - __main__ - Step 55783: {'lr': 0.00035402837891322083, 'samples': 10710336, 'steps': 55782, 'loss/train': 1.1240630149841309} -11/07/2021 05:04:00 - INFO - __main__ - Step 55784: {'lr': 0.00035402355339988307, 'samples': 10710528, 'steps': 55783, 'loss/train': 1.4452277421951294} -11/07/2021 05:04:01 - INFO - __main__ - Step 55785: {'lr': 0.00035401872783967384, 'samples': 10710720, 'steps': 55784, 'loss/train': 1.333119511604309} -11/07/2021 05:04:01 - INFO - __main__ - Step 55786: {'lr': 0.00035401390223259536, 'samples': 10710912, 'steps': 55785, 'loss/train': 1.4963150024414062} -11/07/2021 05:04:02 - INFO - __main__ - Step 55787: {'lr': 0.0003540090765786498, 'samples': 10711104, 'steps': 55786, 'loss/train': 1.3810827732086182} -11/07/2021 05:04:03 - INFO - __main__ - Step 55788: {'lr': 0.0003540042508778394, 'samples': 10711296, 'steps': 55787, 'loss/train': 6.768846035003662} -11/07/2021 05:04:03 - INFO - __main__ - Step 55789: {'lr': 0.00035399942513016623, 'samples': 10711488, 'steps': 55788, 'loss/train': 1.3474509716033936} -11/07/2021 05:04:03 - INFO - __main__ - Step 55790: {'lr': 0.0003539945993356326, 'samples': 10711680, 'steps': 55789, 'loss/train': 1.1473783254623413} -11/07/2021 05:04:04 - INFO - __main__ - Step 55791: {'lr': 0.0003539897734942406, 'samples': 10711872, 'steps': 55790, 'loss/train': 1.2376493215560913} -11/07/2021 05:04:04 - INFO - __main__ - Step 55792: {'lr': 0.00035398494760599243, 'samples': 10712064, 'steps': 55791, 'loss/train': 1.5866944789886475} -11/07/2021 05:04:05 - INFO - __main__ - Step 55793: {'lr': 0.00035398012167089016, 'samples': 10712256, 'steps': 55792, 'loss/train': 1.3174208402633667} -11/07/2021 05:04:05 - INFO - __main__ - Step 55794: {'lr': 0.0003539752956889361, 'samples': 10712448, 'steps': 55793, 'loss/train': 1.541314721107483} -11/07/2021 05:04:06 - INFO - __main__ - Step 55795: {'lr': 0.00035397046966013235, 'samples': 10712640, 'steps': 55794, 'loss/train': 1.03879714012146} -11/07/2021 05:04:06 - INFO - __main__ - Step 55796: {'lr': 0.00035396564358448115, 'samples': 10712832, 'steps': 55795, 'loss/train': 1.6715527772903442} -11/07/2021 05:04:06 - INFO - __main__ - Step 55797: {'lr': 0.00035396081746198467, 'samples': 10713024, 'steps': 55796, 'loss/train': 0.9951236844062805} -11/07/2021 05:04:08 - INFO - __main__ - Step 55798: {'lr': 0.000353955991292645, 'samples': 10713216, 'steps': 55797, 'loss/train': 1.7825127840042114} -11/07/2021 05:04:08 - INFO - __main__ - Step 55799: {'lr': 0.00035395116507646435, 'samples': 10713408, 'steps': 55798, 'loss/train': 1.3425874710083008} -11/07/2021 05:04:08 - INFO - __main__ - Step 55800: {'lr': 0.00035394633881344497, 'samples': 10713600, 'steps': 55799, 'loss/train': 1.4844225645065308} -11/07/2021 05:04:09 - INFO - __main__ - Step 55801: {'lr': 0.00035394151250358886, 'samples': 10713792, 'steps': 55800, 'loss/train': 1.30772066116333} -11/07/2021 05:04:09 - INFO - __main__ - Step 55802: {'lr': 0.00035393668614689837, 'samples': 10713984, 'steps': 55801, 'loss/train': 1.5883336067199707} -11/07/2021 05:04:09 - INFO - __main__ - Step 55803: {'lr': 0.00035393185974337565, 'samples': 10714176, 'steps': 55802, 'loss/train': 1.5440160036087036} -11/07/2021 05:04:10 - INFO - __main__ - Step 55804: {'lr': 0.0003539270332930228, 'samples': 10714368, 'steps': 55803, 'loss/train': 1.5361167192459106} -11/07/2021 05:04:11 - INFO - __main__ - Step 55805: {'lr': 0.00035392220679584206, 'samples': 10714560, 'steps': 55804, 'loss/train': 0.9911054372787476} -11/07/2021 05:04:11 - INFO - __main__ - Step 55806: {'lr': 0.0003539173802518356, 'samples': 10714752, 'steps': 55805, 'loss/train': 1.6084593534469604} -11/07/2021 05:04:12 - INFO - __main__ - Step 55807: {'lr': 0.0003539125536610055, 'samples': 10714944, 'steps': 55806, 'loss/train': 0.6804617643356323} -11/07/2021 05:04:12 - INFO - __main__ - Step 55808: {'lr': 0.00035390772702335405, 'samples': 10715136, 'steps': 55807, 'loss/train': 1.5012800693511963} -11/07/2021 05:04:13 - INFO - __main__ - Step 55809: {'lr': 0.0003539029003388833, 'samples': 10715328, 'steps': 55808, 'loss/train': 1.6742792129516602} -11/07/2021 05:04:13 - INFO - __main__ - Step 55810: {'lr': 0.0003538980736075956, 'samples': 10715520, 'steps': 55809, 'loss/train': 1.4297534227371216} -11/07/2021 05:04:14 - INFO - __main__ - Step 55811: {'lr': 0.0003538932468294931, 'samples': 10715712, 'steps': 55810, 'loss/train': 1.3954731225967407} -11/07/2021 05:04:14 - INFO - __main__ - Step 55812: {'lr': 0.0003538884200045778, 'samples': 10715904, 'steps': 55811, 'loss/train': 1.2371412515640259} -11/07/2021 05:04:14 - INFO - __main__ - Step 55813: {'lr': 0.00035388359313285196, 'samples': 10716096, 'steps': 55812, 'loss/train': 1.278853178024292} -11/07/2021 05:04:15 - INFO - __main__ - Step 55814: {'lr': 0.0003538787662143178, 'samples': 10716288, 'steps': 55813, 'loss/train': 1.3808411359786987} -11/07/2021 05:04:16 - INFO - __main__ - Step 55815: {'lr': 0.00035387393924897747, 'samples': 10716480, 'steps': 55814, 'loss/train': 1.3120583295822144} -11/07/2021 05:04:16 - INFO - __main__ - Step 55816: {'lr': 0.0003538691122368332, 'samples': 10716672, 'steps': 55815, 'loss/train': 1.2973705530166626} -11/07/2021 05:04:16 - INFO - __main__ - Step 55817: {'lr': 0.00035386428517788707, 'samples': 10716864, 'steps': 55816, 'loss/train': 1.9615147113800049} -11/07/2021 05:04:17 - INFO - __main__ - Step 55818: {'lr': 0.00035385945807214124, 'samples': 10717056, 'steps': 55817, 'loss/train': 1.3233554363250732} -11/07/2021 05:04:18 - INFO - __main__ - Step 55819: {'lr': 0.000353854630919598, 'samples': 10717248, 'steps': 55818, 'loss/train': 1.0138968229293823} -11/07/2021 05:04:18 - INFO - __main__ - Step 55820: {'lr': 0.0003538498037202595, 'samples': 10717440, 'steps': 55819, 'loss/train': 1.7565664052963257} -11/07/2021 05:04:18 - INFO - __main__ - Step 55821: {'lr': 0.0003538449764741278, 'samples': 10717632, 'steps': 55820, 'loss/train': 1.3925102949142456} -11/07/2021 05:04:19 - INFO - __main__ - Step 55822: {'lr': 0.00035384014918120527, 'samples': 10717824, 'steps': 55821, 'loss/train': 1.0944126844406128} -11/07/2021 05:04:19 - INFO - __main__ - Step 55823: {'lr': 0.00035383532184149393, 'samples': 10718016, 'steps': 55822, 'loss/train': 1.1503760814666748} -11/07/2021 05:04:20 - INFO - __main__ - Step 55824: {'lr': 0.00035383049445499596, 'samples': 10718208, 'steps': 55823, 'loss/train': 1.5366030931472778} -11/07/2021 05:04:20 - INFO - __main__ - Step 55825: {'lr': 0.0003538256670217135, 'samples': 10718400, 'steps': 55824, 'loss/train': 1.2309882640838623} -11/07/2021 05:04:21 - INFO - __main__ - Step 55826: {'lr': 0.0003538208395416489, 'samples': 10718592, 'steps': 55825, 'loss/train': 1.2972712516784668} -11/07/2021 05:04:21 - INFO - __main__ - Step 55827: {'lr': 0.00035381601201480426, 'samples': 10718784, 'steps': 55826, 'loss/train': 1.76887845993042} -11/07/2021 05:04:21 - INFO - __main__ - Step 55828: {'lr': 0.00035381118444118167, 'samples': 10718976, 'steps': 55827, 'loss/train': 0.9605786204338074} -11/07/2021 05:04:23 - INFO - __main__ - Step 55829: {'lr': 0.00035380635682078334, 'samples': 10719168, 'steps': 55828, 'loss/train': 1.267890453338623} -11/07/2021 05:04:23 - INFO - __main__ - Step 55830: {'lr': 0.00035380152915361144, 'samples': 10719360, 'steps': 55829, 'loss/train': 1.2921608686447144} -11/07/2021 05:04:23 - INFO - __main__ - Step 55831: {'lr': 0.00035379670143966826, 'samples': 10719552, 'steps': 55830, 'loss/train': 2.0029077529907227} -11/07/2021 05:04:24 - INFO - __main__ - Step 55832: {'lr': 0.00035379187367895584, 'samples': 10719744, 'steps': 55831, 'loss/train': 1.0866672992706299} -11/07/2021 05:04:24 - INFO - __main__ - Step 55833: {'lr': 0.0003537870458714765, 'samples': 10719936, 'steps': 55832, 'loss/train': 0.10541039705276489} -11/07/2021 05:04:25 - INFO - __main__ - Step 55834: {'lr': 0.0003537822180172322, 'samples': 10720128, 'steps': 55833, 'loss/train': 1.5007840394973755} -11/07/2021 05:04:25 - INFO - __main__ - Step 55835: {'lr': 0.00035377739011622524, 'samples': 10720320, 'steps': 55834, 'loss/train': 1.2568243741989136} -11/07/2021 05:04:26 - INFO - __main__ - Step 55836: {'lr': 0.0003537725621684578, 'samples': 10720512, 'steps': 55835, 'loss/train': 1.7705588340759277} -11/07/2021 05:04:26 - INFO - __main__ - Step 55837: {'lr': 0.0003537677341739321, 'samples': 10720704, 'steps': 55836, 'loss/train': 1.0530240535736084} -11/07/2021 05:04:26 - INFO - __main__ - Step 55838: {'lr': 0.0003537629061326503, 'samples': 10720896, 'steps': 55837, 'loss/train': 0.9166146516799927} -11/07/2021 05:04:28 - INFO - __main__ - Step 55839: {'lr': 0.0003537580780446144, 'samples': 10721088, 'steps': 55838, 'loss/train': 1.3045827150344849} -11/07/2021 05:04:28 - INFO - __main__ - Step 55840: {'lr': 0.0003537532499098268, 'samples': 10721280, 'steps': 55839, 'loss/train': 1.0616631507873535} -11/07/2021 05:04:28 - INFO - __main__ - Step 55841: {'lr': 0.0003537484217282895, 'samples': 10721472, 'steps': 55840, 'loss/train': 1.56183922290802} -11/07/2021 05:04:29 - INFO - __main__ - Step 55842: {'lr': 0.00035374359350000484, 'samples': 10721664, 'steps': 55841, 'loss/train': 1.5610754489898682} -11/07/2021 05:04:29 - INFO - __main__ - Step 55843: {'lr': 0.0003537387652249749, 'samples': 10721856, 'steps': 55842, 'loss/train': 0.9415774941444397} -11/07/2021 05:04:30 - INFO - __main__ - Step 55844: {'lr': 0.0003537339369032019, 'samples': 10722048, 'steps': 55843, 'loss/train': 1.4559112787246704} -11/07/2021 05:04:30 - INFO - __main__ - Step 55845: {'lr': 0.0003537291085346879, 'samples': 10722240, 'steps': 55844, 'loss/train': 0.9914204478263855} -11/07/2021 05:04:31 - INFO - __main__ - Step 55846: {'lr': 0.0003537242801194353, 'samples': 10722432, 'steps': 55845, 'loss/train': 1.1230731010437012} -11/07/2021 05:04:31 - INFO - __main__ - Step 55847: {'lr': 0.000353719451657446, 'samples': 10722624, 'steps': 55846, 'loss/train': 2.628389596939087} -11/07/2021 05:04:31 - INFO - __main__ - Step 55848: {'lr': 0.0003537146231487224, 'samples': 10722816, 'steps': 55847, 'loss/train': 1.2518551349639893} -11/07/2021 05:04:32 - INFO - __main__ - Step 55849: {'lr': 0.0003537097945932666, 'samples': 10723008, 'steps': 55848, 'loss/train': 1.021565318107605} -11/07/2021 05:04:33 - INFO - __main__ - Step 55850: {'lr': 0.00035370496599108073, 'samples': 10723200, 'steps': 55849, 'loss/train': 1.3686603307724} -11/07/2021 05:04:33 - INFO - __main__ - Step 55851: {'lr': 0.00035370013734216697, 'samples': 10723392, 'steps': 55850, 'loss/train': 1.6993813514709473} -11/07/2021 05:04:34 - INFO - __main__ - Step 55852: {'lr': 0.0003536953086465276, 'samples': 10723584, 'steps': 55851, 'loss/train': 1.298002004623413} -11/07/2021 05:04:34 - INFO - __main__ - Step 55853: {'lr': 0.0003536904799041647, 'samples': 10723776, 'steps': 55852, 'loss/train': 1.31694495677948} -11/07/2021 05:04:35 - INFO - __main__ - Step 55854: {'lr': 0.00035368565111508043, 'samples': 10723968, 'steps': 55853, 'loss/train': 1.5860368013381958} -11/07/2021 05:04:35 - INFO - __main__ - Step 55855: {'lr': 0.000353680822279277, 'samples': 10724160, 'steps': 55854, 'loss/train': 1.274109959602356} -11/07/2021 05:04:36 - INFO - __main__ - Step 55856: {'lr': 0.00035367599339675664, 'samples': 10724352, 'steps': 55855, 'loss/train': 0.953221321105957} -11/07/2021 05:04:36 - INFO - __main__ - Step 55857: {'lr': 0.0003536711644675215, 'samples': 10724544, 'steps': 55856, 'loss/train': 1.5896235704421997} -11/07/2021 05:04:36 - INFO - __main__ - Step 55858: {'lr': 0.0003536663354915737, 'samples': 10724736, 'steps': 55857, 'loss/train': 0.6878846287727356} -11/07/2021 05:04:38 - INFO - __main__ - Step 55859: {'lr': 0.00035366150646891543, 'samples': 10724928, 'steps': 55858, 'loss/train': 1.3998024463653564} -11/07/2021 05:04:38 - INFO - __main__ - Step 55860: {'lr': 0.0003536566773995489, 'samples': 10725120, 'steps': 55859, 'loss/train': 1.8037703037261963} -11/07/2021 05:04:38 - INFO - __main__ - Step 55861: {'lr': 0.0003536518482834763, 'samples': 10725312, 'steps': 55860, 'loss/train': 2.0232062339782715} -11/07/2021 05:04:39 - INFO - __main__ - Step 55862: {'lr': 0.0003536470191206997, 'samples': 10725504, 'steps': 55861, 'loss/train': 1.6955820322036743} -11/07/2021 05:04:39 - INFO - __main__ - Step 55863: {'lr': 0.00035364218991122145, 'samples': 10725696, 'steps': 55862, 'loss/train': 1.434757113456726} -11/07/2021 05:04:40 - INFO - __main__ - Step 55864: {'lr': 0.00035363736065504355, 'samples': 10725888, 'steps': 55863, 'loss/train': 1.400452971458435} -11/07/2021 05:04:40 - INFO - __main__ - Step 55865: {'lr': 0.0003536325313521683, 'samples': 10726080, 'steps': 55864, 'loss/train': 1.664194107055664} -11/07/2021 05:04:41 - INFO - __main__ - Step 55866: {'lr': 0.0003536277020025978, 'samples': 10726272, 'steps': 55865, 'loss/train': 1.6159415245056152} -11/07/2021 05:04:41 - INFO - __main__ - Step 55867: {'lr': 0.0003536228726063343, 'samples': 10726464, 'steps': 55866, 'loss/train': 0.9347060322761536} -11/07/2021 05:04:41 - INFO - __main__ - Step 55868: {'lr': 0.00035361804316337987, 'samples': 10726656, 'steps': 55867, 'loss/train': 1.5989532470703125} -11/07/2021 05:04:42 - INFO - __main__ - Step 55869: {'lr': 0.00035361321367373676, 'samples': 10726848, 'steps': 55868, 'loss/train': 1.2443060874938965} -11/07/2021 05:04:43 - INFO - __main__ - Step 55870: {'lr': 0.00035360838413740715, 'samples': 10727040, 'steps': 55869, 'loss/train': 1.1219351291656494} -11/07/2021 05:04:43 - INFO - __main__ - Step 55871: {'lr': 0.0003536035545543933, 'samples': 10727232, 'steps': 55870, 'loss/train': 0.5671005249023438} -11/07/2021 05:04:43 - INFO - __main__ - Step 55872: {'lr': 0.00035359872492469715, 'samples': 10727424, 'steps': 55871, 'loss/train': 1.500485897064209} -11/07/2021 05:04:44 - INFO - __main__ - Step 55873: {'lr': 0.0003535938952483211, 'samples': 10727616, 'steps': 55872, 'loss/train': 1.4232797622680664} -11/07/2021 05:04:45 - INFO - __main__ - Step 55874: {'lr': 0.00035358906552526714, 'samples': 10727808, 'steps': 55873, 'loss/train': 1.3123780488967896} -11/07/2021 05:04:45 - INFO - __main__ - Step 55875: {'lr': 0.0003535842357555376, 'samples': 10728000, 'steps': 55874, 'loss/train': 1.4959659576416016} -11/07/2021 05:04:46 - INFO - __main__ - Step 55876: {'lr': 0.0003535794059391346, 'samples': 10728192, 'steps': 55875, 'loss/train': 1.2305139303207397} -11/07/2021 05:04:46 - INFO - __main__ - Step 55877: {'lr': 0.00035357457607606034, 'samples': 10728384, 'steps': 55876, 'loss/train': 1.3052294254302979} -11/07/2021 05:04:46 - INFO - __main__ - Step 55878: {'lr': 0.00035356974616631697, 'samples': 10728576, 'steps': 55877, 'loss/train': 1.7017009258270264} -11/07/2021 05:04:47 - INFO - __main__ - Step 55879: {'lr': 0.00035356491620990667, 'samples': 10728768, 'steps': 55878, 'loss/train': 1.325434923171997} -11/07/2021 05:04:48 - INFO - __main__ - Step 55880: {'lr': 0.0003535600862068316, 'samples': 10728960, 'steps': 55879, 'loss/train': 1.3903403282165527} -11/07/2021 05:04:48 - INFO - __main__ - Step 55881: {'lr': 0.00035355525615709393, 'samples': 10729152, 'steps': 55880, 'loss/train': 1.5887025594711304} -11/07/2021 05:04:49 - INFO - __main__ - Step 55882: {'lr': 0.0003535504260606959, 'samples': 10729344, 'steps': 55881, 'loss/train': 1.132631778717041} -11/07/2021 05:04:49 - INFO - __main__ - Step 55883: {'lr': 0.00035354559591763965, 'samples': 10729536, 'steps': 55882, 'loss/train': 1.4556214809417725} -11/07/2021 05:04:49 - INFO - __main__ - Step 55884: {'lr': 0.0003535407657279273, 'samples': 10729728, 'steps': 55883, 'loss/train': 1.1831425428390503} -11/07/2021 05:04:50 - INFO - __main__ - Step 55885: {'lr': 0.00035353593549156115, 'samples': 10729920, 'steps': 55884, 'loss/train': 1.3290823698043823} -11/07/2021 05:04:51 - INFO - __main__ - Step 55886: {'lr': 0.00035353110520854324, 'samples': 10730112, 'steps': 55885, 'loss/train': 1.6130807399749756} -11/07/2021 05:04:51 - INFO - __main__ - Step 55887: {'lr': 0.0003535262748788759, 'samples': 10730304, 'steps': 55886, 'loss/train': 1.4945546388626099} -11/07/2021 05:04:51 - INFO - __main__ - Step 55888: {'lr': 0.00035352144450256115, 'samples': 10730496, 'steps': 55887, 'loss/train': 1.2880640029907227} -11/07/2021 05:04:52 - INFO - __main__ - Step 55889: {'lr': 0.00035351661407960125, 'samples': 10730688, 'steps': 55888, 'loss/train': 1.4798877239227295} -11/07/2021 05:04:53 - INFO - __main__ - Step 55890: {'lr': 0.0003535117836099983, 'samples': 10730880, 'steps': 55889, 'loss/train': 1.4757639169692993} -11/07/2021 05:04:53 - INFO - __main__ - Step 55891: {'lr': 0.00035350695309375465, 'samples': 10731072, 'steps': 55890, 'loss/train': 1.1573599576950073} -11/07/2021 05:04:53 - INFO - __main__ - Step 55892: {'lr': 0.00035350212253087233, 'samples': 10731264, 'steps': 55891, 'loss/train': 1.365740180015564} -11/07/2021 05:04:54 - INFO - __main__ - Step 55893: {'lr': 0.0003534972919213535, 'samples': 10731456, 'steps': 55892, 'loss/train': 1.3830736875534058} -11/07/2021 05:04:54 - INFO - __main__ - Step 55894: {'lr': 0.0003534924612652004, 'samples': 10731648, 'steps': 55893, 'loss/train': 1.2669957876205444} -11/07/2021 05:04:55 - INFO - __main__ - Step 55895: {'lr': 0.00035348763056241515, 'samples': 10731840, 'steps': 55894, 'loss/train': 1.4290146827697754} -11/07/2021 05:04:55 - INFO - __main__ - Step 55896: {'lr': 0.0003534827998130001, 'samples': 10732032, 'steps': 55895, 'loss/train': 1.075005292892456} -11/07/2021 05:04:56 - INFO - __main__ - Step 55897: {'lr': 0.00035347796901695716, 'samples': 10732224, 'steps': 55896, 'loss/train': 1.3419417142868042} -11/07/2021 05:04:56 - INFO - __main__ - Step 55898: {'lr': 0.0003534731381742888, 'samples': 10732416, 'steps': 55897, 'loss/train': 1.0262254476547241} -11/07/2021 05:04:56 - INFO - __main__ - Step 55899: {'lr': 0.0003534683072849969, 'samples': 10732608, 'steps': 55898, 'loss/train': 1.3884958028793335} -11/07/2021 05:04:57 - INFO - __main__ - Step 55900: {'lr': 0.0003534634763490838, 'samples': 10732800, 'steps': 55899, 'loss/train': 1.6960127353668213} -11/07/2021 05:04:58 - INFO - __main__ - Step 55901: {'lr': 0.0003534586453665517, 'samples': 10732992, 'steps': 55900, 'loss/train': 1.274144172668457} -11/07/2021 05:04:58 - INFO - __main__ - Step 55902: {'lr': 0.00035345381433740273, 'samples': 10733184, 'steps': 55901, 'loss/train': 1.7366596460342407} -11/07/2021 05:04:59 - INFO - __main__ - Step 55903: {'lr': 0.00035344898326163907, 'samples': 10733376, 'steps': 55902, 'loss/train': 1.1894418001174927} -11/07/2021 05:04:59 - INFO - __main__ - Step 55904: {'lr': 0.00035344415213926284, 'samples': 10733568, 'steps': 55903, 'loss/train': 1.2441020011901855} -11/07/2021 05:05:00 - INFO - __main__ - Step 55905: {'lr': 0.0003534393209702764, 'samples': 10733760, 'steps': 55904, 'loss/train': 0.24876174330711365} -11/07/2021 05:05:00 - INFO - __main__ - Step 55906: {'lr': 0.0003534344897546816, 'samples': 10733952, 'steps': 55905, 'loss/train': 1.4499990940093994} -11/07/2021 05:05:01 - INFO - __main__ - Step 55907: {'lr': 0.00035342965849248097, 'samples': 10734144, 'steps': 55906, 'loss/train': 1.3530652523040771} -11/07/2021 05:05:01 - INFO - __main__ - Step 55908: {'lr': 0.00035342482718367645, 'samples': 10734336, 'steps': 55907, 'loss/train': 0.10861533880233765} -11/07/2021 05:05:01 - INFO - __main__ - Step 55909: {'lr': 0.0003534199958282703, 'samples': 10734528, 'steps': 55908, 'loss/train': 1.851309895515442} -11/07/2021 05:05:02 - INFO - __main__ - Step 55910: {'lr': 0.00035341516442626475, 'samples': 10734720, 'steps': 55909, 'loss/train': 1.528367519378662} -11/07/2021 05:05:03 - INFO - __main__ - Step 55911: {'lr': 0.0003534103329776619, 'samples': 10734912, 'steps': 55910, 'loss/train': 1.3974149227142334} -11/07/2021 05:05:03 - INFO - __main__ - Step 55912: {'lr': 0.000353405501482464, 'samples': 10735104, 'steps': 55911, 'loss/train': 1.1010369062423706} -11/07/2021 05:05:04 - INFO - __main__ - Step 55913: {'lr': 0.0003534006699406731, 'samples': 10735296, 'steps': 55912, 'loss/train': 1.5172953605651855} -11/07/2021 05:05:04 - INFO - __main__ - Step 55914: {'lr': 0.0003533958383522915, 'samples': 10735488, 'steps': 55913, 'loss/train': 1.2249624729156494} -11/07/2021 05:05:05 - INFO - __main__ - Step 55915: {'lr': 0.0003533910067173213, 'samples': 10735680, 'steps': 55914, 'loss/train': 1.1259907484054565} -11/07/2021 05:05:05 - INFO - __main__ - Step 55916: {'lr': 0.0003533861750357647, 'samples': 10735872, 'steps': 55915, 'loss/train': 1.15132737159729} -11/07/2021 05:05:06 - INFO - __main__ - Step 55917: {'lr': 0.0003533813433076239, 'samples': 10736064, 'steps': 55916, 'loss/train': 1.443205714225769} -11/07/2021 05:05:06 - INFO - __main__ - Step 55918: {'lr': 0.00035337651153290113, 'samples': 10736256, 'steps': 55917, 'loss/train': 1.978428602218628} -11/07/2021 05:05:06 - INFO - __main__ - Step 55919: {'lr': 0.00035337167971159837, 'samples': 10736448, 'steps': 55918, 'loss/train': 1.5240490436553955} -11/07/2021 05:05:07 - INFO - __main__ - Step 55920: {'lr': 0.000353366847843718, 'samples': 10736640, 'steps': 55919, 'loss/train': 1.230600357055664} -11/07/2021 05:05:08 - INFO - __main__ - Step 55921: {'lr': 0.0003533620159292621, 'samples': 10736832, 'steps': 55920, 'loss/train': 1.642690896987915} -11/07/2021 05:05:08 - INFO - __main__ - Step 55922: {'lr': 0.0003533571839682329, 'samples': 10737024, 'steps': 55921, 'loss/train': 1.8003747463226318} -11/07/2021 05:05:09 - INFO - __main__ - Step 55923: {'lr': 0.00035335235196063254, 'samples': 10737216, 'steps': 55922, 'loss/train': 0.1256265640258789} -11/07/2021 05:05:09 - INFO - __main__ - Step 55924: {'lr': 0.0003533475199064632, 'samples': 10737408, 'steps': 55923, 'loss/train': 1.00397527217865} -11/07/2021 05:05:09 - INFO - __main__ - Step 55925: {'lr': 0.00035334268780572707, 'samples': 10737600, 'steps': 55924, 'loss/train': 1.1774753332138062} -11/07/2021 05:05:10 - INFO - __main__ - Step 55926: {'lr': 0.0003533378556584263, 'samples': 10737792, 'steps': 55925, 'loss/train': 1.18112051486969} -11/07/2021 05:05:11 - INFO - __main__ - Step 55927: {'lr': 0.0003533330234645631, 'samples': 10737984, 'steps': 55926, 'loss/train': 1.4713926315307617} -11/07/2021 05:05:11 - INFO - __main__ - Step 55928: {'lr': 0.00035332819122413963, 'samples': 10738176, 'steps': 55927, 'loss/train': 1.5009284019470215} -11/07/2021 05:05:11 - INFO - __main__ - Step 55929: {'lr': 0.00035332335893715805, 'samples': 10738368, 'steps': 55928, 'loss/train': 1.3760688304901123} -11/07/2021 05:05:12 - INFO - __main__ - Step 55930: {'lr': 0.00035331852660362055, 'samples': 10738560, 'steps': 55929, 'loss/train': 1.3465180397033691} -11/07/2021 05:05:13 - INFO - __main__ - Step 55931: {'lr': 0.00035331369422352937, 'samples': 10738752, 'steps': 55930, 'loss/train': 1.4027389287948608} -11/07/2021 05:05:13 - INFO - __main__ - Step 55932: {'lr': 0.00035330886179688666, 'samples': 10738944, 'steps': 55931, 'loss/train': 1.3508884906768799} -11/07/2021 05:05:13 - INFO - __main__ - Step 55933: {'lr': 0.0003533040293236945, 'samples': 10739136, 'steps': 55932, 'loss/train': 1.6447728872299194} -11/07/2021 05:05:14 - INFO - __main__ - Step 55934: {'lr': 0.0003532991968039552, 'samples': 10739328, 'steps': 55933, 'loss/train': 1.617796540260315} -11/07/2021 05:05:14 - INFO - __main__ - Step 55935: {'lr': 0.0003532943642376708, 'samples': 10739520, 'steps': 55934, 'loss/train': 0.9896909594535828} -11/07/2021 05:05:15 - INFO - __main__ - Step 55936: {'lr': 0.00035328953162484355, 'samples': 10739712, 'steps': 55935, 'loss/train': 0.7301599383354187} -11/07/2021 05:05:16 - INFO - __main__ - Step 55937: {'lr': 0.00035328469896547566, 'samples': 10739904, 'steps': 55936, 'loss/train': 1.390870213508606} -11/07/2021 05:05:16 - INFO - __main__ - Step 55938: {'lr': 0.0003532798662595693, 'samples': 10740096, 'steps': 55937, 'loss/train': 1.366762399673462} -11/07/2021 05:05:16 - INFO - __main__ - Step 55939: {'lr': 0.00035327503350712666, 'samples': 10740288, 'steps': 55938, 'loss/train': 1.447092890739441} -11/07/2021 05:05:17 - INFO - __main__ - Step 55940: {'lr': 0.0003532702007081498, 'samples': 10740480, 'steps': 55939, 'loss/train': 1.8277941942214966} -11/07/2021 05:05:18 - INFO - __main__ - Step 55941: {'lr': 0.000353265367862641, 'samples': 10740672, 'steps': 55940, 'loss/train': 1.4005780220031738} -11/07/2021 05:05:18 - INFO - __main__ - Step 55942: {'lr': 0.0003532605349706025, 'samples': 10740864, 'steps': 55941, 'loss/train': 1.4999957084655762} -11/07/2021 05:05:18 - INFO - __main__ - Step 55943: {'lr': 0.00035325570203203626, 'samples': 10741056, 'steps': 55942, 'loss/train': 1.7539501190185547} -11/07/2021 05:05:19 - INFO - __main__ - Step 55944: {'lr': 0.0003532508690469447, 'samples': 10741248, 'steps': 55943, 'loss/train': 1.5305148363113403} -11/07/2021 05:05:19 - INFO - __main__ - Step 55945: {'lr': 0.0003532460360153299, 'samples': 10741440, 'steps': 55944, 'loss/train': 1.5526245832443237} -11/07/2021 05:05:20 - INFO - __main__ - Step 55946: {'lr': 0.000353241202937194, 'samples': 10741632, 'steps': 55945, 'loss/train': 1.1486482620239258} -11/07/2021 05:05:21 - INFO - __main__ - Step 55947: {'lr': 0.00035323636981253914, 'samples': 10741824, 'steps': 55946, 'loss/train': 1.5427560806274414} -11/07/2021 05:05:21 - INFO - __main__ - Step 55948: {'lr': 0.00035323153664136765, 'samples': 10742016, 'steps': 55947, 'loss/train': 1.8074579238891602} -11/07/2021 05:05:21 - INFO - __main__ - Step 55949: {'lr': 0.00035322670342368155, 'samples': 10742208, 'steps': 55948, 'loss/train': 1.2773897647857666} -11/07/2021 05:05:22 - INFO - __main__ - Step 55950: {'lr': 0.0003532218701594832, 'samples': 10742400, 'steps': 55949, 'loss/train': 1.4659587144851685} -11/07/2021 05:05:22 - INFO - __main__ - Step 55951: {'lr': 0.0003532170368487746, 'samples': 10742592, 'steps': 55950, 'loss/train': 1.7059035301208496} -11/07/2021 05:05:23 - INFO - __main__ - Step 55952: {'lr': 0.00035321220349155796, 'samples': 10742784, 'steps': 55951, 'loss/train': 1.6169774532318115} -11/07/2021 05:05:24 - INFO - __main__ - Step 55953: {'lr': 0.00035320737008783556, 'samples': 10742976, 'steps': 55952, 'loss/train': 1.169887661933899} -11/07/2021 05:05:24 - INFO - __main__ - Step 55954: {'lr': 0.0003532025366376095, 'samples': 10743168, 'steps': 55953, 'loss/train': 1.4586212635040283} -11/07/2021 05:05:24 - INFO - __main__ - Step 55955: {'lr': 0.0003531977031408819, 'samples': 10743360, 'steps': 55954, 'loss/train': 1.5239309072494507} -11/07/2021 05:05:25 - INFO - __main__ - Step 55956: {'lr': 0.0003531928695976551, 'samples': 10743552, 'steps': 55955, 'loss/train': 1.4125745296478271} -11/07/2021 05:05:25 - INFO - __main__ - Step 55957: {'lr': 0.00035318803600793117, 'samples': 10743744, 'steps': 55956, 'loss/train': 1.0789803266525269} -11/07/2021 05:05:26 - INFO - __main__ - Step 55958: {'lr': 0.00035318320237171224, 'samples': 10743936, 'steps': 55957, 'loss/train': 1.5693883895874023} -11/07/2021 05:05:26 - INFO - __main__ - Step 55959: {'lr': 0.0003531783686890006, 'samples': 10744128, 'steps': 55958, 'loss/train': 1.3762418031692505} -11/07/2021 05:05:27 - INFO - __main__ - Step 55960: {'lr': 0.0003531735349597984, 'samples': 10744320, 'steps': 55959, 'loss/train': 0.825796902179718} -11/07/2021 05:05:27 - INFO - __main__ - Step 55961: {'lr': 0.0003531687011841077, 'samples': 10744512, 'steps': 55960, 'loss/train': 1.4723906517028809} -11/07/2021 05:05:27 - INFO - __main__ - Step 55962: {'lr': 0.0003531638673619309, 'samples': 10744704, 'steps': 55961, 'loss/train': 1.387729525566101} -11/07/2021 05:05:28 - INFO - __main__ - Step 55963: {'lr': 0.00035315903349327, 'samples': 10744896, 'steps': 55962, 'loss/train': 1.4891746044158936} -11/07/2021 05:05:29 - INFO - __main__ - Step 55964: {'lr': 0.00035315419957812725, 'samples': 10745088, 'steps': 55963, 'loss/train': 1.6799993515014648} -11/07/2021 05:05:29 - INFO - __main__ - Step 55965: {'lr': 0.0003531493656165047, 'samples': 10745280, 'steps': 55964, 'loss/train': 1.3721928596496582} -11/07/2021 05:05:29 - INFO - __main__ - Step 55966: {'lr': 0.00035314453160840476, 'samples': 10745472, 'steps': 55965, 'loss/train': 1.483290433883667} -11/07/2021 05:05:30 - INFO - __main__ - Step 55967: {'lr': 0.00035313969755382946, 'samples': 10745664, 'steps': 55966, 'loss/train': 1.7456120252609253} -11/07/2021 05:05:31 - INFO - __main__ - Step 55968: {'lr': 0.000353134863452781, 'samples': 10745856, 'steps': 55967, 'loss/train': 1.7259849309921265} -11/07/2021 05:05:31 - INFO - __main__ - Step 55969: {'lr': 0.00035313002930526156, 'samples': 10746048, 'steps': 55968, 'loss/train': 0.07837814092636108} -11/07/2021 05:05:31 - INFO - __main__ - Step 55970: {'lr': 0.00035312519511127325, 'samples': 10746240, 'steps': 55969, 'loss/train': 1.245185375213623} -11/07/2021 05:05:32 - INFO - __main__ - Step 55971: {'lr': 0.0003531203608708184, 'samples': 10746432, 'steps': 55970, 'loss/train': 0.6822187900543213} -11/07/2021 05:05:32 - INFO - __main__ - Step 55972: {'lr': 0.00035311552658389914, 'samples': 10746624, 'steps': 55971, 'loss/train': 0.39193999767303467} -11/07/2021 05:05:33 - INFO - __main__ - Step 55973: {'lr': 0.00035311069225051755, 'samples': 10746816, 'steps': 55972, 'loss/train': 1.1932096481323242} -11/07/2021 05:05:34 - INFO - __main__ - Step 55974: {'lr': 0.0003531058578706759, 'samples': 10747008, 'steps': 55973, 'loss/train': 1.864783525466919} -11/07/2021 05:05:34 - INFO - __main__ - Step 55975: {'lr': 0.00035310102344437636, 'samples': 10747200, 'steps': 55974, 'loss/train': 1.5394617319107056} -11/07/2021 05:05:34 - INFO - __main__ - Step 55976: {'lr': 0.00035309618897162097, 'samples': 10747392, 'steps': 55975, 'loss/train': 2.1839776039123535} -11/07/2021 05:05:35 - INFO - __main__ - Step 55977: {'lr': 0.0003530913544524121, 'samples': 10747584, 'steps': 55976, 'loss/train': 1.5453792810440063} -11/07/2021 05:05:35 - INFO - __main__ - Step 55978: {'lr': 0.00035308651988675194, 'samples': 10747776, 'steps': 55977, 'loss/train': 1.2105815410614014} -11/07/2021 05:05:36 - INFO - __main__ - Step 55979: {'lr': 0.0003530816852746426, 'samples': 10747968, 'steps': 55978, 'loss/train': 1.77792489528656} -11/07/2021 05:05:37 - INFO - __main__ - Step 55980: {'lr': 0.00035307685061608605, 'samples': 10748160, 'steps': 55979, 'loss/train': 1.562185287475586} -11/07/2021 05:05:37 - INFO - __main__ - Step 55981: {'lr': 0.00035307201591108485, 'samples': 10748352, 'steps': 55980, 'loss/train': 0.111997589468956} -11/07/2021 05:05:37 - INFO - __main__ - Step 55982: {'lr': 0.0003530671811596409, 'samples': 10748544, 'steps': 55981, 'loss/train': 0.3349896967411041} -11/07/2021 05:05:38 - INFO - __main__ - Step 55983: {'lr': 0.00035306234636175646, 'samples': 10748736, 'steps': 55982, 'loss/train': 0.15526923537254333} -11/07/2021 05:05:39 - INFO - __main__ - Step 55984: {'lr': 0.0003530575115174337, 'samples': 10748928, 'steps': 55983, 'loss/train': 1.426676630973816} -11/07/2021 05:05:39 - INFO - __main__ - Step 55985: {'lr': 0.00035305267662667485, 'samples': 10749120, 'steps': 55984, 'loss/train': 1.652669072151184} -11/07/2021 05:05:40 - INFO - __main__ - Step 55986: {'lr': 0.0003530478416894821, 'samples': 10749312, 'steps': 55985, 'loss/train': 1.0717411041259766} -11/07/2021 05:05:40 - INFO - __main__ - Step 55987: {'lr': 0.00035304300670585754, 'samples': 10749504, 'steps': 55986, 'loss/train': 1.5535953044891357} -11/07/2021 05:05:40 - INFO - __main__ - Step 55988: {'lr': 0.0003530381716758034, 'samples': 10749696, 'steps': 55987, 'loss/train': 1.174253225326538} -11/07/2021 05:05:41 - INFO - __main__ - Step 55989: {'lr': 0.00035303333659932187, 'samples': 10749888, 'steps': 55988, 'loss/train': 1.393289566040039} -11/07/2021 05:05:42 - INFO - __main__ - Step 55990: {'lr': 0.000353028501476415, 'samples': 10750080, 'steps': 55989, 'loss/train': 1.339763879776001} -11/07/2021 05:05:42 - INFO - __main__ - Step 55991: {'lr': 0.0003530236663070852, 'samples': 10750272, 'steps': 55990, 'loss/train': 1.4543182849884033} -11/07/2021 05:05:42 - INFO - __main__ - Step 55992: {'lr': 0.00035301883109133456, 'samples': 10750464, 'steps': 55991, 'loss/train': 1.587518334388733} -11/07/2021 05:05:43 - INFO - __main__ - Step 55993: {'lr': 0.0003530139958291651, 'samples': 10750656, 'steps': 55992, 'loss/train': 1.3030308485031128} -11/07/2021 05:05:44 - INFO - __main__ - Step 55994: {'lr': 0.0003530091605205792, 'samples': 10750848, 'steps': 55993, 'loss/train': 0.8324307799339294} -11/07/2021 05:05:44 - INFO - __main__ - Step 55995: {'lr': 0.0003530043251655789, 'samples': 10751040, 'steps': 55994, 'loss/train': 0.6881075501441956} -11/07/2021 05:05:44 - INFO - __main__ - Step 55996: {'lr': 0.00035299948976416645, 'samples': 10751232, 'steps': 55995, 'loss/train': 1.4833433628082275} -11/07/2021 05:05:45 - INFO - __main__ - Step 55997: {'lr': 0.00035299465431634403, 'samples': 10751424, 'steps': 55996, 'loss/train': 1.2558081150054932} -11/07/2021 05:05:45 - INFO - __main__ - Step 55998: {'lr': 0.00035298981882211385, 'samples': 10751616, 'steps': 55997, 'loss/train': 1.4812978506088257} -11/07/2021 05:05:46 - INFO - __main__ - Step 55999: {'lr': 0.00035298498328147803, 'samples': 10751808, 'steps': 55998, 'loss/train': 0.9314523935317993} -11/07/2021 05:05:47 - INFO - __main__ - Step 56000: {'lr': 0.00035298014769443874, 'samples': 10752000, 'steps': 55999, 'loss/train': 1.2715140581130981} -11/07/2021 05:05:47 - INFO - __main__ - Step 56001: {'lr': 0.0003529753120609982, 'samples': 10752192, 'steps': 56000, 'loss/train': 1.534266710281372} -11/07/2021 05:05:47 - INFO - __main__ - Step 56002: {'lr': 0.0003529704763811585, 'samples': 10752384, 'steps': 56001, 'loss/train': 1.180860996246338} -11/07/2021 05:05:48 - INFO - __main__ - Step 56003: {'lr': 0.000352965640654922, 'samples': 10752576, 'steps': 56002, 'loss/train': 1.4908504486083984} -11/07/2021 05:05:48 - INFO - __main__ - Step 56004: {'lr': 0.0003529608048822908, 'samples': 10752768, 'steps': 56003, 'loss/train': 1.4740095138549805} -11/07/2021 05:05:49 - INFO - __main__ - Step 56005: {'lr': 0.0003529559690632669, 'samples': 10752960, 'steps': 56004, 'loss/train': 2.202659845352173} -11/07/2021 05:05:50 - INFO - __main__ - Step 56006: {'lr': 0.00035295113319785276, 'samples': 10753152, 'steps': 56005, 'loss/train': 1.436906337738037} -11/07/2021 05:05:50 - INFO - __main__ - Step 56007: {'lr': 0.0003529462972860504, 'samples': 10753344, 'steps': 56006, 'loss/train': 1.2278133630752563} -11/07/2021 05:05:50 - INFO - __main__ - Step 56008: {'lr': 0.000352941461327862, 'samples': 10753536, 'steps': 56007, 'loss/train': 1.1644611358642578} -11/07/2021 05:05:51 - INFO - __main__ - Step 56009: {'lr': 0.0003529366253232897, 'samples': 10753728, 'steps': 56008, 'loss/train': 1.4787629842758179} -11/07/2021 05:05:52 - INFO - __main__ - Step 56010: {'lr': 0.00035293178927233587, 'samples': 10753920, 'steps': 56009, 'loss/train': 1.521426796913147} -11/07/2021 05:05:52 - INFO - __main__ - Step 56011: {'lr': 0.0003529269531750025, 'samples': 10754112, 'steps': 56010, 'loss/train': 1.2113900184631348} -11/07/2021 05:05:52 - INFO - __main__ - Step 56012: {'lr': 0.0003529221170312919, 'samples': 10754304, 'steps': 56011, 'loss/train': 1.088667392730713} -11/07/2021 05:05:53 - INFO - __main__ - Step 56013: {'lr': 0.0003529172808412061, 'samples': 10754496, 'steps': 56012, 'loss/train': 0.11348990350961685} -11/07/2021 05:05:53 - INFO - __main__ - Step 56014: {'lr': 0.0003529124446047474, 'samples': 10754688, 'steps': 56013, 'loss/train': 1.4001039266586304} -11/07/2021 05:05:54 - INFO - __main__ - Step 56015: {'lr': 0.0003529076083219179, 'samples': 10754880, 'steps': 56014, 'loss/train': 1.681990146636963} -11/07/2021 05:05:55 - INFO - __main__ - Step 56016: {'lr': 0.0003529027719927199, 'samples': 10755072, 'steps': 56015, 'loss/train': 1.2354339361190796} -11/07/2021 05:05:55 - INFO - __main__ - Step 56017: {'lr': 0.00035289793561715544, 'samples': 10755264, 'steps': 56016, 'loss/train': 1.2206889390945435} -11/07/2021 05:05:55 - INFO - __main__ - Step 56018: {'lr': 0.0003528930991952267, 'samples': 10755456, 'steps': 56017, 'loss/train': 0.7317473888397217} -11/07/2021 05:05:56 - INFO - __main__ - Step 56019: {'lr': 0.00035288826272693606, 'samples': 10755648, 'steps': 56018, 'loss/train': 1.7954611778259277} -11/07/2021 05:05:57 - INFO - __main__ - Step 56020: {'lr': 0.0003528834262122855, 'samples': 10755840, 'steps': 56019, 'loss/train': 1.266148328781128} -11/07/2021 05:05:57 - INFO - __main__ - Step 56021: {'lr': 0.00035287858965127723, 'samples': 10756032, 'steps': 56020, 'loss/train': 0.9832165241241455} -11/07/2021 05:05:57 - INFO - __main__ - Step 56022: {'lr': 0.00035287375304391343, 'samples': 10756224, 'steps': 56021, 'loss/train': 1.249596118927002} -11/07/2021 05:05:58 - INFO - __main__ - Step 56023: {'lr': 0.00035286891639019636, 'samples': 10756416, 'steps': 56022, 'loss/train': 1.4130103588104248} -11/07/2021 05:05:58 - INFO - __main__ - Step 56024: {'lr': 0.00035286407969012813, 'samples': 10756608, 'steps': 56023, 'loss/train': 1.6560721397399902} -11/07/2021 05:05:59 - INFO - __main__ - Step 56025: {'lr': 0.00035285924294371085, 'samples': 10756800, 'steps': 56024, 'loss/train': 1.474733591079712} -11/07/2021 05:05:59 - INFO - __main__ - Step 56026: {'lr': 0.00035285440615094696, 'samples': 10756992, 'steps': 56025, 'loss/train': 1.5125707387924194} -11/07/2021 05:06:00 - INFO - __main__ - Step 56027: {'lr': 0.0003528495693118383, 'samples': 10757184, 'steps': 56026, 'loss/train': 1.1230933666229248} -11/07/2021 05:06:00 - INFO - __main__ - Step 56028: {'lr': 0.0003528447324263873, 'samples': 10757376, 'steps': 56027, 'loss/train': 0.8970708250999451} -11/07/2021 05:06:00 - INFO - __main__ - Step 56029: {'lr': 0.000352839895494596, 'samples': 10757568, 'steps': 56028, 'loss/train': 1.7706984281539917} -11/07/2021 05:06:02 - INFO - __main__ - Step 56030: {'lr': 0.00035283505851646665, 'samples': 10757760, 'steps': 56029, 'loss/train': 1.450102686882019} -11/07/2021 05:06:02 - INFO - __main__ - Step 56031: {'lr': 0.0003528302214920014, 'samples': 10757952, 'steps': 56030, 'loss/train': 1.749725341796875} -11/07/2021 05:06:02 - INFO - __main__ - Step 56032: {'lr': 0.0003528253844212024, 'samples': 10758144, 'steps': 56031, 'loss/train': 0.9640790224075317} -11/07/2021 05:06:03 - INFO - __main__ - Step 56033: {'lr': 0.00035282054730407196, 'samples': 10758336, 'steps': 56032, 'loss/train': 1.684749960899353} -11/07/2021 05:06:03 - INFO - __main__ - Step 56034: {'lr': 0.00035281571014061214, 'samples': 10758528, 'steps': 56033, 'loss/train': 1.329773187637329} -11/07/2021 05:06:04 - INFO - __main__ - Step 56035: {'lr': 0.0003528108729308251, 'samples': 10758720, 'steps': 56034, 'loss/train': 1.843616247177124} -11/07/2021 05:06:04 - INFO - __main__ - Step 56036: {'lr': 0.0003528060356747131, 'samples': 10758912, 'steps': 56035, 'loss/train': 1.5963677167892456} -11/07/2021 05:06:05 - INFO - __main__ - Step 56037: {'lr': 0.0003528011983722783, 'samples': 10759104, 'steps': 56036, 'loss/train': 1.7013540267944336} -11/07/2021 05:06:05 - INFO - __main__ - Step 56038: {'lr': 0.0003527963610235229, 'samples': 10759296, 'steps': 56037, 'loss/train': 0.8886352777481079} -11/07/2021 05:06:05 - INFO - __main__ - Step 56039: {'lr': 0.000352791523628449, 'samples': 10759488, 'steps': 56038, 'loss/train': 1.77224600315094} -11/07/2021 05:06:06 - INFO - __main__ - Step 56040: {'lr': 0.0003527866861870588, 'samples': 10759680, 'steps': 56039, 'loss/train': 1.5709130764007568} -11/07/2021 05:06:07 - INFO - __main__ - Step 56041: {'lr': 0.00035278184869935454, 'samples': 10759872, 'steps': 56040, 'loss/train': 0.9209262728691101} -11/07/2021 05:06:07 - INFO - __main__ - Step 56042: {'lr': 0.0003527770111653383, 'samples': 10760064, 'steps': 56041, 'loss/train': 1.5137721300125122} -11/07/2021 05:06:07 - INFO - __main__ - Step 56043: {'lr': 0.0003527721735850124, 'samples': 10760256, 'steps': 56042, 'loss/train': 1.4074609279632568} -11/07/2021 05:06:08 - INFO - __main__ - Step 56044: {'lr': 0.0003527673359583789, 'samples': 10760448, 'steps': 56043, 'loss/train': 1.074844241142273} -11/07/2021 05:06:09 - INFO - __main__ - Step 56045: {'lr': 0.00035276249828544004, 'samples': 10760640, 'steps': 56044, 'loss/train': 1.5094329118728638} -11/07/2021 05:06:09 - INFO - __main__ - Step 56046: {'lr': 0.0003527576605661981, 'samples': 10760832, 'steps': 56045, 'loss/train': 1.6409003734588623} -11/07/2021 05:06:10 - INFO - __main__ - Step 56047: {'lr': 0.00035275282280065493, 'samples': 10761024, 'steps': 56046, 'loss/train': 1.4655380249023438} -11/07/2021 05:06:10 - INFO - __main__ - Step 56048: {'lr': 0.00035274798498881305, 'samples': 10761216, 'steps': 56047, 'loss/train': 0.4239441454410553} -11/07/2021 05:06:10 - INFO - __main__ - Step 56049: {'lr': 0.00035274314713067454, 'samples': 10761408, 'steps': 56048, 'loss/train': 1.879326581954956} -11/07/2021 05:06:11 - INFO - __main__ - Step 56050: {'lr': 0.00035273830922624147, 'samples': 10761600, 'steps': 56049, 'loss/train': 1.8466169834136963} -11/07/2021 05:06:12 - INFO - __main__ - Step 56051: {'lr': 0.00035273347127551616, 'samples': 10761792, 'steps': 56050, 'loss/train': 1.1744219064712524} -11/07/2021 05:06:12 - INFO - __main__ - Step 56052: {'lr': 0.00035272863327850067, 'samples': 10761984, 'steps': 56051, 'loss/train': 1.4762969017028809} -11/07/2021 05:06:12 - INFO - __main__ - Step 56053: {'lr': 0.00035272379523519734, 'samples': 10762176, 'steps': 56052, 'loss/train': 1.756905436515808} -11/07/2021 05:06:13 - INFO - __main__ - Step 56054: {'lr': 0.0003527189571456082, 'samples': 10762368, 'steps': 56053, 'loss/train': 0.1097700297832489} -11/07/2021 05:06:14 - INFO - __main__ - Step 56055: {'lr': 0.00035271411900973545, 'samples': 10762560, 'steps': 56054, 'loss/train': 1.5177136659622192} -11/07/2021 05:06:14 - INFO - __main__ - Step 56056: {'lr': 0.00035270928082758134, 'samples': 10762752, 'steps': 56055, 'loss/train': 0.9365915060043335} -11/07/2021 05:06:14 - INFO - __main__ - Step 56057: {'lr': 0.00035270444259914794, 'samples': 10762944, 'steps': 56056, 'loss/train': 1.0476480722427368} -11/07/2021 05:06:15 - INFO - __main__ - Step 56058: {'lr': 0.0003526996043244376, 'samples': 10763136, 'steps': 56057, 'loss/train': 1.4696296453475952} -11/07/2021 05:06:15 - INFO - __main__ - Step 56059: {'lr': 0.0003526947660034524, 'samples': 10763328, 'steps': 56058, 'loss/train': 1.3283686637878418} -11/07/2021 05:06:16 - INFO - __main__ - Step 56060: {'lr': 0.0003526899276361945, 'samples': 10763520, 'steps': 56059, 'loss/train': 1.6950527429580688} -11/07/2021 05:06:16 - INFO - __main__ - Step 56061: {'lr': 0.00035268508922266614, 'samples': 10763712, 'steps': 56060, 'loss/train': 1.4874831438064575} -11/07/2021 05:06:17 - INFO - __main__ - Step 56062: {'lr': 0.00035268025076286936, 'samples': 10763904, 'steps': 56061, 'loss/train': 1.465022087097168} -11/07/2021 05:06:17 - INFO - __main__ - Step 56063: {'lr': 0.00035267541225680654, 'samples': 10764096, 'steps': 56062, 'loss/train': 1.7769290208816528} -11/07/2021 05:06:17 - INFO - __main__ - Step 56064: {'lr': 0.00035267057370447967, 'samples': 10764288, 'steps': 56063, 'loss/train': 1.2261261940002441} -11/07/2021 05:06:19 - INFO - __main__ - Step 56065: {'lr': 0.00035266573510589114, 'samples': 10764480, 'steps': 56064, 'loss/train': 2.025089979171753} -11/07/2021 05:06:19 - INFO - __main__ - Step 56066: {'lr': 0.00035266089646104296, 'samples': 10764672, 'steps': 56065, 'loss/train': 1.5993165969848633} -11/07/2021 05:06:19 - INFO - __main__ - Step 56067: {'lr': 0.00035265605776993735, 'samples': 10764864, 'steps': 56066, 'loss/train': 0.9580615162849426} -11/07/2021 05:06:20 - INFO - __main__ - Step 56068: {'lr': 0.0003526512190325765, 'samples': 10765056, 'steps': 56067, 'loss/train': 0.8672080039978027} -11/07/2021 05:06:20 - INFO - __main__ - Step 56069: {'lr': 0.0003526463802489626, 'samples': 10765248, 'steps': 56068, 'loss/train': 1.4725104570388794} -11/07/2021 05:06:20 - INFO - __main__ - Step 56070: {'lr': 0.00035264154141909787, 'samples': 10765440, 'steps': 56069, 'loss/train': 0.6661514043807983} -11/07/2021 05:06:21 - INFO - __main__ - Step 56071: {'lr': 0.00035263670254298443, 'samples': 10765632, 'steps': 56070, 'loss/train': 0.22711573541164398} -11/07/2021 05:06:22 - INFO - __main__ - Step 56072: {'lr': 0.0003526318636206244, 'samples': 10765824, 'steps': 56071, 'loss/train': 1.1294758319854736} -11/07/2021 05:06:22 - INFO - __main__ - Step 56073: {'lr': 0.0003526270246520201, 'samples': 10766016, 'steps': 56072, 'loss/train': 1.2055062055587769} -11/07/2021 05:06:22 - INFO - __main__ - Step 56074: {'lr': 0.0003526221856371737, 'samples': 10766208, 'steps': 56073, 'loss/train': 1.413435935974121} -11/07/2021 05:06:23 - INFO - __main__ - Step 56075: {'lr': 0.0003526173465760872, 'samples': 10766400, 'steps': 56074, 'loss/train': 1.345708966255188} -11/07/2021 05:06:24 - INFO - __main__ - Step 56076: {'lr': 0.000352612507468763, 'samples': 10766592, 'steps': 56075, 'loss/train': 1.6085463762283325} -11/07/2021 05:06:24 - INFO - __main__ - Step 56077: {'lr': 0.00035260766831520315, 'samples': 10766784, 'steps': 56076, 'loss/train': 0.28465864062309265} -11/07/2021 05:06:24 - INFO - __main__ - Step 56078: {'lr': 0.0003526028291154099, 'samples': 10766976, 'steps': 56077, 'loss/train': 0.41470253467559814} -11/07/2021 05:06:25 - INFO - __main__ - Step 56079: {'lr': 0.00035259798986938537, 'samples': 10767168, 'steps': 56078, 'loss/train': 1.6819130182266235} -11/07/2021 05:06:25 - INFO - __main__ - Step 56080: {'lr': 0.00035259315057713177, 'samples': 10767360, 'steps': 56079, 'loss/train': 1.3918805122375488} -11/07/2021 05:06:26 - INFO - __main__ - Step 56081: {'lr': 0.0003525883112386513, 'samples': 10767552, 'steps': 56080, 'loss/train': 1.782894253730774} -11/07/2021 05:06:27 - INFO - __main__ - Step 56082: {'lr': 0.00035258347185394606, 'samples': 10767744, 'steps': 56081, 'loss/train': 1.506486177444458} -11/07/2021 05:06:27 - INFO - __main__ - Step 56083: {'lr': 0.00035257863242301834, 'samples': 10767936, 'steps': 56082, 'loss/train': 1.3411083221435547} -11/07/2021 05:06:27 - INFO - __main__ - Step 56084: {'lr': 0.0003525737929458703, 'samples': 10768128, 'steps': 56083, 'loss/train': 1.1377899646759033} -11/07/2021 05:06:28 - INFO - __main__ - Step 56085: {'lr': 0.0003525689534225041, 'samples': 10768320, 'steps': 56084, 'loss/train': 1.076027750968933} -11/07/2021 05:06:29 - INFO - __main__ - Step 56086: {'lr': 0.00035256411385292186, 'samples': 10768512, 'steps': 56085, 'loss/train': 1.695565938949585} -11/07/2021 05:06:29 - INFO - __main__ - Step 56087: {'lr': 0.0003525592742371258, 'samples': 10768704, 'steps': 56086, 'loss/train': 1.4092981815338135} -11/07/2021 05:06:29 - INFO - __main__ - Step 56088: {'lr': 0.0003525544345751182, 'samples': 10768896, 'steps': 56087, 'loss/train': 1.2346290349960327} -11/07/2021 05:06:30 - INFO - __main__ - Step 56089: {'lr': 0.00035254959486690103, 'samples': 10769088, 'steps': 56088, 'loss/train': 1.3800259828567505} -11/07/2021 05:06:30 - INFO - __main__ - Step 56090: {'lr': 0.0003525447551124766, 'samples': 10769280, 'steps': 56089, 'loss/train': 1.3414525985717773} -11/07/2021 05:06:31 - INFO - __main__ - Step 56091: {'lr': 0.0003525399153118472, 'samples': 10769472, 'steps': 56090, 'loss/train': 1.544366478919983} -11/07/2021 05:06:32 - INFO - __main__ - Step 56092: {'lr': 0.00035253507546501484, 'samples': 10769664, 'steps': 56091, 'loss/train': 1.2946702241897583} -11/07/2021 05:06:32 - INFO - __main__ - Step 56093: {'lr': 0.0003525302355719818, 'samples': 10769856, 'steps': 56092, 'loss/train': 1.568245768547058} -11/07/2021 05:06:32 - INFO - __main__ - Step 56094: {'lr': 0.0003525253956327501, 'samples': 10770048, 'steps': 56093, 'loss/train': 1.3921455144882202} -11/07/2021 05:06:33 - INFO - __main__ - Step 56095: {'lr': 0.0003525205556473221, 'samples': 10770240, 'steps': 56094, 'loss/train': 1.4071180820465088} -11/07/2021 05:06:33 - INFO - __main__ - Step 56096: {'lr': 0.0003525157156157, 'samples': 10770432, 'steps': 56095, 'loss/train': 1.4553344249725342} -11/07/2021 05:06:34 - INFO - __main__ - Step 56097: {'lr': 0.00035251087553788584, 'samples': 10770624, 'steps': 56096, 'loss/train': 1.5578862428665161} -11/07/2021 05:06:34 - INFO - __main__ - Step 56098: {'lr': 0.00035250603541388183, 'samples': 10770816, 'steps': 56097, 'loss/train': 0.07733270525932312} -11/07/2021 05:06:35 - INFO - __main__ - Step 56099: {'lr': 0.00035250119524369016, 'samples': 10771008, 'steps': 56098, 'loss/train': 1.6780366897583008} -11/07/2021 05:06:35 - INFO - __main__ - Step 56100: {'lr': 0.00035249635502731315, 'samples': 10771200, 'steps': 56099, 'loss/train': 1.8048059940338135} -11/07/2021 05:06:36 - INFO - __main__ - Step 56101: {'lr': 0.0003524915147647528, 'samples': 10771392, 'steps': 56100, 'loss/train': 1.3484421968460083} -11/07/2021 05:06:37 - INFO - __main__ - Step 56102: {'lr': 0.00035248667445601133, 'samples': 10771584, 'steps': 56101, 'loss/train': 1.3193823099136353} -11/07/2021 05:06:37 - INFO - __main__ - Step 56103: {'lr': 0.00035248183410109096, 'samples': 10771776, 'steps': 56102, 'loss/train': 0.33234304189682007} -11/07/2021 05:06:37 - INFO - __main__ - Step 56104: {'lr': 0.0003524769936999939, 'samples': 10771968, 'steps': 56103, 'loss/train': 1.1785374879837036} -11/07/2021 05:06:38 - INFO - __main__ - Step 56105: {'lr': 0.0003524721532527222, 'samples': 10772160, 'steps': 56104, 'loss/train': 0.7846789360046387} -11/07/2021 05:06:38 - INFO - __main__ - Step 56106: {'lr': 0.0003524673127592782, 'samples': 10772352, 'steps': 56105, 'loss/train': 1.1164886951446533} -11/07/2021 05:06:39 - INFO - __main__ - Step 56107: {'lr': 0.000352462472219664, 'samples': 10772544, 'steps': 56106, 'loss/train': 1.6663761138916016} -11/07/2021 05:06:39 - INFO - __main__ - Step 56108: {'lr': 0.0003524576316338818, 'samples': 10772736, 'steps': 56107, 'loss/train': 0.842548131942749} -11/07/2021 05:06:40 - INFO - __main__ - Step 56109: {'lr': 0.0003524527910019337, 'samples': 10772928, 'steps': 56108, 'loss/train': 1.3627212047576904} -11/07/2021 05:06:40 - INFO - __main__ - Step 56110: {'lr': 0.00035244795032382206, 'samples': 10773120, 'steps': 56109, 'loss/train': 1.4599909782409668} -11/07/2021 05:06:41 - INFO - __main__ - Step 56111: {'lr': 0.00035244310959954886, 'samples': 10773312, 'steps': 56110, 'loss/train': 1.293717861175537} -11/07/2021 05:06:42 - INFO - __main__ - Step 56112: {'lr': 0.0003524382688291164, 'samples': 10773504, 'steps': 56111, 'loss/train': 1.4754217863082886} -11/07/2021 05:06:42 - INFO - __main__ - Step 56113: {'lr': 0.0003524334280125269, 'samples': 10773696, 'steps': 56112, 'loss/train': 0.8247331976890564} -11/07/2021 05:06:42 - INFO - __main__ - Step 56114: {'lr': 0.0003524285871497824, 'samples': 10773888, 'steps': 56113, 'loss/train': 1.2718819379806519} -11/07/2021 05:06:43 - INFO - __main__ - Step 56115: {'lr': 0.0003524237462408852, 'samples': 10774080, 'steps': 56114, 'loss/train': 1.5664552450180054} -11/07/2021 05:06:43 - INFO - __main__ - Step 56116: {'lr': 0.0003524189052858374, 'samples': 10774272, 'steps': 56115, 'loss/train': 1.324585199356079} -11/07/2021 05:06:43 - INFO - __main__ - Step 56117: {'lr': 0.0003524140642846413, 'samples': 10774464, 'steps': 56116, 'loss/train': 0.9505982995033264} -11/07/2021 05:06:44 - INFO - __main__ - Step 56118: {'lr': 0.0003524092232372989, 'samples': 10774656, 'steps': 56117, 'loss/train': 1.560680627822876} -11/07/2021 05:06:45 - INFO - __main__ - Step 56119: {'lr': 0.00035240438214381253, 'samples': 10774848, 'steps': 56118, 'loss/train': 1.2786351442337036} -11/07/2021 05:06:45 - INFO - __main__ - Step 56120: {'lr': 0.00035239954100418436, 'samples': 10775040, 'steps': 56119, 'loss/train': 1.2073078155517578} -11/07/2021 05:06:45 - INFO - __main__ - Step 56121: {'lr': 0.00035239469981841656, 'samples': 10775232, 'steps': 56120, 'loss/train': 1.5953010320663452} -11/07/2021 05:06:46 - INFO - __main__ - Step 56122: {'lr': 0.0003523898585865112, 'samples': 10775424, 'steps': 56121, 'loss/train': 1.4239513874053955} -11/07/2021 05:06:47 - INFO - __main__ - Step 56123: {'lr': 0.0003523850173084706, 'samples': 10775616, 'steps': 56122, 'loss/train': 1.1879708766937256} -11/07/2021 05:06:47 - INFO - __main__ - Step 56124: {'lr': 0.00035238017598429686, 'samples': 10775808, 'steps': 56123, 'loss/train': 1.3142179250717163} -11/07/2021 05:06:47 - INFO - __main__ - Step 56125: {'lr': 0.0003523753346139922, 'samples': 10776000, 'steps': 56124, 'loss/train': 1.1931241750717163} -11/07/2021 05:06:48 - INFO - __main__ - Step 56126: {'lr': 0.0003523704931975588, 'samples': 10776192, 'steps': 56125, 'loss/train': 1.5110180377960205} -11/07/2021 05:06:48 - INFO - __main__ - Step 56127: {'lr': 0.0003523656517349989, 'samples': 10776384, 'steps': 56126, 'loss/train': 1.1871814727783203} -11/07/2021 05:06:49 - INFO - __main__ - Step 56128: {'lr': 0.0003523608102263145, 'samples': 10776576, 'steps': 56127, 'loss/train': 1.6022156476974487} -11/07/2021 05:06:50 - INFO - __main__ - Step 56129: {'lr': 0.00035235596867150797, 'samples': 10776768, 'steps': 56128, 'loss/train': 1.578641653060913} -11/07/2021 05:06:50 - INFO - __main__ - Step 56130: {'lr': 0.0003523511270705814, 'samples': 10776960, 'steps': 56129, 'loss/train': 1.1083091497421265} -11/07/2021 05:06:50 - INFO - __main__ - Step 56131: {'lr': 0.000352346285423537, 'samples': 10777152, 'steps': 56130, 'loss/train': 1.749462604522705} -11/07/2021 05:06:51 - INFO - __main__ - Step 56132: {'lr': 0.0003523414437303769, 'samples': 10777344, 'steps': 56131, 'loss/train': 1.507034182548523} -11/07/2021 05:06:52 - INFO - __main__ - Step 56133: {'lr': 0.0003523366019911035, 'samples': 10777536, 'steps': 56132, 'loss/train': 1.1592656373977661} -11/07/2021 05:06:52 - INFO - __main__ - Step 56134: {'lr': 0.00035233176020571863, 'samples': 10777728, 'steps': 56133, 'loss/train': 1.5731182098388672} -11/07/2021 05:06:52 - INFO - __main__ - Step 56135: {'lr': 0.0003523269183742246, 'samples': 10777920, 'steps': 56134, 'loss/train': 0.8437652587890625} -11/07/2021 05:06:53 - INFO - __main__ - Step 56136: {'lr': 0.0003523220764966238, 'samples': 10778112, 'steps': 56135, 'loss/train': 1.5683997869491577} -11/07/2021 05:06:53 - INFO - __main__ - Step 56137: {'lr': 0.00035231723457291816, 'samples': 10778304, 'steps': 56136, 'loss/train': 1.260100245475769} -11/07/2021 05:06:54 - INFO - __main__ - Step 56138: {'lr': 0.00035231239260311, 'samples': 10778496, 'steps': 56137, 'loss/train': 1.6461832523345947} -11/07/2021 05:06:55 - INFO - __main__ - Step 56139: {'lr': 0.0003523075505872014, 'samples': 10778688, 'steps': 56138, 'loss/train': 1.358130931854248} -11/07/2021 05:06:55 - INFO - __main__ - Step 56140: {'lr': 0.00035230270852519465, 'samples': 10778880, 'steps': 56139, 'loss/train': 1.5266367197036743} -11/07/2021 05:06:56 - INFO - __main__ - Step 56141: {'lr': 0.00035229786641709183, 'samples': 10779072, 'steps': 56140, 'loss/train': 1.1808722019195557} -11/07/2021 05:06:56 - INFO - __main__ - Step 56142: {'lr': 0.00035229302426289524, 'samples': 10779264, 'steps': 56141, 'loss/train': 0.1280687153339386} -11/07/2021 05:06:57 - INFO - __main__ - Step 56143: {'lr': 0.00035228818206260693, 'samples': 10779456, 'steps': 56142, 'loss/train': 1.2151098251342773} -11/07/2021 05:06:57 - INFO - __main__ - Step 56144: {'lr': 0.00035228333981622914, 'samples': 10779648, 'steps': 56143, 'loss/train': 1.38080894947052} -11/07/2021 05:06:58 - INFO - __main__ - Step 56145: {'lr': 0.0003522784975237641, 'samples': 10779840, 'steps': 56144, 'loss/train': 1.393256425857544} -11/07/2021 05:06:58 - INFO - __main__ - Step 56146: {'lr': 0.00035227365518521387, 'samples': 10780032, 'steps': 56145, 'loss/train': 1.5399317741394043} -11/07/2021 05:06:58 - INFO - __main__ - Step 56147: {'lr': 0.00035226881280058084, 'samples': 10780224, 'steps': 56146, 'loss/train': 1.4262508153915405} -11/07/2021 05:07:00 - INFO - __main__ - Step 56148: {'lr': 0.00035226397036986694, 'samples': 10780416, 'steps': 56147, 'loss/train': 1.5341914892196655} -11/07/2021 05:07:00 - INFO - __main__ - Step 56149: {'lr': 0.0003522591278930745, 'samples': 10780608, 'steps': 56148, 'loss/train': 1.5461366176605225} -11/07/2021 05:07:01 - INFO - __main__ - Step 56150: {'lr': 0.0003522542853702057, 'samples': 10780800, 'steps': 56149, 'loss/train': 1.8080079555511475} -11/07/2021 05:07:01 - INFO - __main__ - Step 56151: {'lr': 0.0003522494428012627, 'samples': 10780992, 'steps': 56150, 'loss/train': 1.4833968877792358} -11/07/2021 05:07:01 - INFO - __main__ - Step 56152: {'lr': 0.0003522446001862476, 'samples': 10781184, 'steps': 56151, 'loss/train': 1.6682887077331543} -11/07/2021 05:07:02 - INFO - __main__ - Step 56153: {'lr': 0.00035223975752516273, 'samples': 10781376, 'steps': 56152, 'loss/train': 1.2973426580429077} -11/07/2021 05:07:02 - INFO - __main__ - Step 56154: {'lr': 0.0003522349148180103, 'samples': 10781568, 'steps': 56153, 'loss/train': 0.6574332118034363} -11/07/2021 05:07:03 - INFO - __main__ - Step 56155: {'lr': 0.00035223007206479226, 'samples': 10781760, 'steps': 56154, 'loss/train': 1.3152788877487183} -11/07/2021 05:07:03 - INFO - __main__ - Step 56156: {'lr': 0.00035222522926551094, 'samples': 10781952, 'steps': 56155, 'loss/train': 1.5688040256500244} -11/07/2021 05:07:04 - INFO - __main__ - Step 56157: {'lr': 0.0003522203864201685, 'samples': 10782144, 'steps': 56156, 'loss/train': 1.280598521232605} -11/07/2021 05:07:04 - INFO - __main__ - Step 56158: {'lr': 0.00035221554352876715, 'samples': 10782336, 'steps': 56157, 'loss/train': 1.8648959398269653} -11/07/2021 05:07:04 - INFO - __main__ - Step 56159: {'lr': 0.00035221070059130913, 'samples': 10782528, 'steps': 56158, 'loss/train': 1.2692580223083496} -11/07/2021 05:07:05 - INFO - __main__ - Step 56160: {'lr': 0.0003522058576077965, 'samples': 10782720, 'steps': 56159, 'loss/train': 1.649580955505371} -11/07/2021 05:07:06 - INFO - __main__ - Step 56161: {'lr': 0.00035220101457823143, 'samples': 10782912, 'steps': 56160, 'loss/train': 1.2421942949295044} -11/07/2021 05:07:06 - INFO - __main__ - Step 56162: {'lr': 0.0003521961715026162, 'samples': 10783104, 'steps': 56161, 'loss/train': 1.789180040359497} -11/07/2021 05:07:07 - INFO - __main__ - Step 56163: {'lr': 0.0003521913283809529, 'samples': 10783296, 'steps': 56162, 'loss/train': 1.1353594064712524} -11/07/2021 05:07:07 - INFO - __main__ - Step 56164: {'lr': 0.00035218648521324387, 'samples': 10783488, 'steps': 56163, 'loss/train': 1.6117337942123413} -11/07/2021 05:07:08 - INFO - __main__ - Step 56165: {'lr': 0.0003521816419994911, 'samples': 10783680, 'steps': 56164, 'loss/train': 0.9769127368927002} -11/07/2021 05:07:08 - INFO - __main__ - Step 56166: {'lr': 0.0003521767987396969, 'samples': 10783872, 'steps': 56165, 'loss/train': 1.6191201210021973} -11/07/2021 05:07:09 - INFO - __main__ - Step 56167: {'lr': 0.00035217195543386345, 'samples': 10784064, 'steps': 56166, 'loss/train': 1.4446793794631958} -11/07/2021 05:07:09 - INFO - __main__ - Step 56168: {'lr': 0.0003521671120819928, 'samples': 10784256, 'steps': 56167, 'loss/train': 1.4271960258483887} -11/07/2021 05:07:09 - INFO - __main__ - Step 56169: {'lr': 0.0003521622686840873, 'samples': 10784448, 'steps': 56168, 'loss/train': 0.05827701464295387} -11/07/2021 05:07:10 - INFO - __main__ - Step 56170: {'lr': 0.000352157425240149, 'samples': 10784640, 'steps': 56169, 'loss/train': 1.6075183153152466} -11/07/2021 05:07:11 - INFO - __main__ - Step 56171: {'lr': 0.00035215258175018015, 'samples': 10784832, 'steps': 56170, 'loss/train': 1.5340136289596558} -11/07/2021 05:07:11 - INFO - __main__ - Step 56172: {'lr': 0.00035214773821418295, 'samples': 10785024, 'steps': 56171, 'loss/train': 1.220860242843628} -11/07/2021 05:07:11 - INFO - __main__ - Step 56173: {'lr': 0.00035214289463215954, 'samples': 10785216, 'steps': 56172, 'loss/train': 1.3255250453948975} -11/07/2021 05:07:12 - INFO - __main__ - Step 56174: {'lr': 0.00035213805100411217, 'samples': 10785408, 'steps': 56173, 'loss/train': 1.3527663946151733} -11/07/2021 05:07:13 - INFO - __main__ - Step 56175: {'lr': 0.00035213320733004297, 'samples': 10785600, 'steps': 56174, 'loss/train': 1.3792458772659302} -11/07/2021 05:07:13 - INFO - __main__ - Step 56176: {'lr': 0.00035212836360995405, 'samples': 10785792, 'steps': 56175, 'loss/train': 1.4815794229507446} -11/07/2021 05:07:14 - INFO - __main__ - Step 56177: {'lr': 0.0003521235198438477, 'samples': 10785984, 'steps': 56176, 'loss/train': 1.5355722904205322} -11/07/2021 05:07:14 - INFO - __main__ - Step 56178: {'lr': 0.000352118676031726, 'samples': 10786176, 'steps': 56177, 'loss/train': 1.8288989067077637} -11/07/2021 05:07:14 - INFO - __main__ - Step 56179: {'lr': 0.0003521138321735913, 'samples': 10786368, 'steps': 56178, 'loss/train': 1.0465120077133179} -11/07/2021 05:07:15 - INFO - __main__ - Step 56180: {'lr': 0.0003521089882694456, 'samples': 10786560, 'steps': 56179, 'loss/train': 1.408577799797058} -11/07/2021 05:07:16 - INFO - __main__ - Step 56181: {'lr': 0.0003521041443192913, 'samples': 10786752, 'steps': 56180, 'loss/train': 1.7961503267288208} -11/07/2021 05:07:16 - INFO - __main__ - Step 56182: {'lr': 0.00035209930032313033, 'samples': 10786944, 'steps': 56181, 'loss/train': 1.2707103490829468} -11/07/2021 05:07:16 - INFO - __main__ - Step 56183: {'lr': 0.000352094456280965, 'samples': 10787136, 'steps': 56182, 'loss/train': 1.4756022691726685} -11/07/2021 05:07:17 - INFO - __main__ - Step 56184: {'lr': 0.0003520896121927975, 'samples': 10787328, 'steps': 56183, 'loss/train': 1.4517836570739746} -11/07/2021 05:07:17 - INFO - __main__ - Step 56185: {'lr': 0.00035208476805863, 'samples': 10787520, 'steps': 56184, 'loss/train': 1.2510775327682495} -11/07/2021 05:07:18 - INFO - __main__ - Step 56186: {'lr': 0.00035207992387846466, 'samples': 10787712, 'steps': 56185, 'loss/train': 1.7733508348464966} -11/07/2021 05:07:19 - INFO - __main__ - Step 56187: {'lr': 0.0003520750796523037, 'samples': 10787904, 'steps': 56186, 'loss/train': 1.5007990598678589} -11/07/2021 05:07:19 - INFO - __main__ - Step 56188: {'lr': 0.0003520702353801493, 'samples': 10788096, 'steps': 56187, 'loss/train': 1.7201709747314453} -11/07/2021 05:07:19 - INFO - __main__ - Step 56189: {'lr': 0.0003520653910620036, 'samples': 10788288, 'steps': 56188, 'loss/train': 1.6831419467926025} -11/07/2021 05:07:20 - INFO - __main__ - Step 56190: {'lr': 0.0003520605466978688, 'samples': 10788480, 'steps': 56189, 'loss/train': 1.3703277111053467} -11/07/2021 05:07:20 - INFO - __main__ - Step 56191: {'lr': 0.00035205570228774715, 'samples': 10788672, 'steps': 56190, 'loss/train': 1.1786553859710693} -11/07/2021 05:07:21 - INFO - __main__ - Step 56192: {'lr': 0.0003520508578316407, 'samples': 10788864, 'steps': 56191, 'loss/train': 0.9848109483718872} -11/07/2021 05:07:21 - INFO - __main__ - Step 56193: {'lr': 0.0003520460133295518, 'samples': 10789056, 'steps': 56192, 'loss/train': 0.5717485547065735} -11/07/2021 05:07:22 - INFO - __main__ - Step 56194: {'lr': 0.0003520411687814825, 'samples': 10789248, 'steps': 56193, 'loss/train': 0.6043590903282166} -11/07/2021 05:07:22 - INFO - __main__ - Step 56195: {'lr': 0.000352036324187435, 'samples': 10789440, 'steps': 56194, 'loss/train': 1.6420927047729492} -11/07/2021 05:07:22 - INFO - __main__ - Step 56196: {'lr': 0.0003520314795474115, 'samples': 10789632, 'steps': 56195, 'loss/train': 1.801336646080017} -11/07/2021 05:07:23 - INFO - __main__ - Step 56197: {'lr': 0.00035202663486141417, 'samples': 10789824, 'steps': 56196, 'loss/train': 1.2203136682510376} -11/07/2021 05:07:24 - INFO - __main__ - Step 56198: {'lr': 0.00035202179012944527, 'samples': 10790016, 'steps': 56197, 'loss/train': 1.20452082157135} -11/07/2021 05:07:24 - INFO - __main__ - Step 56199: {'lr': 0.0003520169453515069, 'samples': 10790208, 'steps': 56198, 'loss/train': 1.4479241371154785} -11/07/2021 05:07:25 - INFO - __main__ - Step 56200: {'lr': 0.00035201210052760123, 'samples': 10790400, 'steps': 56199, 'loss/train': 1.5330617427825928} -11/07/2021 05:07:25 - INFO - __main__ - Step 56201: {'lr': 0.0003520072556577306, 'samples': 10790592, 'steps': 56200, 'loss/train': 1.4841582775115967} -11/07/2021 05:07:26 - INFO - __main__ - Step 56202: {'lr': 0.000352002410741897, 'samples': 10790784, 'steps': 56201, 'loss/train': 1.36457359790802} -11/07/2021 05:07:26 - INFO - __main__ - Step 56203: {'lr': 0.00035199756578010267, 'samples': 10790976, 'steps': 56202, 'loss/train': 1.483276128768921} -11/07/2021 05:07:27 - INFO - __main__ - Step 56204: {'lr': 0.0003519927207723498, 'samples': 10791168, 'steps': 56203, 'loss/train': 4.350569725036621} -11/07/2021 05:07:27 - INFO - __main__ - Step 56205: {'lr': 0.00035198787571864067, 'samples': 10791360, 'steps': 56204, 'loss/train': 1.2586426734924316} -11/07/2021 05:07:27 - INFO - __main__ - Step 56206: {'lr': 0.0003519830306189773, 'samples': 10791552, 'steps': 56205, 'loss/train': 1.167547345161438} -11/07/2021 05:07:28 - INFO - __main__ - Step 56207: {'lr': 0.000351978185473362, 'samples': 10791744, 'steps': 56206, 'loss/train': 2.1130430698394775} -11/07/2021 05:07:29 - INFO - __main__ - Step 56208: {'lr': 0.0003519733402817968, 'samples': 10791936, 'steps': 56207, 'loss/train': 1.4643226861953735} -11/07/2021 05:07:29 - INFO - __main__ - Step 56209: {'lr': 0.0003519684950442841, 'samples': 10792128, 'steps': 56208, 'loss/train': 1.52162504196167} -11/07/2021 05:07:29 - INFO - __main__ - Step 56210: {'lr': 0.00035196364976082593, 'samples': 10792320, 'steps': 56209, 'loss/train': 1.4099293947219849} -11/07/2021 05:07:30 - INFO - __main__ - Step 56211: {'lr': 0.0003519588044314245, 'samples': 10792512, 'steps': 56210, 'loss/train': 1.165474534034729} -11/07/2021 05:07:30 - INFO - __main__ - Step 56212: {'lr': 0.000351953959056082, 'samples': 10792704, 'steps': 56211, 'loss/train': 1.2444922924041748} -11/07/2021 05:07:31 - INFO - __main__ - Step 56213: {'lr': 0.0003519491136348006, 'samples': 10792896, 'steps': 56212, 'loss/train': 1.6387226581573486} -11/07/2021 05:07:32 - INFO - __main__ - Step 56214: {'lr': 0.0003519442681675826, 'samples': 10793088, 'steps': 56213, 'loss/train': 1.2214232683181763} -11/07/2021 05:07:32 - INFO - __main__ - Step 56215: {'lr': 0.00035193942265443, 'samples': 10793280, 'steps': 56214, 'loss/train': 0.08244670182466507} -11/07/2021 05:07:32 - INFO - __main__ - Step 56216: {'lr': 0.0003519345770953452, 'samples': 10793472, 'steps': 56215, 'loss/train': 1.309668779373169} -11/07/2021 05:07:33 - INFO - __main__ - Step 56217: {'lr': 0.00035192973149033007, 'samples': 10793664, 'steps': 56216, 'loss/train': 1.4655251502990723} -11/07/2021 05:07:34 - INFO - __main__ - Step 56218: {'lr': 0.0003519248858393871, 'samples': 10793856, 'steps': 56217, 'loss/train': 1.0780271291732788} -11/07/2021 05:07:34 - INFO - __main__ - Step 56219: {'lr': 0.0003519200401425183, 'samples': 10794048, 'steps': 56218, 'loss/train': 1.5708234310150146} -11/07/2021 05:07:34 - INFO - __main__ - Step 56220: {'lr': 0.0003519151943997259, 'samples': 10794240, 'steps': 56219, 'loss/train': 1.6604366302490234} -11/07/2021 05:07:35 - INFO - __main__ - Step 56221: {'lr': 0.0003519103486110121, 'samples': 10794432, 'steps': 56220, 'loss/train': 1.2300477027893066} -11/07/2021 05:07:35 - INFO - __main__ - Step 56222: {'lr': 0.0003519055027763791, 'samples': 10794624, 'steps': 56221, 'loss/train': 1.3391817808151245} -11/07/2021 05:07:36 - INFO - __main__ - Step 56223: {'lr': 0.00035190065689582895, 'samples': 10794816, 'steps': 56222, 'loss/train': 1.343144178390503} -11/07/2021 05:07:36 - INFO - __main__ - Step 56224: {'lr': 0.00035189581096936395, 'samples': 10795008, 'steps': 56223, 'loss/train': 1.6980105638504028} -11/07/2021 05:07:37 - INFO - __main__ - Step 56225: {'lr': 0.0003518909649969864, 'samples': 10795200, 'steps': 56224, 'loss/train': 1.4061853885650635} -11/07/2021 05:07:37 - INFO - __main__ - Step 56226: {'lr': 0.00035188611897869824, 'samples': 10795392, 'steps': 56225, 'loss/train': 1.4199899435043335} -11/07/2021 05:07:37 - INFO - __main__ - Step 56227: {'lr': 0.00035188127291450183, 'samples': 10795584, 'steps': 56226, 'loss/train': 1.4231295585632324} -11/07/2021 05:07:39 - INFO - __main__ - Step 56228: {'lr': 0.00035187642680439927, 'samples': 10795776, 'steps': 56227, 'loss/train': 1.2420918941497803} -11/07/2021 05:07:39 - INFO - __main__ - Step 56229: {'lr': 0.0003518715806483928, 'samples': 10795968, 'steps': 56228, 'loss/train': 1.7138904333114624} -11/07/2021 05:07:39 - INFO - __main__ - Step 56230: {'lr': 0.0003518667344464845, 'samples': 10796160, 'steps': 56229, 'loss/train': 1.467958927154541} -11/07/2021 05:07:40 - INFO - __main__ - Step 56231: {'lr': 0.00035186188819867663, 'samples': 10796352, 'steps': 56230, 'loss/train': 1.091019630432129} -11/07/2021 05:07:40 - INFO - __main__ - Step 56232: {'lr': 0.00035185704190497137, 'samples': 10796544, 'steps': 56231, 'loss/train': 0.6361316442489624} -11/07/2021 05:07:41 - INFO - __main__ - Step 56233: {'lr': 0.0003518521955653709, 'samples': 10796736, 'steps': 56232, 'loss/train': 1.327677607536316} -11/07/2021 05:07:41 - INFO - __main__ - Step 56234: {'lr': 0.0003518473491798774, 'samples': 10796928, 'steps': 56233, 'loss/train': 1.552869439125061} -11/07/2021 05:07:42 - INFO - __main__ - Step 56235: {'lr': 0.00035184250274849306, 'samples': 10797120, 'steps': 56234, 'loss/train': 1.4740413427352905} -11/07/2021 05:07:42 - INFO - __main__ - Step 56236: {'lr': 0.0003518376562712201, 'samples': 10797312, 'steps': 56235, 'loss/train': 1.5292969942092896} -11/07/2021 05:07:42 - INFO - __main__ - Step 56237: {'lr': 0.00035183280974806065, 'samples': 10797504, 'steps': 56236, 'loss/train': 1.5130194425582886} -11/07/2021 05:07:43 - INFO - __main__ - Step 56238: {'lr': 0.0003518279631790169, 'samples': 10797696, 'steps': 56237, 'loss/train': 1.3904306888580322} -11/07/2021 05:07:44 - INFO - __main__ - Step 56239: {'lr': 0.000351823116564091, 'samples': 10797888, 'steps': 56238, 'loss/train': 0.7780100703239441} -11/07/2021 05:07:44 - INFO - __main__ - Step 56240: {'lr': 0.0003518182699032852, 'samples': 10798080, 'steps': 56239, 'loss/train': 1.3004306554794312} -11/07/2021 05:07:44 - INFO - __main__ - Step 56241: {'lr': 0.0003518134231966017, 'samples': 10798272, 'steps': 56240, 'loss/train': 1.8354072570800781} -11/07/2021 05:07:45 - INFO - __main__ - Step 56242: {'lr': 0.0003518085764440426, 'samples': 10798464, 'steps': 56241, 'loss/train': 1.4560760259628296} -11/07/2021 05:07:46 - INFO - __main__ - Step 56243: {'lr': 0.00035180372964561013, 'samples': 10798656, 'steps': 56242, 'loss/train': 1.2428865432739258} -11/07/2021 05:07:46 - INFO - __main__ - Step 56244: {'lr': 0.00035179888280130646, 'samples': 10798848, 'steps': 56243, 'loss/train': 2.055394411087036} -11/07/2021 05:07:47 - INFO - __main__ - Step 56245: {'lr': 0.00035179403591113377, 'samples': 10799040, 'steps': 56244, 'loss/train': 1.4973167181015015} -11/07/2021 05:07:47 - INFO - __main__ - Step 56246: {'lr': 0.0003517891889750943, 'samples': 10799232, 'steps': 56245, 'loss/train': 1.0132272243499756} -11/07/2021 05:07:47 - INFO - __main__ - Step 56247: {'lr': 0.0003517843419931902, 'samples': 10799424, 'steps': 56246, 'loss/train': 1.3247162103652954} -11/07/2021 05:07:48 - INFO - __main__ - Step 56248: {'lr': 0.0003517794949654236, 'samples': 10799616, 'steps': 56247, 'loss/train': 1.4394179582595825} -11/07/2021 05:07:49 - INFO - __main__ - Step 56249: {'lr': 0.00035177464789179675, 'samples': 10799808, 'steps': 56248, 'loss/train': 1.0051782131195068} -11/07/2021 05:07:49 - INFO - __main__ - Step 56250: {'lr': 0.0003517698007723118, 'samples': 10800000, 'steps': 56249, 'loss/train': 0.5667877197265625} -11/07/2021 05:07:49 - INFO - __main__ - Step 56251: {'lr': 0.00035176495360697096, 'samples': 10800192, 'steps': 56250, 'loss/train': 1.3332971334457397} -11/07/2021 05:07:50 - INFO - __main__ - Step 56252: {'lr': 0.0003517601063957764, 'samples': 10800384, 'steps': 56251, 'loss/train': 1.1086777448654175} -11/07/2021 05:07:51 - INFO - __main__ - Step 56253: {'lr': 0.0003517552591387303, 'samples': 10800576, 'steps': 56252, 'loss/train': 1.2256686687469482} -11/07/2021 05:07:51 - INFO - __main__ - Step 56254: {'lr': 0.0003517504118358349, 'samples': 10800768, 'steps': 56253, 'loss/train': 0.9534670114517212} -11/07/2021 05:07:52 - INFO - __main__ - Step 56255: {'lr': 0.0003517455644870923, 'samples': 10800960, 'steps': 56254, 'loss/train': 1.9628669023513794} -11/07/2021 05:07:52 - INFO - __main__ - Step 56256: {'lr': 0.00035174071709250475, 'samples': 10801152, 'steps': 56255, 'loss/train': 1.3649989366531372} -11/07/2021 05:07:52 - INFO - __main__ - Step 56257: {'lr': 0.00035173586965207436, 'samples': 10801344, 'steps': 56256, 'loss/train': 0.8693755269050598} -11/07/2021 05:07:53 - INFO - __main__ - Step 56258: {'lr': 0.0003517310221658033, 'samples': 10801536, 'steps': 56257, 'loss/train': 1.0500729084014893} -11/07/2021 05:07:54 - INFO - __main__ - Step 56259: {'lr': 0.00035172617463369397, 'samples': 10801728, 'steps': 56258, 'loss/train': 1.4382660388946533} -11/07/2021 05:07:54 - INFO - __main__ - Step 56260: {'lr': 0.0003517213270557482, 'samples': 10801920, 'steps': 56259, 'loss/train': 1.8214768171310425} -11/07/2021 05:07:54 - INFO - __main__ - Step 56261: {'lr': 0.00035171647943196854, 'samples': 10802112, 'steps': 56260, 'loss/train': 1.5306284427642822} -11/07/2021 05:07:55 - INFO - __main__ - Step 56262: {'lr': 0.00035171163176235694, 'samples': 10802304, 'steps': 56261, 'loss/train': 1.4659202098846436} -11/07/2021 05:07:55 - INFO - __main__ - Step 56263: {'lr': 0.00035170678404691563, 'samples': 10802496, 'steps': 56262, 'loss/train': 1.4727448225021362} -11/07/2021 05:07:55 - INFO - __main__ - Step 56264: {'lr': 0.00035170193628564683, 'samples': 10802688, 'steps': 56263, 'loss/train': 1.5459659099578857} -11/07/2021 05:07:57 - INFO - __main__ - Step 56265: {'lr': 0.0003516970884785527, 'samples': 10802880, 'steps': 56264, 'loss/train': 1.6038678884506226} -11/07/2021 05:07:57 - INFO - __main__ - Step 56266: {'lr': 0.00035169224062563543, 'samples': 10803072, 'steps': 56265, 'loss/train': 1.2403324842453003} -11/07/2021 05:07:57 - INFO - __main__ - Step 56267: {'lr': 0.0003516873927268972, 'samples': 10803264, 'steps': 56266, 'loss/train': 1.416727900505066} -11/07/2021 05:07:58 - INFO - __main__ - Step 56268: {'lr': 0.0003516825447823403, 'samples': 10803456, 'steps': 56267, 'loss/train': 1.4993882179260254} -11/07/2021 05:07:58 - INFO - __main__ - Step 56269: {'lr': 0.0003516776967919667, 'samples': 10803648, 'steps': 56268, 'loss/train': 0.9666994214057922} -11/07/2021 05:07:59 - INFO - __main__ - Step 56270: {'lr': 0.0003516728487557787, 'samples': 10803840, 'steps': 56269, 'loss/train': 2.310224771499634} -11/07/2021 05:08:00 - INFO - __main__ - Step 56271: {'lr': 0.00035166800067377855, 'samples': 10804032, 'steps': 56270, 'loss/train': 1.0139963626861572} -11/07/2021 05:08:00 - INFO - __main__ - Step 56272: {'lr': 0.00035166315254596826, 'samples': 10804224, 'steps': 56271, 'loss/train': 1.0522022247314453} -11/07/2021 05:08:00 - INFO - __main__ - Step 56273: {'lr': 0.0003516583043723502, 'samples': 10804416, 'steps': 56272, 'loss/train': 1.325087308883667} -11/07/2021 05:08:01 - INFO - __main__ - Step 56274: {'lr': 0.0003516534561529264, 'samples': 10804608, 'steps': 56273, 'loss/train': 1.4703959226608276} -11/07/2021 05:08:01 - INFO - __main__ - Step 56275: {'lr': 0.00035164860788769925, 'samples': 10804800, 'steps': 56274, 'loss/train': 2.523444175720215} -11/07/2021 05:08:02 - INFO - __main__ - Step 56276: {'lr': 0.0003516437595766708, 'samples': 10804992, 'steps': 56275, 'loss/train': 1.155405044555664} -11/07/2021 05:08:03 - INFO - __main__ - Step 56277: {'lr': 0.00035163891121984316, 'samples': 10805184, 'steps': 56276, 'loss/train': 1.262868046760559} -11/07/2021 05:08:03 - INFO - __main__ - Step 56278: {'lr': 0.0003516340628172186, 'samples': 10805376, 'steps': 56277, 'loss/train': 0.8349221348762512} -11/07/2021 05:08:03 - INFO - __main__ - Step 56279: {'lr': 0.0003516292143687993, 'samples': 10805568, 'steps': 56278, 'loss/train': 1.7897318601608276} -11/07/2021 05:08:04 - INFO - __main__ - Step 56280: {'lr': 0.00035162436587458744, 'samples': 10805760, 'steps': 56279, 'loss/train': 0.9219061732292175} -11/07/2021 05:08:04 - INFO - __main__ - Step 56281: {'lr': 0.0003516195173345853, 'samples': 10805952, 'steps': 56280, 'loss/train': 1.3079655170440674} -11/07/2021 05:08:05 - INFO - __main__ - Step 56282: {'lr': 0.0003516146687487949, 'samples': 10806144, 'steps': 56281, 'loss/train': 0.2008887082338333} -11/07/2021 05:08:05 - INFO - __main__ - Step 56283: {'lr': 0.0003516098201172185, 'samples': 10806336, 'steps': 56282, 'loss/train': 1.6396210193634033} -11/07/2021 05:08:06 - INFO - __main__ - Step 56284: {'lr': 0.00035160497143985823, 'samples': 10806528, 'steps': 56283, 'loss/train': 1.391641616821289} -11/07/2021 05:08:06 - INFO - __main__ - Step 56285: {'lr': 0.0003516001227167164, 'samples': 10806720, 'steps': 56284, 'loss/train': 1.7935125827789307} -11/07/2021 05:08:07 - INFO - __main__ - Step 56286: {'lr': 0.0003515952739477951, 'samples': 10806912, 'steps': 56285, 'loss/train': 1.2115530967712402} -11/07/2021 05:08:08 - INFO - __main__ - Step 56287: {'lr': 0.0003515904251330965, 'samples': 10807104, 'steps': 56286, 'loss/train': 1.4226312637329102} -11/07/2021 05:08:08 - INFO - __main__ - Step 56288: {'lr': 0.00035158557627262295, 'samples': 10807296, 'steps': 56287, 'loss/train': 1.071256160736084} -11/07/2021 05:08:08 - INFO - __main__ - Step 56289: {'lr': 0.00035158072736637643, 'samples': 10807488, 'steps': 56288, 'loss/train': 1.5754724740982056} -11/07/2021 05:08:09 - INFO - __main__ - Step 56290: {'lr': 0.0003515758784143592, 'samples': 10807680, 'steps': 56289, 'loss/train': 2.0535340309143066} -11/07/2021 05:08:09 - INFO - __main__ - Step 56291: {'lr': 0.00035157102941657336, 'samples': 10807872, 'steps': 56290, 'loss/train': 1.3907785415649414} -11/07/2021 05:08:10 - INFO - __main__ - Step 56292: {'lr': 0.0003515661803730213, 'samples': 10808064, 'steps': 56291, 'loss/train': 1.1638755798339844} -11/07/2021 05:08:10 - INFO - __main__ - Step 56293: {'lr': 0.000351561331283705, 'samples': 10808256, 'steps': 56292, 'loss/train': 1.2919719219207764} -11/07/2021 05:08:11 - INFO - __main__ - Step 56294: {'lr': 0.0003515564821486268, 'samples': 10808448, 'steps': 56293, 'loss/train': 1.6496127843856812} -11/07/2021 05:08:11 - INFO - __main__ - Step 56295: {'lr': 0.00035155163296778883, 'samples': 10808640, 'steps': 56294, 'loss/train': 1.5217833518981934} -11/07/2021 05:08:11 - INFO - __main__ - Step 56296: {'lr': 0.0003515467837411932, 'samples': 10808832, 'steps': 56295, 'loss/train': 1.1412055492401123} -11/07/2021 05:08:12 - INFO - __main__ - Step 56297: {'lr': 0.0003515419344688422, 'samples': 10809024, 'steps': 56296, 'loss/train': 0.5805878043174744} -11/07/2021 05:08:13 - INFO - __main__ - Step 56298: {'lr': 0.00035153708515073793, 'samples': 10809216, 'steps': 56297, 'loss/train': 1.531552791595459} -11/07/2021 05:08:13 - INFO - __main__ - Step 56299: {'lr': 0.00035153223578688263, 'samples': 10809408, 'steps': 56298, 'loss/train': 0.08228524029254913} -11/07/2021 05:08:14 - INFO - __main__ - Step 56300: {'lr': 0.0003515273863772785, 'samples': 10809600, 'steps': 56299, 'loss/train': 1.5238845348358154} -11/07/2021 05:08:14 - INFO - __main__ - Step 56301: {'lr': 0.00035152253692192765, 'samples': 10809792, 'steps': 56300, 'loss/train': 1.3679463863372803} -11/07/2021 05:08:15 - INFO - __main__ - Step 56302: {'lr': 0.0003515176874208324, 'samples': 10809984, 'steps': 56301, 'loss/train': 1.4546902179718018} -11/07/2021 05:08:15 - INFO - __main__ - Step 56303: {'lr': 0.0003515128378739948, 'samples': 10810176, 'steps': 56302, 'loss/train': 1.1979960203170776} -11/07/2021 05:08:16 - INFO - __main__ - Step 56304: {'lr': 0.0003515079882814171, 'samples': 10810368, 'steps': 56303, 'loss/train': 1.2700610160827637} -11/07/2021 05:08:16 - INFO - __main__ - Step 56305: {'lr': 0.00035150313864310137, 'samples': 10810560, 'steps': 56304, 'loss/train': 1.5382988452911377} -11/07/2021 05:08:16 - INFO - __main__ - Step 56306: {'lr': 0.00035149828895904994, 'samples': 10810752, 'steps': 56305, 'loss/train': 1.3243350982666016} -11/07/2021 05:08:17 - INFO - __main__ - Step 56307: {'lr': 0.00035149343922926497, 'samples': 10810944, 'steps': 56306, 'loss/train': 1.6069839000701904} -11/07/2021 05:08:18 - INFO - __main__ - Step 56308: {'lr': 0.0003514885894537486, 'samples': 10811136, 'steps': 56307, 'loss/train': 1.2906118631362915} -11/07/2021 05:08:18 - INFO - __main__ - Step 56309: {'lr': 0.00035148373963250307, 'samples': 10811328, 'steps': 56308, 'loss/train': 1.5618865489959717} -11/07/2021 05:08:18 - INFO - __main__ - Step 56310: {'lr': 0.0003514788897655305, 'samples': 10811520, 'steps': 56309, 'loss/train': 0.7043637633323669} -11/07/2021 05:08:19 - INFO - __main__ - Step 56311: {'lr': 0.0003514740398528331, 'samples': 10811712, 'steps': 56310, 'loss/train': 0.9927510619163513} -11/07/2021 05:08:19 - INFO - __main__ - Step 56312: {'lr': 0.0003514691898944131, 'samples': 10811904, 'steps': 56311, 'loss/train': 1.4340620040893555} -11/07/2021 05:08:20 - INFO - __main__ - Step 56313: {'lr': 0.0003514643398902727, 'samples': 10812096, 'steps': 56312, 'loss/train': 1.3973286151885986} -11/07/2021 05:08:20 - INFO - __main__ - Step 56314: {'lr': 0.00035145948984041393, 'samples': 10812288, 'steps': 56313, 'loss/train': 1.5491747856140137} -11/07/2021 05:08:21 - INFO - __main__ - Step 56315: {'lr': 0.00035145463974483915, 'samples': 10812480, 'steps': 56314, 'loss/train': 1.3057949542999268} -11/07/2021 05:08:21 - INFO - __main__ - Step 56316: {'lr': 0.00035144978960355045, 'samples': 10812672, 'steps': 56315, 'loss/train': 1.265416145324707} -11/07/2021 05:08:22 - INFO - __main__ - Step 56317: {'lr': 0.00035144493941655, 'samples': 10812864, 'steps': 56316, 'loss/train': 1.378902792930603} -11/07/2021 05:08:23 - INFO - __main__ - Step 56318: {'lr': 0.00035144008918384006, 'samples': 10813056, 'steps': 56317, 'loss/train': 0.857494592666626} -11/07/2021 05:08:23 - INFO - __main__ - Step 56319: {'lr': 0.0003514352389054228, 'samples': 10813248, 'steps': 56318, 'loss/train': 1.1948238611221313} -11/07/2021 05:08:23 - INFO - __main__ - Step 56320: {'lr': 0.00035143038858130034, 'samples': 10813440, 'steps': 56319, 'loss/train': 1.2425715923309326} -11/07/2021 05:08:24 - INFO - __main__ - Step 56321: {'lr': 0.00035142553821147494, 'samples': 10813632, 'steps': 56320, 'loss/train': 1.6433122158050537} -11/07/2021 05:08:24 - INFO - __main__ - Step 56322: {'lr': 0.00035142068779594885, 'samples': 10813824, 'steps': 56321, 'loss/train': 2.380887031555176} -11/07/2021 05:08:25 - INFO - __main__ - Step 56323: {'lr': 0.00035141583733472407, 'samples': 10814016, 'steps': 56322, 'loss/train': 1.6240476369857788} -11/07/2021 05:08:26 - INFO - __main__ - Step 56324: {'lr': 0.0003514109868278028, 'samples': 10814208, 'steps': 56323, 'loss/train': 0.8962580561637878} -11/07/2021 05:08:26 - INFO - __main__ - Step 56325: {'lr': 0.0003514061362751874, 'samples': 10814400, 'steps': 56324, 'loss/train': 1.420181393623352} -11/07/2021 05:08:26 - INFO - __main__ - Step 56326: {'lr': 0.0003514012856768799, 'samples': 10814592, 'steps': 56325, 'loss/train': 1.265038251876831} -11/07/2021 05:08:27 - INFO - __main__ - Step 56327: {'lr': 0.0003513964350328826, 'samples': 10814784, 'steps': 56326, 'loss/train': 1.5866719484329224} -11/07/2021 05:08:27 - INFO - __main__ - Step 56328: {'lr': 0.0003513915843431977, 'samples': 10814976, 'steps': 56327, 'loss/train': 1.5536901950836182} -11/07/2021 05:08:28 - INFO - __main__ - Step 56329: {'lr': 0.0003513867336078272, 'samples': 10815168, 'steps': 56328, 'loss/train': 1.133144736289978} -11/07/2021 05:08:28 - INFO - __main__ - Step 56330: {'lr': 0.00035138188282677344, 'samples': 10815360, 'steps': 56329, 'loss/train': 1.1731499433517456} -11/07/2021 05:08:29 - INFO - __main__ - Step 56331: {'lr': 0.00035137703200003857, 'samples': 10815552, 'steps': 56330, 'loss/train': 1.340118408203125} -11/07/2021 05:08:29 - INFO - __main__ - Step 56332: {'lr': 0.00035137218112762475, 'samples': 10815744, 'steps': 56331, 'loss/train': 2.1245827674865723} -11/07/2021 05:08:30 - INFO - __main__ - Step 56333: {'lr': 0.0003513673302095342, 'samples': 10815936, 'steps': 56332, 'loss/train': 1.8567603826522827} -11/07/2021 05:08:30 - INFO - __main__ - Step 56334: {'lr': 0.0003513624792457691, 'samples': 10816128, 'steps': 56333, 'loss/train': 1.5586357116699219} -11/07/2021 05:08:31 - INFO - __main__ - Step 56335: {'lr': 0.00035135762823633167, 'samples': 10816320, 'steps': 56334, 'loss/train': 1.6616904735565186} -11/07/2021 05:08:31 - INFO - __main__ - Step 56336: {'lr': 0.00035135277718122403, 'samples': 10816512, 'steps': 56335, 'loss/train': 2.636472225189209} -11/07/2021 05:08:31 - INFO - __main__ - Step 56337: {'lr': 0.0003513479260804484, 'samples': 10816704, 'steps': 56336, 'loss/train': 1.2617383003234863} -11/07/2021 05:08:32 - INFO - __main__ - Step 56338: {'lr': 0.0003513430749340069, 'samples': 10816896, 'steps': 56337, 'loss/train': 1.1958850622177124} -11/07/2021 05:08:33 - INFO - __main__ - Step 56339: {'lr': 0.0003513382237419018, 'samples': 10817088, 'steps': 56338, 'loss/train': 1.488937497138977} -11/07/2021 05:08:33 - INFO - __main__ - Step 56340: {'lr': 0.00035133337250413534, 'samples': 10817280, 'steps': 56339, 'loss/train': 1.2550724744796753} -11/07/2021 05:08:33 - INFO - __main__ - Step 56341: {'lr': 0.00035132852122070953, 'samples': 10817472, 'steps': 56340, 'loss/train': 1.411402940750122} -11/07/2021 05:08:34 - INFO - __main__ - Step 56342: {'lr': 0.0003513236698916267, 'samples': 10817664, 'steps': 56341, 'loss/train': 1.3002254962921143} -11/07/2021 05:08:34 - INFO - __main__ - Step 56343: {'lr': 0.00035131881851688896, 'samples': 10817856, 'steps': 56342, 'loss/train': 0.9825994372367859} -11/07/2021 05:08:35 - INFO - __main__ - Step 56344: {'lr': 0.00035131396709649855, 'samples': 10818048, 'steps': 56343, 'loss/train': 1.5272952318191528} -11/07/2021 05:08:36 - INFO - __main__ - Step 56345: {'lr': 0.00035130911563045764, 'samples': 10818240, 'steps': 56344, 'loss/train': 2.537260055541992} -11/07/2021 05:08:36 - INFO - __main__ - Step 56346: {'lr': 0.00035130426411876834, 'samples': 10818432, 'steps': 56345, 'loss/train': 1.7120434045791626} -11/07/2021 05:08:36 - INFO - __main__ - Step 56347: {'lr': 0.00035129941256143295, 'samples': 10818624, 'steps': 56346, 'loss/train': 1.48082435131073} -11/07/2021 05:08:37 - INFO - __main__ - Step 56348: {'lr': 0.0003512945609584536, 'samples': 10818816, 'steps': 56347, 'loss/train': 0.07550205290317535} -11/07/2021 05:08:38 - INFO - __main__ - Step 56349: {'lr': 0.0003512897093098325, 'samples': 10819008, 'steps': 56348, 'loss/train': 1.1048388481140137} -11/07/2021 05:08:38 - INFO - __main__ - Step 56350: {'lr': 0.0003512848576155718, 'samples': 10819200, 'steps': 56349, 'loss/train': 2.077885389328003} -11/07/2021 05:08:38 - INFO - __main__ - Step 56351: {'lr': 0.0003512800058756738, 'samples': 10819392, 'steps': 56350, 'loss/train': 1.0637279748916626} -11/07/2021 05:08:39 - INFO - __main__ - Step 56352: {'lr': 0.00035127515409014046, 'samples': 10819584, 'steps': 56351, 'loss/train': 1.535597324371338} -11/07/2021 05:08:39 - INFO - __main__ - Step 56353: {'lr': 0.00035127030225897413, 'samples': 10819776, 'steps': 56352, 'loss/train': 1.1597362756729126} -11/07/2021 05:08:40 - INFO - __main__ - Step 56354: {'lr': 0.000351265450382177, 'samples': 10819968, 'steps': 56353, 'loss/train': 1.274021863937378} -11/07/2021 05:08:41 - INFO - __main__ - Step 56355: {'lr': 0.0003512605984597512, 'samples': 10820160, 'steps': 56354, 'loss/train': 1.341858983039856} -11/07/2021 05:08:41 - INFO - __main__ - Step 56356: {'lr': 0.00035125574649169894, 'samples': 10820352, 'steps': 56355, 'loss/train': 1.5707485675811768} -11/07/2021 05:08:41 - INFO - __main__ - Step 56357: {'lr': 0.0003512508944780224, 'samples': 10820544, 'steps': 56356, 'loss/train': 1.7568302154541016} -11/07/2021 05:08:42 - INFO - __main__ - Step 56358: {'lr': 0.0003512460424187237, 'samples': 10820736, 'steps': 56357, 'loss/train': 1.2920538187026978} -11/07/2021 05:08:43 - INFO - __main__ - Step 56359: {'lr': 0.00035124119031380526, 'samples': 10820928, 'steps': 56358, 'loss/train': 1.617993712425232} -11/07/2021 05:08:43 - INFO - __main__ - Step 56360: {'lr': 0.000351236338163269, 'samples': 10821120, 'steps': 56359, 'loss/train': 0.6446110606193542} -11/07/2021 05:08:43 - INFO - __main__ - Step 56361: {'lr': 0.00035123148596711716, 'samples': 10821312, 'steps': 56360, 'loss/train': 1.295314908027649} -11/07/2021 05:08:44 - INFO - __main__ - Step 56362: {'lr': 0.0003512266337253521, 'samples': 10821504, 'steps': 56361, 'loss/train': 1.4957098960876465} -11/07/2021 05:08:44 - INFO - __main__ - Step 56363: {'lr': 0.0003512217814379758, 'samples': 10821696, 'steps': 56362, 'loss/train': 1.2495609521865845} -11/07/2021 05:08:45 - INFO - __main__ - Step 56364: {'lr': 0.0003512169291049905, 'samples': 10821888, 'steps': 56363, 'loss/train': 1.2257405519485474} -11/07/2021 05:08:46 - INFO - __main__ - Step 56365: {'lr': 0.0003512120767263985, 'samples': 10822080, 'steps': 56364, 'loss/train': 1.4817039966583252} -11/07/2021 05:08:46 - INFO - __main__ - Step 56366: {'lr': 0.0003512072243022018, 'samples': 10822272, 'steps': 56365, 'loss/train': 1.5123552083969116} -11/07/2021 05:08:46 - INFO - __main__ - Step 56367: {'lr': 0.00035120237183240276, 'samples': 10822464, 'steps': 56366, 'loss/train': 1.4283339977264404} -11/07/2021 05:08:47 - INFO - __main__ - Step 56368: {'lr': 0.00035119751931700344, 'samples': 10822656, 'steps': 56367, 'loss/train': 1.0413459539413452} -11/07/2021 05:08:48 - INFO - __main__ - Step 56369: {'lr': 0.00035119266675600615, 'samples': 10822848, 'steps': 56368, 'loss/train': 1.5881069898605347} -11/07/2021 05:08:48 - INFO - __main__ - Step 56370: {'lr': 0.00035118781414941296, 'samples': 10823040, 'steps': 56369, 'loss/train': 1.1666054725646973} -11/07/2021 05:08:48 - INFO - __main__ - Step 56371: {'lr': 0.00035118296149722614, 'samples': 10823232, 'steps': 56370, 'loss/train': 1.1436271667480469} -11/07/2021 05:08:49 - INFO - __main__ - Step 56372: {'lr': 0.0003511781087994478, 'samples': 10823424, 'steps': 56371, 'loss/train': 1.313245415687561} -11/07/2021 05:08:49 - INFO - __main__ - Step 56373: {'lr': 0.00035117325605608013, 'samples': 10823616, 'steps': 56372, 'loss/train': 1.2382103204727173} -11/07/2021 05:08:49 - INFO - __main__ - Step 56374: {'lr': 0.0003511684032671254, 'samples': 10823808, 'steps': 56373, 'loss/train': 1.6699844598770142} -11/07/2021 05:08:51 - INFO - __main__ - Step 56375: {'lr': 0.0003511635504325857, 'samples': 10824000, 'steps': 56374, 'loss/train': 1.621235966682434} -11/07/2021 05:08:51 - INFO - __main__ - Step 56376: {'lr': 0.0003511586975524634, 'samples': 10824192, 'steps': 56375, 'loss/train': 1.34029221534729} -11/07/2021 05:08:52 - INFO - __main__ - Step 56377: {'lr': 0.0003511538446267604, 'samples': 10824384, 'steps': 56376, 'loss/train': 5.697155952453613} -11/07/2021 05:08:52 - INFO - __main__ - Step 56378: {'lr': 0.00035114899165547916, 'samples': 10824576, 'steps': 56377, 'loss/train': 1.3295198678970337} -11/07/2021 05:08:52 - INFO - __main__ - Step 56379: {'lr': 0.00035114413863862164, 'samples': 10824768, 'steps': 56378, 'loss/train': 1.9706774950027466} -11/07/2021 05:08:53 - INFO - __main__ - Step 56380: {'lr': 0.0003511392855761902, 'samples': 10824960, 'steps': 56379, 'loss/train': 5.348339557647705} -11/07/2021 05:08:54 - INFO - __main__ - Step 56381: {'lr': 0.0003511344324681869, 'samples': 10825152, 'steps': 56380, 'loss/train': 5.333381175994873} -11/07/2021 05:08:54 - INFO - __main__ - Step 56382: {'lr': 0.00035112957931461407, 'samples': 10825344, 'steps': 56381, 'loss/train': 1.400259256362915} -11/07/2021 05:08:54 - INFO - __main__ - Step 56383: {'lr': 0.00035112472611547376, 'samples': 10825536, 'steps': 56382, 'loss/train': 1.722835659980774} -11/07/2021 05:08:55 - INFO - __main__ - Step 56384: {'lr': 0.0003511198728707682, 'samples': 10825728, 'steps': 56383, 'loss/train': 1.4241292476654053} -11/07/2021 05:08:55 - INFO - __main__ - Step 56385: {'lr': 0.0003511150195804996, 'samples': 10825920, 'steps': 56384, 'loss/train': 1.08267343044281} -11/07/2021 05:08:55 - INFO - __main__ - Step 56386: {'lr': 0.00035111016624467007, 'samples': 10826112, 'steps': 56385, 'loss/train': 1.0685404539108276} -11/07/2021 05:08:56 - INFO - __main__ - Step 56387: {'lr': 0.00035110531286328193, 'samples': 10826304, 'steps': 56386, 'loss/train': 1.584810733795166} -11/07/2021 05:08:57 - INFO - __main__ - Step 56388: {'lr': 0.0003511004594363373, 'samples': 10826496, 'steps': 56387, 'loss/train': 1.4250186681747437} -11/07/2021 05:08:57 - INFO - __main__ - Step 56389: {'lr': 0.0003510956059638384, 'samples': 10826688, 'steps': 56388, 'loss/train': 1.1023499965667725} -11/07/2021 05:08:57 - INFO - __main__ - Step 56390: {'lr': 0.0003510907524457873, 'samples': 10826880, 'steps': 56389, 'loss/train': 1.2967067956924438} -11/07/2021 05:08:58 - INFO - __main__ - Step 56391: {'lr': 0.0003510858988821863, 'samples': 10827072, 'steps': 56390, 'loss/train': 1.3536230325698853} -11/07/2021 05:08:59 - INFO - __main__ - Step 56392: {'lr': 0.00035108104527303754, 'samples': 10827264, 'steps': 56391, 'loss/train': 1.3348649740219116} -11/07/2021 05:08:59 - INFO - __main__ - Step 56393: {'lr': 0.0003510761916183432, 'samples': 10827456, 'steps': 56392, 'loss/train': 1.6952288150787354} -11/07/2021 05:09:00 - INFO - __main__ - Step 56394: {'lr': 0.00035107133791810555, 'samples': 10827648, 'steps': 56393, 'loss/train': 1.2137962579727173} -11/07/2021 05:09:00 - INFO - __main__ - Step 56395: {'lr': 0.00035106648417232666, 'samples': 10827840, 'steps': 56394, 'loss/train': 0.9549675583839417} -11/07/2021 05:09:00 - INFO - __main__ - Step 56396: {'lr': 0.0003510616303810088, 'samples': 10828032, 'steps': 56395, 'loss/train': 1.2758619785308838} -11/07/2021 05:09:01 - INFO - __main__ - Step 56397: {'lr': 0.00035105677654415416, 'samples': 10828224, 'steps': 56396, 'loss/train': 0.17087025940418243} -11/07/2021 05:09:02 - INFO - __main__ - Step 56398: {'lr': 0.0003510519226617648, 'samples': 10828416, 'steps': 56397, 'loss/train': 1.5702942609786987} -11/07/2021 05:09:02 - INFO - __main__ - Step 56399: {'lr': 0.00035104706873384305, 'samples': 10828608, 'steps': 56398, 'loss/train': 0.874310314655304} -11/07/2021 05:09:02 - INFO - __main__ - Step 56400: {'lr': 0.0003510422147603911, 'samples': 10828800, 'steps': 56399, 'loss/train': 1.2134251594543457} -11/07/2021 05:09:03 - INFO - __main__ - Step 56401: {'lr': 0.00035103736074141103, 'samples': 10828992, 'steps': 56400, 'loss/train': 1.54283607006073} -11/07/2021 05:09:04 - INFO - __main__ - Step 56402: {'lr': 0.0003510325066769051, 'samples': 10829184, 'steps': 56401, 'loss/train': 1.7283002138137817} -11/07/2021 05:09:04 - INFO - __main__ - Step 56403: {'lr': 0.00035102765256687555, 'samples': 10829376, 'steps': 56402, 'loss/train': 1.5847009420394897} -11/07/2021 05:09:04 - INFO - __main__ - Step 56404: {'lr': 0.0003510227984113244, 'samples': 10829568, 'steps': 56403, 'loss/train': 1.4769731760025024} -11/07/2021 05:09:05 - INFO - __main__ - Step 56405: {'lr': 0.00035101794421025395, 'samples': 10829760, 'steps': 56404, 'loss/train': 0.45974522829055786} -11/07/2021 05:09:05 - INFO - __main__ - Step 56406: {'lr': 0.00035101308996366635, 'samples': 10829952, 'steps': 56405, 'loss/train': 1.4863005876541138} -11/07/2021 05:09:06 - INFO - __main__ - Step 56407: {'lr': 0.00035100823567156385, 'samples': 10830144, 'steps': 56406, 'loss/train': 1.0604636669158936} -11/07/2021 05:09:07 - INFO - __main__ - Step 56408: {'lr': 0.0003510033813339486, 'samples': 10830336, 'steps': 56407, 'loss/train': 1.907752513885498} -11/07/2021 05:09:07 - INFO - __main__ - Step 56409: {'lr': 0.00035099852695082286, 'samples': 10830528, 'steps': 56408, 'loss/train': 1.43251633644104} -11/07/2021 05:09:07 - INFO - __main__ - Step 56410: {'lr': 0.0003509936725221886, 'samples': 10830720, 'steps': 56409, 'loss/train': 1.3085565567016602} -11/07/2021 05:09:08 - INFO - __main__ - Step 56411: {'lr': 0.0003509888180480483, 'samples': 10830912, 'steps': 56410, 'loss/train': 1.3520587682724} -11/07/2021 05:09:09 - INFO - __main__ - Step 56412: {'lr': 0.00035098396352840384, 'samples': 10831104, 'steps': 56411, 'loss/train': 1.17833411693573} -11/07/2021 05:09:09 - INFO - __main__ - Step 56413: {'lr': 0.00035097910896325765, 'samples': 10831296, 'steps': 56412, 'loss/train': 1.0977505445480347} -11/07/2021 05:09:09 - INFO - __main__ - Step 56414: {'lr': 0.0003509742543526118, 'samples': 10831488, 'steps': 56413, 'loss/train': 1.566825032234192} -11/07/2021 05:09:10 - INFO - __main__ - Step 56415: {'lr': 0.00035096939969646854, 'samples': 10831680, 'steps': 56414, 'loss/train': 1.2906500101089478} -11/07/2021 05:09:10 - INFO - __main__ - Step 56416: {'lr': 0.00035096454499483, 'samples': 10831872, 'steps': 56415, 'loss/train': 1.7458585500717163} -11/07/2021 05:09:11 - INFO - __main__ - Step 56417: {'lr': 0.0003509596902476985, 'samples': 10832064, 'steps': 56416, 'loss/train': 1.7231554985046387} -11/07/2021 05:09:11 - INFO - __main__ - Step 56418: {'lr': 0.000350954835455076, 'samples': 10832256, 'steps': 56417, 'loss/train': 1.106741189956665} -11/07/2021 05:09:12 - INFO - __main__ - Step 56419: {'lr': 0.00035094998061696483, 'samples': 10832448, 'steps': 56418, 'loss/train': 1.2603288888931274} -11/07/2021 05:09:12 - INFO - __main__ - Step 56420: {'lr': 0.0003509451257333671, 'samples': 10832640, 'steps': 56419, 'loss/train': 1.025185465812683} -11/07/2021 05:09:13 - INFO - __main__ - Step 56421: {'lr': 0.00035094027080428514, 'samples': 10832832, 'steps': 56420, 'loss/train': 1.6788630485534668} -11/07/2021 05:09:13 - INFO - __main__ - Step 56422: {'lr': 0.00035093541582972105, 'samples': 10833024, 'steps': 56421, 'loss/train': 1.6398028135299683} -11/07/2021 05:09:14 - INFO - __main__ - Step 56423: {'lr': 0.000350930560809677, 'samples': 10833216, 'steps': 56422, 'loss/train': 1.3926358222961426} -11/07/2021 05:09:14 - INFO - __main__ - Step 56424: {'lr': 0.0003509257057441552, 'samples': 10833408, 'steps': 56423, 'loss/train': 2.116044759750366} -11/07/2021 05:09:14 - INFO - __main__ - Step 56425: {'lr': 0.00035092085063315783, 'samples': 10833600, 'steps': 56424, 'loss/train': 1.327752709388733} -11/07/2021 05:09:15 - INFO - __main__ - Step 56426: {'lr': 0.00035091599547668707, 'samples': 10833792, 'steps': 56425, 'loss/train': 1.8574451208114624} -11/07/2021 05:09:16 - INFO - __main__ - Step 56427: {'lr': 0.00035091114027474514, 'samples': 10833984, 'steps': 56426, 'loss/train': 1.6053627729415894} -11/07/2021 05:09:16 - INFO - __main__ - Step 56428: {'lr': 0.0003509062850273342, 'samples': 10834176, 'steps': 56427, 'loss/train': 1.2255128622055054} -11/07/2021 05:09:16 - INFO - __main__ - Step 56429: {'lr': 0.0003509014297344565, 'samples': 10834368, 'steps': 56428, 'loss/train': 1.2436903715133667} -11/07/2021 05:09:17 - INFO - __main__ - Step 56430: {'lr': 0.0003508965743961141, 'samples': 10834560, 'steps': 56429, 'loss/train': 1.6321382522583008} -11/07/2021 05:09:17 - INFO - __main__ - Step 56431: {'lr': 0.00035089171901230926, 'samples': 10834752, 'steps': 56430, 'loss/train': 1.8084721565246582} -11/07/2021 05:09:18 - INFO - __main__ - Step 56432: {'lr': 0.0003508868635830442, 'samples': 10834944, 'steps': 56431, 'loss/train': 1.4079978466033936} -11/07/2021 05:09:19 - INFO - __main__ - Step 56433: {'lr': 0.00035088200810832104, 'samples': 10835136, 'steps': 56432, 'loss/train': 1.562827467918396} -11/07/2021 05:09:19 - INFO - __main__ - Step 56434: {'lr': 0.00035087715258814203, 'samples': 10835328, 'steps': 56433, 'loss/train': 1.4147230386734009} -11/07/2021 05:09:19 - INFO - __main__ - Step 56435: {'lr': 0.00035087229702250936, 'samples': 10835520, 'steps': 56434, 'loss/train': 1.3920665979385376} -11/07/2021 05:09:20 - INFO - __main__ - Step 56436: {'lr': 0.00035086744141142514, 'samples': 10835712, 'steps': 56435, 'loss/train': 1.5755733251571655} -11/07/2021 05:09:21 - INFO - __main__ - Step 56437: {'lr': 0.0003508625857548916, 'samples': 10835904, 'steps': 56436, 'loss/train': 1.351709246635437} -11/07/2021 05:09:21 - INFO - __main__ - Step 56438: {'lr': 0.000350857730052911, 'samples': 10836096, 'steps': 56437, 'loss/train': 1.2981946468353271} -11/07/2021 05:09:21 - INFO - __main__ - Step 56439: {'lr': 0.0003508528743054854, 'samples': 10836288, 'steps': 56438, 'loss/train': 1.1369142532348633} -11/07/2021 05:09:22 - INFO - __main__ - Step 56440: {'lr': 0.00035084801851261707, 'samples': 10836480, 'steps': 56439, 'loss/train': 0.850168764591217} -11/07/2021 05:09:22 - INFO - __main__ - Step 56441: {'lr': 0.00035084316267430815, 'samples': 10836672, 'steps': 56440, 'loss/train': 1.2398172616958618} -11/07/2021 05:09:23 - INFO - __main__ - Step 56442: {'lr': 0.0003508383067905609, 'samples': 10836864, 'steps': 56441, 'loss/train': 1.5632760524749756} -11/07/2021 05:09:24 - INFO - __main__ - Step 56443: {'lr': 0.0003508334508613775, 'samples': 10837056, 'steps': 56442, 'loss/train': 1.3541842699050903} -11/07/2021 05:09:24 - INFO - __main__ - Step 56444: {'lr': 0.00035082859488676005, 'samples': 10837248, 'steps': 56443, 'loss/train': 1.5581953525543213} -11/07/2021 05:09:24 - INFO - __main__ - Step 56445: {'lr': 0.0003508237388667108, 'samples': 10837440, 'steps': 56444, 'loss/train': 1.1634643077850342} -11/07/2021 05:09:25 - INFO - __main__ - Step 56446: {'lr': 0.00035081888280123194, 'samples': 10837632, 'steps': 56445, 'loss/train': 1.3987843990325928} -11/07/2021 05:09:25 - INFO - __main__ - Step 56447: {'lr': 0.0003508140266903256, 'samples': 10837824, 'steps': 56446, 'loss/train': 1.2198574542999268} -11/07/2021 05:09:26 - INFO - __main__ - Step 56448: {'lr': 0.0003508091705339941, 'samples': 10838016, 'steps': 56447, 'loss/train': 1.7012450695037842} -11/07/2021 05:09:27 - INFO - __main__ - Step 56449: {'lr': 0.00035080431433223946, 'samples': 10838208, 'steps': 56448, 'loss/train': 1.41193425655365} -11/07/2021 05:09:27 - INFO - __main__ - Step 56450: {'lr': 0.000350799458085064, 'samples': 10838400, 'steps': 56449, 'loss/train': 0.7745003700256348} -11/07/2021 05:09:27 - INFO - __main__ - Step 56451: {'lr': 0.00035079460179246984, 'samples': 10838592, 'steps': 56450, 'loss/train': 1.8149513006210327} -11/07/2021 05:09:28 - INFO - __main__ - Step 56452: {'lr': 0.0003507897454544592, 'samples': 10838784, 'steps': 56451, 'loss/train': 1.5369768142700195} -11/07/2021 05:09:29 - INFO - __main__ - Step 56453: {'lr': 0.0003507848890710342, 'samples': 10838976, 'steps': 56452, 'loss/train': 1.4429296255111694} -11/07/2021 05:09:29 - INFO - __main__ - Step 56454: {'lr': 0.00035078003264219713, 'samples': 10839168, 'steps': 56453, 'loss/train': 1.3574390411376953} -11/07/2021 05:09:29 - INFO - __main__ - Step 56455: {'lr': 0.0003507751761679502, 'samples': 10839360, 'steps': 56454, 'loss/train': 1.4801967144012451} -11/07/2021 05:09:30 - INFO - __main__ - Step 56456: {'lr': 0.0003507703196482955, 'samples': 10839552, 'steps': 56455, 'loss/train': 1.9251022338867188} -11/07/2021 05:09:30 - INFO - __main__ - Step 56457: {'lr': 0.0003507654630832352, 'samples': 10839744, 'steps': 56456, 'loss/train': 1.4896724224090576} -11/07/2021 05:09:31 - INFO - __main__ - Step 56458: {'lr': 0.0003507606064727715, 'samples': 10839936, 'steps': 56457, 'loss/train': 1.2481746673583984} -11/07/2021 05:09:31 - INFO - __main__ - Step 56459: {'lr': 0.0003507557498169067, 'samples': 10840128, 'steps': 56458, 'loss/train': 1.343714952468872} -11/07/2021 05:09:32 - INFO - __main__ - Step 56460: {'lr': 0.0003507508931156429, 'samples': 10840320, 'steps': 56459, 'loss/train': 1.4095211029052734} -11/07/2021 05:09:32 - INFO - __main__ - Step 56461: {'lr': 0.0003507460363689823, 'samples': 10840512, 'steps': 56460, 'loss/train': 1.118160367012024} -11/07/2021 05:09:33 - INFO - __main__ - Step 56462: {'lr': 0.00035074117957692707, 'samples': 10840704, 'steps': 56461, 'loss/train': 1.6819826364517212} -11/07/2021 05:09:33 - INFO - __main__ - Step 56463: {'lr': 0.0003507363227394795, 'samples': 10840896, 'steps': 56462, 'loss/train': 0.5558393597602844} -11/07/2021 05:09:34 - INFO - __main__ - Step 56464: {'lr': 0.00035073146585664163, 'samples': 10841088, 'steps': 56463, 'loss/train': 1.30038583278656} -11/07/2021 05:09:34 - INFO - __main__ - Step 56465: {'lr': 0.00035072660892841566, 'samples': 10841280, 'steps': 56464, 'loss/train': 1.0113273859024048} -11/07/2021 05:09:35 - INFO - __main__ - Step 56466: {'lr': 0.0003507217519548039, 'samples': 10841472, 'steps': 56465, 'loss/train': 1.5108157396316528} -11/07/2021 05:09:35 - INFO - __main__ - Step 56467: {'lr': 0.00035071689493580845, 'samples': 10841664, 'steps': 56466, 'loss/train': 1.5632741451263428} -11/07/2021 05:09:35 - INFO - __main__ - Step 56468: {'lr': 0.0003507120378714315, 'samples': 10841856, 'steps': 56467, 'loss/train': 1.402575135231018} -11/07/2021 05:09:36 - INFO - __main__ - Step 56469: {'lr': 0.0003507071807616753, 'samples': 10842048, 'steps': 56468, 'loss/train': 1.387196660041809} -11/07/2021 05:09:37 - INFO - __main__ - Step 56470: {'lr': 0.0003507023236065421, 'samples': 10842240, 'steps': 56469, 'loss/train': 1.0838427543640137} -11/07/2021 05:09:37 - INFO - __main__ - Step 56471: {'lr': 0.0003506974664060338, 'samples': 10842432, 'steps': 56470, 'loss/train': 1.2613595724105835} -11/07/2021 05:09:37 - INFO - __main__ - Step 56472: {'lr': 0.00035069260916015287, 'samples': 10842624, 'steps': 56471, 'loss/train': 2.4340803623199463} -11/07/2021 05:09:38 - INFO - __main__ - Step 56473: {'lr': 0.0003506877518689014, 'samples': 10842816, 'steps': 56472, 'loss/train': 1.6305314302444458} -11/07/2021 05:09:39 - INFO - __main__ - Step 56474: {'lr': 0.0003506828945322816, 'samples': 10843008, 'steps': 56473, 'loss/train': 0.9941365718841553} -11/07/2021 05:09:39 - INFO - __main__ - Step 56475: {'lr': 0.0003506780371502956, 'samples': 10843200, 'steps': 56474, 'loss/train': 1.4905797243118286} -11/07/2021 05:09:40 - INFO - __main__ - Step 56476: {'lr': 0.00035067317972294564, 'samples': 10843392, 'steps': 56475, 'loss/train': 1.0587031841278076} -11/07/2021 05:09:40 - INFO - __main__ - Step 56477: {'lr': 0.00035066832225023393, 'samples': 10843584, 'steps': 56476, 'loss/train': 1.3000357151031494} -11/07/2021 05:09:40 - INFO - __main__ - Step 56478: {'lr': 0.0003506634647321626, 'samples': 10843776, 'steps': 56477, 'loss/train': 1.6559810638427734} -11/07/2021 05:09:41 - INFO - __main__ - Step 56479: {'lr': 0.0003506586071687338, 'samples': 10843968, 'steps': 56478, 'loss/train': 1.014644742012024} -11/07/2021 05:09:42 - INFO - __main__ - Step 56480: {'lr': 0.0003506537495599499, 'samples': 10844160, 'steps': 56479, 'loss/train': 0.08396033942699432} -11/07/2021 05:09:42 - INFO - __main__ - Step 56481: {'lr': 0.0003506488919058129, 'samples': 10844352, 'steps': 56480, 'loss/train': 1.287361979484558} -11/07/2021 05:09:42 - INFO - __main__ - Step 56482: {'lr': 0.00035064403420632505, 'samples': 10844544, 'steps': 56481, 'loss/train': 1.5210411548614502} -11/07/2021 05:09:43 - INFO - __main__ - Step 56483: {'lr': 0.0003506391764614887, 'samples': 10844736, 'steps': 56482, 'loss/train': 1.29570734500885} -11/07/2021 05:09:44 - INFO - __main__ - Step 56484: {'lr': 0.00035063431867130576, 'samples': 10844928, 'steps': 56483, 'loss/train': 1.594150424003601} -11/07/2021 05:09:44 - INFO - __main__ - Step 56485: {'lr': 0.00035062946083577853, 'samples': 10845120, 'steps': 56484, 'loss/train': 1.563456654548645} -11/07/2021 05:09:45 - INFO - __main__ - Step 56486: {'lr': 0.00035062460295490926, 'samples': 10845312, 'steps': 56485, 'loss/train': 1.0996873378753662} -11/07/2021 05:09:45 - INFO - __main__ - Step 56487: {'lr': 0.00035061974502870007, 'samples': 10845504, 'steps': 56486, 'loss/train': 1.7642879486083984} -11/07/2021 05:09:45 - INFO - __main__ - Step 56488: {'lr': 0.0003506148870571533, 'samples': 10845696, 'steps': 56487, 'loss/train': 1.9007972478866577} -11/07/2021 05:09:46 - INFO - __main__ - Step 56489: {'lr': 0.00035061002904027084, 'samples': 10845888, 'steps': 56488, 'loss/train': 1.7326982021331787} -11/07/2021 05:09:47 - INFO - __main__ - Step 56490: {'lr': 0.0003506051709780551, 'samples': 10846080, 'steps': 56489, 'loss/train': 1.564028024673462} -11/07/2021 05:09:47 - INFO - __main__ - Step 56491: {'lr': 0.0003506003128705083, 'samples': 10846272, 'steps': 56490, 'loss/train': 0.7779012322425842} -11/07/2021 05:09:47 - INFO - __main__ - Step 56492: {'lr': 0.0003505954547176325, 'samples': 10846464, 'steps': 56491, 'loss/train': 1.4085956811904907} -11/07/2021 05:09:48 - INFO - __main__ - Step 56493: {'lr': 0.00035059059651942995, 'samples': 10846656, 'steps': 56492, 'loss/train': 1.0903558731079102} -11/07/2021 05:09:48 - INFO - __main__ - Step 56494: {'lr': 0.00035058573827590286, 'samples': 10846848, 'steps': 56493, 'loss/train': 1.7710188627243042} -11/07/2021 05:09:50 - INFO - __main__ - Step 56495: {'lr': 0.0003505808799870533, 'samples': 10847040, 'steps': 56494, 'loss/train': 0.8494094014167786} -11/07/2021 05:09:50 - INFO - __main__ - Step 56496: {'lr': 0.0003505760216528836, 'samples': 10847232, 'steps': 56495, 'loss/train': 1.1221890449523926} -11/07/2021 05:09:50 - INFO - __main__ - Step 56497: {'lr': 0.0003505711632733959, 'samples': 10847424, 'steps': 56496, 'loss/train': 1.116998553276062} -11/07/2021 05:09:51 - INFO - __main__ - Step 56498: {'lr': 0.00035056630484859235, 'samples': 10847616, 'steps': 56497, 'loss/train': 1.4646931886672974} -11/07/2021 05:09:51 - INFO - __main__ - Step 56499: {'lr': 0.00035056144637847525, 'samples': 10847808, 'steps': 56498, 'loss/train': 0.979411780834198} -11/07/2021 05:09:51 - INFO - __main__ - Step 56500: {'lr': 0.0003505565878630467, 'samples': 10848000, 'steps': 56499, 'loss/train': 1.0676548480987549} -11/07/2021 05:09:52 - INFO - __main__ - Step 56501: {'lr': 0.0003505517293023088, 'samples': 10848192, 'steps': 56500, 'loss/train': 0.17799589037895203} -11/07/2021 05:09:53 - INFO - __main__ - Step 56502: {'lr': 0.0003505468706962639, 'samples': 10848384, 'steps': 56501, 'loss/train': 0.748681902885437} -11/07/2021 05:09:53 - INFO - __main__ - Step 56503: {'lr': 0.00035054201204491413, 'samples': 10848576, 'steps': 56502, 'loss/train': 1.7646546363830566} -11/07/2021 05:09:53 - INFO - __main__ - Step 56504: {'lr': 0.00035053715334826176, 'samples': 10848768, 'steps': 56503, 'loss/train': 1.495108723640442} -11/07/2021 05:09:54 - INFO - __main__ - Step 56505: {'lr': 0.0003505322946063089, 'samples': 10848960, 'steps': 56504, 'loss/train': 2.6900439262390137} -11/07/2021 05:09:55 - INFO - __main__ - Step 56506: {'lr': 0.0003505274358190576, 'samples': 10849152, 'steps': 56505, 'loss/train': 1.8099464178085327} -11/07/2021 05:09:55 - INFO - __main__ - Step 56507: {'lr': 0.00035052257698651025, 'samples': 10849344, 'steps': 56506, 'loss/train': 1.2279366254806519} -11/07/2021 05:09:56 - INFO - __main__ - Step 56508: {'lr': 0.000350517718108669, 'samples': 10849536, 'steps': 56507, 'loss/train': 1.1620947122573853} -11/07/2021 05:09:56 - INFO - __main__ - Step 56509: {'lr': 0.000350512859185536, 'samples': 10849728, 'steps': 56508, 'loss/train': 1.5747660398483276} -11/07/2021 05:09:56 - INFO - __main__ - Step 56510: {'lr': 0.00035050800021711346, 'samples': 10849920, 'steps': 56509, 'loss/train': 0.7256755828857422} -11/07/2021 05:09:57 - INFO - __main__ - Step 56511: {'lr': 0.00035050314120340357, 'samples': 10850112, 'steps': 56510, 'loss/train': 1.4492433071136475} -11/07/2021 05:09:58 - INFO - __main__ - Step 56512: {'lr': 0.00035049828214440856, 'samples': 10850304, 'steps': 56511, 'loss/train': 2.0569992065429688} -11/07/2021 05:09:58 - INFO - __main__ - Step 56513: {'lr': 0.00035049342304013055, 'samples': 10850496, 'steps': 56512, 'loss/train': 1.1229181289672852} -11/07/2021 05:09:58 - INFO - __main__ - Step 56514: {'lr': 0.0003504885638905717, 'samples': 10850688, 'steps': 56513, 'loss/train': 1.1955887079238892} -11/07/2021 05:09:59 - INFO - __main__ - Step 56515: {'lr': 0.0003504837046957343, 'samples': 10850880, 'steps': 56514, 'loss/train': 1.7722307443618774} -11/07/2021 05:10:00 - INFO - __main__ - Step 56516: {'lr': 0.0003504788454556205, 'samples': 10851072, 'steps': 56515, 'loss/train': 1.2696478366851807} -11/07/2021 05:10:00 - INFO - __main__ - Step 56517: {'lr': 0.00035047398617023246, 'samples': 10851264, 'steps': 56516, 'loss/train': 1.5104753971099854} -11/07/2021 05:10:00 - INFO - __main__ - Step 56518: {'lr': 0.0003504691268395724, 'samples': 10851456, 'steps': 56517, 'loss/train': 1.338602066040039} -11/07/2021 05:10:01 - INFO - __main__ - Step 56519: {'lr': 0.00035046426746364247, 'samples': 10851648, 'steps': 56518, 'loss/train': 1.8242599964141846} -11/07/2021 05:10:01 - INFO - __main__ - Step 56520: {'lr': 0.0003504594080424449, 'samples': 10851840, 'steps': 56519, 'loss/train': 1.4481475353240967} -11/07/2021 05:10:01 - INFO - __main__ - Step 56521: {'lr': 0.00035045454857598194, 'samples': 10852032, 'steps': 56520, 'loss/train': 1.4232033491134644} -11/07/2021 05:10:03 - INFO - __main__ - Step 56522: {'lr': 0.0003504496890642556, 'samples': 10852224, 'steps': 56521, 'loss/train': 2.073962688446045} -11/07/2021 05:10:03 - INFO - __main__ - Step 56523: {'lr': 0.0003504448295072683, 'samples': 10852416, 'steps': 56522, 'loss/train': 1.0623143911361694} -11/07/2021 05:10:03 - INFO - __main__ - Step 56524: {'lr': 0.00035043996990502204, 'samples': 10852608, 'steps': 56523, 'loss/train': 2.2309913635253906} -11/07/2021 05:10:04 - INFO - __main__ - Step 56525: {'lr': 0.00035043511025751906, 'samples': 10852800, 'steps': 56524, 'loss/train': 1.4322583675384521} -11/07/2021 05:10:04 - INFO - __main__ - Step 56526: {'lr': 0.00035043025056476164, 'samples': 10852992, 'steps': 56525, 'loss/train': 1.4538013935089111} -11/07/2021 05:10:05 - INFO - __main__ - Step 56527: {'lr': 0.00035042539082675184, 'samples': 10853184, 'steps': 56526, 'loss/train': 0.9756379723548889} -11/07/2021 05:10:05 - INFO - __main__ - Step 56528: {'lr': 0.00035042053104349195, 'samples': 10853376, 'steps': 56527, 'loss/train': 0.7582591772079468} -11/07/2021 05:10:06 - INFO - __main__ - Step 56529: {'lr': 0.00035041567121498406, 'samples': 10853568, 'steps': 56528, 'loss/train': 1.4369869232177734} -11/07/2021 05:10:06 - INFO - __main__ - Step 56530: {'lr': 0.0003504108113412305, 'samples': 10853760, 'steps': 56529, 'loss/train': 1.3216538429260254} -11/07/2021 05:10:06 - INFO - __main__ - Step 56531: {'lr': 0.0003504059514222333, 'samples': 10853952, 'steps': 56530, 'loss/train': 1.1601468324661255} -11/07/2021 05:10:07 - INFO - __main__ - Step 56532: {'lr': 0.00035040109145799474, 'samples': 10854144, 'steps': 56531, 'loss/train': 1.9203786849975586} -11/07/2021 05:10:08 - INFO - __main__ - Step 56533: {'lr': 0.0003503962314485171, 'samples': 10854336, 'steps': 56532, 'loss/train': 1.3713005781173706} -11/07/2021 05:10:08 - INFO - __main__ - Step 56534: {'lr': 0.00035039137139380235, 'samples': 10854528, 'steps': 56533, 'loss/train': 1.756475567817688} -11/07/2021 05:10:08 - INFO - __main__ - Step 56535: {'lr': 0.0003503865112938528, 'samples': 10854720, 'steps': 56534, 'loss/train': 1.4186993837356567} -11/07/2021 05:10:09 - INFO - __main__ - Step 56536: {'lr': 0.00035038165114867066, 'samples': 10854912, 'steps': 56535, 'loss/train': 0.7980080246925354} -11/07/2021 05:10:10 - INFO - __main__ - Step 56537: {'lr': 0.00035037679095825815, 'samples': 10855104, 'steps': 56536, 'loss/train': 1.6508228778839111} -11/07/2021 05:10:10 - INFO - __main__ - Step 56538: {'lr': 0.00035037193072261734, 'samples': 10855296, 'steps': 56537, 'loss/train': 0.7000250816345215} -11/07/2021 05:10:11 - INFO - __main__ - Step 56539: {'lr': 0.00035036707044175055, 'samples': 10855488, 'steps': 56538, 'loss/train': 1.0380233526229858} -11/07/2021 05:10:11 - INFO - __main__ - Step 56540: {'lr': 0.00035036221011565985, 'samples': 10855680, 'steps': 56539, 'loss/train': 1.4951800107955933} -11/07/2021 05:10:11 - INFO - __main__ - Step 56541: {'lr': 0.00035035734974434745, 'samples': 10855872, 'steps': 56540, 'loss/train': 1.3978549242019653} -11/07/2021 05:10:12 - INFO - __main__ - Step 56542: {'lr': 0.00035035248932781564, 'samples': 10856064, 'steps': 56541, 'loss/train': 1.6059826612472534} -11/07/2021 05:10:13 - INFO - __main__ - Step 56543: {'lr': 0.0003503476288660665, 'samples': 10856256, 'steps': 56542, 'loss/train': 1.4883650541305542} -11/07/2021 05:10:13 - INFO - __main__ - Step 56544: {'lr': 0.0003503427683591024, 'samples': 10856448, 'steps': 56543, 'loss/train': 1.5489416122436523} -11/07/2021 05:10:13 - INFO - __main__ - Step 56545: {'lr': 0.00035033790780692527, 'samples': 10856640, 'steps': 56544, 'loss/train': 0.9137527346611023} -11/07/2021 05:10:14 - INFO - __main__ - Step 56546: {'lr': 0.0003503330472095375, 'samples': 10856832, 'steps': 56545, 'loss/train': 1.1663609743118286} -11/07/2021 05:10:15 - INFO - __main__ - Step 56547: {'lr': 0.0003503281865669411, 'samples': 10857024, 'steps': 56546, 'loss/train': 1.150452971458435} -11/07/2021 05:10:15 - INFO - __main__ - Step 56548: {'lr': 0.00035032332587913844, 'samples': 10857216, 'steps': 56547, 'loss/train': 1.3628579378128052} -11/07/2021 05:10:16 - INFO - __main__ - Step 56549: {'lr': 0.00035031846514613164, 'samples': 10857408, 'steps': 56548, 'loss/train': 0.8619349598884583} -11/07/2021 05:10:16 - INFO - __main__ - Step 56550: {'lr': 0.00035031360436792294, 'samples': 10857600, 'steps': 56549, 'loss/train': 1.1280677318572998} -11/07/2021 05:10:16 - INFO - __main__ - Step 56551: {'lr': 0.00035030874354451434, 'samples': 10857792, 'steps': 56550, 'loss/train': 1.2040126323699951} -11/07/2021 05:10:17 - INFO - __main__ - Step 56552: {'lr': 0.0003503038826759083, 'samples': 10857984, 'steps': 56551, 'loss/train': 1.8396841287612915} -11/07/2021 05:10:18 - INFO - __main__ - Step 56553: {'lr': 0.00035029902176210675, 'samples': 10858176, 'steps': 56552, 'loss/train': 1.0404289960861206} -11/07/2021 05:10:18 - INFO - __main__ - Step 56554: {'lr': 0.0003502941608031121, 'samples': 10858368, 'steps': 56553, 'loss/train': 1.653855562210083} -11/07/2021 05:10:19 - INFO - __main__ - Step 56555: {'lr': 0.00035028929979892645, 'samples': 10858560, 'steps': 56554, 'loss/train': 1.0883740186691284} -11/07/2021 05:10:19 - INFO - __main__ - Step 56556: {'lr': 0.00035028443874955196, 'samples': 10858752, 'steps': 56555, 'loss/train': 1.2312816381454468} -11/07/2021 05:10:19 - INFO - __main__ - Step 56557: {'lr': 0.00035027957765499084, 'samples': 10858944, 'steps': 56556, 'loss/train': 1.2569242715835571} -11/07/2021 05:10:20 - INFO - __main__ - Step 56558: {'lr': 0.00035027471651524533, 'samples': 10859136, 'steps': 56557, 'loss/train': 1.6510467529296875} -11/07/2021 05:10:21 - INFO - __main__ - Step 56559: {'lr': 0.00035026985533031754, 'samples': 10859328, 'steps': 56558, 'loss/train': 1.7253813743591309} -11/07/2021 05:10:21 - INFO - __main__ - Step 56560: {'lr': 0.00035026499410020974, 'samples': 10859520, 'steps': 56559, 'loss/train': 1.6616827249526978} -11/07/2021 05:10:21 - INFO - __main__ - Step 56561: {'lr': 0.00035026013282492404, 'samples': 10859712, 'steps': 56560, 'loss/train': 1.174570918083191} -11/07/2021 05:10:22 - INFO - __main__ - Step 56562: {'lr': 0.0003502552715044627, 'samples': 10859904, 'steps': 56561, 'loss/train': 1.5358526706695557} -11/07/2021 05:10:23 - INFO - __main__ - Step 56563: {'lr': 0.0003502504101388279, 'samples': 10860096, 'steps': 56562, 'loss/train': 1.172845482826233} -11/07/2021 05:10:23 - INFO - __main__ - Step 56564: {'lr': 0.0003502455487280218, 'samples': 10860288, 'steps': 56563, 'loss/train': 1.251356601715088} -11/07/2021 05:10:23 - INFO - __main__ - Step 56565: {'lr': 0.00035024068727204655, 'samples': 10860480, 'steps': 56564, 'loss/train': 1.361531138420105} -11/07/2021 05:10:24 - INFO - __main__ - Step 56566: {'lr': 0.0003502358257709044, 'samples': 10860672, 'steps': 56565, 'loss/train': 1.2823978662490845} -11/07/2021 05:10:24 - INFO - __main__ - Step 56567: {'lr': 0.00035023096422459756, 'samples': 10860864, 'steps': 56566, 'loss/train': 1.017927885055542} -11/07/2021 05:10:25 - INFO - __main__ - Step 56568: {'lr': 0.0003502261026331282, 'samples': 10861056, 'steps': 56567, 'loss/train': 1.5585192441940308} -11/07/2021 05:10:26 - INFO - __main__ - Step 56569: {'lr': 0.0003502212409964985, 'samples': 10861248, 'steps': 56568, 'loss/train': 1.7004319429397583} -11/07/2021 05:10:26 - INFO - __main__ - Step 56570: {'lr': 0.00035021637931471075, 'samples': 10861440, 'steps': 56569, 'loss/train': 1.6190402507781982} -11/07/2021 05:10:26 - INFO - __main__ - Step 56571: {'lr': 0.00035021151758776693, 'samples': 10861632, 'steps': 56570, 'loss/train': 1.1929931640625} -11/07/2021 05:10:27 - INFO - __main__ - Step 56572: {'lr': 0.00035020665581566934, 'samples': 10861824, 'steps': 56571, 'loss/train': 1.413413405418396} -11/07/2021 05:10:28 - INFO - __main__ - Step 56573: {'lr': 0.0003502017939984202, 'samples': 10862016, 'steps': 56572, 'loss/train': 1.2944855690002441} -11/07/2021 05:10:28 - INFO - __main__ - Step 56574: {'lr': 0.0003501969321360217, 'samples': 10862208, 'steps': 56573, 'loss/train': 0.9877818822860718} -11/07/2021 05:10:28 - INFO - __main__ - Step 56575: {'lr': 0.00035019207022847596, 'samples': 10862400, 'steps': 56574, 'loss/train': 1.2913336753845215} -11/07/2021 05:10:29 - INFO - __main__ - Step 56576: {'lr': 0.0003501872082757852, 'samples': 10862592, 'steps': 56575, 'loss/train': 1.257947564125061} -11/07/2021 05:10:29 - INFO - __main__ - Step 56577: {'lr': 0.0003501823462779518, 'samples': 10862784, 'steps': 56576, 'loss/train': 1.541757345199585} -11/07/2021 05:10:29 - INFO - __main__ - Step 56578: {'lr': 0.00035017748423497766, 'samples': 10862976, 'steps': 56577, 'loss/train': 1.3554177284240723} -11/07/2021 05:10:31 - INFO - __main__ - Step 56579: {'lr': 0.00035017262214686505, 'samples': 10863168, 'steps': 56578, 'loss/train': 1.756501317024231} -11/07/2021 05:10:31 - INFO - __main__ - Step 56580: {'lr': 0.00035016776001361625, 'samples': 10863360, 'steps': 56579, 'loss/train': 1.479548692703247} -11/07/2021 05:10:31 - INFO - __main__ - Step 56581: {'lr': 0.00035016289783523335, 'samples': 10863552, 'steps': 56580, 'loss/train': 0.9331073760986328} -11/07/2021 05:10:32 - INFO - __main__ - Step 56582: {'lr': 0.00035015803561171864, 'samples': 10863744, 'steps': 56581, 'loss/train': 1.2737088203430176} -11/07/2021 05:10:32 - INFO - __main__ - Step 56583: {'lr': 0.0003501531733430743, 'samples': 10863936, 'steps': 56582, 'loss/train': 1.0593665838241577} -11/07/2021 05:10:33 - INFO - __main__ - Step 56584: {'lr': 0.00035014831102930246, 'samples': 10864128, 'steps': 56583, 'loss/train': 1.5288864374160767} -11/07/2021 05:10:33 - INFO - __main__ - Step 56585: {'lr': 0.0003501434486704053, 'samples': 10864320, 'steps': 56584, 'loss/train': 1.3636438846588135} -11/07/2021 05:10:34 - INFO - __main__ - Step 56586: {'lr': 0.0003501385862663851, 'samples': 10864512, 'steps': 56585, 'loss/train': 1.6007615327835083} -11/07/2021 05:10:34 - INFO - __main__ - Step 56587: {'lr': 0.00035013372381724397, 'samples': 10864704, 'steps': 56586, 'loss/train': 1.267218828201294} -11/07/2021 05:10:34 - INFO - __main__ - Step 56588: {'lr': 0.00035012886132298413, 'samples': 10864896, 'steps': 56587, 'loss/train': 1.598380208015442} -11/07/2021 05:10:35 - INFO - __main__ - Step 56589: {'lr': 0.0003501239987836078, 'samples': 10865088, 'steps': 56588, 'loss/train': 1.4377321004867554} -11/07/2021 05:10:36 - INFO - __main__ - Step 56590: {'lr': 0.00035011913619911706, 'samples': 10865280, 'steps': 56589, 'loss/train': 1.3788068294525146} -11/07/2021 05:10:36 - INFO - __main__ - Step 56591: {'lr': 0.0003501142735695143, 'samples': 10865472, 'steps': 56590, 'loss/train': 0.7732943296432495} -11/07/2021 05:10:36 - INFO - __main__ - Step 56592: {'lr': 0.0003501094108948015, 'samples': 10865664, 'steps': 56591, 'loss/train': 1.038304328918457} -11/07/2021 05:10:37 - INFO - __main__ - Step 56593: {'lr': 0.000350104548174981, 'samples': 10865856, 'steps': 56592, 'loss/train': 1.422461748123169} -11/07/2021 05:10:38 - INFO - __main__ - Step 56594: {'lr': 0.00035009968541005487, 'samples': 10866048, 'steps': 56593, 'loss/train': 1.973090410232544} -11/07/2021 05:10:38 - INFO - __main__ - Step 56595: {'lr': 0.00035009482260002544, 'samples': 10866240, 'steps': 56594, 'loss/train': 1.0853878259658813} -11/07/2021 05:10:38 - INFO - __main__ - Step 56596: {'lr': 0.00035008995974489477, 'samples': 10866432, 'steps': 56595, 'loss/train': 1.6085518598556519} -11/07/2021 05:10:39 - INFO - __main__ - Step 56597: {'lr': 0.0003500850968446652, 'samples': 10866624, 'steps': 56596, 'loss/train': 1.4332517385482788} -11/07/2021 05:10:39 - INFO - __main__ - Step 56598: {'lr': 0.00035008023389933876, 'samples': 10866816, 'steps': 56597, 'loss/train': 1.1358370780944824} -11/07/2021 05:10:40 - INFO - __main__ - Step 56599: {'lr': 0.00035007537090891766, 'samples': 10867008, 'steps': 56598, 'loss/train': 1.6242140531539917} -11/07/2021 05:10:40 - INFO - __main__ - Step 56600: {'lr': 0.0003500705078734042, 'samples': 10867200, 'steps': 56599, 'loss/train': 1.2923790216445923} -11/07/2021 05:10:41 - INFO - __main__ - Step 56601: {'lr': 0.0003500656447928005, 'samples': 10867392, 'steps': 56600, 'loss/train': 1.4352679252624512} -11/07/2021 05:10:41 - INFO - __main__ - Step 56602: {'lr': 0.00035006078166710877, 'samples': 10867584, 'steps': 56601, 'loss/train': 1.1847213506698608} -11/07/2021 05:10:41 - INFO - __main__ - Step 56603: {'lr': 0.00035005591849633123, 'samples': 10867776, 'steps': 56602, 'loss/train': 1.1905523538589478} -11/07/2021 05:10:42 - INFO - __main__ - Step 56604: {'lr': 0.00035005105528047, 'samples': 10867968, 'steps': 56603, 'loss/train': 1.476470708847046} -11/07/2021 05:10:43 - INFO - __main__ - Step 56605: {'lr': 0.00035004619201952736, 'samples': 10868160, 'steps': 56604, 'loss/train': 1.518057942390442} -11/07/2021 05:10:43 - INFO - __main__ - Step 56606: {'lr': 0.00035004132871350535, 'samples': 10868352, 'steps': 56605, 'loss/train': 1.1097615957260132} -11/07/2021 05:10:44 - INFO - __main__ - Step 56607: {'lr': 0.0003500364653624063, 'samples': 10868544, 'steps': 56606, 'loss/train': 2.138749122619629} -11/07/2021 05:10:44 - INFO - __main__ - Step 56608: {'lr': 0.0003500316019662324, 'samples': 10868736, 'steps': 56607, 'loss/train': 1.003953456878662} -11/07/2021 05:10:45 - INFO - __main__ - Step 56609: {'lr': 0.00035002673852498577, 'samples': 10868928, 'steps': 56608, 'loss/train': 1.2726805210113525} -11/07/2021 05:10:45 - INFO - __main__ - Step 56610: {'lr': 0.0003500218750386687, 'samples': 10869120, 'steps': 56609, 'loss/train': 1.379153847694397} -11/07/2021 05:10:46 - INFO - __main__ - Step 56611: {'lr': 0.0003500170115072833, 'samples': 10869312, 'steps': 56610, 'loss/train': 1.613093376159668} -11/07/2021 05:10:46 - INFO - __main__ - Step 56612: {'lr': 0.00035001214793083167, 'samples': 10869504, 'steps': 56611, 'loss/train': 0.7998729348182678} -11/07/2021 05:10:46 - INFO - __main__ - Step 56613: {'lr': 0.00035000728430931616, 'samples': 10869696, 'steps': 56612, 'loss/train': 1.0273258686065674} -11/07/2021 05:10:48 - INFO - __main__ - Step 56614: {'lr': 0.000350002420642739, 'samples': 10869888, 'steps': 56613, 'loss/train': 1.4873912334442139} -11/07/2021 05:10:48 - INFO - __main__ - Step 56615: {'lr': 0.0003499975569311022, 'samples': 10870080, 'steps': 56614, 'loss/train': 1.6536808013916016} -11/07/2021 05:10:48 - INFO - __main__ - Step 56616: {'lr': 0.00034999269317440804, 'samples': 10870272, 'steps': 56615, 'loss/train': 1.554644227027893} -11/07/2021 05:10:49 - INFO - __main__ - Step 56617: {'lr': 0.0003499878293726588, 'samples': 10870464, 'steps': 56616, 'loss/train': 1.8007792234420776} -11/07/2021 05:10:49 - INFO - __main__ - Step 56618: {'lr': 0.0003499829655258565, 'samples': 10870656, 'steps': 56617, 'loss/train': 1.3087400197982788} -11/07/2021 05:10:50 - INFO - __main__ - Step 56619: {'lr': 0.00034997810163400343, 'samples': 10870848, 'steps': 56618, 'loss/train': 1.185659646987915} -11/07/2021 05:10:51 - INFO - __main__ - Step 56620: {'lr': 0.0003499732376971018, 'samples': 10871040, 'steps': 56619, 'loss/train': 1.4963005781173706} -11/07/2021 05:10:51 - INFO - __main__ - Step 56621: {'lr': 0.0003499683737151538, 'samples': 10871232, 'steps': 56620, 'loss/train': 1.4350378513336182} -11/07/2021 05:10:51 - INFO - __main__ - Step 56622: {'lr': 0.0003499635096881615, 'samples': 10871424, 'steps': 56621, 'loss/train': 1.1455438137054443} -11/07/2021 05:10:52 - INFO - __main__ - Step 56623: {'lr': 0.0003499586456161273, 'samples': 10871616, 'steps': 56622, 'loss/train': 0.8691271543502808} -11/07/2021 05:10:52 - INFO - __main__ - Step 56624: {'lr': 0.0003499537814990532, 'samples': 10871808, 'steps': 56623, 'loss/train': 1.3309210538864136} -11/07/2021 05:10:53 - INFO - __main__ - Step 56625: {'lr': 0.0003499489173369415, 'samples': 10872000, 'steps': 56624, 'loss/train': 1.5248233079910278} -11/07/2021 05:10:53 - INFO - __main__ - Step 56626: {'lr': 0.00034994405312979433, 'samples': 10872192, 'steps': 56625, 'loss/train': 1.2739338874816895} -11/07/2021 05:10:54 - INFO - __main__ - Step 56627: {'lr': 0.00034993918887761386, 'samples': 10872384, 'steps': 56626, 'loss/train': 1.1588736772537231} -11/07/2021 05:10:54 - INFO - __main__ - Step 56628: {'lr': 0.0003499343245804025, 'samples': 10872576, 'steps': 56627, 'loss/train': 1.2341482639312744} -11/07/2021 05:10:54 - INFO - __main__ - Step 56629: {'lr': 0.00034992946023816216, 'samples': 10872768, 'steps': 56628, 'loss/train': 2.0720772743225098} -11/07/2021 05:10:55 - INFO - __main__ - Step 56630: {'lr': 0.00034992459585089515, 'samples': 10872960, 'steps': 56629, 'loss/train': 0.9724142551422119} -11/07/2021 05:10:56 - INFO - __main__ - Step 56631: {'lr': 0.00034991973141860366, 'samples': 10873152, 'steps': 56630, 'loss/train': 1.3173853158950806} -11/07/2021 05:10:56 - INFO - __main__ - Step 56632: {'lr': 0.00034991486694128986, 'samples': 10873344, 'steps': 56631, 'loss/train': 1.7120763063430786} -11/07/2021 05:10:57 - INFO - __main__ - Step 56633: {'lr': 0.000349910002418956, 'samples': 10873536, 'steps': 56632, 'loss/train': 1.405206322669983} -11/07/2021 05:10:57 - INFO - __main__ - Step 56634: {'lr': 0.0003499051378516043, 'samples': 10873728, 'steps': 56633, 'loss/train': 1.1220430135726929} -11/07/2021 05:10:57 - INFO - __main__ - Step 56635: {'lr': 0.0003499002732392368, 'samples': 10873920, 'steps': 56634, 'loss/train': 1.4978506565093994} -11/07/2021 05:10:58 - INFO - __main__ - Step 56636: {'lr': 0.0003498954085818558, 'samples': 10874112, 'steps': 56635, 'loss/train': 1.1060702800750732} -11/07/2021 05:10:59 - INFO - __main__ - Step 56637: {'lr': 0.00034989054387946344, 'samples': 10874304, 'steps': 56636, 'loss/train': 1.8852922916412354} -11/07/2021 05:10:59 - INFO - __main__ - Step 56638: {'lr': 0.000349885679132062, 'samples': 10874496, 'steps': 56637, 'loss/train': 1.8907239437103271} -11/07/2021 05:10:59 - INFO - __main__ - Step 56639: {'lr': 0.00034988081433965355, 'samples': 10874688, 'steps': 56638, 'loss/train': 1.0390472412109375} -11/07/2021 05:11:00 - INFO - __main__ - Step 56640: {'lr': 0.00034987594950224043, 'samples': 10874880, 'steps': 56639, 'loss/train': 0.5694819688796997} -11/07/2021 05:11:01 - INFO - __main__ - Step 56641: {'lr': 0.0003498710846198247, 'samples': 10875072, 'steps': 56640, 'loss/train': 1.0915600061416626} -11/07/2021 05:11:01 - INFO - __main__ - Step 56642: {'lr': 0.0003498662196924086, 'samples': 10875264, 'steps': 56641, 'loss/train': 0.9697006940841675} -11/07/2021 05:11:01 - INFO - __main__ - Step 56643: {'lr': 0.00034986135471999424, 'samples': 10875456, 'steps': 56642, 'loss/train': 1.376035451889038} -11/07/2021 05:11:02 - INFO - __main__ - Step 56644: {'lr': 0.00034985648970258404, 'samples': 10875648, 'steps': 56643, 'loss/train': 1.46683669090271} -11/07/2021 05:11:02 - INFO - __main__ - Step 56645: {'lr': 0.00034985162464018, 'samples': 10875840, 'steps': 56644, 'loss/train': 1.4045829772949219} -11/07/2021 05:11:03 - INFO - __main__ - Step 56646: {'lr': 0.00034984675953278433, 'samples': 10876032, 'steps': 56645, 'loss/train': 1.4965193271636963} -11/07/2021 05:11:03 - INFO - __main__ - Step 56647: {'lr': 0.00034984189438039926, 'samples': 10876224, 'steps': 56646, 'loss/train': 1.2718865871429443} -11/07/2021 05:11:04 - INFO - __main__ - Step 56648: {'lr': 0.00034983702918302696, 'samples': 10876416, 'steps': 56647, 'loss/train': 1.1979362964630127} -11/07/2021 05:11:04 - INFO - __main__ - Step 56649: {'lr': 0.00034983216394066964, 'samples': 10876608, 'steps': 56648, 'loss/train': 1.4846811294555664} -11/07/2021 05:11:05 - INFO - __main__ - Step 56650: {'lr': 0.00034982729865332953, 'samples': 10876800, 'steps': 56649, 'loss/train': 1.5367149114608765} -11/07/2021 05:11:06 - INFO - __main__ - Step 56651: {'lr': 0.0003498224333210087, 'samples': 10876992, 'steps': 56650, 'loss/train': 1.163350224494934} -11/07/2021 05:11:06 - INFO - __main__ - Step 56652: {'lr': 0.0003498175679437095, 'samples': 10877184, 'steps': 56651, 'loss/train': 1.3177233934402466} -11/07/2021 05:11:06 - INFO - __main__ - Step 56653: {'lr': 0.00034981270252143406, 'samples': 10877376, 'steps': 56652, 'loss/train': 1.9447318315505981} -11/07/2021 05:11:07 - INFO - __main__ - Step 56654: {'lr': 0.0003498078370541845, 'samples': 10877568, 'steps': 56653, 'loss/train': 1.667618751525879} -11/07/2021 05:11:07 - INFO - __main__ - Step 56655: {'lr': 0.00034980297154196306, 'samples': 10877760, 'steps': 56654, 'loss/train': 1.3392319679260254} -11/07/2021 05:11:07 - INFO - __main__ - Step 56656: {'lr': 0.0003497981059847719, 'samples': 10877952, 'steps': 56655, 'loss/train': 1.136358380317688} -11/07/2021 05:11:08 - INFO - __main__ - Step 56657: {'lr': 0.00034979324038261327, 'samples': 10878144, 'steps': 56656, 'loss/train': 1.5484172105789185} -11/07/2021 05:11:09 - INFO - __main__ - Step 56658: {'lr': 0.00034978837473548946, 'samples': 10878336, 'steps': 56657, 'loss/train': 0.7881152629852295} -11/07/2021 05:11:09 - INFO - __main__ - Step 56659: {'lr': 0.0003497835090434025, 'samples': 10878528, 'steps': 56658, 'loss/train': 2.1221213340759277} -11/07/2021 05:11:09 - INFO - __main__ - Step 56660: {'lr': 0.00034977864330635455, 'samples': 10878720, 'steps': 56659, 'loss/train': 1.5315827131271362} -11/07/2021 05:11:10 - INFO - __main__ - Step 56661: {'lr': 0.00034977377752434797, 'samples': 10878912, 'steps': 56660, 'loss/train': 0.46029800176620483} -11/07/2021 05:11:11 - INFO - __main__ - Step 56662: {'lr': 0.0003497689116973848, 'samples': 10879104, 'steps': 56661, 'loss/train': 1.756382703781128} -11/07/2021 05:11:11 - INFO - __main__ - Step 56663: {'lr': 0.00034976404582546736, 'samples': 10879296, 'steps': 56662, 'loss/train': 1.5322246551513672} -11/07/2021 05:11:11 - INFO - __main__ - Step 56664: {'lr': 0.00034975917990859773, 'samples': 10879488, 'steps': 56663, 'loss/train': 1.0125632286071777} -11/07/2021 05:11:12 - INFO - __main__ - Step 56665: {'lr': 0.00034975431394677827, 'samples': 10879680, 'steps': 56664, 'loss/train': 1.1704699993133545} -11/07/2021 05:11:12 - INFO - __main__ - Step 56666: {'lr': 0.0003497494479400109, 'samples': 10879872, 'steps': 56665, 'loss/train': 1.2864733934402466} -11/07/2021 05:11:13 - INFO - __main__ - Step 56667: {'lr': 0.00034974458188829805, 'samples': 10880064, 'steps': 56666, 'loss/train': 1.3400623798370361} -11/07/2021 05:11:13 - INFO - __main__ - Step 56668: {'lr': 0.0003497397157916418, 'samples': 10880256, 'steps': 56667, 'loss/train': 1.3853057622909546} -11/07/2021 05:11:14 - INFO - __main__ - Step 56669: {'lr': 0.00034973484965004437, 'samples': 10880448, 'steps': 56668, 'loss/train': 1.6519192457199097} -11/07/2021 05:11:14 - INFO - __main__ - Step 56670: {'lr': 0.0003497299834635079, 'samples': 10880640, 'steps': 56669, 'loss/train': 1.7198807001113892} -11/07/2021 05:11:14 - INFO - __main__ - Step 56671: {'lr': 0.0003497251172320348, 'samples': 10880832, 'steps': 56670, 'loss/train': 1.3893827199935913} -11/07/2021 05:11:16 - INFO - __main__ - Step 56672: {'lr': 0.00034972025095562697, 'samples': 10881024, 'steps': 56671, 'loss/train': 1.578684687614441} -11/07/2021 05:11:16 - INFO - __main__ - Step 56673: {'lr': 0.00034971538463428683, 'samples': 10881216, 'steps': 56672, 'loss/train': 0.8849255442619324} -11/07/2021 05:11:16 - INFO - __main__ - Step 56674: {'lr': 0.0003497105182680164, 'samples': 10881408, 'steps': 56673, 'loss/train': 0.7655577659606934} -11/07/2021 05:11:17 - INFO - __main__ - Step 56675: {'lr': 0.00034970565185681794, 'samples': 10881600, 'steps': 56674, 'loss/train': 1.4446046352386475} -11/07/2021 05:11:17 - INFO - __main__ - Step 56676: {'lr': 0.0003497007854006937, 'samples': 10881792, 'steps': 56675, 'loss/train': 1.8495018482208252} -11/07/2021 05:11:18 - INFO - __main__ - Step 56677: {'lr': 0.0003496959188996458, 'samples': 10881984, 'steps': 56676, 'loss/train': 1.4334365129470825} -11/07/2021 05:11:18 - INFO - __main__ - Step 56678: {'lr': 0.00034969105235367647, 'samples': 10882176, 'steps': 56677, 'loss/train': 1.2246066331863403} -11/07/2021 05:11:19 - INFO - __main__ - Step 56679: {'lr': 0.0003496861857627879, 'samples': 10882368, 'steps': 56678, 'loss/train': 0.0722784623503685} -11/07/2021 05:11:19 - INFO - __main__ - Step 56680: {'lr': 0.0003496813191269822, 'samples': 10882560, 'steps': 56679, 'loss/train': 4.06576681137085} -11/07/2021 05:11:19 - INFO - __main__ - Step 56681: {'lr': 0.0003496764524462617, 'samples': 10882752, 'steps': 56680, 'loss/train': 1.331288456916809} -11/07/2021 05:11:20 - INFO - __main__ - Step 56682: {'lr': 0.00034967158572062854, 'samples': 10882944, 'steps': 56681, 'loss/train': 1.4976335763931274} -11/07/2021 05:11:21 - INFO - __main__ - Step 56683: {'lr': 0.00034966671895008485, 'samples': 10883136, 'steps': 56682, 'loss/train': 1.457160234451294} -11/07/2021 05:11:21 - INFO - __main__ - Step 56684: {'lr': 0.0003496618521346329, 'samples': 10883328, 'steps': 56683, 'loss/train': 1.4467800855636597} -11/07/2021 05:11:22 - INFO - __main__ - Step 56685: {'lr': 0.00034965698527427493, 'samples': 10883520, 'steps': 56684, 'loss/train': 1.098656415939331} -11/07/2021 05:11:22 - INFO - __main__ - Step 56686: {'lr': 0.00034965211836901293, 'samples': 10883712, 'steps': 56685, 'loss/train': 0.9556757807731628} -11/07/2021 05:11:23 - INFO - __main__ - Step 56687: {'lr': 0.00034964725141884936, 'samples': 10883904, 'steps': 56686, 'loss/train': 1.6815333366394043} -11/07/2021 05:11:23 - INFO - __main__ - Step 56688: {'lr': 0.00034964238442378615, 'samples': 10884096, 'steps': 56687, 'loss/train': 1.2224161624908447} -11/07/2021 05:11:24 - INFO - __main__ - Step 56689: {'lr': 0.00034963751738382564, 'samples': 10884288, 'steps': 56688, 'loss/train': 1.469492793083191} -11/07/2021 05:11:24 - INFO - __main__ - Step 56690: {'lr': 0.00034963265029897006, 'samples': 10884480, 'steps': 56689, 'loss/train': 0.7678528428077698} -11/07/2021 05:11:24 - INFO - __main__ - Step 56691: {'lr': 0.00034962778316922156, 'samples': 10884672, 'steps': 56690, 'loss/train': 1.1522170305252075} -11/07/2021 05:11:25 - INFO - __main__ - Step 56692: {'lr': 0.0003496229159945823, 'samples': 10884864, 'steps': 56691, 'loss/train': 0.4534689486026764} -11/07/2021 05:11:26 - INFO - __main__ - Step 56693: {'lr': 0.0003496180487750544, 'samples': 10885056, 'steps': 56692, 'loss/train': 1.801413655281067} -11/07/2021 05:11:26 - INFO - __main__ - Step 56694: {'lr': 0.00034961318151064026, 'samples': 10885248, 'steps': 56693, 'loss/train': 1.435295820236206} -11/07/2021 05:11:26 - INFO - __main__ - Step 56695: {'lr': 0.00034960831420134187, 'samples': 10885440, 'steps': 56694, 'loss/train': 1.5555894374847412} -11/07/2021 05:11:27 - INFO - __main__ - Step 56696: {'lr': 0.0003496034468471616, 'samples': 10885632, 'steps': 56695, 'loss/train': 1.4497580528259277} -11/07/2021 05:11:28 - INFO - __main__ - Step 56697: {'lr': 0.00034959857944810144, 'samples': 10885824, 'steps': 56696, 'loss/train': 1.1744581460952759} -11/07/2021 05:11:28 - INFO - __main__ - Step 56698: {'lr': 0.0003495937120041638, 'samples': 10886016, 'steps': 56697, 'loss/train': 1.328554630279541} -11/07/2021 05:11:29 - INFO - __main__ - Step 56699: {'lr': 0.00034958884451535073, 'samples': 10886208, 'steps': 56698, 'loss/train': 0.9245701432228088} -11/07/2021 05:11:29 - INFO - __main__ - Step 56700: {'lr': 0.00034958397698166445, 'samples': 10886400, 'steps': 56699, 'loss/train': 1.1948953866958618} -11/07/2021 05:11:29 - INFO - __main__ - Step 56701: {'lr': 0.00034957910940310716, 'samples': 10886592, 'steps': 56700, 'loss/train': 1.4919748306274414} -11/07/2021 05:11:30 - INFO - __main__ - Step 56702: {'lr': 0.00034957424177968114, 'samples': 10886784, 'steps': 56701, 'loss/train': 1.282505750656128} -11/07/2021 05:11:31 - INFO - __main__ - Step 56703: {'lr': 0.0003495693741113884, 'samples': 10886976, 'steps': 56702, 'loss/train': 1.3276407718658447} -11/07/2021 05:11:31 - INFO - __main__ - Step 56704: {'lr': 0.00034956450639823125, 'samples': 10887168, 'steps': 56703, 'loss/train': 1.5844906568527222} -11/07/2021 05:11:31 - INFO - __main__ - Step 56705: {'lr': 0.00034955963864021194, 'samples': 10887360, 'steps': 56704, 'loss/train': 1.1592485904693604} -11/07/2021 05:11:32 - INFO - __main__ - Step 56706: {'lr': 0.00034955477083733257, 'samples': 10887552, 'steps': 56705, 'loss/train': 1.3726892471313477} -11/07/2021 05:11:33 - INFO - __main__ - Step 56707: {'lr': 0.0003495499029895953, 'samples': 10887744, 'steps': 56706, 'loss/train': 0.03601754084229469} -11/07/2021 05:11:33 - INFO - __main__ - Step 56708: {'lr': 0.00034954503509700244, 'samples': 10887936, 'steps': 56707, 'loss/train': 1.2998552322387695} -11/07/2021 05:11:33 - INFO - __main__ - Step 56709: {'lr': 0.0003495401671595561, 'samples': 10888128, 'steps': 56708, 'loss/train': 0.6695010662078857} -11/07/2021 05:11:34 - INFO - __main__ - Step 56710: {'lr': 0.0003495352991772585, 'samples': 10888320, 'steps': 56709, 'loss/train': 1.436187744140625} -11/07/2021 05:11:34 - INFO - __main__ - Step 56711: {'lr': 0.0003495304311501118, 'samples': 10888512, 'steps': 56710, 'loss/train': 0.6216771006584167} -11/07/2021 05:11:34 - INFO - __main__ - Step 56712: {'lr': 0.0003495255630781183, 'samples': 10888704, 'steps': 56711, 'loss/train': 1.65614914894104} -11/07/2021 05:11:36 - INFO - __main__ - Step 56713: {'lr': 0.00034952069496128007, 'samples': 10888896, 'steps': 56712, 'loss/train': 1.5235693454742432} -11/07/2021 05:11:36 - INFO - __main__ - Step 56714: {'lr': 0.0003495158267995994, 'samples': 10889088, 'steps': 56713, 'loss/train': 1.5222333669662476} -11/07/2021 05:11:36 - INFO - __main__ - Step 56715: {'lr': 0.0003495109585930784, 'samples': 10889280, 'steps': 56714, 'loss/train': 1.6087963581085205} -11/07/2021 05:11:37 - INFO - __main__ - Step 56716: {'lr': 0.0003495060903417192, 'samples': 10889472, 'steps': 56715, 'loss/train': 1.353843331336975} -11/07/2021 05:11:37 - INFO - __main__ - Step 56717: {'lr': 0.00034950122204552417, 'samples': 10889664, 'steps': 56716, 'loss/train': 1.246916651725769} -11/07/2021 05:11:38 - INFO - __main__ - Step 56718: {'lr': 0.00034949635370449546, 'samples': 10889856, 'steps': 56717, 'loss/train': 1.7605196237564087} -11/07/2021 05:11:38 - INFO - __main__ - Step 56719: {'lr': 0.00034949148531863517, 'samples': 10890048, 'steps': 56718, 'loss/train': 1.7312897443771362} -11/07/2021 05:11:39 - INFO - __main__ - Step 56720: {'lr': 0.0003494866168879456, 'samples': 10890240, 'steps': 56719, 'loss/train': 0.5320704579353333} -11/07/2021 05:11:39 - INFO - __main__ - Step 56721: {'lr': 0.0003494817484124289, 'samples': 10890432, 'steps': 56720, 'loss/train': 1.625646710395813} -11/07/2021 05:11:39 - INFO - __main__ - Step 56722: {'lr': 0.0003494768798920872, 'samples': 10890624, 'steps': 56721, 'loss/train': 1.09530508518219} -11/07/2021 05:11:40 - INFO - __main__ - Step 56723: {'lr': 0.0003494720113269227, 'samples': 10890816, 'steps': 56722, 'loss/train': 1.383299469947815} -11/07/2021 05:11:41 - INFO - __main__ - Step 56724: {'lr': 0.00034946714271693783, 'samples': 10891008, 'steps': 56723, 'loss/train': 1.5900954008102417} -11/07/2021 05:11:41 - INFO - __main__ - Step 56725: {'lr': 0.0003494622740621345, 'samples': 10891200, 'steps': 56724, 'loss/train': 1.601185917854309} -11/07/2021 05:11:41 - INFO - __main__ - Step 56726: {'lr': 0.00034945740536251505, 'samples': 10891392, 'steps': 56725, 'loss/train': 1.5290385484695435} -11/07/2021 05:11:42 - INFO - __main__ - Step 56727: {'lr': 0.0003494525366180815, 'samples': 10891584, 'steps': 56726, 'loss/train': 1.253729224205017} -11/07/2021 05:11:43 - INFO - __main__ - Step 56728: {'lr': 0.0003494476678288363, 'samples': 10891776, 'steps': 56727, 'loss/train': 0.7405962347984314} -11/07/2021 05:11:43 - INFO - __main__ - Step 56729: {'lr': 0.00034944279899478146, 'samples': 10891968, 'steps': 56728, 'loss/train': 1.7755745649337769} -11/07/2021 05:11:44 - INFO - __main__ - Step 56730: {'lr': 0.00034943793011591926, 'samples': 10892160, 'steps': 56729, 'loss/train': 1.3615187406539917} -11/07/2021 05:11:44 - INFO - __main__ - Step 56731: {'lr': 0.0003494330611922518, 'samples': 10892352, 'steps': 56730, 'loss/train': 1.5941202640533447} -11/07/2021 05:11:44 - INFO - __main__ - Step 56732: {'lr': 0.0003494281922237814, 'samples': 10892544, 'steps': 56731, 'loss/train': 1.1688631772994995} -11/07/2021 05:11:45 - INFO - __main__ - Step 56733: {'lr': 0.0003494233232105102, 'samples': 10892736, 'steps': 56732, 'loss/train': 1.40535569190979} -11/07/2021 05:11:46 - INFO - __main__ - Step 56734: {'lr': 0.0003494184541524403, 'samples': 10892928, 'steps': 56733, 'loss/train': 1.4211196899414062} -11/07/2021 05:11:46 - INFO - __main__ - Step 56735: {'lr': 0.0003494135850495741, 'samples': 10893120, 'steps': 56734, 'loss/train': 1.3987970352172852} -11/07/2021 05:11:46 - INFO - __main__ - Step 56736: {'lr': 0.0003494087159019136, 'samples': 10893312, 'steps': 56735, 'loss/train': 1.4669206142425537} -11/07/2021 05:11:47 - INFO - __main__ - Step 56737: {'lr': 0.0003494038467094611, 'samples': 10893504, 'steps': 56736, 'loss/train': 1.8312269449234009} -11/07/2021 05:11:48 - INFO - __main__ - Step 56738: {'lr': 0.00034939897747221873, 'samples': 10893696, 'steps': 56737, 'loss/train': 1.2512260675430298} -11/07/2021 05:11:48 - INFO - __main__ - Step 56739: {'lr': 0.00034939410819018874, 'samples': 10893888, 'steps': 56738, 'loss/train': 1.0880860090255737} -11/07/2021 05:11:48 - INFO - __main__ - Step 56740: {'lr': 0.0003493892388633733, 'samples': 10894080, 'steps': 56739, 'loss/train': 1.3743757009506226} -11/07/2021 05:11:49 - INFO - __main__ - Step 56741: {'lr': 0.0003493843694917745, 'samples': 10894272, 'steps': 56740, 'loss/train': 1.1670089960098267} -11/07/2021 05:11:49 - INFO - __main__ - Step 56742: {'lr': 0.00034937950007539475, 'samples': 10894464, 'steps': 56741, 'loss/train': 1.5157989263534546} -11/07/2021 05:11:50 - INFO - __main__ - Step 56743: {'lr': 0.0003493746306142361, 'samples': 10894656, 'steps': 56742, 'loss/train': 1.471632957458496} -11/07/2021 05:11:51 - INFO - __main__ - Step 56744: {'lr': 0.00034936976110830077, 'samples': 10894848, 'steps': 56743, 'loss/train': 1.2681918144226074} -11/07/2021 05:11:51 - INFO - __main__ - Step 56745: {'lr': 0.000349364891557591, 'samples': 10895040, 'steps': 56744, 'loss/train': 1.4375859498977661} -11/07/2021 05:11:51 - INFO - __main__ - Step 56746: {'lr': 0.00034936002196210895, 'samples': 10895232, 'steps': 56745, 'loss/train': 1.1087936162948608} -11/07/2021 05:11:52 - INFO - __main__ - Step 56747: {'lr': 0.0003493551523218567, 'samples': 10895424, 'steps': 56746, 'loss/train': 1.2363958358764648} -11/07/2021 05:11:52 - INFO - __main__ - Step 56748: {'lr': 0.0003493502826368366, 'samples': 10895616, 'steps': 56747, 'loss/train': 1.2666784524917603} -11/07/2021 05:11:53 - INFO - __main__ - Step 56749: {'lr': 0.0003493454129070508, 'samples': 10895808, 'steps': 56748, 'loss/train': 1.105308175086975} -11/07/2021 05:11:54 - INFO - __main__ - Step 56750: {'lr': 0.0003493405431325015, 'samples': 10896000, 'steps': 56749, 'loss/train': 0.38008758425712585} -11/07/2021 05:11:54 - INFO - __main__ - Step 56751: {'lr': 0.0003493356733131909, 'samples': 10896192, 'steps': 56750, 'loss/train': 1.7625583410263062} -11/07/2021 05:11:54 - INFO - __main__ - Step 56752: {'lr': 0.0003493308034491212, 'samples': 10896384, 'steps': 56751, 'loss/train': 0.9974585771560669} -11/07/2021 05:11:55 - INFO - __main__ - Step 56753: {'lr': 0.00034932593354029454, 'samples': 10896576, 'steps': 56752, 'loss/train': 1.030988335609436} -11/07/2021 05:11:56 - INFO - __main__ - Step 56754: {'lr': 0.00034932106358671314, 'samples': 10896768, 'steps': 56753, 'loss/train': 1.3519301414489746} -11/07/2021 05:11:56 - INFO - __main__ - Step 56755: {'lr': 0.0003493161935883792, 'samples': 10896960, 'steps': 56754, 'loss/train': 1.558119773864746} -11/07/2021 05:11:57 - INFO - __main__ - Step 56756: {'lr': 0.0003493113235452949, 'samples': 10897152, 'steps': 56755, 'loss/train': 1.1805732250213623} -11/07/2021 05:11:57 - INFO - __main__ - Step 56757: {'lr': 0.00034930645345746246, 'samples': 10897344, 'steps': 56756, 'loss/train': 0.9049232602119446} -11/07/2021 05:11:57 - INFO - __main__ - Step 56758: {'lr': 0.0003493015833248841, 'samples': 10897536, 'steps': 56757, 'loss/train': 1.5116055011749268} -11/07/2021 05:11:58 - INFO - __main__ - Step 56759: {'lr': 0.00034929671314756197, 'samples': 10897728, 'steps': 56758, 'loss/train': 1.3431657552719116} -11/07/2021 05:11:59 - INFO - __main__ - Step 56760: {'lr': 0.0003492918429254983, 'samples': 10897920, 'steps': 56759, 'loss/train': 1.3007172346115112} -11/07/2021 05:11:59 - INFO - __main__ - Step 56761: {'lr': 0.00034928697265869515, 'samples': 10898112, 'steps': 56760, 'loss/train': 1.5657540559768677} -11/07/2021 05:11:59 - INFO - __main__ - Step 56762: {'lr': 0.00034928210234715497, 'samples': 10898304, 'steps': 56761, 'loss/train': 1.4907721281051636} -11/07/2021 05:12:00 - INFO - __main__ - Step 56763: {'lr': 0.0003492772319908797, 'samples': 10898496, 'steps': 56762, 'loss/train': 1.4233965873718262} -11/07/2021 05:12:01 - INFO - __main__ - Step 56764: {'lr': 0.0003492723615898716, 'samples': 10898688, 'steps': 56763, 'loss/train': 0.4662286937236786} -11/07/2021 05:12:01 - INFO - __main__ - Step 56765: {'lr': 0.000349267491144133, 'samples': 10898880, 'steps': 56764, 'loss/train': 1.4547139406204224} -11/07/2021 05:12:01 - INFO - __main__ - Step 56766: {'lr': 0.00034926262065366597, 'samples': 10899072, 'steps': 56765, 'loss/train': 1.2869064807891846} -11/07/2021 05:12:02 - INFO - __main__ - Step 56767: {'lr': 0.0003492577501184727, 'samples': 10899264, 'steps': 56766, 'loss/train': 1.4037586450576782} -11/07/2021 05:12:02 - INFO - __main__ - Step 56768: {'lr': 0.0003492528795385556, 'samples': 10899456, 'steps': 56767, 'loss/train': 1.3813951015472412} -11/07/2021 05:12:03 - INFO - __main__ - Step 56769: {'lr': 0.00034924800891391645, 'samples': 10899648, 'steps': 56768, 'loss/train': 0.9622254371643066} -11/07/2021 05:12:03 - INFO - __main__ - Step 56770: {'lr': 0.0003492431382445578, 'samples': 10899840, 'steps': 56769, 'loss/train': 1.509605884552002} -11/07/2021 05:12:04 - INFO - __main__ - Step 56771: {'lr': 0.00034923826753048163, 'samples': 10900032, 'steps': 56770, 'loss/train': 1.247928500175476} -11/07/2021 05:12:04 - INFO - __main__ - Step 56772: {'lr': 0.00034923339677169033, 'samples': 10900224, 'steps': 56771, 'loss/train': 1.6541073322296143} -11/07/2021 05:12:05 - INFO - __main__ - Step 56773: {'lr': 0.000349228525968186, 'samples': 10900416, 'steps': 56772, 'loss/train': 1.0791624784469604} -11/07/2021 05:12:06 - INFO - __main__ - Step 56774: {'lr': 0.0003492236551199707, 'samples': 10900608, 'steps': 56773, 'loss/train': 1.03981351852417} -11/07/2021 05:12:06 - INFO - __main__ - Step 56775: {'lr': 0.0003492187842270469, 'samples': 10900800, 'steps': 56774, 'loss/train': 1.2804206609725952} -11/07/2021 05:12:06 - INFO - __main__ - Step 56776: {'lr': 0.00034921391328941655, 'samples': 10900992, 'steps': 56775, 'loss/train': 1.37317955493927} -11/07/2021 05:12:07 - INFO - __main__ - Step 56777: {'lr': 0.00034920904230708195, 'samples': 10901184, 'steps': 56776, 'loss/train': 1.294616937637329} -11/07/2021 05:12:07 - INFO - __main__ - Step 56778: {'lr': 0.0003492041712800453, 'samples': 10901376, 'steps': 56777, 'loss/train': 1.3605133295059204} -11/07/2021 05:12:08 - INFO - __main__ - Step 56779: {'lr': 0.0003491993002083088, 'samples': 10901568, 'steps': 56778, 'loss/train': 1.0155563354492188} -11/07/2021 05:12:09 - INFO - __main__ - Step 56780: {'lr': 0.00034919442909187465, 'samples': 10901760, 'steps': 56779, 'loss/train': 1.3637478351593018} -11/07/2021 05:12:09 - INFO - __main__ - Step 56781: {'lr': 0.000349189557930745, 'samples': 10901952, 'steps': 56780, 'loss/train': 1.6369366645812988} -11/07/2021 05:12:09 - INFO - __main__ - Step 56782: {'lr': 0.000349184686724922, 'samples': 10902144, 'steps': 56781, 'loss/train': 1.3192890882492065} -11/07/2021 05:12:10 - INFO - __main__ - Step 56783: {'lr': 0.00034917981547440797, 'samples': 10902336, 'steps': 56782, 'loss/train': 1.9538573026657104} -11/07/2021 05:12:11 - INFO - __main__ - Step 56784: {'lr': 0.00034917494417920504, 'samples': 10902528, 'steps': 56783, 'loss/train': 1.6415321826934814} -11/07/2021 05:12:11 - INFO - __main__ - Step 56785: {'lr': 0.0003491700728393154, 'samples': 10902720, 'steps': 56784, 'loss/train': 1.7147635221481323} -11/07/2021 05:12:11 - INFO - __main__ - Step 56786: {'lr': 0.0003491652014547413, 'samples': 10902912, 'steps': 56785, 'loss/train': 1.1865392923355103} -11/07/2021 05:12:12 - INFO - __main__ - Step 56787: {'lr': 0.00034916033002548486, 'samples': 10903104, 'steps': 56786, 'loss/train': 1.6632952690124512} -11/07/2021 05:12:12 - INFO - __main__ - Step 56788: {'lr': 0.00034915545855154827, 'samples': 10903296, 'steps': 56787, 'loss/train': 1.759561538696289} -11/07/2021 05:12:13 - INFO - __main__ - Step 56789: {'lr': 0.00034915058703293377, 'samples': 10903488, 'steps': 56788, 'loss/train': 1.39176607131958} -11/07/2021 05:12:13 - INFO - __main__ - Step 56790: {'lr': 0.0003491457154696436, 'samples': 10903680, 'steps': 56789, 'loss/train': 1.5938973426818848} -11/07/2021 05:12:14 - INFO - __main__ - Step 56791: {'lr': 0.0003491408438616798, 'samples': 10903872, 'steps': 56790, 'loss/train': 1.3176683187484741} -11/07/2021 05:12:14 - INFO - __main__ - Step 56792: {'lr': 0.0003491359722090448, 'samples': 10904064, 'steps': 56791, 'loss/train': 1.5389387607574463} -11/07/2021 05:12:14 - INFO - __main__ - Step 56793: {'lr': 0.00034913110051174056, 'samples': 10904256, 'steps': 56792, 'loss/train': 1.2145445346832275} -11/07/2021 05:12:15 - INFO - __main__ - Step 56794: {'lr': 0.0003491262287697694, 'samples': 10904448, 'steps': 56793, 'loss/train': 1.434438705444336} -11/07/2021 05:12:16 - INFO - __main__ - Step 56795: {'lr': 0.0003491213569831335, 'samples': 10904640, 'steps': 56794, 'loss/train': 1.6607800722122192} -11/07/2021 05:12:16 - INFO - __main__ - Step 56796: {'lr': 0.000349116485151835, 'samples': 10904832, 'steps': 56795, 'loss/train': 1.0760871171951294} -11/07/2021 05:12:16 - INFO - __main__ - Step 56797: {'lr': 0.00034911161327587625, 'samples': 10905024, 'steps': 56796, 'loss/train': 1.4420219659805298} -11/07/2021 05:12:17 - INFO - __main__ - Step 56798: {'lr': 0.00034910674135525926, 'samples': 10905216, 'steps': 56797, 'loss/train': 1.4551119804382324} -11/07/2021 05:12:18 - INFO - __main__ - Step 56799: {'lr': 0.0003491018693899863, 'samples': 10905408, 'steps': 56798, 'loss/train': 0.805732786655426} -11/07/2021 05:12:18 - INFO - __main__ - Step 56800: {'lr': 0.00034909699738005964, 'samples': 10905600, 'steps': 56799, 'loss/train': 1.4538215398788452} -11/07/2021 05:12:18 - INFO - __main__ - Step 56801: {'lr': 0.0003490921253254813, 'samples': 10905792, 'steps': 56800, 'loss/train': 1.2486374378204346} -11/07/2021 05:12:19 - INFO - __main__ - Step 56802: {'lr': 0.00034908725322625365, 'samples': 10905984, 'steps': 56801, 'loss/train': 1.6391202211380005} -11/07/2021 05:12:19 - INFO - __main__ - Step 56803: {'lr': 0.0003490823810823788, 'samples': 10906176, 'steps': 56802, 'loss/train': 1.2304691076278687} -11/07/2021 05:12:20 - INFO - __main__ - Step 56804: {'lr': 0.0003490775088938589, 'samples': 10906368, 'steps': 56803, 'loss/train': 1.4793990850448608} -11/07/2021 05:12:21 - INFO - __main__ - Step 56805: {'lr': 0.00034907263666069624, 'samples': 10906560, 'steps': 56804, 'loss/train': 1.2749805450439453} -11/07/2021 05:12:21 - INFO - __main__ - Step 56806: {'lr': 0.000349067764382893, 'samples': 10906752, 'steps': 56805, 'loss/train': 1.2632070779800415} -11/07/2021 05:12:21 - INFO - __main__ - Step 56807: {'lr': 0.0003490628920604513, 'samples': 10906944, 'steps': 56806, 'loss/train': 1.7383389472961426} -11/07/2021 05:12:22 - INFO - __main__ - Step 56808: {'lr': 0.00034905801969337347, 'samples': 10907136, 'steps': 56807, 'loss/train': 1.5192008018493652} -11/07/2021 05:12:23 - INFO - __main__ - Step 56809: {'lr': 0.0003490531472816616, 'samples': 10907328, 'steps': 56808, 'loss/train': 1.4717756509780884} -11/07/2021 05:12:23 - INFO - __main__ - Step 56810: {'lr': 0.00034904827482531785, 'samples': 10907520, 'steps': 56809, 'loss/train': 0.5518280267715454} -11/07/2021 05:12:23 - INFO - __main__ - Step 56811: {'lr': 0.0003490434023243445, 'samples': 10907712, 'steps': 56810, 'loss/train': 1.182074785232544} -11/07/2021 05:12:24 - INFO - __main__ - Step 56812: {'lr': 0.0003490385297787438, 'samples': 10907904, 'steps': 56811, 'loss/train': 1.262606143951416} -11/07/2021 05:12:24 - INFO - __main__ - Step 56813: {'lr': 0.00034903365718851775, 'samples': 10908096, 'steps': 56812, 'loss/train': 0.9040560722351074} -11/07/2021 05:12:25 - INFO - __main__ - Step 56814: {'lr': 0.00034902878455366876, 'samples': 10908288, 'steps': 56813, 'loss/train': 1.0892393589019775} -11/07/2021 05:12:25 - INFO - __main__ - Step 56815: {'lr': 0.0003490239118741989, 'samples': 10908480, 'steps': 56814, 'loss/train': 1.5409772396087646} -11/07/2021 05:12:26 - INFO - __main__ - Step 56816: {'lr': 0.00034901903915011035, 'samples': 10908672, 'steps': 56815, 'loss/train': 1.5004373788833618} -11/07/2021 05:12:26 - INFO - __main__ - Step 56817: {'lr': 0.0003490141663814054, 'samples': 10908864, 'steps': 56816, 'loss/train': 1.1160506010055542} -11/07/2021 05:12:26 - INFO - __main__ - Step 56818: {'lr': 0.00034900929356808613, 'samples': 10909056, 'steps': 56817, 'loss/train': 1.5083330869674683} -11/07/2021 05:12:28 - INFO - __main__ - Step 56819: {'lr': 0.00034900442071015485, 'samples': 10909248, 'steps': 56818, 'loss/train': 1.148646593093872} -11/07/2021 05:12:28 - INFO - __main__ - Step 56820: {'lr': 0.00034899954780761373, 'samples': 10909440, 'steps': 56819, 'loss/train': 1.3670462369918823} -11/07/2021 05:12:28 - INFO - __main__ - Step 56821: {'lr': 0.00034899467486046486, 'samples': 10909632, 'steps': 56820, 'loss/train': 1.1212408542633057} -11/07/2021 05:12:29 - INFO - __main__ - Step 56822: {'lr': 0.0003489898018687106, 'samples': 10909824, 'steps': 56821, 'loss/train': 1.2553880214691162} -11/07/2021 05:12:29 - INFO - __main__ - Step 56823: {'lr': 0.000348984928832353, 'samples': 10910016, 'steps': 56822, 'loss/train': 1.1198461055755615} -11/07/2021 05:12:30 - INFO - __main__ - Step 56824: {'lr': 0.00034898005575139437, 'samples': 10910208, 'steps': 56823, 'loss/train': 1.5854177474975586} -11/07/2021 05:12:30 - INFO - __main__ - Step 56825: {'lr': 0.00034897518262583683, 'samples': 10910400, 'steps': 56824, 'loss/train': 1.3185606002807617} -11/07/2021 05:12:31 - INFO - __main__ - Step 56826: {'lr': 0.00034897030945568264, 'samples': 10910592, 'steps': 56825, 'loss/train': 1.1018697023391724} -11/07/2021 05:12:31 - INFO - __main__ - Step 56827: {'lr': 0.0003489654362409339, 'samples': 10910784, 'steps': 56826, 'loss/train': 0.7537766098976135} -11/07/2021 05:12:31 - INFO - __main__ - Step 56828: {'lr': 0.00034896056298159287, 'samples': 10910976, 'steps': 56827, 'loss/train': 1.3221607208251953} -11/07/2021 05:12:33 - INFO - __main__ - Step 56829: {'lr': 0.0003489556896776618, 'samples': 10911168, 'steps': 56828, 'loss/train': 0.6373487710952759} -11/07/2021 05:12:33 - INFO - __main__ - Step 56830: {'lr': 0.00034895081632914274, 'samples': 10911360, 'steps': 56829, 'loss/train': 1.5407037734985352} -11/07/2021 05:12:33 - INFO - __main__ - Step 56831: {'lr': 0.000348945942936038, 'samples': 10911552, 'steps': 56830, 'loss/train': 1.3099194765090942} -11/07/2021 05:12:34 - INFO - __main__ - Step 56832: {'lr': 0.0003489410694983497, 'samples': 10911744, 'steps': 56831, 'loss/train': 1.4125101566314697} -11/07/2021 05:12:34 - INFO - __main__ - Step 56833: {'lr': 0.00034893619601608015, 'samples': 10911936, 'steps': 56832, 'loss/train': 1.600282073020935} -11/07/2021 05:12:34 - INFO - __main__ - Step 56834: {'lr': 0.0003489313224892314, 'samples': 10912128, 'steps': 56833, 'loss/train': 1.6528139114379883} -11/07/2021 05:12:35 - INFO - __main__ - Step 56835: {'lr': 0.0003489264489178058, 'samples': 10912320, 'steps': 56834, 'loss/train': 1.6586995124816895} -11/07/2021 05:12:36 - INFO - __main__ - Step 56836: {'lr': 0.00034892157530180546, 'samples': 10912512, 'steps': 56835, 'loss/train': 0.987562894821167} -11/07/2021 05:12:36 - INFO - __main__ - Step 56837: {'lr': 0.0003489167016412326, 'samples': 10912704, 'steps': 56836, 'loss/train': 1.5761076211929321} -11/07/2021 05:12:36 - INFO - __main__ - Step 56838: {'lr': 0.00034891182793608935, 'samples': 10912896, 'steps': 56837, 'loss/train': 1.2682623863220215} -11/07/2021 05:12:37 - INFO - __main__ - Step 56839: {'lr': 0.000348906954186378, 'samples': 10913088, 'steps': 56838, 'loss/train': 2.0079851150512695} -11/07/2021 05:12:38 - INFO - __main__ - Step 56840: {'lr': 0.0003489020803921007, 'samples': 10913280, 'steps': 56839, 'loss/train': 1.529241681098938} -11/07/2021 05:12:38 - INFO - __main__ - Step 56841: {'lr': 0.00034889720655325955, 'samples': 10913472, 'steps': 56840, 'loss/train': 1.412021517753601} -11/07/2021 05:12:38 - INFO - __main__ - Step 56842: {'lr': 0.000348892332669857, 'samples': 10913664, 'steps': 56841, 'loss/train': 1.6484094858169556} -11/07/2021 05:12:39 - INFO - __main__ - Step 56843: {'lr': 0.000348887458741895, 'samples': 10913856, 'steps': 56842, 'loss/train': 1.524601936340332} -11/07/2021 05:12:39 - INFO - __main__ - Step 56844: {'lr': 0.0003488825847693758, 'samples': 10914048, 'steps': 56843, 'loss/train': 1.6736701726913452} -11/07/2021 05:12:40 - INFO - __main__ - Step 56845: {'lr': 0.0003488777107523017, 'samples': 10914240, 'steps': 56844, 'loss/train': 1.7258293628692627} -11/07/2021 05:12:40 - INFO - __main__ - Step 56846: {'lr': 0.0003488728366906748, 'samples': 10914432, 'steps': 56845, 'loss/train': 1.5056270360946655} -11/07/2021 05:12:41 - INFO - __main__ - Step 56847: {'lr': 0.0003488679625844974, 'samples': 10914624, 'steps': 56846, 'loss/train': 1.5097498893737793} -11/07/2021 05:12:41 - INFO - __main__ - Step 56848: {'lr': 0.0003488630884337715, 'samples': 10914816, 'steps': 56847, 'loss/train': 1.4018149375915527} -11/07/2021 05:12:42 - INFO - __main__ - Step 56849: {'lr': 0.0003488582142384995, 'samples': 10915008, 'steps': 56848, 'loss/train': 1.080633521080017} -11/07/2021 05:12:43 - INFO - __main__ - Step 56850: {'lr': 0.00034885333999868344, 'samples': 10915200, 'steps': 56849, 'loss/train': 0.059797029942274094} -11/07/2021 05:12:43 - INFO - __main__ - Step 56851: {'lr': 0.0003488484657143257, 'samples': 10915392, 'steps': 56850, 'loss/train': 1.1406599283218384} -11/07/2021 05:12:43 - INFO - __main__ - Step 56852: {'lr': 0.00034884359138542825, 'samples': 10915584, 'steps': 56851, 'loss/train': 1.5817950963974} -11/07/2021 05:12:44 - INFO - __main__ - Step 56853: {'lr': 0.0003488387170119935, 'samples': 10915776, 'steps': 56852, 'loss/train': 1.3233317136764526} -11/07/2021 05:12:44 - INFO - __main__ - Step 56854: {'lr': 0.0003488338425940235, 'samples': 10915968, 'steps': 56853, 'loss/train': 0.7318007349967957} -11/07/2021 05:12:45 - INFO - __main__ - Step 56855: {'lr': 0.00034882896813152056, 'samples': 10916160, 'steps': 56854, 'loss/train': 1.2505193948745728} -11/07/2021 05:12:46 - INFO - __main__ - Step 56856: {'lr': 0.0003488240936244867, 'samples': 10916352, 'steps': 56855, 'loss/train': 2.2404658794403076} -11/07/2021 05:12:46 - INFO - __main__ - Step 56857: {'lr': 0.0003488192190729243, 'samples': 10916544, 'steps': 56856, 'loss/train': 1.4771580696105957} -11/07/2021 05:12:46 - INFO - __main__ - Step 56858: {'lr': 0.0003488143444768355, 'samples': 10916736, 'steps': 56857, 'loss/train': 1.3698559999465942} -11/07/2021 05:12:47 - INFO - __main__ - Step 56859: {'lr': 0.0003488094698362224, 'samples': 10916928, 'steps': 56858, 'loss/train': 1.3732186555862427} -11/07/2021 05:12:48 - INFO - __main__ - Step 56860: {'lr': 0.00034880459515108735, 'samples': 10917120, 'steps': 56859, 'loss/train': 1.0488653182983398} -11/07/2021 05:12:48 - INFO - __main__ - Step 56861: {'lr': 0.0003487997204214325, 'samples': 10917312, 'steps': 56860, 'loss/train': 1.0818208456039429} -11/07/2021 05:12:48 - INFO - __main__ - Step 56862: {'lr': 0.00034879484564725993, 'samples': 10917504, 'steps': 56861, 'loss/train': 1.702939748764038} -11/07/2021 05:12:49 - INFO - __main__ - Step 56863: {'lr': 0.00034878997082857195, 'samples': 10917696, 'steps': 56862, 'loss/train': 1.3372565507888794} -11/07/2021 05:12:49 - INFO - __main__ - Step 56864: {'lr': 0.0003487850959653708, 'samples': 10917888, 'steps': 56863, 'loss/train': 1.1413240432739258} -11/07/2021 05:12:49 - INFO - __main__ - Step 56865: {'lr': 0.0003487802210576585, 'samples': 10918080, 'steps': 56864, 'loss/train': 1.5832221508026123} -11/07/2021 05:12:51 - INFO - __main__ - Step 56866: {'lr': 0.0003487753461054375, 'samples': 10918272, 'steps': 56865, 'loss/train': 1.3116753101348877} -11/07/2021 05:12:51 - INFO - __main__ - Step 56867: {'lr': 0.00034877047110870975, 'samples': 10918464, 'steps': 56866, 'loss/train': 1.2290250062942505} -11/07/2021 05:12:51 - INFO - __main__ - Step 56868: {'lr': 0.0003487655960674776, 'samples': 10918656, 'steps': 56867, 'loss/train': 1.3250553607940674} -11/07/2021 05:12:52 - INFO - __main__ - Step 56869: {'lr': 0.00034876072098174315, 'samples': 10918848, 'steps': 56868, 'loss/train': 1.3140314817428589} -11/07/2021 05:12:52 - INFO - __main__ - Step 56870: {'lr': 0.00034875584585150864, 'samples': 10919040, 'steps': 56869, 'loss/train': 1.451603651046753} -11/07/2021 05:12:53 - INFO - __main__ - Step 56871: {'lr': 0.0003487509706767763, 'samples': 10919232, 'steps': 56870, 'loss/train': 1.445232629776001} -11/07/2021 05:12:53 - INFO - __main__ - Step 56872: {'lr': 0.00034874609545754826, 'samples': 10919424, 'steps': 56871, 'loss/train': 0.06420867890119553} -11/07/2021 05:12:54 - INFO - __main__ - Step 56873: {'lr': 0.00034874122019382684, 'samples': 10919616, 'steps': 56872, 'loss/train': 1.2108557224273682} -11/07/2021 05:12:54 - INFO - __main__ - Step 56874: {'lr': 0.0003487363448856141, 'samples': 10919808, 'steps': 56873, 'loss/train': 1.455207347869873} -11/07/2021 05:12:55 - INFO - __main__ - Step 56875: {'lr': 0.00034873146953291224, 'samples': 10920000, 'steps': 56874, 'loss/train': 1.3070580959320068} -11/07/2021 05:12:55 - INFO - __main__ - Step 56876: {'lr': 0.0003487265941357236, 'samples': 10920192, 'steps': 56875, 'loss/train': 1.1097195148468018} -11/07/2021 05:12:56 - INFO - __main__ - Step 56877: {'lr': 0.00034872171869405015, 'samples': 10920384, 'steps': 56876, 'loss/train': 1.4130849838256836} -11/07/2021 05:12:56 - INFO - __main__ - Step 56878: {'lr': 0.0003487168432078943, 'samples': 10920576, 'steps': 56877, 'loss/train': 1.3187248706817627} -11/07/2021 05:12:57 - INFO - __main__ - Step 56879: {'lr': 0.0003487119676772582, 'samples': 10920768, 'steps': 56878, 'loss/train': 2.050884246826172} -11/07/2021 05:12:57 - INFO - __main__ - Step 56880: {'lr': 0.00034870709210214397, 'samples': 10920960, 'steps': 56879, 'loss/train': 0.8796589374542236} -11/07/2021 05:12:58 - INFO - __main__ - Step 56881: {'lr': 0.00034870221648255383, 'samples': 10921152, 'steps': 56880, 'loss/train': 1.1586881875991821} -11/07/2021 05:12:58 - INFO - __main__ - Step 56882: {'lr': 0.00034869734081849, 'samples': 10921344, 'steps': 56881, 'loss/train': 1.4075803756713867} -11/07/2021 05:12:59 - INFO - __main__ - Step 56883: {'lr': 0.0003486924651099547, 'samples': 10921536, 'steps': 56882, 'loss/train': 0.9032168984413147} -11/07/2021 05:12:59 - INFO - __main__ - Step 56884: {'lr': 0.00034868758935695, 'samples': 10921728, 'steps': 56883, 'loss/train': 1.346758246421814} -11/07/2021 05:12:59 - INFO - __main__ - Step 56885: {'lr': 0.0003486827135594783, 'samples': 10921920, 'steps': 56884, 'loss/train': 1.114176869392395} -11/07/2021 05:13:00 - INFO - __main__ - Step 56886: {'lr': 0.0003486778377175417, 'samples': 10922112, 'steps': 56885, 'loss/train': 1.0794364213943481} -11/07/2021 05:13:01 - INFO - __main__ - Step 56887: {'lr': 0.00034867296183114236, 'samples': 10922304, 'steps': 56886, 'loss/train': 1.1506068706512451} -11/07/2021 05:13:01 - INFO - __main__ - Step 56888: {'lr': 0.0003486680859002825, 'samples': 10922496, 'steps': 56887, 'loss/train': 1.1032979488372803} -11/07/2021 05:13:01 - INFO - __main__ - Step 56889: {'lr': 0.00034866320992496427, 'samples': 10922688, 'steps': 56888, 'loss/train': 1.5184299945831299} -11/07/2021 05:13:02 - INFO - __main__ - Step 56890: {'lr': 0.00034865833390518996, 'samples': 10922880, 'steps': 56889, 'loss/train': 1.0353816747665405} -11/07/2021 05:13:03 - INFO - __main__ - Step 56891: {'lr': 0.0003486534578409618, 'samples': 10923072, 'steps': 56890, 'loss/train': 1.490349292755127} -11/07/2021 05:13:03 - INFO - __main__ - Step 56892: {'lr': 0.0003486485817322819, 'samples': 10923264, 'steps': 56891, 'loss/train': 1.4208921194076538} -11/07/2021 05:13:03 - INFO - __main__ - Step 56893: {'lr': 0.0003486437055791524, 'samples': 10923456, 'steps': 56892, 'loss/train': 1.3553944826126099} -11/07/2021 05:13:04 - INFO - __main__ - Step 56894: {'lr': 0.00034863882938157553, 'samples': 10923648, 'steps': 56893, 'loss/train': 1.4005050659179688} -11/07/2021 05:13:04 - INFO - __main__ - Step 56895: {'lr': 0.0003486339531395536, 'samples': 10923840, 'steps': 56894, 'loss/train': 1.583556056022644} -11/07/2021 05:13:05 - INFO - __main__ - Step 56896: {'lr': 0.0003486290768530887, 'samples': 10924032, 'steps': 56895, 'loss/train': 1.2132513523101807} -11/07/2021 05:13:06 - INFO - __main__ - Step 56897: {'lr': 0.00034862420052218313, 'samples': 10924224, 'steps': 56896, 'loss/train': 1.1575571298599243} -11/07/2021 05:13:06 - INFO - __main__ - Step 56898: {'lr': 0.00034861932414683897, 'samples': 10924416, 'steps': 56897, 'loss/train': 1.5526455640792847} -11/07/2021 05:13:06 - INFO - __main__ - Step 56899: {'lr': 0.00034861444772705846, 'samples': 10924608, 'steps': 56898, 'loss/train': 1.6995787620544434} -11/07/2021 05:13:07 - INFO - __main__ - Step 56900: {'lr': 0.0003486095712628438, 'samples': 10924800, 'steps': 56899, 'loss/train': 1.4922962188720703} -11/07/2021 05:13:08 - INFO - __main__ - Step 56901: {'lr': 0.00034860469475419723, 'samples': 10924992, 'steps': 56900, 'loss/train': 1.801711082458496} -11/07/2021 05:13:08 - INFO - __main__ - Step 56902: {'lr': 0.00034859981820112084, 'samples': 10925184, 'steps': 56901, 'loss/train': 1.2205525636672974} -11/07/2021 05:13:08 - INFO - __main__ - Step 56903: {'lr': 0.00034859494160361694, 'samples': 10925376, 'steps': 56902, 'loss/train': 1.3201030492782593} -11/07/2021 05:13:09 - INFO - __main__ - Step 56904: {'lr': 0.00034859006496168764, 'samples': 10925568, 'steps': 56903, 'loss/train': 1.0855777263641357} -11/07/2021 05:13:09 - INFO - __main__ - Step 56905: {'lr': 0.0003485851882753352, 'samples': 10925760, 'steps': 56904, 'loss/train': 1.3407800197601318} -11/07/2021 05:13:10 - INFO - __main__ - Step 56906: {'lr': 0.00034858031154456177, 'samples': 10925952, 'steps': 56905, 'loss/train': 0.8941053152084351} -11/07/2021 05:13:11 - INFO - __main__ - Step 56907: {'lr': 0.0003485754347693696, 'samples': 10926144, 'steps': 56906, 'loss/train': 1.1388531923294067} -11/07/2021 05:13:11 - INFO - __main__ - Step 56908: {'lr': 0.0003485705579497609, 'samples': 10926336, 'steps': 56907, 'loss/train': 1.4479374885559082} -11/07/2021 05:13:11 - INFO - __main__ - Step 56909: {'lr': 0.0003485656810857378, 'samples': 10926528, 'steps': 56908, 'loss/train': 1.2756643295288086} -11/07/2021 05:13:12 - INFO - __main__ - Step 56910: {'lr': 0.00034856080417730253, 'samples': 10926720, 'steps': 56909, 'loss/train': 1.2452208995819092} -11/07/2021 05:13:12 - INFO - __main__ - Step 56911: {'lr': 0.0003485559272244572, 'samples': 10926912, 'steps': 56910, 'loss/train': 1.669407606124878} -11/07/2021 05:13:13 - INFO - __main__ - Step 56912: {'lr': 0.0003485510502272042, 'samples': 10927104, 'steps': 56911, 'loss/train': 2.0323190689086914} -11/07/2021 05:13:13 - INFO - __main__ - Step 56913: {'lr': 0.0003485461731855456, 'samples': 10927296, 'steps': 56912, 'loss/train': 1.4654431343078613} -11/07/2021 05:13:14 - INFO - __main__ - Step 56914: {'lr': 0.0003485412960994836, 'samples': 10927488, 'steps': 56913, 'loss/train': 1.3183684349060059} -11/07/2021 05:13:14 - INFO - __main__ - Step 56915: {'lr': 0.0003485364189690203, 'samples': 10927680, 'steps': 56914, 'loss/train': 1.2402470111846924} -11/07/2021 05:13:14 - INFO - __main__ - Step 56916: {'lr': 0.0003485315417941581, 'samples': 10927872, 'steps': 56915, 'loss/train': 1.2380595207214355} -11/07/2021 05:13:15 - INFO - __main__ - Step 56917: {'lr': 0.00034852666457489917, 'samples': 10928064, 'steps': 56916, 'loss/train': 1.0708080530166626} -11/07/2021 05:13:16 - INFO - __main__ - Step 56918: {'lr': 0.00034852178731124557, 'samples': 10928256, 'steps': 56917, 'loss/train': 1.747732162475586} -11/07/2021 05:13:16 - INFO - __main__ - Step 56919: {'lr': 0.00034851691000319963, 'samples': 10928448, 'steps': 56918, 'loss/train': 1.5586053133010864} -11/07/2021 05:13:16 - INFO - __main__ - Step 56920: {'lr': 0.0003485120326507635, 'samples': 10928640, 'steps': 56919, 'loss/train': 0.9507009387016296} -11/07/2021 05:13:17 - INFO - __main__ - Step 56921: {'lr': 0.0003485071552539393, 'samples': 10928832, 'steps': 56920, 'loss/train': 1.2531992197036743} -11/07/2021 05:13:18 - INFO - __main__ - Step 56922: {'lr': 0.0003485022778127293, 'samples': 10929024, 'steps': 56921, 'loss/train': 1.6206005811691284} -11/07/2021 05:13:18 - INFO - __main__ - Step 56923: {'lr': 0.0003484974003271357, 'samples': 10929216, 'steps': 56922, 'loss/train': 1.4933346509933472} -11/07/2021 05:13:19 - INFO - __main__ - Step 56924: {'lr': 0.0003484925227971607, 'samples': 10929408, 'steps': 56923, 'loss/train': 0.821574866771698} -11/07/2021 05:13:19 - INFO - __main__ - Step 56925: {'lr': 0.0003484876452228065, 'samples': 10929600, 'steps': 56924, 'loss/train': 1.5044890642166138} -11/07/2021 05:13:19 - INFO - __main__ - Step 56926: {'lr': 0.00034848276760407525, 'samples': 10929792, 'steps': 56925, 'loss/train': 1.297538161277771} -11/07/2021 05:13:20 - INFO - __main__ - Step 56927: {'lr': 0.0003484778899409693, 'samples': 10929984, 'steps': 56926, 'loss/train': 1.383144736289978} -11/07/2021 05:13:21 - INFO - __main__ - Step 56928: {'lr': 0.0003484730122334906, 'samples': 10930176, 'steps': 56927, 'loss/train': 1.371925711631775} -11/07/2021 05:13:21 - INFO - __main__ - Step 56929: {'lr': 0.00034846813448164153, 'samples': 10930368, 'steps': 56928, 'loss/train': 1.3051584959030151} -11/07/2021 05:13:21 - INFO - __main__ - Step 56930: {'lr': 0.00034846325668542425, 'samples': 10930560, 'steps': 56929, 'loss/train': 1.477121114730835} -11/07/2021 05:13:22 - INFO - __main__ - Step 56931: {'lr': 0.00034845837884484086, 'samples': 10930752, 'steps': 56930, 'loss/train': 0.9537971019744873} -11/07/2021 05:13:23 - INFO - __main__ - Step 56932: {'lr': 0.00034845350095989377, 'samples': 10930944, 'steps': 56931, 'loss/train': 0.9450234770774841} -11/07/2021 05:13:23 - INFO - __main__ - Step 56933: {'lr': 0.000348448623030585, 'samples': 10931136, 'steps': 56932, 'loss/train': 1.4369124174118042} -11/07/2021 05:13:23 - INFO - __main__ - Step 56934: {'lr': 0.00034844374505691686, 'samples': 10931328, 'steps': 56933, 'loss/train': 0.9749782681465149} -11/07/2021 05:13:24 - INFO - __main__ - Step 56935: {'lr': 0.0003484388670388914, 'samples': 10931520, 'steps': 56934, 'loss/train': 1.6764055490493774} -11/07/2021 05:13:24 - INFO - __main__ - Step 56936: {'lr': 0.0003484339889765109, 'samples': 10931712, 'steps': 56935, 'loss/train': 1.48472261428833} -11/07/2021 05:13:25 - INFO - __main__ - Step 56937: {'lr': 0.0003484291108697776, 'samples': 10931904, 'steps': 56936, 'loss/train': 1.3301887512207031} -11/07/2021 05:13:25 - INFO - __main__ - Step 56938: {'lr': 0.0003484242327186936, 'samples': 10932096, 'steps': 56937, 'loss/train': 1.0789657831192017} -11/07/2021 05:13:26 - INFO - __main__ - Step 56939: {'lr': 0.0003484193545232612, 'samples': 10932288, 'steps': 56938, 'loss/train': 1.1669780015945435} -11/07/2021 05:13:26 - INFO - __main__ - Step 56940: {'lr': 0.00034841447628348267, 'samples': 10932480, 'steps': 56939, 'loss/train': 1.3737448453903198} -11/07/2021 05:13:26 - INFO - __main__ - Step 56941: {'lr': 0.00034840959799936, 'samples': 10932672, 'steps': 56940, 'loss/train': 1.536058783531189} -11/07/2021 05:13:27 - INFO - __main__ - Step 56942: {'lr': 0.0003484047196708955, 'samples': 10932864, 'steps': 56941, 'loss/train': 1.282861351966858} -11/07/2021 05:13:28 - INFO - __main__ - Step 56943: {'lr': 0.00034839984129809125, 'samples': 10933056, 'steps': 56942, 'loss/train': 1.2766464948654175} -11/07/2021 05:13:28 - INFO - __main__ - Step 56944: {'lr': 0.00034839496288094964, 'samples': 10933248, 'steps': 56943, 'loss/train': 1.8850005865097046} -11/07/2021 05:13:28 - INFO - __main__ - Step 56945: {'lr': 0.0003483900844194728, 'samples': 10933440, 'steps': 56944, 'loss/train': 1.4289957284927368} -11/07/2021 05:13:29 - INFO - __main__ - Step 56946: {'lr': 0.00034838520591366285, 'samples': 10933632, 'steps': 56945, 'loss/train': 1.6287003755569458} -11/07/2021 05:13:30 - INFO - __main__ - Step 56947: {'lr': 0.0003483803273635221, 'samples': 10933824, 'steps': 56946, 'loss/train': 0.452557772397995} -11/07/2021 05:13:30 - INFO - __main__ - Step 56948: {'lr': 0.0003483754487690527, 'samples': 10934016, 'steps': 56947, 'loss/train': 1.4415332078933716} -11/07/2021 05:13:31 - INFO - __main__ - Step 56949: {'lr': 0.0003483705701302567, 'samples': 10934208, 'steps': 56948, 'loss/train': 1.4060859680175781} -11/07/2021 05:13:31 - INFO - __main__ - Step 56950: {'lr': 0.0003483656914471366, 'samples': 10934400, 'steps': 56949, 'loss/train': 1.652616024017334} -11/07/2021 05:13:31 - INFO - __main__ - Step 56951: {'lr': 0.00034836081271969436, 'samples': 10934592, 'steps': 56950, 'loss/train': 1.4206058979034424} -11/07/2021 05:13:32 - INFO - __main__ - Step 56952: {'lr': 0.0003483559339479323, 'samples': 10934784, 'steps': 56951, 'loss/train': 1.4728578329086304} -11/07/2021 05:13:33 - INFO - __main__ - Step 56953: {'lr': 0.00034835105513185253, 'samples': 10934976, 'steps': 56952, 'loss/train': 1.665027141571045} -11/07/2021 05:13:33 - INFO - __main__ - Step 56954: {'lr': 0.00034834617627145737, 'samples': 10935168, 'steps': 56953, 'loss/train': 1.2767750024795532} -11/07/2021 05:13:33 - INFO - __main__ - Step 56955: {'lr': 0.00034834129736674885, 'samples': 10935360, 'steps': 56954, 'loss/train': 2.0450494289398193} -11/07/2021 05:13:34 - INFO - __main__ - Step 56956: {'lr': 0.0003483364184177293, 'samples': 10935552, 'steps': 56955, 'loss/train': 1.1888480186462402} -11/07/2021 05:13:34 - INFO - __main__ - Step 56957: {'lr': 0.0003483315394244009, 'samples': 10935744, 'steps': 56956, 'loss/train': 1.5797548294067383} -11/07/2021 05:13:35 - INFO - __main__ - Step 56958: {'lr': 0.00034832666038676576, 'samples': 10935936, 'steps': 56957, 'loss/train': 1.4554880857467651} -11/07/2021 05:13:35 - INFO - __main__ - Step 56959: {'lr': 0.0003483217813048262, 'samples': 10936128, 'steps': 56958, 'loss/train': 1.3941136598587036} -11/07/2021 05:13:36 - INFO - __main__ - Step 56960: {'lr': 0.0003483169021785844, 'samples': 10936320, 'steps': 56959, 'loss/train': 2.511237382888794} -11/07/2021 05:13:36 - INFO - __main__ - Step 56961: {'lr': 0.00034831202300804245, 'samples': 10936512, 'steps': 56960, 'loss/train': 1.3640533685684204} -11/07/2021 05:13:36 - INFO - __main__ - Step 56962: {'lr': 0.0003483071437932026, 'samples': 10936704, 'steps': 56961, 'loss/train': 1.2520326375961304} -11/07/2021 05:13:37 - INFO - __main__ - Step 56963: {'lr': 0.0003483022645340671, 'samples': 10936896, 'steps': 56962, 'loss/train': 1.1164780855178833} -11/07/2021 05:13:38 - INFO - __main__ - Step 56964: {'lr': 0.0003482973852306381, 'samples': 10937088, 'steps': 56963, 'loss/train': 1.4276697635650635} -11/07/2021 05:13:38 - INFO - __main__ - Step 56965: {'lr': 0.00034829250588291785, 'samples': 10937280, 'steps': 56964, 'loss/train': 1.3328008651733398} -11/07/2021 05:13:38 - INFO - __main__ - Step 56966: {'lr': 0.00034828762649090843, 'samples': 10937472, 'steps': 56965, 'loss/train': 1.4390015602111816} -11/07/2021 05:13:39 - INFO - __main__ - Step 56967: {'lr': 0.0003482827470546123, 'samples': 10937664, 'steps': 56966, 'loss/train': 1.0958737134933472} -11/07/2021 05:13:40 - INFO - __main__ - Step 56968: {'lr': 0.00034827786757403136, 'samples': 10937856, 'steps': 56967, 'loss/train': 1.070756196975708} -11/07/2021 05:13:40 - INFO - __main__ - Step 56969: {'lr': 0.00034827298804916793, 'samples': 10938048, 'steps': 56968, 'loss/train': 1.1565850973129272} -11/07/2021 05:13:41 - INFO - __main__ - Step 56970: {'lr': 0.00034826810848002416, 'samples': 10938240, 'steps': 56969, 'loss/train': 1.0730781555175781} -11/07/2021 05:13:41 - INFO - __main__ - Step 56971: {'lr': 0.00034826322886660234, 'samples': 10938432, 'steps': 56970, 'loss/train': 1.6203216314315796} -11/07/2021 05:13:41 - INFO - __main__ - Step 56972: {'lr': 0.00034825834920890463, 'samples': 10938624, 'steps': 56971, 'loss/train': 1.631622314453125} -11/07/2021 05:13:42 - INFO - __main__ - Step 56973: {'lr': 0.00034825346950693325, 'samples': 10938816, 'steps': 56972, 'loss/train': 0.08236096799373627} -11/07/2021 05:13:43 - INFO - __main__ - Step 56974: {'lr': 0.00034824858976069043, 'samples': 10939008, 'steps': 56973, 'loss/train': 1.3933860063552856} -11/07/2021 05:13:43 - INFO - __main__ - Step 56975: {'lr': 0.00034824370997017817, 'samples': 10939200, 'steps': 56974, 'loss/train': 1.330894112586975} -11/07/2021 05:13:43 - INFO - __main__ - Step 56976: {'lr': 0.0003482388301353989, 'samples': 10939392, 'steps': 56975, 'loss/train': 1.251906156539917} -11/07/2021 05:13:44 - INFO - __main__ - Step 56977: {'lr': 0.0003482339502563547, 'samples': 10939584, 'steps': 56976, 'loss/train': 1.060488224029541} -11/07/2021 05:13:45 - INFO - __main__ - Step 56978: {'lr': 0.0003482290703330478, 'samples': 10939776, 'steps': 56977, 'loss/train': 1.015341877937317} -11/07/2021 05:13:45 - INFO - __main__ - Step 56979: {'lr': 0.0003482241903654804, 'samples': 10939968, 'steps': 56978, 'loss/train': 1.4945625066757202} -11/07/2021 05:13:45 - INFO - __main__ - Step 56980: {'lr': 0.00034821931035365465, 'samples': 10940160, 'steps': 56979, 'loss/train': 1.133074402809143} -11/07/2021 05:13:46 - INFO - __main__ - Step 56981: {'lr': 0.0003482144302975729, 'samples': 10940352, 'steps': 56980, 'loss/train': 1.8464810848236084} -11/07/2021 05:13:46 - INFO - __main__ - Step 56982: {'lr': 0.0003482095501972372, 'samples': 10940544, 'steps': 56981, 'loss/train': 1.4704564809799194} -11/07/2021 05:13:47 - INFO - __main__ - Step 56983: {'lr': 0.0003482046700526498, 'samples': 10940736, 'steps': 56982, 'loss/train': 1.6985701322555542} -11/07/2021 05:13:47 - INFO - __main__ - Step 56984: {'lr': 0.0003481997898638128, 'samples': 10940928, 'steps': 56983, 'loss/train': 1.6070499420166016} -11/07/2021 05:13:48 - INFO - __main__ - Step 56985: {'lr': 0.0003481949096307285, 'samples': 10941120, 'steps': 56984, 'loss/train': 1.2578685283660889} -11/07/2021 05:13:48 - INFO - __main__ - Step 56986: {'lr': 0.0003481900293533992, 'samples': 10941312, 'steps': 56985, 'loss/train': 1.5594573020935059} -11/07/2021 05:13:48 - INFO - __main__ - Step 56987: {'lr': 0.00034818514903182696, 'samples': 10941504, 'steps': 56986, 'loss/train': 1.0292149782180786} -11/07/2021 05:13:50 - INFO - __main__ - Step 56988: {'lr': 0.000348180268666014, 'samples': 10941696, 'steps': 56987, 'loss/train': 1.2681105136871338} -11/07/2021 05:13:50 - INFO - __main__ - Step 56989: {'lr': 0.00034817538825596253, 'samples': 10941888, 'steps': 56988, 'loss/train': 1.165054202079773} -11/07/2021 05:13:50 - INFO - __main__ - Step 56990: {'lr': 0.0003481705078016747, 'samples': 10942080, 'steps': 56989, 'loss/train': 1.1151914596557617} -11/07/2021 05:13:51 - INFO - __main__ - Step 56991: {'lr': 0.0003481656273031527, 'samples': 10942272, 'steps': 56990, 'loss/train': 1.0866490602493286} -11/07/2021 05:13:51 - INFO - __main__ - Step 56992: {'lr': 0.0003481607467603989, 'samples': 10942464, 'steps': 56991, 'loss/train': 0.044805631041526794} -11/07/2021 05:13:52 - INFO - __main__ - Step 56993: {'lr': 0.00034815586617341533, 'samples': 10942656, 'steps': 56992, 'loss/train': 1.5680711269378662} -11/07/2021 05:13:53 - INFO - __main__ - Step 56994: {'lr': 0.0003481509855422043, 'samples': 10942848, 'steps': 56993, 'loss/train': 1.6193270683288574} -11/07/2021 05:13:53 - INFO - __main__ - Step 56995: {'lr': 0.0003481461048667679, 'samples': 10943040, 'steps': 56994, 'loss/train': 0.08559868484735489} -11/07/2021 05:13:53 - INFO - __main__ - Step 56996: {'lr': 0.00034814122414710837, 'samples': 10943232, 'steps': 56995, 'loss/train': 1.2014765739440918} -11/07/2021 05:13:54 - INFO - __main__ - Step 56997: {'lr': 0.0003481363433832279, 'samples': 10943424, 'steps': 56996, 'loss/train': 1.3474739789962769} -11/07/2021 05:13:55 - INFO - __main__ - Step 56998: {'lr': 0.00034813146257512876, 'samples': 10943616, 'steps': 56997, 'loss/train': 1.2970685958862305} -11/07/2021 05:13:55 - INFO - __main__ - Step 56999: {'lr': 0.0003481265817228131, 'samples': 10943808, 'steps': 56998, 'loss/train': 1.4136161804199219} -11/07/2021 05:13:56 - INFO - __main__ - Step 57000: {'lr': 0.00034812170082628303, 'samples': 10944000, 'steps': 56999, 'loss/train': 1.2367044687271118} -11/07/2021 05:13:56 - INFO - __main__ - Step 57001: {'lr': 0.00034811681988554095, 'samples': 10944192, 'steps': 57000, 'loss/train': 1.0630079507827759} -11/07/2021 05:13:56 - INFO - __main__ - Step 57002: {'lr': 0.0003481119389005889, 'samples': 10944384, 'steps': 57001, 'loss/train': 1.4385117292404175} -11/07/2021 05:13:58 - INFO - __main__ - Step 57003: {'lr': 0.0003481070578714291, 'samples': 10944576, 'steps': 57002, 'loss/train': 0.06309520453214645} -11/07/2021 05:13:58 - INFO - __main__ - Step 57004: {'lr': 0.0003481021767980638, 'samples': 10944768, 'steps': 57003, 'loss/train': 1.4560445547103882} -11/07/2021 05:13:58 - INFO - __main__ - Step 57005: {'lr': 0.00034809729568049513, 'samples': 10944960, 'steps': 57004, 'loss/train': 1.5791494846343994} -11/07/2021 05:13:59 - INFO - __main__ - Step 57006: {'lr': 0.0003480924145187254, 'samples': 10945152, 'steps': 57005, 'loss/train': 1.7447997331619263} -11/07/2021 05:13:59 - INFO - __main__ - Step 57007: {'lr': 0.0003480875333127567, 'samples': 10945344, 'steps': 57006, 'loss/train': 1.5612694025039673} -11/07/2021 05:13:59 - INFO - __main__ - Step 57008: {'lr': 0.0003480826520625913, 'samples': 10945536, 'steps': 57007, 'loss/train': 1.7285468578338623} -11/07/2021 05:14:00 - INFO - __main__ - Step 57009: {'lr': 0.0003480777707682313, 'samples': 10945728, 'steps': 57008, 'loss/train': 0.1764259934425354} -11/07/2021 05:14:01 - INFO - __main__ - Step 57010: {'lr': 0.00034807288942967905, 'samples': 10945920, 'steps': 57009, 'loss/train': 1.6600234508514404} -11/07/2021 05:14:01 - INFO - __main__ - Step 57011: {'lr': 0.0003480680080469366, 'samples': 10946112, 'steps': 57010, 'loss/train': 1.1775566339492798} -11/07/2021 05:14:01 - INFO - __main__ - Step 57012: {'lr': 0.0003480631266200063, 'samples': 10946304, 'steps': 57011, 'loss/train': 1.5337494611740112} -11/07/2021 05:14:02 - INFO - __main__ - Step 57013: {'lr': 0.0003480582451488902, 'samples': 10946496, 'steps': 57012, 'loss/train': 1.730421543121338} -11/07/2021 05:14:03 - INFO - __main__ - Step 57014: {'lr': 0.00034805336363359066, 'samples': 10946688, 'steps': 57013, 'loss/train': 1.591624140739441} -11/07/2021 05:14:03 - INFO - __main__ - Step 57015: {'lr': 0.00034804848207410974, 'samples': 10946880, 'steps': 57014, 'loss/train': 1.498093843460083} -11/07/2021 05:14:04 - INFO - __main__ - Step 57016: {'lr': 0.00034804360047044965, 'samples': 10947072, 'steps': 57015, 'loss/train': 1.7804088592529297} -11/07/2021 05:14:04 - INFO - __main__ - Step 57017: {'lr': 0.0003480387188226126, 'samples': 10947264, 'steps': 57016, 'loss/train': 1.5107934474945068} -11/07/2021 05:14:04 - INFO - __main__ - Step 57018: {'lr': 0.0003480338371306009, 'samples': 10947456, 'steps': 57017, 'loss/train': 1.2875913381576538} -11/07/2021 05:14:05 - INFO - __main__ - Step 57019: {'lr': 0.0003480289553944166, 'samples': 10947648, 'steps': 57018, 'loss/train': 1.4271272420883179} -11/07/2021 05:14:06 - INFO - __main__ - Step 57020: {'lr': 0.000348024073614062, 'samples': 10947840, 'steps': 57019, 'loss/train': 1.0144290924072266} -11/07/2021 05:14:06 - INFO - __main__ - Step 57021: {'lr': 0.0003480191917895393, 'samples': 10948032, 'steps': 57020, 'loss/train': 1.7339799404144287} -11/07/2021 05:14:06 - INFO - __main__ - Step 57022: {'lr': 0.0003480143099208506, 'samples': 10948224, 'steps': 57021, 'loss/train': 1.292941927909851} -11/07/2021 05:14:07 - INFO - __main__ - Step 57023: {'lr': 0.00034800942800799817, 'samples': 10948416, 'steps': 57022, 'loss/train': 1.318372130393982} -11/07/2021 05:14:08 - INFO - __main__ - Step 57024: {'lr': 0.00034800454605098417, 'samples': 10948608, 'steps': 57023, 'loss/train': 0.3450126349925995} -11/07/2021 05:14:08 - INFO - __main__ - Step 57025: {'lr': 0.00034799966404981095, 'samples': 10948800, 'steps': 57024, 'loss/train': 1.3935389518737793} -11/07/2021 05:14:08 - INFO - __main__ - Step 57026: {'lr': 0.00034799478200448056, 'samples': 10948992, 'steps': 57025, 'loss/train': 1.5002765655517578} -11/07/2021 05:14:09 - INFO - __main__ - Step 57027: {'lr': 0.0003479898999149952, 'samples': 10949184, 'steps': 57026, 'loss/train': 1.3063820600509644} -11/07/2021 05:14:09 - INFO - __main__ - Step 57028: {'lr': 0.00034798501778135704, 'samples': 10949376, 'steps': 57027, 'loss/train': 1.380514144897461} -11/07/2021 05:14:10 - INFO - __main__ - Step 57029: {'lr': 0.0003479801356035684, 'samples': 10949568, 'steps': 57028, 'loss/train': 1.4907722473144531} -11/07/2021 05:14:11 - INFO - __main__ - Step 57030: {'lr': 0.0003479752533816315, 'samples': 10949760, 'steps': 57029, 'loss/train': 1.2079057693481445} -11/07/2021 05:14:11 - INFO - __main__ - Step 57031: {'lr': 0.0003479703711155484, 'samples': 10949952, 'steps': 57030, 'loss/train': 1.1674896478652954} -11/07/2021 05:14:11 - INFO - __main__ - Step 57032: {'lr': 0.00034796548880532135, 'samples': 10950144, 'steps': 57031, 'loss/train': 1.5546785593032837} -11/07/2021 05:14:12 - INFO - __main__ - Step 57033: {'lr': 0.0003479606064509526, 'samples': 10950336, 'steps': 57032, 'loss/train': 1.2576812505722046} -11/07/2021 05:14:13 - INFO - __main__ - Step 57034: {'lr': 0.00034795572405244425, 'samples': 10950528, 'steps': 57033, 'loss/train': 1.206067681312561} -11/07/2021 05:14:13 - INFO - __main__ - Step 57035: {'lr': 0.0003479508416097986, 'samples': 10950720, 'steps': 57034, 'loss/train': 1.2598367929458618} -11/07/2021 05:14:13 - INFO - __main__ - Step 57036: {'lr': 0.0003479459591230177, 'samples': 10950912, 'steps': 57035, 'loss/train': 1.8784977197647095} -11/07/2021 05:14:14 - INFO - __main__ - Step 57037: {'lr': 0.0003479410765921041, 'samples': 10951104, 'steps': 57036, 'loss/train': 1.462232232093811} -11/07/2021 05:14:14 - INFO - __main__ - Step 57038: {'lr': 0.0003479361940170596, 'samples': 10951296, 'steps': 57037, 'loss/train': 1.3565127849578857} -11/07/2021 05:14:15 - INFO - __main__ - Step 57039: {'lr': 0.0003479313113978866, 'samples': 10951488, 'steps': 57038, 'loss/train': 1.4616706371307373} -11/07/2021 05:14:15 - INFO - __main__ - Step 57040: {'lr': 0.00034792642873458725, 'samples': 10951680, 'steps': 57039, 'loss/train': 0.4259514808654785} -11/07/2021 05:14:16 - INFO - __main__ - Step 57041: {'lr': 0.00034792154602716376, 'samples': 10951872, 'steps': 57040, 'loss/train': 0.5904067158699036} -11/07/2021 05:14:16 - INFO - __main__ - Step 57042: {'lr': 0.0003479166632756184, 'samples': 10952064, 'steps': 57041, 'loss/train': 1.4015944004058838} -11/07/2021 05:14:16 - INFO - __main__ - Step 57043: {'lr': 0.0003479117804799532, 'samples': 10952256, 'steps': 57042, 'loss/train': 0.7780531048774719} -11/07/2021 05:14:18 - INFO - __main__ - Step 57044: {'lr': 0.00034790689764017046, 'samples': 10952448, 'steps': 57043, 'loss/train': 1.5652540922164917} -11/07/2021 05:14:18 - INFO - __main__ - Step 57045: {'lr': 0.00034790201475627246, 'samples': 10952640, 'steps': 57044, 'loss/train': 1.007209300994873} -11/07/2021 05:14:18 - INFO - __main__ - Step 57046: {'lr': 0.00034789713182826126, 'samples': 10952832, 'steps': 57045, 'loss/train': 1.5317529439926147} -11/07/2021 05:14:19 - INFO - __main__ - Step 57047: {'lr': 0.0003478922488561392, 'samples': 10953024, 'steps': 57046, 'loss/train': 1.1437493562698364} -11/07/2021 05:14:19 - INFO - __main__ - Step 57048: {'lr': 0.0003478873658399084, 'samples': 10953216, 'steps': 57047, 'loss/train': 0.6343510150909424} -11/07/2021 05:14:20 - INFO - __main__ - Step 57049: {'lr': 0.000347882482779571, 'samples': 10953408, 'steps': 57048, 'loss/train': 0.871766984462738} -11/07/2021 05:14:20 - INFO - __main__ - Step 57050: {'lr': 0.00034787759967512923, 'samples': 10953600, 'steps': 57049, 'loss/train': 1.715659260749817} -11/07/2021 05:14:21 - INFO - __main__ - Step 57051: {'lr': 0.00034787271652658534, 'samples': 10953792, 'steps': 57050, 'loss/train': 1.4466074705123901} -11/07/2021 05:14:21 - INFO - __main__ - Step 57052: {'lr': 0.0003478678333339416, 'samples': 10953984, 'steps': 57051, 'loss/train': 1.6088135242462158} -11/07/2021 05:14:21 - INFO - __main__ - Step 57053: {'lr': 0.0003478629500972, 'samples': 10954176, 'steps': 57052, 'loss/train': 1.1456817388534546} -11/07/2021 05:14:22 - INFO - __main__ - Step 57054: {'lr': 0.0003478580668163631, 'samples': 10954368, 'steps': 57053, 'loss/train': 1.8548530340194702} -11/07/2021 05:14:23 - INFO - __main__ - Step 57055: {'lr': 0.0003478531834914326, 'samples': 10954560, 'steps': 57054, 'loss/train': 1.2103031873703003} -11/07/2021 05:14:23 - INFO - __main__ - Step 57056: {'lr': 0.0003478483001224111, 'samples': 10954752, 'steps': 57055, 'loss/train': 1.7151169776916504} -11/07/2021 05:14:23 - INFO - __main__ - Step 57057: {'lr': 0.00034784341670930066, 'samples': 10954944, 'steps': 57056, 'loss/train': 1.577838659286499} -11/07/2021 05:14:24 - INFO - __main__ - Step 57058: {'lr': 0.00034783853325210344, 'samples': 10955136, 'steps': 57057, 'loss/train': 1.2713603973388672} -11/07/2021 05:14:25 - INFO - __main__ - Step 57059: {'lr': 0.0003478336497508217, 'samples': 10955328, 'steps': 57058, 'loss/train': 1.584445595741272} -11/07/2021 05:14:25 - INFO - __main__ - Step 57060: {'lr': 0.0003478287662054576, 'samples': 10955520, 'steps': 57059, 'loss/train': 1.4578912258148193} -11/07/2021 05:14:25 - INFO - __main__ - Step 57061: {'lr': 0.0003478238826160135, 'samples': 10955712, 'steps': 57060, 'loss/train': 1.5543626546859741} -11/07/2021 05:14:26 - INFO - __main__ - Step 57062: {'lr': 0.00034781899898249136, 'samples': 10955904, 'steps': 57061, 'loss/train': 1.0813395977020264} -11/07/2021 05:14:26 - INFO - __main__ - Step 57063: {'lr': 0.0003478141153048935, 'samples': 10956096, 'steps': 57062, 'loss/train': 1.8367377519607544} -11/07/2021 05:14:27 - INFO - __main__ - Step 57064: {'lr': 0.0003478092315832221, 'samples': 10956288, 'steps': 57063, 'loss/train': 1.458410382270813} -11/07/2021 05:14:28 - INFO - __main__ - Step 57065: {'lr': 0.00034780434781747936, 'samples': 10956480, 'steps': 57064, 'loss/train': 1.5763148069381714} -11/07/2021 05:14:28 - INFO - __main__ - Step 57066: {'lr': 0.0003477994640076675, 'samples': 10956672, 'steps': 57065, 'loss/train': 1.4608738422393799} -11/07/2021 05:14:28 - INFO - __main__ - Step 57067: {'lr': 0.00034779458015378874, 'samples': 10956864, 'steps': 57066, 'loss/train': 1.340052843093872} -11/07/2021 05:14:29 - INFO - __main__ - Step 57068: {'lr': 0.00034778969625584523, 'samples': 10957056, 'steps': 57067, 'loss/train': 1.2458049058914185} -11/07/2021 05:14:30 - INFO - __main__ - Step 57069: {'lr': 0.0003477848123138392, 'samples': 10957248, 'steps': 57068, 'loss/train': 1.28065824508667} -11/07/2021 05:14:30 - INFO - __main__ - Step 57070: {'lr': 0.0003477799283277728, 'samples': 10957440, 'steps': 57069, 'loss/train': 0.7120200395584106} -11/07/2021 05:14:30 - INFO - __main__ - Step 57071: {'lr': 0.0003477750442976483, 'samples': 10957632, 'steps': 57070, 'loss/train': 0.8300448656082153} -11/07/2021 05:14:31 - INFO - __main__ - Step 57072: {'lr': 0.0003477701602234679, 'samples': 10957824, 'steps': 57071, 'loss/train': 1.402589201927185} -11/07/2021 05:14:31 - INFO - __main__ - Step 57073: {'lr': 0.00034776527610523377, 'samples': 10958016, 'steps': 57072, 'loss/train': 1.1367018222808838} -11/07/2021 05:14:31 - INFO - __main__ - Step 57074: {'lr': 0.00034776039194294806, 'samples': 10958208, 'steps': 57073, 'loss/train': 1.4829801321029663} -11/07/2021 05:14:32 - INFO - __main__ - Step 57075: {'lr': 0.0003477555077366131, 'samples': 10958400, 'steps': 57074, 'loss/train': 1.6662720441818237} -11/07/2021 05:14:33 - INFO - __main__ - Step 57076: {'lr': 0.000347750623486231, 'samples': 10958592, 'steps': 57075, 'loss/train': 1.5730881690979004} -11/07/2021 05:14:33 - INFO - __main__ - Step 57077: {'lr': 0.00034774573919180396, 'samples': 10958784, 'steps': 57076, 'loss/train': 1.4155805110931396} -11/07/2021 05:14:33 - INFO - __main__ - Step 57078: {'lr': 0.0003477408548533342, 'samples': 10958976, 'steps': 57077, 'loss/train': 1.7398052215576172} -11/07/2021 05:14:34 - INFO - __main__ - Step 57079: {'lr': 0.0003477359704708239, 'samples': 10959168, 'steps': 57078, 'loss/train': 1.2042269706726074} -11/07/2021 05:14:35 - INFO - __main__ - Step 57080: {'lr': 0.00034773108604427527, 'samples': 10959360, 'steps': 57079, 'loss/train': 0.755284309387207} -11/07/2021 05:14:35 - INFO - __main__ - Step 57081: {'lr': 0.0003477262015736906, 'samples': 10959552, 'steps': 57080, 'loss/train': 1.5055509805679321} -11/07/2021 05:14:35 - INFO - __main__ - Step 57082: {'lr': 0.000347721317059072, 'samples': 10959744, 'steps': 57081, 'loss/train': 1.6597017049789429} -11/07/2021 05:14:36 - INFO - __main__ - Step 57083: {'lr': 0.00034771643250042163, 'samples': 10959936, 'steps': 57082, 'loss/train': 1.3603308200836182} -11/07/2021 05:14:36 - INFO - __main__ - Step 57084: {'lr': 0.0003477115478977417, 'samples': 10960128, 'steps': 57083, 'loss/train': 1.0547682046890259} -11/07/2021 05:14:37 - INFO - __main__ - Step 57085: {'lr': 0.0003477066632510346, 'samples': 10960320, 'steps': 57084, 'loss/train': 2.257406234741211} -11/07/2021 05:14:37 - INFO - __main__ - Step 57086: {'lr': 0.00034770177856030223, 'samples': 10960512, 'steps': 57085, 'loss/train': 1.6284343004226685} -11/07/2021 05:14:38 - INFO - __main__ - Step 57087: {'lr': 0.00034769689382554704, 'samples': 10960704, 'steps': 57086, 'loss/train': 1.7002869844436646} -11/07/2021 05:14:38 - INFO - __main__ - Step 57088: {'lr': 0.0003476920090467711, 'samples': 10960896, 'steps': 57087, 'loss/train': 1.0626585483551025} -11/07/2021 05:14:39 - INFO - __main__ - Step 57089: {'lr': 0.0003476871242239767, 'samples': 10961088, 'steps': 57088, 'loss/train': 0.4999178349971771} -11/07/2021 05:14:39 - INFO - __main__ - Step 57090: {'lr': 0.0003476822393571659, 'samples': 10961280, 'steps': 57089, 'loss/train': 1.420108675956726} -11/07/2021 05:14:40 - INFO - __main__ - Step 57091: {'lr': 0.00034767735444634105, 'samples': 10961472, 'steps': 57090, 'loss/train': 1.3181227445602417} -11/07/2021 05:14:40 - INFO - __main__ - Step 57092: {'lr': 0.00034767246949150425, 'samples': 10961664, 'steps': 57091, 'loss/train': 1.2863893508911133} -11/07/2021 05:14:41 - INFO - __main__ - Step 57093: {'lr': 0.0003476675844926578, 'samples': 10961856, 'steps': 57092, 'loss/train': 1.6348007917404175} -11/07/2021 05:14:41 - INFO - __main__ - Step 57094: {'lr': 0.0003476626994498038, 'samples': 10962048, 'steps': 57093, 'loss/train': 1.8778717517852783} -11/07/2021 05:14:42 - INFO - __main__ - Step 57095: {'lr': 0.0003476578143629445, 'samples': 10962240, 'steps': 57094, 'loss/train': 1.701960563659668} -11/07/2021 05:14:42 - INFO - __main__ - Step 57096: {'lr': 0.0003476529292320821, 'samples': 10962432, 'steps': 57095, 'loss/train': 1.5509767532348633} -11/07/2021 05:14:43 - INFO - __main__ - Step 57097: {'lr': 0.00034764804405721885, 'samples': 10962624, 'steps': 57096, 'loss/train': 1.1595499515533447} -11/07/2021 05:14:43 - INFO - __main__ - Step 57098: {'lr': 0.0003476431588383568, 'samples': 10962816, 'steps': 57097, 'loss/train': 0.8355369567871094} -11/07/2021 05:14:43 - INFO - __main__ - Step 57099: {'lr': 0.0003476382735754983, 'samples': 10963008, 'steps': 57098, 'loss/train': 1.2774282693862915} -11/07/2021 05:14:45 - INFO - __main__ - Step 57100: {'lr': 0.00034763338826864556, 'samples': 10963200, 'steps': 57099, 'loss/train': 1.3770716190338135} -11/07/2021 05:14:45 - INFO - __main__ - Step 57101: {'lr': 0.0003476285029178006, 'samples': 10963392, 'steps': 57100, 'loss/train': 1.096310019493103} -11/07/2021 05:14:46 - INFO - __main__ - Step 57102: {'lr': 0.0003476236175229659, 'samples': 10963584, 'steps': 57101, 'loss/train': 1.3786247968673706} -11/07/2021 05:14:46 - INFO - __main__ - Step 57103: {'lr': 0.0003476187320841434, 'samples': 10963776, 'steps': 57102, 'loss/train': 1.2944613695144653} -11/07/2021 05:14:46 - INFO - __main__ - Step 57104: {'lr': 0.0003476138466013354, 'samples': 10963968, 'steps': 57103, 'loss/train': 1.6037278175354004} -11/07/2021 05:14:47 - INFO - __main__ - Step 57105: {'lr': 0.00034760896107454407, 'samples': 10964160, 'steps': 57104, 'loss/train': 0.710163414478302} -11/07/2021 05:14:47 - INFO - __main__ - Step 57106: {'lr': 0.0003476040755037717, 'samples': 10964352, 'steps': 57105, 'loss/train': 2.0947957038879395} -11/07/2021 05:14:48 - INFO - __main__ - Step 57107: {'lr': 0.00034759918988902045, 'samples': 10964544, 'steps': 57106, 'loss/train': 1.7483853101730347} -11/07/2021 05:14:49 - INFO - __main__ - Step 57108: {'lr': 0.00034759430423029255, 'samples': 10964736, 'steps': 57107, 'loss/train': 1.576919674873352} -11/07/2021 05:14:49 - INFO - __main__ - Step 57109: {'lr': 0.0003475894185275901, 'samples': 10964928, 'steps': 57108, 'loss/train': 1.459820032119751} -11/07/2021 05:14:49 - INFO - __main__ - Step 57110: {'lr': 0.00034758453278091537, 'samples': 10965120, 'steps': 57109, 'loss/train': 1.5835328102111816} -11/07/2021 05:14:50 - INFO - __main__ - Step 57111: {'lr': 0.00034757964699027054, 'samples': 10965312, 'steps': 57110, 'loss/train': 1.4095795154571533} -11/07/2021 05:14:51 - INFO - __main__ - Step 57112: {'lr': 0.0003475747611556579, 'samples': 10965504, 'steps': 57111, 'loss/train': 1.0903464555740356} -11/07/2021 05:14:51 - INFO - __main__ - Step 57113: {'lr': 0.0003475698752770795, 'samples': 10965696, 'steps': 57112, 'loss/train': 1.3601086139678955} -11/07/2021 05:14:51 - INFO - __main__ - Step 57114: {'lr': 0.0003475649893545376, 'samples': 10965888, 'steps': 57113, 'loss/train': 1.4585551023483276} -11/07/2021 05:14:52 - INFO - __main__ - Step 57115: {'lr': 0.0003475601033880346, 'samples': 10966080, 'steps': 57114, 'loss/train': 1.3388257026672363} -11/07/2021 05:14:52 - INFO - __main__ - Step 57116: {'lr': 0.00034755521737757237, 'samples': 10966272, 'steps': 57115, 'loss/train': 1.212584376335144} -11/07/2021 05:14:53 - INFO - __main__ - Step 57117: {'lr': 0.0003475503313231533, 'samples': 10966464, 'steps': 57116, 'loss/train': 1.2603864669799805} -11/07/2021 05:14:53 - INFO - __main__ - Step 57118: {'lr': 0.0003475454452247795, 'samples': 10966656, 'steps': 57117, 'loss/train': 1.2596713304519653} -11/07/2021 05:14:54 - INFO - __main__ - Step 57119: {'lr': 0.00034754055908245326, 'samples': 10966848, 'steps': 57118, 'loss/train': 1.3811181783676147} -11/07/2021 05:14:54 - INFO - __main__ - Step 57120: {'lr': 0.0003475356728961767, 'samples': 10967040, 'steps': 57119, 'loss/train': 0.9532086849212646} -11/07/2021 05:14:54 - INFO - __main__ - Step 57121: {'lr': 0.0003475307866659522, 'samples': 10967232, 'steps': 57120, 'loss/train': 1.3746074438095093} -11/07/2021 05:14:56 - INFO - __main__ - Step 57122: {'lr': 0.00034752590039178175, 'samples': 10967424, 'steps': 57121, 'loss/train': 1.6336432695388794} -11/07/2021 05:14:56 - INFO - __main__ - Step 57123: {'lr': 0.00034752101407366763, 'samples': 10967616, 'steps': 57122, 'loss/train': 1.1915686130523682} -11/07/2021 05:14:56 - INFO - __main__ - Step 57124: {'lr': 0.00034751612771161214, 'samples': 10967808, 'steps': 57123, 'loss/train': 1.6695116758346558} -11/07/2021 05:14:57 - INFO - __main__ - Step 57125: {'lr': 0.0003475112413056173, 'samples': 10968000, 'steps': 57124, 'loss/train': 1.7698873281478882} -11/07/2021 05:14:57 - INFO - __main__ - Step 57126: {'lr': 0.0003475063548556854, 'samples': 10968192, 'steps': 57125, 'loss/train': 1.1600044965744019} -11/07/2021 05:14:58 - INFO - __main__ - Step 57127: {'lr': 0.0003475014683618186, 'samples': 10968384, 'steps': 57126, 'loss/train': 1.1192550659179688} -11/07/2021 05:14:58 - INFO - __main__ - Step 57128: {'lr': 0.00034749658182401923, 'samples': 10968576, 'steps': 57127, 'loss/train': 1.7815827131271362} -11/07/2021 05:14:59 - INFO - __main__ - Step 57129: {'lr': 0.00034749169524228937, 'samples': 10968768, 'steps': 57128, 'loss/train': 1.80890953540802} -11/07/2021 05:14:59 - INFO - __main__ - Step 57130: {'lr': 0.0003474868086166312, 'samples': 10968960, 'steps': 57129, 'loss/train': 1.3178973197937012} -11/07/2021 05:14:59 - INFO - __main__ - Step 57131: {'lr': 0.0003474819219470471, 'samples': 10969152, 'steps': 57130, 'loss/train': 1.3103485107421875} -11/07/2021 05:15:01 - INFO - __main__ - Step 57132: {'lr': 0.0003474770352335391, 'samples': 10969344, 'steps': 57131, 'loss/train': 0.8342475295066833} -11/07/2021 05:15:01 - INFO - __main__ - Step 57133: {'lr': 0.00034747214847610943, 'samples': 10969536, 'steps': 57132, 'loss/train': 1.472228765487671} -11/07/2021 05:15:01 - INFO - __main__ - Step 57134: {'lr': 0.00034746726167476027, 'samples': 10969728, 'steps': 57133, 'loss/train': 1.7928417921066284} -11/07/2021 05:15:02 - INFO - __main__ - Step 57135: {'lr': 0.00034746237482949393, 'samples': 10969920, 'steps': 57134, 'loss/train': 1.3290101289749146} -11/07/2021 05:15:02 - INFO - __main__ - Step 57136: {'lr': 0.0003474574879403126, 'samples': 10970112, 'steps': 57135, 'loss/train': 0.19079530239105225} -11/07/2021 05:15:03 - INFO - __main__ - Step 57137: {'lr': 0.0003474526010072183, 'samples': 10970304, 'steps': 57136, 'loss/train': 1.43719482421875} -11/07/2021 05:15:04 - INFO - __main__ - Step 57138: {'lr': 0.0003474477140302134, 'samples': 10970496, 'steps': 57137, 'loss/train': 1.7045570611953735} -11/07/2021 05:15:04 - INFO - __main__ - Step 57139: {'lr': 0.0003474428270093001, 'samples': 10970688, 'steps': 57138, 'loss/train': 1.9332865476608276} -11/07/2021 05:15:04 - INFO - __main__ - Step 57140: {'lr': 0.00034743793994448057, 'samples': 10970880, 'steps': 57139, 'loss/train': 1.4491996765136719} -11/07/2021 05:15:05 - INFO - __main__ - Step 57141: {'lr': 0.000347433052835757, 'samples': 10971072, 'steps': 57140, 'loss/train': 1.4185638427734375} -11/07/2021 05:15:06 - INFO - __main__ - Step 57142: {'lr': 0.00034742816568313165, 'samples': 10971264, 'steps': 57141, 'loss/train': 0.08232451230287552} -11/07/2021 05:15:06 - INFO - __main__ - Step 57143: {'lr': 0.0003474232784866066, 'samples': 10971456, 'steps': 57142, 'loss/train': 1.1138741970062256} -11/07/2021 05:15:06 - INFO - __main__ - Step 57144: {'lr': 0.0003474183912461841, 'samples': 10971648, 'steps': 57143, 'loss/train': 1.3590716123580933} -11/07/2021 05:15:07 - INFO - __main__ - Step 57145: {'lr': 0.00034741350396186646, 'samples': 10971840, 'steps': 57144, 'loss/train': 1.4189975261688232} -11/07/2021 05:15:07 - INFO - __main__ - Step 57146: {'lr': 0.0003474086166336557, 'samples': 10972032, 'steps': 57145, 'loss/train': 1.466606855392456} -11/07/2021 05:15:07 - INFO - __main__ - Step 57147: {'lr': 0.0003474037292615542, 'samples': 10972224, 'steps': 57146, 'loss/train': 1.2200415134429932} -11/07/2021 05:15:09 - INFO - __main__ - Step 57148: {'lr': 0.000347398841845564, 'samples': 10972416, 'steps': 57147, 'loss/train': 1.6551554203033447} -11/07/2021 05:15:09 - INFO - __main__ - Step 57149: {'lr': 0.0003473939543856875, 'samples': 10972608, 'steps': 57148, 'loss/train': 1.3456071615219116} -11/07/2021 05:15:09 - INFO - __main__ - Step 57150: {'lr': 0.00034738906688192673, 'samples': 10972800, 'steps': 57149, 'loss/train': 1.497469186782837} -11/07/2021 05:15:10 - INFO - __main__ - Step 57151: {'lr': 0.0003473841793342839, 'samples': 10972992, 'steps': 57150, 'loss/train': 1.4696048498153687} -11/07/2021 05:15:10 - INFO - __main__ - Step 57152: {'lr': 0.00034737929174276133, 'samples': 10973184, 'steps': 57151, 'loss/train': 1.2160767316818237} -11/07/2021 05:15:11 - INFO - __main__ - Step 57153: {'lr': 0.0003473744041073611, 'samples': 10973376, 'steps': 57152, 'loss/train': 1.4955682754516602} -11/07/2021 05:15:11 - INFO - __main__ - Step 57154: {'lr': 0.0003473695164280855, 'samples': 10973568, 'steps': 57153, 'loss/train': 1.8641687631607056} -11/07/2021 05:15:12 - INFO - __main__ - Step 57155: {'lr': 0.0003473646287049368, 'samples': 10973760, 'steps': 57154, 'loss/train': 1.1599198579788208} -11/07/2021 05:15:12 - INFO - __main__ - Step 57156: {'lr': 0.00034735974093791697, 'samples': 10973952, 'steps': 57155, 'loss/train': 0.8260247707366943} -11/07/2021 05:15:12 - INFO - __main__ - Step 57157: {'lr': 0.00034735485312702835, 'samples': 10974144, 'steps': 57156, 'loss/train': 1.145938515663147} -11/07/2021 05:15:13 - INFO - __main__ - Step 57158: {'lr': 0.00034734996527227313, 'samples': 10974336, 'steps': 57157, 'loss/train': 1.5853530168533325} -11/07/2021 05:15:14 - INFO - __main__ - Step 57159: {'lr': 0.0003473450773736536, 'samples': 10974528, 'steps': 57158, 'loss/train': 1.3499584197998047} -11/07/2021 05:15:14 - INFO - __main__ - Step 57160: {'lr': 0.00034734018943117183, 'samples': 10974720, 'steps': 57159, 'loss/train': 1.316514492034912} -11/07/2021 05:15:14 - INFO - __main__ - Step 57161: {'lr': 0.00034733530144483003, 'samples': 10974912, 'steps': 57160, 'loss/train': 1.3778836727142334} -11/07/2021 05:15:15 - INFO - __main__ - Step 57162: {'lr': 0.0003473304134146305, 'samples': 10975104, 'steps': 57161, 'loss/train': 2.1690492630004883} -11/07/2021 05:15:16 - INFO - __main__ - Step 57163: {'lr': 0.0003473255253405754, 'samples': 10975296, 'steps': 57162, 'loss/train': 1.465073823928833} -11/07/2021 05:15:16 - INFO - __main__ - Step 57164: {'lr': 0.0003473206372226668, 'samples': 10975488, 'steps': 57163, 'loss/train': 0.9232267141342163} -11/07/2021 05:15:16 - INFO - __main__ - Step 57165: {'lr': 0.0003473157490609071, 'samples': 10975680, 'steps': 57164, 'loss/train': 1.0334287881851196} -11/07/2021 05:15:17 - INFO - __main__ - Step 57166: {'lr': 0.0003473108608552985, 'samples': 10975872, 'steps': 57165, 'loss/train': 1.4061572551727295} -11/07/2021 05:15:17 - INFO - __main__ - Step 57167: {'lr': 0.00034730597260584304, 'samples': 10976064, 'steps': 57166, 'loss/train': 1.1580924987792969} -11/07/2021 05:15:18 - INFO - __main__ - Step 57168: {'lr': 0.0003473010843125431, 'samples': 10976256, 'steps': 57167, 'loss/train': 1.3049694299697876} -11/07/2021 05:15:18 - INFO - __main__ - Step 57169: {'lr': 0.0003472961959754007, 'samples': 10976448, 'steps': 57168, 'loss/train': 1.7472347021102905} -11/07/2021 05:15:19 - INFO - __main__ - Step 57170: {'lr': 0.0003472913075944182, 'samples': 10976640, 'steps': 57169, 'loss/train': 1.2301182746887207} -11/07/2021 05:15:19 - INFO - __main__ - Step 57171: {'lr': 0.00034728641916959767, 'samples': 10976832, 'steps': 57170, 'loss/train': 1.4124161005020142} -11/07/2021 05:15:19 - INFO - __main__ - Step 57172: {'lr': 0.00034728153070094143, 'samples': 10977024, 'steps': 57171, 'loss/train': 1.0823720693588257} -11/07/2021 05:15:21 - INFO - __main__ - Step 57173: {'lr': 0.0003472766421884516, 'samples': 10977216, 'steps': 57172, 'loss/train': 1.1575038433074951} -11/07/2021 05:15:21 - INFO - __main__ - Step 57174: {'lr': 0.00034727175363213046, 'samples': 10977408, 'steps': 57173, 'loss/train': 0.38192084431648254} -11/07/2021 05:15:21 - INFO - __main__ - Step 57175: {'lr': 0.0003472668650319801, 'samples': 10977600, 'steps': 57174, 'loss/train': 1.71419095993042} -11/07/2021 05:15:22 - INFO - __main__ - Step 57176: {'lr': 0.0003472619763880029, 'samples': 10977792, 'steps': 57175, 'loss/train': 1.3020073175430298} -11/07/2021 05:15:22 - INFO - __main__ - Step 57177: {'lr': 0.00034725708770020085, 'samples': 10977984, 'steps': 57176, 'loss/train': 1.2572638988494873} -11/07/2021 05:15:23 - INFO - __main__ - Step 57178: {'lr': 0.0003472521989685763, 'samples': 10978176, 'steps': 57177, 'loss/train': 1.4011561870574951} -11/07/2021 05:15:23 - INFO - __main__ - Step 57179: {'lr': 0.00034724731019313145, 'samples': 10978368, 'steps': 57178, 'loss/train': 1.1475541591644287} -11/07/2021 05:15:24 - INFO - __main__ - Step 57180: {'lr': 0.0003472424213738684, 'samples': 10978560, 'steps': 57179, 'loss/train': 1.1881182193756104} -11/07/2021 05:15:24 - INFO - __main__ - Step 57181: {'lr': 0.0003472375325107894, 'samples': 10978752, 'steps': 57180, 'loss/train': 1.7085241079330444} -11/07/2021 05:15:24 - INFO - __main__ - Step 57182: {'lr': 0.00034723264360389674, 'samples': 10978944, 'steps': 57181, 'loss/train': 1.2377347946166992} -11/07/2021 05:15:25 - INFO - __main__ - Step 57183: {'lr': 0.0003472277546531925, 'samples': 10979136, 'steps': 57182, 'loss/train': 1.4597644805908203} -11/07/2021 05:15:26 - INFO - __main__ - Step 57184: {'lr': 0.00034722286565867897, 'samples': 10979328, 'steps': 57183, 'loss/train': 1.2952302694320679} -11/07/2021 05:15:26 - INFO - __main__ - Step 57185: {'lr': 0.00034721797662035824, 'samples': 10979520, 'steps': 57184, 'loss/train': 0.7012817859649658} -11/07/2021 05:15:26 - INFO - __main__ - Step 57186: {'lr': 0.00034721308753823266, 'samples': 10979712, 'steps': 57185, 'loss/train': 1.0798956155776978} -11/07/2021 05:15:27 - INFO - __main__ - Step 57187: {'lr': 0.00034720819841230433, 'samples': 10979904, 'steps': 57186, 'loss/train': 1.4146571159362793} -11/07/2021 05:15:28 - INFO - __main__ - Step 57188: {'lr': 0.0003472033092425755, 'samples': 10980096, 'steps': 57187, 'loss/train': 1.2016068696975708} -11/07/2021 05:15:28 - INFO - __main__ - Step 57189: {'lr': 0.00034719842002904844, 'samples': 10980288, 'steps': 57188, 'loss/train': 1.0058929920196533} -11/07/2021 05:15:29 - INFO - __main__ - Step 57190: {'lr': 0.00034719353077172516, 'samples': 10980480, 'steps': 57189, 'loss/train': 1.4530718326568604} -11/07/2021 05:15:29 - INFO - __main__ - Step 57191: {'lr': 0.00034718864147060803, 'samples': 10980672, 'steps': 57190, 'loss/train': 1.6307939291000366} -11/07/2021 05:15:29 - INFO - __main__ - Step 57192: {'lr': 0.00034718375212569916, 'samples': 10980864, 'steps': 57191, 'loss/train': 1.438184142112732} -11/07/2021 05:15:30 - INFO - __main__ - Step 57193: {'lr': 0.0003471788627370008, 'samples': 10981056, 'steps': 57192, 'loss/train': 1.6724183559417725} -11/07/2021 05:15:31 - INFO - __main__ - Step 57194: {'lr': 0.0003471739733045151, 'samples': 10981248, 'steps': 57193, 'loss/train': 0.655161440372467} -11/07/2021 05:15:31 - INFO - __main__ - Step 57195: {'lr': 0.00034716908382824435, 'samples': 10981440, 'steps': 57194, 'loss/train': 1.3965442180633545} -11/07/2021 05:15:31 - INFO - __main__ - Step 57196: {'lr': 0.0003471641943081908, 'samples': 10981632, 'steps': 57195, 'loss/train': 1.3838998079299927} -11/07/2021 05:15:32 - INFO - __main__ - Step 57197: {'lr': 0.0003471593047443564, 'samples': 10981824, 'steps': 57196, 'loss/train': 1.01152765750885} -11/07/2021 05:15:32 - INFO - __main__ - Step 57198: {'lr': 0.00034715441513674363, 'samples': 10982016, 'steps': 57197, 'loss/train': 1.327661156654358} -11/07/2021 05:15:33 - INFO - __main__ - Step 57199: {'lr': 0.00034714952548535455, 'samples': 10982208, 'steps': 57198, 'loss/train': 0.8171754479408264} -11/07/2021 05:15:34 - INFO - __main__ - Step 57200: {'lr': 0.0003471446357901914, 'samples': 10982400, 'steps': 57199, 'loss/train': 1.1679540872573853} -11/07/2021 05:15:34 - INFO - __main__ - Step 57201: {'lr': 0.0003471397460512563, 'samples': 10982592, 'steps': 57200, 'loss/train': 1.601515531539917} -11/07/2021 05:15:34 - INFO - __main__ - Step 57202: {'lr': 0.0003471348562685517, 'samples': 10982784, 'steps': 57201, 'loss/train': 1.4043967723846436} -11/07/2021 05:15:35 - INFO - __main__ - Step 57203: {'lr': 0.0003471299664420795, 'samples': 10982976, 'steps': 57202, 'loss/train': 0.9429094195365906} -11/07/2021 05:15:36 - INFO - __main__ - Step 57204: {'lr': 0.00034712507657184207, 'samples': 10983168, 'steps': 57203, 'loss/train': 1.6474299430847168} -11/07/2021 05:15:36 - INFO - __main__ - Step 57205: {'lr': 0.00034712018665784155, 'samples': 10983360, 'steps': 57204, 'loss/train': 1.2825877666473389} -11/07/2021 05:15:36 - INFO - __main__ - Step 57206: {'lr': 0.0003471152967000802, 'samples': 10983552, 'steps': 57205, 'loss/train': 1.379895806312561} -11/07/2021 05:15:37 - INFO - __main__ - Step 57207: {'lr': 0.0003471104066985602, 'samples': 10983744, 'steps': 57206, 'loss/train': 1.354645848274231} -11/07/2021 05:15:37 - INFO - __main__ - Step 57208: {'lr': 0.0003471055166532837, 'samples': 10983936, 'steps': 57207, 'loss/train': 1.132021188735962} -11/07/2021 05:15:38 - INFO - __main__ - Step 57209: {'lr': 0.00034710062656425304, 'samples': 10984128, 'steps': 57208, 'loss/train': 0.8864858150482178} -11/07/2021 05:15:38 - INFO - __main__ - Step 57210: {'lr': 0.0003470957364314703, 'samples': 10984320, 'steps': 57209, 'loss/train': 1.4582781791687012} -11/07/2021 05:15:39 - INFO - __main__ - Step 57211: {'lr': 0.0003470908462549377, 'samples': 10984512, 'steps': 57210, 'loss/train': 1.2331348657608032} -11/07/2021 05:15:39 - INFO - __main__ - Step 57212: {'lr': 0.00034708595603465743, 'samples': 10984704, 'steps': 57211, 'loss/train': 0.7234694957733154} -11/07/2021 05:15:39 - INFO - __main__ - Step 57213: {'lr': 0.0003470810657706318, 'samples': 10984896, 'steps': 57212, 'loss/train': 1.3726696968078613} -11/07/2021 05:15:41 - INFO - __main__ - Step 57214: {'lr': 0.0003470761754628629, 'samples': 10985088, 'steps': 57213, 'loss/train': 1.3842049837112427} -11/07/2021 05:15:41 - INFO - __main__ - Step 57215: {'lr': 0.000347071285111353, 'samples': 10985280, 'steps': 57214, 'loss/train': 1.4608348608016968} -11/07/2021 05:15:41 - INFO - __main__ - Step 57216: {'lr': 0.00034706639471610424, 'samples': 10985472, 'steps': 57215, 'loss/train': 0.8314490914344788} -11/07/2021 05:15:42 - INFO - __main__ - Step 57217: {'lr': 0.0003470615042771189, 'samples': 10985664, 'steps': 57216, 'loss/train': 1.5083117485046387} -11/07/2021 05:15:42 - INFO - __main__ - Step 57218: {'lr': 0.00034705661379439914, 'samples': 10985856, 'steps': 57217, 'loss/train': 0.9466352462768555} -11/07/2021 05:15:43 - INFO - __main__ - Step 57219: {'lr': 0.0003470517232679471, 'samples': 10986048, 'steps': 57218, 'loss/train': 1.3346738815307617} -11/07/2021 05:15:43 - INFO - __main__ - Step 57220: {'lr': 0.0003470468326977651, 'samples': 10986240, 'steps': 57219, 'loss/train': 0.9492648243904114} -11/07/2021 05:15:44 - INFO - __main__ - Step 57221: {'lr': 0.0003470419420838553, 'samples': 10986432, 'steps': 57220, 'loss/train': 1.3113689422607422} -11/07/2021 05:15:44 - INFO - __main__ - Step 57222: {'lr': 0.0003470370514262199, 'samples': 10986624, 'steps': 57221, 'loss/train': 1.5532441139221191} -11/07/2021 05:15:44 - INFO - __main__ - Step 57223: {'lr': 0.0003470321607248611, 'samples': 10986816, 'steps': 57222, 'loss/train': 1.6135445833206177} -11/07/2021 05:15:45 - INFO - __main__ - Step 57224: {'lr': 0.0003470272699797811, 'samples': 10987008, 'steps': 57223, 'loss/train': 1.5716966390609741} -11/07/2021 05:15:46 - INFO - __main__ - Step 57225: {'lr': 0.0003470223791909821, 'samples': 10987200, 'steps': 57224, 'loss/train': 1.6298424005508423} -11/07/2021 05:15:46 - INFO - __main__ - Step 57226: {'lr': 0.0003470174883584664, 'samples': 10987392, 'steps': 57225, 'loss/train': 1.3984442949295044} -11/07/2021 05:15:46 - INFO - __main__ - Step 57227: {'lr': 0.00034701259748223595, 'samples': 10987584, 'steps': 57226, 'loss/train': 1.1414973735809326} -11/07/2021 05:15:47 - INFO - __main__ - Step 57228: {'lr': 0.00034700770656229324, 'samples': 10987776, 'steps': 57227, 'loss/train': 1.8051258325576782} -11/07/2021 05:15:47 - INFO - __main__ - Step 57229: {'lr': 0.00034700281559864034, 'samples': 10987968, 'steps': 57228, 'loss/train': 1.304807186126709} -11/07/2021 05:15:48 - INFO - __main__ - Step 57230: {'lr': 0.00034699792459127945, 'samples': 10988160, 'steps': 57229, 'loss/train': 1.508192539215088} -11/07/2021 05:15:48 - INFO - __main__ - Step 57231: {'lr': 0.00034699303354021285, 'samples': 10988352, 'steps': 57230, 'loss/train': 1.1588743925094604} -11/07/2021 05:15:49 - INFO - __main__ - Step 57232: {'lr': 0.0003469881424454426, 'samples': 10988544, 'steps': 57231, 'loss/train': 1.6050984859466553} -11/07/2021 05:15:49 - INFO - __main__ - Step 57233: {'lr': 0.000346983251306971, 'samples': 10988736, 'steps': 57232, 'loss/train': 1.877519965171814} -11/07/2021 05:15:50 - INFO - __main__ - Step 57234: {'lr': 0.0003469783601248002, 'samples': 10988928, 'steps': 57233, 'loss/train': 1.5269972085952759} -11/07/2021 05:15:51 - INFO - __main__ - Step 57235: {'lr': 0.0003469734688989326, 'samples': 10989120, 'steps': 57234, 'loss/train': 1.4625635147094727} -11/07/2021 05:15:51 - INFO - __main__ - Step 57236: {'lr': 0.0003469685776293702, 'samples': 10989312, 'steps': 57235, 'loss/train': 1.305212378501892} -11/07/2021 05:15:51 - INFO - __main__ - Step 57237: {'lr': 0.0003469636863161152, 'samples': 10989504, 'steps': 57236, 'loss/train': 1.4039185047149658} -11/07/2021 05:15:52 - INFO - __main__ - Step 57238: {'lr': 0.0003469587949591698, 'samples': 10989696, 'steps': 57237, 'loss/train': 1.2485064268112183} -11/07/2021 05:15:52 - INFO - __main__ - Step 57239: {'lr': 0.0003469539035585364, 'samples': 10989888, 'steps': 57238, 'loss/train': 1.3334019184112549} -11/07/2021 05:15:53 - INFO - __main__ - Step 57240: {'lr': 0.00034694901211421695, 'samples': 10990080, 'steps': 57239, 'loss/train': 0.6343439221382141} -11/07/2021 05:15:53 - INFO - __main__ - Step 57241: {'lr': 0.00034694412062621384, 'samples': 10990272, 'steps': 57240, 'loss/train': 1.6191811561584473} -11/07/2021 05:15:54 - INFO - __main__ - Step 57242: {'lr': 0.0003469392290945292, 'samples': 10990464, 'steps': 57241, 'loss/train': 0.6367524862289429} -11/07/2021 05:15:54 - INFO - __main__ - Step 57243: {'lr': 0.00034693433751916525, 'samples': 10990656, 'steps': 57242, 'loss/train': 1.3679172992706299} -11/07/2021 05:15:54 - INFO - __main__ - Step 57244: {'lr': 0.0003469294459001242, 'samples': 10990848, 'steps': 57243, 'loss/train': 1.4669983386993408} -11/07/2021 05:15:56 - INFO - __main__ - Step 57245: {'lr': 0.0003469245542374082, 'samples': 10991040, 'steps': 57244, 'loss/train': 1.5077030658721924} -11/07/2021 05:15:56 - INFO - __main__ - Step 57246: {'lr': 0.00034691966253101947, 'samples': 10991232, 'steps': 57245, 'loss/train': 1.504335880279541} -11/07/2021 05:15:56 - INFO - __main__ - Step 57247: {'lr': 0.00034691477078096025, 'samples': 10991424, 'steps': 57246, 'loss/train': 1.3656114339828491} -11/07/2021 05:15:57 - INFO - __main__ - Step 57248: {'lr': 0.0003469098789872327, 'samples': 10991616, 'steps': 57247, 'loss/train': 1.659846305847168} -11/07/2021 05:15:57 - INFO - __main__ - Step 57249: {'lr': 0.0003469049871498392, 'samples': 10991808, 'steps': 57248, 'loss/train': 0.7325455546379089} -11/07/2021 05:15:58 - INFO - __main__ - Step 57250: {'lr': 0.0003469000952687817, 'samples': 10992000, 'steps': 57249, 'loss/train': 3.3924875259399414} -11/07/2021 05:15:59 - INFO - __main__ - Step 57251: {'lr': 0.0003468952033440625, 'samples': 10992192, 'steps': 57250, 'loss/train': 1.5785741806030273} -11/07/2021 05:15:59 - INFO - __main__ - Step 57252: {'lr': 0.00034689031137568384, 'samples': 10992384, 'steps': 57251, 'loss/train': 1.597221851348877} -11/07/2021 05:15:59 - INFO - __main__ - Step 57253: {'lr': 0.0003468854193636479, 'samples': 10992576, 'steps': 57252, 'loss/train': 1.3004043102264404} -11/07/2021 05:16:00 - INFO - __main__ - Step 57254: {'lr': 0.00034688052730795683, 'samples': 10992768, 'steps': 57253, 'loss/train': 1.6935105323791504} -11/07/2021 05:16:01 - INFO - __main__ - Step 57255: {'lr': 0.00034687563520861294, 'samples': 10992960, 'steps': 57254, 'loss/train': 1.0508880615234375} -11/07/2021 05:16:01 - INFO - __main__ - Step 57256: {'lr': 0.0003468707430656184, 'samples': 10993152, 'steps': 57255, 'loss/train': 1.217911958694458} -11/07/2021 05:16:01 - INFO - __main__ - Step 57257: {'lr': 0.00034686585087897537, 'samples': 10993344, 'steps': 57256, 'loss/train': 1.1200474500656128} -11/07/2021 05:16:02 - INFO - __main__ - Step 57258: {'lr': 0.0003468609586486861, 'samples': 10993536, 'steps': 57257, 'loss/train': 1.9295845031738281} -11/07/2021 05:16:02 - INFO - __main__ - Step 57259: {'lr': 0.00034685606637475274, 'samples': 10993728, 'steps': 57258, 'loss/train': 1.585288405418396} -11/07/2021 05:16:03 - INFO - __main__ - Step 57260: {'lr': 0.0003468511740571776, 'samples': 10993920, 'steps': 57259, 'loss/train': 0.9167661666870117} -11/07/2021 05:16:03 - INFO - __main__ - Step 57261: {'lr': 0.00034684628169596277, 'samples': 10994112, 'steps': 57260, 'loss/train': 1.277349829673767} -11/07/2021 05:16:04 - INFO - __main__ - Step 57262: {'lr': 0.0003468413892911105, 'samples': 10994304, 'steps': 57261, 'loss/train': 1.2273873090744019} -11/07/2021 05:16:04 - INFO - __main__ - Step 57263: {'lr': 0.00034683649684262303, 'samples': 10994496, 'steps': 57262, 'loss/train': 1.5148195028305054} -11/07/2021 05:16:05 - INFO - __main__ - Step 57264: {'lr': 0.0003468316043505025, 'samples': 10994688, 'steps': 57263, 'loss/train': 1.4055837392807007} -11/07/2021 05:16:06 - INFO - __main__ - Step 57265: {'lr': 0.00034682671181475113, 'samples': 10994880, 'steps': 57264, 'loss/train': 1.6199654340744019} -11/07/2021 05:16:06 - INFO - __main__ - Step 57266: {'lr': 0.00034682181923537114, 'samples': 10995072, 'steps': 57265, 'loss/train': 1.3538107872009277} -11/07/2021 05:16:06 - INFO - __main__ - Step 57267: {'lr': 0.0003468169266123647, 'samples': 10995264, 'steps': 57266, 'loss/train': 1.1905224323272705} -11/07/2021 05:16:07 - INFO - __main__ - Step 57268: {'lr': 0.0003468120339457341, 'samples': 10995456, 'steps': 57267, 'loss/train': 1.4119234085083008} -11/07/2021 05:16:07 - INFO - __main__ - Step 57269: {'lr': 0.00034680714123548146, 'samples': 10995648, 'steps': 57268, 'loss/train': 1.2339471578598022} -11/07/2021 05:16:07 - INFO - __main__ - Step 57270: {'lr': 0.0003468022484816091, 'samples': 10995840, 'steps': 57269, 'loss/train': 1.278130292892456} -11/07/2021 05:16:08 - INFO - __main__ - Step 57271: {'lr': 0.0003467973556841191, 'samples': 10996032, 'steps': 57270, 'loss/train': 1.2380174398422241} -11/07/2021 05:16:09 - INFO - __main__ - Step 57272: {'lr': 0.00034679246284301365, 'samples': 10996224, 'steps': 57271, 'loss/train': 1.3780403137207031} -11/07/2021 05:16:09 - INFO - __main__ - Step 57273: {'lr': 0.000346787569958295, 'samples': 10996416, 'steps': 57272, 'loss/train': 1.2759188413619995} -11/07/2021 05:16:09 - INFO - __main__ - Step 57274: {'lr': 0.0003467826770299654, 'samples': 10996608, 'steps': 57273, 'loss/train': 1.464417576789856} -11/07/2021 05:16:10 - INFO - __main__ - Step 57275: {'lr': 0.000346777784058027, 'samples': 10996800, 'steps': 57274, 'loss/train': 1.413720965385437} -11/07/2021 05:16:11 - INFO - __main__ - Step 57276: {'lr': 0.0003467728910424821, 'samples': 10996992, 'steps': 57275, 'loss/train': 1.4004560708999634} -11/07/2021 05:16:11 - INFO - __main__ - Step 57277: {'lr': 0.0003467679979833328, 'samples': 10997184, 'steps': 57276, 'loss/train': 1.57266366481781} -11/07/2021 05:16:11 - INFO - __main__ - Step 57278: {'lr': 0.00034676310488058126, 'samples': 10997376, 'steps': 57277, 'loss/train': 1.1300008296966553} -11/07/2021 05:16:12 - INFO - __main__ - Step 57279: {'lr': 0.00034675821173422983, 'samples': 10997568, 'steps': 57278, 'loss/train': 0.7691164612770081} -11/07/2021 05:16:12 - INFO - __main__ - Step 57280: {'lr': 0.0003467533185442806, 'samples': 10997760, 'steps': 57279, 'loss/train': 1.7687597274780273} -11/07/2021 05:16:13 - INFO - __main__ - Step 57281: {'lr': 0.00034674842531073587, 'samples': 10997952, 'steps': 57280, 'loss/train': 1.3839212656021118} -11/07/2021 05:16:14 - INFO - __main__ - Step 57282: {'lr': 0.0003467435320335978, 'samples': 10998144, 'steps': 57281, 'loss/train': 1.2992281913757324} -11/07/2021 05:16:14 - INFO - __main__ - Step 57283: {'lr': 0.00034673863871286854, 'samples': 10998336, 'steps': 57282, 'loss/train': 1.5022506713867188} -11/07/2021 05:16:14 - INFO - __main__ - Step 57284: {'lr': 0.00034673374534855035, 'samples': 10998528, 'steps': 57283, 'loss/train': 1.6627693176269531} -11/07/2021 05:16:15 - INFO - __main__ - Step 57285: {'lr': 0.0003467288519406454, 'samples': 10998720, 'steps': 57284, 'loss/train': 1.5031355619430542} -11/07/2021 05:16:16 - INFO - __main__ - Step 57286: {'lr': 0.00034672395848915594, 'samples': 10998912, 'steps': 57285, 'loss/train': 1.4156684875488281} -11/07/2021 05:16:16 - INFO - __main__ - Step 57287: {'lr': 0.00034671906499408417, 'samples': 10999104, 'steps': 57286, 'loss/train': 1.271929383277893} -11/07/2021 05:16:16 - INFO - __main__ - Step 57288: {'lr': 0.0003467141714554323, 'samples': 10999296, 'steps': 57287, 'loss/train': 1.4576336145401} -11/07/2021 05:16:17 - INFO - __main__ - Step 57289: {'lr': 0.0003467092778732025, 'samples': 10999488, 'steps': 57288, 'loss/train': 1.3043655157089233} -11/07/2021 05:16:17 - INFO - __main__ - Step 57290: {'lr': 0.00034670438424739695, 'samples': 10999680, 'steps': 57289, 'loss/train': 1.2958300113677979} -11/07/2021 05:16:18 - INFO - __main__ - Step 57291: {'lr': 0.000346699490578018, 'samples': 10999872, 'steps': 57290, 'loss/train': 1.3538079261779785} -11/07/2021 05:16:19 - INFO - __main__ - Step 57292: {'lr': 0.00034669459686506766, 'samples': 11000064, 'steps': 57291, 'loss/train': 0.9389482736587524} -11/07/2021 05:16:19 - INFO - __main__ - Step 57293: {'lr': 0.0003466897031085482, 'samples': 11000256, 'steps': 57292, 'loss/train': 1.2801103591918945} -11/07/2021 05:16:19 - INFO - __main__ - Step 57294: {'lr': 0.000346684809308462, 'samples': 11000448, 'steps': 57293, 'loss/train': 1.7676334381103516} -11/07/2021 05:16:20 - INFO - __main__ - Step 57295: {'lr': 0.00034667991546481096, 'samples': 11000640, 'steps': 57294, 'loss/train': 1.8828591108322144} -11/07/2021 05:16:21 - INFO - __main__ - Step 57296: {'lr': 0.0003466750215775975, 'samples': 11000832, 'steps': 57295, 'loss/train': 1.4249674081802368} -11/07/2021 05:16:21 - INFO - __main__ - Step 57297: {'lr': 0.0003466701276468238, 'samples': 11001024, 'steps': 57296, 'loss/train': 1.5335332155227661} -11/07/2021 05:16:21 - INFO - __main__ - Step 57298: {'lr': 0.00034666523367249196, 'samples': 11001216, 'steps': 57297, 'loss/train': 1.4811491966247559} -11/07/2021 05:16:22 - INFO - __main__ - Step 57299: {'lr': 0.0003466603396546043, 'samples': 11001408, 'steps': 57298, 'loss/train': 1.5754340887069702} -11/07/2021 05:16:22 - INFO - __main__ - Step 57300: {'lr': 0.00034665544559316303, 'samples': 11001600, 'steps': 57299, 'loss/train': 1.0971513986587524} -11/07/2021 05:16:23 - INFO - __main__ - Step 57301: {'lr': 0.0003466505514881703, 'samples': 11001792, 'steps': 57300, 'loss/train': 3.5548441410064697} -11/07/2021 05:16:23 - INFO - __main__ - Step 57302: {'lr': 0.00034664565733962823, 'samples': 11001984, 'steps': 57301, 'loss/train': 1.138931155204773} -11/07/2021 05:16:24 - INFO - __main__ - Step 57303: {'lr': 0.0003466407631475392, 'samples': 11002176, 'steps': 57302, 'loss/train': 1.2977111339569092} -11/07/2021 05:16:24 - INFO - __main__ - Step 57304: {'lr': 0.00034663586891190524, 'samples': 11002368, 'steps': 57303, 'loss/train': 1.4463646411895752} -11/07/2021 05:16:24 - INFO - __main__ - Step 57305: {'lr': 0.0003466309746327288, 'samples': 11002560, 'steps': 57304, 'loss/train': 1.1357953548431396} -11/07/2021 05:16:26 - INFO - __main__ - Step 57306: {'lr': 0.0003466260803100118, 'samples': 11002752, 'steps': 57305, 'loss/train': 1.6303383111953735} -11/07/2021 05:16:26 - INFO - __main__ - Step 57307: {'lr': 0.0003466211859437566, 'samples': 11002944, 'steps': 57306, 'loss/train': 1.6040101051330566} -11/07/2021 05:16:27 - INFO - __main__ - Step 57308: {'lr': 0.00034661629153396543, 'samples': 11003136, 'steps': 57307, 'loss/train': 1.4108153581619263} -11/07/2021 05:16:27 - INFO - __main__ - Step 57309: {'lr': 0.00034661139708064043, 'samples': 11003328, 'steps': 57308, 'loss/train': 0.22060233354568481} -11/07/2021 05:16:27 - INFO - __main__ - Step 57310: {'lr': 0.00034660650258378384, 'samples': 11003520, 'steps': 57309, 'loss/train': 1.1796612739562988} -11/07/2021 05:16:28 - INFO - __main__ - Step 57311: {'lr': 0.00034660160804339784, 'samples': 11003712, 'steps': 57310, 'loss/train': 1.29084312915802} -11/07/2021 05:16:29 - INFO - __main__ - Step 57312: {'lr': 0.0003465967134594847, 'samples': 11003904, 'steps': 57311, 'loss/train': 1.0948700904846191} -11/07/2021 05:16:29 - INFO - __main__ - Step 57313: {'lr': 0.0003465918188320465, 'samples': 11004096, 'steps': 57312, 'loss/train': 0.959750235080719} -11/07/2021 05:16:29 - INFO - __main__ - Step 57314: {'lr': 0.0003465869241610855, 'samples': 11004288, 'steps': 57313, 'loss/train': 1.9232094287872314} -11/07/2021 05:16:30 - INFO - __main__ - Step 57315: {'lr': 0.00034658202944660396, 'samples': 11004480, 'steps': 57314, 'loss/train': 1.5287576913833618} -11/07/2021 05:16:30 - INFO - __main__ - Step 57316: {'lr': 0.000346577134688604, 'samples': 11004672, 'steps': 57315, 'loss/train': 1.2158355712890625} -11/07/2021 05:16:31 - INFO - __main__ - Step 57317: {'lr': 0.00034657223988708796, 'samples': 11004864, 'steps': 57316, 'loss/train': 1.6573148965835571} -11/07/2021 05:16:31 - INFO - __main__ - Step 57318: {'lr': 0.0003465673450420579, 'samples': 11005056, 'steps': 57317, 'loss/train': 1.4946718215942383} -11/07/2021 05:16:32 - INFO - __main__ - Step 57319: {'lr': 0.0003465624501535161, 'samples': 11005248, 'steps': 57318, 'loss/train': 1.2168070077896118} -11/07/2021 05:16:32 - INFO - __main__ - Step 57320: {'lr': 0.0003465575552214648, 'samples': 11005440, 'steps': 57319, 'loss/train': 1.6642897129058838} -11/07/2021 05:16:32 - INFO - __main__ - Step 57321: {'lr': 0.00034655266024590604, 'samples': 11005632, 'steps': 57320, 'loss/train': 1.0355887413024902} -11/07/2021 05:16:33 - INFO - __main__ - Step 57322: {'lr': 0.0003465477652268422, 'samples': 11005824, 'steps': 57321, 'loss/train': 1.2140164375305176} -11/07/2021 05:16:34 - INFO - __main__ - Step 57323: {'lr': 0.0003465428701642755, 'samples': 11006016, 'steps': 57322, 'loss/train': 1.493344783782959} -11/07/2021 05:16:34 - INFO - __main__ - Step 57324: {'lr': 0.00034653797505820795, 'samples': 11006208, 'steps': 57323, 'loss/train': 1.6135051250457764} -11/07/2021 05:16:35 - INFO - __main__ - Step 57325: {'lr': 0.000346533079908642, 'samples': 11006400, 'steps': 57324, 'loss/train': 1.1621938943862915} -11/07/2021 05:16:35 - INFO - __main__ - Step 57326: {'lr': 0.0003465281847155796, 'samples': 11006592, 'steps': 57325, 'loss/train': 1.454559087753296} -11/07/2021 05:16:36 - INFO - __main__ - Step 57327: {'lr': 0.00034652328947902317, 'samples': 11006784, 'steps': 57326, 'loss/train': 1.4118322134017944} -11/07/2021 05:16:36 - INFO - __main__ - Step 57328: {'lr': 0.0003465183941989748, 'samples': 11006976, 'steps': 57327, 'loss/train': 0.8050600290298462} -11/07/2021 05:16:37 - INFO - __main__ - Step 57329: {'lr': 0.00034651349887543674, 'samples': 11007168, 'steps': 57328, 'loss/train': 1.7745147943496704} -11/07/2021 05:16:37 - INFO - __main__ - Step 57330: {'lr': 0.00034650860350841125, 'samples': 11007360, 'steps': 57329, 'loss/train': 1.2334222793579102} -11/07/2021 05:16:37 - INFO - __main__ - Step 57331: {'lr': 0.0003465037080979004, 'samples': 11007552, 'steps': 57330, 'loss/train': 1.2701380252838135} -11/07/2021 05:16:38 - INFO - __main__ - Step 57332: {'lr': 0.0003464988126439065, 'samples': 11007744, 'steps': 57331, 'loss/train': 1.4824724197387695} -11/07/2021 05:16:39 - INFO - __main__ - Step 57333: {'lr': 0.0003464939171464317, 'samples': 11007936, 'steps': 57332, 'loss/train': 1.4551417827606201} -11/07/2021 05:16:39 - INFO - __main__ - Step 57334: {'lr': 0.0003464890216054782, 'samples': 11008128, 'steps': 57333, 'loss/train': 1.0542746782302856} -11/07/2021 05:16:39 - INFO - __main__ - Step 57335: {'lr': 0.0003464841260210483, 'samples': 11008320, 'steps': 57334, 'loss/train': 1.463664174079895} -11/07/2021 05:16:40 - INFO - __main__ - Step 57336: {'lr': 0.0003464792303931441, 'samples': 11008512, 'steps': 57335, 'loss/train': 1.3808726072311401} -11/07/2021 05:16:41 - INFO - __main__ - Step 57337: {'lr': 0.0003464743347217679, 'samples': 11008704, 'steps': 57336, 'loss/train': 1.4817286729812622} -11/07/2021 05:16:41 - INFO - __main__ - Step 57338: {'lr': 0.00034646943900692187, 'samples': 11008896, 'steps': 57337, 'loss/train': 1.192395806312561} -11/07/2021 05:16:41 - INFO - __main__ - Step 57339: {'lr': 0.0003464645432486081, 'samples': 11009088, 'steps': 57338, 'loss/train': 1.324694275856018} -11/07/2021 05:16:42 - INFO - __main__ - Step 57340: {'lr': 0.000346459647446829, 'samples': 11009280, 'steps': 57339, 'loss/train': 1.774898648262024} -11/07/2021 05:16:42 - INFO - __main__ - Step 57341: {'lr': 0.0003464547516015866, 'samples': 11009472, 'steps': 57340, 'loss/train': 1.6069287061691284} -11/07/2021 05:16:43 - INFO - __main__ - Step 57342: {'lr': 0.0003464498557128832, 'samples': 11009664, 'steps': 57341, 'loss/train': 5.762038707733154} -11/07/2021 05:16:43 - INFO - __main__ - Step 57343: {'lr': 0.00034644495978072094, 'samples': 11009856, 'steps': 57342, 'loss/train': 1.7801626920700073} -11/07/2021 05:16:44 - INFO - __main__ - Step 57344: {'lr': 0.00034644006380510215, 'samples': 11010048, 'steps': 57343, 'loss/train': 1.6430482864379883} -11/07/2021 05:16:44 - INFO - __main__ - Step 57345: {'lr': 0.0003464351677860289, 'samples': 11010240, 'steps': 57344, 'loss/train': 1.46976637840271} -11/07/2021 05:16:45 - INFO - __main__ - Step 57346: {'lr': 0.00034643027172350345, 'samples': 11010432, 'steps': 57345, 'loss/train': 1.1630475521087646} -11/07/2021 05:16:45 - INFO - __main__ - Step 57347: {'lr': 0.000346425375617528, 'samples': 11010624, 'steps': 57346, 'loss/train': 0.7415656447410583} -11/07/2021 05:16:46 - INFO - __main__ - Step 57348: {'lr': 0.00034642047946810477, 'samples': 11010816, 'steps': 57347, 'loss/train': 1.3568874597549438} -11/07/2021 05:16:46 - INFO - __main__ - Step 57349: {'lr': 0.000346415583275236, 'samples': 11011008, 'steps': 57348, 'loss/train': 1.4117162227630615} -11/07/2021 05:16:47 - INFO - __main__ - Step 57350: {'lr': 0.00034641068703892387, 'samples': 11011200, 'steps': 57349, 'loss/train': 1.1161599159240723} -11/07/2021 05:16:47 - INFO - __main__ - Step 57351: {'lr': 0.00034640579075917053, 'samples': 11011392, 'steps': 57350, 'loss/train': 1.0881834030151367} -11/07/2021 05:16:47 - INFO - __main__ - Step 57352: {'lr': 0.0003464008944359782, 'samples': 11011584, 'steps': 57351, 'loss/train': 1.755181074142456} -11/07/2021 05:16:48 - INFO - __main__ - Step 57353: {'lr': 0.00034639599806934917, 'samples': 11011776, 'steps': 57352, 'loss/train': 1.1692019701004028} -11/07/2021 05:16:49 - INFO - __main__ - Step 57354: {'lr': 0.0003463911016592856, 'samples': 11011968, 'steps': 57353, 'loss/train': 1.4031453132629395} -11/07/2021 05:16:49 - INFO - __main__ - Step 57355: {'lr': 0.0003463862052057896, 'samples': 11012160, 'steps': 57354, 'loss/train': 1.7824376821517944} -11/07/2021 05:16:49 - INFO - __main__ - Step 57356: {'lr': 0.00034638130870886353, 'samples': 11012352, 'steps': 57355, 'loss/train': 1.1180835962295532} -11/07/2021 05:16:50 - INFO - __main__ - Step 57357: {'lr': 0.0003463764121685096, 'samples': 11012544, 'steps': 57356, 'loss/train': 1.5490951538085938} -11/07/2021 05:16:51 - INFO - __main__ - Step 57358: {'lr': 0.0003463715155847298, 'samples': 11012736, 'steps': 57357, 'loss/train': 1.4867855310440063} -11/07/2021 05:16:51 - INFO - __main__ - Step 57359: {'lr': 0.00034636661895752653, 'samples': 11012928, 'steps': 57358, 'loss/train': 1.299237608909607} -11/07/2021 05:16:52 - INFO - __main__ - Step 57360: {'lr': 0.000346361722286902, 'samples': 11013120, 'steps': 57359, 'loss/train': 1.4953867197036743} -11/07/2021 05:16:52 - INFO - __main__ - Step 57361: {'lr': 0.0003463568255728583, 'samples': 11013312, 'steps': 57360, 'loss/train': 1.8217616081237793} -11/07/2021 05:16:52 - INFO - __main__ - Step 57362: {'lr': 0.0003463519288153977, 'samples': 11013504, 'steps': 57361, 'loss/train': 1.428085207939148} -11/07/2021 05:16:53 - INFO - __main__ - Step 57363: {'lr': 0.00034634703201452243, 'samples': 11013696, 'steps': 57362, 'loss/train': 1.5637208223342896} -11/07/2021 05:16:54 - INFO - __main__ - Step 57364: {'lr': 0.00034634213517023473, 'samples': 11013888, 'steps': 57363, 'loss/train': 1.333274245262146} -11/07/2021 05:16:54 - INFO - __main__ - Step 57365: {'lr': 0.0003463372382825367, 'samples': 11014080, 'steps': 57364, 'loss/train': 0.20709101855754852} -11/07/2021 05:16:54 - INFO - __main__ - Step 57366: {'lr': 0.0003463323413514306, 'samples': 11014272, 'steps': 57365, 'loss/train': 1.1538246870040894} -11/07/2021 05:16:55 - INFO - __main__ - Step 57367: {'lr': 0.0003463274443769186, 'samples': 11014464, 'steps': 57366, 'loss/train': 1.3712096214294434} -11/07/2021 05:16:55 - INFO - __main__ - Step 57368: {'lr': 0.000346322547359003, 'samples': 11014656, 'steps': 57367, 'loss/train': 1.385015606880188} -11/07/2021 05:16:56 - INFO - __main__ - Step 57369: {'lr': 0.00034631765029768594, 'samples': 11014848, 'steps': 57368, 'loss/train': 1.4773645401000977} -11/07/2021 05:16:56 - INFO - __main__ - Step 57370: {'lr': 0.0003463127531929696, 'samples': 11015040, 'steps': 57369, 'loss/train': 1.287975788116455} -11/07/2021 05:16:57 - INFO - __main__ - Step 57371: {'lr': 0.0003463078560448562, 'samples': 11015232, 'steps': 57370, 'loss/train': 1.7418196201324463} -11/07/2021 05:16:57 - INFO - __main__ - Step 57372: {'lr': 0.000346302958853348, 'samples': 11015424, 'steps': 57371, 'loss/train': 1.3799270391464233} -11/07/2021 05:16:57 - INFO - __main__ - Step 57373: {'lr': 0.0003462980616184472, 'samples': 11015616, 'steps': 57372, 'loss/train': 1.3816124200820923} -11/07/2021 05:16:58 - INFO - __main__ - Step 57374: {'lr': 0.0003462931643401559, 'samples': 11015808, 'steps': 57373, 'loss/train': 1.3825258016586304} -11/07/2021 05:16:59 - INFO - __main__ - Step 57375: {'lr': 0.00034628826701847644, 'samples': 11016000, 'steps': 57374, 'loss/train': 0.2318015843629837} -11/07/2021 05:16:59 - INFO - __main__ - Step 57376: {'lr': 0.000346283369653411, 'samples': 11016192, 'steps': 57375, 'loss/train': 1.0265570878982544} -11/07/2021 05:17:00 - INFO - __main__ - Step 57377: {'lr': 0.0003462784722449617, 'samples': 11016384, 'steps': 57376, 'loss/train': 1.0038529634475708} -11/07/2021 05:17:00 - INFO - __main__ - Step 57378: {'lr': 0.00034627357479313087, 'samples': 11016576, 'steps': 57377, 'loss/train': 1.564623236656189} -11/07/2021 05:17:02 - INFO - __main__ - Step 57379: {'lr': 0.0003462686772979206, 'samples': 11016768, 'steps': 57378, 'loss/train': 0.4925709664821625} -11/07/2021 05:17:02 - INFO - __main__ - Step 57380: {'lr': 0.00034626377975933314, 'samples': 11016960, 'steps': 57379, 'loss/train': 1.9429572820663452} -11/07/2021 05:17:02 - INFO - __main__ - Step 57381: {'lr': 0.00034625888217737076, 'samples': 11017152, 'steps': 57380, 'loss/train': 1.6184098720550537} -11/07/2021 05:17:03 - INFO - __main__ - Step 57382: {'lr': 0.0003462539845520356, 'samples': 11017344, 'steps': 57381, 'loss/train': 1.3695964813232422} -11/07/2021 05:17:03 - INFO - __main__ - Step 57383: {'lr': 0.0003462490868833298, 'samples': 11017536, 'steps': 57382, 'loss/train': 1.2670353651046753} -11/07/2021 05:17:03 - INFO - __main__ - Step 57384: {'lr': 0.00034624418917125575, 'samples': 11017728, 'steps': 57383, 'loss/train': 0.5824760794639587} -11/07/2021 05:17:05 - INFO - __main__ - Step 57385: {'lr': 0.00034623929141581555, 'samples': 11017920, 'steps': 57384, 'loss/train': 1.0204366445541382} -11/07/2021 05:17:05 - INFO - __main__ - Step 57386: {'lr': 0.0003462343936170114, 'samples': 11018112, 'steps': 57385, 'loss/train': 1.1853617429733276} -11/07/2021 05:17:05 - INFO - __main__ - Step 57387: {'lr': 0.0003462294957748455, 'samples': 11018304, 'steps': 57386, 'loss/train': 1.394788384437561} -11/07/2021 05:17:06 - INFO - __main__ - Step 57388: {'lr': 0.00034622459788932004, 'samples': 11018496, 'steps': 57387, 'loss/train': 1.415103554725647} -11/07/2021 05:17:06 - INFO - __main__ - Step 57389: {'lr': 0.00034621969996043725, 'samples': 11018688, 'steps': 57388, 'loss/train': 1.2047784328460693} -11/07/2021 05:17:07 - INFO - __main__ - Step 57390: {'lr': 0.0003462148019881994, 'samples': 11018880, 'steps': 57389, 'loss/train': 1.1877517700195312} -11/07/2021 05:17:07 - INFO - __main__ - Step 57391: {'lr': 0.0003462099039726087, 'samples': 11019072, 'steps': 57390, 'loss/train': 1.1441655158996582} -11/07/2021 05:17:08 - INFO - __main__ - Step 57392: {'lr': 0.0003462050059136672, 'samples': 11019264, 'steps': 57391, 'loss/train': 1.7648218870162964} -11/07/2021 05:17:08 - INFO - __main__ - Step 57393: {'lr': 0.00034620010781137724, 'samples': 11019456, 'steps': 57392, 'loss/train': 1.5704514980316162} -11/07/2021 05:17:08 - INFO - __main__ - Step 57394: {'lr': 0.000346195209665741, 'samples': 11019648, 'steps': 57393, 'loss/train': 1.6239277124404907} -11/07/2021 05:17:09 - INFO - __main__ - Step 57395: {'lr': 0.0003461903114767607, 'samples': 11019840, 'steps': 57394, 'loss/train': 0.7149443626403809} -11/07/2021 05:17:10 - INFO - __main__ - Step 57396: {'lr': 0.00034618541324443844, 'samples': 11020032, 'steps': 57395, 'loss/train': 1.5315989255905151} -11/07/2021 05:17:10 - INFO - __main__ - Step 57397: {'lr': 0.0003461805149687767, 'samples': 11020224, 'steps': 57396, 'loss/train': 1.3829823732376099} -11/07/2021 05:17:10 - INFO - __main__ - Step 57398: {'lr': 0.0003461756166497773, 'samples': 11020416, 'steps': 57397, 'loss/train': 1.4139355421066284} -11/07/2021 05:17:11 - INFO - __main__ - Step 57399: {'lr': 0.00034617071828744274, 'samples': 11020608, 'steps': 57398, 'loss/train': 1.1383767127990723} -11/07/2021 05:17:12 - INFO - __main__ - Step 57400: {'lr': 0.00034616581988177516, 'samples': 11020800, 'steps': 57399, 'loss/train': 1.0450670719146729} -11/07/2021 05:17:12 - INFO - __main__ - Step 57401: {'lr': 0.00034616092143277674, 'samples': 11020992, 'steps': 57400, 'loss/train': 0.9170766472816467} -11/07/2021 05:17:13 - INFO - __main__ - Step 57402: {'lr': 0.0003461560229404497, 'samples': 11021184, 'steps': 57401, 'loss/train': 2.8225150108337402} -11/07/2021 05:17:13 - INFO - __main__ - Step 57403: {'lr': 0.0003461511244047962, 'samples': 11021376, 'steps': 57402, 'loss/train': 1.3104650974273682} -11/07/2021 05:17:13 - INFO - __main__ - Step 57404: {'lr': 0.0003461462258258185, 'samples': 11021568, 'steps': 57403, 'loss/train': 1.458613634109497} -11/07/2021 05:17:14 - INFO - __main__ - Step 57405: {'lr': 0.00034614132720351884, 'samples': 11021760, 'steps': 57404, 'loss/train': 0.919306218624115} -11/07/2021 05:17:15 - INFO - __main__ - Step 57406: {'lr': 0.00034613642853789927, 'samples': 11021952, 'steps': 57405, 'loss/train': 1.053566813468933} -11/07/2021 05:17:15 - INFO - __main__ - Step 57407: {'lr': 0.00034613152982896224, 'samples': 11022144, 'steps': 57406, 'loss/train': 1.1296557188034058} -11/07/2021 05:17:15 - INFO - __main__ - Step 57408: {'lr': 0.0003461266310767097, 'samples': 11022336, 'steps': 57407, 'loss/train': 1.511297583580017} -11/07/2021 05:17:16 - INFO - __main__ - Step 57409: {'lr': 0.00034612173228114405, 'samples': 11022528, 'steps': 57408, 'loss/train': 1.3894857168197632} -11/07/2021 05:17:17 - INFO - __main__ - Step 57410: {'lr': 0.00034611683344226745, 'samples': 11022720, 'steps': 57409, 'loss/train': 1.1479789018630981} -11/07/2021 05:17:17 - INFO - __main__ - Step 57411: {'lr': 0.0003461119345600821, 'samples': 11022912, 'steps': 57410, 'loss/train': 1.1791572570800781} -11/07/2021 05:17:17 - INFO - __main__ - Step 57412: {'lr': 0.0003461070356345902, 'samples': 11023104, 'steps': 57411, 'loss/train': 1.347753643989563} -11/07/2021 05:17:18 - INFO - __main__ - Step 57413: {'lr': 0.0003461021366657939, 'samples': 11023296, 'steps': 57412, 'loss/train': 1.4777131080627441} -11/07/2021 05:17:18 - INFO - __main__ - Step 57414: {'lr': 0.00034609723765369546, 'samples': 11023488, 'steps': 57413, 'loss/train': 0.8746947646141052} -11/07/2021 05:17:19 - INFO - __main__ - Step 57415: {'lr': 0.00034609233859829707, 'samples': 11023680, 'steps': 57414, 'loss/train': 1.1914379596710205} -11/07/2021 05:17:20 - INFO - __main__ - Step 57416: {'lr': 0.00034608743949960096, 'samples': 11023872, 'steps': 57415, 'loss/train': 0.7074412703514099} -11/07/2021 05:17:20 - INFO - __main__ - Step 57417: {'lr': 0.00034608254035760946, 'samples': 11024064, 'steps': 57416, 'loss/train': 1.6975936889648438} -11/07/2021 05:17:20 - INFO - __main__ - Step 57418: {'lr': 0.0003460776411723245, 'samples': 11024256, 'steps': 57417, 'loss/train': 1.3936597108840942} -11/07/2021 05:17:21 - INFO - __main__ - Step 57419: {'lr': 0.00034607274194374847, 'samples': 11024448, 'steps': 57418, 'loss/train': 1.178491234779358} -11/07/2021 05:17:21 - INFO - __main__ - Step 57420: {'lr': 0.00034606784267188364, 'samples': 11024640, 'steps': 57419, 'loss/train': 1.1270482540130615} -11/07/2021 05:17:22 - INFO - __main__ - Step 57421: {'lr': 0.000346062943356732, 'samples': 11024832, 'steps': 57420, 'loss/train': 1.1398437023162842} -11/07/2021 05:17:22 - INFO - __main__ - Step 57422: {'lr': 0.00034605804399829595, 'samples': 11025024, 'steps': 57421, 'loss/train': 1.578539252281189} -11/07/2021 05:17:23 - INFO - __main__ - Step 57423: {'lr': 0.00034605314459657763, 'samples': 11025216, 'steps': 57422, 'loss/train': 1.3543661832809448} -11/07/2021 05:17:23 - INFO - __main__ - Step 57424: {'lr': 0.00034604824515157916, 'samples': 11025408, 'steps': 57423, 'loss/train': 1.1689528226852417} -11/07/2021 05:17:23 - INFO - __main__ - Step 57425: {'lr': 0.0003460433456633029, 'samples': 11025600, 'steps': 57424, 'loss/train': 1.2760167121887207} -11/07/2021 05:17:25 - INFO - __main__ - Step 57426: {'lr': 0.000346038446131751, 'samples': 11025792, 'steps': 57425, 'loss/train': 1.5373750925064087} -11/07/2021 05:17:25 - INFO - __main__ - Step 57427: {'lr': 0.0003460335465569256, 'samples': 11025984, 'steps': 57426, 'loss/train': 0.09772712737321854} -11/07/2021 05:17:25 - INFO - __main__ - Step 57428: {'lr': 0.0003460286469388291, 'samples': 11026176, 'steps': 57427, 'loss/train': 1.454162836074829} -11/07/2021 05:17:26 - INFO - __main__ - Step 57429: {'lr': 0.0003460237472774634, 'samples': 11026368, 'steps': 57428, 'loss/train': 1.8001880645751953} -11/07/2021 05:17:26 - INFO - __main__ - Step 57430: {'lr': 0.000346018847572831, 'samples': 11026560, 'steps': 57429, 'loss/train': 1.9741418361663818} -11/07/2021 05:17:27 - INFO - __main__ - Step 57431: {'lr': 0.00034601394782493393, 'samples': 11026752, 'steps': 57430, 'loss/train': 1.4095287322998047} -11/07/2021 05:17:28 - INFO - __main__ - Step 57432: {'lr': 0.00034600904803377454, 'samples': 11026944, 'steps': 57431, 'loss/train': 1.6216919422149658} -11/07/2021 05:17:28 - INFO - __main__ - Step 57433: {'lr': 0.0003460041481993549, 'samples': 11027136, 'steps': 57432, 'loss/train': 1.2803337574005127} -11/07/2021 05:17:28 - INFO - __main__ - Step 57434: {'lr': 0.0003459992483216773, 'samples': 11027328, 'steps': 57433, 'loss/train': 1.4107896089553833} -11/07/2021 05:17:29 - INFO - __main__ - Step 57435: {'lr': 0.0003459943484007438, 'samples': 11027520, 'steps': 57434, 'loss/train': 0.09461843967437744} -11/07/2021 05:17:30 - INFO - __main__ - Step 57436: {'lr': 0.0003459894484365568, 'samples': 11027712, 'steps': 57435, 'loss/train': 1.2363675832748413} -11/07/2021 05:17:30 - INFO - __main__ - Step 57437: {'lr': 0.0003459845484291185, 'samples': 11027904, 'steps': 57436, 'loss/train': 1.6568247079849243} -11/07/2021 05:17:30 - INFO - __main__ - Step 57438: {'lr': 0.00034597964837843097, 'samples': 11028096, 'steps': 57437, 'loss/train': 0.8117554187774658} -11/07/2021 05:17:31 - INFO - __main__ - Step 57439: {'lr': 0.00034597474828449646, 'samples': 11028288, 'steps': 57438, 'loss/train': 1.149634599685669} -11/07/2021 05:17:31 - INFO - __main__ - Step 57440: {'lr': 0.00034596984814731736, 'samples': 11028480, 'steps': 57439, 'loss/train': 1.4476789236068726} -11/07/2021 05:17:32 - INFO - __main__ - Step 57441: {'lr': 0.0003459649479668956, 'samples': 11028672, 'steps': 57440, 'loss/train': 1.3072500228881836} -11/07/2021 05:17:33 - INFO - __main__ - Step 57442: {'lr': 0.00034596004774323355, 'samples': 11028864, 'steps': 57441, 'loss/train': 1.5590335130691528} -11/07/2021 05:17:33 - INFO - __main__ - Step 57443: {'lr': 0.0003459551474763334, 'samples': 11029056, 'steps': 57442, 'loss/train': 1.6526044607162476} -11/07/2021 05:17:33 - INFO - __main__ - Step 57444: {'lr': 0.00034595024716619726, 'samples': 11029248, 'steps': 57443, 'loss/train': 1.0462483167648315} -11/07/2021 05:17:34 - INFO - __main__ - Step 57445: {'lr': 0.0003459453468128276, 'samples': 11029440, 'steps': 57444, 'loss/train': 1.490347981452942} -11/07/2021 05:17:35 - INFO - __main__ - Step 57446: {'lr': 0.0003459404464162263, 'samples': 11029632, 'steps': 57445, 'loss/train': 1.1569639444351196} -11/07/2021 05:17:35 - INFO - __main__ - Step 57447: {'lr': 0.0003459355459763957, 'samples': 11029824, 'steps': 57446, 'loss/train': 1.3507537841796875} -11/07/2021 05:17:35 - INFO - __main__ - Step 57448: {'lr': 0.0003459306454933381, 'samples': 11030016, 'steps': 57447, 'loss/train': 1.0689138174057007} -11/07/2021 05:17:36 - INFO - __main__ - Step 57449: {'lr': 0.0003459257449670555, 'samples': 11030208, 'steps': 57448, 'loss/train': 1.300590991973877} -11/07/2021 05:17:36 - INFO - __main__ - Step 57450: {'lr': 0.0003459208443975504, 'samples': 11030400, 'steps': 57449, 'loss/train': 2.5017642974853516} -11/07/2021 05:17:37 - INFO - __main__ - Step 57451: {'lr': 0.00034591594378482484, 'samples': 11030592, 'steps': 57450, 'loss/train': 1.2393287420272827} -11/07/2021 05:17:37 - INFO - __main__ - Step 57452: {'lr': 0.00034591104312888096, 'samples': 11030784, 'steps': 57451, 'loss/train': 2.2869598865509033} -11/07/2021 05:17:38 - INFO - __main__ - Step 57453: {'lr': 0.00034590614242972106, 'samples': 11030976, 'steps': 57452, 'loss/train': 1.5786266326904297} -11/07/2021 05:17:38 - INFO - __main__ - Step 57454: {'lr': 0.00034590124168734735, 'samples': 11031168, 'steps': 57453, 'loss/train': 1.2358040809631348} -11/07/2021 05:17:38 - INFO - __main__ - Step 57455: {'lr': 0.00034589634090176195, 'samples': 11031360, 'steps': 57454, 'loss/train': 1.4128271341323853} -11/07/2021 05:17:39 - INFO - __main__ - Step 57456: {'lr': 0.0003458914400729672, 'samples': 11031552, 'steps': 57455, 'loss/train': 1.3198496103286743} -11/07/2021 05:17:40 - INFO - __main__ - Step 57457: {'lr': 0.00034588653920096524, 'samples': 11031744, 'steps': 57456, 'loss/train': 0.814330518245697} -11/07/2021 05:17:40 - INFO - __main__ - Step 57458: {'lr': 0.00034588163828575837, 'samples': 11031936, 'steps': 57457, 'loss/train': 1.571532130241394} -11/07/2021 05:17:41 - INFO - __main__ - Step 57459: {'lr': 0.0003458767373273486, 'samples': 11032128, 'steps': 57458, 'loss/train': 1.1901860237121582} -11/07/2021 05:17:41 - INFO - __main__ - Step 57460: {'lr': 0.00034587183632573825, 'samples': 11032320, 'steps': 57459, 'loss/train': 1.4375938177108765} -11/07/2021 05:17:41 - INFO - __main__ - Step 57461: {'lr': 0.00034586693528092954, 'samples': 11032512, 'steps': 57460, 'loss/train': 1.5013798475265503} -11/07/2021 05:17:42 - INFO - __main__ - Step 57462: {'lr': 0.0003458620341929247, 'samples': 11032704, 'steps': 57461, 'loss/train': 0.18268518149852753} -11/07/2021 05:17:43 - INFO - __main__ - Step 57463: {'lr': 0.0003458571330617259, 'samples': 11032896, 'steps': 57462, 'loss/train': 1.1528363227844238} -11/07/2021 05:17:43 - INFO - __main__ - Step 57464: {'lr': 0.00034585223188733535, 'samples': 11033088, 'steps': 57463, 'loss/train': 2.0035576820373535} -11/07/2021 05:17:43 - INFO - __main__ - Step 57465: {'lr': 0.0003458473306697553, 'samples': 11033280, 'steps': 57464, 'loss/train': 1.2071844339370728} -11/07/2021 05:17:44 - INFO - __main__ - Step 57466: {'lr': 0.0003458424294089879, 'samples': 11033472, 'steps': 57465, 'loss/train': 1.8875221014022827} -11/07/2021 05:17:45 - INFO - __main__ - Step 57467: {'lr': 0.00034583752810503533, 'samples': 11033664, 'steps': 57466, 'loss/train': 1.198325276374817} -11/07/2021 05:17:45 - INFO - __main__ - Step 57468: {'lr': 0.0003458326267578999, 'samples': 11033856, 'steps': 57467, 'loss/train': 1.4165171384811401} -11/07/2021 05:17:45 - INFO - __main__ - Step 57469: {'lr': 0.0003458277253675837, 'samples': 11034048, 'steps': 57468, 'loss/train': 1.3195197582244873} -11/07/2021 05:17:46 - INFO - __main__ - Step 57470: {'lr': 0.0003458228239340891, 'samples': 11034240, 'steps': 57469, 'loss/train': 1.482831358909607} -11/07/2021 05:17:46 - INFO - __main__ - Step 57471: {'lr': 0.0003458179224574182, 'samples': 11034432, 'steps': 57470, 'loss/train': 0.546582818031311} -11/07/2021 05:17:47 - INFO - __main__ - Step 57472: {'lr': 0.00034581302093757317, 'samples': 11034624, 'steps': 57471, 'loss/train': 1.2985109090805054} -11/07/2021 05:17:48 - INFO - __main__ - Step 57473: {'lr': 0.0003458081193745563, 'samples': 11034816, 'steps': 57472, 'loss/train': 1.4421230554580688} -11/07/2021 05:17:48 - INFO - __main__ - Step 57474: {'lr': 0.00034580321776836974, 'samples': 11035008, 'steps': 57473, 'loss/train': 1.6130874156951904} -11/07/2021 05:17:49 - INFO - __main__ - Step 57475: {'lr': 0.0003457983161190158, 'samples': 11035200, 'steps': 57474, 'loss/train': 1.1718443632125854} -11/07/2021 05:17:49 - INFO - __main__ - Step 57476: {'lr': 0.00034579341442649654, 'samples': 11035392, 'steps': 57475, 'loss/train': 1.7045835256576538} -11/07/2021 05:17:49 - INFO - __main__ - Step 57477: {'lr': 0.00034578851269081426, 'samples': 11035584, 'steps': 57476, 'loss/train': 1.056429386138916} -11/07/2021 05:17:50 - INFO - __main__ - Step 57478: {'lr': 0.0003457836109119712, 'samples': 11035776, 'steps': 57477, 'loss/train': 1.4926329851150513} -11/07/2021 05:17:51 - INFO - __main__ - Step 57479: {'lr': 0.0003457787090899695, 'samples': 11035968, 'steps': 57478, 'loss/train': 1.235234022140503} -11/07/2021 05:17:51 - INFO - __main__ - Step 57480: {'lr': 0.00034577380722481137, 'samples': 11036160, 'steps': 57479, 'loss/train': 1.5416814088821411} -11/07/2021 05:17:51 - INFO - __main__ - Step 57481: {'lr': 0.00034576890531649905, 'samples': 11036352, 'steps': 57480, 'loss/train': 0.5756336450576782} -11/07/2021 05:17:52 - INFO - __main__ - Step 57482: {'lr': 0.0003457640033650348, 'samples': 11036544, 'steps': 57481, 'loss/train': 1.221463680267334} -11/07/2021 05:17:53 - INFO - __main__ - Step 57483: {'lr': 0.00034575910137042064, 'samples': 11036736, 'steps': 57482, 'loss/train': 0.822562575340271} -11/07/2021 05:17:53 - INFO - __main__ - Step 57484: {'lr': 0.000345754199332659, 'samples': 11036928, 'steps': 57483, 'loss/train': 1.3301583528518677} -11/07/2021 05:17:54 - INFO - __main__ - Step 57485: {'lr': 0.00034574929725175203, 'samples': 11037120, 'steps': 57484, 'loss/train': 0.14026418328285217} -11/07/2021 05:17:54 - INFO - __main__ - Step 57486: {'lr': 0.0003457443951277018, 'samples': 11037312, 'steps': 57485, 'loss/train': 1.0388625860214233} -11/07/2021 05:17:54 - INFO - __main__ - Step 57487: {'lr': 0.00034573949296051065, 'samples': 11037504, 'steps': 57486, 'loss/train': 1.5076392889022827} -11/07/2021 05:17:55 - INFO - __main__ - Step 57488: {'lr': 0.0003457345907501808, 'samples': 11037696, 'steps': 57487, 'loss/train': 1.0548630952835083} -11/07/2021 05:17:56 - INFO - __main__ - Step 57489: {'lr': 0.0003457296884967144, 'samples': 11037888, 'steps': 57488, 'loss/train': 0.9093506336212158} -11/07/2021 05:17:56 - INFO - __main__ - Step 57490: {'lr': 0.0003457247862001137, 'samples': 11038080, 'steps': 57489, 'loss/train': 1.5272330045700073} -11/07/2021 05:17:56 - INFO - __main__ - Step 57491: {'lr': 0.0003457198838603809, 'samples': 11038272, 'steps': 57490, 'loss/train': 1.4084599018096924} -11/07/2021 05:17:57 - INFO - __main__ - Step 57492: {'lr': 0.0003457149814775182, 'samples': 11038464, 'steps': 57491, 'loss/train': 0.740615725517273} -11/07/2021 05:17:59 - INFO - __main__ - Step 57493: {'lr': 0.00034571007905152774, 'samples': 11038656, 'steps': 57492, 'loss/train': 1.2653871774673462} -11/07/2021 05:17:59 - INFO - __main__ - Step 57494: {'lr': 0.00034570517658241186, 'samples': 11038848, 'steps': 57493, 'loss/train': 1.5141576528549194} -11/07/2021 05:17:59 - INFO - __main__ - Step 57495: {'lr': 0.00034570027407017264, 'samples': 11039040, 'steps': 57494, 'loss/train': 1.4731392860412598} -11/07/2021 05:18:00 - INFO - __main__ - Step 57496: {'lr': 0.0003456953715148124, 'samples': 11039232, 'steps': 57495, 'loss/train': 1.3965580463409424} -11/07/2021 05:18:00 - INFO - __main__ - Step 57497: {'lr': 0.0003456904689163333, 'samples': 11039424, 'steps': 57496, 'loss/train': 1.3600486516952515} -11/07/2021 05:18:01 - INFO - __main__ - Step 57498: {'lr': 0.0003456855662747376, 'samples': 11039616, 'steps': 57497, 'loss/train': 1.4234179258346558} -11/07/2021 05:18:01 - INFO - __main__ - Step 57499: {'lr': 0.0003456806635900274, 'samples': 11039808, 'steps': 57498, 'loss/train': 0.7817096710205078} -11/07/2021 05:18:02 - INFO - __main__ - Step 57500: {'lr': 0.00034567576086220493, 'samples': 11040000, 'steps': 57499, 'loss/train': 1.321328043937683} -11/07/2021 05:18:02 - INFO - __main__ - Step 57501: {'lr': 0.0003456708580912725, 'samples': 11040192, 'steps': 57500, 'loss/train': 1.4732120037078857} -11/07/2021 05:18:03 - INFO - __main__ - Step 57502: {'lr': 0.0003456659552772322, 'samples': 11040384, 'steps': 57501, 'loss/train': 1.3813444375991821} -11/07/2021 05:18:03 - INFO - __main__ - Step 57503: {'lr': 0.0003456610524200863, 'samples': 11040576, 'steps': 57502, 'loss/train': 1.4180666208267212} -11/07/2021 05:18:03 - INFO - __main__ - Step 57504: {'lr': 0.00034565614951983706, 'samples': 11040768, 'steps': 57503, 'loss/train': 1.3131844997406006} -11/07/2021 05:18:04 - INFO - __main__ - Step 57505: {'lr': 0.00034565124657648665, 'samples': 11040960, 'steps': 57504, 'loss/train': 1.6327060461044312} -11/07/2021 05:18:05 - INFO - __main__ - Step 57506: {'lr': 0.0003456463435900372, 'samples': 11041152, 'steps': 57505, 'loss/train': 1.7291350364685059} -11/07/2021 05:18:05 - INFO - __main__ - Step 57507: {'lr': 0.0003456414405604911, 'samples': 11041344, 'steps': 57506, 'loss/train': 1.431210994720459} -11/07/2021 05:18:05 - INFO - __main__ - Step 57508: {'lr': 0.0003456365374878503, 'samples': 11041536, 'steps': 57507, 'loss/train': 1.4372285604476929} -11/07/2021 05:18:06 - INFO - __main__ - Step 57509: {'lr': 0.00034563163437211717, 'samples': 11041728, 'steps': 57508, 'loss/train': 1.177987813949585} -11/07/2021 05:18:07 - INFO - __main__ - Step 57510: {'lr': 0.000345626731213294, 'samples': 11041920, 'steps': 57509, 'loss/train': 1.9565181732177734} -11/07/2021 05:18:07 - INFO - __main__ - Step 57511: {'lr': 0.00034562182801138277, 'samples': 11042112, 'steps': 57510, 'loss/train': 1.3832385540008545} -11/07/2021 05:18:08 - INFO - __main__ - Step 57512: {'lr': 0.00034561692476638595, 'samples': 11042304, 'steps': 57511, 'loss/train': 1.446972131729126} -11/07/2021 05:18:08 - INFO - __main__ - Step 57513: {'lr': 0.00034561202147830554, 'samples': 11042496, 'steps': 57512, 'loss/train': 1.1404516696929932} -11/07/2021 05:18:08 - INFO - __main__ - Step 57514: {'lr': 0.00034560711814714387, 'samples': 11042688, 'steps': 57513, 'loss/train': 1.307263970375061} -11/07/2021 05:18:10 - INFO - __main__ - Step 57515: {'lr': 0.0003456022147729031, 'samples': 11042880, 'steps': 57514, 'loss/train': 1.6337566375732422} -11/07/2021 05:18:10 - INFO - __main__ - Step 57516: {'lr': 0.00034559731135558536, 'samples': 11043072, 'steps': 57515, 'loss/train': 1.3496122360229492} -11/07/2021 05:18:10 - INFO - __main__ - Step 57517: {'lr': 0.000345592407895193, 'samples': 11043264, 'steps': 57516, 'loss/train': 1.1995166540145874} -11/07/2021 05:18:11 - INFO - __main__ - Step 57518: {'lr': 0.00034558750439172826, 'samples': 11043456, 'steps': 57517, 'loss/train': 0.35492417216300964} -11/07/2021 05:18:11 - INFO - __main__ - Step 57519: {'lr': 0.0003455826008451932, 'samples': 11043648, 'steps': 57518, 'loss/train': 1.1940852403640747} -11/07/2021 05:18:12 - INFO - __main__ - Step 57520: {'lr': 0.00034557769725559014, 'samples': 11043840, 'steps': 57519, 'loss/train': 1.813337802886963} -11/07/2021 05:18:12 - INFO - __main__ - Step 57521: {'lr': 0.00034557279362292117, 'samples': 11044032, 'steps': 57520, 'loss/train': 1.3919909000396729} -11/07/2021 05:18:13 - INFO - __main__ - Step 57522: {'lr': 0.00034556788994718855, 'samples': 11044224, 'steps': 57521, 'loss/train': 1.758271336555481} -11/07/2021 05:18:13 - INFO - __main__ - Step 57523: {'lr': 0.00034556298622839463, 'samples': 11044416, 'steps': 57522, 'loss/train': 1.1725791692733765} -11/07/2021 05:18:13 - INFO - __main__ - Step 57524: {'lr': 0.0003455580824665414, 'samples': 11044608, 'steps': 57523, 'loss/train': 1.4767088890075684} -11/07/2021 05:18:15 - INFO - __main__ - Step 57525: {'lr': 0.0003455531786616313, 'samples': 11044800, 'steps': 57524, 'loss/train': 1.4721578359603882} -11/07/2021 05:18:15 - INFO - __main__ - Step 57526: {'lr': 0.0003455482748136663, 'samples': 11044992, 'steps': 57525, 'loss/train': 0.6027123332023621} -11/07/2021 05:18:15 - INFO - __main__ - Step 57527: {'lr': 0.00034554337092264874, 'samples': 11045184, 'steps': 57526, 'loss/train': 0.8254349231719971} -11/07/2021 05:18:16 - INFO - __main__ - Step 57528: {'lr': 0.00034553846698858083, 'samples': 11045376, 'steps': 57527, 'loss/train': 1.0931326150894165} -11/07/2021 05:18:16 - INFO - __main__ - Step 57529: {'lr': 0.00034553356301146473, 'samples': 11045568, 'steps': 57528, 'loss/train': 1.4469027519226074} -11/07/2021 05:18:17 - INFO - __main__ - Step 57530: {'lr': 0.0003455286589913027, 'samples': 11045760, 'steps': 57529, 'loss/train': 1.4669450521469116} -11/07/2021 05:18:17 - INFO - __main__ - Step 57531: {'lr': 0.0003455237549280969, 'samples': 11045952, 'steps': 57530, 'loss/train': 1.434045433998108} -11/07/2021 05:18:18 - INFO - __main__ - Step 57532: {'lr': 0.0003455188508218496, 'samples': 11046144, 'steps': 57531, 'loss/train': 0.8300938606262207} -11/07/2021 05:18:18 - INFO - __main__ - Step 57533: {'lr': 0.000345513946672563, 'samples': 11046336, 'steps': 57532, 'loss/train': 1.4491974115371704} -11/07/2021 05:18:18 - INFO - __main__ - Step 57534: {'lr': 0.0003455090424802393, 'samples': 11046528, 'steps': 57533, 'loss/train': 1.086493730545044} -11/07/2021 05:18:20 - INFO - __main__ - Step 57535: {'lr': 0.00034550413824488066, 'samples': 11046720, 'steps': 57534, 'loss/train': 1.7283111810684204} -11/07/2021 05:18:20 - INFO - __main__ - Step 57536: {'lr': 0.0003454992339664893, 'samples': 11046912, 'steps': 57535, 'loss/train': 1.2079789638519287} -11/07/2021 05:18:20 - INFO - __main__ - Step 57537: {'lr': 0.00034549432964506755, 'samples': 11047104, 'steps': 57536, 'loss/train': 1.3897489309310913} -11/07/2021 05:18:21 - INFO - __main__ - Step 57538: {'lr': 0.0003454894252806175, 'samples': 11047296, 'steps': 57537, 'loss/train': 1.3062047958374023} -11/07/2021 05:18:21 - INFO - __main__ - Step 57539: {'lr': 0.00034548452087314135, 'samples': 11047488, 'steps': 57538, 'loss/train': 1.1824064254760742} -11/07/2021 05:18:21 - INFO - __main__ - Step 57540: {'lr': 0.0003454796164226414, 'samples': 11047680, 'steps': 57539, 'loss/train': 2.041522979736328} -11/07/2021 05:18:22 - INFO - __main__ - Step 57541: {'lr': 0.00034547471192911973, 'samples': 11047872, 'steps': 57540, 'loss/train': 1.3433326482772827} -11/07/2021 05:18:23 - INFO - __main__ - Step 57542: {'lr': 0.0003454698073925787, 'samples': 11048064, 'steps': 57541, 'loss/train': 1.5176191329956055} -11/07/2021 05:18:23 - INFO - __main__ - Step 57543: {'lr': 0.00034546490281302033, 'samples': 11048256, 'steps': 57542, 'loss/train': 1.421345829963684} -11/07/2021 05:18:23 - INFO - __main__ - Step 57544: {'lr': 0.000345459998190447, 'samples': 11048448, 'steps': 57543, 'loss/train': 1.42875075340271} -11/07/2021 05:18:24 - INFO - __main__ - Step 57545: {'lr': 0.000345455093524861, 'samples': 11048640, 'steps': 57544, 'loss/train': 1.1425549983978271} -11/07/2021 05:18:25 - INFO - __main__ - Step 57546: {'lr': 0.00034545018881626435, 'samples': 11048832, 'steps': 57545, 'loss/train': 0.5950518250465393} -11/07/2021 05:18:25 - INFO - __main__ - Step 57547: {'lr': 0.00034544528406465927, 'samples': 11049024, 'steps': 57546, 'loss/train': 1.4897198677062988} -11/07/2021 05:18:25 - INFO - __main__ - Step 57548: {'lr': 0.000345440379270048, 'samples': 11049216, 'steps': 57547, 'loss/train': 0.9663727879524231} -11/07/2021 05:18:26 - INFO - __main__ - Step 57549: {'lr': 0.0003454354744324328, 'samples': 11049408, 'steps': 57548, 'loss/train': 1.471144199371338} -11/07/2021 05:18:26 - INFO - __main__ - Step 57550: {'lr': 0.00034543056955181584, 'samples': 11049600, 'steps': 57549, 'loss/train': 1.6009119749069214} -11/07/2021 05:18:27 - INFO - __main__ - Step 57551: {'lr': 0.0003454256646281993, 'samples': 11049792, 'steps': 57550, 'loss/train': 1.3860677480697632} -11/07/2021 05:18:28 - INFO - __main__ - Step 57552: {'lr': 0.0003454207596615855, 'samples': 11049984, 'steps': 57551, 'loss/train': 0.10142990201711655} -11/07/2021 05:18:28 - INFO - __main__ - Step 57553: {'lr': 0.00034541585465197653, 'samples': 11050176, 'steps': 57552, 'loss/train': 0.9701891541481018} -11/07/2021 05:18:28 - INFO - __main__ - Step 57554: {'lr': 0.0003454109495993747, 'samples': 11050368, 'steps': 57553, 'loss/train': 1.6230173110961914} -11/07/2021 05:18:29 - INFO - __main__ - Step 57555: {'lr': 0.0003454060445037821, 'samples': 11050560, 'steps': 57554, 'loss/train': 1.0044591426849365} -11/07/2021 05:18:30 - INFO - __main__ - Step 57556: {'lr': 0.0003454011393652011, 'samples': 11050752, 'steps': 57555, 'loss/train': 1.0634393692016602} -11/07/2021 05:18:30 - INFO - __main__ - Step 57557: {'lr': 0.0003453962341836337, 'samples': 11050944, 'steps': 57556, 'loss/train': 1.2863399982452393} -11/07/2021 05:18:30 - INFO - __main__ - Step 57558: {'lr': 0.0003453913289590823, 'samples': 11051136, 'steps': 57557, 'loss/train': 1.1702903509140015} -11/07/2021 05:18:31 - INFO - __main__ - Step 57559: {'lr': 0.00034538642369154907, 'samples': 11051328, 'steps': 57558, 'loss/train': 0.8804982304573059} -11/07/2021 05:18:31 - INFO - __main__ - Step 57560: {'lr': 0.00034538151838103614, 'samples': 11051520, 'steps': 57559, 'loss/train': 1.1462171077728271} -11/07/2021 05:18:32 - INFO - __main__ - Step 57561: {'lr': 0.00034537661302754577, 'samples': 11051712, 'steps': 57560, 'loss/train': 1.5659589767456055} -11/07/2021 05:18:33 - INFO - __main__ - Step 57562: {'lr': 0.00034537170763108017, 'samples': 11051904, 'steps': 57561, 'loss/train': 1.5989017486572266} -11/07/2021 05:18:33 - INFO - __main__ - Step 57563: {'lr': 0.00034536680219164156, 'samples': 11052096, 'steps': 57562, 'loss/train': 0.07066918164491653} -11/07/2021 05:18:33 - INFO - __main__ - Step 57564: {'lr': 0.0003453618967092322, 'samples': 11052288, 'steps': 57563, 'loss/train': 1.3893033266067505} -11/07/2021 05:18:34 - INFO - __main__ - Step 57565: {'lr': 0.00034535699118385413, 'samples': 11052480, 'steps': 57564, 'loss/train': 1.46445894241333} -11/07/2021 05:18:35 - INFO - __main__ - Step 57566: {'lr': 0.00034535208561550974, 'samples': 11052672, 'steps': 57565, 'loss/train': 1.139594554901123} -11/07/2021 05:18:35 - INFO - __main__ - Step 57567: {'lr': 0.00034534718000420113, 'samples': 11052864, 'steps': 57566, 'loss/train': 1.5781636238098145} -11/07/2021 05:18:35 - INFO - __main__ - Step 57568: {'lr': 0.0003453422743499306, 'samples': 11053056, 'steps': 57567, 'loss/train': 1.1728266477584839} -11/07/2021 05:18:36 - INFO - __main__ - Step 57569: {'lr': 0.00034533736865270025, 'samples': 11053248, 'steps': 57568, 'loss/train': 1.7905948162078857} -11/07/2021 05:18:36 - INFO - __main__ - Step 57570: {'lr': 0.0003453324629125124, 'samples': 11053440, 'steps': 57569, 'loss/train': 1.189206600189209} -11/07/2021 05:18:37 - INFO - __main__ - Step 57571: {'lr': 0.00034532755712936926, 'samples': 11053632, 'steps': 57570, 'loss/train': 1.337283968925476} -11/07/2021 05:18:38 - INFO - __main__ - Step 57572: {'lr': 0.0003453226513032729, 'samples': 11053824, 'steps': 57571, 'loss/train': 1.6351426839828491} -11/07/2021 05:18:38 - INFO - __main__ - Step 57573: {'lr': 0.00034531774543422567, 'samples': 11054016, 'steps': 57572, 'loss/train': 1.2395817041397095} -11/07/2021 05:18:38 - INFO - __main__ - Step 57574: {'lr': 0.00034531283952222975, 'samples': 11054208, 'steps': 57573, 'loss/train': 1.7429171800613403} -11/07/2021 05:18:39 - INFO - __main__ - Step 57575: {'lr': 0.00034530793356728727, 'samples': 11054400, 'steps': 57574, 'loss/train': 0.9734483957290649} -11/07/2021 05:18:40 - INFO - __main__ - Step 57576: {'lr': 0.0003453030275694006, 'samples': 11054592, 'steps': 57575, 'loss/train': 1.240654706954956} -11/07/2021 05:18:40 - INFO - __main__ - Step 57577: {'lr': 0.0003452981215285718, 'samples': 11054784, 'steps': 57576, 'loss/train': 1.734090805053711} -11/07/2021 05:18:40 - INFO - __main__ - Step 57578: {'lr': 0.0003452932154448031, 'samples': 11054976, 'steps': 57577, 'loss/train': 1.6185129880905151} -11/07/2021 05:18:41 - INFO - __main__ - Step 57579: {'lr': 0.0003452883093180968, 'samples': 11055168, 'steps': 57578, 'loss/train': 1.7786346673965454} -11/07/2021 05:18:41 - INFO - __main__ - Step 57580: {'lr': 0.0003452834031484551, 'samples': 11055360, 'steps': 57579, 'loss/train': 1.3384336233139038} -11/07/2021 05:18:42 - INFO - __main__ - Step 57581: {'lr': 0.0003452784969358801, 'samples': 11055552, 'steps': 57580, 'loss/train': 1.6141666173934937} -11/07/2021 05:18:42 - INFO - __main__ - Step 57582: {'lr': 0.0003452735906803741, 'samples': 11055744, 'steps': 57581, 'loss/train': 1.5685594081878662} -11/07/2021 05:18:43 - INFO - __main__ - Step 57583: {'lr': 0.0003452686843819393, 'samples': 11055936, 'steps': 57582, 'loss/train': 1.4723563194274902} -11/07/2021 05:18:43 - INFO - __main__ - Step 57584: {'lr': 0.0003452637780405778, 'samples': 11056128, 'steps': 57583, 'loss/train': 0.8280128836631775} -11/07/2021 05:18:43 - INFO - __main__ - Step 57585: {'lr': 0.000345258871656292, 'samples': 11056320, 'steps': 57584, 'loss/train': 1.4360042810440063} -11/07/2021 05:18:45 - INFO - __main__ - Step 57586: {'lr': 0.0003452539652290841, 'samples': 11056512, 'steps': 57585, 'loss/train': 1.7037127017974854} -11/07/2021 05:18:45 - INFO - __main__ - Step 57587: {'lr': 0.00034524905875895614, 'samples': 11056704, 'steps': 57586, 'loss/train': 0.9621776342391968} -11/07/2021 05:18:46 - INFO - __main__ - Step 57588: {'lr': 0.00034524415224591046, 'samples': 11056896, 'steps': 57587, 'loss/train': 1.1307048797607422} -11/07/2021 05:18:46 - INFO - __main__ - Step 57589: {'lr': 0.00034523924568994913, 'samples': 11057088, 'steps': 57588, 'loss/train': 1.5178391933441162} -11/07/2021 05:18:46 - INFO - __main__ - Step 57590: {'lr': 0.00034523433909107454, 'samples': 11057280, 'steps': 57589, 'loss/train': 0.6705071926116943} -11/07/2021 05:18:47 - INFO - __main__ - Step 57591: {'lr': 0.00034522943244928885, 'samples': 11057472, 'steps': 57590, 'loss/train': 1.5455048084259033} -11/07/2021 05:18:48 - INFO - __main__ - Step 57592: {'lr': 0.0003452245257645943, 'samples': 11057664, 'steps': 57591, 'loss/train': 1.3068667650222778} -11/07/2021 05:18:48 - INFO - __main__ - Step 57593: {'lr': 0.00034521961903699296, 'samples': 11057856, 'steps': 57592, 'loss/train': 1.2720032930374146} -11/07/2021 05:18:48 - INFO - __main__ - Step 57594: {'lr': 0.00034521471226648716, 'samples': 11058048, 'steps': 57593, 'loss/train': 1.7495051622390747} -11/07/2021 05:18:49 - INFO - __main__ - Step 57595: {'lr': 0.000345209805453079, 'samples': 11058240, 'steps': 57594, 'loss/train': 1.0688161849975586} -11/07/2021 05:18:49 - INFO - __main__ - Step 57596: {'lr': 0.00034520489859677083, 'samples': 11058432, 'steps': 57595, 'loss/train': 1.3923890590667725} -11/07/2021 05:18:50 - INFO - __main__ - Step 57597: {'lr': 0.0003451999916975648, 'samples': 11058624, 'steps': 57596, 'loss/train': 1.1420775651931763} -11/07/2021 05:18:50 - INFO - __main__ - Step 57598: {'lr': 0.00034519508475546314, 'samples': 11058816, 'steps': 57597, 'loss/train': 1.9673023223876953} -11/07/2021 05:18:51 - INFO - __main__ - Step 57599: {'lr': 0.0003451901777704681, 'samples': 11059008, 'steps': 57598, 'loss/train': 1.1575087308883667} -11/07/2021 05:18:51 - INFO - __main__ - Step 57600: {'lr': 0.00034518527074258175, 'samples': 11059200, 'steps': 57599, 'loss/train': 1.737684726715088} -11/07/2021 05:18:52 - INFO - __main__ - Step 57601: {'lr': 0.00034518036367180637, 'samples': 11059392, 'steps': 57600, 'loss/train': 0.9970178008079529} -11/07/2021 05:18:53 - INFO - __main__ - Step 57602: {'lr': 0.00034517545655814424, 'samples': 11059584, 'steps': 57601, 'loss/train': 0.5880791544914246} -11/07/2021 05:18:53 - INFO - __main__ - Step 57603: {'lr': 0.0003451705494015975, 'samples': 11059776, 'steps': 57602, 'loss/train': 1.185686469078064} -11/07/2021 05:18:53 - INFO - __main__ - Step 57604: {'lr': 0.0003451656422021684, 'samples': 11059968, 'steps': 57603, 'loss/train': 1.592069387435913} -11/07/2021 05:18:54 - INFO - __main__ - Step 57605: {'lr': 0.0003451607349598591, 'samples': 11060160, 'steps': 57604, 'loss/train': 1.4268330335617065} -11/07/2021 05:18:54 - INFO - __main__ - Step 57606: {'lr': 0.0003451558276746719, 'samples': 11060352, 'steps': 57605, 'loss/train': 1.9687608480453491} -11/07/2021 05:18:55 - INFO - __main__ - Step 57607: {'lr': 0.0003451509203466089, 'samples': 11060544, 'steps': 57606, 'loss/train': 1.3777413368225098} -11/07/2021 05:18:56 - INFO - __main__ - Step 57608: {'lr': 0.00034514601297567235, 'samples': 11060736, 'steps': 57607, 'loss/train': 1.1087727546691895} -11/07/2021 05:18:56 - INFO - __main__ - Step 57609: {'lr': 0.00034514110556186446, 'samples': 11060928, 'steps': 57608, 'loss/train': 1.738145112991333} -11/07/2021 05:18:56 - INFO - __main__ - Step 57610: {'lr': 0.0003451361981051875, 'samples': 11061120, 'steps': 57609, 'loss/train': 1.6119134426116943} -11/07/2021 05:18:57 - INFO - __main__ - Step 57611: {'lr': 0.00034513129060564365, 'samples': 11061312, 'steps': 57610, 'loss/train': 0.7874797582626343} -11/07/2021 05:18:58 - INFO - __main__ - Step 57612: {'lr': 0.00034512638306323506, 'samples': 11061504, 'steps': 57611, 'loss/train': 0.8196049928665161} -11/07/2021 05:18:58 - INFO - __main__ - Step 57613: {'lr': 0.000345121475477964, 'samples': 11061696, 'steps': 57612, 'loss/train': 1.529039978981018} -11/07/2021 05:18:58 - INFO - __main__ - Step 57614: {'lr': 0.0003451165678498327, 'samples': 11061888, 'steps': 57613, 'loss/train': 1.3116601705551147} -11/07/2021 05:18:59 - INFO - __main__ - Step 57615: {'lr': 0.00034511166017884334, 'samples': 11062080, 'steps': 57614, 'loss/train': 1.3582158088684082} -11/07/2021 05:18:59 - INFO - __main__ - Step 57616: {'lr': 0.0003451067524649981, 'samples': 11062272, 'steps': 57615, 'loss/train': 0.7368661761283875} -11/07/2021 05:19:00 - INFO - __main__ - Step 57617: {'lr': 0.00034510184470829924, 'samples': 11062464, 'steps': 57616, 'loss/train': 1.6011773347854614} -11/07/2021 05:19:00 - INFO - __main__ - Step 57618: {'lr': 0.000345096936908749, 'samples': 11062656, 'steps': 57617, 'loss/train': 0.5298988819122314} -11/07/2021 05:19:01 - INFO - __main__ - Step 57619: {'lr': 0.0003450920290663495, 'samples': 11062848, 'steps': 57618, 'loss/train': 1.0885212421417236} -11/07/2021 05:19:01 - INFO - __main__ - Step 57620: {'lr': 0.000345087121181103, 'samples': 11063040, 'steps': 57619, 'loss/train': 1.5097908973693848} -11/07/2021 05:19:01 - INFO - __main__ - Step 57621: {'lr': 0.0003450822132530117, 'samples': 11063232, 'steps': 57620, 'loss/train': 1.131121277809143} -11/07/2021 05:19:02 - INFO - __main__ - Step 57622: {'lr': 0.0003450773052820779, 'samples': 11063424, 'steps': 57621, 'loss/train': 0.9881262183189392} -11/07/2021 05:19:03 - INFO - __main__ - Step 57623: {'lr': 0.0003450723972683036, 'samples': 11063616, 'steps': 57622, 'loss/train': 1.750808835029602} -11/07/2021 05:19:03 - INFO - __main__ - Step 57624: {'lr': 0.00034506748921169124, 'samples': 11063808, 'steps': 57623, 'loss/train': 1.2427629232406616} -11/07/2021 05:19:03 - INFO - __main__ - Step 57625: {'lr': 0.00034506258111224294, 'samples': 11064000, 'steps': 57624, 'loss/train': 1.133847713470459} -11/07/2021 05:19:04 - INFO - __main__ - Step 57626: {'lr': 0.00034505767296996086, 'samples': 11064192, 'steps': 57625, 'loss/train': 1.138538122177124} -11/07/2021 05:19:05 - INFO - __main__ - Step 57627: {'lr': 0.0003450527647848473, 'samples': 11064384, 'steps': 57626, 'loss/train': 1.8103456497192383} -11/07/2021 05:19:05 - INFO - __main__ - Step 57628: {'lr': 0.0003450478565569044, 'samples': 11064576, 'steps': 57627, 'loss/train': 1.8080732822418213} -11/07/2021 05:19:06 - INFO - __main__ - Step 57629: {'lr': 0.0003450429482861344, 'samples': 11064768, 'steps': 57628, 'loss/train': 1.4648878574371338} -11/07/2021 05:19:06 - INFO - __main__ - Step 57630: {'lr': 0.0003450380399725396, 'samples': 11064960, 'steps': 57629, 'loss/train': 0.7530885338783264} -11/07/2021 05:19:06 - INFO - __main__ - Step 57631: {'lr': 0.000345033131616122, 'samples': 11065152, 'steps': 57630, 'loss/train': 1.634304404258728} -11/07/2021 05:19:07 - INFO - __main__ - Step 57632: {'lr': 0.000345028223216884, 'samples': 11065344, 'steps': 57631, 'loss/train': 1.7826693058013916} -11/07/2021 05:19:08 - INFO - __main__ - Step 57633: {'lr': 0.0003450233147748278, 'samples': 11065536, 'steps': 57632, 'loss/train': 1.7429877519607544} -11/07/2021 05:19:08 - INFO - __main__ - Step 57634: {'lr': 0.00034501840628995545, 'samples': 11065728, 'steps': 57633, 'loss/train': 1.4022407531738281} -11/07/2021 05:19:08 - INFO - __main__ - Step 57635: {'lr': 0.0003450134977622693, 'samples': 11065920, 'steps': 57634, 'loss/train': 1.4085102081298828} -11/07/2021 05:19:09 - INFO - __main__ - Step 57636: {'lr': 0.0003450085891917716, 'samples': 11066112, 'steps': 57635, 'loss/train': 1.1837139129638672} -11/07/2021 05:19:09 - INFO - __main__ - Step 57637: {'lr': 0.00034500368057846444, 'samples': 11066304, 'steps': 57636, 'loss/train': 1.6431742906570435} -11/07/2021 05:19:10 - INFO - __main__ - Step 57638: {'lr': 0.00034499877192235005, 'samples': 11066496, 'steps': 57637, 'loss/train': 1.51119065284729} -11/07/2021 05:19:11 - INFO - __main__ - Step 57639: {'lr': 0.00034499386322343087, 'samples': 11066688, 'steps': 57638, 'loss/train': 1.151750087738037} -11/07/2021 05:19:11 - INFO - __main__ - Step 57640: {'lr': 0.00034498895448170874, 'samples': 11066880, 'steps': 57639, 'loss/train': 1.271364450454712} -11/07/2021 05:19:11 - INFO - __main__ - Step 57641: {'lr': 0.0003449840456971861, 'samples': 11067072, 'steps': 57640, 'loss/train': 1.3291971683502197} -11/07/2021 05:19:12 - INFO - __main__ - Step 57642: {'lr': 0.0003449791368698651, 'samples': 11067264, 'steps': 57641, 'loss/train': 1.3007110357284546} -11/07/2021 05:19:13 - INFO - __main__ - Step 57643: {'lr': 0.000344974227999748, 'samples': 11067456, 'steps': 57642, 'loss/train': 1.3085644245147705} -11/07/2021 05:19:13 - INFO - __main__ - Step 57644: {'lr': 0.0003449693190868369, 'samples': 11067648, 'steps': 57643, 'loss/train': 1.3239974975585938} -11/07/2021 05:19:13 - INFO - __main__ - Step 57645: {'lr': 0.0003449644101311341, 'samples': 11067840, 'steps': 57644, 'loss/train': 1.547965168952942} -11/07/2021 05:19:14 - INFO - __main__ - Step 57646: {'lr': 0.00034495950113264194, 'samples': 11068032, 'steps': 57645, 'loss/train': 1.2187222242355347} -11/07/2021 05:19:14 - INFO - __main__ - Step 57647: {'lr': 0.0003449545920913624, 'samples': 11068224, 'steps': 57646, 'loss/train': 1.7817707061767578} -11/07/2021 05:19:15 - INFO - __main__ - Step 57648: {'lr': 0.0003449496830072978, 'samples': 11068416, 'steps': 57647, 'loss/train': 1.0762932300567627} -11/07/2021 05:19:15 - INFO - __main__ - Step 57649: {'lr': 0.0003449447738804503, 'samples': 11068608, 'steps': 57648, 'loss/train': 0.5625360608100891} -11/07/2021 05:19:16 - INFO - __main__ - Step 57650: {'lr': 0.00034493986471082215, 'samples': 11068800, 'steps': 57649, 'loss/train': 1.4757633209228516} -11/07/2021 05:19:16 - INFO - __main__ - Step 57651: {'lr': 0.0003449349554984156, 'samples': 11068992, 'steps': 57650, 'loss/train': 1.2945477962493896} -11/07/2021 05:19:16 - INFO - __main__ - Step 57652: {'lr': 0.0003449300462432328, 'samples': 11069184, 'steps': 57651, 'loss/train': 1.314429759979248} -11/07/2021 05:19:17 - INFO - __main__ - Step 57653: {'lr': 0.0003449251369452761, 'samples': 11069376, 'steps': 57652, 'loss/train': 1.6082700490951538} -11/07/2021 05:19:18 - INFO - __main__ - Step 57654: {'lr': 0.00034492022760454743, 'samples': 11069568, 'steps': 57653, 'loss/train': 1.409935474395752} -11/07/2021 05:19:18 - INFO - __main__ - Step 57655: {'lr': 0.00034491531822104923, 'samples': 11069760, 'steps': 57654, 'loss/train': 1.408873438835144} -11/07/2021 05:19:18 - INFO - __main__ - Step 57656: {'lr': 0.00034491040879478364, 'samples': 11069952, 'steps': 57655, 'loss/train': 1.2753372192382812} -11/07/2021 05:19:19 - INFO - __main__ - Step 57657: {'lr': 0.0003449054993257529, 'samples': 11070144, 'steps': 57656, 'loss/train': 1.4293252229690552} -11/07/2021 05:19:20 - INFO - __main__ - Step 57658: {'lr': 0.0003449005898139592, 'samples': 11070336, 'steps': 57657, 'loss/train': 1.550768494606018} -11/07/2021 05:19:20 - INFO - __main__ - Step 57659: {'lr': 0.0003448956802594048, 'samples': 11070528, 'steps': 57658, 'loss/train': 0.6354227662086487} -11/07/2021 05:19:20 - INFO - __main__ - Step 57660: {'lr': 0.00034489077066209185, 'samples': 11070720, 'steps': 57659, 'loss/train': 1.4722617864608765} -11/07/2021 05:19:21 - INFO - __main__ - Step 57661: {'lr': 0.0003448858610220226, 'samples': 11070912, 'steps': 57660, 'loss/train': 1.1395282745361328} -11/07/2021 05:19:21 - INFO - __main__ - Step 57662: {'lr': 0.00034488095133919914, 'samples': 11071104, 'steps': 57661, 'loss/train': 1.1864697933197021} -11/07/2021 05:19:22 - INFO - __main__ - Step 57663: {'lr': 0.0003448760416136239, 'samples': 11071296, 'steps': 57662, 'loss/train': 1.638628602027893} -11/07/2021 05:19:22 - INFO - __main__ - Step 57664: {'lr': 0.00034487113184529896, 'samples': 11071488, 'steps': 57663, 'loss/train': 1.009995937347412} -11/07/2021 05:19:23 - INFO - __main__ - Step 57665: {'lr': 0.0003448662220342265, 'samples': 11071680, 'steps': 57664, 'loss/train': 1.5353615283966064} -11/07/2021 05:19:23 - INFO - __main__ - Step 57666: {'lr': 0.0003448613121804088, 'samples': 11071872, 'steps': 57665, 'loss/train': 1.1033000946044922} -11/07/2021 05:19:23 - INFO - __main__ - Step 57667: {'lr': 0.0003448564022838481, 'samples': 11072064, 'steps': 57666, 'loss/train': 1.711601734161377} -11/07/2021 05:19:25 - INFO - __main__ - Step 57668: {'lr': 0.0003448514923445466, 'samples': 11072256, 'steps': 57667, 'loss/train': 0.8116577863693237} -11/07/2021 05:19:25 - INFO - __main__ - Step 57669: {'lr': 0.00034484658236250636, 'samples': 11072448, 'steps': 57668, 'loss/train': 1.245047926902771} -11/07/2021 05:19:25 - INFO - __main__ - Step 57670: {'lr': 0.0003448416723377298, 'samples': 11072640, 'steps': 57669, 'loss/train': 1.4965254068374634} -11/07/2021 05:19:26 - INFO - __main__ - Step 57671: {'lr': 0.00034483676227021906, 'samples': 11072832, 'steps': 57670, 'loss/train': 1.5550516843795776} -11/07/2021 05:19:26 - INFO - __main__ - Step 57672: {'lr': 0.00034483185215997624, 'samples': 11073024, 'steps': 57671, 'loss/train': 1.3319071531295776} -11/07/2021 05:19:27 - INFO - __main__ - Step 57673: {'lr': 0.00034482694200700377, 'samples': 11073216, 'steps': 57672, 'loss/train': 1.562532901763916} -11/07/2021 05:19:27 - INFO - __main__ - Step 57674: {'lr': 0.00034482203181130365, 'samples': 11073408, 'steps': 57673, 'loss/train': 1.730484962463379} -11/07/2021 05:19:28 - INFO - __main__ - Step 57675: {'lr': 0.00034481712157287826, 'samples': 11073600, 'steps': 57674, 'loss/train': 1.526288628578186} -11/07/2021 05:19:28 - INFO - __main__ - Step 57676: {'lr': 0.00034481221129172967, 'samples': 11073792, 'steps': 57675, 'loss/train': 1.6786359548568726} -11/07/2021 05:19:28 - INFO - __main__ - Step 57677: {'lr': 0.0003448073009678602, 'samples': 11073984, 'steps': 57676, 'loss/train': 1.3379011154174805} -11/07/2021 05:19:29 - INFO - __main__ - Step 57678: {'lr': 0.00034480239060127204, 'samples': 11074176, 'steps': 57677, 'loss/train': 1.4021776914596558} -11/07/2021 05:19:30 - INFO - __main__ - Step 57679: {'lr': 0.00034479748019196734, 'samples': 11074368, 'steps': 57678, 'loss/train': 1.0051445960998535} -11/07/2021 05:19:30 - INFO - __main__ - Step 57680: {'lr': 0.00034479256973994843, 'samples': 11074560, 'steps': 57679, 'loss/train': 0.7099761366844177} -11/07/2021 05:19:30 - INFO - __main__ - Step 57681: {'lr': 0.0003447876592452174, 'samples': 11074752, 'steps': 57680, 'loss/train': 1.466721773147583} -11/07/2021 05:19:31 - INFO - __main__ - Step 57682: {'lr': 0.00034478274870777646, 'samples': 11074944, 'steps': 57681, 'loss/train': 1.3075916767120361} -11/07/2021 05:19:32 - INFO - __main__ - Step 57683: {'lr': 0.00034477783812762795, 'samples': 11075136, 'steps': 57682, 'loss/train': 1.4150981903076172} -11/07/2021 05:19:32 - INFO - __main__ - Step 57684: {'lr': 0.00034477292750477396, 'samples': 11075328, 'steps': 57683, 'loss/train': 1.0988235473632812} -11/07/2021 05:19:33 - INFO - __main__ - Step 57685: {'lr': 0.00034476801683921683, 'samples': 11075520, 'steps': 57684, 'loss/train': 1.3911079168319702} -11/07/2021 05:19:33 - INFO - __main__ - Step 57686: {'lr': 0.00034476310613095867, 'samples': 11075712, 'steps': 57685, 'loss/train': 0.05851629748940468} -11/07/2021 05:19:33 - INFO - __main__ - Step 57687: {'lr': 0.0003447581953800017, 'samples': 11075904, 'steps': 57686, 'loss/train': 1.8319309949874878} -11/07/2021 05:19:34 - INFO - __main__ - Step 57688: {'lr': 0.00034475328458634814, 'samples': 11076096, 'steps': 57687, 'loss/train': 1.9513481855392456} -11/07/2021 05:19:35 - INFO - __main__ - Step 57689: {'lr': 0.00034474837375000016, 'samples': 11076288, 'steps': 57688, 'loss/train': 1.4049649238586426} -11/07/2021 05:19:35 - INFO - __main__ - Step 57690: {'lr': 0.0003447434628709601, 'samples': 11076480, 'steps': 57689, 'loss/train': 2.0631494522094727} -11/07/2021 05:19:35 - INFO - __main__ - Step 57691: {'lr': 0.00034473855194923006, 'samples': 11076672, 'steps': 57690, 'loss/train': 1.1817691326141357} -11/07/2021 05:19:36 - INFO - __main__ - Step 57692: {'lr': 0.0003447336409848124, 'samples': 11076864, 'steps': 57691, 'loss/train': 1.365451693534851} -11/07/2021 05:19:37 - INFO - __main__ - Step 57693: {'lr': 0.0003447287299777091, 'samples': 11077056, 'steps': 57692, 'loss/train': 1.5198798179626465} -11/07/2021 05:19:37 - INFO - __main__ - Step 57694: {'lr': 0.0003447238189279225, 'samples': 11077248, 'steps': 57693, 'loss/train': 1.849091649055481} -11/07/2021 05:19:37 - INFO - __main__ - Step 57695: {'lr': 0.0003447189078354548, 'samples': 11077440, 'steps': 57694, 'loss/train': 1.4110535383224487} -11/07/2021 05:19:38 - INFO - __main__ - Step 57696: {'lr': 0.00034471399670030824, 'samples': 11077632, 'steps': 57695, 'loss/train': 1.1762892007827759} -11/07/2021 05:19:38 - INFO - __main__ - Step 57697: {'lr': 0.00034470908552248504, 'samples': 11077824, 'steps': 57696, 'loss/train': 1.0973211526870728} -11/07/2021 05:19:38 - INFO - __main__ - Step 57698: {'lr': 0.00034470417430198743, 'samples': 11078016, 'steps': 57697, 'loss/train': 1.0146803855895996} -11/07/2021 05:19:40 - INFO - __main__ - Step 57699: {'lr': 0.00034469926303881747, 'samples': 11078208, 'steps': 57698, 'loss/train': 1.2770438194274902} -11/07/2021 05:19:40 - INFO - __main__ - Step 57700: {'lr': 0.0003446943517329776, 'samples': 11078400, 'steps': 57699, 'loss/train': 1.2319482564926147} -11/07/2021 05:19:40 - INFO - __main__ - Step 57701: {'lr': 0.0003446894403844698, 'samples': 11078592, 'steps': 57700, 'loss/train': 1.2217903137207031} -11/07/2021 05:19:41 - INFO - __main__ - Step 57702: {'lr': 0.0003446845289932965, 'samples': 11078784, 'steps': 57701, 'loss/train': 1.4680088758468628} -11/07/2021 05:19:41 - INFO - __main__ - Step 57703: {'lr': 0.0003446796175594598, 'samples': 11078976, 'steps': 57702, 'loss/train': 0.3309529423713684} -11/07/2021 05:19:42 - INFO - __main__ - Step 57704: {'lr': 0.00034467470608296185, 'samples': 11079168, 'steps': 57703, 'loss/train': 1.5323333740234375} -11/07/2021 05:19:42 - INFO - __main__ - Step 57705: {'lr': 0.00034466979456380497, 'samples': 11079360, 'steps': 57704, 'loss/train': 1.2461626529693604} -11/07/2021 05:19:43 - INFO - __main__ - Step 57706: {'lr': 0.0003446648830019914, 'samples': 11079552, 'steps': 57705, 'loss/train': 1.397922158241272} -11/07/2021 05:19:43 - INFO - __main__ - Step 57707: {'lr': 0.00034465997139752327, 'samples': 11079744, 'steps': 57706, 'loss/train': 1.5268123149871826} -11/07/2021 05:19:43 - INFO - __main__ - Step 57708: {'lr': 0.00034465505975040273, 'samples': 11079936, 'steps': 57707, 'loss/train': 0.03303880989551544} -11/07/2021 05:19:44 - INFO - __main__ - Step 57709: {'lr': 0.0003446501480606322, 'samples': 11080128, 'steps': 57708, 'loss/train': 1.4570459127426147} -11/07/2021 05:19:45 - INFO - __main__ - Step 57710: {'lr': 0.0003446452363282137, 'samples': 11080320, 'steps': 57709, 'loss/train': 1.3838202953338623} -11/07/2021 05:19:45 - INFO - __main__ - Step 57711: {'lr': 0.00034464032455314955, 'samples': 11080512, 'steps': 57710, 'loss/train': 1.2123501300811768} -11/07/2021 05:19:45 - INFO - __main__ - Step 57712: {'lr': 0.0003446354127354419, 'samples': 11080704, 'steps': 57711, 'loss/train': 1.649638056755066} -11/07/2021 05:19:46 - INFO - __main__ - Step 57713: {'lr': 0.000344630500875093, 'samples': 11080896, 'steps': 57712, 'loss/train': 1.2207626104354858} -11/07/2021 05:19:47 - INFO - __main__ - Step 57714: {'lr': 0.0003446255889721051, 'samples': 11081088, 'steps': 57713, 'loss/train': 1.644190788269043} -11/07/2021 05:19:47 - INFO - __main__ - Step 57715: {'lr': 0.00034462067702648036, 'samples': 11081280, 'steps': 57714, 'loss/train': 1.2539130449295044} -11/07/2021 05:19:47 - INFO - __main__ - Step 57716: {'lr': 0.000344615765038221, 'samples': 11081472, 'steps': 57715, 'loss/train': 1.253875494003296} -11/07/2021 05:19:48 - INFO - __main__ - Step 57717: {'lr': 0.0003446108530073292, 'samples': 11081664, 'steps': 57716, 'loss/train': 1.1340068578720093} -11/07/2021 05:19:48 - INFO - __main__ - Step 57718: {'lr': 0.0003446059409338072, 'samples': 11081856, 'steps': 57717, 'loss/train': 0.8219293355941772} -11/07/2021 05:19:49 - INFO - __main__ - Step 57719: {'lr': 0.00034460102881765723, 'samples': 11082048, 'steps': 57718, 'loss/train': 1.338723063468933} -11/07/2021 05:19:50 - INFO - __main__ - Step 57720: {'lr': 0.0003445961166588816, 'samples': 11082240, 'steps': 57719, 'loss/train': 1.2686856985092163} -11/07/2021 05:19:50 - INFO - __main__ - Step 57721: {'lr': 0.0003445912044574823, 'samples': 11082432, 'steps': 57720, 'loss/train': 1.2591438293457031} -11/07/2021 05:19:50 - INFO - __main__ - Step 57722: {'lr': 0.00034458629221346173, 'samples': 11082624, 'steps': 57721, 'loss/train': 1.7226529121398926} -11/07/2021 05:19:51 - INFO - __main__ - Step 57723: {'lr': 0.000344581379926822, 'samples': 11082816, 'steps': 57722, 'loss/train': 1.2006354331970215} -11/07/2021 05:19:52 - INFO - __main__ - Step 57724: {'lr': 0.00034457646759756535, 'samples': 11083008, 'steps': 57723, 'loss/train': 1.7096425294876099} -11/07/2021 05:19:52 - INFO - __main__ - Step 57725: {'lr': 0.00034457155522569393, 'samples': 11083200, 'steps': 57724, 'loss/train': 1.5500774383544922} -11/07/2021 05:19:52 - INFO - __main__ - Step 57726: {'lr': 0.00034456664281121017, 'samples': 11083392, 'steps': 57725, 'loss/train': 1.4748237133026123} -11/07/2021 05:19:53 - INFO - __main__ - Step 57727: {'lr': 0.00034456173035411606, 'samples': 11083584, 'steps': 57726, 'loss/train': 1.2925790548324585} -11/07/2021 05:19:53 - INFO - __main__ - Step 57728: {'lr': 0.00034455681785441395, 'samples': 11083776, 'steps': 57727, 'loss/train': 1.6779370307922363} -11/07/2021 05:19:54 - INFO - __main__ - Step 57729: {'lr': 0.00034455190531210595, 'samples': 11083968, 'steps': 57728, 'loss/train': 1.0728123188018799} -11/07/2021 05:19:55 - INFO - __main__ - Step 57730: {'lr': 0.0003445469927271944, 'samples': 11084160, 'steps': 57729, 'loss/train': 1.1827887296676636} -11/07/2021 05:19:55 - INFO - __main__ - Step 57731: {'lr': 0.0003445420800996813, 'samples': 11084352, 'steps': 57730, 'loss/train': 1.102344036102295} -11/07/2021 05:19:55 - INFO - __main__ - Step 57732: {'lr': 0.0003445371674295691, 'samples': 11084544, 'steps': 57731, 'loss/train': 1.6247098445892334} -11/07/2021 05:19:56 - INFO - __main__ - Step 57733: {'lr': 0.0003445322547168599, 'samples': 11084736, 'steps': 57732, 'loss/train': 1.6746764183044434} -11/07/2021 05:19:57 - INFO - __main__ - Step 57734: {'lr': 0.0003445273419615559, 'samples': 11084928, 'steps': 57733, 'loss/train': 1.0753048658370972} -11/07/2021 05:19:57 - INFO - __main__ - Step 57735: {'lr': 0.00034452242916365935, 'samples': 11085120, 'steps': 57734, 'loss/train': 1.6022965908050537} -11/07/2021 05:19:58 - INFO - __main__ - Step 57736: {'lr': 0.0003445175163231724, 'samples': 11085312, 'steps': 57735, 'loss/train': 1.5820335149765015} -11/07/2021 05:19:58 - INFO - __main__ - Step 57737: {'lr': 0.00034451260344009737, 'samples': 11085504, 'steps': 57736, 'loss/train': 1.6642982959747314} -11/07/2021 05:19:58 - INFO - __main__ - Step 57738: {'lr': 0.00034450769051443635, 'samples': 11085696, 'steps': 57737, 'loss/train': 1.0080724954605103} -11/07/2021 05:19:59 - INFO - __main__ - Step 57739: {'lr': 0.0003445027775461917, 'samples': 11085888, 'steps': 57738, 'loss/train': 1.4903745651245117} -11/07/2021 05:20:00 - INFO - __main__ - Step 57740: {'lr': 0.0003444978645353656, 'samples': 11086080, 'steps': 57739, 'loss/train': 0.07775591313838959} -11/07/2021 05:20:00 - INFO - __main__ - Step 57741: {'lr': 0.0003444929514819601, 'samples': 11086272, 'steps': 57740, 'loss/train': 1.0781891345977783} -11/07/2021 05:20:01 - INFO - __main__ - Step 57742: {'lr': 0.00034448803838597766, 'samples': 11086464, 'steps': 57741, 'loss/train': 2.499934673309326} -11/07/2021 05:20:01 - INFO - __main__ - Step 57743: {'lr': 0.00034448312524742027, 'samples': 11086656, 'steps': 57742, 'loss/train': 1.4848999977111816} -11/07/2021 05:20:01 - INFO - __main__ - Step 57744: {'lr': 0.00034447821206629026, 'samples': 11086848, 'steps': 57743, 'loss/train': 1.5241488218307495} -11/07/2021 05:20:02 - INFO - __main__ - Step 57745: {'lr': 0.0003444732988425898, 'samples': 11087040, 'steps': 57744, 'loss/train': 1.348928451538086} -11/07/2021 05:20:03 - INFO - __main__ - Step 57746: {'lr': 0.0003444683855763212, 'samples': 11087232, 'steps': 57745, 'loss/train': 1.2769927978515625} -11/07/2021 05:20:03 - INFO - __main__ - Step 57747: {'lr': 0.0003444634722674866, 'samples': 11087424, 'steps': 57746, 'loss/train': 1.7812557220458984} -11/07/2021 05:20:03 - INFO - __main__ - Step 57748: {'lr': 0.0003444585589160882, 'samples': 11087616, 'steps': 57747, 'loss/train': 1.227088451385498} -11/07/2021 05:20:04 - INFO - __main__ - Step 57749: {'lr': 0.0003444536455221282, 'samples': 11087808, 'steps': 57748, 'loss/train': 1.3041777610778809} -11/07/2021 05:20:04 - INFO - __main__ - Step 57750: {'lr': 0.00034444873208560884, 'samples': 11088000, 'steps': 57749, 'loss/train': 1.9908219575881958} -11/07/2021 05:20:05 - INFO - __main__ - Step 57751: {'lr': 0.00034444381860653233, 'samples': 11088192, 'steps': 57750, 'loss/train': 1.521040678024292} -11/07/2021 05:20:05 - INFO - __main__ - Step 57752: {'lr': 0.00034443890508490093, 'samples': 11088384, 'steps': 57751, 'loss/train': 1.2209283113479614} -11/07/2021 05:20:06 - INFO - __main__ - Step 57753: {'lr': 0.0003444339915207168, 'samples': 11088576, 'steps': 57752, 'loss/train': 1.6212396621704102} -11/07/2021 05:20:06 - INFO - __main__ - Step 57754: {'lr': 0.0003444290779139823, 'samples': 11088768, 'steps': 57753, 'loss/train': 1.6818703413009644} -11/07/2021 05:20:07 - INFO - __main__ - Step 57755: {'lr': 0.00034442416426469936, 'samples': 11088960, 'steps': 57754, 'loss/train': 1.79239022731781} -11/07/2021 05:20:08 - INFO - __main__ - Step 57756: {'lr': 0.0003444192505728704, 'samples': 11089152, 'steps': 57755, 'loss/train': 1.2616841793060303} -11/07/2021 05:20:08 - INFO - __main__ - Step 57757: {'lr': 0.0003444143368384975, 'samples': 11089344, 'steps': 57756, 'loss/train': 1.4383338689804077} -11/07/2021 05:20:08 - INFO - __main__ - Step 57758: {'lr': 0.000344409423061583, 'samples': 11089536, 'steps': 57757, 'loss/train': 1.6081862449645996} -11/07/2021 05:20:09 - INFO - __main__ - Step 57759: {'lr': 0.00034440450924212913, 'samples': 11089728, 'steps': 57758, 'loss/train': 1.5299433469772339} -11/07/2021 05:20:09 - INFO - __main__ - Step 57760: {'lr': 0.00034439959538013805, 'samples': 11089920, 'steps': 57759, 'loss/train': 1.4348293542861938} -11/07/2021 05:20:10 - INFO - __main__ - Step 57761: {'lr': 0.0003443946814756119, 'samples': 11090112, 'steps': 57760, 'loss/train': 1.2355751991271973} -11/07/2021 05:20:10 - INFO - __main__ - Step 57762: {'lr': 0.000344389767528553, 'samples': 11090304, 'steps': 57761, 'loss/train': 0.541526198387146} -11/07/2021 05:20:11 - INFO - __main__ - Step 57763: {'lr': 0.0003443848535389635, 'samples': 11090496, 'steps': 57762, 'loss/train': 1.4673749208450317} -11/07/2021 05:20:11 - INFO - __main__ - Step 57764: {'lr': 0.00034437993950684566, 'samples': 11090688, 'steps': 57763, 'loss/train': 1.3057758808135986} -11/07/2021 05:20:11 - INFO - __main__ - Step 57765: {'lr': 0.00034437502543220166, 'samples': 11090880, 'steps': 57764, 'loss/train': 1.5854928493499756} -11/07/2021 05:20:12 - INFO - __main__ - Step 57766: {'lr': 0.0003443701113150337, 'samples': 11091072, 'steps': 57765, 'loss/train': 0.4549166262149811} -11/07/2021 05:20:13 - INFO - __main__ - Step 57767: {'lr': 0.00034436519715534415, 'samples': 11091264, 'steps': 57766, 'loss/train': 1.3708440065383911} -11/07/2021 05:20:13 - INFO - __main__ - Step 57768: {'lr': 0.00034436028295313503, 'samples': 11091456, 'steps': 57767, 'loss/train': 1.161154866218567} -11/07/2021 05:20:13 - INFO - __main__ - Step 57769: {'lr': 0.00034435536870840855, 'samples': 11091648, 'steps': 57768, 'loss/train': 1.197624683380127} -11/07/2021 05:20:14 - INFO - __main__ - Step 57770: {'lr': 0.0003443504544211671, 'samples': 11091840, 'steps': 57769, 'loss/train': 1.1574995517730713} -11/07/2021 05:20:15 - INFO - __main__ - Step 57771: {'lr': 0.0003443455400914127, 'samples': 11092032, 'steps': 57770, 'loss/train': 1.2135539054870605} -11/07/2021 05:20:15 - INFO - __main__ - Step 57772: {'lr': 0.0003443406257191477, 'samples': 11092224, 'steps': 57771, 'loss/train': 1.3909350633621216} -11/07/2021 05:20:16 - INFO - __main__ - Step 57773: {'lr': 0.0003443357113043743, 'samples': 11092416, 'steps': 57772, 'loss/train': 1.4927105903625488} -11/07/2021 05:20:16 - INFO - __main__ - Step 57774: {'lr': 0.00034433079684709466, 'samples': 11092608, 'steps': 57773, 'loss/train': 1.1110316514968872} -11/07/2021 05:20:16 - INFO - __main__ - Step 57775: {'lr': 0.000344325882347311, 'samples': 11092800, 'steps': 57774, 'loss/train': 1.4093879461288452} -11/07/2021 05:20:17 - INFO - __main__ - Step 57776: {'lr': 0.00034432096780502564, 'samples': 11092992, 'steps': 57775, 'loss/train': 1.352190613746643} -11/07/2021 05:20:18 - INFO - __main__ - Step 57777: {'lr': 0.0003443160532202406, 'samples': 11093184, 'steps': 57776, 'loss/train': 0.969149649143219} -11/07/2021 05:20:18 - INFO - __main__ - Step 57778: {'lr': 0.00034431113859295827, 'samples': 11093376, 'steps': 57777, 'loss/train': 1.5390814542770386} -11/07/2021 05:20:18 - INFO - __main__ - Step 57779: {'lr': 0.00034430622392318073, 'samples': 11093568, 'steps': 57778, 'loss/train': 1.5301694869995117} -11/07/2021 05:20:19 - INFO - __main__ - Step 57780: {'lr': 0.0003443013092109103, 'samples': 11093760, 'steps': 57779, 'loss/train': 1.3802093267440796} -11/07/2021 05:20:20 - INFO - __main__ - Step 57781: {'lr': 0.0003442963944561492, 'samples': 11093952, 'steps': 57780, 'loss/train': 1.5616902112960815} -11/07/2021 05:20:20 - INFO - __main__ - Step 57782: {'lr': 0.0003442914796588995, 'samples': 11094144, 'steps': 57781, 'loss/train': 2.0523765087127686} -11/07/2021 05:20:20 - INFO - __main__ - Step 57783: {'lr': 0.00034428656481916357, 'samples': 11094336, 'steps': 57782, 'loss/train': 0.9525910019874573} -11/07/2021 05:20:21 - INFO - __main__ - Step 57784: {'lr': 0.00034428164993694356, 'samples': 11094528, 'steps': 57783, 'loss/train': 1.1512936353683472} -11/07/2021 05:20:21 - INFO - __main__ - Step 57785: {'lr': 0.0003442767350122417, 'samples': 11094720, 'steps': 57784, 'loss/train': 1.297159194946289} -11/07/2021 05:20:22 - INFO - __main__ - Step 57786: {'lr': 0.0003442718200450602, 'samples': 11094912, 'steps': 57785, 'loss/train': 1.5386817455291748} -11/07/2021 05:20:22 - INFO - __main__ - Step 57787: {'lr': 0.0003442669050354013, 'samples': 11095104, 'steps': 57786, 'loss/train': 1.2106409072875977} -11/07/2021 05:20:23 - INFO - __main__ - Step 57788: {'lr': 0.00034426198998326713, 'samples': 11095296, 'steps': 57787, 'loss/train': 1.3910138607025146} -11/07/2021 05:20:23 - INFO - __main__ - Step 57789: {'lr': 0.00034425707488866, 'samples': 11095488, 'steps': 57788, 'loss/train': 1.5607638359069824} -11/07/2021 05:20:23 - INFO - __main__ - Step 57790: {'lr': 0.0003442521597515821, 'samples': 11095680, 'steps': 57789, 'loss/train': 0.755548894405365} -11/07/2021 05:20:24 - INFO - __main__ - Step 57791: {'lr': 0.00034424724457203553, 'samples': 11095872, 'steps': 57790, 'loss/train': 1.1952698230743408} -11/07/2021 05:20:25 - INFO - __main__ - Step 57792: {'lr': 0.0003442423293500227, 'samples': 11096064, 'steps': 57791, 'loss/train': 1.4297170639038086} -11/07/2021 05:20:25 - INFO - __main__ - Step 57793: {'lr': 0.0003442374140855457, 'samples': 11096256, 'steps': 57792, 'loss/train': 1.6370017528533936} -11/07/2021 05:20:25 - INFO - __main__ - Step 57794: {'lr': 0.00034423249877860683, 'samples': 11096448, 'steps': 57793, 'loss/train': 0.8426752090454102} -11/07/2021 05:20:26 - INFO - __main__ - Step 57795: {'lr': 0.0003442275834292082, 'samples': 11096640, 'steps': 57794, 'loss/train': 1.2816393375396729} -11/07/2021 05:20:27 - INFO - __main__ - Step 57796: {'lr': 0.0003442226680373521, 'samples': 11096832, 'steps': 57795, 'loss/train': 1.638270616531372} -11/07/2021 05:20:27 - INFO - __main__ - Step 57797: {'lr': 0.00034421775260304067, 'samples': 11097024, 'steps': 57796, 'loss/train': 1.542790412902832} -11/07/2021 05:20:28 - INFO - __main__ - Step 57798: {'lr': 0.0003442128371262762, 'samples': 11097216, 'steps': 57797, 'loss/train': 1.4426237344741821} -11/07/2021 05:20:28 - INFO - __main__ - Step 57799: {'lr': 0.00034420792160706087, 'samples': 11097408, 'steps': 57798, 'loss/train': 0.5713027715682983} -11/07/2021 05:20:28 - INFO - __main__ - Step 57800: {'lr': 0.0003442030060453969, 'samples': 11097600, 'steps': 57799, 'loss/train': 1.7395669221878052} -11/07/2021 05:20:29 - INFO - __main__ - Step 57801: {'lr': 0.0003441980904412866, 'samples': 11097792, 'steps': 57800, 'loss/train': 1.0744584798812866} -11/07/2021 05:20:30 - INFO - __main__ - Step 57802: {'lr': 0.000344193174794732, 'samples': 11097984, 'steps': 57801, 'loss/train': 2.3064522743225098} -11/07/2021 05:20:30 - INFO - __main__ - Step 57803: {'lr': 0.00034418825910573545, 'samples': 11098176, 'steps': 57802, 'loss/train': 1.4305062294006348} -11/07/2021 05:20:31 - INFO - __main__ - Step 57804: {'lr': 0.00034418334337429907, 'samples': 11098368, 'steps': 57803, 'loss/train': 0.11569163203239441} -11/07/2021 05:20:31 - INFO - __main__ - Step 57805: {'lr': 0.00034417842760042517, 'samples': 11098560, 'steps': 57804, 'loss/train': 1.8115553855895996} -11/07/2021 05:20:32 - INFO - __main__ - Step 57806: {'lr': 0.0003441735117841159, 'samples': 11098752, 'steps': 57805, 'loss/train': 1.549162745475769} -11/07/2021 05:20:32 - INFO - __main__ - Step 57807: {'lr': 0.0003441685959253736, 'samples': 11098944, 'steps': 57806, 'loss/train': 1.1044977903366089} -11/07/2021 05:20:33 - INFO - __main__ - Step 57808: {'lr': 0.0003441636800242003, 'samples': 11099136, 'steps': 57807, 'loss/train': 1.107480525970459} -11/07/2021 05:20:33 - INFO - __main__ - Step 57809: {'lr': 0.0003441587640805983, 'samples': 11099328, 'steps': 57808, 'loss/train': 1.224845290184021} -11/07/2021 05:20:34 - INFO - __main__ - Step 57810: {'lr': 0.0003441538480945697, 'samples': 11099520, 'steps': 57809, 'loss/train': 1.0226614475250244} -11/07/2021 05:20:34 - INFO - __main__ - Step 57811: {'lr': 0.00034414893206611695, 'samples': 11099712, 'steps': 57810, 'loss/train': 1.5952225923538208} -11/07/2021 05:20:35 - INFO - __main__ - Step 57812: {'lr': 0.0003441440159952422, 'samples': 11099904, 'steps': 57811, 'loss/train': 1.1762220859527588} -11/07/2021 05:20:36 - INFO - __main__ - Step 57813: {'lr': 0.00034413909988194753, 'samples': 11100096, 'steps': 57812, 'loss/train': 1.836982011795044} -11/07/2021 05:20:36 - INFO - __main__ - Step 57814: {'lr': 0.0003441341837262353, 'samples': 11100288, 'steps': 57813, 'loss/train': 0.7086502909660339} -11/07/2021 05:20:36 - INFO - __main__ - Step 57815: {'lr': 0.00034412926752810756, 'samples': 11100480, 'steps': 57814, 'loss/train': 0.8831301331520081} -11/07/2021 05:20:37 - INFO - __main__ - Step 57816: {'lr': 0.0003441243512875667, 'samples': 11100672, 'steps': 57815, 'loss/train': 1.4944149255752563} -11/07/2021 05:20:38 - INFO - __main__ - Step 57817: {'lr': 0.00034411943500461484, 'samples': 11100864, 'steps': 57816, 'loss/train': 1.751255750656128} -11/07/2021 05:20:38 - INFO - __main__ - Step 57818: {'lr': 0.0003441145186792542, 'samples': 11101056, 'steps': 57817, 'loss/train': 1.6801643371582031} -11/07/2021 05:20:38 - INFO - __main__ - Step 57819: {'lr': 0.000344109602311487, 'samples': 11101248, 'steps': 57818, 'loss/train': 1.4103548526763916} -11/07/2021 05:20:39 - INFO - __main__ - Step 57820: {'lr': 0.0003441046859013155, 'samples': 11101440, 'steps': 57819, 'loss/train': 1.3571488857269287} -11/07/2021 05:20:39 - INFO - __main__ - Step 57821: {'lr': 0.00034409976944874186, 'samples': 11101632, 'steps': 57820, 'loss/train': 1.3241790533065796} -11/07/2021 05:20:40 - INFO - __main__ - Step 57822: {'lr': 0.0003440948529537683, 'samples': 11101824, 'steps': 57821, 'loss/train': 1.1724662780761719} -11/07/2021 05:20:40 - INFO - __main__ - Step 57823: {'lr': 0.00034408993641639707, 'samples': 11102016, 'steps': 57822, 'loss/train': 1.1723467111587524} -11/07/2021 05:20:41 - INFO - __main__ - Step 57824: {'lr': 0.0003440850198366304, 'samples': 11102208, 'steps': 57823, 'loss/train': 1.08247971534729} -11/07/2021 05:20:41 - INFO - __main__ - Step 57825: {'lr': 0.0003440801032144704, 'samples': 11102400, 'steps': 57824, 'loss/train': 1.039486050605774} -11/07/2021 05:20:42 - INFO - __main__ - Step 57826: {'lr': 0.00034407518654991945, 'samples': 11102592, 'steps': 57825, 'loss/train': 1.1007189750671387} -11/07/2021 05:20:43 - INFO - __main__ - Step 57827: {'lr': 0.00034407026984297964, 'samples': 11102784, 'steps': 57826, 'loss/train': 1.5922685861587524} -11/07/2021 05:20:43 - INFO - __main__ - Step 57828: {'lr': 0.00034406535309365317, 'samples': 11102976, 'steps': 57827, 'loss/train': 1.230177402496338} -11/07/2021 05:20:43 - INFO - __main__ - Step 57829: {'lr': 0.0003440604363019423, 'samples': 11103168, 'steps': 57828, 'loss/train': 1.265795111656189} -11/07/2021 05:20:44 - INFO - __main__ - Step 57830: {'lr': 0.0003440555194678493, 'samples': 11103360, 'steps': 57829, 'loss/train': 1.4641492366790771} -11/07/2021 05:20:44 - INFO - __main__ - Step 57831: {'lr': 0.0003440506025913763, 'samples': 11103552, 'steps': 57830, 'loss/train': 1.6361924409866333} -11/07/2021 05:20:45 - INFO - __main__ - Step 57832: {'lr': 0.0003440456856725256, 'samples': 11103744, 'steps': 57831, 'loss/train': 1.487054467201233} -11/07/2021 05:20:45 - INFO - __main__ - Step 57833: {'lr': 0.0003440407687112993, 'samples': 11103936, 'steps': 57832, 'loss/train': 1.1568161249160767} -11/07/2021 05:20:46 - INFO - __main__ - Step 57834: {'lr': 0.0003440358517076997, 'samples': 11104128, 'steps': 57833, 'loss/train': 1.13609778881073} -11/07/2021 05:20:46 - INFO - __main__ - Step 57835: {'lr': 0.00034403093466172903, 'samples': 11104320, 'steps': 57834, 'loss/train': 1.3248300552368164} -11/07/2021 05:20:46 - INFO - __main__ - Step 57836: {'lr': 0.00034402601757338946, 'samples': 11104512, 'steps': 57835, 'loss/train': 1.3437557220458984} -11/07/2021 05:20:47 - INFO - __main__ - Step 57837: {'lr': 0.00034402110044268327, 'samples': 11104704, 'steps': 57836, 'loss/train': 1.1121588945388794} -11/07/2021 05:20:48 - INFO - __main__ - Step 57838: {'lr': 0.00034401618326961253, 'samples': 11104896, 'steps': 57837, 'loss/train': 1.7878296375274658} -11/07/2021 05:20:48 - INFO - __main__ - Step 57839: {'lr': 0.0003440112660541795, 'samples': 11105088, 'steps': 57838, 'loss/train': 1.859351396560669} -11/07/2021 05:20:48 - INFO - __main__ - Step 57840: {'lr': 0.0003440063487963866, 'samples': 11105280, 'steps': 57839, 'loss/train': 1.1802302598953247} -11/07/2021 05:20:49 - INFO - __main__ - Step 57841: {'lr': 0.00034400143149623574, 'samples': 11105472, 'steps': 57840, 'loss/train': 1.8758044242858887} -11/07/2021 05:20:50 - INFO - __main__ - Step 57842: {'lr': 0.0003439965141537294, 'samples': 11105664, 'steps': 57841, 'loss/train': 1.8026816844940186} -11/07/2021 05:20:50 - INFO - __main__ - Step 57843: {'lr': 0.00034399159676886965, 'samples': 11105856, 'steps': 57842, 'loss/train': 0.5418456792831421} -11/07/2021 05:20:51 - INFO - __main__ - Step 57844: {'lr': 0.00034398667934165873, 'samples': 11106048, 'steps': 57843, 'loss/train': 0.05089479684829712} -11/07/2021 05:20:51 - INFO - __main__ - Step 57845: {'lr': 0.00034398176187209887, 'samples': 11106240, 'steps': 57844, 'loss/train': 1.1053050756454468} -11/07/2021 05:20:51 - INFO - __main__ - Step 57846: {'lr': 0.0003439768443601923, 'samples': 11106432, 'steps': 57845, 'loss/train': 1.5870858430862427} -11/07/2021 05:20:52 - INFO - __main__ - Step 57847: {'lr': 0.0003439719268059411, 'samples': 11106624, 'steps': 57846, 'loss/train': 1.7755992412567139} -11/07/2021 05:20:53 - INFO - __main__ - Step 57848: {'lr': 0.0003439670092093478, 'samples': 11106816, 'steps': 57847, 'loss/train': 0.8469088673591614} -11/07/2021 05:20:53 - INFO - __main__ - Step 57849: {'lr': 0.00034396209157041424, 'samples': 11107008, 'steps': 57848, 'loss/train': 1.2248122692108154} -11/07/2021 05:20:53 - INFO - __main__ - Step 57850: {'lr': 0.0003439571738891428, 'samples': 11107200, 'steps': 57849, 'loss/train': 0.9531872868537903} -11/07/2021 05:20:54 - INFO - __main__ - Step 57851: {'lr': 0.00034395225616553585, 'samples': 11107392, 'steps': 57850, 'loss/train': 1.5660516023635864} -11/07/2021 05:20:54 - INFO - __main__ - Step 57852: {'lr': 0.00034394733839959534, 'samples': 11107584, 'steps': 57851, 'loss/train': 1.6531728506088257} -11/07/2021 05:20:55 - INFO - __main__ - Step 57853: {'lr': 0.0003439424205913236, 'samples': 11107776, 'steps': 57852, 'loss/train': 1.7772634029388428} -11/07/2021 05:20:56 - INFO - __main__ - Step 57854: {'lr': 0.000343937502740723, 'samples': 11107968, 'steps': 57853, 'loss/train': 1.7304883003234863} -11/07/2021 05:20:56 - INFO - __main__ - Step 57855: {'lr': 0.00034393258484779555, 'samples': 11108160, 'steps': 57854, 'loss/train': 1.537498116493225} -11/07/2021 05:20:56 - INFO - __main__ - Step 57856: {'lr': 0.0003439276669125435, 'samples': 11108352, 'steps': 57855, 'loss/train': 1.427783727645874} -11/07/2021 05:20:57 - INFO - __main__ - Step 57857: {'lr': 0.00034392274893496903, 'samples': 11108544, 'steps': 57856, 'loss/train': 1.1278772354125977} -11/07/2021 05:20:58 - INFO - __main__ - Step 57858: {'lr': 0.0003439178309150745, 'samples': 11108736, 'steps': 57857, 'loss/train': 1.3305517435073853} -11/07/2021 05:20:58 - INFO - __main__ - Step 57859: {'lr': 0.000343912912852862, 'samples': 11108928, 'steps': 57858, 'loss/train': 1.2788364887237549} -11/07/2021 05:20:58 - INFO - __main__ - Step 57860: {'lr': 0.00034390799474833385, 'samples': 11109120, 'steps': 57859, 'loss/train': 0.5940954089164734} -11/07/2021 05:20:59 - INFO - __main__ - Step 57861: {'lr': 0.0003439030766014922, 'samples': 11109312, 'steps': 57860, 'loss/train': 1.5349797010421753} -11/07/2021 05:20:59 - INFO - __main__ - Step 57862: {'lr': 0.0003438981584123392, 'samples': 11109504, 'steps': 57861, 'loss/train': 1.8759766817092896} -11/07/2021 05:21:00 - INFO - __main__ - Step 57863: {'lr': 0.0003438932401808772, 'samples': 11109696, 'steps': 57862, 'loss/train': 0.8557454943656921} -11/07/2021 05:21:01 - INFO - __main__ - Step 57864: {'lr': 0.0003438883219071083, 'samples': 11109888, 'steps': 57863, 'loss/train': 1.0207797288894653} -11/07/2021 05:21:01 - INFO - __main__ - Step 57865: {'lr': 0.00034388340359103485, 'samples': 11110080, 'steps': 57864, 'loss/train': 1.1741703748703003} -11/07/2021 05:21:01 - INFO - __main__ - Step 57866: {'lr': 0.0003438784852326589, 'samples': 11110272, 'steps': 57865, 'loss/train': 0.4235229194164276} -11/07/2021 05:21:02 - INFO - __main__ - Step 57867: {'lr': 0.0003438735668319828, 'samples': 11110464, 'steps': 57866, 'loss/train': 1.6470001935958862} -11/07/2021 05:21:03 - INFO - __main__ - Step 57868: {'lr': 0.00034386864838900877, 'samples': 11110656, 'steps': 57867, 'loss/train': 1.5702577829360962} -11/07/2021 05:21:03 - INFO - __main__ - Step 57869: {'lr': 0.00034386372990373893, 'samples': 11110848, 'steps': 57868, 'loss/train': 1.312443733215332} -11/07/2021 05:21:03 - INFO - __main__ - Step 57870: {'lr': 0.0003438588113761755, 'samples': 11111040, 'steps': 57869, 'loss/train': 0.07350760698318481} -11/07/2021 05:21:04 - INFO - __main__ - Step 57871: {'lr': 0.00034385389280632077, 'samples': 11111232, 'steps': 57870, 'loss/train': 1.0477763414382935} -11/07/2021 05:21:04 - INFO - __main__ - Step 57872: {'lr': 0.00034384897419417694, 'samples': 11111424, 'steps': 57871, 'loss/train': 0.7560630440711975} -11/07/2021 05:21:05 - INFO - __main__ - Step 57873: {'lr': 0.0003438440555397462, 'samples': 11111616, 'steps': 57872, 'loss/train': 1.059000015258789} -11/07/2021 05:21:06 - INFO - __main__ - Step 57874: {'lr': 0.00034383913684303075, 'samples': 11111808, 'steps': 57873, 'loss/train': 1.5997111797332764} -11/07/2021 05:21:06 - INFO - __main__ - Step 57875: {'lr': 0.00034383421810403294, 'samples': 11112000, 'steps': 57874, 'loss/train': 1.3373414278030396} -11/07/2021 05:21:07 - INFO - __main__ - Step 57876: {'lr': 0.00034382929932275476, 'samples': 11112192, 'steps': 57875, 'loss/train': 1.5026295185089111} -11/07/2021 05:21:07 - INFO - __main__ - Step 57877: {'lr': 0.0003438243804991986, 'samples': 11112384, 'steps': 57876, 'loss/train': 1.6113172769546509} -11/07/2021 05:21:08 - INFO - __main__ - Step 57878: {'lr': 0.0003438194616333666, 'samples': 11112576, 'steps': 57877, 'loss/train': 0.31013643741607666} -11/07/2021 05:21:08 - INFO - __main__ - Step 57879: {'lr': 0.00034381454272526096, 'samples': 11112768, 'steps': 57878, 'loss/train': 1.2493027448654175} -11/07/2021 05:21:09 - INFO - __main__ - Step 57880: {'lr': 0.000343809623774884, 'samples': 11112960, 'steps': 57879, 'loss/train': 1.2290037870407104} -11/07/2021 05:21:09 - INFO - __main__ - Step 57881: {'lr': 0.0003438047047822379, 'samples': 11113152, 'steps': 57880, 'loss/train': 1.3986181020736694} -11/07/2021 05:21:09 - INFO - __main__ - Step 57882: {'lr': 0.0003437997857473248, 'samples': 11113344, 'steps': 57881, 'loss/train': 1.0933270454406738} -11/07/2021 05:21:10 - INFO - __main__ - Step 57883: {'lr': 0.0003437948666701469, 'samples': 11113536, 'steps': 57882, 'loss/train': 0.9028867483139038} -11/07/2021 05:21:11 - INFO - __main__ - Step 57884: {'lr': 0.00034378994755070657, 'samples': 11113728, 'steps': 57883, 'loss/train': 1.2105731964111328} -11/07/2021 05:21:11 - INFO - __main__ - Step 57885: {'lr': 0.00034378502838900587, 'samples': 11113920, 'steps': 57884, 'loss/train': 1.6737838983535767} -11/07/2021 05:21:11 - INFO - __main__ - Step 57886: {'lr': 0.00034378010918504714, 'samples': 11114112, 'steps': 57885, 'loss/train': 1.116660714149475} -11/07/2021 05:21:12 - INFO - __main__ - Step 57887: {'lr': 0.0003437751899388325, 'samples': 11114304, 'steps': 57886, 'loss/train': 1.4971961975097656} -11/07/2021 05:21:13 - INFO - __main__ - Step 57888: {'lr': 0.00034377027065036423, 'samples': 11114496, 'steps': 57887, 'loss/train': 1.456732153892517} -11/07/2021 05:21:13 - INFO - __main__ - Step 57889: {'lr': 0.0003437653513196446, 'samples': 11114688, 'steps': 57888, 'loss/train': 1.1172996759414673} -11/07/2021 05:21:14 - INFO - __main__ - Step 57890: {'lr': 0.0003437604319466756, 'samples': 11114880, 'steps': 57889, 'loss/train': 1.5059787034988403} -11/07/2021 05:21:14 - INFO - __main__ - Step 57891: {'lr': 0.0003437555125314597, 'samples': 11115072, 'steps': 57890, 'loss/train': 0.9523252248764038} -11/07/2021 05:21:14 - INFO - __main__ - Step 57892: {'lr': 0.00034375059307399896, 'samples': 11115264, 'steps': 57891, 'loss/train': 1.4915522336959839} -11/07/2021 05:21:15 - INFO - __main__ - Step 57893: {'lr': 0.00034374567357429563, 'samples': 11115456, 'steps': 57892, 'loss/train': 1.5016074180603027} -11/07/2021 05:21:16 - INFO - __main__ - Step 57894: {'lr': 0.000343740754032352, 'samples': 11115648, 'steps': 57893, 'loss/train': 1.9699833393096924} -11/07/2021 05:21:16 - INFO - __main__ - Step 57895: {'lr': 0.00034373583444817024, 'samples': 11115840, 'steps': 57894, 'loss/train': 1.5629128217697144} -11/07/2021 05:21:17 - INFO - __main__ - Step 57896: {'lr': 0.0003437309148217526, 'samples': 11116032, 'steps': 57895, 'loss/train': 1.4169114828109741} -11/07/2021 05:21:17 - INFO - __main__ - Step 57897: {'lr': 0.00034372599515310117, 'samples': 11116224, 'steps': 57896, 'loss/train': 1.3311491012573242} -11/07/2021 05:21:17 - INFO - __main__ - Step 57898: {'lr': 0.00034372107544221824, 'samples': 11116416, 'steps': 57897, 'loss/train': 1.322851538658142} -11/07/2021 05:21:18 - INFO - __main__ - Step 57899: {'lr': 0.00034371615568910607, 'samples': 11116608, 'steps': 57898, 'loss/train': 1.0532596111297607} -11/07/2021 05:21:19 - INFO - __main__ - Step 57900: {'lr': 0.00034371123589376683, 'samples': 11116800, 'steps': 57899, 'loss/train': 1.5819395780563354} -11/07/2021 05:21:19 - INFO - __main__ - Step 57901: {'lr': 0.00034370631605620285, 'samples': 11116992, 'steps': 57900, 'loss/train': 1.5906492471694946} -11/07/2021 05:21:19 - INFO - __main__ - Step 57902: {'lr': 0.0003437013961764162, 'samples': 11117184, 'steps': 57901, 'loss/train': 1.4747021198272705} -11/07/2021 05:21:20 - INFO - __main__ - Step 57903: {'lr': 0.00034369647625440906, 'samples': 11117376, 'steps': 57902, 'loss/train': 1.3367058038711548} -11/07/2021 05:21:21 - INFO - __main__ - Step 57904: {'lr': 0.00034369155629018376, 'samples': 11117568, 'steps': 57903, 'loss/train': 1.4811495542526245} -11/07/2021 05:21:21 - INFO - __main__ - Step 57905: {'lr': 0.00034368663628374255, 'samples': 11117760, 'steps': 57904, 'loss/train': 1.115447759628296} -11/07/2021 05:21:22 - INFO - __main__ - Step 57906: {'lr': 0.0003436817162350876, 'samples': 11117952, 'steps': 57905, 'loss/train': 1.1253905296325684} -11/07/2021 05:21:22 - INFO - __main__ - Step 57907: {'lr': 0.00034367679614422103, 'samples': 11118144, 'steps': 57906, 'loss/train': 1.396866798400879} -11/07/2021 05:21:22 - INFO - __main__ - Step 57908: {'lr': 0.0003436718760111452, 'samples': 11118336, 'steps': 57907, 'loss/train': 1.3769924640655518} -11/07/2021 05:21:23 - INFO - __main__ - Step 57909: {'lr': 0.0003436669558358623, 'samples': 11118528, 'steps': 57908, 'loss/train': 1.8341175317764282} -11/07/2021 05:21:24 - INFO - __main__ - Step 57910: {'lr': 0.00034366203561837446, 'samples': 11118720, 'steps': 57909, 'loss/train': 1.081642508506775} -11/07/2021 05:21:24 - INFO - __main__ - Step 57911: {'lr': 0.00034365711535868396, 'samples': 11118912, 'steps': 57910, 'loss/train': 1.3062201738357544} -11/07/2021 05:21:24 - INFO - __main__ - Step 57912: {'lr': 0.000343652195056793, 'samples': 11119104, 'steps': 57911, 'loss/train': 1.5675636529922485} -11/07/2021 05:21:25 - INFO - __main__ - Step 57913: {'lr': 0.0003436472747127038, 'samples': 11119296, 'steps': 57912, 'loss/train': 1.618319034576416} -11/07/2021 05:21:26 - INFO - __main__ - Step 57914: {'lr': 0.0003436423543264186, 'samples': 11119488, 'steps': 57913, 'loss/train': 1.3111189603805542} -11/07/2021 05:21:26 - INFO - __main__ - Step 57915: {'lr': 0.00034363743389793965, 'samples': 11119680, 'steps': 57914, 'loss/train': 1.3982800245285034} -11/07/2021 05:21:26 - INFO - __main__ - Step 57916: {'lr': 0.0003436325134272691, 'samples': 11119872, 'steps': 57915, 'loss/train': 1.8558919429779053} -11/07/2021 05:21:27 - INFO - __main__ - Step 57917: {'lr': 0.0003436275929144091, 'samples': 11120064, 'steps': 57916, 'loss/train': 0.7404921054840088} -11/07/2021 05:21:27 - INFO - __main__ - Step 57918: {'lr': 0.000343622672359362, 'samples': 11120256, 'steps': 57917, 'loss/train': 1.2649706602096558} -11/07/2021 05:21:28 - INFO - __main__ - Step 57919: {'lr': 0.0003436177517621299, 'samples': 11120448, 'steps': 57918, 'loss/train': 1.645738959312439} -11/07/2021 05:21:29 - INFO - __main__ - Step 57920: {'lr': 0.0003436128311227152, 'samples': 11120640, 'steps': 57919, 'loss/train': 1.0767428874969482} -11/07/2021 05:21:29 - INFO - __main__ - Step 57921: {'lr': 0.00034360791044111996, 'samples': 11120832, 'steps': 57920, 'loss/train': 1.6540600061416626} -11/07/2021 05:21:29 - INFO - __main__ - Step 57922: {'lr': 0.00034360298971734647, 'samples': 11121024, 'steps': 57921, 'loss/train': 0.6858277916908264} -11/07/2021 05:21:30 - INFO - __main__ - Step 57923: {'lr': 0.00034359806895139686, 'samples': 11121216, 'steps': 57922, 'loss/train': 1.1156251430511475} -11/07/2021 05:21:31 - INFO - __main__ - Step 57924: {'lr': 0.0003435931481432735, 'samples': 11121408, 'steps': 57923, 'loss/train': 1.3785035610198975} -11/07/2021 05:21:31 - INFO - __main__ - Step 57925: {'lr': 0.00034358822729297847, 'samples': 11121600, 'steps': 57924, 'loss/train': 2.4129350185394287} -11/07/2021 05:21:31 - INFO - __main__ - Step 57926: {'lr': 0.00034358330640051396, 'samples': 11121792, 'steps': 57925, 'loss/train': 1.0540449619293213} -11/07/2021 05:21:32 - INFO - __main__ - Step 57927: {'lr': 0.0003435783854658823, 'samples': 11121984, 'steps': 57926, 'loss/train': 0.7716109156608582} -11/07/2021 05:21:32 - INFO - __main__ - Step 57928: {'lr': 0.00034357346448908566, 'samples': 11122176, 'steps': 57927, 'loss/train': 1.7647292613983154} -11/07/2021 05:21:32 - INFO - __main__ - Step 57929: {'lr': 0.00034356854347012626, 'samples': 11122368, 'steps': 57928, 'loss/train': 5.723478317260742} -11/07/2021 05:21:34 - INFO - __main__ - Step 57930: {'lr': 0.00034356362240900635, 'samples': 11122560, 'steps': 57929, 'loss/train': 1.1204917430877686} -11/07/2021 05:21:34 - INFO - __main__ - Step 57931: {'lr': 0.0003435587013057281, 'samples': 11122752, 'steps': 57930, 'loss/train': 1.4171696901321411} -11/07/2021 05:21:34 - INFO - __main__ - Step 57932: {'lr': 0.0003435537801602937, 'samples': 11122944, 'steps': 57931, 'loss/train': 0.584794819355011} -11/07/2021 05:21:35 - INFO - __main__ - Step 57933: {'lr': 0.00034354885897270546, 'samples': 11123136, 'steps': 57932, 'loss/train': 0.9820351600646973} -11/07/2021 05:21:35 - INFO - __main__ - Step 57934: {'lr': 0.0003435439377429655, 'samples': 11123328, 'steps': 57933, 'loss/train': 1.352911353111267} -11/07/2021 05:21:36 - INFO - __main__ - Step 57935: {'lr': 0.00034353901647107615, 'samples': 11123520, 'steps': 57934, 'loss/train': 1.4055920839309692} -11/07/2021 05:21:36 - INFO - __main__ - Step 57936: {'lr': 0.0003435340951570395, 'samples': 11123712, 'steps': 57935, 'loss/train': 1.2950204610824585} -11/07/2021 05:21:37 - INFO - __main__ - Step 57937: {'lr': 0.00034352917380085784, 'samples': 11123904, 'steps': 57936, 'loss/train': 1.9416735172271729} -11/07/2021 05:21:37 - INFO - __main__ - Step 57938: {'lr': 0.00034352425240253344, 'samples': 11124096, 'steps': 57937, 'loss/train': 1.0612602233886719} -11/07/2021 05:21:37 - INFO - __main__ - Step 57939: {'lr': 0.0003435193309620684, 'samples': 11124288, 'steps': 57938, 'loss/train': 1.3730577230453491} -11/07/2021 05:21:38 - INFO - __main__ - Step 57940: {'lr': 0.000343514409479465, 'samples': 11124480, 'steps': 57939, 'loss/train': 1.103216290473938} -11/07/2021 05:21:39 - INFO - __main__ - Step 57941: {'lr': 0.00034350948795472543, 'samples': 11124672, 'steps': 57940, 'loss/train': 1.063675880432129} -11/07/2021 05:21:39 - INFO - __main__ - Step 57942: {'lr': 0.000343504566387852, 'samples': 11124864, 'steps': 57941, 'loss/train': 1.0157917737960815} -11/07/2021 05:21:40 - INFO - __main__ - Step 57943: {'lr': 0.0003434996447788468, 'samples': 11125056, 'steps': 57942, 'loss/train': 1.411668062210083} -11/07/2021 05:21:40 - INFO - __main__ - Step 57944: {'lr': 0.0003434947231277121, 'samples': 11125248, 'steps': 57943, 'loss/train': 1.6276054382324219} -11/07/2021 05:21:40 - INFO - __main__ - Step 57945: {'lr': 0.0003434898014344501, 'samples': 11125440, 'steps': 57944, 'loss/train': 1.142353892326355} -11/07/2021 05:21:42 - INFO - __main__ - Step 57946: {'lr': 0.00034348487969906307, 'samples': 11125632, 'steps': 57945, 'loss/train': 2.2820980548858643} -11/07/2021 05:21:42 - INFO - __main__ - Step 57947: {'lr': 0.00034347995792155316, 'samples': 11125824, 'steps': 57946, 'loss/train': 1.163718819618225} -11/07/2021 05:21:42 - INFO - __main__ - Step 57948: {'lr': 0.00034347503610192265, 'samples': 11126016, 'steps': 57947, 'loss/train': 1.7779464721679688} -11/07/2021 05:21:43 - INFO - __main__ - Step 57949: {'lr': 0.0003434701142401738, 'samples': 11126208, 'steps': 57948, 'loss/train': 1.4960453510284424} -11/07/2021 05:21:43 - INFO - __main__ - Step 57950: {'lr': 0.0003434651923363087, 'samples': 11126400, 'steps': 57949, 'loss/train': 0.7504159808158875} -11/07/2021 05:21:44 - INFO - __main__ - Step 57951: {'lr': 0.0003434602703903296, 'samples': 11126592, 'steps': 57950, 'loss/train': 1.6045472621917725} -11/07/2021 05:21:44 - INFO - __main__ - Step 57952: {'lr': 0.0003434553484022388, 'samples': 11126784, 'steps': 57951, 'loss/train': 0.257572740316391} -11/07/2021 05:21:45 - INFO - __main__ - Step 57953: {'lr': 0.0003434504263720384, 'samples': 11126976, 'steps': 57952, 'loss/train': 1.4461199045181274} -11/07/2021 05:21:45 - INFO - __main__ - Step 57954: {'lr': 0.0003434455042997307, 'samples': 11127168, 'steps': 57953, 'loss/train': 1.3689465522766113} -11/07/2021 05:21:45 - INFO - __main__ - Step 57955: {'lr': 0.00034344058218531794, 'samples': 11127360, 'steps': 57954, 'loss/train': 1.4795900583267212} -11/07/2021 05:21:47 - INFO - __main__ - Step 57956: {'lr': 0.0003434356600288023, 'samples': 11127552, 'steps': 57955, 'loss/train': 1.458519458770752} -11/07/2021 05:21:47 - INFO - __main__ - Step 57957: {'lr': 0.00034343073783018593, 'samples': 11127744, 'steps': 57956, 'loss/train': 1.0316636562347412} -11/07/2021 05:21:47 - INFO - __main__ - Step 57958: {'lr': 0.00034342581558947113, 'samples': 11127936, 'steps': 57957, 'loss/train': 1.6033358573913574} -11/07/2021 05:21:48 - INFO - __main__ - Step 57959: {'lr': 0.00034342089330666, 'samples': 11128128, 'steps': 57958, 'loss/train': 1.5310497283935547} -11/07/2021 05:21:48 - INFO - __main__ - Step 57960: {'lr': 0.00034341597098175503, 'samples': 11128320, 'steps': 57959, 'loss/train': 1.3717107772827148} -11/07/2021 05:21:49 - INFO - __main__ - Step 57961: {'lr': 0.0003434110486147582, 'samples': 11128512, 'steps': 57960, 'loss/train': 1.3544975519180298} -11/07/2021 05:21:50 - INFO - __main__ - Step 57962: {'lr': 0.0003434061262056718, 'samples': 11128704, 'steps': 57961, 'loss/train': 1.8260358572006226} -11/07/2021 05:21:50 - INFO - __main__ - Step 57963: {'lr': 0.0003434012037544981, 'samples': 11128896, 'steps': 57962, 'loss/train': 1.7426804304122925} -11/07/2021 05:21:50 - INFO - __main__ - Step 57964: {'lr': 0.0003433962812612391, 'samples': 11129088, 'steps': 57963, 'loss/train': 1.6939276456832886} -11/07/2021 05:21:51 - INFO - __main__ - Step 57965: {'lr': 0.0003433913587258973, 'samples': 11129280, 'steps': 57964, 'loss/train': 0.47931137681007385} -11/07/2021 05:21:51 - INFO - __main__ - Step 57966: {'lr': 0.0003433864361484748, 'samples': 11129472, 'steps': 57965, 'loss/train': 0.7440065145492554} -11/07/2021 05:21:52 - INFO - __main__ - Step 57967: {'lr': 0.00034338151352897376, 'samples': 11129664, 'steps': 57966, 'loss/train': 1.2602134943008423} -11/07/2021 05:21:52 - INFO - __main__ - Step 57968: {'lr': 0.00034337659086739646, 'samples': 11129856, 'steps': 57967, 'loss/train': 1.6563085317611694} -11/07/2021 05:21:53 - INFO - __main__ - Step 57969: {'lr': 0.0003433716681637451, 'samples': 11130048, 'steps': 57968, 'loss/train': 1.4218497276306152} -11/07/2021 05:21:53 - INFO - __main__ - Step 57970: {'lr': 0.0003433667454180219, 'samples': 11130240, 'steps': 57969, 'loss/train': 1.4764411449432373} -11/07/2021 05:21:53 - INFO - __main__ - Step 57971: {'lr': 0.00034336182263022916, 'samples': 11130432, 'steps': 57970, 'loss/train': 1.9545987844467163} -11/07/2021 05:21:55 - INFO - __main__ - Step 57972: {'lr': 0.000343356899800369, 'samples': 11130624, 'steps': 57971, 'loss/train': 1.9532370567321777} -11/07/2021 05:21:55 - INFO - __main__ - Step 57973: {'lr': 0.0003433519769284436, 'samples': 11130816, 'steps': 57972, 'loss/train': 0.43979793787002563} -11/07/2021 05:21:55 - INFO - __main__ - Step 57974: {'lr': 0.00034334705401445527, 'samples': 11131008, 'steps': 57973, 'loss/train': 1.2245796918869019} -11/07/2021 05:21:56 - INFO - __main__ - Step 57975: {'lr': 0.00034334213105840616, 'samples': 11131200, 'steps': 57974, 'loss/train': 1.6564574241638184} -11/07/2021 05:21:56 - INFO - __main__ - Step 57976: {'lr': 0.00034333720806029863, 'samples': 11131392, 'steps': 57975, 'loss/train': 1.4846664667129517} -11/07/2021 05:21:57 - INFO - __main__ - Step 57977: {'lr': 0.00034333228502013473, 'samples': 11131584, 'steps': 57976, 'loss/train': 1.1061686277389526} -11/07/2021 05:21:57 - INFO - __main__ - Step 57978: {'lr': 0.00034332736193791675, 'samples': 11131776, 'steps': 57977, 'loss/train': 1.5870442390441895} -11/07/2021 05:21:58 - INFO - __main__ - Step 57979: {'lr': 0.0003433224388136469, 'samples': 11131968, 'steps': 57978, 'loss/train': 1.3707860708236694} -11/07/2021 05:21:58 - INFO - __main__ - Step 57980: {'lr': 0.0003433175156473274, 'samples': 11132160, 'steps': 57979, 'loss/train': 1.1279058456420898} -11/07/2021 05:21:58 - INFO - __main__ - Step 57981: {'lr': 0.0003433125924389604, 'samples': 11132352, 'steps': 57980, 'loss/train': 1.3661913871765137} -11/07/2021 05:21:59 - INFO - __main__ - Step 57982: {'lr': 0.00034330766918854827, 'samples': 11132544, 'steps': 57981, 'loss/train': 1.43588125705719} -11/07/2021 05:22:00 - INFO - __main__ - Step 57983: {'lr': 0.0003433027458960932, 'samples': 11132736, 'steps': 57982, 'loss/train': 1.4345775842666626} -11/07/2021 05:22:00 - INFO - __main__ - Step 57984: {'lr': 0.00034329782256159724, 'samples': 11132928, 'steps': 57983, 'loss/train': 1.5670498609542847} -11/07/2021 05:22:00 - INFO - __main__ - Step 57985: {'lr': 0.00034329289918506276, 'samples': 11133120, 'steps': 57984, 'loss/train': 0.8577389717102051} -11/07/2021 05:22:01 - INFO - __main__ - Step 57986: {'lr': 0.0003432879757664919, 'samples': 11133312, 'steps': 57985, 'loss/train': 0.9772616028785706} -11/07/2021 05:22:02 - INFO - __main__ - Step 57987: {'lr': 0.00034328305230588694, 'samples': 11133504, 'steps': 57986, 'loss/train': 1.9733684062957764} -11/07/2021 05:22:02 - INFO - __main__ - Step 57988: {'lr': 0.0003432781288032501, 'samples': 11133696, 'steps': 57987, 'loss/train': 1.7668211460113525} -11/07/2021 05:22:03 - INFO - __main__ - Step 57989: {'lr': 0.00034327320525858357, 'samples': 11133888, 'steps': 57988, 'loss/train': 1.6571251153945923} -11/07/2021 05:22:03 - INFO - __main__ - Step 57990: {'lr': 0.00034326828167188957, 'samples': 11134080, 'steps': 57989, 'loss/train': 1.3920128345489502} -11/07/2021 05:22:03 - INFO - __main__ - Step 57991: {'lr': 0.0003432633580431703, 'samples': 11134272, 'steps': 57990, 'loss/train': 1.3259575366973877} -11/07/2021 05:22:04 - INFO - __main__ - Step 57992: {'lr': 0.00034325843437242804, 'samples': 11134464, 'steps': 57991, 'loss/train': 1.3787813186645508} -11/07/2021 05:22:05 - INFO - __main__ - Step 57993: {'lr': 0.0003432535106596649, 'samples': 11134656, 'steps': 57992, 'loss/train': 1.1121562719345093} -11/07/2021 05:22:05 - INFO - __main__ - Step 57994: {'lr': 0.00034324858690488324, 'samples': 11134848, 'steps': 57993, 'loss/train': 0.5191564559936523} -11/07/2021 05:22:05 - INFO - __main__ - Step 57995: {'lr': 0.0003432436631080851, 'samples': 11135040, 'steps': 57994, 'loss/train': 1.6217098236083984} -11/07/2021 05:22:06 - INFO - __main__ - Step 57996: {'lr': 0.00034323873926927296, 'samples': 11135232, 'steps': 57995, 'loss/train': 1.472947359085083} -11/07/2021 05:22:06 - INFO - __main__ - Step 57997: {'lr': 0.00034323381538844884, 'samples': 11135424, 'steps': 57996, 'loss/train': 0.7900754809379578} -11/07/2021 05:22:07 - INFO - __main__ - Step 57998: {'lr': 0.0003432288914656149, 'samples': 11135616, 'steps': 57997, 'loss/train': 1.040427327156067} -11/07/2021 05:22:08 - INFO - __main__ - Step 57999: {'lr': 0.00034322396750077354, 'samples': 11135808, 'steps': 57998, 'loss/train': 1.0184991359710693} -11/07/2021 05:22:08 - INFO - __main__ - Step 58000: {'lr': 0.0003432190434939269, 'samples': 11136000, 'steps': 57999, 'loss/train': 1.4191187620162964} -11/07/2021 05:22:08 - INFO - __main__ - Step 58001: {'lr': 0.0003432141194450772, 'samples': 11136192, 'steps': 58000, 'loss/train': 1.4723877906799316} -11/07/2021 05:22:09 - INFO - __main__ - Step 58002: {'lr': 0.0003432091953542267, 'samples': 11136384, 'steps': 58001, 'loss/train': 1.513293981552124} -11/07/2021 05:22:10 - INFO - __main__ - Step 58003: {'lr': 0.00034320427122137745, 'samples': 11136576, 'steps': 58002, 'loss/train': 1.0501506328582764} -11/07/2021 05:22:10 - INFO - __main__ - Step 58004: {'lr': 0.0003431993470465319, 'samples': 11136768, 'steps': 58003, 'loss/train': 1.3065688610076904} -11/07/2021 05:22:10 - INFO - __main__ - Step 58005: {'lr': 0.00034319442282969206, 'samples': 11136960, 'steps': 58004, 'loss/train': 0.4899785816669464} -11/07/2021 05:22:11 - INFO - __main__ - Step 58006: {'lr': 0.0003431894985708603, 'samples': 11137152, 'steps': 58005, 'loss/train': 1.4666774272918701} -11/07/2021 05:22:11 - INFO - __main__ - Step 58007: {'lr': 0.0003431845742700388, 'samples': 11137344, 'steps': 58006, 'loss/train': 1.3265217542648315} -11/07/2021 05:22:12 - INFO - __main__ - Step 58008: {'lr': 0.00034317964992722975, 'samples': 11137536, 'steps': 58007, 'loss/train': 1.5669384002685547} -11/07/2021 05:22:12 - INFO - __main__ - Step 58009: {'lr': 0.00034317472554243545, 'samples': 11137728, 'steps': 58008, 'loss/train': 0.9563673138618469} -11/07/2021 05:22:13 - INFO - __main__ - Step 58010: {'lr': 0.00034316980111565796, 'samples': 11137920, 'steps': 58009, 'loss/train': 1.1143641471862793} -11/07/2021 05:22:13 - INFO - __main__ - Step 58011: {'lr': 0.00034316487664689974, 'samples': 11138112, 'steps': 58010, 'loss/train': 0.9312244057655334} -11/07/2021 05:22:13 - INFO - __main__ - Step 58012: {'lr': 0.00034315995213616266, 'samples': 11138304, 'steps': 58011, 'loss/train': 1.4314597845077515} -11/07/2021 05:22:14 - INFO - __main__ - Step 58013: {'lr': 0.0003431550275834493, 'samples': 11138496, 'steps': 58012, 'loss/train': 1.2774111032485962} -11/07/2021 05:22:15 - INFO - __main__ - Step 58014: {'lr': 0.0003431501029887617, 'samples': 11138688, 'steps': 58013, 'loss/train': 1.5383182764053345} -11/07/2021 05:22:15 - INFO - __main__ - Step 58015: {'lr': 0.00034314517835210207, 'samples': 11138880, 'steps': 58014, 'loss/train': 1.4472438097000122} -11/07/2021 05:22:16 - INFO - __main__ - Step 58016: {'lr': 0.00034314025367347266, 'samples': 11139072, 'steps': 58015, 'loss/train': 1.0739012956619263} -11/07/2021 05:22:16 - INFO - __main__ - Step 58017: {'lr': 0.00034313532895287574, 'samples': 11139264, 'steps': 58016, 'loss/train': 1.1794275045394897} -11/07/2021 05:22:17 - INFO - __main__ - Step 58018: {'lr': 0.00034313040419031336, 'samples': 11139456, 'steps': 58017, 'loss/train': 1.309901237487793} -11/07/2021 05:22:17 - INFO - __main__ - Step 58019: {'lr': 0.00034312547938578796, 'samples': 11139648, 'steps': 58018, 'loss/train': 1.4783639907836914} -11/07/2021 05:22:18 - INFO - __main__ - Step 58020: {'lr': 0.0003431205545393016, 'samples': 11139840, 'steps': 58019, 'loss/train': 1.6573526859283447} -11/07/2021 05:22:18 - INFO - __main__ - Step 58021: {'lr': 0.00034311562965085664, 'samples': 11140032, 'steps': 58020, 'loss/train': 1.2112683057785034} -11/07/2021 05:22:18 - INFO - __main__ - Step 58022: {'lr': 0.0003431107047204552, 'samples': 11140224, 'steps': 58021, 'loss/train': 1.7318570613861084} -11/07/2021 05:22:19 - INFO - __main__ - Step 58023: {'lr': 0.00034310577974809944, 'samples': 11140416, 'steps': 58022, 'loss/train': 1.3370510339736938} -11/07/2021 05:22:20 - INFO - __main__ - Step 58024: {'lr': 0.0003431008547337917, 'samples': 11140608, 'steps': 58023, 'loss/train': 1.460934042930603} -11/07/2021 05:22:20 - INFO - __main__ - Step 58025: {'lr': 0.0003430959296775341, 'samples': 11140800, 'steps': 58024, 'loss/train': 1.3419275283813477} -11/07/2021 05:22:21 - INFO - __main__ - Step 58026: {'lr': 0.00034309100457932895, 'samples': 11140992, 'steps': 58025, 'loss/train': 1.6616933345794678} -11/07/2021 05:22:21 - INFO - __main__ - Step 58027: {'lr': 0.0003430860794391784, 'samples': 11141184, 'steps': 58026, 'loss/train': 1.6319591999053955} -11/07/2021 05:22:22 - INFO - __main__ - Step 58028: {'lr': 0.00034308115425708477, 'samples': 11141376, 'steps': 58027, 'loss/train': 1.709490418434143} -11/07/2021 05:22:22 - INFO - __main__ - Step 58029: {'lr': 0.0003430762290330501, 'samples': 11141568, 'steps': 58028, 'loss/train': 1.3632644414901733} -11/07/2021 05:22:22 - INFO - __main__ - Step 58030: {'lr': 0.00034307130376707684, 'samples': 11141760, 'steps': 58029, 'loss/train': 1.4385491609573364} -11/07/2021 05:22:23 - INFO - __main__ - Step 58031: {'lr': 0.000343066378459167, 'samples': 11141952, 'steps': 58030, 'loss/train': 1.7479932308197021} -11/07/2021 05:22:23 - INFO - __main__ - Step 58032: {'lr': 0.00034306145310932293, 'samples': 11142144, 'steps': 58031, 'loss/train': 0.8931760787963867} -11/07/2021 05:22:24 - INFO - __main__ - Step 58033: {'lr': 0.0003430565277175468, 'samples': 11142336, 'steps': 58032, 'loss/train': 1.4687832593917847} -11/07/2021 05:22:25 - INFO - __main__ - Step 58034: {'lr': 0.0003430516022838408, 'samples': 11142528, 'steps': 58033, 'loss/train': 1.2242742776870728} -11/07/2021 05:22:25 - INFO - __main__ - Step 58035: {'lr': 0.00034304667680820714, 'samples': 11142720, 'steps': 58034, 'loss/train': 1.1620845794677734} -11/07/2021 05:22:25 - INFO - __main__ - Step 58036: {'lr': 0.0003430417512906482, 'samples': 11142912, 'steps': 58035, 'loss/train': 1.0705658197402954} -11/07/2021 05:22:26 - INFO - __main__ - Step 58037: {'lr': 0.0003430368257311661, 'samples': 11143104, 'steps': 58036, 'loss/train': 1.4266974925994873} -11/07/2021 05:22:26 - INFO - __main__ - Step 58038: {'lr': 0.0003430319001297629, 'samples': 11143296, 'steps': 58037, 'loss/train': 0.85700923204422} -11/07/2021 05:22:27 - INFO - __main__ - Step 58039: {'lr': 0.00034302697448644105, 'samples': 11143488, 'steps': 58038, 'loss/train': 1.4314415454864502} -11/07/2021 05:22:27 - INFO - __main__ - Step 58040: {'lr': 0.00034302204880120267, 'samples': 11143680, 'steps': 58039, 'loss/train': 1.265537142753601} -11/07/2021 05:22:28 - INFO - __main__ - Step 58041: {'lr': 0.00034301712307404996, 'samples': 11143872, 'steps': 58040, 'loss/train': 1.2173185348510742} -11/07/2021 05:22:28 - INFO - __main__ - Step 58042: {'lr': 0.00034301219730498524, 'samples': 11144064, 'steps': 58041, 'loss/train': 1.1953152418136597} -11/07/2021 05:22:28 - INFO - __main__ - Step 58043: {'lr': 0.00034300727149401064, 'samples': 11144256, 'steps': 58042, 'loss/train': 1.4818683862686157} -11/07/2021 05:22:29 - INFO - __main__ - Step 58044: {'lr': 0.00034300234564112837, 'samples': 11144448, 'steps': 58043, 'loss/train': 1.2073689699172974} -11/07/2021 05:22:30 - INFO - __main__ - Step 58045: {'lr': 0.0003429974197463407, 'samples': 11144640, 'steps': 58044, 'loss/train': 1.2426390647888184} -11/07/2021 05:22:30 - INFO - __main__ - Step 58046: {'lr': 0.00034299249380964977, 'samples': 11144832, 'steps': 58045, 'loss/train': 2.0916635990142822} -11/07/2021 05:22:30 - INFO - __main__ - Step 58047: {'lr': 0.0003429875678310579, 'samples': 11145024, 'steps': 58046, 'loss/train': 1.402531623840332} -11/07/2021 05:22:31 - INFO - __main__ - Step 58048: {'lr': 0.0003429826418105673, 'samples': 11145216, 'steps': 58047, 'loss/train': 1.5624163150787354} -11/07/2021 05:22:32 - INFO - __main__ - Step 58049: {'lr': 0.0003429777157481801, 'samples': 11145408, 'steps': 58048, 'loss/train': 1.217465877532959} -11/07/2021 05:22:32 - INFO - __main__ - Step 58050: {'lr': 0.0003429727896438986, 'samples': 11145600, 'steps': 58049, 'loss/train': 1.2060452699661255} -11/07/2021 05:22:32 - INFO - __main__ - Step 58051: {'lr': 0.00034296786349772494, 'samples': 11145792, 'steps': 58050, 'loss/train': 1.6606749296188354} -11/07/2021 05:22:33 - INFO - __main__ - Step 58052: {'lr': 0.0003429629373096615, 'samples': 11145984, 'steps': 58051, 'loss/train': 1.473239779472351} -11/07/2021 05:22:33 - INFO - __main__ - Step 58053: {'lr': 0.0003429580110797103, 'samples': 11146176, 'steps': 58052, 'loss/train': 0.9374370574951172} -11/07/2021 05:22:34 - INFO - __main__ - Step 58054: {'lr': 0.0003429530848078737, 'samples': 11146368, 'steps': 58053, 'loss/train': 1.3914765119552612} -11/07/2021 05:22:34 - INFO - __main__ - Step 58055: {'lr': 0.0003429481584941538, 'samples': 11146560, 'steps': 58054, 'loss/train': 1.4052411317825317} -11/07/2021 05:22:35 - INFO - __main__ - Step 58056: {'lr': 0.0003429432321385531, 'samples': 11146752, 'steps': 58055, 'loss/train': 1.6026771068572998} -11/07/2021 05:22:35 - INFO - __main__ - Step 58057: {'lr': 0.00034293830574107345, 'samples': 11146944, 'steps': 58056, 'loss/train': 1.494822382926941} -11/07/2021 05:22:36 - INFO - __main__ - Step 58058: {'lr': 0.0003429333793017173, 'samples': 11147136, 'steps': 58057, 'loss/train': 0.8916078209877014} -11/07/2021 05:22:37 - INFO - __main__ - Step 58059: {'lr': 0.00034292845282048667, 'samples': 11147328, 'steps': 58058, 'loss/train': 1.2187190055847168} -11/07/2021 05:22:37 - INFO - __main__ - Step 58060: {'lr': 0.00034292352629738406, 'samples': 11147520, 'steps': 58059, 'loss/train': 0.9712035655975342} -11/07/2021 05:22:37 - INFO - __main__ - Step 58061: {'lr': 0.00034291859973241146, 'samples': 11147712, 'steps': 58060, 'loss/train': 0.9141193628311157} -11/07/2021 05:22:38 - INFO - __main__ - Step 58062: {'lr': 0.0003429136731255712, 'samples': 11147904, 'steps': 58061, 'loss/train': 1.4545624256134033} -11/07/2021 05:22:38 - INFO - __main__ - Step 58063: {'lr': 0.0003429087464768655, 'samples': 11148096, 'steps': 58062, 'loss/train': 1.2438966035842896} -11/07/2021 05:22:39 - INFO - __main__ - Step 58064: {'lr': 0.00034290381978629655, 'samples': 11148288, 'steps': 58063, 'loss/train': 1.4399888515472412} -11/07/2021 05:22:39 - INFO - __main__ - Step 58065: {'lr': 0.00034289889305386654, 'samples': 11148480, 'steps': 58064, 'loss/train': 1.438434362411499} -11/07/2021 05:22:40 - INFO - __main__ - Step 58066: {'lr': 0.0003428939662795777, 'samples': 11148672, 'steps': 58065, 'loss/train': 1.2491456270217896} -11/07/2021 05:22:40 - INFO - __main__ - Step 58067: {'lr': 0.0003428890394634323, 'samples': 11148864, 'steps': 58066, 'loss/train': 1.3859294652938843} -11/07/2021 05:22:40 - INFO - __main__ - Step 58068: {'lr': 0.0003428841126054326, 'samples': 11149056, 'steps': 58067, 'loss/train': 1.482081413269043} -11/07/2021 05:22:42 - INFO - __main__ - Step 58069: {'lr': 0.0003428791857055806, 'samples': 11149248, 'steps': 58068, 'loss/train': 1.2527201175689697} -11/07/2021 05:22:42 - INFO - __main__ - Step 58070: {'lr': 0.0003428742587638788, 'samples': 11149440, 'steps': 58069, 'loss/train': 0.22418178617954254} -11/07/2021 05:22:42 - INFO - __main__ - Step 58071: {'lr': 0.0003428693317803293, 'samples': 11149632, 'steps': 58070, 'loss/train': 1.7594146728515625} -11/07/2021 05:22:43 - INFO - __main__ - Step 58072: {'lr': 0.00034286440475493423, 'samples': 11149824, 'steps': 58071, 'loss/train': 1.462848424911499} -11/07/2021 05:22:43 - INFO - __main__ - Step 58073: {'lr': 0.0003428594776876959, 'samples': 11150016, 'steps': 58072, 'loss/train': 1.330108880996704} -11/07/2021 05:22:44 - INFO - __main__ - Step 58074: {'lr': 0.0003428545505786166, 'samples': 11150208, 'steps': 58073, 'loss/train': 1.428093433380127} -11/07/2021 05:22:44 - INFO - __main__ - Step 58075: {'lr': 0.0003428496234276984, 'samples': 11150400, 'steps': 58074, 'loss/train': 1.7277567386627197} -11/07/2021 05:22:45 - INFO - __main__ - Step 58076: {'lr': 0.0003428446962349437, 'samples': 11150592, 'steps': 58075, 'loss/train': 1.0090595483779907} -11/07/2021 05:22:45 - INFO - __main__ - Step 58077: {'lr': 0.0003428397690003545, 'samples': 11150784, 'steps': 58076, 'loss/train': 1.258705496788025} -11/07/2021 05:22:45 - INFO - __main__ - Step 58078: {'lr': 0.00034283484172393315, 'samples': 11150976, 'steps': 58077, 'loss/train': 1.2631856203079224} -11/07/2021 05:22:47 - INFO - __main__ - Step 58079: {'lr': 0.0003428299144056818, 'samples': 11151168, 'steps': 58078, 'loss/train': 1.2879300117492676} -11/07/2021 05:22:47 - INFO - __main__ - Step 58080: {'lr': 0.00034282498704560284, 'samples': 11151360, 'steps': 58079, 'loss/train': 1.1683639287948608} -11/07/2021 05:22:47 - INFO - __main__ - Step 58081: {'lr': 0.0003428200596436983, 'samples': 11151552, 'steps': 58080, 'loss/train': 1.3141639232635498} -11/07/2021 05:22:48 - INFO - __main__ - Step 58082: {'lr': 0.00034281513219997054, 'samples': 11151744, 'steps': 58081, 'loss/train': 1.1433618068695068} -11/07/2021 05:22:48 - INFO - __main__ - Step 58083: {'lr': 0.0003428102047144217, 'samples': 11151936, 'steps': 58082, 'loss/train': 1.0904260873794556} -11/07/2021 05:22:48 - INFO - __main__ - Step 58084: {'lr': 0.00034280527718705397, 'samples': 11152128, 'steps': 58083, 'loss/train': 1.9198188781738281} -11/07/2021 05:22:50 - INFO - __main__ - Step 58085: {'lr': 0.0003428003496178696, 'samples': 11152320, 'steps': 58084, 'loss/train': 1.529852032661438} -11/07/2021 05:22:50 - INFO - __main__ - Step 58086: {'lr': 0.00034279542200687087, 'samples': 11152512, 'steps': 58085, 'loss/train': 1.5440113544464111} -11/07/2021 05:22:50 - INFO - __main__ - Step 58087: {'lr': 0.0003427904943540599, 'samples': 11152704, 'steps': 58086, 'loss/train': 1.61406672000885} -11/07/2021 05:22:51 - INFO - __main__ - Step 58088: {'lr': 0.000342785566659439, 'samples': 11152896, 'steps': 58087, 'loss/train': 1.048874855041504} -11/07/2021 05:22:52 - INFO - __main__ - Step 58089: {'lr': 0.00034278063892301036, 'samples': 11153088, 'steps': 58088, 'loss/train': 0.7622469067573547} -11/07/2021 05:22:52 - INFO - __main__ - Step 58090: {'lr': 0.00034277571114477623, 'samples': 11153280, 'steps': 58089, 'loss/train': 0.9306669235229492} -11/07/2021 05:22:52 - INFO - __main__ - Step 58091: {'lr': 0.0003427707833247388, 'samples': 11153472, 'steps': 58090, 'loss/train': 1.3199565410614014} -11/07/2021 05:22:53 - INFO - __main__ - Step 58092: {'lr': 0.0003427658554629002, 'samples': 11153664, 'steps': 58091, 'loss/train': 1.4994642734527588} -11/07/2021 05:22:53 - INFO - __main__ - Step 58093: {'lr': 0.00034276092755926275, 'samples': 11153856, 'steps': 58092, 'loss/train': 1.5093677043914795} -11/07/2021 05:22:54 - INFO - __main__ - Step 58094: {'lr': 0.0003427559996138287, 'samples': 11154048, 'steps': 58093, 'loss/train': 2.099083662033081} -11/07/2021 05:22:55 - INFO - __main__ - Step 58095: {'lr': 0.00034275107162660024, 'samples': 11154240, 'steps': 58094, 'loss/train': 1.3972128629684448} -11/07/2021 05:22:55 - INFO - __main__ - Step 58096: {'lr': 0.0003427461435975796, 'samples': 11154432, 'steps': 58095, 'loss/train': 1.568275809288025} -11/07/2021 05:22:56 - INFO - __main__ - Step 58097: {'lr': 0.0003427412155267688, 'samples': 11154624, 'steps': 58096, 'loss/train': 1.3446893692016602} -11/07/2021 05:22:56 - INFO - __main__ - Step 58098: {'lr': 0.00034273628741417043, 'samples': 11154816, 'steps': 58097, 'loss/train': 1.7160266637802124} -11/07/2021 05:22:56 - INFO - __main__ - Step 58099: {'lr': 0.0003427313592597865, 'samples': 11155008, 'steps': 58098, 'loss/train': 1.2969858646392822} -11/07/2021 05:22:57 - INFO - __main__ - Step 58100: {'lr': 0.00034272643106361916, 'samples': 11155200, 'steps': 58099, 'loss/train': 1.284481406211853} -11/07/2021 05:22:58 - INFO - __main__ - Step 58101: {'lr': 0.00034272150282567084, 'samples': 11155392, 'steps': 58100, 'loss/train': 1.4279965162277222} -11/07/2021 05:22:58 - INFO - __main__ - Step 58102: {'lr': 0.00034271657454594355, 'samples': 11155584, 'steps': 58101, 'loss/train': 1.6952944993972778} -11/07/2021 05:22:58 - INFO - __main__ - Step 58103: {'lr': 0.0003427116462244396, 'samples': 11155776, 'steps': 58102, 'loss/train': 1.5189787149429321} -11/07/2021 05:22:59 - INFO - __main__ - Step 58104: {'lr': 0.00034270671786116127, 'samples': 11155968, 'steps': 58103, 'loss/train': 1.3295122385025024} -11/07/2021 05:22:59 - INFO - __main__ - Step 58105: {'lr': 0.00034270178945611067, 'samples': 11156160, 'steps': 58104, 'loss/train': 1.4877725839614868} -11/07/2021 05:23:00 - INFO - __main__ - Step 58106: {'lr': 0.00034269686100929015, 'samples': 11156352, 'steps': 58105, 'loss/train': 1.7005438804626465} -11/07/2021 05:23:00 - INFO - __main__ - Step 58107: {'lr': 0.0003426919325207018, 'samples': 11156544, 'steps': 58106, 'loss/train': 1.6490744352340698} -11/07/2021 05:23:01 - INFO - __main__ - Step 58108: {'lr': 0.0003426870039903479, 'samples': 11156736, 'steps': 58107, 'loss/train': 1.5698260068893433} -11/07/2021 05:23:01 - INFO - __main__ - Step 58109: {'lr': 0.00034268207541823066, 'samples': 11156928, 'steps': 58108, 'loss/train': 1.6872550249099731} -11/07/2021 05:23:01 - INFO - __main__ - Step 58110: {'lr': 0.0003426771468043523, 'samples': 11157120, 'steps': 58109, 'loss/train': 2.1855580806732178} -11/07/2021 05:23:03 - INFO - __main__ - Step 58111: {'lr': 0.00034267221814871505, 'samples': 11157312, 'steps': 58110, 'loss/train': 1.670572280883789} -11/07/2021 05:23:03 - INFO - __main__ - Step 58112: {'lr': 0.0003426672894513212, 'samples': 11157504, 'steps': 58111, 'loss/train': 1.4893500804901123} -11/07/2021 05:23:03 - INFO - __main__ - Step 58113: {'lr': 0.00034266236071217284, 'samples': 11157696, 'steps': 58112, 'loss/train': 1.5400220155715942} -11/07/2021 05:23:04 - INFO - __main__ - Step 58114: {'lr': 0.00034265743193127217, 'samples': 11157888, 'steps': 58113, 'loss/train': 1.7129415273666382} -11/07/2021 05:23:04 - INFO - __main__ - Step 58115: {'lr': 0.00034265250310862164, 'samples': 11158080, 'steps': 58114, 'loss/train': 1.34105384349823} -11/07/2021 05:23:05 - INFO - __main__ - Step 58116: {'lr': 0.0003426475742442232, 'samples': 11158272, 'steps': 58115, 'loss/train': 1.7803500890731812} -11/07/2021 05:23:05 - INFO - __main__ - Step 58117: {'lr': 0.0003426426453380793, 'samples': 11158464, 'steps': 58116, 'loss/train': 1.460178256034851} -11/07/2021 05:23:06 - INFO - __main__ - Step 58118: {'lr': 0.000342637716390192, 'samples': 11158656, 'steps': 58117, 'loss/train': 1.3733336925506592} -11/07/2021 05:23:06 - INFO - __main__ - Step 58119: {'lr': 0.0003426327874005636, 'samples': 11158848, 'steps': 58118, 'loss/train': 1.0330922603607178} -11/07/2021 05:23:06 - INFO - __main__ - Step 58120: {'lr': 0.00034262785836919617, 'samples': 11159040, 'steps': 58119, 'loss/train': 1.5005682706832886} -11/07/2021 05:23:07 - INFO - __main__ - Step 58121: {'lr': 0.00034262292929609217, 'samples': 11159232, 'steps': 58120, 'loss/train': 0.6388111710548401} -11/07/2021 05:23:08 - INFO - __main__ - Step 58122: {'lr': 0.0003426180001812537, 'samples': 11159424, 'steps': 58121, 'loss/train': 0.8463659286499023} -11/07/2021 05:23:08 - INFO - __main__ - Step 58123: {'lr': 0.000342613071024683, 'samples': 11159616, 'steps': 58122, 'loss/train': 0.7747419476509094} -11/07/2021 05:23:08 - INFO - __main__ - Step 58124: {'lr': 0.0003426081418263823, 'samples': 11159808, 'steps': 58123, 'loss/train': 1.5754873752593994} -11/07/2021 05:23:09 - INFO - __main__ - Step 58125: {'lr': 0.00034260321258635377, 'samples': 11160000, 'steps': 58124, 'loss/train': 0.8849248886108398} -11/07/2021 05:23:09 - INFO - __main__ - Step 58126: {'lr': 0.0003425982833045996, 'samples': 11160192, 'steps': 58125, 'loss/train': 1.6146043539047241} -11/07/2021 05:23:10 - INFO - __main__ - Step 58127: {'lr': 0.0003425933539811221, 'samples': 11160384, 'steps': 58126, 'loss/train': 1.31283438205719} -11/07/2021 05:23:11 - INFO - __main__ - Step 58128: {'lr': 0.0003425884246159235, 'samples': 11160576, 'steps': 58127, 'loss/train': 1.4597915410995483} -11/07/2021 05:23:11 - INFO - __main__ - Step 58129: {'lr': 0.00034258349520900595, 'samples': 11160768, 'steps': 58128, 'loss/train': 1.814573049545288} -11/07/2021 05:23:11 - INFO - __main__ - Step 58130: {'lr': 0.0003425785657603718, 'samples': 11160960, 'steps': 58129, 'loss/train': 1.185489535331726} -11/07/2021 05:23:12 - INFO - __main__ - Step 58131: {'lr': 0.0003425736362700231, 'samples': 11161152, 'steps': 58130, 'loss/train': 1.199737310409546} -11/07/2021 05:23:13 - INFO - __main__ - Step 58132: {'lr': 0.00034256870673796217, 'samples': 11161344, 'steps': 58131, 'loss/train': 1.3147960901260376} -11/07/2021 05:23:13 - INFO - __main__ - Step 58133: {'lr': 0.0003425637771641911, 'samples': 11161536, 'steps': 58132, 'loss/train': 1.3148967027664185} -11/07/2021 05:23:13 - INFO - __main__ - Step 58134: {'lr': 0.00034255884754871233, 'samples': 11161728, 'steps': 58133, 'loss/train': 1.83072030544281} -11/07/2021 05:23:14 - INFO - __main__ - Step 58135: {'lr': 0.000342553917891528, 'samples': 11161920, 'steps': 58134, 'loss/train': 1.1407413482666016} -11/07/2021 05:23:14 - INFO - __main__ - Step 58136: {'lr': 0.0003425489881926402, 'samples': 11162112, 'steps': 58135, 'loss/train': 2.0290093421936035} -11/07/2021 05:23:15 - INFO - __main__ - Step 58137: {'lr': 0.0003425440584520514, 'samples': 11162304, 'steps': 58136, 'loss/train': 1.5655841827392578} -11/07/2021 05:23:15 - INFO - __main__ - Step 58138: {'lr': 0.00034253912866976353, 'samples': 11162496, 'steps': 58137, 'loss/train': 1.5796418190002441} -11/07/2021 05:23:16 - INFO - __main__ - Step 58139: {'lr': 0.000342534198845779, 'samples': 11162688, 'steps': 58138, 'loss/train': 1.5528148412704468} -11/07/2021 05:23:16 - INFO - __main__ - Step 58140: {'lr': 0.0003425292689801, 'samples': 11162880, 'steps': 58139, 'loss/train': 1.3445820808410645} -11/07/2021 05:23:16 - INFO - __main__ - Step 58141: {'lr': 0.00034252433907272875, 'samples': 11163072, 'steps': 58140, 'loss/train': 1.4922312498092651} -11/07/2021 05:23:18 - INFO - __main__ - Step 58142: {'lr': 0.0003425194091236674, 'samples': 11163264, 'steps': 58141, 'loss/train': 1.2161821126937866} -11/07/2021 05:23:18 - INFO - __main__ - Step 58143: {'lr': 0.0003425144791329183, 'samples': 11163456, 'steps': 58142, 'loss/train': 1.1257246732711792} -11/07/2021 05:23:18 - INFO - __main__ - Step 58144: {'lr': 0.00034250954910048357, 'samples': 11163648, 'steps': 58143, 'loss/train': 1.5302990674972534} -11/07/2021 05:23:19 - INFO - __main__ - Step 58145: {'lr': 0.0003425046190263655, 'samples': 11163840, 'steps': 58144, 'loss/train': 1.6194462776184082} -11/07/2021 05:23:19 - INFO - __main__ - Step 58146: {'lr': 0.00034249968891056625, 'samples': 11164032, 'steps': 58145, 'loss/train': 1.2853859663009644} -11/07/2021 05:23:20 - INFO - __main__ - Step 58147: {'lr': 0.00034249475875308813, 'samples': 11164224, 'steps': 58146, 'loss/train': 1.7340830564498901} -11/07/2021 05:23:20 - INFO - __main__ - Step 58148: {'lr': 0.00034248982855393317, 'samples': 11164416, 'steps': 58147, 'loss/train': 1.2193033695220947} -11/07/2021 05:23:21 - INFO - __main__ - Step 58149: {'lr': 0.0003424848983131038, 'samples': 11164608, 'steps': 58148, 'loss/train': 1.3887706995010376} -11/07/2021 05:23:21 - INFO - __main__ - Step 58150: {'lr': 0.0003424799680306022, 'samples': 11164800, 'steps': 58149, 'loss/train': 0.44565680623054504} -11/07/2021 05:23:21 - INFO - __main__ - Step 58151: {'lr': 0.0003424750377064305, 'samples': 11164992, 'steps': 58150, 'loss/train': 1.300445556640625} -11/07/2021 05:23:22 - INFO - __main__ - Step 58152: {'lr': 0.000342470107340591, 'samples': 11165184, 'steps': 58151, 'loss/train': 1.3930526971817017} -11/07/2021 05:23:23 - INFO - __main__ - Step 58153: {'lr': 0.0003424651769330859, 'samples': 11165376, 'steps': 58152, 'loss/train': 1.7067426443099976} -11/07/2021 05:23:23 - INFO - __main__ - Step 58154: {'lr': 0.0003424602464839173, 'samples': 11165568, 'steps': 58153, 'loss/train': 0.9218025207519531} -11/07/2021 05:23:24 - INFO - __main__ - Step 58155: {'lr': 0.0003424553159930877, 'samples': 11165760, 'steps': 58154, 'loss/train': 1.6319758892059326} -11/07/2021 05:23:24 - INFO - __main__ - Step 58156: {'lr': 0.00034245038546059904, 'samples': 11165952, 'steps': 58155, 'loss/train': 1.5520331859588623} -11/07/2021 05:23:24 - INFO - __main__ - Step 58157: {'lr': 0.0003424454548864538, 'samples': 11166144, 'steps': 58156, 'loss/train': 1.245050072669983} -11/07/2021 05:23:25 - INFO - __main__ - Step 58158: {'lr': 0.00034244052427065397, 'samples': 11166336, 'steps': 58157, 'loss/train': 1.8263821601867676} -11/07/2021 05:23:26 - INFO - __main__ - Step 58159: {'lr': 0.00034243559361320187, 'samples': 11166528, 'steps': 58158, 'loss/train': 3.1753933429718018} -11/07/2021 05:23:26 - INFO - __main__ - Step 58160: {'lr': 0.00034243066291409977, 'samples': 11166720, 'steps': 58159, 'loss/train': 1.89552903175354} -11/07/2021 05:23:26 - INFO - __main__ - Step 58161: {'lr': 0.0003424257321733497, 'samples': 11166912, 'steps': 58160, 'loss/train': 1.6489208936691284} -11/07/2021 05:23:27 - INFO - __main__ - Step 58162: {'lr': 0.00034242080139095416, 'samples': 11167104, 'steps': 58161, 'loss/train': 1.6356033086776733} -11/07/2021 05:23:28 - INFO - __main__ - Step 58163: {'lr': 0.0003424158705669152, 'samples': 11167296, 'steps': 58162, 'loss/train': 1.5166915655136108} -11/07/2021 05:23:28 - INFO - __main__ - Step 58164: {'lr': 0.0003424109397012351, 'samples': 11167488, 'steps': 58163, 'loss/train': 1.524658441543579} -11/07/2021 05:23:28 - INFO - __main__ - Step 58165: {'lr': 0.000342406008793916, 'samples': 11167680, 'steps': 58164, 'loss/train': 1.2651325464248657} -11/07/2021 05:23:29 - INFO - __main__ - Step 58166: {'lr': 0.00034240107784496023, 'samples': 11167872, 'steps': 58165, 'loss/train': 1.3366292715072632} -11/07/2021 05:23:29 - INFO - __main__ - Step 58167: {'lr': 0.00034239614685436994, 'samples': 11168064, 'steps': 58166, 'loss/train': 1.7601878643035889} -11/07/2021 05:23:30 - INFO - __main__ - Step 58168: {'lr': 0.0003423912158221473, 'samples': 11168256, 'steps': 58167, 'loss/train': 1.148177981376648} -11/07/2021 05:23:31 - INFO - __main__ - Step 58169: {'lr': 0.0003423862847482947, 'samples': 11168448, 'steps': 58168, 'loss/train': 0.06079781800508499} -11/07/2021 05:23:31 - INFO - __main__ - Step 58170: {'lr': 0.0003423813536328143, 'samples': 11168640, 'steps': 58169, 'loss/train': 1.6206070184707642} -11/07/2021 05:23:31 - INFO - __main__ - Step 58171: {'lr': 0.00034237642247570815, 'samples': 11168832, 'steps': 58170, 'loss/train': 1.9088107347488403} -11/07/2021 05:23:32 - INFO - __main__ - Step 58172: {'lr': 0.0003423714912769787, 'samples': 11169024, 'steps': 58171, 'loss/train': 1.0276298522949219} -11/07/2021 05:23:32 - INFO - __main__ - Step 58173: {'lr': 0.000342366560036628, 'samples': 11169216, 'steps': 58172, 'loss/train': 1.4985283613204956} -11/07/2021 05:23:33 - INFO - __main__ - Step 58174: {'lr': 0.0003423616287546585, 'samples': 11169408, 'steps': 58173, 'loss/train': 1.5972003936767578} -11/07/2021 05:23:33 - INFO - __main__ - Step 58175: {'lr': 0.00034235669743107214, 'samples': 11169600, 'steps': 58174, 'loss/train': 1.5434128046035767} -11/07/2021 05:23:34 - INFO - __main__ - Step 58176: {'lr': 0.0003423517660658713, 'samples': 11169792, 'steps': 58175, 'loss/train': 0.8475615978240967} -11/07/2021 05:23:34 - INFO - __main__ - Step 58177: {'lr': 0.0003423468346590583, 'samples': 11169984, 'steps': 58176, 'loss/train': 1.3889529705047607} -11/07/2021 05:23:34 - INFO - __main__ - Step 58178: {'lr': 0.00034234190321063516, 'samples': 11170176, 'steps': 58177, 'loss/train': 1.2486295700073242} -11/07/2021 05:23:36 - INFO - __main__ - Step 58179: {'lr': 0.00034233697172060415, 'samples': 11170368, 'steps': 58178, 'loss/train': 1.5169450044631958} -11/07/2021 05:23:36 - INFO - __main__ - Step 58180: {'lr': 0.00034233204018896754, 'samples': 11170560, 'steps': 58179, 'loss/train': 1.3016443252563477} -11/07/2021 05:23:37 - INFO - __main__ - Step 58181: {'lr': 0.00034232710861572754, 'samples': 11170752, 'steps': 58180, 'loss/train': 0.5447980761528015} -11/07/2021 05:23:37 - INFO - __main__ - Step 58182: {'lr': 0.0003423221770008864, 'samples': 11170944, 'steps': 58181, 'loss/train': 1.4304301738739014} -11/07/2021 05:23:37 - INFO - __main__ - Step 58183: {'lr': 0.0003423172453444462, 'samples': 11171136, 'steps': 58182, 'loss/train': 1.4617197513580322} -11/07/2021 05:23:38 - INFO - __main__ - Step 58184: {'lr': 0.00034231231364640946, 'samples': 11171328, 'steps': 58183, 'loss/train': 1.0902422666549683} -11/07/2021 05:23:39 - INFO - __main__ - Step 58185: {'lr': 0.0003423073819067781, 'samples': 11171520, 'steps': 58184, 'loss/train': 1.501054048538208} -11/07/2021 05:23:39 - INFO - __main__ - Step 58186: {'lr': 0.00034230245012555445, 'samples': 11171712, 'steps': 58185, 'loss/train': 0.9810585379600525} -11/07/2021 05:23:39 - INFO - __main__ - Step 58187: {'lr': 0.00034229751830274077, 'samples': 11171904, 'steps': 58186, 'loss/train': 1.3098068237304688} -11/07/2021 05:23:40 - INFO - __main__ - Step 58188: {'lr': 0.0003422925864383392, 'samples': 11172096, 'steps': 58187, 'loss/train': 1.1051206588745117} -11/07/2021 05:23:41 - INFO - __main__ - Step 58189: {'lr': 0.00034228765453235213, 'samples': 11172288, 'steps': 58188, 'loss/train': 1.5620949268341064} -11/07/2021 05:23:41 - INFO - __main__ - Step 58190: {'lr': 0.0003422827225847816, 'samples': 11172480, 'steps': 58189, 'loss/train': 1.223131537437439} -11/07/2021 05:23:41 - INFO - __main__ - Step 58191: {'lr': 0.0003422777905956299, 'samples': 11172672, 'steps': 58190, 'loss/train': 1.2403318881988525} -11/07/2021 05:23:42 - INFO - __main__ - Step 58192: {'lr': 0.0003422728585648992, 'samples': 11172864, 'steps': 58191, 'loss/train': 1.8370261192321777} -11/07/2021 05:23:42 - INFO - __main__ - Step 58193: {'lr': 0.00034226792649259184, 'samples': 11173056, 'steps': 58192, 'loss/train': 1.4494093656539917} -11/07/2021 05:23:43 - INFO - __main__ - Step 58194: {'lr': 0.00034226299437870993, 'samples': 11173248, 'steps': 58193, 'loss/train': 1.1527293920516968} -11/07/2021 05:23:44 - INFO - __main__ - Step 58195: {'lr': 0.0003422580622232558, 'samples': 11173440, 'steps': 58194, 'loss/train': 1.4890687465667725} -11/07/2021 05:23:44 - INFO - __main__ - Step 58196: {'lr': 0.0003422531300262316, 'samples': 11173632, 'steps': 58195, 'loss/train': 1.525909662246704} -11/07/2021 05:23:44 - INFO - __main__ - Step 58197: {'lr': 0.00034224819778763953, 'samples': 11173824, 'steps': 58196, 'loss/train': 1.4138767719268799} -11/07/2021 05:23:45 - INFO - __main__ - Step 58198: {'lr': 0.0003422432655074819, 'samples': 11174016, 'steps': 58197, 'loss/train': 1.4295481443405151} -11/07/2021 05:23:45 - INFO - __main__ - Step 58199: {'lr': 0.0003422383331857608, 'samples': 11174208, 'steps': 58198, 'loss/train': 1.5134727954864502} -11/07/2021 05:23:46 - INFO - __main__ - Step 58200: {'lr': 0.00034223340082247856, 'samples': 11174400, 'steps': 58199, 'loss/train': 2.110922336578369} -11/07/2021 05:23:46 - INFO - __main__ - Step 58201: {'lr': 0.0003422284684176374, 'samples': 11174592, 'steps': 58200, 'loss/train': 1.659425973892212} -11/07/2021 05:23:47 - INFO - __main__ - Step 58202: {'lr': 0.00034222353597123946, 'samples': 11174784, 'steps': 58201, 'loss/train': 1.4581602811813354} -11/07/2021 05:23:47 - INFO - __main__ - Step 58203: {'lr': 0.00034221860348328703, 'samples': 11174976, 'steps': 58202, 'loss/train': 1.4331773519515991} -11/07/2021 05:23:47 - INFO - __main__ - Step 58204: {'lr': 0.0003422136709537824, 'samples': 11175168, 'steps': 58203, 'loss/train': 1.7570655345916748} -11/07/2021 05:23:48 - INFO - __main__ - Step 58205: {'lr': 0.00034220873838272767, 'samples': 11175360, 'steps': 58204, 'loss/train': 1.2941737174987793} -11/07/2021 05:23:49 - INFO - __main__ - Step 58206: {'lr': 0.00034220380577012506, 'samples': 11175552, 'steps': 58205, 'loss/train': 1.502335548400879} -11/07/2021 05:23:49 - INFO - __main__ - Step 58207: {'lr': 0.00034219887311597686, 'samples': 11175744, 'steps': 58206, 'loss/train': 1.3283244371414185} -11/07/2021 05:23:49 - INFO - __main__ - Step 58208: {'lr': 0.0003421939404202853, 'samples': 11175936, 'steps': 58207, 'loss/train': 1.7608331441879272} -11/07/2021 05:23:50 - INFO - __main__ - Step 58209: {'lr': 0.0003421890076830525, 'samples': 11176128, 'steps': 58208, 'loss/train': 1.7661632299423218} -11/07/2021 05:23:51 - INFO - __main__ - Step 58210: {'lr': 0.00034218407490428085, 'samples': 11176320, 'steps': 58209, 'loss/train': 1.0454431772232056} -11/07/2021 05:23:51 - INFO - __main__ - Step 58211: {'lr': 0.0003421791420839724, 'samples': 11176512, 'steps': 58210, 'loss/train': 1.4422022104263306} -11/07/2021 05:23:52 - INFO - __main__ - Step 58212: {'lr': 0.00034217420922212947, 'samples': 11176704, 'steps': 58211, 'loss/train': 1.4320636987686157} -11/07/2021 05:23:52 - INFO - __main__ - Step 58213: {'lr': 0.0003421692763187543, 'samples': 11176896, 'steps': 58212, 'loss/train': 1.5016170740127563} -11/07/2021 05:23:52 - INFO - __main__ - Step 58214: {'lr': 0.00034216434337384905, 'samples': 11177088, 'steps': 58213, 'loss/train': 1.1252275705337524} -11/07/2021 05:23:53 - INFO - __main__ - Step 58215: {'lr': 0.000342159410387416, 'samples': 11177280, 'steps': 58214, 'loss/train': 1.9015330076217651} -11/07/2021 05:23:54 - INFO - __main__ - Step 58216: {'lr': 0.0003421544773594573, 'samples': 11177472, 'steps': 58215, 'loss/train': 1.9007363319396973} -11/07/2021 05:23:54 - INFO - __main__ - Step 58217: {'lr': 0.0003421495442899753, 'samples': 11177664, 'steps': 58216, 'loss/train': 1.3868484497070312} -11/07/2021 05:23:54 - INFO - __main__ - Step 58218: {'lr': 0.0003421446111789721, 'samples': 11177856, 'steps': 58217, 'loss/train': 2.0489532947540283} -11/07/2021 05:23:55 - INFO - __main__ - Step 58219: {'lr': 0.00034213967802644986, 'samples': 11178048, 'steps': 58218, 'loss/train': 1.278505802154541} -11/07/2021 05:23:56 - INFO - __main__ - Step 58220: {'lr': 0.000342134744832411, 'samples': 11178240, 'steps': 58219, 'loss/train': 1.5730618238449097} -11/07/2021 05:23:56 - INFO - __main__ - Step 58221: {'lr': 0.0003421298115968576, 'samples': 11178432, 'steps': 58220, 'loss/train': 2.0743625164031982} -11/07/2021 05:23:57 - INFO - __main__ - Step 58222: {'lr': 0.0003421248783197919, 'samples': 11178624, 'steps': 58221, 'loss/train': 1.1445319652557373} -11/07/2021 05:23:57 - INFO - __main__ - Step 58223: {'lr': 0.0003421199450012162, 'samples': 11178816, 'steps': 58222, 'loss/train': 1.6939197778701782} -11/07/2021 05:23:57 - INFO - __main__ - Step 58224: {'lr': 0.00034211501164113276, 'samples': 11179008, 'steps': 58223, 'loss/train': 1.6914745569229126} -11/07/2021 05:23:58 - INFO - __main__ - Step 58225: {'lr': 0.0003421100782395436, 'samples': 11179200, 'steps': 58224, 'loss/train': 1.6748243570327759} -11/07/2021 05:23:59 - INFO - __main__ - Step 58226: {'lr': 0.000342105144796451, 'samples': 11179392, 'steps': 58225, 'loss/train': 1.6589128971099854} -11/07/2021 05:23:59 - INFO - __main__ - Step 58227: {'lr': 0.0003421002113118574, 'samples': 11179584, 'steps': 58226, 'loss/train': 1.6836780309677124} -11/07/2021 05:23:59 - INFO - __main__ - Step 58228: {'lr': 0.00034209527778576477, 'samples': 11179776, 'steps': 58227, 'loss/train': 1.0992323160171509} -11/07/2021 05:24:00 - INFO - __main__ - Step 58229: {'lr': 0.0003420903442181755, 'samples': 11179968, 'steps': 58228, 'loss/train': 1.1824052333831787} -11/07/2021 05:24:00 - INFO - __main__ - Step 58230: {'lr': 0.0003420854106090917, 'samples': 11180160, 'steps': 58229, 'loss/train': 1.4953030347824097} -11/07/2021 05:24:01 - INFO - __main__ - Step 58231: {'lr': 0.00034208047695851563, 'samples': 11180352, 'steps': 58230, 'loss/train': 1.0680210590362549} -11/07/2021 05:24:01 - INFO - __main__ - Step 58232: {'lr': 0.0003420755432664495, 'samples': 11180544, 'steps': 58231, 'loss/train': 1.3415437936782837} -11/07/2021 05:24:02 - INFO - __main__ - Step 58233: {'lr': 0.0003420706095328956, 'samples': 11180736, 'steps': 58232, 'loss/train': 1.3045610189437866} -11/07/2021 05:24:02 - INFO - __main__ - Step 58234: {'lr': 0.0003420656757578561, 'samples': 11180928, 'steps': 58233, 'loss/train': 1.4776599407196045} -11/07/2021 05:24:02 - INFO - __main__ - Step 58235: {'lr': 0.00034206074194133323, 'samples': 11181120, 'steps': 58234, 'loss/train': 1.7522863149642944} -11/07/2021 05:24:04 - INFO - __main__ - Step 58236: {'lr': 0.00034205580808332916, 'samples': 11181312, 'steps': 58235, 'loss/train': 1.7411361932754517} -11/07/2021 05:24:04 - INFO - __main__ - Step 58237: {'lr': 0.0003420508741838462, 'samples': 11181504, 'steps': 58236, 'loss/train': 1.7615766525268555} -11/07/2021 05:24:04 - INFO - __main__ - Step 58238: {'lr': 0.0003420459402428865, 'samples': 11181696, 'steps': 58237, 'loss/train': 1.363251805305481} -11/07/2021 05:24:05 - INFO - __main__ - Step 58239: {'lr': 0.00034204100626045235, 'samples': 11181888, 'steps': 58238, 'loss/train': 1.4591209888458252} -11/07/2021 05:24:05 - INFO - __main__ - Step 58240: {'lr': 0.00034203607223654594, 'samples': 11182080, 'steps': 58239, 'loss/train': 1.4060337543487549} -11/07/2021 05:24:06 - INFO - __main__ - Step 58241: {'lr': 0.00034203113817116957, 'samples': 11182272, 'steps': 58240, 'loss/train': 0.6312339901924133} -11/07/2021 05:24:06 - INFO - __main__ - Step 58242: {'lr': 0.0003420262040643253, 'samples': 11182464, 'steps': 58241, 'loss/train': 1.2740561962127686} -11/07/2021 05:24:07 - INFO - __main__ - Step 58243: {'lr': 0.0003420212699160154, 'samples': 11182656, 'steps': 58242, 'loss/train': 1.509224534034729} -11/07/2021 05:24:07 - INFO - __main__ - Step 58244: {'lr': 0.00034201633572624216, 'samples': 11182848, 'steps': 58243, 'loss/train': 1.5922558307647705} -11/07/2021 05:24:07 - INFO - __main__ - Step 58245: {'lr': 0.00034201140149500784, 'samples': 11183040, 'steps': 58244, 'loss/train': 1.5326972007751465} -11/07/2021 05:24:08 - INFO - __main__ - Step 58246: {'lr': 0.0003420064672223146, 'samples': 11183232, 'steps': 58245, 'loss/train': 1.5039807558059692} -11/07/2021 05:24:09 - INFO - __main__ - Step 58247: {'lr': 0.0003420015329081647, 'samples': 11183424, 'steps': 58246, 'loss/train': 1.651671051979065} -11/07/2021 05:24:09 - INFO - __main__ - Step 58248: {'lr': 0.00034199659855256023, 'samples': 11183616, 'steps': 58247, 'loss/train': 1.4716250896453857} -11/07/2021 05:24:09 - INFO - __main__ - Step 58249: {'lr': 0.00034199166415550353, 'samples': 11183808, 'steps': 58248, 'loss/train': 1.0323662757873535} -11/07/2021 05:24:10 - INFO - __main__ - Step 58250: {'lr': 0.0003419867297169968, 'samples': 11184000, 'steps': 58249, 'loss/train': 1.5270559787750244} -11/07/2021 05:24:10 - INFO - __main__ - Step 58251: {'lr': 0.00034198179523704233, 'samples': 11184192, 'steps': 58250, 'loss/train': 1.4787980318069458} -11/07/2021 05:24:11 - INFO - __main__ - Step 58252: {'lr': 0.0003419768607156423, 'samples': 11184384, 'steps': 58251, 'loss/train': 1.374104380607605} -11/07/2021 05:24:12 - INFO - __main__ - Step 58253: {'lr': 0.0003419719261527988, 'samples': 11184576, 'steps': 58252, 'loss/train': 1.5750901699066162} -11/07/2021 05:24:12 - INFO - __main__ - Step 58254: {'lr': 0.0003419669915485142, 'samples': 11184768, 'steps': 58253, 'loss/train': 1.468117117881775} -11/07/2021 05:24:12 - INFO - __main__ - Step 58255: {'lr': 0.00034196205690279076, 'samples': 11184960, 'steps': 58254, 'loss/train': 1.0962551832199097} -11/07/2021 05:24:13 - INFO - __main__ - Step 58256: {'lr': 0.00034195712221563057, 'samples': 11185152, 'steps': 58255, 'loss/train': 1.4864016771316528} -11/07/2021 05:24:14 - INFO - __main__ - Step 58257: {'lr': 0.00034195218748703596, 'samples': 11185344, 'steps': 58256, 'loss/train': 1.6173681020736694} -11/07/2021 05:24:14 - INFO - __main__ - Step 58258: {'lr': 0.00034194725271700915, 'samples': 11185536, 'steps': 58257, 'loss/train': 1.283270001411438} -11/07/2021 05:24:14 - INFO - __main__ - Step 58259: {'lr': 0.0003419423179055523, 'samples': 11185728, 'steps': 58258, 'loss/train': 0.7892928719520569} -11/07/2021 05:24:15 - INFO - __main__ - Step 58260: {'lr': 0.0003419373830526676, 'samples': 11185920, 'steps': 58259, 'loss/train': 1.3765954971313477} -11/07/2021 05:24:15 - INFO - __main__ - Step 58261: {'lr': 0.0003419324481583574, 'samples': 11186112, 'steps': 58260, 'loss/train': 1.7961735725402832} -11/07/2021 05:24:16 - INFO - __main__ - Step 58262: {'lr': 0.00034192751322262375, 'samples': 11186304, 'steps': 58261, 'loss/train': 1.456167221069336} -11/07/2021 05:24:16 - INFO - __main__ - Step 58263: {'lr': 0.0003419225782454691, 'samples': 11186496, 'steps': 58262, 'loss/train': 1.5626648664474487} -11/07/2021 05:24:17 - INFO - __main__ - Step 58264: {'lr': 0.00034191764322689553, 'samples': 11186688, 'steps': 58263, 'loss/train': 1.3266459703445435} -11/07/2021 05:24:17 - INFO - __main__ - Step 58265: {'lr': 0.00034191270816690526, 'samples': 11186880, 'steps': 58264, 'loss/train': 1.2717241048812866} -11/07/2021 05:24:17 - INFO - __main__ - Step 58266: {'lr': 0.0003419077730655006, 'samples': 11187072, 'steps': 58265, 'loss/train': 1.8614730834960938} -11/07/2021 05:24:18 - INFO - __main__ - Step 58267: {'lr': 0.00034190283792268365, 'samples': 11187264, 'steps': 58266, 'loss/train': 1.3185659646987915} -11/07/2021 05:24:19 - INFO - __main__ - Step 58268: {'lr': 0.0003418979027384567, 'samples': 11187456, 'steps': 58267, 'loss/train': 1.5168559551239014} -11/07/2021 05:24:19 - INFO - __main__ - Step 58269: {'lr': 0.00034189296751282203, 'samples': 11187648, 'steps': 58268, 'loss/train': 1.7645275592803955} -11/07/2021 05:24:20 - INFO - __main__ - Step 58270: {'lr': 0.0003418880322457817, 'samples': 11187840, 'steps': 58269, 'loss/train': 1.0933140516281128} -11/07/2021 05:24:20 - INFO - __main__ - Step 58271: {'lr': 0.0003418830969373382, 'samples': 11188032, 'steps': 58270, 'loss/train': 1.7920719385147095} -11/07/2021 05:24:20 - INFO - __main__ - Step 58272: {'lr': 0.00034187816158749354, 'samples': 11188224, 'steps': 58271, 'loss/train': 0.6926540732383728} -11/07/2021 05:24:21 - INFO - __main__ - Step 58273: {'lr': 0.00034187322619624996, 'samples': 11188416, 'steps': 58272, 'loss/train': 1.59482741355896} -11/07/2021 05:24:22 - INFO - __main__ - Step 58274: {'lr': 0.0003418682907636097, 'samples': 11188608, 'steps': 58273, 'loss/train': 1.5063611268997192} -11/07/2021 05:24:22 - INFO - __main__ - Step 58275: {'lr': 0.000341863355289575, 'samples': 11188800, 'steps': 58274, 'loss/train': 1.543867826461792} -11/07/2021 05:24:22 - INFO - __main__ - Step 58276: {'lr': 0.0003418584197741481, 'samples': 11188992, 'steps': 58275, 'loss/train': 1.5246760845184326} -11/07/2021 05:24:23 - INFO - __main__ - Step 58277: {'lr': 0.00034185348421733125, 'samples': 11189184, 'steps': 58276, 'loss/train': 1.4306000471115112} -11/07/2021 05:24:24 - INFO - __main__ - Step 58278: {'lr': 0.0003418485486191267, 'samples': 11189376, 'steps': 58277, 'loss/train': 1.5192270278930664} -11/07/2021 05:24:24 - INFO - __main__ - Step 58279: {'lr': 0.0003418436129795365, 'samples': 11189568, 'steps': 58278, 'loss/train': 1.6188006401062012} -11/07/2021 05:24:24 - INFO - __main__ - Step 58280: {'lr': 0.000341838677298563, 'samples': 11189760, 'steps': 58279, 'loss/train': 1.1027847528457642} -11/07/2021 05:24:25 - INFO - __main__ - Step 58281: {'lr': 0.00034183374157620847, 'samples': 11189952, 'steps': 58280, 'loss/train': 1.3313562870025635} -11/07/2021 05:24:25 - INFO - __main__ - Step 58282: {'lr': 0.000341828805812475, 'samples': 11190144, 'steps': 58281, 'loss/train': 1.4884618520736694} -11/07/2021 05:24:26 - INFO - __main__ - Step 58283: {'lr': 0.0003418238700073649, 'samples': 11190336, 'steps': 58282, 'loss/train': 1.4345486164093018} -11/07/2021 05:24:26 - INFO - __main__ - Step 58284: {'lr': 0.0003418189341608804, 'samples': 11190528, 'steps': 58283, 'loss/train': 1.6635472774505615} -11/07/2021 05:24:27 - INFO - __main__ - Step 58285: {'lr': 0.0003418139982730237, 'samples': 11190720, 'steps': 58284, 'loss/train': 1.0728845596313477} -11/07/2021 05:24:27 - INFO - __main__ - Step 58286: {'lr': 0.0003418090623437971, 'samples': 11190912, 'steps': 58285, 'loss/train': 1.3892258405685425} -11/07/2021 05:24:27 - INFO - __main__ - Step 58287: {'lr': 0.00034180412637320267, 'samples': 11191104, 'steps': 58286, 'loss/train': 0.9549578428268433} -11/07/2021 05:24:28 - INFO - __main__ - Step 58288: {'lr': 0.0003417991903612427, 'samples': 11191296, 'steps': 58287, 'loss/train': 1.3454868793487549} -11/07/2021 05:24:29 - INFO - __main__ - Step 58289: {'lr': 0.0003417942543079195, 'samples': 11191488, 'steps': 58288, 'loss/train': 1.5178730487823486} -11/07/2021 05:24:29 - INFO - __main__ - Step 58290: {'lr': 0.00034178931821323517, 'samples': 11191680, 'steps': 58289, 'loss/train': 1.457436203956604} -11/07/2021 05:24:30 - INFO - __main__ - Step 58291: {'lr': 0.0003417843820771921, 'samples': 11191872, 'steps': 58290, 'loss/train': 1.162864089012146} -11/07/2021 05:24:30 - INFO - __main__ - Step 58292: {'lr': 0.00034177944589979225, 'samples': 11192064, 'steps': 58291, 'loss/train': 1.137751817703247} -11/07/2021 05:24:30 - INFO - __main__ - Step 58293: {'lr': 0.0003417745096810381, 'samples': 11192256, 'steps': 58292, 'loss/train': 1.3616067171096802} -11/07/2021 05:24:31 - INFO - __main__ - Step 58294: {'lr': 0.00034176957342093174, 'samples': 11192448, 'steps': 58293, 'loss/train': 1.521599292755127} -11/07/2021 05:24:32 - INFO - __main__ - Step 58295: {'lr': 0.0003417646371194754, 'samples': 11192640, 'steps': 58294, 'loss/train': 1.423263430595398} -11/07/2021 05:24:32 - INFO - __main__ - Step 58296: {'lr': 0.00034175970077667136, 'samples': 11192832, 'steps': 58295, 'loss/train': 1.610305905342102} -11/07/2021 05:24:32 - INFO - __main__ - Step 58297: {'lr': 0.00034175476439252177, 'samples': 11193024, 'steps': 58296, 'loss/train': 1.8208974599838257} -11/07/2021 05:24:33 - INFO - __main__ - Step 58298: {'lr': 0.00034174982796702895, 'samples': 11193216, 'steps': 58297, 'loss/train': 1.125916600227356} -11/07/2021 05:24:34 - INFO - __main__ - Step 58299: {'lr': 0.00034174489150019506, 'samples': 11193408, 'steps': 58298, 'loss/train': 1.8532830476760864} -11/07/2021 05:24:34 - INFO - __main__ - Step 58300: {'lr': 0.0003417399549920224, 'samples': 11193600, 'steps': 58299, 'loss/train': 1.7013945579528809} -11/07/2021 05:24:35 - INFO - __main__ - Step 58301: {'lr': 0.00034173501844251305, 'samples': 11193792, 'steps': 58300, 'loss/train': 1.583761215209961} -11/07/2021 05:24:35 - INFO - __main__ - Step 58302: {'lr': 0.0003417300818516693, 'samples': 11193984, 'steps': 58301, 'loss/train': 1.596790075302124} -11/07/2021 05:24:35 - INFO - __main__ - Step 58303: {'lr': 0.00034172514521949336, 'samples': 11194176, 'steps': 58302, 'loss/train': 1.9282759428024292} -11/07/2021 05:24:36 - INFO - __main__ - Step 58304: {'lr': 0.0003417202085459876, 'samples': 11194368, 'steps': 58303, 'loss/train': 2.0007357597351074} -11/07/2021 05:24:36 - INFO - __main__ - Step 58305: {'lr': 0.00034171527183115413, 'samples': 11194560, 'steps': 58304, 'loss/train': 1.590613842010498} -11/07/2021 05:24:37 - INFO - __main__ - Step 58306: {'lr': 0.0003417103350749951, 'samples': 11194752, 'steps': 58305, 'loss/train': 0.5088095664978027} -11/07/2021 05:24:37 - INFO - __main__ - Step 58307: {'lr': 0.00034170539827751284, 'samples': 11194944, 'steps': 58306, 'loss/train': 1.890604019165039} -11/07/2021 05:24:38 - INFO - __main__ - Step 58308: {'lr': 0.0003417004614387095, 'samples': 11195136, 'steps': 58307, 'loss/train': 1.2942551374435425} -11/07/2021 05:24:38 - INFO - __main__ - Step 58309: {'lr': 0.0003416955245585874, 'samples': 11195328, 'steps': 58308, 'loss/train': 0.6271637678146362} -11/07/2021 05:24:39 - INFO - __main__ - Step 58310: {'lr': 0.00034169058763714865, 'samples': 11195520, 'steps': 58309, 'loss/train': 2.029214859008789} -11/07/2021 05:24:39 - INFO - __main__ - Step 58311: {'lr': 0.0003416856506743956, 'samples': 11195712, 'steps': 58310, 'loss/train': 1.5270578861236572} -11/07/2021 05:24:40 - INFO - __main__ - Step 58312: {'lr': 0.00034168071367033043, 'samples': 11195904, 'steps': 58311, 'loss/train': 1.3987207412719727} -11/07/2021 05:24:40 - INFO - __main__ - Step 58313: {'lr': 0.0003416757766249553, 'samples': 11196096, 'steps': 58312, 'loss/train': 1.6209709644317627} -11/07/2021 05:24:40 - INFO - __main__ - Step 58314: {'lr': 0.0003416708395382725, 'samples': 11196288, 'steps': 58313, 'loss/train': 1.304992437362671} -11/07/2021 05:24:41 - INFO - __main__ - Step 58315: {'lr': 0.00034166590241028425, 'samples': 11196480, 'steps': 58314, 'loss/train': 1.3999801874160767} -11/07/2021 05:24:42 - INFO - __main__ - Step 58316: {'lr': 0.00034166096524099264, 'samples': 11196672, 'steps': 58315, 'loss/train': 1.3416448831558228} -11/07/2021 05:24:42 - INFO - __main__ - Step 58317: {'lr': 0.00034165602803040013, 'samples': 11196864, 'steps': 58316, 'loss/train': 0.8841568827629089} -11/07/2021 05:24:42 - INFO - __main__ - Step 58318: {'lr': 0.00034165109077850884, 'samples': 11197056, 'steps': 58317, 'loss/train': 1.7505240440368652} -11/07/2021 05:24:43 - INFO - __main__ - Step 58319: {'lr': 0.00034164615348532094, 'samples': 11197248, 'steps': 58318, 'loss/train': 1.6183518171310425} -11/07/2021 05:24:44 - INFO - __main__ - Step 58320: {'lr': 0.0003416412161508387, 'samples': 11197440, 'steps': 58319, 'loss/train': 1.959389328956604} -11/07/2021 05:24:44 - INFO - __main__ - Step 58321: {'lr': 0.0003416362787750643, 'samples': 11197632, 'steps': 58320, 'loss/train': 1.081329107284546} -11/07/2021 05:24:44 - INFO - __main__ - Step 58322: {'lr': 0.00034163134135800004, 'samples': 11197824, 'steps': 58321, 'loss/train': 1.529457688331604} -11/07/2021 05:24:45 - INFO - __main__ - Step 58323: {'lr': 0.00034162640389964814, 'samples': 11198016, 'steps': 58322, 'loss/train': 1.1754611730575562} -11/07/2021 05:24:45 - INFO - __main__ - Step 58324: {'lr': 0.0003416214664000108, 'samples': 11198208, 'steps': 58323, 'loss/train': 1.4142574071884155} -11/07/2021 05:24:46 - INFO - __main__ - Step 58325: {'lr': 0.00034161652885909025, 'samples': 11198400, 'steps': 58324, 'loss/train': 1.1935970783233643} -11/07/2021 05:24:47 - INFO - __main__ - Step 58326: {'lr': 0.0003416115912768887, 'samples': 11198592, 'steps': 58325, 'loss/train': 1.3951812982559204} -11/07/2021 05:24:47 - INFO - __main__ - Step 58327: {'lr': 0.0003416066536534083, 'samples': 11198784, 'steps': 58326, 'loss/train': 0.9472230672836304} -11/07/2021 05:24:47 - INFO - __main__ - Step 58328: {'lr': 0.0003416017159886514, 'samples': 11198976, 'steps': 58327, 'loss/train': 0.9106329083442688} -11/07/2021 05:24:48 - INFO - __main__ - Step 58329: {'lr': 0.0003415967782826202, 'samples': 11199168, 'steps': 58328, 'loss/train': 0.9734601974487305} -11/07/2021 05:24:49 - INFO - __main__ - Step 58330: {'lr': 0.0003415918405353169, 'samples': 11199360, 'steps': 58329, 'loss/train': 0.8111278414726257} -11/07/2021 05:24:49 - INFO - __main__ - Step 58331: {'lr': 0.0003415869027467437, 'samples': 11199552, 'steps': 58330, 'loss/train': 1.3817026615142822} -11/07/2021 05:24:50 - INFO - __main__ - Step 58332: {'lr': 0.000341581964916903, 'samples': 11199744, 'steps': 58331, 'loss/train': 2.877706527709961} -11/07/2021 05:24:50 - INFO - __main__ - Step 58333: {'lr': 0.00034157702704579667, 'samples': 11199936, 'steps': 58332, 'loss/train': 1.1789413690567017} -11/07/2021 05:24:50 - INFO - __main__ - Step 58334: {'lr': 0.00034157208913342726, 'samples': 11200128, 'steps': 58333, 'loss/train': 1.6798967123031616} -11/07/2021 05:24:51 - INFO - __main__ - Step 58335: {'lr': 0.00034156715117979685, 'samples': 11200320, 'steps': 58334, 'loss/train': 1.5536830425262451} -11/07/2021 05:24:52 - INFO - __main__ - Step 58336: {'lr': 0.00034156221318490767, 'samples': 11200512, 'steps': 58335, 'loss/train': 1.310221791267395} -11/07/2021 05:24:52 - INFO - __main__ - Step 58337: {'lr': 0.000341557275148762, 'samples': 11200704, 'steps': 58336, 'loss/train': 1.6157326698303223} -11/07/2021 05:24:52 - INFO - __main__ - Step 58338: {'lr': 0.0003415523370713621, 'samples': 11200896, 'steps': 58337, 'loss/train': 1.3565797805786133} -11/07/2021 05:24:53 - INFO - __main__ - Step 58339: {'lr': 0.00034154739895271005, 'samples': 11201088, 'steps': 58338, 'loss/train': 1.564904808998108} -11/07/2021 05:24:54 - INFO - __main__ - Step 58340: {'lr': 0.00034154246079280817, 'samples': 11201280, 'steps': 58339, 'loss/train': 1.5634486675262451} -11/07/2021 05:24:54 - INFO - __main__ - Step 58341: {'lr': 0.0003415375225916586, 'samples': 11201472, 'steps': 58340, 'loss/train': 1.7276787757873535} -11/07/2021 05:24:55 - INFO - __main__ - Step 58342: {'lr': 0.0003415325843492637, 'samples': 11201664, 'steps': 58341, 'loss/train': 1.4368934631347656} -11/07/2021 05:24:55 - INFO - __main__ - Step 58343: {'lr': 0.00034152764606562564, 'samples': 11201856, 'steps': 58342, 'loss/train': 1.7426483631134033} -11/07/2021 05:24:55 - INFO - __main__ - Step 58344: {'lr': 0.0003415227077407466, 'samples': 11202048, 'steps': 58343, 'loss/train': 2.328885555267334} -11/07/2021 05:24:56 - INFO - __main__ - Step 58345: {'lr': 0.00034151776937462895, 'samples': 11202240, 'steps': 58344, 'loss/train': 1.487534761428833} -11/07/2021 05:24:57 - INFO - __main__ - Step 58346: {'lr': 0.0003415128309672747, 'samples': 11202432, 'steps': 58345, 'loss/train': 1.504127860069275} -11/07/2021 05:24:57 - INFO - __main__ - Step 58347: {'lr': 0.0003415078925186862, 'samples': 11202624, 'steps': 58346, 'loss/train': 1.621259331703186} -11/07/2021 05:24:57 - INFO - __main__ - Step 58348: {'lr': 0.00034150295402886566, 'samples': 11202816, 'steps': 58347, 'loss/train': 1.4061305522918701} -11/07/2021 05:24:58 - INFO - __main__ - Step 58349: {'lr': 0.0003414980154978153, 'samples': 11203008, 'steps': 58348, 'loss/train': 1.718531847000122} -11/07/2021 05:24:58 - INFO - __main__ - Step 58350: {'lr': 0.00034149307692553734, 'samples': 11203200, 'steps': 58349, 'loss/train': 1.1638323068618774} -11/07/2021 05:24:59 - INFO - __main__ - Step 58351: {'lr': 0.000341488138312034, 'samples': 11203392, 'steps': 58350, 'loss/train': 1.4727329015731812} -11/07/2021 05:24:59 - INFO - __main__ - Step 58352: {'lr': 0.00034148319965730757, 'samples': 11203584, 'steps': 58351, 'loss/train': 1.5973743200302124} -11/07/2021 05:25:00 - INFO - __main__ - Step 58353: {'lr': 0.0003414782609613602, 'samples': 11203776, 'steps': 58352, 'loss/train': 1.1058869361877441} -11/07/2021 05:25:00 - INFO - __main__ - Step 58354: {'lr': 0.0003414733222241941, 'samples': 11203968, 'steps': 58353, 'loss/train': 1.8483293056488037} -11/07/2021 05:25:00 - INFO - __main__ - Step 58355: {'lr': 0.00034146838344581155, 'samples': 11204160, 'steps': 58354, 'loss/train': 1.3488630056381226} -11/07/2021 05:25:01 - INFO - __main__ - Step 58356: {'lr': 0.00034146344462621477, 'samples': 11204352, 'steps': 58355, 'loss/train': 1.172558307647705} -11/07/2021 05:25:02 - INFO - __main__ - Step 58357: {'lr': 0.00034145850576540595, 'samples': 11204544, 'steps': 58356, 'loss/train': 1.4694602489471436} -11/07/2021 05:25:02 - INFO - __main__ - Step 58358: {'lr': 0.00034145356686338736, 'samples': 11204736, 'steps': 58357, 'loss/train': 1.4156039953231812} -11/07/2021 05:25:02 - INFO - __main__ - Step 58359: {'lr': 0.00034144862792016123, 'samples': 11204928, 'steps': 58358, 'loss/train': 1.4292247295379639} -11/07/2021 05:25:03 - INFO - __main__ - Step 58360: {'lr': 0.00034144368893572973, 'samples': 11205120, 'steps': 58359, 'loss/train': 0.8911574482917786} -11/07/2021 05:25:04 - INFO - __main__ - Step 58361: {'lr': 0.00034143874991009513, 'samples': 11205312, 'steps': 58360, 'loss/train': 1.5435965061187744} -11/07/2021 05:25:04 - INFO - __main__ - Step 58362: {'lr': 0.0003414338108432596, 'samples': 11205504, 'steps': 58361, 'loss/train': 1.7827941179275513} -11/07/2021 05:25:05 - INFO - __main__ - Step 58363: {'lr': 0.0003414288717352254, 'samples': 11205696, 'steps': 58362, 'loss/train': 1.3278061151504517} -11/07/2021 05:25:05 - INFO - __main__ - Step 58364: {'lr': 0.00034142393258599485, 'samples': 11205888, 'steps': 58363, 'loss/train': 2.042924642562866} -11/07/2021 05:25:05 - INFO - __main__ - Step 58365: {'lr': 0.00034141899339557003, 'samples': 11206080, 'steps': 58364, 'loss/train': 0.7355446219444275} -11/07/2021 05:25:06 - INFO - __main__ - Step 58366: {'lr': 0.0003414140541639532, 'samples': 11206272, 'steps': 58365, 'loss/train': 1.257541537284851} -11/07/2021 05:25:07 - INFO - __main__ - Step 58367: {'lr': 0.0003414091148911466, 'samples': 11206464, 'steps': 58366, 'loss/train': 1.490370750427246} -11/07/2021 05:25:07 - INFO - __main__ - Step 58368: {'lr': 0.00034140417557715255, 'samples': 11206656, 'steps': 58367, 'loss/train': 1.6572939157485962} -11/07/2021 05:25:07 - INFO - __main__ - Step 58369: {'lr': 0.0003413992362219731, 'samples': 11206848, 'steps': 58368, 'loss/train': 1.513646125793457} -11/07/2021 05:25:08 - INFO - __main__ - Step 58370: {'lr': 0.0003413942968256106, 'samples': 11207040, 'steps': 58369, 'loss/train': 1.2397743463516235} -11/07/2021 05:25:09 - INFO - __main__ - Step 58371: {'lr': 0.00034138935738806727, 'samples': 11207232, 'steps': 58370, 'loss/train': 1.7745050191879272} -11/07/2021 05:25:09 - INFO - __main__ - Step 58372: {'lr': 0.0003413844179093453, 'samples': 11207424, 'steps': 58371, 'loss/train': 1.7837297916412354} -11/07/2021 05:25:09 - INFO - __main__ - Step 58373: {'lr': 0.0003413794783894468, 'samples': 11207616, 'steps': 58372, 'loss/train': 1.6627751588821411} -11/07/2021 05:25:10 - INFO - __main__ - Step 58374: {'lr': 0.0003413745388283742, 'samples': 11207808, 'steps': 58373, 'loss/train': 1.1967734098434448} -11/07/2021 05:25:10 - INFO - __main__ - Step 58375: {'lr': 0.00034136959922612977, 'samples': 11208000, 'steps': 58374, 'loss/train': 1.3841203451156616} -11/07/2021 05:25:10 - INFO - __main__ - Step 58376: {'lr': 0.00034136465958271546, 'samples': 11208192, 'steps': 58375, 'loss/train': 1.028459072113037} -11/07/2021 05:25:11 - INFO - __main__ - Step 58377: {'lr': 0.00034135971989813363, 'samples': 11208384, 'steps': 58376, 'loss/train': 1.339853286743164} -11/07/2021 05:25:12 - INFO - __main__ - Step 58378: {'lr': 0.0003413547801723866, 'samples': 11208576, 'steps': 58377, 'loss/train': 1.0697388648986816} -11/07/2021 05:25:12 - INFO - __main__ - Step 58379: {'lr': 0.00034134984040547645, 'samples': 11208768, 'steps': 58378, 'loss/train': 1.5722737312316895} -11/07/2021 05:25:13 - INFO - __main__ - Step 58380: {'lr': 0.0003413449005974055, 'samples': 11208960, 'steps': 58379, 'loss/train': 1.5390830039978027} -11/07/2021 05:25:13 - INFO - __main__ - Step 58381: {'lr': 0.00034133996074817597, 'samples': 11209152, 'steps': 58380, 'loss/train': 1.4299684762954712} -11/07/2021 05:25:14 - INFO - __main__ - Step 58382: {'lr': 0.00034133502085779006, 'samples': 11209344, 'steps': 58381, 'loss/train': 1.7696834802627563} -11/07/2021 05:25:14 - INFO - __main__ - Step 58383: {'lr': 0.00034133008092624995, 'samples': 11209536, 'steps': 58382, 'loss/train': 1.5855791568756104} -11/07/2021 05:25:15 - INFO - __main__ - Step 58384: {'lr': 0.0003413251409535579, 'samples': 11209728, 'steps': 58383, 'loss/train': 1.531802773475647} -11/07/2021 05:25:15 - INFO - __main__ - Step 58385: {'lr': 0.0003413202009397163, 'samples': 11209920, 'steps': 58384, 'loss/train': 1.2706406116485596} -11/07/2021 05:25:16 - INFO - __main__ - Step 58386: {'lr': 0.0003413152608847271, 'samples': 11210112, 'steps': 58385, 'loss/train': 0.9080643653869629} -11/07/2021 05:25:17 - INFO - __main__ - Step 58387: {'lr': 0.0003413103207885927, 'samples': 11210304, 'steps': 58386, 'loss/train': 1.0522125959396362} -11/07/2021 05:25:17 - INFO - __main__ - Step 58388: {'lr': 0.00034130538065131524, 'samples': 11210496, 'steps': 58387, 'loss/train': 1.045793890953064} -11/07/2021 05:25:17 - INFO - __main__ - Step 58389: {'lr': 0.000341300440472897, 'samples': 11210688, 'steps': 58388, 'loss/train': 1.702425479888916} -11/07/2021 05:25:18 - INFO - __main__ - Step 58390: {'lr': 0.00034129550025334014, 'samples': 11210880, 'steps': 58389, 'loss/train': 1.2906677722930908} -11/07/2021 05:25:18 - INFO - __main__ - Step 58391: {'lr': 0.00034129055999264704, 'samples': 11211072, 'steps': 58390, 'loss/train': 1.4244874715805054} -11/07/2021 05:25:19 - INFO - __main__ - Step 58392: {'lr': 0.0003412856196908198, 'samples': 11211264, 'steps': 58391, 'loss/train': 1.1508504152297974} -11/07/2021 05:25:19 - INFO - __main__ - Step 58393: {'lr': 0.00034128067934786064, 'samples': 11211456, 'steps': 58392, 'loss/train': 1.6703565120697021} -11/07/2021 05:25:20 - INFO - __main__ - Step 58394: {'lr': 0.0003412757389637718, 'samples': 11211648, 'steps': 58393, 'loss/train': 1.8441166877746582} -11/07/2021 05:25:20 - INFO - __main__ - Step 58395: {'lr': 0.00034127079853855545, 'samples': 11211840, 'steps': 58394, 'loss/train': 1.4765968322753906} -11/07/2021 05:25:20 - INFO - __main__ - Step 58396: {'lr': 0.00034126585807221397, 'samples': 11212032, 'steps': 58395, 'loss/train': 2.049560546875} -11/07/2021 05:25:21 - INFO - __main__ - Step 58397: {'lr': 0.0003412609175647495, 'samples': 11212224, 'steps': 58396, 'loss/train': 1.4930609464645386} -11/07/2021 05:25:22 - INFO - __main__ - Step 58398: {'lr': 0.0003412559770161643, 'samples': 11212416, 'steps': 58397, 'loss/train': 1.710405945777893} -11/07/2021 05:25:22 - INFO - __main__ - Step 58399: {'lr': 0.0003412510364264606, 'samples': 11212608, 'steps': 58398, 'loss/train': 1.7443203926086426} -11/07/2021 05:25:23 - INFO - __main__ - Step 58400: {'lr': 0.0003412460957956405, 'samples': 11212800, 'steps': 58399, 'loss/train': 2.1306657791137695} -11/07/2021 05:25:23 - INFO - __main__ - Step 58401: {'lr': 0.00034124115512370636, 'samples': 11212992, 'steps': 58400, 'loss/train': 1.4786614179611206} -11/07/2021 05:25:23 - INFO - __main__ - Step 58402: {'lr': 0.0003412362144106603, 'samples': 11213184, 'steps': 58401, 'loss/train': 1.1887379884719849} -11/07/2021 05:25:24 - INFO - __main__ - Step 58403: {'lr': 0.00034123127365650463, 'samples': 11213376, 'steps': 58402, 'loss/train': 1.3642297983169556} -11/07/2021 05:25:25 - INFO - __main__ - Step 58404: {'lr': 0.0003412263328612416, 'samples': 11213568, 'steps': 58403, 'loss/train': 1.8511093854904175} -11/07/2021 05:25:25 - INFO - __main__ - Step 58405: {'lr': 0.00034122139202487334, 'samples': 11213760, 'steps': 58404, 'loss/train': 1.587825059890747} -11/07/2021 05:25:25 - INFO - __main__ - Step 58406: {'lr': 0.00034121645114740224, 'samples': 11213952, 'steps': 58405, 'loss/train': 1.443624496459961} -11/07/2021 05:25:26 - INFO - __main__ - Step 58407: {'lr': 0.00034121151022883033, 'samples': 11214144, 'steps': 58406, 'loss/train': 1.4731860160827637} -11/07/2021 05:25:26 - INFO - __main__ - Step 58408: {'lr': 0.00034120656926915995, 'samples': 11214336, 'steps': 58407, 'loss/train': 1.2097426652908325} -11/07/2021 05:25:27 - INFO - __main__ - Step 58409: {'lr': 0.0003412016282683932, 'samples': 11214528, 'steps': 58408, 'loss/train': 1.3646695613861084} -11/07/2021 05:25:28 - INFO - __main__ - Step 58410: {'lr': 0.0003411966872265325, 'samples': 11214720, 'steps': 58409, 'loss/train': 1.5305606126785278} -11/07/2021 05:25:28 - INFO - __main__ - Step 58411: {'lr': 0.00034119174614357994, 'samples': 11214912, 'steps': 58410, 'loss/train': 1.4746593236923218} -11/07/2021 05:25:28 - INFO - __main__ - Step 58412: {'lr': 0.00034118680501953784, 'samples': 11215104, 'steps': 58411, 'loss/train': 1.6140037775039673} -11/07/2021 05:25:29 - INFO - __main__ - Step 58413: {'lr': 0.00034118186385440833, 'samples': 11215296, 'steps': 58412, 'loss/train': 1.4457831382751465} -11/07/2021 05:25:30 - INFO - __main__ - Step 58414: {'lr': 0.00034117692264819374, 'samples': 11215488, 'steps': 58413, 'loss/train': 0.9754199385643005} -11/07/2021 05:25:30 - INFO - __main__ - Step 58415: {'lr': 0.0003411719814008961, 'samples': 11215680, 'steps': 58414, 'loss/train': 1.1841983795166016} -11/07/2021 05:25:30 - INFO - __main__ - Step 58416: {'lr': 0.0003411670401125179, 'samples': 11215872, 'steps': 58415, 'loss/train': 1.4019126892089844} -11/07/2021 05:25:31 - INFO - __main__ - Step 58417: {'lr': 0.00034116209878306116, 'samples': 11216064, 'steps': 58416, 'loss/train': 1.2930548191070557} -11/07/2021 05:25:31 - INFO - __main__ - Step 58418: {'lr': 0.00034115715741252824, 'samples': 11216256, 'steps': 58417, 'loss/train': 1.7811188697814941} -11/07/2021 05:25:32 - INFO - __main__ - Step 58419: {'lr': 0.0003411522160009213, 'samples': 11216448, 'steps': 58418, 'loss/train': 1.5482412576675415} -11/07/2021 05:25:32 - INFO - __main__ - Step 58420: {'lr': 0.00034114727454824257, 'samples': 11216640, 'steps': 58419, 'loss/train': 1.6688786745071411} -11/07/2021 05:25:33 - INFO - __main__ - Step 58421: {'lr': 0.00034114233305449426, 'samples': 11216832, 'steps': 58420, 'loss/train': 1.3504208326339722} -11/07/2021 05:25:33 - INFO - __main__ - Step 58422: {'lr': 0.00034113739151967864, 'samples': 11217024, 'steps': 58421, 'loss/train': 1.7886126041412354} -11/07/2021 05:25:33 - INFO - __main__ - Step 58423: {'lr': 0.00034113244994379794, 'samples': 11217216, 'steps': 58422, 'loss/train': 1.0460597276687622} -11/07/2021 05:25:35 - INFO - __main__ - Step 58424: {'lr': 0.00034112750832685434, 'samples': 11217408, 'steps': 58423, 'loss/train': 1.436403751373291} -11/07/2021 05:25:35 - INFO - __main__ - Step 58425: {'lr': 0.0003411225666688501, 'samples': 11217600, 'steps': 58424, 'loss/train': 2.3052642345428467} -11/07/2021 05:25:35 - INFO - __main__ - Step 58426: {'lr': 0.0003411176249697875, 'samples': 11217792, 'steps': 58425, 'loss/train': 1.1679171323776245} -11/07/2021 05:25:36 - INFO - __main__ - Step 58427: {'lr': 0.0003411126832296686, 'samples': 11217984, 'steps': 58426, 'loss/train': 1.7709113359451294} -11/07/2021 05:25:36 - INFO - __main__ - Step 58428: {'lr': 0.00034110774144849575, 'samples': 11218176, 'steps': 58427, 'loss/train': 1.904578447341919} -11/07/2021 05:25:37 - INFO - __main__ - Step 58429: {'lr': 0.00034110279962627115, 'samples': 11218368, 'steps': 58428, 'loss/train': 0.8743123412132263} -11/07/2021 05:25:38 - INFO - __main__ - Step 58430: {'lr': 0.0003410978577629971, 'samples': 11218560, 'steps': 58429, 'loss/train': 2.0276880264282227} -11/07/2021 05:25:38 - INFO - __main__ - Step 58431: {'lr': 0.0003410929158586757, 'samples': 11218752, 'steps': 58430, 'loss/train': 0.9819093942642212} -11/07/2021 05:25:38 - INFO - __main__ - Step 58432: {'lr': 0.0003410879739133093, 'samples': 11218944, 'steps': 58431, 'loss/train': 1.8218625783920288} -11/07/2021 05:25:39 - INFO - __main__ - Step 58433: {'lr': 0.00034108303192690003, 'samples': 11219136, 'steps': 58432, 'loss/train': 2.471243381500244} -11/07/2021 05:25:40 - INFO - __main__ - Step 58434: {'lr': 0.0003410780898994501, 'samples': 11219328, 'steps': 58433, 'loss/train': 1.8734984397888184} -11/07/2021 05:25:40 - INFO - __main__ - Step 58435: {'lr': 0.00034107314783096183, 'samples': 11219520, 'steps': 58434, 'loss/train': 1.4329745769500732} -11/07/2021 05:25:41 - INFO - __main__ - Step 58436: {'lr': 0.0003410682057214374, 'samples': 11219712, 'steps': 58435, 'loss/train': 0.6696116924285889} -11/07/2021 05:25:41 - INFO - __main__ - Step 58437: {'lr': 0.00034106326357087905, 'samples': 11219904, 'steps': 58436, 'loss/train': 1.388970971107483} -11/07/2021 05:25:41 - INFO - __main__ - Step 58438: {'lr': 0.000341058321379289, 'samples': 11220096, 'steps': 58437, 'loss/train': 1.5257045030593872} -11/07/2021 05:25:42 - INFO - __main__ - Step 58439: {'lr': 0.0003410533791466695, 'samples': 11220288, 'steps': 58438, 'loss/train': 1.4143130779266357} -11/07/2021 05:25:43 - INFO - __main__ - Step 58440: {'lr': 0.0003410484368730227, 'samples': 11220480, 'steps': 58439, 'loss/train': 1.3513290882110596} -11/07/2021 05:25:43 - INFO - __main__ - Step 58441: {'lr': 0.00034104349455835094, 'samples': 11220672, 'steps': 58440, 'loss/train': 0.796983003616333} -11/07/2021 05:25:43 - INFO - __main__ - Step 58442: {'lr': 0.0003410385522026563, 'samples': 11220864, 'steps': 58441, 'loss/train': 1.6240644454956055} -11/07/2021 05:25:44 - INFO - __main__ - Step 58443: {'lr': 0.0003410336098059412, 'samples': 11221056, 'steps': 58442, 'loss/train': 0.7649230360984802} -11/07/2021 05:25:44 - INFO - __main__ - Step 58444: {'lr': 0.0003410286673682077, 'samples': 11221248, 'steps': 58443, 'loss/train': 1.2710825204849243} -11/07/2021 05:25:45 - INFO - __main__ - Step 58445: {'lr': 0.0003410237248894581, 'samples': 11221440, 'steps': 58444, 'loss/train': 1.3829941749572754} -11/07/2021 05:25:45 - INFO - __main__ - Step 58446: {'lr': 0.00034101878236969464, 'samples': 11221632, 'steps': 58445, 'loss/train': 2.1312994956970215} -11/07/2021 05:25:46 - INFO - __main__ - Step 58447: {'lr': 0.0003410138398089195, 'samples': 11221824, 'steps': 58446, 'loss/train': 1.766077995300293} -11/07/2021 05:25:46 - INFO - __main__ - Step 58448: {'lr': 0.0003410088972071349, 'samples': 11222016, 'steps': 58447, 'loss/train': 1.6206458806991577} -11/07/2021 05:25:47 - INFO - __main__ - Step 58449: {'lr': 0.0003410039545643431, 'samples': 11222208, 'steps': 58448, 'loss/train': 1.5594794750213623} -11/07/2021 05:25:48 - INFO - __main__ - Step 58450: {'lr': 0.0003409990118805463, 'samples': 11222400, 'steps': 58449, 'loss/train': 1.4494882822036743} -11/07/2021 05:25:48 - INFO - __main__ - Step 58451: {'lr': 0.0003409940691557468, 'samples': 11222592, 'steps': 58450, 'loss/train': 1.6536080837249756} -11/07/2021 05:25:48 - INFO - __main__ - Step 58452: {'lr': 0.0003409891263899467, 'samples': 11222784, 'steps': 58451, 'loss/train': 1.4545527696609497} -11/07/2021 05:25:49 - INFO - __main__ - Step 58453: {'lr': 0.0003409841835831484, 'samples': 11222976, 'steps': 58452, 'loss/train': 1.3133459091186523} -11/07/2021 05:25:49 - INFO - __main__ - Step 58454: {'lr': 0.000340979240735354, 'samples': 11223168, 'steps': 58453, 'loss/train': 1.4204963445663452} -11/07/2021 05:25:49 - INFO - __main__ - Step 58455: {'lr': 0.00034097429784656574, 'samples': 11223360, 'steps': 58454, 'loss/train': 1.6007115840911865} -11/07/2021 05:25:50 - INFO - __main__ - Step 58456: {'lr': 0.00034096935491678595, 'samples': 11223552, 'steps': 58455, 'loss/train': 1.6012096405029297} -11/07/2021 05:25:51 - INFO - __main__ - Step 58457: {'lr': 0.0003409644119460166, 'samples': 11223744, 'steps': 58456, 'loss/train': 1.7056620121002197} -11/07/2021 05:25:51 - INFO - __main__ - Step 58458: {'lr': 0.00034095946893426024, 'samples': 11223936, 'steps': 58457, 'loss/train': 0.8120853900909424} -11/07/2021 05:25:51 - INFO - __main__ - Step 58459: {'lr': 0.0003409545258815189, 'samples': 11224128, 'steps': 58458, 'loss/train': 1.0179810523986816} -11/07/2021 05:25:52 - INFO - __main__ - Step 58460: {'lr': 0.00034094958278779486, 'samples': 11224320, 'steps': 58459, 'loss/train': 1.7241183519363403} -11/07/2021 05:25:53 - INFO - __main__ - Step 58461: {'lr': 0.00034094463965309035, 'samples': 11224512, 'steps': 58460, 'loss/train': 1.5440194606781006} -11/07/2021 05:25:53 - INFO - __main__ - Step 58462: {'lr': 0.00034093969647740755, 'samples': 11224704, 'steps': 58461, 'loss/train': 0.582253098487854} -11/07/2021 05:25:54 - INFO - __main__ - Step 58463: {'lr': 0.00034093475326074874, 'samples': 11224896, 'steps': 58462, 'loss/train': 1.6896227598190308} -11/07/2021 05:25:54 - INFO - __main__ - Step 58464: {'lr': 0.00034092981000311614, 'samples': 11225088, 'steps': 58463, 'loss/train': 1.6384936571121216} -11/07/2021 05:25:54 - INFO - __main__ - Step 58465: {'lr': 0.00034092486670451197, 'samples': 11225280, 'steps': 58464, 'loss/train': 0.5751922130584717} -11/07/2021 05:25:55 - INFO - __main__ - Step 58466: {'lr': 0.0003409199233649385, 'samples': 11225472, 'steps': 58465, 'loss/train': 0.8946777582168579} -11/07/2021 05:25:56 - INFO - __main__ - Step 58467: {'lr': 0.0003409149799843979, 'samples': 11225664, 'steps': 58466, 'loss/train': 1.3113489151000977} -11/07/2021 05:25:56 - INFO - __main__ - Step 58468: {'lr': 0.00034091003656289235, 'samples': 11225856, 'steps': 58467, 'loss/train': 1.8885964155197144} -11/07/2021 05:25:56 - INFO - __main__ - Step 58469: {'lr': 0.00034090509310042414, 'samples': 11226048, 'steps': 58468, 'loss/train': 1.6570892333984375} -11/07/2021 05:25:57 - INFO - __main__ - Step 58470: {'lr': 0.00034090014959699554, 'samples': 11226240, 'steps': 58469, 'loss/train': 1.4603313207626343} -11/07/2021 05:25:59 - INFO - __main__ - Step 58471: {'lr': 0.0003408952060526087, 'samples': 11226432, 'steps': 58470, 'loss/train': 1.2665852308273315} -11/07/2021 05:25:59 - INFO - __main__ - Step 58472: {'lr': 0.00034089026246726596, 'samples': 11226624, 'steps': 58471, 'loss/train': 1.663528561592102} -11/07/2021 05:26:00 - INFO - __main__ - Step 58473: {'lr': 0.00034088531884096944, 'samples': 11226816, 'steps': 58472, 'loss/train': 1.2827757596969604} -11/07/2021 05:26:00 - INFO - __main__ - Step 58474: {'lr': 0.0003408803751737214, 'samples': 11227008, 'steps': 58473, 'loss/train': 1.6015524864196777} -11/07/2021 05:26:00 - INFO - __main__ - Step 58475: {'lr': 0.00034087543146552404, 'samples': 11227200, 'steps': 58474, 'loss/train': 1.0194486379623413} -11/07/2021 05:26:01 - INFO - __main__ - Step 58476: {'lr': 0.0003408704877163796, 'samples': 11227392, 'steps': 58475, 'loss/train': 1.4756325483322144} -11/07/2021 05:26:01 - INFO - __main__ - Step 58477: {'lr': 0.00034086554392629033, 'samples': 11227584, 'steps': 58476, 'loss/train': 0.9150516986846924} -11/07/2021 05:26:01 - INFO - __main__ - Step 58478: {'lr': 0.00034086060009525844, 'samples': 11227776, 'steps': 58477, 'loss/train': 0.882000207901001} -11/07/2021 05:26:02 - INFO - __main__ - Step 58479: {'lr': 0.0003408556562232862, 'samples': 11227968, 'steps': 58478, 'loss/train': 1.1304144859313965} -11/07/2021 05:26:03 - INFO - __main__ - Step 58480: {'lr': 0.00034085071231037585, 'samples': 11228160, 'steps': 58479, 'loss/train': 1.2820016145706177} -11/07/2021 05:26:03 - INFO - __main__ - Step 58481: {'lr': 0.0003408457683565295, 'samples': 11228352, 'steps': 58480, 'loss/train': 1.3621982336044312} -11/07/2021 05:26:03 - INFO - __main__ - Step 58482: {'lr': 0.00034084082436174946, 'samples': 11228544, 'steps': 58481, 'loss/train': 1.0864423513412476} -11/07/2021 05:26:04 - INFO - __main__ - Step 58483: {'lr': 0.0003408358803260379, 'samples': 11228736, 'steps': 58482, 'loss/train': 1.4017298221588135} -11/07/2021 05:26:04 - INFO - __main__ - Step 58484: {'lr': 0.00034083093624939716, 'samples': 11228928, 'steps': 58483, 'loss/train': 1.4749741554260254} -11/07/2021 05:26:05 - INFO - __main__ - Step 58485: {'lr': 0.00034082599213182933, 'samples': 11229120, 'steps': 58484, 'loss/train': 1.3955676555633545} -11/07/2021 05:26:05 - INFO - __main__ - Step 58486: {'lr': 0.0003408210479733368, 'samples': 11229312, 'steps': 58485, 'loss/train': 1.6664291620254517} -11/07/2021 05:26:06 - INFO - __main__ - Step 58487: {'lr': 0.0003408161037739217, 'samples': 11229504, 'steps': 58486, 'loss/train': 1.0070327520370483} -11/07/2021 05:26:06 - INFO - __main__ - Step 58488: {'lr': 0.0003408111595335862, 'samples': 11229696, 'steps': 58487, 'loss/train': 1.5712045431137085} -11/07/2021 05:26:06 - INFO - __main__ - Step 58489: {'lr': 0.00034080621525233264, 'samples': 11229888, 'steps': 58488, 'loss/train': 1.3353732824325562} -11/07/2021 05:26:08 - INFO - __main__ - Step 58490: {'lr': 0.0003408012709301632, 'samples': 11230080, 'steps': 58489, 'loss/train': 1.323580026626587} -11/07/2021 05:26:08 - INFO - __main__ - Step 58491: {'lr': 0.00034079632656708005, 'samples': 11230272, 'steps': 58490, 'loss/train': 1.2277162075042725} -11/07/2021 05:26:08 - INFO - __main__ - Step 58492: {'lr': 0.00034079138216308553, 'samples': 11230464, 'steps': 58491, 'loss/train': 1.6625176668167114} -11/07/2021 05:26:09 - INFO - __main__ - Step 58493: {'lr': 0.00034078643771818184, 'samples': 11230656, 'steps': 58492, 'loss/train': 1.116775393486023} -11/07/2021 05:26:09 - INFO - __main__ - Step 58494: {'lr': 0.00034078149323237114, 'samples': 11230848, 'steps': 58493, 'loss/train': 1.5711719989776611} -11/07/2021 05:26:10 - INFO - __main__ - Step 58495: {'lr': 0.00034077654870565566, 'samples': 11231040, 'steps': 58494, 'loss/train': 1.6955015659332275} -11/07/2021 05:26:10 - INFO - __main__ - Step 58496: {'lr': 0.00034077160413803774, 'samples': 11231232, 'steps': 58495, 'loss/train': 1.8912805318832397} -11/07/2021 05:26:11 - INFO - __main__ - Step 58497: {'lr': 0.0003407666595295195, 'samples': 11231424, 'steps': 58496, 'loss/train': 2.1351826190948486} -11/07/2021 05:26:11 - INFO - __main__ - Step 58498: {'lr': 0.0003407617148801033, 'samples': 11231616, 'steps': 58497, 'loss/train': 1.5520429611206055} -11/07/2021 05:26:11 - INFO - __main__ - Step 58499: {'lr': 0.0003407567701897911, 'samples': 11231808, 'steps': 58498, 'loss/train': 1.2427788972854614} -11/07/2021 05:26:12 - INFO - __main__ - Step 58500: {'lr': 0.0003407518254585854, 'samples': 11232000, 'steps': 58499, 'loss/train': 1.039374828338623} -11/07/2021 05:26:13 - INFO - __main__ - Step 58501: {'lr': 0.0003407468806864883, 'samples': 11232192, 'steps': 58500, 'loss/train': 1.1369225978851318} -11/07/2021 05:26:13 - INFO - __main__ - Step 58502: {'lr': 0.0003407419358735021, 'samples': 11232384, 'steps': 58501, 'loss/train': 1.0871407985687256} -11/07/2021 05:26:13 - INFO - __main__ - Step 58503: {'lr': 0.0003407369910196289, 'samples': 11232576, 'steps': 58502, 'loss/train': 1.1347147226333618} -11/07/2021 05:26:14 - INFO - __main__ - Step 58504: {'lr': 0.0003407320461248711, 'samples': 11232768, 'steps': 58503, 'loss/train': 1.7463244199752808} -11/07/2021 05:26:15 - INFO - __main__ - Step 58505: {'lr': 0.00034072710118923086, 'samples': 11232960, 'steps': 58504, 'loss/train': 1.2943141460418701} -11/07/2021 05:26:15 - INFO - __main__ - Step 58506: {'lr': 0.0003407221562127103, 'samples': 11233152, 'steps': 58505, 'loss/train': 1.6389752626419067} -11/07/2021 05:26:15 - INFO - __main__ - Step 58507: {'lr': 0.0003407172111953117, 'samples': 11233344, 'steps': 58506, 'loss/train': 1.3285409212112427} -11/07/2021 05:26:16 - INFO - __main__ - Step 58508: {'lr': 0.00034071226613703744, 'samples': 11233536, 'steps': 58507, 'loss/train': 1.5552165508270264} -11/07/2021 05:26:16 - INFO - __main__ - Step 58509: {'lr': 0.0003407073210378897, 'samples': 11233728, 'steps': 58508, 'loss/train': 1.6005282402038574} -11/07/2021 05:26:17 - INFO - __main__ - Step 58510: {'lr': 0.00034070237589787047, 'samples': 11233920, 'steps': 58509, 'loss/train': 1.6873674392700195} -11/07/2021 05:26:18 - INFO - __main__ - Step 58511: {'lr': 0.00034069743071698215, 'samples': 11234112, 'steps': 58510, 'loss/train': 1.2324090003967285} -11/07/2021 05:26:18 - INFO - __main__ - Step 58512: {'lr': 0.000340692485495227, 'samples': 11234304, 'steps': 58511, 'loss/train': 1.2363803386688232} -11/07/2021 05:26:18 - INFO - __main__ - Step 58513: {'lr': 0.0003406875402326073, 'samples': 11234496, 'steps': 58512, 'loss/train': 1.2501964569091797} -11/07/2021 05:26:19 - INFO - __main__ - Step 58514: {'lr': 0.00034068259492912514, 'samples': 11234688, 'steps': 58513, 'loss/train': 1.5018353462219238} -11/07/2021 05:26:19 - INFO - __main__ - Step 58515: {'lr': 0.00034067764958478283, 'samples': 11234880, 'steps': 58514, 'loss/train': 1.2529922723770142} -11/07/2021 05:26:20 - INFO - __main__ - Step 58516: {'lr': 0.0003406727041995825, 'samples': 11235072, 'steps': 58515, 'loss/train': 1.340499997138977} -11/07/2021 05:26:20 - INFO - __main__ - Step 58517: {'lr': 0.00034066775877352644, 'samples': 11235264, 'steps': 58516, 'loss/train': 2.417407751083374} -11/07/2021 05:26:21 - INFO - __main__ - Step 58518: {'lr': 0.00034066281330661697, 'samples': 11235456, 'steps': 58517, 'loss/train': 1.1057500839233398} -11/07/2021 05:26:21 - INFO - __main__ - Step 58519: {'lr': 0.0003406578677988562, 'samples': 11235648, 'steps': 58518, 'loss/train': 1.3503586053848267} -11/07/2021 05:26:21 - INFO - __main__ - Step 58520: {'lr': 0.00034065292225024643, 'samples': 11235840, 'steps': 58519, 'loss/train': 1.4391413927078247} -11/07/2021 05:26:22 - INFO - __main__ - Step 58521: {'lr': 0.0003406479766607898, 'samples': 11236032, 'steps': 58520, 'loss/train': 1.568670392036438} -11/07/2021 05:26:23 - INFO - __main__ - Step 58522: {'lr': 0.00034064303103048863, 'samples': 11236224, 'steps': 58521, 'loss/train': 1.5107706785202026} -11/07/2021 05:26:23 - INFO - __main__ - Step 58523: {'lr': 0.000340638085359345, 'samples': 11236416, 'steps': 58522, 'loss/train': 1.541881799697876} -11/07/2021 05:26:23 - INFO - __main__ - Step 58524: {'lr': 0.00034063313964736135, 'samples': 11236608, 'steps': 58523, 'loss/train': 1.410552740097046} -11/07/2021 05:26:24 - INFO - __main__ - Step 58525: {'lr': 0.0003406281938945398, 'samples': 11236800, 'steps': 58524, 'loss/train': 1.5633823871612549} -11/07/2021 05:26:25 - INFO - __main__ - Step 58526: {'lr': 0.0003406232481008825, 'samples': 11236992, 'steps': 58525, 'loss/train': 1.2339831590652466} -11/07/2021 05:26:25 - INFO - __main__ - Step 58527: {'lr': 0.0003406183022663919, 'samples': 11237184, 'steps': 58526, 'loss/train': 1.4524608850479126} -11/07/2021 05:26:26 - INFO - __main__ - Step 58528: {'lr': 0.00034061335639107006, 'samples': 11237376, 'steps': 58527, 'loss/train': 1.383617877960205} -11/07/2021 05:26:26 - INFO - __main__ - Step 58529: {'lr': 0.0003406084104749192, 'samples': 11237568, 'steps': 58528, 'loss/train': 1.4862842559814453} -11/07/2021 05:26:26 - INFO - __main__ - Step 58530: {'lr': 0.00034060346451794156, 'samples': 11237760, 'steps': 58529, 'loss/train': 1.6672933101654053} -11/07/2021 05:26:27 - INFO - __main__ - Step 58531: {'lr': 0.0003405985185201394, 'samples': 11237952, 'steps': 58530, 'loss/train': 1.3401219844818115} -11/07/2021 05:26:28 - INFO - __main__ - Step 58532: {'lr': 0.000340593572481515, 'samples': 11238144, 'steps': 58531, 'loss/train': 1.2921035289764404} -11/07/2021 05:26:28 - INFO - __main__ - Step 58533: {'lr': 0.0003405886264020706, 'samples': 11238336, 'steps': 58532, 'loss/train': 1.5293786525726318} -11/07/2021 05:26:28 - INFO - __main__ - Step 58534: {'lr': 0.0003405836802818082, 'samples': 11238528, 'steps': 58533, 'loss/train': 0.5165374279022217} -11/07/2021 05:26:29 - INFO - __main__ - Step 58535: {'lr': 0.00034057873412073026, 'samples': 11238720, 'steps': 58534, 'loss/train': 1.6103554964065552} -11/07/2021 05:26:30 - INFO - __main__ - Step 58536: {'lr': 0.0003405737879188389, 'samples': 11238912, 'steps': 58535, 'loss/train': 1.6690616607666016} -11/07/2021 05:26:30 - INFO - __main__ - Step 58537: {'lr': 0.0003405688416761364, 'samples': 11239104, 'steps': 58536, 'loss/train': 1.1031736135482788} -11/07/2021 05:26:30 - INFO - __main__ - Step 58538: {'lr': 0.00034056389539262506, 'samples': 11239296, 'steps': 58537, 'loss/train': 0.9342900514602661} -11/07/2021 05:26:31 - INFO - __main__ - Step 58539: {'lr': 0.000340558949068307, 'samples': 11239488, 'steps': 58538, 'loss/train': 1.6302703619003296} -11/07/2021 05:26:31 - INFO - __main__ - Step 58540: {'lr': 0.0003405540027031845, 'samples': 11239680, 'steps': 58539, 'loss/train': 1.5585918426513672} -11/07/2021 05:26:32 - INFO - __main__ - Step 58541: {'lr': 0.00034054905629725965, 'samples': 11239872, 'steps': 58540, 'loss/train': 0.9911255836486816} -11/07/2021 05:26:33 - INFO - __main__ - Step 58542: {'lr': 0.00034054410985053483, 'samples': 11240064, 'steps': 58541, 'loss/train': 1.3347887992858887} -11/07/2021 05:26:33 - INFO - __main__ - Step 58543: {'lr': 0.00034053916336301225, 'samples': 11240256, 'steps': 58542, 'loss/train': 1.497240662574768} -11/07/2021 05:26:33 - INFO - __main__ - Step 58544: {'lr': 0.00034053421683469416, 'samples': 11240448, 'steps': 58543, 'loss/train': 0.7741641402244568} -11/07/2021 05:26:34 - INFO - __main__ - Step 58545: {'lr': 0.00034052927026558265, 'samples': 11240640, 'steps': 58544, 'loss/train': 1.7934575080871582} -11/07/2021 05:26:35 - INFO - __main__ - Step 58546: {'lr': 0.00034052432365568015, 'samples': 11240832, 'steps': 58545, 'loss/train': 1.5654975175857544} -11/07/2021 05:26:35 - INFO - __main__ - Step 58547: {'lr': 0.0003405193770049888, 'samples': 11241024, 'steps': 58546, 'loss/train': 1.5136960744857788} -11/07/2021 05:26:35 - INFO - __main__ - Step 58548: {'lr': 0.0003405144303135108, 'samples': 11241216, 'steps': 58547, 'loss/train': 1.2865959405899048} -11/07/2021 05:26:36 - INFO - __main__ - Step 58549: {'lr': 0.00034050948358124836, 'samples': 11241408, 'steps': 58548, 'loss/train': 0.9187461137771606} -11/07/2021 05:26:36 - INFO - __main__ - Step 58550: {'lr': 0.00034050453680820373, 'samples': 11241600, 'steps': 58549, 'loss/train': 1.1021056175231934} -11/07/2021 05:26:37 - INFO - __main__ - Step 58551: {'lr': 0.0003404995899943791, 'samples': 11241792, 'steps': 58550, 'loss/train': 1.6945784091949463} -11/07/2021 05:26:37 - INFO - __main__ - Step 58552: {'lr': 0.00034049464313977684, 'samples': 11241984, 'steps': 58551, 'loss/train': 1.5661370754241943} -11/07/2021 05:26:38 - INFO - __main__ - Step 58553: {'lr': 0.0003404896962443991, 'samples': 11242176, 'steps': 58552, 'loss/train': 1.3892261981964111} -11/07/2021 05:26:38 - INFO - __main__ - Step 58554: {'lr': 0.0003404847493082481, 'samples': 11242368, 'steps': 58553, 'loss/train': 1.0884599685668945} -11/07/2021 05:26:38 - INFO - __main__ - Step 58555: {'lr': 0.000340479802331326, 'samples': 11242560, 'steps': 58554, 'loss/train': 1.1438909769058228} -11/07/2021 05:26:39 - INFO - __main__ - Step 58556: {'lr': 0.0003404748553136351, 'samples': 11242752, 'steps': 58555, 'loss/train': 1.5107654333114624} -11/07/2021 05:26:40 - INFO - __main__ - Step 58557: {'lr': 0.00034046990825517765, 'samples': 11242944, 'steps': 58556, 'loss/train': 1.5175063610076904} -11/07/2021 05:26:40 - INFO - __main__ - Step 58558: {'lr': 0.0003404649611559559, 'samples': 11243136, 'steps': 58557, 'loss/train': 1.0964844226837158} -11/07/2021 05:26:41 - INFO - __main__ - Step 58559: {'lr': 0.0003404600140159719, 'samples': 11243328, 'steps': 58558, 'loss/train': 1.0572022199630737} -11/07/2021 05:26:41 - INFO - __main__ - Step 58560: {'lr': 0.0003404550668352282, 'samples': 11243520, 'steps': 58559, 'loss/train': 1.190142035484314} -11/07/2021 05:26:41 - INFO - __main__ - Step 58561: {'lr': 0.00034045011961372676, 'samples': 11243712, 'steps': 58560, 'loss/train': 1.0817368030548096} -11/07/2021 05:26:42 - INFO - __main__ - Step 58562: {'lr': 0.0003404451723514699, 'samples': 11243904, 'steps': 58561, 'loss/train': 1.7233643531799316} -11/07/2021 05:26:43 - INFO - __main__ - Step 58563: {'lr': 0.00034044022504845986, 'samples': 11244096, 'steps': 58562, 'loss/train': 1.3554329872131348} -11/07/2021 05:26:43 - INFO - __main__ - Step 58564: {'lr': 0.00034043527770469874, 'samples': 11244288, 'steps': 58563, 'loss/train': 1.447244644165039} -11/07/2021 05:26:43 - INFO - __main__ - Step 58565: {'lr': 0.00034043033032018897, 'samples': 11244480, 'steps': 58564, 'loss/train': 1.2000093460083008} -11/07/2021 05:26:44 - INFO - __main__ - Step 58566: {'lr': 0.00034042538289493266, 'samples': 11244672, 'steps': 58565, 'loss/train': 1.7884174585342407} -11/07/2021 05:26:45 - INFO - __main__ - Step 58567: {'lr': 0.00034042043542893214, 'samples': 11244864, 'steps': 58566, 'loss/train': 0.39903920888900757} -11/07/2021 05:26:45 - INFO - __main__ - Step 58568: {'lr': 0.0003404154879221895, 'samples': 11245056, 'steps': 58567, 'loss/train': 0.9793217778205872} -11/07/2021 05:26:46 - INFO - __main__ - Step 58569: {'lr': 0.00034041054037470703, 'samples': 11245248, 'steps': 58568, 'loss/train': 1.5822800397872925} -11/07/2021 05:26:46 - INFO - __main__ - Step 58570: {'lr': 0.00034040559278648695, 'samples': 11245440, 'steps': 58569, 'loss/train': 2.0370893478393555} -11/07/2021 05:26:46 - INFO - __main__ - Step 58571: {'lr': 0.00034040064515753154, 'samples': 11245632, 'steps': 58570, 'loss/train': 1.6098743677139282} -11/07/2021 05:26:47 - INFO - __main__ - Step 58572: {'lr': 0.000340395697487843, 'samples': 11245824, 'steps': 58571, 'loss/train': 1.3138717412948608} -11/07/2021 05:26:48 - INFO - __main__ - Step 58573: {'lr': 0.00034039074977742356, 'samples': 11246016, 'steps': 58572, 'loss/train': 0.9125752449035645} -11/07/2021 05:26:48 - INFO - __main__ - Step 58574: {'lr': 0.00034038580202627543, 'samples': 11246208, 'steps': 58573, 'loss/train': 1.0024455785751343} -11/07/2021 05:26:49 - INFO - __main__ - Step 58575: {'lr': 0.0003403808542344009, 'samples': 11246400, 'steps': 58574, 'loss/train': 1.3768975734710693} -11/07/2021 05:26:49 - INFO - __main__ - Step 58576: {'lr': 0.00034037590640180205, 'samples': 11246592, 'steps': 58575, 'loss/train': 1.6127654314041138} -11/07/2021 05:26:49 - INFO - __main__ - Step 58577: {'lr': 0.00034037095852848125, 'samples': 11246784, 'steps': 58576, 'loss/train': 0.5709400177001953} -11/07/2021 05:26:51 - INFO - __main__ - Step 58578: {'lr': 0.00034036601061444074, 'samples': 11246976, 'steps': 58577, 'loss/train': 1.6432132720947266} -11/07/2021 05:26:51 - INFO - __main__ - Step 58579: {'lr': 0.00034036106265968263, 'samples': 11247168, 'steps': 58578, 'loss/train': 1.5485974550247192} -11/07/2021 05:26:51 - INFO - __main__ - Step 58580: {'lr': 0.00034035611466420927, 'samples': 11247360, 'steps': 58579, 'loss/train': 2.261461019515991} -11/07/2021 05:26:52 - INFO - __main__ - Step 58581: {'lr': 0.00034035116662802287, 'samples': 11247552, 'steps': 58580, 'loss/train': 1.7287871837615967} -11/07/2021 05:26:52 - INFO - __main__ - Step 58582: {'lr': 0.0003403462185511256, 'samples': 11247744, 'steps': 58581, 'loss/train': 1.6491888761520386} -11/07/2021 05:26:53 - INFO - __main__ - Step 58583: {'lr': 0.0003403412704335196, 'samples': 11247936, 'steps': 58582, 'loss/train': 2.915558338165283} -11/07/2021 05:26:54 - INFO - __main__ - Step 58584: {'lr': 0.0003403363222752074, 'samples': 11248128, 'steps': 58583, 'loss/train': 1.3191951513290405} -11/07/2021 05:26:54 - INFO - __main__ - Step 58585: {'lr': 0.0003403313740761909, 'samples': 11248320, 'steps': 58584, 'loss/train': 1.1483147144317627} -11/07/2021 05:26:54 - INFO - __main__ - Step 58586: {'lr': 0.00034032642583647254, 'samples': 11248512, 'steps': 58585, 'loss/train': 0.8842759132385254} -11/07/2021 05:26:55 - INFO - __main__ - Step 58587: {'lr': 0.0003403214775560545, 'samples': 11248704, 'steps': 58586, 'loss/train': 1.4254627227783203} -11/07/2021 05:26:56 - INFO - __main__ - Step 58588: {'lr': 0.000340316529234939, 'samples': 11248896, 'steps': 58587, 'loss/train': 1.6152998208999634} -11/07/2021 05:26:56 - INFO - __main__ - Step 58589: {'lr': 0.00034031158087312823, 'samples': 11249088, 'steps': 58588, 'loss/train': 1.426893949508667} -11/07/2021 05:26:56 - INFO - __main__ - Step 58590: {'lr': 0.0003403066324706245, 'samples': 11249280, 'steps': 58589, 'loss/train': 1.4237428903579712} -11/07/2021 05:26:57 - INFO - __main__ - Step 58591: {'lr': 0.00034030168402742996, 'samples': 11249472, 'steps': 58590, 'loss/train': 1.5858216285705566} -11/07/2021 05:26:57 - INFO - __main__ - Step 58592: {'lr': 0.0003402967355435469, 'samples': 11249664, 'steps': 58591, 'loss/train': 2.0844335556030273} -11/07/2021 05:26:58 - INFO - __main__ - Step 58593: {'lr': 0.00034029178701897744, 'samples': 11249856, 'steps': 58592, 'loss/train': 1.3354320526123047} -11/07/2021 05:26:58 - INFO - __main__ - Step 58594: {'lr': 0.00034028683845372407, 'samples': 11250048, 'steps': 58593, 'loss/train': 1.568726897239685} -11/07/2021 05:26:59 - INFO - __main__ - Step 58595: {'lr': 0.00034028188984778867, 'samples': 11250240, 'steps': 58594, 'loss/train': 1.2948017120361328} -11/07/2021 05:26:59 - INFO - __main__ - Step 58596: {'lr': 0.0003402769412011737, 'samples': 11250432, 'steps': 58595, 'loss/train': 1.8752646446228027} -11/07/2021 05:26:59 - INFO - __main__ - Step 58597: {'lr': 0.00034027199251388137, 'samples': 11250624, 'steps': 58596, 'loss/train': 1.518560528755188} -11/07/2021 05:27:00 - INFO - __main__ - Step 58598: {'lr': 0.0003402670437859138, 'samples': 11250816, 'steps': 58597, 'loss/train': 1.5436047315597534} -11/07/2021 05:27:01 - INFO - __main__ - Step 58599: {'lr': 0.0003402620950172733, 'samples': 11251008, 'steps': 58598, 'loss/train': 1.5812362432479858} -11/07/2021 05:27:01 - INFO - __main__ - Step 58600: {'lr': 0.00034025714620796225, 'samples': 11251200, 'steps': 58599, 'loss/train': 1.1292755603790283} -11/07/2021 05:27:02 - INFO - __main__ - Step 58601: {'lr': 0.0003402521973579826, 'samples': 11251392, 'steps': 58600, 'loss/train': 1.4832994937896729} -11/07/2021 05:27:02 - INFO - __main__ - Step 58602: {'lr': 0.00034024724846733667, 'samples': 11251584, 'steps': 58601, 'loss/train': 1.6459180116653442} -11/07/2021 05:27:03 - INFO - __main__ - Step 58603: {'lr': 0.0003402422995360268, 'samples': 11251776, 'steps': 58602, 'loss/train': 1.2370795011520386} -11/07/2021 05:27:03 - INFO - __main__ - Step 58604: {'lr': 0.00034023735056405507, 'samples': 11251968, 'steps': 58603, 'loss/train': 1.4220401048660278} -11/07/2021 05:27:04 - INFO - __main__ - Step 58605: {'lr': 0.00034023240155142383, 'samples': 11252160, 'steps': 58604, 'loss/train': 1.5945957899093628} -11/07/2021 05:27:04 - INFO - __main__ - Step 58606: {'lr': 0.00034022745249813523, 'samples': 11252352, 'steps': 58605, 'loss/train': 1.4449801445007324} -11/07/2021 05:27:04 - INFO - __main__ - Step 58607: {'lr': 0.0003402225034041916, 'samples': 11252544, 'steps': 58606, 'loss/train': 1.0904531478881836} -11/07/2021 05:27:05 - INFO - __main__ - Step 58608: {'lr': 0.000340217554269595, 'samples': 11252736, 'steps': 58607, 'loss/train': 1.895560622215271} -11/07/2021 05:27:06 - INFO - __main__ - Step 58609: {'lr': 0.00034021260509434784, 'samples': 11252928, 'steps': 58608, 'loss/train': 1.7363203763961792} -11/07/2021 05:27:06 - INFO - __main__ - Step 58610: {'lr': 0.0003402076558784522, 'samples': 11253120, 'steps': 58609, 'loss/train': 0.9608591198921204} -11/07/2021 05:27:06 - INFO - __main__ - Step 58611: {'lr': 0.00034020270662191046, 'samples': 11253312, 'steps': 58610, 'loss/train': 1.9516892433166504} -11/07/2021 05:27:07 - INFO - __main__ - Step 58612: {'lr': 0.00034019775732472467, 'samples': 11253504, 'steps': 58611, 'loss/train': 1.3757413625717163} -11/07/2021 05:27:07 - INFO - __main__ - Step 58613: {'lr': 0.0003401928079868973, 'samples': 11253696, 'steps': 58612, 'loss/train': 1.1356873512268066} -11/07/2021 05:27:08 - INFO - __main__ - Step 58614: {'lr': 0.0003401878586084304, 'samples': 11253888, 'steps': 58613, 'loss/train': 1.5409858226776123} -11/07/2021 05:27:08 - INFO - __main__ - Step 58615: {'lr': 0.0003401829091893262, 'samples': 11254080, 'steps': 58614, 'loss/train': 1.800312876701355} -11/07/2021 05:27:09 - INFO - __main__ - Step 58616: {'lr': 0.000340177959729587, 'samples': 11254272, 'steps': 58615, 'loss/train': 1.058474063873291} -11/07/2021 05:27:09 - INFO - __main__ - Step 58617: {'lr': 0.000340173010229215, 'samples': 11254464, 'steps': 58616, 'loss/train': 1.5124789476394653} -11/07/2021 05:27:09 - INFO - __main__ - Step 58618: {'lr': 0.0003401680606882124, 'samples': 11254656, 'steps': 58617, 'loss/train': 1.286466360092163} -11/07/2021 05:27:11 - INFO - __main__ - Step 58619: {'lr': 0.0003401631111065815, 'samples': 11254848, 'steps': 58618, 'loss/train': 1.4471435546875} -11/07/2021 05:27:11 - INFO - __main__ - Step 58620: {'lr': 0.0003401581614843244, 'samples': 11255040, 'steps': 58619, 'loss/train': 1.771852731704712} -11/07/2021 05:27:11 - INFO - __main__ - Step 58621: {'lr': 0.00034015321182144357, 'samples': 11255232, 'steps': 58620, 'loss/train': 1.1483772993087769} -11/07/2021 05:27:12 - INFO - __main__ - Step 58622: {'lr': 0.00034014826211794104, 'samples': 11255424, 'steps': 58621, 'loss/train': 1.7596633434295654} -11/07/2021 05:27:12 - INFO - __main__ - Step 58623: {'lr': 0.0003401433123738191, 'samples': 11255616, 'steps': 58622, 'loss/train': 1.252971887588501} -11/07/2021 05:27:12 - INFO - __main__ - Step 58624: {'lr': 0.00034013836258907994, 'samples': 11255808, 'steps': 58623, 'loss/train': 1.7156128883361816} -11/07/2021 05:27:13 - INFO - __main__ - Step 58625: {'lr': 0.0003401334127637258, 'samples': 11256000, 'steps': 58624, 'loss/train': 1.6319975852966309} -11/07/2021 05:27:14 - INFO - __main__ - Step 58626: {'lr': 0.000340128462897759, 'samples': 11256192, 'steps': 58625, 'loss/train': 0.9937305450439453} -11/07/2021 05:27:14 - INFO - __main__ - Step 58627: {'lr': 0.0003401235129911817, 'samples': 11256384, 'steps': 58626, 'loss/train': 1.6375449895858765} -11/07/2021 05:27:14 - INFO - __main__ - Step 58628: {'lr': 0.0003401185630439961, 'samples': 11256576, 'steps': 58627, 'loss/train': 1.6889230012893677} -11/07/2021 05:27:15 - INFO - __main__ - Step 58629: {'lr': 0.0003401136130562045, 'samples': 11256768, 'steps': 58628, 'loss/train': 1.2075716257095337} -11/07/2021 05:27:16 - INFO - __main__ - Step 58630: {'lr': 0.0003401086630278091, 'samples': 11256960, 'steps': 58629, 'loss/train': 1.2659410238265991} -11/07/2021 05:27:16 - INFO - __main__ - Step 58631: {'lr': 0.00034010371295881207, 'samples': 11257152, 'steps': 58630, 'loss/train': 1.9190737009048462} -11/07/2021 05:27:16 - INFO - __main__ - Step 58632: {'lr': 0.00034009876284921576, 'samples': 11257344, 'steps': 58631, 'loss/train': 1.6319178342819214} -11/07/2021 05:27:17 - INFO - __main__ - Step 58633: {'lr': 0.00034009381269902236, 'samples': 11257536, 'steps': 58632, 'loss/train': 1.64049232006073} -11/07/2021 05:27:17 - INFO - __main__ - Step 58634: {'lr': 0.000340088862508234, 'samples': 11257728, 'steps': 58633, 'loss/train': 0.9824512004852295} -11/07/2021 05:27:18 - INFO - __main__ - Step 58635: {'lr': 0.00034008391227685305, 'samples': 11257920, 'steps': 58634, 'loss/train': 1.4872363805770874} -11/07/2021 05:27:18 - INFO - __main__ - Step 58636: {'lr': 0.00034007896200488163, 'samples': 11258112, 'steps': 58635, 'loss/train': 1.282004475593567} -11/07/2021 05:27:19 - INFO - __main__ - Step 58637: {'lr': 0.0003400740116923221, 'samples': 11258304, 'steps': 58636, 'loss/train': 1.1979315280914307} -11/07/2021 05:27:19 - INFO - __main__ - Step 58638: {'lr': 0.00034006906133917655, 'samples': 11258496, 'steps': 58637, 'loss/train': 1.8014849424362183} -11/07/2021 05:27:20 - INFO - __main__ - Step 58639: {'lr': 0.0003400641109454473, 'samples': 11258688, 'steps': 58638, 'loss/train': 1.707274317741394} -11/07/2021 05:27:21 - INFO - __main__ - Step 58640: {'lr': 0.0003400591605111364, 'samples': 11258880, 'steps': 58639, 'loss/train': 1.3305047750473022} -11/07/2021 05:27:21 - INFO - __main__ - Step 58641: {'lr': 0.0003400542100362464, 'samples': 11259072, 'steps': 58640, 'loss/train': 1.6776947975158691} -11/07/2021 05:27:21 - INFO - __main__ - Step 58642: {'lr': 0.0003400492595207793, 'samples': 11259264, 'steps': 58641, 'loss/train': 1.1673380136489868} -11/07/2021 05:27:22 - INFO - __main__ - Step 58643: {'lr': 0.00034004430896473743, 'samples': 11259456, 'steps': 58642, 'loss/train': 1.5140269994735718} -11/07/2021 05:27:22 - INFO - __main__ - Step 58644: {'lr': 0.000340039358368123, 'samples': 11259648, 'steps': 58643, 'loss/train': 1.3781821727752686} -11/07/2021 05:27:22 - INFO - __main__ - Step 58645: {'lr': 0.00034003440773093817, 'samples': 11259840, 'steps': 58644, 'loss/train': 1.7038558721542358} -11/07/2021 05:27:24 - INFO - __main__ - Step 58646: {'lr': 0.0003400294570531852, 'samples': 11260032, 'steps': 58645, 'loss/train': 0.6562949419021606} -11/07/2021 05:27:24 - INFO - __main__ - Step 58647: {'lr': 0.0003400245063348664, 'samples': 11260224, 'steps': 58646, 'loss/train': 1.6678837537765503} -11/07/2021 05:27:24 - INFO - __main__ - Step 58648: {'lr': 0.000340019555575984, 'samples': 11260416, 'steps': 58647, 'loss/train': 1.872270941734314} -11/07/2021 05:27:25 - INFO - __main__ - Step 58649: {'lr': 0.00034001460477654013, 'samples': 11260608, 'steps': 58648, 'loss/train': 1.8131369352340698} -11/07/2021 05:27:25 - INFO - __main__ - Step 58650: {'lr': 0.00034000965393653703, 'samples': 11260800, 'steps': 58649, 'loss/train': 1.475797414779663} -11/07/2021 05:27:26 - INFO - __main__ - Step 58651: {'lr': 0.00034000470305597697, 'samples': 11260992, 'steps': 58650, 'loss/train': 1.2250440120697021} -11/07/2021 05:27:26 - INFO - __main__ - Step 58652: {'lr': 0.0003399997521348622, 'samples': 11261184, 'steps': 58651, 'loss/train': 1.5154170989990234} -11/07/2021 05:27:27 - INFO - __main__ - Step 58653: {'lr': 0.00033999480117319494, 'samples': 11261376, 'steps': 58652, 'loss/train': 1.315185308456421} -11/07/2021 05:27:27 - INFO - __main__ - Step 58654: {'lr': 0.0003399898501709774, 'samples': 11261568, 'steps': 58653, 'loss/train': 1.6343590021133423} -11/07/2021 05:27:27 - INFO - __main__ - Step 58655: {'lr': 0.00033998489912821187, 'samples': 11261760, 'steps': 58654, 'loss/train': 0.7975795865058899} -11/07/2021 05:27:28 - INFO - __main__ - Step 58656: {'lr': 0.00033997994804490047, 'samples': 11261952, 'steps': 58655, 'loss/train': 1.5882381200790405} -11/07/2021 05:27:29 - INFO - __main__ - Step 58657: {'lr': 0.0003399749969210455, 'samples': 11262144, 'steps': 58656, 'loss/train': 1.467847466468811} -11/07/2021 05:27:29 - INFO - __main__ - Step 58658: {'lr': 0.0003399700457566492, 'samples': 11262336, 'steps': 58657, 'loss/train': 1.6790921688079834} -11/07/2021 05:27:30 - INFO - __main__ - Step 58659: {'lr': 0.00033996509455171375, 'samples': 11262528, 'steps': 58658, 'loss/train': 1.463994026184082} -11/07/2021 05:27:30 - INFO - __main__ - Step 58660: {'lr': 0.0003399601433062415, 'samples': 11262720, 'steps': 58659, 'loss/train': 1.6266387701034546} -11/07/2021 05:27:30 - INFO - __main__ - Step 58661: {'lr': 0.00033995519202023453, 'samples': 11262912, 'steps': 58660, 'loss/train': 1.5797277688980103} -11/07/2021 05:27:31 - INFO - __main__ - Step 58662: {'lr': 0.00033995024069369517, 'samples': 11263104, 'steps': 58661, 'loss/train': 1.788406491279602} -11/07/2021 05:27:32 - INFO - __main__ - Step 58663: {'lr': 0.0003399452893266256, 'samples': 11263296, 'steps': 58662, 'loss/train': 1.2432971000671387} -11/07/2021 05:27:32 - INFO - __main__ - Step 58664: {'lr': 0.000339940337919028, 'samples': 11263488, 'steps': 58663, 'loss/train': 1.4610928297042847} -11/07/2021 05:27:32 - INFO - __main__ - Step 58665: {'lr': 0.0003399353864709048, 'samples': 11263680, 'steps': 58664, 'loss/train': 1.2338680028915405} -11/07/2021 05:27:33 - INFO - __main__ - Step 58666: {'lr': 0.000339930434982258, 'samples': 11263872, 'steps': 58665, 'loss/train': 1.294327735900879} -11/07/2021 05:27:34 - INFO - __main__ - Step 58667: {'lr': 0.00033992548345309, 'samples': 11264064, 'steps': 58666, 'loss/train': 1.6519348621368408} -11/07/2021 05:27:34 - INFO - __main__ - Step 58668: {'lr': 0.000339920531883403, 'samples': 11264256, 'steps': 58667, 'loss/train': 1.3834352493286133} -11/07/2021 05:27:34 - INFO - __main__ - Step 58669: {'lr': 0.0003399155802731991, 'samples': 11264448, 'steps': 58668, 'loss/train': 1.2895777225494385} -11/07/2021 05:27:35 - INFO - __main__ - Step 58670: {'lr': 0.0003399106286224807, 'samples': 11264640, 'steps': 58669, 'loss/train': 1.0402488708496094} -11/07/2021 05:27:35 - INFO - __main__ - Step 58671: {'lr': 0.0003399056769312499, 'samples': 11264832, 'steps': 58670, 'loss/train': 1.2308584451675415} -11/07/2021 05:27:36 - INFO - __main__ - Step 58672: {'lr': 0.000339900725199509, 'samples': 11265024, 'steps': 58671, 'loss/train': 1.3313902616500854} -11/07/2021 05:27:37 - INFO - __main__ - Step 58673: {'lr': 0.0003398957734272602, 'samples': 11265216, 'steps': 58672, 'loss/train': 1.8147152662277222} -11/07/2021 05:27:37 - INFO - __main__ - Step 58674: {'lr': 0.00033989082161450584, 'samples': 11265408, 'steps': 58673, 'loss/train': 1.1897612810134888} -11/07/2021 05:27:37 - INFO - __main__ - Step 58675: {'lr': 0.000339885869761248, 'samples': 11265600, 'steps': 58674, 'loss/train': 3.0839974880218506} -11/07/2021 05:27:38 - INFO - __main__ - Step 58676: {'lr': 0.000339880917867489, 'samples': 11265792, 'steps': 58675, 'loss/train': 1.751492977142334} -11/07/2021 05:27:39 - INFO - __main__ - Step 58677: {'lr': 0.00033987596593323103, 'samples': 11265984, 'steps': 58676, 'loss/train': 1.605707049369812} -11/07/2021 05:27:39 - INFO - __main__ - Step 58678: {'lr': 0.00033987101395847636, 'samples': 11266176, 'steps': 58677, 'loss/train': 1.7508043050765991} -11/07/2021 05:27:40 - INFO - __main__ - Step 58679: {'lr': 0.00033986606194322716, 'samples': 11266368, 'steps': 58678, 'loss/train': 1.5047215223312378} -11/07/2021 05:27:40 - INFO - __main__ - Step 58680: {'lr': 0.00033986110988748567, 'samples': 11266560, 'steps': 58679, 'loss/train': 1.4525678157806396} -11/07/2021 05:27:40 - INFO - __main__ - Step 58681: {'lr': 0.00033985615779125427, 'samples': 11266752, 'steps': 58680, 'loss/train': 1.2383021116256714} -11/07/2021 05:27:41 - INFO - __main__ - Step 58682: {'lr': 0.00033985120565453497, 'samples': 11266944, 'steps': 58681, 'loss/train': 1.4485909938812256} -11/07/2021 05:27:42 - INFO - __main__ - Step 58683: {'lr': 0.00033984625347733015, 'samples': 11267136, 'steps': 58682, 'loss/train': 1.7783548831939697} -11/07/2021 05:27:42 - INFO - __main__ - Step 58684: {'lr': 0.000339841301259642, 'samples': 11267328, 'steps': 58683, 'loss/train': 1.653826117515564} -11/07/2021 05:27:42 - INFO - __main__ - Step 58685: {'lr': 0.0003398363490014727, 'samples': 11267520, 'steps': 58684, 'loss/train': 1.6136869192123413} -11/07/2021 05:27:43 - INFO - __main__ - Step 58686: {'lr': 0.0003398313967028245, 'samples': 11267712, 'steps': 58685, 'loss/train': 1.4425431489944458} -11/07/2021 05:27:43 - INFO - __main__ - Step 58687: {'lr': 0.00033982644436369975, 'samples': 11267904, 'steps': 58686, 'loss/train': 1.4149539470672607} -11/07/2021 05:27:44 - INFO - __main__ - Step 58688: {'lr': 0.00033982149198410057, 'samples': 11268096, 'steps': 58687, 'loss/train': 1.8159171342849731} -11/07/2021 05:27:44 - INFO - __main__ - Step 58689: {'lr': 0.0003398165395640292, 'samples': 11268288, 'steps': 58688, 'loss/train': 1.5644479990005493} -11/07/2021 05:27:45 - INFO - __main__ - Step 58690: {'lr': 0.00033981158710348787, 'samples': 11268480, 'steps': 58689, 'loss/train': 1.5640636682510376} -11/07/2021 05:27:45 - INFO - __main__ - Step 58691: {'lr': 0.0003398066346024788, 'samples': 11268672, 'steps': 58690, 'loss/train': 1.2179890871047974} -11/07/2021 05:27:45 - INFO - __main__ - Step 58692: {'lr': 0.0003398016820610043, 'samples': 11268864, 'steps': 58691, 'loss/train': 1.3885226249694824} -11/07/2021 05:27:46 - INFO - __main__ - Step 58693: {'lr': 0.00033979672947906646, 'samples': 11269056, 'steps': 58692, 'loss/train': 1.5098356008529663} -11/07/2021 05:27:47 - INFO - __main__ - Step 58694: {'lr': 0.0003397917768566677, 'samples': 11269248, 'steps': 58693, 'loss/train': 1.6539536714553833} -11/07/2021 05:27:47 - INFO - __main__ - Step 58695: {'lr': 0.0003397868241938101, 'samples': 11269440, 'steps': 58694, 'loss/train': 1.2934186458587646} -11/07/2021 05:27:47 - INFO - __main__ - Step 58696: {'lr': 0.00033978187149049597, 'samples': 11269632, 'steps': 58695, 'loss/train': 1.6360303163528442} -11/07/2021 05:27:48 - INFO - __main__ - Step 58697: {'lr': 0.0003397769187467275, 'samples': 11269824, 'steps': 58696, 'loss/train': 1.910764455795288} -11/07/2021 05:27:49 - INFO - __main__ - Step 58698: {'lr': 0.0003397719659625069, 'samples': 11270016, 'steps': 58697, 'loss/train': 1.394666314125061} -11/07/2021 05:27:49 - INFO - __main__ - Step 58699: {'lr': 0.0003397670131378365, 'samples': 11270208, 'steps': 58698, 'loss/train': 1.1060389280319214} -11/07/2021 05:27:50 - INFO - __main__ - Step 58700: {'lr': 0.0003397620602727184, 'samples': 11270400, 'steps': 58699, 'loss/train': 1.065557837486267} -11/07/2021 05:27:50 - INFO - __main__ - Step 58701: {'lr': 0.00033975710736715504, 'samples': 11270592, 'steps': 58700, 'loss/train': 2.4465560913085938} -11/07/2021 05:27:50 - INFO - __main__ - Step 58702: {'lr': 0.00033975215442114836, 'samples': 11270784, 'steps': 58701, 'loss/train': 1.1995782852172852} -11/07/2021 05:27:51 - INFO - __main__ - Step 58703: {'lr': 0.00033974720143470084, 'samples': 11270976, 'steps': 58702, 'loss/train': 1.7081576585769653} -11/07/2021 05:27:52 - INFO - __main__ - Step 58704: {'lr': 0.00033974224840781453, 'samples': 11271168, 'steps': 58703, 'loss/train': 1.3235079050064087} -11/07/2021 05:27:52 - INFO - __main__ - Step 58705: {'lr': 0.0003397372953404918, 'samples': 11271360, 'steps': 58704, 'loss/train': 1.443793535232544} -11/07/2021 05:27:52 - INFO - __main__ - Step 58706: {'lr': 0.0003397323422327348, 'samples': 11271552, 'steps': 58705, 'loss/train': 0.9678148031234741} -11/07/2021 05:27:53 - INFO - __main__ - Step 58707: {'lr': 0.0003397273890845458, 'samples': 11271744, 'steps': 58706, 'loss/train': 1.5049041509628296} -11/07/2021 05:27:54 - INFO - __main__ - Step 58708: {'lr': 0.0003397224358959271, 'samples': 11271936, 'steps': 58707, 'loss/train': 1.630176305770874} -11/07/2021 05:27:54 - INFO - __main__ - Step 58709: {'lr': 0.0003397174826668808, 'samples': 11272128, 'steps': 58708, 'loss/train': 1.4808259010314941} -11/07/2021 05:27:54 - INFO - __main__ - Step 58710: {'lr': 0.00033971252939740915, 'samples': 11272320, 'steps': 58709, 'loss/train': 1.1939408779144287} -11/07/2021 05:27:55 - INFO - __main__ - Step 58711: {'lr': 0.00033970757608751446, 'samples': 11272512, 'steps': 58710, 'loss/train': 1.1783385276794434} -11/07/2021 05:27:55 - INFO - __main__ - Step 58712: {'lr': 0.0003397026227371989, 'samples': 11272704, 'steps': 58711, 'loss/train': 1.3982597589492798} -11/07/2021 05:27:56 - INFO - __main__ - Step 58713: {'lr': 0.0003396976693464647, 'samples': 11272896, 'steps': 58712, 'loss/train': 1.225518822669983} -11/07/2021 05:27:57 - INFO - __main__ - Step 58714: {'lr': 0.0003396927159153141, 'samples': 11273088, 'steps': 58713, 'loss/train': 2.111703872680664} -11/07/2021 05:27:57 - INFO - __main__ - Step 58715: {'lr': 0.0003396877624437495, 'samples': 11273280, 'steps': 58714, 'loss/train': 1.869307041168213} -11/07/2021 05:27:57 - INFO - __main__ - Step 58716: {'lr': 0.0003396828089317728, 'samples': 11273472, 'steps': 58715, 'loss/train': 1.187577247619629} -11/07/2021 05:27:58 - INFO - __main__ - Step 58717: {'lr': 0.0003396778553793865, 'samples': 11273664, 'steps': 58716, 'loss/train': 1.9779194593429565} -11/07/2021 05:27:58 - INFO - __main__ - Step 58718: {'lr': 0.00033967290178659273, 'samples': 11273856, 'steps': 58717, 'loss/train': 1.1186343431472778} -11/07/2021 05:27:59 - INFO - __main__ - Step 58719: {'lr': 0.0003396679481533937, 'samples': 11274048, 'steps': 58718, 'loss/train': 1.6696780920028687} -11/07/2021 05:27:59 - INFO - __main__ - Step 58720: {'lr': 0.0003396629944797917, 'samples': 11274240, 'steps': 58719, 'loss/train': 1.3711998462677002} -11/07/2021 05:28:00 - INFO - __main__ - Step 58721: {'lr': 0.0003396580407657889, 'samples': 11274432, 'steps': 58720, 'loss/train': 1.3863716125488281} -11/07/2021 05:28:00 - INFO - __main__ - Step 58722: {'lr': 0.0003396530870113877, 'samples': 11274624, 'steps': 58721, 'loss/train': 1.036597490310669} -11/07/2021 05:28:00 - INFO - __main__ - Step 58723: {'lr': 0.0003396481332165901, 'samples': 11274816, 'steps': 58722, 'loss/train': 1.3757930994033813} -11/07/2021 05:28:01 - INFO - __main__ - Step 58724: {'lr': 0.00033964317938139845, 'samples': 11275008, 'steps': 58723, 'loss/train': 1.1915156841278076} -11/07/2021 05:28:02 - INFO - __main__ - Step 58725: {'lr': 0.00033963822550581494, 'samples': 11275200, 'steps': 58724, 'loss/train': 1.6021989583969116} -11/07/2021 05:28:02 - INFO - __main__ - Step 58726: {'lr': 0.0003396332715898418, 'samples': 11275392, 'steps': 58725, 'loss/train': 1.5126571655273438} -11/07/2021 05:28:02 - INFO - __main__ - Step 58727: {'lr': 0.00033962831763348133, 'samples': 11275584, 'steps': 58726, 'loss/train': 1.6027170419692993} -11/07/2021 05:28:03 - INFO - __main__ - Step 58728: {'lr': 0.00033962336363673585, 'samples': 11275776, 'steps': 58727, 'loss/train': 1.2824872732162476} -11/07/2021 05:28:04 - INFO - __main__ - Step 58729: {'lr': 0.00033961840959960735, 'samples': 11275968, 'steps': 58728, 'loss/train': 1.62641441822052} -11/07/2021 05:28:04 - INFO - __main__ - Step 58730: {'lr': 0.0003396134555220982, 'samples': 11276160, 'steps': 58729, 'loss/train': 1.0455607175827026} -11/07/2021 05:28:05 - INFO - __main__ - Step 58731: {'lr': 0.0003396085014042105, 'samples': 11276352, 'steps': 58730, 'loss/train': 2.2827987670898438} -11/07/2021 05:28:05 - INFO - __main__ - Step 58732: {'lr': 0.00033960354724594665, 'samples': 11276544, 'steps': 58731, 'loss/train': 1.1796807050704956} -11/07/2021 05:28:05 - INFO - __main__ - Step 58733: {'lr': 0.0003395985930473089, 'samples': 11276736, 'steps': 58732, 'loss/train': 1.3315881490707397} -11/07/2021 05:28:06 - INFO - __main__ - Step 58734: {'lr': 0.00033959363880829935, 'samples': 11276928, 'steps': 58733, 'loss/train': 0.8745399713516235} -11/07/2021 05:28:07 - INFO - __main__ - Step 58735: {'lr': 0.00033958868452892035, 'samples': 11277120, 'steps': 58734, 'loss/train': 1.1936465501785278} -11/07/2021 05:28:07 - INFO - __main__ - Step 58736: {'lr': 0.000339583730209174, 'samples': 11277312, 'steps': 58735, 'loss/train': 1.7472937107086182} -11/07/2021 05:28:07 - INFO - __main__ - Step 58737: {'lr': 0.0003395787758490626, 'samples': 11277504, 'steps': 58736, 'loss/train': 1.8023500442504883} -11/07/2021 05:28:08 - INFO - __main__ - Step 58738: {'lr': 0.0003395738214485884, 'samples': 11277696, 'steps': 58737, 'loss/train': 1.734580397605896} -11/07/2021 05:28:08 - INFO - __main__ - Step 58739: {'lr': 0.0003395688670077536, 'samples': 11277888, 'steps': 58738, 'loss/train': 1.074816107749939} -11/07/2021 05:28:09 - INFO - __main__ - Step 58740: {'lr': 0.0003395639125265605, 'samples': 11278080, 'steps': 58739, 'loss/train': 1.2014753818511963} -11/07/2021 05:28:10 - INFO - __main__ - Step 58741: {'lr': 0.00033955895800501126, 'samples': 11278272, 'steps': 58740, 'loss/train': 1.6427022218704224} -11/07/2021 05:28:10 - INFO - __main__ - Step 58742: {'lr': 0.0003395540034431082, 'samples': 11278464, 'steps': 58741, 'loss/train': 1.4095505475997925} -11/07/2021 05:28:10 - INFO - __main__ - Step 58743: {'lr': 0.0003395490488408534, 'samples': 11278656, 'steps': 58742, 'loss/train': 1.2669202089309692} -11/07/2021 05:28:11 - INFO - __main__ - Step 58744: {'lr': 0.00033954409419824924, 'samples': 11278848, 'steps': 58743, 'loss/train': 1.5797938108444214} -11/07/2021 05:28:12 - INFO - __main__ - Step 58745: {'lr': 0.0003395391395152978, 'samples': 11279040, 'steps': 58744, 'loss/train': 1.3473795652389526} -11/07/2021 05:28:12 - INFO - __main__ - Step 58746: {'lr': 0.0003395341847920015, 'samples': 11279232, 'steps': 58745, 'loss/train': 1.8958699703216553} -11/07/2021 05:28:12 - INFO - __main__ - Step 58747: {'lr': 0.00033952923002836244, 'samples': 11279424, 'steps': 58746, 'loss/train': 1.3172633647918701} -11/07/2021 05:28:13 - INFO - __main__ - Step 58748: {'lr': 0.0003395242752243829, 'samples': 11279616, 'steps': 58747, 'loss/train': 1.4201595783233643} -11/07/2021 05:28:13 - INFO - __main__ - Step 58749: {'lr': 0.00033951932038006513, 'samples': 11279808, 'steps': 58748, 'loss/train': 1.725259780883789} -11/07/2021 05:28:14 - INFO - __main__ - Step 58750: {'lr': 0.00033951436549541124, 'samples': 11280000, 'steps': 58749, 'loss/train': 1.2477748394012451} -11/07/2021 05:28:15 - INFO - __main__ - Step 58751: {'lr': 0.0003395094105704236, 'samples': 11280192, 'steps': 58750, 'loss/train': 2.0528318881988525} -11/07/2021 05:28:15 - INFO - __main__ - Step 58752: {'lr': 0.00033950445560510445, 'samples': 11280384, 'steps': 58751, 'loss/train': 1.4452126026153564} -11/07/2021 05:28:15 - INFO - __main__ - Step 58753: {'lr': 0.00033949950059945593, 'samples': 11280576, 'steps': 58752, 'loss/train': 1.1500120162963867} -11/07/2021 05:28:16 - INFO - __main__ - Step 58754: {'lr': 0.00033949454555348035, 'samples': 11280768, 'steps': 58753, 'loss/train': 1.5976330041885376} -11/07/2021 05:28:17 - INFO - __main__ - Step 58755: {'lr': 0.0003394895904671799, 'samples': 11280960, 'steps': 58754, 'loss/train': 1.6130250692367554} -11/07/2021 05:28:17 - INFO - __main__ - Step 58756: {'lr': 0.00033948463534055683, 'samples': 11281152, 'steps': 58755, 'loss/train': 1.5885192155838013} -11/07/2021 05:28:17 - INFO - __main__ - Step 58757: {'lr': 0.0003394796801736133, 'samples': 11281344, 'steps': 58756, 'loss/train': 4.94766902923584} -11/07/2021 05:28:18 - INFO - __main__ - Step 58758: {'lr': 0.0003394747249663517, 'samples': 11281536, 'steps': 58757, 'loss/train': 1.3459274768829346} -11/07/2021 05:28:18 - INFO - __main__ - Step 58759: {'lr': 0.0003394697697187741, 'samples': 11281728, 'steps': 58758, 'loss/train': 1.4971816539764404} -11/07/2021 05:28:19 - INFO - __main__ - Step 58760: {'lr': 0.00033946481443088286, 'samples': 11281920, 'steps': 58759, 'loss/train': 1.644182801246643} -11/07/2021 05:28:19 - INFO - __main__ - Step 58761: {'lr': 0.00033945985910268007, 'samples': 11282112, 'steps': 58760, 'loss/train': 1.4899896383285522} -11/07/2021 05:28:20 - INFO - __main__ - Step 58762: {'lr': 0.0003394549037341681, 'samples': 11282304, 'steps': 58761, 'loss/train': 1.335142970085144} -11/07/2021 05:28:20 - INFO - __main__ - Step 58763: {'lr': 0.00033944994832534915, 'samples': 11282496, 'steps': 58762, 'loss/train': 0.785372257232666} -11/07/2021 05:28:21 - INFO - __main__ - Step 58764: {'lr': 0.0003394449928762254, 'samples': 11282688, 'steps': 58763, 'loss/train': 1.4672189950942993} -11/07/2021 05:28:21 - INFO - __main__ - Step 58765: {'lr': 0.0003394400373867991, 'samples': 11282880, 'steps': 58764, 'loss/train': 1.681606411933899} -11/07/2021 05:28:22 - INFO - __main__ - Step 58766: {'lr': 0.00033943508185707257, 'samples': 11283072, 'steps': 58765, 'loss/train': 0.9648610949516296} -11/07/2021 05:28:22 - INFO - __main__ - Step 58767: {'lr': 0.0003394301262870479, 'samples': 11283264, 'steps': 58766, 'loss/train': 1.4518312215805054} -11/07/2021 05:28:23 - INFO - __main__ - Step 58768: {'lr': 0.00033942517067672744, 'samples': 11283456, 'steps': 58767, 'loss/train': 1.7672967910766602} -11/07/2021 05:28:23 - INFO - __main__ - Step 58769: {'lr': 0.00033942021502611334, 'samples': 11283648, 'steps': 58768, 'loss/train': 1.2715245485305786} -11/07/2021 05:28:23 - INFO - __main__ - Step 58770: {'lr': 0.0003394152593352079, 'samples': 11283840, 'steps': 58769, 'loss/train': 1.7486598491668701} -11/07/2021 05:28:25 - INFO - __main__ - Step 58771: {'lr': 0.0003394103036040133, 'samples': 11284032, 'steps': 58770, 'loss/train': 1.5962742567062378} -11/07/2021 05:28:25 - INFO - __main__ - Step 58772: {'lr': 0.00033940534783253185, 'samples': 11284224, 'steps': 58771, 'loss/train': 1.1509003639221191} -11/07/2021 05:28:25 - INFO - __main__ - Step 58773: {'lr': 0.00033940039202076574, 'samples': 11284416, 'steps': 58772, 'loss/train': 1.5305585861206055} -11/07/2021 05:28:26 - INFO - __main__ - Step 58774: {'lr': 0.0003393954361687172, 'samples': 11284608, 'steps': 58773, 'loss/train': 1.8478020429611206} -11/07/2021 05:28:26 - INFO - __main__ - Step 58775: {'lr': 0.0003393904802763883, 'samples': 11284800, 'steps': 58774, 'loss/train': 1.253279685974121} -11/07/2021 05:28:27 - INFO - __main__ - Step 58776: {'lr': 0.00033938552434378155, 'samples': 11284992, 'steps': 58775, 'loss/train': 1.685002088546753} -11/07/2021 05:28:27 - INFO - __main__ - Step 58777: {'lr': 0.00033938056837089903, 'samples': 11285184, 'steps': 58776, 'loss/train': 0.8082150816917419} -11/07/2021 05:28:28 - INFO - __main__ - Step 58778: {'lr': 0.00033937561235774307, 'samples': 11285376, 'steps': 58777, 'loss/train': 1.5093408823013306} -11/07/2021 05:28:28 - INFO - __main__ - Step 58779: {'lr': 0.00033937065630431577, 'samples': 11285568, 'steps': 58778, 'loss/train': 1.5160646438598633} -11/07/2021 05:28:28 - INFO - __main__ - Step 58780: {'lr': 0.00033936570021061947, 'samples': 11285760, 'steps': 58779, 'loss/train': 1.2714723348617554} -11/07/2021 05:28:29 - INFO - __main__ - Step 58781: {'lr': 0.0003393607440766563, 'samples': 11285952, 'steps': 58780, 'loss/train': 1.4022120237350464} -11/07/2021 05:28:30 - INFO - __main__ - Step 58782: {'lr': 0.0003393557879024286, 'samples': 11286144, 'steps': 58781, 'loss/train': 1.0381698608398438} -11/07/2021 05:28:30 - INFO - __main__ - Step 58783: {'lr': 0.00033935083168793855, 'samples': 11286336, 'steps': 58782, 'loss/train': 1.210511326789856} -11/07/2021 05:28:30 - INFO - __main__ - Step 58784: {'lr': 0.00033934587543318846, 'samples': 11286528, 'steps': 58783, 'loss/train': 1.061765432357788} -11/07/2021 05:28:31 - INFO - __main__ - Step 58785: {'lr': 0.00033934091913818043, 'samples': 11286720, 'steps': 58784, 'loss/train': 1.9269541501998901} -11/07/2021 05:28:32 - INFO - __main__ - Step 58786: {'lr': 0.0003393359628029168, 'samples': 11286912, 'steps': 58785, 'loss/train': 1.7752442359924316} -11/07/2021 05:28:32 - INFO - __main__ - Step 58787: {'lr': 0.0003393310064273997, 'samples': 11287104, 'steps': 58786, 'loss/train': 1.9661850929260254} -11/07/2021 05:28:32 - INFO - __main__ - Step 58788: {'lr': 0.0003393260500116315, 'samples': 11287296, 'steps': 58787, 'loss/train': 1.5297590494155884} -11/07/2021 05:28:33 - INFO - __main__ - Step 58789: {'lr': 0.0003393210935556143, 'samples': 11287488, 'steps': 58788, 'loss/train': 1.4794427156448364} -11/07/2021 05:28:33 - INFO - __main__ - Step 58790: {'lr': 0.00033931613705935046, 'samples': 11287680, 'steps': 58789, 'loss/train': 1.4250047206878662} -11/07/2021 05:28:34 - INFO - __main__ - Step 58791: {'lr': 0.000339311180522842, 'samples': 11287872, 'steps': 58790, 'loss/train': 1.4402660131454468} -11/07/2021 05:28:34 - INFO - __main__ - Step 58792: {'lr': 0.00033930622394609143, 'samples': 11288064, 'steps': 58791, 'loss/train': 1.288271188735962} -11/07/2021 05:28:35 - INFO - __main__ - Step 58793: {'lr': 0.00033930126732910083, 'samples': 11288256, 'steps': 58792, 'loss/train': 1.3805677890777588} -11/07/2021 05:28:35 - INFO - __main__ - Step 58794: {'lr': 0.0003392963106718725, 'samples': 11288448, 'steps': 58793, 'loss/train': 1.5357708930969238} -11/07/2021 05:28:35 - INFO - __main__ - Step 58795: {'lr': 0.00033929135397440857, 'samples': 11288640, 'steps': 58794, 'loss/train': 0.8117380142211914} -11/07/2021 05:28:36 - INFO - __main__ - Step 58796: {'lr': 0.0003392863972367114, 'samples': 11288832, 'steps': 58795, 'loss/train': 1.312749981880188} -11/07/2021 05:28:37 - INFO - __main__ - Step 58797: {'lr': 0.0003392814404587831, 'samples': 11289024, 'steps': 58796, 'loss/train': 1.5030581951141357} -11/07/2021 05:28:37 - INFO - __main__ - Step 58798: {'lr': 0.00033927648364062593, 'samples': 11289216, 'steps': 58797, 'loss/train': 1.2318079471588135} -11/07/2021 05:28:37 - INFO - __main__ - Step 58799: {'lr': 0.00033927152678224216, 'samples': 11289408, 'steps': 58798, 'loss/train': 1.2372905015945435} -11/07/2021 05:28:38 - INFO - __main__ - Step 58800: {'lr': 0.00033926656988363406, 'samples': 11289600, 'steps': 58799, 'loss/train': 0.903574526309967} -11/07/2021 05:28:39 - INFO - __main__ - Step 58801: {'lr': 0.00033926161294480384, 'samples': 11289792, 'steps': 58800, 'loss/train': 1.9908605813980103} -11/07/2021 05:28:39 - INFO - __main__ - Step 58802: {'lr': 0.00033925665596575374, 'samples': 11289984, 'steps': 58801, 'loss/train': 1.9544095993041992} -11/07/2021 05:28:40 - INFO - __main__ - Step 58803: {'lr': 0.00033925169894648586, 'samples': 11290176, 'steps': 58802, 'loss/train': 1.858659029006958} -11/07/2021 05:28:40 - INFO - __main__ - Step 58804: {'lr': 0.0003392467418870026, 'samples': 11290368, 'steps': 58803, 'loss/train': 1.8051953315734863} -11/07/2021 05:28:40 - INFO - __main__ - Step 58805: {'lr': 0.0003392417847873061, 'samples': 11290560, 'steps': 58804, 'loss/train': 1.6961629390716553} -11/07/2021 05:28:41 - INFO - __main__ - Step 58806: {'lr': 0.00033923682764739867, 'samples': 11290752, 'steps': 58805, 'loss/train': 1.0150158405303955} -11/07/2021 05:28:42 - INFO - __main__ - Step 58807: {'lr': 0.0003392318704672825, 'samples': 11290944, 'steps': 58806, 'loss/train': 1.145486831665039} -11/07/2021 05:28:42 - INFO - __main__ - Step 58808: {'lr': 0.00033922691324695975, 'samples': 11291136, 'steps': 58807, 'loss/train': 1.3180099725723267} -11/07/2021 05:28:42 - INFO - __main__ - Step 58809: {'lr': 0.00033922195598643293, 'samples': 11291328, 'steps': 58808, 'loss/train': 1.2919305562973022} -11/07/2021 05:28:43 - INFO - __main__ - Step 58810: {'lr': 0.0003392169986857039, 'samples': 11291520, 'steps': 58809, 'loss/train': 1.4855728149414062} -11/07/2021 05:28:43 - INFO - __main__ - Step 58811: {'lr': 0.0003392120413447751, 'samples': 11291712, 'steps': 58810, 'loss/train': 1.737269401550293} -11/07/2021 05:28:44 - INFO - __main__ - Step 58812: {'lr': 0.0003392070839636487, 'samples': 11291904, 'steps': 58811, 'loss/train': 1.4681472778320312} -11/07/2021 05:28:44 - INFO - __main__ - Step 58813: {'lr': 0.000339202126542327, 'samples': 11292096, 'steps': 58812, 'loss/train': 1.1999744176864624} -11/07/2021 05:28:45 - INFO - __main__ - Step 58814: {'lr': 0.00033919716908081224, 'samples': 11292288, 'steps': 58813, 'loss/train': 1.0629862546920776} -11/07/2021 05:28:45 - INFO - __main__ - Step 58815: {'lr': 0.0003391922115791065, 'samples': 11292480, 'steps': 58814, 'loss/train': 1.4069360494613647} -11/07/2021 05:28:46 - INFO - __main__ - Step 58816: {'lr': 0.0003391872540372123, 'samples': 11292672, 'steps': 58815, 'loss/train': 1.1592175960540771} -11/07/2021 05:28:47 - INFO - __main__ - Step 58817: {'lr': 0.00033918229645513154, 'samples': 11292864, 'steps': 58816, 'loss/train': 1.3755083084106445} -11/07/2021 05:28:47 - INFO - __main__ - Step 58818: {'lr': 0.0003391773388328667, 'samples': 11293056, 'steps': 58817, 'loss/train': 1.0568621158599854} -11/07/2021 05:28:47 - INFO - __main__ - Step 58819: {'lr': 0.0003391723811704199, 'samples': 11293248, 'steps': 58818, 'loss/train': 2.00492000579834} -11/07/2021 05:28:48 - INFO - __main__ - Step 58820: {'lr': 0.0003391674234677934, 'samples': 11293440, 'steps': 58819, 'loss/train': 1.5136122703552246} -11/07/2021 05:28:48 - INFO - __main__ - Step 58821: {'lr': 0.0003391624657249894, 'samples': 11293632, 'steps': 58820, 'loss/train': 1.2482664585113525} -11/07/2021 05:28:49 - INFO - __main__ - Step 58822: {'lr': 0.0003391575079420102, 'samples': 11293824, 'steps': 58821, 'loss/train': 1.6979384422302246} -11/07/2021 05:28:50 - INFO - __main__ - Step 58823: {'lr': 0.00033915255011885803, 'samples': 11294016, 'steps': 58822, 'loss/train': 1.4658546447753906} -11/07/2021 05:28:50 - INFO - __main__ - Step 58824: {'lr': 0.000339147592255535, 'samples': 11294208, 'steps': 58823, 'loss/train': 0.37755846977233887} -11/07/2021 05:28:50 - INFO - __main__ - Step 58825: {'lr': 0.00033914263435204356, 'samples': 11294400, 'steps': 58824, 'loss/train': 1.4825007915496826} -11/07/2021 05:28:51 - INFO - __main__ - Step 58826: {'lr': 0.0003391376764083858, 'samples': 11294592, 'steps': 58825, 'loss/train': 1.3988101482391357} -11/07/2021 05:28:52 - INFO - __main__ - Step 58827: {'lr': 0.00033913271842456394, 'samples': 11294784, 'steps': 58826, 'loss/train': 1.2597273588180542} -11/07/2021 05:28:52 - INFO - __main__ - Step 58828: {'lr': 0.0003391277604005802, 'samples': 11294976, 'steps': 58827, 'loss/train': 1.4019348621368408} -11/07/2021 05:28:52 - INFO - __main__ - Step 58829: {'lr': 0.00033912280233643706, 'samples': 11295168, 'steps': 58828, 'loss/train': 1.0812780857086182} -11/07/2021 05:28:53 - INFO - __main__ - Step 58830: {'lr': 0.00033911784423213645, 'samples': 11295360, 'steps': 58829, 'loss/train': 1.0912331342697144} -11/07/2021 05:28:53 - INFO - __main__ - Step 58831: {'lr': 0.00033911288608768063, 'samples': 11295552, 'steps': 58830, 'loss/train': 1.7023320198059082} -11/07/2021 05:28:54 - INFO - __main__ - Step 58832: {'lr': 0.000339107927903072, 'samples': 11295744, 'steps': 58831, 'loss/train': 1.2451249361038208} -11/07/2021 05:28:55 - INFO - __main__ - Step 58833: {'lr': 0.00033910296967831267, 'samples': 11295936, 'steps': 58832, 'loss/train': 1.6281076669692993} -11/07/2021 05:28:55 - INFO - __main__ - Step 58834: {'lr': 0.00033909801141340497, 'samples': 11296128, 'steps': 58833, 'loss/train': 1.525278925895691} -11/07/2021 05:28:55 - INFO - __main__ - Step 58835: {'lr': 0.00033909305310835105, 'samples': 11296320, 'steps': 58834, 'loss/train': 3.20565128326416} -11/07/2021 05:28:56 - INFO - __main__ - Step 58836: {'lr': 0.00033908809476315325, 'samples': 11296512, 'steps': 58835, 'loss/train': 0.47229987382888794} -11/07/2021 05:28:56 - INFO - __main__ - Step 58837: {'lr': 0.0003390831363778136, 'samples': 11296704, 'steps': 58836, 'loss/train': 1.7827147245407104} -11/07/2021 05:28:57 - INFO - __main__ - Step 58838: {'lr': 0.00033907817795233454, 'samples': 11296896, 'steps': 58837, 'loss/train': 1.7282392978668213} -11/07/2021 05:28:57 - INFO - __main__ - Step 58839: {'lr': 0.0003390732194867182, 'samples': 11297088, 'steps': 58838, 'loss/train': 1.4342314004898071} -11/07/2021 05:28:58 - INFO - __main__ - Step 58840: {'lr': 0.00033906826098096686, 'samples': 11297280, 'steps': 58839, 'loss/train': 1.4809050559997559} -11/07/2021 05:28:58 - INFO - __main__ - Step 58841: {'lr': 0.0003390633024350827, 'samples': 11297472, 'steps': 58840, 'loss/train': 1.2768079042434692} -11/07/2021 05:28:59 - INFO - __main__ - Step 58842: {'lr': 0.000339058343849068, 'samples': 11297664, 'steps': 58841, 'loss/train': 1.1015459299087524} -11/07/2021 05:29:00 - INFO - __main__ - Step 58843: {'lr': 0.00033905338522292514, 'samples': 11297856, 'steps': 58842, 'loss/train': 1.8206262588500977} -11/07/2021 05:29:00 - INFO - __main__ - Step 58844: {'lr': 0.00033904842655665604, 'samples': 11298048, 'steps': 58843, 'loss/train': 1.1822291612625122} -11/07/2021 05:29:00 - INFO - __main__ - Step 58845: {'lr': 0.00033904346785026306, 'samples': 11298240, 'steps': 58844, 'loss/train': 1.5804479122161865} -11/07/2021 05:29:01 - INFO - __main__ - Step 58846: {'lr': 0.0003390385091037486, 'samples': 11298432, 'steps': 58845, 'loss/train': 0.22993512451648712} -11/07/2021 05:29:01 - INFO - __main__ - Step 58847: {'lr': 0.0003390335503171146, 'samples': 11298624, 'steps': 58846, 'loss/train': 1.4215235710144043} -11/07/2021 05:29:02 - INFO - __main__ - Step 58848: {'lr': 0.0003390285914903636, 'samples': 11298816, 'steps': 58847, 'loss/train': 1.3228076696395874} -11/07/2021 05:29:02 - INFO - __main__ - Step 58849: {'lr': 0.0003390236326234977, 'samples': 11299008, 'steps': 58848, 'loss/train': 1.8202475309371948} -11/07/2021 05:29:03 - INFO - __main__ - Step 58850: {'lr': 0.000339018673716519, 'samples': 11299200, 'steps': 58849, 'loss/train': 1.0453081130981445} -11/07/2021 05:29:03 - INFO - __main__ - Step 58851: {'lr': 0.0003390137147694299, 'samples': 11299392, 'steps': 58850, 'loss/train': 1.7012423276901245} -11/07/2021 05:29:03 - INFO - __main__ - Step 58852: {'lr': 0.0003390087557822326, 'samples': 11299584, 'steps': 58851, 'loss/train': 1.2014970779418945} -11/07/2021 05:29:05 - INFO - __main__ - Step 58853: {'lr': 0.00033900379675492933, 'samples': 11299776, 'steps': 58852, 'loss/train': 1.6210826635360718} -11/07/2021 05:29:05 - INFO - __main__ - Step 58854: {'lr': 0.00033899883768752234, 'samples': 11299968, 'steps': 58853, 'loss/train': 0.15507566928863525} -11/07/2021 05:29:05 - INFO - __main__ - Step 58855: {'lr': 0.00033899387858001386, 'samples': 11300160, 'steps': 58854, 'loss/train': 1.646939754486084} -11/07/2021 05:29:06 - INFO - __main__ - Step 58856: {'lr': 0.0003389889194324061, 'samples': 11300352, 'steps': 58855, 'loss/train': 1.5895023345947266} -11/07/2021 05:29:06 - INFO - __main__ - Step 58857: {'lr': 0.0003389839602447013, 'samples': 11300544, 'steps': 58856, 'loss/train': 1.5853663682937622} -11/07/2021 05:29:07 - INFO - __main__ - Step 58858: {'lr': 0.0003389790010169017, 'samples': 11300736, 'steps': 58857, 'loss/train': 1.2243292331695557} -11/07/2021 05:29:07 - INFO - __main__ - Step 58859: {'lr': 0.00033897404174900955, 'samples': 11300928, 'steps': 58858, 'loss/train': 1.537453532218933} -11/07/2021 05:29:08 - INFO - __main__ - Step 58860: {'lr': 0.000338969082441027, 'samples': 11301120, 'steps': 58859, 'loss/train': 1.625871181488037} -11/07/2021 05:29:08 - INFO - __main__ - Step 58861: {'lr': 0.00033896412309295643, 'samples': 11301312, 'steps': 58860, 'loss/train': 1.698410153388977} -11/07/2021 05:29:08 - INFO - __main__ - Step 58862: {'lr': 0.00033895916370479994, 'samples': 11301504, 'steps': 58861, 'loss/train': 1.4595767259597778} -11/07/2021 05:29:09 - INFO - __main__ - Step 58863: {'lr': 0.00033895420427655995, 'samples': 11301696, 'steps': 58862, 'loss/train': 1.8079336881637573} -11/07/2021 05:29:10 - INFO - __main__ - Step 58864: {'lr': 0.0003389492448082384, 'samples': 11301888, 'steps': 58863, 'loss/train': 1.5572354793548584} -11/07/2021 05:29:10 - INFO - __main__ - Step 58865: {'lr': 0.0003389442852998378, 'samples': 11302080, 'steps': 58864, 'loss/train': 0.9346509575843811} -11/07/2021 05:29:10 - INFO - __main__ - Step 58866: {'lr': 0.0003389393257513602, 'samples': 11302272, 'steps': 58865, 'loss/train': 1.4819879531860352} -11/07/2021 05:29:11 - INFO - __main__ - Step 58867: {'lr': 0.00033893436616280796, 'samples': 11302464, 'steps': 58866, 'loss/train': 1.6216272115707397} -11/07/2021 05:29:11 - INFO - __main__ - Step 58868: {'lr': 0.0003389294065341833, 'samples': 11302656, 'steps': 58867, 'loss/train': 1.5425323247909546} -11/07/2021 05:29:12 - INFO - __main__ - Step 58869: {'lr': 0.0003389244468654884, 'samples': 11302848, 'steps': 58868, 'loss/train': 1.6218205690383911} -11/07/2021 05:29:13 - INFO - __main__ - Step 58870: {'lr': 0.0003389194871567255, 'samples': 11303040, 'steps': 58869, 'loss/train': 1.5652034282684326} -11/07/2021 05:29:13 - INFO - __main__ - Step 58871: {'lr': 0.00033891452740789687, 'samples': 11303232, 'steps': 58870, 'loss/train': 1.0977128744125366} -11/07/2021 05:29:13 - INFO - __main__ - Step 58872: {'lr': 0.0003389095676190047, 'samples': 11303424, 'steps': 58871, 'loss/train': 1.8839526176452637} -11/07/2021 05:29:14 - INFO - __main__ - Step 58873: {'lr': 0.00033890460779005126, 'samples': 11303616, 'steps': 58872, 'loss/train': 0.8943089246749878} -11/07/2021 05:29:15 - INFO - __main__ - Step 58874: {'lr': 0.0003388996479210388, 'samples': 11303808, 'steps': 58873, 'loss/train': 1.4530586004257202} -11/07/2021 05:29:15 - INFO - __main__ - Step 58875: {'lr': 0.0003388946880119695, 'samples': 11304000, 'steps': 58874, 'loss/train': 1.6234910488128662} -11/07/2021 05:29:15 - INFO - __main__ - Step 58876: {'lr': 0.0003388897280628457, 'samples': 11304192, 'steps': 58875, 'loss/train': 1.7356258630752563} -11/07/2021 05:29:16 - INFO - __main__ - Step 58877: {'lr': 0.00033888476807366946, 'samples': 11304384, 'steps': 58876, 'loss/train': 1.4881302118301392} -11/07/2021 05:29:16 - INFO - __main__ - Step 58878: {'lr': 0.00033887980804444314, 'samples': 11304576, 'steps': 58877, 'loss/train': 2.574214220046997} -11/07/2021 05:29:17 - INFO - __main__ - Step 58879: {'lr': 0.00033887484797516895, 'samples': 11304768, 'steps': 58878, 'loss/train': 1.7607316970825195} -11/07/2021 05:29:18 - INFO - __main__ - Step 58880: {'lr': 0.00033886988786584914, 'samples': 11304960, 'steps': 58879, 'loss/train': 1.4334523677825928} -11/07/2021 05:29:18 - INFO - __main__ - Step 58881: {'lr': 0.0003388649277164859, 'samples': 11305152, 'steps': 58880, 'loss/train': 1.0518630743026733} -11/07/2021 05:29:18 - INFO - __main__ - Step 58882: {'lr': 0.0003388599675270815, 'samples': 11305344, 'steps': 58881, 'loss/train': 1.4622739553451538} -11/07/2021 05:29:19 - INFO - __main__ - Step 58883: {'lr': 0.00033885500729763824, 'samples': 11305536, 'steps': 58882, 'loss/train': 1.1759334802627563} -11/07/2021 05:29:19 - INFO - __main__ - Step 58884: {'lr': 0.00033885004702815825, 'samples': 11305728, 'steps': 58883, 'loss/train': 1.3764007091522217} -11/07/2021 05:29:20 - INFO - __main__ - Step 58885: {'lr': 0.00033884508671864377, 'samples': 11305920, 'steps': 58884, 'loss/train': 2.0678844451904297} -11/07/2021 05:29:20 - INFO - __main__ - Step 58886: {'lr': 0.0003388401263690971, 'samples': 11306112, 'steps': 58885, 'loss/train': 1.4492619037628174} -11/07/2021 05:29:21 - INFO - __main__ - Step 58887: {'lr': 0.00033883516597952033, 'samples': 11306304, 'steps': 58886, 'loss/train': 1.3749444484710693} -11/07/2021 05:29:21 - INFO - __main__ - Step 58888: {'lr': 0.00033883020554991594, 'samples': 11306496, 'steps': 58887, 'loss/train': 1.6271275281906128} -11/07/2021 05:29:21 - INFO - __main__ - Step 58889: {'lr': 0.000338825245080286, 'samples': 11306688, 'steps': 58888, 'loss/train': 1.6742115020751953} -11/07/2021 05:29:22 - INFO - __main__ - Step 58890: {'lr': 0.0003388202845706328, 'samples': 11306880, 'steps': 58889, 'loss/train': 1.6185718774795532} -11/07/2021 05:29:23 - INFO - __main__ - Step 58891: {'lr': 0.0003388153240209585, 'samples': 11307072, 'steps': 58890, 'loss/train': 1.3241333961486816} -11/07/2021 05:29:23 - INFO - __main__ - Step 58892: {'lr': 0.0003388103634312654, 'samples': 11307264, 'steps': 58891, 'loss/train': 0.517514169216156} -11/07/2021 05:29:23 - INFO - __main__ - Step 58893: {'lr': 0.0003388054028015557, 'samples': 11307456, 'steps': 58892, 'loss/train': 1.2490746974945068} -11/07/2021 05:29:24 - INFO - __main__ - Step 58894: {'lr': 0.00033880044213183163, 'samples': 11307648, 'steps': 58893, 'loss/train': 1.1121854782104492} -11/07/2021 05:29:25 - INFO - __main__ - Step 58895: {'lr': 0.00033879548142209546, 'samples': 11307840, 'steps': 58894, 'loss/train': 1.2886314392089844} -11/07/2021 05:29:25 - INFO - __main__ - Step 58896: {'lr': 0.0003387905206723496, 'samples': 11308032, 'steps': 58895, 'loss/train': 1.453001856803894} -11/07/2021 05:29:25 - INFO - __main__ - Step 58897: {'lr': 0.00033878555988259583, 'samples': 11308224, 'steps': 58896, 'loss/train': 1.716269612312317} -11/07/2021 05:29:26 - INFO - __main__ - Step 58898: {'lr': 0.0003387805990528368, 'samples': 11308416, 'steps': 58897, 'loss/train': 1.284360408782959} -11/07/2021 05:29:26 - INFO - __main__ - Step 58899: {'lr': 0.0003387756381830746, 'samples': 11308608, 'steps': 58898, 'loss/train': 1.240405559539795} -11/07/2021 05:29:27 - INFO - __main__ - Step 58900: {'lr': 0.00033877067727331145, 'samples': 11308800, 'steps': 58899, 'loss/train': 1.0199034214019775} -11/07/2021 05:29:27 - INFO - __main__ - Step 58901: {'lr': 0.00033876571632354956, 'samples': 11308992, 'steps': 58900, 'loss/train': 1.4096803665161133} -11/07/2021 05:29:28 - INFO - __main__ - Step 58902: {'lr': 0.0003387607553337913, 'samples': 11309184, 'steps': 58901, 'loss/train': 1.220066785812378} -11/07/2021 05:29:28 - INFO - __main__ - Step 58903: {'lr': 0.00033875579430403877, 'samples': 11309376, 'steps': 58902, 'loss/train': 1.6530935764312744} -11/07/2021 05:29:29 - INFO - __main__ - Step 58904: {'lr': 0.00033875083323429425, 'samples': 11309568, 'steps': 58903, 'loss/train': 1.5301777124404907} -11/07/2021 05:29:30 - INFO - __main__ - Step 58905: {'lr': 0.0003387458721245599, 'samples': 11309760, 'steps': 58904, 'loss/train': 1.2797760963439941} -11/07/2021 05:29:30 - INFO - __main__ - Step 58906: {'lr': 0.0003387409109748381, 'samples': 11309952, 'steps': 58905, 'loss/train': 1.5946542024612427} -11/07/2021 05:29:30 - INFO - __main__ - Step 58907: {'lr': 0.0003387359497851311, 'samples': 11310144, 'steps': 58906, 'loss/train': 1.783267855644226} -11/07/2021 05:29:31 - INFO - __main__ - Step 58908: {'lr': 0.00033873098855544093, 'samples': 11310336, 'steps': 58907, 'loss/train': 1.5928608179092407} -11/07/2021 05:29:31 - INFO - __main__ - Step 58909: {'lr': 0.00033872602728576997, 'samples': 11310528, 'steps': 58908, 'loss/train': 1.4806081056594849} -11/07/2021 05:29:32 - INFO - __main__ - Step 58910: {'lr': 0.0003387210659761204, 'samples': 11310720, 'steps': 58909, 'loss/train': 1.586470365524292} -11/07/2021 05:29:32 - INFO - __main__ - Step 58911: {'lr': 0.00033871610462649456, 'samples': 11310912, 'steps': 58910, 'loss/train': 1.1386555433273315} -11/07/2021 05:29:33 - INFO - __main__ - Step 58912: {'lr': 0.00033871114323689457, 'samples': 11311104, 'steps': 58911, 'loss/train': 1.499022126197815} -11/07/2021 05:29:33 - INFO - __main__ - Step 58913: {'lr': 0.0003387061818073227, 'samples': 11311296, 'steps': 58912, 'loss/train': 1.3436602354049683} -11/07/2021 05:29:33 - INFO - __main__ - Step 58914: {'lr': 0.00033870122033778123, 'samples': 11311488, 'steps': 58913, 'loss/train': 1.4523167610168457} -11/07/2021 05:29:34 - INFO - __main__ - Step 58915: {'lr': 0.00033869625882827233, 'samples': 11311680, 'steps': 58914, 'loss/train': 1.2665297985076904} -11/07/2021 05:29:35 - INFO - __main__ - Step 58916: {'lr': 0.00033869129727879827, 'samples': 11311872, 'steps': 58915, 'loss/train': 1.5188469886779785} -11/07/2021 05:29:35 - INFO - __main__ - Step 58917: {'lr': 0.0003386863356893612, 'samples': 11312064, 'steps': 58916, 'loss/train': 1.2079638242721558} -11/07/2021 05:29:36 - INFO - __main__ - Step 58918: {'lr': 0.00033868137405996363, 'samples': 11312256, 'steps': 58917, 'loss/train': 1.0151643753051758} -11/07/2021 05:29:36 - INFO - __main__ - Step 58919: {'lr': 0.0003386764123906075, 'samples': 11312448, 'steps': 58918, 'loss/train': 1.3737975358963013} -11/07/2021 05:29:36 - INFO - __main__ - Step 58920: {'lr': 0.00033867145068129515, 'samples': 11312640, 'steps': 58919, 'loss/train': 1.2140005826950073} -11/07/2021 05:29:37 - INFO - __main__ - Step 58921: {'lr': 0.0003386664889320287, 'samples': 11312832, 'steps': 58920, 'loss/train': 1.5475101470947266} -11/07/2021 05:29:38 - INFO - __main__ - Step 58922: {'lr': 0.0003386615271428106, 'samples': 11313024, 'steps': 58921, 'loss/train': 1.5680527687072754} -11/07/2021 05:29:38 - INFO - __main__ - Step 58923: {'lr': 0.000338656565313643, 'samples': 11313216, 'steps': 58922, 'loss/train': 0.8294448852539062} -11/07/2021 05:29:38 - INFO - __main__ - Step 58924: {'lr': 0.0003386516034445281, 'samples': 11313408, 'steps': 58923, 'loss/train': 1.2829402685165405} -11/07/2021 05:29:39 - INFO - __main__ - Step 58925: {'lr': 0.0003386466415354682, 'samples': 11313600, 'steps': 58924, 'loss/train': 1.3706296682357788} -11/07/2021 05:29:40 - INFO - __main__ - Step 58926: {'lr': 0.00033864167958646543, 'samples': 11313792, 'steps': 58925, 'loss/train': 1.8204190731048584} -11/07/2021 05:29:40 - INFO - __main__ - Step 58927: {'lr': 0.00033863671759752206, 'samples': 11313984, 'steps': 58926, 'loss/train': 1.4258006811141968} -11/07/2021 05:29:40 - INFO - __main__ - Step 58928: {'lr': 0.0003386317555686404, 'samples': 11314176, 'steps': 58927, 'loss/train': 1.1298774480819702} -11/07/2021 05:29:41 - INFO - __main__ - Step 58929: {'lr': 0.0003386267934998226, 'samples': 11314368, 'steps': 58928, 'loss/train': 1.2495743036270142} -11/07/2021 05:29:41 - INFO - __main__ - Step 58930: {'lr': 0.00033862183139107106, 'samples': 11314560, 'steps': 58929, 'loss/train': 1.1795114278793335} -11/07/2021 05:29:41 - INFO - __main__ - Step 58931: {'lr': 0.0003386168692423878, 'samples': 11314752, 'steps': 58930, 'loss/train': 1.692266821861267} -11/07/2021 05:29:43 - INFO - __main__ - Step 58932: {'lr': 0.0003386119070537751, 'samples': 11314944, 'steps': 58931, 'loss/train': 1.6516591310501099} -11/07/2021 05:29:43 - INFO - __main__ - Step 58933: {'lr': 0.0003386069448252353, 'samples': 11315136, 'steps': 58932, 'loss/train': 1.7982105016708374} -11/07/2021 05:29:43 - INFO - __main__ - Step 58934: {'lr': 0.00033860198255677054, 'samples': 11315328, 'steps': 58933, 'loss/train': 1.8225808143615723} -11/07/2021 05:29:44 - INFO - __main__ - Step 58935: {'lr': 0.0003385970202483831, 'samples': 11315520, 'steps': 58934, 'loss/train': 0.9737790822982788} -11/07/2021 05:29:44 - INFO - __main__ - Step 58936: {'lr': 0.0003385920579000752, 'samples': 11315712, 'steps': 58935, 'loss/train': 1.3228092193603516} -11/07/2021 05:29:45 - INFO - __main__ - Step 58937: {'lr': 0.0003385870955118492, 'samples': 11315904, 'steps': 58936, 'loss/train': 1.6627357006072998} -11/07/2021 05:29:45 - INFO - __main__ - Step 58938: {'lr': 0.0003385821330837071, 'samples': 11316096, 'steps': 58937, 'loss/train': 1.279924988746643} -11/07/2021 05:29:46 - INFO - __main__ - Step 58939: {'lr': 0.0003385771706156513, 'samples': 11316288, 'steps': 58938, 'loss/train': 2.1263813972473145} -11/07/2021 05:29:46 - INFO - __main__ - Step 58940: {'lr': 0.00033857220810768395, 'samples': 11316480, 'steps': 58939, 'loss/train': 1.8346434831619263} -11/07/2021 05:29:46 - INFO - __main__ - Step 58941: {'lr': 0.00033856724555980736, 'samples': 11316672, 'steps': 58940, 'loss/train': 1.4390860795974731} -11/07/2021 05:29:47 - INFO - __main__ - Step 58942: {'lr': 0.00033856228297202373, 'samples': 11316864, 'steps': 58941, 'loss/train': 0.9148387312889099} -11/07/2021 05:29:48 - INFO - __main__ - Step 58943: {'lr': 0.0003385573203443354, 'samples': 11317056, 'steps': 58942, 'loss/train': 1.4333701133728027} -11/07/2021 05:29:48 - INFO - __main__ - Step 58944: {'lr': 0.0003385523576767444, 'samples': 11317248, 'steps': 58943, 'loss/train': 1.6836155652999878} -11/07/2021 05:29:48 - INFO - __main__ - Step 58945: {'lr': 0.0003385473949692531, 'samples': 11317440, 'steps': 58944, 'loss/train': 1.46369206905365} -11/07/2021 05:29:49 - INFO - __main__ - Step 58946: {'lr': 0.0003385424322218637, 'samples': 11317632, 'steps': 58945, 'loss/train': 1.2269657850265503} -11/07/2021 05:29:50 - INFO - __main__ - Step 58947: {'lr': 0.0003385374694345784, 'samples': 11317824, 'steps': 58946, 'loss/train': 1.8922995328903198} -11/07/2021 05:29:50 - INFO - __main__ - Step 58948: {'lr': 0.00033853250660739954, 'samples': 11318016, 'steps': 58947, 'loss/train': 1.7637218236923218} -11/07/2021 05:29:51 - INFO - __main__ - Step 58949: {'lr': 0.00033852754374032927, 'samples': 11318208, 'steps': 58948, 'loss/train': 1.931194543838501} -11/07/2021 05:29:51 - INFO - __main__ - Step 58950: {'lr': 0.00033852258083336996, 'samples': 11318400, 'steps': 58949, 'loss/train': 1.311229944229126} -11/07/2021 05:29:51 - INFO - __main__ - Step 58951: {'lr': 0.0003385176178865236, 'samples': 11318592, 'steps': 58950, 'loss/train': 1.9002926349639893} -11/07/2021 05:29:52 - INFO - __main__ - Step 58952: {'lr': 0.00033851265489979267, 'samples': 11318784, 'steps': 58951, 'loss/train': 1.1847608089447021} -11/07/2021 05:29:53 - INFO - __main__ - Step 58953: {'lr': 0.00033850769187317923, 'samples': 11318976, 'steps': 58952, 'loss/train': 1.194960117340088} -11/07/2021 05:29:53 - INFO - __main__ - Step 58954: {'lr': 0.00033850272880668565, 'samples': 11319168, 'steps': 58953, 'loss/train': 1.077144742012024} -11/07/2021 05:29:53 - INFO - __main__ - Step 58955: {'lr': 0.000338497765700314, 'samples': 11319360, 'steps': 58954, 'loss/train': 1.4415621757507324} -11/07/2021 05:29:54 - INFO - __main__ - Step 58956: {'lr': 0.00033849280255406674, 'samples': 11319552, 'steps': 58955, 'loss/train': 1.3159661293029785} -11/07/2021 05:29:55 - INFO - __main__ - Step 58957: {'lr': 0.000338487839367946, 'samples': 11319744, 'steps': 58956, 'loss/train': 1.506406545639038} -11/07/2021 05:29:55 - INFO - __main__ - Step 58958: {'lr': 0.00033848287614195394, 'samples': 11319936, 'steps': 58957, 'loss/train': 1.6731747388839722} -11/07/2021 05:29:55 - INFO - __main__ - Step 58959: {'lr': 0.00033847791287609287, 'samples': 11320128, 'steps': 58958, 'loss/train': 1.0841224193572998} -11/07/2021 05:29:56 - INFO - __main__ - Step 58960: {'lr': 0.00033847294957036503, 'samples': 11320320, 'steps': 58959, 'loss/train': 1.33205246925354} -11/07/2021 05:29:56 - INFO - __main__ - Step 58961: {'lr': 0.0003384679862247726, 'samples': 11320512, 'steps': 58960, 'loss/train': 0.9158821105957031} -11/07/2021 05:29:57 - INFO - __main__ - Step 58962: {'lr': 0.0003384630228393179, 'samples': 11320704, 'steps': 58961, 'loss/train': 0.9067651033401489} -11/07/2021 05:29:58 - INFO - __main__ - Step 58963: {'lr': 0.0003384580594140031, 'samples': 11320896, 'steps': 58962, 'loss/train': 1.540272831916809} -11/07/2021 05:29:58 - INFO - __main__ - Step 58964: {'lr': 0.00033845309594883054, 'samples': 11321088, 'steps': 58963, 'loss/train': 1.5439705848693848} -11/07/2021 05:29:58 - INFO - __main__ - Step 58965: {'lr': 0.0003384481324438023, 'samples': 11321280, 'steps': 58964, 'loss/train': 1.2622952461242676} -11/07/2021 05:29:59 - INFO - __main__ - Step 58966: {'lr': 0.00033844316889892074, 'samples': 11321472, 'steps': 58965, 'loss/train': 1.2017014026641846} -11/07/2021 05:30:00 - INFO - __main__ - Step 58967: {'lr': 0.000338438205314188, 'samples': 11321664, 'steps': 58966, 'loss/train': 1.4321461915969849} -11/07/2021 05:30:00 - INFO - __main__ - Step 58968: {'lr': 0.00033843324168960644, 'samples': 11321856, 'steps': 58967, 'loss/train': 1.3554356098175049} -11/07/2021 05:30:00 - INFO - __main__ - Step 58969: {'lr': 0.0003384282780251782, 'samples': 11322048, 'steps': 58968, 'loss/train': 1.3642568588256836} -11/07/2021 05:30:01 - INFO - __main__ - Step 58970: {'lr': 0.0003384233143209056, 'samples': 11322240, 'steps': 58969, 'loss/train': 1.3941218852996826} -11/07/2021 05:30:01 - INFO - __main__ - Step 58971: {'lr': 0.0003384183505767907, 'samples': 11322432, 'steps': 58970, 'loss/train': 1.179962158203125} -11/07/2021 05:30:01 - INFO - __main__ - Step 58972: {'lr': 0.0003384133867928359, 'samples': 11322624, 'steps': 58971, 'loss/train': 1.2346917390823364} -11/07/2021 05:30:02 - INFO - __main__ - Step 58973: {'lr': 0.0003384084229690434, 'samples': 11322816, 'steps': 58972, 'loss/train': 1.7636467218399048} -11/07/2021 05:30:03 - INFO - __main__ - Step 58974: {'lr': 0.0003384034591054154, 'samples': 11323008, 'steps': 58973, 'loss/train': 1.005846381187439} -11/07/2021 05:30:03 - INFO - __main__ - Step 58975: {'lr': 0.0003383984952019542, 'samples': 11323200, 'steps': 58974, 'loss/train': 1.4979660511016846} -11/07/2021 05:30:03 - INFO - __main__ - Step 58976: {'lr': 0.00033839353125866194, 'samples': 11323392, 'steps': 58975, 'loss/train': 1.52721107006073} -11/07/2021 05:30:04 - INFO - __main__ - Step 58977: {'lr': 0.00033838856727554106, 'samples': 11323584, 'steps': 58976, 'loss/train': 1.274423599243164} -11/07/2021 05:30:05 - INFO - __main__ - Step 58978: {'lr': 0.00033838360325259354, 'samples': 11323776, 'steps': 58977, 'loss/train': 0.9597126841545105} -11/07/2021 05:30:05 - INFO - __main__ - Step 58979: {'lr': 0.00033837863918982175, 'samples': 11323968, 'steps': 58978, 'loss/train': 1.0574196577072144} -11/07/2021 05:30:05 - INFO - __main__ - Step 58980: {'lr': 0.0003383736750872279, 'samples': 11324160, 'steps': 58979, 'loss/train': 1.7264882326126099} -11/07/2021 05:30:06 - INFO - __main__ - Step 58981: {'lr': 0.00033836871094481433, 'samples': 11324352, 'steps': 58980, 'loss/train': 1.2755435705184937} -11/07/2021 05:30:06 - INFO - __main__ - Step 58982: {'lr': 0.0003383637467625831, 'samples': 11324544, 'steps': 58981, 'loss/train': 1.6883162260055542} -11/07/2021 05:30:07 - INFO - __main__ - Step 58983: {'lr': 0.00033835878254053647, 'samples': 11324736, 'steps': 58982, 'loss/train': 1.2053639888763428} -11/07/2021 05:30:07 - INFO - __main__ - Step 58984: {'lr': 0.00033835381827867686, 'samples': 11324928, 'steps': 58983, 'loss/train': 1.5472948551177979} -11/07/2021 05:30:08 - INFO - __main__ - Step 58985: {'lr': 0.00033834885397700633, 'samples': 11325120, 'steps': 58984, 'loss/train': 1.3101754188537598} -11/07/2021 05:30:08 - INFO - __main__ - Step 58986: {'lr': 0.00033834388963552715, 'samples': 11325312, 'steps': 58985, 'loss/train': 1.4082560539245605} -11/07/2021 05:30:09 - INFO - __main__ - Step 58987: {'lr': 0.0003383389252542416, 'samples': 11325504, 'steps': 58986, 'loss/train': 1.0450400114059448} -11/07/2021 05:30:10 - INFO - __main__ - Step 58988: {'lr': 0.0003383339608331519, 'samples': 11325696, 'steps': 58987, 'loss/train': 1.324913501739502} -11/07/2021 05:30:10 - INFO - __main__ - Step 58989: {'lr': 0.00033832899637226024, 'samples': 11325888, 'steps': 58988, 'loss/train': 1.4061994552612305} -11/07/2021 05:30:10 - INFO - __main__ - Step 58990: {'lr': 0.0003383240318715689, 'samples': 11326080, 'steps': 58989, 'loss/train': 1.8055460453033447} -11/07/2021 05:30:11 - INFO - __main__ - Step 58991: {'lr': 0.0003383190673310802, 'samples': 11326272, 'steps': 58990, 'loss/train': 1.3656814098358154} -11/07/2021 05:30:11 - INFO - __main__ - Step 58992: {'lr': 0.0003383141027507962, 'samples': 11326464, 'steps': 58991, 'loss/train': 1.1166648864746094} -11/07/2021 05:30:12 - INFO - __main__ - Step 58993: {'lr': 0.0003383091381307193, 'samples': 11326656, 'steps': 58992, 'loss/train': 1.576315999031067} -11/07/2021 05:30:12 - INFO - __main__ - Step 58994: {'lr': 0.0003383041734708516, 'samples': 11326848, 'steps': 58993, 'loss/train': 1.656105637550354} -11/07/2021 05:30:13 - INFO - __main__ - Step 58995: {'lr': 0.0003382992087711954, 'samples': 11327040, 'steps': 58994, 'loss/train': 1.2767597436904907} -11/07/2021 05:30:13 - INFO - __main__ - Step 58996: {'lr': 0.00033829424403175297, 'samples': 11327232, 'steps': 58995, 'loss/train': 0.18723994493484497} -11/07/2021 05:30:13 - INFO - __main__ - Step 58997: {'lr': 0.00033828927925252657, 'samples': 11327424, 'steps': 58996, 'loss/train': 1.48435378074646} -11/07/2021 05:30:14 - INFO - __main__ - Step 58998: {'lr': 0.0003382843144335183, 'samples': 11327616, 'steps': 58997, 'loss/train': 1.5496824979782104} -11/07/2021 05:30:15 - INFO - __main__ - Step 58999: {'lr': 0.0003382793495747305, 'samples': 11327808, 'steps': 58998, 'loss/train': 1.3105796575546265} -11/07/2021 05:30:15 - INFO - __main__ - Step 59000: {'lr': 0.0003382743846761654, 'samples': 11328000, 'steps': 58999, 'loss/train': 1.9641363620758057} -11/07/2021 05:30:15 - INFO - __main__ - Step 59001: {'lr': 0.0003382694197378252, 'samples': 11328192, 'steps': 59000, 'loss/train': 0.6021393537521362} -11/07/2021 05:30:16 - INFO - __main__ - Step 59002: {'lr': 0.00033826445475971216, 'samples': 11328384, 'steps': 59001, 'loss/train': 1.301620602607727} -11/07/2021 05:30:16 - INFO - __main__ - Step 59003: {'lr': 0.0003382594897418285, 'samples': 11328576, 'steps': 59002, 'loss/train': 1.00771963596344} -11/07/2021 05:30:17 - INFO - __main__ - Step 59004: {'lr': 0.0003382545246841766, 'samples': 11328768, 'steps': 59003, 'loss/train': 1.8510748147964478} -11/07/2021 05:30:18 - INFO - __main__ - Step 59005: {'lr': 0.00033824955958675843, 'samples': 11328960, 'steps': 59004, 'loss/train': 0.6068124175071716} -11/07/2021 05:30:18 - INFO - __main__ - Step 59006: {'lr': 0.00033824459444957645, 'samples': 11329152, 'steps': 59005, 'loss/train': 1.2799570560455322} -11/07/2021 05:30:18 - INFO - __main__ - Step 59007: {'lr': 0.0003382396292726328, 'samples': 11329344, 'steps': 59006, 'loss/train': 1.6679545640945435} -11/07/2021 05:30:19 - INFO - __main__ - Step 59008: {'lr': 0.00033823466405592974, 'samples': 11329536, 'steps': 59007, 'loss/train': 1.59792160987854} -11/07/2021 05:30:20 - INFO - __main__ - Step 59009: {'lr': 0.00033822969879946947, 'samples': 11329728, 'steps': 59008, 'loss/train': 1.542983889579773} -11/07/2021 05:30:20 - INFO - __main__ - Step 59010: {'lr': 0.0003382247335032542, 'samples': 11329920, 'steps': 59009, 'loss/train': 1.476171851158142} -11/07/2021 05:30:20 - INFO - __main__ - Step 59011: {'lr': 0.0003382197681672864, 'samples': 11330112, 'steps': 59010, 'loss/train': 0.20667408406734467} -11/07/2021 05:30:21 - INFO - __main__ - Step 59012: {'lr': 0.000338214802791568, 'samples': 11330304, 'steps': 59011, 'loss/train': 1.7993354797363281} -11/07/2021 05:30:21 - INFO - __main__ - Step 59013: {'lr': 0.00033820983737610147, 'samples': 11330496, 'steps': 59012, 'loss/train': 1.5575295686721802} -11/07/2021 05:30:22 - INFO - __main__ - Step 59014: {'lr': 0.00033820487192088883, 'samples': 11330688, 'steps': 59013, 'loss/train': 1.5250554084777832} -11/07/2021 05:30:23 - INFO - __main__ - Step 59015: {'lr': 0.0003381999064259325, 'samples': 11330880, 'steps': 59014, 'loss/train': 1.177808165550232} -11/07/2021 05:30:23 - INFO - __main__ - Step 59016: {'lr': 0.00033819494089123466, 'samples': 11331072, 'steps': 59015, 'loss/train': 1.3401293754577637} -11/07/2021 05:30:23 - INFO - __main__ - Step 59017: {'lr': 0.00033818997531679756, 'samples': 11331264, 'steps': 59016, 'loss/train': 0.44552716612815857} -11/07/2021 05:30:24 - INFO - __main__ - Step 59018: {'lr': 0.0003381850097026234, 'samples': 11331456, 'steps': 59017, 'loss/train': 1.4919835329055786} -11/07/2021 05:30:25 - INFO - __main__ - Step 59019: {'lr': 0.0003381800440487144, 'samples': 11331648, 'steps': 59018, 'loss/train': 1.3549867868423462} -11/07/2021 05:30:25 - INFO - __main__ - Step 59020: {'lr': 0.00033817507835507283, 'samples': 11331840, 'steps': 59019, 'loss/train': 1.3828877210617065} -11/07/2021 05:30:25 - INFO - __main__ - Step 59021: {'lr': 0.00033817011262170097, 'samples': 11332032, 'steps': 59020, 'loss/train': 1.3331918716430664} -11/07/2021 05:30:26 - INFO - __main__ - Step 59022: {'lr': 0.000338165146848601, 'samples': 11332224, 'steps': 59021, 'loss/train': 1.3515325784683228} -11/07/2021 05:30:26 - INFO - __main__ - Step 59023: {'lr': 0.0003381601810357752, 'samples': 11332416, 'steps': 59022, 'loss/train': 1.296303391456604} -11/07/2021 05:30:27 - INFO - __main__ - Step 59024: {'lr': 0.00033815521518322576, 'samples': 11332608, 'steps': 59023, 'loss/train': 1.0616830587387085} -11/07/2021 05:30:27 - INFO - __main__ - Step 59025: {'lr': 0.00033815024929095496, 'samples': 11332800, 'steps': 59024, 'loss/train': 1.3384326696395874} -11/07/2021 05:30:28 - INFO - __main__ - Step 59026: {'lr': 0.000338145283358965, 'samples': 11332992, 'steps': 59025, 'loss/train': 1.268005132675171} -11/07/2021 05:30:28 - INFO - __main__ - Step 59027: {'lr': 0.0003381403173872581, 'samples': 11333184, 'steps': 59026, 'loss/train': 0.9674777984619141} -11/07/2021 05:30:29 - INFO - __main__ - Step 59028: {'lr': 0.00033813535137583656, 'samples': 11333376, 'steps': 59027, 'loss/train': 1.3868147134780884} -11/07/2021 05:30:29 - INFO - __main__ - Step 59029: {'lr': 0.0003381303853247026, 'samples': 11333568, 'steps': 59028, 'loss/train': 1.801058292388916} -11/07/2021 05:30:30 - INFO - __main__ - Step 59030: {'lr': 0.0003381254192338585, 'samples': 11333760, 'steps': 59029, 'loss/train': 1.4851211309432983} -11/07/2021 05:30:30 - INFO - __main__ - Step 59031: {'lr': 0.00033812045310330636, 'samples': 11333952, 'steps': 59030, 'loss/train': 0.4006422758102417} -11/07/2021 05:30:31 - INFO - __main__ - Step 59032: {'lr': 0.0003381154869330485, 'samples': 11334144, 'steps': 59031, 'loss/train': 0.8292285799980164} -11/07/2021 05:30:31 - INFO - __main__ - Step 59033: {'lr': 0.00033811052072308724, 'samples': 11334336, 'steps': 59032, 'loss/train': 1.8231481313705444} -11/07/2021 05:30:31 - INFO - __main__ - Step 59034: {'lr': 0.0003381055544734247, 'samples': 11334528, 'steps': 59033, 'loss/train': 1.622146725654602} -11/07/2021 05:30:32 - INFO - __main__ - Step 59035: {'lr': 0.00033810058818406307, 'samples': 11334720, 'steps': 59034, 'loss/train': 1.0690467357635498} -11/07/2021 05:30:33 - INFO - __main__ - Step 59036: {'lr': 0.0003380956218550049, 'samples': 11334912, 'steps': 59035, 'loss/train': 1.2485395669937134} -11/07/2021 05:30:33 - INFO - __main__ - Step 59037: {'lr': 0.000338090655486252, 'samples': 11335104, 'steps': 59036, 'loss/train': 1.5792678594589233} -11/07/2021 05:30:33 - INFO - __main__ - Step 59038: {'lr': 0.00033808568907780687, 'samples': 11335296, 'steps': 59037, 'loss/train': 1.1977735757827759} -11/07/2021 05:30:34 - INFO - __main__ - Step 59039: {'lr': 0.00033808072262967164, 'samples': 11335488, 'steps': 59038, 'loss/train': 1.333406686782837} -11/07/2021 05:30:35 - INFO - __main__ - Step 59040: {'lr': 0.00033807575614184864, 'samples': 11335680, 'steps': 59039, 'loss/train': 1.4398648738861084} -11/07/2021 05:30:35 - INFO - __main__ - Step 59041: {'lr': 0.0003380707896143401, 'samples': 11335872, 'steps': 59040, 'loss/train': 1.0140451192855835} -11/07/2021 05:30:36 - INFO - __main__ - Step 59042: {'lr': 0.0003380658230471482, 'samples': 11336064, 'steps': 59041, 'loss/train': 1.574953317642212} -11/07/2021 05:30:36 - INFO - __main__ - Step 59043: {'lr': 0.0003380608564402752, 'samples': 11336256, 'steps': 59042, 'loss/train': 1.8984801769256592} -11/07/2021 05:30:36 - INFO - __main__ - Step 59044: {'lr': 0.0003380558897937233, 'samples': 11336448, 'steps': 59043, 'loss/train': 1.3492224216461182} -11/07/2021 05:30:37 - INFO - __main__ - Step 59045: {'lr': 0.0003380509231074948, 'samples': 11336640, 'steps': 59044, 'loss/train': 1.5896109342575073} -11/07/2021 05:30:38 - INFO - __main__ - Step 59046: {'lr': 0.0003380459563815919, 'samples': 11336832, 'steps': 59045, 'loss/train': 1.0907433032989502} -11/07/2021 05:30:38 - INFO - __main__ - Step 59047: {'lr': 0.0003380409896160169, 'samples': 11337024, 'steps': 59046, 'loss/train': 1.303443193435669} -11/07/2021 05:30:38 - INFO - __main__ - Step 59048: {'lr': 0.00033803602281077194, 'samples': 11337216, 'steps': 59047, 'loss/train': 1.4601738452911377} -11/07/2021 05:30:39 - INFO - __main__ - Step 59049: {'lr': 0.0003380310559658593, 'samples': 11337408, 'steps': 59048, 'loss/train': 1.196200966835022} -11/07/2021 05:30:40 - INFO - __main__ - Step 59050: {'lr': 0.00033802608908128126, 'samples': 11337600, 'steps': 59049, 'loss/train': 1.0969765186309814} -11/07/2021 05:30:40 - INFO - __main__ - Step 59051: {'lr': 0.00033802112215704, 'samples': 11337792, 'steps': 59050, 'loss/train': 1.753443717956543} -11/07/2021 05:30:40 - INFO - __main__ - Step 59052: {'lr': 0.0003380161551931378, 'samples': 11337984, 'steps': 59051, 'loss/train': 1.0757197141647339} -11/07/2021 05:30:41 - INFO - __main__ - Step 59053: {'lr': 0.00033801118818957686, 'samples': 11338176, 'steps': 59052, 'loss/train': 1.2961983680725098} -11/07/2021 05:30:41 - INFO - __main__ - Step 59054: {'lr': 0.00033800622114635943, 'samples': 11338368, 'steps': 59053, 'loss/train': 1.1351161003112793} -11/07/2021 05:30:42 - INFO - __main__ - Step 59055: {'lr': 0.0003380012540634878, 'samples': 11338560, 'steps': 59054, 'loss/train': 1.7041480541229248} -11/07/2021 05:30:42 - INFO - __main__ - Step 59056: {'lr': 0.00033799628694096407, 'samples': 11338752, 'steps': 59055, 'loss/train': 1.5331214666366577} -11/07/2021 05:30:43 - INFO - __main__ - Step 59057: {'lr': 0.0003379913197787907, 'samples': 11338944, 'steps': 59056, 'loss/train': 1.6381770372390747} -11/07/2021 05:30:43 - INFO - __main__ - Step 59058: {'lr': 0.00033798635257696976, 'samples': 11339136, 'steps': 59057, 'loss/train': 0.44634076952934265} -11/07/2021 05:30:43 - INFO - __main__ - Step 59059: {'lr': 0.0003379813853355034, 'samples': 11339328, 'steps': 59058, 'loss/train': 1.2636781930923462} -11/07/2021 05:30:45 - INFO - __main__ - Step 59060: {'lr': 0.0003379764180543941, 'samples': 11339520, 'steps': 59059, 'loss/train': 1.602419376373291} -11/07/2021 05:30:45 - INFO - __main__ - Step 59061: {'lr': 0.000337971450733644, 'samples': 11339712, 'steps': 59060, 'loss/train': 1.3686432838439941} -11/07/2021 05:30:45 - INFO - __main__ - Step 59062: {'lr': 0.00033796648337325525, 'samples': 11339904, 'steps': 59061, 'loss/train': 0.6409185528755188} -11/07/2021 05:30:46 - INFO - __main__ - Step 59063: {'lr': 0.0003379615159732302, 'samples': 11340096, 'steps': 59062, 'loss/train': 1.3427462577819824} -11/07/2021 05:30:46 - INFO - __main__ - Step 59064: {'lr': 0.00033795654853357104, 'samples': 11340288, 'steps': 59063, 'loss/train': 1.4081156253814697} -11/07/2021 05:30:47 - INFO - __main__ - Step 59065: {'lr': 0.00033795158105428, 'samples': 11340480, 'steps': 59064, 'loss/train': 1.1225422620773315} -11/07/2021 05:30:47 - INFO - __main__ - Step 59066: {'lr': 0.0003379466135353594, 'samples': 11340672, 'steps': 59065, 'loss/train': 1.297689437866211} -11/07/2021 05:30:48 - INFO - __main__ - Step 59067: {'lr': 0.0003379416459768114, 'samples': 11340864, 'steps': 59066, 'loss/train': 1.8279924392700195} -11/07/2021 05:30:48 - INFO - __main__ - Step 59068: {'lr': 0.00033793667837863815, 'samples': 11341056, 'steps': 59067, 'loss/train': 1.3760242462158203} -11/07/2021 05:30:48 - INFO - __main__ - Step 59069: {'lr': 0.0003379317107408421, 'samples': 11341248, 'steps': 59068, 'loss/train': 1.5519757270812988} -11/07/2021 05:30:49 - INFO - __main__ - Step 59070: {'lr': 0.0003379267430634253, 'samples': 11341440, 'steps': 59069, 'loss/train': 1.4017212390899658} -11/07/2021 05:30:50 - INFO - __main__ - Step 59071: {'lr': 0.00033792177534639015, 'samples': 11341632, 'steps': 59070, 'loss/train': 1.1278568506240845} -11/07/2021 05:30:50 - INFO - __main__ - Step 59072: {'lr': 0.00033791680758973874, 'samples': 11341824, 'steps': 59071, 'loss/train': 1.3602644205093384} -11/07/2021 05:30:51 - INFO - __main__ - Step 59073: {'lr': 0.0003379118397934734, 'samples': 11342016, 'steps': 59072, 'loss/train': 5.711589813232422} -11/07/2021 05:30:51 - INFO - __main__ - Step 59074: {'lr': 0.00033790687195759636, 'samples': 11342208, 'steps': 59073, 'loss/train': 1.1390502452850342} -11/07/2021 05:30:51 - INFO - __main__ - Step 59075: {'lr': 0.00033790190408210973, 'samples': 11342400, 'steps': 59074, 'loss/train': 1.4508646726608276} -11/07/2021 05:30:52 - INFO - __main__ - Step 59076: {'lr': 0.000337896936167016, 'samples': 11342592, 'steps': 59075, 'loss/train': 1.3428006172180176} -11/07/2021 05:30:53 - INFO - __main__ - Step 59077: {'lr': 0.00033789196821231717, 'samples': 11342784, 'steps': 59076, 'loss/train': 1.171927809715271} -11/07/2021 05:30:53 - INFO - __main__ - Step 59078: {'lr': 0.00033788700021801564, 'samples': 11342976, 'steps': 59077, 'loss/train': 1.3192864656448364} -11/07/2021 05:30:53 - INFO - __main__ - Step 59079: {'lr': 0.00033788203218411357, 'samples': 11343168, 'steps': 59078, 'loss/train': 1.6850391626358032} -11/07/2021 05:30:54 - INFO - __main__ - Step 59080: {'lr': 0.0003378770641106132, 'samples': 11343360, 'steps': 59079, 'loss/train': 1.1569558382034302} -11/07/2021 05:30:55 - INFO - __main__ - Step 59081: {'lr': 0.00033787209599751676, 'samples': 11343552, 'steps': 59080, 'loss/train': 1.3070340156555176} -11/07/2021 05:30:55 - INFO - __main__ - Step 59082: {'lr': 0.0003378671278448265, 'samples': 11343744, 'steps': 59081, 'loss/train': 1.6367872953414917} -11/07/2021 05:30:56 - INFO - __main__ - Step 59083: {'lr': 0.00033786215965254474, 'samples': 11343936, 'steps': 59082, 'loss/train': 0.9003011584281921} -11/07/2021 05:30:56 - INFO - __main__ - Step 59084: {'lr': 0.00033785719142067364, 'samples': 11344128, 'steps': 59083, 'loss/train': 1.2933342456817627} -11/07/2021 05:30:56 - INFO - __main__ - Step 59085: {'lr': 0.0003378522231492154, 'samples': 11344320, 'steps': 59084, 'loss/train': 1.5280778408050537} -11/07/2021 05:30:57 - INFO - __main__ - Step 59086: {'lr': 0.0003378472548381723, 'samples': 11344512, 'steps': 59085, 'loss/train': 1.450378656387329} -11/07/2021 05:30:58 - INFO - __main__ - Step 59087: {'lr': 0.0003378422864875466, 'samples': 11344704, 'steps': 59086, 'loss/train': 1.1537388563156128} -11/07/2021 05:30:58 - INFO - __main__ - Step 59088: {'lr': 0.0003378373180973405, 'samples': 11344896, 'steps': 59087, 'loss/train': 1.1885035037994385} -11/07/2021 05:30:58 - INFO - __main__ - Step 59089: {'lr': 0.0003378323496675563, 'samples': 11345088, 'steps': 59088, 'loss/train': 1.5443912744522095} -11/07/2021 05:30:59 - INFO - __main__ - Step 59090: {'lr': 0.0003378273811981961, 'samples': 11345280, 'steps': 59089, 'loss/train': 1.4305788278579712} -11/07/2021 05:30:59 - INFO - __main__ - Step 59091: {'lr': 0.00033782241268926237, 'samples': 11345472, 'steps': 59090, 'loss/train': 1.343381404876709} -11/07/2021 05:31:00 - INFO - __main__ - Step 59092: {'lr': 0.00033781744414075723, 'samples': 11345664, 'steps': 59091, 'loss/train': 1.6727418899536133} -11/07/2021 05:31:00 - INFO - __main__ - Step 59093: {'lr': 0.0003378124755526828, 'samples': 11345856, 'steps': 59092, 'loss/train': 1.842724323272705} -11/07/2021 05:31:01 - INFO - __main__ - Step 59094: {'lr': 0.0003378075069250414, 'samples': 11346048, 'steps': 59093, 'loss/train': 1.3655223846435547} -11/07/2021 05:31:01 - INFO - __main__ - Step 59095: {'lr': 0.00033780253825783533, 'samples': 11346240, 'steps': 59094, 'loss/train': 1.0376087427139282} -11/07/2021 05:31:02 - INFO - __main__ - Step 59096: {'lr': 0.0003377975695510668, 'samples': 11346432, 'steps': 59095, 'loss/train': 1.179636001586914} -11/07/2021 05:31:03 - INFO - __main__ - Step 59097: {'lr': 0.0003377926008047381, 'samples': 11346624, 'steps': 59096, 'loss/train': 1.4483702182769775} -11/07/2021 05:31:03 - INFO - __main__ - Step 59098: {'lr': 0.0003377876320188514, 'samples': 11346816, 'steps': 59097, 'loss/train': 1.4322985410690308} -11/07/2021 05:31:03 - INFO - __main__ - Step 59099: {'lr': 0.0003377826631934089, 'samples': 11347008, 'steps': 59098, 'loss/train': 1.5368103981018066} -11/07/2021 05:31:04 - INFO - __main__ - Step 59100: {'lr': 0.0003377776943284129, 'samples': 11347200, 'steps': 59099, 'loss/train': 1.2427552938461304} -11/07/2021 05:31:04 - INFO - __main__ - Step 59101: {'lr': 0.00033777272542386564, 'samples': 11347392, 'steps': 59100, 'loss/train': 0.9969795346260071} -11/07/2021 05:31:05 - INFO - __main__ - Step 59102: {'lr': 0.0003377677564797693, 'samples': 11347584, 'steps': 59101, 'loss/train': 1.987402319908142} -11/07/2021 05:31:05 - INFO - __main__ - Step 59103: {'lr': 0.00033776278749612617, 'samples': 11347776, 'steps': 59102, 'loss/train': 1.5692646503448486} -11/07/2021 05:31:06 - INFO - __main__ - Step 59104: {'lr': 0.00033775781847293846, 'samples': 11347968, 'steps': 59103, 'loss/train': 0.8707871437072754} -11/07/2021 05:31:06 - INFO - __main__ - Step 59105: {'lr': 0.00033775284941020854, 'samples': 11348160, 'steps': 59104, 'loss/train': 0.0916455090045929} -11/07/2021 05:31:06 - INFO - __main__ - Step 59106: {'lr': 0.0003377478803079385, 'samples': 11348352, 'steps': 59105, 'loss/train': 1.0275636911392212} -11/07/2021 05:31:07 - INFO - __main__ - Step 59107: {'lr': 0.00033774291116613054, 'samples': 11348544, 'steps': 59106, 'loss/train': 1.5135724544525146} -11/07/2021 05:31:08 - INFO - __main__ - Step 59108: {'lr': 0.000337737941984787, 'samples': 11348736, 'steps': 59107, 'loss/train': 1.7488468885421753} -11/07/2021 05:31:08 - INFO - __main__ - Step 59109: {'lr': 0.00033773297276391015, 'samples': 11348928, 'steps': 59108, 'loss/train': 1.8064600229263306} -11/07/2021 05:31:09 - INFO - __main__ - Step 59110: {'lr': 0.00033772800350350215, 'samples': 11349120, 'steps': 59109, 'loss/train': 1.6492990255355835} -11/07/2021 05:31:09 - INFO - __main__ - Step 59111: {'lr': 0.0003377230342035653, 'samples': 11349312, 'steps': 59110, 'loss/train': 1.475067138671875} -11/07/2021 05:31:09 - INFO - __main__ - Step 59112: {'lr': 0.00033771806486410176, 'samples': 11349504, 'steps': 59111, 'loss/train': 1.3603543043136597} -11/07/2021 05:31:10 - INFO - __main__ - Step 59113: {'lr': 0.0003377130954851138, 'samples': 11349696, 'steps': 59112, 'loss/train': 1.298151969909668} -11/07/2021 05:31:11 - INFO - __main__ - Step 59114: {'lr': 0.0003377081260666037, 'samples': 11349888, 'steps': 59113, 'loss/train': 2.65168833732605} -11/07/2021 05:31:11 - INFO - __main__ - Step 59115: {'lr': 0.00033770315660857367, 'samples': 11350080, 'steps': 59114, 'loss/train': 1.5206751823425293} -11/07/2021 05:31:11 - INFO - __main__ - Step 59116: {'lr': 0.00033769818711102594, 'samples': 11350272, 'steps': 59115, 'loss/train': 1.7334089279174805} -11/07/2021 05:31:12 - INFO - __main__ - Step 59117: {'lr': 0.0003376932175739628, 'samples': 11350464, 'steps': 59116, 'loss/train': 1.4664421081542969} -11/07/2021 05:31:13 - INFO - __main__ - Step 59118: {'lr': 0.00033768824799738646, 'samples': 11350656, 'steps': 59117, 'loss/train': 1.2359026670455933} -11/07/2021 05:31:13 - INFO - __main__ - Step 59119: {'lr': 0.0003376832783812991, 'samples': 11350848, 'steps': 59118, 'loss/train': 1.3090336322784424} -11/07/2021 05:31:13 - INFO - __main__ - Step 59120: {'lr': 0.000337678308725703, 'samples': 11351040, 'steps': 59119, 'loss/train': 1.4215831756591797} -11/07/2021 05:31:14 - INFO - __main__ - Step 59121: {'lr': 0.0003376733390306004, 'samples': 11351232, 'steps': 59120, 'loss/train': 1.9562761783599854} -11/07/2021 05:31:14 - INFO - __main__ - Step 59122: {'lr': 0.00033766836929599353, 'samples': 11351424, 'steps': 59121, 'loss/train': 1.4182853698730469} -11/07/2021 05:31:15 - INFO - __main__ - Step 59123: {'lr': 0.00033766339952188474, 'samples': 11351616, 'steps': 59122, 'loss/train': 0.6436710953712463} -11/07/2021 05:31:16 - INFO - __main__ - Step 59124: {'lr': 0.0003376584297082761, 'samples': 11351808, 'steps': 59123, 'loss/train': 1.6214978694915771} -11/07/2021 05:31:16 - INFO - __main__ - Step 59125: {'lr': 0.00033765345985517, 'samples': 11352000, 'steps': 59124, 'loss/train': 1.309025526046753} -11/07/2021 05:31:16 - INFO - __main__ - Step 59126: {'lr': 0.0003376484899625685, 'samples': 11352192, 'steps': 59125, 'loss/train': 1.4658406972885132} -11/07/2021 05:31:17 - INFO - __main__ - Step 59127: {'lr': 0.00033764352003047397, 'samples': 11352384, 'steps': 59126, 'loss/train': 1.7807698249816895} -11/07/2021 05:31:17 - INFO - __main__ - Step 59128: {'lr': 0.00033763855005888865, 'samples': 11352576, 'steps': 59127, 'loss/train': 1.494262456893921} -11/07/2021 05:31:18 - INFO - __main__ - Step 59129: {'lr': 0.00033763358004781474, 'samples': 11352768, 'steps': 59128, 'loss/train': 0.5428523421287537} -11/07/2021 05:31:18 - INFO - __main__ - Step 59130: {'lr': 0.00033762860999725456, 'samples': 11352960, 'steps': 59129, 'loss/train': 1.6502593755722046} -11/07/2021 05:31:19 - INFO - __main__ - Step 59131: {'lr': 0.0003376236399072101, 'samples': 11353152, 'steps': 59130, 'loss/train': 1.2911310195922852} -11/07/2021 05:31:19 - INFO - __main__ - Step 59132: {'lr': 0.000337618669777684, 'samples': 11353344, 'steps': 59131, 'loss/train': 1.6087331771850586} -11/07/2021 05:31:19 - INFO - __main__ - Step 59133: {'lr': 0.0003376136996086782, 'samples': 11353536, 'steps': 59132, 'loss/train': 1.5826588869094849} -11/07/2021 05:31:21 - INFO - __main__ - Step 59134: {'lr': 0.00033760872940019496, 'samples': 11353728, 'steps': 59133, 'loss/train': 1.4108322858810425} -11/07/2021 05:31:21 - INFO - __main__ - Step 59135: {'lr': 0.00033760375915223664, 'samples': 11353920, 'steps': 59134, 'loss/train': 1.2831298112869263} -11/07/2021 05:31:21 - INFO - __main__ - Step 59136: {'lr': 0.00033759878886480534, 'samples': 11354112, 'steps': 59135, 'loss/train': 1.5412404537200928} -11/07/2021 05:31:22 - INFO - __main__ - Step 59137: {'lr': 0.00033759381853790344, 'samples': 11354304, 'steps': 59136, 'loss/train': 1.5404393672943115} -11/07/2021 05:31:22 - INFO - __main__ - Step 59138: {'lr': 0.0003375888481715331, 'samples': 11354496, 'steps': 59137, 'loss/train': 0.9630423784255981} -11/07/2021 05:31:23 - INFO - __main__ - Step 59139: {'lr': 0.0003375838777656966, 'samples': 11354688, 'steps': 59138, 'loss/train': 1.5023905038833618} -11/07/2021 05:31:23 - INFO - __main__ - Step 59140: {'lr': 0.00033757890732039617, 'samples': 11354880, 'steps': 59139, 'loss/train': 1.1749709844589233} -11/07/2021 05:31:24 - INFO - __main__ - Step 59141: {'lr': 0.000337573936835634, 'samples': 11355072, 'steps': 59140, 'loss/train': 1.4763453006744385} -11/07/2021 05:31:24 - INFO - __main__ - Step 59142: {'lr': 0.0003375689663114123, 'samples': 11355264, 'steps': 59141, 'loss/train': 1.478682041168213} -11/07/2021 05:31:24 - INFO - __main__ - Step 59143: {'lr': 0.00033756399574773343, 'samples': 11355456, 'steps': 59142, 'loss/train': 1.1878386735916138} -11/07/2021 05:31:25 - INFO - __main__ - Step 59144: {'lr': 0.00033755902514459964, 'samples': 11355648, 'steps': 59143, 'loss/train': 1.773189663887024} -11/07/2021 05:31:26 - INFO - __main__ - Step 59145: {'lr': 0.0003375540545020131, 'samples': 11355840, 'steps': 59144, 'loss/train': 1.5469133853912354} -11/07/2021 05:31:26 - INFO - __main__ - Step 59146: {'lr': 0.00033754908381997595, 'samples': 11356032, 'steps': 59145, 'loss/train': 1.284981608390808} -11/07/2021 05:31:26 - INFO - __main__ - Step 59147: {'lr': 0.00033754411309849065, 'samples': 11356224, 'steps': 59146, 'loss/train': 1.224838137626648} -11/07/2021 05:31:27 - INFO - __main__ - Step 59148: {'lr': 0.0003375391423375592, 'samples': 11356416, 'steps': 59147, 'loss/train': 1.4976599216461182} -11/07/2021 05:31:28 - INFO - __main__ - Step 59149: {'lr': 0.00033753417153718405, 'samples': 11356608, 'steps': 59148, 'loss/train': 1.3317590951919556} -11/07/2021 05:31:28 - INFO - __main__ - Step 59150: {'lr': 0.0003375292006973673, 'samples': 11356800, 'steps': 59149, 'loss/train': 1.0247522592544556} -11/07/2021 05:31:29 - INFO - __main__ - Step 59151: {'lr': 0.0003375242298181113, 'samples': 11356992, 'steps': 59150, 'loss/train': 0.06391794979572296} -11/07/2021 05:31:29 - INFO - __main__ - Step 59152: {'lr': 0.0003375192588994183, 'samples': 11357184, 'steps': 59151, 'loss/train': 1.327622890472412} -11/07/2021 05:31:29 - INFO - __main__ - Step 59153: {'lr': 0.0003375142879412903, 'samples': 11357376, 'steps': 59152, 'loss/train': 1.6796025037765503} -11/07/2021 05:31:30 - INFO - __main__ - Step 59154: {'lr': 0.0003375093169437298, 'samples': 11357568, 'steps': 59153, 'loss/train': 1.3426998853683472} -11/07/2021 05:31:31 - INFO - __main__ - Step 59155: {'lr': 0.00033750434590673893, 'samples': 11357760, 'steps': 59154, 'loss/train': 1.3947049379348755} -11/07/2021 05:31:31 - INFO - __main__ - Step 59156: {'lr': 0.00033749937483031994, 'samples': 11357952, 'steps': 59155, 'loss/train': 1.1491570472717285} -11/07/2021 05:31:31 - INFO - __main__ - Step 59157: {'lr': 0.00033749440371447513, 'samples': 11358144, 'steps': 59156, 'loss/train': 1.46199631690979} -11/07/2021 05:31:32 - INFO - __main__ - Step 59158: {'lr': 0.00033748943255920667, 'samples': 11358336, 'steps': 59157, 'loss/train': 1.4713354110717773} -11/07/2021 05:31:33 - INFO - __main__ - Step 59159: {'lr': 0.00033748446136451683, 'samples': 11358528, 'steps': 59158, 'loss/train': 1.4283231496810913} -11/07/2021 05:31:33 - INFO - __main__ - Step 59160: {'lr': 0.00033747949013040784, 'samples': 11358720, 'steps': 59159, 'loss/train': 1.6834089756011963} -11/07/2021 05:31:34 - INFO - __main__ - Step 59161: {'lr': 0.000337474518856882, 'samples': 11358912, 'steps': 59160, 'loss/train': 1.418248176574707} -11/07/2021 05:31:34 - INFO - __main__ - Step 59162: {'lr': 0.0003374695475439413, 'samples': 11359104, 'steps': 59161, 'loss/train': 1.3154340982437134} -11/07/2021 05:31:34 - INFO - __main__ - Step 59163: {'lr': 0.0003374645761915883, 'samples': 11359296, 'steps': 59162, 'loss/train': 1.5452814102172852} -11/07/2021 05:31:35 - INFO - __main__ - Step 59164: {'lr': 0.00033745960479982515, 'samples': 11359488, 'steps': 59163, 'loss/train': 1.2473890781402588} -11/07/2021 05:31:36 - INFO - __main__ - Step 59165: {'lr': 0.00033745463336865407, 'samples': 11359680, 'steps': 59164, 'loss/train': 1.9435663223266602} -11/07/2021 05:31:36 - INFO - __main__ - Step 59166: {'lr': 0.0003374496618980772, 'samples': 11359872, 'steps': 59165, 'loss/train': 1.3976154327392578} -11/07/2021 05:31:36 - INFO - __main__ - Step 59167: {'lr': 0.0003374446903880969, 'samples': 11360064, 'steps': 59166, 'loss/train': 1.1069480180740356} -11/07/2021 05:31:37 - INFO - __main__ - Step 59168: {'lr': 0.0003374397188387153, 'samples': 11360256, 'steps': 59167, 'loss/train': 0.9928202629089355} -11/07/2021 05:31:38 - INFO - __main__ - Step 59169: {'lr': 0.0003374347472499348, 'samples': 11360448, 'steps': 59168, 'loss/train': 1.838614821434021} -11/07/2021 05:31:38 - INFO - __main__ - Step 59170: {'lr': 0.00033742977562175756, 'samples': 11360640, 'steps': 59169, 'loss/train': 1.390904426574707} -11/07/2021 05:31:39 - INFO - __main__ - Step 59171: {'lr': 0.00033742480395418574, 'samples': 11360832, 'steps': 59170, 'loss/train': 0.5628034472465515} -11/07/2021 05:31:39 - INFO - __main__ - Step 59172: {'lr': 0.0003374198322472217, 'samples': 11361024, 'steps': 59171, 'loss/train': 1.525457739830017} -11/07/2021 05:31:39 - INFO - __main__ - Step 59173: {'lr': 0.00033741486050086763, 'samples': 11361216, 'steps': 59172, 'loss/train': 1.7237218618392944} -11/07/2021 05:31:40 - INFO - __main__ - Step 59174: {'lr': 0.00033740988871512574, 'samples': 11361408, 'steps': 59173, 'loss/train': 1.40801203250885} -11/07/2021 05:31:41 - INFO - __main__ - Step 59175: {'lr': 0.0003374049168899983, 'samples': 11361600, 'steps': 59174, 'loss/train': 1.4984530210494995} -11/07/2021 05:31:41 - INFO - __main__ - Step 59176: {'lr': 0.00033739994502548766, 'samples': 11361792, 'steps': 59175, 'loss/train': 1.8369193077087402} -11/07/2021 05:31:41 - INFO - __main__ - Step 59177: {'lr': 0.0003373949731215958, 'samples': 11361984, 'steps': 59176, 'loss/train': 1.3676249980926514} -11/07/2021 05:31:42 - INFO - __main__ - Step 59178: {'lr': 0.0003373900011783252, 'samples': 11362176, 'steps': 59177, 'loss/train': 1.2269113063812256} -11/07/2021 05:31:43 - INFO - __main__ - Step 59179: {'lr': 0.000337385029195678, 'samples': 11362368, 'steps': 59178, 'loss/train': 1.5693867206573486} -11/07/2021 05:31:43 - INFO - __main__ - Step 59180: {'lr': 0.00033738005717365646, 'samples': 11362560, 'steps': 59179, 'loss/train': 1.3788961172103882} -11/07/2021 05:31:43 - INFO - __main__ - Step 59181: {'lr': 0.00033737508511226283, 'samples': 11362752, 'steps': 59180, 'loss/train': 1.3437258005142212} -11/07/2021 05:31:44 - INFO - __main__ - Step 59182: {'lr': 0.00033737011301149933, 'samples': 11362944, 'steps': 59181, 'loss/train': 1.7837194204330444} -11/07/2021 05:31:44 - INFO - __main__ - Step 59183: {'lr': 0.0003373651408713682, 'samples': 11363136, 'steps': 59182, 'loss/train': 1.8440576791763306} -11/07/2021 05:31:44 - INFO - __main__ - Step 59184: {'lr': 0.00033736016869187165, 'samples': 11363328, 'steps': 59183, 'loss/train': 1.4563645124435425} -11/07/2021 05:31:45 - INFO - __main__ - Step 59185: {'lr': 0.0003373551964730119, 'samples': 11363520, 'steps': 59184, 'loss/train': 1.5352476835250854} -11/07/2021 05:31:46 - INFO - __main__ - Step 59186: {'lr': 0.00033735022421479136, 'samples': 11363712, 'steps': 59185, 'loss/train': 1.0495479106903076} -11/07/2021 05:31:46 - INFO - __main__ - Step 59187: {'lr': 0.00033734525191721215, 'samples': 11363904, 'steps': 59186, 'loss/train': 1.6984713077545166} -11/07/2021 05:31:47 - INFO - __main__ - Step 59188: {'lr': 0.00033734027958027646, 'samples': 11364096, 'steps': 59187, 'loss/train': 1.4865436553955078} -11/07/2021 05:31:47 - INFO - __main__ - Step 59189: {'lr': 0.00033733530720398666, 'samples': 11364288, 'steps': 59188, 'loss/train': 1.7580646276474} -11/07/2021 05:31:48 - INFO - __main__ - Step 59190: {'lr': 0.00033733033478834483, 'samples': 11364480, 'steps': 59189, 'loss/train': 1.0829137563705444} -11/07/2021 05:31:48 - INFO - __main__ - Step 59191: {'lr': 0.00033732536233335334, 'samples': 11364672, 'steps': 59190, 'loss/train': 1.535908579826355} -11/07/2021 05:31:49 - INFO - __main__ - Step 59192: {'lr': 0.0003373203898390145, 'samples': 11364864, 'steps': 59191, 'loss/train': 1.6308199167251587} -11/07/2021 05:31:49 - INFO - __main__ - Step 59193: {'lr': 0.0003373154173053303, 'samples': 11365056, 'steps': 59192, 'loss/train': 1.6149977445602417} -11/07/2021 05:31:49 - INFO - __main__ - Step 59194: {'lr': 0.0003373104447323031, 'samples': 11365248, 'steps': 59193, 'loss/train': 1.3431729078292847} -11/07/2021 05:31:50 - INFO - __main__ - Step 59195: {'lr': 0.00033730547211993525, 'samples': 11365440, 'steps': 59194, 'loss/train': 1.1915044784545898} -11/07/2021 05:31:51 - INFO - __main__ - Step 59196: {'lr': 0.00033730049946822883, 'samples': 11365632, 'steps': 59195, 'loss/train': 1.6732431650161743} -11/07/2021 05:31:51 - INFO - __main__ - Step 59197: {'lr': 0.0003372955267771862, 'samples': 11365824, 'steps': 59196, 'loss/train': 1.5167385339736938} -11/07/2021 05:31:51 - INFO - __main__ - Step 59198: {'lr': 0.00033729055404680953, 'samples': 11366016, 'steps': 59197, 'loss/train': 1.1936794519424438} -11/07/2021 05:31:52 - INFO - __main__ - Step 59199: {'lr': 0.00033728558127710115, 'samples': 11366208, 'steps': 59198, 'loss/train': 1.2849947214126587} -11/07/2021 05:31:53 - INFO - __main__ - Step 59200: {'lr': 0.0003372806084680632, 'samples': 11366400, 'steps': 59199, 'loss/train': 1.5322794914245605} -11/07/2021 05:31:53 - INFO - __main__ - Step 59201: {'lr': 0.0003372756356196979, 'samples': 11366592, 'steps': 59200, 'loss/train': 1.5394585132598877} -11/07/2021 05:31:54 - INFO - __main__ - Step 59202: {'lr': 0.0003372706627320076, 'samples': 11366784, 'steps': 59201, 'loss/train': 1.2204450368881226} -11/07/2021 05:31:54 - INFO - __main__ - Step 59203: {'lr': 0.0003372656898049944, 'samples': 11366976, 'steps': 59202, 'loss/train': 1.5385537147521973} -11/07/2021 05:31:54 - INFO - __main__ - Step 59204: {'lr': 0.0003372607168386607, 'samples': 11367168, 'steps': 59203, 'loss/train': 1.9647362232208252} -11/07/2021 05:31:55 - INFO - __main__ - Step 59205: {'lr': 0.00033725574383300865, 'samples': 11367360, 'steps': 59204, 'loss/train': 1.1615335941314697} -11/07/2021 05:31:56 - INFO - __main__ - Step 59206: {'lr': 0.0003372507707880406, 'samples': 11367552, 'steps': 59205, 'loss/train': 1.3706697225570679} -11/07/2021 05:31:56 - INFO - __main__ - Step 59207: {'lr': 0.0003372457977037586, 'samples': 11367744, 'steps': 59206, 'loss/train': 1.6664659976959229} -11/07/2021 05:31:56 - INFO - __main__ - Step 59208: {'lr': 0.000337240824580165, 'samples': 11367936, 'steps': 59207, 'loss/train': 1.6000585556030273} -11/07/2021 05:31:57 - INFO - __main__ - Step 59209: {'lr': 0.00033723585141726196, 'samples': 11368128, 'steps': 59208, 'loss/train': 1.851723074913025} -11/07/2021 05:31:58 - INFO - __main__ - Step 59210: {'lr': 0.0003372308782150519, 'samples': 11368320, 'steps': 59209, 'loss/train': 0.06964382529258728} -11/07/2021 05:31:58 - INFO - __main__ - Step 59211: {'lr': 0.0003372259049735369, 'samples': 11368512, 'steps': 59210, 'loss/train': 1.5304545164108276} -11/07/2021 05:31:59 - INFO - __main__ - Step 59212: {'lr': 0.00033722093169271934, 'samples': 11368704, 'steps': 59211, 'loss/train': 1.4610363245010376} -11/07/2021 05:31:59 - INFO - __main__ - Step 59213: {'lr': 0.00033721595837260125, 'samples': 11368896, 'steps': 59212, 'loss/train': 1.2715320587158203} -11/07/2021 05:31:59 - INFO - __main__ - Step 59214: {'lr': 0.00033721098501318506, 'samples': 11369088, 'steps': 59213, 'loss/train': 1.2266206741333008} -11/07/2021 05:32:00 - INFO - __main__ - Step 59215: {'lr': 0.00033720601161447294, 'samples': 11369280, 'steps': 59214, 'loss/train': 1.958136796951294} -11/07/2021 05:32:01 - INFO - __main__ - Step 59216: {'lr': 0.0003372010381764671, 'samples': 11369472, 'steps': 59215, 'loss/train': 1.6986103057861328} -11/07/2021 05:32:01 - INFO - __main__ - Step 59217: {'lr': 0.00033719606469916985, 'samples': 11369664, 'steps': 59216, 'loss/train': 1.4668993949890137} -11/07/2021 05:32:01 - INFO - __main__ - Step 59218: {'lr': 0.0003371910911825834, 'samples': 11369856, 'steps': 59217, 'loss/train': 2.378601312637329} -11/07/2021 05:32:02 - INFO - __main__ - Step 59219: {'lr': 0.00033718611762671003, 'samples': 11370048, 'steps': 59218, 'loss/train': 1.9074461460113525} -11/07/2021 05:32:02 - INFO - __main__ - Step 59220: {'lr': 0.0003371811440315519, 'samples': 11370240, 'steps': 59219, 'loss/train': 1.6932467222213745} -11/07/2021 05:32:03 - INFO - __main__ - Step 59221: {'lr': 0.0003371761703971113, 'samples': 11370432, 'steps': 59220, 'loss/train': 1.7494654655456543} -11/07/2021 05:32:03 - INFO - __main__ - Step 59222: {'lr': 0.0003371711967233905, 'samples': 11370624, 'steps': 59221, 'loss/train': 1.582100749015808} -11/07/2021 05:32:04 - INFO - __main__ - Step 59223: {'lr': 0.00033716622301039164, 'samples': 11370816, 'steps': 59222, 'loss/train': 1.5961817502975464} -11/07/2021 05:32:04 - INFO - __main__ - Step 59224: {'lr': 0.000337161249258117, 'samples': 11371008, 'steps': 59223, 'loss/train': 0.8752351403236389} -11/07/2021 05:32:05 - INFO - __main__ - Step 59225: {'lr': 0.0003371562754665689, 'samples': 11371200, 'steps': 59224, 'loss/train': 1.7890576124191284} -11/07/2021 05:32:05 - INFO - __main__ - Step 59226: {'lr': 0.0003371513016357496, 'samples': 11371392, 'steps': 59225, 'loss/train': 1.5614650249481201} -11/07/2021 05:32:06 - INFO - __main__ - Step 59227: {'lr': 0.0003371463277656611, 'samples': 11371584, 'steps': 59226, 'loss/train': 1.256270170211792} -11/07/2021 05:32:06 - INFO - __main__ - Step 59228: {'lr': 0.00033714135385630597, 'samples': 11371776, 'steps': 59227, 'loss/train': 1.6196098327636719} -11/07/2021 05:32:07 - INFO - __main__ - Step 59229: {'lr': 0.0003371363799076862, 'samples': 11371968, 'steps': 59228, 'loss/train': 1.5933330059051514} -11/07/2021 05:32:07 - INFO - __main__ - Step 59230: {'lr': 0.00033713140591980407, 'samples': 11372160, 'steps': 59229, 'loss/train': 1.7267251014709473} -11/07/2021 05:32:07 - INFO - __main__ - Step 59231: {'lr': 0.00033712643189266197, 'samples': 11372352, 'steps': 59230, 'loss/train': 1.4047694206237793} -11/07/2021 05:32:08 - INFO - __main__ - Step 59232: {'lr': 0.00033712145782626205, 'samples': 11372544, 'steps': 59231, 'loss/train': 1.4500529766082764} -11/07/2021 05:32:09 - INFO - __main__ - Step 59233: {'lr': 0.0003371164837206065, 'samples': 11372736, 'steps': 59232, 'loss/train': 1.6374399662017822} -11/07/2021 05:32:09 - INFO - __main__ - Step 59234: {'lr': 0.00033711150957569763, 'samples': 11372928, 'steps': 59233, 'loss/train': 1.4036811590194702} -11/07/2021 05:32:09 - INFO - __main__ - Step 59235: {'lr': 0.00033710653539153763, 'samples': 11373120, 'steps': 59234, 'loss/train': 1.540671467781067} -11/07/2021 05:32:10 - INFO - __main__ - Step 59236: {'lr': 0.0003371015611681288, 'samples': 11373312, 'steps': 59235, 'loss/train': 1.4164243936538696} -11/07/2021 05:32:11 - INFO - __main__ - Step 59237: {'lr': 0.0003370965869054733, 'samples': 11373504, 'steps': 59236, 'loss/train': 0.0903257355093956} -11/07/2021 05:32:11 - INFO - __main__ - Step 59238: {'lr': 0.0003370916126035735, 'samples': 11373696, 'steps': 59237, 'loss/train': 1.7022573947906494} -11/07/2021 05:32:11 - INFO - __main__ - Step 59239: {'lr': 0.0003370866382624315, 'samples': 11373888, 'steps': 59238, 'loss/train': 1.0951852798461914} -11/07/2021 05:32:12 - INFO - __main__ - Step 59240: {'lr': 0.00033708166388204963, 'samples': 11374080, 'steps': 59239, 'loss/train': 1.3774245977401733} -11/07/2021 05:32:12 - INFO - __main__ - Step 59241: {'lr': 0.0003370766894624301, 'samples': 11374272, 'steps': 59240, 'loss/train': 1.5817006826400757} -11/07/2021 05:32:13 - INFO - __main__ - Step 59242: {'lr': 0.00033707171500357516, 'samples': 11374464, 'steps': 59241, 'loss/train': 1.5087922811508179} -11/07/2021 05:32:14 - INFO - __main__ - Step 59243: {'lr': 0.000337066740505487, 'samples': 11374656, 'steps': 59242, 'loss/train': 2.273547410964966} -11/07/2021 05:32:14 - INFO - __main__ - Step 59244: {'lr': 0.00033706176596816795, 'samples': 11374848, 'steps': 59243, 'loss/train': 1.559385895729065} -11/07/2021 05:32:15 - INFO - __main__ - Step 59245: {'lr': 0.0003370567913916203, 'samples': 11375040, 'steps': 59244, 'loss/train': 1.7910820245742798} -11/07/2021 05:32:15 - INFO - __main__ - Step 59246: {'lr': 0.0003370518167758461, 'samples': 11375232, 'steps': 59245, 'loss/train': 1.7979004383087158} -11/07/2021 05:32:15 - INFO - __main__ - Step 59247: {'lr': 0.00033704684212084774, 'samples': 11375424, 'steps': 59246, 'loss/train': 1.5317434072494507} -11/07/2021 05:32:16 - INFO - __main__ - Step 59248: {'lr': 0.0003370418674266273, 'samples': 11375616, 'steps': 59247, 'loss/train': 1.1110860109329224} -11/07/2021 05:32:17 - INFO - __main__ - Step 59249: {'lr': 0.00033703689269318725, 'samples': 11375808, 'steps': 59248, 'loss/train': 1.7913658618927002} -11/07/2021 05:32:17 - INFO - __main__ - Step 59250: {'lr': 0.00033703191792052974, 'samples': 11376000, 'steps': 59249, 'loss/train': 1.4231507778167725} -11/07/2021 05:32:17 - INFO - __main__ - Step 59251: {'lr': 0.00033702694310865696, 'samples': 11376192, 'steps': 59250, 'loss/train': 1.6132559776306152} -11/07/2021 05:32:18 - INFO - __main__ - Step 59252: {'lr': 0.00033702196825757114, 'samples': 11376384, 'steps': 59251, 'loss/train': 1.4366536140441895} -11/07/2021 05:32:19 - INFO - __main__ - Step 59253: {'lr': 0.00033701699336727465, 'samples': 11376576, 'steps': 59252, 'loss/train': 1.3314954042434692} -11/07/2021 05:32:19 - INFO - __main__ - Step 59254: {'lr': 0.00033701201843776957, 'samples': 11376768, 'steps': 59253, 'loss/train': 1.6341077089309692} -11/07/2021 05:32:19 - INFO - __main__ - Step 59255: {'lr': 0.0003370070434690583, 'samples': 11376960, 'steps': 59254, 'loss/train': 1.0928893089294434} -11/07/2021 05:32:20 - INFO - __main__ - Step 59256: {'lr': 0.0003370020684611429, 'samples': 11377152, 'steps': 59255, 'loss/train': 1.1169596910476685} -11/07/2021 05:32:20 - INFO - __main__ - Step 59257: {'lr': 0.0003369970934140257, 'samples': 11377344, 'steps': 59256, 'loss/train': 1.2681905031204224} -11/07/2021 05:32:22 - INFO - __main__ - Step 59258: {'lr': 0.00033699211832770906, 'samples': 11377536, 'steps': 59257, 'loss/train': 1.5688832998275757} -11/07/2021 05:32:22 - INFO - __main__ - Step 59259: {'lr': 0.000336987143202195, 'samples': 11377728, 'steps': 59258, 'loss/train': 1.8637508153915405} -11/07/2021 05:32:22 - INFO - __main__ - Step 59260: {'lr': 0.000336982168037486, 'samples': 11377920, 'steps': 59259, 'loss/train': 1.576521635055542} -11/07/2021 05:32:23 - INFO - __main__ - Step 59261: {'lr': 0.0003369771928335841, 'samples': 11378112, 'steps': 59260, 'loss/train': 1.802741527557373} -11/07/2021 05:32:23 - INFO - __main__ - Step 59262: {'lr': 0.00033697221759049163, 'samples': 11378304, 'steps': 59261, 'loss/train': 1.3999284505844116} -11/07/2021 05:32:23 - INFO - __main__ - Step 59263: {'lr': 0.0003369672423082108, 'samples': 11378496, 'steps': 59262, 'loss/train': 1.166931390762329} -11/07/2021 05:32:24 - INFO - __main__ - Step 59264: {'lr': 0.00033696226698674386, 'samples': 11378688, 'steps': 59263, 'loss/train': 3.1869373321533203} -11/07/2021 05:32:25 - INFO - __main__ - Step 59265: {'lr': 0.0003369572916260931, 'samples': 11378880, 'steps': 59264, 'loss/train': 0.38798093795776367} -11/07/2021 05:32:25 - INFO - __main__ - Step 59266: {'lr': 0.0003369523162262608, 'samples': 11379072, 'steps': 59265, 'loss/train': 1.6349838972091675} -11/07/2021 05:32:26 - INFO - __main__ - Step 59267: {'lr': 0.00033694734078724904, 'samples': 11379264, 'steps': 59266, 'loss/train': 1.0898051261901855} -11/07/2021 05:32:26 - INFO - __main__ - Step 59268: {'lr': 0.00033694236530906014, 'samples': 11379456, 'steps': 59267, 'loss/train': 1.725724458694458} -11/07/2021 05:32:26 - INFO - __main__ - Step 59269: {'lr': 0.00033693738979169636, 'samples': 11379648, 'steps': 59268, 'loss/train': 1.2573586702346802} -11/07/2021 05:32:28 - INFO - __main__ - Step 59270: {'lr': 0.0003369324142351599, 'samples': 11379840, 'steps': 59269, 'loss/train': 0.08163659274578094} -11/07/2021 05:32:28 - INFO - __main__ - Step 59271: {'lr': 0.0003369274386394531, 'samples': 11380032, 'steps': 59270, 'loss/train': 1.5909442901611328} -11/07/2021 05:32:28 - INFO - __main__ - Step 59272: {'lr': 0.0003369224630045781, 'samples': 11380224, 'steps': 59271, 'loss/train': 1.4559556245803833} -11/07/2021 05:32:29 - INFO - __main__ - Step 59273: {'lr': 0.0003369174873305373, 'samples': 11380416, 'steps': 59272, 'loss/train': 1.5236685276031494} -11/07/2021 05:32:29 - INFO - __main__ - Step 59274: {'lr': 0.0003369125116173327, 'samples': 11380608, 'steps': 59273, 'loss/train': 1.7690908908843994} -11/07/2021 05:32:30 - INFO - __main__ - Step 59275: {'lr': 0.00033690753586496666, 'samples': 11380800, 'steps': 59274, 'loss/train': 1.5433930158615112} -11/07/2021 05:32:30 - INFO - __main__ - Step 59276: {'lr': 0.00033690256007344144, 'samples': 11380992, 'steps': 59275, 'loss/train': 1.5260899066925049} -11/07/2021 05:32:31 - INFO - __main__ - Step 59277: {'lr': 0.0003368975842427592, 'samples': 11381184, 'steps': 59276, 'loss/train': 1.5196844339370728} -11/07/2021 05:32:31 - INFO - __main__ - Step 59278: {'lr': 0.00033689260837292234, 'samples': 11381376, 'steps': 59277, 'loss/train': 1.7671854496002197} -11/07/2021 05:32:31 - INFO - __main__ - Step 59279: {'lr': 0.000336887632463933, 'samples': 11381568, 'steps': 59278, 'loss/train': 2.06708025932312} -11/07/2021 05:32:33 - INFO - __main__ - Step 59280: {'lr': 0.00033688265651579354, 'samples': 11381760, 'steps': 59279, 'loss/train': 1.5717920064926147} -11/07/2021 05:32:33 - INFO - __main__ - Step 59281: {'lr': 0.0003368776805285059, 'samples': 11381952, 'steps': 59280, 'loss/train': 1.348695158958435} -11/07/2021 05:32:33 - INFO - __main__ - Step 59282: {'lr': 0.0003368727045020726, 'samples': 11382144, 'steps': 59281, 'loss/train': 1.636444091796875} -11/07/2021 05:32:34 - INFO - __main__ - Step 59283: {'lr': 0.00033686772843649583, 'samples': 11382336, 'steps': 59282, 'loss/train': 1.4910632371902466} -11/07/2021 05:32:34 - INFO - __main__ - Step 59284: {'lr': 0.00033686275233177777, 'samples': 11382528, 'steps': 59283, 'loss/train': 1.386777639389038} -11/07/2021 05:32:34 - INFO - __main__ - Step 59285: {'lr': 0.00033685777618792066, 'samples': 11382720, 'steps': 59284, 'loss/train': 1.2180293798446655} -11/07/2021 05:32:36 - INFO - __main__ - Step 59286: {'lr': 0.0003368528000049269, 'samples': 11382912, 'steps': 59285, 'loss/train': 0.7874096632003784} -11/07/2021 05:32:36 - INFO - __main__ - Step 59287: {'lr': 0.00033684782378279847, 'samples': 11383104, 'steps': 59286, 'loss/train': 1.564002275466919} -11/07/2021 05:32:36 - INFO - __main__ - Step 59288: {'lr': 0.0003368428475215378, 'samples': 11383296, 'steps': 59287, 'loss/train': 1.4068653583526611} -11/07/2021 05:32:37 - INFO - __main__ - Step 59289: {'lr': 0.00033683787122114713, 'samples': 11383488, 'steps': 59288, 'loss/train': 1.694163203239441} -11/07/2021 05:32:37 - INFO - __main__ - Step 59290: {'lr': 0.0003368328948816286, 'samples': 11383680, 'steps': 59289, 'loss/train': 1.6267966032028198} -11/07/2021 05:32:38 - INFO - __main__ - Step 59291: {'lr': 0.0003368279185029845, 'samples': 11383872, 'steps': 59290, 'loss/train': 1.035529375076294} -11/07/2021 05:32:38 - INFO - __main__ - Step 59292: {'lr': 0.0003368229420852171, 'samples': 11384064, 'steps': 59291, 'loss/train': 1.2174526453018188} -11/07/2021 05:32:39 - INFO - __main__ - Step 59293: {'lr': 0.00033681796562832865, 'samples': 11384256, 'steps': 59292, 'loss/train': 1.5012623071670532} -11/07/2021 05:32:39 - INFO - __main__ - Step 59294: {'lr': 0.0003368129891323213, 'samples': 11384448, 'steps': 59293, 'loss/train': 0.7952998876571655} -11/07/2021 05:32:39 - INFO - __main__ - Step 59295: {'lr': 0.0003368080125971974, 'samples': 11384640, 'steps': 59294, 'loss/train': 1.5874347686767578} -11/07/2021 05:32:41 - INFO - __main__ - Step 59296: {'lr': 0.00033680303602295913, 'samples': 11384832, 'steps': 59295, 'loss/train': 1.1530067920684814} -11/07/2021 05:32:41 - INFO - __main__ - Step 59297: {'lr': 0.00033679805940960877, 'samples': 11385024, 'steps': 59296, 'loss/train': 1.5158717632293701} -11/07/2021 05:32:41 - INFO - __main__ - Step 59298: {'lr': 0.0003367930827571485, 'samples': 11385216, 'steps': 59297, 'loss/train': 1.4791208505630493} -11/07/2021 05:32:42 - INFO - __main__ - Step 59299: {'lr': 0.00033678810606558077, 'samples': 11385408, 'steps': 59298, 'loss/train': 1.3377068042755127} -11/07/2021 05:32:42 - INFO - __main__ - Step 59300: {'lr': 0.00033678312933490753, 'samples': 11385600, 'steps': 59299, 'loss/train': 1.330207347869873} -11/07/2021 05:32:43 - INFO - __main__ - Step 59301: {'lr': 0.00033677815256513114, 'samples': 11385792, 'steps': 59300, 'loss/train': 1.4737035036087036} -11/07/2021 05:32:43 - INFO - __main__ - Step 59302: {'lr': 0.0003367731757562538, 'samples': 11385984, 'steps': 59301, 'loss/train': 1.0610145330429077} -11/07/2021 05:32:44 - INFO - __main__ - Step 59303: {'lr': 0.0003367681989082779, 'samples': 11386176, 'steps': 59302, 'loss/train': 1.8311078548431396} -11/07/2021 05:32:44 - INFO - __main__ - Step 59304: {'lr': 0.0003367632220212056, 'samples': 11386368, 'steps': 59303, 'loss/train': 1.2422478199005127} -11/07/2021 05:32:44 - INFO - __main__ - Step 59305: {'lr': 0.0003367582450950391, 'samples': 11386560, 'steps': 59304, 'loss/train': 1.722801685333252} -11/07/2021 05:32:45 - INFO - __main__ - Step 59306: {'lr': 0.0003367532681297807, 'samples': 11386752, 'steps': 59305, 'loss/train': 1.5947935581207275} -11/07/2021 05:32:46 - INFO - __main__ - Step 59307: {'lr': 0.0003367482911254325, 'samples': 11386944, 'steps': 59306, 'loss/train': 1.0572227239608765} -11/07/2021 05:32:46 - INFO - __main__ - Step 59308: {'lr': 0.000336743314081997, 'samples': 11387136, 'steps': 59307, 'loss/train': 1.228071689605713} -11/07/2021 05:32:46 - INFO - __main__ - Step 59309: {'lr': 0.0003367383369994762, 'samples': 11387328, 'steps': 59308, 'loss/train': 1.5417029857635498} -11/07/2021 05:32:47 - INFO - __main__ - Step 59310: {'lr': 0.0003367333598778725, 'samples': 11387520, 'steps': 59309, 'loss/train': 1.4989715814590454} -11/07/2021 05:32:48 - INFO - __main__ - Step 59311: {'lr': 0.0003367283827171881, 'samples': 11387712, 'steps': 59310, 'loss/train': 1.4128915071487427} -11/07/2021 05:32:48 - INFO - __main__ - Step 59312: {'lr': 0.0003367234055174252, 'samples': 11387904, 'steps': 59311, 'loss/train': 0.8536984920501709} -11/07/2021 05:32:49 - INFO - __main__ - Step 59313: {'lr': 0.00033671842827858605, 'samples': 11388096, 'steps': 59312, 'loss/train': 1.2938698530197144} -11/07/2021 05:32:49 - INFO - __main__ - Step 59314: {'lr': 0.000336713451000673, 'samples': 11388288, 'steps': 59313, 'loss/train': 0.43849876523017883} -11/07/2021 05:32:49 - INFO - __main__ - Step 59315: {'lr': 0.00033670847368368805, 'samples': 11388480, 'steps': 59314, 'loss/train': 1.4717206954956055} -11/07/2021 05:32:50 - INFO - __main__ - Step 59316: {'lr': 0.00033670349632763377, 'samples': 11388672, 'steps': 59315, 'loss/train': 1.661509394645691} -11/07/2021 05:32:51 - INFO - __main__ - Step 59317: {'lr': 0.0003366985189325121, 'samples': 11388864, 'steps': 59316, 'loss/train': 2.1882638931274414} -11/07/2021 05:32:51 - INFO - __main__ - Step 59318: {'lr': 0.00033669354149832556, 'samples': 11389056, 'steps': 59317, 'loss/train': 1.328861951828003} -11/07/2021 05:32:52 - INFO - __main__ - Step 59319: {'lr': 0.0003366885640250761, 'samples': 11389248, 'steps': 59318, 'loss/train': 1.3705939054489136} -11/07/2021 05:32:52 - INFO - __main__ - Step 59320: {'lr': 0.00033668358651276614, 'samples': 11389440, 'steps': 59319, 'loss/train': 1.318787693977356} -11/07/2021 05:32:52 - INFO - __main__ - Step 59321: {'lr': 0.000336678608961398, 'samples': 11389632, 'steps': 59320, 'loss/train': 0.34411898255348206} -11/07/2021 05:32:53 - INFO - __main__ - Step 59322: {'lr': 0.00033667363137097374, 'samples': 11389824, 'steps': 59321, 'loss/train': 1.7547041177749634} -11/07/2021 05:32:54 - INFO - __main__ - Step 59323: {'lr': 0.0003366686537414957, 'samples': 11390016, 'steps': 59322, 'loss/train': 1.3817046880722046} -11/07/2021 05:32:54 - INFO - __main__ - Step 59324: {'lr': 0.00033666367607296607, 'samples': 11390208, 'steps': 59323, 'loss/train': 1.3879252672195435} -11/07/2021 05:32:54 - INFO - __main__ - Step 59325: {'lr': 0.0003366586983653871, 'samples': 11390400, 'steps': 59324, 'loss/train': 1.6638904809951782} -11/07/2021 05:32:55 - INFO - __main__ - Step 59326: {'lr': 0.0003366537206187611, 'samples': 11390592, 'steps': 59325, 'loss/train': 2.0016846656799316} -11/07/2021 05:32:56 - INFO - __main__ - Step 59327: {'lr': 0.0003366487428330903, 'samples': 11390784, 'steps': 59326, 'loss/train': 1.3757736682891846} -11/07/2021 05:32:56 - INFO - __main__ - Step 59328: {'lr': 0.0003366437650083768, 'samples': 11390976, 'steps': 59327, 'loss/train': 1.6433217525482178} -11/07/2021 05:32:57 - INFO - __main__ - Step 59329: {'lr': 0.0003366387871446231, 'samples': 11391168, 'steps': 59328, 'loss/train': 1.3558849096298218} -11/07/2021 05:32:57 - INFO - __main__ - Step 59330: {'lr': 0.00033663380924183123, 'samples': 11391360, 'steps': 59329, 'loss/train': 1.678908109664917} -11/07/2021 05:32:57 - INFO - __main__ - Step 59331: {'lr': 0.0003366288313000035, 'samples': 11391552, 'steps': 59330, 'loss/train': 0.7552284598350525} -11/07/2021 05:32:58 - INFO - __main__ - Step 59332: {'lr': 0.00033662385331914216, 'samples': 11391744, 'steps': 59331, 'loss/train': 0.9863568544387817} -11/07/2021 05:32:59 - INFO - __main__ - Step 59333: {'lr': 0.0003366188752992495, 'samples': 11391936, 'steps': 59332, 'loss/train': 1.226762294769287} -11/07/2021 05:32:59 - INFO - __main__ - Step 59334: {'lr': 0.00033661389724032765, 'samples': 11392128, 'steps': 59333, 'loss/train': 1.5386178493499756} -11/07/2021 05:32:59 - INFO - __main__ - Step 59335: {'lr': 0.0003366089191423789, 'samples': 11392320, 'steps': 59334, 'loss/train': 1.459900140762329} -11/07/2021 05:33:00 - INFO - __main__ - Step 59336: {'lr': 0.00033660394100540553, 'samples': 11392512, 'steps': 59335, 'loss/train': 1.12985360622406} -11/07/2021 05:33:00 - INFO - __main__ - Step 59337: {'lr': 0.00033659896282940975, 'samples': 11392704, 'steps': 59336, 'loss/train': 1.3907475471496582} -11/07/2021 05:33:01 - INFO - __main__ - Step 59338: {'lr': 0.0003365939846143938, 'samples': 11392896, 'steps': 59337, 'loss/train': 1.3147752285003662} -11/07/2021 05:33:02 - INFO - __main__ - Step 59339: {'lr': 0.00033658900636036, 'samples': 11393088, 'steps': 59338, 'loss/train': 1.8776735067367554} -11/07/2021 05:33:02 - INFO - __main__ - Step 59340: {'lr': 0.00033658402806731054, 'samples': 11393280, 'steps': 59339, 'loss/train': 1.6488615274429321} -11/07/2021 05:33:02 - INFO - __main__ - Step 59341: {'lr': 0.00033657904973524754, 'samples': 11393472, 'steps': 59340, 'loss/train': 1.708038330078125} -11/07/2021 05:33:03 - INFO - __main__ - Step 59342: {'lr': 0.00033657407136417343, 'samples': 11393664, 'steps': 59341, 'loss/train': 1.3855866193771362} -11/07/2021 05:33:04 - INFO - __main__ - Step 59343: {'lr': 0.0003365690929540904, 'samples': 11393856, 'steps': 59342, 'loss/train': 1.318496823310852} -11/07/2021 05:33:04 - INFO - __main__ - Step 59344: {'lr': 0.0003365641145050006, 'samples': 11394048, 'steps': 59343, 'loss/train': 1.5625256299972534} -11/07/2021 05:33:04 - INFO - __main__ - Step 59345: {'lr': 0.0003365591360169064, 'samples': 11394240, 'steps': 59344, 'loss/train': 1.9332079887390137} -11/07/2021 05:33:05 - INFO - __main__ - Step 59346: {'lr': 0.00033655415748981, 'samples': 11394432, 'steps': 59345, 'loss/train': 1.0971368551254272} -11/07/2021 05:33:05 - INFO - __main__ - Step 59347: {'lr': 0.00033654917892371363, 'samples': 11394624, 'steps': 59346, 'loss/train': 1.528804898262024} -11/07/2021 05:33:06 - INFO - __main__ - Step 59348: {'lr': 0.00033654420031861953, 'samples': 11394816, 'steps': 59347, 'loss/train': 1.6762912273406982} -11/07/2021 05:33:06 - INFO - __main__ - Step 59349: {'lr': 0.0003365392216745299, 'samples': 11395008, 'steps': 59348, 'loss/train': 1.4819291830062866} -11/07/2021 05:33:07 - INFO - __main__ - Step 59350: {'lr': 0.0003365342429914471, 'samples': 11395200, 'steps': 59349, 'loss/train': 0.7258336544036865} -11/07/2021 05:33:07 - INFO - __main__ - Step 59351: {'lr': 0.0003365292642693733, 'samples': 11395392, 'steps': 59350, 'loss/train': 1.3492298126220703} -11/07/2021 05:33:07 - INFO - __main__ - Step 59352: {'lr': 0.0003365242855083107, 'samples': 11395584, 'steps': 59351, 'loss/train': 1.3703134059906006} -11/07/2021 05:33:09 - INFO - __main__ - Step 59353: {'lr': 0.00033651930670826157, 'samples': 11395776, 'steps': 59352, 'loss/train': 1.5654878616333008} -11/07/2021 05:33:09 - INFO - __main__ - Step 59354: {'lr': 0.0003365143278692283, 'samples': 11395968, 'steps': 59353, 'loss/train': 1.1283808946609497} -11/07/2021 05:33:09 - INFO - __main__ - Step 59355: {'lr': 0.0003365093489912129, 'samples': 11396160, 'steps': 59354, 'loss/train': 1.5003823041915894} -11/07/2021 05:33:10 - INFO - __main__ - Step 59356: {'lr': 0.00033650437007421775, 'samples': 11396352, 'steps': 59355, 'loss/train': 0.9820141196250916} -11/07/2021 05:33:10 - INFO - __main__ - Step 59357: {'lr': 0.0003364993911182451, 'samples': 11396544, 'steps': 59356, 'loss/train': 1.8636622428894043} -11/07/2021 05:33:11 - INFO - __main__ - Step 59358: {'lr': 0.0003364944121232971, 'samples': 11396736, 'steps': 59357, 'loss/train': 1.063173532485962} -11/07/2021 05:33:11 - INFO - __main__ - Step 59359: {'lr': 0.0003364894330893761, 'samples': 11396928, 'steps': 59358, 'loss/train': 1.4838443994522095} -11/07/2021 05:33:12 - INFO - __main__ - Step 59360: {'lr': 0.0003364844540164843, 'samples': 11397120, 'steps': 59359, 'loss/train': 1.0383440256118774} -11/07/2021 05:33:12 - INFO - __main__ - Step 59361: {'lr': 0.00033647947490462386, 'samples': 11397312, 'steps': 59360, 'loss/train': 1.0313713550567627} -11/07/2021 05:33:12 - INFO - __main__ - Step 59362: {'lr': 0.0003364744957537972, 'samples': 11397504, 'steps': 59361, 'loss/train': 0.9415063858032227} -11/07/2021 05:33:13 - INFO - __main__ - Step 59363: {'lr': 0.00033646951656400635, 'samples': 11397696, 'steps': 59362, 'loss/train': 1.3204634189605713} -11/07/2021 05:33:14 - INFO - __main__ - Step 59364: {'lr': 0.0003364645373352538, 'samples': 11397888, 'steps': 59363, 'loss/train': 1.4480024576187134} -11/07/2021 05:33:15 - INFO - __main__ - Step 59365: {'lr': 0.00033645955806754156, 'samples': 11398080, 'steps': 59364, 'loss/train': 1.6689462661743164} -11/07/2021 05:33:15 - INFO - __main__ - Step 59366: {'lr': 0.00033645457876087205, 'samples': 11398272, 'steps': 59365, 'loss/train': 1.1205670833587646} -11/07/2021 05:33:15 - INFO - __main__ - Step 59367: {'lr': 0.0003364495994152474, 'samples': 11398464, 'steps': 59366, 'loss/train': 0.1568594127893448} -11/07/2021 05:33:16 - INFO - __main__ - Step 59368: {'lr': 0.00033644462003066996, 'samples': 11398656, 'steps': 59367, 'loss/train': 1.8210835456848145} -11/07/2021 05:33:17 - INFO - __main__ - Step 59369: {'lr': 0.00033643964060714183, 'samples': 11398848, 'steps': 59368, 'loss/train': 2.4489545822143555} -11/07/2021 05:33:18 - INFO - __main__ - Step 59370: {'lr': 0.00033643466114466537, 'samples': 11399040, 'steps': 59369, 'loss/train': 1.9088011980056763} -11/07/2021 05:33:18 - INFO - __main__ - Step 59371: {'lr': 0.0003364296816432428, 'samples': 11399232, 'steps': 59370, 'loss/train': 2.0525920391082764} -11/07/2021 05:33:18 - INFO - __main__ - Step 59372: {'lr': 0.0003364247021028763, 'samples': 11399424, 'steps': 59371, 'loss/train': 1.4817010164260864} -11/07/2021 05:33:19 - INFO - __main__ - Step 59373: {'lr': 0.0003364197225235682, 'samples': 11399616, 'steps': 59372, 'loss/train': 1.2891323566436768} -11/07/2021 05:33:19 - INFO - __main__ - Step 59374: {'lr': 0.0003364147429053207, 'samples': 11399808, 'steps': 59373, 'loss/train': 1.1993621587753296} -11/07/2021 05:33:20 - INFO - __main__ - Step 59375: {'lr': 0.00033640976324813605, 'samples': 11400000, 'steps': 59374, 'loss/train': 0.8058171272277832} -11/07/2021 05:33:20 - INFO - __main__ - Step 59376: {'lr': 0.00033640478355201646, 'samples': 11400192, 'steps': 59375, 'loss/train': 1.5635567903518677} -11/07/2021 05:33:21 - INFO - __main__ - Step 59377: {'lr': 0.00033639980381696425, 'samples': 11400384, 'steps': 59376, 'loss/train': 1.3642702102661133} -11/07/2021 05:33:21 - INFO - __main__ - Step 59378: {'lr': 0.0003363948240429816, 'samples': 11400576, 'steps': 59377, 'loss/train': 1.5507620573043823} -11/07/2021 05:33:21 - INFO - __main__ - Step 59379: {'lr': 0.0003363898442300708, 'samples': 11400768, 'steps': 59378, 'loss/train': 1.1319968700408936} -11/07/2021 05:33:22 - INFO - __main__ - Step 59380: {'lr': 0.0003363848643782341, 'samples': 11400960, 'steps': 59379, 'loss/train': 1.0250396728515625} -11/07/2021 05:33:23 - INFO - __main__ - Step 59381: {'lr': 0.00033637988448747365, 'samples': 11401152, 'steps': 59380, 'loss/train': 0.688690721988678} -11/07/2021 05:33:23 - INFO - __main__ - Step 59382: {'lr': 0.00033637490455779175, 'samples': 11401344, 'steps': 59381, 'loss/train': 1.5102119445800781} -11/07/2021 05:33:23 - INFO - __main__ - Step 59383: {'lr': 0.0003363699245891907, 'samples': 11401536, 'steps': 59382, 'loss/train': 1.6710865497589111} -11/07/2021 05:33:24 - INFO - __main__ - Step 59384: {'lr': 0.00033636494458167267, 'samples': 11401728, 'steps': 59383, 'loss/train': 0.4653959572315216} -11/07/2021 05:33:24 - INFO - __main__ - Step 59385: {'lr': 0.00033635996453523987, 'samples': 11401920, 'steps': 59384, 'loss/train': 1.7350064516067505} -11/07/2021 05:33:25 - INFO - __main__ - Step 59386: {'lr': 0.0003363549844498947, 'samples': 11402112, 'steps': 59385, 'loss/train': 1.4382284879684448} -11/07/2021 05:33:26 - INFO - __main__ - Step 59387: {'lr': 0.00033635000432563926, 'samples': 11402304, 'steps': 59386, 'loss/train': 0.8000993132591248} -11/07/2021 05:33:26 - INFO - __main__ - Step 59388: {'lr': 0.0003363450241624759, 'samples': 11402496, 'steps': 59387, 'loss/train': 1.293431282043457} -11/07/2021 05:33:26 - INFO - __main__ - Step 59389: {'lr': 0.00033634004396040673, 'samples': 11402688, 'steps': 59388, 'loss/train': 1.5316147804260254} -11/07/2021 05:33:27 - INFO - __main__ - Step 59390: {'lr': 0.0003363350637194341, 'samples': 11402880, 'steps': 59389, 'loss/train': 1.2599658966064453} -11/07/2021 05:33:28 - INFO - __main__ - Step 59391: {'lr': 0.0003363300834395602, 'samples': 11403072, 'steps': 59390, 'loss/train': 1.994467854499817} -11/07/2021 05:33:28 - INFO - __main__ - Step 59392: {'lr': 0.0003363251031207873, 'samples': 11403264, 'steps': 59391, 'loss/train': 1.5025508403778076} -11/07/2021 05:33:28 - INFO - __main__ - Step 59393: {'lr': 0.00033632012276311763, 'samples': 11403456, 'steps': 59392, 'loss/train': 1.3745367527008057} -11/07/2021 05:33:29 - INFO - __main__ - Step 59394: {'lr': 0.00033631514236655345, 'samples': 11403648, 'steps': 59393, 'loss/train': 2.2225964069366455} -11/07/2021 05:33:29 - INFO - __main__ - Step 59395: {'lr': 0.00033631016193109704, 'samples': 11403840, 'steps': 59394, 'loss/train': 1.3247920274734497} -11/07/2021 05:33:30 - INFO - __main__ - Step 59396: {'lr': 0.00033630518145675057, 'samples': 11404032, 'steps': 59395, 'loss/train': 1.5393571853637695} -11/07/2021 05:33:30 - INFO - __main__ - Step 59397: {'lr': 0.0003363002009435163, 'samples': 11404224, 'steps': 59396, 'loss/train': 1.3608369827270508} -11/07/2021 05:33:31 - INFO - __main__ - Step 59398: {'lr': 0.00033629522039139656, 'samples': 11404416, 'steps': 59397, 'loss/train': 1.306970238685608} -11/07/2021 05:33:31 - INFO - __main__ - Step 59399: {'lr': 0.00033629023980039346, 'samples': 11404608, 'steps': 59398, 'loss/train': 1.4013481140136719} -11/07/2021 05:33:32 - INFO - __main__ - Step 59400: {'lr': 0.00033628525917050935, 'samples': 11404800, 'steps': 59399, 'loss/train': 0.9148676991462708} -11/07/2021 05:33:32 - INFO - __main__ - Step 59401: {'lr': 0.0003362802785017464, 'samples': 11404992, 'steps': 59400, 'loss/train': 1.1169158220291138} -11/07/2021 05:33:33 - INFO - __main__ - Step 59402: {'lr': 0.00033627529779410695, 'samples': 11405184, 'steps': 59401, 'loss/train': 1.1892825365066528} -11/07/2021 05:33:33 - INFO - __main__ - Step 59403: {'lr': 0.0003362703170475931, 'samples': 11405376, 'steps': 59402, 'loss/train': 1.4537960290908813} -11/07/2021 05:33:34 - INFO - __main__ - Step 59404: {'lr': 0.00033626533626220724, 'samples': 11405568, 'steps': 59403, 'loss/train': 1.6124074459075928} -11/07/2021 05:33:34 - INFO - __main__ - Step 59405: {'lr': 0.0003362603554379515, 'samples': 11405760, 'steps': 59404, 'loss/train': 1.7371422052383423} -11/07/2021 05:33:34 - INFO - __main__ - Step 59406: {'lr': 0.0003362553745748281, 'samples': 11405952, 'steps': 59405, 'loss/train': 1.1758849620819092} -11/07/2021 05:33:36 - INFO - __main__ - Step 59407: {'lr': 0.00033625039367283957, 'samples': 11406144, 'steps': 59406, 'loss/train': 1.7903153896331787} -11/07/2021 05:33:36 - INFO - __main__ - Step 59408: {'lr': 0.00033624541273198785, 'samples': 11406336, 'steps': 59407, 'loss/train': 1.4561078548431396} -11/07/2021 05:33:36 - INFO - __main__ - Step 59409: {'lr': 0.0003362404317522752, 'samples': 11406528, 'steps': 59408, 'loss/train': 1.1592931747436523} -11/07/2021 05:33:37 - INFO - __main__ - Step 59410: {'lr': 0.000336235450733704, 'samples': 11406720, 'steps': 59409, 'loss/train': 1.768731713294983} -11/07/2021 05:33:37 - INFO - __main__ - Step 59411: {'lr': 0.00033623046967627647, 'samples': 11406912, 'steps': 59410, 'loss/train': 1.1054468154907227} -11/07/2021 05:33:38 - INFO - __main__ - Step 59412: {'lr': 0.00033622548857999477, 'samples': 11407104, 'steps': 59411, 'loss/train': 2.166207790374756} -11/07/2021 05:33:38 - INFO - __main__ - Step 59413: {'lr': 0.00033622050744486117, 'samples': 11407296, 'steps': 59412, 'loss/train': 1.1738817691802979} -11/07/2021 05:33:39 - INFO - __main__ - Step 59414: {'lr': 0.000336215526270878, 'samples': 11407488, 'steps': 59413, 'loss/train': 1.745837926864624} -11/07/2021 05:33:39 - INFO - __main__ - Step 59415: {'lr': 0.00033621054505804745, 'samples': 11407680, 'steps': 59414, 'loss/train': 1.676180124282837} -11/07/2021 05:33:40 - INFO - __main__ - Step 59416: {'lr': 0.0003362055638063717, 'samples': 11407872, 'steps': 59415, 'loss/train': 1.809029221534729} -11/07/2021 05:33:40 - INFO - __main__ - Step 59417: {'lr': 0.00033620058251585314, 'samples': 11408064, 'steps': 59416, 'loss/train': 0.9265207648277283} -11/07/2021 05:33:41 - INFO - __main__ - Step 59418: {'lr': 0.00033619560118649383, 'samples': 11408256, 'steps': 59417, 'loss/train': 1.4864901304244995} -11/07/2021 05:33:41 - INFO - __main__ - Step 59419: {'lr': 0.0003361906198182961, 'samples': 11408448, 'steps': 59418, 'loss/train': 1.5386531352996826} -11/07/2021 05:33:42 - INFO - __main__ - Step 59420: {'lr': 0.0003361856384112623, 'samples': 11408640, 'steps': 59419, 'loss/train': 1.6746221780776978} -11/07/2021 05:33:42 - INFO - __main__ - Step 59421: {'lr': 0.00033618065696539457, 'samples': 11408832, 'steps': 59420, 'loss/train': 1.4639761447906494} -11/07/2021 05:33:42 - INFO - __main__ - Step 59422: {'lr': 0.00033617567548069517, 'samples': 11409024, 'steps': 59421, 'loss/train': 0.8389047980308533} -11/07/2021 05:33:43 - INFO - __main__ - Step 59423: {'lr': 0.00033617069395716626, 'samples': 11409216, 'steps': 59422, 'loss/train': 1.4436959028244019} -11/07/2021 05:33:44 - INFO - __main__ - Step 59424: {'lr': 0.0003361657123948103, 'samples': 11409408, 'steps': 59423, 'loss/train': 1.450130581855774} -11/07/2021 05:33:44 - INFO - __main__ - Step 59425: {'lr': 0.00033616073079362923, 'samples': 11409600, 'steps': 59424, 'loss/train': 1.641268253326416} -11/07/2021 05:33:44 - INFO - __main__ - Step 59426: {'lr': 0.00033615574915362556, 'samples': 11409792, 'steps': 59425, 'loss/train': 1.3853462934494019} -11/07/2021 05:33:45 - INFO - __main__ - Step 59427: {'lr': 0.0003361507674748015, 'samples': 11409984, 'steps': 59426, 'loss/train': 1.1510624885559082} -11/07/2021 05:33:46 - INFO - __main__ - Step 59428: {'lr': 0.00033614578575715914, 'samples': 11410176, 'steps': 59427, 'loss/train': 1.7111918926239014} -11/07/2021 05:33:46 - INFO - __main__ - Step 59429: {'lr': 0.0003361408040007008, 'samples': 11410368, 'steps': 59428, 'loss/train': 1.0449142456054688} -11/07/2021 05:33:46 - INFO - __main__ - Step 59430: {'lr': 0.00033613582220542884, 'samples': 11410560, 'steps': 59429, 'loss/train': 1.3424932956695557} -11/07/2021 05:33:47 - INFO - __main__ - Step 59431: {'lr': 0.00033613084037134534, 'samples': 11410752, 'steps': 59430, 'loss/train': 1.526412010192871} -11/07/2021 05:33:47 - INFO - __main__ - Step 59432: {'lr': 0.00033612585849845256, 'samples': 11410944, 'steps': 59431, 'loss/train': 1.7384799718856812} -11/07/2021 05:33:48 - INFO - __main__ - Step 59433: {'lr': 0.00033612087658675287, 'samples': 11411136, 'steps': 59432, 'loss/train': 1.1954818964004517} -11/07/2021 05:33:49 - INFO - __main__ - Step 59434: {'lr': 0.0003361158946362485, 'samples': 11411328, 'steps': 59433, 'loss/train': 1.625868320465088} -11/07/2021 05:33:49 - INFO - __main__ - Step 59435: {'lr': 0.00033611091264694156, 'samples': 11411520, 'steps': 59434, 'loss/train': 0.24433954060077667} -11/07/2021 05:33:49 - INFO - __main__ - Step 59436: {'lr': 0.0003361059306188344, 'samples': 11411712, 'steps': 59435, 'loss/train': 1.3391706943511963} -11/07/2021 05:33:50 - INFO - __main__ - Step 59437: {'lr': 0.0003361009485519292, 'samples': 11411904, 'steps': 59436, 'loss/train': 0.8222254514694214} -11/07/2021 05:33:51 - INFO - __main__ - Step 59438: {'lr': 0.0003360959664462282, 'samples': 11412096, 'steps': 59437, 'loss/train': 1.3256622552871704} -11/07/2021 05:33:51 - INFO - __main__ - Step 59439: {'lr': 0.0003360909843017338, 'samples': 11412288, 'steps': 59438, 'loss/train': 1.7633172273635864} -11/07/2021 05:33:52 - INFO - __main__ - Step 59440: {'lr': 0.0003360860021184481, 'samples': 11412480, 'steps': 59439, 'loss/train': 1.453478217124939} -11/07/2021 05:33:52 - INFO - __main__ - Step 59441: {'lr': 0.0003360810198963733, 'samples': 11412672, 'steps': 59440, 'loss/train': 1.3727055788040161} -11/07/2021 05:33:52 - INFO - __main__ - Step 59442: {'lr': 0.0003360760376355118, 'samples': 11412864, 'steps': 59441, 'loss/train': 1.7543045282363892} -11/07/2021 05:33:53 - INFO - __main__ - Step 59443: {'lr': 0.00033607105533586573, 'samples': 11413056, 'steps': 59442, 'loss/train': 1.4854484796524048} -11/07/2021 05:33:54 - INFO - __main__ - Step 59444: {'lr': 0.0003360660729974374, 'samples': 11413248, 'steps': 59443, 'loss/train': 1.4913972616195679} -11/07/2021 05:33:54 - INFO - __main__ - Step 59445: {'lr': 0.00033606109062022906, 'samples': 11413440, 'steps': 59444, 'loss/train': 0.49917852878570557} -11/07/2021 05:33:54 - INFO - __main__ - Step 59446: {'lr': 0.0003360561082042428, 'samples': 11413632, 'steps': 59445, 'loss/train': 1.382643699645996} -11/07/2021 05:33:55 - INFO - __main__ - Step 59447: {'lr': 0.00033605112574948106, 'samples': 11413824, 'steps': 59446, 'loss/train': 1.754879117012024} -11/07/2021 05:33:56 - INFO - __main__ - Step 59448: {'lr': 0.000336046143255946, 'samples': 11414016, 'steps': 59447, 'loss/train': 0.3582473695278168} -11/07/2021 05:33:56 - INFO - __main__ - Step 59449: {'lr': 0.0003360411607236399, 'samples': 11414208, 'steps': 59448, 'loss/train': 1.2509737014770508} -11/07/2021 05:33:57 - INFO - __main__ - Step 59450: {'lr': 0.0003360361781525649, 'samples': 11414400, 'steps': 59449, 'loss/train': 1.4894764423370361} -11/07/2021 05:33:57 - INFO - __main__ - Step 59451: {'lr': 0.00033603119554272343, 'samples': 11414592, 'steps': 59450, 'loss/train': 1.4741876125335693} -11/07/2021 05:33:57 - INFO - __main__ - Step 59452: {'lr': 0.0003360262128941176, 'samples': 11414784, 'steps': 59451, 'loss/train': 1.1519569158554077} -11/07/2021 05:33:58 - INFO - __main__ - Step 59453: {'lr': 0.00033602123020674965, 'samples': 11414976, 'steps': 59452, 'loss/train': 1.4954636096954346} -11/07/2021 05:33:59 - INFO - __main__ - Step 59454: {'lr': 0.0003360162474806219, 'samples': 11415168, 'steps': 59453, 'loss/train': 1.335933804512024} -11/07/2021 05:33:59 - INFO - __main__ - Step 59455: {'lr': 0.0003360112647157366, 'samples': 11415360, 'steps': 59454, 'loss/train': 0.730075478553772} -11/07/2021 05:33:59 - INFO - __main__ - Step 59456: {'lr': 0.0003360062819120958, 'samples': 11415552, 'steps': 59455, 'loss/train': 1.5944722890853882} -11/07/2021 05:34:00 - INFO - __main__ - Step 59457: {'lr': 0.000336001299069702, 'samples': 11415744, 'steps': 59456, 'loss/train': 1.1954927444458008} -11/07/2021 05:34:00 - INFO - __main__ - Step 59458: {'lr': 0.0003359963161885573, 'samples': 11415936, 'steps': 59457, 'loss/train': 1.7233270406723022} -11/07/2021 05:34:01 - INFO - __main__ - Step 59459: {'lr': 0.000335991333268664, 'samples': 11416128, 'steps': 59458, 'loss/train': 1.4710155725479126} -11/07/2021 05:34:02 - INFO - __main__ - Step 59460: {'lr': 0.0003359863503100244, 'samples': 11416320, 'steps': 59459, 'loss/train': 1.1441378593444824} -11/07/2021 05:34:02 - INFO - __main__ - Step 59461: {'lr': 0.0003359813673126406, 'samples': 11416512, 'steps': 59460, 'loss/train': 1.2662721872329712} -11/07/2021 05:34:02 - INFO - __main__ - Step 59462: {'lr': 0.000335976384276515, 'samples': 11416704, 'steps': 59461, 'loss/train': 1.6323987245559692} -11/07/2021 05:34:03 - INFO - __main__ - Step 59463: {'lr': 0.0003359714012016497, 'samples': 11416896, 'steps': 59462, 'loss/train': 1.9028390645980835} -11/07/2021 05:34:04 - INFO - __main__ - Step 59464: {'lr': 0.000335966418088047, 'samples': 11417088, 'steps': 59463, 'loss/train': 0.28088605403900146} -11/07/2021 05:34:04 - INFO - __main__ - Step 59465: {'lr': 0.0003359614349357092, 'samples': 11417280, 'steps': 59464, 'loss/train': 1.1726419925689697} -11/07/2021 05:34:04 - INFO - __main__ - Step 59466: {'lr': 0.00033595645174463843, 'samples': 11417472, 'steps': 59465, 'loss/train': 1.3974151611328125} -11/07/2021 05:34:05 - INFO - __main__ - Step 59467: {'lr': 0.0003359514685148371, 'samples': 11417664, 'steps': 59466, 'loss/train': 1.5635926723480225} -11/07/2021 05:34:05 - INFO - __main__ - Step 59468: {'lr': 0.0003359464852463074, 'samples': 11417856, 'steps': 59467, 'loss/train': 0.8446754217147827} -11/07/2021 05:34:06 - INFO - __main__ - Step 59469: {'lr': 0.00033594150193905144, 'samples': 11418048, 'steps': 59468, 'loss/train': 1.2928434610366821} -11/07/2021 05:34:06 - INFO - __main__ - Step 59470: {'lr': 0.0003359365185930716, 'samples': 11418240, 'steps': 59469, 'loss/train': 1.5282357931137085} -11/07/2021 05:34:07 - INFO - __main__ - Step 59471: {'lr': 0.00033593153520837006, 'samples': 11418432, 'steps': 59470, 'loss/train': 1.4693994522094727} -11/07/2021 05:34:07 - INFO - __main__ - Step 59472: {'lr': 0.0003359265517849491, 'samples': 11418624, 'steps': 59471, 'loss/train': 1.5970423221588135} -11/07/2021 05:34:08 - INFO - __main__ - Step 59473: {'lr': 0.000335921568322811, 'samples': 11418816, 'steps': 59472, 'loss/train': 1.3727434873580933} -11/07/2021 05:34:09 - INFO - __main__ - Step 59474: {'lr': 0.00033591658482195796, 'samples': 11419008, 'steps': 59473, 'loss/train': 1.4155181646347046} -11/07/2021 05:34:09 - INFO - __main__ - Step 59475: {'lr': 0.0003359116012823923, 'samples': 11419200, 'steps': 59474, 'loss/train': 1.4483219385147095} -11/07/2021 05:34:10 - INFO - __main__ - Step 59476: {'lr': 0.0003359066177041161, 'samples': 11419392, 'steps': 59475, 'loss/train': 1.1662133932113647} -11/07/2021 05:34:10 - INFO - __main__ - Step 59477: {'lr': 0.0003359016340871317, 'samples': 11419584, 'steps': 59476, 'loss/train': 2.426244020462036} -11/07/2021 05:34:10 - INFO - __main__ - Step 59478: {'lr': 0.0003358966504314414, 'samples': 11419776, 'steps': 59477, 'loss/train': 1.0725919008255005} -11/07/2021 05:34:11 - INFO - __main__ - Step 59479: {'lr': 0.00033589166673704735, 'samples': 11419968, 'steps': 59478, 'loss/train': 0.5581346750259399} -11/07/2021 05:34:12 - INFO - __main__ - Step 59480: {'lr': 0.0003358866830039519, 'samples': 11420160, 'steps': 59479, 'loss/train': 1.908988118171692} -11/07/2021 05:34:12 - INFO - __main__ - Step 59481: {'lr': 0.0003358816992321572, 'samples': 11420352, 'steps': 59480, 'loss/train': 0.7702450752258301} -11/07/2021 05:34:12 - INFO - __main__ - Step 59482: {'lr': 0.0003358767154216655, 'samples': 11420544, 'steps': 59481, 'loss/train': 1.5035277605056763} -11/07/2021 05:34:13 - INFO - __main__ - Step 59483: {'lr': 0.00033587173157247915, 'samples': 11420736, 'steps': 59482, 'loss/train': 1.2740265130996704} -11/07/2021 05:34:13 - INFO - __main__ - Step 59484: {'lr': 0.00033586674768460025, 'samples': 11420928, 'steps': 59483, 'loss/train': 1.1467206478118896} -11/07/2021 05:34:14 - INFO - __main__ - Step 59485: {'lr': 0.0003358617637580311, 'samples': 11421120, 'steps': 59484, 'loss/train': 1.1890020370483398} -11/07/2021 05:34:14 - INFO - __main__ - Step 59486: {'lr': 0.00033585677979277407, 'samples': 11421312, 'steps': 59485, 'loss/train': 1.4078155755996704} -11/07/2021 05:34:15 - INFO - __main__ - Step 59487: {'lr': 0.00033585179578883123, 'samples': 11421504, 'steps': 59486, 'loss/train': 1.1714547872543335} -11/07/2021 05:34:15 - INFO - __main__ - Step 59488: {'lr': 0.00033584681174620497, 'samples': 11421696, 'steps': 59487, 'loss/train': 1.5593702793121338} -11/07/2021 05:34:15 - INFO - __main__ - Step 59489: {'lr': 0.00033584182766489736, 'samples': 11421888, 'steps': 59488, 'loss/train': 1.2370959520339966} -11/07/2021 05:34:17 - INFO - __main__ - Step 59490: {'lr': 0.0003358368435449108, 'samples': 11422080, 'steps': 59489, 'loss/train': 1.6344785690307617} -11/07/2021 05:34:17 - INFO - __main__ - Step 59491: {'lr': 0.0003358318593862474, 'samples': 11422272, 'steps': 59490, 'loss/train': 1.0064419507980347} -11/07/2021 05:34:17 - INFO - __main__ - Step 59492: {'lr': 0.0003358268751889096, 'samples': 11422464, 'steps': 59491, 'loss/train': 1.6573501825332642} -11/07/2021 05:34:18 - INFO - __main__ - Step 59493: {'lr': 0.0003358218909528995, 'samples': 11422656, 'steps': 59492, 'loss/train': 1.7153048515319824} -11/07/2021 05:34:18 - INFO - __main__ - Step 59494: {'lr': 0.00033581690667821933, 'samples': 11422848, 'steps': 59493, 'loss/train': 1.686608910560608} -11/07/2021 05:34:19 - INFO - __main__ - Step 59495: {'lr': 0.00033581192236487153, 'samples': 11423040, 'steps': 59494, 'loss/train': 1.7390670776367188} -11/07/2021 05:34:19 - INFO - __main__ - Step 59496: {'lr': 0.00033580693801285805, 'samples': 11423232, 'steps': 59495, 'loss/train': 1.3494672775268555} -11/07/2021 05:34:20 - INFO - __main__ - Step 59497: {'lr': 0.0003358019536221814, 'samples': 11423424, 'steps': 59496, 'loss/train': 1.100712537765503} -11/07/2021 05:34:20 - INFO - __main__ - Step 59498: {'lr': 0.00033579696919284357, 'samples': 11423616, 'steps': 59497, 'loss/train': 1.6030791997909546} -11/07/2021 05:34:20 - INFO - __main__ - Step 59499: {'lr': 0.00033579198472484707, 'samples': 11423808, 'steps': 59498, 'loss/train': 1.0974394083023071} -11/07/2021 05:34:21 - INFO - __main__ - Step 59500: {'lr': 0.000335787000218194, 'samples': 11424000, 'steps': 59499, 'loss/train': 1.6031955480575562} -11/07/2021 05:34:22 - INFO - __main__ - Step 59501: {'lr': 0.0003357820156728866, 'samples': 11424192, 'steps': 59500, 'loss/train': 0.9540095925331116} -11/07/2021 05:34:22 - INFO - __main__ - Step 59502: {'lr': 0.0003357770310889272, 'samples': 11424384, 'steps': 59501, 'loss/train': 1.1483746767044067} -11/07/2021 05:34:23 - INFO - __main__ - Step 59503: {'lr': 0.0003357720464663179, 'samples': 11424576, 'steps': 59502, 'loss/train': 0.8712205290794373} -11/07/2021 05:34:23 - INFO - __main__ - Step 59504: {'lr': 0.0003357670618050611, 'samples': 11424768, 'steps': 59503, 'loss/train': 1.2671444416046143} -11/07/2021 05:34:24 - INFO - __main__ - Step 59505: {'lr': 0.000335762077105159, 'samples': 11424960, 'steps': 59504, 'loss/train': 2.224961042404175} -11/07/2021 05:34:25 - INFO - __main__ - Step 59506: {'lr': 0.0003357570923666138, 'samples': 11425152, 'steps': 59505, 'loss/train': 2.035517930984497} -11/07/2021 05:34:25 - INFO - __main__ - Step 59507: {'lr': 0.0003357521075894278, 'samples': 11425344, 'steps': 59506, 'loss/train': 1.5490002632141113} -11/07/2021 05:34:25 - INFO - __main__ - Step 59508: {'lr': 0.00033574712277360325, 'samples': 11425536, 'steps': 59507, 'loss/train': 1.7147842645645142} -11/07/2021 05:34:26 - INFO - __main__ - Step 59509: {'lr': 0.00033574213791914235, 'samples': 11425728, 'steps': 59508, 'loss/train': 0.10911858081817627} -11/07/2021 05:34:27 - INFO - __main__ - Step 59510: {'lr': 0.00033573715302604736, 'samples': 11425920, 'steps': 59509, 'loss/train': 1.6349005699157715} -11/07/2021 05:34:27 - INFO - __main__ - Step 59511: {'lr': 0.0003357321680943205, 'samples': 11426112, 'steps': 59510, 'loss/train': 1.656241774559021} -11/07/2021 05:34:27 - INFO - __main__ - Step 59512: {'lr': 0.00033572718312396404, 'samples': 11426304, 'steps': 59511, 'loss/train': 1.4408379793167114} -11/07/2021 05:34:28 - INFO - __main__ - Step 59513: {'lr': 0.0003357221981149803, 'samples': 11426496, 'steps': 59512, 'loss/train': 1.3564294576644897} -11/07/2021 05:34:28 - INFO - __main__ - Step 59514: {'lr': 0.0003357172130673714, 'samples': 11426688, 'steps': 59513, 'loss/train': 1.758360743522644} -11/07/2021 05:34:29 - INFO - __main__ - Step 59515: {'lr': 0.00033571222798113977, 'samples': 11426880, 'steps': 59514, 'loss/train': 1.6956180334091187} -11/07/2021 05:34:29 - INFO - __main__ - Step 59516: {'lr': 0.0003357072428562874, 'samples': 11427072, 'steps': 59515, 'loss/train': 1.64950692653656} -11/07/2021 05:34:30 - INFO - __main__ - Step 59517: {'lr': 0.0003357022576928167, 'samples': 11427264, 'steps': 59516, 'loss/train': 1.238654613494873} -11/07/2021 05:34:30 - INFO - __main__ - Step 59518: {'lr': 0.0003356972724907299, 'samples': 11427456, 'steps': 59517, 'loss/train': 1.1894230842590332} -11/07/2021 05:34:30 - INFO - __main__ - Step 59519: {'lr': 0.0003356922872500292, 'samples': 11427648, 'steps': 59518, 'loss/train': 1.35769522190094} -11/07/2021 05:34:31 - INFO - __main__ - Step 59520: {'lr': 0.0003356873019707169, 'samples': 11427840, 'steps': 59519, 'loss/train': 1.5582650899887085} -11/07/2021 05:34:32 - INFO - __main__ - Step 59521: {'lr': 0.0003356823166527952, 'samples': 11428032, 'steps': 59520, 'loss/train': 1.5470657348632812} -11/07/2021 05:34:32 - INFO - __main__ - Step 59522: {'lr': 0.00033567733129626645, 'samples': 11428224, 'steps': 59521, 'loss/train': 1.1028765439987183} -11/07/2021 05:34:33 - INFO - __main__ - Step 59523: {'lr': 0.00033567234590113274, 'samples': 11428416, 'steps': 59522, 'loss/train': 1.334879994392395} -11/07/2021 05:34:33 - INFO - __main__ - Step 59524: {'lr': 0.00033566736046739643, 'samples': 11428608, 'steps': 59523, 'loss/train': 1.5988858938217163} -11/07/2021 05:34:33 - INFO - __main__ - Step 59525: {'lr': 0.0003356623749950597, 'samples': 11428800, 'steps': 59524, 'loss/train': 1.3079609870910645} -11/07/2021 05:34:34 - INFO - __main__ - Step 59526: {'lr': 0.0003356573894841248, 'samples': 11428992, 'steps': 59525, 'loss/train': 1.1951123476028442} -11/07/2021 05:34:34 - INFO - __main__ - Step 59527: {'lr': 0.0003356524039345941, 'samples': 11429184, 'steps': 59526, 'loss/train': 1.3614507913589478} -11/07/2021 05:34:35 - INFO - __main__ - Step 59528: {'lr': 0.00033564741834646967, 'samples': 11429376, 'steps': 59527, 'loss/train': 1.3990288972854614} -11/07/2021 05:34:35 - INFO - __main__ - Step 59529: {'lr': 0.0003356424327197539, 'samples': 11429568, 'steps': 59528, 'loss/train': 1.2418543100357056} -11/07/2021 05:34:36 - INFO - __main__ - Step 59530: {'lr': 0.00033563744705444886, 'samples': 11429760, 'steps': 59529, 'loss/train': 1.0261796712875366} -11/07/2021 05:34:37 - INFO - __main__ - Step 59531: {'lr': 0.000335632461350557, 'samples': 11429952, 'steps': 59530, 'loss/train': 1.293760061264038} -11/07/2021 05:34:37 - INFO - __main__ - Step 59532: {'lr': 0.00033562747560808044, 'samples': 11430144, 'steps': 59531, 'loss/train': 1.2552067041397095} -11/07/2021 05:34:37 - INFO - __main__ - Step 59533: {'lr': 0.00033562248982702144, 'samples': 11430336, 'steps': 59532, 'loss/train': 1.2043218612670898} -11/07/2021 05:34:38 - INFO - __main__ - Step 59534: {'lr': 0.0003356175040073823, 'samples': 11430528, 'steps': 59533, 'loss/train': 1.0706124305725098} -11/07/2021 05:34:38 - INFO - __main__ - Step 59535: {'lr': 0.0003356125181491653, 'samples': 11430720, 'steps': 59534, 'loss/train': 1.805811882019043} -11/07/2021 05:34:39 - INFO - __main__ - Step 59536: {'lr': 0.0003356075322523725, 'samples': 11430912, 'steps': 59535, 'loss/train': 1.2499884366989136} -11/07/2021 05:34:39 - INFO - __main__ - Step 59537: {'lr': 0.00033560254631700634, 'samples': 11431104, 'steps': 59536, 'loss/train': 1.4227045774459839} -11/07/2021 05:34:40 - INFO - __main__ - Step 59538: {'lr': 0.0003355975603430689, 'samples': 11431296, 'steps': 59537, 'loss/train': 1.4031585454940796} -11/07/2021 05:34:40 - INFO - __main__ - Step 59539: {'lr': 0.0003355925743305626, 'samples': 11431488, 'steps': 59538, 'loss/train': 0.8719915747642517} -11/07/2021 05:34:40 - INFO - __main__ - Step 59540: {'lr': 0.0003355875882794896, 'samples': 11431680, 'steps': 59539, 'loss/train': 1.7507216930389404} -11/07/2021 05:34:41 - INFO - __main__ - Step 59541: {'lr': 0.00033558260218985214, 'samples': 11431872, 'steps': 59540, 'loss/train': 1.453427791595459} -11/07/2021 05:34:42 - INFO - __main__ - Step 59542: {'lr': 0.00033557761606165253, 'samples': 11432064, 'steps': 59541, 'loss/train': 0.9681723117828369} -11/07/2021 05:34:42 - INFO - __main__ - Step 59543: {'lr': 0.00033557262989489294, 'samples': 11432256, 'steps': 59542, 'loss/train': 1.5702011585235596} -11/07/2021 05:34:43 - INFO - __main__ - Step 59544: {'lr': 0.0003355676436895756, 'samples': 11432448, 'steps': 59543, 'loss/train': 1.639803409576416} -11/07/2021 05:34:43 - INFO - __main__ - Step 59545: {'lr': 0.0003355626574457029, 'samples': 11432640, 'steps': 59544, 'loss/train': 1.6117422580718994} -11/07/2021 05:34:44 - INFO - __main__ - Step 59546: {'lr': 0.00033555767116327686, 'samples': 11432832, 'steps': 59545, 'loss/train': 1.8059355020523071} -11/07/2021 05:34:44 - INFO - __main__ - Step 59547: {'lr': 0.00033555268484229987, 'samples': 11433024, 'steps': 59546, 'loss/train': 1.1739661693572998} -11/07/2021 05:34:45 - INFO - __main__ - Step 59548: {'lr': 0.0003355476984827743, 'samples': 11433216, 'steps': 59547, 'loss/train': 1.4571211338043213} -11/07/2021 05:34:45 - INFO - __main__ - Step 59549: {'lr': 0.0003355427120847021, 'samples': 11433408, 'steps': 59548, 'loss/train': 1.7085621356964111} -11/07/2021 05:34:45 - INFO - __main__ - Step 59550: {'lr': 0.0003355377256480858, 'samples': 11433600, 'steps': 59549, 'loss/train': 1.1984351873397827} -11/07/2021 05:34:46 - INFO - __main__ - Step 59551: {'lr': 0.00033553273917292744, 'samples': 11433792, 'steps': 59550, 'loss/train': 1.194305181503296} -11/07/2021 05:34:47 - INFO - __main__ - Step 59552: {'lr': 0.0003355277526592293, 'samples': 11433984, 'steps': 59551, 'loss/train': 1.199188232421875} -11/07/2021 05:34:47 - INFO - __main__ - Step 59553: {'lr': 0.00033552276610699375, 'samples': 11434176, 'steps': 59552, 'loss/train': 1.4422672986984253} -11/07/2021 05:34:47 - INFO - __main__ - Step 59554: {'lr': 0.00033551777951622297, 'samples': 11434368, 'steps': 59553, 'loss/train': 1.435340404510498} -11/07/2021 05:34:48 - INFO - __main__ - Step 59555: {'lr': 0.0003355127928869192, 'samples': 11434560, 'steps': 59554, 'loss/train': 1.4675737619400024} -11/07/2021 05:34:49 - INFO - __main__ - Step 59556: {'lr': 0.0003355078062190847, 'samples': 11434752, 'steps': 59555, 'loss/train': 0.8876587748527527} -11/07/2021 05:34:49 - INFO - __main__ - Step 59557: {'lr': 0.00033550281951272163, 'samples': 11434944, 'steps': 59556, 'loss/train': 1.6628034114837646} -11/07/2021 05:34:50 - INFO - __main__ - Step 59558: {'lr': 0.0003354978327678323, 'samples': 11435136, 'steps': 59557, 'loss/train': 1.1888867616653442} -11/07/2021 05:34:50 - INFO - __main__ - Step 59559: {'lr': 0.00033549284598441897, 'samples': 11435328, 'steps': 59558, 'loss/train': 1.5983210802078247} -11/07/2021 05:34:50 - INFO - __main__ - Step 59560: {'lr': 0.0003354878591624839, 'samples': 11435520, 'steps': 59559, 'loss/train': 1.2895994186401367} -11/07/2021 05:34:51 - INFO - __main__ - Step 59561: {'lr': 0.0003354828723020294, 'samples': 11435712, 'steps': 59560, 'loss/train': 1.5360382795333862} -11/07/2021 05:34:52 - INFO - __main__ - Step 59562: {'lr': 0.0003354778854030576, 'samples': 11435904, 'steps': 59561, 'loss/train': 1.4257394075393677} -11/07/2021 05:34:52 - INFO - __main__ - Step 59563: {'lr': 0.0003354728984655708, 'samples': 11436096, 'steps': 59562, 'loss/train': 1.2033840417861938} -11/07/2021 05:34:52 - INFO - __main__ - Step 59564: {'lr': 0.0003354679114895711, 'samples': 11436288, 'steps': 59563, 'loss/train': 1.349900722503662} -11/07/2021 05:34:53 - INFO - __main__ - Step 59565: {'lr': 0.000335462924475061, 'samples': 11436480, 'steps': 59564, 'loss/train': 0.9771448373794556} -11/07/2021 05:34:54 - INFO - __main__ - Step 59566: {'lr': 0.00033545793742204255, 'samples': 11436672, 'steps': 59565, 'loss/train': 1.3499360084533691} -11/07/2021 05:34:54 - INFO - __main__ - Step 59567: {'lr': 0.00033545295033051814, 'samples': 11436864, 'steps': 59566, 'loss/train': 1.3435114622116089} -11/07/2021 05:34:54 - INFO - __main__ - Step 59568: {'lr': 0.00033544796320048996, 'samples': 11437056, 'steps': 59567, 'loss/train': 1.2455247640609741} -11/07/2021 05:34:55 - INFO - __main__ - Step 59569: {'lr': 0.0003354429760319602, 'samples': 11437248, 'steps': 59568, 'loss/train': 1.316182017326355} -11/07/2021 05:34:55 - INFO - __main__ - Step 59570: {'lr': 0.00033543798882493123, 'samples': 11437440, 'steps': 59569, 'loss/train': 0.7195746302604675} -11/07/2021 05:34:55 - INFO - __main__ - Step 59571: {'lr': 0.0003354330015794051, 'samples': 11437632, 'steps': 59570, 'loss/train': 1.4050893783569336} -11/07/2021 05:34:56 - INFO - __main__ - Step 59572: {'lr': 0.00033542801429538424, 'samples': 11437824, 'steps': 59571, 'loss/train': 1.6291940212249756} -11/07/2021 05:34:57 - INFO - __main__ - Step 59573: {'lr': 0.0003354230269728709, 'samples': 11438016, 'steps': 59572, 'loss/train': 1.7440979480743408} -11/07/2021 05:34:57 - INFO - __main__ - Step 59574: {'lr': 0.0003354180396118671, 'samples': 11438208, 'steps': 59573, 'loss/train': 1.2694685459136963} -11/07/2021 05:34:58 - INFO - __main__ - Step 59575: {'lr': 0.0003354130522123754, 'samples': 11438400, 'steps': 59574, 'loss/train': 1.6482088565826416} -11/07/2021 05:34:59 - INFO - __main__ - Step 59576: {'lr': 0.0003354080647743978, 'samples': 11438592, 'steps': 59575, 'loss/train': 1.1161706447601318} -11/07/2021 05:34:59 - INFO - __main__ - Step 59577: {'lr': 0.0003354030772979367, 'samples': 11438784, 'steps': 59576, 'loss/train': 1.1914986371994019} -11/07/2021 05:34:59 - INFO - __main__ - Step 59578: {'lr': 0.00033539808978299423, 'samples': 11438976, 'steps': 59577, 'loss/train': 1.3084155321121216} -11/07/2021 05:35:00 - INFO - __main__ - Step 59579: {'lr': 0.0003353931022295728, 'samples': 11439168, 'steps': 59578, 'loss/train': 2.5183029174804688} -11/07/2021 05:35:00 - INFO - __main__ - Step 59580: {'lr': 0.0003353881146376745, 'samples': 11439360, 'steps': 59579, 'loss/train': 1.261258840560913} -11/07/2021 05:35:00 - INFO - __main__ - Step 59581: {'lr': 0.0003353831270073016, 'samples': 11439552, 'steps': 59580, 'loss/train': 0.11749255657196045} -11/07/2021 05:35:02 - INFO - __main__ - Step 59582: {'lr': 0.0003353781393384564, 'samples': 11439744, 'steps': 59581, 'loss/train': 1.3081586360931396} -11/07/2021 05:35:02 - INFO - __main__ - Step 59583: {'lr': 0.0003353731516311411, 'samples': 11439936, 'steps': 59582, 'loss/train': 0.18103912472724915} -11/07/2021 05:35:03 - INFO - __main__ - Step 59584: {'lr': 0.00033536816388535814, 'samples': 11440128, 'steps': 59583, 'loss/train': 1.3822505474090576} -11/07/2021 05:35:03 - INFO - __main__ - Step 59585: {'lr': 0.0003353631761011094, 'samples': 11440320, 'steps': 59584, 'loss/train': 1.2396767139434814} -11/07/2021 05:35:03 - INFO - __main__ - Step 59586: {'lr': 0.00033535818827839744, 'samples': 11440512, 'steps': 59585, 'loss/train': 1.3074694871902466} -11/07/2021 05:35:05 - INFO - __main__ - Step 59587: {'lr': 0.0003353532004172244, 'samples': 11440704, 'steps': 59586, 'loss/train': 1.5764880180358887} -11/07/2021 05:35:05 - INFO - __main__ - Step 59588: {'lr': 0.00033534821251759246, 'samples': 11440896, 'steps': 59587, 'loss/train': 0.9902772307395935} -11/07/2021 05:35:05 - INFO - __main__ - Step 59589: {'lr': 0.00033534322457950396, 'samples': 11441088, 'steps': 59588, 'loss/train': 1.802744746208191} -11/07/2021 05:35:06 - INFO - __main__ - Step 59590: {'lr': 0.00033533823660296115, 'samples': 11441280, 'steps': 59589, 'loss/train': 1.0557581186294556} -11/07/2021 05:35:06 - INFO - __main__ - Step 59591: {'lr': 0.00033533324858796623, 'samples': 11441472, 'steps': 59590, 'loss/train': 1.397140622138977} -11/07/2021 05:35:07 - INFO - __main__ - Step 59592: {'lr': 0.00033532826053452145, 'samples': 11441664, 'steps': 59591, 'loss/train': 0.15451475977897644} -11/07/2021 05:35:07 - INFO - __main__ - Step 59593: {'lr': 0.00033532327244262906, 'samples': 11441856, 'steps': 59592, 'loss/train': 1.3034030199050903} -11/07/2021 05:35:08 - INFO - __main__ - Step 59594: {'lr': 0.0003353182843122913, 'samples': 11442048, 'steps': 59593, 'loss/train': 1.8378833532333374} -11/07/2021 05:35:08 - INFO - __main__ - Step 59595: {'lr': 0.0003353132961435105, 'samples': 11442240, 'steps': 59594, 'loss/train': 1.328703761100769} -11/07/2021 05:35:08 - INFO - __main__ - Step 59596: {'lr': 0.00033530830793628886, 'samples': 11442432, 'steps': 59595, 'loss/train': 1.4518554210662842} -11/07/2021 05:35:10 - INFO - __main__ - Step 59597: {'lr': 0.00033530331969062853, 'samples': 11442624, 'steps': 59596, 'loss/train': 1.4871795177459717} -11/07/2021 05:35:10 - INFO - __main__ - Step 59598: {'lr': 0.00033529833140653187, 'samples': 11442816, 'steps': 59597, 'loss/train': 1.5746878385543823} -11/07/2021 05:35:10 - INFO - __main__ - Step 59599: {'lr': 0.0003352933430840011, 'samples': 11443008, 'steps': 59598, 'loss/train': 0.10077402740716934} -11/07/2021 05:35:11 - INFO - __main__ - Step 59600: {'lr': 0.0003352883547230385, 'samples': 11443200, 'steps': 59599, 'loss/train': 1.2615989446640015} -11/07/2021 05:35:11 - INFO - __main__ - Step 59601: {'lr': 0.00033528336632364624, 'samples': 11443392, 'steps': 59600, 'loss/train': 1.404905080795288} -11/07/2021 05:35:12 - INFO - __main__ - Step 59602: {'lr': 0.00033527837788582663, 'samples': 11443584, 'steps': 59601, 'loss/train': 0.9862393736839294} -11/07/2021 05:35:12 - INFO - __main__ - Step 59603: {'lr': 0.00033527338940958197, 'samples': 11443776, 'steps': 59602, 'loss/train': 1.3578568696975708} -11/07/2021 05:35:13 - INFO - __main__ - Step 59604: {'lr': 0.00033526840089491433, 'samples': 11443968, 'steps': 59603, 'loss/train': 1.252523422241211} -11/07/2021 05:35:13 - INFO - __main__ - Step 59605: {'lr': 0.00033526341234182613, 'samples': 11444160, 'steps': 59604, 'loss/train': 1.8080463409423828} -11/07/2021 05:35:14 - INFO - __main__ - Step 59606: {'lr': 0.00033525842375031946, 'samples': 11444352, 'steps': 59605, 'loss/train': 1.431477427482605} -11/07/2021 05:35:15 - INFO - __main__ - Step 59607: {'lr': 0.00033525343512039673, 'samples': 11444544, 'steps': 59606, 'loss/train': 1.2721199989318848} -11/07/2021 05:35:15 - INFO - __main__ - Step 59608: {'lr': 0.0003352484464520601, 'samples': 11444736, 'steps': 59607, 'loss/train': 0.9697229862213135} -11/07/2021 05:35:15 - INFO - __main__ - Step 59609: {'lr': 0.0003352434577453119, 'samples': 11444928, 'steps': 59608, 'loss/train': 1.3642055988311768} -11/07/2021 05:35:16 - INFO - __main__ - Step 59610: {'lr': 0.00033523846900015427, 'samples': 11445120, 'steps': 59609, 'loss/train': 1.4536397457122803} -11/07/2021 05:35:16 - INFO - __main__ - Step 59611: {'lr': 0.00033523348021658947, 'samples': 11445312, 'steps': 59610, 'loss/train': 1.5773667097091675} -11/07/2021 05:35:17 - INFO - __main__ - Step 59612: {'lr': 0.00033522849139461973, 'samples': 11445504, 'steps': 59611, 'loss/train': 1.2811578512191772} -11/07/2021 05:35:18 - INFO - __main__ - Step 59613: {'lr': 0.0003352235025342475, 'samples': 11445696, 'steps': 59612, 'loss/train': 1.6257545948028564} -11/07/2021 05:35:18 - INFO - __main__ - Step 59614: {'lr': 0.00033521851363547473, 'samples': 11445888, 'steps': 59613, 'loss/train': 1.0231727361679077} -11/07/2021 05:35:18 - INFO - __main__ - Step 59615: {'lr': 0.0003352135246983039, 'samples': 11446080, 'steps': 59614, 'loss/train': 1.655920386314392} -11/07/2021 05:35:19 - INFO - __main__ - Step 59616: {'lr': 0.0003352085357227372, 'samples': 11446272, 'steps': 59615, 'loss/train': 1.7154494524002075} -11/07/2021 05:35:19 - INFO - __main__ - Step 59617: {'lr': 0.00033520354670877673, 'samples': 11446464, 'steps': 59616, 'loss/train': 1.5022478103637695} -11/07/2021 05:35:20 - INFO - __main__ - Step 59618: {'lr': 0.00033519855765642493, 'samples': 11446656, 'steps': 59617, 'loss/train': 1.3677871227264404} -11/07/2021 05:35:21 - INFO - __main__ - Step 59619: {'lr': 0.00033519356856568397, 'samples': 11446848, 'steps': 59618, 'loss/train': 1.5715504884719849} -11/07/2021 05:35:21 - INFO - __main__ - Step 59620: {'lr': 0.00033518857943655607, 'samples': 11447040, 'steps': 59619, 'loss/train': 1.1762737035751343} -11/07/2021 05:35:21 - INFO - __main__ - Step 59621: {'lr': 0.00033518359026904357, 'samples': 11447232, 'steps': 59620, 'loss/train': 1.3297492265701294} -11/07/2021 05:35:22 - INFO - __main__ - Step 59622: {'lr': 0.00033517860106314863, 'samples': 11447424, 'steps': 59621, 'loss/train': 0.13469816744327545} -11/07/2021 05:35:23 - INFO - __main__ - Step 59623: {'lr': 0.00033517361181887353, 'samples': 11447616, 'steps': 59622, 'loss/train': 1.3062771558761597} -11/07/2021 05:35:23 - INFO - __main__ - Step 59624: {'lr': 0.0003351686225362205, 'samples': 11447808, 'steps': 59623, 'loss/train': 1.686296820640564} -11/07/2021 05:35:23 - INFO - __main__ - Step 59625: {'lr': 0.00033516363321519185, 'samples': 11448000, 'steps': 59624, 'loss/train': 1.2708745002746582} -11/07/2021 05:35:24 - INFO - __main__ - Step 59626: {'lr': 0.0003351586438557897, 'samples': 11448192, 'steps': 59625, 'loss/train': 1.0592166185379028} -11/07/2021 05:35:24 - INFO - __main__ - Step 59627: {'lr': 0.00033515365445801635, 'samples': 11448384, 'steps': 59626, 'loss/train': 1.2782230377197266} -11/07/2021 05:35:25 - INFO - __main__ - Step 59628: {'lr': 0.00033514866502187417, 'samples': 11448576, 'steps': 59627, 'loss/train': 0.7311087846755981} -11/07/2021 05:35:26 - INFO - __main__ - Step 59629: {'lr': 0.0003351436755473654, 'samples': 11448768, 'steps': 59628, 'loss/train': 1.175594449043274} -11/07/2021 05:35:26 - INFO - __main__ - Step 59630: {'lr': 0.00033513868603449203, 'samples': 11448960, 'steps': 59629, 'loss/train': 1.260723352432251} -11/07/2021 05:35:26 - INFO - __main__ - Step 59631: {'lr': 0.00033513369648325653, 'samples': 11449152, 'steps': 59630, 'loss/train': 1.033092737197876} -11/07/2021 05:35:27 - INFO - __main__ - Step 59632: {'lr': 0.00033512870689366114, 'samples': 11449344, 'steps': 59631, 'loss/train': 1.294837474822998} -11/07/2021 05:35:27 - INFO - __main__ - Step 59633: {'lr': 0.0003351237172657081, 'samples': 11449536, 'steps': 59632, 'loss/train': 1.1664807796478271} -11/07/2021 05:35:28 - INFO - __main__ - Step 59634: {'lr': 0.00033511872759939954, 'samples': 11449728, 'steps': 59633, 'loss/train': 1.6271213293075562} -11/07/2021 05:35:28 - INFO - __main__ - Step 59635: {'lr': 0.0003351137378947378, 'samples': 11449920, 'steps': 59634, 'loss/train': 1.7285903692245483} -11/07/2021 05:35:29 - INFO - __main__ - Step 59636: {'lr': 0.00033510874815172523, 'samples': 11450112, 'steps': 59635, 'loss/train': 0.9194626212120056} -11/07/2021 05:35:29 - INFO - __main__ - Step 59637: {'lr': 0.00033510375837036386, 'samples': 11450304, 'steps': 59636, 'loss/train': 1.944482445716858} -11/07/2021 05:35:29 - INFO - __main__ - Step 59638: {'lr': 0.0003350987685506561, 'samples': 11450496, 'steps': 59637, 'loss/train': 1.3527714014053345} -11/07/2021 05:35:31 - INFO - __main__ - Step 59639: {'lr': 0.0003350937786926041, 'samples': 11450688, 'steps': 59638, 'loss/train': 1.75435471534729} -11/07/2021 05:35:31 - INFO - __main__ - Step 59640: {'lr': 0.0003350887887962102, 'samples': 11450880, 'steps': 59639, 'loss/train': 1.2585010528564453} -11/07/2021 05:35:31 - INFO - __main__ - Step 59641: {'lr': 0.00033508379886147655, 'samples': 11451072, 'steps': 59640, 'loss/train': 1.3809635639190674} -11/07/2021 05:35:32 - INFO - __main__ - Step 59642: {'lr': 0.00033507880888840547, 'samples': 11451264, 'steps': 59641, 'loss/train': 1.4172636270523071} -11/07/2021 05:35:32 - INFO - __main__ - Step 59643: {'lr': 0.00033507381887699927, 'samples': 11451456, 'steps': 59642, 'loss/train': 1.5943095684051514} -11/07/2021 05:35:33 - INFO - __main__ - Step 59644: {'lr': 0.0003350688288272601, 'samples': 11451648, 'steps': 59643, 'loss/train': 0.06723592430353165} -11/07/2021 05:35:34 - INFO - __main__ - Step 59645: {'lr': 0.00033506383873919016, 'samples': 11451840, 'steps': 59644, 'loss/train': 1.517072319984436} -11/07/2021 05:35:34 - INFO - __main__ - Step 59646: {'lr': 0.0003350588486127918, 'samples': 11452032, 'steps': 59645, 'loss/train': 0.43619540333747864} -11/07/2021 05:35:34 - INFO - __main__ - Step 59647: {'lr': 0.0003350538584480672, 'samples': 11452224, 'steps': 59646, 'loss/train': 1.0386179685592651} -11/07/2021 05:35:35 - INFO - __main__ - Step 59648: {'lr': 0.0003350488682450187, 'samples': 11452416, 'steps': 59647, 'loss/train': 2.321737051010132} -11/07/2021 05:35:36 - INFO - __main__ - Step 59649: {'lr': 0.00033504387800364856, 'samples': 11452608, 'steps': 59648, 'loss/train': 1.195865511894226} -11/07/2021 05:35:36 - INFO - __main__ - Step 59650: {'lr': 0.00033503888772395886, 'samples': 11452800, 'steps': 59649, 'loss/train': 2.187549591064453} -11/07/2021 05:35:37 - INFO - __main__ - Step 59651: {'lr': 0.0003350338974059519, 'samples': 11452992, 'steps': 59650, 'loss/train': 1.7402242422103882} -11/07/2021 05:35:37 - INFO - __main__ - Step 59652: {'lr': 0.0003350289070496301, 'samples': 11453184, 'steps': 59651, 'loss/train': 1.593725323677063} -11/07/2021 05:35:37 - INFO - __main__ - Step 59653: {'lr': 0.0003350239166549955, 'samples': 11453376, 'steps': 59652, 'loss/train': 1.6116315126419067} -11/07/2021 05:35:38 - INFO - __main__ - Step 59654: {'lr': 0.0003350189262220504, 'samples': 11453568, 'steps': 59653, 'loss/train': 1.701385736465454} -11/07/2021 05:35:39 - INFO - __main__ - Step 59655: {'lr': 0.0003350139357507972, 'samples': 11453760, 'steps': 59654, 'loss/train': 1.0990419387817383} -11/07/2021 05:35:39 - INFO - __main__ - Step 59656: {'lr': 0.00033500894524123796, 'samples': 11453952, 'steps': 59655, 'loss/train': 1.5260257720947266} -11/07/2021 05:35:39 - INFO - __main__ - Step 59657: {'lr': 0.0003350039546933751, 'samples': 11454144, 'steps': 59656, 'loss/train': 1.3701422214508057} -11/07/2021 05:35:40 - INFO - __main__ - Step 59658: {'lr': 0.00033499896410721066, 'samples': 11454336, 'steps': 59657, 'loss/train': 1.5399134159088135} -11/07/2021 05:35:40 - INFO - __main__ - Step 59659: {'lr': 0.000334993973482747, 'samples': 11454528, 'steps': 59658, 'loss/train': 0.7803982496261597} -11/07/2021 05:35:41 - INFO - __main__ - Step 59660: {'lr': 0.0003349889828199864, 'samples': 11454720, 'steps': 59659, 'loss/train': 1.2550472021102905} -11/07/2021 05:35:41 - INFO - __main__ - Step 59661: {'lr': 0.000334983992118931, 'samples': 11454912, 'steps': 59660, 'loss/train': 1.2362215518951416} -11/07/2021 05:35:42 - INFO - __main__ - Step 59662: {'lr': 0.00033497900137958325, 'samples': 11455104, 'steps': 59661, 'loss/train': 1.4623883962631226} -11/07/2021 05:35:42 - INFO - __main__ - Step 59663: {'lr': 0.00033497401060194525, 'samples': 11455296, 'steps': 59662, 'loss/train': 1.6779707670211792} -11/07/2021 05:35:42 - INFO - __main__ - Step 59664: {'lr': 0.00033496901978601924, 'samples': 11455488, 'steps': 59663, 'loss/train': 1.2709845304489136} -11/07/2021 05:35:44 - INFO - __main__ - Step 59665: {'lr': 0.0003349640289318075, 'samples': 11455680, 'steps': 59664, 'loss/train': 1.0757722854614258} -11/07/2021 05:35:44 - INFO - __main__ - Step 59666: {'lr': 0.0003349590380393123, 'samples': 11455872, 'steps': 59665, 'loss/train': 0.8987736105918884} -11/07/2021 05:35:44 - INFO - __main__ - Step 59667: {'lr': 0.0003349540471085358, 'samples': 11456064, 'steps': 59666, 'loss/train': 0.9906978607177734} -11/07/2021 05:35:45 - INFO - __main__ - Step 59668: {'lr': 0.00033494905613948035, 'samples': 11456256, 'steps': 59667, 'loss/train': 1.535966396331787} -11/07/2021 05:35:45 - INFO - __main__ - Step 59669: {'lr': 0.00033494406513214826, 'samples': 11456448, 'steps': 59668, 'loss/train': 1.8228522539138794} -11/07/2021 05:35:46 - INFO - __main__ - Step 59670: {'lr': 0.0003349390740865416, 'samples': 11456640, 'steps': 59669, 'loss/train': 1.481791377067566} -11/07/2021 05:35:46 - INFO - __main__ - Step 59671: {'lr': 0.0003349340830026627, 'samples': 11456832, 'steps': 59670, 'loss/train': 0.6913386583328247} -11/07/2021 05:35:47 - INFO - __main__ - Step 59672: {'lr': 0.0003349290918805138, 'samples': 11457024, 'steps': 59671, 'loss/train': 0.9363782405853271} -11/07/2021 05:35:47 - INFO - __main__ - Step 59673: {'lr': 0.0003349241007200972, 'samples': 11457216, 'steps': 59672, 'loss/train': 1.3432589769363403} -11/07/2021 05:35:48 - INFO - __main__ - Step 59674: {'lr': 0.0003349191095214151, 'samples': 11457408, 'steps': 59673, 'loss/train': 1.3509225845336914} -11/07/2021 05:35:49 - INFO - __main__ - Step 59675: {'lr': 0.00033491411828446974, 'samples': 11457600, 'steps': 59674, 'loss/train': 1.407131314277649} -11/07/2021 05:35:49 - INFO - __main__ - Step 59676: {'lr': 0.00033490912700926345, 'samples': 11457792, 'steps': 59675, 'loss/train': 1.3684331178665161} -11/07/2021 05:35:49 - INFO - __main__ - Step 59677: {'lr': 0.00033490413569579837, 'samples': 11457984, 'steps': 59676, 'loss/train': 1.229500651359558} -11/07/2021 05:35:50 - INFO - __main__ - Step 59678: {'lr': 0.00033489914434407683, 'samples': 11458176, 'steps': 59677, 'loss/train': 1.3191747665405273} -11/07/2021 05:35:50 - INFO - __main__ - Step 59679: {'lr': 0.00033489415295410096, 'samples': 11458368, 'steps': 59678, 'loss/train': 1.3091589212417603} -11/07/2021 05:35:51 - INFO - __main__ - Step 59680: {'lr': 0.0003348891615258732, 'samples': 11458560, 'steps': 59679, 'loss/train': 1.3246545791625977} -11/07/2021 05:35:52 - INFO - __main__ - Step 59681: {'lr': 0.0003348841700593956, 'samples': 11458752, 'steps': 59680, 'loss/train': 0.14527994394302368} -11/07/2021 05:35:52 - INFO - __main__ - Step 59682: {'lr': 0.00033487917855467056, 'samples': 11458944, 'steps': 59681, 'loss/train': 1.6974310874938965} -11/07/2021 05:35:52 - INFO - __main__ - Step 59683: {'lr': 0.0003348741870117003, 'samples': 11459136, 'steps': 59682, 'loss/train': 1.2273606061935425} -11/07/2021 05:35:53 - INFO - __main__ - Step 59684: {'lr': 0.000334869195430487, 'samples': 11459328, 'steps': 59683, 'loss/train': 1.6151094436645508} -11/07/2021 05:35:54 - INFO - __main__ - Step 59685: {'lr': 0.0003348642038110329, 'samples': 11459520, 'steps': 59684, 'loss/train': 1.2376044988632202} -11/07/2021 05:35:54 - INFO - __main__ - Step 59686: {'lr': 0.0003348592121533404, 'samples': 11459712, 'steps': 59685, 'loss/train': 1.2281603813171387} -11/07/2021 05:35:54 - INFO - __main__ - Step 59687: {'lr': 0.00033485422045741154, 'samples': 11459904, 'steps': 59686, 'loss/train': 1.5677322149276733} -11/07/2021 05:35:55 - INFO - __main__ - Step 59688: {'lr': 0.00033484922872324875, 'samples': 11460096, 'steps': 59687, 'loss/train': 1.1358038187026978} -11/07/2021 05:35:55 - INFO - __main__ - Step 59689: {'lr': 0.0003348442369508542, 'samples': 11460288, 'steps': 59688, 'loss/train': 1.6422333717346191} -11/07/2021 05:35:55 - INFO - __main__ - Step 59690: {'lr': 0.0003348392451402302, 'samples': 11460480, 'steps': 59689, 'loss/train': 1.289177656173706} -11/07/2021 05:35:56 - INFO - __main__ - Step 59691: {'lr': 0.00033483425329137886, 'samples': 11460672, 'steps': 59690, 'loss/train': 1.566542148590088} -11/07/2021 05:35:57 - INFO - __main__ - Step 59692: {'lr': 0.00033482926140430253, 'samples': 11460864, 'steps': 59691, 'loss/train': 1.6093891859054565} -11/07/2021 05:35:57 - INFO - __main__ - Step 59693: {'lr': 0.00033482426947900346, 'samples': 11461056, 'steps': 59692, 'loss/train': 1.5558502674102783} -11/07/2021 05:35:57 - INFO - __main__ - Step 59694: {'lr': 0.0003348192775154839, 'samples': 11461248, 'steps': 59693, 'loss/train': 1.9984288215637207} -11/07/2021 05:35:58 - INFO - __main__ - Step 59695: {'lr': 0.000334814285513746, 'samples': 11461440, 'steps': 59694, 'loss/train': 1.259392261505127} -11/07/2021 05:35:59 - INFO - __main__ - Step 59696: {'lr': 0.0003348092934737922, 'samples': 11461632, 'steps': 59695, 'loss/train': 1.1630260944366455} -11/07/2021 05:35:59 - INFO - __main__ - Step 59697: {'lr': 0.00033480430139562456, 'samples': 11461824, 'steps': 59696, 'loss/train': 0.7738115191459656} -11/07/2021 05:35:59 - INFO - __main__ - Step 59698: {'lr': 0.00033479930927924543, 'samples': 11462016, 'steps': 59697, 'loss/train': 1.451158046722412} -11/07/2021 05:36:00 - INFO - __main__ - Step 59699: {'lr': 0.000334794317124657, 'samples': 11462208, 'steps': 59698, 'loss/train': 1.1373018026351929} -11/07/2021 05:36:00 - INFO - __main__ - Step 59700: {'lr': 0.00033478932493186163, 'samples': 11462400, 'steps': 59699, 'loss/train': 1.2634257078170776} -11/07/2021 05:36:01 - INFO - __main__ - Step 59701: {'lr': 0.0003347843327008615, 'samples': 11462592, 'steps': 59700, 'loss/train': 1.2875890731811523} -11/07/2021 05:36:02 - INFO - __main__ - Step 59702: {'lr': 0.0003347793404316589, 'samples': 11462784, 'steps': 59701, 'loss/train': 1.8182542324066162} -11/07/2021 05:36:02 - INFO - __main__ - Step 59703: {'lr': 0.00033477434812425596, 'samples': 11462976, 'steps': 59702, 'loss/train': 0.7015295624732971} -11/07/2021 05:36:02 - INFO - __main__ - Step 59704: {'lr': 0.00033476935577865497, 'samples': 11463168, 'steps': 59703, 'loss/train': 1.2705014944076538} -11/07/2021 05:36:03 - INFO - __main__ - Step 59705: {'lr': 0.0003347643633948583, 'samples': 11463360, 'steps': 59704, 'loss/train': 0.9029524922370911} -11/07/2021 05:36:04 - INFO - __main__ - Step 59706: {'lr': 0.00033475937097286805, 'samples': 11463552, 'steps': 59705, 'loss/train': 1.3314130306243896} -11/07/2021 05:36:04 - INFO - __main__ - Step 59707: {'lr': 0.00033475437851268657, 'samples': 11463744, 'steps': 59706, 'loss/train': 0.4221527874469757} -11/07/2021 05:36:04 - INFO - __main__ - Step 59708: {'lr': 0.0003347493860143161, 'samples': 11463936, 'steps': 59707, 'loss/train': 1.3227791786193848} -11/07/2021 05:36:05 - INFO - __main__ - Step 59709: {'lr': 0.0003347443934777589, 'samples': 11464128, 'steps': 59708, 'loss/train': 1.4634250402450562} -11/07/2021 05:36:05 - INFO - __main__ - Step 59710: {'lr': 0.0003347394009030171, 'samples': 11464320, 'steps': 59709, 'loss/train': 1.2356635332107544} -11/07/2021 05:36:06 - INFO - __main__ - Step 59711: {'lr': 0.00033473440829009303, 'samples': 11464512, 'steps': 59710, 'loss/train': 1.7734612226486206} -11/07/2021 05:36:06 - INFO - __main__ - Step 59712: {'lr': 0.00033472941563898897, 'samples': 11464704, 'steps': 59711, 'loss/train': 1.698994517326355} -11/07/2021 05:36:07 - INFO - __main__ - Step 59713: {'lr': 0.00033472442294970716, 'samples': 11464896, 'steps': 59712, 'loss/train': 1.3743351697921753} -11/07/2021 05:36:07 - INFO - __main__ - Step 59714: {'lr': 0.00033471943022224984, 'samples': 11465088, 'steps': 59713, 'loss/train': 1.2542681694030762} -11/07/2021 05:36:08 - INFO - __main__ - Step 59715: {'lr': 0.0003347144374566192, 'samples': 11465280, 'steps': 59714, 'loss/train': 1.762437105178833} -11/07/2021 05:36:09 - INFO - __main__ - Step 59716: {'lr': 0.00033470944465281753, 'samples': 11465472, 'steps': 59715, 'loss/train': 1.3514084815979004} -11/07/2021 05:36:09 - INFO - __main__ - Step 59717: {'lr': 0.00033470445181084716, 'samples': 11465664, 'steps': 59716, 'loss/train': 1.3770685195922852} -11/07/2021 05:36:09 - INFO - __main__ - Step 59718: {'lr': 0.0003346994589307102, 'samples': 11465856, 'steps': 59717, 'loss/train': 1.4346739053726196} -11/07/2021 05:36:10 - INFO - __main__ - Step 59719: {'lr': 0.00033469446601240907, 'samples': 11466048, 'steps': 59718, 'loss/train': 1.4784272909164429} -11/07/2021 05:36:10 - INFO - __main__ - Step 59720: {'lr': 0.00033468947305594586, 'samples': 11466240, 'steps': 59719, 'loss/train': 0.5607002377510071} -11/07/2021 05:36:11 - INFO - __main__ - Step 59721: {'lr': 0.0003346844800613229, 'samples': 11466432, 'steps': 59720, 'loss/train': 1.163059949874878} -11/07/2021 05:36:11 - INFO - __main__ - Step 59722: {'lr': 0.00033467948702854233, 'samples': 11466624, 'steps': 59721, 'loss/train': 1.3342009782791138} -11/07/2021 05:36:12 - INFO - __main__ - Step 59723: {'lr': 0.00033467449395760656, 'samples': 11466816, 'steps': 59722, 'loss/train': 1.665111780166626} -11/07/2021 05:36:12 - INFO - __main__ - Step 59724: {'lr': 0.0003346695008485179, 'samples': 11467008, 'steps': 59723, 'loss/train': 1.8015192747116089} -11/07/2021 05:36:13 - INFO - __main__ - Step 59725: {'lr': 0.00033466450770127824, 'samples': 11467200, 'steps': 59724, 'loss/train': 1.6405117511749268} -11/07/2021 05:36:13 - INFO - __main__ - Step 59726: {'lr': 0.0003346595145158902, 'samples': 11467392, 'steps': 59725, 'loss/train': 0.12103454768657684} -11/07/2021 05:36:14 - INFO - __main__ - Step 59727: {'lr': 0.00033465452129235584, 'samples': 11467584, 'steps': 59726, 'loss/train': 2.292454957962036} -11/07/2021 05:36:14 - INFO - __main__ - Step 59728: {'lr': 0.00033464952803067746, 'samples': 11467776, 'steps': 59727, 'loss/train': 1.4133906364440918} -11/07/2021 05:36:15 - INFO - __main__ - Step 59729: {'lr': 0.0003346445347308573, 'samples': 11467968, 'steps': 59728, 'loss/train': 1.6800386905670166} -11/07/2021 05:36:15 - INFO - __main__ - Step 59730: {'lr': 0.0003346395413928977, 'samples': 11468160, 'steps': 59729, 'loss/train': 1.228143334388733} -11/07/2021 05:36:16 - INFO - __main__ - Step 59731: {'lr': 0.0003346345480168007, 'samples': 11468352, 'steps': 59730, 'loss/train': 1.40749990940094} -11/07/2021 05:36:16 - INFO - __main__ - Step 59732: {'lr': 0.00033462955460256876, 'samples': 11468544, 'steps': 59731, 'loss/train': 1.4132229089736938} -11/07/2021 05:36:17 - INFO - __main__ - Step 59733: {'lr': 0.00033462456115020405, 'samples': 11468736, 'steps': 59732, 'loss/train': 1.8561713695526123} -11/07/2021 05:36:17 - INFO - __main__ - Step 59734: {'lr': 0.0003346195676597088, 'samples': 11468928, 'steps': 59733, 'loss/train': 1.4148104190826416} -11/07/2021 05:36:17 - INFO - __main__ - Step 59735: {'lr': 0.00033461457413108524, 'samples': 11469120, 'steps': 59734, 'loss/train': 1.4156752824783325} -11/07/2021 05:36:18 - INFO - __main__ - Step 59736: {'lr': 0.00033460958056433574, 'samples': 11469312, 'steps': 59735, 'loss/train': 1.3613808155059814} -11/07/2021 05:36:19 - INFO - __main__ - Step 59737: {'lr': 0.00033460458695946244, 'samples': 11469504, 'steps': 59736, 'loss/train': 1.300649881362915} -11/07/2021 05:36:19 - INFO - __main__ - Step 59738: {'lr': 0.0003345995933164676, 'samples': 11469696, 'steps': 59737, 'loss/train': 1.3083850145339966} -11/07/2021 05:36:19 - INFO - __main__ - Step 59739: {'lr': 0.0003345945996353535, 'samples': 11469888, 'steps': 59738, 'loss/train': 1.737492561340332} -11/07/2021 05:36:20 - INFO - __main__ - Step 59740: {'lr': 0.0003345896059161224, 'samples': 11470080, 'steps': 59739, 'loss/train': 1.0234007835388184} -11/07/2021 05:36:20 - INFO - __main__ - Step 59741: {'lr': 0.00033458461215877644, 'samples': 11470272, 'steps': 59740, 'loss/train': 1.4739450216293335} -11/07/2021 05:36:21 - INFO - __main__ - Step 59742: {'lr': 0.000334579618363318, 'samples': 11470464, 'steps': 59741, 'loss/train': 1.3406312465667725} -11/07/2021 05:36:21 - INFO - __main__ - Step 59743: {'lr': 0.0003345746245297494, 'samples': 11470656, 'steps': 59742, 'loss/train': 0.7481667399406433} -11/07/2021 05:36:22 - INFO - __main__ - Step 59744: {'lr': 0.00033456963065807264, 'samples': 11470848, 'steps': 59743, 'loss/train': 1.0869067907333374} -11/07/2021 05:36:22 - INFO - __main__ - Step 59745: {'lr': 0.0003345646367482902, 'samples': 11471040, 'steps': 59744, 'loss/train': 1.4960869550704956} -11/07/2021 05:36:22 - INFO - __main__ - Step 59746: {'lr': 0.00033455964280040417, 'samples': 11471232, 'steps': 59745, 'loss/train': 1.6462482213974} -11/07/2021 05:36:24 - INFO - __main__ - Step 59747: {'lr': 0.0003345546488144169, 'samples': 11471424, 'steps': 59746, 'loss/train': 1.2318847179412842} -11/07/2021 05:36:24 - INFO - __main__ - Step 59748: {'lr': 0.0003345496547903306, 'samples': 11471616, 'steps': 59747, 'loss/train': 1.2419209480285645} -11/07/2021 05:36:24 - INFO - __main__ - Step 59749: {'lr': 0.0003345446607281475, 'samples': 11471808, 'steps': 59748, 'loss/train': 0.16311971843242645} -11/07/2021 05:36:25 - INFO - __main__ - Step 59750: {'lr': 0.00033453966662786995, 'samples': 11472000, 'steps': 59749, 'loss/train': 1.2368395328521729} -11/07/2021 05:36:25 - INFO - __main__ - Step 59751: {'lr': 0.0003345346724895001, 'samples': 11472192, 'steps': 59750, 'loss/train': 1.3162906169891357} -11/07/2021 05:36:26 - INFO - __main__ - Step 59752: {'lr': 0.0003345296783130402, 'samples': 11472384, 'steps': 59751, 'loss/train': 1.7774964570999146} -11/07/2021 05:36:26 - INFO - __main__ - Step 59753: {'lr': 0.0003345246840984926, 'samples': 11472576, 'steps': 59752, 'loss/train': 1.8524725437164307} -11/07/2021 05:36:27 - INFO - __main__ - Step 59754: {'lr': 0.0003345196898458594, 'samples': 11472768, 'steps': 59753, 'loss/train': 1.4533371925354004} -11/07/2021 05:36:27 - INFO - __main__ - Step 59755: {'lr': 0.00033451469555514294, 'samples': 11472960, 'steps': 59754, 'loss/train': 1.2159703969955444} -11/07/2021 05:36:27 - INFO - __main__ - Step 59756: {'lr': 0.0003345097012263456, 'samples': 11473152, 'steps': 59755, 'loss/train': 1.1995917558670044} -11/07/2021 05:36:29 - INFO - __main__ - Step 59757: {'lr': 0.0003345047068594694, 'samples': 11473344, 'steps': 59756, 'loss/train': 1.2755703926086426} -11/07/2021 05:36:29 - INFO - __main__ - Step 59758: {'lr': 0.0003344997124545166, 'samples': 11473536, 'steps': 59757, 'loss/train': 1.3318367004394531} -11/07/2021 05:36:29 - INFO - __main__ - Step 59759: {'lr': 0.00033449471801148963, 'samples': 11473728, 'steps': 59758, 'loss/train': 2.1833062171936035} -11/07/2021 05:36:30 - INFO - __main__ - Step 59760: {'lr': 0.00033448972353039065, 'samples': 11473920, 'steps': 59759, 'loss/train': 1.5835164785385132} -11/07/2021 05:36:30 - INFO - __main__ - Step 59761: {'lr': 0.00033448472901122185, 'samples': 11474112, 'steps': 59760, 'loss/train': 1.106222152709961} -11/07/2021 05:36:31 - INFO - __main__ - Step 59762: {'lr': 0.0003344797344539855, 'samples': 11474304, 'steps': 59761, 'loss/train': 1.3897550106048584} -11/07/2021 05:36:31 - INFO - __main__ - Step 59763: {'lr': 0.000334474739858684, 'samples': 11474496, 'steps': 59762, 'loss/train': 0.879180371761322} -11/07/2021 05:36:32 - INFO - __main__ - Step 59764: {'lr': 0.0003344697452253195, 'samples': 11474688, 'steps': 59763, 'loss/train': 1.3495070934295654} -11/07/2021 05:36:32 - INFO - __main__ - Step 59765: {'lr': 0.00033446475055389413, 'samples': 11474880, 'steps': 59764, 'loss/train': 1.703831434249878} -11/07/2021 05:36:32 - INFO - __main__ - Step 59766: {'lr': 0.00033445975584441023, 'samples': 11475072, 'steps': 59765, 'loss/train': 1.5049314498901367} -11/07/2021 05:36:33 - INFO - __main__ - Step 59767: {'lr': 0.00033445476109687013, 'samples': 11475264, 'steps': 59766, 'loss/train': 1.7458064556121826} -11/07/2021 05:36:34 - INFO - __main__ - Step 59768: {'lr': 0.000334449766311276, 'samples': 11475456, 'steps': 59767, 'loss/train': 1.2554872035980225} -11/07/2021 05:36:34 - INFO - __main__ - Step 59769: {'lr': 0.00033444477148763006, 'samples': 11475648, 'steps': 59768, 'loss/train': 0.7513704895973206} -11/07/2021 05:36:34 - INFO - __main__ - Step 59770: {'lr': 0.0003344397766259348, 'samples': 11475840, 'steps': 59769, 'loss/train': 1.1398470401763916} -11/07/2021 05:36:35 - INFO - __main__ - Step 59771: {'lr': 0.0003344347817261921, 'samples': 11476032, 'steps': 59770, 'loss/train': 1.2013721466064453} -11/07/2021 05:36:35 - INFO - __main__ - Step 59772: {'lr': 0.0003344297867884044, 'samples': 11476224, 'steps': 59771, 'loss/train': 0.7768096327781677} -11/07/2021 05:36:36 - INFO - __main__ - Step 59773: {'lr': 0.000334424791812574, 'samples': 11476416, 'steps': 59772, 'loss/train': 1.5392483472824097} -11/07/2021 05:36:37 - INFO - __main__ - Step 59774: {'lr': 0.00033441979679870305, 'samples': 11476608, 'steps': 59773, 'loss/train': 1.5798436403274536} -11/07/2021 05:36:37 - INFO - __main__ - Step 59775: {'lr': 0.00033441480174679385, 'samples': 11476800, 'steps': 59774, 'loss/train': 1.1530206203460693} -11/07/2021 05:36:37 - INFO - __main__ - Step 59776: {'lr': 0.00033440980665684866, 'samples': 11476992, 'steps': 59775, 'loss/train': 1.7026039361953735} -11/07/2021 05:36:38 - INFO - __main__ - Step 59777: {'lr': 0.00033440481152886977, 'samples': 11477184, 'steps': 59776, 'loss/train': 2.033388376235962} -11/07/2021 05:36:39 - INFO - __main__ - Step 59778: {'lr': 0.00033439981636285935, 'samples': 11477376, 'steps': 59777, 'loss/train': 0.8706176280975342} -11/07/2021 05:36:39 - INFO - __main__ - Step 59779: {'lr': 0.0003343948211588196, 'samples': 11477568, 'steps': 59778, 'loss/train': 1.307417869567871} -11/07/2021 05:36:39 - INFO - __main__ - Step 59780: {'lr': 0.00033438982591675284, 'samples': 11477760, 'steps': 59779, 'loss/train': 0.745901346206665} -11/07/2021 05:36:40 - INFO - __main__ - Step 59781: {'lr': 0.00033438483063666136, 'samples': 11477952, 'steps': 59780, 'loss/train': 1.1092472076416016} -11/07/2021 05:36:40 - INFO - __main__ - Step 59782: {'lr': 0.0003343798353185474, 'samples': 11478144, 'steps': 59781, 'loss/train': 1.6200780868530273} -11/07/2021 05:36:41 - INFO - __main__ - Step 59783: {'lr': 0.0003343748399624131, 'samples': 11478336, 'steps': 59782, 'loss/train': 0.8787214756011963} -11/07/2021 05:36:42 - INFO - __main__ - Step 59784: {'lr': 0.00033436984456826097, 'samples': 11478528, 'steps': 59783, 'loss/train': 1.573609709739685} -11/07/2021 05:36:42 - INFO - __main__ - Step 59785: {'lr': 0.000334364849136093, 'samples': 11478720, 'steps': 59784, 'loss/train': 1.411788821220398} -11/07/2021 05:36:42 - INFO - __main__ - Step 59786: {'lr': 0.0003343598536659115, 'samples': 11478912, 'steps': 59785, 'loss/train': 1.3767591714859009} -11/07/2021 05:36:43 - INFO - __main__ - Step 59787: {'lr': 0.00033435485815771875, 'samples': 11479104, 'steps': 59786, 'loss/train': 1.462869644165039} -11/07/2021 05:36:44 - INFO - __main__ - Step 59788: {'lr': 0.00033434986261151705, 'samples': 11479296, 'steps': 59787, 'loss/train': 1.5607069730758667} -11/07/2021 05:36:44 - INFO - __main__ - Step 59789: {'lr': 0.0003343448670273086, 'samples': 11479488, 'steps': 59788, 'loss/train': 1.6731963157653809} -11/07/2021 05:36:44 - INFO - __main__ - Step 59790: {'lr': 0.00033433987140509566, 'samples': 11479680, 'steps': 59789, 'loss/train': 0.9215992093086243} -11/07/2021 05:36:45 - INFO - __main__ - Step 59791: {'lr': 0.0003343348757448804, 'samples': 11479872, 'steps': 59790, 'loss/train': 1.42835533618927} -11/07/2021 05:36:45 - INFO - __main__ - Step 59792: {'lr': 0.0003343298800466652, 'samples': 11480064, 'steps': 59791, 'loss/train': 0.590241551399231} -11/07/2021 05:36:46 - INFO - __main__ - Step 59793: {'lr': 0.0003343248843104523, 'samples': 11480256, 'steps': 59792, 'loss/train': 1.6024614572525024} -11/07/2021 05:36:46 - INFO - __main__ - Step 59794: {'lr': 0.00033431988853624384, 'samples': 11480448, 'steps': 59793, 'loss/train': 1.5865528583526611} -11/07/2021 05:36:47 - INFO - __main__ - Step 59795: {'lr': 0.00033431489272404215, 'samples': 11480640, 'steps': 59794, 'loss/train': 1.3040661811828613} -11/07/2021 05:36:47 - INFO - __main__ - Step 59796: {'lr': 0.0003343098968738495, 'samples': 11480832, 'steps': 59795, 'loss/train': 1.4046781063079834} -11/07/2021 05:36:47 - INFO - __main__ - Step 59797: {'lr': 0.00033430490098566813, 'samples': 11481024, 'steps': 59796, 'loss/train': 1.5291950702667236} -11/07/2021 05:36:48 - INFO - __main__ - Step 59798: {'lr': 0.00033429990505950025, 'samples': 11481216, 'steps': 59797, 'loss/train': 1.2005763053894043} -11/07/2021 05:36:49 - INFO - __main__ - Step 59799: {'lr': 0.0003342949090953481, 'samples': 11481408, 'steps': 59798, 'loss/train': 1.9645662307739258} -11/07/2021 05:36:49 - INFO - __main__ - Step 59800: {'lr': 0.000334289913093214, 'samples': 11481600, 'steps': 59799, 'loss/train': 1.816665768623352} -11/07/2021 05:36:49 - INFO - __main__ - Step 59801: {'lr': 0.0003342849170531001, 'samples': 11481792, 'steps': 59800, 'loss/train': 1.27961266040802} -11/07/2021 05:36:50 - INFO - __main__ - Step 59802: {'lr': 0.00033427992097500876, 'samples': 11481984, 'steps': 59801, 'loss/train': 1.76497220993042} -11/07/2021 05:36:51 - INFO - __main__ - Step 59803: {'lr': 0.00033427492485894216, 'samples': 11482176, 'steps': 59802, 'loss/train': 1.549760103225708} -11/07/2021 05:36:51 - INFO - __main__ - Step 59804: {'lr': 0.0003342699287049027, 'samples': 11482368, 'steps': 59803, 'loss/train': 1.2277553081512451} -11/07/2021 05:36:51 - INFO - __main__ - Step 59805: {'lr': 0.0003342649325128924, 'samples': 11482560, 'steps': 59804, 'loss/train': 1.6004462242126465} -11/07/2021 05:36:52 - INFO - __main__ - Step 59806: {'lr': 0.00033425993628291367, 'samples': 11482752, 'steps': 59805, 'loss/train': 1.6093926429748535} -11/07/2021 05:36:52 - INFO - __main__ - Step 59807: {'lr': 0.0003342549400149687, 'samples': 11482944, 'steps': 59806, 'loss/train': 0.9378297924995422} -11/07/2021 05:36:53 - INFO - __main__ - Step 59808: {'lr': 0.0003342499437090597, 'samples': 11483136, 'steps': 59807, 'loss/train': 1.5748845338821411} -11/07/2021 05:36:54 - INFO - __main__ - Step 59809: {'lr': 0.000334244947365189, 'samples': 11483328, 'steps': 59808, 'loss/train': 1.2187085151672363} -11/07/2021 05:36:54 - INFO - __main__ - Step 59810: {'lr': 0.00033423995098335886, 'samples': 11483520, 'steps': 59809, 'loss/train': 1.9742186069488525} -11/07/2021 05:36:54 - INFO - __main__ - Step 59811: {'lr': 0.00033423495456357156, 'samples': 11483712, 'steps': 59810, 'loss/train': 1.3039319515228271} -11/07/2021 05:36:55 - INFO - __main__ - Step 59812: {'lr': 0.00033422995810582917, 'samples': 11483904, 'steps': 59811, 'loss/train': 1.3863568305969238} -11/07/2021 05:36:56 - INFO - __main__ - Step 59813: {'lr': 0.0003342249616101341, 'samples': 11484096, 'steps': 59812, 'loss/train': 1.435603380203247} -11/07/2021 05:36:56 - INFO - __main__ - Step 59814: {'lr': 0.0003342199650764886, 'samples': 11484288, 'steps': 59813, 'loss/train': 1.6086353063583374} -11/07/2021 05:36:56 - INFO - __main__ - Step 59815: {'lr': 0.0003342149685048949, 'samples': 11484480, 'steps': 59814, 'loss/train': 1.496732234954834} -11/07/2021 05:36:57 - INFO - __main__ - Step 59816: {'lr': 0.0003342099718953551, 'samples': 11484672, 'steps': 59815, 'loss/train': 1.3912758827209473} -11/07/2021 05:36:57 - INFO - __main__ - Step 59817: {'lr': 0.00033420497524787177, 'samples': 11484864, 'steps': 59816, 'loss/train': 1.4049148559570312} -11/07/2021 05:36:58 - INFO - __main__ - Step 59818: {'lr': 0.0003341999785624468, 'samples': 11485056, 'steps': 59817, 'loss/train': 1.3746356964111328} -11/07/2021 05:36:58 - INFO - __main__ - Step 59819: {'lr': 0.0003341949818390827, 'samples': 11485248, 'steps': 59818, 'loss/train': 0.8529001474380493} -11/07/2021 05:36:59 - INFO - __main__ - Step 59820: {'lr': 0.00033418998507778164, 'samples': 11485440, 'steps': 59819, 'loss/train': 1.4577114582061768} -11/07/2021 05:36:59 - INFO - __main__ - Step 59821: {'lr': 0.00033418498827854587, 'samples': 11485632, 'steps': 59820, 'loss/train': 1.522295355796814} -11/07/2021 05:36:59 - INFO - __main__ - Step 59822: {'lr': 0.0003341799914413776, 'samples': 11485824, 'steps': 59821, 'loss/train': 1.6530967950820923} -11/07/2021 05:37:01 - INFO - __main__ - Step 59823: {'lr': 0.0003341749945662792, 'samples': 11486016, 'steps': 59822, 'loss/train': 1.5433629751205444} -11/07/2021 05:37:01 - INFO - __main__ - Step 59824: {'lr': 0.00033416999765325286, 'samples': 11486208, 'steps': 59823, 'loss/train': 1.4311084747314453} -11/07/2021 05:37:01 - INFO - __main__ - Step 59825: {'lr': 0.0003341650007023008, 'samples': 11486400, 'steps': 59824, 'loss/train': 1.3693621158599854} -11/07/2021 05:37:02 - INFO - __main__ - Step 59826: {'lr': 0.0003341600037134252, 'samples': 11486592, 'steps': 59825, 'loss/train': 1.2301878929138184} -11/07/2021 05:37:02 - INFO - __main__ - Step 59827: {'lr': 0.00033415500668662845, 'samples': 11486784, 'steps': 59826, 'loss/train': 1.6107709407806396} -11/07/2021 05:37:02 - INFO - __main__ - Step 59828: {'lr': 0.00033415000962191277, 'samples': 11486976, 'steps': 59827, 'loss/train': 1.178155779838562} -11/07/2021 05:37:03 - INFO - __main__ - Step 59829: {'lr': 0.0003341450125192804, 'samples': 11487168, 'steps': 59828, 'loss/train': 1.3227167129516602} -11/07/2021 05:37:04 - INFO - __main__ - Step 59830: {'lr': 0.0003341400153787336, 'samples': 11487360, 'steps': 59829, 'loss/train': 1.284824013710022} -11/07/2021 05:37:04 - INFO - __main__ - Step 59831: {'lr': 0.00033413501820027456, 'samples': 11487552, 'steps': 59830, 'loss/train': 1.378790259361267} -11/07/2021 05:37:04 - INFO - __main__ - Step 59832: {'lr': 0.00033413002098390567, 'samples': 11487744, 'steps': 59831, 'loss/train': 0.932711124420166} -11/07/2021 05:37:05 - INFO - __main__ - Step 59833: {'lr': 0.00033412502372962894, 'samples': 11487936, 'steps': 59832, 'loss/train': 1.0881677865982056} -11/07/2021 05:37:06 - INFO - __main__ - Step 59834: {'lr': 0.0003341200264374469, 'samples': 11488128, 'steps': 59833, 'loss/train': 1.1093249320983887} -11/07/2021 05:37:06 - INFO - __main__ - Step 59835: {'lr': 0.0003341150291073616, 'samples': 11488320, 'steps': 59834, 'loss/train': 1.4371024370193481} -11/07/2021 05:37:06 - INFO - __main__ - Step 59836: {'lr': 0.0003341100317393754, 'samples': 11488512, 'steps': 59835, 'loss/train': 1.6734120845794678} -11/07/2021 05:37:07 - INFO - __main__ - Step 59837: {'lr': 0.00033410503433349055, 'samples': 11488704, 'steps': 59836, 'loss/train': 1.3474565744400024} -11/07/2021 05:37:07 - INFO - __main__ - Step 59838: {'lr': 0.00033410003688970927, 'samples': 11488896, 'steps': 59837, 'loss/train': 3.1182456016540527} -11/07/2021 05:37:08 - INFO - __main__ - Step 59839: {'lr': 0.0003340950394080337, 'samples': 11489088, 'steps': 59838, 'loss/train': 1.438690423965454} -11/07/2021 05:37:09 - INFO - __main__ - Step 59840: {'lr': 0.0003340900418884663, 'samples': 11489280, 'steps': 59839, 'loss/train': 1.6547439098358154} -11/07/2021 05:37:09 - INFO - __main__ - Step 59841: {'lr': 0.00033408504433100916, 'samples': 11489472, 'steps': 59840, 'loss/train': 1.5318498611450195} -11/07/2021 05:37:09 - INFO - __main__ - Step 59842: {'lr': 0.0003340800467356647, 'samples': 11489664, 'steps': 59841, 'loss/train': 0.697304368019104} -11/07/2021 05:37:10 - INFO - __main__ - Step 59843: {'lr': 0.00033407504910243504, 'samples': 11489856, 'steps': 59842, 'loss/train': 1.1265060901641846} -11/07/2021 05:37:10 - INFO - __main__ - Step 59844: {'lr': 0.0003340700514313224, 'samples': 11490048, 'steps': 59843, 'loss/train': 1.5800620317459106} -11/07/2021 05:37:11 - INFO - __main__ - Step 59845: {'lr': 0.0003340650537223291, 'samples': 11490240, 'steps': 59844, 'loss/train': 1.636988878250122} -11/07/2021 05:37:11 - INFO - __main__ - Step 59846: {'lr': 0.0003340600559754574, 'samples': 11490432, 'steps': 59845, 'loss/train': 2.1109626293182373} -11/07/2021 05:37:12 - INFO - __main__ - Step 59847: {'lr': 0.0003340550581907095, 'samples': 11490624, 'steps': 59846, 'loss/train': 1.8847805261611938} -11/07/2021 05:37:12 - INFO - __main__ - Step 59848: {'lr': 0.0003340500603680878, 'samples': 11490816, 'steps': 59847, 'loss/train': 1.22675359249115} -11/07/2021 05:37:12 - INFO - __main__ - Step 59849: {'lr': 0.00033404506250759436, 'samples': 11491008, 'steps': 59848, 'loss/train': 1.5579403638839722} -11/07/2021 05:37:13 - INFO - __main__ - Step 59850: {'lr': 0.0003340400646092315, 'samples': 11491200, 'steps': 59849, 'loss/train': 1.0249091386795044} -11/07/2021 05:37:14 - INFO - __main__ - Step 59851: {'lr': 0.0003340350666730015, 'samples': 11491392, 'steps': 59850, 'loss/train': 1.398000717163086} -11/07/2021 05:37:14 - INFO - __main__ - Step 59852: {'lr': 0.0003340300686989066, 'samples': 11491584, 'steps': 59851, 'loss/train': 1.31829035282135} -11/07/2021 05:37:15 - INFO - __main__ - Step 59853: {'lr': 0.0003340250706869491, 'samples': 11491776, 'steps': 59852, 'loss/train': 1.0441431999206543} -11/07/2021 05:37:15 - INFO - __main__ - Step 59854: {'lr': 0.00033402007263713115, 'samples': 11491968, 'steps': 59853, 'loss/train': 1.3283215761184692} -11/07/2021 05:37:16 - INFO - __main__ - Step 59855: {'lr': 0.000334015074549455, 'samples': 11492160, 'steps': 59854, 'loss/train': 1.2623116970062256} -11/07/2021 05:37:16 - INFO - __main__ - Step 59856: {'lr': 0.000334010076423923, 'samples': 11492352, 'steps': 59855, 'loss/train': 1.3793851137161255} -11/07/2021 05:37:17 - INFO - __main__ - Step 59857: {'lr': 0.00033400507826053733, 'samples': 11492544, 'steps': 59856, 'loss/train': 1.8009610176086426} -11/07/2021 05:37:17 - INFO - __main__ - Step 59858: {'lr': 0.0003340000800593004, 'samples': 11492736, 'steps': 59857, 'loss/train': 0.09556188434362411} -11/07/2021 05:37:17 - INFO - __main__ - Step 59859: {'lr': 0.0003339950818202142, 'samples': 11492928, 'steps': 59858, 'loss/train': 1.0893874168395996} -11/07/2021 05:37:18 - INFO - __main__ - Step 59860: {'lr': 0.00033399008354328106, 'samples': 11493120, 'steps': 59859, 'loss/train': 1.4364213943481445} -11/07/2021 05:37:19 - INFO - __main__ - Step 59861: {'lr': 0.0003339850852285034, 'samples': 11493312, 'steps': 59860, 'loss/train': 1.5607722997665405} -11/07/2021 05:37:19 - INFO - __main__ - Step 59862: {'lr': 0.00033398008687588333, 'samples': 11493504, 'steps': 59861, 'loss/train': 1.3319916725158691} -11/07/2021 05:37:19 - INFO - __main__ - Step 59863: {'lr': 0.00033397508848542306, 'samples': 11493696, 'steps': 59862, 'loss/train': 1.4987218379974365} -11/07/2021 05:37:20 - INFO - __main__ - Step 59864: {'lr': 0.000333970090057125, 'samples': 11493888, 'steps': 59863, 'loss/train': 1.1037565469741821} -11/07/2021 05:37:21 - INFO - __main__ - Step 59865: {'lr': 0.00033396509159099133, 'samples': 11494080, 'steps': 59864, 'loss/train': 1.326676845550537} -11/07/2021 05:37:21 - INFO - __main__ - Step 59866: {'lr': 0.00033396009308702426, 'samples': 11494272, 'steps': 59865, 'loss/train': 1.9202079772949219} -11/07/2021 05:37:22 - INFO - __main__ - Step 59867: {'lr': 0.000333955094545226, 'samples': 11494464, 'steps': 59866, 'loss/train': 1.259358286857605} -11/07/2021 05:37:22 - INFO - __main__ - Step 59868: {'lr': 0.00033395009596559887, 'samples': 11494656, 'steps': 59867, 'loss/train': 1.3198281526565552} -11/07/2021 05:37:22 - INFO - __main__ - Step 59869: {'lr': 0.00033394509734814516, 'samples': 11494848, 'steps': 59868, 'loss/train': 1.099117636680603} -11/07/2021 05:37:23 - INFO - __main__ - Step 59870: {'lr': 0.0003339400986928671, 'samples': 11495040, 'steps': 59869, 'loss/train': 1.5058186054229736} -11/07/2021 05:37:24 - INFO - __main__ - Step 59871: {'lr': 0.000333935099999767, 'samples': 11495232, 'steps': 59870, 'loss/train': 1.140355110168457} -11/07/2021 05:37:24 - INFO - __main__ - Step 59872: {'lr': 0.00033393010126884696, 'samples': 11495424, 'steps': 59871, 'loss/train': 2.3761146068573} -11/07/2021 05:37:24 - INFO - __main__ - Step 59873: {'lr': 0.00033392510250010926, 'samples': 11495616, 'steps': 59872, 'loss/train': 1.3409818410873413} -11/07/2021 05:37:25 - INFO - __main__ - Step 59874: {'lr': 0.00033392010369355627, 'samples': 11495808, 'steps': 59873, 'loss/train': 1.6499170064926147} -11/07/2021 05:37:25 - INFO - __main__ - Step 59875: {'lr': 0.00033391510484919015, 'samples': 11496000, 'steps': 59874, 'loss/train': 0.8844736814498901} -11/07/2021 05:37:26 - INFO - __main__ - Step 59876: {'lr': 0.00033391010596701314, 'samples': 11496192, 'steps': 59875, 'loss/train': 1.285159945487976} -11/07/2021 05:37:27 - INFO - __main__ - Step 59877: {'lr': 0.0003339051070470276, 'samples': 11496384, 'steps': 59876, 'loss/train': 2.0157523155212402} -11/07/2021 05:37:27 - INFO - __main__ - Step 59878: {'lr': 0.00033390010808923573, 'samples': 11496576, 'steps': 59877, 'loss/train': 1.7896143198013306} -11/07/2021 05:37:27 - INFO - __main__ - Step 59879: {'lr': 0.00033389510909363974, 'samples': 11496768, 'steps': 59878, 'loss/train': 1.4786338806152344} -11/07/2021 05:37:28 - INFO - __main__ - Step 59880: {'lr': 0.00033389011006024183, 'samples': 11496960, 'steps': 59879, 'loss/train': 1.577348232269287} -11/07/2021 05:37:28 - INFO - __main__ - Step 59881: {'lr': 0.0003338851109890444, 'samples': 11497152, 'steps': 59880, 'loss/train': 0.7143099904060364} -11/07/2021 05:37:29 - INFO - __main__ - Step 59882: {'lr': 0.00033388011188004965, 'samples': 11497344, 'steps': 59881, 'loss/train': 1.6632063388824463} -11/07/2021 05:37:29 - INFO - __main__ - Step 59883: {'lr': 0.00033387511273325976, 'samples': 11497536, 'steps': 59882, 'loss/train': 1.4234802722930908} -11/07/2021 05:37:30 - INFO - __main__ - Step 59884: {'lr': 0.0003338701135486771, 'samples': 11497728, 'steps': 59883, 'loss/train': 2.193471908569336} -11/07/2021 05:37:30 - INFO - __main__ - Step 59885: {'lr': 0.0003338651143263038, 'samples': 11497920, 'steps': 59884, 'loss/train': 1.4223037958145142} -11/07/2021 05:37:31 - INFO - __main__ - Step 59886: {'lr': 0.0003338601150661423, 'samples': 11498112, 'steps': 59885, 'loss/train': 0.952494740486145} -11/07/2021 05:37:31 - INFO - __main__ - Step 59887: {'lr': 0.0003338551157681946, 'samples': 11498304, 'steps': 59886, 'loss/train': 1.3072333335876465} -11/07/2021 05:37:32 - INFO - __main__ - Step 59888: {'lr': 0.00033385011643246313, 'samples': 11498496, 'steps': 59887, 'loss/train': 0.570316731929779} -11/07/2021 05:37:32 - INFO - __main__ - Step 59889: {'lr': 0.00033384511705895003, 'samples': 11498688, 'steps': 59888, 'loss/train': 1.7107895612716675} -11/07/2021 05:37:33 - INFO - __main__ - Step 59890: {'lr': 0.00033384011764765764, 'samples': 11498880, 'steps': 59889, 'loss/train': 1.3058995008468628} -11/07/2021 05:37:33 - INFO - __main__ - Step 59891: {'lr': 0.0003338351181985882, 'samples': 11499072, 'steps': 59890, 'loss/train': 1.1536494493484497} -11/07/2021 05:37:33 - INFO - __main__ - Step 59892: {'lr': 0.000333830118711744, 'samples': 11499264, 'steps': 59891, 'loss/train': 1.3105016946792603} -11/07/2021 05:37:34 - INFO - __main__ - Step 59893: {'lr': 0.00033382511918712723, 'samples': 11499456, 'steps': 59892, 'loss/train': 1.7648695707321167} -11/07/2021 05:37:35 - INFO - __main__ - Step 59894: {'lr': 0.00033382011962474004, 'samples': 11499648, 'steps': 59893, 'loss/train': 1.2767893075942993} -11/07/2021 05:37:35 - INFO - __main__ - Step 59895: {'lr': 0.0003338151200245849, 'samples': 11499840, 'steps': 59894, 'loss/train': 1.6090312004089355} -11/07/2021 05:37:35 - INFO - __main__ - Step 59896: {'lr': 0.000333810120386664, 'samples': 11500032, 'steps': 59895, 'loss/train': 1.5503777265548706} -11/07/2021 05:37:36 - INFO - __main__ - Step 59897: {'lr': 0.00033380512071097947, 'samples': 11500224, 'steps': 59896, 'loss/train': 1.195521593093872} -11/07/2021 05:37:37 - INFO - __main__ - Step 59898: {'lr': 0.00033380012099753364, 'samples': 11500416, 'steps': 59897, 'loss/train': 1.4737271070480347} -11/07/2021 05:37:37 - INFO - __main__ - Step 59899: {'lr': 0.00033379512124632885, 'samples': 11500608, 'steps': 59898, 'loss/train': 1.5121731758117676} -11/07/2021 05:37:38 - INFO - __main__ - Step 59900: {'lr': 0.0003337901214573672, 'samples': 11500800, 'steps': 59899, 'loss/train': 1.6407800912857056} -11/07/2021 05:37:38 - INFO - __main__ - Step 59901: {'lr': 0.000333785121630651, 'samples': 11500992, 'steps': 59900, 'loss/train': 1.5833220481872559} -11/07/2021 05:37:38 - INFO - __main__ - Step 59902: {'lr': 0.0003337801217661826, 'samples': 11501184, 'steps': 59901, 'loss/train': 1.5912500619888306} -11/07/2021 05:37:40 - INFO - __main__ - Step 59903: {'lr': 0.0003337751218639641, 'samples': 11501376, 'steps': 59902, 'loss/train': 1.6189994812011719} -11/07/2021 05:37:40 - INFO - __main__ - Step 59904: {'lr': 0.0003337701219239978, 'samples': 11501568, 'steps': 59903, 'loss/train': 1.056644082069397} -11/07/2021 05:37:40 - INFO - __main__ - Step 59905: {'lr': 0.00033376512194628605, 'samples': 11501760, 'steps': 59904, 'loss/train': 1.5313489437103271} -11/07/2021 05:37:41 - INFO - __main__ - Step 59906: {'lr': 0.000333760121930831, 'samples': 11501952, 'steps': 59905, 'loss/train': 1.311906099319458} -11/07/2021 05:37:41 - INFO - __main__ - Step 59907: {'lr': 0.0003337551218776349, 'samples': 11502144, 'steps': 59906, 'loss/train': 1.4480106830596924} -11/07/2021 05:37:42 - INFO - __main__ - Step 59908: {'lr': 0.0003337501217867001, 'samples': 11502336, 'steps': 59907, 'loss/train': 0.07434665411710739} -11/07/2021 05:37:42 - INFO - __main__ - Step 59909: {'lr': 0.00033374512165802874, 'samples': 11502528, 'steps': 59908, 'loss/train': 1.4887604713439941} -11/07/2021 05:37:43 - INFO - __main__ - Step 59910: {'lr': 0.00033374012149162314, 'samples': 11502720, 'steps': 59909, 'loss/train': 1.267632007598877} -11/07/2021 05:37:43 - INFO - __main__ - Step 59911: {'lr': 0.0003337351212874856, 'samples': 11502912, 'steps': 59910, 'loss/train': 1.438001036643982} -11/07/2021 05:37:43 - INFO - __main__ - Step 59912: {'lr': 0.00033373012104561815, 'samples': 11503104, 'steps': 59911, 'loss/train': 1.8732619285583496} -11/07/2021 05:37:44 - INFO - __main__ - Step 59913: {'lr': 0.0003337251207660233, 'samples': 11503296, 'steps': 59912, 'loss/train': 1.391196608543396} -11/07/2021 05:37:45 - INFO - __main__ - Step 59914: {'lr': 0.00033372012044870317, 'samples': 11503488, 'steps': 59913, 'loss/train': 1.5033156871795654} -11/07/2021 05:37:45 - INFO - __main__ - Step 59915: {'lr': 0.00033371512009366006, 'samples': 11503680, 'steps': 59914, 'loss/train': 1.3974770307540894} -11/07/2021 05:37:45 - INFO - __main__ - Step 59916: {'lr': 0.0003337101197008962, 'samples': 11503872, 'steps': 59915, 'loss/train': 1.5923370122909546} -11/07/2021 05:37:46 - INFO - __main__ - Step 59917: {'lr': 0.00033370511927041386, 'samples': 11504064, 'steps': 59916, 'loss/train': 1.885499358177185} -11/07/2021 05:37:47 - INFO - __main__ - Step 59918: {'lr': 0.0003337001188022153, 'samples': 11504256, 'steps': 59917, 'loss/train': 1.192004919052124} -11/07/2021 05:37:47 - INFO - __main__ - Step 59919: {'lr': 0.0003336951182963027, 'samples': 11504448, 'steps': 59918, 'loss/train': 1.1246466636657715} -11/07/2021 05:37:48 - INFO - __main__ - Step 59920: {'lr': 0.0003336901177526784, 'samples': 11504640, 'steps': 59919, 'loss/train': 1.2675156593322754} -11/07/2021 05:37:48 - INFO - __main__ - Step 59921: {'lr': 0.0003336851171713447, 'samples': 11504832, 'steps': 59920, 'loss/train': 1.1757452487945557} -11/07/2021 05:37:48 - INFO - __main__ - Step 59922: {'lr': 0.00033368011655230366, 'samples': 11505024, 'steps': 59921, 'loss/train': 1.2680805921554565} -11/07/2021 05:37:49 - INFO - __main__ - Step 59923: {'lr': 0.0003336751158955577, 'samples': 11505216, 'steps': 59922, 'loss/train': 1.0946545600891113} -11/07/2021 05:37:50 - INFO - __main__ - Step 59924: {'lr': 0.00033367011520110906, 'samples': 11505408, 'steps': 59923, 'loss/train': 1.6121041774749756} -11/07/2021 05:37:50 - INFO - __main__ - Step 59925: {'lr': 0.00033366511446896, 'samples': 11505600, 'steps': 59924, 'loss/train': 1.5153909921646118} -11/07/2021 05:37:50 - INFO - __main__ - Step 59926: {'lr': 0.0003336601136991126, 'samples': 11505792, 'steps': 59925, 'loss/train': 0.9676465392112732} -11/07/2021 05:37:51 - INFO - __main__ - Step 59927: {'lr': 0.0003336551128915693, 'samples': 11505984, 'steps': 59926, 'loss/train': 1.4178122282028198} -11/07/2021 05:37:51 - INFO - __main__ - Step 59928: {'lr': 0.00033365011204633234, 'samples': 11506176, 'steps': 59927, 'loss/train': 1.9650468826293945} -11/07/2021 05:37:52 - INFO - __main__ - Step 59929: {'lr': 0.0003336451111634038, 'samples': 11506368, 'steps': 59928, 'loss/train': 0.666279673576355} -11/07/2021 05:37:53 - INFO - __main__ - Step 59930: {'lr': 0.00033364011024278616, 'samples': 11506560, 'steps': 59929, 'loss/train': 1.2978079319000244} -11/07/2021 05:37:53 - INFO - __main__ - Step 59931: {'lr': 0.0003336351092844816, 'samples': 11506752, 'steps': 59930, 'loss/train': 1.436763882637024} -11/07/2021 05:37:53 - INFO - __main__ - Step 59932: {'lr': 0.0003336301082884924, 'samples': 11506944, 'steps': 59931, 'loss/train': 1.1624747514724731} -11/07/2021 05:37:54 - INFO - __main__ - Step 59933: {'lr': 0.00033362510725482063, 'samples': 11507136, 'steps': 59932, 'loss/train': 1.6544556617736816} -11/07/2021 05:37:55 - INFO - __main__ - Step 59934: {'lr': 0.0003336201061834687, 'samples': 11507328, 'steps': 59933, 'loss/train': 1.6201013326644897} -11/07/2021 05:37:55 - INFO - __main__ - Step 59935: {'lr': 0.0003336151050744389, 'samples': 11507520, 'steps': 59934, 'loss/train': 1.6059478521347046} -11/07/2021 05:37:55 - INFO - __main__ - Step 59936: {'lr': 0.00033361010392773336, 'samples': 11507712, 'steps': 59935, 'loss/train': 1.707397222518921} -11/07/2021 05:37:56 - INFO - __main__ - Step 59937: {'lr': 0.0003336051027433544, 'samples': 11507904, 'steps': 59936, 'loss/train': 0.16855694353580475} -11/07/2021 05:37:56 - INFO - __main__ - Step 59938: {'lr': 0.00033360010152130436, 'samples': 11508096, 'steps': 59937, 'loss/train': 1.3239763975143433} -11/07/2021 05:37:57 - INFO - __main__ - Step 59939: {'lr': 0.00033359510026158534, 'samples': 11508288, 'steps': 59938, 'loss/train': 1.1314833164215088} -11/07/2021 05:37:58 - INFO - __main__ - Step 59940: {'lr': 0.00033359009896419966, 'samples': 11508480, 'steps': 59939, 'loss/train': 1.8635438680648804} -11/07/2021 05:37:58 - INFO - __main__ - Step 59941: {'lr': 0.00033358509762914957, 'samples': 11508672, 'steps': 59940, 'loss/train': 1.7521969079971313} -11/07/2021 05:37:59 - INFO - __main__ - Step 59942: {'lr': 0.0003335800962564374, 'samples': 11508864, 'steps': 59941, 'loss/train': 0.7541856169700623} -11/07/2021 05:37:59 - INFO - __main__ - Step 59943: {'lr': 0.0003335750948460652, 'samples': 11509056, 'steps': 59942, 'loss/train': 1.1702239513397217} -11/07/2021 05:37:59 - INFO - __main__ - Step 59944: {'lr': 0.0003335700933980354, 'samples': 11509248, 'steps': 59943, 'loss/train': 1.7087632417678833} -11/07/2021 05:38:00 - INFO - __main__ - Step 59945: {'lr': 0.0003335650919123503, 'samples': 11509440, 'steps': 59944, 'loss/train': 1.7990319728851318} -11/07/2021 05:38:01 - INFO - __main__ - Step 59946: {'lr': 0.0003335600903890119, 'samples': 11509632, 'steps': 59945, 'loss/train': 1.8563764095306396} -11/07/2021 05:38:01 - INFO - __main__ - Step 59947: {'lr': 0.0003335550888280227, 'samples': 11509824, 'steps': 59946, 'loss/train': 1.5483802556991577} -11/07/2021 05:38:01 - INFO - __main__ - Step 59948: {'lr': 0.00033355008722938485, 'samples': 11510016, 'steps': 59947, 'loss/train': 0.8849313855171204} -11/07/2021 05:38:02 - INFO - __main__ - Step 59949: {'lr': 0.0003335450855931006, 'samples': 11510208, 'steps': 59948, 'loss/train': 1.6003526449203491} -11/07/2021 05:38:03 - INFO - __main__ - Step 59950: {'lr': 0.00033354008391917224, 'samples': 11510400, 'steps': 59949, 'loss/train': 1.5374506711959839} -11/07/2021 05:38:03 - INFO - __main__ - Step 59951: {'lr': 0.00033353508220760204, 'samples': 11510592, 'steps': 59950, 'loss/train': 1.5414222478866577} -11/07/2021 05:38:03 - INFO - __main__ - Step 59952: {'lr': 0.00033353008045839224, 'samples': 11510784, 'steps': 59951, 'loss/train': 1.1849223375320435} -11/07/2021 05:38:04 - INFO - __main__ - Step 59953: {'lr': 0.000333525078671545, 'samples': 11510976, 'steps': 59952, 'loss/train': 0.8675971031188965} -11/07/2021 05:38:04 - INFO - __main__ - Step 59954: {'lr': 0.0003335200768470627, 'samples': 11511168, 'steps': 59953, 'loss/train': 0.0594203881919384} -11/07/2021 05:38:05 - INFO - __main__ - Step 59955: {'lr': 0.0003335150749849475, 'samples': 11511360, 'steps': 59954, 'loss/train': 1.1955112218856812} -11/07/2021 05:38:05 - INFO - __main__ - Step 59956: {'lr': 0.0003335100730852017, 'samples': 11511552, 'steps': 59955, 'loss/train': 1.3597326278686523} -11/07/2021 05:38:06 - INFO - __main__ - Step 59957: {'lr': 0.0003335050711478276, 'samples': 11511744, 'steps': 59956, 'loss/train': 1.4074528217315674} -11/07/2021 05:38:06 - INFO - __main__ - Step 59958: {'lr': 0.0003335000691728273, 'samples': 11511936, 'steps': 59957, 'loss/train': 1.0630269050598145} -11/07/2021 05:38:07 - INFO - __main__ - Step 59959: {'lr': 0.0003334950671602033, 'samples': 11512128, 'steps': 59958, 'loss/train': 1.3670204877853394} -11/07/2021 05:38:08 - INFO - __main__ - Step 59960: {'lr': 0.00033349006510995766, 'samples': 11512320, 'steps': 59959, 'loss/train': 1.0078097581863403} -11/07/2021 05:38:08 - INFO - __main__ - Step 59961: {'lr': 0.00033348506302209265, 'samples': 11512512, 'steps': 59960, 'loss/train': 1.460436224937439} -11/07/2021 05:38:08 - INFO - __main__ - Step 59962: {'lr': 0.00033348006089661055, 'samples': 11512704, 'steps': 59961, 'loss/train': 1.4430351257324219} -11/07/2021 05:38:09 - INFO - __main__ - Step 59963: {'lr': 0.0003334750587335136, 'samples': 11512896, 'steps': 59962, 'loss/train': 1.1543771028518677} -11/07/2021 05:38:09 - INFO - __main__ - Step 59964: {'lr': 0.00033347005653280414, 'samples': 11513088, 'steps': 59963, 'loss/train': 1.6782102584838867} -11/07/2021 05:38:09 - INFO - __main__ - Step 59965: {'lr': 0.0003334650542944844, 'samples': 11513280, 'steps': 59964, 'loss/train': 1.6661664247512817} -11/07/2021 05:38:10 - INFO - __main__ - Step 59966: {'lr': 0.00033346005201855656, 'samples': 11513472, 'steps': 59965, 'loss/train': 1.1616204977035522} -11/07/2021 05:38:11 - INFO - __main__ - Step 59967: {'lr': 0.00033345504970502284, 'samples': 11513664, 'steps': 59966, 'loss/train': 0.9831913709640503} -11/07/2021 05:38:11 - INFO - __main__ - Step 59968: {'lr': 0.0003334500473538856, 'samples': 11513856, 'steps': 59967, 'loss/train': 1.378980278968811} -11/07/2021 05:38:11 - INFO - __main__ - Step 59969: {'lr': 0.00033344504496514703, 'samples': 11514048, 'steps': 59968, 'loss/train': 1.2002038955688477} -11/07/2021 05:38:12 - INFO - __main__ - Step 59970: {'lr': 0.0003334400425388095, 'samples': 11514240, 'steps': 59969, 'loss/train': 1.185613989830017} -11/07/2021 05:38:13 - INFO - __main__ - Step 59971: {'lr': 0.00033343504007487515, 'samples': 11514432, 'steps': 59970, 'loss/train': 1.4303959608078003} -11/07/2021 05:38:13 - INFO - __main__ - Step 59972: {'lr': 0.00033343003757334625, 'samples': 11514624, 'steps': 59971, 'loss/train': 1.2609548568725586} -11/07/2021 05:38:14 - INFO - __main__ - Step 59973: {'lr': 0.000333425035034225, 'samples': 11514816, 'steps': 59972, 'loss/train': 1.406761884689331} -11/07/2021 05:38:14 - INFO - __main__ - Step 59974: {'lr': 0.00033342003245751374, 'samples': 11515008, 'steps': 59973, 'loss/train': 1.5263012647628784} -11/07/2021 05:38:14 - INFO - __main__ - Step 59975: {'lr': 0.0003334150298432147, 'samples': 11515200, 'steps': 59974, 'loss/train': 1.870259404182434} -11/07/2021 05:38:15 - INFO - __main__ - Step 59976: {'lr': 0.00033341002719133016, 'samples': 11515392, 'steps': 59975, 'loss/train': 1.5945241451263428} -11/07/2021 05:38:16 - INFO - __main__ - Step 59977: {'lr': 0.0003334050245018624, 'samples': 11515584, 'steps': 59976, 'loss/train': 1.0896097421646118} -11/07/2021 05:38:16 - INFO - __main__ - Step 59978: {'lr': 0.00033340002177481353, 'samples': 11515776, 'steps': 59977, 'loss/train': 1.4379078149795532} -11/07/2021 05:38:16 - INFO - __main__ - Step 59979: {'lr': 0.00033339501901018595, 'samples': 11515968, 'steps': 59978, 'loss/train': 1.8286679983139038} -11/07/2021 05:38:17 - INFO - __main__ - Step 59980: {'lr': 0.0003333900162079818, 'samples': 11516160, 'steps': 59979, 'loss/train': 1.4866057634353638} -11/07/2021 05:38:18 - INFO - __main__ - Step 59981: {'lr': 0.00033338501336820347, 'samples': 11516352, 'steps': 59980, 'loss/train': 1.0197144746780396} -11/07/2021 05:38:18 - INFO - __main__ - Step 59982: {'lr': 0.0003333800104908531, 'samples': 11516544, 'steps': 59981, 'loss/train': 1.3618757724761963} -11/07/2021 05:38:18 - INFO - __main__ - Step 59983: {'lr': 0.00033337500757593306, 'samples': 11516736, 'steps': 59982, 'loss/train': 1.2537387609481812} -11/07/2021 05:38:19 - INFO - __main__ - Step 59984: {'lr': 0.0003333700046234454, 'samples': 11516928, 'steps': 59983, 'loss/train': 0.8415775299072266} -11/07/2021 05:38:19 - INFO - __main__ - Step 59985: {'lr': 0.00033336500163339255, 'samples': 11517120, 'steps': 59984, 'loss/train': 1.416278600692749} -11/07/2021 05:38:20 - INFO - __main__ - Step 59986: {'lr': 0.00033335999860577677, 'samples': 11517312, 'steps': 59985, 'loss/train': 1.417700171470642} -11/07/2021 05:38:21 - INFO - __main__ - Step 59987: {'lr': 0.0003333549955406002, 'samples': 11517504, 'steps': 59986, 'loss/train': 1.4902400970458984} -11/07/2021 05:38:21 - INFO - __main__ - Step 59988: {'lr': 0.0003333499924378652, 'samples': 11517696, 'steps': 59987, 'loss/train': 1.3031017780303955} -11/07/2021 05:38:21 - INFO - __main__ - Step 59989: {'lr': 0.00033334498929757394, 'samples': 11517888, 'steps': 59988, 'loss/train': 1.293977975845337} -11/07/2021 05:38:22 - INFO - __main__ - Step 59990: {'lr': 0.0003333399861197287, 'samples': 11518080, 'steps': 59989, 'loss/train': 0.5613684058189392} -11/07/2021 05:38:23 - INFO - __main__ - Step 59991: {'lr': 0.00033333498290433184, 'samples': 11518272, 'steps': 59990, 'loss/train': 1.4361369609832764} -11/07/2021 05:38:23 - INFO - __main__ - Step 59992: {'lr': 0.00033332997965138545, 'samples': 11518464, 'steps': 59991, 'loss/train': 1.5548150539398193} -11/07/2021 05:38:24 - INFO - __main__ - Step 59993: {'lr': 0.0003333249763608919, 'samples': 11518656, 'steps': 59992, 'loss/train': 1.6068527698516846} -11/07/2021 05:38:24 - INFO - __main__ - Step 59994: {'lr': 0.00033331997303285334, 'samples': 11518848, 'steps': 59993, 'loss/train': 0.06748134642839432} -11/07/2021 05:38:24 - INFO - __main__ - Step 59995: {'lr': 0.00033331496966727207, 'samples': 11519040, 'steps': 59994, 'loss/train': 1.4003791809082031} -11/07/2021 05:38:25 - INFO - __main__ - Step 59996: {'lr': 0.00033330996626415046, 'samples': 11519232, 'steps': 59995, 'loss/train': 1.4762942790985107} -11/07/2021 05:38:26 - INFO - __main__ - Step 59997: {'lr': 0.0003333049628234906, 'samples': 11519424, 'steps': 59996, 'loss/train': 1.3110620975494385} -11/07/2021 05:38:26 - INFO - __main__ - Step 59998: {'lr': 0.0003332999593452948, 'samples': 11519616, 'steps': 59997, 'loss/train': 1.3451272249221802} -11/07/2021 05:38:27 - INFO - __main__ - Step 59999: {'lr': 0.0003332949558295654, 'samples': 11519808, 'steps': 59998, 'loss/train': 1.0439751148223877} -11/07/2021 05:38:27 - INFO - __main__ - Step 60000: {'lr': 0.0003332899522763045, 'samples': 11520000, 'steps': 59999, 'loss/train': 1.3764021396636963} -11/07/2021 05:38:27 - INFO - __main__ - Evaluating and saving model checkpoint -11/07/2021 05:41:40 - INFO - __main__ - Step 60000: {'loss/eval': 1.3816074132919312, 'perplexity': 3.9812960624694824} +version https://git-lfs.github.com/spec/v1 +oid sha256:9a5a3a6af8c5ea712bc974f401994aeef7b737fa4e9e7e83264b090830e5ed50 +size 11396737